Makefile.am 31 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111
  1. # StarPU --- Runtime system for heterogeneous multicore architectures.
  2. #
  3. # Copyright (C) 2009-2020 Université de Bordeaux, CNRS (LaBRI UMR 5800), Inria
  4. #
  5. # StarPU is free software; you can redistribute it and/or modify
  6. # it under the terms of the GNU Lesser General Public License as published by
  7. # the Free Software Foundation; either version 2.1 of the License, or (at
  8. # your option) any later version.
  9. #
  10. # StarPU is distributed in the hope that it will be useful, but
  11. # WITHOUT ANY WARRANTY; without even the implied warranty of
  12. # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
  13. #
  14. # See the GNU Lesser General Public License in COPYING.LGPL for more details.
  15. #
  16. include $(top_srcdir)/starpu.mk
  17. AM_CFLAGS = $(HWLOC_CFLAGS) $(FXT_CFLAGS) -Wall $(STARPU_CUDA_CPPFLAGS) $(STARPU_OPENCL_CPPFLAGS) $(STARPU_FPGA_CPPFLAGS) $(STARPU_COI_CPPFLAGS) $(STARPU_SCIF_CPPFLAGS) $(GLOBAL_AM_CFLAGS) -Wno-unused
  18. AM_CXXFLAGS = $(HWLOC_CFLAGS) $(FXT_CFLAGS) -Wall $(STARPU_CUDA_CPPFLAGS) $(STARPU_OPENCL_CPPFLAGS) $(STARPU_COI_CPPFLAGS) $(STARPU_SCIF_CPPFLAGS) $(GLOBAL_AM_CXXFLAGS) -Wno-unused
  19. AM_CPPFLAGS = -I$(top_srcdir)/include/ -I$(top_builddir)/src -I$(top_srcdir)/src/
  20. AM_LDFLAGS = @STARPU_EXPORT_DYNAMIC@
  21. LIBS += $(top_builddir)/src/@LIBSTARPU_LINK@ $(HWLOC_LIBS) $(FXT_LIBS)
  22. LIBS += $(STARPU_OPENCL_LDFLAGS) $(STARPU_CUDA_LDFLAGS) $(STARPU_COI_LDFLAGS) $(STARPU_SCIF_LDFLAGS) $(FXT_LDFLAGS)
  23. EXTRA_DIST = \
  24. helper.h \
  25. datawizard/locality.sh \
  26. main/increment_codelet.h \
  27. overlap/overlap.sh \
  28. datawizard/scal.h \
  29. datawizard/mpi_like.h \
  30. regression/profiles.in \
  31. regression/regression.sh.in \
  32. regression/profiles.build.only.in \
  33. microbenchs/tasks_data_overhead.sh \
  34. microbenchs/sync_tasks_data_overhead.sh \
  35. microbenchs/async_tasks_data_overhead.sh \
  36. microbenchs/tasks_size_overhead.sh \
  37. microbenchs/tasks_size_overhead_sched.sh \
  38. microbenchs/tasks_size_overhead_scheds.sh \
  39. microbenchs/tasks_size_overhead.gp \
  40. microbenchs/parallel_dependent_homogeneous_tasks_data.sh \
  41. microbenchs/parallel_independent_heterogeneous_tasks_data.sh \
  42. microbenchs/parallel_independent_heterogeneous_tasks.sh \
  43. microbenchs/parallel_independent_homogeneous_tasks_data.sh \
  44. microbenchs/parallel_independent_homogeneous_tasks.sh \
  45. microbenchs/bandwidth_scheds.sh \
  46. energy/static.sh \
  47. energy/dynamic.sh \
  48. energy/perfs.gp \
  49. datawizard/scratch_opencl_kernel.cl \
  50. datawizard/sync_and_notify_data_opencl_codelet.cl\
  51. datawizard/opencl_codelet_unsigned_inc_kernel.cl \
  52. coverage/coverage.sh \
  53. datawizard/acquire_release_opencl_kernel.cl \
  54. datawizard/interfaces/test_interfaces.h \
  55. datawizard/interfaces/bcsr/bcsr_opencl_kernel.cl \
  56. datawizard/interfaces/coo/coo_opencl_kernel.cl \
  57. datawizard/interfaces/matrix/matrix_opencl_kernel.cl \
  58. datawizard/interfaces/variable/variable_opencl_kernel.cl \
  59. datawizard/interfaces/vector/vector_opencl_kernel.cl \
  60. datawizard/interfaces/multiformat/multiformat_types.h \
  61. datawizard/interfaces/multiformat/multiformat_opencl_kernel.cl \
  62. datawizard/interfaces/multiformat/multiformat_conversion_codelets_kernel.cl \
  63. datawizard/interfaces/multiformat/advanced/generic.h \
  64. datawizard/interfaces/csr/csr_opencl_kernel.cl \
  65. datawizard/interfaces/block/block_opencl_kernel.cl \
  66. datawizard/interfaces/tensor/tensor_opencl_kernel.cl \
  67. perfmodels/opencl_memset_kernel.cl \
  68. $(MICROBENCHS:=.sh) \
  69. microbenchs/microbench.sh
  70. CLEANFILES = \
  71. *.gcno *.gcda *.linkinfo core starpu_idle_microsec.log *.mod *.png *.output tasks.rec perfs.rec */perfs.rec */*/perfs.rec perfs2.rec fortran90/starpu_mod.f90 bandwidth-*.dat bandwidth.gp bandwidth.eps bandwidth.svg
  72. BUILT_SOURCES =
  73. SUBDIRS =
  74. examplebindir = $(libdir)/starpu/examples
  75. if STARPU_USE_OPENCL
  76. nobase_STARPU_OPENCL_DATA_DATA =
  77. endif
  78. if STARPU_USE_CUDA
  79. if STARPU_COVERITY
  80. include $(top_srcdir)/starpu-mynvcc.mk
  81. else
  82. NVCCFLAGS += --compiler-options -fno-strict-aliasing $(AM_CPPFLAGS) -I$(top_builddir)/include $(HWLOC_CFLAGS) $(SIMGRID_CFLAGS)
  83. .cu.cubin:
  84. $(V_nvcc) $(NVCC) -cubin $< -o $@ $(NVCCFLAGS)
  85. .cu.o:
  86. $(V_nvcc) $(NVCC) $< -c -o $@ $(NVCCFLAGS)
  87. endif
  88. endif
  89. testbindir = $(libdir)/starpu/tests
  90. #####################################
  91. # What to install and what to check #
  92. #####################################
  93. noinst_PROGRAMS =
  94. if !STARPU_HAVE_WINDOWS
  95. ## test loader program
  96. if !STARPU_CROSS_COMPILING
  97. LOADER = loader
  98. LOADER_BIN = $(abs_top_builddir)/tests/$(LOADER)
  99. noinst_PROGRAMS += loader
  100. else
  101. LOADER =
  102. LOADER_BIN = $(top_builddir)/tests/loader-cross.sh
  103. endif
  104. if STARPU_USE_MPI_MASTER_SLAVE
  105. LOADER_BIN2 = $(MPI_LAUNCHER) $(LOADER_BIN)
  106. else
  107. LOADER_BIN2 = $(LOADER_BIN)
  108. endif
  109. if STARPU_HAVE_AM111
  110. TESTS_ENVIRONMENT = $(MPI_RUN_ARGS) top_builddir="$(abs_top_builddir)" top_srcdir="$(abs_top_srcdir)"
  111. LOG_COMPILER = $(LOADER_BIN2)
  112. else
  113. TESTS_ENVIRONMENT = $(MPI_RUN_ARGS) top_builddir="$(abs_top_builddir)" top_srcdir="$(abs_top_srcdir)" $(LOADER_BIN2)
  114. endif
  115. endif
  116. TESTS = $(SHELL_TESTS) $(myPROGRAMS)
  117. SHELL_TESTS =
  118. if STARPU_COVERAGE_ENABLED
  119. SHELL_TESTS += coverage/coverage.sh
  120. endif
  121. XFAIL_TESTS = \
  122. errorcheck/invalid_blocking_calls
  123. myPROGRAMS =
  124. myPROGRAMS += \
  125. main/callback \
  126. main/bind \
  127. main/mkdtemp \
  128. main/execute_schedule \
  129. main/insert_task_pack \
  130. main/insert_task_nullcodelet \
  131. main/multithreaded_init \
  132. main/empty_task \
  133. main/empty_task_chain \
  134. main/starpu_worker_exists \
  135. main/codelet_null_callback \
  136. datawizard/allocate \
  137. datawizard/acquire_cb \
  138. datawizard/deps \
  139. datawizard/user_interaction_implicit \
  140. datawizard/interfaces/copy_interfaces \
  141. datawizard/numa_overflow \
  142. datawizard/locality \
  143. datawizard/variable_size \
  144. errorcheck/starpu_init_noworker \
  145. errorcheck/invalid_tasks \
  146. helper/cublas_init \
  147. helper/cusparse_init \
  148. helper/pinned_memory \
  149. helper/execute_on_all \
  150. microbenchs/display_structures_size \
  151. microbenchs/local_pingpong \
  152. overlap/overlap \
  153. sched_ctx/sched_ctx_list \
  154. sched_ctx/sched_ctx_policy_data \
  155. openmp/init_exit_01 \
  156. openmp/init_exit_02 \
  157. openmp/environment \
  158. openmp/api_01 \
  159. openmp/parallel_01 \
  160. openmp/parallel_02 \
  161. openmp/parallel_03 \
  162. openmp/parallel_barrier_01 \
  163. openmp/parallel_master_01 \
  164. openmp/parallel_master_inline_01 \
  165. openmp/parallel_single_wait_01 \
  166. openmp/parallel_single_nowait_01 \
  167. openmp/parallel_single_inline_01 \
  168. openmp/parallel_single_copyprivate_01 \
  169. openmp/parallel_single_copyprivate_inline_01 \
  170. openmp/parallel_critical_01 \
  171. openmp/parallel_critical_inline_01 \
  172. openmp/parallel_critical_named_01 \
  173. openmp/parallel_critical_named_inline_01\
  174. openmp/parallel_simple_lock_01 \
  175. openmp/parallel_nested_lock_01 \
  176. openmp/parallel_for_01 \
  177. openmp/parallel_for_02 \
  178. openmp/parallel_for_ordered_01 \
  179. openmp/parallel_sections_01 \
  180. openmp/parallel_sections_combined_01 \
  181. openmp/task_01 \
  182. openmp/task_02 \
  183. openmp/task_03 \
  184. openmp/taskloop \
  185. openmp/taskwait_01 \
  186. openmp/taskgroup_01 \
  187. openmp/taskgroup_02 \
  188. openmp/array_slice_01 \
  189. openmp/cuda_task_01 \
  190. perfmodels/value_nan
  191. if STARPU_SIMGRID
  192. myPROGRAMS += \
  193. energy/energy_efficiency \
  194. datawizard/simgrid-locality
  195. endif
  196. if !STARPU_SIMGRID
  197. myPROGRAMS += \
  198. main/deprecated_func \
  199. main/driver_api/init_run_deinit \
  200. main/driver_api/run_driver \
  201. main/deploop \
  202. main/display_binding \
  203. main/execute_on_a_specific_worker \
  204. main/insert_task \
  205. main/insert_task_value \
  206. main/insert_task_dyn_handles \
  207. main/insert_task_array \
  208. main/insert_task_many \
  209. main/insert_task_where \
  210. main/multithreaded \
  211. main/starpu_task_bundle \
  212. main/starpu_task_wait_for_all \
  213. main/starpu_task_wait \
  214. main/static_restartable \
  215. main/static_restartable_using_initializer\
  216. main/static_restartable_tag \
  217. main/regenerate \
  218. main/regenerate_pipeline \
  219. main/restart \
  220. main/wait_all_regenerable_tasks \
  221. main/subgraph_repeat \
  222. main/subgraph_repeat_tag \
  223. main/subgraph_repeat_regenerate \
  224. main/subgraph_repeat_regenerate_tag \
  225. main/subgraph_repeat_regenerate_tag_cycle \
  226. main/empty_task_sync_point \
  227. main/empty_task_sync_point_tasks \
  228. main/tag_wait_api \
  229. main/tag_get_task \
  230. main/task_wait_api \
  231. main/declare_deps_in_callback \
  232. main/declare_deps_after_submission \
  233. main/declare_deps_after_submission_synchronous \
  234. main/get_current_task \
  235. main/starpu_init \
  236. main/submit \
  237. main/pause_resume \
  238. main/pack \
  239. main/get_children_tasks \
  240. main/hwloc_cpuset \
  241. main/task_end_dep \
  242. datawizard/acquire_cb_insert \
  243. datawizard/acquire_release \
  244. datawizard/acquire_release2 \
  245. datawizard/acquire_release_to \
  246. datawizard/acquire_try \
  247. datawizard/bcsr \
  248. datawizard/cache \
  249. datawizard/commute \
  250. datawizard/commute2 \
  251. datawizard/copy \
  252. datawizard/data_implicit_deps \
  253. datawizard/data_lookup \
  254. datawizard/data_register \
  255. datawizard/scratch \
  256. datawizard/scratch_reuse \
  257. datawizard/sync_and_notify_data \
  258. datawizard/sync_and_notify_data_implicit\
  259. datawizard/dsm_stress \
  260. datawizard/double_parameter \
  261. datawizard/write_only_tmp_buffer \
  262. datawizard/data_invalidation \
  263. datawizard/dining_philosophers \
  264. datawizard/manual_reduction \
  265. datawizard/readers_and_writers \
  266. datawizard/unpartition \
  267. datawizard/sync_with_data_with_mem \
  268. datawizard/sync_with_data_with_mem_non_blocking\
  269. datawizard/sync_with_data_with_mem_non_blocking_implicit\
  270. datawizard/mpi_like \
  271. datawizard/mpi_like_async \
  272. datawizard/critical_section_with_void_interface\
  273. datawizard/increment_init \
  274. datawizard/increment_redux \
  275. datawizard/increment_redux_v2 \
  276. datawizard/increment_redux_lazy \
  277. datawizard/handle_to_pointer \
  278. datawizard/lazy_allocation \
  279. datawizard/lazy_unregister \
  280. datawizard/no_unregister \
  281. datawizard/noreclaim \
  282. datawizard/nowhere \
  283. datawizard/interfaces/block/block_interface \
  284. datawizard/interfaces/bcsr/bcsr_interface \
  285. datawizard/interfaces/coo/coo_interface \
  286. datawizard/interfaces/csr/csr_interface \
  287. datawizard/interfaces/matrix/matrix_interface \
  288. datawizard/interfaces/multiformat/multiformat_interface \
  289. datawizard/interfaces/multiformat/advanced/multiformat_cuda_opencl \
  290. datawizard/interfaces/multiformat/advanced/multiformat_data_release \
  291. datawizard/interfaces/multiformat/advanced/multiformat_worker \
  292. datawizard/interfaces/multiformat/advanced/multiformat_handle_conversion \
  293. datawizard/interfaces/multiformat/advanced/same_handle \
  294. datawizard/interfaces/tensor/tensor_interface \
  295. datawizard/interfaces/variable/variable_interface \
  296. datawizard/interfaces/vector/vector_interface \
  297. datawizard/interfaces/void/void_interface \
  298. datawizard/in_place_partition \
  299. datawizard/partition_dep \
  300. datawizard/partition_lazy \
  301. datawizard/partition_init \
  302. datawizard/partition_wontuse \
  303. datawizard/gpu_register \
  304. datawizard/gpu_ptr_register \
  305. datawizard/variable_parameters \
  306. datawizard/wt_host \
  307. datawizard/wt_broadcast \
  308. datawizard/readonly \
  309. datawizard/specific_node \
  310. datawizard/task_with_multiple_time_the_same_handle \
  311. datawizard/test_arbiter \
  312. datawizard/invalidate_pending_requests \
  313. datawizard/temporary_partition \
  314. datawizard/temporary_partition_implicit \
  315. datawizard/redux_acquire \
  316. disk/disk_copy \
  317. disk/disk_copy_unpack \
  318. disk/disk_copy_to_disk \
  319. disk/disk_compute \
  320. disk/disk_pack \
  321. disk/mem_reclaim \
  322. errorcheck/invalid_blocking_calls \
  323. errorcheck/workers_cpuid \
  324. fault-tolerance/retry \
  325. helper/starpu_data_cpy \
  326. helper/starpu_data_dup_ro \
  327. helper/starpu_create_sync_task \
  328. microbenchs/async_tasks_overhead \
  329. microbenchs/sync_tasks_overhead \
  330. microbenchs/tasks_overhead \
  331. microbenchs/tasks_size_overhead \
  332. microbenchs/prefetch_data_on_node \
  333. microbenchs/redundant_buffer \
  334. microbenchs/matrix_as_vector \
  335. microbenchs/bandwidth \
  336. overlap/gpu_concurrency \
  337. parallel_tasks/explicit_combined_worker \
  338. parallel_tasks/parallel_kernels \
  339. parallel_tasks/parallel_kernels_trivial \
  340. parallel_tasks/parallel_kernels_spmd \
  341. parallel_tasks/spmd_peager \
  342. parallel_tasks/cuda_only \
  343. perfmodels/regression_based_memset \
  344. perfmodels/regression_based_check \
  345. perfmodels/regression_based_multiimpl \
  346. perfmodels/regression_based_energy \
  347. perfmodels/regression_based_gpu \
  348. perfmodels/non_linear_regression_based \
  349. perfmodels/feed \
  350. perfmodels/user_base \
  351. perfmodels/valid_model \
  352. perfmodels/memory \
  353. sched_policies/data_locality \
  354. sched_policies/execute_all_tasks \
  355. sched_policies/prio \
  356. sched_policies/simple_deps \
  357. sched_policies/simple_cpu_gpu_sched \
  358. sched_ctx/sched_ctx_hierarchy
  359. if STARPU_USE_FPGA
  360. myPROGRAMS += \
  361. fpga/max_fpga
  362. endif
  363. endif
  364. MICROBENCHS = \
  365. microbenchs/parallel_independent_homogeneous_tasks \
  366. microbenchs/parallel_independent_heterogeneous_tasks \
  367. microbenchs/parallel_independent_homogeneous_tasks_data \
  368. microbenchs/parallel_independent_heterogeneous_tasks_data \
  369. microbenchs/parallel_redux_homogeneous_tasks_data \
  370. microbenchs/parallel_redux_heterogeneous_tasks_data \
  371. microbenchs/parallel_dependent_homogeneous_tasks_data
  372. if STARPU_HAVE_FC
  373. if !STARPU_SANITIZE
  374. if !STARPU_SIMGRID
  375. myPROGRAMS += \
  376. fortran90/init_01
  377. endif
  378. endif
  379. endif
  380. if !STARPU_SIMGRID
  381. if STARPU_LONG_CHECK
  382. myPROGRAMS += \
  383. main/tag_task_data_deps \
  384. datawizard/reclaim
  385. endif
  386. endif
  387. examplebin_PROGRAMS = \
  388. microbenchs/async_tasks_overhead \
  389. microbenchs/sync_tasks_overhead \
  390. microbenchs/tasks_overhead \
  391. microbenchs/tasks_size_overhead \
  392. microbenchs/local_pingpong
  393. examplebin_SCRIPTS = \
  394. microbenchs/tasks_data_overhead.sh \
  395. microbenchs/sync_tasks_data_overhead.sh \
  396. microbenchs/async_tasks_data_overhead.sh \
  397. microbenchs/tasks_size_overhead.gp \
  398. microbenchs/tasks_size_overhead.sh
  399. if !STARPU_SIMGRID
  400. if !STARPU_USE_MPI_MASTER_SLAVE
  401. examplebin_PROGRAMS += \
  402. microbenchs/bandwidth
  403. SHELL_TESTS += \
  404. microbenchs/tasks_data_overhead.sh \
  405. microbenchs/sync_tasks_data_overhead.sh \
  406. microbenchs/async_tasks_data_overhead.sh \
  407. microbenchs/tasks_size_overhead_scheds.sh
  408. endif
  409. endif
  410. if STARPU_HAVE_WINDOWS
  411. check_PROGRAMS = $(myPROGRAMS)
  412. else
  413. check_PROGRAMS = $(LOADER) $(myPROGRAMS)
  414. endif
  415. noinst_PROGRAMS += $(myPROGRAMS)
  416. noinst_PROGRAMS += $(MICROBENCHS)
  417. if STARPU_SIMGRID
  418. SHELL_TESTS += $(MICROBENCHS:=.sh)
  419. endif
  420. if !STARPU_USE_MPI_MASTER_SLAVE
  421. SHELL_TESTS += \
  422. datawizard/locality.sh \
  423. microbenchs/bandwidth_scheds.sh \
  424. overlap/overlap.sh
  425. endif
  426. ################################
  427. # Simgrid Model Checking tests #
  428. ################################
  429. if STARPU_SIMGRID_MC
  430. SUBDIRS += model-checking
  431. endif
  432. #######################
  433. # Source files #
  434. #######################
  435. datawizard_acquire_release_SOURCES = \
  436. datawizard/acquire_release.c
  437. if STARPU_USE_CUDA
  438. datawizard_acquire_release_SOURCES += \
  439. datawizard/acquire_release_cuda.cu
  440. endif
  441. if STARPU_USE_OPENCL
  442. datawizard_acquire_release_SOURCES += \
  443. datawizard/acquire_release_opencl.c
  444. nobase_STARPU_OPENCL_DATA_DATA += \
  445. datawizard/acquire_release_opencl_kernel.cl
  446. endif
  447. datawizard_acquire_release2_SOURCES = \
  448. datawizard/acquire_release2.c
  449. if STARPU_USE_CUDA
  450. datawizard_acquire_release2_SOURCES += \
  451. datawizard/acquire_release_cuda.cu
  452. endif
  453. if STARPU_USE_OPENCL
  454. datawizard_acquire_release2_SOURCES += \
  455. datawizard/acquire_release_opencl.c
  456. endif
  457. datawizard_acquire_release_to_SOURCES = \
  458. datawizard/acquire_release_to.c
  459. if STARPU_USE_CUDA
  460. datawizard_acquire_release_to_SOURCES += \
  461. datawizard/acquire_release_cuda.cu
  462. endif
  463. if STARPU_USE_OPENCL
  464. datawizard_acquire_release_to_SOURCES += \
  465. datawizard/acquire_release_opencl.c
  466. endif
  467. datawizard_scratch_SOURCES = \
  468. datawizard/scratch.c
  469. if STARPU_USE_CUDA
  470. datawizard_scratch_SOURCES += \
  471. datawizard/scratch_cuda.cu
  472. endif
  473. if STARPU_USE_OPENCL
  474. datawizard_scratch_SOURCES += \
  475. datawizard/scratch_opencl.c
  476. nobase_STARPU_OPENCL_DATA_DATA += \
  477. datawizard/scratch_opencl_kernel.cl
  478. endif
  479. datawizard_mpi_like_SOURCES = \
  480. datawizard/mpi_like.c
  481. if STARPU_USE_CUDA
  482. datawizard_mpi_like_SOURCES += \
  483. datawizard/cuda_codelet_unsigned_inc.cu
  484. endif
  485. if STARPU_USE_OPENCL
  486. datawizard_mpi_like_SOURCES += \
  487. datawizard/opencl_codelet_unsigned_inc.c
  488. nobase_STARPU_OPENCL_DATA_DATA+= \
  489. datawizard/opencl_codelet_unsigned_inc_kernel.cl
  490. endif
  491. datawizard_mpi_like_async_SOURCES = \
  492. datawizard/mpi_like_async.c
  493. if STARPU_USE_CUDA
  494. datawizard_mpi_like_async_SOURCES += \
  495. datawizard/cuda_codelet_unsigned_inc.cu
  496. endif
  497. if STARPU_USE_OPENCL
  498. datawizard_mpi_like_async_SOURCES += \
  499. datawizard/opencl_codelet_unsigned_inc.c
  500. endif
  501. datawizard_sync_and_notify_data_SOURCES = \
  502. datawizard/sync_and_notify_data.c
  503. if STARPU_USE_CUDA
  504. datawizard_sync_and_notify_data_SOURCES += \
  505. datawizard/sync_and_notify_data_kernels.cu
  506. endif
  507. if STARPU_USE_OPENCL
  508. datawizard_sync_and_notify_data_SOURCES += \
  509. datawizard/sync_and_notify_data_opencl.c
  510. nobase_STARPU_OPENCL_DATA_DATA += \
  511. datawizard/sync_and_notify_data_opencl_codelet.cl
  512. endif
  513. datawizard_sync_and_notify_data_implicit_SOURCES = \
  514. datawizard/sync_and_notify_data_implicit.c
  515. if STARPU_USE_CUDA
  516. datawizard_sync_and_notify_data_implicit_SOURCES += \
  517. datawizard/sync_and_notify_data_kernels.cu
  518. endif
  519. if STARPU_USE_OPENCL
  520. datawizard_sync_and_notify_data_implicit_SOURCES += \
  521. datawizard/sync_and_notify_data_opencl.c
  522. endif
  523. datawizard_in_place_partition_SOURCES = \
  524. datawizard/in_place_partition.c \
  525. datawizard/scal.c
  526. if STARPU_USE_CUDA
  527. datawizard_in_place_partition_SOURCES += \
  528. datawizard/scal_cuda.cu
  529. endif
  530. if STARPU_USE_OPENCL
  531. datawizard_in_place_partition_SOURCES += \
  532. datawizard/scal_opencl.cl
  533. endif
  534. datawizard_partition_dep_SOURCES = \
  535. datawizard/partition_dep.c \
  536. datawizard/scal.c
  537. if STARPU_USE_CUDA
  538. datawizard_partition_dep_SOURCES += \
  539. datawizard/scal_cuda.cu
  540. endif
  541. if STARPU_USE_OPENCL
  542. datawizard_partition_dep_SOURCES += \
  543. datawizard/scal_opencl.cl
  544. endif
  545. datawizard_partition_lazy_SOURCES = \
  546. datawizard/partition_lazy.c \
  547. datawizard/scal.c
  548. if STARPU_USE_CUDA
  549. datawizard_partition_lazy_SOURCES += \
  550. datawizard/scal_cuda.cu
  551. endif
  552. if STARPU_USE_OPENCL
  553. datawizard_partition_lazy_SOURCES += \
  554. datawizard/scal_opencl.cl
  555. endif
  556. datawizard_gpu_register_SOURCES = \
  557. datawizard/gpu_register.c \
  558. datawizard/scal.c
  559. if STARPU_USE_CUDA
  560. datawizard_gpu_register_SOURCES += \
  561. datawizard/scal_cuda.cu
  562. endif
  563. if STARPU_USE_OPENCL
  564. datawizard_gpu_register_SOURCES += \
  565. datawizard/scal_opencl.cl
  566. endif
  567. datawizard_gpu_ptr_register_SOURCES = \
  568. datawizard/gpu_ptr_register.c \
  569. datawizard/scal.c
  570. if STARPU_USE_CUDA
  571. datawizard_gpu_ptr_register_SOURCES += \
  572. datawizard/scal_cuda.cu
  573. endif
  574. if STARPU_USE_OPENCL
  575. datawizard_gpu_ptr_register_SOURCES += \
  576. datawizard/scal_opencl.cl
  577. endif
  578. datawizard_wt_host_SOURCES = \
  579. datawizard/wt_host.c
  580. datawizard_wt_broadcast_SOURCES = \
  581. datawizard/wt_broadcast.c
  582. datawizard_specific_node_SOURCES = \
  583. datawizard/specific_node.c
  584. if STARPU_USE_CUDA
  585. datawizard_specific_node_SOURCES += \
  586. datawizard/cuda_codelet_unsigned_inc.cu
  587. endif
  588. if STARPU_USE_OPENCL
  589. datawizard_specific_node_SOURCES += \
  590. datawizard/opencl_codelet_unsigned_inc.c
  591. endif
  592. datawizard_test_arbiter_SOURCES = \
  593. datawizard/test_arbiter.cpp
  594. main_deprecated_func_CFLAGS = $(AM_CFLAGS) -Wno-deprecated-declarations
  595. main_insert_task_where_SOURCES = \
  596. main/insert_task_where.c
  597. if STARPU_USE_CUDA
  598. main_insert_task_where_SOURCES += \
  599. main/increment.cu
  600. endif
  601. main_subgraph_repeat_SOURCES = \
  602. main/subgraph_repeat.c \
  603. main/increment_codelet.c
  604. if STARPU_USE_CUDA
  605. main_subgraph_repeat_SOURCES += \
  606. main/increment.cu
  607. endif
  608. main_subgraph_repeat_tag_SOURCES = \
  609. main/subgraph_repeat_tag.c \
  610. main/increment_codelet.c
  611. if STARPU_USE_CUDA
  612. main_subgraph_repeat_tag_SOURCES += \
  613. main/increment.cu
  614. endif
  615. main_subgraph_repeat_regenerate_SOURCES = \
  616. main/subgraph_repeat_regenerate.c \
  617. main/increment_codelet.c
  618. if STARPU_USE_CUDA
  619. main_subgraph_repeat_regenerate_SOURCES += \
  620. main/increment.cu
  621. endif
  622. main_subgraph_repeat_regenerate_tag_SOURCES = \
  623. main/subgraph_repeat_regenerate_tag.c \
  624. main/increment_codelet.c
  625. if STARPU_USE_CUDA
  626. main_subgraph_repeat_regenerate_tag_SOURCES += \
  627. main/increment.cu
  628. endif
  629. main_subgraph_repeat_regenerate_tag_cycle_SOURCES = \
  630. main/subgraph_repeat_regenerate_tag_cycle.c \
  631. main/increment_codelet.c
  632. if STARPU_USE_CUDA
  633. main_subgraph_repeat_regenerate_tag_cycle_SOURCES += \
  634. main/increment.cu
  635. endif
  636. sched_ctx_sched_ctx_list_SOURCES = \
  637. sched_ctx/sched_ctx_list.c
  638. sched_ctx_sched_ctx_policy_data_SOURCES = \
  639. sched_ctx/sched_ctx_policy_data.c
  640. sched_ctx_sched_ctx_hierarchy_SOURCES = \
  641. sched_ctx/sched_ctx_hierarchy.c
  642. openmp_init_exit_01_SOURCES = \
  643. openmp/init_exit_01.c
  644. openmp_init_exit_02_SOURCES = \
  645. openmp/init_exit_02.c
  646. openmp_environment_SOURCES = \
  647. openmp/environment.c
  648. openmp_api_01_SOURCES = \
  649. openmp/api_01.c
  650. openmp_parallel_01_SOURCES = \
  651. openmp/parallel_01.c
  652. openmp_parallel_02_SOURCES = \
  653. openmp/parallel_02.c
  654. openmp_parallel_03_SOURCES = \
  655. openmp/parallel_03.c
  656. openmp_parallel_barrier_01_SOURCES = \
  657. openmp/parallel_barrier_01.c
  658. openmp_parallel_master_01_SOURCES = \
  659. openmp/parallel_master_01.c
  660. openmp_parallel_master_inline_01_SOURCES = \
  661. openmp/parallel_master_inline_01.c
  662. openmp_parallel_single_wait_01_SOURCES = \
  663. openmp/parallel_single_wait_01.c
  664. openmp_parallel_single_nowait_01_SOURCES = \
  665. openmp/parallel_single_nowait_01.c
  666. openmp_parallel_single_inline_01_SOURCES = \
  667. openmp/parallel_single_inline_01.c
  668. openmp_parallel_single_copyprivate_01_SOURCES = \
  669. openmp/parallel_single_copyprivate_01.c
  670. openmp_parallel_single_copyprivate_inline_01_SOURCES = \
  671. openmp/parallel_single_copyprivate_inline_01.c
  672. openmp_parallel_critical_01_SOURCES = \
  673. openmp/parallel_critical_01.c
  674. openmp_parallel_critical_inline_01_SOURCES = \
  675. openmp/parallel_critical_inline_01.c
  676. openmp_parallel_critical_named_01_SOURCES = \
  677. openmp/parallel_critical_named_01.c
  678. openmp_parallel_critical_named_inline_01_SOURCES = \
  679. openmp/parallel_critical_named_inline_01.c
  680. openmp_parallel_simple_lock_01_SOURCES = \
  681. openmp/parallel_simple_lock_01.c
  682. openmp_parallel_nested_lock_01_SOURCES = \
  683. openmp/parallel_nested_lock_01.c
  684. openmp_parallel_for_01_SOURCES = \
  685. openmp/parallel_for_01.c
  686. openmp_parallel_for_02_SOURCES = \
  687. openmp/parallel_for_02.c
  688. openmp_parallel_for_ordered_01_SOURCES = \
  689. openmp/parallel_for_ordered_01.c
  690. openmp_parallel_sections_01_SOURCES = \
  691. openmp/parallel_sections_01.c
  692. openmp_parallel_sections_combined_01_SOURCES = \
  693. openmp/parallel_sections_combined_01.c
  694. openmp_task_01_SOURCES = \
  695. openmp/task_01.c
  696. openmp_task_02_SOURCES = \
  697. openmp/task_02.c
  698. openmp_task_03_SOURCES = \
  699. openmp/task_03.c
  700. openmp_taskloop_SOURCES = \
  701. openmp/taskloop.c
  702. openmp_taskwait_01_SOURCES = \
  703. openmp/taskwait_01.c
  704. openmp_taskgroup_01_SOURCES = \
  705. openmp/taskgroup_01.c
  706. openmp_taskgroup_02_SOURCES = \
  707. openmp/taskgroup_02.c
  708. openmp_array_slice_01_SOURCES = \
  709. openmp/array_slice_01.c
  710. openmp_cuda_task_01_SOURCES = \
  711. openmp/cuda_task_01.c
  712. if STARPU_HAVE_FC
  713. fortran90_init_01_SOURCES = \
  714. fortran90/starpu_mod.f90 \
  715. fortran90/init_01.f90
  716. endif
  717. helper_starpu_data_dup_ro_SOURCES = \
  718. helper/starpu_data_dup_ro.c \
  719. main/increment_codelet.c
  720. if STARPU_USE_CUDA
  721. helper_starpu_data_dup_ro_SOURCES += \
  722. main/increment.cu
  723. endif
  724. ###################
  725. # Block interface #
  726. ###################
  727. datawizard_interfaces_block_block_interface_SOURCES= \
  728. datawizard/interfaces/test_interfaces.c \
  729. datawizard/interfaces/block/block_interface.c
  730. if STARPU_USE_CUDA
  731. datawizard_interfaces_block_block_interface_SOURCES+= \
  732. datawizard/interfaces/block/block_cuda.cu
  733. endif
  734. if STARPU_USE_OPENCL
  735. datawizard_interfaces_block_block_interface_SOURCES+= \
  736. datawizard/interfaces/block/block_opencl.c
  737. nobase_STARPU_OPENCL_DATA_DATA += \
  738. datawizard/interfaces/block/block_opencl_kernel.cl
  739. endif
  740. ###################
  741. # Tensor interface #
  742. ###################
  743. datawizard_interfaces_tensor_tensor_interface_SOURCES= \
  744. datawizard/interfaces/test_interfaces.c \
  745. datawizard/interfaces/tensor/tensor_interface.c
  746. if STARPU_USE_CUDA
  747. datawizard_interfaces_tensor_tensor_interface_SOURCES+= \
  748. datawizard/interfaces/tensor/tensor_cuda.cu
  749. endif
  750. if STARPU_USE_OPENCL
  751. datawizard_interfaces_tensor_tensor_interface_SOURCES+= \
  752. datawizard/interfaces/tensor/tensor_opencl.c
  753. nobase_STARPU_OPENCL_DATA_DATA += \
  754. datawizard/interfaces/tensor/tensor_opencl_kernel.cl
  755. endif
  756. ##################
  757. # BSCR interface #
  758. ##################
  759. datawizard_interfaces_bcsr_bcsr_interface_SOURCES= \
  760. datawizard/interfaces/test_interfaces.c \
  761. datawizard/interfaces/bcsr/bcsr_interface.c
  762. if STARPU_USE_CUDA
  763. datawizard_interfaces_bcsr_bcsr_interface_SOURCES+= \
  764. datawizard/interfaces/bcsr/bcsr_cuda.cu
  765. endif
  766. if STARPU_USE_OPENCL
  767. datawizard_interfaces_bcsr_bcsr_interface_SOURCES+= \
  768. datawizard/interfaces/bcsr/bcsr_opencl.c
  769. nobase_STARPU_OPENCL_DATA_DATA += \
  770. datawizard/interfaces/bcsr/bcsr_opencl_kernel.cl
  771. endif
  772. #################
  773. # COO interface #
  774. #################
  775. datawizard_interfaces_coo_coo_interface_SOURCES= \
  776. datawizard/interfaces/test_interfaces.c \
  777. datawizard/interfaces/coo/coo_interface.c
  778. if STARPU_USE_CUDA
  779. datawizard_interfaces_coo_coo_interface_SOURCES+= \
  780. datawizard/interfaces/coo/coo_cuda.cu
  781. endif
  782. if STARPU_USE_OPENCL
  783. datawizard_interfaces_coo_coo_interface_SOURCES+= \
  784. datawizard/interfaces/coo/coo_opencl.c
  785. nobase_STARPU_OPENCL_DATA_DATA += \
  786. datawizard/interfaces/coo/coo_opencl_kernel.cl
  787. endif
  788. #################
  789. # CSR interface #
  790. #################
  791. datawizard_interfaces_csr_csr_interface_SOURCES= \
  792. datawizard/interfaces/test_interfaces.c \
  793. datawizard/interfaces/csr/csr_interface.c
  794. if STARPU_USE_CUDA
  795. datawizard_interfaces_csr_csr_interface_SOURCES+= \
  796. datawizard/interfaces/csr/csr_cuda.cu
  797. endif
  798. if STARPU_USE_OPENCL
  799. datawizard_interfaces_csr_csr_interface_SOURCES+= \
  800. datawizard/interfaces/csr/csr_opencl.c
  801. nobase_STARPU_OPENCL_DATA_DATA += \
  802. datawizard/interfaces/csr/csr_opencl_kernel.cl
  803. endif
  804. datawizard_interfaces_vector_vector_interface_SOURCES = \
  805. datawizard/interfaces/vector/vector_interface.c \
  806. datawizard/interfaces/test_interfaces.c
  807. if STARPU_USE_CUDA
  808. datawizard_interfaces_vector_vector_interface_SOURCES += \
  809. datawizard/interfaces/vector/vector_cuda.cu
  810. endif
  811. if STARPU_USE_OPENCL
  812. datawizard_interfaces_vector_vector_interface_SOURCES += \
  813. datawizard/interfaces/vector/vector_opencl.c
  814. nobase_STARPU_OPENCL_DATA_DATA += \
  815. datawizard/interfaces/vector/vector_opencl_kernel.cl
  816. endif
  817. ####################
  818. # Matrix interface #
  819. ####################
  820. datawizard_interfaces_matrix_matrix_interface_SOURCES= \
  821. datawizard/interfaces/test_interfaces.c \
  822. datawizard/interfaces/matrix/matrix_interface.c
  823. if STARPU_USE_CUDA
  824. datawizard_interfaces_matrix_matrix_interface_SOURCES+= \
  825. datawizard/interfaces/matrix/matrix_cuda.cu
  826. endif
  827. if STARPU_USE_OPENCL
  828. datawizard_interfaces_matrix_matrix_interface_SOURCES+= \
  829. datawizard/interfaces/matrix/matrix_opencl.c
  830. nobase_STARPU_OPENCL_DATA_DATA+= \
  831. datawizard/interfaces/matrix/matrix_opencl_kernel.cl
  832. endif
  833. #########################
  834. # Multiformat interface #
  835. #########################
  836. datawizard_interfaces_multiformat_multiformat_interface_SOURCES = \
  837. datawizard/interfaces/test_interfaces.c \
  838. datawizard/interfaces/multiformat/multiformat_interface.c \
  839. datawizard/interfaces/multiformat/multiformat_conversion_codelets.c
  840. if STARPU_USE_CUDA
  841. datawizard_interfaces_multiformat_multiformat_interface_SOURCES+= \
  842. datawizard/interfaces/multiformat/multiformat_cuda.cu \
  843. datawizard/interfaces/multiformat/multiformat_conversion_codelets_cuda.cu
  844. endif
  845. if STARPU_USE_OPENCL
  846. datawizard_interfaces_multiformat_multiformat_interface_SOURCES+= \
  847. datawizard/interfaces/multiformat/multiformat_opencl.c \
  848. datawizard/interfaces/multiformat/multiformat_conversion_codelets_opencl.c
  849. nobase_STARPU_OPENCL_DATA_DATA += \
  850. datawizard/interfaces/multiformat/multiformat_opencl_kernel.cl \
  851. datawizard/interfaces/multiformat/multiformat_conversion_codelets_kernel.cl
  852. endif
  853. datawizard_interfaces_multiformat_advanced_multiformat_cuda_opencl_SOURCES=\
  854. datawizard/interfaces/multiformat/advanced/generic.c \
  855. datawizard/interfaces/multiformat/advanced/multiformat_cuda_opencl.c
  856. datawizard_interfaces_multiformat_advanced_multiformat_data_release_SOURCES = \
  857. datawizard/interfaces/multiformat/advanced/generic.c \
  858. datawizard/interfaces/multiformat/advanced/multiformat_data_release.c
  859. datawizard_interfaces_multiformat_advanced_multiformat_worker_SOURCES=\
  860. datawizard/interfaces/multiformat/advanced/generic.c \
  861. datawizard/interfaces/multiformat/advanced/multiformat_worker.c
  862. datawizard_interfaces_multiformat_advanced_multiformat_handle_conversion_SOURCES = \
  863. datawizard/interfaces/multiformat/advanced/generic.c \
  864. datawizard/interfaces/multiformat/advanced/multiformat_handle_conversion.c
  865. datawizard_interfaces_multiformat_advanced_same_handle_SOURCES= \
  866. datawizard/interfaces/multiformat/advanced/generic.c \
  867. datawizard/interfaces/multiformat/advanced/same_handle.c
  868. datawizard_interfaces_variable_variable_interface_SOURCES= \
  869. datawizard/interfaces/test_interfaces.c \
  870. datawizard/interfaces/variable/variable_interface.c
  871. if STARPU_USE_CUDA
  872. datawizard_interfaces_variable_variable_interface_SOURCES+= \
  873. datawizard/interfaces/variable/variable_cuda.cu
  874. endif
  875. if STARPU_USE_OPENCL
  876. datawizard_interfaces_variable_variable_interface_SOURCES+= \
  877. datawizard/interfaces/variable/variable_opencl.c
  878. nobase_STARPU_OPENCL_DATA_DATA += \
  879. datawizard/interfaces/variable/variable_opencl_kernel.cl
  880. endif
  881. ##################
  882. # Void interface #
  883. ##################
  884. datawizard_interfaces_void_void_interface_SOURCES=\
  885. datawizard/interfaces/test_interfaces.c \
  886. datawizard/interfaces/void/void_interface.c
  887. overlap_gpu_concurrency_SOURCES=\
  888. overlap/gpu_concurrency.c
  889. if STARPU_USE_CUDA
  890. overlap_gpu_concurrency_SOURCES+=\
  891. overlap/long_kernel.cu
  892. endif
  893. perfmodels_regression_based_memset_SOURCES=\
  894. perfmodels/regression_based_memset.c
  895. perfmodels_regression_based_check_SOURCES=\
  896. perfmodels/regression_based_check.c
  897. perfmodels_regression_based_multiimpl_SOURCES=\
  898. perfmodels/regression_based_multiimpl.c
  899. perfmodels_regression_based_energy_SOURCES=\
  900. perfmodels/regression_based_energy.c
  901. perfmodels_regression_based_gpu_SOURCES=\
  902. perfmodels/regression_based_gpu.c
  903. fpga_max_fpga_SOURCES=\
  904. fpga/max_fpga.c
  905. fpga_max_fpga_LDADD = $(LDADD) \
  906. fpga/slic_MyTasks.o
  907. fpga/max_fpga.o: fpga/MyTasks.max
  908. if STARPU_USE_OPENCL
  909. perfmodels_regression_based_memset_SOURCES+=\
  910. perfmodels/opencl_memset.c
  911. perfmodels_regression_based_gpu_SOURCES+=\
  912. perfmodels/opencl_memset.c
  913. nobase_STARPU_OPENCL_DATA_DATA += \
  914. perfmodels/opencl_memset_kernel.cl
  915. endif
  916. perfmodels_non_linear_regression_based_SOURCES=\
  917. perfmodels/non_linear_regression_based.c
  918. if STARPU_USE_OPENCL
  919. perfmodels_non_linear_regression_based_SOURCES+=\
  920. perfmodels/opencl_memset.c
  921. endif
  922. perfmodels_feed_SOURCES=\
  923. perfmodels/feed.c
  924. sched_policies_execute_all_tasks_LDFLAGS = $(AM_LDFLAGS) -lm
  925. # Fortran90 tests
  926. # - link over source file to build our own object
  927. fortran90/starpu_mod.f90:
  928. @$(MKDIR_P) $(dir $@)
  929. $(V_ln) $(LN_S) $(abs_top_srcdir)/include/$(notdir $@) $@
  930. if STARPU_HAVE_FC
  931. # - express the creation of .mod along .o
  932. starpu_mod.mod: fortran90/starpu_mod.o
  933. # - list explicit dependences to control proper module files dependencies
  934. fortran90/init_01.o: starpu_mod.mod
  935. endif
  936. # Maxeler compiler
  937. if STARPU_USE_FPGA
  938. MAX_TARGET = DFE_SIM
  939. MAX_DFE = MAX5C_$(MAX_TARGET)
  940. MAXJ=$(wildcard fpga/*.maxj)
  941. CLASS=$(MAXJ:.maxj=.class)
  942. $(CLASS) &: $(MAXJ)
  943. maxjc -1.7 -cp $$MAXCLASSPATH $(dir $<)
  944. %.max: %Manager.class
  945. java -XX:+UseSerialGC -Xmx2048m -cp $$MAXCLASSPATH:. $(shell dirname $*).$(notdir $*)Manager DFEModel=MAIA maxFileName=$(notdir $*) target=$(MAX_TARGET)
  946. cp $(notdir $*)_$(MAX_DFE)/results/$(notdir $*).{max,h} $(dir $@)
  947. slic_%.o: %.max
  948. sliccompile $< $@
  949. CLEANFILES += */*.max */*.class fpga/*.h
  950. endif