123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356 |
- /* StarPU --- Runtime system for heterogeneous multicore architectures.
- *
- * Copyright (C) 2011 INRIA
- * Copyright (C) 2011 Centre National de la Recherche Scientifique
- *
- * StarPU is free software; you can redistribute it and/or modify
- * it under the terms of the GNU Lesser General Public License as published by
- * the Free Software Foundation; either version 2.1 of the License, or (at
- * your option) any later version.
- *
- * StarPU is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
- *
- * See the GNU Lesser General Public License in COPYING.LGPL for more details.
- */
- #include <starpu.h>
- #include "../helper.h"
- #define NX 4
- #define DEBUG 0
- #if DEBUG
- #define SYNCHRONOUS 1 /* Easier to debug with synchronous tasks */
- #define ENTER() do { FPRINTF(stderr, "Entering %s\n", __func__); } while (0)
- #else
- #define SYNCHRONOUS 0
- #define ENTER()
- #endif
- /* Counting the calls to the codelets */
- struct stats
- {
- unsigned int cpu;
- #ifdef STARPU_USE_CUDA
- unsigned int cuda;
- unsigned int cpu_to_cuda;
- unsigned int cuda_to_cpu;
- #endif
- #ifdef STARPU_USE_OPENCL
- unsigned int opencl;
- unsigned int cpu_to_opencl;
- unsigned int opencl_to_cpu;
- #endif
- };
- struct stats global_stats;
- /* "Fake" conversion codelets */
- #ifdef STARPU_USE_CUDA
- static void cpu_to_cuda_func(void *buffers[], void *args)
- {
- ENTER();
- global_stats.cpu_to_cuda++;
- }
- static void cuda_to_cpu_func(void *buffers[], void *args)
- {
- ENTER();
- global_stats.cuda_to_cpu++;
- }
- struct starpu_codelet cpu_to_cuda_cl =
- {
- .where = STARPU_CUDA,
- .cuda_funcs = {cpu_to_cuda_func, NULL},
- .nbuffers = 1
- };
- struct starpu_codelet cuda_to_cpu_cl =
- {
- .where = STARPU_CPU,
- .cpu_funcs = {cuda_to_cpu_func, NULL},
- .nbuffers = 1
- };
- #endif /* !STARPU_USE_CUDA */
- #ifdef STARPU_USE_OPENCL
- static void cpu_to_opencl_func(void *buffers[], void *args)
- {
- ENTER();
- global_stats.cpu_to_opencl++;
- }
- static void opencl_to_cpu_func(void *buffers[], void *args)
- {
- ENTER();
- global_stats.opencl_to_cpu++;
- }
- struct starpu_codelet cpu_to_opencl_cl =
- {
- .where = STARPU_OPENCL,
- .opencl_funcs = {cpu_to_opencl_func, NULL},
- .nbuffers = 1
- };
- struct starpu_codelet opencl_to_cpu_cl =
- {
- .where = STARPU_CPU,
- .cpu_funcs = {opencl_to_cpu_func, NULL},
- .nbuffers = 1
- };
- #endif /* !STARPU_USE_OPENCL */
- static struct starpu_multiformat_data_interface_ops ops =
- {
- #ifdef STARPU_USE_CUDA
- .cuda_elemsize = sizeof(int),
- .cpu_to_cuda_cl = &cpu_to_cuda_cl,
- .cuda_to_cpu_cl = &cuda_to_cpu_cl,
- #endif
- #ifdef STARPU_USE_OPENCL
- .opencl_elemsize = sizeof(int),
- .cpu_to_opencl_cl = &cpu_to_opencl_cl,
- .opencl_to_cpu_cl = &opencl_to_cpu_cl,
- #endif
- .cpu_elemsize = sizeof(int)
- };
- static void cpu_func(void *buffers[], void *args)
- {
- ENTER();
- global_stats.cpu++;
- }
- #ifdef STARPU_USE_CUDA
- static void cuda_func(void *buffers[], void *args)
- {
- ENTER();
- global_stats.cuda++;
- }
- #endif /* !STARPU_USE_CUDA */
- #ifdef STARPU_USE_OPENCL
- static void opencl_func(void *buffers[], void *args)
- {
- ENTER();
- global_stats.opencl++;
- }
- #endif /* !STARPU_USE_OPENCL */
- static void
- create_and_submit_tasks(int where, starpu_data_handle_t handles[])
- {
- FPRINTF(stderr, "***** Starting Task 1\n");
- static struct starpu_codelet cl =
- {
- .modes = { STARPU_RW },
- #ifdef STARPU_USE_CUDA
- .cuda_funcs = {cuda_func, NULL},
- #endif
- #if STARPU_USE_OPENCL
- .opencl_funcs = {opencl_func, NULL},
- #endif
- .nbuffers = 1
- };
- cl.where = where;
- struct starpu_task *task = starpu_task_create();
- task->synchronous = SYNCHRONOUS;
- task->cl = &cl;
- task->handles[0] = handles[0];
- starpu_task_submit(task);
- FPRINTF(stderr, "***** Starting Task 2\n");
- static struct starpu_codelet cl2 =
- {
- .modes = { STARPU_RW },
- .where = STARPU_CPU,
- .cpu_funcs = {cpu_func, NULL},
- .nbuffers = 1
- };
- struct starpu_task *task2 = starpu_task_create();
- task2->synchronous = SYNCHRONOUS;
- task2->cl = &cl2;
- task2->handles[0] = handles[1];
- starpu_task_submit(task2);
- FPRINTF(stderr, "***** Starting Task 3\n");
- static struct starpu_codelet cl3 =
- {
- .modes = { STARPU_RW, STARPU_RW },
- .cpu_funcs = {cpu_func, NULL},
- #ifdef STARPU_USE_CUDA
- .cuda_funcs = {cuda_func, NULL},
- #endif
- #ifdef STARPU_USE_OPENCL
- .opencl_funcs = {opencl_func, NULL},
- #endif
- .nbuffers = 2
- };
- cl3.where = where;
- struct starpu_task *task3 = starpu_task_create();
- task3->synchronous = SYNCHRONOUS;
- task3->cl = &cl3;
- task3->handles[0] = handles[0];
- task3->handles[1] = handles[1];
- starpu_task_submit(task3);
- starpu_task_wait_for_all();
- FPRINTF(stderr, "***** End of all tasks\n");
- return;
- }
- #if DEBUG
- static void
- print_stats(struct stats *s)
- {
- FPRINTF(stderr, "cpu : %d\n", s->cpu);
- #ifdef STARPU_USE_CUDA
- FPRINTF(stderr, "cuda : %d\n"
- "cpu->cuda : %d\n"
- "cuda->cpu : %d\n",
- s->cuda,
- s->cpu_to_cuda,
- s->cuda_to_cpu);
- #endif
- #ifdef STARPU_USE_OPENCL
- FPRINTF(stderr, "opencl : %d\n"
- "cpu->opencl : %d\n"
- "opencl->cpu : %d\n",
- s->opencl,
- s->cpu_to_opencl,
- s->opencl_to_cpu);
- #endif
- }
- #endif /* !DEBUG */
- /* XXX Just a little bit of copy/pasta here... */
- #ifdef STARPU_USE_CUDA
- static int
- test_cuda(void)
- {
- int i;
- int vector1[NX];
- int vector2[NX];
- starpu_data_handle_t handles[2];
- for (i = 0; i < NX; i++)
- {
- vector1[i] = i;
- vector2[i] = i;
- }
- starpu_multiformat_data_register(handles, 0, vector1, NX, &ops);
- starpu_multiformat_data_register(handles+1, 0, vector2, NX, &ops);
- memset(&global_stats, 0, sizeof(global_stats));
- create_and_submit_tasks(STARPU_CUDA, handles);
- starpu_data_unregister(handles[0]);
- starpu_data_unregister(handles[1]);
- #if DEBUG
- print_stats(&global_stats);
- #endif
- return !(global_stats.cpu == 1 &&
- global_stats.cpu_to_cuda == 2 &&
- global_stats.cuda_to_cpu == 2 &&
- global_stats.cuda == 2);
- }
- #endif /* !STARPU_USE_CUDA */
- #ifdef STARPU_USE_OPENCL
- static int
- test_opencl(void)
- {
- int i;
- int vector1[NX];
- int vector2[NX];
- starpu_data_handle_t handles[2];
- for (i = 0; i < NX; i++)
- {
- vector1[i] = i;
- vector2[i] = i;
- }
- starpu_multiformat_data_register(handles, 0, vector1, NX, &ops);
- starpu_multiformat_data_register(handles+1, 0, vector2, NX, &ops);
- memset(&global_stats, 0, sizeof(global_stats));
- create_and_submit_tasks(STARPU_OPENCL, handles);
- starpu_data_unregister(handles[0]);
- starpu_data_unregister(handles[1]);
- #if DEBUG
- print_stats(&global_stats);
- #endif
- return !(global_stats.cpu == 1 &&
- global_stats.cpu_to_opencl == 2 &&
- global_stats.opencl_to_cpu == 2 &&
- global_stats.opencl == 2);
- }
- #endif /* !STARPU_USE_OPENCL */
- int
- main(void)
- {
- #ifdef STARPU_USE_CPU
- int ret;
- struct starpu_conf conf =
- {
- .ncpus = -1,
- .ncuda = 2,
- .nopencl = 1
- };
- ret = starpu_init(&conf);
- STARPU_CHECK_RETURN_VALUE(ret, "starpu_init");
- unsigned int ncuda = starpu_cuda_worker_get_count();
- unsigned int nopencl = starpu_opencl_worker_get_count();
- #ifdef STARPU_USE_OPENCL
- if (nopencl > 0 && test_opencl() != 0)
- {
- FPRINTF(stderr, "OPENCL FAILED\n");
- return EXIT_FAILURE;
- }
- #endif
- #ifdef STARPU_USE_CUDA
- if (ncuda > 0 && test_cuda() != 0)
- {
- FPRINTF(stderr, "CUDA FAILED \n");
- return EXIT_FAILURE;
- }
- #endif
- starpu_shutdown();
- if (ncuda == 0 && nopencl == 0)
- return STARPU_TEST_SKIPPED;
- else
- return EXIT_SUCCESS;
- #else /* !STARPU_USE_CPU */
- /* Without the CPU, there is no point in using the multiformat
- * interface, so this test is pointless. */
- return STARPU_TEST_SKIPPED;
- #endif
- }
|