123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236 |
- /* StarPU --- Runtime system for heterogeneous multicore architectures.
- *
- * Copyright (C) 2015-2021 Université de Bordeaux, CNRS (LaBRI UMR 5800), Inria
- *
- * StarPU is free software; you can redistribute it and/or modify
- * it under the terms of the GNU Lesser General Public License as published by
- * the Free Software Foundation; either version 2.1 of the License, or (at
- * your option) any later version.
- *
- * StarPU is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
- *
- * See the GNU Lesser General Public License in COPYING.LGPL for more details.
- */
- /*
- * This is an example making use of the heteroprio scheduler, it shows how
- * priorities are taken into account.
- */
- #include <starpu.h>
- #include <schedulers/starpu_heteroprio.h>
- #include <unistd.h>
- #define FPRINTF(ofile, fmt, ...) do { if (!getenv("STARPU_SSILENT")) {fprintf(ofile, fmt, ## __VA_ARGS__); }} while(0)
- void initSchedulerCallback(unsigned sched_ctx)
- {
- // CPU uses 3 buckets
- #ifdef STARPU_USE_CPU
- if (starpu_cpu_worker_get_count())
- {
- starpu_heteroprio_set_nb_prios(0, STARPU_CPU_WORKER, 3);
- // It uses direct mapping idx => idx
- unsigned idx;
- for(idx = 0; idx < 3; ++idx)
- {
- starpu_heteroprio_set_mapping(sched_ctx, STARPU_CPU_WORKER, idx, idx);
- starpu_heteroprio_set_faster_arch(sched_ctx, STARPU_CPU_WORKER, idx);
- }
- }
- #endif
- #ifdef STARPU_USE_OPENCL
- // OpenCL is enabled and uses 2 buckets
- starpu_heteroprio_set_nb_prios(sched_ctx, STARPU_OPENCL_WORKER, 2);
- // OpenCL will first look to priority 2
- int prio2 = starpu_cpu_worker_get_count() ? 2 : 1;
- starpu_heteroprio_set_mapping(sched_ctx, STARPU_OPENCL_WORKER, 0, prio2);
- // For this bucket OpenCL is the fastest
- starpu_heteroprio_set_faster_arch(sched_ctx, STARPU_OPENCL_WORKER, prio2);
- // And CPU is 4 times slower
- #ifdef STARPU_USE_CPU
- starpu_heteroprio_set_arch_slow_factor(sched_ctx, STARPU_CPU_WORKER, 2, 4.0f);
- #endif
- int prio1 = starpu_cpu_worker_get_count() ? 1 : 0;
- starpu_heteroprio_set_mapping(sched_ctx, STARPU_OPENCL_WORKER, 1, prio1);
- // We let the CPU as the fastest and tell that OpenCL is 1.7 times slower
- starpu_heteroprio_set_arch_slow_factor(sched_ctx, STARPU_OPENCL_WORKER, prio1, 1.7f);
- #endif
- }
- void callback_a_cpu(void *buffers[], void *cl_arg)
- {
- (void)buffers;
- (void)cl_arg;
- usleep(100000);
- FPRINTF(stderr, "[COMMUTE_LOG] callback %s\n", __FUNCTION__); fflush(stderr);
- }
- void callback_b_cpu(void *buffers[], void *cl_arg)
- {
- (void)buffers;
- (void)cl_arg;
- usleep(100000);
- FPRINTF(stderr, "[COMMUTE_LOG] callback %s\n", __FUNCTION__); fflush(stderr);
- }
- void callback_c_cpu(void *buffers[], void *cl_arg)
- {
- (void)buffers;
- (void)cl_arg;
- usleep(100000);
- FPRINTF(stderr, "[COMMUTE_LOG] callback %s\n", __FUNCTION__); fflush(stderr);
- }
- #ifdef STARPU_USE_OPENCL
- void callback_a_opencl(void *buffers[], void *cl_arg)
- {
- (void)buffers;
- (void)cl_arg;
- usleep(100000);
- FPRINTF(stderr, "[COMMUTE_LOG] callback %s\n", __FUNCTION__); fflush(stderr);
- }
- void callback_b_opencl(void *buffers[], void *cl_arg)
- {
- (void)buffers;
- (void)cl_arg;
- usleep(100000);
- FPRINTF(stderr, "[COMMUTE_LOG] callback %s\n", __FUNCTION__); fflush(stderr);
- }
- void callback_c_opencl(void *buffers[], void *cl_arg)
- {
- (void)buffers;
- (void)cl_arg;
- usleep(100000);
- FPRINTF(stderr, "[COMMUTE_LOG] callback %s\n", __FUNCTION__); fflush(stderr);
- }
- #endif
- int main(void)
- {
- int ret;
- struct starpu_conf conf;
- int ncpus, nopencls;
- ret = starpu_conf_init(&conf);
- STARPU_CHECK_RETURN_VALUE(ret, "starpu_conf_init");
- assert(ret == 0);
- conf.sched_policy_name = "heteroprio";
- conf.sched_policy_callback = &initSchedulerCallback;
- ret = starpu_init(&conf);
- if (ret == -ENODEV)
- return 77;
- ncpus = starpu_cpu_worker_get_count();
- nopencls = starpu_opencl_worker_get_count();
- FPRINTF(stderr, "Worker = %u\n", starpu_worker_get_count());
- FPRINTF(stderr, "Worker CPU = %d\n", ncpus);
- FPRINTF(stderr, "Worker OpenCL = %d\n", nopencls);
- if (ncpus + nopencls == 0)
- {
- FPRINTF(stderr, "Needs at least one CPU or OpenCL device\n");
- starpu_shutdown();
- return 77;
- }
- struct starpu_codelet codeleteA;
- {
- memset(&codeleteA, 0, sizeof(codeleteA));
- codeleteA.nbuffers = 2;
- codeleteA.modes[0] = STARPU_RW;
- codeleteA.modes[1] = STARPU_RW;
- codeleteA.name = "codeleteA";
- #ifdef STARPU_USE_CPU
- codeleteA.cpu_funcs[0] = callback_a_cpu;
- #endif
- #ifdef STARPU_USE_OPENCL
- codeleteA.opencl_funcs[0] = callback_a_opencl;
- #endif
- }
- struct starpu_codelet codeleteB;
- {
- memset(&codeleteB, 0, sizeof(codeleteB));
- codeleteB.nbuffers = 2;
- codeleteB.modes[0] = STARPU_RW;
- codeleteB.modes[1] = STARPU_RW;
- codeleteB.name = "codeleteB";
- codeleteB.cpu_funcs[0] = callback_b_cpu;
- #ifdef STARPU_USE_OPENCL
- codeleteB.opencl_funcs[0] = callback_b_opencl;
- #endif
- }
- struct starpu_codelet codeleteC;
- {
- memset(&codeleteC, 0, sizeof(codeleteC));
- codeleteC.nbuffers = 2;
- codeleteC.modes[0] = STARPU_RW;
- codeleteC.modes[1] = STARPU_RW;
- codeleteC.name = "codeleteC";
- codeleteC.cpu_funcs[0] = callback_c_cpu;
- #ifdef STARPU_USE_OPENCL
- codeleteC.opencl_funcs[0] = callback_c_opencl;
- #endif
- }
- const int nbHandles = 10;
- FPRINTF(stderr, "Nb handles = %d\n", nbHandles);
- starpu_data_handle_t handles[nbHandles];
- memset(handles, 0, sizeof(handles[0])*nbHandles);
- int dataA[nbHandles];
- int idx;
- for(idx = 0; idx < nbHandles; ++idx)
- {
- dataA[idx] = idx;
- }
- int idxHandle;
- for(idxHandle = 0; idxHandle < nbHandles; ++idxHandle)
- {
- starpu_variable_data_register(&handles[idxHandle], 0, (uintptr_t)&dataA[idxHandle], sizeof(dataA[idxHandle]));
- }
- const int nbTasks = 4;
- FPRINTF(stderr, "Submit %d tasks \n", nbTasks);
- int prio2 = starpu_cpu_worker_get_count() ? 2 : 1;
- int idxTask;
- for(idxTask = 0; idxTask < nbTasks; ++idxTask)
- {
- starpu_insert_task(&codeleteA,
- STARPU_PRIORITY, 0,
- (STARPU_RW), handles[(idxTask*2)%nbHandles],
- (STARPU_RW), handles[(idxTask*3+1)%nbHandles],
- 0);
- starpu_insert_task(&codeleteB,
- STARPU_PRIORITY, 1,
- (STARPU_RW), handles[(idxTask*2 +1 )%nbHandles],
- (STARPU_RW), handles[(idxTask*2)%nbHandles],
- 0);
- starpu_insert_task(&codeleteC,
- STARPU_PRIORITY, prio2,
- (STARPU_RW), handles[(idxTask)%nbHandles],
- (STARPU_RW), handles[(idxTask*idxTask)%nbHandles],
- 0);
- }
- FPRINTF(stderr, "Wait task\n");
- starpu_task_wait_for_all();
- FPRINTF(stderr, "Release data\n");
- for(idxHandle = 0 ; idxHandle < nbHandles ; ++idxHandle)
- {
- starpu_data_unregister(handles[idxHandle]);
- }
- FPRINTF(stderr, "Shutdown\n");
- starpu_shutdown();
- return 0;
- }
|