heteroprio_test.c 6.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237
  1. /* StarPU --- Runtime system for heterogeneous multicore architectures.
  2. *
  3. * Copyright (C) 2015 INRIA
  4. * Copyright (C) 2016, 2017 CNRS
  5. *
  6. * StarPU is free software; you can redistribute it and/or modify
  7. * it under the terms of the GNU Lesser General Public License as published by
  8. * the Free Software Foundation; either version 2.1 of the License, or (at
  9. * your option) any later version.
  10. *
  11. * StarPU is distributed in the hope that it will be useful, but
  12. * WITHOUT ANY WARRANTY; without even the implied warranty of
  13. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
  14. *
  15. * See the GNU Lesser General Public License in COPYING.LGPL for more details.
  16. */
  17. /*
  18. * This is an example making use of the heteroprio scheduler, it shows how
  19. * priorities are taken into account.
  20. */
  21. #include <starpu.h>
  22. #include <schedulers/starpu_heteroprio.h>
  23. #include <unistd.h>
  24. #define FPRINTF(ofile, fmt, ...) do { if (!getenv("STARPU_SSILENT")) {fprintf(ofile, fmt, ## __VA_ARGS__); }} while(0)
  25. void initSchedulerCallback(unsigned sched_ctx)
  26. {
  27. // CPU uses 3 buckets
  28. #ifdef STARPU_USE_CPU
  29. if (starpu_cpu_worker_get_count())
  30. {
  31. starpu_heteroprio_set_nb_prios(0, STARPU_CPU_IDX, 3);
  32. // It uses direct mapping idx => idx
  33. unsigned idx;
  34. for(idx = 0; idx < 3; ++idx)
  35. {
  36. starpu_heteroprio_set_mapping(sched_ctx, STARPU_CPU_IDX, idx, idx);
  37. starpu_heteroprio_set_faster_arch(sched_ctx, STARPU_CPU_IDX, idx);
  38. }
  39. }
  40. #endif
  41. #ifdef STARPU_USE_OPENCL
  42. // OpenCL is enabled and uses 2 buckets
  43. starpu_heteroprio_set_nb_prios(sched_ctx, STARPU_OPENCL_IDX, 2);
  44. // OpenCL will first look to priority 2
  45. int prio2 = starpu_cpu_worker_get_count() ? 2 : 1;
  46. starpu_heteroprio_set_mapping(sched_ctx, STARPU_OPENCL_IDX, 0, prio2);
  47. // For this bucket OpenCL is the fastest
  48. starpu_heteroprio_set_faster_arch(sched_ctx, STARPU_OPENCL_IDX, prio2);
  49. // And CPU is 4 times slower
  50. #ifdef STARPU_USE_CPU
  51. starpu_heteroprio_set_arch_slow_factor(sched_ctx, STARPU_CPU_IDX, 2, 4.0f);
  52. #endif
  53. int prio1 = starpu_cpu_worker_get_count() ? 1 : 0;
  54. starpu_heteroprio_set_mapping(sched_ctx, STARPU_OPENCL_IDX, 1, prio1);
  55. // We let the CPU as the fastest and tell that OpenCL is 1.7 times slower
  56. starpu_heteroprio_set_arch_slow_factor(sched_ctx, STARPU_OPENCL_IDX, prio1, 1.7f);
  57. #endif
  58. }
  59. void callback_a_cpu(void *buffers[], void *cl_arg)
  60. {
  61. (void)buffers;
  62. (void)cl_arg;
  63. usleep(100000);
  64. FPRINTF(stderr, "[COMMUTE_LOG] callback %s\n", __FUNCTION__); fflush(stderr);
  65. }
  66. void callback_b_cpu(void *buffers[], void *cl_arg)
  67. {
  68. (void)buffers;
  69. (void)cl_arg;
  70. usleep(100000);
  71. FPRINTF(stderr, "[COMMUTE_LOG] callback %s\n", __FUNCTION__); fflush(stderr);
  72. }
  73. void callback_c_cpu(void *buffers[], void *cl_arg)
  74. {
  75. (void)buffers;
  76. (void)cl_arg;
  77. usleep(100000);
  78. FPRINTF(stderr, "[COMMUTE_LOG] callback %s\n", __FUNCTION__); fflush(stderr);
  79. }
  80. #ifdef STARPU_USE_OPENCL
  81. void callback_a_opencl(void *buffers[], void *cl_arg)
  82. {
  83. (void)buffers;
  84. (void)cl_arg;
  85. usleep(100000);
  86. FPRINTF(stderr, "[COMMUTE_LOG] callback %s\n", __FUNCTION__); fflush(stderr);
  87. }
  88. void callback_b_opencl(void *buffers[], void *cl_arg)
  89. {
  90. (void)buffers;
  91. (void)cl_arg;
  92. usleep(100000);
  93. FPRINTF(stderr, "[COMMUTE_LOG] callback %s\n", __FUNCTION__); fflush(stderr);
  94. }
  95. void callback_c_opencl(void *buffers[], void *cl_arg)
  96. {
  97. (void)buffers;
  98. (void)cl_arg;
  99. usleep(100000);
  100. FPRINTF(stderr, "[COMMUTE_LOG] callback %s\n", __FUNCTION__); fflush(stderr);
  101. }
  102. #endif
  103. int main(void)
  104. {
  105. int ret;
  106. struct starpu_conf conf;
  107. int ncpus, nopencls;
  108. ret = starpu_conf_init(&conf);
  109. STARPU_CHECK_RETURN_VALUE(ret, "starpu_conf_init");
  110. assert(ret == 0);
  111. conf.sched_policy_name = "heteroprio";
  112. conf.sched_policy_init = &initSchedulerCallback;
  113. ret = starpu_init(&conf);
  114. if (ret == -ENODEV)
  115. return 77;
  116. ncpus = starpu_cpu_worker_get_count();
  117. nopencls = starpu_opencl_worker_get_count();
  118. FPRINTF(stderr, "Worker = %u\n", starpu_worker_get_count());
  119. FPRINTF(stderr, "Worker CPU = %d\n", ncpus);
  120. FPRINTF(stderr, "Worker OpenCL = %d\n", nopencls);
  121. if (ncpus + nopencls == 0)
  122. {
  123. FPRINTF(stderr, "Needs at least one CPU or OpenCL device\n");
  124. starpu_shutdown();
  125. return 77;
  126. }
  127. struct starpu_codelet codeleteA;
  128. {
  129. memset(&codeleteA, 0, sizeof(codeleteA));
  130. codeleteA.nbuffers = 2;
  131. codeleteA.modes[0] = STARPU_RW;
  132. codeleteA.modes[1] = STARPU_RW;
  133. codeleteA.name = "codeleteA";
  134. #ifdef STARPU_USE_CPU
  135. codeleteA.cpu_funcs[0] = callback_a_cpu;
  136. #endif
  137. #ifdef STARPU_USE_OPENCL
  138. codeleteA.opencl_funcs[0] = callback_a_opencl;
  139. #endif
  140. }
  141. struct starpu_codelet codeleteB;
  142. {
  143. memset(&codeleteB, 0, sizeof(codeleteB));
  144. codeleteB.nbuffers = 2;
  145. codeleteB.modes[0] = STARPU_RW;
  146. codeleteB.modes[1] = STARPU_RW;
  147. codeleteB.name = "codeleteB";
  148. codeleteB.cpu_funcs[0] = callback_b_cpu;
  149. #ifdef STARPU_USE_OPENCL
  150. codeleteB.opencl_funcs[0] = callback_b_opencl;
  151. #endif
  152. }
  153. struct starpu_codelet codeleteC;
  154. {
  155. memset(&codeleteC, 0, sizeof(codeleteC));
  156. codeleteC.nbuffers = 2;
  157. codeleteC.modes[0] = STARPU_RW;
  158. codeleteC.modes[1] = STARPU_RW;
  159. codeleteC.name = "codeleteC";
  160. codeleteC.cpu_funcs[0] = callback_c_cpu;
  161. #ifdef STARPU_USE_OPENCL
  162. codeleteC.opencl_funcs[0] = callback_c_opencl;
  163. #endif
  164. }
  165. const int nbHandles = 10;
  166. FPRINTF(stderr, "Nb handles = %d\n", nbHandles);
  167. starpu_data_handle_t handles[nbHandles];
  168. memset(handles, 0, sizeof(handles[0])*nbHandles);
  169. int dataA[nbHandles];
  170. int idx;
  171. for(idx = 0; idx < nbHandles; ++idx)
  172. {
  173. dataA[idx] = idx;
  174. }
  175. int idxHandle;
  176. for(idxHandle = 0; idxHandle < nbHandles; ++idxHandle)
  177. {
  178. starpu_variable_data_register(&handles[idxHandle], 0, (uintptr_t)&dataA[idxHandle], sizeof(dataA[idxHandle]));
  179. }
  180. const int nbTasks = 4;
  181. FPRINTF(stderr, "Submit %d tasks \n", nbTasks);
  182. int prio2 = starpu_cpu_worker_get_count() ? 2 : 1;
  183. int idxTask;
  184. for(idxTask = 0; idxTask < nbTasks; ++idxTask)
  185. {
  186. starpu_insert_task(&codeleteA,
  187. STARPU_PRIORITY, 0,
  188. (STARPU_RW), handles[(idxTask*2)%nbHandles],
  189. (STARPU_RW), handles[(idxTask*3+1)%nbHandles],
  190. 0);
  191. starpu_insert_task(&codeleteB,
  192. STARPU_PRIORITY, 1,
  193. (STARPU_RW), handles[(idxTask*2 +1 )%nbHandles],
  194. (STARPU_RW), handles[(idxTask*2)%nbHandles],
  195. 0);
  196. starpu_insert_task(&codeleteC,
  197. STARPU_PRIORITY, prio2,
  198. (STARPU_RW), handles[(idxTask)%nbHandles],
  199. (STARPU_RW), handles[(idxTask*idxTask)%nbHandles],
  200. 0);
  201. }
  202. FPRINTF(stderr, "Wait task\n");
  203. starpu_task_wait_for_all();
  204. FPRINTF(stderr, "Release data\n");
  205. for(idxHandle = 0 ; idxHandle < nbHandles ; ++idxHandle)
  206. {
  207. starpu_data_unregister(handles[idxHandle]);
  208. }
  209. FPRINTF(stderr, "Shutdown\n");
  210. starpu_shutdown();
  211. return 0;
  212. }