sched_policy.c 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522
  1. /* StarPU --- Runtime system for heterogeneous multicore architectures.
  2. *
  3. * Copyright (C) 2010-2012 Université de Bordeaux 1
  4. * Copyright (C) 2010-2012 Centre National de la Recherche Scientifique
  5. *
  6. * StarPU is free software; you can redistribute it and/or modify
  7. * it under the terms of the GNU Lesser General Public License as published by
  8. * the Free Software Foundation; either version 2.1 of the License, or (at
  9. * your option) any later version.
  10. *
  11. * StarPU is distributed in the hope that it will be useful, but
  12. * WITHOUT ANY WARRANTY; without even the implied warranty of
  13. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
  14. *
  15. * See the GNU Lesser General Public License in COPYING.LGPL for more details.
  16. */
  17. #include <pthread.h>
  18. #include <starpu.h>
  19. #include <common/config.h>
  20. #include <common/utils.h>
  21. #include <core/sched_policy.h>
  22. #include <profiling/profiling.h>
  23. #include <common/barrier.h>
  24. static struct starpu_sched_policy policy;
  25. static int use_prefetch = 0;
  26. int starpu_get_prefetch_flag(void)
  27. {
  28. return use_prefetch;
  29. }
  30. /*
  31. * Predefined policies
  32. */
  33. extern struct starpu_sched_policy _starpu_sched_ws_policy;
  34. extern struct starpu_sched_policy _starpu_sched_prio_policy;
  35. extern struct starpu_sched_policy _starpu_sched_random_policy;
  36. extern struct starpu_sched_policy _starpu_sched_dm_policy;
  37. extern struct starpu_sched_policy _starpu_sched_dmda_policy;
  38. extern struct starpu_sched_policy _starpu_sched_dmda_ready_policy;
  39. extern struct starpu_sched_policy _starpu_sched_dmda_sorted_policy;
  40. extern struct starpu_sched_policy _starpu_sched_eager_policy;
  41. extern struct starpu_sched_policy _starpu_sched_parallel_heft_policy;
  42. extern struct starpu_sched_policy _starpu_sched_pgreedy_policy;
  43. extern struct starpu_sched_policy heft_policy;
  44. static struct starpu_sched_policy *predefined_policies[] =
  45. {
  46. &_starpu_sched_ws_policy,
  47. &_starpu_sched_prio_policy,
  48. &_starpu_sched_dm_policy,
  49. &_starpu_sched_dmda_policy,
  50. &heft_policy,
  51. &_starpu_sched_dmda_ready_policy,
  52. &_starpu_sched_dmda_sorted_policy,
  53. &_starpu_sched_random_policy,
  54. &_starpu_sched_eager_policy,
  55. &_starpu_sched_parallel_heft_policy,
  56. &_starpu_sched_pgreedy_policy
  57. };
  58. struct starpu_sched_policy *_starpu_get_sched_policy(void)
  59. {
  60. return &policy;
  61. }
  62. /*
  63. * Methods to initialize the scheduling policy
  64. */
  65. static void load_sched_policy(struct starpu_sched_policy *sched_policy)
  66. {
  67. STARPU_ASSERT(sched_policy);
  68. #ifdef STARPU_VERBOSE
  69. if (sched_policy->policy_name)
  70. {
  71. if (sched_policy->policy_description)
  72. _STARPU_DEBUG("Use %s scheduler (%s)\n", sched_policy->policy_name, sched_policy->policy_description);
  73. else
  74. _STARPU_DEBUG("Use %s scheduler \n", sched_policy->policy_name);
  75. }
  76. #endif
  77. policy.init_sched = sched_policy->init_sched;
  78. policy.deinit_sched = sched_policy->deinit_sched;
  79. policy.push_task = sched_policy->push_task;
  80. policy.push_task_notify = sched_policy->push_task_notify;
  81. policy.pop_task = sched_policy->pop_task;
  82. policy.pre_exec_hook = sched_policy->pre_exec_hook;
  83. policy.post_exec_hook = sched_policy->post_exec_hook;
  84. policy.pop_every_task = sched_policy->pop_every_task;
  85. }
  86. static struct starpu_sched_policy *find_sched_policy_from_name(const char *policy_name)
  87. {
  88. if (!policy_name)
  89. return NULL;
  90. unsigned i;
  91. for (i = 0; i < sizeof(predefined_policies)/sizeof(predefined_policies[0]); i++)
  92. {
  93. struct starpu_sched_policy *p;
  94. p = predefined_policies[i];
  95. if (p->policy_name)
  96. {
  97. if (strcmp(policy_name, p->policy_name) == 0)
  98. {
  99. /* we found a policy with the requested name */
  100. return p;
  101. }
  102. }
  103. }
  104. fprintf(stderr, "Warning: scheduling policy \"%s\" was not found, try \"help\" to get a list\n", policy_name);
  105. /* nothing was found */
  106. return NULL;
  107. }
  108. static void display_sched_help_message(void)
  109. {
  110. const char *sched_env = getenv("STARPU_SCHED");
  111. if (sched_env && (strcmp(sched_env, "help") == 0))
  112. {
  113. fprintf(stderr, "STARPU_SCHED can be either of\n");
  114. /* display the description of all predefined policies */
  115. unsigned i;
  116. for (i = 0; i < sizeof(predefined_policies)/sizeof(predefined_policies[0]); i++)
  117. {
  118. struct starpu_sched_policy *p;
  119. p = predefined_policies[i];
  120. fprintf(stderr, "%s\t-> %s\n", p->policy_name, p->policy_description);
  121. }
  122. }
  123. }
  124. static struct starpu_sched_policy *select_sched_policy(struct _starpu_machine_config *config)
  125. {
  126. struct starpu_sched_policy *selected_policy = NULL;
  127. /* First, we check whether the application explicitely gave a scheduling policy or not */
  128. if (config->conf->sched_policy)
  129. return config->conf->sched_policy;
  130. /* Otherwise, we look if the application specified the name of a policy to load */
  131. if (config->conf->sched_policy_name)
  132. selected_policy = find_sched_policy_from_name(config->conf->sched_policy_name);
  133. /* Perhaps there was no policy that matched the name */
  134. if (selected_policy)
  135. return selected_policy;
  136. /* If no policy was specified, we use the greedy policy as a default */
  137. return &_starpu_sched_eager_policy;
  138. }
  139. void _starpu_init_sched_policy(struct _starpu_machine_config *config)
  140. {
  141. /* Perhaps we have to display some help */
  142. display_sched_help_message();
  143. /* Prefetch is activated by default */
  144. use_prefetch = starpu_get_env_number("STARPU_PREFETCH");
  145. if (use_prefetch == -1)
  146. use_prefetch = 1;
  147. /* Set calibrate flag */
  148. _starpu_set_calibrate_flag(config->conf->calibrate);
  149. struct starpu_sched_policy *selected_policy;
  150. selected_policy = select_sched_policy(config);
  151. load_sched_policy(selected_policy);
  152. policy.init_sched(&config->topology, &policy);
  153. }
  154. void _starpu_deinit_sched_policy(struct _starpu_machine_config *config)
  155. {
  156. if (policy.deinit_sched)
  157. policy.deinit_sched(&config->topology, &policy);
  158. }
  159. /* Enqueue a task into the list of tasks explicitely attached to a worker. In
  160. * case workerid identifies a combined worker, a task will be enqueued into
  161. * each worker of the combination. */
  162. static int _starpu_push_task_on_specific_worker(struct starpu_task *task, int workerid)
  163. {
  164. int nbasic_workers = (int)starpu_worker_get_count();
  165. /* Is this a basic worker or a combined worker ? */
  166. int is_basic_worker = (workerid < nbasic_workers);
  167. unsigned memory_node;
  168. struct _starpu_worker *worker = NULL;
  169. struct _starpu_combined_worker *combined_worker = NULL;
  170. if (is_basic_worker)
  171. {
  172. worker = _starpu_get_worker_struct(workerid);
  173. memory_node = worker->memory_node;
  174. }
  175. else
  176. {
  177. combined_worker = _starpu_get_combined_worker_struct(workerid);
  178. memory_node = combined_worker->memory_node;
  179. }
  180. if (use_prefetch)
  181. starpu_prefetch_task_input_on_node(task, memory_node);
  182. if (policy.push_task_notify)
  183. policy.push_task_notify(task, workerid);
  184. if (is_basic_worker)
  185. {
  186. unsigned node = starpu_worker_get_memory_node(workerid);
  187. if (_starpu_task_uses_multiformat_handles(task))
  188. {
  189. unsigned i;
  190. for (i = 0; i < task->cl->nbuffers; i++)
  191. {
  192. struct starpu_task *conversion_task;
  193. starpu_data_handle_t handle;
  194. handle = task->handles[i];
  195. if (!_starpu_handle_needs_conversion_task(handle, node))
  196. continue;
  197. conversion_task = _starpu_create_conversion_task(handle, node);
  198. conversion_task->mf_skip = 1;
  199. conversion_task->execute_on_a_specific_worker = 1;
  200. conversion_task->workerid = workerid;
  201. _starpu_task_submit_conversion_task(conversion_task, workerid);
  202. //_STARPU_DEBUG("Pushing a conversion task\n");
  203. }
  204. for (i = 0; i < task->cl->nbuffers; i++)
  205. task->handles[i]->mf_node = node;
  206. }
  207. return _starpu_push_local_task(worker, task, 0);
  208. }
  209. else
  210. {
  211. /* This is a combined worker so we create task aliases */
  212. int worker_size = combined_worker->worker_size;
  213. int *combined_workerid = combined_worker->combined_workerid;
  214. int ret = 0;
  215. int i;
  216. struct _starpu_job *j = _starpu_get_job_associated_to_task(task);
  217. j->task_size = worker_size;
  218. j->combined_workerid = workerid;
  219. j->active_task_alias_count = 0;
  220. _STARPU_PTHREAD_BARRIER_INIT(&j->before_work_barrier, NULL, worker_size);
  221. _STARPU_PTHREAD_BARRIER_INIT(&j->after_work_barrier, NULL, worker_size);
  222. for (i = 0; i < worker_size; i++)
  223. {
  224. struct starpu_task *alias = _starpu_create_task_alias(task);
  225. worker = _starpu_get_worker_struct(combined_workerid[i]);
  226. ret |= _starpu_push_local_task(worker, alias, 0);
  227. }
  228. return ret;
  229. }
  230. }
  231. /* the generic interface that call the proper underlying implementation */
  232. int _starpu_push_task(struct _starpu_job *j)
  233. {
  234. struct starpu_task *task = j->task;
  235. _STARPU_LOG_IN();
  236. _starpu_increment_nready_tasks();
  237. task->status = STARPU_TASK_READY;
  238. _starpu_profiling_set_task_push_start_time(task);
  239. /* in case there is no codelet associated to the task (that's a control
  240. * task), we directly execute its callback and enforce the
  241. * corresponding dependencies */
  242. if (task->cl == NULL)
  243. {
  244. _starpu_handle_job_termination(j);
  245. _STARPU_LOG_OUT_TAG("handle_job_termination");
  246. return 0;
  247. }
  248. int ret;
  249. if (STARPU_UNLIKELY(task->execute_on_a_specific_worker))
  250. {
  251. ret = _starpu_push_task_on_specific_worker(task, task->workerid);
  252. }
  253. else
  254. {
  255. STARPU_ASSERT(policy.push_task);
  256. ret = policy.push_task(task);
  257. }
  258. _starpu_profiling_set_task_push_end_time(task);
  259. _STARPU_LOG_OUT();
  260. return ret;
  261. }
  262. /*
  263. * Given a handle that needs to be converted in order to be used on the given
  264. * node, returns a task that takes care of the conversion.
  265. */
  266. struct starpu_task *_starpu_create_conversion_task(starpu_data_handle_t handle,
  267. unsigned int node)
  268. {
  269. struct starpu_task *conversion_task;
  270. struct starpu_multiformat_interface *format_interface;
  271. enum starpu_node_kind node_kind;
  272. conversion_task = starpu_task_create();
  273. conversion_task->synchronous = 0;
  274. conversion_task->handles[0] = handle;
  275. /* The node does not really matter here */
  276. format_interface = (struct starpu_multiformat_interface *) starpu_data_get_interface_on_node(handle, 0);
  277. node_kind = starpu_node_get_kind(node);
  278. _starpu_spin_lock(&handle->header_lock);
  279. handle->refcnt++;
  280. handle->busy_count++;
  281. _starpu_spin_unlock(&handle->header_lock);
  282. struct starpu_multiformat_data_interface_ops *mf_ops;
  283. mf_ops = (struct starpu_multiformat_data_interface_ops *) handle->ops->get_mf_ops(format_interface);
  284. switch(node_kind)
  285. {
  286. case STARPU_CPU_RAM:
  287. switch (starpu_node_get_kind(handle->mf_node))
  288. {
  289. case STARPU_CPU_RAM:
  290. STARPU_ASSERT(0);
  291. #ifdef STARPU_USE_CUDA
  292. case STARPU_CUDA_RAM:
  293. conversion_task->cl = mf_ops->cuda_to_cpu_cl;
  294. break;
  295. #endif
  296. #ifdef STARPU_USE_OPENCL
  297. case STARPU_OPENCL_RAM:
  298. conversion_task->cl = mf_ops->opencl_to_cpu_cl;
  299. break;
  300. #endif
  301. default:
  302. fprintf(stderr, "Oops : %u\n", handle->mf_node);
  303. STARPU_ASSERT(0);
  304. }
  305. break;
  306. #ifdef STARPU_USE_CUDA
  307. case STARPU_CUDA_RAM:
  308. conversion_task->cl = mf_ops->cpu_to_cuda_cl;
  309. break;
  310. #endif
  311. #ifdef STARPU_USE_OPENCL
  312. case STARPU_OPENCL_RAM:
  313. conversion_task->cl = mf_ops->cpu_to_opencl_cl;
  314. break;
  315. #endif
  316. case STARPU_SPU_LS: /* Not supported */
  317. default:
  318. STARPU_ASSERT(0);
  319. }
  320. conversion_task->cl->modes[0] = STARPU_RW;
  321. return conversion_task;
  322. }
  323. struct starpu_task *_starpu_pop_task(struct _starpu_worker *worker)
  324. {
  325. struct starpu_task *task;
  326. int worker_id;
  327. unsigned node;
  328. /* We can't tell in advance which task will be picked up, so we measure
  329. * a timestamp, and will attribute it afterwards to the task. */
  330. int profiling = starpu_profiling_status_get();
  331. struct timespec pop_start_time;
  332. if (profiling)
  333. _starpu_clock_gettime(&pop_start_time);
  334. pick:
  335. /* perhaps there is some local task to be executed first */
  336. task = _starpu_pop_local_task(worker);
  337. if (!task && policy.pop_task)
  338. task = policy.pop_task();
  339. if (!task)
  340. return NULL;
  341. /* Make sure we do not bother with all the multiformat-specific code if
  342. * it is not necessary. */
  343. if (!_starpu_task_uses_multiformat_handles(task))
  344. goto profiling;
  345. /* This is either a conversion task, or a regular task for which the
  346. * conversion tasks have already been created and submitted */
  347. if (task->mf_skip)
  348. goto profiling;
  349. worker_id = starpu_worker_get_id();
  350. if (!starpu_worker_can_execute_task(worker_id, task, 0))
  351. return task;
  352. node = starpu_worker_get_memory_node(worker_id);
  353. /*
  354. * We do have a task that uses multiformat handles. Let's create the
  355. * required conversion tasks.
  356. */
  357. unsigned i;
  358. for (i = 0; i < task->cl->nbuffers; i++)
  359. {
  360. struct starpu_task *conversion_task;
  361. starpu_data_handle_t handle;
  362. handle = task->handles[i];
  363. if (!_starpu_handle_needs_conversion_task(handle, node))
  364. continue;
  365. conversion_task = _starpu_create_conversion_task(handle, node);
  366. conversion_task->mf_skip = 1;
  367. conversion_task->execute_on_a_specific_worker = 1;
  368. conversion_task->workerid = worker_id;
  369. /*
  370. * Next tasks will need to know where these handles have gone.
  371. */
  372. handle->mf_node = node;
  373. _starpu_task_submit_conversion_task(conversion_task, worker_id);
  374. }
  375. task->mf_skip = 1;
  376. starpu_task_list_push_front(&worker->local_tasks, task);
  377. goto pick;
  378. profiling:
  379. if (profiling)
  380. {
  381. struct starpu_task_profiling_info *profiling_info;
  382. profiling_info = task->profiling_info;
  383. /* The task may have been created before profiling was enabled,
  384. * so we check if the profiling_info structure is available
  385. * even though we already tested if profiling is enabled. */
  386. if (profiling_info)
  387. {
  388. memcpy(&profiling_info->pop_start_time,
  389. &pop_start_time, sizeof(struct timespec));
  390. _starpu_clock_gettime(&profiling_info->pop_end_time);
  391. }
  392. }
  393. return task;
  394. }
  395. struct starpu_task *_starpu_pop_every_task(void)
  396. {
  397. STARPU_ASSERT(policy.pop_every_task);
  398. /* TODO set profiling info */
  399. return policy.pop_every_task();
  400. }
  401. void _starpu_sched_pre_exec_hook(struct starpu_task *task)
  402. {
  403. if (policy.pre_exec_hook)
  404. policy.pre_exec_hook(task);
  405. }
  406. void _starpu_sched_post_exec_hook(struct starpu_task *task)
  407. {
  408. if (policy.post_exec_hook)
  409. policy.post_exec_hook(task);
  410. }
  411. void _starpu_wait_on_sched_event(void)
  412. {
  413. struct _starpu_worker *worker = _starpu_get_local_worker_key();
  414. _STARPU_PTHREAD_MUTEX_LOCK(worker->sched_mutex);
  415. _starpu_handle_all_pending_node_data_requests(worker->memory_node);
  416. if (_starpu_machine_is_running())
  417. {
  418. #ifndef STARPU_NON_BLOCKING_DRIVERS
  419. _STARPU_PTHREAD_COND_WAIT(worker->sched_cond,
  420. worker->sched_mutex);
  421. #endif
  422. }
  423. _STARPU_PTHREAD_MUTEX_UNLOCK(worker->sched_mutex);
  424. }
  425. /* The scheduling policy may put tasks directly into a worker's local queue so
  426. * that it is not always necessary to create its own queue when the local queue
  427. * is sufficient. If "back" not null, the task is put at the back of the queue
  428. * where the worker will pop tasks first. Setting "back" to 0 therefore ensures
  429. * a FIFO ordering. */
  430. int starpu_push_local_task(int workerid, struct starpu_task *task, int back)
  431. {
  432. struct _starpu_worker *worker = _starpu_get_worker_struct(workerid);
  433. return _starpu_push_local_task(worker, task, back);
  434. }