sched_ctx.h 9.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265
  1. /* StarPU --- Runtime system for heterogeneous multicore architectures.
  2. *
  3. * Copyright (C) 2011, 2013 INRIA
  4. *
  5. * StarPU is free software; you can redistribute it and/or modify
  6. * it under the terms of the GNU Lesser General Public License as published by
  7. * the Free Software Foundation; either version 2.1 of the License, or (at
  8. * your option) any later version.
  9. *
  10. * StarPU is distributed in the hope that it will be useful, but
  11. * WITHOUT ANY WARRANTY; without even the implied warranty of
  12. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
  13. *
  14. * See the GNU Lesser General Public License in COPYING.LGPL for more details.
  15. */
  16. #ifndef __SCHED_CONTEXT_H__
  17. #define __SCHED_CONTEXT_H__
  18. #include <starpu.h>
  19. #include <starpu_sched_ctx.h>
  20. #include <starpu_sched_ctx_hypervisor.h>
  21. #include <starpu_scheduler.h>
  22. #include <common/config.h>
  23. #include <common/barrier_counter.h>
  24. #include <profiling/profiling.h>
  25. #include <semaphore.h>
  26. #include "sched_ctx_list.h"
  27. #ifdef STARPU_HAVE_HWLOC
  28. #include <hwloc.h>
  29. #endif
  30. #define NO_RESIZE -1
  31. #define REQ_RESIZE 0
  32. #define DO_RESIZE 1
  33. #define STARPU_GLOBAL_SCHED_CTX 0
  34. struct _starpu_sched_ctx
  35. {
  36. /* id of the context used in user mode*/
  37. unsigned id;
  38. /* name of context */
  39. const char *name;
  40. /* policy of the context */
  41. struct starpu_sched_policy *sched_policy;
  42. /* data necessary for the policy */
  43. void *policy_data;
  44. /* pointer for application use */
  45. void *user_data;
  46. struct starpu_worker_collection *workers;
  47. /* we keep an initial sched which we never delete */
  48. unsigned is_initial_sched;
  49. /* wait for the tasks submitted to the context to be executed */
  50. struct _starpu_barrier_counter tasks_barrier;
  51. /* wait for the tasks ready of the context to be executed */
  52. struct _starpu_barrier_counter ready_tasks_barrier;
  53. /* amount of ready flops in a context */
  54. double ready_flops;
  55. /* cond to block push when there are no workers in the ctx */
  56. starpu_pthread_cond_t no_workers_cond;
  57. /* mutex to block push when there are no workers in the ctx */
  58. starpu_pthread_mutex_t no_workers_mutex;
  59. /*ready tasks that couldn't be pushed because the ctx has no workers*/
  60. struct starpu_task_list empty_ctx_tasks;
  61. /* mutext protecting empty_ctx_tasks list */
  62. starpu_pthread_mutex_t empty_ctx_mutex;
  63. /*ready tasks that couldn't be pushed because the the window of tasks was already full*/
  64. struct starpu_task_list waiting_tasks;
  65. /* mutext protecting waiting_tasks list */
  66. starpu_pthread_mutex_t waiting_tasks_mutex;
  67. /* mutext protecting write to all worker's sched_ctx_list structure for this sched_ctx */
  68. starpu_pthread_mutex_t sched_ctx_list_mutex;
  69. /* min CPUs to execute*/
  70. int min_ncpus;
  71. /* max CPUs to execute*/
  72. int max_ncpus;
  73. /* min GPUs to execute*/
  74. int min_ngpus;
  75. /* max GPUs to execute*/
  76. int max_ngpus;
  77. /* in case we delete the context leave resources to the inheritor*/
  78. unsigned inheritor;
  79. /* indicates whether the application finished submitting tasks
  80. to this context*/
  81. unsigned finished_submit;
  82. /* By default we have a binary type of priority: either a task is a priority
  83. * task (level 1) or it is not (level 0). */
  84. int min_priority;
  85. int max_priority;
  86. int min_priority_is_set;
  87. int max_priority_is_set;
  88. /* hwloc tree structure of workers */
  89. #ifdef STARPU_HAVE_HWLOC
  90. hwloc_bitmap_t hwloc_workers_set;
  91. #endif
  92. #ifdef STARPU_USE_SC_HYPERVISOR
  93. /* a structure containing a series of performance counters determining the resize procedure */
  94. struct starpu_sched_ctx_performance_counters *perf_counters;
  95. #endif //STARPU_USE_SC_HYPERVISOR
  96. /* callback called when the context finished executed its submitted tasks */
  97. void (*close_callback)(unsigned sched_ctx_id, void* args);
  98. void *close_args;
  99. /* value placing the contexts in their hierarchy */
  100. unsigned hierarchy_level;
  101. /* if we execute non-StarPU code inside the context
  102. we have a single master worker that stays awake,
  103. if not master is -1 */
  104. int main_master;
  105. /* conditions variables used when parallel sections are executed in contexts */
  106. starpu_pthread_cond_t parallel_sect_cond[STARPU_NMAXWORKERS];
  107. starpu_pthread_mutex_t parallel_sect_mutex[STARPU_NMAXWORKERS];
  108. starpu_pthread_cond_t parallel_sect_cond_busy[STARPU_NMAXWORKERS];
  109. int busy[STARPU_NMAXWORKERS];
  110. /* boolean indicating that workers should block in order to allow
  111. parallel sections to be executed on their allocated resources */
  112. unsigned parallel_sect[STARPU_NMAXWORKERS];
  113. /* id of the master worker */
  114. int master[STARPU_NMAXWORKERS];
  115. /* semaphore that block appl thread until starpu threads are
  116. all blocked and ready to exec the parallel code */
  117. sem_t fall_asleep_sem[STARPU_NMAXWORKERS];
  118. /* semaphore that block appl thread until starpu threads are
  119. all woke up and ready continue appl */
  120. sem_t wake_up_sem[STARPU_NMAXWORKERS];
  121. /* bool indicating if the workers is sleeping in this ctx */
  122. unsigned sleeping[STARPU_NMAXWORKERS];
  123. /* ctx nesting the current ctx */
  124. unsigned nesting_sched_ctx;
  125. /* perf model for the device comb of the ctx */
  126. struct starpu_perfmodel_arch perf_arch;
  127. /* for ctxs without policy: flag to indicate that we want to get
  128. the threads to sleep in order to replace them with other threads or leave
  129. them awake & use them in the parallel code*/
  130. unsigned awake_workers;
  131. /* function called when initializing the scheduler */
  132. void (*init_sched)();
  133. };
  134. struct _starpu_machine_config;
  135. /* init sched_ctx_id of all contextes*/
  136. void _starpu_init_all_sched_ctxs(struct _starpu_machine_config *config);
  137. /* allocate all structures belonging to a context */
  138. struct _starpu_sched_ctx* _starpu_create_sched_ctx(struct starpu_sched_policy *policy, int *workerid, int nworkerids, unsigned is_init_sched, const char *sched_name,
  139. int min_prio_set, int min_prio,
  140. int max_prio_set, int max_prio, unsigned awake_workers, void (*sched_policy_init)(void), void *user_data);
  141. /* delete all sched_ctx */
  142. void _starpu_delete_all_sched_ctxs();
  143. /* This function waits until all the tasks that were already submitted to a specific
  144. * context have been executed. */
  145. int _starpu_wait_for_all_tasks_of_sched_ctx(unsigned sched_ctx_id);
  146. /* This function waits until at most n tasks are still submitted. */
  147. int _starpu_wait_for_n_submitted_tasks_of_sched_ctx(unsigned sched_ctx_id, unsigned n);
  148. /* In order to implement starpu_wait_for_all_tasks_of_ctx, we keep track of the number of
  149. * task currently submitted to the context */
  150. void _starpu_decrement_nsubmitted_tasks_of_sched_ctx(unsigned sched_ctx_id);
  151. void _starpu_increment_nsubmitted_tasks_of_sched_ctx(unsigned sched_ctx_id);
  152. int _starpu_get_nsubmitted_tasks_of_sched_ctx(unsigned sched_ctx_id);
  153. int _starpu_check_nsubmitted_tasks_of_sched_ctx(unsigned sched_ctx_id);
  154. void _starpu_decrement_nready_tasks_of_sched_ctx(unsigned sched_ctx_id, double ready_flops);
  155. unsigned _starpu_increment_nready_tasks_of_sched_ctx(unsigned sched_ctx_id, double ready_flops, struct starpu_task *task);
  156. int _starpu_wait_for_no_ready_of_sched_ctx(unsigned sched_ctx_id);
  157. /* Return the corresponding index of the workerid in the ctx table */
  158. int _starpu_get_index_in_ctx_of_workerid(unsigned sched_ctx, unsigned workerid);
  159. /* Get the mutex corresponding to the global workerid */
  160. starpu_pthread_mutex_t *_starpu_get_sched_mutex(struct _starpu_sched_ctx *sched_ctx, int worker);
  161. /* Get workers belonging to a certain context, it returns the number of workers
  162. take care: no mutex taken, the list of workers might not be updated */
  163. int _starpu_get_workers_of_sched_ctx(unsigned sched_ctx_id, int *pus, enum starpu_worker_archtype arch);
  164. /* Let the worker know it does not belong to the context and that
  165. it should stop poping from it */
  166. void _starpu_worker_gets_out_of_ctx(unsigned sched_ctx_id, struct _starpu_worker *worker);
  167. /* Check if the worker belongs to another sched_ctx */
  168. unsigned _starpu_worker_belongs_to_a_sched_ctx(int workerid, unsigned sched_ctx_id);
  169. /* mutex synchronising several simultaneous modifications of a context */
  170. starpu_pthread_rwlock_t* _starpu_sched_ctx_get_changing_ctx_mutex(unsigned sched_ctx_id);
  171. /* indicates wheather this worker should go to sleep or not
  172. (if it is the last one awake in a context he should better keep awake) */
  173. unsigned _starpu_sched_ctx_last_worker_awake(struct _starpu_worker *worker);
  174. /* let the appl know that the worker blocked to execute parallel code */
  175. void _starpu_sched_ctx_signal_worker_blocked(unsigned sched_ctx_id, int workerid);
  176. /* let the appl know that the worker woke up */
  177. void _starpu_sched_ctx_signal_worker_woke_up(unsigned sched_ctx_id, int workerid);
  178. /* If starpu_sched_ctx_set_context() has been called, returns the context
  179. * id set by its last call, or the id of the initial context */
  180. unsigned _starpu_sched_ctx_get_current_context();
  181. /* verify how many workers can execute a certain task */
  182. int _starpu_nworkers_able_to_execute_task(struct starpu_task *task, struct _starpu_sched_ctx *sched_ctx);
  183. void _starpu_fetch_tasks_from_empty_ctx_list(struct _starpu_sched_ctx *sched_ctx);
  184. unsigned _starpu_sched_ctx_allow_hypervisor(unsigned sched_ctx_id);
  185. struct starpu_perfmodel_arch * _starpu_sched_ctx_get_perf_archtype(unsigned sched_ctx);
  186. #ifdef STARPU_USE_SC_HYPERVISOR
  187. /* Notifies the hypervisor that a tasks was poped from the workers' list */
  188. void _starpu_sched_ctx_post_exec_task_cb(int workerid, struct starpu_task *task, size_t data_size, uint32_t footprint);
  189. #endif //STARPU_USE_SC_HYPERVISOR
  190. /* if the worker is the master of a parallel context, and the job is meant to be executed on this parallel context, return a pointer to the context */
  191. struct _starpu_sched_ctx *__starpu_sched_ctx_get_sched_ctx_for_worker_and_job(struct _starpu_worker *worker, struct _starpu_job *j);
  192. #define _starpu_sched_ctx_get_sched_ctx_for_worker_and_job(w,j) \
  193. (_starpu_get_nsched_ctxs() <= 1 ? _starpu_get_sched_ctx_struct(0) : __starpu_sched_ctx_get_sched_ctx_for_worker_and_job((w),(j)))
  194. #endif // __SCHED_CONTEXT_H__