sc_hypervisor.c 31 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963
  1. /* StarPU --- Runtime system for heterogeneous multicore architectures.
  2. *
  3. * Copyright (C) 2011, 2012 INRIA
  4. *
  5. * StarPU is free software; you can redistribute it and/or modify
  6. * it under the terms of the GNU Lesser General Public License as published by
  7. * the Free Software Foundation; either version 2.1 of the License, or (at
  8. * your option) any later version.
  9. *
  10. * StarPU is distributed in the hope that it will be useful, but
  11. * WITHOUT ANY WARRANTY; without even the implied warranty of
  12. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
  13. *
  14. * See the GNU Lesser General Public License in COPYING.LGPL for more details.
  15. */
  16. #include <sc_hypervisor_intern.h>
  17. #include <sc_hypervisor_policy.h>
  18. #include <common/uthash.h>
  19. #include <starpu_config.h>
  20. unsigned imposed_resize = 0;
  21. unsigned type_of_tasks_known = 0;
  22. struct starpu_sched_ctx_performance_counters* perf_counters = NULL;
  23. static void notify_idle_cycle(unsigned sched_ctx, int worker, double idle_time);
  24. static void notify_pushed_task(unsigned sched_ctx, int worker);
  25. static void notify_poped_task(unsigned sched_ctx, int worker, struct starpu_task *task, size_t data_size, uint32_t footprint);
  26. static void notify_post_exec_hook(unsigned sched_ctx, int taskid);
  27. static void notify_idle_end(unsigned sched_ctx, int worker);
  28. static void notify_submitted_job(struct starpu_task *task, unsigned footprint);
  29. static void notify_delete_context(unsigned sched_ctx);
  30. extern struct sc_hypervisor_policy idle_policy;
  31. extern struct sc_hypervisor_policy app_driven_policy;
  32. extern struct sc_hypervisor_policy gflops_rate_policy;
  33. #ifdef STARPU_HAVE_GLPK_H
  34. extern struct sc_hypervisor_policy feft_lp_policy;
  35. extern struct sc_hypervisor_policy teft_lp_policy;
  36. extern struct sc_hypervisor_policy ispeed_lp_policy;
  37. extern struct sc_hypervisor_policy debit_lp_policy;
  38. #endif // STARPU_HAVE_GLPK_
  39. extern struct sc_hypervisor_policy ispeed_policy;
  40. static struct sc_hypervisor_policy *predefined_policies[] =
  41. {
  42. &idle_policy,
  43. &app_driven_policy,
  44. #ifdef STARPU_HAVE_GLPK_H
  45. &feft_lp_policy,
  46. &teft_lp_policy,
  47. &ispeed_lp_policy,
  48. &debit_lp_policy,
  49. #endif // STARPU_HAVE_GLPK_H
  50. &gflops_rate_policy,
  51. &ispeed_policy
  52. };
  53. static void _load_hypervisor_policy(struct sc_hypervisor_policy *policy)
  54. {
  55. STARPU_ASSERT(policy);
  56. hypervisor.policy.name = policy->name;
  57. hypervisor.policy.size_ctxs = policy->size_ctxs;
  58. hypervisor.policy.handle_poped_task = policy->handle_poped_task;
  59. hypervisor.policy.handle_pushed_task = policy->handle_pushed_task;
  60. hypervisor.policy.handle_idle_cycle = policy->handle_idle_cycle;
  61. hypervisor.policy.handle_idle_end = policy->handle_idle_end;
  62. hypervisor.policy.handle_post_exec_hook = policy->handle_post_exec_hook;
  63. hypervisor.policy.handle_submitted_job = policy->handle_submitted_job;
  64. hypervisor.policy.end_ctx = policy->end_ctx;
  65. }
  66. static struct sc_hypervisor_policy *_find_hypervisor_policy_from_name(const char *policy_name)
  67. {
  68. if (!policy_name)
  69. return NULL;
  70. unsigned i;
  71. for (i = 0; i < sizeof(predefined_policies)/sizeof(predefined_policies[0]); i++)
  72. {
  73. struct sc_hypervisor_policy *p;
  74. p = predefined_policies[i];
  75. if (p->name)
  76. {
  77. if (strcmp(policy_name, p->name) == 0) {
  78. /* we found a policy with the requested name */
  79. return p;
  80. }
  81. }
  82. }
  83. fprintf(stderr, "Warning: hypervisor policy \"%s\" was not found, try \"help\" to get a list\n", policy_name);
  84. /* nothing was found */
  85. return NULL;
  86. }
  87. static struct sc_hypervisor_policy *_select_hypervisor_policy(struct sc_hypervisor_policy* hypervisor_policy)
  88. {
  89. struct sc_hypervisor_policy *selected_policy = NULL;
  90. if(hypervisor_policy && hypervisor_policy->custom)
  91. return hypervisor_policy;
  92. /* we look if the application specified the name of a policy to load */
  93. const char *policy_name;
  94. if (hypervisor_policy && hypervisor_policy->name)
  95. {
  96. policy_name = hypervisor_policy->name;
  97. }
  98. else
  99. {
  100. policy_name = getenv("SC_HYPERVISOR_POLICY");
  101. }
  102. if (policy_name)
  103. selected_policy = _find_hypervisor_policy_from_name(policy_name);
  104. /* Perhaps there was no policy that matched the name */
  105. if (selected_policy)
  106. return selected_policy;
  107. /* If no policy was specified, we use the idle policy as a default */
  108. return &idle_policy;
  109. }
  110. /* initializez the performance counters that starpu will use to retrive hints for resizing */
  111. struct starpu_sched_ctx_performance_counters* sc_hypervisor_init(struct sc_hypervisor_policy *hypervisor_policy)
  112. {
  113. hypervisor.min_tasks = 0;
  114. hypervisor.nsched_ctxs = 0;
  115. char* vel_gap = getenv("SC_HYPERVISOR_MAX_VELOCITY_GAP");
  116. hypervisor.max_velocity_gap = vel_gap ? atof(vel_gap) : SC_VELOCITY_MAX_GAP_DEFAULT;
  117. char* crit = getenv("SC_HYPERVISOR_TRIGGER_RESIZE");
  118. hypervisor.resize_criteria = !crit ? SC_IDLE : strcmp(crit,"idle") == 0 ? SC_IDLE : (strcmp(crit,"speed") == 0 ? SC_VELOCITY : SC_NOTHING);
  119. starpu_pthread_mutex_init(&act_hypervisor_mutex, NULL);
  120. hypervisor.start_executing_time = starpu_timing_now();
  121. int i;
  122. for(i = 0; i < STARPU_NMAX_SCHED_CTXS; i++)
  123. {
  124. hypervisor.resize[i] = 0;
  125. hypervisor.allow_remove[i] = 1;
  126. hypervisor.configurations[i] = NULL;
  127. hypervisor.sr = NULL;
  128. hypervisor.check_min_tasks[i] = 1;
  129. hypervisor.sched_ctxs[i] = STARPU_NMAX_SCHED_CTXS;
  130. hypervisor.sched_ctx_w[i].sched_ctx = STARPU_NMAX_SCHED_CTXS;
  131. hypervisor.sched_ctx_w[i].config = NULL;
  132. hypervisor.sched_ctx_w[i].total_flops = 0.0;
  133. hypervisor.sched_ctx_w[i].submitted_flops = 0.0;
  134. hypervisor.sched_ctx_w[i].remaining_flops = 0.0;
  135. hypervisor.sched_ctx_w[i].start_time = 0.0;
  136. hypervisor.sched_ctx_w[i].real_start_time = 0.0;
  137. hypervisor.sched_ctx_w[i].resize_ack.receiver_sched_ctx = -1;
  138. hypervisor.sched_ctx_w[i].resize_ack.moved_workers = NULL;
  139. hypervisor.sched_ctx_w[i].resize_ack.nmoved_workers = 0;
  140. hypervisor.sched_ctx_w[i].resize_ack.acked_workers = NULL;
  141. starpu_pthread_mutex_init(&hypervisor.sched_ctx_w[i].mutex, NULL);
  142. hypervisor.optimal_v[i] = 0.0;
  143. int j;
  144. for(j = 0; j < STARPU_NMAXWORKERS; j++)
  145. {
  146. hypervisor.sched_ctx_w[i].current_idle_time[j] = 0.0;
  147. hypervisor.sched_ctx_w[i].idle_time[j] = 0.0;
  148. hypervisor.sched_ctx_w[i].idle_start_time[j] = 0.0;
  149. hypervisor.sched_ctx_w[i].pushed_tasks[j] = 0;
  150. hypervisor.sched_ctx_w[i].poped_tasks[j] = 0;
  151. hypervisor.sched_ctx_w[i].elapsed_flops[j] = 0.0;
  152. hypervisor.sched_ctx_w[i].elapsed_data[j] = 0;
  153. hypervisor.sched_ctx_w[i].elapsed_tasks[j] = 0;
  154. hypervisor.sched_ctx_w[i].total_elapsed_flops[j] = 0.0;
  155. hypervisor.sched_ctx_w[i].worker_to_be_removed[j] = 0;
  156. hypervisor.sched_ctx_w[i].ref_velocity[j] = -1.0;
  157. }
  158. }
  159. struct sc_hypervisor_policy *selected_hypervisor_policy = _select_hypervisor_policy(hypervisor_policy);
  160. _load_hypervisor_policy(selected_hypervisor_policy);
  161. perf_counters = (struct starpu_sched_ctx_performance_counters*)malloc(sizeof(struct starpu_sched_ctx_performance_counters));
  162. perf_counters->notify_idle_cycle = notify_idle_cycle;
  163. perf_counters->notify_pushed_task = notify_pushed_task;
  164. perf_counters->notify_poped_task = notify_poped_task;
  165. perf_counters->notify_post_exec_hook = notify_post_exec_hook;
  166. perf_counters->notify_idle_end = notify_idle_end;
  167. perf_counters->notify_submitted_job = notify_submitted_job;
  168. perf_counters->notify_delete_context = notify_delete_context;
  169. starpu_sched_ctx_notify_hypervisor_exists();
  170. return perf_counters;
  171. }
  172. const char* sc_hypervisor_get_policy()
  173. {
  174. return hypervisor.policy.name;
  175. }
  176. /* the user can forbid the resizing process*/
  177. void sc_hypervisor_stop_resize(unsigned sched_ctx)
  178. {
  179. imposed_resize = 1;
  180. hypervisor.resize[sched_ctx] = 0;
  181. }
  182. /* the user can restart the resizing process*/
  183. void sc_hypervisor_start_resize(unsigned sched_ctx)
  184. {
  185. imposed_resize = 1;
  186. hypervisor.resize[sched_ctx] = 1;
  187. }
  188. static void _print_current_time()
  189. {
  190. if(!getenv("SC_HYPERVISOR_STOP_PRINT"))
  191. {
  192. double curr_time = starpu_timing_now();
  193. double elapsed_time = (curr_time - hypervisor.start_executing_time) / 1000000.0; /* in seconds */
  194. fprintf(stdout, "Time: %lf\n", elapsed_time);
  195. int i;
  196. for(i = 0; i < STARPU_NMAX_SCHED_CTXS; i++)
  197. {
  198. if(hypervisor.sched_ctxs[i] != STARPU_NMAX_SCHED_CTXS)
  199. {
  200. struct sc_hypervisor_wrapper *sc_w = &hypervisor.sched_ctx_w[hypervisor.sched_ctxs[i]];
  201. double cpu_speed = sc_hypervisor_get_velocity(sc_w, STARPU_CPU_WORKER);
  202. double cuda_speed = sc_hypervisor_get_velocity(sc_w, STARPU_CUDA_WORKER);
  203. int ncpus = sc_hypervisor_get_nworkers_ctx(sc_w->sched_ctx, STARPU_CPU_WORKER);
  204. int ncuda = sc_hypervisor_get_nworkers_ctx(sc_w->sched_ctx, STARPU_CUDA_WORKER);
  205. fprintf(stdout, "%d: cpu_v = %lf cuda_v = %lf ncpus = %d ncuda = %d\n", hypervisor.sched_ctxs[i], cpu_speed, cuda_speed, ncpus, ncuda);
  206. }
  207. }
  208. }
  209. return;
  210. }
  211. void sc_hypervisor_shutdown(void)
  212. {
  213. // printf("shutdown\n");
  214. int i;
  215. for(i = 0; i < STARPU_NMAX_SCHED_CTXS; i++)
  216. {
  217. if(hypervisor.sched_ctxs[i] != STARPU_NMAX_SCHED_CTXS && hypervisor.nsched_ctxs > 0)
  218. {
  219. sc_hypervisor_stop_resize(hypervisor.sched_ctxs[i]);
  220. sc_hypervisor_unregister_ctx(hypervisor.sched_ctxs[i]);
  221. starpu_pthread_mutex_destroy(&hypervisor.sched_ctx_w[i].mutex);
  222. }
  223. }
  224. perf_counters->notify_idle_cycle = NULL;
  225. perf_counters->notify_pushed_task = NULL;
  226. perf_counters->notify_poped_task = NULL;
  227. perf_counters->notify_post_exec_hook = NULL;
  228. perf_counters->notify_idle_end = NULL;
  229. perf_counters->notify_delete_context = NULL;
  230. free(perf_counters);
  231. perf_counters = NULL;
  232. starpu_pthread_mutex_destroy(&act_hypervisor_mutex);
  233. }
  234. /* the hypervisor is in charge only of the contexts registered to it*/
  235. void sc_hypervisor_register_ctx(unsigned sched_ctx, double total_flops)
  236. {
  237. starpu_pthread_mutex_lock(&act_hypervisor_mutex);
  238. hypervisor.configurations[sched_ctx] = NULL;
  239. hypervisor.resize_requests[sched_ctx] = NULL;
  240. starpu_pthread_mutex_init(&hypervisor.conf_mut[sched_ctx], NULL);
  241. starpu_pthread_mutex_init(&hypervisor.resize_mut[sched_ctx], NULL);
  242. _add_config(sched_ctx);
  243. hypervisor.sched_ctx_w[sched_ctx].sched_ctx = sched_ctx;
  244. hypervisor.sched_ctxs[hypervisor.nsched_ctxs++] = sched_ctx;
  245. hypervisor.sched_ctx_w[sched_ctx].total_flops = total_flops;
  246. hypervisor.sched_ctx_w[sched_ctx].remaining_flops = total_flops;
  247. if(strcmp(hypervisor.policy.name, "app_driven") == 0)
  248. hypervisor.resize[sched_ctx] = 1;
  249. starpu_pthread_mutex_unlock(&act_hypervisor_mutex);
  250. }
  251. static int _get_first_free_sched_ctx(int *sched_ctxs, int nsched_ctxs)
  252. {
  253. int i;
  254. for(i = 0; i < nsched_ctxs; i++)
  255. if(sched_ctxs[i] == STARPU_NMAX_SCHED_CTXS)
  256. return i;
  257. return STARPU_NMAX_SCHED_CTXS;
  258. }
  259. /* rearange array of sched_ctxs in order not to have {MAXVAL, MAXVAL, 5, MAXVAL, 7}
  260. and have instead {5, 7, MAXVAL, MAXVAL, MAXVAL}
  261. it is easier afterwards to iterate the array
  262. */
  263. static void _rearange_sched_ctxs(int *sched_ctxs, int old_nsched_ctxs)
  264. {
  265. int first_free_id = STARPU_NMAX_SCHED_CTXS;
  266. int i;
  267. for(i = 0; i < old_nsched_ctxs; i++)
  268. {
  269. if(sched_ctxs[i] != STARPU_NMAX_SCHED_CTXS)
  270. {
  271. first_free_id = _get_first_free_sched_ctx(sched_ctxs, old_nsched_ctxs);
  272. if(first_free_id != STARPU_NMAX_SCHED_CTXS)
  273. {
  274. sched_ctxs[first_free_id] = sched_ctxs[i];
  275. sched_ctxs[i] = STARPU_NMAX_SCHED_CTXS;
  276. }
  277. }
  278. }
  279. }
  280. /* unregistered contexts will no longer be resized */
  281. void sc_hypervisor_unregister_ctx(unsigned sched_ctx)
  282. {
  283. if(hypervisor.policy.end_ctx)
  284. hypervisor.policy.end_ctx(sched_ctx);
  285. starpu_pthread_mutex_lock(&act_hypervisor_mutex);
  286. unsigned i;
  287. for(i = 0; i < hypervisor.nsched_ctxs; i++)
  288. {
  289. if(hypervisor.sched_ctxs[i] == (int)sched_ctx)
  290. {
  291. hypervisor.sched_ctxs[i] = STARPU_NMAX_SCHED_CTXS;
  292. break;
  293. }
  294. }
  295. _rearange_sched_ctxs(hypervisor.sched_ctxs, hypervisor.nsched_ctxs);
  296. hypervisor.nsched_ctxs--;
  297. hypervisor.sched_ctx_w[sched_ctx].sched_ctx = STARPU_NMAX_SCHED_CTXS;
  298. _remove_config(sched_ctx);
  299. /* free(hypervisor.configurations[sched_ctx]); */
  300. /* free(hypervisor.resize_requests[sched_ctx]); */
  301. starpu_pthread_mutex_destroy(&hypervisor.conf_mut[sched_ctx]);
  302. starpu_pthread_mutex_destroy(&hypervisor.resize_mut[sched_ctx]);
  303. if(hypervisor.nsched_ctxs == 1)
  304. sc_hypervisor_stop_resize(hypervisor.sched_ctxs[0]);
  305. starpu_pthread_mutex_unlock(&act_hypervisor_mutex);
  306. }
  307. double _get_max_velocity_gap()
  308. {
  309. return hypervisor.max_velocity_gap;
  310. }
  311. unsigned sc_hypervisor_get_resize_criteria()
  312. {
  313. return hypervisor.resize_criteria;
  314. }
  315. static int get_ntasks( int *tasks)
  316. {
  317. int ntasks = 0;
  318. int j;
  319. for(j = 0; j < STARPU_NMAXWORKERS; j++)
  320. {
  321. ntasks += tasks[j];
  322. }
  323. return ntasks;
  324. }
  325. static void _get_cpus(int *workers, int nworkers, int *cpus, int *ncpus)
  326. {
  327. int i, worker;
  328. *ncpus = 0;
  329. for(i = 0; i < nworkers; i++)
  330. {
  331. worker = workers[i];
  332. enum starpu_worker_archtype arch = starpu_worker_get_type(worker);
  333. if(arch == STARPU_CPU_WORKER)
  334. cpus[(*ncpus)++] = worker;
  335. }
  336. }
  337. int sc_hypervisor_get_nworkers_ctx(unsigned sched_ctx, enum starpu_worker_archtype arch)
  338. {
  339. int nworkers_ctx = 0;
  340. struct starpu_worker_collection *workers = starpu_sched_ctx_get_worker_collection(sched_ctx);
  341. int worker;
  342. struct starpu_sched_ctx_iterator it;
  343. if(workers->init_iterator)
  344. workers->init_iterator(workers, &it);
  345. while(workers->has_next(workers, &it))
  346. {
  347. worker = workers->get_next(workers, &it);
  348. enum starpu_worker_archtype curr_arch = starpu_worker_get_type(worker);
  349. if(curr_arch == arch || arch == STARPU_ANY_WORKER)
  350. nworkers_ctx++;
  351. }
  352. return nworkers_ctx;
  353. }
  354. static void _set_elapsed_flops_per_sched_ctx(unsigned sched_ctx, double val)
  355. {
  356. int i;
  357. for(i = 0; i < STARPU_NMAXWORKERS; i++)
  358. {
  359. hypervisor.sched_ctx_w[sched_ctx].elapsed_flops[i] = val;
  360. if(val == 0)
  361. {
  362. hypervisor.sched_ctx_w[sched_ctx].elapsed_data[i] = 0;
  363. hypervisor.sched_ctx_w[sched_ctx].elapsed_tasks[i] = 0;
  364. }
  365. }
  366. }
  367. double sc_hypervisor_get_elapsed_flops_per_sched_ctx(struct sc_hypervisor_wrapper* sc_w)
  368. {
  369. double ret_val = 0.0;
  370. int i;
  371. for(i = 0; i < STARPU_NMAXWORKERS; i++)
  372. ret_val += sc_w->elapsed_flops[i];
  373. return ret_val;
  374. }
  375. double sc_hypervisor_get_total_elapsed_flops_per_sched_ctx(struct sc_hypervisor_wrapper* sc_w)
  376. {
  377. double ret_val = 0.0;
  378. int i;
  379. for(i = 0; i < STARPU_NMAXWORKERS; i++)
  380. ret_val += sc_w->total_elapsed_flops[i];
  381. return ret_val;
  382. }
  383. static void _reset_idle_time(unsigned sched_ctx)
  384. {
  385. int i;
  386. for(i = 0; i < STARPU_NMAXWORKERS; i++)
  387. {
  388. hypervisor.sched_ctx_w[sched_ctx].idle_time[i] = 0.0;
  389. }
  390. return;
  391. }
  392. void _reset_resize_sample_info(unsigned sender_sched_ctx, unsigned receiver_sched_ctx)
  393. {
  394. /* info concerning only the gflops_rate strateg */
  395. struct sc_hypervisor_wrapper *sender_sc_w = &hypervisor.sched_ctx_w[sender_sched_ctx];
  396. struct sc_hypervisor_wrapper *receiver_sc_w = &hypervisor.sched_ctx_w[receiver_sched_ctx];
  397. double start_time = starpu_timing_now();
  398. sender_sc_w->start_time = start_time;
  399. _set_elapsed_flops_per_sched_ctx(sender_sched_ctx, 0.0);
  400. _reset_idle_time(sender_sched_ctx);
  401. receiver_sc_w->start_time = start_time;
  402. _set_elapsed_flops_per_sched_ctx(receiver_sched_ctx, 0.0);
  403. _reset_idle_time(receiver_sched_ctx);
  404. }
  405. /* actually move the workers: the cpus are moved, gpus are only shared */
  406. /* forbids another resize request before this one is take into account */
  407. void sc_hypervisor_move_workers(unsigned sender_sched_ctx, unsigned receiver_sched_ctx, int* workers_to_move, unsigned nworkers_to_move, unsigned now)
  408. {
  409. if(nworkers_to_move > 0 && hypervisor.resize[sender_sched_ctx])
  410. {
  411. _print_current_time();
  412. unsigned j;
  413. printf("resize ctx %d with %d workers", sender_sched_ctx, nworkers_to_move);
  414. for(j = 0; j < nworkers_to_move; j++)
  415. printf(" %d", workers_to_move[j]);
  416. printf("\n");
  417. starpu_trace_user_event(1);
  418. hypervisor.allow_remove[receiver_sched_ctx] = 0;
  419. starpu_sched_ctx_add_workers(workers_to_move, nworkers_to_move, receiver_sched_ctx);
  420. if(now)
  421. {
  422. unsigned j;
  423. printf("remove now from ctx %d:", sender_sched_ctx);
  424. for(j = 0; j < nworkers_to_move; j++)
  425. printf(" %d", workers_to_move[j]);
  426. printf("\n");
  427. starpu_sched_ctx_remove_workers(workers_to_move, nworkers_to_move, sender_sched_ctx);
  428. hypervisor.allow_remove[receiver_sched_ctx] = 1;
  429. _reset_resize_sample_info(sender_sched_ctx, receiver_sched_ctx);
  430. }
  431. else
  432. {
  433. int ret = starpu_pthread_mutex_trylock(&hypervisor.sched_ctx_w[sender_sched_ctx].mutex);
  434. if(ret != EBUSY)
  435. {
  436. hypervisor.sched_ctx_w[sender_sched_ctx].resize_ack.receiver_sched_ctx = receiver_sched_ctx;
  437. hypervisor.sched_ctx_w[sender_sched_ctx].resize_ack.moved_workers = (int*)malloc(nworkers_to_move * sizeof(int));
  438. hypervisor.sched_ctx_w[sender_sched_ctx].resize_ack.nmoved_workers = nworkers_to_move;
  439. hypervisor.sched_ctx_w[sender_sched_ctx].resize_ack.acked_workers = (int*)malloc(nworkers_to_move * sizeof(int));
  440. unsigned i;
  441. for(i = 0; i < nworkers_to_move; i++)
  442. {
  443. hypervisor.sched_ctx_w[sender_sched_ctx].current_idle_time[workers_to_move[i]] = 0.0;
  444. hypervisor.sched_ctx_w[sender_sched_ctx].resize_ack.moved_workers[i] = workers_to_move[i];
  445. hypervisor.sched_ctx_w[sender_sched_ctx].resize_ack.acked_workers[i] = 0;
  446. }
  447. hypervisor.resize[sender_sched_ctx] = 0;
  448. starpu_pthread_mutex_unlock(&hypervisor.sched_ctx_w[sender_sched_ctx].mutex);
  449. }
  450. }
  451. struct sc_hypervisor_policy_config *new_config = sc_hypervisor_get_config(receiver_sched_ctx);
  452. unsigned i;
  453. for(i = 0; i < nworkers_to_move; i++)
  454. new_config->max_idle[workers_to_move[i]] = new_config->max_idle[workers_to_move[i]] !=MAX_IDLE_TIME ? new_config->max_idle[workers_to_move[i]] : new_config->new_workers_max_idle;
  455. }
  456. return;
  457. }
  458. void sc_hypervisor_add_workers_to_sched_ctx(int* workers_to_add, unsigned nworkers_to_add, unsigned sched_ctx)
  459. {
  460. if(nworkers_to_add > 0 && hypervisor.resize[sched_ctx])
  461. {
  462. _print_current_time();
  463. unsigned j;
  464. printf("add to ctx %d:", sched_ctx);
  465. for(j = 0; j < nworkers_to_add; j++)
  466. printf(" %d", workers_to_add[j]);
  467. printf("\n");
  468. starpu_sched_ctx_add_workers(workers_to_add, nworkers_to_add, sched_ctx);
  469. struct sc_hypervisor_policy_config *new_config = sc_hypervisor_get_config(sched_ctx);
  470. unsigned i;
  471. for(i = 0; i < nworkers_to_add; i++)
  472. new_config->max_idle[workers_to_add[i]] = new_config->max_idle[workers_to_add[i]] != MAX_IDLE_TIME ? new_config->max_idle[workers_to_add[i]] : new_config->new_workers_max_idle;
  473. }
  474. return;
  475. }
  476. unsigned sc_hypervisor_can_resize(unsigned sched_ctx)
  477. {
  478. return hypervisor.resize[sched_ctx];
  479. }
  480. void sc_hypervisor_remove_workers_from_sched_ctx(int* workers_to_remove, unsigned nworkers_to_remove, unsigned sched_ctx, unsigned now)
  481. {
  482. if(nworkers_to_remove > 0 && hypervisor.resize[sched_ctx] && hypervisor.allow_remove[sched_ctx])
  483. {
  484. _print_current_time();
  485. unsigned nworkers = 0;
  486. int workers[nworkers_to_remove];
  487. if(now)
  488. {
  489. unsigned j;
  490. printf("remove explicitley now from ctx %d:", sched_ctx);
  491. for(j = 0; j < nworkers_to_remove; j++)
  492. printf(" %d", workers_to_remove[j]);
  493. printf("\n");
  494. starpu_sched_ctx_remove_workers(workers_to_remove, nworkers_to_remove, sched_ctx);
  495. }
  496. else
  497. {
  498. printf("try to remove from ctx %d: ", sched_ctx);
  499. unsigned j;
  500. for(j = 0; j < nworkers_to_remove; j++)
  501. printf(" %d", workers_to_remove[j]);
  502. printf("\n");
  503. int ret = starpu_pthread_mutex_trylock(&hypervisor.sched_ctx_w[sched_ctx].mutex);
  504. if(ret != EBUSY)
  505. {
  506. unsigned i;
  507. for(i = 0; i < nworkers_to_remove; i++)
  508. if(starpu_sched_ctx_contains_worker(workers_to_remove[i], sched_ctx))
  509. workers[nworkers++] = workers_to_remove[i];
  510. hypervisor.sched_ctx_w[sched_ctx].resize_ack.receiver_sched_ctx = -1;
  511. hypervisor.sched_ctx_w[sched_ctx].resize_ack.moved_workers = (int*)malloc(nworkers_to_remove * sizeof(int));
  512. hypervisor.sched_ctx_w[sched_ctx].resize_ack.nmoved_workers = (int)nworkers;
  513. hypervisor.sched_ctx_w[sched_ctx].resize_ack.acked_workers = (int*)malloc(nworkers_to_remove * sizeof(int));
  514. for(i = 0; i < nworkers; i++)
  515. {
  516. hypervisor.sched_ctx_w[sched_ctx].current_idle_time[workers[i]] = 0.0;
  517. hypervisor.sched_ctx_w[sched_ctx].resize_ack.moved_workers[i] = workers[i];
  518. hypervisor.sched_ctx_w[sched_ctx].resize_ack.acked_workers[i] = 0;
  519. }
  520. hypervisor.resize[sched_ctx] = 0;
  521. starpu_pthread_mutex_unlock(&hypervisor.sched_ctx_w[sched_ctx].mutex);
  522. }
  523. }
  524. }
  525. return;
  526. }
  527. static unsigned _ack_resize_completed(unsigned sched_ctx, int worker)
  528. {
  529. if(worker != -1 && !starpu_sched_ctx_contains_worker(worker, sched_ctx))
  530. return 0;
  531. struct sc_hypervisor_resize_ack *resize_ack = NULL;
  532. unsigned sender_sched_ctx = STARPU_NMAX_SCHED_CTXS;
  533. int i;
  534. for(i = 0; i < STARPU_NMAX_SCHED_CTXS; i++)
  535. {
  536. if(hypervisor.sched_ctxs[i] != STARPU_NMAX_SCHED_CTXS)
  537. {
  538. struct sc_hypervisor_wrapper *sc_w = &hypervisor.sched_ctx_w[hypervisor.sched_ctxs[i]];
  539. starpu_pthread_mutex_lock(&sc_w->mutex);
  540. unsigned only_remove = 0;
  541. if(sc_w->resize_ack.receiver_sched_ctx == -1 && hypervisor.sched_ctxs[i] != (int)sched_ctx &&
  542. sc_w->resize_ack.nmoved_workers > 0 && starpu_sched_ctx_contains_worker(worker, hypervisor.sched_ctxs[i]))
  543. {
  544. int j;
  545. for(j = 0; j < sc_w->resize_ack.nmoved_workers; j++)
  546. if(sc_w->resize_ack.moved_workers[j] == worker)
  547. {
  548. only_remove = 1;
  549. starpu_pthread_mutex_unlock(&sc_w->mutex);
  550. break;
  551. }
  552. }
  553. if(only_remove ||
  554. (sc_w->resize_ack.receiver_sched_ctx != -1 && sc_w->resize_ack.receiver_sched_ctx == (int)sched_ctx))
  555. {
  556. resize_ack = &sc_w->resize_ack;
  557. sender_sched_ctx = hypervisor.sched_ctxs[i];
  558. starpu_pthread_mutex_unlock(&sc_w->mutex);
  559. break;
  560. }
  561. starpu_pthread_mutex_unlock(&sc_w->mutex);
  562. }
  563. }
  564. /* if there is no ctx waiting for its ack return 1*/
  565. if(resize_ack == NULL)
  566. return 1;
  567. int ret = starpu_pthread_mutex_trylock(&hypervisor.sched_ctx_w[sender_sched_ctx].mutex);
  568. if(ret != EBUSY)
  569. {
  570. int *moved_workers = resize_ack->moved_workers;
  571. int nmoved_workers = resize_ack->nmoved_workers;
  572. int *acked_workers = resize_ack->acked_workers;
  573. if(worker != -1)
  574. {
  575. for(i = 0; i < nmoved_workers; i++)
  576. {
  577. int moved_worker = moved_workers[i];
  578. if(moved_worker == worker && acked_workers[i] == 0)
  579. {
  580. acked_workers[i] = 1;
  581. }
  582. }
  583. }
  584. int nacked_workers = 0;
  585. for(i = 0; i < nmoved_workers; i++)
  586. {
  587. nacked_workers += (acked_workers[i] == 1);
  588. }
  589. unsigned resize_completed = (nacked_workers == nmoved_workers);
  590. int receiver_sched_ctx = sched_ctx;
  591. if(resize_completed)
  592. {
  593. /* if the permission to resize is not allowed by the user don't do it
  594. whatever the application says */
  595. if(!((hypervisor.resize[sender_sched_ctx] == 0 || hypervisor.resize[receiver_sched_ctx] == 0) && imposed_resize))
  596. {
  597. /* int j; */
  598. /* printf("remove after ack from ctx %d:", sender_sched_ctx); */
  599. /* for(j = 0; j < nmoved_workers; j++) */
  600. /* printf(" %d", moved_workers[j]); */
  601. /* printf("\n"); */
  602. starpu_sched_ctx_remove_workers(moved_workers, nmoved_workers, sender_sched_ctx);
  603. _reset_resize_sample_info(sender_sched_ctx, receiver_sched_ctx);
  604. hypervisor.resize[sender_sched_ctx] = 1;
  605. hypervisor.allow_remove[receiver_sched_ctx] = 1;
  606. /* if the user allowed resizing leave the decisions to the application */
  607. if(imposed_resize) imposed_resize = 0;
  608. resize_ack->receiver_sched_ctx = -1;
  609. resize_ack->nmoved_workers = 0;
  610. free(resize_ack->moved_workers);
  611. free(resize_ack->acked_workers);
  612. }
  613. starpu_pthread_mutex_unlock(&hypervisor.sched_ctx_w[sender_sched_ctx].mutex);
  614. return resize_completed;
  615. }
  616. starpu_pthread_mutex_unlock(&hypervisor.sched_ctx_w[sender_sched_ctx].mutex);
  617. }
  618. return 0;
  619. }
  620. /* Enqueue a resize request for 'sched_ctx', to be executed when the
  621. * 'task_tag' tasks of 'sched_ctx' complete. */
  622. void sc_hypervisor_resize(unsigned sched_ctx, int task_tag)
  623. {
  624. struct resize_request_entry *entry;
  625. entry = malloc(sizeof *entry);
  626. STARPU_ASSERT(entry != NULL);
  627. entry->sched_ctx = sched_ctx;
  628. entry->task_tag = task_tag;
  629. starpu_pthread_mutex_lock(&hypervisor.resize_mut[sched_ctx]);
  630. HASH_ADD_INT(hypervisor.resize_requests[sched_ctx], task_tag, entry);
  631. starpu_pthread_mutex_unlock(&hypervisor.resize_mut[sched_ctx]);
  632. }
  633. /* notifies the hypervisor that the worker is no longer idle and a new task was pushed on its queue */
  634. static void notify_idle_end(unsigned sched_ctx, int worker)
  635. {
  636. if(hypervisor.resize[sched_ctx])
  637. hypervisor.sched_ctx_w[sched_ctx].current_idle_time[worker] = 0.0;
  638. struct sc_hypervisor_wrapper *sc_w = &hypervisor.sched_ctx_w[sched_ctx];
  639. if(sc_w->idle_start_time[worker] != 0.0)
  640. {
  641. double end_time = starpu_timing_now();
  642. sc_w->idle_time[worker] += (end_time - sc_w->idle_start_time[worker]) / 1000000.0; /* in seconds */
  643. sc_w->idle_start_time[worker] = 0.0;
  644. }
  645. if(hypervisor.policy.handle_idle_end)
  646. hypervisor.policy.handle_idle_end(sched_ctx, worker);
  647. }
  648. /* notifies the hypervisor that the worker spent another cycle in idle time */
  649. static void notify_idle_cycle(unsigned sched_ctx, int worker, double idle_time)
  650. {
  651. if(hypervisor.resize[sched_ctx])
  652. {
  653. struct sc_hypervisor_wrapper *sc_w = &hypervisor.sched_ctx_w[sched_ctx];
  654. sc_w->current_idle_time[worker] += idle_time;
  655. if(sc_w->idle_start_time[worker] == 0.0)
  656. sc_w->idle_start_time[worker] = starpu_timing_now();
  657. if(hypervisor.policy.handle_idle_cycle)
  658. {
  659. hypervisor.policy.handle_idle_cycle(sched_ctx, worker);
  660. }
  661. }
  662. return;
  663. }
  664. /* notifies the hypervisor that a new task was pushed on the queue of the worker */
  665. static void notify_pushed_task(unsigned sched_ctx, int worker)
  666. {
  667. hypervisor.sched_ctx_w[sched_ctx].pushed_tasks[worker]++;
  668. if(hypervisor.sched_ctx_w[sched_ctx].total_flops != 0.0 && hypervisor.sched_ctx_w[sched_ctx].start_time == 0.0)
  669. hypervisor.sched_ctx_w[sched_ctx].start_time = starpu_timing_now();
  670. if(hypervisor.sched_ctx_w[sched_ctx].total_flops != 0.0 && hypervisor.sched_ctx_w[sched_ctx].real_start_time == 0.0)
  671. hypervisor.sched_ctx_w[sched_ctx].real_start_time = starpu_timing_now();
  672. int ntasks = get_ntasks(hypervisor.sched_ctx_w[sched_ctx].pushed_tasks);
  673. if((hypervisor.min_tasks == 0 || (!(hypervisor.resize[sched_ctx] == 0 && imposed_resize) && ntasks == hypervisor.min_tasks)) && hypervisor.check_min_tasks[sched_ctx])
  674. {
  675. hypervisor.resize[sched_ctx] = 1;
  676. if(imposed_resize) imposed_resize = 0;
  677. hypervisor.check_min_tasks[sched_ctx] = 0;
  678. }
  679. if(hypervisor.policy.handle_pushed_task)
  680. hypervisor.policy.handle_pushed_task(sched_ctx, worker);
  681. }
  682. /* notifies the hypervisor that a task was poped from the queue of the worker */
  683. static void notify_poped_task(unsigned sched_ctx, int worker, struct starpu_task *task, size_t data_size, uint32_t footprint)
  684. {
  685. hypervisor.sched_ctx_w[sched_ctx].poped_tasks[worker]++;
  686. hypervisor.sched_ctx_w[sched_ctx].elapsed_flops[worker] += task->flops;
  687. hypervisor.sched_ctx_w[sched_ctx].elapsed_data[worker] += data_size ;
  688. hypervisor.sched_ctx_w[sched_ctx].elapsed_tasks[worker]++ ;
  689. hypervisor.sched_ctx_w[sched_ctx].total_elapsed_flops[worker] += task->flops;
  690. hypervisor.sched_ctx_w[sched_ctx].remaining_flops -= task->flops; //sc_hypervisor_get_elapsed_flops_per_sched_ctx(&hypervisor.sched_ctx_w[sched_ctx]);
  691. if(hypervisor.resize[sched_ctx])
  692. {
  693. if(hypervisor.policy.handle_poped_task)
  694. hypervisor.policy.handle_poped_task(sched_ctx, worker, task, footprint);
  695. }
  696. _ack_resize_completed(sched_ctx, worker);
  697. if(hypervisor.sched_ctx_w[sched_ctx].poped_tasks[worker] % 200 == 0)
  698. _print_current_time();
  699. }
  700. /* notifies the hypervisor that a tagged task has just been executed */
  701. static void notify_post_exec_hook(unsigned sched_ctx, int task_tag)
  702. {
  703. STARPU_ASSERT(task_tag > 0);
  704. unsigned conf_sched_ctx;
  705. unsigned i;
  706. starpu_pthread_mutex_lock(&act_hypervisor_mutex);
  707. unsigned ns = hypervisor.nsched_ctxs;
  708. starpu_pthread_mutex_unlock(&act_hypervisor_mutex);
  709. for(i = 0; i < ns; i++)
  710. {
  711. struct configuration_entry *entry;
  712. conf_sched_ctx = hypervisor.sched_ctxs[i];
  713. starpu_pthread_mutex_lock(&hypervisor.conf_mut[conf_sched_ctx]);
  714. HASH_FIND_INT(hypervisor.configurations[conf_sched_ctx], &task_tag, entry);
  715. if (entry != NULL)
  716. {
  717. struct sc_hypervisor_policy_config *config = entry->configuration;
  718. sc_hypervisor_set_config(conf_sched_ctx, config);
  719. HASH_DEL(hypervisor.configurations[conf_sched_ctx], entry);
  720. free(config);
  721. }
  722. starpu_pthread_mutex_unlock(&hypervisor.conf_mut[conf_sched_ctx]);
  723. }
  724. if(hypervisor.resize[sched_ctx])
  725. {
  726. starpu_pthread_mutex_lock(&hypervisor.resize_mut[sched_ctx]);
  727. if(hypervisor.policy.handle_post_exec_hook)
  728. {
  729. /* Check whether 'task_tag' is in the 'resize_requests' set. */
  730. struct resize_request_entry *entry;
  731. HASH_FIND_INT(hypervisor.resize_requests[sched_ctx], &task_tag, entry);
  732. if (entry != NULL)
  733. {
  734. hypervisor.policy.handle_post_exec_hook(sched_ctx, task_tag);
  735. HASH_DEL(hypervisor.resize_requests[sched_ctx], entry);
  736. free(entry);
  737. }
  738. }
  739. starpu_pthread_mutex_unlock(&hypervisor.resize_mut[sched_ctx]);
  740. }
  741. return;
  742. }
  743. static void notify_submitted_job(struct starpu_task *task, uint32_t footprint)
  744. {
  745. starpu_pthread_mutex_lock(&act_hypervisor_mutex);
  746. hypervisor.sched_ctx_w[task->sched_ctx].submitted_flops += task->flops;
  747. starpu_pthread_mutex_unlock(&act_hypervisor_mutex);
  748. if(hypervisor.policy.handle_submitted_job && !type_of_tasks_known)
  749. hypervisor.policy.handle_submitted_job(task->cl, task->sched_ctx, footprint);
  750. }
  751. void sc_hypervisor_set_type_of_task(struct starpu_codelet *cl, unsigned sched_ctx, uint32_t footprint)
  752. {
  753. type_of_tasks_known = 1;
  754. if(hypervisor.policy.handle_submitted_job)
  755. hypervisor.policy.handle_submitted_job(cl, sched_ctx, footprint);
  756. }
  757. static void notify_delete_context(unsigned sched_ctx)
  758. {
  759. _print_current_time();
  760. sc_hypervisor_unregister_ctx(sched_ctx);
  761. }
  762. void sc_hypervisor_size_ctxs(int *sched_ctxs, int nsched_ctxs, int *workers, int nworkers)
  763. {
  764. starpu_pthread_mutex_lock(&act_hypervisor_mutex);
  765. unsigned curr_nsched_ctxs = sched_ctxs == NULL ? hypervisor.nsched_ctxs : nsched_ctxs;
  766. int *curr_sched_ctxs = sched_ctxs == NULL ? hypervisor.sched_ctxs : sched_ctxs;
  767. starpu_pthread_mutex_unlock(&act_hypervisor_mutex);
  768. unsigned s;
  769. for(s = 0; s < curr_nsched_ctxs; s++)
  770. hypervisor.resize[curr_sched_ctxs[s]] = 1;
  771. if(hypervisor.policy.size_ctxs)
  772. hypervisor.policy.size_ctxs(curr_sched_ctxs, curr_nsched_ctxs, workers, nworkers);
  773. }
  774. struct sc_hypervisor_wrapper* sc_hypervisor_get_wrapper(unsigned sched_ctx)
  775. {
  776. return &hypervisor.sched_ctx_w[sched_ctx];
  777. }
  778. int* sc_hypervisor_get_sched_ctxs()
  779. {
  780. return hypervisor.sched_ctxs;
  781. }
  782. int sc_hypervisor_get_nsched_ctxs()
  783. {
  784. int ns;
  785. ns = hypervisor.nsched_ctxs;
  786. return ns;
  787. }
  788. void sc_hypervisor_save_size_req(int *sched_ctxs, int nsched_ctxs, int *workers, int nworkers)
  789. {
  790. hypervisor.sr = (struct size_request*)malloc(sizeof(struct size_request));
  791. hypervisor.sr->sched_ctxs = sched_ctxs;
  792. hypervisor.sr->nsched_ctxs = nsched_ctxs;
  793. hypervisor.sr->workers = workers;
  794. hypervisor.sr->nworkers = nworkers;
  795. }
  796. unsigned sc_hypervisor_get_size_req(int **sched_ctxs, int* nsched_ctxs, int **workers, int *nworkers)
  797. {
  798. if(hypervisor.sr != NULL)
  799. {
  800. *sched_ctxs = hypervisor.sr->sched_ctxs;
  801. *nsched_ctxs = hypervisor.sr->nsched_ctxs;
  802. *workers = hypervisor.sr->workers;
  803. *nworkers = hypervisor.sr->nworkers;
  804. return 1;
  805. }
  806. return 0;
  807. }
  808. void sc_hypervisor_free_size_req(void)
  809. {
  810. if(hypervisor.sr != NULL)
  811. {
  812. free(hypervisor.sr);
  813. hypervisor.sr = NULL;
  814. }
  815. }
  816. double _get_optimal_v(unsigned sched_ctx)
  817. {
  818. return hypervisor.optimal_v[sched_ctx];
  819. }
  820. void _set_optimal_v(unsigned sched_ctx, double optimal_v)
  821. {
  822. hypervisor.optimal_v[sched_ctx] = optimal_v;
  823. }