starpurm.c 51 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730
  1. /* StarPU --- Runtime system for heterogeneous multicore architectures.
  2. *
  3. * Copyright (C) 2017-2020 Université de Bordeaux, CNRS (LaBRI UMR 5800), Inria
  4. *
  5. * StarPU is free software; you can redistribute it and/or modify
  6. * it under the terms of the GNU Lesser General Public License as published by
  7. * the Free Software Foundation; either version 2.1 of the License, or (at
  8. * your option) any later version.
  9. *
  10. * StarPU is distributed in the hope that it will be useful, but
  11. * WITHOUT ANY WARRANTY; without even the implied warranty of
  12. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
  13. *
  14. * See the GNU Lesser General Public License in COPYING.LGPL for more details.
  15. */
  16. #include <stdlib.h>
  17. #include <stdio.h>
  18. #include <string.h>
  19. #include <assert.h>
  20. #include <hwloc.h>
  21. #include <starpu.h>
  22. #include <starpurm.h>
  23. #include <common/config.h>
  24. #include <starpurm_private.h>
  25. /*
  26. * #define _DEBUG
  27. */
  28. struct s_starpurm_unit
  29. {
  30. /* Opaque unit id.
  31. *
  32. * For StarPU-RM, this id is used as an index to array starpurm->units[].
  33. */
  34. int id;
  35. /* Id of the unit type. */
  36. int type;
  37. /* Boolean indicating whether the device is currently selected for use by the runtime system. */
  38. int selected;
  39. /* StarPU id of the worker driving the device. */
  40. int workerid;
  41. /* Cpuset of the StarPU worker. */
  42. hwloc_cpuset_t worker_cpuset;
  43. /* Condition variable to notify that a unit is now available to driver a worker waking up. */
  44. pthread_cond_t unit_available_cond;
  45. };
  46. static struct s_starpurm *_starpurm = NULL;
  47. #if 0
  48. static char *bitmap_to_str(hwloc_bitmap_t bitmap)
  49. {
  50. int strl = hwloc_bitmap_snprintf(NULL, 0, bitmap);
  51. char *str = malloc(strl+1);
  52. hwloc_bitmap_snprintf(str, strl+1, bitmap);
  53. return str;
  54. }
  55. #endif
  56. #ifdef STARPURM_STARPU_HAVE_WORKER_CALLBACKS
  57. enum e_starpurm_event
  58. {
  59. starpurm_event_code_min = 0,
  60. starpurm_event_exit = 0,
  61. starpurm_event_worker_going_to_sleep = 1,
  62. starpurm_event_worker_waking_up = 2,
  63. starpurm_event_unit_available = 3,
  64. starpurm_event_code_max = 3
  65. };
  66. const char *_starpurm_event_to_str(int event_code)
  67. {
  68. const char *s = NULL;
  69. switch (event_code)
  70. {
  71. case starpurm_event_exit:
  72. s = "starpurm_event_exit";
  73. break;
  74. case starpurm_event_worker_going_to_sleep:
  75. s = "starpurm_event_worker_going_to_sleep";
  76. break;
  77. case starpurm_event_worker_waking_up:
  78. s = "starpurm_event_worker_waking_up";
  79. break;
  80. case starpurm_event_unit_available:
  81. s = "starpurm_event_unit_available";
  82. break;
  83. default:
  84. s = "<unknown starpurm event>";
  85. break;
  86. }
  87. return s;
  88. }
  89. struct s_starpurm_event
  90. {
  91. struct s_starpurm_event *next;
  92. struct s_starpurm_event *prev;
  93. enum e_starpurm_event code;
  94. unsigned int workerid;
  95. };
  96. static void _enqueue_event(struct s_starpurm_event *event)
  97. {
  98. assert(_starpurm != NULL);
  99. assert(_starpurm->state != state_uninitialized);
  100. struct s_starpurm *rm = _starpurm;
  101. assert(event->next == NULL);
  102. assert(event->prev == NULL);
  103. assert(event->code >= starpurm_event_code_min && event->code <= starpurm_event_code_max);
  104. pthread_mutex_lock(&rm->event_list_mutex);
  105. if (rm->event_processing_ended)
  106. {
  107. pthread_mutex_unlock(&rm->event_list_mutex);
  108. return;
  109. }
  110. assert((rm->event_list_head == NULL && rm->event_list_tail == NULL)
  111. || (rm->event_list_head != NULL && rm->event_list_tail != NULL));
  112. if (rm->event_list_head == NULL)
  113. {
  114. rm->event_list_tail = event;
  115. }
  116. else
  117. {
  118. rm->event_list_head->prev = event;
  119. }
  120. event->next = rm->event_list_head;
  121. rm->event_list_head = event;
  122. if (event->code == starpurm_event_exit)
  123. {
  124. rm->event_processing_ended = 1;
  125. int i;
  126. for (i=0; i<rm->nunits; i++)
  127. {
  128. pthread_cond_broadcast(&rm->units[i].unit_available_cond);
  129. }
  130. }
  131. #ifdef STARPURM_VERBOSE
  132. if (event->code != starpurm_event_worker_waking_up)
  133. fprintf(stderr, "%s: event->code=%d('%s'), workerid=%u\n", __func__, event->code, _starpurm_event_to_str(event->code), event->workerid);
  134. #endif
  135. pthread_cond_broadcast(&rm->event_list_cond);
  136. #ifdef STARPURM_HAVE_DLB
  137. if (event->code == starpurm_event_worker_waking_up)
  138. {
  139. int unit_id = rm->worker_unit_ids[event->workerid];
  140. /* if DLB is in use, wait for the unit to become available from the point of view of DLB, before using it */
  141. #ifdef STARPURM_VERBOSE
  142. fprintf(stderr, "%s: event->code=%d('%s'), workerid=%u - waiting\n", __func__, event->code, _starpurm_event_to_str(event->code), event->workerid);
  143. #endif
  144. pthread_cond_wait(&rm->units[unit_id].unit_available_cond, &rm->event_list_mutex);
  145. #ifdef STARPURM_VERBOSE
  146. fprintf(stderr, "%s: event->code=%d('%s'), workerid=%u - wakeup\n", __func__, event->code, _starpurm_event_to_str(event->code), event->workerid);
  147. #endif
  148. }
  149. #endif
  150. pthread_mutex_unlock(&rm->event_list_mutex);
  151. }
  152. static struct s_starpurm_event *_dequeue_event_no_lock(void)
  153. {
  154. struct s_starpurm *rm = _starpurm;
  155. struct s_starpurm_event *event = NULL;
  156. if (rm->event_list_tail != NULL)
  157. {
  158. event = rm->event_list_tail;
  159. if (event->prev == NULL)
  160. {
  161. rm->event_list_head = NULL;
  162. rm->event_list_tail = NULL;
  163. }
  164. else
  165. {
  166. event->prev->next = NULL;
  167. rm->event_list_tail = event->prev;
  168. }
  169. event->prev = NULL;
  170. event->next = NULL;
  171. }
  172. return event;
  173. }
  174. static struct s_starpurm_event *_wait_event_no_lock(void)
  175. {
  176. struct s_starpurm *rm = _starpurm;
  177. while (rm->event_list_head == NULL)
  178. {
  179. pthread_cond_wait(&rm->event_list_cond, &rm->event_list_mutex);
  180. }
  181. struct s_starpurm_event *event = _dequeue_event_no_lock();
  182. return event;
  183. }
  184. /* unused */
  185. static struct s_starpurm_event *_dequeue_event(void)
  186. {
  187. assert(_starpurm != NULL);
  188. assert(_starpurm->state != state_uninitialized);
  189. struct s_starpurm *rm = _starpurm;
  190. pthread_mutex_lock(&rm->event_list_mutex);
  191. struct s_starpurm_event *event = _dequeue_event_no_lock();
  192. pthread_mutex_unlock(&rm->event_list_mutex);
  193. return event;
  194. }
  195. /* unused */
  196. static struct s_starpurm_event *_wait_event(void)
  197. {
  198. assert(_starpurm != NULL);
  199. assert(_starpurm->state != state_uninitialized);
  200. struct s_starpurm *rm = _starpurm;
  201. pthread_mutex_lock(&rm->event_list_mutex);
  202. struct s_starpurm_event *event = _wait_event_no_lock();
  203. pthread_mutex_unlock(&rm->event_list_mutex);
  204. return event;
  205. }
  206. static void _enqueue_exit_event(void)
  207. {
  208. struct s_starpurm_event *event = calloc(1, sizeof(*event));
  209. event->code = starpurm_event_exit;
  210. event->workerid = 0;
  211. _enqueue_event(event);
  212. }
  213. static void callback_worker_going_to_sleep(unsigned workerid)
  214. {
  215. struct s_starpurm_event *event = calloc(1, sizeof(*event));
  216. event->code = starpurm_event_worker_going_to_sleep;
  217. event->workerid = workerid;
  218. _enqueue_event(event);
  219. }
  220. static void callback_worker_waking_up(unsigned workerid)
  221. {
  222. struct s_starpurm_event *event = calloc(1, sizeof(*event));
  223. event->code = starpurm_event_worker_waking_up;
  224. event->workerid = workerid;
  225. _enqueue_event(event);
  226. }
  227. void starpurm_enqueue_event_cpu_unit_available(int unit_id)
  228. {
  229. assert(_starpurm != NULL);
  230. assert(_starpurm->state != state_uninitialized);
  231. struct s_starpurm *rm = _starpurm;
  232. assert(unit_id >= 0);
  233. /*
  234. * unit_id may exceed the number of CPU units actually used by StarPU,
  235. * if some CPU cores are not used.
  236. *
  237. * //assert(unit_id < rm->nunits_by_type[starpurm_unit_cpu]);
  238. */
  239. unsigned workerid = rm->units[unit_id].workerid; struct
  240. s_starpurm_event *event = calloc(1, sizeof(*event));
  241. event->code = starpurm_event_unit_available; event->workerid =
  242. workerid; _enqueue_event(event); }
  243. static void *event_thread_func(void *_arg)
  244. {
  245. (void)_arg;
  246. assert(_starpurm != NULL);
  247. assert(_starpurm->state != state_uninitialized);
  248. struct s_starpurm *rm = _starpurm;
  249. int need_refresh = 0;
  250. pthread_mutex_lock(&rm->event_list_mutex);
  251. while (rm->event_processing_enabled == 0)
  252. {
  253. pthread_cond_wait(&rm->event_processing_cond, &rm->event_list_mutex);
  254. }
  255. pthread_mutex_unlock(&rm->event_list_mutex);
  256. hwloc_cpuset_t owned_cpuset = hwloc_bitmap_dup(rm->global_cpuset);
  257. hwloc_cpuset_t to_reclaim_cpuset = hwloc_bitmap_alloc();
  258. hwloc_cpuset_t to_lend_cpuset = hwloc_bitmap_alloc();
  259. while (1)
  260. {
  261. struct s_starpurm_event *event = _dequeue_event();
  262. #ifdef STARPURM_HAVE_DLB
  263. if ((event == NULL || event->code == starpurm_event_exit) || need_refresh)
  264. #else
  265. if ((event == NULL || event->code == starpurm_event_exit) && need_refresh)
  266. #endif
  267. {
  268. int did_lend_cpuset = 1;
  269. #ifdef STARPURM_HAVE_DLB
  270. /* notify DLB about changes */
  271. if (!hwloc_bitmap_iszero(to_reclaim_cpuset))
  272. {
  273. starpurm_dlb_notify_starpu_worker_mask_waking_up(to_reclaim_cpuset);
  274. }
  275. did_lend_cpuset = 0;
  276. if (!hwloc_bitmap_iszero(to_lend_cpuset))
  277. {
  278. did_lend_cpuset = starpurm_dlb_notify_starpu_worker_mask_going_to_sleep(to_lend_cpuset);
  279. }
  280. #endif
  281. /* if DLB is not initialized, ignore lend operations */
  282. if (did_lend_cpuset)
  283. {
  284. hwloc_bitmap_andnot(owned_cpuset, owned_cpuset, to_lend_cpuset);
  285. }
  286. hwloc_bitmap_or(owned_cpuset, owned_cpuset, to_reclaim_cpuset);
  287. #if 0
  288. {
  289. char *to_lend_str = bitmap_to_str(to_lend_cpuset);
  290. char *to_reclaim_str = bitmap_to_str(to_reclaim_cpuset);
  291. free(to_lend_str);
  292. free(to_reclaim_str);
  293. }
  294. #endif
  295. need_refresh = 0;
  296. hwloc_bitmap_zero(to_lend_cpuset);
  297. hwloc_bitmap_zero(to_reclaim_cpuset);
  298. }
  299. if (event == NULL)
  300. {
  301. event = _wait_event();
  302. }
  303. if (event->code == starpurm_event_exit)
  304. {
  305. free(event);
  306. break;
  307. }
  308. /* TODO: accumulate state change */
  309. switch (event->code)
  310. {
  311. case starpurm_event_worker_going_to_sleep:
  312. {
  313. if (event->workerid < rm->nunits)
  314. {
  315. int unit_id = rm->worker_unit_ids[event->workerid];
  316. hwloc_bitmap_or(to_lend_cpuset, to_lend_cpuset, rm->units[unit_id].worker_cpuset);
  317. hwloc_bitmap_andnot(to_reclaim_cpuset, to_reclaim_cpuset, rm->units[unit_id].worker_cpuset);
  318. }
  319. }
  320. break;
  321. case starpurm_event_worker_waking_up:
  322. {
  323. if (event->workerid < rm->nunits)
  324. {
  325. int unit_id = rm->worker_unit_ids[event->workerid];
  326. hwloc_bitmap_andnot(to_lend_cpuset, to_lend_cpuset, rm->units[unit_id].worker_cpuset);
  327. #ifdef STARPURM_HAVE_DLB
  328. if (rm->units[unit_id].type == starpurm_unit_cpu && !hwloc_bitmap_intersects(rm->units[unit_id].worker_cpuset, owned_cpuset))
  329. {
  330. /* Only reclaim the unit from DLB if StarPU does not own it already. */
  331. hwloc_bitmap_or(to_reclaim_cpuset, to_reclaim_cpuset, rm->units[unit_id].worker_cpuset);
  332. }
  333. else
  334. {
  335. pthread_cond_broadcast(&rm->units[unit_id].unit_available_cond);
  336. }
  337. #else
  338. hwloc_bitmap_or(to_reclaim_cpuset, to_reclaim_cpuset, rm->units[unit_id].worker_cpuset);
  339. #endif
  340. }
  341. }
  342. break;
  343. #ifdef STARPURM_HAVE_DLB
  344. case starpurm_event_unit_available:
  345. {
  346. if (event->workerid < rm->nunits)
  347. {
  348. /* a reclaimed unit is now available from DLB, unlock the corresponding worker waking up */
  349. int unit_id = rm->worker_unit_ids[event->workerid];
  350. pthread_cond_broadcast(&rm->units[unit_id].unit_available_cond);
  351. }
  352. }
  353. break;
  354. #endif
  355. default:
  356. /* unknown event code */
  357. assert(0);
  358. break;
  359. }
  360. free(event);
  361. need_refresh = 1;
  362. }
  363. pthread_mutex_lock(&rm->event_list_mutex);
  364. /* exit event should be last */
  365. assert(rm->event_list_head == NULL);
  366. assert(rm->event_list_tail == NULL);
  367. hwloc_bitmap_free(owned_cpuset);
  368. hwloc_bitmap_free(to_reclaim_cpuset);
  369. hwloc_bitmap_free(to_lend_cpuset);
  370. pthread_mutex_unlock(&rm->event_list_mutex);
  371. return NULL;
  372. }
  373. #endif /* STARPURM_STARPU_HAVE_WORKER_CALLBACKS */
  374. /* Resource enforcement */
  375. static starpurm_drs_ret_t _starpurm_update_cpuset(hwloc_cpuset_t cpuset)
  376. {
  377. assert(_starpurm != NULL);
  378. assert(_starpurm->state != state_uninitialized);
  379. struct s_starpurm *rm = _starpurm;
  380. if (hwloc_bitmap_isequal(cpuset, rm->selected_cpuset))
  381. {
  382. return starpurm_DRS_SUCCESS;
  383. }
  384. pthread_mutex_lock(&rm->temporary_ctxs_mutex);
  385. if (rm->starpu_in_pause)
  386. {
  387. starpu_resume();
  388. rm->starpu_in_pause = 0;
  389. }
  390. int workers_to_remove[_starpurm->nunits];
  391. unsigned nworkers_to_remove = 0;
  392. int workers_to_add[_starpurm->nunits];
  393. unsigned nworkers_to_add = 0;
  394. int i;
  395. hwloc_cpuset_t temp_cpuset = hwloc_bitmap_alloc();
  396. int new_selected_ncpus = 0;
  397. for (i=0; i<rm->nunits; i++)
  398. {
  399. struct s_starpurm_unit *unit = &rm->units[i];
  400. hwloc_bitmap_and(temp_cpuset, unit->worker_cpuset, cpuset);
  401. if (hwloc_bitmap_iszero(temp_cpuset))
  402. {
  403. workers_to_remove[nworkers_to_remove] = unit->workerid;
  404. unit->selected = 0;
  405. nworkers_to_remove++;
  406. }
  407. else
  408. {
  409. workers_to_add[nworkers_to_add] = unit->workerid;
  410. unit->selected = 1;
  411. nworkers_to_add++;
  412. if (unit->type == starpurm_unit_cpu)
  413. {
  414. new_selected_ncpus++;
  415. }
  416. }
  417. }
  418. hwloc_bitmap_free(temp_cpuset);
  419. rm->selected_nworkers = nworkers_to_add;
  420. rm->selected_ncpus = new_selected_ncpus;
  421. hwloc_bitmap_free(rm->selected_cpuset);
  422. rm->selected_cpuset = hwloc_bitmap_dup(cpuset);
  423. if (nworkers_to_add > 0)
  424. {
  425. #if defined(STARPURM_HAVE_DLB) && !defined(STARPURM_STARPU_HAVE_WORKER_CALLBACKS)
  426. {
  427. /* if StarPU worker callbacks are not enabled, we still
  428. * notify DLB about resource usage changes, but we do
  429. * not wait for the formal DLB go to use the units */
  430. hwloc_cpuset_t to_reclaim_cpuset = hwloc_bitmap_alloc();
  431. for (i=0; i<nworkers_to_add; i++)
  432. {
  433. int unit_id = rm->worker_unit_ids[workers_to_add[i]];
  434. hwloc_bitmap_or(to_reclaim_cpuset, to_reclaim_cpuset, rm->units[unit_id].worker_cpuset);
  435. }
  436. starpurm_dlb_notify_starpu_worker_mask_waking_up(to_reclaim_cpuset);
  437. hwloc_bitmap_free(to_reclaim_cpuset);
  438. }
  439. #endif
  440. starpu_sched_ctx_add_workers(workers_to_add, nworkers_to_add, rm->sched_ctx_id);
  441. }
  442. if (nworkers_to_remove > 0)
  443. {
  444. starpu_sched_ctx_remove_workers(workers_to_remove, nworkers_to_remove, rm->sched_ctx_id);
  445. #if defined(STARPURM_HAVE_DLB) && !defined(STARPURM_STARPU_HAVE_WORKER_CALLBACKS)
  446. {
  447. /* if StarPU worker callbacks are not enabled, we still
  448. * notify DLB about resource usage changes, but we do
  449. * not wait for the workers to become idle */
  450. hwloc_cpuset_t to_lend_cpuset = hwloc_bitmap_alloc();
  451. for (i=0; i<nworkers_to_remove; i++)
  452. {
  453. int unit_id = rm->worker_unit_ids[workers_to_remove[i]];
  454. hwloc_bitmap_or(to_lend_cpuset, to_lend_cpuset, rm->units[unit_id].worker_cpuset);
  455. }
  456. starpurm_dlb_notify_starpu_worker_mask_going_to_sleep(to_lend_cpuset);
  457. hwloc_bitmap_free(to_lend_cpuset);
  458. }
  459. #endif
  460. }
  461. #ifdef _DEBUG
  462. starpu_sched_ctx_display_workers(rm->sched_ctx_id, stderr);
  463. #endif /* DEBUG */
  464. if (rm->selected_nworkers == 0 && rm->avail_temporary_ctxs == rm->max_temporary_ctxs)
  465. {
  466. rm->starpu_in_pause = 1;
  467. starpu_pause();
  468. }
  469. pthread_mutex_unlock(&rm->temporary_ctxs_mutex);
  470. return starpurm_DRS_SUCCESS;
  471. }
  472. static unsigned _starpurm_temporary_context_alloc(hwloc_cpuset_t cpuset)
  473. {
  474. assert(_starpurm != NULL);
  475. assert(_starpurm->state != state_uninitialized);
  476. assert(_starpurm->max_temporary_ctxs > 0);
  477. struct s_starpurm *rm = _starpurm;
  478. pthread_mutex_lock(&rm->temporary_ctxs_mutex);
  479. while(rm->avail_temporary_ctxs == 0)
  480. {
  481. pthread_cond_wait(&rm->temporary_ctxs_cond, &rm->temporary_ctxs_mutex);
  482. }
  483. assert(rm->avail_temporary_ctxs > 0);
  484. rm->avail_temporary_ctxs--;
  485. if (rm->starpu_in_pause)
  486. {
  487. starpu_resume();
  488. rm->starpu_in_pause = 0;
  489. }
  490. pthread_mutex_unlock(&rm->temporary_ctxs_mutex);
  491. unsigned sched_ctx_id = starpu_sched_ctx_create(NULL, -1, "starpurm_temp", STARPU_SCHED_CTX_POLICY_NAME, "eager", 0);
  492. assert(sched_ctx_id != STARPU_NMAX_SCHED_CTXS);
  493. int workers_to_remove[_starpurm->nunits];
  494. unsigned nworkers_to_remove = 0;
  495. int workers_to_add[_starpurm->nunits];
  496. unsigned nworkers_to_add = 0;
  497. int i;
  498. hwloc_cpuset_t temp_cpuset = hwloc_bitmap_alloc();
  499. for (i=0; i<rm->nunits; i++)
  500. {
  501. struct s_starpurm_unit *unit = &rm->units[i];
  502. hwloc_bitmap_and(temp_cpuset, unit->worker_cpuset, cpuset);
  503. if (hwloc_bitmap_iszero(temp_cpuset))
  504. {
  505. workers_to_remove[nworkers_to_remove] = unit->workerid;
  506. nworkers_to_remove++;
  507. }
  508. else
  509. {
  510. workers_to_add[nworkers_to_add] = unit->workerid;
  511. nworkers_to_add++;
  512. }
  513. }
  514. hwloc_bitmap_free(temp_cpuset);
  515. if (nworkers_to_add > 0)
  516. starpu_sched_ctx_add_workers(workers_to_add, nworkers_to_add, sched_ctx_id);
  517. if (nworkers_to_remove > 0)
  518. starpu_sched_ctx_remove_workers(workers_to_remove, nworkers_to_remove, sched_ctx_id);
  519. #ifdef _DEBUG
  520. starpu_sched_ctx_display_workers(sched_ctx_id, stderr);
  521. #endif /* DEBUG */
  522. return sched_ctx_id;
  523. }
  524. static void _starpurm_temporary_context_free(unsigned ctx)
  525. {
  526. assert(_starpurm != NULL);
  527. assert(_starpurm->state != state_uninitialized);
  528. assert(_starpurm->max_temporary_ctxs > 0);
  529. struct s_starpurm *rm = _starpurm;
  530. starpu_sched_ctx_delete(ctx);
  531. pthread_mutex_lock(&rm->temporary_ctxs_mutex);
  532. rm->avail_temporary_ctxs++;
  533. pthread_cond_signal(&rm->temporary_ctxs_cond);
  534. if (rm->selected_nworkers == 0 && rm->avail_temporary_ctxs == rm->max_temporary_ctxs)
  535. {
  536. rm->starpu_in_pause = 1;
  537. starpu_pause();
  538. }
  539. pthread_mutex_unlock(&rm->temporary_ctxs_mutex);
  540. }
  541. static starpurm_drs_ret_t _starpurm_set_ncpus(unsigned int ncpus)
  542. {
  543. assert(_starpurm != NULL);
  544. assert(_starpurm->state != state_uninitialized);
  545. struct s_starpurm *rm = _starpurm;
  546. int i;
  547. if (ncpus > rm->nunits_by_type[starpurm_unit_cpu])
  548. {
  549. ncpus = rm->nunits_by_type[starpurm_unit_cpu];
  550. }
  551. if (ncpus == rm->selected_ncpus)
  552. {
  553. return starpurm_DRS_SUCCESS;
  554. }
  555. pthread_mutex_lock(&rm->temporary_ctxs_mutex);
  556. if (rm->starpu_in_pause)
  557. {
  558. starpu_resume();
  559. rm->starpu_in_pause = 0;
  560. }
  561. int workers_to_remove[_starpurm->nunits];
  562. unsigned nworkers_to_remove = 0;
  563. int workers_to_add[_starpurm->nunits];
  564. unsigned nworkers_to_add = 0;
  565. for (i=0; i<rm->nunits; i++)
  566. {
  567. struct s_starpurm_unit *unit = &rm->units[i];
  568. if (unit->type != starpurm_unit_cpu)
  569. continue;
  570. if (nworkers_to_add < ncpus)
  571. {
  572. workers_to_add[nworkers_to_add] = unit->workerid;
  573. unit->selected = 1;
  574. nworkers_to_add++;
  575. hwloc_bitmap_or(rm->selected_cpuset, rm->selected_cpuset, unit->worker_cpuset);
  576. }
  577. else
  578. {
  579. workers_to_remove[nworkers_to_remove] = unit->workerid;
  580. unit->selected = 0;
  581. hwloc_bitmap_andnot(rm->selected_cpuset, rm->selected_cpuset, unit->worker_cpuset);
  582. nworkers_to_remove++;
  583. }
  584. }
  585. rm->selected_nworkers = nworkers_to_add;
  586. rm->selected_ncpus = nworkers_to_add;
  587. if (nworkers_to_add > 0)
  588. starpu_sched_ctx_add_workers(workers_to_add, nworkers_to_add, rm->sched_ctx_id);
  589. if (nworkers_to_remove > 0)
  590. starpu_sched_ctx_remove_workers(workers_to_remove, nworkers_to_remove, rm->sched_ctx_id);
  591. #if def_DEBUG
  592. starpu_sched_ctx_display_workers(rm->sched_ctx_id, stderr);
  593. #endif /* DEBUG */
  594. if (rm->selected_nworkers == 0 && rm->avail_temporary_ctxs == rm->max_temporary_ctxs)
  595. {
  596. rm->starpu_in_pause = 1;
  597. starpu_pause();
  598. }
  599. pthread_mutex_unlock(&rm->temporary_ctxs_mutex);
  600. return starpurm_DRS_SUCCESS;
  601. }
  602. /* Initialize rm state for StarPU */
  603. void starpurm_initialize_with_cpuset(const hwloc_cpuset_t initially_owned_cpuset)
  604. {
  605. int ret;
  606. assert(_starpurm == NULL);
  607. struct s_starpurm *rm = calloc(1, sizeof(*rm));
  608. pthread_mutex_init(&rm->temporary_ctxs_mutex, NULL);
  609. pthread_cond_init(&rm->temporary_ctxs_cond, NULL);
  610. rm->state = state_init;
  611. /* init hwloc objects */
  612. hwloc_topology_init(&rm->topology);
  613. hwloc_topology_load(rm->topology);
  614. rm->global_cpuset = hwloc_bitmap_alloc();
  615. hwloc_bitmap_zero(rm->global_cpuset);
  616. rm->initially_owned_cpuset_mask = hwloc_bitmap_dup(initially_owned_cpuset);
  617. rm->all_cpu_workers_cpuset = hwloc_bitmap_alloc();
  618. hwloc_bitmap_zero(rm->all_cpu_workers_cpuset);
  619. rm->all_opencl_device_workers_cpuset = hwloc_bitmap_alloc();
  620. hwloc_bitmap_zero(rm->all_opencl_device_workers_cpuset);
  621. rm->all_cuda_device_workers_cpuset = hwloc_bitmap_alloc();
  622. hwloc_bitmap_zero(rm->all_cuda_device_workers_cpuset);
  623. rm->all_mic_device_workers_cpuset = hwloc_bitmap_alloc();
  624. hwloc_bitmap_zero(rm->all_mic_device_workers_cpuset);
  625. rm->all_device_workers_cpuset = hwloc_bitmap_alloc();
  626. hwloc_bitmap_zero(rm->all_device_workers_cpuset);
  627. /* init event list, before StarPU is initialized */
  628. pthread_mutex_init(&rm->event_list_mutex, NULL);
  629. pthread_cond_init(&rm->event_list_cond, NULL);
  630. pthread_cond_init(&rm->event_processing_cond, NULL);
  631. pthread_mutex_lock(&rm->event_list_mutex);
  632. rm->event_processing_enabled = 0;
  633. rm->event_processing_ended = 0;
  634. rm->event_list_head = NULL;
  635. rm->event_list_tail = NULL;
  636. pthread_mutex_unlock(&rm->event_list_mutex);
  637. /* set _starpurm here since StarPU's callbacks may reference it once starpu_init is called */
  638. _starpurm = rm;
  639. #ifdef STARPURM_STARPU_HAVE_WORKER_CALLBACKS
  640. /* launch event thread */
  641. ret = pthread_create(&rm->event_thread, NULL, event_thread_func, rm);
  642. assert(ret == 0);
  643. #endif
  644. /* init StarPU */
  645. struct starpu_conf starpu_conf;
  646. ret = starpu_conf_init(&starpu_conf);
  647. assert(ret == 0);
  648. #ifdef STARPURM_STARPU_HAVE_WORKER_CALLBACKS
  649. starpu_conf.callback_worker_going_to_sleep = callback_worker_going_to_sleep;
  650. starpu_conf.callback_worker_waking_up = callback_worker_waking_up;
  651. #endif
  652. ret = starpu_init(&starpu_conf);
  653. assert(ret == 0);
  654. /* init any worker objects */
  655. rm->nunits = starpu_worker_get_count_by_type(STARPU_ANY_WORKER);
  656. /* init device worker objects */
  657. rm->unit_ntypes = starpurm_unit_ntypes;
  658. rm->nunits_by_type = calloc(rm->unit_ntypes, sizeof(*rm->nunits_by_type));
  659. rm->unit_offsets_by_type = calloc(rm->unit_ntypes, sizeof(*rm->unit_offsets_by_type));
  660. const int cpu_nunits = starpu_worker_get_count_by_type(STARPU_CPU_WORKER);
  661. rm->nunits_by_type[starpurm_unit_cpu] = cpu_nunits;
  662. const int opencl_nunits = starpu_worker_get_count_by_type(STARPU_OPENCL_WORKER);
  663. rm->nunits_by_type[starpurm_unit_opencl] = opencl_nunits;
  664. const int cuda_nunits = starpu_worker_get_count_by_type(STARPU_CUDA_WORKER);
  665. rm->nunits_by_type[starpurm_unit_cuda] = cuda_nunits;
  666. const int mic_nunits = starpu_worker_get_count_by_type(STARPU_MIC_WORKER);
  667. rm->nunits_by_type[starpurm_unit_mic] = mic_nunits;
  668. const int nunits = cpu_nunits + opencl_nunits + cuda_nunits + mic_nunits;
  669. rm->nunits = nunits;
  670. rm->units = calloc(nunits, sizeof(*rm->units));
  671. int unitid = 0;
  672. int cpu_workerids[cpu_nunits];
  673. starpu_worker_get_ids_by_type(STARPU_CPU_WORKER, cpu_workerids, cpu_nunits);
  674. rm->unit_offsets_by_type[starpurm_unit_cpu] = unitid;
  675. unsigned int max_worker_id = 0;
  676. int i;
  677. for (i = 0; i < cpu_nunits; i++)
  678. {
  679. rm->units[unitid].id = unitid;
  680. rm->units[unitid].type = starpurm_unit_cpu;
  681. rm->units[unitid].selected = 1; /* enabled by default */
  682. rm->units[unitid].workerid = cpu_workerids[i];
  683. if (max_worker_id < rm->units[unitid].workerid)
  684. {
  685. max_worker_id = rm->units[unitid].workerid;
  686. }
  687. rm->units[unitid].worker_cpuset = starpu_worker_get_hwloc_cpuset(rm->units[unitid].workerid);
  688. pthread_cond_init(&rm->units[unitid].unit_available_cond, NULL);
  689. hwloc_bitmap_or(rm->global_cpuset, rm->global_cpuset, rm->units[unitid].worker_cpuset);
  690. hwloc_bitmap_or(rm->all_cpu_workers_cpuset, rm->all_cpu_workers_cpuset, rm->units[unitid].worker_cpuset);;
  691. #ifdef STARPURM_VERBOSE
  692. {
  693. char * s_unit = NULL;
  694. hwloc_bitmap_asprintf(&s_unit, rm->units[unitid].worker_cpuset);
  695. fprintf(stderr, "%s: 'cpu', unitid=%d, cpuset=0x%s, workerid=%d\n", __func__, unitid, s_unit, rm->units[unitid].workerid);
  696. free(s_unit);
  697. }
  698. #endif
  699. unitid++;
  700. }
  701. int opencl_workerids[opencl_nunits];
  702. starpu_worker_get_ids_by_type(STARPU_OPENCL_WORKER, opencl_workerids, opencl_nunits);
  703. rm->unit_offsets_by_type[starpurm_unit_opencl] = unitid;
  704. for (i = 0; i < opencl_nunits; i++)
  705. {
  706. rm->units[unitid].id = unitid;
  707. rm->units[unitid].type = starpurm_unit_opencl;
  708. rm->units[unitid].selected = 1; /* enabled by default */
  709. rm->units[unitid].workerid = opencl_workerids[i];
  710. if (max_worker_id < rm->units[unitid].workerid)
  711. {
  712. max_worker_id = rm->units[unitid].workerid;
  713. }
  714. rm->units[unitid].worker_cpuset = starpu_worker_get_hwloc_cpuset(rm->units[unitid].workerid);
  715. pthread_cond_init(&rm->units[unitid].unit_available_cond, NULL);
  716. hwloc_bitmap_or(rm->global_cpuset, rm->global_cpuset, rm->units[unitid].worker_cpuset);
  717. hwloc_bitmap_or(rm->all_opencl_device_workers_cpuset, rm->all_opencl_device_workers_cpuset, rm->units[unitid].worker_cpuset);
  718. hwloc_bitmap_or(rm->all_device_workers_cpuset, rm->all_device_workers_cpuset, rm->units[unitid].worker_cpuset);
  719. unitid++;
  720. }
  721. int cuda_workerids[opencl_nunits];
  722. starpu_worker_get_ids_by_type(STARPU_CUDA_WORKER, cuda_workerids, cuda_nunits);
  723. rm->unit_offsets_by_type[starpurm_unit_cuda] = unitid;
  724. for (i = 0; i < cuda_nunits; i++)
  725. {
  726. rm->units[unitid].id = unitid;
  727. rm->units[unitid].type = starpurm_unit_cuda;
  728. rm->units[unitid].selected = 1; /* enabled by default */
  729. rm->units[unitid].workerid = cuda_workerids[i];
  730. if (max_worker_id < rm->units[unitid].workerid)
  731. {
  732. max_worker_id = rm->units[unitid].workerid;
  733. }
  734. rm->units[unitid].worker_cpuset = starpu_worker_get_hwloc_cpuset(rm->units[unitid].workerid);
  735. pthread_cond_init(&rm->units[unitid].unit_available_cond, NULL);
  736. hwloc_bitmap_or(rm->global_cpuset, rm->global_cpuset, rm->units[unitid].worker_cpuset);
  737. hwloc_bitmap_or(rm->all_cuda_device_workers_cpuset, rm->all_cuda_device_workers_cpuset, rm->units[unitid].worker_cpuset);
  738. hwloc_bitmap_or(rm->all_device_workers_cpuset, rm->all_device_workers_cpuset, rm->units[unitid].worker_cpuset);
  739. unitid++;
  740. }
  741. int mic_workerids[mic_nunits];
  742. starpu_worker_get_ids_by_type(STARPU_MIC_WORKER, mic_workerids, mic_nunits);
  743. rm->unit_offsets_by_type[starpurm_unit_mic] = unitid;
  744. for (i = 0; i < mic_nunits; i++)
  745. {
  746. rm->units[unitid].id = unitid;
  747. rm->units[unitid].type = starpurm_unit_mic;
  748. rm->units[unitid].selected = 1; /* enabled by default */
  749. rm->units[unitid].workerid = mic_workerids[i];
  750. if (max_worker_id < rm->units[unitid].workerid)
  751. {
  752. max_worker_id = rm->units[unitid].workerid;
  753. }
  754. rm->units[unitid].worker_cpuset = starpu_worker_get_hwloc_cpuset(rm->units[unitid].workerid);
  755. pthread_cond_init(&rm->units[unitid].unit_available_cond, NULL);
  756. hwloc_bitmap_or(rm->global_cpuset, rm->global_cpuset, rm->units[unitid].worker_cpuset);
  757. hwloc_bitmap_or(rm->all_mic_device_workers_cpuset, rm->all_mic_device_workers_cpuset, rm->units[unitid].worker_cpuset);
  758. hwloc_bitmap_or(rm->all_device_workers_cpuset, rm->all_device_workers_cpuset, rm->units[unitid].worker_cpuset);
  759. unitid++;
  760. }
  761. rm->max_worker_id = max_worker_id;
  762. {
  763. int *worker_unit_ids = malloc((max_worker_id+1) * sizeof(*worker_unit_ids));
  764. for (i = 0; i < max_worker_id+1; i++)
  765. {
  766. worker_unit_ids[i] = -1;
  767. }
  768. for (i=0; i<rm->nunits; i++)
  769. {
  770. worker_unit_ids[rm->units[i].workerid] = i;
  771. }
  772. rm->worker_unit_ids = worker_unit_ids;
  773. }
  774. /* create StarPU sched_ctx for RM instance */
  775. {
  776. int workerids[rm->nunits];
  777. starpu_worker_get_ids_by_type(STARPU_ANY_WORKER, workerids, rm->nunits);
  778. /* TODO: make sched_ctx policy configurable */
  779. rm->sched_ctx_id = starpu_sched_ctx_create(workerids, rm->nunits, "starpurm", STARPU_SCHED_CTX_POLICY_NAME, "eager", 0);
  780. #ifdef _DEBUG
  781. starpu_sched_ctx_display_workers(rm->sched_ctx_id, stderr);
  782. #endif /* DEBUG */
  783. }
  784. starpu_sched_ctx_set_context(&rm->sched_ctx_id);
  785. /* number selected workers (total) */
  786. rm->selected_nworkers = rm->nunits;
  787. /* number of selected CPUs workers */
  788. rm->selected_ncpus = rm->nunits_by_type[starpurm_unit_cpu];
  789. /* cpuset of all currently selected workers */
  790. rm->selected_cpuset = hwloc_bitmap_dup(rm->global_cpuset);
  791. if (STARPU_NMAX_SCHED_CTXS > 2)
  792. {
  793. /* account for main ctx (0) and default rm ctx (1)
  794. * TODO: check that no other ctxs are allocated by external codes */
  795. rm->max_temporary_ctxs = STARPU_NMAX_SCHED_CTXS - 2;
  796. }
  797. else
  798. {
  799. rm->max_temporary_ctxs = 0;
  800. }
  801. rm->avail_temporary_ctxs = rm->max_temporary_ctxs;
  802. if (rm->selected_nworkers == 0)
  803. {
  804. rm->starpu_in_pause = 1;
  805. starpu_pause();
  806. }
  807. else
  808. {
  809. rm->starpu_in_pause = 0;
  810. }
  811. #ifdef STARPURM_HAVE_DLB
  812. starpurm_dlb_init(rm);
  813. #endif
  814. pthread_mutex_lock(&rm->event_list_mutex);
  815. rm->event_processing_enabled = 1;
  816. pthread_cond_broadcast(&rm->event_processing_cond);
  817. pthread_mutex_unlock(&rm->event_list_mutex);
  818. _starpurm = rm;
  819. }
  820. void starpurm_initialize()
  821. {
  822. hwloc_cpuset_t full_cpuset = hwloc_bitmap_alloc_full();
  823. starpurm_initialize_with_cpuset(full_cpuset);
  824. hwloc_bitmap_free(full_cpuset);
  825. }
  826. /* Free rm struct for StarPU */
  827. void starpurm_shutdown(void)
  828. {
  829. assert(_starpurm != NULL);
  830. assert(_starpurm->state != state_uninitialized);
  831. struct s_starpurm *rm = _starpurm;
  832. if (rm->starpu_in_pause)
  833. {
  834. starpu_resume();
  835. rm->starpu_in_pause = 0;
  836. }
  837. starpu_sched_ctx_delete(rm->sched_ctx_id);
  838. #ifdef STARPURM_STARPU_HAVE_WORKER_CALLBACKS
  839. _enqueue_exit_event();
  840. #endif
  841. starpu_shutdown();
  842. #ifdef STARPURM_HAVE_DLB
  843. starpurm_dlb_exit();
  844. #endif
  845. hwloc_topology_destroy(rm->topology);
  846. #ifdef STARPURM_STARPU_HAVE_WORKER_CALLBACKS
  847. pthread_join(rm->event_thread, NULL);
  848. #endif
  849. assert(rm->event_list_head == NULL);
  850. assert(rm->event_list_tail == NULL);
  851. pthread_cond_destroy(&rm->event_list_cond);
  852. pthread_mutex_destroy(&rm->event_list_mutex);
  853. rm->state = state_uninitialized;
  854. hwloc_bitmap_free(rm->global_cpuset);
  855. hwloc_bitmap_free(rm->all_cpu_workers_cpuset);
  856. hwloc_bitmap_free(rm->all_opencl_device_workers_cpuset);
  857. hwloc_bitmap_free(rm->all_cuda_device_workers_cpuset);
  858. hwloc_bitmap_free(rm->all_mic_device_workers_cpuset);
  859. hwloc_bitmap_free(rm->all_device_workers_cpuset);
  860. hwloc_bitmap_free(rm->selected_cpuset);
  861. hwloc_bitmap_free(rm->initially_owned_cpuset_mask);
  862. int i;
  863. for (i=0; i<rm->nunits; i++)
  864. {
  865. pthread_cond_destroy(&rm->units[i].unit_available_cond);
  866. }
  867. free(rm->units);
  868. rm->units = NULL;
  869. free(rm->nunits_by_type);
  870. rm->nunits_by_type = NULL;
  871. free(rm->unit_offsets_by_type);
  872. rm->unit_offsets_by_type = NULL;
  873. free(rm);
  874. _starpurm = NULL;
  875. }
  876. void starpurm_spawn_kernel_on_cpus(void *data, void(*f)(void *), void *args, hwloc_cpuset_t cpuset)
  877. {
  878. (void) data;
  879. assert(_starpurm != NULL);
  880. assert(_starpurm->state != state_uninitialized);
  881. struct s_starpurm *rm = _starpurm;
  882. unsigned ctx = _starpurm_temporary_context_alloc(cpuset);
  883. starpu_sched_ctx_set_context(&ctx);
  884. f(args);
  885. starpu_sched_ctx_set_context(&rm->sched_ctx_id);
  886. _starpurm_temporary_context_free(ctx);
  887. }
  888. struct s_starpurm__spawn_args
  889. {
  890. void(*f)(void *);
  891. void *args;
  892. void(*cb_f)(void *);
  893. void *cb_args;
  894. hwloc_cpuset_t cpuset;
  895. };
  896. static void *_starpurm_spawn_kernel_thread(void *_spawn_args)
  897. {
  898. struct s_starpurm__spawn_args *spawn_args = _spawn_args;
  899. unsigned ctx = _starpurm_temporary_context_alloc(spawn_args->cpuset);
  900. starpu_sched_ctx_set_context(&ctx);
  901. spawn_args->f(spawn_args->args);
  902. struct s_starpurm *rm = _starpurm;
  903. starpu_sched_ctx_set_context(&rm->sched_ctx_id);
  904. _starpurm_temporary_context_free(ctx);
  905. spawn_args->cb_f(spawn_args->cb_args);
  906. hwloc_bitmap_free(spawn_args->cpuset);
  907. free(spawn_args);
  908. return NULL;
  909. }
  910. void starpurm_spawn_kernel_on_cpus_callback(void *data, void(*f)(void *), void *args, hwloc_cpuset_t cpuset, void(*cb_f)(void *), void *cb_args)
  911. {
  912. (void) data;
  913. struct s_starpurm__spawn_args *spawn_args = calloc(1, sizeof(*spawn_args));
  914. spawn_args->f = f;
  915. spawn_args->args = args;
  916. spawn_args->cb_f = cb_f;
  917. spawn_args->cb_args = cb_args;
  918. spawn_args->cpuset = hwloc_bitmap_dup(cpuset);
  919. pthread_attr_t attr;
  920. int ret;
  921. ret = pthread_attr_init(&attr);
  922. assert(ret == 0);
  923. ret = pthread_attr_setdetachstate(&attr, 1);
  924. assert(ret == 0);
  925. pthread_t t;
  926. ret = pthread_create(&t, &attr, _starpurm_spawn_kernel_thread, spawn_args);
  927. assert(ret == 0);
  928. }
  929. static void *_starpurm_spawn_kernel_in_default_context_thread(void *_spawn_args)
  930. {
  931. struct s_starpurm__spawn_args *spawn_args = _spawn_args;
  932. struct s_starpurm *rm = _starpurm;
  933. starpu_sched_ctx_set_context(&rm->sched_ctx_id);
  934. spawn_args->f(spawn_args->args);
  935. spawn_args->cb_f(spawn_args->cb_args);
  936. free(spawn_args);
  937. return NULL;
  938. }
  939. void starpurm_spawn_kernel_callback(void *data, void(*f)(void *), void *args, void(*cb_f)(void *), void *cb_args)
  940. {
  941. (void) data;
  942. struct s_starpurm__spawn_args *spawn_args = calloc(1, sizeof(*spawn_args));
  943. spawn_args->f = f;
  944. spawn_args->args = args;
  945. spawn_args->cb_f = cb_f;
  946. spawn_args->cb_args = cb_args;
  947. pthread_attr_t attr;
  948. int ret;
  949. ret = pthread_attr_init(&attr);
  950. assert(ret == 0);
  951. ret = pthread_attr_setdetachstate(&attr, 1);
  952. assert(ret == 0);
  953. pthread_t t;
  954. ret = pthread_create(&t, &attr, _starpurm_spawn_kernel_in_default_context_thread, spawn_args);
  955. assert(ret == 0);
  956. }
  957. hwloc_cpuset_t starpurm_get_unit_cpuset(int unitid)
  958. {
  959. assert(_starpurm != NULL);
  960. assert(_starpurm->state != state_uninitialized);
  961. struct s_starpurm *rm = _starpurm;
  962. assert(unitid >= 0 && unitid < rm->nunits);
  963. return hwloc_bitmap_dup(rm->units[unitid].worker_cpuset);
  964. }
  965. hwloc_cpuset_t starpurm_get_cpu_worker_cpuset(int unit_rank)
  966. {
  967. assert(_starpurm != NULL);
  968. assert(_starpurm->state != state_uninitialized);
  969. struct s_starpurm *rm = _starpurm;
  970. assert(unit_rank >= 0 && unit_rank < rm->nunits_by_type[starpurm_unit_cpu]);
  971. return hwloc_bitmap_dup(rm->units[rm->unit_offsets_by_type[starpurm_unit_cpu] + unit_rank].worker_cpuset);
  972. }
  973. /* Dynamic resource sharing */
  974. starpurm_drs_ret_t starpurm_set_drs_enable(starpurm_drs_desc_t *spd)
  975. {
  976. (void)spd;
  977. assert(_starpurm != NULL);
  978. assert(_starpurm->state != state_uninitialized);
  979. struct s_starpurm *rm = _starpurm;
  980. rm->dynamic_resource_sharing = 1;
  981. return starpurm_DRS_SUCCESS;
  982. }
  983. starpurm_drs_ret_t starpurm_set_drs_disable(starpurm_drs_desc_t *spd)
  984. {
  985. (void)spd;
  986. assert(_starpurm != NULL);
  987. assert(_starpurm->state != state_uninitialized);
  988. struct s_starpurm *rm = _starpurm;
  989. rm->dynamic_resource_sharing = 0;
  990. return starpurm_DRS_SUCCESS;
  991. }
  992. int starpurm_drs_enabled_p(void)
  993. {
  994. assert(_starpurm != NULL);
  995. assert(_starpurm->state != state_uninitialized);
  996. struct s_starpurm *rm = _starpurm;
  997. return rm->dynamic_resource_sharing;
  998. }
  999. starpurm_drs_ret_t starpurm_set_max_parallelism(starpurm_drs_desc_t *spd, int ncpus)
  1000. {
  1001. (void)spd;
  1002. assert(_starpurm != NULL);
  1003. assert(_starpurm->state != state_uninitialized);
  1004. struct s_starpurm *rm = _starpurm;
  1005. if (!rm->dynamic_resource_sharing)
  1006. return starpurm_DRS_DISABLD;
  1007. if (ncpus > rm->nunits_by_type[starpurm_unit_cpu])
  1008. {
  1009. ncpus = rm->nunits_by_type[starpurm_unit_cpu];
  1010. }
  1011. rm->max_ncpus = ncpus;
  1012. if (rm->selected_ncpus > ncpus)
  1013. {
  1014. return _starpurm_set_ncpus(ncpus);
  1015. }
  1016. return starpurm_DRS_SUCCESS;
  1017. }
  1018. starpurm_drs_ret_t starpurm_callback_set(starpurm_drs_desc_t *spd, starpurm_drs_cbs_t which, starpurm_drs_cb_t callback)
  1019. {
  1020. (void)spd;
  1021. (void)which;
  1022. (void)callback;
  1023. /* unimplemented */
  1024. assert(0);
  1025. return starpurm_DRS_PERM;
  1026. }
  1027. starpurm_drs_ret_t starpurm_callback_get(starpurm_drs_desc_t *spd, starpurm_drs_cbs_t which, starpurm_drs_cb_t *callback)
  1028. {
  1029. (void)spd;
  1030. (void)which;
  1031. (void)callback;
  1032. /* unimplemented */
  1033. assert(0);
  1034. return starpurm_DRS_PERM;
  1035. }
  1036. starpurm_drs_ret_t starpurm_assign_cpu_to_starpu(starpurm_drs_desc_t *spd, int cpuid)
  1037. {
  1038. assert(_starpurm != NULL);
  1039. assert(_starpurm->state != state_uninitialized);
  1040. struct s_starpurm *rm = _starpurm;
  1041. if (!rm->dynamic_resource_sharing)
  1042. return starpurm_DRS_DISABLD;
  1043. starpurm_drs_ret_t ret = 0;
  1044. assert(hwloc_bitmap_isset(rm->global_cpuset, cpuid));
  1045. if (!hwloc_bitmap_isset(rm->selected_cpuset, cpuid))
  1046. {
  1047. hwloc_cpuset_t temp_cpuset = hwloc_bitmap_dup(rm->selected_cpuset);
  1048. hwloc_bitmap_set(temp_cpuset, cpuid);
  1049. ret = _starpurm_update_cpuset(temp_cpuset);
  1050. hwloc_bitmap_free(temp_cpuset);
  1051. }
  1052. return ret;
  1053. }
  1054. starpurm_drs_ret_t starpurm_assign_cpus_to_starpu(starpurm_drs_desc_t *spd, int ncpus)
  1055. {
  1056. (void)spd;
  1057. assert(_starpurm != NULL);
  1058. assert(_starpurm->state != state_uninitialized);
  1059. struct s_starpurm *rm = _starpurm;
  1060. if (!rm->dynamic_resource_sharing)
  1061. return starpurm_DRS_DISABLD;
  1062. /* add ncpus more CPUs to the CPUs pool */
  1063. return _starpurm_set_ncpus(rm->selected_ncpus+ncpus);
  1064. }
  1065. starpurm_drs_ret_t starpurm_assign_cpu_mask_to_starpu(starpurm_drs_desc_t *spd, const hwloc_cpuset_t mask)
  1066. {
  1067. (void)spd;
  1068. assert(_starpurm != NULL);
  1069. assert(_starpurm->state != state_uninitialized);
  1070. struct s_starpurm *rm = _starpurm;
  1071. if (!rm->dynamic_resource_sharing)
  1072. return starpurm_DRS_DISABLD;
  1073. hwloc_cpuset_t temp_cpuset = hwloc_bitmap_dup(rm->selected_cpuset);
  1074. hwloc_bitmap_or(temp_cpuset, temp_cpuset, mask);
  1075. starpurm_drs_ret_t ret = _starpurm_update_cpuset(temp_cpuset);
  1076. hwloc_bitmap_free(temp_cpuset);
  1077. return ret;
  1078. }
  1079. starpurm_drs_ret_t starpurm_assign_all_cpus_to_starpu(starpurm_drs_desc_t *spd)
  1080. {
  1081. assert(_starpurm != NULL);
  1082. assert(_starpurm->state != state_uninitialized);
  1083. struct s_starpurm *rm = _starpurm;
  1084. if (!rm->dynamic_resource_sharing)
  1085. return starpurm_DRS_DISABLD;
  1086. return starpurm_assign_cpus_to_starpu(spd, rm->nunits_by_type[starpurm_unit_cpu]);
  1087. }
  1088. starpurm_drs_ret_t starpurm_withdraw_cpu_from_starpu(starpurm_drs_desc_t *spd, int cpuid)
  1089. {
  1090. assert(_starpurm != NULL);
  1091. assert(_starpurm->state != state_uninitialized);
  1092. struct s_starpurm *rm = _starpurm;
  1093. if (!rm->dynamic_resource_sharing)
  1094. return starpurm_DRS_DISABLD;
  1095. starpurm_drs_ret_t ret = 0;
  1096. assert(hwloc_bitmap_isset(rm->global_cpuset, cpuid));
  1097. if (hwloc_bitmap_isset(rm->selected_cpuset, cpuid))
  1098. {
  1099. hwloc_cpuset_t temp_cpuset = hwloc_bitmap_dup(rm->selected_cpuset);
  1100. hwloc_bitmap_clr(temp_cpuset, cpuid);
  1101. ret = _starpurm_update_cpuset(temp_cpuset);
  1102. hwloc_bitmap_free(temp_cpuset);
  1103. }
  1104. return ret;
  1105. }
  1106. starpurm_drs_ret_t starpurm_withdraw_cpus_from_starpu(starpurm_drs_desc_t *spd, int ncpus)
  1107. {
  1108. (void)spd;
  1109. assert(_starpurm != NULL);
  1110. assert(_starpurm->state != state_uninitialized);
  1111. struct s_starpurm *rm = _starpurm;
  1112. if (!rm->dynamic_resource_sharing)
  1113. return starpurm_DRS_DISABLD;
  1114. /* add ncpus more CPUs to the CPUs pool */
  1115. starpurm_drs_ret_t ret = 0;
  1116. if (ncpus <= rm->nunits_by_type[starpurm_unit_cpu])
  1117. {
  1118. ret = _starpurm_set_ncpus(rm->nunits_by_type[starpurm_unit_cpu]-ncpus);
  1119. }
  1120. else
  1121. {
  1122. ret = _starpurm_set_ncpus(0);
  1123. }
  1124. return ret;
  1125. }
  1126. starpurm_drs_ret_t starpurm_withdraw_cpu_mask_from_starpu(starpurm_drs_desc_t *spd, const hwloc_cpuset_t mask)
  1127. {
  1128. (void)spd;
  1129. assert(_starpurm != NULL);
  1130. assert(_starpurm->state != state_uninitialized);
  1131. struct s_starpurm *rm = _starpurm;
  1132. if (!rm->dynamic_resource_sharing)
  1133. return starpurm_DRS_DISABLD;
  1134. hwloc_cpuset_t temp_cpuset = hwloc_bitmap_dup(rm->selected_cpuset);
  1135. hwloc_bitmap_andnot(temp_cpuset, temp_cpuset, mask);
  1136. starpurm_drs_ret_t ret = _starpurm_update_cpuset(temp_cpuset);
  1137. hwloc_bitmap_free(temp_cpuset);
  1138. return ret;
  1139. }
  1140. starpurm_drs_ret_t starpurm_withdraw_all_cpus_from_starpu(starpurm_drs_desc_t *spd)
  1141. {
  1142. assert(_starpurm != NULL);
  1143. assert(_starpurm->state != state_uninitialized);
  1144. struct s_starpurm *rm = _starpurm;
  1145. if (!rm->dynamic_resource_sharing)
  1146. return starpurm_DRS_DISABLD;
  1147. return starpurm_withdraw_cpus_from_starpu(spd, rm->nunits_by_type[starpurm_unit_cpu]);
  1148. }
  1149. /* --- */
  1150. starpurm_drs_ret_t starpurm_lend_cpu(starpurm_drs_desc_t *spd, int cpuid)
  1151. {
  1152. return starpurm_assign_cpu_to_starpu(spd, cpuid);
  1153. }
  1154. starpurm_drs_ret_t starpurm_lend_cpus(starpurm_drs_desc_t *spd, int ncpus)
  1155. {
  1156. return starpurm_assign_cpus_to_starpu(spd, ncpus);
  1157. }
  1158. starpurm_drs_ret_t starpurm_lend_cpu_mask(starpurm_drs_desc_t *spd, const hwloc_cpuset_t mask)
  1159. {
  1160. return starpurm_assign_cpu_mask_to_starpu(spd, mask);
  1161. }
  1162. starpurm_drs_ret_t starpurm_lend(starpurm_drs_desc_t *spd)
  1163. {
  1164. return starpurm_assign_all_cpus_to_starpu(spd);
  1165. }
  1166. starpurm_drs_ret_t starpurm_reclaim_cpu(starpurm_drs_desc_t *spd, int cpuid)
  1167. {
  1168. return starpurm_withdraw_cpu_from_starpu(spd, cpuid);
  1169. }
  1170. starpurm_drs_ret_t starpurm_reclaim_cpus(starpurm_drs_desc_t *spd, int ncpus)
  1171. {
  1172. return starpurm_withdraw_cpus_from_starpu(spd, ncpus);
  1173. }
  1174. starpurm_drs_ret_t starpurm_reclaim_cpu_mask(starpurm_drs_desc_t *spd, const hwloc_cpuset_t mask)
  1175. {
  1176. return starpurm_withdraw_cpu_mask_from_starpu(spd, mask);
  1177. }
  1178. starpurm_drs_ret_t starpurm_reclaim(starpurm_drs_desc_t *spd)
  1179. {
  1180. return starpurm_withdraw_all_cpus_from_starpu(spd);
  1181. }
  1182. starpurm_drs_ret_t starpurm_acquire(starpurm_drs_desc_t *spd)
  1183. {
  1184. return starpurm_withdraw_all_cpus_from_starpu(spd);
  1185. }
  1186. starpurm_drs_ret_t starpurm_acquire_cpu(starpurm_drs_desc_t *spd, int cpuid)
  1187. {
  1188. return starpurm_withdraw_cpu_from_starpu(spd, cpuid);
  1189. }
  1190. starpurm_drs_ret_t starpurm_acquire_cpus(starpurm_drs_desc_t *spd, int ncpus)
  1191. {
  1192. return starpurm_withdraw_cpus_from_starpu(spd, ncpus);
  1193. }
  1194. starpurm_drs_ret_t starpurm_acquire_cpu_mask(starpurm_drs_desc_t *spd, const hwloc_cpuset_t mask)
  1195. {
  1196. return starpurm_withdraw_cpu_mask_from_starpu(spd, mask);
  1197. }
  1198. starpurm_drs_ret_t starpurm_return_all(starpurm_drs_desc_t *spd)
  1199. {
  1200. return starpurm_assign_all_cpus_to_starpu(spd);
  1201. }
  1202. starpurm_drs_ret_t starpurm_return_cpu(starpurm_drs_desc_t *spd, int cpuid)
  1203. {
  1204. return starpurm_assign_cpu_to_starpu(spd, cpuid);
  1205. }
  1206. /* Pause/resume */
  1207. starpurm_drs_ret_t starpurm_create_block_condition(starpurm_block_cond_t *cond)
  1208. {
  1209. /* unimplemented */
  1210. assert(0);
  1211. return starpurm_DRS_PERM;
  1212. }
  1213. void starpurm_block_current_task(starpurm_block_cond_t *cond)
  1214. {
  1215. /* unimplemented */
  1216. assert(0);
  1217. }
  1218. void starpurm_signal_block_condition(starpurm_block_cond_t *cond)
  1219. {
  1220. /* unimplemented */
  1221. assert(0);
  1222. }
  1223. void starpurm_register_polling_service(const char *service_name, starpurm_polling_t function, void *data)
  1224. {
  1225. /* unimplemented */
  1226. assert(0);
  1227. }
  1228. void starpurm_unregister_polling_service(const char *service_name, starpurm_polling_t function, void *data)
  1229. {
  1230. /* unimplemented */
  1231. assert(0);
  1232. }
  1233. /* devices */
  1234. int starpurm_get_device_type_id(const char *type_str)
  1235. {
  1236. if (strcmp(type_str, "cpu") == 0)
  1237. return starpurm_unit_cpu;
  1238. if (strcmp(type_str, "opencl") == 0)
  1239. return starpurm_unit_opencl;
  1240. if (strcmp(type_str, "cuda") == 0)
  1241. return starpurm_unit_cuda;
  1242. if (strcmp(type_str, "mic") == 0)
  1243. return starpurm_unit_mic;
  1244. return -1;
  1245. }
  1246. const char *starpurm_get_device_type_name(int type_id)
  1247. {
  1248. if (type_id == starpurm_unit_cpu)
  1249. return "cpu";
  1250. if (type_id == starpurm_unit_opencl)
  1251. return "opencl";
  1252. if (type_id == starpurm_unit_cuda)
  1253. return "cuda";
  1254. if (type_id == starpurm_unit_mic)
  1255. return "mic";
  1256. return NULL;
  1257. }
  1258. int starpurm_get_nb_devices_by_type(int type_id)
  1259. {
  1260. assert(_starpurm != NULL);
  1261. assert(_starpurm->state != state_uninitialized);
  1262. struct s_starpurm *rm = _starpurm;
  1263. if (type_id < 0 || type_id >= starpurm_unit_ntypes)
  1264. return -1;
  1265. return rm->nunits_by_type[type_id];
  1266. }
  1267. int starpurm_get_device_id(int type_id, int unit_rank)
  1268. {
  1269. assert(_starpurm != NULL);
  1270. assert(_starpurm->state != state_uninitialized);
  1271. struct s_starpurm *rm = _starpurm;
  1272. if (type_id < 0 || type_id >= starpurm_unit_ntypes)
  1273. return -1;
  1274. if (unit_rank < 0 || unit_rank >= rm->nunits_by_type[type_id])
  1275. return -1;
  1276. return rm->units[rm->unit_offsets_by_type[type_id] + unit_rank].id;
  1277. }
  1278. starpurm_drs_ret_t starpurm_assign_device_to_starpu(starpurm_drs_desc_t *spd, int type_id, int unit_rank)
  1279. {
  1280. assert(_starpurm != NULL);
  1281. assert(_starpurm->state != state_uninitialized);
  1282. struct s_starpurm *rm = _starpurm;
  1283. if (!rm->dynamic_resource_sharing)
  1284. return starpurm_DRS_DISABLD;
  1285. if (type_id < 0 || type_id >= starpurm_unit_ntypes)
  1286. return starpurm_DRS_EINVAL;
  1287. if (unit_rank < 0 || unit_rank >= rm->nunits_by_type[type_id])
  1288. return starpurm_DRS_EINVAL;
  1289. hwloc_cpuset_t temp_cpuset = hwloc_bitmap_dup(rm->selected_cpuset);
  1290. hwloc_bitmap_or(temp_cpuset, temp_cpuset, rm->units[rm->unit_offsets_by_type[type_id] + unit_rank].worker_cpuset);
  1291. starpurm_drs_ret_t ret = _starpurm_update_cpuset(temp_cpuset);
  1292. hwloc_bitmap_free(temp_cpuset);
  1293. return ret;
  1294. }
  1295. starpurm_drs_ret_t starpurm_assign_devices_to_starpu(starpurm_drs_desc_t *spd, int type_id, int ndevices)
  1296. {
  1297. (void)spd;
  1298. assert(_starpurm != NULL);
  1299. assert(_starpurm->state != state_uninitialized);
  1300. struct s_starpurm *rm = _starpurm;
  1301. if (!rm->dynamic_resource_sharing)
  1302. return starpurm_DRS_DISABLD;
  1303. if (type_id < 0 || type_id >= starpurm_unit_ntypes)
  1304. return starpurm_DRS_EINVAL;
  1305. hwloc_cpuset_t temp_cpuset = hwloc_bitmap_dup(rm->selected_cpuset);
  1306. if (ndevices > rm->nunits_by_type[type_id])
  1307. {
  1308. ndevices = rm->nunits_by_type[type_id];
  1309. }
  1310. int i;
  1311. for (i = 0; i < ndevices; i++)
  1312. {
  1313. hwloc_bitmap_or(temp_cpuset, temp_cpuset, rm->units[rm->unit_offsets_by_type[type_id] + i].worker_cpuset);
  1314. }
  1315. starpurm_drs_ret_t ret = _starpurm_update_cpuset(temp_cpuset);
  1316. hwloc_bitmap_free(temp_cpuset);
  1317. return ret;
  1318. }
  1319. starpurm_drs_ret_t starpurm_assign_device_mask_to_starpu(starpurm_drs_desc_t *spd, const hwloc_cpuset_t mask)
  1320. {
  1321. (void)spd;
  1322. assert(_starpurm != NULL);
  1323. assert(_starpurm->state != state_uninitialized);
  1324. struct s_starpurm *rm = _starpurm;
  1325. if (!rm->dynamic_resource_sharing)
  1326. return starpurm_DRS_DISABLD;
  1327. hwloc_cpuset_t temp_cpuset = hwloc_bitmap_dup(rm->selected_cpuset);
  1328. hwloc_bitmap_or(temp_cpuset, temp_cpuset, mask);
  1329. starpurm_drs_ret_t ret = _starpurm_update_cpuset(temp_cpuset);
  1330. hwloc_bitmap_free(temp_cpuset);
  1331. return ret;
  1332. }
  1333. starpurm_drs_ret_t starpurm_assign_all_devices_to_starpu(starpurm_drs_desc_t *spd, int type_id)
  1334. {
  1335. assert(_starpurm != NULL);
  1336. assert(_starpurm->state != state_uninitialized);
  1337. struct s_starpurm *rm = _starpurm;
  1338. if (!rm->dynamic_resource_sharing)
  1339. return starpurm_DRS_DISABLD;
  1340. if (type_id < 0 || type_id >= starpurm_unit_ntypes)
  1341. return starpurm_DRS_EINVAL;
  1342. return starpurm_assign_devices_to_starpu(spd, type_id, rm->nunits_by_type[type_id]);
  1343. }
  1344. starpurm_drs_ret_t starpurm_withdraw_device_from_starpu(starpurm_drs_desc_t *spd, int type_id, int unit_rank)
  1345. {
  1346. assert(_starpurm != NULL);
  1347. assert(_starpurm->state != state_uninitialized);
  1348. struct s_starpurm *rm = _starpurm;
  1349. if (!rm->dynamic_resource_sharing)
  1350. return starpurm_DRS_DISABLD;
  1351. if (type_id < 0 || type_id >= starpurm_unit_ntypes)
  1352. return starpurm_DRS_EINVAL;
  1353. if (unit_rank < 0 || unit_rank >= rm->nunits_by_type[type_id])
  1354. return starpurm_DRS_EINVAL;
  1355. hwloc_cpuset_t temp_cpuset = hwloc_bitmap_dup(rm->selected_cpuset);
  1356. hwloc_bitmap_andnot(temp_cpuset, temp_cpuset, rm->units[rm->unit_offsets_by_type[type_id] + unit_rank].worker_cpuset);
  1357. starpurm_drs_ret_t ret = _starpurm_update_cpuset(temp_cpuset);
  1358. hwloc_bitmap_free(temp_cpuset);
  1359. return ret;
  1360. }
  1361. starpurm_drs_ret_t starpurm_withdraw_devices_from_starpu(starpurm_drs_desc_t *spd, int type_id, int ndevices)
  1362. {
  1363. (void)spd;
  1364. assert(_starpurm != NULL);
  1365. assert(_starpurm->state != state_uninitialized);
  1366. struct s_starpurm *rm = _starpurm;
  1367. if (!rm->dynamic_resource_sharing)
  1368. return starpurm_DRS_DISABLD;
  1369. if (type_id < 0 || type_id >= starpurm_unit_ntypes)
  1370. return starpurm_DRS_EINVAL;
  1371. hwloc_cpuset_t temp_cpuset = hwloc_bitmap_dup(rm->selected_cpuset);
  1372. if (ndevices > rm->nunits_by_type[type_id])
  1373. {
  1374. ndevices = rm->nunits_by_type[type_id];
  1375. }
  1376. int i;
  1377. for (i = 0; i < ndevices; i++)
  1378. {
  1379. hwloc_bitmap_andnot(temp_cpuset, temp_cpuset, rm->units[rm->unit_offsets_by_type[type_id] + i].worker_cpuset);
  1380. }
  1381. starpurm_drs_ret_t ret = _starpurm_update_cpuset(temp_cpuset);
  1382. hwloc_bitmap_free(temp_cpuset);
  1383. return ret;
  1384. }
  1385. starpurm_drs_ret_t starpurm_withdraw_device_mask_from_starpu(starpurm_drs_desc_t *spd, const hwloc_cpuset_t mask)
  1386. {
  1387. (void)spd;
  1388. assert(_starpurm != NULL);
  1389. assert(_starpurm->state != state_uninitialized);
  1390. struct s_starpurm *rm = _starpurm;
  1391. if (!rm->dynamic_resource_sharing)
  1392. return starpurm_DRS_DISABLD;
  1393. hwloc_cpuset_t temp_cpuset = hwloc_bitmap_dup(rm->selected_cpuset);
  1394. hwloc_bitmap_andnot(temp_cpuset, temp_cpuset, mask);
  1395. starpurm_drs_ret_t ret = _starpurm_update_cpuset(temp_cpuset);
  1396. hwloc_bitmap_free(temp_cpuset);
  1397. return ret;
  1398. }
  1399. starpurm_drs_ret_t starpurm_withdraw_all_devices_from_starpu(starpurm_drs_desc_t *spd, int type_id)
  1400. {
  1401. assert(_starpurm != NULL);
  1402. assert(_starpurm->state != state_uninitialized);
  1403. struct s_starpurm *rm = _starpurm;
  1404. if (!rm->dynamic_resource_sharing)
  1405. return starpurm_DRS_DISABLD;
  1406. if (type_id < 0 || type_id >= starpurm_unit_ntypes)
  1407. return starpurm_DRS_EINVAL;
  1408. return starpurm_withdraw_devices_from_starpu(spd, type_id, rm->nunits_by_type[type_id]);
  1409. }
  1410. /* --- */
  1411. starpurm_drs_ret_t starpurm_lend_device(starpurm_drs_desc_t *spd, int type_id, int unit_rank)
  1412. {
  1413. return starpurm_assign_device_to_starpu(spd, type_id, unit_rank);
  1414. }
  1415. starpurm_drs_ret_t starpurm_lend_devices(starpurm_drs_desc_t *spd, int type_id, int ndevices)
  1416. {
  1417. return starpurm_assign_devices_to_starpu(spd, type_id, ndevices);
  1418. }
  1419. starpurm_drs_ret_t starpurm_lend_device_mask(starpurm_drs_desc_t *spd, const hwloc_cpuset_t mask)
  1420. {
  1421. return starpurm_assign_device_mask_to_starpu(spd, mask);
  1422. }
  1423. starpurm_drs_ret_t starpurm_lend_all_devices(starpurm_drs_desc_t *spd, int type_id)
  1424. {
  1425. return starpurm_assign_all_devices_to_starpu(spd, type_id);
  1426. }
  1427. starpurm_drs_ret_t starpurm_reclaim_device(starpurm_drs_desc_t *spd, int type_id, int unit_rank)
  1428. {
  1429. return starpurm_withdraw_device_from_starpu(spd, type_id, unit_rank);
  1430. }
  1431. starpurm_drs_ret_t starpurm_reclaim_devices(starpurm_drs_desc_t *spd, int type_id, int ndevices)
  1432. {
  1433. return starpurm_withdraw_devices_from_starpu(spd, type_id, ndevices);
  1434. }
  1435. starpurm_drs_ret_t starpurm_reclaim_device_mask(starpurm_drs_desc_t *spd, const hwloc_cpuset_t mask)
  1436. {
  1437. return starpurm_withdraw_device_mask_from_starpu(spd, mask);
  1438. }
  1439. starpurm_drs_ret_t starpurm_reclaim_all_devices(starpurm_drs_desc_t *spd, int type_id)
  1440. {
  1441. return starpurm_withdraw_all_devices_from_starpu(spd, type_id);
  1442. }
  1443. starpurm_drs_ret_t starpurm_acquire_all_devices(starpurm_drs_desc_t *spd, int type_id)
  1444. {
  1445. return starpurm_withdraw_all_devices_from_starpu(spd, type_id);
  1446. }
  1447. starpurm_drs_ret_t starpurm_acquire_device(starpurm_drs_desc_t *spd, int type_id, int unit_rank)
  1448. {
  1449. return starpurm_withdraw_device_from_starpu(spd, type_id, unit_rank);
  1450. }
  1451. starpurm_drs_ret_t starpurm_acquire_devices(starpurm_drs_desc_t *spd, int type_id, int ndevices)
  1452. {
  1453. return starpurm_withdraw_devices_from_starpu(spd, type_id, ndevices);
  1454. }
  1455. starpurm_drs_ret_t starpurm_acquire_device_mask(starpurm_drs_desc_t *spd, const hwloc_cpuset_t mask)
  1456. {
  1457. return starpurm_withdraw_device_mask_from_starpu(spd, mask);
  1458. }
  1459. starpurm_drs_ret_t starpurm_return_all_devices(starpurm_drs_desc_t *spd, int type_id)
  1460. {
  1461. return starpurm_assign_all_devices_to_starpu(spd, type_id);
  1462. }
  1463. starpurm_drs_ret_t starpurm_return_device(starpurm_drs_desc_t *spd, int type_id, int unit_rank)
  1464. {
  1465. return starpurm_assign_device_to_starpu(spd, type_id, unit_rank);
  1466. }
  1467. /* cpusets */
  1468. hwloc_cpuset_t starpurm_get_device_worker_cpuset(int type_id, int unit_rank)
  1469. {
  1470. assert(_starpurm != NULL);
  1471. assert(_starpurm->state != state_uninitialized);
  1472. struct s_starpurm *rm = _starpurm;
  1473. assert(type_id >= 0 && type_id < starpurm_unit_ntypes);
  1474. assert(unit_rank >= 0 && unit_rank < rm->nunits_by_type[type_id]);
  1475. return hwloc_bitmap_dup(rm->units[rm->unit_offsets_by_type[type_id] + unit_rank].worker_cpuset);
  1476. }
  1477. hwloc_cpuset_t starpurm_get_global_cpuset(void)
  1478. {
  1479. assert(_starpurm != NULL);
  1480. assert(_starpurm->state != state_uninitialized);
  1481. struct s_starpurm *rm = _starpurm;
  1482. return hwloc_bitmap_dup(rm->global_cpuset);
  1483. }
  1484. hwloc_cpuset_t starpurm_get_selected_cpuset(void)
  1485. {
  1486. assert(_starpurm != NULL);
  1487. assert(_starpurm->state != state_uninitialized);
  1488. struct s_starpurm *rm = _starpurm;
  1489. return hwloc_bitmap_dup(rm->selected_cpuset);
  1490. }
  1491. hwloc_cpuset_t starpurm_get_all_cpu_workers_cpuset(void)
  1492. {
  1493. assert(_starpurm != NULL);
  1494. assert(_starpurm->state != state_uninitialized);
  1495. struct s_starpurm *rm = _starpurm;
  1496. return hwloc_bitmap_dup(rm->all_cpu_workers_cpuset);
  1497. }
  1498. static hwloc_cpuset_t starpurm_get_all_opencl_device_workers_cpuset(void)
  1499. {
  1500. assert(_starpurm != NULL);
  1501. assert(_starpurm->state != state_uninitialized);
  1502. struct s_starpurm *rm = _starpurm;
  1503. return hwloc_bitmap_dup(rm->all_opencl_device_workers_cpuset);
  1504. }
  1505. static hwloc_cpuset_t starpurm_get_all_cuda_device_workers_cpuset(void)
  1506. {
  1507. assert(_starpurm != NULL);
  1508. assert(_starpurm->state != state_uninitialized);
  1509. struct s_starpurm *rm = _starpurm;
  1510. return hwloc_bitmap_dup(rm->all_cuda_device_workers_cpuset);
  1511. }
  1512. static hwloc_cpuset_t starpurm_get_all_mic_device_workers_cpuset(void)
  1513. {
  1514. assert(_starpurm != NULL);
  1515. assert(_starpurm->state != state_uninitialized);
  1516. struct s_starpurm *rm = _starpurm;
  1517. return hwloc_bitmap_dup(rm->all_mic_device_workers_cpuset);
  1518. }
  1519. hwloc_cpuset_t starpurm_get_all_device_workers_cpuset(void)
  1520. {
  1521. assert(_starpurm != NULL);
  1522. assert(_starpurm->state != state_uninitialized);
  1523. struct s_starpurm *rm = _starpurm;
  1524. return hwloc_bitmap_dup(rm->all_device_workers_cpuset);
  1525. }
  1526. hwloc_cpuset_t starpurm_get_all_device_workers_cpuset_by_type(int typeid)
  1527. {
  1528. assert(_starpurm != NULL);
  1529. assert(_starpurm->state != state_uninitialized);
  1530. assert(typeid != starpurm_unit_cpu);
  1531. if (typeid == starpurm_unit_opencl)
  1532. return starpurm_get_all_opencl_device_workers_cpuset();
  1533. if (typeid == starpurm_unit_cuda)
  1534. return starpurm_get_all_cuda_device_workers_cpuset();
  1535. if (typeid == starpurm_unit_mic)
  1536. return starpurm_get_all_mic_device_workers_cpuset();
  1537. hwloc_cpuset_t empty_bitmap = hwloc_bitmap_alloc();
  1538. hwloc_bitmap_zero(empty_bitmap);
  1539. return empty_bitmap;
  1540. }