starpurm.c 50 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687
  1. /* StarPU --- Runtime system for heterogeneous multicore architectures.
  2. *
  3. * Copyright (C) 2017-2021 Université de Bordeaux, CNRS (LaBRI UMR 5800), Inria
  4. *
  5. * StarPU is free software; you can redistribute it and/or modify
  6. * it under the terms of the GNU Lesser General Public License as published by
  7. * the Free Software Foundation; either version 2.1 of the License, or (at
  8. * your option) any later version.
  9. *
  10. * StarPU is distributed in the hope that it will be useful, but
  11. * WITHOUT ANY WARRANTY; without even the implied warranty of
  12. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
  13. *
  14. * See the GNU Lesser General Public License in COPYING.LGPL for more details.
  15. */
  16. #include <stdlib.h>
  17. #include <stdio.h>
  18. #include <string.h>
  19. #include <assert.h>
  20. #include <hwloc.h>
  21. #include <starpu.h>
  22. #include <starpurm.h>
  23. #include <common/config.h>
  24. #include <starpurm_private.h>
  25. /*
  26. * #define _DEBUG
  27. */
  28. struct s_starpurm_unit
  29. {
  30. /* Opaque unit id.
  31. *
  32. * For StarPU-RM, this id is used as an index to array starpurm->units[].
  33. */
  34. int id;
  35. /* Id of the unit type. */
  36. int type;
  37. /* Boolean indicating whether the device is currently selected for use by the runtime system. */
  38. int selected;
  39. /* StarPU id of the worker driving the device. */
  40. int workerid;
  41. /* Cpuset of the StarPU worker. */
  42. hwloc_cpuset_t worker_cpuset;
  43. /* Condition variable to notify that a unit is now available to driver a worker waking up. */
  44. pthread_cond_t unit_available_cond;
  45. };
  46. static struct s_starpurm *_starpurm = NULL;
  47. #if 0
  48. static char *bitmap_to_str(hwloc_bitmap_t bitmap)
  49. {
  50. int strl = hwloc_bitmap_snprintf(NULL, 0, bitmap);
  51. char *str = malloc(strl+1);
  52. hwloc_bitmap_snprintf(str, strl+1, bitmap);
  53. return str;
  54. }
  55. #endif
  56. #ifdef STARPURM_STARPU_HAVE_WORKER_CALLBACKS
  57. enum e_starpurm_event
  58. {
  59. starpurm_event_code_min = 0,
  60. starpurm_event_exit = 0,
  61. starpurm_event_worker_going_to_sleep = 1,
  62. starpurm_event_worker_waking_up = 2,
  63. starpurm_event_unit_available = 3,
  64. starpurm_event_code_max = 3
  65. };
  66. const char *_starpurm_event_to_str(int event_code)
  67. {
  68. const char *s = NULL;
  69. switch (event_code)
  70. {
  71. case starpurm_event_exit:
  72. s = "starpurm_event_exit";
  73. break;
  74. case starpurm_event_worker_going_to_sleep:
  75. s = "starpurm_event_worker_going_to_sleep";
  76. break;
  77. case starpurm_event_worker_waking_up:
  78. s = "starpurm_event_worker_waking_up";
  79. break;
  80. case starpurm_event_unit_available:
  81. s = "starpurm_event_unit_available";
  82. break;
  83. default:
  84. s = "<unknown starpurm event>";
  85. break;
  86. }
  87. return s;
  88. }
  89. struct s_starpurm_event
  90. {
  91. struct s_starpurm_event *next;
  92. struct s_starpurm_event *prev;
  93. enum e_starpurm_event code;
  94. unsigned int workerid;
  95. };
  96. static void _enqueue_event(struct s_starpurm_event *event)
  97. {
  98. assert(_starpurm != NULL);
  99. assert(_starpurm->state != state_uninitialized);
  100. struct s_starpurm *rm = _starpurm;
  101. assert(event->next == NULL);
  102. assert(event->prev == NULL);
  103. assert(event->code >= starpurm_event_code_min && event->code <= starpurm_event_code_max);
  104. pthread_mutex_lock(&rm->event_list_mutex);
  105. if (rm->event_processing_ended)
  106. {
  107. pthread_mutex_unlock(&rm->event_list_mutex);
  108. return;
  109. }
  110. assert((rm->event_list_head == NULL && rm->event_list_tail == NULL)
  111. || (rm->event_list_head != NULL && rm->event_list_tail != NULL));
  112. if (rm->event_list_head == NULL)
  113. {
  114. rm->event_list_tail = event;
  115. }
  116. else
  117. {
  118. rm->event_list_head->prev = event;
  119. }
  120. event->next = rm->event_list_head;
  121. rm->event_list_head = event;
  122. if (event->code == starpurm_event_exit)
  123. {
  124. rm->event_processing_ended = 1;
  125. int i;
  126. for (i=0; i<rm->nunits; i++)
  127. {
  128. pthread_cond_broadcast(&rm->units[i].unit_available_cond);
  129. }
  130. }
  131. #ifdef STARPURM_VERBOSE
  132. if (event->code != starpurm_event_worker_waking_up)
  133. fprintf(stderr, "%s: event->code=%d('%s'), workerid=%u\n", __func__, event->code, _starpurm_event_to_str(event->code), event->workerid);
  134. #endif
  135. pthread_cond_broadcast(&rm->event_list_cond);
  136. #ifdef STARPURM_HAVE_DLB
  137. if (event->code == starpurm_event_worker_waking_up)
  138. {
  139. int unit_id = rm->worker_unit_ids[event->workerid];
  140. /* if DLB is in use, wait for the unit to become available from the point of view of DLB, before using it */
  141. #ifdef STARPURM_VERBOSE
  142. fprintf(stderr, "%s: event->code=%d('%s'), workerid=%u - waiting\n", __func__, event->code, _starpurm_event_to_str(event->code), event->workerid);
  143. #endif
  144. pthread_cond_wait(&rm->units[unit_id].unit_available_cond, &rm->event_list_mutex);
  145. #ifdef STARPURM_VERBOSE
  146. fprintf(stderr, "%s: event->code=%d('%s'), workerid=%u - wakeup\n", __func__, event->code, _starpurm_event_to_str(event->code), event->workerid);
  147. #endif
  148. }
  149. #endif
  150. pthread_mutex_unlock(&rm->event_list_mutex);
  151. }
  152. static struct s_starpurm_event *_dequeue_event_no_lock(void)
  153. {
  154. struct s_starpurm *rm = _starpurm;
  155. struct s_starpurm_event *event = NULL;
  156. if (rm->event_list_tail != NULL)
  157. {
  158. event = rm->event_list_tail;
  159. if (event->prev == NULL)
  160. {
  161. rm->event_list_head = NULL;
  162. rm->event_list_tail = NULL;
  163. }
  164. else
  165. {
  166. event->prev->next = NULL;
  167. rm->event_list_tail = event->prev;
  168. }
  169. event->prev = NULL;
  170. event->next = NULL;
  171. }
  172. return event;
  173. }
  174. static struct s_starpurm_event *_wait_event_no_lock(void)
  175. {
  176. struct s_starpurm *rm = _starpurm;
  177. while (rm->event_list_head == NULL)
  178. {
  179. pthread_cond_wait(&rm->event_list_cond, &rm->event_list_mutex);
  180. }
  181. struct s_starpurm_event *event = _dequeue_event_no_lock();
  182. return event;
  183. }
  184. /* unused */
  185. static struct s_starpurm_event *_dequeue_event(void)
  186. {
  187. assert(_starpurm != NULL);
  188. assert(_starpurm->state != state_uninitialized);
  189. struct s_starpurm *rm = _starpurm;
  190. pthread_mutex_lock(&rm->event_list_mutex);
  191. struct s_starpurm_event *event = _dequeue_event_no_lock();
  192. pthread_mutex_unlock(&rm->event_list_mutex);
  193. return event;
  194. }
  195. /* unused */
  196. static struct s_starpurm_event *_wait_event(void)
  197. {
  198. assert(_starpurm != NULL);
  199. assert(_starpurm->state != state_uninitialized);
  200. struct s_starpurm *rm = _starpurm;
  201. pthread_mutex_lock(&rm->event_list_mutex);
  202. struct s_starpurm_event *event = _wait_event_no_lock();
  203. pthread_mutex_unlock(&rm->event_list_mutex);
  204. return event;
  205. }
  206. static void _enqueue_exit_event(void)
  207. {
  208. struct s_starpurm_event *event = calloc(1, sizeof(*event));
  209. event->code = starpurm_event_exit;
  210. event->workerid = 0;
  211. _enqueue_event(event);
  212. }
  213. static void callback_worker_going_to_sleep(unsigned workerid)
  214. {
  215. struct s_starpurm_event *event = calloc(1, sizeof(*event));
  216. event->code = starpurm_event_worker_going_to_sleep;
  217. event->workerid = workerid;
  218. _enqueue_event(event);
  219. }
  220. static void callback_worker_waking_up(unsigned workerid)
  221. {
  222. struct s_starpurm_event *event = calloc(1, sizeof(*event));
  223. event->code = starpurm_event_worker_waking_up;
  224. event->workerid = workerid;
  225. _enqueue_event(event);
  226. }
  227. void starpurm_enqueue_event_cpu_unit_available(int unit_id)
  228. {
  229. assert(_starpurm != NULL);
  230. assert(_starpurm->state != state_uninitialized);
  231. struct s_starpurm *rm = _starpurm;
  232. assert(unit_id >= 0);
  233. /*
  234. * unit_id may exceed the number of CPU units actually used by StarPU,
  235. * if some CPU cores are not used.
  236. *
  237. * //assert(unit_id < rm->nunits_by_type[starpurm_unit_cpu]);
  238. */
  239. unsigned workerid = rm->units[unit_id].workerid; struct
  240. s_starpurm_event *event = calloc(1, sizeof(*event));
  241. event->code = starpurm_event_unit_available; event->workerid =
  242. workerid; _enqueue_event(event); }
  243. static void *event_thread_func(void *_arg)
  244. {
  245. (void)_arg;
  246. assert(_starpurm != NULL);
  247. assert(_starpurm->state != state_uninitialized);
  248. struct s_starpurm *rm = _starpurm;
  249. int need_refresh = 0;
  250. pthread_mutex_lock(&rm->event_list_mutex);
  251. while (rm->event_processing_enabled == 0)
  252. {
  253. pthread_cond_wait(&rm->event_processing_cond, &rm->event_list_mutex);
  254. }
  255. pthread_mutex_unlock(&rm->event_list_mutex);
  256. hwloc_cpuset_t owned_cpuset = hwloc_bitmap_dup(rm->global_cpuset);
  257. hwloc_cpuset_t to_reclaim_cpuset = hwloc_bitmap_alloc();
  258. hwloc_cpuset_t to_lend_cpuset = hwloc_bitmap_alloc();
  259. while (1)
  260. {
  261. struct s_starpurm_event *event = _dequeue_event();
  262. #ifdef STARPURM_HAVE_DLB
  263. if ((event == NULL || event->code == starpurm_event_exit) || need_refresh)
  264. #else
  265. if ((event == NULL || event->code == starpurm_event_exit) && need_refresh)
  266. #endif
  267. {
  268. int did_lend_cpuset = 1;
  269. #ifdef STARPURM_HAVE_DLB
  270. /* notify DLB about changes */
  271. if (!hwloc_bitmap_iszero(to_reclaim_cpuset))
  272. {
  273. starpurm_dlb_notify_starpu_worker_mask_waking_up(to_reclaim_cpuset);
  274. }
  275. did_lend_cpuset = 0;
  276. if (!hwloc_bitmap_iszero(to_lend_cpuset))
  277. {
  278. did_lend_cpuset = starpurm_dlb_notify_starpu_worker_mask_going_to_sleep(to_lend_cpuset);
  279. }
  280. #endif
  281. /* if DLB is not initialized, ignore lend operations */
  282. if (did_lend_cpuset)
  283. {
  284. hwloc_bitmap_andnot(owned_cpuset, owned_cpuset, to_lend_cpuset);
  285. }
  286. hwloc_bitmap_or(owned_cpuset, owned_cpuset, to_reclaim_cpuset);
  287. #if 0
  288. {
  289. char *to_lend_str = bitmap_to_str(to_lend_cpuset);
  290. char *to_reclaim_str = bitmap_to_str(to_reclaim_cpuset);
  291. free(to_lend_str);
  292. free(to_reclaim_str);
  293. }
  294. #endif
  295. need_refresh = 0;
  296. hwloc_bitmap_zero(to_lend_cpuset);
  297. hwloc_bitmap_zero(to_reclaim_cpuset);
  298. }
  299. if (event == NULL)
  300. {
  301. event = _wait_event();
  302. }
  303. if (event->code == starpurm_event_exit)
  304. {
  305. free(event);
  306. break;
  307. }
  308. /* TODO: accumulate state change */
  309. switch (event->code)
  310. {
  311. case starpurm_event_worker_going_to_sleep:
  312. {
  313. if (event->workerid < rm->nunits)
  314. {
  315. int unit_id = rm->worker_unit_ids[event->workerid];
  316. hwloc_bitmap_or(to_lend_cpuset, to_lend_cpuset, rm->units[unit_id].worker_cpuset);
  317. hwloc_bitmap_andnot(to_reclaim_cpuset, to_reclaim_cpuset, rm->units[unit_id].worker_cpuset);
  318. }
  319. }
  320. break;
  321. case starpurm_event_worker_waking_up:
  322. {
  323. if (event->workerid < rm->nunits)
  324. {
  325. int unit_id = rm->worker_unit_ids[event->workerid];
  326. hwloc_bitmap_andnot(to_lend_cpuset, to_lend_cpuset, rm->units[unit_id].worker_cpuset);
  327. #ifdef STARPURM_HAVE_DLB
  328. if (rm->units[unit_id].type == starpurm_unit_cpu && !hwloc_bitmap_intersects(rm->units[unit_id].worker_cpuset, owned_cpuset))
  329. {
  330. /* Only reclaim the unit from DLB if StarPU does not own it already. */
  331. hwloc_bitmap_or(to_reclaim_cpuset, to_reclaim_cpuset, rm->units[unit_id].worker_cpuset);
  332. }
  333. else
  334. {
  335. pthread_cond_broadcast(&rm->units[unit_id].unit_available_cond);
  336. }
  337. #else
  338. hwloc_bitmap_or(to_reclaim_cpuset, to_reclaim_cpuset, rm->units[unit_id].worker_cpuset);
  339. #endif
  340. }
  341. }
  342. break;
  343. #ifdef STARPURM_HAVE_DLB
  344. case starpurm_event_unit_available:
  345. {
  346. if (event->workerid < rm->nunits)
  347. {
  348. /* a reclaimed unit is now available from DLB, unlock the corresponding worker waking up */
  349. int unit_id = rm->worker_unit_ids[event->workerid];
  350. pthread_cond_broadcast(&rm->units[unit_id].unit_available_cond);
  351. }
  352. }
  353. break;
  354. #endif
  355. default:
  356. /* unknown event code */
  357. assert(0);
  358. break;
  359. }
  360. free(event);
  361. need_refresh = 1;
  362. }
  363. pthread_mutex_lock(&rm->event_list_mutex);
  364. /* exit event should be last */
  365. assert(rm->event_list_head == NULL);
  366. assert(rm->event_list_tail == NULL);
  367. hwloc_bitmap_free(owned_cpuset);
  368. hwloc_bitmap_free(to_reclaim_cpuset);
  369. hwloc_bitmap_free(to_lend_cpuset);
  370. pthread_mutex_unlock(&rm->event_list_mutex);
  371. return NULL;
  372. }
  373. #endif /* STARPURM_STARPU_HAVE_WORKER_CALLBACKS */
  374. /* Resource enforcement */
  375. static starpurm_drs_ret_t _starpurm_update_cpuset(hwloc_cpuset_t cpuset)
  376. {
  377. assert(_starpurm != NULL);
  378. assert(_starpurm->state != state_uninitialized);
  379. struct s_starpurm *rm = _starpurm;
  380. if (hwloc_bitmap_isequal(cpuset, rm->selected_cpuset))
  381. {
  382. return starpurm_DRS_SUCCESS;
  383. }
  384. pthread_mutex_lock(&rm->temporary_ctxs_mutex);
  385. if (rm->starpu_in_pause)
  386. {
  387. starpu_resume();
  388. rm->starpu_in_pause = 0;
  389. }
  390. int workers_to_remove[_starpurm->nunits];
  391. unsigned nworkers_to_remove = 0;
  392. int workers_to_add[_starpurm->nunits];
  393. unsigned nworkers_to_add = 0;
  394. int i;
  395. hwloc_cpuset_t temp_cpuset = hwloc_bitmap_alloc();
  396. int new_selected_ncpus = 0;
  397. for (i=0; i<rm->nunits; i++)
  398. {
  399. struct s_starpurm_unit *unit = &rm->units[i];
  400. hwloc_bitmap_and(temp_cpuset, unit->worker_cpuset, cpuset);
  401. if (hwloc_bitmap_iszero(temp_cpuset))
  402. {
  403. workers_to_remove[nworkers_to_remove] = unit->workerid;
  404. unit->selected = 0;
  405. nworkers_to_remove++;
  406. }
  407. else
  408. {
  409. workers_to_add[nworkers_to_add] = unit->workerid;
  410. unit->selected = 1;
  411. nworkers_to_add++;
  412. if (unit->type == starpurm_unit_cpu)
  413. {
  414. new_selected_ncpus++;
  415. }
  416. }
  417. }
  418. hwloc_bitmap_free(temp_cpuset);
  419. rm->selected_nworkers = nworkers_to_add;
  420. rm->selected_ncpus = new_selected_ncpus;
  421. hwloc_bitmap_free(rm->selected_cpuset);
  422. rm->selected_cpuset = hwloc_bitmap_dup(cpuset);
  423. if (nworkers_to_add > 0)
  424. {
  425. #if defined(STARPURM_HAVE_DLB) && !defined(STARPURM_STARPU_HAVE_WORKER_CALLBACKS)
  426. {
  427. /* if StarPU worker callbacks are not enabled, we still
  428. * notify DLB about resource usage changes, but we do
  429. * not wait for the formal DLB go to use the units */
  430. hwloc_cpuset_t to_reclaim_cpuset = hwloc_bitmap_alloc();
  431. for (i=0; i<nworkers_to_add; i++)
  432. {
  433. int unit_id = rm->worker_unit_ids[workers_to_add[i]];
  434. hwloc_bitmap_or(to_reclaim_cpuset, to_reclaim_cpuset, rm->units[unit_id].worker_cpuset);
  435. }
  436. starpurm_dlb_notify_starpu_worker_mask_waking_up(to_reclaim_cpuset);
  437. hwloc_bitmap_free(to_reclaim_cpuset);
  438. }
  439. #endif
  440. starpu_sched_ctx_add_workers(workers_to_add, nworkers_to_add, rm->sched_ctx_id);
  441. }
  442. if (nworkers_to_remove > 0)
  443. {
  444. starpu_sched_ctx_remove_workers(workers_to_remove, nworkers_to_remove, rm->sched_ctx_id);
  445. #if defined(STARPURM_HAVE_DLB) && !defined(STARPURM_STARPU_HAVE_WORKER_CALLBACKS)
  446. {
  447. /* if StarPU worker callbacks are not enabled, we still
  448. * notify DLB about resource usage changes, but we do
  449. * not wait for the workers to become idle */
  450. hwloc_cpuset_t to_lend_cpuset = hwloc_bitmap_alloc();
  451. for (i=0; i<nworkers_to_remove; i++)
  452. {
  453. int unit_id = rm->worker_unit_ids[workers_to_remove[i]];
  454. hwloc_bitmap_or(to_lend_cpuset, to_lend_cpuset, rm->units[unit_id].worker_cpuset);
  455. }
  456. starpurm_dlb_notify_starpu_worker_mask_going_to_sleep(to_lend_cpuset);
  457. hwloc_bitmap_free(to_lend_cpuset);
  458. }
  459. #endif
  460. }
  461. #ifdef _DEBUG
  462. starpu_sched_ctx_display_workers(rm->sched_ctx_id, stderr);
  463. #endif /* DEBUG */
  464. if (rm->selected_nworkers == 0 && rm->avail_temporary_ctxs == rm->max_temporary_ctxs)
  465. {
  466. rm->starpu_in_pause = 1;
  467. starpu_pause();
  468. }
  469. pthread_mutex_unlock(&rm->temporary_ctxs_mutex);
  470. return starpurm_DRS_SUCCESS;
  471. }
  472. static unsigned _starpurm_temporary_context_alloc(hwloc_cpuset_t cpuset)
  473. {
  474. assert(_starpurm != NULL);
  475. assert(_starpurm->state != state_uninitialized);
  476. assert(_starpurm->max_temporary_ctxs > 0);
  477. struct s_starpurm *rm = _starpurm;
  478. pthread_mutex_lock(&rm->temporary_ctxs_mutex);
  479. while(rm->avail_temporary_ctxs == 0)
  480. {
  481. pthread_cond_wait(&rm->temporary_ctxs_cond, &rm->temporary_ctxs_mutex);
  482. }
  483. assert(rm->avail_temporary_ctxs > 0);
  484. rm->avail_temporary_ctxs--;
  485. if (rm->starpu_in_pause)
  486. {
  487. starpu_resume();
  488. rm->starpu_in_pause = 0;
  489. }
  490. pthread_mutex_unlock(&rm->temporary_ctxs_mutex);
  491. unsigned sched_ctx_id = starpu_sched_ctx_create(NULL, -1, "starpurm_temp", STARPU_SCHED_CTX_POLICY_NAME, "eager", 0);
  492. assert(sched_ctx_id != STARPU_NMAX_SCHED_CTXS);
  493. int workers_to_remove[_starpurm->nunits];
  494. unsigned nworkers_to_remove = 0;
  495. int workers_to_add[_starpurm->nunits];
  496. unsigned nworkers_to_add = 0;
  497. int i;
  498. hwloc_cpuset_t temp_cpuset = hwloc_bitmap_alloc();
  499. for (i=0; i<rm->nunits; i++)
  500. {
  501. struct s_starpurm_unit *unit = &rm->units[i];
  502. hwloc_bitmap_and(temp_cpuset, unit->worker_cpuset, cpuset);
  503. if (hwloc_bitmap_iszero(temp_cpuset))
  504. {
  505. workers_to_remove[nworkers_to_remove] = unit->workerid;
  506. nworkers_to_remove++;
  507. }
  508. else
  509. {
  510. workers_to_add[nworkers_to_add] = unit->workerid;
  511. nworkers_to_add++;
  512. }
  513. }
  514. hwloc_bitmap_free(temp_cpuset);
  515. if (nworkers_to_add > 0)
  516. starpu_sched_ctx_add_workers(workers_to_add, nworkers_to_add, sched_ctx_id);
  517. if (nworkers_to_remove > 0)
  518. starpu_sched_ctx_remove_workers(workers_to_remove, nworkers_to_remove, sched_ctx_id);
  519. #ifdef _DEBUG
  520. starpu_sched_ctx_display_workers(sched_ctx_id, stderr);
  521. #endif /* DEBUG */
  522. return sched_ctx_id;
  523. }
  524. static void _starpurm_temporary_context_free(unsigned ctx)
  525. {
  526. assert(_starpurm != NULL);
  527. assert(_starpurm->state != state_uninitialized);
  528. assert(_starpurm->max_temporary_ctxs > 0);
  529. struct s_starpurm *rm = _starpurm;
  530. starpu_sched_ctx_delete(ctx);
  531. pthread_mutex_lock(&rm->temporary_ctxs_mutex);
  532. rm->avail_temporary_ctxs++;
  533. pthread_cond_signal(&rm->temporary_ctxs_cond);
  534. if (rm->selected_nworkers == 0 && rm->avail_temporary_ctxs == rm->max_temporary_ctxs)
  535. {
  536. rm->starpu_in_pause = 1;
  537. starpu_pause();
  538. }
  539. pthread_mutex_unlock(&rm->temporary_ctxs_mutex);
  540. }
  541. static starpurm_drs_ret_t _starpurm_set_ncpus(unsigned int ncpus)
  542. {
  543. assert(_starpurm != NULL);
  544. assert(_starpurm->state != state_uninitialized);
  545. struct s_starpurm *rm = _starpurm;
  546. int i;
  547. if (ncpus > rm->nunits_by_type[starpurm_unit_cpu])
  548. {
  549. ncpus = rm->nunits_by_type[starpurm_unit_cpu];
  550. }
  551. if (ncpus == rm->selected_ncpus)
  552. {
  553. return starpurm_DRS_SUCCESS;
  554. }
  555. pthread_mutex_lock(&rm->temporary_ctxs_mutex);
  556. if (rm->starpu_in_pause)
  557. {
  558. starpu_resume();
  559. rm->starpu_in_pause = 0;
  560. }
  561. int workers_to_remove[_starpurm->nunits];
  562. unsigned nworkers_to_remove = 0;
  563. int workers_to_add[_starpurm->nunits];
  564. unsigned nworkers_to_add = 0;
  565. for (i=0; i<rm->nunits; i++)
  566. {
  567. struct s_starpurm_unit *unit = &rm->units[i];
  568. if (unit->type != starpurm_unit_cpu)
  569. continue;
  570. if (nworkers_to_add < ncpus)
  571. {
  572. workers_to_add[nworkers_to_add] = unit->workerid;
  573. unit->selected = 1;
  574. nworkers_to_add++;
  575. hwloc_bitmap_or(rm->selected_cpuset, rm->selected_cpuset, unit->worker_cpuset);
  576. }
  577. else
  578. {
  579. workers_to_remove[nworkers_to_remove] = unit->workerid;
  580. unit->selected = 0;
  581. hwloc_bitmap_andnot(rm->selected_cpuset, rm->selected_cpuset, unit->worker_cpuset);
  582. nworkers_to_remove++;
  583. }
  584. }
  585. rm->selected_nworkers = nworkers_to_add;
  586. rm->selected_ncpus = nworkers_to_add;
  587. if (nworkers_to_add > 0)
  588. starpu_sched_ctx_add_workers(workers_to_add, nworkers_to_add, rm->sched_ctx_id);
  589. if (nworkers_to_remove > 0)
  590. starpu_sched_ctx_remove_workers(workers_to_remove, nworkers_to_remove, rm->sched_ctx_id);
  591. #if def_DEBUG
  592. starpu_sched_ctx_display_workers(rm->sched_ctx_id, stderr);
  593. #endif /* DEBUG */
  594. if (rm->selected_nworkers == 0 && rm->avail_temporary_ctxs == rm->max_temporary_ctxs)
  595. {
  596. rm->starpu_in_pause = 1;
  597. starpu_pause();
  598. }
  599. pthread_mutex_unlock(&rm->temporary_ctxs_mutex);
  600. return starpurm_DRS_SUCCESS;
  601. }
  602. /* Initialize rm state for StarPU */
  603. void starpurm_initialize_with_cpuset(const hwloc_cpuset_t initially_owned_cpuset)
  604. {
  605. int ret;
  606. assert(_starpurm == NULL);
  607. struct s_starpurm *rm = calloc(1, sizeof(*rm));
  608. pthread_mutex_init(&rm->temporary_ctxs_mutex, NULL);
  609. pthread_cond_init(&rm->temporary_ctxs_cond, NULL);
  610. rm->state = state_init;
  611. /* init hwloc objects */
  612. hwloc_topology_init(&rm->topology);
  613. hwloc_topology_load(rm->topology);
  614. rm->global_cpuset = hwloc_bitmap_alloc();
  615. hwloc_bitmap_zero(rm->global_cpuset);
  616. rm->initially_owned_cpuset_mask = hwloc_bitmap_dup(initially_owned_cpuset);
  617. rm->all_cpu_workers_cpuset = hwloc_bitmap_alloc();
  618. hwloc_bitmap_zero(rm->all_cpu_workers_cpuset);
  619. rm->all_opencl_device_workers_cpuset = hwloc_bitmap_alloc();
  620. hwloc_bitmap_zero(rm->all_opencl_device_workers_cpuset);
  621. rm->all_cuda_device_workers_cpuset = hwloc_bitmap_alloc();
  622. hwloc_bitmap_zero(rm->all_cuda_device_workers_cpuset);
  623. rm->all_device_workers_cpuset = hwloc_bitmap_alloc();
  624. hwloc_bitmap_zero(rm->all_device_workers_cpuset);
  625. /* init event list, before StarPU is initialized */
  626. pthread_mutex_init(&rm->event_list_mutex, NULL);
  627. pthread_cond_init(&rm->event_list_cond, NULL);
  628. pthread_cond_init(&rm->event_processing_cond, NULL);
  629. pthread_mutex_lock(&rm->event_list_mutex);
  630. rm->event_processing_enabled = 0;
  631. rm->event_processing_ended = 0;
  632. rm->event_list_head = NULL;
  633. rm->event_list_tail = NULL;
  634. pthread_mutex_unlock(&rm->event_list_mutex);
  635. /* set _starpurm here since StarPU's callbacks may reference it once starpu_init is called */
  636. _starpurm = rm;
  637. #ifdef STARPURM_STARPU_HAVE_WORKER_CALLBACKS
  638. /* launch event thread */
  639. ret = pthread_create(&rm->event_thread, NULL, event_thread_func, rm);
  640. assert(ret == 0);
  641. #endif
  642. /* init StarPU */
  643. struct starpu_conf starpu_conf;
  644. ret = starpu_conf_init(&starpu_conf);
  645. assert(ret == 0);
  646. #ifdef STARPURM_STARPU_HAVE_WORKER_CALLBACKS
  647. starpu_conf.callback_worker_going_to_sleep = callback_worker_going_to_sleep;
  648. starpu_conf.callback_worker_waking_up = callback_worker_waking_up;
  649. #endif
  650. ret = starpu_init(&starpu_conf);
  651. assert(ret == 0);
  652. /* init any worker objects */
  653. rm->nunits = starpu_worker_get_count_by_type(STARPU_ANY_WORKER);
  654. /* init device worker objects */
  655. rm->unit_ntypes = starpurm_unit_ntypes;
  656. rm->nunits_by_type = calloc(rm->unit_ntypes, sizeof(*rm->nunits_by_type));
  657. rm->unit_offsets_by_type = calloc(rm->unit_ntypes, sizeof(*rm->unit_offsets_by_type));
  658. const int cpu_nunits = starpu_worker_get_count_by_type(STARPU_CPU_WORKER);
  659. rm->nunits_by_type[starpurm_unit_cpu] = cpu_nunits;
  660. const int opencl_nunits = starpu_worker_get_count_by_type(STARPU_OPENCL_WORKER);
  661. rm->nunits_by_type[starpurm_unit_opencl] = opencl_nunits;
  662. const int cuda_nunits = starpu_worker_get_count_by_type(STARPU_CUDA_WORKER);
  663. rm->nunits_by_type[starpurm_unit_cuda] = cuda_nunits;
  664. const int nunits = cpu_nunits + opencl_nunits + cuda_nunits;
  665. rm->nunits = nunits;
  666. rm->units = calloc(nunits, sizeof(*rm->units));
  667. int unitid = 0;
  668. int cpu_workerids[cpu_nunits];
  669. starpu_worker_get_ids_by_type(STARPU_CPU_WORKER, cpu_workerids, cpu_nunits);
  670. rm->unit_offsets_by_type[starpurm_unit_cpu] = unitid;
  671. unsigned int max_worker_id = 0;
  672. int i;
  673. for (i = 0; i < cpu_nunits; i++)
  674. {
  675. rm->units[unitid].id = unitid;
  676. rm->units[unitid].type = starpurm_unit_cpu;
  677. rm->units[unitid].selected = 1; /* enabled by default */
  678. rm->units[unitid].workerid = cpu_workerids[i];
  679. if (max_worker_id < rm->units[unitid].workerid)
  680. {
  681. max_worker_id = rm->units[unitid].workerid;
  682. }
  683. rm->units[unitid].worker_cpuset = starpu_worker_get_hwloc_cpuset(rm->units[unitid].workerid);
  684. pthread_cond_init(&rm->units[unitid].unit_available_cond, NULL);
  685. hwloc_bitmap_or(rm->global_cpuset, rm->global_cpuset, rm->units[unitid].worker_cpuset);
  686. hwloc_bitmap_or(rm->all_cpu_workers_cpuset, rm->all_cpu_workers_cpuset, rm->units[unitid].worker_cpuset);;
  687. #ifdef STARPURM_VERBOSE
  688. {
  689. char * s_unit = NULL;
  690. hwloc_bitmap_asprintf(&s_unit, rm->units[unitid].worker_cpuset);
  691. fprintf(stderr, "%s: 'cpu', unitid=%d, cpuset=0x%s, workerid=%d\n", __func__, unitid, s_unit, rm->units[unitid].workerid);
  692. free(s_unit);
  693. }
  694. #endif
  695. unitid++;
  696. }
  697. int opencl_workerids[opencl_nunits];
  698. starpu_worker_get_ids_by_type(STARPU_OPENCL_WORKER, opencl_workerids, opencl_nunits);
  699. rm->unit_offsets_by_type[starpurm_unit_opencl] = unitid;
  700. for (i = 0; i < opencl_nunits; i++)
  701. {
  702. rm->units[unitid].id = unitid;
  703. rm->units[unitid].type = starpurm_unit_opencl;
  704. rm->units[unitid].selected = 1; /* enabled by default */
  705. rm->units[unitid].workerid = opencl_workerids[i];
  706. if (max_worker_id < rm->units[unitid].workerid)
  707. {
  708. max_worker_id = rm->units[unitid].workerid;
  709. }
  710. rm->units[unitid].worker_cpuset = starpu_worker_get_hwloc_cpuset(rm->units[unitid].workerid);
  711. pthread_cond_init(&rm->units[unitid].unit_available_cond, NULL);
  712. hwloc_bitmap_or(rm->global_cpuset, rm->global_cpuset, rm->units[unitid].worker_cpuset);
  713. hwloc_bitmap_or(rm->all_opencl_device_workers_cpuset, rm->all_opencl_device_workers_cpuset, rm->units[unitid].worker_cpuset);
  714. hwloc_bitmap_or(rm->all_device_workers_cpuset, rm->all_device_workers_cpuset, rm->units[unitid].worker_cpuset);
  715. unitid++;
  716. }
  717. int cuda_workerids[opencl_nunits];
  718. starpu_worker_get_ids_by_type(STARPU_CUDA_WORKER, cuda_workerids, cuda_nunits);
  719. rm->unit_offsets_by_type[starpurm_unit_cuda] = unitid;
  720. for (i = 0; i < cuda_nunits; i++)
  721. {
  722. rm->units[unitid].id = unitid;
  723. rm->units[unitid].type = starpurm_unit_cuda;
  724. rm->units[unitid].selected = 1; /* enabled by default */
  725. rm->units[unitid].workerid = cuda_workerids[i];
  726. if (max_worker_id < rm->units[unitid].workerid)
  727. {
  728. max_worker_id = rm->units[unitid].workerid;
  729. }
  730. rm->units[unitid].worker_cpuset = starpu_worker_get_hwloc_cpuset(rm->units[unitid].workerid);
  731. pthread_cond_init(&rm->units[unitid].unit_available_cond, NULL);
  732. hwloc_bitmap_or(rm->global_cpuset, rm->global_cpuset, rm->units[unitid].worker_cpuset);
  733. hwloc_bitmap_or(rm->all_cuda_device_workers_cpuset, rm->all_cuda_device_workers_cpuset, rm->units[unitid].worker_cpuset);
  734. hwloc_bitmap_or(rm->all_device_workers_cpuset, rm->all_device_workers_cpuset, rm->units[unitid].worker_cpuset);
  735. unitid++;
  736. }
  737. rm->max_worker_id = max_worker_id;
  738. {
  739. int *worker_unit_ids = malloc((max_worker_id+1) * sizeof(*worker_unit_ids));
  740. for (i = 0; i < max_worker_id+1; i++)
  741. {
  742. worker_unit_ids[i] = -1;
  743. }
  744. for (i=0; i<rm->nunits; i++)
  745. {
  746. worker_unit_ids[rm->units[i].workerid] = i;
  747. }
  748. rm->worker_unit_ids = worker_unit_ids;
  749. }
  750. /* create StarPU sched_ctx for RM instance */
  751. {
  752. int workerids[rm->nunits];
  753. starpu_worker_get_ids_by_type(STARPU_ANY_WORKER, workerids, rm->nunits);
  754. /* TODO: make sched_ctx policy configurable */
  755. rm->sched_ctx_id = starpu_sched_ctx_create(workerids, rm->nunits, "starpurm", STARPU_SCHED_CTX_POLICY_NAME, "eager", 0);
  756. #ifdef _DEBUG
  757. starpu_sched_ctx_display_workers(rm->sched_ctx_id, stderr);
  758. #endif /* DEBUG */
  759. }
  760. starpu_sched_ctx_set_context(&rm->sched_ctx_id);
  761. /* number selected workers (total) */
  762. rm->selected_nworkers = rm->nunits;
  763. /* number of selected CPUs workers */
  764. rm->selected_ncpus = rm->nunits_by_type[starpurm_unit_cpu];
  765. /* cpuset of all currently selected workers */
  766. rm->selected_cpuset = hwloc_bitmap_dup(rm->global_cpuset);
  767. if (STARPU_NMAX_SCHED_CTXS > 2)
  768. {
  769. /* account for main ctx (0) and default rm ctx (1)
  770. * TODO: check that no other ctxs are allocated by external codes */
  771. rm->max_temporary_ctxs = STARPU_NMAX_SCHED_CTXS - 2;
  772. }
  773. else
  774. {
  775. rm->max_temporary_ctxs = 0;
  776. }
  777. rm->avail_temporary_ctxs = rm->max_temporary_ctxs;
  778. if (rm->selected_nworkers == 0)
  779. {
  780. rm->starpu_in_pause = 1;
  781. starpu_pause();
  782. }
  783. else
  784. {
  785. rm->starpu_in_pause = 0;
  786. }
  787. #ifdef STARPURM_HAVE_DLB
  788. starpurm_dlb_init(rm);
  789. #endif
  790. pthread_mutex_lock(&rm->event_list_mutex);
  791. rm->event_processing_enabled = 1;
  792. pthread_cond_broadcast(&rm->event_processing_cond);
  793. pthread_mutex_unlock(&rm->event_list_mutex);
  794. _starpurm = rm;
  795. }
  796. void starpurm_initialize()
  797. {
  798. hwloc_cpuset_t full_cpuset = hwloc_bitmap_alloc_full();
  799. starpurm_initialize_with_cpuset(full_cpuset);
  800. hwloc_bitmap_free(full_cpuset);
  801. }
  802. /* Free rm struct for StarPU */
  803. void starpurm_shutdown(void)
  804. {
  805. assert(_starpurm != NULL);
  806. assert(_starpurm->state != state_uninitialized);
  807. struct s_starpurm *rm = _starpurm;
  808. if (rm->starpu_in_pause)
  809. {
  810. starpu_resume();
  811. rm->starpu_in_pause = 0;
  812. }
  813. starpu_sched_ctx_delete(rm->sched_ctx_id);
  814. #ifdef STARPURM_STARPU_HAVE_WORKER_CALLBACKS
  815. _enqueue_exit_event();
  816. #endif
  817. starpu_shutdown();
  818. #ifdef STARPURM_HAVE_DLB
  819. starpurm_dlb_exit();
  820. #endif
  821. hwloc_topology_destroy(rm->topology);
  822. #ifdef STARPURM_STARPU_HAVE_WORKER_CALLBACKS
  823. pthread_join(rm->event_thread, NULL);
  824. #endif
  825. assert(rm->event_list_head == NULL);
  826. assert(rm->event_list_tail == NULL);
  827. pthread_cond_destroy(&rm->event_list_cond);
  828. pthread_mutex_destroy(&rm->event_list_mutex);
  829. rm->state = state_uninitialized;
  830. hwloc_bitmap_free(rm->global_cpuset);
  831. hwloc_bitmap_free(rm->all_cpu_workers_cpuset);
  832. hwloc_bitmap_free(rm->all_opencl_device_workers_cpuset);
  833. hwloc_bitmap_free(rm->all_cuda_device_workers_cpuset);
  834. hwloc_bitmap_free(rm->all_device_workers_cpuset);
  835. hwloc_bitmap_free(rm->selected_cpuset);
  836. hwloc_bitmap_free(rm->initially_owned_cpuset_mask);
  837. int i;
  838. for (i=0; i<rm->nunits; i++)
  839. {
  840. pthread_cond_destroy(&rm->units[i].unit_available_cond);
  841. }
  842. free(rm->units);
  843. rm->units = NULL;
  844. free(rm->nunits_by_type);
  845. rm->nunits_by_type = NULL;
  846. free(rm->unit_offsets_by_type);
  847. rm->unit_offsets_by_type = NULL;
  848. free(rm);
  849. _starpurm = NULL;
  850. }
  851. void starpurm_spawn_kernel_on_cpus(void *data, void(*f)(void *), void *args, hwloc_cpuset_t cpuset)
  852. {
  853. (void) data;
  854. assert(_starpurm != NULL);
  855. assert(_starpurm->state != state_uninitialized);
  856. struct s_starpurm *rm = _starpurm;
  857. unsigned ctx = _starpurm_temporary_context_alloc(cpuset);
  858. starpu_sched_ctx_set_context(&ctx);
  859. f(args);
  860. starpu_sched_ctx_set_context(&rm->sched_ctx_id);
  861. _starpurm_temporary_context_free(ctx);
  862. }
  863. struct s_starpurm__spawn_args
  864. {
  865. void(*f)(void *);
  866. void *args;
  867. void(*cb_f)(void *);
  868. void *cb_args;
  869. hwloc_cpuset_t cpuset;
  870. };
  871. static void *_starpurm_spawn_kernel_thread(void *_spawn_args)
  872. {
  873. struct s_starpurm__spawn_args *spawn_args = _spawn_args;
  874. unsigned ctx = _starpurm_temporary_context_alloc(spawn_args->cpuset);
  875. starpu_sched_ctx_set_context(&ctx);
  876. spawn_args->f(spawn_args->args);
  877. struct s_starpurm *rm = _starpurm;
  878. starpu_sched_ctx_set_context(&rm->sched_ctx_id);
  879. _starpurm_temporary_context_free(ctx);
  880. spawn_args->cb_f(spawn_args->cb_args);
  881. hwloc_bitmap_free(spawn_args->cpuset);
  882. free(spawn_args);
  883. return NULL;
  884. }
  885. void starpurm_spawn_kernel_on_cpus_callback(void *data, void(*f)(void *), void *args, hwloc_cpuset_t cpuset, void(*cb_f)(void *), void *cb_args)
  886. {
  887. (void) data;
  888. struct s_starpurm__spawn_args *spawn_args = calloc(1, sizeof(*spawn_args));
  889. spawn_args->f = f;
  890. spawn_args->args = args;
  891. spawn_args->cb_f = cb_f;
  892. spawn_args->cb_args = cb_args;
  893. spawn_args->cpuset = hwloc_bitmap_dup(cpuset);
  894. pthread_attr_t attr;
  895. int ret;
  896. ret = pthread_attr_init(&attr);
  897. assert(ret == 0);
  898. ret = pthread_attr_setdetachstate(&attr, 1);
  899. assert(ret == 0);
  900. pthread_t t;
  901. ret = pthread_create(&t, &attr, _starpurm_spawn_kernel_thread, spawn_args);
  902. assert(ret == 0);
  903. }
  904. static void *_starpurm_spawn_kernel_in_default_context_thread(void *_spawn_args)
  905. {
  906. struct s_starpurm__spawn_args *spawn_args = _spawn_args;
  907. struct s_starpurm *rm = _starpurm;
  908. starpu_sched_ctx_set_context(&rm->sched_ctx_id);
  909. spawn_args->f(spawn_args->args);
  910. spawn_args->cb_f(spawn_args->cb_args);
  911. free(spawn_args);
  912. return NULL;
  913. }
  914. void starpurm_spawn_kernel_callback(void *data, void(*f)(void *), void *args, void(*cb_f)(void *), void *cb_args)
  915. {
  916. (void) data;
  917. struct s_starpurm__spawn_args *spawn_args = calloc(1, sizeof(*spawn_args));
  918. spawn_args->f = f;
  919. spawn_args->args = args;
  920. spawn_args->cb_f = cb_f;
  921. spawn_args->cb_args = cb_args;
  922. pthread_attr_t attr;
  923. int ret;
  924. ret = pthread_attr_init(&attr);
  925. assert(ret == 0);
  926. ret = pthread_attr_setdetachstate(&attr, 1);
  927. assert(ret == 0);
  928. pthread_t t;
  929. ret = pthread_create(&t, &attr, _starpurm_spawn_kernel_in_default_context_thread, spawn_args);
  930. assert(ret == 0);
  931. }
  932. hwloc_cpuset_t starpurm_get_unit_cpuset(int unitid)
  933. {
  934. assert(_starpurm != NULL);
  935. assert(_starpurm->state != state_uninitialized);
  936. struct s_starpurm *rm = _starpurm;
  937. assert(unitid >= 0 && unitid < rm->nunits);
  938. return hwloc_bitmap_dup(rm->units[unitid].worker_cpuset);
  939. }
  940. hwloc_cpuset_t starpurm_get_cpu_worker_cpuset(int unit_rank)
  941. {
  942. assert(_starpurm != NULL);
  943. assert(_starpurm->state != state_uninitialized);
  944. struct s_starpurm *rm = _starpurm;
  945. assert(unit_rank >= 0 && unit_rank < rm->nunits_by_type[starpurm_unit_cpu]);
  946. return hwloc_bitmap_dup(rm->units[rm->unit_offsets_by_type[starpurm_unit_cpu] + unit_rank].worker_cpuset);
  947. }
  948. /* Dynamic resource sharing */
  949. starpurm_drs_ret_t starpurm_set_drs_enable(starpurm_drs_desc_t *spd)
  950. {
  951. (void)spd;
  952. assert(_starpurm != NULL);
  953. assert(_starpurm->state != state_uninitialized);
  954. struct s_starpurm *rm = _starpurm;
  955. rm->dynamic_resource_sharing = 1;
  956. return starpurm_DRS_SUCCESS;
  957. }
  958. starpurm_drs_ret_t starpurm_set_drs_disable(starpurm_drs_desc_t *spd)
  959. {
  960. (void)spd;
  961. assert(_starpurm != NULL);
  962. assert(_starpurm->state != state_uninitialized);
  963. struct s_starpurm *rm = _starpurm;
  964. rm->dynamic_resource_sharing = 0;
  965. return starpurm_DRS_SUCCESS;
  966. }
  967. int starpurm_drs_enabled_p(void)
  968. {
  969. assert(_starpurm != NULL);
  970. assert(_starpurm->state != state_uninitialized);
  971. struct s_starpurm *rm = _starpurm;
  972. return rm->dynamic_resource_sharing;
  973. }
  974. starpurm_drs_ret_t starpurm_set_max_parallelism(starpurm_drs_desc_t *spd, int ncpus)
  975. {
  976. (void)spd;
  977. assert(_starpurm != NULL);
  978. assert(_starpurm->state != state_uninitialized);
  979. struct s_starpurm *rm = _starpurm;
  980. if (!rm->dynamic_resource_sharing)
  981. return starpurm_DRS_DISABLD;
  982. if (ncpus > rm->nunits_by_type[starpurm_unit_cpu])
  983. {
  984. ncpus = rm->nunits_by_type[starpurm_unit_cpu];
  985. }
  986. rm->max_ncpus = ncpus;
  987. if (rm->selected_ncpus > ncpus)
  988. {
  989. return _starpurm_set_ncpus(ncpus);
  990. }
  991. return starpurm_DRS_SUCCESS;
  992. }
  993. starpurm_drs_ret_t starpurm_callback_set(starpurm_drs_desc_t *spd, starpurm_drs_cbs_t which, starpurm_drs_cb_t callback)
  994. {
  995. (void)spd;
  996. (void)which;
  997. (void)callback;
  998. /* unimplemented */
  999. assert(0);
  1000. return starpurm_DRS_PERM;
  1001. }
  1002. starpurm_drs_ret_t starpurm_callback_get(starpurm_drs_desc_t *spd, starpurm_drs_cbs_t which, starpurm_drs_cb_t *callback)
  1003. {
  1004. (void)spd;
  1005. (void)which;
  1006. (void)callback;
  1007. /* unimplemented */
  1008. assert(0);
  1009. return starpurm_DRS_PERM;
  1010. }
  1011. starpurm_drs_ret_t starpurm_assign_cpu_to_starpu(starpurm_drs_desc_t *spd, int cpuid)
  1012. {
  1013. assert(_starpurm != NULL);
  1014. assert(_starpurm->state != state_uninitialized);
  1015. struct s_starpurm *rm = _starpurm;
  1016. if (!rm->dynamic_resource_sharing)
  1017. return starpurm_DRS_DISABLD;
  1018. starpurm_drs_ret_t ret = 0;
  1019. assert(hwloc_bitmap_isset(rm->global_cpuset, cpuid));
  1020. if (!hwloc_bitmap_isset(rm->selected_cpuset, cpuid))
  1021. {
  1022. hwloc_cpuset_t temp_cpuset = hwloc_bitmap_dup(rm->selected_cpuset);
  1023. hwloc_bitmap_set(temp_cpuset, cpuid);
  1024. ret = _starpurm_update_cpuset(temp_cpuset);
  1025. hwloc_bitmap_free(temp_cpuset);
  1026. }
  1027. return ret;
  1028. }
  1029. starpurm_drs_ret_t starpurm_assign_cpus_to_starpu(starpurm_drs_desc_t *spd, int ncpus)
  1030. {
  1031. (void)spd;
  1032. assert(_starpurm != NULL);
  1033. assert(_starpurm->state != state_uninitialized);
  1034. struct s_starpurm *rm = _starpurm;
  1035. if (!rm->dynamic_resource_sharing)
  1036. return starpurm_DRS_DISABLD;
  1037. /* add ncpus more CPUs to the CPUs pool */
  1038. return _starpurm_set_ncpus(rm->selected_ncpus+ncpus);
  1039. }
  1040. starpurm_drs_ret_t starpurm_assign_cpu_mask_to_starpu(starpurm_drs_desc_t *spd, const hwloc_cpuset_t mask)
  1041. {
  1042. (void)spd;
  1043. assert(_starpurm != NULL);
  1044. assert(_starpurm->state != state_uninitialized);
  1045. struct s_starpurm *rm = _starpurm;
  1046. if (!rm->dynamic_resource_sharing)
  1047. return starpurm_DRS_DISABLD;
  1048. hwloc_cpuset_t temp_cpuset = hwloc_bitmap_dup(rm->selected_cpuset);
  1049. hwloc_bitmap_or(temp_cpuset, temp_cpuset, mask);
  1050. starpurm_drs_ret_t ret = _starpurm_update_cpuset(temp_cpuset);
  1051. hwloc_bitmap_free(temp_cpuset);
  1052. return ret;
  1053. }
  1054. starpurm_drs_ret_t starpurm_assign_all_cpus_to_starpu(starpurm_drs_desc_t *spd)
  1055. {
  1056. assert(_starpurm != NULL);
  1057. assert(_starpurm->state != state_uninitialized);
  1058. struct s_starpurm *rm = _starpurm;
  1059. if (!rm->dynamic_resource_sharing)
  1060. return starpurm_DRS_DISABLD;
  1061. return starpurm_assign_cpus_to_starpu(spd, rm->nunits_by_type[starpurm_unit_cpu]);
  1062. }
  1063. starpurm_drs_ret_t starpurm_withdraw_cpu_from_starpu(starpurm_drs_desc_t *spd, int cpuid)
  1064. {
  1065. assert(_starpurm != NULL);
  1066. assert(_starpurm->state != state_uninitialized);
  1067. struct s_starpurm *rm = _starpurm;
  1068. if (!rm->dynamic_resource_sharing)
  1069. return starpurm_DRS_DISABLD;
  1070. starpurm_drs_ret_t ret = 0;
  1071. assert(hwloc_bitmap_isset(rm->global_cpuset, cpuid));
  1072. if (hwloc_bitmap_isset(rm->selected_cpuset, cpuid))
  1073. {
  1074. hwloc_cpuset_t temp_cpuset = hwloc_bitmap_dup(rm->selected_cpuset);
  1075. hwloc_bitmap_clr(temp_cpuset, cpuid);
  1076. ret = _starpurm_update_cpuset(temp_cpuset);
  1077. hwloc_bitmap_free(temp_cpuset);
  1078. }
  1079. return ret;
  1080. }
  1081. starpurm_drs_ret_t starpurm_withdraw_cpus_from_starpu(starpurm_drs_desc_t *spd, int ncpus)
  1082. {
  1083. (void)spd;
  1084. assert(_starpurm != NULL);
  1085. assert(_starpurm->state != state_uninitialized);
  1086. struct s_starpurm *rm = _starpurm;
  1087. if (!rm->dynamic_resource_sharing)
  1088. return starpurm_DRS_DISABLD;
  1089. /* add ncpus more CPUs to the CPUs pool */
  1090. starpurm_drs_ret_t ret = 0;
  1091. if (ncpus <= rm->nunits_by_type[starpurm_unit_cpu])
  1092. {
  1093. ret = _starpurm_set_ncpus(rm->nunits_by_type[starpurm_unit_cpu]-ncpus);
  1094. }
  1095. else
  1096. {
  1097. ret = _starpurm_set_ncpus(0);
  1098. }
  1099. return ret;
  1100. }
  1101. starpurm_drs_ret_t starpurm_withdraw_cpu_mask_from_starpu(starpurm_drs_desc_t *spd, const hwloc_cpuset_t mask)
  1102. {
  1103. (void)spd;
  1104. assert(_starpurm != NULL);
  1105. assert(_starpurm->state != state_uninitialized);
  1106. struct s_starpurm *rm = _starpurm;
  1107. if (!rm->dynamic_resource_sharing)
  1108. return starpurm_DRS_DISABLD;
  1109. hwloc_cpuset_t temp_cpuset = hwloc_bitmap_dup(rm->selected_cpuset);
  1110. hwloc_bitmap_andnot(temp_cpuset, temp_cpuset, mask);
  1111. starpurm_drs_ret_t ret = _starpurm_update_cpuset(temp_cpuset);
  1112. hwloc_bitmap_free(temp_cpuset);
  1113. return ret;
  1114. }
  1115. starpurm_drs_ret_t starpurm_withdraw_all_cpus_from_starpu(starpurm_drs_desc_t *spd)
  1116. {
  1117. assert(_starpurm != NULL);
  1118. assert(_starpurm->state != state_uninitialized);
  1119. struct s_starpurm *rm = _starpurm;
  1120. if (!rm->dynamic_resource_sharing)
  1121. return starpurm_DRS_DISABLD;
  1122. return starpurm_withdraw_cpus_from_starpu(spd, rm->nunits_by_type[starpurm_unit_cpu]);
  1123. }
  1124. /* --- */
  1125. starpurm_drs_ret_t starpurm_lend_cpu(starpurm_drs_desc_t *spd, int cpuid)
  1126. {
  1127. return starpurm_assign_cpu_to_starpu(spd, cpuid);
  1128. }
  1129. starpurm_drs_ret_t starpurm_lend_cpus(starpurm_drs_desc_t *spd, int ncpus)
  1130. {
  1131. return starpurm_assign_cpus_to_starpu(spd, ncpus);
  1132. }
  1133. starpurm_drs_ret_t starpurm_lend_cpu_mask(starpurm_drs_desc_t *spd, const hwloc_cpuset_t mask)
  1134. {
  1135. return starpurm_assign_cpu_mask_to_starpu(spd, mask);
  1136. }
  1137. starpurm_drs_ret_t starpurm_lend(starpurm_drs_desc_t *spd)
  1138. {
  1139. return starpurm_assign_all_cpus_to_starpu(spd);
  1140. }
  1141. starpurm_drs_ret_t starpurm_reclaim_cpu(starpurm_drs_desc_t *spd, int cpuid)
  1142. {
  1143. return starpurm_withdraw_cpu_from_starpu(spd, cpuid);
  1144. }
  1145. starpurm_drs_ret_t starpurm_reclaim_cpus(starpurm_drs_desc_t *spd, int ncpus)
  1146. {
  1147. return starpurm_withdraw_cpus_from_starpu(spd, ncpus);
  1148. }
  1149. starpurm_drs_ret_t starpurm_reclaim_cpu_mask(starpurm_drs_desc_t *spd, const hwloc_cpuset_t mask)
  1150. {
  1151. return starpurm_withdraw_cpu_mask_from_starpu(spd, mask);
  1152. }
  1153. starpurm_drs_ret_t starpurm_reclaim(starpurm_drs_desc_t *spd)
  1154. {
  1155. return starpurm_withdraw_all_cpus_from_starpu(spd);
  1156. }
  1157. starpurm_drs_ret_t starpurm_acquire(starpurm_drs_desc_t *spd)
  1158. {
  1159. return starpurm_withdraw_all_cpus_from_starpu(spd);
  1160. }
  1161. starpurm_drs_ret_t starpurm_acquire_cpu(starpurm_drs_desc_t *spd, int cpuid)
  1162. {
  1163. return starpurm_withdraw_cpu_from_starpu(spd, cpuid);
  1164. }
  1165. starpurm_drs_ret_t starpurm_acquire_cpus(starpurm_drs_desc_t *spd, int ncpus)
  1166. {
  1167. return starpurm_withdraw_cpus_from_starpu(spd, ncpus);
  1168. }
  1169. starpurm_drs_ret_t starpurm_acquire_cpu_mask(starpurm_drs_desc_t *spd, const hwloc_cpuset_t mask)
  1170. {
  1171. return starpurm_withdraw_cpu_mask_from_starpu(spd, mask);
  1172. }
  1173. starpurm_drs_ret_t starpurm_return_all(starpurm_drs_desc_t *spd)
  1174. {
  1175. return starpurm_assign_all_cpus_to_starpu(spd);
  1176. }
  1177. starpurm_drs_ret_t starpurm_return_cpu(starpurm_drs_desc_t *spd, int cpuid)
  1178. {
  1179. return starpurm_assign_cpu_to_starpu(spd, cpuid);
  1180. }
  1181. /* Pause/resume */
  1182. starpurm_drs_ret_t starpurm_create_block_condition(starpurm_block_cond_t *cond)
  1183. {
  1184. /* unimplemented */
  1185. assert(0);
  1186. return starpurm_DRS_PERM;
  1187. }
  1188. void starpurm_block_current_task(starpurm_block_cond_t *cond)
  1189. {
  1190. /* unimplemented */
  1191. assert(0);
  1192. }
  1193. void starpurm_signal_block_condition(starpurm_block_cond_t *cond)
  1194. {
  1195. /* unimplemented */
  1196. assert(0);
  1197. }
  1198. void starpurm_register_polling_service(const char *service_name, starpurm_polling_t function, void *data)
  1199. {
  1200. /* unimplemented */
  1201. assert(0);
  1202. }
  1203. void starpurm_unregister_polling_service(const char *service_name, starpurm_polling_t function, void *data)
  1204. {
  1205. /* unimplemented */
  1206. assert(0);
  1207. }
  1208. /* devices */
  1209. int starpurm_get_device_type_id(const char *type_str)
  1210. {
  1211. if (strcmp(type_str, "cpu") == 0)
  1212. return starpurm_unit_cpu;
  1213. if (strcmp(type_str, "opencl") == 0)
  1214. return starpurm_unit_opencl;
  1215. if (strcmp(type_str, "cuda") == 0)
  1216. return starpurm_unit_cuda;
  1217. return -1;
  1218. }
  1219. const char *starpurm_get_device_type_name(int type_id)
  1220. {
  1221. if (type_id == starpurm_unit_cpu)
  1222. return "cpu";
  1223. if (type_id == starpurm_unit_opencl)
  1224. return "opencl";
  1225. if (type_id == starpurm_unit_cuda)
  1226. return "cuda";
  1227. return NULL;
  1228. }
  1229. int starpurm_get_nb_devices_by_type(int type_id)
  1230. {
  1231. assert(_starpurm != NULL);
  1232. assert(_starpurm->state != state_uninitialized);
  1233. struct s_starpurm *rm = _starpurm;
  1234. if (type_id < 0 || type_id >= starpurm_unit_ntypes)
  1235. return -1;
  1236. return rm->nunits_by_type[type_id];
  1237. }
  1238. int starpurm_get_device_id(int type_id, int unit_rank)
  1239. {
  1240. assert(_starpurm != NULL);
  1241. assert(_starpurm->state != state_uninitialized);
  1242. struct s_starpurm *rm = _starpurm;
  1243. if (type_id < 0 || type_id >= starpurm_unit_ntypes)
  1244. return -1;
  1245. if (unit_rank < 0 || unit_rank >= rm->nunits_by_type[type_id])
  1246. return -1;
  1247. return rm->units[rm->unit_offsets_by_type[type_id] + unit_rank].id;
  1248. }
  1249. starpurm_drs_ret_t starpurm_assign_device_to_starpu(starpurm_drs_desc_t *spd, int type_id, int unit_rank)
  1250. {
  1251. assert(_starpurm != NULL);
  1252. assert(_starpurm->state != state_uninitialized);
  1253. struct s_starpurm *rm = _starpurm;
  1254. if (!rm->dynamic_resource_sharing)
  1255. return starpurm_DRS_DISABLD;
  1256. if (type_id < 0 || type_id >= starpurm_unit_ntypes)
  1257. return starpurm_DRS_EINVAL;
  1258. if (unit_rank < 0 || unit_rank >= rm->nunits_by_type[type_id])
  1259. return starpurm_DRS_EINVAL;
  1260. hwloc_cpuset_t temp_cpuset = hwloc_bitmap_dup(rm->selected_cpuset);
  1261. hwloc_bitmap_or(temp_cpuset, temp_cpuset, rm->units[rm->unit_offsets_by_type[type_id] + unit_rank].worker_cpuset);
  1262. starpurm_drs_ret_t ret = _starpurm_update_cpuset(temp_cpuset);
  1263. hwloc_bitmap_free(temp_cpuset);
  1264. return ret;
  1265. }
  1266. starpurm_drs_ret_t starpurm_assign_devices_to_starpu(starpurm_drs_desc_t *spd, int type_id, int ndevices)
  1267. {
  1268. (void)spd;
  1269. assert(_starpurm != NULL);
  1270. assert(_starpurm->state != state_uninitialized);
  1271. struct s_starpurm *rm = _starpurm;
  1272. if (!rm->dynamic_resource_sharing)
  1273. return starpurm_DRS_DISABLD;
  1274. if (type_id < 0 || type_id >= starpurm_unit_ntypes)
  1275. return starpurm_DRS_EINVAL;
  1276. hwloc_cpuset_t temp_cpuset = hwloc_bitmap_dup(rm->selected_cpuset);
  1277. if (ndevices > rm->nunits_by_type[type_id])
  1278. {
  1279. ndevices = rm->nunits_by_type[type_id];
  1280. }
  1281. int i;
  1282. for (i = 0; i < ndevices; i++)
  1283. {
  1284. hwloc_bitmap_or(temp_cpuset, temp_cpuset, rm->units[rm->unit_offsets_by_type[type_id] + i].worker_cpuset);
  1285. }
  1286. starpurm_drs_ret_t ret = _starpurm_update_cpuset(temp_cpuset);
  1287. hwloc_bitmap_free(temp_cpuset);
  1288. return ret;
  1289. }
  1290. starpurm_drs_ret_t starpurm_assign_device_mask_to_starpu(starpurm_drs_desc_t *spd, const hwloc_cpuset_t mask)
  1291. {
  1292. (void)spd;
  1293. assert(_starpurm != NULL);
  1294. assert(_starpurm->state != state_uninitialized);
  1295. struct s_starpurm *rm = _starpurm;
  1296. if (!rm->dynamic_resource_sharing)
  1297. return starpurm_DRS_DISABLD;
  1298. hwloc_cpuset_t temp_cpuset = hwloc_bitmap_dup(rm->selected_cpuset);
  1299. hwloc_bitmap_or(temp_cpuset, temp_cpuset, mask);
  1300. starpurm_drs_ret_t ret = _starpurm_update_cpuset(temp_cpuset);
  1301. hwloc_bitmap_free(temp_cpuset);
  1302. return ret;
  1303. }
  1304. starpurm_drs_ret_t starpurm_assign_all_devices_to_starpu(starpurm_drs_desc_t *spd, int type_id)
  1305. {
  1306. assert(_starpurm != NULL);
  1307. assert(_starpurm->state != state_uninitialized);
  1308. struct s_starpurm *rm = _starpurm;
  1309. if (!rm->dynamic_resource_sharing)
  1310. return starpurm_DRS_DISABLD;
  1311. if (type_id < 0 || type_id >= starpurm_unit_ntypes)
  1312. return starpurm_DRS_EINVAL;
  1313. return starpurm_assign_devices_to_starpu(spd, type_id, rm->nunits_by_type[type_id]);
  1314. }
  1315. starpurm_drs_ret_t starpurm_withdraw_device_from_starpu(starpurm_drs_desc_t *spd, int type_id, int unit_rank)
  1316. {
  1317. assert(_starpurm != NULL);
  1318. assert(_starpurm->state != state_uninitialized);
  1319. struct s_starpurm *rm = _starpurm;
  1320. if (!rm->dynamic_resource_sharing)
  1321. return starpurm_DRS_DISABLD;
  1322. if (type_id < 0 || type_id >= starpurm_unit_ntypes)
  1323. return starpurm_DRS_EINVAL;
  1324. if (unit_rank < 0 || unit_rank >= rm->nunits_by_type[type_id])
  1325. return starpurm_DRS_EINVAL;
  1326. hwloc_cpuset_t temp_cpuset = hwloc_bitmap_dup(rm->selected_cpuset);
  1327. hwloc_bitmap_andnot(temp_cpuset, temp_cpuset, rm->units[rm->unit_offsets_by_type[type_id] + unit_rank].worker_cpuset);
  1328. starpurm_drs_ret_t ret = _starpurm_update_cpuset(temp_cpuset);
  1329. hwloc_bitmap_free(temp_cpuset);
  1330. return ret;
  1331. }
  1332. starpurm_drs_ret_t starpurm_withdraw_devices_from_starpu(starpurm_drs_desc_t *spd, int type_id, int ndevices)
  1333. {
  1334. (void)spd;
  1335. assert(_starpurm != NULL);
  1336. assert(_starpurm->state != state_uninitialized);
  1337. struct s_starpurm *rm = _starpurm;
  1338. if (!rm->dynamic_resource_sharing)
  1339. return starpurm_DRS_DISABLD;
  1340. if (type_id < 0 || type_id >= starpurm_unit_ntypes)
  1341. return starpurm_DRS_EINVAL;
  1342. hwloc_cpuset_t temp_cpuset = hwloc_bitmap_dup(rm->selected_cpuset);
  1343. if (ndevices > rm->nunits_by_type[type_id])
  1344. {
  1345. ndevices = rm->nunits_by_type[type_id];
  1346. }
  1347. int i;
  1348. for (i = 0; i < ndevices; i++)
  1349. {
  1350. hwloc_bitmap_andnot(temp_cpuset, temp_cpuset, rm->units[rm->unit_offsets_by_type[type_id] + i].worker_cpuset);
  1351. }
  1352. starpurm_drs_ret_t ret = _starpurm_update_cpuset(temp_cpuset);
  1353. hwloc_bitmap_free(temp_cpuset);
  1354. return ret;
  1355. }
  1356. starpurm_drs_ret_t starpurm_withdraw_device_mask_from_starpu(starpurm_drs_desc_t *spd, const hwloc_cpuset_t mask)
  1357. {
  1358. (void)spd;
  1359. assert(_starpurm != NULL);
  1360. assert(_starpurm->state != state_uninitialized);
  1361. struct s_starpurm *rm = _starpurm;
  1362. if (!rm->dynamic_resource_sharing)
  1363. return starpurm_DRS_DISABLD;
  1364. hwloc_cpuset_t temp_cpuset = hwloc_bitmap_dup(rm->selected_cpuset);
  1365. hwloc_bitmap_andnot(temp_cpuset, temp_cpuset, mask);
  1366. starpurm_drs_ret_t ret = _starpurm_update_cpuset(temp_cpuset);
  1367. hwloc_bitmap_free(temp_cpuset);
  1368. return ret;
  1369. }
  1370. starpurm_drs_ret_t starpurm_withdraw_all_devices_from_starpu(starpurm_drs_desc_t *spd, int type_id)
  1371. {
  1372. assert(_starpurm != NULL);
  1373. assert(_starpurm->state != state_uninitialized);
  1374. struct s_starpurm *rm = _starpurm;
  1375. if (!rm->dynamic_resource_sharing)
  1376. return starpurm_DRS_DISABLD;
  1377. if (type_id < 0 || type_id >= starpurm_unit_ntypes)
  1378. return starpurm_DRS_EINVAL;
  1379. return starpurm_withdraw_devices_from_starpu(spd, type_id, rm->nunits_by_type[type_id]);
  1380. }
  1381. /* --- */
  1382. starpurm_drs_ret_t starpurm_lend_device(starpurm_drs_desc_t *spd, int type_id, int unit_rank)
  1383. {
  1384. return starpurm_assign_device_to_starpu(spd, type_id, unit_rank);
  1385. }
  1386. starpurm_drs_ret_t starpurm_lend_devices(starpurm_drs_desc_t *spd, int type_id, int ndevices)
  1387. {
  1388. return starpurm_assign_devices_to_starpu(spd, type_id, ndevices);
  1389. }
  1390. starpurm_drs_ret_t starpurm_lend_device_mask(starpurm_drs_desc_t *spd, const hwloc_cpuset_t mask)
  1391. {
  1392. return starpurm_assign_device_mask_to_starpu(spd, mask);
  1393. }
  1394. starpurm_drs_ret_t starpurm_lend_all_devices(starpurm_drs_desc_t *spd, int type_id)
  1395. {
  1396. return starpurm_assign_all_devices_to_starpu(spd, type_id);
  1397. }
  1398. starpurm_drs_ret_t starpurm_reclaim_device(starpurm_drs_desc_t *spd, int type_id, int unit_rank)
  1399. {
  1400. return starpurm_withdraw_device_from_starpu(spd, type_id, unit_rank);
  1401. }
  1402. starpurm_drs_ret_t starpurm_reclaim_devices(starpurm_drs_desc_t *spd, int type_id, int ndevices)
  1403. {
  1404. return starpurm_withdraw_devices_from_starpu(spd, type_id, ndevices);
  1405. }
  1406. starpurm_drs_ret_t starpurm_reclaim_device_mask(starpurm_drs_desc_t *spd, const hwloc_cpuset_t mask)
  1407. {
  1408. return starpurm_withdraw_device_mask_from_starpu(spd, mask);
  1409. }
  1410. starpurm_drs_ret_t starpurm_reclaim_all_devices(starpurm_drs_desc_t *spd, int type_id)
  1411. {
  1412. return starpurm_withdraw_all_devices_from_starpu(spd, type_id);
  1413. }
  1414. starpurm_drs_ret_t starpurm_acquire_all_devices(starpurm_drs_desc_t *spd, int type_id)
  1415. {
  1416. return starpurm_withdraw_all_devices_from_starpu(spd, type_id);
  1417. }
  1418. starpurm_drs_ret_t starpurm_acquire_device(starpurm_drs_desc_t *spd, int type_id, int unit_rank)
  1419. {
  1420. return starpurm_withdraw_device_from_starpu(spd, type_id, unit_rank);
  1421. }
  1422. starpurm_drs_ret_t starpurm_acquire_devices(starpurm_drs_desc_t *spd, int type_id, int ndevices)
  1423. {
  1424. return starpurm_withdraw_devices_from_starpu(spd, type_id, ndevices);
  1425. }
  1426. starpurm_drs_ret_t starpurm_acquire_device_mask(starpurm_drs_desc_t *spd, const hwloc_cpuset_t mask)
  1427. {
  1428. return starpurm_withdraw_device_mask_from_starpu(spd, mask);
  1429. }
  1430. starpurm_drs_ret_t starpurm_return_all_devices(starpurm_drs_desc_t *spd, int type_id)
  1431. {
  1432. return starpurm_assign_all_devices_to_starpu(spd, type_id);
  1433. }
  1434. starpurm_drs_ret_t starpurm_return_device(starpurm_drs_desc_t *spd, int type_id, int unit_rank)
  1435. {
  1436. return starpurm_assign_device_to_starpu(spd, type_id, unit_rank);
  1437. }
  1438. /* cpusets */
  1439. hwloc_cpuset_t starpurm_get_device_worker_cpuset(int type_id, int unit_rank)
  1440. {
  1441. assert(_starpurm != NULL);
  1442. assert(_starpurm->state != state_uninitialized);
  1443. struct s_starpurm *rm = _starpurm;
  1444. assert(type_id >= 0 && type_id < starpurm_unit_ntypes);
  1445. assert(unit_rank >= 0 && unit_rank < rm->nunits_by_type[type_id]);
  1446. return hwloc_bitmap_dup(rm->units[rm->unit_offsets_by_type[type_id] + unit_rank].worker_cpuset);
  1447. }
  1448. hwloc_cpuset_t starpurm_get_global_cpuset(void)
  1449. {
  1450. assert(_starpurm != NULL);
  1451. assert(_starpurm->state != state_uninitialized);
  1452. struct s_starpurm *rm = _starpurm;
  1453. return hwloc_bitmap_dup(rm->global_cpuset);
  1454. }
  1455. hwloc_cpuset_t starpurm_get_selected_cpuset(void)
  1456. {
  1457. assert(_starpurm != NULL);
  1458. assert(_starpurm->state != state_uninitialized);
  1459. struct s_starpurm *rm = _starpurm;
  1460. return hwloc_bitmap_dup(rm->selected_cpuset);
  1461. }
  1462. hwloc_cpuset_t starpurm_get_all_cpu_workers_cpuset(void)
  1463. {
  1464. assert(_starpurm != NULL);
  1465. assert(_starpurm->state != state_uninitialized);
  1466. struct s_starpurm *rm = _starpurm;
  1467. return hwloc_bitmap_dup(rm->all_cpu_workers_cpuset);
  1468. }
  1469. static hwloc_cpuset_t starpurm_get_all_opencl_device_workers_cpuset(void)
  1470. {
  1471. assert(_starpurm != NULL);
  1472. assert(_starpurm->state != state_uninitialized);
  1473. struct s_starpurm *rm = _starpurm;
  1474. return hwloc_bitmap_dup(rm->all_opencl_device_workers_cpuset);
  1475. }
  1476. static hwloc_cpuset_t starpurm_get_all_cuda_device_workers_cpuset(void)
  1477. {
  1478. assert(_starpurm != NULL);
  1479. assert(_starpurm->state != state_uninitialized);
  1480. struct s_starpurm *rm = _starpurm;
  1481. return hwloc_bitmap_dup(rm->all_cuda_device_workers_cpuset);
  1482. }
  1483. hwloc_cpuset_t starpurm_get_all_device_workers_cpuset(void)
  1484. {
  1485. assert(_starpurm != NULL);
  1486. assert(_starpurm->state != state_uninitialized);
  1487. struct s_starpurm *rm = _starpurm;
  1488. return hwloc_bitmap_dup(rm->all_device_workers_cpuset);
  1489. }
  1490. hwloc_cpuset_t starpurm_get_all_device_workers_cpuset_by_type(int typeid)
  1491. {
  1492. assert(_starpurm != NULL);
  1493. assert(_starpurm->state != state_uninitialized);
  1494. assert(typeid != starpurm_unit_cpu);
  1495. if (typeid == starpurm_unit_opencl)
  1496. return starpurm_get_all_opencl_device_workers_cpuset();
  1497. if (typeid == starpurm_unit_cuda)
  1498. return starpurm_get_all_cuda_device_workers_cpuset();
  1499. hwloc_cpuset_t empty_bitmap = hwloc_bitmap_alloc();
  1500. hwloc_bitmap_zero(empty_bitmap);
  1501. return empty_bitmap;
  1502. }