starpurm.c 48 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620
  1. /* StarPU --- Resource Management Layer.
  2. *
  3. * Copyright (C) 2017, 2018 Inria
  4. *
  5. * StarPU is free software; you can redistribute it and/or modify
  6. * it under the terms of the GNU Lesser General Public License as published by
  7. * the Free Software Foundation; either version 2.1 of the License, or (at
  8. * your option) any later version.
  9. *
  10. * StarPU is distributed in the hope that it will be useful, but
  11. * WITHOUT ANY WARRANTY; without even the implied warranty of
  12. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
  13. *
  14. * See the GNU Lesser General Public License in COPYING.LGPL for more details.
  15. */
  16. #include <stdlib.h>
  17. #include <stdio.h>
  18. #include <string.h>
  19. #include <assert.h>
  20. #include <hwloc.h>
  21. #include <starpu.h>
  22. #include <starpurm.h>
  23. #include <config.h>
  24. #include <starpurm_private.h>
  25. /*
  26. * #define _DEBUG
  27. */
  28. struct s_starpurm_unit
  29. {
  30. /* Opaque unit id.
  31. *
  32. * For StarPU-RM, this id is used as an index to array starpurm->units[].
  33. */
  34. int id;
  35. /* Id of the unit type. */
  36. int type;
  37. /* Boolean indicating whether the device is currently selected for use by the runtime system. */
  38. int selected;
  39. /* StarPU id of the worker driving the device. */
  40. int workerid;
  41. /* Cpuset of the StarPU worker. */
  42. hwloc_cpuset_t worker_cpuset;
  43. /* Condition variable to notify that a unit is now available to driver a worker waking up. */
  44. pthread_cond_t unit_available_cond;
  45. };
  46. static struct s_starpurm *_starpurm = NULL;
  47. #if 0
  48. static char *bitmap_to_str(hwloc_bitmap_t bitmap)
  49. {
  50. int strl = hwloc_bitmap_snprintf(NULL, 0, bitmap);
  51. char *str = malloc(strl+1);
  52. hwloc_bitmap_snprintf(str, strl+1, bitmap);
  53. return str;
  54. }
  55. #endif
  56. #ifdef STARPURM_STARPU_HAVE_WORKER_CALLBACKS
  57. enum e_starpurm_event
  58. {
  59. starpurm_event_code_min = 0,
  60. starpurm_event_exit = 0,
  61. starpurm_event_worker_going_to_sleep = 1,
  62. starpurm_event_worker_waking_up = 2,
  63. starpurm_event_unit_available = 3,
  64. starpurm_event_code_max = 3
  65. };
  66. struct s_starpurm_event
  67. {
  68. struct s_starpurm_event *next;
  69. struct s_starpurm_event *prev;
  70. enum e_starpurm_event code;
  71. unsigned int workerid;
  72. };
  73. static void _enqueue_event(struct s_starpurm_event *event)
  74. {
  75. assert(_starpurm != NULL);
  76. assert(_starpurm->state != state_uninitialized);
  77. struct s_starpurm *rm = _starpurm;
  78. assert(event->next == NULL);
  79. assert(event->prev == NULL);
  80. assert(event->code >= starpurm_event_code_min && event->code <= starpurm_event_code_max);
  81. pthread_mutex_lock(&rm->event_list_mutex);
  82. if (rm->event_processing_ended)
  83. {
  84. pthread_mutex_unlock(&rm->event_list_mutex);
  85. return;
  86. }
  87. assert((rm->event_list_head == NULL && rm->event_list_tail == NULL)
  88. || (rm->event_list_head != NULL && rm->event_list_tail != NULL));
  89. if (rm->event_list_head == NULL)
  90. {
  91. rm->event_list_tail = event;
  92. }
  93. else
  94. {
  95. rm->event_list_head->prev = event;
  96. }
  97. event->next = rm->event_list_head;
  98. rm->event_list_head = event;
  99. if (event->code == starpurm_event_exit)
  100. {
  101. rm->event_processing_ended = 1;
  102. int i;
  103. for (i=0; i<rm->nunits; i++)
  104. {
  105. pthread_cond_broadcast(&rm->units[i].unit_available_cond);
  106. }
  107. }
  108. pthread_cond_broadcast(&rm->event_list_cond);
  109. #ifdef STARPURM_HAVE_DLB
  110. if (event->code == starpurm_event_worker_waking_up)
  111. {
  112. int unit_id = rm->worker_unit_ids[event->workerid];
  113. /* if DLB is in use, wait for the unit to become available from the point of view of DLB, before using it */
  114. pthread_cond_wait(&rm->units[unit_id].unit_available_cond, &rm->event_list_mutex);
  115. }
  116. #endif
  117. pthread_mutex_unlock(&rm->event_list_mutex);
  118. }
  119. static struct s_starpurm_event *_dequeue_event_no_lock(void)
  120. {
  121. struct s_starpurm *rm = _starpurm;
  122. struct s_starpurm_event *event = NULL;
  123. if (rm->event_list_tail != NULL)
  124. {
  125. event = rm->event_list_tail;
  126. if (event->prev == NULL)
  127. {
  128. rm->event_list_head = NULL;
  129. rm->event_list_tail = NULL;
  130. }
  131. else
  132. {
  133. event->prev->next = NULL;
  134. rm->event_list_tail = event->prev;
  135. }
  136. event->prev = NULL;
  137. event->next = NULL;
  138. }
  139. return event;
  140. }
  141. static struct s_starpurm_event *_wait_event_no_lock(void)
  142. {
  143. struct s_starpurm *rm = _starpurm;
  144. while (rm->event_list_head == NULL)
  145. {
  146. pthread_cond_wait(&rm->event_list_cond, &rm->event_list_mutex);
  147. }
  148. struct s_starpurm_event *event = _dequeue_event_no_lock();
  149. return event;
  150. }
  151. /* unused */
  152. static struct s_starpurm_event *_dequeue_event(void)
  153. {
  154. assert(_starpurm != NULL);
  155. assert(_starpurm->state != state_uninitialized);
  156. struct s_starpurm *rm = _starpurm;
  157. pthread_mutex_lock(&rm->event_list_mutex);
  158. struct s_starpurm_event *event = _dequeue_event_no_lock();
  159. pthread_mutex_unlock(&rm->event_list_mutex);
  160. return event;
  161. }
  162. /* unused */
  163. static struct s_starpurm_event *_wait_event(void)
  164. {
  165. assert(_starpurm != NULL);
  166. assert(_starpurm->state != state_uninitialized);
  167. struct s_starpurm *rm = _starpurm;
  168. pthread_mutex_lock(&rm->event_list_mutex);
  169. struct s_starpurm_event *event = _wait_event_no_lock();
  170. pthread_mutex_unlock(&rm->event_list_mutex);
  171. return event;
  172. }
  173. static void _enqueue_exit_event(void)
  174. {
  175. struct s_starpurm_event *event = calloc(1, sizeof(*event));
  176. event->code = starpurm_event_exit;
  177. event->workerid = 0;
  178. _enqueue_event(event);
  179. }
  180. static void callback_worker_going_to_sleep(unsigned workerid)
  181. {
  182. struct s_starpurm_event *event = calloc(1, sizeof(*event));
  183. event->code = starpurm_event_worker_going_to_sleep;
  184. event->workerid = workerid;
  185. _enqueue_event(event);
  186. }
  187. static void callback_worker_waking_up(unsigned workerid)
  188. {
  189. struct s_starpurm_event *event = calloc(1, sizeof(*event));
  190. event->code = starpurm_event_worker_waking_up;
  191. event->workerid = workerid;
  192. _enqueue_event(event);
  193. }
  194. void starpurm_enqueue_event_cpu_unit_available(int unit_id)
  195. {
  196. assert(_starpurm != NULL);
  197. assert(_starpurm->state != state_uninitialized);
  198. struct s_starpurm *rm = _starpurm;
  199. assert(unit_id >= 0);
  200. assert(unit_id < rm->nunits_by_type[starpurm_unit_cpu]);
  201. unsigned workerid = rm->units[unit_id].workerid;
  202. struct s_starpurm_event *event = calloc(1, sizeof(*event));
  203. event->code = starpurm_event_unit_available;
  204. event->workerid = workerid;
  205. _enqueue_event(event);
  206. }
  207. static void *event_thread_func(void *_arg)
  208. {
  209. (void)_arg;
  210. assert(_starpurm != NULL);
  211. assert(_starpurm->state != state_uninitialized);
  212. struct s_starpurm *rm = _starpurm;
  213. int need_refresh = 0;
  214. pthread_mutex_lock(&rm->event_list_mutex);
  215. while (rm->event_processing_enabled == 0)
  216. {
  217. pthread_cond_wait(&rm->event_processing_cond, &rm->event_list_mutex);
  218. }
  219. pthread_mutex_unlock(&rm->event_list_mutex);
  220. hwloc_cpuset_t owned_cpuset = hwloc_bitmap_dup(rm->global_cpuset);
  221. hwloc_cpuset_t to_reclaim_cpuset = hwloc_bitmap_alloc();
  222. hwloc_cpuset_t to_lend_cpuset = hwloc_bitmap_alloc();
  223. while (1)
  224. {
  225. struct s_starpurm_event *event = _dequeue_event();
  226. if ((event == NULL || event->code == starpurm_event_exit) && need_refresh)
  227. {
  228. #ifdef STARPURM_HAVE_DLB
  229. /* notify DLB about changes */
  230. if (!hwloc_bitmap_iszero(to_reclaim_cpuset))
  231. {
  232. starpurm_dlb_notify_starpu_worker_mask_waking_up(to_reclaim_cpuset);
  233. }
  234. int did_lend_cpuset = 0;
  235. if (!hwloc_bitmap_iszero(to_lend_cpuset))
  236. {
  237. did_lend_cpuset = starpurm_dlb_notify_starpu_worker_mask_going_to_sleep(to_lend_cpuset);
  238. }
  239. #endif
  240. /* if DLB is not initialized, ignore lend operations */
  241. if (did_lend_cpuset)
  242. {
  243. hwloc_bitmap_andnot(owned_cpuset, owned_cpuset, to_lend_cpuset);
  244. }
  245. hwloc_bitmap_or(owned_cpuset, owned_cpuset, to_reclaim_cpuset);
  246. #if 0
  247. {
  248. char *to_lend_str = bitmap_to_str(to_lend_cpuset);
  249. char *to_reclaim_str = bitmap_to_str(to_reclaim_cpuset);
  250. free(to_lend_str);
  251. free(to_reclaim_str);
  252. }
  253. #endif
  254. need_refresh = 0;
  255. hwloc_bitmap_zero(to_lend_cpuset);
  256. hwloc_bitmap_zero(to_reclaim_cpuset);
  257. }
  258. if (event == NULL)
  259. {
  260. event = _wait_event();
  261. }
  262. if (event->code == starpurm_event_exit)
  263. {
  264. free(event);
  265. break;
  266. }
  267. /* TODO: accumulate state change */
  268. switch (event->code)
  269. {
  270. case starpurm_event_worker_going_to_sleep:
  271. {
  272. int unit_id = rm->worker_unit_ids[event->workerid];
  273. hwloc_bitmap_or(to_lend_cpuset, to_lend_cpuset, rm->units[unit_id].worker_cpuset);
  274. hwloc_bitmap_andnot(to_reclaim_cpuset, to_reclaim_cpuset, rm->units[unit_id].worker_cpuset);
  275. }
  276. break;
  277. case starpurm_event_worker_waking_up:
  278. {
  279. int unit_id = rm->worker_unit_ids[event->workerid];
  280. hwloc_bitmap_andnot(to_lend_cpuset, to_lend_cpuset, rm->units[unit_id].worker_cpuset);
  281. #ifdef STARPURM_HAVE_DLB
  282. if (rm->units[unit_id].type == starpurm_unit_cpu && !hwloc_bitmap_intersects(rm->units[unit_id].worker_cpuset, owned_cpuset))
  283. {
  284. /* Only reclaim the unit from DLB if StarPU does not own it already. */
  285. hwloc_bitmap_or(to_reclaim_cpuset, to_reclaim_cpuset, rm->units[unit_id].worker_cpuset);
  286. }
  287. else
  288. {
  289. pthread_cond_broadcast(&rm->units[unit_id].unit_available_cond);
  290. }
  291. #else
  292. hwloc_bitmap_or(to_reclaim_cpuset, to_reclaim_cpuset, rm->units[unit_id].worker_cpuset);
  293. #endif
  294. }
  295. break;
  296. #ifdef STARPURM_HAVE_DLB
  297. case starpurm_event_unit_available:
  298. {
  299. /* a reclaimed unit is now available from DLB, unlock the corresponding worker waking up */
  300. int unit_id = rm->worker_unit_ids[event->workerid];
  301. pthread_cond_broadcast(&rm->units[unit_id].unit_available_cond);
  302. }
  303. break;
  304. #endif
  305. default:
  306. /* unknown event code */
  307. assert(0);
  308. break;
  309. }
  310. free(event);
  311. need_refresh = 1;
  312. }
  313. pthread_mutex_lock(&rm->event_list_mutex);
  314. /* exit event should be last */
  315. assert(rm->event_list_head == NULL);
  316. assert(rm->event_list_tail == NULL);
  317. hwloc_bitmap_free(owned_cpuset);
  318. hwloc_bitmap_free(to_reclaim_cpuset);
  319. hwloc_bitmap_free(to_lend_cpuset);
  320. pthread_mutex_unlock(&rm->event_list_mutex);
  321. return NULL;
  322. }
  323. #endif /* STARPURM_STARPU_HAVE_WORKER_CALLBACKS */
  324. /* Resource enforcement */
  325. static starpurm_drs_ret_t _starpurm_update_cpuset(hwloc_cpuset_t cpuset)
  326. {
  327. assert(_starpurm != NULL);
  328. assert(_starpurm->state != state_uninitialized);
  329. struct s_starpurm *rm = _starpurm;
  330. if (hwloc_bitmap_isequal(cpuset, rm->selected_cpuset))
  331. {
  332. return starpurm_DRS_SUCCESS;
  333. }
  334. pthread_mutex_lock(&rm->temporary_ctxs_mutex);
  335. if (rm->starpu_in_pause)
  336. {
  337. starpu_resume();
  338. rm->starpu_in_pause = 0;
  339. }
  340. int workers_to_remove[_starpurm->nunits];
  341. unsigned nworkers_to_remove = 0;
  342. int workers_to_add[_starpurm->nunits];
  343. unsigned nworkers_to_add = 0;
  344. int i;
  345. hwloc_cpuset_t temp_cpuset = hwloc_bitmap_alloc();
  346. int new_selected_ncpus = 0;
  347. for (i=0; i<rm->nunits; i++)
  348. {
  349. struct s_starpurm_unit *unit = &rm->units[i];
  350. hwloc_bitmap_and(temp_cpuset, unit->worker_cpuset, cpuset);
  351. if (hwloc_bitmap_iszero(temp_cpuset))
  352. {
  353. workers_to_remove[nworkers_to_remove] = unit->workerid;
  354. unit->selected = 0;
  355. nworkers_to_remove++;
  356. }
  357. else
  358. {
  359. workers_to_add[nworkers_to_add] = unit->workerid;
  360. unit->selected = 1;
  361. nworkers_to_add++;
  362. if (unit->type == starpurm_unit_cpu)
  363. {
  364. new_selected_ncpus++;
  365. }
  366. }
  367. }
  368. hwloc_bitmap_free(temp_cpuset);
  369. rm->selected_nworkers = nworkers_to_add;
  370. rm->selected_ncpus = new_selected_ncpus;
  371. hwloc_bitmap_free(rm->selected_cpuset);
  372. rm->selected_cpuset = hwloc_bitmap_dup(cpuset);
  373. if (nworkers_to_add > 0)
  374. {
  375. #if defined(STARPURM_HAVE_DLB) && !defined(STARPURM_STARPU_HAVE_WORKER_CALLBACKS)
  376. {
  377. /* if StarPU worker callbacks are not enabled, we still
  378. * notify DLB about resource usage changes, but we do
  379. * not wait for the formal DLB go to use the units */
  380. hwloc_cpuset_t to_reclaim_cpuset = hwloc_bitmap_alloc();
  381. for (i=0; i<nworkers_to_add; i++)
  382. {
  383. int unit_id = rm->worker_unit_ids[workers_to_add[i]];
  384. hwloc_bitmap_or(to_reclaim_cpuset, to_reclaim_cpuset, rm->units[unit_id].worker_cpuset);
  385. }
  386. starpurm_dlb_notify_starpu_worker_mask_waking_up(to_reclaim_cpuset);
  387. hwloc_bitmap_free(to_reclaim_cpuset);
  388. }
  389. #endif
  390. starpu_sched_ctx_add_workers(workers_to_add, nworkers_to_add, rm->sched_ctx_id);
  391. }
  392. if (nworkers_to_remove > 0)
  393. {
  394. starpu_sched_ctx_remove_workers(workers_to_remove, nworkers_to_remove, rm->sched_ctx_id);
  395. #if defined(STARPURM_HAVE_DLB) && !defined(STARPURM_STARPU_HAVE_WORKER_CALLBACKS)
  396. {
  397. /* if StarPU worker callbacks are not enabled, we still
  398. * notify DLB about resource usage changes, but we do
  399. * not wait for the workers to become idle */
  400. hwloc_cpuset_t to_lend_cpuset = hwloc_bitmap_alloc();
  401. for (i=0; i<nworkers_to_remove; i++)
  402. {
  403. int unit_id = rm->worker_unit_ids[workers_to_remove[i]];
  404. hwloc_bitmap_or(to_lend_cpuset, to_lend_cpuset, rm->units[unit_id].worker_cpuset);
  405. }
  406. starpurm_dlb_notify_starpu_worker_mask_going_to_sleep(to_lend_cpuset);
  407. hwloc_bitmap_free(to_lend_cpuset);
  408. }
  409. #endif
  410. }
  411. #ifdef _DEBUG
  412. starpu_sched_ctx_display_workers(rm->sched_ctx_id, stderr);
  413. #endif /* DEBUG */
  414. if (rm->selected_nworkers == 0 && rm->avail_temporary_ctxs == rm->max_temporary_ctxs)
  415. {
  416. rm->starpu_in_pause = 1;
  417. starpu_pause();
  418. }
  419. pthread_mutex_unlock(&rm->temporary_ctxs_mutex);
  420. return starpurm_DRS_SUCCESS;
  421. }
  422. static unsigned _starpurm_temporary_context_alloc(hwloc_cpuset_t cpuset)
  423. {
  424. assert(_starpurm != NULL);
  425. assert(_starpurm->state != state_uninitialized);
  426. assert(_starpurm->max_temporary_ctxs > 0);
  427. struct s_starpurm *rm = _starpurm;
  428. pthread_mutex_lock(&rm->temporary_ctxs_mutex);
  429. while(rm->avail_temporary_ctxs == 0)
  430. {
  431. pthread_cond_wait(&rm->temporary_ctxs_cond, &rm->temporary_ctxs_mutex);
  432. }
  433. assert(rm->avail_temporary_ctxs > 0);
  434. rm->avail_temporary_ctxs--;
  435. if (rm->starpu_in_pause)
  436. {
  437. starpu_resume();
  438. rm->starpu_in_pause = 0;
  439. }
  440. pthread_mutex_unlock(&rm->temporary_ctxs_mutex);
  441. unsigned sched_ctx_id = starpu_sched_ctx_create(NULL, -1, "starpurm_temp", STARPU_SCHED_CTX_POLICY_NAME, "eager", 0);
  442. assert(sched_ctx_id != STARPU_NMAX_SCHED_CTXS);
  443. int workers_to_remove[_starpurm->nunits];
  444. unsigned nworkers_to_remove = 0;
  445. int workers_to_add[_starpurm->nunits];
  446. unsigned nworkers_to_add = 0;
  447. int i;
  448. hwloc_cpuset_t temp_cpuset = hwloc_bitmap_alloc();
  449. for (i=0; i<rm->nunits; i++)
  450. {
  451. struct s_starpurm_unit *unit = &rm->units[i];
  452. hwloc_bitmap_and(temp_cpuset, unit->worker_cpuset, cpuset);
  453. if (hwloc_bitmap_iszero(temp_cpuset))
  454. {
  455. workers_to_remove[nworkers_to_remove] = unit->workerid;
  456. nworkers_to_remove++;
  457. }
  458. else
  459. {
  460. workers_to_add[nworkers_to_add] = unit->workerid;
  461. nworkers_to_add++;
  462. }
  463. }
  464. hwloc_bitmap_free(temp_cpuset);
  465. if (nworkers_to_add > 0)
  466. starpu_sched_ctx_add_workers(workers_to_add, nworkers_to_add, sched_ctx_id);
  467. if (nworkers_to_remove > 0)
  468. starpu_sched_ctx_remove_workers(workers_to_remove, nworkers_to_remove, sched_ctx_id);
  469. #ifdef _DEBUG
  470. starpu_sched_ctx_display_workers(sched_ctx_id, stderr);
  471. #endif /* DEBUG */
  472. return sched_ctx_id;
  473. }
  474. static void _starpurm_temporary_context_free(unsigned ctx)
  475. {
  476. assert(_starpurm != NULL);
  477. assert(_starpurm->state != state_uninitialized);
  478. assert(_starpurm->max_temporary_ctxs > 0);
  479. struct s_starpurm *rm = _starpurm;
  480. starpu_sched_ctx_delete(ctx);
  481. pthread_mutex_lock(&rm->temporary_ctxs_mutex);
  482. rm->avail_temporary_ctxs++;
  483. pthread_cond_signal(&rm->temporary_ctxs_cond);
  484. if (rm->selected_nworkers == 0 && rm->avail_temporary_ctxs == rm->max_temporary_ctxs)
  485. {
  486. rm->starpu_in_pause = 1;
  487. starpu_pause();
  488. }
  489. pthread_mutex_unlock(&rm->temporary_ctxs_mutex);
  490. }
  491. static starpurm_drs_ret_t _starpurm_set_ncpus(unsigned int ncpus)
  492. {
  493. assert(_starpurm != NULL);
  494. assert(_starpurm->state != state_uninitialized);
  495. struct s_starpurm *rm = _starpurm;
  496. int i;
  497. if (ncpus > rm->nunits_by_type[starpurm_unit_cpu])
  498. {
  499. ncpus = rm->nunits_by_type[starpurm_unit_cpu];
  500. }
  501. if (ncpus == rm->selected_ncpus)
  502. {
  503. return starpurm_DRS_SUCCESS;
  504. }
  505. pthread_mutex_lock(&rm->temporary_ctxs_mutex);
  506. if (rm->starpu_in_pause)
  507. {
  508. starpu_resume();
  509. rm->starpu_in_pause = 0;
  510. }
  511. int workers_to_remove[_starpurm->nunits];
  512. unsigned nworkers_to_remove = 0;
  513. int workers_to_add[_starpurm->nunits];
  514. unsigned nworkers_to_add = 0;
  515. for (i=0; i<rm->nunits; i++)
  516. {
  517. struct s_starpurm_unit *unit = &rm->units[i];
  518. if (unit->type != starpurm_unit_cpu)
  519. continue;
  520. if (nworkers_to_add < ncpus)
  521. {
  522. workers_to_add[nworkers_to_add] = unit->workerid;
  523. unit->selected = 1;
  524. nworkers_to_add++;
  525. hwloc_bitmap_or(rm->selected_cpuset, rm->selected_cpuset, unit->worker_cpuset);
  526. }
  527. else
  528. {
  529. workers_to_remove[nworkers_to_remove] = unit->workerid;
  530. unit->selected = 0;
  531. hwloc_bitmap_andnot(rm->selected_cpuset, rm->selected_cpuset, unit->worker_cpuset);
  532. nworkers_to_remove++;
  533. }
  534. }
  535. rm->selected_nworkers = nworkers_to_add;
  536. rm->selected_ncpus = nworkers_to_add;
  537. if (nworkers_to_add > 0)
  538. starpu_sched_ctx_add_workers(workers_to_add, nworkers_to_add, rm->sched_ctx_id);
  539. if (nworkers_to_remove > 0)
  540. starpu_sched_ctx_remove_workers(workers_to_remove, nworkers_to_remove, rm->sched_ctx_id);
  541. #if def_DEBUG
  542. starpu_sched_ctx_display_workers(rm->sched_ctx_id, stderr);
  543. #endif /* DEBUG */
  544. if (rm->selected_nworkers == 0 && rm->avail_temporary_ctxs == rm->max_temporary_ctxs)
  545. {
  546. rm->starpu_in_pause = 1;
  547. starpu_pause();
  548. }
  549. pthread_mutex_unlock(&rm->temporary_ctxs_mutex);
  550. return starpurm_DRS_SUCCESS;
  551. }
  552. /* Initialize rm state for StarPU */
  553. void starpurm_initialize(void)
  554. {
  555. int ret;
  556. assert(_starpurm == NULL);
  557. struct s_starpurm *rm = calloc(1, sizeof(*rm));
  558. pthread_mutex_init(&rm->temporary_ctxs_mutex, NULL);
  559. pthread_cond_init(&rm->temporary_ctxs_cond, NULL);
  560. rm->state = state_init;
  561. /* init hwloc objects */
  562. hwloc_topology_init(&rm->topology);
  563. hwloc_topology_load(rm->topology);
  564. rm->global_cpuset = hwloc_bitmap_alloc();
  565. hwloc_bitmap_zero(rm->global_cpuset);
  566. rm->all_cpu_workers_cpuset = hwloc_bitmap_alloc();
  567. hwloc_bitmap_zero(rm->all_cpu_workers_cpuset);
  568. rm->all_opencl_device_workers_cpuset = hwloc_bitmap_alloc();
  569. hwloc_bitmap_zero(rm->all_opencl_device_workers_cpuset);
  570. rm->all_cuda_device_workers_cpuset = hwloc_bitmap_alloc();
  571. hwloc_bitmap_zero(rm->all_cuda_device_workers_cpuset);
  572. rm->all_mic_device_workers_cpuset = hwloc_bitmap_alloc();
  573. hwloc_bitmap_zero(rm->all_mic_device_workers_cpuset);
  574. rm->all_device_workers_cpuset = hwloc_bitmap_alloc();
  575. hwloc_bitmap_zero(rm->all_device_workers_cpuset);
  576. /* init event list, before StarPU is initialized */
  577. pthread_mutex_init(&rm->event_list_mutex, NULL);
  578. pthread_cond_init(&rm->event_list_cond, NULL);
  579. pthread_cond_init(&rm->event_processing_cond, NULL);
  580. pthread_mutex_lock(&rm->event_list_mutex);
  581. rm->event_processing_enabled = 0;
  582. rm->event_processing_ended = 0;
  583. rm->event_list_head = NULL;
  584. rm->event_list_tail = NULL;
  585. pthread_mutex_unlock(&rm->event_list_mutex);
  586. /* set _starpurm here since StarPU's callbacks may reference it once starpu_init is called */
  587. _starpurm = rm;
  588. #ifdef STARPURM_STARPU_HAVE_WORKER_CALLBACKS
  589. /* launch event thread */
  590. ret = pthread_create(&rm->event_thread, NULL, event_thread_func, rm);
  591. assert(ret == 0);
  592. #endif
  593. /* init StarPU */
  594. struct starpu_conf starpu_conf;
  595. ret = starpu_conf_init(&starpu_conf);
  596. assert(ret == 0);
  597. #ifdef STARPURM_STARPU_HAVE_WORKER_CALLBACKS
  598. starpu_conf.callback_worker_going_to_sleep = callback_worker_going_to_sleep;
  599. starpu_conf.callback_worker_waking_up = callback_worker_waking_up;
  600. #endif
  601. ret = starpu_init(&starpu_conf);
  602. assert(ret == 0);
  603. /* init any worker objects */
  604. rm->nunits = starpu_worker_get_count_by_type(STARPU_ANY_WORKER);
  605. /* init device worker objects */
  606. rm->unit_ntypes = starpurm_unit_ntypes;
  607. rm->nunits_by_type = calloc(rm->unit_ntypes, sizeof(*rm->nunits_by_type));
  608. rm->unit_offsets_by_type = calloc(rm->unit_ntypes, sizeof(*rm->unit_offsets_by_type));
  609. const int cpu_nunits = starpu_worker_get_count_by_type(STARPU_CPU_WORKER);
  610. rm->nunits_by_type[starpurm_unit_cpu] = cpu_nunits;
  611. const int opencl_nunits = starpu_worker_get_count_by_type(STARPU_OPENCL_WORKER);
  612. rm->nunits_by_type[starpurm_unit_opencl] = opencl_nunits;
  613. const int cuda_nunits = starpu_worker_get_count_by_type(STARPU_CUDA_WORKER);
  614. rm->nunits_by_type[starpurm_unit_cuda] = cuda_nunits;
  615. const int mic_nunits = starpu_worker_get_count_by_type(STARPU_MIC_WORKER);
  616. rm->nunits_by_type[starpurm_unit_mic] = mic_nunits;
  617. const int nunits = cpu_nunits + opencl_nunits + cuda_nunits + mic_nunits;
  618. rm->nunits = nunits;
  619. rm->units = calloc(nunits, sizeof(*rm->units));
  620. int unitid = 0;
  621. int cpu_workerids[cpu_nunits];
  622. starpu_worker_get_ids_by_type(STARPU_CPU_WORKER, cpu_workerids, cpu_nunits);
  623. rm->unit_offsets_by_type[starpurm_unit_cpu] = unitid;
  624. unsigned int max_worker_id = 0;
  625. int i;
  626. for (i = 0; i < cpu_nunits; i++)
  627. {
  628. rm->units[unitid].id = unitid;
  629. rm->units[unitid].type = starpurm_unit_cpu;
  630. rm->units[unitid].selected = 1; /* enabled by default */
  631. rm->units[unitid].workerid = cpu_workerids[i];
  632. if (max_worker_id < rm->units[unitid].workerid)
  633. {
  634. max_worker_id = rm->units[unitid].workerid;
  635. }
  636. rm->units[unitid].worker_cpuset = starpu_worker_get_hwloc_cpuset(rm->units[unitid].workerid);
  637. pthread_cond_init(&rm->units[unitid].unit_available_cond, NULL);
  638. hwloc_bitmap_or(rm->global_cpuset, rm->global_cpuset, rm->units[unitid].worker_cpuset);
  639. hwloc_bitmap_or(rm->all_cpu_workers_cpuset, rm->all_cpu_workers_cpuset, rm->units[unitid].worker_cpuset);;
  640. unitid++;
  641. }
  642. int opencl_workerids[opencl_nunits];
  643. starpu_worker_get_ids_by_type(STARPU_OPENCL_WORKER, opencl_workerids, opencl_nunits);
  644. rm->unit_offsets_by_type[starpurm_unit_opencl] = unitid;
  645. for (i = 0; i < opencl_nunits; i++)
  646. {
  647. rm->units[unitid].id = unitid;
  648. rm->units[unitid].type = starpurm_unit_opencl;
  649. rm->units[unitid].selected = 1; /* enabled by default */
  650. rm->units[unitid].workerid = opencl_workerids[i];
  651. if (max_worker_id < rm->units[unitid].workerid)
  652. {
  653. max_worker_id = rm->units[unitid].workerid;
  654. }
  655. rm->units[unitid].worker_cpuset = starpu_worker_get_hwloc_cpuset(rm->units[unitid].workerid);
  656. pthread_cond_init(&rm->units[unitid].unit_available_cond, NULL);
  657. hwloc_bitmap_or(rm->global_cpuset, rm->global_cpuset, rm->units[unitid].worker_cpuset);
  658. hwloc_bitmap_or(rm->all_opencl_device_workers_cpuset, rm->all_opencl_device_workers_cpuset, rm->units[unitid].worker_cpuset);
  659. hwloc_bitmap_or(rm->all_device_workers_cpuset, rm->all_device_workers_cpuset, rm->units[unitid].worker_cpuset);
  660. unitid++;
  661. }
  662. int cuda_workerids[opencl_nunits];
  663. starpu_worker_get_ids_by_type(STARPU_CUDA_WORKER, cuda_workerids, cuda_nunits);
  664. rm->unit_offsets_by_type[starpurm_unit_cuda] = unitid;
  665. for (i = 0; i < cuda_nunits; i++)
  666. {
  667. rm->units[unitid].id = unitid;
  668. rm->units[unitid].type = starpurm_unit_cuda;
  669. rm->units[unitid].selected = 1; /* enabled by default */
  670. rm->units[unitid].workerid = cuda_workerids[i];
  671. if (max_worker_id < rm->units[unitid].workerid)
  672. {
  673. max_worker_id = rm->units[unitid].workerid;
  674. }
  675. rm->units[unitid].worker_cpuset = starpu_worker_get_hwloc_cpuset(rm->units[unitid].workerid);
  676. pthread_cond_init(&rm->units[unitid].unit_available_cond, NULL);
  677. hwloc_bitmap_or(rm->global_cpuset, rm->global_cpuset, rm->units[unitid].worker_cpuset);
  678. hwloc_bitmap_or(rm->all_cuda_device_workers_cpuset, rm->all_cuda_device_workers_cpuset, rm->units[unitid].worker_cpuset);
  679. hwloc_bitmap_or(rm->all_device_workers_cpuset, rm->all_device_workers_cpuset, rm->units[unitid].worker_cpuset);
  680. unitid++;
  681. }
  682. int mic_workerids[mic_nunits];
  683. starpu_worker_get_ids_by_type(STARPU_MIC_WORKER, mic_workerids, mic_nunits);
  684. rm->unit_offsets_by_type[starpurm_unit_mic] = unitid;
  685. for (i = 0; i < mic_nunits; i++)
  686. {
  687. rm->units[unitid].id = unitid;
  688. rm->units[unitid].type = starpurm_unit_mic;
  689. rm->units[unitid].selected = 1; /* enabled by default */
  690. rm->units[unitid].workerid = mic_workerids[i];
  691. if (max_worker_id < rm->units[unitid].workerid)
  692. {
  693. max_worker_id = rm->units[unitid].workerid;
  694. }
  695. rm->units[unitid].worker_cpuset = starpu_worker_get_hwloc_cpuset(rm->units[unitid].workerid);
  696. pthread_cond_init(&rm->units[unitid].unit_available_cond, NULL);
  697. hwloc_bitmap_or(rm->global_cpuset, rm->global_cpuset, rm->units[unitid].worker_cpuset);
  698. hwloc_bitmap_or(rm->all_mic_device_workers_cpuset, rm->all_mic_device_workers_cpuset, rm->units[unitid].worker_cpuset);
  699. hwloc_bitmap_or(rm->all_device_workers_cpuset, rm->all_device_workers_cpuset, rm->units[unitid].worker_cpuset);
  700. unitid++;
  701. }
  702. rm->max_worker_id = max_worker_id;
  703. {
  704. int *worker_unit_ids = malloc((max_worker_id+1) * sizeof(*worker_unit_ids));
  705. for (i = 0; i < max_worker_id+1; i++)
  706. {
  707. worker_unit_ids[i] = -1;
  708. }
  709. for (i=0; i<rm->nunits; i++)
  710. {
  711. worker_unit_ids[rm->units[i].workerid] = i;
  712. }
  713. rm->worker_unit_ids = worker_unit_ids;
  714. }
  715. /* create StarPU sched_ctx for RM instance */
  716. {
  717. int workerids[rm->nunits];
  718. starpu_worker_get_ids_by_type(STARPU_ANY_WORKER, workerids, rm->nunits);
  719. /* TODO: make sched_ctx policy configurable */
  720. rm->sched_ctx_id = starpu_sched_ctx_create(workerids, rm->nunits, "starpurm", STARPU_SCHED_CTX_POLICY_NAME, "eager", 0);
  721. #ifdef _DEBUG
  722. starpu_sched_ctx_display_workers(rm->sched_ctx_id, stderr);
  723. #endif /* DEBUG */
  724. }
  725. starpu_sched_ctx_set_context(&rm->sched_ctx_id);
  726. /* number selected workers (total) */
  727. rm->selected_nworkers = rm->nunits;
  728. /* number of selected CPUs workers */
  729. rm->selected_ncpus = rm->nunits_by_type[starpurm_unit_cpu];
  730. /* cpuset of all currently selected workers */
  731. rm->selected_cpuset = hwloc_bitmap_dup(rm->global_cpuset);
  732. if (STARPU_NMAX_SCHED_CTXS > 2)
  733. {
  734. /* account for main ctx (0) and default rm ctx (1)
  735. * TODO: check that no other ctxs are allocated by external codes */
  736. rm->max_temporary_ctxs = STARPU_NMAX_SCHED_CTXS - 2;
  737. }
  738. else
  739. {
  740. rm->max_temporary_ctxs = 0;
  741. }
  742. rm->avail_temporary_ctxs = rm->max_temporary_ctxs;
  743. if (rm->selected_nworkers == 0)
  744. {
  745. rm->starpu_in_pause = 1;
  746. starpu_pause();
  747. }
  748. else
  749. {
  750. rm->starpu_in_pause = 0;
  751. }
  752. pthread_mutex_lock(&rm->event_list_mutex);
  753. rm->event_processing_enabled = 1;
  754. pthread_cond_broadcast(&rm->event_processing_cond);
  755. pthread_mutex_unlock(&rm->event_list_mutex);
  756. _starpurm = rm;
  757. #ifdef STARPURM_HAVE_DLB
  758. starpurm_dlb_init(rm);
  759. #endif
  760. }
  761. /* Free rm struct for StarPU */
  762. void starpurm_shutdown(void)
  763. {
  764. assert(_starpurm != NULL);
  765. assert(_starpurm->state != state_uninitialized);
  766. struct s_starpurm *rm = _starpurm;
  767. if (rm->starpu_in_pause)
  768. {
  769. starpu_resume();
  770. rm->starpu_in_pause = 0;
  771. }
  772. starpu_sched_ctx_delete(rm->sched_ctx_id);
  773. #ifdef STARPURM_STARPU_HAVE_WORKER_CALLBACKS
  774. _enqueue_exit_event();
  775. #endif
  776. starpu_shutdown();
  777. #ifdef STARPURM_HAVE_DLB
  778. starpurm_dlb_exit();
  779. #endif
  780. hwloc_topology_destroy(rm->topology);
  781. #ifdef STARPURM_STARPU_HAVE_WORKER_CALLBACKS
  782. pthread_join(rm->event_thread, NULL);
  783. #endif
  784. assert(rm->event_list_head == NULL);
  785. assert(rm->event_list_tail == NULL);
  786. pthread_cond_destroy(&rm->event_list_cond);
  787. pthread_mutex_destroy(&rm->event_list_mutex);
  788. rm->state = state_uninitialized;
  789. hwloc_bitmap_free(rm->global_cpuset);
  790. hwloc_bitmap_free(rm->all_cpu_workers_cpuset);
  791. hwloc_bitmap_free(rm->all_opencl_device_workers_cpuset);
  792. hwloc_bitmap_free(rm->all_cuda_device_workers_cpuset);
  793. hwloc_bitmap_free(rm->all_mic_device_workers_cpuset);
  794. hwloc_bitmap_free(rm->all_device_workers_cpuset);
  795. hwloc_bitmap_free(rm->selected_cpuset);
  796. int i;
  797. for (i=0; i<rm->nunits; i++)
  798. {
  799. pthread_cond_destroy(&rm->units[i].unit_available_cond);
  800. }
  801. free(rm->units);
  802. rm->units = NULL;
  803. free(rm->nunits_by_type);
  804. rm->nunits_by_type = NULL;
  805. free(rm->unit_offsets_by_type);
  806. rm->unit_offsets_by_type = NULL;
  807. free(rm);
  808. _starpurm = NULL;
  809. }
  810. void starpurm_spawn_kernel_on_cpus(void *data, void(*f)(void *), void *args, hwloc_cpuset_t cpuset)
  811. {
  812. (void) data;
  813. assert(_starpurm != NULL);
  814. assert(_starpurm->state != state_uninitialized);
  815. struct s_starpurm *rm = _starpurm;
  816. unsigned ctx = _starpurm_temporary_context_alloc(cpuset);
  817. starpu_sched_ctx_set_context(&ctx);
  818. f(args);
  819. starpu_sched_ctx_set_context(&rm->sched_ctx_id);
  820. _starpurm_temporary_context_free(ctx);
  821. }
  822. struct s_starpurm__spawn_args
  823. {
  824. void(*f)(void *);
  825. void *args;
  826. void(*cb_f)(void *);
  827. void *cb_args;
  828. hwloc_cpuset_t cpuset;
  829. };
  830. static void *_starpurm_spawn_kernel_thread(void *_spawn_args)
  831. {
  832. struct s_starpurm__spawn_args *spawn_args = _spawn_args;
  833. unsigned ctx = _starpurm_temporary_context_alloc(spawn_args->cpuset);
  834. starpu_sched_ctx_set_context(&ctx);
  835. spawn_args->f(spawn_args->args);
  836. struct s_starpurm *rm = _starpurm;
  837. starpu_sched_ctx_set_context(&rm->sched_ctx_id);
  838. _starpurm_temporary_context_free(ctx);
  839. spawn_args->cb_f(spawn_args->cb_args);
  840. hwloc_bitmap_free(spawn_args->cpuset);
  841. free(spawn_args);
  842. return NULL;
  843. }
  844. void starpurm_spawn_kernel_on_cpus_callback(void *data, void(*f)(void *), void *args, hwloc_cpuset_t cpuset, void(*cb_f)(void *), void *cb_args)
  845. {
  846. (void) data;
  847. struct s_starpurm__spawn_args *spawn_args = calloc(1, sizeof(*spawn_args));
  848. spawn_args->f = f;
  849. spawn_args->args = args;
  850. spawn_args->cb_f = cb_f;
  851. spawn_args->cb_args = cb_args;
  852. spawn_args->cpuset = hwloc_bitmap_dup(cpuset);
  853. pthread_attr_t attr;
  854. int ret;
  855. ret = pthread_attr_init(&attr);
  856. assert(ret == 0);
  857. ret = pthread_attr_setdetachstate(&attr, 1);
  858. assert(ret == 0);
  859. pthread_t t;
  860. ret = pthread_create(&t, &attr, _starpurm_spawn_kernel_thread, spawn_args);
  861. assert(ret == 0);
  862. }
  863. hwloc_cpuset_t starpurm_get_cpu_worker_cpuset(int unit_rank)
  864. {
  865. assert(_starpurm != NULL);
  866. assert(_starpurm->state != state_uninitialized);
  867. struct s_starpurm *rm = _starpurm;
  868. assert(unit_rank >= 0 && unit_rank < rm->nunits_by_type[starpurm_unit_cpu]);
  869. return hwloc_bitmap_dup(rm->units[rm->unit_offsets_by_type[starpurm_unit_cpu] + unit_rank].worker_cpuset);
  870. }
  871. /* Dynamic resource sharing */
  872. starpurm_drs_ret_t starpurm_set_drs_enable(starpurm_drs_desc_t *spd)
  873. {
  874. (void)spd;
  875. assert(_starpurm != NULL);
  876. assert(_starpurm->state != state_uninitialized);
  877. struct s_starpurm *rm = _starpurm;
  878. rm->dynamic_resource_sharing = 1;
  879. return starpurm_DRS_SUCCESS;
  880. }
  881. starpurm_drs_ret_t starpurm_set_drs_disable(starpurm_drs_desc_t *spd)
  882. {
  883. (void)spd;
  884. assert(_starpurm != NULL);
  885. assert(_starpurm->state != state_uninitialized);
  886. struct s_starpurm *rm = _starpurm;
  887. rm->dynamic_resource_sharing = 0;
  888. return starpurm_DRS_SUCCESS;
  889. }
  890. int starpurm_drs_enabled_p(void)
  891. {
  892. assert(_starpurm != NULL);
  893. assert(_starpurm->state != state_uninitialized);
  894. struct s_starpurm *rm = _starpurm;
  895. return rm->dynamic_resource_sharing;
  896. }
  897. starpurm_drs_ret_t starpurm_set_max_parallelism(starpurm_drs_desc_t *spd, int ncpus)
  898. {
  899. (void)spd;
  900. assert(_starpurm != NULL);
  901. assert(_starpurm->state != state_uninitialized);
  902. struct s_starpurm *rm = _starpurm;
  903. if (!rm->dynamic_resource_sharing)
  904. return starpurm_DRS_DISABLD;
  905. if (ncpus > rm->nunits_by_type[starpurm_unit_cpu])
  906. {
  907. ncpus = rm->nunits_by_type[starpurm_unit_cpu];
  908. }
  909. rm->max_ncpus = ncpus;
  910. if (rm->selected_ncpus > ncpus)
  911. {
  912. return _starpurm_set_ncpus(ncpus);
  913. }
  914. return starpurm_DRS_SUCCESS;
  915. }
  916. starpurm_drs_ret_t starpurm_callback_set(starpurm_drs_desc_t *spd, starpurm_drs_cbs_t which, starpurm_drs_cb_t callback)
  917. {
  918. (void)spd;
  919. (void)which;
  920. (void)callback;
  921. /* unimplemented */
  922. assert(0);
  923. return starpurm_DRS_PERM;
  924. }
  925. starpurm_drs_ret_t starpurm_callback_get(starpurm_drs_desc_t *spd, starpurm_drs_cbs_t which, starpurm_drs_cb_t *callback)
  926. {
  927. (void)spd;
  928. (void)which;
  929. (void)callback;
  930. /* unimplemented */
  931. assert(0);
  932. return starpurm_DRS_PERM;
  933. }
  934. starpurm_drs_ret_t starpurm_assign_cpu_to_starpu(starpurm_drs_desc_t *spd, int cpuid)
  935. {
  936. assert(_starpurm != NULL);
  937. assert(_starpurm->state != state_uninitialized);
  938. struct s_starpurm *rm = _starpurm;
  939. if (!rm->dynamic_resource_sharing)
  940. return starpurm_DRS_DISABLD;
  941. starpurm_drs_ret_t ret = 0;
  942. assert(hwloc_bitmap_isset(rm->global_cpuset, cpuid));
  943. if (!hwloc_bitmap_isset(rm->selected_cpuset, cpuid))
  944. {
  945. hwloc_cpuset_t temp_cpuset = hwloc_bitmap_dup(rm->selected_cpuset);
  946. hwloc_bitmap_set(temp_cpuset, cpuid);
  947. ret = _starpurm_update_cpuset(temp_cpuset);
  948. hwloc_bitmap_free(temp_cpuset);
  949. }
  950. return ret;
  951. }
  952. starpurm_drs_ret_t starpurm_assign_cpus_to_starpu(starpurm_drs_desc_t *spd, int ncpus)
  953. {
  954. (void)spd;
  955. assert(_starpurm != NULL);
  956. assert(_starpurm->state != state_uninitialized);
  957. struct s_starpurm *rm = _starpurm;
  958. if (!rm->dynamic_resource_sharing)
  959. return starpurm_DRS_DISABLD;
  960. /* add ncpus more CPUs to the CPUs pool */
  961. return _starpurm_set_ncpus(rm->selected_ncpus+ncpus);
  962. }
  963. starpurm_drs_ret_t starpurm_assign_cpu_mask_to_starpu(starpurm_drs_desc_t *spd, const hwloc_cpuset_t mask)
  964. {
  965. (void)spd;
  966. assert(_starpurm != NULL);
  967. assert(_starpurm->state != state_uninitialized);
  968. struct s_starpurm *rm = _starpurm;
  969. if (!rm->dynamic_resource_sharing)
  970. return starpurm_DRS_DISABLD;
  971. hwloc_cpuset_t temp_cpuset = hwloc_bitmap_dup(rm->selected_cpuset);
  972. hwloc_bitmap_or(temp_cpuset, temp_cpuset, mask);
  973. starpurm_drs_ret_t ret = _starpurm_update_cpuset(temp_cpuset);
  974. hwloc_bitmap_free(temp_cpuset);
  975. return ret;
  976. }
  977. starpurm_drs_ret_t starpurm_assign_all_cpus_to_starpu(starpurm_drs_desc_t *spd)
  978. {
  979. assert(_starpurm != NULL);
  980. assert(_starpurm->state != state_uninitialized);
  981. struct s_starpurm *rm = _starpurm;
  982. if (!rm->dynamic_resource_sharing)
  983. return starpurm_DRS_DISABLD;
  984. return starpurm_assign_cpus_to_starpu(spd, rm->nunits_by_type[starpurm_unit_cpu]);
  985. }
  986. starpurm_drs_ret_t starpurm_withdraw_cpu_from_starpu(starpurm_drs_desc_t *spd, int cpuid)
  987. {
  988. assert(_starpurm != NULL);
  989. assert(_starpurm->state != state_uninitialized);
  990. struct s_starpurm *rm = _starpurm;
  991. if (!rm->dynamic_resource_sharing)
  992. return starpurm_DRS_DISABLD;
  993. starpurm_drs_ret_t ret = 0;
  994. assert(hwloc_bitmap_isset(rm->global_cpuset, cpuid));
  995. if (hwloc_bitmap_isset(rm->selected_cpuset, cpuid))
  996. {
  997. hwloc_cpuset_t temp_cpuset = hwloc_bitmap_dup(rm->selected_cpuset);
  998. hwloc_bitmap_clr(temp_cpuset, cpuid);
  999. ret = _starpurm_update_cpuset(temp_cpuset);
  1000. hwloc_bitmap_free(temp_cpuset);
  1001. }
  1002. return ret;
  1003. }
  1004. starpurm_drs_ret_t starpurm_withdraw_cpus_from_starpu(starpurm_drs_desc_t *spd, int ncpus)
  1005. {
  1006. (void)spd;
  1007. assert(_starpurm != NULL);
  1008. assert(_starpurm->state != state_uninitialized);
  1009. struct s_starpurm *rm = _starpurm;
  1010. if (!rm->dynamic_resource_sharing)
  1011. return starpurm_DRS_DISABLD;
  1012. /* add ncpus more CPUs to the CPUs pool */
  1013. starpurm_drs_ret_t ret = 0;
  1014. if (ncpus <= rm->nunits_by_type[starpurm_unit_cpu])
  1015. {
  1016. ret = _starpurm_set_ncpus(rm->nunits_by_type[starpurm_unit_cpu]-ncpus);
  1017. }
  1018. else
  1019. {
  1020. ret = _starpurm_set_ncpus(0);
  1021. }
  1022. return ret;
  1023. }
  1024. starpurm_drs_ret_t starpurm_withdraw_cpu_mask_from_starpu(starpurm_drs_desc_t *spd, const hwloc_cpuset_t mask)
  1025. {
  1026. (void)spd;
  1027. assert(_starpurm != NULL);
  1028. assert(_starpurm->state != state_uninitialized);
  1029. struct s_starpurm *rm = _starpurm;
  1030. if (!rm->dynamic_resource_sharing)
  1031. return starpurm_DRS_DISABLD;
  1032. hwloc_cpuset_t temp_cpuset = hwloc_bitmap_dup(rm->selected_cpuset);
  1033. hwloc_bitmap_andnot(temp_cpuset, temp_cpuset, mask);
  1034. starpurm_drs_ret_t ret = _starpurm_update_cpuset(temp_cpuset);
  1035. hwloc_bitmap_free(temp_cpuset);
  1036. return ret;
  1037. }
  1038. starpurm_drs_ret_t starpurm_withdraw_all_cpus_from_starpu(starpurm_drs_desc_t *spd)
  1039. {
  1040. assert(_starpurm != NULL);
  1041. assert(_starpurm->state != state_uninitialized);
  1042. struct s_starpurm *rm = _starpurm;
  1043. if (!rm->dynamic_resource_sharing)
  1044. return starpurm_DRS_DISABLD;
  1045. return starpurm_withdraw_cpus_from_starpu(spd, rm->nunits_by_type[starpurm_unit_cpu]);
  1046. }
  1047. /* --- */
  1048. starpurm_drs_ret_t starpurm_lend_cpu(starpurm_drs_desc_t *spd, int cpuid)
  1049. {
  1050. return starpurm_assign_cpu_to_starpu(spd, cpuid);
  1051. }
  1052. starpurm_drs_ret_t starpurm_lend_cpus(starpurm_drs_desc_t *spd, int ncpus)
  1053. {
  1054. return starpurm_assign_cpus_to_starpu(spd, ncpus);
  1055. }
  1056. starpurm_drs_ret_t starpurm_lend_cpu_mask(starpurm_drs_desc_t *spd, const hwloc_cpuset_t mask)
  1057. {
  1058. return starpurm_assign_cpu_mask_to_starpu(spd, mask);
  1059. }
  1060. starpurm_drs_ret_t starpurm_lend(starpurm_drs_desc_t *spd)
  1061. {
  1062. return starpurm_assign_all_cpus_to_starpu(spd);
  1063. }
  1064. starpurm_drs_ret_t starpurm_reclaim_cpu(starpurm_drs_desc_t *spd, int cpuid)
  1065. {
  1066. return starpurm_withdraw_cpu_from_starpu(spd, cpuid);
  1067. }
  1068. starpurm_drs_ret_t starpurm_reclaim_cpus(starpurm_drs_desc_t *spd, int ncpus)
  1069. {
  1070. return starpurm_withdraw_cpus_from_starpu(spd, ncpus);
  1071. }
  1072. starpurm_drs_ret_t starpurm_reclaim_cpu_mask(starpurm_drs_desc_t *spd, const hwloc_cpuset_t mask)
  1073. {
  1074. return starpurm_withdraw_cpu_mask_from_starpu(spd, mask);
  1075. }
  1076. starpurm_drs_ret_t starpurm_reclaim(starpurm_drs_desc_t *spd)
  1077. {
  1078. return starpurm_withdraw_all_cpus_from_starpu(spd);
  1079. }
  1080. starpurm_drs_ret_t starpurm_acquire(starpurm_drs_desc_t *spd)
  1081. {
  1082. return starpurm_withdraw_all_cpus_from_starpu(spd);
  1083. }
  1084. starpurm_drs_ret_t starpurm_acquire_cpu(starpurm_drs_desc_t *spd, int cpuid)
  1085. {
  1086. return starpurm_withdraw_cpu_from_starpu(spd, cpuid);
  1087. }
  1088. starpurm_drs_ret_t starpurm_acquire_cpus(starpurm_drs_desc_t *spd, int ncpus)
  1089. {
  1090. return starpurm_withdraw_cpus_from_starpu(spd, ncpus);
  1091. }
  1092. starpurm_drs_ret_t starpurm_acquire_cpu_mask(starpurm_drs_desc_t *spd, const hwloc_cpuset_t mask)
  1093. {
  1094. return starpurm_withdraw_cpu_mask_from_starpu(spd, mask);
  1095. }
  1096. starpurm_drs_ret_t starpurm_return_all(starpurm_drs_desc_t *spd)
  1097. {
  1098. return starpurm_assign_all_cpus_to_starpu(spd);
  1099. }
  1100. starpurm_drs_ret_t starpurm_return_cpu(starpurm_drs_desc_t *spd, int cpuid)
  1101. {
  1102. return starpurm_assign_cpu_to_starpu(spd, cpuid);
  1103. }
  1104. /* Pause/resume */
  1105. starpurm_drs_ret_t starpurm_create_block_condition(starpurm_block_cond_t *cond)
  1106. {
  1107. /* unimplemented */
  1108. assert(0);
  1109. return starpurm_DRS_PERM;
  1110. }
  1111. void starpurm_block_current_task(starpurm_block_cond_t *cond)
  1112. {
  1113. /* unimplemented */
  1114. assert(0);
  1115. }
  1116. void starpurm_signal_block_condition(starpurm_block_cond_t *cond)
  1117. {
  1118. /* unimplemented */
  1119. assert(0);
  1120. }
  1121. void starpurm_register_polling_service(const char *service_name, starpurm_polling_t function, void *data)
  1122. {
  1123. /* unimplemented */
  1124. assert(0);
  1125. }
  1126. void starpurm_unregister_polling_service(const char *service_name, starpurm_polling_t function, void *data)
  1127. {
  1128. /* unimplemented */
  1129. assert(0);
  1130. }
  1131. /* devices */
  1132. int starpurm_get_device_type_id(const char *type_str)
  1133. {
  1134. if (strcmp(type_str, "cpu") == 0)
  1135. return starpurm_unit_cpu;
  1136. if (strcmp(type_str, "opencl") == 0)
  1137. return starpurm_unit_opencl;
  1138. if (strcmp(type_str, "cuda") == 0)
  1139. return starpurm_unit_cuda;
  1140. if (strcmp(type_str, "mic") == 0)
  1141. return starpurm_unit_mic;
  1142. return -1;
  1143. }
  1144. const char *starpurm_get_device_type_name(int type_id)
  1145. {
  1146. if (type_id == starpurm_unit_cpu)
  1147. return "cpu";
  1148. if (type_id == starpurm_unit_opencl)
  1149. return "opencl";
  1150. if (type_id == starpurm_unit_cuda)
  1151. return "cuda";
  1152. if (type_id == starpurm_unit_mic)
  1153. return "mic";
  1154. return NULL;
  1155. }
  1156. int starpurm_get_nb_devices_by_type(int type_id)
  1157. {
  1158. assert(_starpurm != NULL);
  1159. assert(_starpurm->state != state_uninitialized);
  1160. struct s_starpurm *rm = _starpurm;
  1161. if (type_id < 0 || type_id >= starpurm_unit_ntypes)
  1162. return -1;
  1163. return rm->nunits_by_type[type_id];
  1164. }
  1165. int starpurm_get_device_id(int type_id, int unit_rank)
  1166. {
  1167. assert(_starpurm != NULL);
  1168. assert(_starpurm->state != state_uninitialized);
  1169. struct s_starpurm *rm = _starpurm;
  1170. if (type_id < 0 || type_id >= starpurm_unit_ntypes)
  1171. return -1;
  1172. if (unit_rank < 0 || unit_rank >= rm->nunits_by_type[type_id])
  1173. return -1;
  1174. return rm->units[rm->unit_offsets_by_type[type_id] + unit_rank].id;
  1175. }
  1176. starpurm_drs_ret_t starpurm_assign_device_to_starpu(starpurm_drs_desc_t *spd, int type_id, int unit_rank)
  1177. {
  1178. assert(_starpurm != NULL);
  1179. assert(_starpurm->state != state_uninitialized);
  1180. struct s_starpurm *rm = _starpurm;
  1181. if (!rm->dynamic_resource_sharing)
  1182. return starpurm_DRS_DISABLD;
  1183. if (type_id < 0 || type_id >= starpurm_unit_ntypes)
  1184. return starpurm_DRS_EINVAL;
  1185. if (unit_rank < 0 || unit_rank >= rm->nunits_by_type[type_id])
  1186. return starpurm_DRS_EINVAL;
  1187. hwloc_cpuset_t temp_cpuset = hwloc_bitmap_dup(rm->selected_cpuset);
  1188. hwloc_bitmap_or(temp_cpuset, temp_cpuset, rm->units[rm->unit_offsets_by_type[type_id] + unit_rank].worker_cpuset);
  1189. starpurm_drs_ret_t ret = _starpurm_update_cpuset(temp_cpuset);
  1190. hwloc_bitmap_free(temp_cpuset);
  1191. return ret;
  1192. }
  1193. starpurm_drs_ret_t starpurm_assign_devices_to_starpu(starpurm_drs_desc_t *spd, int type_id, int ndevices)
  1194. {
  1195. (void)spd;
  1196. assert(_starpurm != NULL);
  1197. assert(_starpurm->state != state_uninitialized);
  1198. struct s_starpurm *rm = _starpurm;
  1199. if (!rm->dynamic_resource_sharing)
  1200. return starpurm_DRS_DISABLD;
  1201. if (type_id < 0 || type_id >= starpurm_unit_ntypes)
  1202. return starpurm_DRS_EINVAL;
  1203. hwloc_cpuset_t temp_cpuset = hwloc_bitmap_dup(rm->selected_cpuset);
  1204. if (ndevices > rm->nunits_by_type[type_id])
  1205. {
  1206. ndevices = rm->nunits_by_type[type_id];
  1207. }
  1208. int i;
  1209. for (i = 0; i < ndevices; i++)
  1210. {
  1211. hwloc_bitmap_or(temp_cpuset, temp_cpuset, rm->units[rm->unit_offsets_by_type[type_id] + i].worker_cpuset);
  1212. }
  1213. starpurm_drs_ret_t ret = _starpurm_update_cpuset(temp_cpuset);
  1214. hwloc_bitmap_free(temp_cpuset);
  1215. return ret;
  1216. }
  1217. starpurm_drs_ret_t starpurm_assign_device_mask_to_starpu(starpurm_drs_desc_t *spd, const hwloc_cpuset_t mask)
  1218. {
  1219. (void)spd;
  1220. assert(_starpurm != NULL);
  1221. assert(_starpurm->state != state_uninitialized);
  1222. struct s_starpurm *rm = _starpurm;
  1223. if (!rm->dynamic_resource_sharing)
  1224. return starpurm_DRS_DISABLD;
  1225. hwloc_cpuset_t temp_cpuset = hwloc_bitmap_dup(rm->selected_cpuset);
  1226. hwloc_bitmap_or(temp_cpuset, temp_cpuset, mask);
  1227. starpurm_drs_ret_t ret = _starpurm_update_cpuset(temp_cpuset);
  1228. hwloc_bitmap_free(temp_cpuset);
  1229. return ret;
  1230. }
  1231. starpurm_drs_ret_t starpurm_assign_all_devices_to_starpu(starpurm_drs_desc_t *spd, int type_id)
  1232. {
  1233. assert(_starpurm != NULL);
  1234. assert(_starpurm->state != state_uninitialized);
  1235. struct s_starpurm *rm = _starpurm;
  1236. if (!rm->dynamic_resource_sharing)
  1237. return starpurm_DRS_DISABLD;
  1238. if (type_id < 0 || type_id >= starpurm_unit_ntypes)
  1239. return starpurm_DRS_EINVAL;
  1240. return starpurm_assign_devices_to_starpu(spd, type_id, rm->nunits_by_type[type_id]);
  1241. }
  1242. starpurm_drs_ret_t starpurm_withdraw_device_from_starpu(starpurm_drs_desc_t *spd, int type_id, int unit_rank)
  1243. {
  1244. assert(_starpurm != NULL);
  1245. assert(_starpurm->state != state_uninitialized);
  1246. struct s_starpurm *rm = _starpurm;
  1247. if (!rm->dynamic_resource_sharing)
  1248. return starpurm_DRS_DISABLD;
  1249. if (type_id < 0 || type_id >= starpurm_unit_ntypes)
  1250. return starpurm_DRS_EINVAL;
  1251. if (unit_rank < 0 || unit_rank >= rm->nunits_by_type[type_id])
  1252. return starpurm_DRS_EINVAL;
  1253. hwloc_cpuset_t temp_cpuset = hwloc_bitmap_dup(rm->selected_cpuset);
  1254. hwloc_bitmap_andnot(temp_cpuset, temp_cpuset, rm->units[rm->unit_offsets_by_type[type_id] + unit_rank].worker_cpuset);
  1255. starpurm_drs_ret_t ret = _starpurm_update_cpuset(temp_cpuset);
  1256. hwloc_bitmap_free(temp_cpuset);
  1257. return ret;
  1258. }
  1259. starpurm_drs_ret_t starpurm_withdraw_devices_from_starpu(starpurm_drs_desc_t *spd, int type_id, int ndevices)
  1260. {
  1261. (void)spd;
  1262. assert(_starpurm != NULL);
  1263. assert(_starpurm->state != state_uninitialized);
  1264. struct s_starpurm *rm = _starpurm;
  1265. if (!rm->dynamic_resource_sharing)
  1266. return starpurm_DRS_DISABLD;
  1267. if (type_id < 0 || type_id >= starpurm_unit_ntypes)
  1268. return starpurm_DRS_EINVAL;
  1269. hwloc_cpuset_t temp_cpuset = hwloc_bitmap_dup(rm->selected_cpuset);
  1270. if (ndevices > rm->nunits_by_type[type_id])
  1271. {
  1272. ndevices = rm->nunits_by_type[type_id];
  1273. }
  1274. int i;
  1275. for (i = 0; i < ndevices; i++)
  1276. {
  1277. hwloc_bitmap_andnot(temp_cpuset, temp_cpuset, rm->units[rm->unit_offsets_by_type[type_id] + i].worker_cpuset);
  1278. }
  1279. starpurm_drs_ret_t ret = _starpurm_update_cpuset(temp_cpuset);
  1280. hwloc_bitmap_free(temp_cpuset);
  1281. return ret;
  1282. }
  1283. starpurm_drs_ret_t starpurm_withdraw_device_mask_from_starpu(starpurm_drs_desc_t *spd, const hwloc_cpuset_t mask)
  1284. {
  1285. (void)spd;
  1286. assert(_starpurm != NULL);
  1287. assert(_starpurm->state != state_uninitialized);
  1288. struct s_starpurm *rm = _starpurm;
  1289. if (!rm->dynamic_resource_sharing)
  1290. return starpurm_DRS_DISABLD;
  1291. hwloc_cpuset_t temp_cpuset = hwloc_bitmap_dup(rm->selected_cpuset);
  1292. hwloc_bitmap_andnot(temp_cpuset, temp_cpuset, mask);
  1293. starpurm_drs_ret_t ret = _starpurm_update_cpuset(temp_cpuset);
  1294. hwloc_bitmap_free(temp_cpuset);
  1295. return ret;
  1296. }
  1297. starpurm_drs_ret_t starpurm_withdraw_all_devices_from_starpu(starpurm_drs_desc_t *spd, int type_id)
  1298. {
  1299. assert(_starpurm != NULL);
  1300. assert(_starpurm->state != state_uninitialized);
  1301. struct s_starpurm *rm = _starpurm;
  1302. if (!rm->dynamic_resource_sharing)
  1303. return starpurm_DRS_DISABLD;
  1304. if (type_id < 0 || type_id >= starpurm_unit_ntypes)
  1305. return starpurm_DRS_EINVAL;
  1306. return starpurm_withdraw_devices_from_starpu(spd, type_id, rm->nunits_by_type[type_id]);
  1307. }
  1308. /* --- */
  1309. starpurm_drs_ret_t starpurm_lend_device(starpurm_drs_desc_t *spd, int type_id, int unit_rank)
  1310. {
  1311. return starpurm_assign_device_to_starpu(spd, type_id, unit_rank);
  1312. }
  1313. starpurm_drs_ret_t starpurm_lend_devices(starpurm_drs_desc_t *spd, int type_id, int ndevices)
  1314. {
  1315. return starpurm_assign_devices_to_starpu(spd, type_id, ndevices);
  1316. }
  1317. starpurm_drs_ret_t starpurm_lend_device_mask(starpurm_drs_desc_t *spd, const hwloc_cpuset_t mask)
  1318. {
  1319. return starpurm_assign_device_mask_to_starpu(spd, mask);
  1320. }
  1321. starpurm_drs_ret_t starpurm_lend_all_devices(starpurm_drs_desc_t *spd, int type_id)
  1322. {
  1323. return starpurm_assign_all_devices_to_starpu(spd, type_id);
  1324. }
  1325. starpurm_drs_ret_t starpurm_reclaim_device(starpurm_drs_desc_t *spd, int type_id, int unit_rank)
  1326. {
  1327. return starpurm_withdraw_device_from_starpu(spd, type_id, unit_rank);
  1328. }
  1329. starpurm_drs_ret_t starpurm_reclaim_devices(starpurm_drs_desc_t *spd, int type_id, int ndevices)
  1330. {
  1331. return starpurm_withdraw_devices_from_starpu(spd, type_id, ndevices);
  1332. }
  1333. starpurm_drs_ret_t starpurm_reclaim_device_mask(starpurm_drs_desc_t *spd, const hwloc_cpuset_t mask)
  1334. {
  1335. return starpurm_withdraw_device_mask_from_starpu(spd, mask);
  1336. }
  1337. starpurm_drs_ret_t starpurm_reclaim_all_devices(starpurm_drs_desc_t *spd, int type_id)
  1338. {
  1339. return starpurm_withdraw_all_devices_from_starpu(spd, type_id);
  1340. }
  1341. starpurm_drs_ret_t starpurm_acquire_all_devices(starpurm_drs_desc_t *spd, int type_id)
  1342. {
  1343. return starpurm_withdraw_all_devices_from_starpu(spd, type_id);
  1344. }
  1345. starpurm_drs_ret_t starpurm_acquire_device(starpurm_drs_desc_t *spd, int type_id, int unit_rank)
  1346. {
  1347. return starpurm_withdraw_device_from_starpu(spd, type_id, unit_rank);
  1348. }
  1349. starpurm_drs_ret_t starpurm_acquire_devices(starpurm_drs_desc_t *spd, int type_id, int ndevices)
  1350. {
  1351. return starpurm_withdraw_devices_from_starpu(spd, type_id, ndevices);
  1352. }
  1353. starpurm_drs_ret_t starpurm_acquire_device_mask(starpurm_drs_desc_t *spd, const hwloc_cpuset_t mask)
  1354. {
  1355. return starpurm_withdraw_device_mask_from_starpu(spd, mask);
  1356. }
  1357. starpurm_drs_ret_t starpurm_return_all_devices(starpurm_drs_desc_t *spd, int type_id)
  1358. {
  1359. return starpurm_assign_all_devices_to_starpu(spd, type_id);
  1360. }
  1361. starpurm_drs_ret_t starpurm_return_device(starpurm_drs_desc_t *spd, int type_id, int unit_rank)
  1362. {
  1363. return starpurm_assign_device_to_starpu(spd, type_id, unit_rank);
  1364. }
  1365. /* cpusets */
  1366. hwloc_cpuset_t starpurm_get_device_worker_cpuset(int type_id, int unit_rank)
  1367. {
  1368. assert(_starpurm != NULL);
  1369. assert(_starpurm->state != state_uninitialized);
  1370. struct s_starpurm *rm = _starpurm;
  1371. assert(type_id >= 0 && type_id < starpurm_unit_ntypes);
  1372. assert(unit_rank >= 0 && unit_rank < rm->nunits_by_type[type_id]);
  1373. return hwloc_bitmap_dup(rm->units[rm->unit_offsets_by_type[type_id] + unit_rank].worker_cpuset);
  1374. }
  1375. hwloc_cpuset_t starpurm_get_global_cpuset(void)
  1376. {
  1377. assert(_starpurm != NULL);
  1378. assert(_starpurm->state != state_uninitialized);
  1379. struct s_starpurm *rm = _starpurm;
  1380. return hwloc_bitmap_dup(rm->global_cpuset);
  1381. }
  1382. hwloc_cpuset_t starpurm_get_selected_cpuset(void)
  1383. {
  1384. assert(_starpurm != NULL);
  1385. assert(_starpurm->state != state_uninitialized);
  1386. struct s_starpurm *rm = _starpurm;
  1387. return hwloc_bitmap_dup(rm->selected_cpuset);
  1388. }
  1389. hwloc_cpuset_t starpurm_get_all_cpu_workers_cpuset(void)
  1390. {
  1391. assert(_starpurm != NULL);
  1392. assert(_starpurm->state != state_uninitialized);
  1393. struct s_starpurm *rm = _starpurm;
  1394. return hwloc_bitmap_dup(rm->all_cpu_workers_cpuset);
  1395. }
  1396. static hwloc_cpuset_t starpurm_get_all_opencl_device_workers_cpuset(void)
  1397. {
  1398. assert(_starpurm != NULL);
  1399. assert(_starpurm->state != state_uninitialized);
  1400. struct s_starpurm *rm = _starpurm;
  1401. return hwloc_bitmap_dup(rm->all_opencl_device_workers_cpuset);
  1402. }
  1403. static hwloc_cpuset_t starpurm_get_all_cuda_device_workers_cpuset(void)
  1404. {
  1405. assert(_starpurm != NULL);
  1406. assert(_starpurm->state != state_uninitialized);
  1407. struct s_starpurm *rm = _starpurm;
  1408. return hwloc_bitmap_dup(rm->all_cuda_device_workers_cpuset);
  1409. }
  1410. static hwloc_cpuset_t starpurm_get_all_mic_device_workers_cpuset(void)
  1411. {
  1412. assert(_starpurm != NULL);
  1413. assert(_starpurm->state != state_uninitialized);
  1414. struct s_starpurm *rm = _starpurm;
  1415. return hwloc_bitmap_dup(rm->all_mic_device_workers_cpuset);
  1416. }
  1417. hwloc_cpuset_t starpurm_get_all_device_workers_cpuset(void)
  1418. {
  1419. assert(_starpurm != NULL);
  1420. assert(_starpurm->state != state_uninitialized);
  1421. struct s_starpurm *rm = _starpurm;
  1422. return hwloc_bitmap_dup(rm->all_device_workers_cpuset);
  1423. }
  1424. hwloc_cpuset_t starpurm_get_all_device_workers_cpuset_by_type(int typeid)
  1425. {
  1426. assert(_starpurm != NULL);
  1427. assert(_starpurm->state != state_uninitialized);
  1428. assert(typeid != starpurm_unit_cpu);
  1429. if (typeid == starpurm_unit_opencl)
  1430. return starpurm_get_all_opencl_device_workers_cpuset();
  1431. if (typeid == starpurm_unit_cuda)
  1432. return starpurm_get_all_cuda_device_workers_cpuset();
  1433. if (typeid == starpurm_unit_mic)
  1434. return starpurm_get_all_mic_device_workers_cpuset();
  1435. hwloc_cpuset_t empty_bitmap = hwloc_bitmap_alloc();
  1436. hwloc_bitmap_zero(empty_bitmap);
  1437. return empty_bitmap;
  1438. }