starpu_replay_sched.c 10 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430
  1. /* StarPU --- Runtime system for heterogeneous multicore architectures.
  2. *
  3. * Copyright (C) 2016-2017 Université de Bordeaux
  4. * Copyright (C) 2017 Erwan Leria
  5. *
  6. * StarPU is free software; you can redistribute it and/or modify
  7. * it under the terms of the GNU Lesser General Public License as published by
  8. * the Free Software Foundation; either version 2.1 of the License, or (at
  9. * your option) any later version.
  10. *
  11. * StarPU is distributed in the hope that it will be useful, but
  12. * WITHOUT ANY WARRANTY; without even the implied warranty of
  13. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
  14. *
  15. * See the GNU Lesser General Public License in COPYING.LGPL for more details.
  16. */
  17. /*
  18. * This reads a sched.rec file and mangles submitted tasks according to the hint
  19. * from that file.
  20. */
  21. #include <starpu.h>
  22. #include <unistd.h>
  23. #include <stdio.h>
  24. #include <math.h>
  25. #include <common/uthash.h>
  26. #include <common/list.h>
  27. #include <common/utils.h>
  28. #include <limits.h>
  29. /*
  30. sched.rec files look like this:
  31. SubmitOrder: 1234
  32. Priority: 12
  33. SpecificWorker: 1
  34. Workers: 0 1 2
  35. DependsOn: 1235
  36. Prefetch: 1234
  37. DependsOn: 1233
  38. MemoryNode: 1
  39. Parameters: 1
  40. */
  41. #define CPY(src, dst, n) memcpy(dst, src, n * sizeof(*dst))
  42. #if 0
  43. #define debug(fmt, ...) fprintf(stderr, fmt, ##__VA_ARGS__)
  44. #else
  45. #define debug(fmt, ...) (void)0
  46. #endif
  47. static unsigned long submitorder; /* Also use as prefetchtag */
  48. static int priority;
  49. static int eosw;
  50. static unsigned workerorder;
  51. static int memnode;
  52. /* FIXME: MAXs */
  53. static uint32_t workers[STARPU_NMAXWORKERS/32];
  54. static unsigned nworkers;
  55. static unsigned dependson[STARPU_NMAXBUFS];
  56. static unsigned ndependson;
  57. static unsigned params[STARPU_NMAXBUFS];
  58. static unsigned nparams;
  59. static enum sched_type {
  60. NormalTask,
  61. PrefetchTask,
  62. } sched_type;
  63. static struct starpu_codelet cl_prefetch = {
  64. .where = STARPU_NOWHERE,
  65. .nbuffers = 1,
  66. .modes = { STARPU_R },
  67. };
  68. static struct task
  69. {
  70. UT_hash_handle hh;
  71. unsigned long submitorder;
  72. int priority;
  73. int memnode;
  74. unsigned dependson[STARPU_NMAXBUFS];
  75. unsigned ndependson;
  76. struct starpu_task *depends_tasks[STARPU_NMAXBUFS];
  77. /* For real tasks */
  78. int eosw;
  79. unsigned workerorder;
  80. uint32_t workers[STARPU_NMAXWORKERS/32];
  81. unsigned nworkers;
  82. /* For prefetch tasks */
  83. unsigned params[STARPU_NMAXBUFS];
  84. unsigned nparams;
  85. struct starpu_task *pref_task; /* Actual prefetch task */
  86. } *mangled_tasks, *prefetch_tasks;
  87. LIST_TYPE(dep,
  88. struct task *task;
  89. unsigned i;
  90. );
  91. struct deps {
  92. UT_hash_handle hh;
  93. unsigned long submitorder;
  94. struct dep_list list;
  95. } *dependencies = NULL;
  96. static void reset(void) {
  97. submitorder = 0;
  98. priority = INT_MIN;
  99. eosw = -1;
  100. memset(&workers, 0, sizeof(workers));
  101. nworkers = 0;
  102. ndependson = 0;
  103. sched_type = NormalTask;
  104. nparams = 0;
  105. memnode = -1;
  106. workerorder = 0;
  107. }
  108. /* TODO : respecter l'ordre de soumission des tâches SubmitOrder */
  109. static void checkField(char * s)
  110. {
  111. /* Record various information */
  112. #define TEST(field) (!strncmp(s, field": ", strlen(field) + 2))
  113. if (TEST("SubmitOrder"))
  114. {
  115. s = s + strlen("SubmitOrder: ");
  116. submitorder = strtol(s, NULL, 10);
  117. }
  118. else if (TEST("Priority"))
  119. {
  120. s = s + strlen("Priority: ");
  121. priority = strtol(s, NULL, 10);
  122. }
  123. else if (TEST("SpecificWorker"))
  124. {
  125. s = s + strlen("SpecificWorker: ");
  126. eosw = strtol(s, NULL, 10);
  127. }
  128. else if (TEST("Workers"))
  129. {
  130. s = s + strlen("Workers: ");
  131. char * delim = " ";
  132. char * token = strtok(s, delim);
  133. int i = 0;
  134. while (token != NULL)
  135. {
  136. int k = strtol(token, NULL, 10);
  137. STARPU_ASSERT_MSG(k < STARPU_NMAXWORKERS, "%d is bigger than maximum %d\n", k, STARPU_NMAXWORKERS);
  138. workers[k/(sizeof(*workers)*8)] |= (1 << (k%(sizeof(*workers)*8)));
  139. i++;
  140. token = strtok(NULL, delim);
  141. }
  142. nworkers = i;
  143. }
  144. else if (TEST("DependsOn"))
  145. {
  146. /* NOTE : dependsons (in the sched.rec) should be the submit orders of the dependencies,
  147. otherwise it can occur an undefined behaviour
  148. (contrary to the tasks.rec where dependencies are jobids */
  149. unsigned i = 0;
  150. char * delim = " ";
  151. char * token = strtok(s+strlen("DependsOn: "), delim);
  152. while (token != NULL)
  153. {
  154. dependson[i] = strtol(token, NULL, 10);
  155. i++;
  156. token = strtok(NULL, delim);
  157. }
  158. ndependson = i;
  159. }
  160. else if (TEST("Prefetch"))
  161. {
  162. s = s + strlen("Prefetch: ");
  163. submitorder = strtol(s, NULL, 10);
  164. sched_type = PrefetchTask;
  165. }
  166. else if (TEST("Parameters"))
  167. {
  168. s = s + strlen("Parameters: ");
  169. char * delim = " ";
  170. char * token = strtok(s, delim);
  171. int i = 0;
  172. while (token != NULL)
  173. {
  174. params[i] = strtol(token, NULL, 10);
  175. i++;
  176. token = strtok(NULL, delim);
  177. }
  178. nparams = i;
  179. }
  180. else if (TEST("MemoryNode"))
  181. {
  182. s = s + strlen("MemoryNode: ");
  183. memnode = strtol(s, NULL, 10);
  184. }
  185. else if (TEST("Workerorder"))
  186. {
  187. s = s + strlen("Workerorder: ");
  188. workerorder = strtol(s, NULL, 10);
  189. }
  190. }
  191. void schedRecInit(const char * filename)
  192. {
  193. FILE * f = fopen(filename, "r");
  194. if(f == NULL)
  195. {
  196. fprintf(stderr,"unable to open file %s: %s\n", filename, strerror(errno));
  197. return;
  198. }
  199. size_t lnsize = 128;
  200. char * s = malloc(sizeof(*s) * lnsize);
  201. int eof = 0;
  202. reset();
  203. while(!eof && !feof(f))
  204. {
  205. char *ln;
  206. /* Get the line */
  207. if (!fgets(s, lnsize, f))
  208. {
  209. eof = 1;
  210. }
  211. while (!(ln = strchr(s, '\n')))
  212. {
  213. _STARPU_REALLOC(s, lnsize * 2);
  214. if (!fgets(s + lnsize-1, lnsize+1, f))
  215. {
  216. eof = 1;
  217. break;
  218. }
  219. lnsize *= 2;
  220. }
  221. if ((ln == s || eof) && submitorder)
  222. {
  223. /* Empty line, doit */
  224. struct task * task;
  225. unsigned i;
  226. _STARPU_MALLOC(task, sizeof(*task));
  227. task->submitorder = submitorder;
  228. task->priority = priority;
  229. task->memnode = memnode;
  230. CPY(dependson, task->dependson, ndependson);
  231. task->ndependson = ndependson;
  232. /* Also record submitorder of tasks that this one will need to depend on */
  233. for (i = 0; i < ndependson; i++) {
  234. struct dep *dep;
  235. struct starpu_task *starpu_task;
  236. _STARPU_MALLOC(dep, sizeof(*dep));
  237. dep->task = task;
  238. dep->i = i;
  239. struct deps *deps;
  240. HASH_FIND(hh, dependencies, &task->dependson[i], sizeof(submitorder), deps);
  241. if (!deps) {
  242. /* No task depends on this one yet, add a cell for it */
  243. _STARPU_MALLOC(deps, sizeof(*deps));
  244. dep_list_init(&deps->list);
  245. deps->submitorder = task->dependson[i];
  246. HASH_ADD(hh, dependencies, submitorder, sizeof(submitorder), deps);
  247. }
  248. dep_list_push_back(&deps->list, dep);
  249. /* Create the intermediate task */
  250. starpu_task = dep->task->depends_tasks[i] = starpu_task_create();
  251. starpu_task->cl = NULL;
  252. starpu_task->destroy = 0;
  253. starpu_task->no_submitorder = 1;
  254. }
  255. switch (sched_type)
  256. {
  257. case NormalTask:
  258. /* A new task to mangle, record what needs to be done */
  259. task->eosw = eosw;
  260. task->workerorder = workerorder;
  261. CPY(workers, task->workers, nworkers);
  262. task->nworkers = nworkers;
  263. STARPU_ASSERT(nparams == 0);
  264. debug("adding mangled task %lu\n", submitorder);
  265. HASH_ADD(hh, mangled_tasks, submitorder, sizeof(submitorder), task);
  266. break;
  267. case PrefetchTask:
  268. STARPU_ASSERT(memnode >= 0);
  269. STARPU_ASSERT(eosw == -1);
  270. STARPU_ASSERT(workerorder == 0);
  271. STARPU_ASSERT(nworkers == 0);
  272. CPY(params, task->params, nparams);
  273. task->nparams = nparams;
  274. /* TODO: more params */
  275. STARPU_ASSERT_MSG(nparams == 1, "only supports one parameter at a time");
  276. debug("adding prefetch task for %lu\n", submitorder);
  277. HASH_ADD(hh, prefetch_tasks, submitorder, sizeof(submitorder), task);
  278. break;
  279. default:
  280. STARPU_ASSERT(0);
  281. break;
  282. }
  283. reset();
  284. }
  285. else checkField(s);
  286. }
  287. }
  288. static void do_prefetch(void *arg)
  289. {
  290. unsigned node = (uintptr_t) arg;
  291. starpu_data_idle_prefetch_on_node(starpu_task_get_current()->handles[0], node, 1);
  292. }
  293. void applySchedRec(struct starpu_task *starpu_task, unsigned long submit_order)
  294. {
  295. struct task *task;
  296. struct deps *deps;
  297. int ret;
  298. HASH_FIND(hh, dependencies, &submit_order, sizeof(submit_order), deps);
  299. if (deps)
  300. {
  301. struct dep *dep;
  302. for (dep = dep_list_begin(&deps->list);
  303. dep != dep_list_end(&deps->list);
  304. dep = dep_list_next(dep))
  305. {
  306. debug("task %lu is %d-th dep for %lu\n", submit_order, dep->i, dep->task->submitorder);
  307. /* Some task will depend on this one, make the dependency */
  308. starpu_task_declare_deps_array(dep->task->depends_tasks[dep->i], 1, &starpu_task);
  309. ret = starpu_task_submit(dep->task->depends_tasks[dep->i]);
  310. STARPU_ASSERT(ret == 0);
  311. }
  312. }
  313. HASH_FIND(hh, prefetch_tasks, &submit_order, sizeof(submit_order), task);
  314. if (task) {
  315. /* We want to submit a prefetch for this task */
  316. debug("task %lu has a prefetch for parameter %d to node %d\n", submit_order, task->params[0], task->memnode);
  317. struct starpu_task *pref_task;
  318. pref_task = task->pref_task = starpu_task_create();
  319. pref_task->cl = &cl_prefetch;
  320. pref_task->destroy = 1;
  321. pref_task->no_submitorder = 1;
  322. pref_task->callback_arg = (void*)(uintptr_t) task->memnode;
  323. pref_task->callback_func = do_prefetch;
  324. /* TODO: more params */
  325. pref_task->handles[0] = starpu_task->handles[task->params[0]];
  326. /* Make it depend on intermediate tasks */
  327. if (task->ndependson)
  328. {
  329. debug("%u dependencies\n", task->ndependson);
  330. starpu_task_declare_deps_array(pref_task, task->ndependson, task->depends_tasks);
  331. }
  332. ret = starpu_task_submit(pref_task);
  333. STARPU_ASSERT(ret == 0);
  334. }
  335. HASH_FIND(hh, mangled_tasks, &submit_order, sizeof(submit_order), task);
  336. if (task == NULL)
  337. /* Nothing to do for this */
  338. return;
  339. debug("mangling task %lu\n", submit_order);
  340. if (task->eosw >= 0)
  341. {
  342. debug("execute on a specific worker %d\n", task->eosw);
  343. starpu_task->workerid = task->eosw;
  344. starpu_task->execute_on_a_specific_worker = 1;
  345. }
  346. if (task->workerorder > 0)
  347. {
  348. debug("workerorder %d\n", task->workerorder);
  349. starpu_task->workerorder = task->workerorder;
  350. }
  351. if (task->priority != INT_MIN)
  352. {
  353. debug("priority %d\n", task->priority);
  354. starpu_task->priority = task->priority;
  355. }
  356. if (task->nworkers)
  357. {
  358. debug("%u workers %x\n", task->nworkers, task->workers[0]);
  359. starpu_task->workerids_len = sizeof(task->workers) / sizeof(task->workers[0]);
  360. _STARPU_MALLOC(starpu_task->workerids, task->nworkers * sizeof(*starpu_task->workerids));
  361. CPY(task->workers, starpu_task->workerids, task->nworkers);
  362. }
  363. if (task->ndependson)
  364. {
  365. debug("%u dependencies\n", task->ndependson);
  366. starpu_task_declare_deps_array(starpu_task, task->ndependson, task->depends_tasks);
  367. }
  368. /* And now, let it go! */
  369. }