starpu_replay_sched.c 10 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439
  1. /* StarPU --- Runtime system for heterogeneous multicore architectures.
  2. *
  3. * Copyright (C) 2016-2017 Université de Bordeaux
  4. * Copyright (C) 2017 Erwan Leria
  5. *
  6. * StarPU is free software; you can redistribute it and/or modify
  7. * it under the terms of the GNU Lesser General Public License as published by
  8. * the Free Software Foundation; either version 2.1 of the License, or (at
  9. * your option) any later version.
  10. *
  11. * StarPU is distributed in the hope that it will be useful, but
  12. * WITHOUT ANY WARRANTY; without even the implied warranty of
  13. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
  14. *
  15. * See the GNU Lesser General Public License in COPYING.LGPL for more details.
  16. */
  17. /*
  18. * This reads a sched.rec file and mangles submitted tasks according to the hint
  19. * from that file.
  20. */
  21. #include <starpu.h>
  22. #include <unistd.h>
  23. #include <stdio.h>
  24. #include <math.h>
  25. #include <common/uthash.h>
  26. #include <common/list.h>
  27. #include <common/utils.h>
  28. #include <limits.h>
  29. /*
  30. sched.rec files look like this:
  31. SubmitOrder: 1234
  32. Priority: 12
  33. SpecificWorker: 1
  34. Workers: 0 1 2
  35. DependsOn: 1235
  36. Prefetch: 1234
  37. DependsOn: 1233
  38. MemoryNode: 1
  39. Parameters: 1
  40. */
  41. #define CPY(src, dst, n) memcpy(dst, src, n * sizeof(*dst))
  42. #if 0
  43. #define debug(fmt, ...) fprintf(stderr, fmt, ##__VA_ARGS__)
  44. #else
  45. #define debug(fmt, ...) (void)0
  46. #endif
  47. static unsigned long submitorder; /* Also use as prefetchtag */
  48. static int priority;
  49. static int eosw;
  50. static unsigned workerorder;
  51. static int memnode;
  52. /* FIXME: MAXs */
  53. static uint32_t workers[STARPU_NMAXWORKERS/32];
  54. static unsigned nworkers;
  55. static unsigned dependson[STARPU_NMAXBUFS];
  56. static unsigned ndependson;
  57. static unsigned params[STARPU_NMAXBUFS];
  58. static unsigned nparams;
  59. static enum sched_type
  60. {
  61. NormalTask,
  62. PrefetchTask,
  63. } sched_type;
  64. static struct starpu_codelet cl_prefetch =
  65. {
  66. .where = STARPU_NOWHERE,
  67. .nbuffers = 1,
  68. .modes = { STARPU_R },
  69. };
  70. static struct task
  71. {
  72. UT_hash_handle hh;
  73. unsigned long submitorder;
  74. int priority;
  75. int memnode;
  76. unsigned dependson[STARPU_NMAXBUFS];
  77. unsigned ndependson;
  78. struct starpu_task *depends_tasks[STARPU_NMAXBUFS];
  79. /* For real tasks */
  80. int eosw;
  81. unsigned workerorder;
  82. uint32_t workers[STARPU_NMAXWORKERS/32];
  83. unsigned nworkers;
  84. /* For prefetch tasks */
  85. unsigned params[STARPU_NMAXBUFS];
  86. unsigned nparams;
  87. struct starpu_task *pref_task; /* Actual prefetch task */
  88. } *mangled_tasks, *prefetch_tasks;
  89. LIST_TYPE(dep,
  90. struct task *task;
  91. unsigned i;
  92. );
  93. struct deps
  94. {
  95. UT_hash_handle hh;
  96. unsigned long submitorder;
  97. struct dep_list list;
  98. } *dependencies = NULL;
  99. static void reset(void)
  100. {
  101. submitorder = 0;
  102. priority = INT_MIN;
  103. eosw = -1;
  104. memset(&workers, 0, sizeof(workers));
  105. nworkers = 0;
  106. ndependson = 0;
  107. sched_type = NormalTask;
  108. nparams = 0;
  109. memnode = -1;
  110. workerorder = 0;
  111. }
  112. /* TODO : respecter l'ordre de soumission des tâches SubmitOrder */
  113. static void checkField(char * s)
  114. {
  115. /* Record various information */
  116. #define TEST(field) (!strncmp(s, field": ", strlen(field) + 2))
  117. if (TEST("SubmitOrder"))
  118. {
  119. s = s + strlen("SubmitOrder: ");
  120. submitorder = strtol(s, NULL, 10);
  121. }
  122. else if (TEST("Priority"))
  123. {
  124. s = s + strlen("Priority: ");
  125. priority = strtol(s, NULL, 10);
  126. }
  127. else if (TEST("SpecificWorker"))
  128. {
  129. s = s + strlen("SpecificWorker: ");
  130. eosw = strtol(s, NULL, 10);
  131. }
  132. else if (TEST("Workers"))
  133. {
  134. s = s + strlen("Workers: ");
  135. char * delim = " ";
  136. char * token = strtok(s, delim);
  137. int i = 0;
  138. while (token != NULL)
  139. {
  140. int k = strtol(token, NULL, 10);
  141. STARPU_ASSERT_MSG(k < STARPU_NMAXWORKERS, "%d is bigger than maximum %d\n", k, STARPU_NMAXWORKERS);
  142. workers[k/(sizeof(*workers)*8)] |= (1 << (k%(sizeof(*workers)*8)));
  143. i++;
  144. token = strtok(NULL, delim);
  145. }
  146. nworkers = i;
  147. }
  148. else if (TEST("DependsOn"))
  149. {
  150. /* NOTE : dependsons (in the sched.rec) should be the submit orders of the dependencies,
  151. otherwise it can occur an undefined behaviour
  152. (contrary to the tasks.rec where dependencies are jobids */
  153. unsigned i = 0;
  154. char * delim = " ";
  155. char * token = strtok(s+strlen("DependsOn: "), delim);
  156. while (token != NULL)
  157. {
  158. dependson[i] = strtol(token, NULL, 10);
  159. i++;
  160. token = strtok(NULL, delim);
  161. }
  162. ndependson = i;
  163. }
  164. else if (TEST("Prefetch"))
  165. {
  166. s = s + strlen("Prefetch: ");
  167. submitorder = strtol(s, NULL, 10);
  168. sched_type = PrefetchTask;
  169. }
  170. else if (TEST("Parameters"))
  171. {
  172. s = s + strlen("Parameters: ");
  173. char * delim = " ";
  174. char * token = strtok(s, delim);
  175. int i = 0;
  176. while (token != NULL)
  177. {
  178. params[i] = strtol(token, NULL, 10);
  179. i++;
  180. token = strtok(NULL, delim);
  181. }
  182. nparams = i;
  183. }
  184. else if (TEST("MemoryNode"))
  185. {
  186. s = s + strlen("MemoryNode: ");
  187. memnode = strtol(s, NULL, 10);
  188. }
  189. else if (TEST("Workerorder"))
  190. {
  191. s = s + strlen("Workerorder: ");
  192. workerorder = strtol(s, NULL, 10);
  193. }
  194. }
  195. void schedRecInit(const char * filename)
  196. {
  197. FILE * f = fopen(filename, "r");
  198. if(f == NULL)
  199. {
  200. fprintf(stderr,"unable to open file %s: %s\n", filename, strerror(errno));
  201. return;
  202. }
  203. size_t lnsize = 128;
  204. char * s = malloc(sizeof(*s) * lnsize);
  205. int eof = 0;
  206. reset();
  207. while(!eof && !feof(f))
  208. {
  209. char *ln;
  210. /* Get the line */
  211. if (!fgets(s, lnsize, f))
  212. {
  213. eof = 1;
  214. }
  215. while (!(ln = strchr(s, '\n')))
  216. {
  217. _STARPU_REALLOC(s, lnsize * 2);
  218. if (!fgets(s + lnsize-1, lnsize+1, f))
  219. {
  220. eof = 1;
  221. break;
  222. }
  223. lnsize *= 2;
  224. }
  225. if ((ln == s || eof) && submitorder)
  226. {
  227. /* Empty line, doit */
  228. struct task * task;
  229. unsigned i;
  230. _STARPU_MALLOC(task, sizeof(*task));
  231. task->submitorder = submitorder;
  232. task->priority = priority;
  233. task->memnode = memnode;
  234. CPY(dependson, task->dependson, ndependson);
  235. task->ndependson = ndependson;
  236. /* Also record submitorder of tasks that this one will need to depend on */
  237. for (i = 0; i < ndependson; i++)
  238. {
  239. struct dep *dep;
  240. struct starpu_task *starpu_task;
  241. _STARPU_MALLOC(dep, sizeof(*dep));
  242. dep->task = task;
  243. dep->i = i;
  244. struct deps *deps;
  245. HASH_FIND(hh, dependencies, &task->dependson[i], sizeof(submitorder), deps);
  246. if (!deps)
  247. {
  248. /* No task depends on this one yet, add a cell for it */
  249. _STARPU_MALLOC(deps, sizeof(*deps));
  250. dep_list_init(&deps->list);
  251. deps->submitorder = task->dependson[i];
  252. HASH_ADD(hh, dependencies, submitorder, sizeof(submitorder), deps);
  253. }
  254. dep_list_push_back(&deps->list, dep);
  255. /* Create the intermediate task */
  256. starpu_task = dep->task->depends_tasks[i] = starpu_task_create();
  257. starpu_task->cl = NULL;
  258. starpu_task->destroy = 0;
  259. starpu_task->no_submitorder = 1;
  260. }
  261. switch (sched_type)
  262. {
  263. case NormalTask:
  264. /* A new task to mangle, record what needs to be done */
  265. task->eosw = eosw;
  266. task->workerorder = workerorder;
  267. CPY(workers, task->workers, nworkers);
  268. task->nworkers = nworkers;
  269. STARPU_ASSERT(nparams == 0);
  270. debug("adding mangled task %lu\n", submitorder);
  271. HASH_ADD(hh, mangled_tasks, submitorder, sizeof(submitorder), task);
  272. break;
  273. case PrefetchTask:
  274. STARPU_ASSERT(memnode >= 0);
  275. STARPU_ASSERT(eosw == -1);
  276. STARPU_ASSERT(workerorder == 0);
  277. STARPU_ASSERT(nworkers == 0);
  278. CPY(params, task->params, nparams);
  279. task->nparams = nparams;
  280. /* TODO: more params */
  281. STARPU_ASSERT_MSG(nparams == 1, "only supports one parameter at a time");
  282. debug("adding prefetch task for %lu\n", submitorder);
  283. HASH_ADD(hh, prefetch_tasks, submitorder, sizeof(submitorder), task);
  284. break;
  285. default:
  286. STARPU_ASSERT(0);
  287. break;
  288. }
  289. reset();
  290. }
  291. else checkField(s);
  292. }
  293. fclose(f);
  294. }
  295. static void do_prefetch(void *arg)
  296. {
  297. unsigned node = (uintptr_t) arg;
  298. starpu_data_idle_prefetch_on_node(starpu_task_get_current()->handles[0], node, 1);
  299. }
  300. void applySchedRec(struct starpu_task *starpu_task, unsigned long submit_order)
  301. {
  302. struct task *task;
  303. struct deps *deps;
  304. int ret;
  305. HASH_FIND(hh, dependencies, &submit_order, sizeof(submit_order), deps);
  306. if (deps)
  307. {
  308. struct dep *dep;
  309. for (dep = dep_list_begin(&deps->list);
  310. dep != dep_list_end(&deps->list);
  311. dep = dep_list_next(dep))
  312. {
  313. debug("task %lu is %d-th dep for %lu\n", submit_order, dep->i, dep->task->submitorder);
  314. /* Some task will depend on this one, make the dependency */
  315. starpu_task_declare_deps_array(dep->task->depends_tasks[dep->i], 1, &starpu_task);
  316. ret = starpu_task_submit(dep->task->depends_tasks[dep->i]);
  317. STARPU_ASSERT(ret == 0);
  318. }
  319. }
  320. HASH_FIND(hh, prefetch_tasks, &submit_order, sizeof(submit_order), task);
  321. if (task)
  322. {
  323. /* We want to submit a prefetch for this task */
  324. debug("task %lu has a prefetch for parameter %d to node %d\n", submit_order, task->params[0], task->memnode);
  325. struct starpu_task *pref_task;
  326. pref_task = task->pref_task = starpu_task_create();
  327. pref_task->cl = &cl_prefetch;
  328. pref_task->destroy = 1;
  329. pref_task->no_submitorder = 1;
  330. pref_task->callback_arg = (void*)(uintptr_t) task->memnode;
  331. pref_task->callback_func = do_prefetch;
  332. /* TODO: more params */
  333. pref_task->handles[0] = starpu_task->handles[task->params[0]];
  334. /* Make it depend on intermediate tasks */
  335. if (task->ndependson)
  336. {
  337. debug("%u dependencies\n", task->ndependson);
  338. starpu_task_declare_deps_array(pref_task, task->ndependson, task->depends_tasks);
  339. }
  340. ret = starpu_task_submit(pref_task);
  341. STARPU_ASSERT(ret == 0);
  342. }
  343. HASH_FIND(hh, mangled_tasks, &submit_order, sizeof(submit_order), task);
  344. if (task == NULL)
  345. /* Nothing to do for this */
  346. return;
  347. debug("mangling task %lu\n", submit_order);
  348. if (task->eosw >= 0)
  349. {
  350. debug("execute on a specific worker %d\n", task->eosw);
  351. starpu_task->workerid = task->eosw;
  352. starpu_task->execute_on_a_specific_worker = 1;
  353. }
  354. if (task->workerorder > 0)
  355. {
  356. debug("workerorder %d\n", task->workerorder);
  357. starpu_task->workerorder = task->workerorder;
  358. }
  359. if (task->priority != INT_MIN)
  360. {
  361. debug("priority %d\n", task->priority);
  362. starpu_task->priority = task->priority;
  363. }
  364. if (task->nworkers)
  365. {
  366. debug("%u workers %x\n", task->nworkers, task->workers[0]);
  367. starpu_task->workerids_len = sizeof(task->workers) / sizeof(task->workers[0]);
  368. _STARPU_MALLOC(starpu_task->workerids, task->nworkers * sizeof(*starpu_task->workerids));
  369. CPY(task->workers, starpu_task->workerids, task->nworkers);
  370. }
  371. if (task->ndependson)
  372. {
  373. debug("%u dependencies\n", task->ndependson);
  374. starpu_task_declare_deps_array(starpu_task, task->ndependson, task->depends_tasks);
  375. }
  376. /* And now, let it go! */
  377. }