memory_nodes.c 5.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199
  1. /* StarPU --- Runtime system for heterogeneous multicore architectures.
  2. *
  3. * Copyright (C) 2009-2017,2019 Université de Bordeaux
  4. * Copyright (C) 2011-2013,2016,2017 Inria
  5. * Copyright (C) 2010-2015,2017,2018 CNRS
  6. *
  7. * StarPU is free software; you can redistribute it and/or modify
  8. * it under the terms of the GNU Lesser General Public License as published by
  9. * the Free Software Foundation; either version 2.1 of the License, or (at
  10. * your option) any later version.
  11. *
  12. * StarPU is distributed in the hope that it will be useful, but
  13. * WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
  15. *
  16. * See the GNU Lesser General Public License in COPYING.LGPL for more details.
  17. */
  18. #include <common/config.h>
  19. #include <core/sched_policy.h>
  20. #include <datawizard/datastats.h>
  21. #include <datawizard/memory_manager.h>
  22. #include <datawizard/memory_nodes.h>
  23. #include <datawizard/malloc.h>
  24. #include <common/fxt.h>
  25. #include "copy_driver.h"
  26. #include "memalloc.h"
  27. char _starpu_worker_drives_memory[STARPU_NMAXWORKERS][STARPU_MAXNODES];
  28. struct _starpu_memory_node_descr _starpu_descr;
  29. void _starpu_memory_nodes_init(void)
  30. {
  31. /* there is no node yet, subsequent nodes will be
  32. * added using _starpu_memory_node_register */
  33. _starpu_descr.nnodes = 0;
  34. unsigned i;
  35. for (i = 0; i < STARPU_MAXNODES; i++)
  36. {
  37. _starpu_descr.nodes[i] = STARPU_UNUSED;
  38. _starpu_descr.nworkers[i] = 0;
  39. }
  40. STARPU_HG_DISABLE_CHECKING(_starpu_worker_drives_memory);
  41. _starpu_init_mem_chunk_lists();
  42. _starpu_init_data_request_lists();
  43. _starpu_memory_manager_init();
  44. STARPU_PTHREAD_RWLOCK_INIT(&_starpu_descr.conditions_rwlock, NULL);
  45. _starpu_descr.total_condition_count = 0;
  46. }
  47. void _starpu_memory_nodes_deinit(void)
  48. {
  49. _starpu_deinit_data_request_lists();
  50. _starpu_deinit_mem_chunk_lists();
  51. STARPU_PTHREAD_RWLOCK_DESTROY(&_starpu_descr.conditions_rwlock);
  52. }
  53. #undef starpu_node_get_kind
  54. enum starpu_node_kind starpu_node_get_kind(unsigned node)
  55. {
  56. return _starpu_node_get_kind(node);
  57. }
  58. #undef starpu_memory_nodes_get_count
  59. unsigned starpu_memory_nodes_get_count(void)
  60. {
  61. return _starpu_memory_nodes_get_count();
  62. }
  63. int starpu_memory_node_get_name(unsigned node, char *name, size_t size)
  64. {
  65. const char *prefix;
  66. switch (_starpu_descr.nodes[node])
  67. {
  68. case STARPU_CPU_RAM:
  69. prefix = "NUMA";
  70. break;
  71. case STARPU_CUDA_RAM:
  72. prefix = "CUDA";
  73. break;
  74. case STARPU_OPENCL_RAM:
  75. prefix = "OpenCL";
  76. break;
  77. case STARPU_DISK_RAM:
  78. prefix = "Disk";
  79. break;
  80. case STARPU_MIC_RAM:
  81. prefix = "MIC";
  82. break;
  83. case STARPU_MPI_MS_RAM:
  84. prefix = "MPI_MS";
  85. break;
  86. case STARPU_SCC_RAM:
  87. prefix = "SCC_RAM";
  88. break;
  89. case STARPU_SCC_SHM:
  90. prefix = "SCC_shared";
  91. break;
  92. case STARPU_UNUSED:
  93. default:
  94. prefix = "unknown";
  95. STARPU_ASSERT(0);
  96. }
  97. return snprintf(name, size, "%s %d", prefix, _starpu_descr.devid[node]);
  98. }
  99. unsigned _starpu_memory_node_register(enum starpu_node_kind kind, int devid)
  100. {
  101. unsigned node;
  102. /* ATOMIC_ADD returns the new value ... */
  103. node = STARPU_ATOMIC_ADD(&_starpu_descr.nnodes, 1) - 1;
  104. STARPU_ASSERT_MSG(node < STARPU_MAXNODES,"Too many nodes (%u) for maximum %d. Use configure option --enable-maxnodes=xxx to update the maximum number of nodes.", node, STARPU_MAXNODES);
  105. _starpu_descr.nodes[node] = kind;
  106. _STARPU_TRACE_NEW_MEM_NODE(node);
  107. _starpu_descr.devid[node] = devid;
  108. /* for now, there is no condition associated to that newly created node */
  109. _starpu_descr.condition_count[node] = 0;
  110. _starpu_malloc_init(node);
  111. return node;
  112. }
  113. /* TODO move in a more appropriate file !! */
  114. /* Register a condition variable associated to worker which is associated to a
  115. * memory node itself. */
  116. void _starpu_memory_node_register_condition(struct _starpu_worker *worker, starpu_pthread_cond_t *cond, unsigned nodeid)
  117. {
  118. unsigned cond_id;
  119. unsigned nconds_total, nconds;
  120. STARPU_PTHREAD_RWLOCK_WRLOCK(&_starpu_descr.conditions_rwlock);
  121. /* we only insert the queue if it's not already in the list */
  122. nconds = _starpu_descr.condition_count[nodeid];
  123. for (cond_id = 0; cond_id < nconds; cond_id++)
  124. {
  125. if (_starpu_descr.conditions_attached_to_node[nodeid][cond_id].cond == cond)
  126. {
  127. STARPU_ASSERT(_starpu_descr.conditions_attached_to_node[nodeid][cond_id].worker == worker);
  128. /* the condition is already in the list */
  129. STARPU_PTHREAD_RWLOCK_UNLOCK(&_starpu_descr.conditions_rwlock);
  130. return;
  131. }
  132. }
  133. /* it was not found locally */
  134. _starpu_descr.conditions_attached_to_node[nodeid][cond_id].cond = cond;
  135. _starpu_descr.conditions_attached_to_node[nodeid][cond_id].worker = worker;
  136. _starpu_descr.condition_count[nodeid]++;
  137. /* do we have to add it in the global list as well ? */
  138. nconds_total = _starpu_descr.total_condition_count;
  139. for (cond_id = 0; cond_id < nconds_total; cond_id++)
  140. {
  141. if (_starpu_descr.conditions_all[cond_id].cond == cond)
  142. {
  143. /* the queue is already in the global list */
  144. STARPU_PTHREAD_RWLOCK_UNLOCK(&_starpu_descr.conditions_rwlock);
  145. return;
  146. }
  147. }
  148. /* it was not in the global list either */
  149. _starpu_descr.conditions_all[nconds_total].cond = cond;
  150. _starpu_descr.conditions_all[nconds_total].worker = worker;
  151. _starpu_descr.total_condition_count++;
  152. STARPU_PTHREAD_RWLOCK_UNLOCK(&_starpu_descr.conditions_rwlock);
  153. }
  154. #undef starpu_worker_get_memory_node
  155. unsigned starpu_worker_get_memory_node(unsigned workerid)
  156. {
  157. return _starpu_worker_get_memory_node(workerid);
  158. }
  159. /* same utility as _starpu_memory_node_add_nworkers */
  160. void _starpu_worker_drives_memory_node(struct _starpu_worker *worker, unsigned memnode)
  161. {
  162. if (! _starpu_worker_drives_memory[worker->workerid][memnode])
  163. {
  164. _starpu_worker_drives_memory[worker->workerid][memnode] = 1;
  165. #ifdef STARPU_SIMGRID
  166. starpu_pthread_queue_register(&worker->wait, &_starpu_simgrid_transfer_queue[memnode]);
  167. #endif
  168. }
  169. }