memory_nodes.c 5.6 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198
  1. /* StarPU --- Runtime system for heterogeneous multicore architectures.
  2. *
  3. * Copyright (C) 2009-2017 Université de Bordeaux
  4. * Copyright (C) 2010, 2011, 2012, 2013, 2014, 2015 CNRS
  5. * Copyright (C) 2017 Inria
  6. *
  7. * StarPU is free software; you can redistribute it and/or modify
  8. * it under the terms of the GNU Lesser General Public License as published by
  9. * the Free Software Foundation; either version 2.1 of the License, or (at
  10. * your option) any later version.
  11. *
  12. * StarPU is distributed in the hope that it will be useful, but
  13. * WITHOUT ANY WARRANTY; without even the implied warranty of
  14. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
  15. *
  16. * See the GNU Lesser General Public License in COPYING.LGPL for more details.
  17. */
  18. #include <common/config.h>
  19. #include <core/sched_policy.h>
  20. #include <datawizard/datastats.h>
  21. #include <datawizard/memory_manager.h>
  22. #include <datawizard/memory_nodes.h>
  23. #include <datawizard/malloc.h>
  24. #include <common/fxt.h>
  25. #include "copy_driver.h"
  26. #include "memalloc.h"
  27. char _starpu_worker_drives_memory[STARPU_NMAXWORKERS][STARPU_MAXNODES];
  28. struct _starpu_memory_node_descr _starpu_descr;
  29. void _starpu_memory_nodes_init(void)
  30. {
  31. /* there is no node yet, subsequent nodes will be
  32. * added using _starpu_memory_node_register */
  33. _starpu_descr.nnodes = 0;
  34. unsigned i;
  35. for (i = 0; i < STARPU_MAXNODES; i++)
  36. {
  37. _starpu_descr.nodes[i] = STARPU_UNUSED;
  38. _starpu_descr.nworkers[i] = 0;
  39. }
  40. _starpu_init_mem_chunk_lists();
  41. _starpu_init_data_request_lists();
  42. _starpu_memory_manager_init();
  43. STARPU_PTHREAD_RWLOCK_INIT(&_starpu_descr.conditions_rwlock, NULL);
  44. _starpu_descr.total_condition_count = 0;
  45. }
  46. void _starpu_memory_nodes_deinit(void)
  47. {
  48. _starpu_deinit_data_request_lists();
  49. _starpu_deinit_mem_chunk_lists();
  50. STARPU_PTHREAD_RWLOCK_DESTROY(&_starpu_descr.conditions_rwlock);
  51. }
  52. #undef starpu_node_get_kind
  53. enum starpu_node_kind starpu_node_get_kind(unsigned node)
  54. {
  55. return _starpu_node_get_kind(node);
  56. }
  57. #undef starpu_memory_nodes_get_count
  58. unsigned starpu_memory_nodes_get_count(void)
  59. {
  60. return _starpu_memory_nodes_get_count();
  61. }
  62. void _starpu_memory_node_get_name(unsigned node, char *name, int size)
  63. {
  64. const char *prefix;
  65. switch (_starpu_descr.nodes[node])
  66. {
  67. case STARPU_CPU_RAM:
  68. prefix = "NUMA";
  69. break;
  70. case STARPU_CUDA_RAM:
  71. prefix = "CUDA";
  72. break;
  73. case STARPU_OPENCL_RAM:
  74. prefix = "OpenCL";
  75. break;
  76. case STARPU_DISK_RAM:
  77. prefix = "Disk";
  78. break;
  79. case STARPU_MIC_RAM:
  80. prefix = "MIC";
  81. break;
  82. case STARPU_MPI_MS_RAM:
  83. prefix = "MPI_MS";
  84. break;
  85. case STARPU_SCC_RAM:
  86. prefix = "SCC_RAM";
  87. break;
  88. case STARPU_SCC_SHM:
  89. prefix = "SCC_shared";
  90. break;
  91. case STARPU_UNUSED:
  92. default:
  93. prefix = "unknown";
  94. STARPU_ASSERT(0);
  95. }
  96. snprintf(name, size, "%s %u", prefix, _starpu_descr.devid[node]);
  97. }
  98. unsigned _starpu_memory_node_register(enum starpu_node_kind kind, int devid)
  99. {
  100. unsigned node;
  101. /* ATOMIC_ADD returns the new value ... */
  102. node = STARPU_ATOMIC_ADD(&_starpu_descr.nnodes, 1) - 1;
  103. STARPU_ASSERT_MSG(node < STARPU_MAXNODES,"Too many nodes (%u) for maximum %u. Use configure option --enable-maxnodes=xxx to update the maximum number of nodes.", node, STARPU_MAXNODES);
  104. _starpu_descr.nodes[node] = kind;
  105. _STARPU_TRACE_NEW_MEM_NODE(node);
  106. _starpu_descr.devid[node] = devid;
  107. /* for now, there is no condition associated to that newly created node */
  108. _starpu_descr.condition_count[node] = 0;
  109. _starpu_malloc_init(node);
  110. return node;
  111. }
  112. /* TODO move in a more appropriate file !! */
  113. /* Register a condition variable associated to worker which is associated to a
  114. * memory node itself. */
  115. void _starpu_memory_node_register_condition(starpu_pthread_cond_t *cond, starpu_pthread_mutex_t *mutex, unsigned nodeid)
  116. {
  117. unsigned cond_id;
  118. unsigned nconds_total, nconds;
  119. STARPU_PTHREAD_RWLOCK_WRLOCK(&_starpu_descr.conditions_rwlock);
  120. /* we only insert the queue if it's not already in the list */
  121. nconds = _starpu_descr.condition_count[nodeid];
  122. for (cond_id = 0; cond_id < nconds; cond_id++)
  123. {
  124. if (_starpu_descr.conditions_attached_to_node[nodeid][cond_id].cond == cond)
  125. {
  126. STARPU_ASSERT(_starpu_descr.conditions_attached_to_node[nodeid][cond_id].mutex == mutex);
  127. /* the condition is already in the list */
  128. STARPU_PTHREAD_RWLOCK_UNLOCK(&_starpu_descr.conditions_rwlock);
  129. return;
  130. }
  131. }
  132. /* it was not found locally */
  133. _starpu_descr.conditions_attached_to_node[nodeid][cond_id].cond = cond;
  134. _starpu_descr.conditions_attached_to_node[nodeid][cond_id].mutex = mutex;
  135. _starpu_descr.condition_count[nodeid]++;
  136. /* do we have to add it in the global list as well ? */
  137. nconds_total = _starpu_descr.total_condition_count;
  138. for (cond_id = 0; cond_id < nconds_total; cond_id++)
  139. {
  140. if (_starpu_descr.conditions_all[cond_id].cond == cond)
  141. {
  142. /* the queue is already in the global list */
  143. STARPU_PTHREAD_RWLOCK_UNLOCK(&_starpu_descr.conditions_rwlock);
  144. return;
  145. }
  146. }
  147. /* it was not in the global list either */
  148. _starpu_descr.conditions_all[nconds_total].cond = cond;
  149. _starpu_descr.conditions_all[nconds_total].mutex = mutex;
  150. _starpu_descr.total_condition_count++;
  151. STARPU_PTHREAD_RWLOCK_UNLOCK(&_starpu_descr.conditions_rwlock);
  152. }
  153. #undef starpu_worker_get_memory_node
  154. unsigned starpu_worker_get_memory_node(unsigned workerid)
  155. {
  156. return _starpu_worker_get_memory_node(workerid);
  157. }
  158. /* same utility as _starpu_memory_node_add_nworkers */
  159. void _starpu_worker_drives_memory_node(struct _starpu_worker *worker, unsigned memnode)
  160. {
  161. if (! _starpu_worker_drives_memory[worker->workerid][memnode])
  162. {
  163. _starpu_worker_drives_memory[worker->workerid][memnode] = 1;
  164. #ifdef STARPU_SIMGRID
  165. starpu_pthread_queue_register(&worker->wait, &_starpu_simgrid_transfer_queue[memnode]);
  166. #endif
  167. }
  168. }