memory_manager.c 5.4 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222
  1. /* StarPU --- Runtime system for heterogeneous multicore architectures.
  2. *
  3. * Copyright (C) 2012-2013, 2015, 2016, 2017 CNRS
  4. *
  5. * StarPU is free software; you can redistribute it and/or modify
  6. * it under the terms of the GNU Lesser General Public License as published by
  7. * the Free Software Foundation; either version 2.1 of the License, or (at
  8. * your option) any later version.
  9. *
  10. * StarPU is distributed in the hope that it will be useful, but
  11. * WITHOUT ANY WARRANTY; without even the implied warranty of
  12. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
  13. *
  14. * See the GNU Lesser General Public License in COPYING.LGPL for more details.
  15. */
  16. #include <starpu.h>
  17. #include <common/utils.h>
  18. #include <common/thread.h>
  19. #include <common/fxt.h>
  20. #include <datawizard/memory_manager.h>
  21. #include <core/workers.h>
  22. #include <starpu_stdlib.h>
  23. static size_t global_size[STARPU_MAXNODES];
  24. static size_t used_size[STARPU_MAXNODES];
  25. /* This is used as an optimization to avoid to wake up allocating threads for
  26. * each and every deallocation, only to find that there is still not enough
  27. * room. */
  28. /* Minimum amount being waited for */
  29. static size_t waiting_size[STARPU_MAXNODES];
  30. static starpu_pthread_mutex_t lock_nodes[STARPU_MAXNODES];
  31. static starpu_pthread_cond_t cond_nodes[STARPU_MAXNODES];
  32. int _starpu_memory_manager_init()
  33. {
  34. int i;
  35. for(i=0 ; i<STARPU_MAXNODES ; i++)
  36. {
  37. global_size[i] = 0;
  38. used_size[i] = 0;
  39. /* This is accessed for statistics outside the lock, don't care
  40. * about that */
  41. STARPU_HG_DISABLE_CHECKING(used_size[i]);
  42. waiting_size[i] = 0;
  43. STARPU_PTHREAD_MUTEX_INIT(&lock_nodes[i], NULL);
  44. STARPU_PTHREAD_COND_INIT(&cond_nodes[i], NULL);
  45. }
  46. return 0;
  47. }
  48. void _starpu_memory_manager_set_global_memory_size(unsigned node, size_t size)
  49. {
  50. STARPU_PTHREAD_MUTEX_LOCK(&lock_nodes[node]);
  51. if (!global_size[node])
  52. {
  53. global_size[node] = size;
  54. _STARPU_DEBUG("Global size for node %u is %ld\n", node, (long)global_size[node]);
  55. }
  56. else
  57. {
  58. STARPU_ASSERT(global_size[node] == size);
  59. }
  60. STARPU_PTHREAD_MUTEX_UNLOCK(&lock_nodes[node]);
  61. }
  62. size_t _starpu_memory_manager_get_global_memory_size(unsigned node)
  63. {
  64. return global_size[node];
  65. }
  66. int starpu_memory_allocate(unsigned node, size_t size, int flags)
  67. {
  68. int ret;
  69. STARPU_PTHREAD_MUTEX_LOCK(&lock_nodes[node]);
  70. if (flags & STARPU_MEMORY_WAIT)
  71. {
  72. struct _starpu_worker *worker = _starpu_get_local_worker_key();
  73. enum _starpu_worker_status old_status = STATUS_UNKNOWN;
  74. if (worker)
  75. {
  76. old_status = worker->status;
  77. _starpu_set_worker_status(worker, STATUS_WAITING);
  78. }
  79. while (used_size[node] + size > global_size[node])
  80. {
  81. /* Tell deallocators we need this amount */
  82. if (!waiting_size[node] || size < waiting_size[node])
  83. waiting_size[node] = size;
  84. /* Wait for it */
  85. STARPU_PTHREAD_COND_WAIT(&cond_nodes[node], &lock_nodes[node]);
  86. }
  87. if (worker)
  88. {
  89. _starpu_set_worker_status(worker, old_status);
  90. }
  91. /* And take it */
  92. used_size[node] += size;
  93. _STARPU_TRACE_USED_MEM(node, used_size[node]);
  94. ret = 0;
  95. }
  96. else if (flags & STARPU_MEMORY_OVERFLOW
  97. || global_size[node] == 0
  98. || used_size[node] + size <= global_size[node])
  99. {
  100. used_size[node] += size;
  101. _STARPU_TRACE_USED_MEM(node, used_size[node]);
  102. ret = 0;
  103. }
  104. else
  105. {
  106. ret = -ENOMEM;
  107. }
  108. STARPU_PTHREAD_MUTEX_UNLOCK(&lock_nodes[node]);
  109. return ret;
  110. }
  111. void starpu_memory_deallocate(unsigned node, size_t size)
  112. {
  113. STARPU_PTHREAD_MUTEX_LOCK(&lock_nodes[node]);
  114. used_size[node] -= size;
  115. _STARPU_TRACE_USED_MEM(node, used_size[node]);
  116. /* If there's now room for waiters, wake them */
  117. if (waiting_size[node] &&
  118. global_size[node] - used_size[node] >= waiting_size[node])
  119. {
  120. /* And have those not happy enough tell us the size again */
  121. waiting_size[node] = 0;
  122. STARPU_PTHREAD_COND_BROADCAST(&cond_nodes[node]);
  123. }
  124. STARPU_PTHREAD_MUTEX_UNLOCK(&lock_nodes[node]);
  125. }
  126. starpu_ssize_t starpu_memory_get_total(unsigned node)
  127. {
  128. if (global_size[node] == 0)
  129. return -1;
  130. else
  131. return global_size[node];
  132. }
  133. starpu_ssize_t starpu_memory_get_total_all_nodes()
  134. {
  135. unsigned memnodes, i;
  136. memnodes = starpu_memory_nodes_get_count();
  137. starpu_ssize_t total = 0;
  138. for(i=0 ; i<memnodes ; i++)
  139. {
  140. starpu_ssize_t node = starpu_memory_get_total(i);
  141. if (node != -1)
  142. total += node;
  143. }
  144. return total;
  145. }
  146. starpu_ssize_t starpu_memory_get_available(unsigned node)
  147. {
  148. starpu_ssize_t ret;
  149. if (global_size[node] == 0)
  150. return -1;
  151. ret = global_size[node] - used_size[node];
  152. return ret;
  153. }
  154. starpu_ssize_t starpu_memory_get_available_all_nodes()
  155. {
  156. unsigned memnodes, i;
  157. memnodes = starpu_memory_nodes_get_count();
  158. starpu_ssize_t avail = 0;
  159. for(i=0 ; i<memnodes ; i++)
  160. {
  161. starpu_ssize_t node = starpu_memory_get_available(i);
  162. if (node != -1)
  163. avail += node;
  164. }
  165. return avail;
  166. }
  167. void starpu_memory_wait_available(unsigned node, size_t size)
  168. {
  169. STARPU_PTHREAD_MUTEX_LOCK(&lock_nodes[node]);
  170. while (used_size[node] + size > global_size[node])
  171. {
  172. /* Tell deallocators we need this amount */
  173. if (!waiting_size[node] || size < waiting_size[node])
  174. waiting_size[node] = size;
  175. /* Wait for it */
  176. STARPU_PTHREAD_COND_WAIT(&cond_nodes[node], &lock_nodes[node]);
  177. }
  178. STARPU_PTHREAD_MUTEX_UNLOCK(&lock_nodes[node]);
  179. }
  180. int _starpu_memory_manager_test_allocate_size(unsigned node, size_t size)
  181. {
  182. int ret;
  183. STARPU_PTHREAD_MUTEX_LOCK(&lock_nodes[node]);
  184. if (global_size[node] == 0)
  185. ret = 1;
  186. else if (used_size[node] + size <= global_size[node])
  187. ret = 1;
  188. else
  189. ret = 0;
  190. STARPU_PTHREAD_MUTEX_UNLOCK(&lock_nodes[node]);
  191. return ret;
  192. }