|
@@ -18,6 +18,7 @@
|
|
|
|
|
|
#include <starpu.h>
|
|
|
#include <common/uthash.h>
|
|
|
+#include <datawizard/coherency.h>
|
|
|
|
|
|
#include <starpu_mpi_cache.h>
|
|
|
#include <starpu_mpi_cache_stats.h>
|
|
@@ -27,16 +28,14 @@
|
|
|
struct _starpu_data_entry
|
|
|
{
|
|
|
UT_hash_handle hh;
|
|
|
- starpu_data_handle_t data;
|
|
|
+ starpu_data_handle_t data_handle;
|
|
|
};
|
|
|
|
|
|
-static starpu_pthread_mutex_t *_cache_sent_mutex;
|
|
|
-static starpu_pthread_mutex_t *_cache_received_mutex;
|
|
|
-static struct _starpu_data_entry **_cache_sent_data = NULL;
|
|
|
-static struct _starpu_data_entry **_cache_received_data = NULL;
|
|
|
+static starpu_pthread_mutex_t _cache_mutex;
|
|
|
+static struct _starpu_data_entry *_cache_data = NULL;
|
|
|
int _starpu_cache_enabled=1;
|
|
|
-MPI_Comm _starpu_cache_comm;
|
|
|
-int _starpu_cache_comm_size;
|
|
|
+static MPI_Comm _starpu_cache_comm;
|
|
|
+static int _starpu_cache_comm_size;
|
|
|
|
|
|
int starpu_mpi_cache_is_enabled()
|
|
|
{
|
|
@@ -55,7 +54,7 @@ int starpu_mpi_cache_set(int enabled)
|
|
|
{
|
|
|
|
|
|
starpu_mpi_cache_flush_all_data(_starpu_cache_comm);
|
|
|
- _starpu_mpi_cache_shutdown(_starpu_cache_comm_size);
|
|
|
+ _starpu_mpi_cache_shutdown();
|
|
|
}
|
|
|
_starpu_cache_enabled = 0;
|
|
|
}
|
|
@@ -64,8 +63,6 @@ int starpu_mpi_cache_set(int enabled)
|
|
|
|
|
|
void _starpu_mpi_cache_init(MPI_Comm comm)
|
|
|
{
|
|
|
- int i;
|
|
|
-
|
|
|
_starpu_cache_enabled = starpu_get_env_number("STARPU_MPI_CACHE");
|
|
|
if (_starpu_cache_enabled == -1)
|
|
|
{
|
|
@@ -80,295 +77,301 @@ void _starpu_mpi_cache_init(MPI_Comm comm)
|
|
|
|
|
|
_starpu_cache_comm = comm;
|
|
|
starpu_mpi_comm_size(comm, &_starpu_cache_comm_size);
|
|
|
- _STARPU_MPI_DEBUG(2, "Initialising htable for cache\n");
|
|
|
+ _starpu_mpi_cache_stats_init(comm);
|
|
|
+ STARPU_PTHREAD_MUTEX_INIT(&_cache_mutex, NULL);
|
|
|
+}
|
|
|
|
|
|
- _STARPU_MPI_MALLOC(_cache_sent_data, _starpu_cache_comm_size * sizeof(struct _starpu_data_entry *));
|
|
|
- _STARPU_MPI_MALLOC(_cache_received_data, _starpu_cache_comm_size * sizeof(struct _starpu_data_entry *));
|
|
|
- _STARPU_MPI_MALLOC(_cache_sent_mutex, _starpu_cache_comm_size * sizeof(starpu_pthread_mutex_t));
|
|
|
- _STARPU_MPI_MALLOC(_cache_received_mutex, _starpu_cache_comm_size * sizeof(starpu_pthread_mutex_t));
|
|
|
+void _starpu_mpi_cache_shutdown()
|
|
|
+{
|
|
|
+ if (_starpu_cache_enabled == 0) return;
|
|
|
|
|
|
- for(i=0 ; i<_starpu_cache_comm_size ; i++)
|
|
|
+ struct _starpu_data_entry *entry, *tmp;
|
|
|
+
|
|
|
+ STARPU_PTHREAD_MUTEX_LOCK(&_cache_mutex);
|
|
|
+ HASH_ITER(hh, _cache_data, entry, tmp)
|
|
|
{
|
|
|
- _cache_sent_data[i] = NULL;
|
|
|
- _cache_received_data[i] = NULL;
|
|
|
- STARPU_PTHREAD_MUTEX_INIT(&_cache_sent_mutex[i], NULL);
|
|
|
- STARPU_PTHREAD_MUTEX_INIT(&_cache_received_mutex[i], NULL);
|
|
|
+ HASH_DEL(_cache_data, entry);
|
|
|
+ free(entry);
|
|
|
}
|
|
|
- _starpu_mpi_cache_stats_init(comm);
|
|
|
+ STARPU_PTHREAD_MUTEX_UNLOCK(&_cache_mutex);
|
|
|
+ STARPU_PTHREAD_MUTEX_DESTROY(&_cache_mutex);
|
|
|
+ free(_cache_data);
|
|
|
+ _starpu_mpi_cache_stats_shutdown();
|
|
|
}
|
|
|
|
|
|
-static
|
|
|
-void _starpu_mpi_cache_empty_tables(int world_size)
|
|
|
+void _starpu_mpi_cache_data_clear(starpu_data_handle_t data_handle)
|
|
|
{
|
|
|
int i;
|
|
|
+ struct _starpu_mpi_data *mpi_data = data_handle->mpi_data;
|
|
|
|
|
|
- if (_starpu_cache_enabled == 0) return;
|
|
|
-
|
|
|
- _STARPU_MPI_DEBUG(2, "Clearing htable for cache\n");
|
|
|
+ if (_starpu_cache_enabled == 0) return 0;
|
|
|
|
|
|
- for(i=0 ; i<world_size ; i++)
|
|
|
+ _starpu_mpi_cache_flush(data_handle);
|
|
|
+ for(i=0 ; i<_starpu_cache_comm_size ; i++)
|
|
|
{
|
|
|
- struct _starpu_data_entry *entry, *tmp;
|
|
|
-
|
|
|
- STARPU_PTHREAD_MUTEX_LOCK(&_cache_sent_mutex[i]);
|
|
|
- HASH_ITER(hh, _cache_sent_data[i], entry, tmp)
|
|
|
- {
|
|
|
- HASH_DEL(_cache_sent_data[i], entry);
|
|
|
- free(entry);
|
|
|
- }
|
|
|
- STARPU_PTHREAD_MUTEX_UNLOCK(&_cache_sent_mutex[i]);
|
|
|
-
|
|
|
- STARPU_PTHREAD_MUTEX_LOCK(&_cache_received_mutex[i]);
|
|
|
- HASH_ITER(hh, _cache_received_data[i], entry, tmp)
|
|
|
- {
|
|
|
- HASH_DEL(_cache_received_data[i], entry);
|
|
|
- _starpu_mpi_cache_stats_dec(i, entry->data);
|
|
|
- free(entry);
|
|
|
- }
|
|
|
- STARPU_PTHREAD_MUTEX_UNLOCK(&_cache_received_mutex[i]);
|
|
|
+ STARPU_PTHREAD_MUTEX_DESTROY(&mpi_data->cache_sent_mutex[i]);
|
|
|
}
|
|
|
+ free(mpi_data->cache_sent);
|
|
|
+ free(mpi_data->cache_sent_mutex);
|
|
|
}
|
|
|
|
|
|
-void _starpu_mpi_cache_shutdown()
|
|
|
+void _starpu_mpi_cache_data_init(starpu_data_handle_t data_handle)
|
|
|
{
|
|
|
int i;
|
|
|
+ struct _starpu_mpi_data *mpi_data = data_handle->mpi_data;
|
|
|
|
|
|
- if (_starpu_cache_enabled == 0) return;
|
|
|
-
|
|
|
- _starpu_mpi_cache_empty_tables(_starpu_cache_comm_size);
|
|
|
- free(_cache_sent_data);
|
|
|
- free(_cache_received_data);
|
|
|
+ if (_starpu_cache_enabled == 0) return 0;
|
|
|
|
|
|
+ STARPU_PTHREAD_MUTEX_INIT(&mpi_data->cache_received_mutex, NULL);
|
|
|
+ mpi_data->cache_received = 0;
|
|
|
+ _STARPU_MALLOC(mpi_data->cache_sent_mutex, _starpu_cache_comm_size*sizeof(mpi_data->cache_sent_mutex[0]));
|
|
|
+ _STARPU_MALLOC(mpi_data->cache_sent, _starpu_cache_comm_size*sizeof(mpi_data->cache_sent[0]));
|
|
|
for(i=0 ; i<_starpu_cache_comm_size ; i++)
|
|
|
{
|
|
|
- STARPU_PTHREAD_MUTEX_DESTROY(&_cache_sent_mutex[i]);
|
|
|
- STARPU_PTHREAD_MUTEX_DESTROY(&_cache_received_mutex[i]);
|
|
|
+ STARPU_PTHREAD_MUTEX_INIT(&mpi_data->cache_sent_mutex[i], NULL);
|
|
|
+ mpi_data->cache_sent[i] = 0;
|
|
|
}
|
|
|
- free(_cache_sent_mutex);
|
|
|
- free(_cache_received_mutex);
|
|
|
-
|
|
|
- _starpu_mpi_cache_stats_shutdown();
|
|
|
}
|
|
|
|
|
|
-void _starpu_mpi_cache_sent_data_clear(MPI_Comm comm, starpu_data_handle_t data)
|
|
|
+static void _starpu_mpi_cache_data_add(starpu_data_handle_t data_handle)
|
|
|
{
|
|
|
- int n, size;
|
|
|
- starpu_mpi_comm_size(comm, &size);
|
|
|
+ struct _starpu_data_entry *entry;
|
|
|
|
|
|
- for(n=0 ; n<size ; n++)
|
|
|
+ if (_starpu_cache_enabled == 0) return 0;
|
|
|
+
|
|
|
+ STARPU_PTHREAD_MUTEX_LOCK(&_cache_mutex);
|
|
|
+ HASH_FIND_PTR(_cache_data, &data_handle, entry);
|
|
|
+ if (entry == NULL)
|
|
|
{
|
|
|
- struct _starpu_data_entry *already_sent;
|
|
|
+ _STARPU_MPI_MALLOC(entry, sizeof(*entry));
|
|
|
+ entry->data_handle = data_handle;
|
|
|
+ HASH_ADD_PTR(_cache_data, data_handle, entry);
|
|
|
+ }
|
|
|
+ STARPU_PTHREAD_MUTEX_UNLOCK(&_cache_mutex);
|
|
|
+}
|
|
|
|
|
|
- STARPU_PTHREAD_MUTEX_LOCK(&_cache_sent_mutex[n]);
|
|
|
- HASH_FIND_PTR(_cache_sent_data[n], &data, already_sent);
|
|
|
- if (already_sent)
|
|
|
- {
|
|
|
- _STARPU_MPI_DEBUG(2, "Clearing send cache for data %p\n", data);
|
|
|
- HASH_DEL(_cache_sent_data[n], already_sent);
|
|
|
- free(already_sent);
|
|
|
- }
|
|
|
- STARPU_PTHREAD_MUTEX_UNLOCK(&_cache_sent_mutex[n]);
|
|
|
+static void _starpu_mpi_cache_data_remove(starpu_data_handle_t data_handle)
|
|
|
+{
|
|
|
+ struct _starpu_data_entry *entry;
|
|
|
+
|
|
|
+ if (_starpu_cache_enabled == 0) return 0;
|
|
|
+
|
|
|
+ STARPU_PTHREAD_MUTEX_LOCK(&_cache_mutex);
|
|
|
+ HASH_FIND_PTR(_cache_data, &data_handle, entry);
|
|
|
+ if (entry)
|
|
|
+ {
|
|
|
+ HASH_DEL(_cache_data, entry);
|
|
|
+ free(entry);
|
|
|
}
|
|
|
+ STARPU_PTHREAD_MUTEX_UNLOCK(&_cache_mutex);
|
|
|
}
|
|
|
|
|
|
-void _starpu_mpi_cache_received_data_clear(starpu_data_handle_t data)
|
|
|
+
|
|
|
+ * Received cache
|
|
|
+ **************************************/
|
|
|
+void _starpu_mpi_cache_received_data_clear(starpu_data_handle_t data_handle)
|
|
|
{
|
|
|
- int mpi_rank = starpu_mpi_data_get_rank(data);
|
|
|
- struct _starpu_data_entry *already_received;
|
|
|
+ int mpi_rank = starpu_mpi_data_get_rank(data_handle);
|
|
|
+ struct _starpu_mpi_data *mpi_data = data_handle->mpi_data;
|
|
|
+
|
|
|
+ if (_starpu_cache_enabled == 0) return 0;
|
|
|
|
|
|
+ STARPU_ASSERT(mpi_data->magic == 42);
|
|
|
STARPU_MPI_ASSERT_MSG(mpi_rank < _starpu_cache_comm_size, "Node %d invalid. Max node is %d\n", mpi_rank, _starpu_cache_comm_size);
|
|
|
|
|
|
- STARPU_PTHREAD_MUTEX_LOCK(&_cache_received_mutex[mpi_rank]);
|
|
|
- HASH_FIND_PTR(_cache_received_data[mpi_rank], &data, already_received);
|
|
|
- if (already_received)
|
|
|
+ STARPU_PTHREAD_MUTEX_LOCK(&mpi_data->cache_received_mutex);
|
|
|
+ if (mpi_data->cache_received == 1)
|
|
|
{
|
|
|
#ifdef STARPU_DEVEL
|
|
|
# warning TODO: Somebody else will write to the data, so discard our cached copy if any. starpu_mpi could just remember itself.
|
|
|
#endif
|
|
|
- _STARPU_MPI_DEBUG(2, "Clearing receive cache for data %p\n", data);
|
|
|
- HASH_DEL(_cache_received_data[mpi_rank], already_received);
|
|
|
- _starpu_mpi_cache_stats_dec(mpi_rank, data);
|
|
|
- free(already_received);
|
|
|
- starpu_data_invalidate_submit(data);
|
|
|
+ _STARPU_MPI_DEBUG(2, "Clearing receive cache for data %p\n", data_handle);
|
|
|
+ mpi_data->cache_received = 0;
|
|
|
+ starpu_data_invalidate_submit(data_handle);
|
|
|
+ _starpu_mpi_cache_data_remove(data_handle);
|
|
|
+ _starpu_mpi_cache_stats_dec(mpi_rank, data_handle);
|
|
|
}
|
|
|
- STARPU_PTHREAD_MUTEX_UNLOCK(&_cache_received_mutex[mpi_rank]);
|
|
|
+ STARPU_PTHREAD_MUTEX_UNLOCK(&mpi_data->cache_received_mutex);
|
|
|
}
|
|
|
|
|
|
-void starpu_mpi_cache_flush_all_data(MPI_Comm comm)
|
|
|
+int _starpu_mpi_cache_received_data_set(starpu_data_handle_t data_handle)
|
|
|
{
|
|
|
- int nb_nodes, i;
|
|
|
- int mpi_rank, my_rank;
|
|
|
+ int mpi_rank = starpu_mpi_data_get_rank(data_handle);
|
|
|
+ struct _starpu_mpi_data *mpi_data = data_handle->mpi_data;
|
|
|
|
|
|
- if (_starpu_cache_enabled == 0) return;
|
|
|
+ if (_starpu_cache_enabled == 0) return 0;
|
|
|
|
|
|
- starpu_mpi_comm_size(comm, &nb_nodes);
|
|
|
- starpu_mpi_comm_rank(comm, &my_rank);
|
|
|
+ STARPU_ASSERT(mpi_data->magic == 42);
|
|
|
+ STARPU_MPI_ASSERT_MSG(mpi_rank < _starpu_cache_comm_size, "Node %d invalid. Max node is %d\n", mpi_rank, _starpu_cache_comm_size);
|
|
|
|
|
|
- for(i=0 ; i<nb_nodes ; i++)
|
|
|
+ STARPU_PTHREAD_MUTEX_LOCK(&mpi_data->cache_received_mutex);
|
|
|
+ int already_received = mpi_data->cache_received;
|
|
|
+ if (already_received == 0)
|
|
|
{
|
|
|
- struct _starpu_data_entry *entry, *tmp;
|
|
|
-
|
|
|
- STARPU_PTHREAD_MUTEX_LOCK(&_cache_sent_mutex[i]);
|
|
|
- HASH_ITER(hh, _cache_sent_data[i], entry, tmp)
|
|
|
- {
|
|
|
- mpi_rank = starpu_mpi_data_get_rank(entry->data);
|
|
|
- if (mpi_rank != my_rank && mpi_rank != -1)
|
|
|
- starpu_data_invalidate_submit(entry->data);
|
|
|
- HASH_DEL(_cache_sent_data[i], entry);
|
|
|
- free(entry);
|
|
|
- }
|
|
|
- STARPU_PTHREAD_MUTEX_UNLOCK(&_cache_sent_mutex[i]);
|
|
|
-
|
|
|
- STARPU_PTHREAD_MUTEX_LOCK(&_cache_received_mutex[i]);
|
|
|
- HASH_ITER(hh, _cache_received_data[i], entry, tmp)
|
|
|
- {
|
|
|
- mpi_rank = starpu_mpi_data_get_rank(entry->data);
|
|
|
- if (mpi_rank != my_rank && mpi_rank != -1)
|
|
|
- starpu_data_invalidate_submit(entry->data);
|
|
|
- HASH_DEL(_cache_received_data[i], entry);
|
|
|
- _starpu_mpi_cache_stats_dec(i, entry->data);
|
|
|
- free(entry);
|
|
|
- }
|
|
|
- STARPU_PTHREAD_MUTEX_UNLOCK(&_cache_received_mutex[i]);
|
|
|
+ _STARPU_MPI_DEBUG(2, "Noting that data %p has already been received by %d\n", data_handle, mpi_rank);
|
|
|
+ mpi_data->cache_received = 1;
|
|
|
+ _starpu_mpi_cache_data_add(data_handle);
|
|
|
+ _starpu_mpi_cache_stats_inc(mpi_rank, data_handle);
|
|
|
+ }
|
|
|
+ else
|
|
|
+ {
|
|
|
+ _STARPU_MPI_DEBUG(2, "Do not receive data %p from node %d as it is already available\n", data_handle, mpi_rank);
|
|
|
}
|
|
|
+ STARPU_PTHREAD_MUTEX_UNLOCK(&mpi_data->cache_received_mutex);
|
|
|
+ return already_received;
|
|
|
}
|
|
|
|
|
|
-void _starpu_mpi_cache_flush(MPI_Comm comm, starpu_data_handle_t data_handle)
|
|
|
+int _starpu_mpi_cache_received_data_get(starpu_data_handle_t data_handle)
|
|
|
{
|
|
|
- struct _starpu_data_entry *avail;
|
|
|
- int i, nb_nodes;
|
|
|
+ int already_received;
|
|
|
+ struct _starpu_mpi_data *mpi_data = data_handle->mpi_data;
|
|
|
|
|
|
- if (_starpu_cache_enabled == 0) return;
|
|
|
+ if (_starpu_cache_enabled == 0) return 0;
|
|
|
|
|
|
- starpu_mpi_comm_size(comm, &nb_nodes);
|
|
|
- for(i=0 ; i<nb_nodes ; i++)
|
|
|
- {
|
|
|
- STARPU_PTHREAD_MUTEX_LOCK(&_cache_sent_mutex[i]);
|
|
|
- HASH_FIND_PTR(_cache_sent_data[i], &data_handle, avail);
|
|
|
- if (avail)
|
|
|
- {
|
|
|
- _STARPU_MPI_DEBUG(2, "Clearing send cache for data %p\n", data_handle);
|
|
|
- HASH_DEL(_cache_sent_data[i], avail);
|
|
|
- free(avail);
|
|
|
- }
|
|
|
- STARPU_PTHREAD_MUTEX_UNLOCK(&_cache_sent_mutex[i]);
|
|
|
+ STARPU_ASSERT(mpi_data->magic == 42);
|
|
|
|
|
|
- STARPU_PTHREAD_MUTEX_LOCK(&_cache_received_mutex[i]);
|
|
|
- HASH_FIND_PTR(_cache_received_data[i], &data_handle, avail);
|
|
|
- if (avail)
|
|
|
- {
|
|
|
- _STARPU_MPI_DEBUG(2, "Clearing send cache for data %p\n", data_handle);
|
|
|
- HASH_DEL(_cache_received_data[i], avail);
|
|
|
- _starpu_mpi_cache_stats_dec(i, data_handle);
|
|
|
- free(avail);
|
|
|
- }
|
|
|
- STARPU_PTHREAD_MUTEX_UNLOCK(&_cache_received_mutex[i]);
|
|
|
- }
|
|
|
+ STARPU_PTHREAD_MUTEX_LOCK(&mpi_data->cache_received_mutex);
|
|
|
+ already_received = mpi_data->cache_received;
|
|
|
+ STARPU_PTHREAD_MUTEX_UNLOCK(&mpi_data->cache_received_mutex);
|
|
|
+ return already_received;
|
|
|
}
|
|
|
|
|
|
-void starpu_mpi_cache_flush(MPI_Comm comm, starpu_data_handle_t data_handle)
|
|
|
+int starpu_mpi_cached_receive(starpu_data_handle_t data_handle)
|
|
|
{
|
|
|
- int my_rank, mpi_rank;
|
|
|
+ return _starpu_mpi_cache_received_data_get(data_handle);
|
|
|
+}
|
|
|
+
|
|
|
+
|
|
|
+ * Send cache
|
|
|
+ **************************************/
|
|
|
+void _starpu_mpi_cache_sent_data_clear(starpu_data_handle_t data_handle)
|
|
|
+{
|
|
|
+ int n, size;
|
|
|
+ struct _starpu_mpi_data *mpi_data = data_handle->mpi_data;
|
|
|
|
|
|
- _starpu_mpi_cache_flush(comm, data_handle);
|
|
|
+ if (_starpu_cache_enabled == 0) return 0;
|
|
|
|
|
|
- starpu_mpi_comm_rank(comm, &my_rank);
|
|
|
- mpi_rank = starpu_mpi_data_get_rank(data_handle);
|
|
|
- if (mpi_rank != my_rank && mpi_rank != -1)
|
|
|
- starpu_data_invalidate_submit(data_handle);
|
|
|
+ starpu_mpi_comm_size(mpi_data->node_tag.comm, &size);
|
|
|
+ for(n=0 ; n<size ; n++)
|
|
|
+ {
|
|
|
+ STARPU_PTHREAD_MUTEX_LOCK(&mpi_data->cache_sent_mutex[n]);
|
|
|
+ if (mpi_data->cache_sent[n] == 1)
|
|
|
+ {
|
|
|
+ _STARPU_MPI_DEBUG(2, "Clearing send cache for data %p\n", data_handle);
|
|
|
+ mpi_data->cache_sent[n] = 0;
|
|
|
+ _starpu_mpi_cache_data_remove(data_handle);
|
|
|
+ }
|
|
|
+ STARPU_PTHREAD_MUTEX_UNLOCK(&mpi_data->cache_sent_mutex[n]);
|
|
|
+ }
|
|
|
}
|
|
|
|
|
|
-void *_starpu_mpi_cache_received_data_set(starpu_data_handle_t data, int mpi_rank)
|
|
|
+int _starpu_mpi_cache_sent_data_set(starpu_data_handle_t data_handle, int dest)
|
|
|
{
|
|
|
- struct _starpu_data_entry *already_received;
|
|
|
+ struct _starpu_mpi_data *mpi_data = data_handle->mpi_data;
|
|
|
|
|
|
- if (_starpu_cache_enabled == 0) return NULL;
|
|
|
+ if (_starpu_cache_enabled == 0) return 0;
|
|
|
|
|
|
- STARPU_MPI_ASSERT_MSG(mpi_rank < _starpu_cache_comm_size, "Node %d invalid. Max node is %d\n", mpi_rank, _starpu_cache_comm_size);
|
|
|
+ STARPU_MPI_ASSERT_MSG(dest < _starpu_cache_comm_size, "Node %d invalid. Max node is %d\n", dest, _starpu_cache_comm_size);
|
|
|
|
|
|
- STARPU_PTHREAD_MUTEX_LOCK(&_cache_received_mutex[mpi_rank]);
|
|
|
- HASH_FIND_PTR(_cache_received_data[mpi_rank], &data, already_received);
|
|
|
- if (already_received == NULL)
|
|
|
+ STARPU_PTHREAD_MUTEX_LOCK(&mpi_data->cache_sent_mutex[dest]);
|
|
|
+ int already_sent = mpi_data->cache_sent[dest];
|
|
|
+ if (mpi_data->cache_sent[dest] == 0)
|
|
|
{
|
|
|
- struct _starpu_data_entry *entry;
|
|
|
- _STARPU_MPI_MALLOC(entry, sizeof(*entry));
|
|
|
- entry->data = data;
|
|
|
- HASH_ADD_PTR(_cache_received_data[mpi_rank], data, entry);
|
|
|
- _STARPU_MPI_DEBUG(2, "Noting that data %p has already been received by %d\n", data, mpi_rank);
|
|
|
- _starpu_mpi_cache_stats_inc(mpi_rank, data);
|
|
|
+ mpi_data->cache_sent[dest] = 1;
|
|
|
+ _starpu_mpi_cache_data_add(data_handle);
|
|
|
+ _STARPU_MPI_DEBUG(2, "Noting that data %p has already been sent to %d\n", data_handle, dest);
|
|
|
}
|
|
|
else
|
|
|
{
|
|
|
- _STARPU_MPI_DEBUG(2, "Do not receive data %p from node %d as it is already available\n", data, mpi_rank);
|
|
|
+ _STARPU_MPI_DEBUG(2, "Do not send data %p to node %d as it has already been sent\n", data_handle, dest);
|
|
|
}
|
|
|
- STARPU_PTHREAD_MUTEX_UNLOCK(&_cache_received_mutex[mpi_rank]);
|
|
|
- return already_received;
|
|
|
+ STARPU_PTHREAD_MUTEX_UNLOCK(&mpi_data->cache_sent_mutex[dest]);
|
|
|
+ return already_sent;
|
|
|
}
|
|
|
|
|
|
-void *_starpu_mpi_cache_received_data_get(starpu_data_handle_t data, int mpi_rank)
|
|
|
+int _starpu_mpi_cache_sent_data_get(starpu_data_handle_t data_handle, int dest)
|
|
|
{
|
|
|
- struct _starpu_data_entry *already_received;
|
|
|
+ struct _starpu_mpi_data *mpi_data = data_handle->mpi_data;
|
|
|
+ int already_sent;
|
|
|
|
|
|
- if (_starpu_cache_enabled == 0) return NULL;
|
|
|
+ if (_starpu_cache_enabled == 0) return 0;
|
|
|
|
|
|
- STARPU_MPI_ASSERT_MSG(mpi_rank < _starpu_cache_comm_size, "Node %d invalid. Max node is %d\n", mpi_rank, _starpu_cache_comm_size);
|
|
|
+ STARPU_MPI_ASSERT_MSG(dest < _starpu_cache_comm_size, "Node %d invalid. Max node is %d\n", dest, _starpu_cache_comm_size);
|
|
|
|
|
|
- STARPU_PTHREAD_MUTEX_LOCK(&_cache_received_mutex[mpi_rank]);
|
|
|
- HASH_FIND_PTR(_cache_received_data[mpi_rank], &data, already_received);
|
|
|
- STARPU_PTHREAD_MUTEX_UNLOCK(&_cache_received_mutex[mpi_rank]);
|
|
|
- return already_received;
|
|
|
+ STARPU_PTHREAD_MUTEX_LOCK(&mpi_data->cache_sent_mutex[dest]);
|
|
|
+ already_sent = mpi_data->cache_sent[dest];
|
|
|
+ STARPU_PTHREAD_MUTEX_UNLOCK(&mpi_data->cache_sent_mutex[dest]);
|
|
|
+ return already_sent;
|
|
|
}
|
|
|
|
|
|
-int starpu_mpi_cached_receive(starpu_data_handle_t data_handle)
|
|
|
+int starpu_mpi_cached_send(starpu_data_handle_t data_handle, int dest)
|
|
|
{
|
|
|
- int owner = starpu_mpi_data_get_rank(data_handle);
|
|
|
- void *already_received = _starpu_mpi_cache_received_data_get(data_handle, owner);
|
|
|
- return already_received != NULL;
|
|
|
+ return _starpu_mpi_cache_sent_data_get(data_handle, dest);
|
|
|
}
|
|
|
|
|
|
-void *_starpu_mpi_cache_sent_data_set(starpu_data_handle_t data, int dest)
|
|
|
+void _starpu_mpi_cache_flush(starpu_data_handle_t data_handle)
|
|
|
{
|
|
|
- struct _starpu_data_entry *already_sent;
|
|
|
-
|
|
|
- if (_starpu_cache_enabled == 0) return NULL;
|
|
|
+ struct _starpu_mpi_data *mpi_data = data_handle->mpi_data;
|
|
|
+ int i, nb_nodes;
|
|
|
|
|
|
- STARPU_MPI_ASSERT_MSG(dest < _starpu_cache_comm_size, "Node %d invalid. Max node is %d\n", dest, _starpu_cache_comm_size);
|
|
|
+ if (_starpu_cache_enabled == 0) return;
|
|
|
|
|
|
- STARPU_PTHREAD_MUTEX_LOCK(&_cache_sent_mutex[dest]);
|
|
|
- HASH_FIND_PTR(_cache_sent_data[dest], &data, already_sent);
|
|
|
- if (already_sent == NULL)
|
|
|
+ starpu_mpi_comm_size(mpi_data->node_tag.comm, &nb_nodes);
|
|
|
+ for(i=0 ; i<nb_nodes ; i++)
|
|
|
{
|
|
|
- struct _starpu_data_entry *entry;
|
|
|
- _STARPU_MPI_MALLOC(entry, sizeof(*entry));
|
|
|
- entry->data = data;
|
|
|
- HASH_ADD_PTR(_cache_sent_data[dest], data, entry);
|
|
|
- _STARPU_MPI_DEBUG(2, "Noting that data %p has already been sent to %d\n", data, dest);
|
|
|
+ STARPU_PTHREAD_MUTEX_LOCK(&mpi_data->cache_sent_mutex[i]);
|
|
|
+ if (mpi_data->cache_sent[i] == 1)
|
|
|
+ {
|
|
|
+ _STARPU_MPI_DEBUG(2, "Clearing send cache for data %p\n", data_handle);
|
|
|
+ mpi_data->cache_sent[i] = 0;
|
|
|
+ _starpu_mpi_cache_stats_dec(i, data_handle);
|
|
|
+ }
|
|
|
+ STARPU_PTHREAD_MUTEX_UNLOCK(&mpi_data->cache_sent_mutex[i]);
|
|
|
}
|
|
|
- else
|
|
|
+
|
|
|
+ STARPU_PTHREAD_MUTEX_LOCK(&mpi_data->cache_received_mutex);
|
|
|
+ if (mpi_data->cache_received == 1)
|
|
|
{
|
|
|
- _STARPU_MPI_DEBUG(2, "Do not send data %p to node %d as it has already been sent\n", data, dest);
|
|
|
+ int mpi_rank = starpu_mpi_data_get_rank(data_handle);
|
|
|
+ _STARPU_MPI_DEBUG(2, "Clearing received cache for data %p\n", data_handle);
|
|
|
+ mpi_data->cache_received = 0;
|
|
|
+ _starpu_mpi_cache_stats_dec(mpi_rank, data_handle);
|
|
|
}
|
|
|
- STARPU_PTHREAD_MUTEX_UNLOCK(&_cache_sent_mutex[dest]);
|
|
|
- return already_sent;
|
|
|
+ STARPU_PTHREAD_MUTEX_UNLOCK(&mpi_data->cache_received_mutex);
|
|
|
}
|
|
|
|
|
|
-void *_starpu_mpi_cache_sent_data_get(starpu_data_handle_t data, int dest)
|
|
|
+static void _starpu_mpi_cache_flush_and_invalidate(MPI_Comm comm, starpu_data_handle_t data_handle)
|
|
|
{
|
|
|
- struct _starpu_data_entry *already_sent;
|
|
|
-
|
|
|
- if (_starpu_cache_enabled == 0) return NULL;
|
|
|
+ int my_rank, mpi_rank;
|
|
|
|
|
|
- STARPU_MPI_ASSERT_MSG(dest < _starpu_cache_comm_size, "Node %d invalid. Max node is %d\n", dest, _starpu_cache_comm_size);
|
|
|
+ _starpu_mpi_cache_flush(data_handle);
|
|
|
|
|
|
- STARPU_PTHREAD_MUTEX_LOCK(&_cache_sent_mutex[dest]);
|
|
|
- HASH_FIND_PTR(_cache_sent_data[dest], &data, already_sent);
|
|
|
- STARPU_PTHREAD_MUTEX_UNLOCK(&_cache_sent_mutex[dest]);
|
|
|
- return already_sent;
|
|
|
+ starpu_mpi_comm_rank(comm, &my_rank);
|
|
|
+ mpi_rank = starpu_mpi_data_get_rank(data_handle);
|
|
|
+ if (mpi_rank != my_rank && mpi_rank != -1)
|
|
|
+ starpu_data_invalidate_submit(data_handle);
|
|
|
}
|
|
|
|
|
|
-int starpu_mpi_cached_send(starpu_data_handle_t data_handle, int dest)
|
|
|
+void starpu_mpi_cache_flush(MPI_Comm comm, starpu_data_handle_t data_handle)
|
|
|
{
|
|
|
- void *already_sent = _starpu_mpi_cache_sent_data_get(data_handle, dest);
|
|
|
- return already_sent != NULL;
|
|
|
+ if (_starpu_cache_enabled == 0) return 0;
|
|
|
+
|
|
|
+ _starpu_mpi_cache_flush_and_invalidate(comm, data_handle);
|
|
|
+ _starpu_mpi_cache_data_remove(data_handle);
|
|
|
}
|
|
|
|
|
|
+void starpu_mpi_cache_flush_all_data(MPI_Comm comm)
|
|
|
+{
|
|
|
+ struct _starpu_data_entry *entry, *tmp;
|
|
|
+
|
|
|
+ if (_starpu_cache_enabled == 0) return;
|
|
|
+
|
|
|
+ STARPU_PTHREAD_MUTEX_LOCK(&_cache_mutex);
|
|
|
+ HASH_ITER(hh, _cache_data, entry, tmp)
|
|
|
+ {
|
|
|
+ _starpu_mpi_cache_flush_and_invalidate(comm, entry->data_handle);
|
|
|
+ HASH_DEL(_cache_data, entry);
|
|
|
+ free(entry);
|
|
|
+ }
|
|
|
+ STARPU_PTHREAD_MUTEX_UNLOCK(&_cache_mutex);
|
|
|
+}
|