лет назад: 13 · f60eb1288d
--- a/ChangeLog
+++ b/ChangeLog
@@ -56,6 +56,8 @@ New features:
 
				         - When exchanging user-defined data interfaces, the size of
			
 
				 	  the data is the size returned by the pack operation, i.e
			
 
				 	  data with dynamic size can now be exchanged with StarPU-MPI.
			
 
				+  * Add experimental simgrid support, to simulation execution with various
			
 
				+    number of CPUs, GPUs, amount of memory, etc.
			
 
				 
			
 
				 Changes:
			
 
				   * Fix the block filter functions.
			
--- a/configure.ac
+++ b/configure.ac
@@ -777,6 +777,25 @@ AC_DEFINE_UNQUOTED(STARPU_MAXGORDONDEVS, [1], [maximum number of GORDON devices]
 
				 #                                                                             #
			
 
				 ###############################################################################
			
 
				 
			
 
				+AC_ARG_ENABLE(simgrid, [AS_HELP_STRING([--enable-simgrid],
			
 
				+			[Enable simulating execution in simgrid])],
			
 
				+			enable_simgrid=$enableval, enable_simgrid=no)
			
 
				+if test x$enable_simgrid = xyes ; then
			
 
				+	AC_HAVE_LIBRARY([simgrid], [],
			
 
				+		[
			
 
				+			AC_MSG_ERROR(Simgrid support needs simgrid installed)
			
 
				+		]
			
 
				+	)
			
 
				+	SIMGRID_LIBS=-lsimgrid
			
 
				+	AC_DEFINE(STARPU_SIMGRID, 1, [Define this to enable simgrid execution])
			
 
				+	# Avoid the starpu top thread compilation
			
 
				+	enable_starpu_top=no
			
 
				+	# We won't bind or detect anything
			
 
				+	with_hwloc=no
			
 
				+	# In simgrid, it's much better to let workers block than spinlock
			
 
				+	enable_blocking=yes
			
 
				+fi
			
 
				+
			
 
				 AC_MSG_CHECKING(whether blocking drivers should be disabled)
			
 
				 AC_ARG_ENABLE(blocking-drivers, [AS_HELP_STRING([--enable-blocking-drivers], [enable blocking drivers])],
			
 
				 				enable_blocking=$enableval, enable_blocking=no)
			
@@ -1183,10 +1202,6 @@ else
 
				   build_starpu_top=no
			
 
				 fi
			
 
				 
			
 
				-if test "x$build_starpu_top" != "xno" ; then
			
 
				-	AC_DEFINE(STARPU_TOP, [1], [Define this to 1 to enable building StarPU Top])
			
 
				-fi
			
 
				-
			
 
				 AM_CONDITIONAL(BUILD_STARPU_TOP, test x$build_starpu_top = xyes)
			
 
				 
			
 
				 ###############################################################################
			
@@ -1712,7 +1727,7 @@ AC_SUBST([LIBSTARPU_LDFLAGS])
 
				 
			
 
				 LIBSTARPU_LINK=libstarpu-$STARPU_EFFECTIVE_VERSION.la
			
 
				 if test x$enable_perf_debug = xyes; then
			
 
				-	LIBSTARPU_LINK=".libs/libstarpu-$STARPU_EFFECTIVE_VERSION.a $LIBSTARPU_LDFLAGS $HWLOC_LIBS $STARPU_CUDA_LDFLAGS $STARPU_OPENCL_LDFLAGS"
			
 
				+	LIBSTARPU_LINK=".libs/libstarpu-$STARPU_EFFECTIVE_VERSION.a $LIBSTARPU_LDFLAGS $HWLOC_LIBS $SIMGRID_LIBS $STARPU_CUDA_LDFLAGS $STARPU_OPENCL_LDFLAGS"
			
 
				 fi
			
 
				 AC_SUBST([LIBSTARPU_LINK])
			
 
				 
			
@@ -1808,6 +1823,7 @@ AC_MSG_NOTICE([
 
				 	       GCC plug-in test suite (requires GNU Guile): $run_gcc_plugin_test_suite
			
 
				 	       SOCL enabled:                                $build_socl
			
 
				                SOCL test suite:                             $run_socl_check
			
 
				+               simgrid enabled:                             $enable_simgrid
			
 
				 ])
			
 
				 
			
 
				 if test "$build_socl" = "yes" -a "$run_socl_check" = "no" ; then
			
--- a/doc/chapters/configuration.texi
+++ b/doc/chapters/configuration.texi
@@ -283,6 +283,11 @@ Disable the build of examples.
 
				 Enable memory statistics (@pxref{Memory feedback}).
			
 
				 @end defvr
			
 
				 
			
 
				+@defvr {Configure option} --enable-simgrid
			
 
				+Enable simulation of execution in simgrid, to allow easy experimentation with
			
 
				+various numbers of cores and GPUs, or amount of memory, etc. Experimental.
			
 
				+@end defvr
			
 
				+
			
 
				 @node Execution configuration through environment variables
			
 
				 @section Execution configuration through environment variables
			
 
				 
			
--- a/doc/chapters/perf-optimization.texi
+++ b/doc/chapters/perf-optimization.texi
@@ -21,6 +21,7 @@ TODO: improve!
 
				 * Profiling::
			
 
				 * CUDA-specific optimizations::
			
 
				 * Performance debugging::
			
 
				+* Simulated performance::
			
 
				 @end menu
			
 
				 
			
 
				 Simply encapsulating application kernels into tasks already permits to
			
@@ -422,3 +423,21 @@ detailed in the next chapter. The various informations should be checked for.
 
				   greedy algorithm which thus performs badly.
			
 
				 @end itemize
			
 
				 @end itemize
			
 
				+
			
 
				+@node Simulated performance
			
 
				+@section Simulated performance
			
 
				+
			
 
				+StarPU can use Simgrid in order to simulate execution on an arbitrary
			
 
				+platform. The idea is to first compile StarPU normally, and run the application,
			
 
				+so as to automatically benchmark the bus and the codelets. Then, recompile
			
 
				+StarPU, passing @code{--enable-simgrid} to @code{./configure}, and re-run the
			
 
				+application, specifying the requested number of devices:
			
 
				+
			
 
				+@cartouche
			
 
				+@smallexample
			
 
				+STARPU_NCPU=12 STARPU_NCUDA=2 STARPU_NOPENCL=0 ./example
			
 
				+@end smallexample
			
 
				+@end cartouche
			
 
				+
			
 
				+For now, only the number of cpus can be arbitrarily chosen. The number of CUDA
			
 
				+and OpenCL devices have to be lower than the real number on the current machine.
			
--- a/include/starpu.h
+++ b/include/starpu.h
@@ -66,6 +66,10 @@ extern "C"
 
				 {
			
 
				 #endif
			
 
				 
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+#define main starpu_main
			
 
				+#endif
			
 
				+
			
 
				 enum starpu_archtype
			
 
				 {
			
 
				 	STARPU_CPU_WORKER,    /* CPU core */
			
--- a/include/starpu_config.h.in
+++ b/include/starpu_config.h.in
@@ -26,6 +26,8 @@
 
				 #undef STARPU_USE_OPENCL
			
 
				 #undef STARPU_USE_GORDON
			
 
				 
			
 
				+#undef STARPU_SIMGRID
			
 
				+
			
 
				 #undef STARPU_HAVE_ICC
			
 
				 
			
 
				 #undef STARPU_USE_MPI
			
--- a/include/starpu_perfmodel.h
+++ b/include/starpu_perfmodel.h
@@ -188,7 +188,7 @@ struct starpu_perfmodel
 
				 	unsigned is_loaded;
			
 
				 	unsigned benchmarking;
			
 
				 
			
 
				-#if defined(_MSC_VER)
			
 
				+#if defined(_MSC_VER) || defined(STARPU_SIMGRID)
			
 
				 	void *model_rwlock;
			
 
				 #else
			
 
				 	pthread_rwlock_t model_rwlock;
			
--- a/include/starpu_scheduler.h
+++ b/include/starpu_scheduler.h
@@ -118,7 +118,7 @@ multiple workers may use the same condition variable. For instance, in the case
 
				 of a scheduling strategy with a single task queue, the same condition variable
			
 
				 would be used to block and wake up all workers.  The initialization method of a
			
 
				 scheduling strategy (init_sched) must call this function once per worker. */
			
 
				-#if !defined(_MSC_VER)
			
 
				+#if !defined(_MSC_VER) && !defined(STARPU_SIMGRID)
			
 
				 void starpu_worker_set_sched_condition(int workerid, pthread_cond_t *sched_cond, pthread_mutex_t *sched_mutex);
			
 
				 #endif
			
 
				 
			
--- a/mpi/src/starpu_mpi.c
+++ b/mpi/src/starpu_mpi.c
@@ -855,7 +855,7 @@ int _starpu_mpi_initialize(int *argc, char ***argv)
 
				 	struct _starpu_mpi_argc_argv *argc_argv = malloc(sizeof(struct _starpu_mpi_argc_argv));
			
 
				 	argc_argv->argc = argc;
			
 
				 	argc_argv->argv = argv;
			
 
				-	_STARPU_PTHREAD_CREATE(&progress_thread, NULL, _starpu_mpi_progress_thread_func, argc_argv);
			
 
				+	_STARPU_PTHREAD_CREATE("MPI progress", &progress_thread, NULL, _starpu_mpi_progress_thread_func, argc_argv);
			
 
				 
			
 
				 	_STARPU_PTHREAD_MUTEX_LOCK(&mutex);
			
 
				 	while (!running)
			
--- a/src/Makefile.am
+++ b/src/Makefile.am
@@ -72,6 +72,7 @@ noinst_HEADERS = 						\
 
				 	core/errorcheck.h					\
			
 
				 	core/combined_workers.h					\
			
 
				 	core/parallel_task.h					\
			
 
				+	core/simgrid.h						\
			
 
				 	core/task_bundle.h					\
			
 
				 	sched_policies/detect_combined_workers.h		\
			
 
				 	sched_policies/fifo_queues.h				\
			
@@ -147,6 +148,7 @@ libstarpu_@STARPU_EFFECTIVE_VERSION@_la_SOURCES = 						\
 
				 	core/perfmodel/perfmodel_print.c			\
			
 
				 	core/perfmodel/regression.c				\
			
 
				 	core/sched_policy.c					\
			
 
				+	core/simgrid.c						\
			
 
				 	core/priorities.c					\
			
 
				 	core/parallel_task.c					\
			
 
				 	sched_policies/eager_central_policy.c			\
			
--- a/src/common/barrier.h
+++ b/src/common/barrier.h
@@ -17,6 +17,11 @@
 
				 #ifndef __COMMON_BARRIER_H__
			
 
				 #define __COMMON_BARRIER_H__
			
 
				 
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+/* Force using our implementation of barriers, so it can be simgridish */
			
 
				+#undef PTHREAD_BARRIER_SERIAL_THREAD
			
 
				+#endif
			
 
				+
			
 
				 #include <pthread.h>
			
 
				 #include <common/utils.h>
			
 
				 
			
--- a/src/common/starpu_spinlock.c
+++ b/src/common/starpu_spinlock.c
@@ -20,6 +20,10 @@
 
				 #include <common/utils.h>
			
 
				 #include <starpu_util.h>
			
 
				 
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+#include <msg/msg.h>
			
 
				+#endif
			
 
				+
			
 
				 int _starpu_spin_init(struct _starpu_spinlock *lock)
			
 
				 {
			
 
				 #ifdef STARPU_SPINLOCK_CHECK
			
@@ -70,9 +74,22 @@ int _starpu_spin_lock(struct _starpu_spinlock *lock)
 
				 	return ret;
			
 
				 #else
			
 
				 #ifdef HAVE_PTHREAD_SPIN_LOCK
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+	while (1) {
			
 
				+		int ret = pthread_spin_trylock(&lock->lock);
			
 
				+		if (ret <= 0)
			
 
				+			return ret;
			
 
				+#ifdef STARPU_DEVEL
			
 
				+#warning FIXME: better way to spinlock?
			
 
				+#endif
			
 
				+		/* Sleep for 10µs */
			
 
				+		MSG_process_sleep(0.000010);
			
 
				+	}
			
 
				+#else
			
 
				 	int ret = pthread_spin_lock(&lock->lock);
			
 
				 	STARPU_ASSERT(!ret);
			
 
				 	return ret;
			
 
				+#endif
			
 
				 #else
			
 
				 	uint32_t prev;
			
 
				 	do
			
--- a/src/common/timing.c
+++ b/src/common/timing.c
@@ -21,7 +21,23 @@
 
				 #include <profiling/profiling.h>
			
 
				 #include <common/timing.h>
			
 
				 
			
 
				-#if defined(HAVE_CLOCK_GETTIME) && defined(CLOCK_MONOTONIC)
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+#include <msg/msg.h>
			
 
				+#endif
			
 
				+
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+void _starpu_timing_init(void)
			
 
				+{
			
 
				+}
			
 
				+
			
 
				+void _starpu_clock_gettime(struct timespec *ts)
			
 
				+{
			
 
				+	double now = MSG_get_clock();
			
 
				+	ts->tv_sec = floor(now);
			
 
				+	ts->tv_nsec = floor((now - ts->tv_sec) * 1000000000);
			
 
				+}
			
 
				+
			
 
				+#elif defined(HAVE_CLOCK_GETTIME) && defined(CLOCK_MONOTONIC)
			
 
				 #include <time.h>
			
 
				 #ifndef _POSIX_C_SOURCE
			
 
				 /* for clock_gettime */
			
@@ -193,8 +209,12 @@ double starpu_timing_timespec_to_us(struct timespec *ts)
 
				 
			
 
				 double starpu_timing_now(void)
			
 
				 {
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+	return MSG_get_clock()*1000000;
			
 
				+#else
			
 
				 	struct timespec now;
			
 
				 	_starpu_clock_gettime(&now);
			
 
				 
			
 
				 	return starpu_timing_timespec_to_us(&now);
			
 
				+#endif
			
 
				 }
			
--- a/src/common/utils.h
+++ b/src/common/utils.h
@@ -26,6 +26,11 @@
 
				 #include <stdlib.h>
			
 
				 #include <math.h>
			
 
				 
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+#include <xbt/synchro_core.h>
			
 
				+#include <msg/msg.h>
			
 
				+#endif
			
 
				+
			
 
				 #ifdef STARPU_VERBOSE
			
 
				 #  define _STARPU_DEBUG(fmt, args ...) do { if (!getenv("STARPU_SILENT")) {fprintf(stderr, "[starpu][%s] " fmt ,__func__ ,##args); fflush(stderr); }} while(0)
			
 
				 #else
			
@@ -52,7 +57,11 @@
 
				 
			
 
				 #define _STARPU_IS_ZERO(a) (fpclassify(a) == FP_ZERO)
			
 
				 
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+typedef xbt_mutex_t _starpu_pthread_mutex_t;
			
 
				+#else
			
 
				 typedef pthread_mutex_t _starpu_pthread_mutex_t;
			
 
				+#endif
			
 
				 int _starpu_mkpath(const char *s, mode_t mode);
			
 
				 void _starpu_mkpath_and_check(const char *s, mode_t mode);
			
 
				 int _starpu_check_mutex_deadlock(_starpu_pthread_mutex_t *mutex);
			
@@ -69,7 +78,25 @@ struct starpu_codelet;
 
				 /* Returns the symbol associated to that job if any. */
			
 
				 const char *_starpu_codelet_get_model_name(struct starpu_codelet *cl);
			
 
				 
			
 
				-#define _STARPU_PTHREAD_CREATE(thread, attr, routine, arg) do {                \
			
 
				+struct _starpu_pthread_args {
			
 
				+	void *(*f)(void*);
			
 
				+	void *arg;
			
 
				+};
			
 
				+
			
 
				+int _starpu_simgrid_thread_start(int argc, char *argv[]);
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+#define _STARPU_PTHREAD_CREATE_ON(name, thread, attr, routine, threadarg, where) do {\
			
 
				+	struct _starpu_pthread_args *_args = malloc(sizeof(*_args));           \
			
 
				+	xbt_dynar_t _hosts;                                                    \
			
 
				+	_args->f = routine;                                                    \
			
 
				+	_args->arg = threadarg;                                                \
			
 
				+	_hosts = MSG_hosts_as_dynar();                                         \
			
 
				+	MSG_process_create((name), _starpu_simgrid_thread_start, _args,        \
			
 
				+			xbt_dynar_get_as(_hosts, (where), msg_host_t));        \
			
 
				+	xbt_dynar_free(&_hosts);                                               \
			
 
				+} while (0)
			
 
				+#else
			
 
				+#define _STARPU_PTHREAD_CREATE_ON(name, thread, attr, routine, arg, where) do {\
			
 
				 	int p_ret = pthread_create((thread), (attr), (routine), (arg));	       \
			
 
				 	if (STARPU_UNLIKELY(p_ret != 0)) {                                     \
			
 
				 		fprintf(stderr,                                                \
			
@@ -77,10 +104,24 @@ const char *_starpu_codelet_get_model_name(struct starpu_codelet *cl);
 
				 			__FILE__, __LINE__, strerror(p_ret));                  \
			
 
				 	}                                                                      \
			
 
				 } while (0)
			
 
				+#endif
			
 
				+#define _STARPU_PTHREAD_CREATE(name, thread, attr, routine, arg)               \
			
 
				+	_STARPU_PTHREAD_CREATE_ON(name, thread, attr, routine, arg, 0)
			
 
				 
			
 
				 /*
			
 
				  * Encapsulation of the pthread_key_* functions.
			
 
				  */
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+typedef int _starpu_pthread_key_t;
			
 
				+int _starpu_pthread_key_create(_starpu_pthread_key_t *key);
			
 
				+#define _STARPU_PTHREAD_KEY_CREATE(key, destr) _starpu_pthread_key_create(key)
			
 
				+int _starpu_pthread_key_delete(_starpu_pthread_key_t key);
			
 
				+#define _STARPU_PTHREAD_KEY_DELETE(key) _starpu_pthread_key_delete(key)
			
 
				+int _starpu_pthread_setspecific(_starpu_pthread_key_t key, void *ptr);
			
 
				+#define _STARPU_PTHREAD_SETSPECIFIC(key, ptr) _starpu_pthread_setspecific(key, ptr)
			
 
				+void *_starpu_pthread_getspecific(_starpu_pthread_key_t key);
			
 
				+#define _STARPU_PTHREAD_GETSPECIFIC(key) _starpu_pthread_getspecific(key)
			
 
				+#else
			
 
				 typedef pthread_key_t _starpu_pthread_key_t;
			
 
				 #define _STARPU_PTHREAD_KEY_CREATE(key, destr) do {                            \
			
 
				 	int p_ret = pthread_key_create((key), (destr));	                       \
			
@@ -110,10 +151,17 @@ typedef pthread_key_t _starpu_pthread_key_t;
 
				 } while (0)
			
 
				 
			
 
				 #define _STARPU_PTHREAD_GETSPECIFIC(key) pthread_getspecific((key))
			
 
				+#endif
			
 
				 
			
 
				 /*
			
 
				  * Encapsulation of the pthread_mutex_* functions.
			
 
				  */
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+#define _STARPU_PTHREAD_MUTEX_INITIALIZER NULL
			
 
				+#define _STARPU_PTHREAD_MUTEX_INIT(mutex, attr) do {                           \
			
 
				+	(*mutex) = xbt_mutex_init();                                           \
			
 
				+} while (0)
			
 
				+#else
			
 
				 #define _STARPU_PTHREAD_MUTEX_INITIALIZER PTHREAD_MUTEX_INITIALIZER
			
 
				 #define _STARPU_PTHREAD_MUTEX_INIT(mutex, attr) do {                           \
			
 
				 	int p_ret = pthread_mutex_init((mutex), (attr));                       \
			
@@ -124,7 +172,14 @@ typedef pthread_key_t _starpu_pthread_key_t;
 
				 		STARPU_ABORT();                                                \
			
 
				 	}                                                                      \
			
 
				 } while (0)
			
 
				+#endif
			
 
				 
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+#define _STARPU_PTHREAD_MUTEX_DESTROY(mutex) do {                              \
			
 
				+	if (*mutex)                                                            \
			
 
				+		xbt_mutex_destroy((*mutex));                                   \
			
 
				+} while (0)
			
 
				+#else
			
 
				 #define _STARPU_PTHREAD_MUTEX_DESTROY(mutex) do {                              \
			
 
				 	int p_ret = pthread_mutex_destroy(mutex);                              \
			
 
				 	if (STARPU_UNLIKELY(p_ret)) {                                          \
			
@@ -134,7 +189,14 @@ typedef pthread_key_t _starpu_pthread_key_t;
 
				 		STARPU_ABORT();                                                \
			
 
				 	}                                                                      \
			
 
				 } while(0)
			
 
				+#endif
			
 
				 
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+#define _STARPU_PTHREAD_MUTEX_LOCK(mutex) do {                                 \
			
 
				+	if (!(*mutex)) _STARPU_PTHREAD_MUTEX_INIT((mutex), NULL);              \
			
 
				+	xbt_mutex_acquire((*mutex));                                           \
			
 
				+} while (0)
			
 
				+#else
			
 
				 #define _STARPU_PTHREAD_MUTEX_LOCK(mutex) do {                                 \
			
 
				 	int p_ret = pthread_mutex_lock(mutex);                                 \
			
 
				 	if (STARPU_UNLIKELY(p_ret)) {                                          \
			
@@ -144,9 +206,19 @@ typedef pthread_key_t _starpu_pthread_key_t;
 
				 		STARPU_ABORT();                                                \
			
 
				 	}                                                                      \
			
 
				 } while (0)
			
 
				+#endif
			
 
				 
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+#define _STARPU_PTHREAD_MUTEX_TRYLOCK(mutex) (xbt_mutex_acquire(*mutex), 0)
			
 
				+#else
			
 
				 #define _STARPU_PTHREAD_MUTEX_TRYLOCK(mutex) pthread_mutex_trylock(mutex)
			
 
				+#endif
			
 
				 
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+#define _STARPU_PTHREAD_MUTEX_UNLOCK(mutex) do {                               \
			
 
				+	xbt_mutex_release((*mutex));                                           \
			
 
				+} while (0)
			
 
				+#else
			
 
				 #define _STARPU_PTHREAD_MUTEX_UNLOCK(mutex) do {                               \
			
 
				 	int p_ret = pthread_mutex_unlock(mutex);                               \
			
 
				 	if (STARPU_UNLIKELY(p_ret)) {                                          \
			
@@ -156,11 +228,19 @@ typedef pthread_key_t _starpu_pthread_key_t;
 
				 		STARPU_ABORT();                                                \
			
 
				 	}                                                                      \
			
 
				 } while (0)
			
 
				+#endif
			
 
				 
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+typedef xbt_mutex_t _starpu_pthread_rwlock_t;
			
 
				+#else
			
 
				 typedef pthread_rwlock_t _starpu_pthread_rwlock_t;
			
 
				+#endif
			
 
				 /*
			
 
				  * Encapsulation of the pthread_rwlock_* functions.
			
 
				  */
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+#define _STARPU_PTHREAD_RWLOCK_INIT(rwlock, attr) _STARPU_PTHREAD_MUTEX_INIT(rwlock, attr)
			
 
				+#else
			
 
				 #define _STARPU_PTHREAD_RWLOCK_INIT(rwlock, attr) do {                         \
			
 
				 	int p_ret = pthread_rwlock_init((rwlock), (attr));                     \
			
 
				 	if (STARPU_UNLIKELY(p_ret)) {                                          \
			
@@ -170,7 +250,11 @@ typedef pthread_rwlock_t _starpu_pthread_rwlock_t;
 
				 		STARPU_ABORT();                                                \
			
 
				 	}                                                                      \
			
 
				 } while (0)
			
 
				+#endif
			
 
				 
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+#define _STARPU_PTHREAD_RWLOCK_RDLOCK(rwlock) _STARPU_PTHREAD_MUTEX_LOCK(rwlock)
			
 
				+#else
			
 
				 #define _STARPU_PTHREAD_RWLOCK_RDLOCK(rwlock) do {                             \
			
 
				 	int p_ret = pthread_rwlock_rdlock(rwlock);                             \
			
 
				 	if (STARPU_UNLIKELY(p_ret)) {                                          \
			
@@ -180,7 +264,11 @@ typedef pthread_rwlock_t _starpu_pthread_rwlock_t;
 
				 		STARPU_ABORT();                                                \
			
 
				 	}                                                                      \
			
 
				 } while (0)
			
 
				+#endif
			
 
				 
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+#define _STARPU_PTHREAD_RWLOCK_WRLOCK(rwlock) _STARPU_PTHREAD_MUTEX_LOCK(rwlock)
			
 
				+#else
			
 
				 #define _STARPU_PTHREAD_RWLOCK_WRLOCK(rwlock) do {                             \
			
 
				 	int p_ret = pthread_rwlock_wrlock(rwlock);                             \
			
 
				 	if (STARPU_UNLIKELY(p_ret)) {                                          \
			
@@ -190,7 +278,11 @@ typedef pthread_rwlock_t _starpu_pthread_rwlock_t;
 
				 		STARPU_ABORT();                                                \
			
 
				 	}                                                                      \
			
 
				 } while (0)
			
 
				+#endif
			
 
				 
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+#define _STARPU_PTHREAD_RWLOCK_UNLOCK(rwlock) _STARPU_PTHREAD_MUTEX_UNLOCK(rwlock)
			
 
				+#else
			
 
				 #define _STARPU_PTHREAD_RWLOCK_UNLOCK(rwlock) do {                             \
			
 
				 	int p_ret = pthread_rwlock_unlock(rwlock);                             \
			
 
				 	if (STARPU_UNLIKELY(p_ret)) {                                          \
			
@@ -200,7 +292,11 @@ typedef pthread_rwlock_t _starpu_pthread_rwlock_t;
 
				 		STARPU_ABORT();                                                \
			
 
				 	}                                                                      \
			
 
				 } while (0)
			
 
				+#endif
			
 
				 
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+#define _STARPU_PTHREAD_RWLOCK_DESTROY(rwlock) _STARPU_PTHREAD_MUTEX_DESTROY(rwlock)
			
 
				+#else
			
 
				 #define _STARPU_PTHREAD_RWLOCK_DESTROY(rwlock) do {                            \
			
 
				 	int p_ret = pthread_rwlock_destroy(rwlock);                            \
			
 
				 	if (STARPU_UNLIKELY(p_ret)) {                                          \
			
@@ -210,11 +306,22 @@ typedef pthread_rwlock_t _starpu_pthread_rwlock_t;
 
				 		STARPU_ABORT();                                                \
			
 
				 	}                                                                      \
			
 
				 } while (0)
			
 
				+#endif
			
 
				 
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+typedef xbt_cond_t _starpu_pthread_cond_t;
			
 
				+#else
			
 
				 typedef pthread_cond_t _starpu_pthread_cond_t;
			
 
				+#endif
			
 
				 /*
			
 
				  * Encapsulation of the pthread_cond_* functions.
			
 
				  */
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+#define _STARPU_PTHREAD_COND_INITIALIZER NULL
			
 
				+#define _STARPU_PTHREAD_COND_INIT(cond, attr) do {                             \
			
 
				+	(*cond) = xbt_cond_init();                                             \
			
 
				+} while (0)
			
 
				+#else
			
 
				 #define _STARPU_PTHREAD_COND_INITIALIZER PTHREAD_COND_INITIALIZER
			
 
				 #define _STARPU_PTHREAD_COND_INIT(cond, attr) do {                             \
			
 
				 	int p_ret = pthread_cond_init((cond), (attr));                         \
			
@@ -225,7 +332,14 @@ typedef pthread_cond_t _starpu_pthread_cond_t;
 
				 		STARPU_ABORT();                                                \
			
 
				 	}                                                                      \
			
 
				 } while (0)
			
 
				+#endif
			
 
				 
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+#define _STARPU_PTHREAD_COND_DESTROY(cond) do {                                \
			
 
				+	if (*cond)                                                             \
			
 
				+		xbt_cond_destroy((*cond));                                     \
			
 
				+} while (0)
			
 
				+#else
			
 
				 #define _STARPU_PTHREAD_COND_DESTROY(cond) do {                                \
			
 
				 	int p_ret = pthread_cond_destroy(cond);                                \
			
 
				 	if (STARPU_UNLIKELY(p_ret)) {                                          \
			
@@ -235,7 +349,15 @@ typedef pthread_cond_t _starpu_pthread_cond_t;
 
				 			STARPU_ABORT();                                        \
			
 
				 	}                                                                      \
			
 
				 } while (0)
			
 
				+#endif
			
 
				 
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+#define _STARPU_PTHREAD_COND_SIGNAL(cond) do {                                 \
			
 
				+	if (!*cond)                                                            \
			
 
				+		_STARPU_PTHREAD_COND_INIT(cond, NULL);                         \
			
 
				+	xbt_cond_signal((*cond));                                              \
			
 
				+} while (0)
			
 
				+#else
			
 
				 #define _STARPU_PTHREAD_COND_SIGNAL(cond) do {                                 \
			
 
				 	int p_ret = pthread_cond_signal(cond);                                 \
			
 
				 	if (STARPU_UNLIKELY(p_ret)) {                                          \
			
@@ -245,7 +367,15 @@ typedef pthread_cond_t _starpu_pthread_cond_t;
 
				 		STARPU_ABORT();                                                \
			
 
				 	}                                                                      \
			
 
				 } while (0)
			
 
				+#endif
			
 
				 
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+#define _STARPU_PTHREAD_COND_BROADCAST(cond) do {                              \
			
 
				+	if (!*cond)                                                            \
			
 
				+		_STARPU_PTHREAD_COND_INIT(cond, NULL);                         \
			
 
				+	xbt_cond_broadcast((*cond));                                           \
			
 
				+} while (0)
			
 
				+#else
			
 
				 #define _STARPU_PTHREAD_COND_BROADCAST(cond) do {                              \
			
 
				 	int p_ret = pthread_cond_broadcast(cond);                              \
			
 
				 	if (STARPU_UNLIKELY(p_ret)) {                                          \
			
@@ -255,7 +385,15 @@ typedef pthread_cond_t _starpu_pthread_cond_t;
 
				 		STARPU_ABORT();                                                \
			
 
				 	}                                                                      \
			
 
				 } while (0)
			
 
				+#endif
			
 
				 
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+#define _STARPU_PTHREAD_COND_WAIT(cond, mutex) do {                            \
			
 
				+	if (!*cond)                                                            \
			
 
				+		_STARPU_PTHREAD_COND_INIT(cond, NULL);                         \
			
 
				+	xbt_cond_wait((*cond), (*mutex));                                      \
			
 
				+} while (0)
			
 
				+#else
			
 
				 #define _STARPU_PTHREAD_COND_WAIT(cond, mutex) do {                            \
			
 
				 	int p_ret = pthread_cond_wait((cond), (mutex));                        \
			
 
				 	if (STARPU_UNLIKELY(p_ret)) {                                          \
			
@@ -265,6 +403,7 @@ typedef pthread_cond_t _starpu_pthread_cond_t;
 
				 		STARPU_ABORT();                                                \
			
 
				 	}                                                                      \
			
 
				 } while (0)
			
 
				+#endif
			
 
				 
			
 
				 #include <common/barrier.h>
			
 
				 
			
--- a/src/core/perfmodel/perfmodel.h
+++ b/src/core/perfmodel/perfmodel.h
@@ -1,6 +1,6 @@
 
				 /* StarPU --- Runtime system for heterogeneous multicore architectures.
			
 
				  *
			
 
				- * Copyright (C) 2009, 2010, 2011  Université de Bordeaux 1
			
 
				+ * Copyright (C) 2009-2012  Université de Bordeaux 1
			
 
				  * Copyright (C) 2010, 2011, 2012  Centre National de la Recherche Scientifique
			
 
				  * Copyright (C) 2011  Télécom-SudParis
			
 
				  *
			
@@ -60,6 +60,8 @@ void _starpu_update_perfmodel_history(struct _starpu_job *j, struct starpu_perfm
 
				 void _starpu_create_sampling_directory_if_needed(void);
			
 
				 
			
 
				 void _starpu_load_bus_performance_files(void);
			
 
				+double _starpu_transfer_bandwidth(unsigned src_node, unsigned dst_node);
			
 
				+double _starpu_transfer_latency(unsigned src_node, unsigned dst_node);
			
 
				 double _starpu_predict_transfer_time(unsigned src_node, unsigned dst_node, size_t size);
			
 
				 
			
 
				 
			
--- a/src/core/perfmodel/perfmodel_bus.c
+++ b/src/core/perfmodel/perfmodel_bus.c
@@ -44,7 +44,9 @@
 
				 #define SIZE	(32*1024*1024*sizeof(char))
			
 
				 #define NITER	128
			
 
				 
			
 
				+#ifndef STARPU_SIMGRID
			
 
				 static void starpu_force_bus_sampling(void);
			
 
				+#endif
			
 
				 
			
 
				 /* timing is in µs per byte (i.e. slowness, inverse of bandwidth) */
			
 
				 struct dev_timing
			
@@ -84,7 +86,7 @@ static struct dev_timing opencldev_timing_per_cpu[STARPU_MAXNODES*STARPU_MAXCPUS
 
				 static hwloc_topology_t hwtopology;
			
 
				 #endif
			
 
				 
			
 
				-#if defined(STARPU_USE_CUDA) || defined(STARPU_USE_OPENCL)
			
 
				+#if (defined(STARPU_USE_CUDA) || defined(STARPU_USE_OPENCL)) && !defined(STARPU_SIMGRID)
			
 
				 
			
 
				 #ifdef STARPU_USE_CUDA
			
 
				 
			
@@ -529,6 +531,10 @@ static void measure_bandwidth_between_host_and_dev(int dev, double *dev_timing_h
 
				 
			
 
				 static void benchmark_all_gpu_devices(void)
			
 
				 {
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+	_STARPU_DISP("can not measure bus in simgrid mode\n");
			
 
				+	STARPU_ABORT();
			
 
				+#else /* !SIMGRID */
			
 
				 #if defined(STARPU_USE_CUDA) || defined(STARPU_USE_OPENCL)
			
 
				 	int i;
			
 
				 #endif
			
@@ -611,6 +617,7 @@ static void benchmark_all_gpu_devices(void)
 
				 	_STARPU_DEBUG("Benchmarking the speed of the bus is done.\n");
			
 
				 
			
 
				 	was_benchmarked = 1;
			
 
				+#endif /* !SIMGRID */
			
 
				 }
			
 
				 
			
 
				 static void get_bus_path(const char *type, char *path, size_t maxlen)
			
@@ -632,6 +639,7 @@ static void get_bus_path(const char *type, char *path, size_t maxlen)
 
				  *	Affinity
			
 
				  */
			
 
				 
			
 
				+#ifndef STARPU_SIMGRID
			
 
				 static void get_affinity_path(char *path, size_t maxlen)
			
 
				 {
			
 
				 	get_bus_path("affinity", path, maxlen);
			
@@ -788,6 +796,7 @@ static void load_bus_affinity_file(void)
 
				 
			
 
				 	load_bus_affinity_file_content();
			
 
				 }
			
 
				+#endif /* !SIMGRID */
			
 
				 
			
 
				 #ifdef STARPU_USE_CUDA
			
 
				 int *_starpu_get_cuda_affinity_vector(unsigned gpuid)
			
@@ -1213,6 +1222,7 @@ static void load_bus_bandwidth_file(void)
 
				 	}
			
 
				 }
			
 
				 
			
 
				+#ifndef STARPU_SIMGRID
			
 
				 /*
			
 
				  *	Config
			
 
				  */
			
@@ -1329,17 +1339,32 @@ static void starpu_force_bus_sampling(void)
 
				 	generate_bus_bandwidth_file();
			
 
				         generate_bus_config_file();
			
 
				 }
			
 
				+#endif /* !SIMGRID */
			
 
				 
			
 
				 void _starpu_load_bus_performance_files(void)
			
 
				 {
			
 
				 	_starpu_create_sampling_directory_if_needed();
			
 
				 
			
 
				+#ifndef STARPU_SIMGRID
			
 
				         check_bus_config_file();
			
 
				 	load_bus_affinity_file();
			
 
				+#endif
			
 
				 	load_bus_latency_file();
			
 
				 	load_bus_bandwidth_file();
			
 
				 }
			
 
				 
			
 
				+/* (in MB/s) */
			
 
				+double _starpu_transfer_bandwidth(unsigned src_node, unsigned dst_node)
			
 
				+{
			
 
				+	return bandwidth_matrix[src_node][dst_node];
			
 
				+}
			
 
				+
			
 
				+/* (in µs) */
			
 
				+double _starpu_transfer_latency(unsigned src_node, unsigned dst_node)
			
 
				+{
			
 
				+	return latency_matrix[src_node][dst_node];
			
 
				+}
			
 
				+
			
 
				 /* (in µs) */
			
 
				 double _starpu_predict_transfer_time(unsigned src_node, unsigned dst_node, size_t size)
			
 
				 {
			
--- a/src/core/simgrid.c
+++ b/src/core/simgrid.c
@@ -0,0 +1,275 @@
 
				+/* StarPU --- Runtime system for heterogeneous multicore architectures.
			
 
				+ *
			
 
				+ * Copyright (C) 2012  Université de Bordeaux 1
			
 
				+ *
			
 
				+ * StarPU is free software; you can redistribute it and/or modify
			
 
				+ * it under the terms of the GNU Lesser General Public License as published by
			
 
				+ * the Free Software Foundation; either version 2.1 of the License, or (at
			
 
				+ * your option) any later version.
			
 
				+ *
			
 
				+ * StarPU is distributed in the hope that it will be useful, but
			
 
				+ * WITHOUT ANY WARRANTY; without even the implied warranty of
			
 
				+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
			
 
				+ *
			
 
				+ * See the GNU Lesser General Public License in COPYING.LGPL for more details.
			
 
				+ */
			
 
				+
			
 
				+#include <starpu.h>
			
 
				+#include <datawizard/memory_nodes.h>
			
 
				+#include <unistd.h>
			
 
				+#include <core/perfmodel/perfmodel.h>
			
 
				+#include <core/workers.h>
			
 
				+
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+#include <msg/msg.h>
			
 
				+
			
 
				+#define MAX_TSD 16
			
 
				+
			
 
				+#pragma weak starpu_main
			
 
				+extern int starpu_main(int argc, char *argv[]);
			
 
				+
			
 
				+static void bus_name(struct starpu_conf *conf, char *s, size_t size, int num)
			
 
				+{
			
 
				+	if (!num)
			
 
				+		snprintf(s, size, "RAM");
			
 
				+	else if (num < conf->ncuda + 1)
			
 
				+		snprintf(s, size, "CUDA%d", num - 1);
			
 
				+	else
			
 
				+		snprintf(s, size, "OpenCL%d", num - conf->ncuda - 1);
			
 
				+}
			
 
				+
			
 
				+#ifdef STARPU_DEVEL
			
 
				+#warning TODO: use another way to start main, when simgrid provides it, and then include the application-provided configuration for platform numbers
			
 
				+#endif
			
 
				+#undef main
			
 
				+int main(int argc, char **argv)
			
 
				+{
			
 
				+	xbt_dynar_t hosts;
			
 
				+	int i, j;
			
 
				+	char name[] = "/tmp/starpu-simgrid-platform.xml.XXXXXX";
			
 
				+	int fd;
			
 
				+	FILE *file;
			
 
				+	struct starpu_machine_topology *topology = &_starpu_get_machine_config()->topology;
			
 
				+
			
 
				+	if (!starpu_main)
			
 
				+	{
			
 
				+		fprintf(stderr,"The main file of this application needs to be compiled with starpu.h included, to properly define starpu_main\n");
			
 
				+		exit(EXIT_FAILURE);
			
 
				+	}
			
 
				+
			
 
				+	MSG_init(&argc, argv);
			
 
				+	MSG_config("workstation/model", "ptask_L07");
			
 
				+
			
 
				+	/* Create platform file */
			
 
				+	struct starpu_conf conf;
			
 
				+	starpu_conf_init(&conf);
			
 
				+	if (!getenv("STARPU_NCPUS")
			
 
				+#ifdef STARPU_USE_CUDA
			
 
				+	 || !getenv("STARPU_NCUDA")
			
 
				+#endif
			
 
				+#ifdef STARPU_USE_OPENCL
			
 
				+	 || !getenv("STARPU_NOPENCL")
			
 
				+#endif
			
 
				+			)
			
 
				+	{
			
 
				+		fprintf(stderr,"Please specify the number of cpus and gpus\n");
			
 
				+		exit(EXIT_FAILURE);
			
 
				+	}
			
 
				+	_starpu_conf_check_environment(&conf);
			
 
				+
			
 
				+	_starpu_load_bus_performance_files();
			
 
				+
			
 
				+	topology->ncpus = conf.ncpus;
			
 
				+	topology->ncudagpus = conf.ncuda;
			
 
				+	topology->nopenclgpus = conf.nopencl;
			
 
				+
			
 
				+	fd = mkstemp(name);
			
 
				+	file = fdopen(fd, "w");
			
 
				+	fprintf(file,
			
 
				+"<?xml version='1.0'?>\n"
			
 
				+" <!DOCTYPE platform SYSTEM 'http://simgrid.gforge.inria.fr/simgrid.dtd'>\n"
			
 
				+" <platform version='3'>\n"
			
 
				+" <AS  id='AS0'  routing='Full'>\n"
			
 
				+"   <host id='MAIN' power='1'/>\n"
			
 
				+		);
			
 
				+
			
 
				+	for (i = 0; i < conf.ncpus; i++)
			
 
				+		fprintf(file, "   <host id='CPU%d' power='2000000000'/>\n", i);
			
 
				+
			
 
				+	for (i = 0; i < conf.ncuda; i++)
			
 
				+		fprintf(file, "   <host id='CUDA%d' power='2000000000'/>\n", i);
			
 
				+
			
 
				+	for (i = 0; i < conf.nopencl; i++)
			
 
				+		fprintf(file, "   <host id='OpenCL%d' power='2000000000'/>\n", i);
			
 
				+
			
 
				+	fprintf(file, "\n   <host id='RAM' power='1'/>\n");
			
 
				+
			
 
				+	/* Compute maximum bandwidth, taken as machine bandwidth */
			
 
				+	double max_bandwidth = 0;
			
 
				+	for (i = 1; i < conf.ncuda + conf.nopencl + 1; i++)
			
 
				+	{
			
 
				+		if (max_bandwidth < _starpu_transfer_bandwidth(0, i))
			
 
				+			max_bandwidth = _starpu_transfer_bandwidth(0, i);
			
 
				+		if (max_bandwidth < _starpu_transfer_bandwidth(i, 0))
			
 
				+			max_bandwidth = _starpu_transfer_bandwidth(i, 0);
			
 
				+	}
			
 
				+	fprintf(file, "\n   <link id='Share' bandwidth='%f' latency='0.000000'/>\n\n", max_bandwidth*1000000);
			
 
				+
			
 
				+	for (i = 0; i < conf.ncuda + conf.nopencl + 1; i++)
			
 
				+	{
			
 
				+		char i_name[16];
			
 
				+		bus_name(&conf, i_name, sizeof(i_name), i);
			
 
				+
			
 
				+		for (j = 0; j < conf.ncuda + conf.nopencl + 1; j++)
			
 
				+		{
			
 
				+			char j_name[16];
			
 
				+			if (j == i)
			
 
				+				continue;
			
 
				+			bus_name(&conf, j_name, sizeof(j_name), j);
			
 
				+			fprintf(file, "   <link id='%s-%s' bandwidth='%f' latency='%f'/>\n",
			
 
				+				i_name, j_name,
			
 
				+				_starpu_transfer_bandwidth(i, j) * 1000000,
			
 
				+				_starpu_transfer_latency(i, j) / 1000000);
			
 
				+		}
			
 
				+	}
			
 
				+
			
 
				+	for (i = 0; i < conf.ncuda + conf.nopencl + 1; i++)
			
 
				+	{
			
 
				+		char i_name[16];
			
 
				+		bus_name(&conf, i_name, sizeof(i_name), i);
			
 
				+
			
 
				+		for (j = 0; j < conf.ncuda + conf.nopencl + 1; j++)
			
 
				+		{
			
 
				+			char j_name[16];
			
 
				+			if (j == i)
			
 
				+				continue;
			
 
				+			bus_name(&conf, j_name, sizeof(j_name), j);
			
 
				+			fprintf(file,
			
 
				+"   <route src='%s' dst='%s' symmetrical='NO'><link_ctn id='%s-%s'/><link_ctn id='Share'/></route>\n",
			
 
				+				i_name, j_name, i_name, j_name);
			
 
				+		}
			
 
				+	}
			
 
				+
			
 
				+	fprintf(file, 
			
 
				+" </AS>\n"
			
 
				+" </platform>\n"
			
 
				+		);
			
 
				+	fclose(file);
			
 
				+	close(fd);
			
 
				+
			
 
				+	/* and load it */
			
 
				+	MSG_create_environment(name);
			
 
				+	unlink(name);
			
 
				+
			
 
				+	hosts = MSG_hosts_as_dynar();
			
 
				+	int nb = xbt_dynar_length(hosts);
			
 
				+	for (i = 0; i < nb; i++)
			
 
				+		MSG_host_set_data(xbt_dynar_get_as(hosts, i, msg_host_t), calloc(MAX_TSD, sizeof(void*)));
			
 
				+	MSG_process_create("main", &starpu_main, NULL, xbt_dynar_get_as(hosts, 0, msg_host_t));
			
 
				+	xbt_dynar_free(&hosts);
			
 
				+
			
 
				+	MSG_main();
			
 
				+	return 0;
			
 
				+}
			
 
				+
			
 
				+void _starpu_simgrid_execute_job(struct _starpu_job *j, enum starpu_perf_archtype perf_arch)
			
 
				+{
			
 
				+	struct starpu_task *task = j->task;
			
 
				+	msg_task_t simgrid_task;
			
 
				+	double length = starpu_task_expected_length(task, perf_arch, j->nimpl);
			
 
				+
			
 
				+	STARPU_ASSERT_MSG(!_STARPU_IS_ZERO(length) && !isnan(length), "Codelets need to have a calibrated perfmodel");
			
 
				+
			
 
				+	simgrid_task = MSG_task_create(_starpu_job_get_model_name(j),
			
 
				+			length/1000000.0*MSG_get_host_speed(MSG_host_self()),
			
 
				+			0, NULL);
			
 
				+	MSG_task_execute(simgrid_task);
			
 
				+}
			
 
				+
			
 
				+msg_task_t _starpu_simgrid_transfer_task_create(unsigned src_node, unsigned dst_node, size_t size)
			
 
				+{
			
 
				+	msg_host_t *hosts = calloc(2, sizeof(*hosts));
			
 
				+	double *computation = calloc(2, sizeof(*hosts));
			
 
				+	double *communication = calloc(4, sizeof(*hosts));
			
 
				+
			
 
				+	hosts[0] = _starpu_simgrid_memory_node_get_host(src_node);
			
 
				+	hosts[1] = _starpu_simgrid_memory_node_get_host(dst_node);
			
 
				+	communication[1] = size;
			
 
				+
			
 
				+	return MSG_parallel_task_create("copy", 2, hosts, computation, communication, NULL);
			
 
				+}
			
 
				+
			
 
				+struct completion {
			
 
				+	msg_task_t task;
			
 
				+	unsigned *finished;
			
 
				+	_starpu_pthread_mutex_t *mutex;
			
 
				+	_starpu_pthread_cond_t *cond;
			
 
				+};
			
 
				+
			
 
				+int transfer_execute(int argc STARPU_ATTRIBUTE_UNUSED, char *argv[] STARPU_ATTRIBUTE_UNUSED)
			
 
				+{
			
 
				+	struct completion *completion = MSG_process_get_data(MSG_process_self());
			
 
				+	MSG_task_execute(completion->task);
			
 
				+	MSG_task_destroy(completion->task);
			
 
				+	_STARPU_PTHREAD_MUTEX_LOCK(completion->mutex);
			
 
				+	*completion->finished = 1;
			
 
				+	fprintf(stderr, "transfer finished\n");
			
 
				+	_STARPU_PTHREAD_COND_BROADCAST(completion->cond);
			
 
				+	_STARPU_PTHREAD_MUTEX_UNLOCK(completion->mutex);
			
 
				+	free(completion);
			
 
				+	return 0;
			
 
				+}
			
 
				+
			
 
				+void _starpu_simgrid_post_task(msg_task_t task, unsigned *finished, _starpu_pthread_mutex_t *mutex, _starpu_pthread_cond_t *cond)
			
 
				+{
			
 
				+	struct completion *completion = malloc(sizeof (*completion));
			
 
				+	completion->task = task;
			
 
				+	completion->finished = finished;
			
 
				+	completion->mutex = mutex;
			
 
				+	completion->cond = cond;
			
 
				+	xbt_dynar_t hosts = MSG_hosts_as_dynar();
			
 
				+	MSG_process_create("transfer task", transfer_execute, completion, xbt_dynar_get_as(hosts, 0, msg_host_t));
			
 
				+	fprintf(stderr,"process started\n");
			
 
				+	xbt_dynar_free(&hosts);
			
 
				+}
			
 
				+
			
 
				+static int last_key;
			
 
				+
			
 
				+int _starpu_pthread_key_create(_starpu_pthread_key_t *key)
			
 
				+{
			
 
				+	/* Note: no synchronization here, we are actually monothreaded anyway. */
			
 
				+	STARPU_ASSERT(last_key < MAX_TSD);
			
 
				+	*key = last_key++;
			
 
				+	return 0;
			
 
				+}
			
 
				+
			
 
				+int _starpu_pthread_key_delete(_starpu_pthread_key_t key)
			
 
				+{
			
 
				+#ifdef STARPU_DEVEL
			
 
				+#warning TODO: implement pthread_key_delete so simgridified starpu can be restarted at will
			
 
				+#endif
			
 
				+	return 0;
			
 
				+}
			
 
				+
			
 
				+int _starpu_pthread_setspecific(_starpu_pthread_key_t key, void *ptr)
			
 
				+{
			
 
				+	void **array = MSG_host_get_data(MSG_host_self());
			
 
				+	array[key] = ptr;
			
 
				+	return 0;
			
 
				+}
			
 
				+
			
 
				+void* _starpu_pthread_getspecific(_starpu_pthread_key_t key)
			
 
				+{
			
 
				+	void **array = MSG_host_get_data(MSG_host_self());
			
 
				+	return array[key];
			
 
				+}
			
 
				+
			
 
				+int
			
 
				+_starpu_simgrid_thread_start(int argc STARPU_ATTRIBUTE_UNUSED, char *argv[] STARPU_ATTRIBUTE_UNUSED)
			
 
				+{
			
 
				+	struct _starpu_pthread_args *args = MSG_process_get_data(MSG_process_self());
			
 
				+	args->f(args->arg);
			
 
				+	free(args);
			
 
				+	return 0;
			
 
				+}
			
 
				+#endif
			
--- a/src/core/simgrid.h
+++ b/src/core/simgrid.h
@@ -0,0 +1,28 @@
 
				+/* StarPU --- Runtime system for heterogeneous multicore architectures.
			
 
				+ *
			
 
				+ * Copyright (C) 2012  Université de Bordeaux 1
			
 
				+ *
			
 
				+ * StarPU is free software; you can redistribute it and/or modify
			
 
				+ * it under the terms of the GNU Lesser General Public License as published by
			
 
				+ * the Free Software Foundation; either version 2.1 of the License, or (at
			
 
				+ * your option) any later version.
			
 
				+ *
			
 
				+ * StarPU is distributed in the hope that it will be useful, but
			
 
				+ * WITHOUT ANY WARRANTY; without even the implied warranty of
			
 
				+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
			
 
				+ *
			
 
				+ * See the GNU Lesser General Public License in COPYING.LGPL for more details.
			
 
				+ */
			
 
				+
			
 
				+#ifndef __SIMGRID_H__
			
 
				+#define __SIMGRID_H__
			
 
				+
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+#include <msg/msg.h>
			
 
				+
			
 
				+void _starpu_simgrid_execute_job(struct _starpu_job *job, enum starpu_perf_archtype perf_arch);
			
 
				+msg_task_t _starpu_simgrid_transfer_task_create(unsigned src_node, unsigned dst_node, size_t size);
			
 
				+void _starpu_simgrid_post_task(msg_task_t task, unsigned *finished, _starpu_pthread_mutex_t *mutex, _starpu_pthread_cond_t *cond);
			
 
				+#endif
			
 
				+
			
 
				+#endif // __SIMGRID_H__
			
--- a/src/core/topology.c
+++ b/src/core/topology.c
@@ -37,6 +37,11 @@
 
				 #include <windows.h>
			
 
				 #endif
			
 
				 
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+#include <msg/msg.h>
			
 
				+#include <core/simgrid.h>
			
 
				+#endif
			
 
				+
			
 
				 static unsigned topology_is_initialized = 0;
			
 
				 
			
 
				 #if defined(STARPU_USE_CUDA) || defined(STARPU_USE_OPENCL)
			
@@ -266,6 +271,12 @@ _starpu_init_topology (struct _starpu_machine_config *config)
 
				 	if (topology_is_initialized)
			
 
				 		return;
			
 
				 
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+	struct starpu_conf *conf = config->conf;
			
 
				+	topology->nhwcpus = conf->ncpus;
			
 
				+	topology->nhwcudagpus = conf->ncuda;
			
 
				+	topology->nhwopenclgpus = conf->nopencl;
			
 
				+#else
			
 
				 	topology->nhwcpus = 0;
			
 
				 
			
 
				 #ifdef STARPU_HAVE_HWLOC
			
@@ -276,6 +287,7 @@ _starpu_init_topology (struct _starpu_machine_config *config)
 
				 	_starpu_cpu_discover_devices(config);
			
 
				 	_starpu_cuda_discover_devices(config);
			
 
				 	_starpu_opencl_discover_devices(config);
			
 
				+#endif
			
 
				 
			
 
				 	topology_is_initialized = 1;
			
 
				 }
			
@@ -450,6 +462,7 @@ _starpu_init_machine_config (struct _starpu_machine_config *config)
 
				 #ifdef STARPU_USE_CUDA
			
 
				 	int ncuda = config->conf->ncuda;
			
 
				 
			
 
				+#ifndef STARPU_SIMGRID
			
 
				 	if (ncuda != 0)
			
 
				 	{
			
 
				 		/* The user did not disable CUDA. We need to initialize CUDA
			
@@ -473,6 +486,7 @@ _starpu_init_machine_config (struct _starpu_machine_config *config)
 
				 			}
			
 
				 		}
			
 
				 	}
			
 
				+#endif
			
 
				 
			
 
				 	/* Now we know how many CUDA devices will be used */
			
 
				 	topology->ncudagpus = ncuda;
			
@@ -506,6 +520,7 @@ _starpu_init_machine_config (struct _starpu_machine_config *config)
 
				 #ifdef STARPU_USE_OPENCL
			
 
				 	int nopencl = config->conf->nopencl;
			
 
				 
			
 
				+#ifndef STARPU_SIMGRID
			
 
				 	if (nopencl != 0)
			
 
				 	{
			
 
				 		/* The user did not disable OPENCL. We need to initialize
			
@@ -542,6 +557,7 @@ _starpu_init_machine_config (struct _starpu_machine_config *config)
 
				 			}
			
 
				 		}
			
 
				 	}
			
 
				+#endif
			
 
				 
			
 
				 	topology->nopenclgpus = nopencl;
			
 
				 	STARPU_ASSERT(topology->nopenclgpus + topology->nworkers <= STARPU_NMAXWORKERS);
			
@@ -669,6 +685,9 @@ _starpu_bind_thread_on_cpu (
 
				 	struct _starpu_machine_config *config STARPU_ATTRIBUTE_UNUSED,
			
 
				 	unsigned cpuid)
			
 
				 {
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+	return;
			
 
				+#endif
			
 
				 	if (starpu_get_env_number("STARPU_WORKERS_NOBIND") > 0)
			
 
				 		return;
			
 
				 #ifdef STARPU_HAVE_HWLOC
			
@@ -732,8 +751,11 @@ _starpu_bind_thread_on_cpu (
 
				 void
			
 
				 _starpu_bind_thread_on_cpus (
			
 
				 	struct _starpu_machine_config *config STARPU_ATTRIBUTE_UNUSED,
			
 
				-	struct _starpu_combined_worker *combined_worker)
			
 
				+	struct _starpu_combined_worker *combined_worker STARPU_ATTRIBUTE_UNUSED)
			
 
				 {
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+	return;
			
 
				+#endif
			
 
				 #ifdef STARPU_HAVE_HWLOC
			
 
				 	const struct hwloc_topology_support *support;
			
 
				 
			
@@ -779,6 +801,18 @@ _starpu_init_workers_binding (struct _starpu_machine_config *config)
 
				 	/* TODO : support NUMA  ;) */
			
 
				 	ram_memory_node = _starpu_register_memory_node(STARPU_CPU_RAM, -1);
			
 
				 
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+	xbt_dynar_t hosts = MSG_hosts_as_dynar();
			
 
				+	int nb = xbt_dynar_length(hosts), i;
			
 
				+	for (i = 0; i < nb; i++) {
			
 
				+		msg_host_t host = xbt_dynar_get_as(hosts, i, msg_host_t);
			
 
				+		if (!memcmp(MSG_host_get_name(host), "RAM", 4)) {
			
 
				+			_starpu_simgrid_memory_node_set_host(0, host);
			
 
				+			break;
			
 
				+		}
			
 
				+	}
			
 
				+#endif
			
 
				+
			
 
				 	/* We will store all the busid of the different (src, dst)
			
 
				 	 * combinations in a matrix which we initialize here. */
			
 
				 	_starpu_initialize_busid_matrix();
			
@@ -820,6 +854,9 @@ _starpu_init_workers_binding (struct _starpu_machine_config *config)
 
				 				}
			
 
				 				is_a_set_of_accelerators = 0;
			
 
				 				memory_node = _starpu_register_memory_node(STARPU_CUDA_RAM, workerarg->devid);
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+				_starpu_simgrid_memory_node_set_host(memory_node, xbt_dynar_get_as(hosts, worker+1, msg_host_t));
			
 
				+#endif
			
 
				 				_starpu_memory_node_worker_add(memory_node);
			
 
				 
			
 
				 				_starpu_register_bus(0, memory_node);
			
@@ -850,6 +887,9 @@ _starpu_init_workers_binding (struct _starpu_machine_config *config)
 
				 				}
			
 
				 				is_a_set_of_accelerators = 0;
			
 
				 				memory_node = _starpu_register_memory_node(STARPU_OPENCL_RAM, workerarg->devid);
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+				_starpu_simgrid_memory_node_set_host(memory_node, xbt_dynar_get_as(hosts, worker+1, msg_host_t));
			
 
				+#endif
			
 
				 				_starpu_memory_node_worker_add(memory_node);
			
 
				 				_starpu_register_bus(0, memory_node);
			
 
				 				_starpu_register_bus(memory_node, 0);
			
@@ -899,6 +939,9 @@ _starpu_init_workers_binding (struct _starpu_machine_config *config)
 
				 			hwloc_bitmap_dup (worker_obj->cpuset);
			
 
				 #endif
			
 
				 	}
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+	xbt_dynar_free(&hosts);
			
 
				+#endif
			
 
				 }
			
 
				 
			
 
				 
			
--- a/src/core/workers.c
+++ b/src/core/workers.c
@@ -32,6 +32,10 @@
 
				 #include <drivers/cuda/driver_cuda.h>
			
 
				 #include <drivers/opencl/driver_opencl.h>
			
 
				 
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+#include <msg/msg.h>
			
 
				+#endif
			
 
				+
			
 
				 #ifdef __MINGW32__
			
 
				 #include <windows.h>
			
 
				 #endif
			
@@ -383,11 +387,13 @@ static void _starpu_launch_drivers(struct _starpu_machine_config *config)
 
				 				driver.id.cpu_id = cpu;
			
 
				 				if (_starpu_may_launch_driver(config->conf, &driver))
			
 
				 				{
			
 
				-					_STARPU_PTHREAD_CREATE(
			
 
				+					_STARPU_PTHREAD_CREATE_ON(
			
 
				+						workerarg->name,
			
 
				 						&workerarg->worker_thread,
			
 
				 						NULL,
			
 
				 						_starpu_cpu_worker,
			
 
				-						workerarg);
			
 
				+						workerarg,
			
 
				+						worker+1);
			
 
				 				}
			
 
				 				else
			
 
				 				{
			
@@ -403,11 +409,13 @@ static void _starpu_launch_drivers(struct _starpu_machine_config *config)
 
				 				driver.id.cuda_id = cuda;
			
 
				 				if (_starpu_may_launch_driver(config->conf, &driver))
			
 
				 				{
			
 
				-					_STARPU_PTHREAD_CREATE(
			
 
				+					_STARPU_PTHREAD_CREATE_ON(
			
 
				+						workerarg->name,
			
 
				 						&workerarg->worker_thread,
			
 
				 						NULL,
			
 
				 						_starpu_cuda_worker,
			
 
				-						workerarg);
			
 
				+						workerarg,
			
 
				+						worker+1);
			
 
				 				}
			
 
				 				else
			
 
				 				{
			
@@ -426,11 +434,13 @@ static void _starpu_launch_drivers(struct _starpu_machine_config *config)
 
				 				}
			
 
				 				workerarg->set = NULL;
			
 
				 				workerarg->worker_is_initialized = 0;
			
 
				-				_STARPU_PTHREAD_CREATE(
			
 
				+				_STARPU_PTHREAD_CREATE_ON(
			
 
				+					workerarg->name,
			
 
				 					&workerarg->worker_thread,
			
 
				 					NULL,
			
 
				 					_starpu_opencl_worker,
			
 
				-					workerarg);
			
 
				+					workerarg,
			
 
				+					worker+1);
			
 
				 				break;
			
 
				 #endif
			
 
				 #ifdef STARPU_USE_GORDON
			
@@ -444,11 +454,13 @@ static void _starpu_launch_drivers(struct _starpu_machine_config *config)
 
				 
			
 
				 					gordon_worker_set.set_is_initialized = 0;
			
 
				 
			
 
				-					_STARPU_PTHREAD_CREATE(
			
 
				+					_STARPU_PTHREAD_CREATE_ON(
			
 
				+						workerarg->name
			
 
				 						&gordon_worker_set.worker_thread,
			
 
				 						NULL,
			
 
				 						_starpu_gordon_worker,
			
 
				-						&gordon_worker_set);
			
 
				+						&gordon_worker_set,
			
 
				+						worker+1);
			
 
				 
			
 
				 					_STARPU_PTHREAD_MUTEX_LOCK(&gordon_worker_set.mutex);
			
 
				 					while (!gordon_worker_set.set_is_initialized)
			
@@ -615,7 +627,7 @@ static void _starpu_conf_set_value_against_environment(char *name, int *value)
 
				 	}
			
 
				 }
			
 
				 
			
 
				-static void _starpu_conf_check_environment(struct starpu_conf *conf)
			
 
				+void _starpu_conf_check_environment(struct starpu_conf *conf)
			
 
				 {
			
 
				 	char *sched = getenv("STARPU_SCHED");
			
 
				 	if (sched)
			
@@ -787,6 +799,12 @@ static void _starpu_terminate_workers(struct _starpu_machine_config *config)
 
				 		{
			
 
				 			if (!set->joined)
			
 
				 			{
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+#ifdef STARPU_DEVEL
			
 
				+#warning TODO: use a simgrid_join when it becomes available
			
 
				+#endif
			
 
				+				MSG_process_sleep(1);
			
 
				+#else
			
 
				 				if (!pthread_equal(pthread_self(), set->worker_thread))
			
 
				 				{
			
 
				 					status = pthread_join(set->worker_thread, NULL);
			
@@ -797,6 +815,7 @@ static void _starpu_terminate_workers(struct _starpu_machine_config *config)
 
				                                         }
			
 
				 #endif
			
 
				 				}
			
 
				+#endif
			
 
				 
			
 
				 				set->joined = 1;
			
 
				 			}
			
@@ -806,6 +825,9 @@ static void _starpu_terminate_workers(struct _starpu_machine_config *config)
 
				 			if (!worker->run_by_starpu)
			
 
				 				goto out;
			
 
				 
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+			MSG_process_sleep(1);
			
 
				+#else
			
 
				 			if (!pthread_equal(pthread_self(), worker->worker_thread))
			
 
				 			{
			
 
				 				status = pthread_join(worker->worker_thread, NULL);
			
@@ -816,6 +838,7 @@ static void _starpu_terminate_workers(struct _starpu_machine_config *config)
 
				                                 }
			
 
				 #endif
			
 
				 			}
			
 
				+#endif
			
 
				 		}
			
 
				 
			
 
				 out:
			
--- a/src/core/workers.h
+++ b/src/core/workers.h
@@ -166,6 +166,9 @@ struct _starpu_machine_config
 
				 	unsigned submitting;
			
 
				 };
			
 
				 
			
 
				+/* Fill conf with environment variables */
			
 
				+void _starpu_conf_check_environment(struct starpu_conf *conf);
			
 
				+
			
 
				 /* Has starpu_shutdown already been called ? */
			
 
				 unsigned _starpu_machine_is_running(void);
			
 
				 
			
--- a/src/datawizard/copy_driver.c
+++ b/src/datawizard/copy_driver.c
@@ -27,6 +27,11 @@
 
				 #include <starpu_cuda.h>
			
 
				 #include <profiling/profiling.h>
			
 
				 
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+#include <core/simgrid.h>
			
 
				+#include <msg/msg.h>
			
 
				+#endif
			
 
				+
			
 
				 void _starpu_wake_all_blocked_workers_on_node(unsigned nodeid)
			
 
				 {
			
 
				 	/* wake up all workers on that memory node */
			
@@ -87,29 +92,47 @@ static int copy_data_1_to_1_generic(starpu_data_handle_t handle,
 
				 				    struct _starpu_data_replicate *dst_replicate,
			
 
				 				    struct _starpu_data_request *req STARPU_ATTRIBUTE_UNUSED)
			
 
				 {
			
 
				-	int ret = 0;
			
 
				-
			
 
				-	const struct starpu_data_copy_methods *copy_methods = handle->ops->copy_methods;
			
 
				-
			
 
				 	unsigned src_node = src_replicate->memory_node;
			
 
				 	unsigned dst_node = dst_replicate->memory_node;
			
 
				 
			
 
				-	enum starpu_node_kind src_kind = starpu_node_get_kind(src_node);
			
 
				-	enum starpu_node_kind dst_kind = starpu_node_get_kind(dst_node);
			
 
				-
			
 
				 	STARPU_ASSERT(src_replicate->refcnt);
			
 
				 	STARPU_ASSERT(dst_replicate->refcnt);
			
 
				 
			
 
				 	STARPU_ASSERT(src_replicate->allocated);
			
 
				 	STARPU_ASSERT(dst_replicate->allocated);
			
 
				 
			
 
				+	_starpu_comm_amounts_inc(src_node, dst_node, handle->ops->get_size(handle));
			
 
				+
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+	msg_task_t task = _starpu_simgrid_transfer_task_create(src_node, dst_node, handle->ops->get_size(handle));
			
 
				+	if (!req) {
			
 
				+		/* this is not associated to a request so it's synchronous */
			
 
				+		MSG_task_execute(task);
			
 
				+		MSG_task_destroy(task);
			
 
				+		return 0;
			
 
				+	}
			
 
				+	_STARPU_TRACE_START_DRIVER_COPY_ASYNC(src_node, dst_node);
			
 
				+	req->async_channel.event.finished = 0;
			
 
				+	_STARPU_PTHREAD_MUTEX_INIT(&req->async_channel.event.mutex, NULL);
			
 
				+	_STARPU_PTHREAD_COND_INIT(&req->async_channel.event.cond, NULL);
			
 
				+	_starpu_simgrid_post_task(task, &req->async_channel.event.finished, &req->async_channel.event.mutex, &req->async_channel.event.cond);
			
 
				+	_STARPU_TRACE_END_DRIVER_COPY_ASYNC(src_node, dst_node);
			
 
				+	_STARPU_TRACE_DATA_COPY(src_node, dst_node, handle->ops->get_size(handle));
			
 
				+	return -EAGAIN;
			
 
				+#else /* !SIMGRID */
			
 
				+
			
 
				+	int ret = 0;
			
 
				+
			
 
				+	const struct starpu_data_copy_methods *copy_methods = handle->ops->copy_methods;
			
 
				+
			
 
				+	enum starpu_node_kind src_kind = starpu_node_get_kind(src_node);
			
 
				+	enum starpu_node_kind dst_kind = starpu_node_get_kind(dst_node);
			
 
				+
			
 
				 #ifdef STARPU_USE_CUDA
			
 
				 	cudaError_t cures;
			
 
				 	cudaStream_t stream;
			
 
				 #endif
			
 
				 
			
 
				-	_starpu_comm_amounts_inc(src_node, dst_node, handle->ops->get_size(handle));
			
 
				-
			
 
				 	void *src_interface = src_replicate->data_interface;
			
 
				 	void *dst_interface = dst_replicate->data_interface;
			
 
				 
			
@@ -248,6 +271,7 @@ static int copy_data_1_to_1_generic(starpu_data_handle_t handle,
 
				 	}
			
 
				 
			
 
				 	return ret;
			
 
				+#endif /* !SIMGRID */
			
 
				 }
			
 
				 
			
 
				 int __attribute__((warn_unused_result)) _starpu_driver_copy_data_1_to_1(starpu_data_handle_t handle,
			
@@ -315,6 +339,14 @@ int __attribute__((warn_unused_result)) _starpu_driver_copy_data_1_to_1(starpu_d
 
				 
			
 
				 void _starpu_driver_wait_request_completion(struct _starpu_async_channel *async_channel)
			
 
				 {
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+	if (async_channel->event.finished)
			
 
				+		return;
			
 
				+	_STARPU_PTHREAD_MUTEX_LOCK(&async_channel->event.mutex);
			
 
				+	while (!async_channel->event.finished)
			
 
				+		_STARPU_PTHREAD_COND_WAIT(&async_channel->event.cond, &async_channel->event.mutex);
			
 
				+	_STARPU_PTHREAD_MUTEX_UNLOCK(&async_channel->event.mutex);
			
 
				+#else /* !SIMGRID */
			
 
				 	enum starpu_node_kind kind = async_channel->type;
			
 
				 #ifdef STARPU_USE_CUDA
			
 
				 	cudaEvent_t event;
			
@@ -351,10 +383,14 @@ void _starpu_driver_wait_request_completion(struct _starpu_async_channel *async_
 
				 	default:
			
 
				 		STARPU_ABORT();
			
 
				 	}
			
 
				+#endif /* !SIMGRID */
			
 
				 }
			
 
				 
			
 
				 unsigned _starpu_driver_test_request_completion(struct _starpu_async_channel *async_channel)
			
 
				 {
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+	return async_channel->event.finished;
			
 
				+#else /* !SIMGRID */
			
 
				 	enum starpu_node_kind kind = async_channel->type;
			
 
				 	unsigned success = 0;
			
 
				 #ifdef STARPU_USE_CUDA
			
@@ -396,4 +432,5 @@ unsigned _starpu_driver_test_request_completion(struct _starpu_async_channel *as
 
				 	}
			
 
				 
			
 
				 	return success;
			
 
				+#endif /* !SIMGRID */
			
 
				 }
			
--- a/src/datawizard/copy_driver.h
+++ b/src/datawizard/copy_driver.h
@@ -1,6 +1,6 @@
 
				 /* StarPU --- Runtime system for heterogeneous multicore architectures.
			
 
				  *
			
 
				- * Copyright (C) 2010  Université de Bordeaux 1
			
 
				+ * Copyright (C) 2010, 2012  Université de Bordeaux 1
			
 
				  * Copyright (C) 2010, 2011  Centre National de la Recherche Scientifique
			
 
				  *
			
 
				  * StarPU is free software; you can redistribute it and/or modify
			
@@ -41,6 +41,13 @@ struct _starpu_data_replicate;
 
				 union _starpu_async_channel_event
			
 
				 {
			
 
				 	int dummy;
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+	struct {
			
 
				+		unsigned finished;
			
 
				+		_starpu_pthread_mutex_t mutex;
			
 
				+		_starpu_pthread_cond_t cond;
			
 
				+	};
			
 
				+#endif
			
 
				 #ifdef STARPU_USE_CUDA
			
 
				 	cudaEvent_t cuda_event;
			
 
				 #endif
			
--- a/src/datawizard/memalloc.c
+++ b/src/datawizard/memalloc.c
@@ -242,7 +242,7 @@ static size_t free_memory_on_node(struct _starpu_mem_chunk *mc, uint32_t node)
 
				 		if (handle && !data_was_deleted)
			
 
				 			STARPU_ASSERT(replicate->allocated);
			
 
				 
			
 
				-#if defined(STARPU_USE_CUDA) && defined(HAVE_CUDA_MEMCPY_PEER)
			
 
				+#if defined(STARPU_USE_CUDA) && defined(HAVE_CUDA_MEMCPY_PEER) && !defined(STARPU_SIMGRID)
			
 
				 		if (starpu_node_get_kind(node) == STARPU_CUDA_RAM)
			
 
				 		{
			
 
				 			/* To facilitate the design of interface, we set the
			
@@ -750,6 +750,11 @@ static size_t _starpu_get_global_mem_size(int dst_node)
 
				 	return global_mem_size;
			
 
				 }
			
 
				 
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+static _starpu_pthread_mutex_t cuda_alloc_mutex = _STARPU_PTHREAD_MUTEX_INITIALIZER;
			
 
				+static _starpu_pthread_mutex_t opencl_alloc_mutex = _STARPU_PTHREAD_MUTEX_INITIALIZER;
			
 
				+#endif
			
 
				+
			
 
				 uintptr_t
			
 
				 starpu_allocate_buffer_on_node(uint32_t dst_node, size_t size)
			
 
				 {
			
@@ -766,7 +771,19 @@ starpu_allocate_buffer_on_node(uint32_t dst_node, size_t size)
 
				 			break;
			
 
				 #ifdef STARPU_USE_CUDA
			
 
				 		case STARPU_CUDA_RAM:
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+#ifdef STARPU_DEVEL
			
 
				+#warning TODO: record used memory, using a simgrid property to know the available memory
			
 
				+#endif
			
 
				+			/* Sleep 10µs for the allocation */
			
 
				+			_STARPU_PTHREAD_MUTEX_LOCK(&cuda_alloc_mutex);
			
 
				+			MSG_process_sleep(0.000010);
			
 
				+			addr = 1;
			
 
				+			status = cudaSuccess;
			
 
				+			_STARPU_PTHREAD_MUTEX_UNLOCK(&cuda_alloc_mutex);
			
 
				+#else
			
 
				 			status = cudaMalloc((void **)&addr, size);
			
 
				+#endif
			
 
				 			if (!addr || (status != cudaSuccess))
			
 
				 			{
			
 
				 				if (STARPU_UNLIKELY(status != cudaErrorMemoryAllocation))
			
@@ -781,7 +798,16 @@ starpu_allocate_buffer_on_node(uint32_t dst_node, size_t size)
 
				 			{
			
 
				                                 int ret;
			
 
				 				cl_mem ptr;
			
 
				-                                ret = starpu_opencl_allocate_memory(&ptr, size, CL_MEM_READ_WRITE);
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+				/* Sleep 10µs for the allocation */
			
 
				+				_STARPU_PTHREAD_MUTEX_LOCK(&opencl_alloc_mutex);
			
 
				+				MSG_process_sleep(0.000010);
			
 
				+				ptr = (cl_mem) 1;
			
 
				+				ret = CL_SUCCESS;
			
 
				+				_STARPU_PTHREAD_MUTEX_UNLOCK(&opencl_alloc_mutex);
			
 
				+#else
			
 
				+				ret = starpu_opencl_allocate_memory(&ptr, size, CL_MEM_READ_WRITE);
			
 
				+#endif
			
 
				 				if (ret)
			
 
				 					addr = 0;
			
 
				 				else
			
@@ -809,7 +835,15 @@ starpu_free_buffer_on_node(uint32_t dst_node, uintptr_t addr)
 
				 		case STARPU_CUDA_RAM:
			
 
				 		{
			
 
				 			cudaError_t err;
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+			_STARPU_PTHREAD_MUTEX_LOCK(&cuda_alloc_mutex);
			
 
				+			/* Sleep 10µs for the free */
			
 
				+			MSG_process_sleep(0.000010);
			
 
				+			err = cudaSuccess;
			
 
				+			_STARPU_PTHREAD_MUTEX_UNLOCK(&cuda_alloc_mutex);
			
 
				+#else
			
 
				 			err = cudaFree((void*)addr);
			
 
				+#endif
			
 
				 			if (STARPU_UNLIKELY(err != cudaSuccess))
			
 
				 				STARPU_CUDA_REPORT_ERROR(err);
			
 
				 			break;
			
@@ -819,7 +853,15 @@ starpu_free_buffer_on_node(uint32_t dst_node, uintptr_t addr)
 
				                 case STARPU_OPENCL_RAM:
			
 
				 		{
			
 
				 			cl_int err;
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+			_STARPU_PTHREAD_MUTEX_LOCK(&opencl_alloc_mutex);
			
 
				+			/* Sleep 10µs for the free */
			
 
				+			MSG_process_sleep(0.000010);
			
 
				+			err = CL_SUCCESS;
			
 
				+			_STARPU_PTHREAD_MUTEX_UNLOCK(&opencl_alloc_mutex);
			
 
				+#else
			
 
				                         err = clReleaseMemObject((void*)addr);
			
 
				+#endif
			
 
				 			if (STARPU_UNLIKELY(err != CL_SUCCESS))
			
 
				 				STARPU_OPENCL_REPORT_ERROR(err);
			
 
				                         break;
			
@@ -878,7 +920,7 @@ static ssize_t _starpu_allocate_interface(starpu_data_handle_t handle, struct _s
 
				 		_STARPU_TRACE_START_ALLOC(dst_node);
			
 
				 		STARPU_ASSERT(replicate->data_interface);
			
 
				 
			
 
				-#if defined(STARPU_USE_CUDA) && defined(HAVE_CUDA_MEMCPY_PEER)
			
 
				+#if defined(STARPU_USE_CUDA) && defined(HAVE_CUDA_MEMCPY_PEER) && !defined(STARPU_SIMGRID)
			
 
				 		if (starpu_node_get_kind(dst_node) == STARPU_CUDA_RAM)
			
 
				 		{
			
 
				 			/* To facilitate the design of interface, we set the
			
--- a/src/datawizard/memory_nodes.c
+++ b/src/datawizard/memory_nodes.c
@@ -1,6 +1,6 @@
 
				 /* StarPU --- Runtime system for heterogeneous multicore architectures.
			
 
				  *
			
 
				- * Copyright (C) 2009-2011  Université de Bordeaux 1
			
 
				+ * Copyright (C) 2009-2012  Université de Bordeaux 1
			
 
				  * Copyright (C) 2010, 2011  Centre National de la Recherche Scientifique
			
 
				  *
			
 
				  * StarPU is free software; you can redistribute it and/or modify
			
@@ -121,6 +121,18 @@ unsigned _starpu_register_memory_node(enum starpu_node_kind kind, int devid)
 
				 	return (nnodes-1);
			
 
				 }
			
 
				 
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+void _starpu_simgrid_memory_node_set_host(unsigned node, msg_host_t host)
			
 
				+{
			
 
				+	descr.host[node] = host;
			
 
				+}
			
 
				+
			
 
				+msg_host_t _starpu_simgrid_memory_node_get_host(unsigned node)
			
 
				+{
			
 
				+	return descr.host[node];
			
 
				+}
			
 
				+#endif
			
 
				+
			
 
				 /* TODO move in a more appropriate file  !! */
			
 
				 /* Register a condition variable associated to worker which is associated to a
			
 
				  * memory node itself. */
			
--- a/src/datawizard/memory_nodes.h
+++ b/src/datawizard/memory_nodes.h
@@ -24,6 +24,9 @@
 
				 #include <datawizard/memalloc.h>
			
 
				 #include <common/utils.h>
			
 
				 
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+#include <msg/msg.h>
			
 
				+#endif
			
 
				 
			
 
				 #define _STARPU_MEMORY_NODE_TUPLE(node1,node2) (node1 | (node2 << 4))
			
 
				 #define _STARPU_MEMORY_NODE_TUPLE_FIRST(tuple) (tuple & 0x0F)
			
@@ -45,6 +48,10 @@ struct _starpu_mem_node_descr
 
				 
			
 
				 	unsigned nworkers[STARPU_MAXNODES];
			
 
				 
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+	msg_host_t host[STARPU_MAXNODES];
			
 
				+#endif
			
 
				+
			
 
				 	// TODO move this 2 lists outside struct _starpu_mem_node_descr
			
 
				 	/* Every worker is associated to a condition variable on which the
			
 
				 	 * worker waits when there is task available. It is possible that
			
@@ -66,6 +73,10 @@ void _starpu_set_local_memory_node_key(unsigned *node);
 
				 unsigned _starpu_get_local_memory_node(void);
			
 
				 void _starpu_memory_node_worker_add(unsigned node);
			
 
				 unsigned _starpu_memory_node_workers(unsigned node);
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+void _starpu_simgrid_memory_node_set_host(unsigned node, msg_host_t host);
			
 
				+msg_host_t _starpu_simgrid_memory_node_get_host(unsigned node);
			
 
				+#endif
			
 
				 unsigned _starpu_register_memory_node(enum starpu_node_kind kind, int devid);
			
 
				 //void _starpu_memory_node_attach_queue(struct starpu_jobq_s *q, unsigned nodeid);
			
 
				 void _starpu_memory_node_register_condition(_starpu_pthread_cond_t *cond, _starpu_pthread_mutex_t *mutex, unsigned memory_node);
			
--- a/src/datawizard/progress.c
+++ b/src/datawizard/progress.c
@@ -1,6 +1,6 @@
 
				 /* StarPU --- Runtime system for heterogeneous multicore architectures.
			
 
				  *
			
 
				- * Copyright (C) 2009, 2010  Université de Bordeaux 1
			
 
				+ * Copyright (C) 2009, 2010, 2012  Université de Bordeaux 1
			
 
				  * Copyright (C) 2010, 2011  Centre National de la Recherche Scientifique
			
 
				  *
			
 
				  * StarPU is free software; you can redistribute it and/or modify
			
@@ -19,9 +19,18 @@
 
				 #include <common/config.h>
			
 
				 #include <datawizard/datawizard.h>
			
 
				 #include <core/workers.h>
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+#include <msg/msg.h>
			
 
				+#endif
			
 
				 
			
 
				 void _starpu_datawizard_progress(uint32_t memory_node, unsigned may_alloc)
			
 
				 {
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+#if STARPU_DEVEL
			
 
				+#warning FIXME
			
 
				+#endif
			
 
				+	MSG_process_sleep(0.000010);
			
 
				+#endif
			
 
				 	/* in case some other driver requested data */
			
 
				 	_starpu_handle_pending_node_data_requests(memory_node);
			
 
				 	_starpu_handle_node_data_requests(memory_node, may_alloc);
			
--- a/src/drivers/cpu/driver_cpu.c
+++ b/src/drivers/cpu/driver_cpu.c
@@ -40,6 +40,11 @@
 
				 #include <windows.h>
			
 
				 #endif
			
 
				 
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+#include <core/simgrid.h>
			
 
				+#endif
			
 
				+
			
 
				+#ifndef STARPU_SIMGRID
			
 
				 #ifdef STARPU_HAVE_HWLOC
			
 
				 void
			
 
				 _starpu_cpu_discover_devices(struct _starpu_machine_config *config)
			
@@ -92,6 +97,7 @@ _starpu_cpu_discover_devices(struct _starpu_machine_config *config)
 
				 	config->topology.nhwcpus = 1;
			
 
				 }
			
 
				 #endif
			
 
				+#endif
			
 
				 
			
 
				 
			
 
				 /* Actually launch the job on a cpu worker.
			
@@ -142,7 +148,11 @@ static int execute_job_on_cpu(struct _starpu_job *j, struct starpu_task *worker_
 
				 			/* bind to parallel worker */
			
 
				 			_starpu_bind_thread_on_cpus(cpu_args->config, _starpu_get_combined_worker_struct(j->combined_workerid));
			
 
				 		STARPU_ASSERT(func);
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+		_starpu_simgrid_execute_job(j, perf_arch);
			
 
				+#else
			
 
				 		func(task->interfaces, task->cl_arg);
			
 
				+#endif
			
 
				 		if (is_parallel_task && cl->type == STARPU_FORKJOIN)
			
 
				 			/* rebind to single CPU */
			
 
				 			_starpu_bind_thread_on_cpu(cpu_args->config, cpu_args->bindid);
			
--- a/src/drivers/cuda/driver_cuda.c
+++ b/src/drivers/cuda/driver_cuda.c
@@ -30,6 +30,10 @@
 
				 #include <cuda_gl_interop.h>
			
 
				 #endif
			
 
				 
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+#include <core/simgrid.h>
			
 
				+#endif
			
 
				+
			
 
				 /* the number of CUDA devices */
			
 
				 static int ncudagpus;
			
 
				 
			
@@ -37,11 +41,7 @@ static cudaStream_t streams[STARPU_NMAXWORKERS];
 
				 static cudaStream_t transfer_streams[STARPU_NMAXWORKERS];
			
 
				 static struct cudaDeviceProp props[STARPU_MAXCUDADEVS];
			
 
				 
			
 
				-/* In case we want to cap the amount of memory available on the GPUs by the
			
 
				- * mean of the STARPU_LIMIT_GPU_MEM, we allocate a big buffer when the driver
			
 
				- * is launched. */
			
 
				-static char *wasted_memory[STARPU_NMAXWORKERS];
			
 
				-
			
 
				+#ifndef STARPU_SIMGRID
			
 
				 void
			
 
				 _starpu_cuda_discover_devices (struct _starpu_machine_config *config)
			
 
				 {
			
@@ -56,6 +56,11 @@ _starpu_cuda_discover_devices (struct _starpu_machine_config *config)
 
				 	config->topology.nhwcudagpus = cnt;
			
 
				 }
			
 
				 
			
 
				+/* In case we want to cap the amount of memory available on the GPUs by the
			
 
				+ * mean of the STARPU_LIMIT_GPU_MEM, we allocate a big buffer when the driver
			
 
				+ * is launched. */
			
 
				+static char *wasted_memory[STARPU_NMAXWORKERS];
			
 
				+
			
 
				 static void limit_gpu_mem_if_needed(unsigned devid)
			
 
				 {
			
 
				 	cudaError_t cures;
			
@@ -98,6 +103,7 @@ static void unlimit_gpu_mem_if_needed(unsigned devid)
 
				 		wasted_memory[devid] = NULL;
			
 
				 	}
			
 
				 }
			
 
				+#endif
			
 
				 
			
 
				 size_t starpu_cuda_get_global_mem_size(unsigned devid)
			
 
				 {
			
@@ -125,8 +131,11 @@ const struct cudaDeviceProp *starpu_cuda_get_device_properties(unsigned workerid
 
				 	return &props[devid];
			
 
				 }
			
 
				 
			
 
				-void starpu_cuda_set_device(unsigned devid)
			
 
				+void starpu_cuda_set_device(unsigned devid STARPU_ATTRIBUTE_UNUSED)
			
 
				 {
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+	STARPU_ABORT();
			
 
				+#else
			
 
				 	cudaError_t cures;
			
 
				 	struct starpu_conf *conf = _starpu_get_machine_config()->conf;
			
 
				 #if !defined(HAVE_CUDA_MEMCPY_PEER) && defined(HAVE_CUDA_GL_INTEROP_H)
			
@@ -158,8 +167,10 @@ done:
 
				 #endif
			
 
				 	if (STARPU_UNLIKELY(cures))
			
 
				 		STARPU_CUDA_REPORT_ERROR(cures);
			
 
				+#endif
			
 
				 }
			
 
				 
			
 
				+#ifndef STARPU_SIMGRID
			
 
				 static void init_context(unsigned devid)
			
 
				 {
			
 
				 	cudaError_t cures;
			
@@ -234,7 +245,7 @@ static void deinit_context(int workerid, unsigned devid)
 
				 	if (cures)
			
 
				 		STARPU_CUDA_REPORT_ERROR(cures);
			
 
				 }
			
 
				-
			
 
				+#endif /* !SIMGRID */
			
 
				 
			
 
				 /* Return the number of devices usable in the system.
			
 
				  * The value returned cannot be greater than MAXCUDADEVS */
			
@@ -289,14 +300,19 @@ static int execute_job_on_cuda(struct _starpu_job *j, struct _starpu_worker *arg
 
				 
			
 
				 	_starpu_driver_start_job(args, j, &codelet_start, 0, profiling);
			
 
				 
			
 
				-#ifdef HAVE_CUDA_MEMCPY_PEER
			
 
				+#if defined(HAVE_CUDA_MEMCPY_PEER) && !defined(STARPU_SIMGRID)
			
 
				 	/* We make sure we do manipulate the proper device */
			
 
				 	starpu_cuda_set_device(args->devid);
			
 
				 #endif
			
 
				 
			
 
				 	starpu_cuda_func_t func = _starpu_task_get_cuda_nth_implementation(cl, j->nimpl);
			
 
				 	STARPU_ASSERT(func);
			
 
				+
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+	_starpu_simgrid_execute_job(j, args->perf_arch);
			
 
				+#else
			
 
				 	func(task->interfaces, task->cl_arg);
			
 
				+#endif
			
 
				 
			
 
				 	_starpu_driver_end_job(args, j, args->perf_arch, &codelet_end, 0, profiling);
			
 
				 
			
@@ -332,17 +348,23 @@ int _starpu_cuda_driver_init(struct starpu_driver *d)
 
				 	struct _starpu_worker* args = _starpu_get_worker_from_driver(d);
			
 
				 	STARPU_ASSERT(args);
			
 
				 
			
 
				-	unsigned devid = args->devid;
			
 
				-
			
 
				 	_starpu_worker_init(args, _STARPU_FUT_CUDA_KEY);
			
 
				 
			
 
				+#ifndef STARPU_SIMGRID
			
 
				+	unsigned devid = args->devid;
			
 
				+
			
 
				 	init_context(devid);
			
 
				+#endif
			
 
				 
			
 
				 	/* one more time to avoid hacks from third party lib :) */
			
 
				 	_starpu_bind_thread_on_cpu(args->config, args->bindid);
			
 
				 
			
 
				 	args->status = STATUS_UNKNOWN;
			
 
				 
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+	const char *devname = "Simgrid";
			
 
				+	snprintf(args->name, sizeof(args->name), "CUDA %u (%s TODO GiB)", args->devid, devname);
			
 
				+#else
			
 
				 	/* get the device's name */
			
 
				 	char devname[128];
			
 
				 	strncpy(devname, props[devid].name, 128);
			
@@ -358,6 +380,7 @@ int _starpu_cuda_driver_init(struct starpu_driver *d)
 
				 #else
			
 
				 	snprintf(args->name, sizeof(args->name), "CUDA %u (%s %.1f GiB)", args->devid, devname, size);
			
 
				 #endif
			
 
				+#endif
			
 
				 	snprintf(args->short_name, sizeof(args->short_name), "CUDA %u", args->devid);
			
 
				 	_STARPU_DEBUG("cuda (%s) dev id %u thread is ready to run on CPU %d !\n", devname, devid, args->bindid);
			
 
				 
			
@@ -443,7 +466,9 @@ int _starpu_cuda_driver_deinit(struct starpu_driver *d)
 
				 	 * coherency is not maintained anymore at that point ! */
			
 
				 	_starpu_free_all_automatically_allocated_buffers(memnode);
			
 
				 
			
 
				+#ifndef STARPU_SIMGRID
			
 
				 	deinit_context(args->workerid, args->devid);
			
 
				+#endif
			
 
				 
			
 
				 	_STARPU_TRACE_WORKER_DEINIT_END(_STARPU_FUT_CUDA_KEY);
			
 
				 
			
--- a/src/drivers/gordon/driver_gordon.c
+++ b/src/drivers/gordon/driver_gordon.c
@@ -464,7 +464,7 @@ void *_starpu_gordon_worker(void *arg)
 
				 	_STARPU_PTHREAD_MUTEX_INIT(&progress_mutex, NULL);
			
 
				 	_STARPU_PTHREAD_COND_INIT(&progress_cond, NULL);
			
 
				 
			
 
				-	_STARPU_PTHREAD_CREATE(&progress_thread, NULL,
			
 
				+	_STARPU_PTHREAD_CREATE("Gordon progress", &progress_thread, NULL,
			
 
				 			       gordon_worker_progress, gordon_set_arg);
			
 
				 
			
 
				 	/* wait for the progression thread to be ready */
			
--- a/src/drivers/opencl/driver_opencl.c
+++ b/src/drivers/opencl/driver_opencl.c
@@ -29,6 +29,10 @@
 
				 #include "driver_opencl_utils.h"
			
 
				 #include <common/utils.h>
			
 
				 
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+#include <core/simgrid.h>
			
 
				+#endif
			
 
				+
			
 
				 static _starpu_pthread_mutex_t big_lock = _STARPU_PTHREAD_MUTEX_INITIALIZER;
			
 
				 
			
 
				 static cl_context contexts[STARPU_MAXOPENCLDEVS];
			
@@ -38,6 +42,7 @@ static cl_command_queue transfer_queues[STARPU_MAXOPENCLDEVS];
 
				 static cl_uint nb_devices = -1;
			
 
				 static int init_done = 0;
			
 
				 
			
 
				+#ifndef STARPU_SIMGRID
			
 
				 void
			
 
				 _starpu_opencl_discover_devices(struct _starpu_machine_config *config)
			
 
				 {
			
@@ -92,6 +97,7 @@ static void unlimit_gpu_mem_if_needed(int devid)
 
				 		wasted_memory[devid] = NULL;
			
 
				 	}
			
 
				 }
			
 
				+#endif
			
 
				 
			
 
				 size_t starpu_opencl_get_global_mem_size(int devid)
			
 
				 {
			
@@ -135,6 +141,7 @@ void starpu_opencl_get_current_context(cl_context *context)
 
				         *context = contexts[worker->devid];
			
 
				 }
			
 
				 
			
 
				+#ifndef STARPU_SIMGRID
			
 
				 cl_int _starpu_opencl_init_context(int devid)
			
 
				 {
			
 
				 	cl_int err;
			
@@ -193,9 +200,13 @@ cl_int _starpu_opencl_deinit_context(int devid)
 
				 
			
 
				         return CL_SUCCESS;
			
 
				 }
			
 
				+#endif
			
 
				 
			
 
				-cl_int starpu_opencl_allocate_memory(cl_mem *mem, size_t size, cl_mem_flags flags)
			
 
				+cl_int starpu_opencl_allocate_memory(cl_mem *mem STARPU_ATTRIBUTE_UNUSED, size_t size STARPU_ATTRIBUTE_UNUSED, cl_mem_flags flags STARPU_ATTRIBUTE_UNUSED)
			
 
				 {
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+	STARPU_ABORT();
			
 
				+#else
			
 
				 	cl_int err;
			
 
				         cl_mem memory;
			
 
				         struct _starpu_worker *worker = _starpu_get_local_worker_key();
			
@@ -223,6 +234,7 @@ cl_int starpu_opencl_allocate_memory(cl_mem *mem, size_t size, cl_mem_flags flag
 
				 
			
 
				         *mem = memory;
			
 
				         return CL_SUCCESS;
			
 
				+#endif
			
 
				 }
			
 
				 
			
 
				 cl_int starpu_opencl_copy_ram_to_opencl(void *ptr, unsigned src_node STARPU_ATTRIBUTE_UNUSED, cl_mem buffer, unsigned dst_node STARPU_ATTRIBUTE_UNUSED, size_t size, size_t offset, cl_event *event, int *ret)
			
@@ -410,7 +422,9 @@ void _starpu_opencl_init(void)
 
				 	_STARPU_PTHREAD_MUTEX_UNLOCK(&big_lock);
			
 
				 }
			
 
				 
			
 
				+#ifndef STARPU_SIMGRID
			
 
				 static unsigned _starpu_opencl_get_device_name(int dev, char *name, int lname);
			
 
				+#endif
			
 
				 static int _starpu_opencl_execute_job(struct _starpu_job *j, struct _starpu_worker *args);
			
 
				 
			
 
				 static struct _starpu_worker*
			
@@ -444,20 +458,26 @@ int _starpu_opencl_driver_init(struct starpu_driver *d)
 
				 	args = _starpu_opencl_get_worker_from_driver(d);
			
 
				 	STARPU_ASSERT(args);
			
 
				 
			
 
				-	int devid = args->devid;
			
 
				-
			
 
				 	_starpu_worker_init(args, _STARPU_FUT_OPENCL_KEY);
			
 
				 
			
 
				+#ifndef STARPU_SIMGRID
			
 
				+	int devid = args->devid;
			
 
				+
			
 
				 	_starpu_opencl_init_context(devid);
			
 
				+#endif
			
 
				 
			
 
				 	/* one more time to avoid hacks from third party lib :) */
			
 
				 	_starpu_bind_thread_on_cpu(args->config, args->bindid);
			
 
				 
			
 
				 	args->status = STATUS_UNKNOWN;
			
 
				 
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+	const char *devname = "Simgrid";
			
 
				+#else
			
 
				 	/* get the device's name */
			
 
				 	char devname[128];
			
 
				 	_starpu_opencl_get_device_name(devid, devname, 128);
			
 
				+#endif
			
 
				 	snprintf(args->name, sizeof(args->name), "OpenCL %u (%s)", args->devid, devname);
			
 
				 	snprintf(args->short_name, sizeof(args->short_name), "OpenCL %u", args->devid);
			
 
				 
			
@@ -540,11 +560,13 @@ int _starpu_opencl_driver_deinit(struct starpu_driver *d)
 
				 	args = _starpu_opencl_get_worker_from_driver(d);
			
 
				 	STARPU_ASSERT(args);
			
 
				 
			
 
				-	unsigned devid   = args->devid;
			
 
				 	unsigned memnode = args->memory_node;
			
 
				 
			
 
				 	_starpu_handle_all_pending_node_data_requests(memnode);
			
 
				+#ifndef STARPU_SIMGRID
			
 
				+	unsigned devid   = args->devid;
			
 
				         _starpu_opencl_deinit_context(devid);
			
 
				+#endif
			
 
				 
			
 
				 	return 0;
			
 
				 }
			
@@ -568,6 +590,7 @@ void *_starpu_opencl_worker(void *arg)
 
				 	return NULL;
			
 
				 }
			
 
				 
			
 
				+#ifndef STARPU_SIMGRID
			
 
				 static unsigned _starpu_opencl_get_device_name(int dev, char *name, int lname)
			
 
				 {
			
 
				 	int err;
			
@@ -584,6 +607,7 @@ static unsigned _starpu_opencl_get_device_name(int dev, char *name, int lname)
 
				 	_STARPU_DEBUG("Device %d : [%s]\n", dev, name);
			
 
				 	return EXIT_SUCCESS;
			
 
				 }
			
 
				+#endif
			
 
				 
			
 
				 unsigned _starpu_opencl_get_device_count(void)
			
 
				 {
			
@@ -637,7 +661,12 @@ static int _starpu_opencl_execute_job(struct _starpu_job *j, struct _starpu_work
 
				 
			
 
				 	starpu_opencl_func_t func = _starpu_task_get_opencl_nth_implementation(cl, j->nimpl);
			
 
				 	STARPU_ASSERT(func);
			
 
				+
			
 
				+#ifdef STARPU_SIMGRID
			
 
				+	_starpu_simgrid_execute_job(j, args->perf_arch);
			
 
				+#else
			
 
				 	func(task->interfaces, task->cl_arg);
			
 
				+#endif
			
 
				 
			
 
				 	_starpu_driver_end_job(args, j, args->perf_arch, &codelet_end, 0, profiling);
			
 
				 
			
--- a/src/top/starpu_top_connection.c
+++ b/src/top/starpu_top_connection.c
@@ -100,7 +100,6 @@ void * message_to_ui(void * p)
 
				 
			
 
				 void _starpu_top_communications_threads_launcher(void)
			
 
				 {
			
 
				-#ifdef STARPU_TOP
			
 
				 	pthread_t from_ui;
			
 
				 	pthread_t to_ui;
			
 
				 	pthread_attr_t threads_attr;
			
@@ -163,8 +162,7 @@ void _starpu_top_communications_threads_launcher(void)
 
				 	pthread_attr_init(&threads_attr);
			
 
				 	pthread_attr_setdetachstate(&threads_attr, PTHREAD_CREATE_DETACHED);
			
 
				 
			
 
				-	_STARPU_PTHREAD_CREATE(&from_ui, &threads_attr, message_from_ui, NULL);
			
 
				-	_STARPU_PTHREAD_CREATE(&to_ui, &threads_attr, message_to_ui, NULL);
			
 
				-#endif
			
 
				+	_STARPU_PTHREAD_CREATE("StarPU-Top from", &from_ui, &threads_attr, message_from_ui, NULL);
			
 
				+	_STARPU_PTHREAD_CREATE("StarPU-Top to", &to_ui, &threads_attr, message_to_ui, NULL);
			
 
				 }
			
 
				 
			
--- a/src/util/malloc.c
+++ b/src/util/malloc.c
@@ -41,7 +41,7 @@ struct malloc_pinned_codelet_struct
 
				 //}
			
 
				 //#endif
			
 
				 
			
 
				-#if defined(STARPU_USE_CUDA) && !defined(HAVE_CUDA_MEMCPY_PEER)
			
 
				+#if defined(STARPU_USE_CUDA) && !defined(HAVE_CUDA_MEMCPY_PEER) && !defined(STARPU_SIMGRID)
			
 
				 static void malloc_pinned_cuda_codelet(void *buffers[] STARPU_ATTRIBUTE_UNUSED, void *arg)
			
 
				 {
			
 
				 	struct malloc_pinned_codelet_struct *s = arg;
			
@@ -53,7 +53,7 @@ static void malloc_pinned_cuda_codelet(void *buffers[] STARPU_ATTRIBUTE_UNUSED,
 
				 }
			
 
				 #endif
			
 
				 
			
 
				-#if (defined(STARPU_USE_CUDA) && !defined(HAVE_CUDA_MEMCPY_PEER))// || defined(STARPU_USE_OPENCL)
			
 
				+#if (defined(STARPU_USE_CUDA) && !defined(HAVE_CUDA_MEMCPY_PEER)) && !defined(STARPU_SIMGRID)// || defined(STARPU_USE_OPENCL)
			
 
				 static struct starpu_perfmodel malloc_pinned_model =
			
 
				 {
			
 
				 	.type = STARPU_HISTORY_BASED,
			
@@ -78,6 +78,7 @@ int starpu_malloc(void **A, size_t dim)
 
				 
			
 
				 	STARPU_ASSERT(A);
			
 
				 
			
 
				+#ifndef STARPU_SIMGRID
			
 
				 	if (_starpu_can_submit_cuda_task())
			
 
				 	{
			
 
				 #ifdef STARPU_USE_CUDA
			
@@ -136,6 +137,7 @@ int starpu_malloc(void **A, size_t dim)
 
				 //#endif
			
 
				 //        }
			
 
				         else
			
 
				+#endif
			
 
				 	{
			
 
				 		*A = malloc(dim);
			
 
				 	}
			
@@ -145,7 +147,7 @@ int starpu_malloc(void **A, size_t dim)
 
				 	return 0;
			
 
				 }
			
 
				 
			
 
				-#if defined(STARPU_USE_CUDA) && !defined(HAVE_CUDA_MEMCPY_PEER)
			
 
				+#if defined(STARPU_USE_CUDA) && !defined(HAVE_CUDA_MEMCPY_PEER) && !defined(STARPU_SIMGRID)
			
 
				 static void free_pinned_cuda_codelet(void *buffers[] STARPU_ATTRIBUTE_UNUSED, void *arg)
			
 
				 {
			
 
				 	cudaError_t cures;
			
@@ -187,6 +189,7 @@ int starpu_free(void *A)
 
				 	if (STARPU_UNLIKELY(!_starpu_worker_may_perform_blocking_calls()))
			
 
				 		return -EDEADLK;
			
 
				 
			
 
				+#ifndef STARPU_SIMGRID
			
 
				 #ifdef STARPU_USE_CUDA
			
 
				 	if (_starpu_can_submit_cuda_task())
			
 
				 	{
			
@@ -241,6 +244,7 @@ int starpu_free(void *A)
 
				 //	}
			
 
				 	} else
			
 
				 #endif
			
 
				+#endif
			
 
				 	{
			
 
				 		free(A);
			
 
				 	}