9 years ago · a4530061c2
--- a/ChangeLog
+++ b/ChangeLog
@@ -42,6 +42,8 @@ New features:
 
				     files.
			
 
				   * Add STARPU_FXT_TRACE environment variable.
			
 
				   * Add starpu_data_set_user_data and starpu_data_get_user_data.
			
 
				+  * Add STARPU_MPI_FAKE_SIZE and STARPU_MPI_FAKE_RANK to allow simulating
			
 
				+    execution of just one MPI node.
			
 
				 
			
 
				 StarPU 1.2.0 (svn revision 18521)
			
 
				 ==============================================
			
--- a/configure.ac
+++ b/configure.ac
@@ -86,7 +86,7 @@ AC_OPENMP
 
				 #c++11 detection
			
 
				 AX_CXX_COMPILE_STDCXX(11,noext,optional)
			
 
				 
			
 
				-AC_SUBST([STARPU_HAVE_CXX11], [test "$HAVE_CXX11" -eq 1])
			
 
				+AC_SUBST([STARPU_HAVE_CXX11], $HAVE_CXX11)
			
 
				 AM_CONDITIONAL([STARPU_HAVE_CXX11], [test "$HAVE_CXX11" -eq 1])
			
 
				 if test $HAVE_CXX11 -eq 1; then
			
 
				   AC_DEFINE(STARPU_HAVE_CXX11, [1], [compiler supports cxx11])
			
--- a/doc/doxygen/chapters/301_tasks.doxy
+++ b/doc/doxygen/chapters/301_tasks.doxy
@@ -1,7 +1,7 @@
 
				 /*
			
 
				  * This file is part of the StarPU Handbook.
			
 
				  * Copyright (C) 2009--2011  Universit@'e de Bordeaux
			
 
				- * Copyright (C) 2010, 2011, 2012, 2013, 2014, 2016  CNRS
			
 
				+ * Copyright (C) 2010, 2011, 2012, 2013, 2014, 2016, 2017  CNRS
			
 
				  * Copyright (C) 2011, 2012 INRIA
			
 
				  * See the file version.doxy for copying conditions.
			
 
				  */
			
@@ -371,7 +371,7 @@ void func_cpu(void *descr[], void *_args)
 
				         int ifactor;
			
 
				         float ffactor;
			
 
				 
			
 
				-        starpu_codelet_unpack_args(_args, &ifactor, NULL);
			
 
				+        starpu_codelet_unpack_args(_args, &ifactor, 0);
			
 
				         starpu_codelet_unpack_args(_args, &ifactor, &ffactor);
			
 
				 }
			
 
				 \endcode
			
@@ -383,7 +383,7 @@ void func_cpu(void *descr[], void *_args)
 
				         float ffactor;
			
 
				 	char buffer[100];
			
 
				 
			
 
				-        starpu_codelet_unpack_args_and_copyleft(_args, buffer, 100, &ifactor, NULL);
			
 
				+        starpu_codelet_unpack_args_and_copyleft(_args, buffer, 100, &ifactor, 0);
			
 
				         starpu_codelet_unpack_args(buffer, &ffactor);
			
 
				 }
			
 
				 \endcode
			
--- a/doc/doxygen/chapters/390_faq.doxy
+++ b/doc/doxygen/chapters/390_faq.doxy
@@ -226,6 +226,21 @@ starpu_resume();
 
				 starpu_shutdown();
			
 
				 \endcode
			
 
				 
			
 
				+\section GPUEatingCores When running with CUDA or OpenCL devices, I am seeing less CPU cores
			
 
				+
			
 
				+Yes, this is on purpose.
			
 
				+
			
 
				+Since GPU devices are way faster than CPUs, StarPU needs to react quickly when
			
 
				+a task is finished, to feed the GPU with another task (StarPU actually submits
			
 
				+a couple of tasks in advance so as to pipeline this, but filling the pipeline
			
 
				+still has to be happening often enough), and thus it has to dedicate threads for
			
 
				+this, and this is a very CPU-consuming duty. StarPU thus dedicates one CPU core
			
 
				+for driving each GPU.
			
 
				+
			
 
				+Such dedication is also useful when a codelet is hybrid, i.e. while kernels are
			
 
				+running on the GPU, the codelet can run some computation, which thus be run by
			
 
				+the CPU core instead of driving the GPU.
			
 
				+
			
 
				 \section CUDADrivers StarPU does not see my CUDA device
			
 
				 
			
 
				 First make sure that CUDA is properly running outside StarPU: build and
			
--- a/doc/doxygen/chapters/410_mpi_support.doxy
+++ b/doc/doxygen/chapters/410_mpi_support.doxy
@@ -501,6 +501,21 @@ If the distribution function is not too complex and the compiler is very good,
 
				 the latter can even optimize the <c>for</c> loops, thus dramatically reducing
			
 
				 the cost of task submission.
			
 
				 
			
 
				+To estimate quickly how long task submission takes, and notably how much pruning
			
 
				+saves, a quick and easy way is to measure the submission time of just one of the
			
 
				+MPI nodes. This can be achieved by running the application on just one MPI node
			
 
				+with the following environment variables:
			
 
				+
			
 
				+\code
			
 
				+export STARPU_DISABLE_KERNELS=1
			
 
				+export STARPU_MPI_FAKE_RANK=2
			
 
				+export STARPU_MPI_FAKE_SIZE=1024
			
 
				+\endcode
			
 
				+
			
 
				+Here we have disabled the kernel function call to skip the actual computation
			
 
				+time and only keep submission time, and we have asked StarPU to fake running on
			
 
				+MPI node 2 out of 1024 nodes.
			
 
				+
			
 
				 A function starpu_mpi_task_build() is also provided with the aim to
			
 
				 only construct the task structure. All MPI nodes need to call the
			
 
				 function, only the node which is to execute the task will return a
			
--- a/doc/doxygen/chapters/501_environment_variables.doxy
+++ b/doc/doxygen/chapters/501_environment_variables.doxy
@@ -521,6 +521,26 @@ it prints messages on the standard output when data are added or removed from th
 
				 communication cache.
			
 
				 </dd>
			
 
				 
			
 
				+<dt>STARPU_MPI_FAKE_SIZE</dt>
			
 
				+<dd>
			
 
				+\anchor STARPU_MPI_FAKE_SIZE
			
 
				+\addindex __env__STARPU_MPI_FAKE_SIZE
			
 
				+Setting to a number makes StarPU believe that there are as many MPI nodes, even
			
 
				+if it was run on only one MPI node. This allows e.g. to simulate the execution
			
 
				+of one of the nodes of a big cluster without actually running the rest.
			
 
				+It of course does not provide computation results and timing.
			
 
				+</dd>
			
 
				+
			
 
				+<dt>STARPU_MPI_FAKE_RANK</dt>
			
 
				+<dd>
			
 
				+\anchor STARPU_MPI_FAKE_RANK
			
 
				+\addindex __env__STARPU_MPI_FAKE_RANK
			
 
				+Setting to a number makes StarPU believe that it runs the given MPI node, even
			
 
				+if it was run on only one MPI node. This allows e.g. to simulate the execution
			
 
				+of one of the nodes of a big cluster without actually running the rest.
			
 
				+It of course does not provide computation results and timing.
			
 
				+</dd>
			
 
				+
			
 
				 <dt>STARPU_SIMGRID_CUDA_MALLOC_COST</dt>
			
 
				 <dd>
			
 
				 \anchor STARPU_SIMGRID_CUDA_MALLOC_COST
			
@@ -743,6 +763,15 @@ GPUs (or in main memory, when using out of core), when performing an asynchronou
 
				 writeback pass. The default is 10%.
			
 
				 </dd>
			
 
				 
			
 
				+<dt>STARPU_DIDUSE_BARRIER</dt>
			
 
				+<dd>
			
 
				+\anchor STARPU_DIDUSE_BARRIER
			
 
				+\addindex __env__STARPU_DIDUSE_BARRIER
			
 
				+When set to 1, StarPU will never evict a piece of data if it has not been used
			
 
				+by at least one task. This avoids odd behaviors under high memory pressure, but
			
 
				+can lead to deadlocks, so is to be considered experimental only.
			
 
				+</dd>
			
 
				+
			
 
				 <dt>STARPU_DISK_SWAP</dt>
			
 
				 <dd>
			
 
				 \anchor STARPU_DISK_SWAP
			
--- a/doc/doxygen/chapters/api/codelet_and_tasks.doxy
+++ b/doc/doxygen/chapters/api/codelet_and_tasks.doxy
@@ -853,6 +853,15 @@ This function returns the task currently executed by the
 
				 worker, or <c>NULL</c> if it is called either from a thread that is not a
			
 
				 task or simply because there is no task being executed at the moment.
			
 
				 
			
 
				+\fn const char *starpu_task_get_name(struct starpu_task *task)
			
 
				+\ingroup API_Codelet_And_Tasks
			
 
				+This function returns the name of \p task, i.e. either its task->name field, or
			
 
				+the name of the corresponding performance model.
			
 
				+
			
 
				+\fn const char *starpu_task_get_model_name(struct starpu_task *task)
			
 
				+\ingroup API_Codelet_And_Tasks
			
 
				+This function returns the name of the performance model of \p task.
			
 
				+
			
 
				 \fn void starpu_codelet_display_stats(struct starpu_codelet *cl)
			
 
				 \ingroup API_Codelet_And_Tasks
			
 
				 Output on stderr some statistics on the codelet \p cl.
			
--- a/doc/doxygen/chapters/api/insert_task.doxy
+++ b/doc/doxygen/chapters/api/insert_task.doxy
@@ -1,7 +1,7 @@
 
				 /*
			
 
				  * This file is part of the StarPU Handbook.
			
 
				  * Copyright (C) 2009--2011  Universit@'e de Bordeaux
			
 
				- * Copyright (C) 2010, 2011, 2012, 2013, 2014, 2015, 2016  CNRS
			
 
				+ * Copyright (C) 2010, 2011, 2012, 2013, 2014, 2015, 2016, 2017  CNRS
			
 
				  * Copyright (C) 2011, 2012 INRIA
			
 
				  * See the file version.doxy for copying conditions.
			
 
				  */
			
@@ -140,13 +140,13 @@ starpu_codelet_unpack_args().
 
				 \ingroup API_Insert_Task
			
 
				 Retrieve the arguments of type ::STARPU_VALUE associated to a
			
 
				 task automatically created using the function starpu_task_insert(). If
			
 
				-some parameter is NULL, unpacking will stop there and ignore the remaining
			
 
				+any parameter's value is 0, unpacking will stop there and ignore the remaining
			
 
				 parameters.
			
 
				 
			
 
				 \fn void starpu_codelet_unpack_args_and_copyleft(void *cl_arg, void *buffer, size_t buffer_size, ...)
			
 
				 \ingroup API_Insert_Task
			
 
				-Similar to starpu_codelet_unpack_args(), but if some parameter is
			
 
				-NULL, copy the part of cl_arg that has not been read in buffer which
			
 
				+Similar to starpu_codelet_unpack_args(), but if any parameter is
			
 
				+0, copy the part of cl_arg that has not been read in buffer which
			
 
				 can then be used in a later call to one of the unpack functions.
			
 
				 
			
 
				 \fn struct starpu_task *starpu_task_build(struct starpu_codelet *cl, ...)
			
--- a/examples/Makefile.am
+++ b/examples/Makefile.am
@@ -1,6 +1,6 @@
 
				 # StarPU --- Runtime system for heterogeneous multicore architectures.
			
 
				 #
			
 
				-# Copyright (C) 2009-2016  Université de Bordeaux
			
 
				+# Copyright (C) 2009-2017  Université de Bordeaux
			
 
				 # Copyright (C) 2010, 2011, 2012, 2013, 2014, 2015  CNRS
			
 
				 # Copyright (C) 2011  Télécom-SudParis
			
 
				 # Copyright (C) 2011-2012  INRIA
			
@@ -23,8 +23,10 @@ include $(top_srcdir)/starpu.mk
 
				 if STARPU_SIMGRID
			
 
				 STARPU_PERF_MODEL_DIR=$(abs_top_srcdir)/tools/perfmodels/sampling
			
 
				 STARPU_HOSTNAME=mirage
			
 
				+MALLOC_PERTURB_=0
			
 
				 export STARPU_PERF_MODEL_DIR
			
 
				 export STARPU_HOSTNAME
			
 
				+export MALLOC_PERTURB_
			
 
				 endif
			
 
				 
			
 
				 AM_CFLAGS = $(MAGMA_CFLAGS) $(HWLOC_CFLAGS) -Wall $(STARPU_CUDA_CPPFLAGS) $(STARPU_OPENCL_CPPFLAGS) $(GLOBAL_AM_CFLAGS) -Wno-unused
			
--- a/examples/mlr/mlr.c
+++ b/examples/mlr/mlr.c
@@ -119,14 +119,14 @@ static struct starpu_perfmodel cl_model_final = {
 
				 
			
 
				 static struct starpu_codelet cl_init = {
			
 
				 	.cpu_funcs = { cpu_func },
			
 
				-	.cpu_funcs_name = { "mlr_codelet_init" },
			
 
				+	.cpu_funcs_name = { "cpu_func" },
			
 
				 	.nbuffers = 0,
			
 
				 	.model = &cl_model_init,
			
 
				 };
			
 
				 
			
 
				 static struct starpu_codelet cl_final = {
			
 
				 	.cpu_funcs = { cpu_func },
			
 
				-	.cpu_funcs_name = { "mlr_codelet_final" },
			
 
				+	.cpu_funcs_name = { "cpu_func" },
			
 
				 	.nbuffers = 0,
			
 
				 	.model = &cl_model_final,
			
 
				 };
			
--- a/examples/pi/pi.c
+++ b/examples/pi/pi.c
@@ -2,7 +2,7 @@
 
				  *
			
 
				  * Copyright (C) 2010-2011, 2013-2015  Université de Bordeaux
			
 
				  * Copyright (C) 2010  Mehdi Juhoor <mjuhoor@gmail.com>
			
 
				- * Copyright (C) 2010, 2011, 2012, 2013, 2016  CNRS
			
 
				+ * Copyright (C) 2010, 2011, 2012, 2013, 2016, 2017  CNRS
			
 
				  *
			
 
				  * StarPU is free software; you can redistribute it and/or modify
			
 
				  * it under the terms of the GNU Lesser General Public License as published by
			
@@ -146,7 +146,7 @@ int main(int argc, char **argv)
 
				 	starpu_vector_data_register(&sobol_qrng_direction_handle, STARPU_MAIN_RAM,
			
 
				 		(uintptr_t)sobol_qrng_directions, n_dimensions*n_directions, sizeof(unsigned));
			
 
				 
			
 
				-	unsigned *cnt_array = malloc(ntasks*sizeof(unsigned));
			
 
				+	unsigned *cnt_array = calloc(ntasks, sizeof(unsigned));
			
 
				 	STARPU_ASSERT(cnt_array);
			
 
				 	starpu_data_handle_t cnt_array_handle;
			
 
				 	starpu_vector_data_register(&cnt_array_handle, STARPU_MAIN_RAM, (uintptr_t)cnt_array, ntasks, sizeof(unsigned));
			
@@ -161,7 +161,7 @@ int main(int argc, char **argv)
 
				 		.filter_func = starpu_vector_filter_block,
			
 
				 		.nchildren = ntasks
			
 
				 	};
			
 
				-	
			
 
				+
			
 
				 	starpu_data_partition(cnt_array_handle, &f);
			
 
				 
			
 
				 	double start;
			
--- a/examples/pi/pi_redux.c
+++ b/examples/pi/pi_redux.c
@@ -1,6 +1,6 @@
 
				 /* StarPU --- Runtime system for heterogeneous multicore architectures.
			
 
				  *
			
 
				- * Copyright (C) 2010-2015  Université de Bordeaux
			
 
				+ * Copyright (C) 2010-2015, 2017  Université de Bordeaux
			
 
				  * Copyright (C) 2016  CNRS
			
 
				  *
			
 
				  * StarPU is free software; you can redistribute it and/or modify
			
@@ -158,7 +158,7 @@ void pi_func_cpu(void *descr[], void *cl_arg STARPU_ATTRIBUTE_UNUSED)
 
				 	unsigned short *worker_xsub;
			
 
				 	worker_xsub = &xsubi[PADDING*workerid];
			
 
				 
			
 
				-	struct drand48_data *buffer;
			
 
				+	starpu_drand48_data *buffer;
			
 
				 	buffer = &randbuffer[PADDING*workerid];
			
 
				 
			
 
				 	unsigned long local_cnt = 0;
			
--- a/examples/sched_ctx/nested_sched_ctxs.c
+++ b/examples/sched_ctx/nested_sched_ctxs.c
@@ -1,7 +1,7 @@
 
				 /* StarPU --- Runtime system for heterogeneous multicore architectures.
			
 
				  *
			
 
				  * Copyright (C) 2010-2015  Université de Bordeaux
			
 
				- * Copyright (C) 2010-2014, 2016  CNRS
			
 
				+ * Copyright (C) 2010-2014, 2016, 2017  CNRS
			
 
				  *
			
 
				  * StarPU is free software; you can redistribute it and/or modify
			
 
				  * it under the terms of the GNU Lesser General Public License as published by
			
@@ -51,8 +51,10 @@ int parallel_code(int sched_ctx)
 
				 static void sched_ctx_func(void *descr[] STARPU_ATTRIBUTE_UNUSED, void *arg)
			
 
				 {
			
 
				 	int w = starpu_worker_get_id();
			
 
				+	(void) w;
			
 
				 	unsigned sched_ctx = (uintptr_t)arg;
			
 
				 	int n = parallel_code(sched_ctx);
			
 
				+	(void) n;
			
 
				 	//printf("w %d executed %d it \n", w, n);
			
 
				 }
			
 
				 
			
--- a/examples/sched_ctx/parallel_code.c
+++ b/examples/sched_ctx/parallel_code.c
@@ -1,7 +1,7 @@
 
				 /* StarPU --- Runtime system for heterogeneous multicore architectures.
			
 
				  *
			
 
				  * Copyright (C) 2010-2014, 2016  Université de Bordeaux
			
 
				- * Copyright (C) 2010-2016  CNRS
			
 
				+ * Copyright (C) 2010-2017  CNRS
			
 
				  *
			
 
				  * StarPU is free software; you can redistribute it and/or modify
			
 
				  * it under the terms of the GNU Lesser General Public License as published by
			
@@ -87,8 +87,8 @@ int main(int argc, char **argv)
 
				 		return 77;
			
 
				 	STARPU_CHECK_RETURN_VALUE(ret, "starpu_init");
			
 
				 
			
 
				-	int nprocs1 = 1;
			
 
				-	int nprocs2 = 1;
			
 
				+	int nprocs1;
			
 
				+	int nprocs2;
			
 
				 	int *procs1, *procs2;
			
 
				 
			
 
				 #ifdef STARPU_USE_CPU
			
@@ -103,6 +103,8 @@ int main(int argc, char **argv)
 
				 	for(j = nprocs1; j < nprocs1+nprocs2; j++)
			
 
				 		procs2[k++] = j;
			
 
				 #else
			
 
				+	nprocs1 = 1;
			
 
				+	nprocs2 = 1;
			
 
				 	procs1 = (int*)malloc(nprocs1*sizeof(int));
			
 
				 	procs2 = (int*)malloc(nprocs2*sizeof(int));
			
 
				 	procs1[0] = 0;
			
--- a/examples/sched_ctx/two_cpu_contexts.c
+++ b/examples/sched_ctx/two_cpu_contexts.c
@@ -85,14 +85,14 @@ int main(int argc, char **argv)
 
				 	for (i=0; i < n; i++)
			
 
				 	{
			
 
				 		int arg_id = 1*1000 + i;
			
 
				-		ret = starpu_insert_task(&sched_ctx_codelet, STARPU_VALUE, &arg_id, sizeof(int), STARPU_SCHED_CTX, sched_ctx1, NULL);
			
 
				+		ret = starpu_task_insert(&sched_ctx_codelet, STARPU_VALUE, &arg_id, sizeof(int), STARPU_SCHED_CTX, sched_ctx1, 0);
			
 
				 		STARPU_CHECK_RETURN_VALUE(ret, "starpu_task_submit");
			
 
				 	}
			
 
				 
			
 
				 	for (i=0; i < n; i++)
			
 
				 	{
			
 
				 		int arg_id = 2*1000 + i;
			
 
				-		ret = starpu_insert_task(&sched_ctx_codelet, STARPU_VALUE, &arg_id, sizeof(int), STARPU_SCHED_CTX, sched_ctx2, NULL);
			
 
				+		ret = starpu_task_insert(&sched_ctx_codelet, STARPU_VALUE, &arg_id, sizeof(int), STARPU_SCHED_CTX, sched_ctx2, 0);
			
 
				 		STARPU_CHECK_RETURN_VALUE(ret, "starpu_task_submit");
			
 
				 	}
			
 
				 
			
@@ -101,7 +101,7 @@ int main(int argc, char **argv)
 
				 	for (i=0; i < n; i++)
			
 
				 	{
			
 
				 		int arg_id = 1*10000 + i;
			
 
				-		ret = starpu_insert_task(&sched_ctx_codelet, STARPU_VALUE, &arg_id, sizeof(int), STARPU_SCHED_CTX, sched_ctx1, NULL);
			
 
				+		ret = starpu_task_insert(&sched_ctx_codelet, STARPU_VALUE, &arg_id, sizeof(int), STARPU_SCHED_CTX, sched_ctx1, 0);
			
 
				 		STARPU_CHECK_RETURN_VALUE(ret, "starpu_task_submit");
			
 
				 	}
			
 
				 
			
--- a/examples/spmv/matrix_market/example_read.c
+++ b/examples/spmv/matrix_market/example_read.c
@@ -1,6 +1,6 @@
 
				 /* StarPU --- Runtime system for heterogeneous multicore architectures.
			
 
				  *
			
 
				- * Copyright (C) 2010  CNRS
			
 
				+ * Copyright (C) 2010, 2017  CNRS
			
 
				  *
			
 
				  * StarPU is free software; you can redistribute it and/or modify
			
 
				  * it under the terms of the GNU Lesser General Public License as published by
			
@@ -13,6 +13,7 @@
 
				  *
			
 
				  * See the GNU Lesser General Public License in COPYING.LGPL for more details.
			
 
				  */
			
 
				+
			
 
				 #include "mm_to_bcsr.h"
			
 
				 
			
 
				 int main(int argc, char *argv[])
			
@@ -30,6 +31,7 @@ int main(int argc, char *argv[])
 
				 
			
 
				 	bcsr_t *bcsr;
			
 
				 	bcsr = mm_file_to_bcsr(argv[1], c, r);
			
 
				+	(void) bcsr;
			
 
				 
			
 
				 	return 0;
			
 
				 }
			
--- a/examples/stencil/implicit-stencil-kernels.c
+++ b/examples/stencil/implicit-stencil-kernels.c
@@ -1,7 +1,7 @@
 
				 /* StarPU --- Runtime system for heterogeneous multicore architectures.
			
 
				  *
			
 
				  * Copyright (C) 2010-2015  Université de Bordeaux
			
 
				- * Copyright (C) 2012, 2013, 2016  CNRS
			
 
				+ * Copyright (C) 2012, 2013, 2016, 2017  CNRS
			
 
				  *
			
 
				  * StarPU is free software; you can redistribute it and/or modify
			
 
				  * it under the terms of the GNU Lesser General Public License as published by
			
@@ -571,6 +571,7 @@ static void dummy_func_bottom_cuda(void *descr[] STARPU_ATTRIBUTE_UNUSED, void *
 
				 	unsigned z;
			
 
				 	starpu_codelet_unpack_args(arg, &z);
			
 
				 	struct block_description *block = get_block_description(z);
			
 
				+	(void) block;
			
 
				 
			
 
				 	int workerid = starpu_worker_get_id_check();
			
 
				 	bottom_per_worker[workerid]++;
			
@@ -605,9 +606,10 @@ static void dummy_func_top_opencl(void *descr[] STARPU_ATTRIBUTE_UNUSED, void *a
 
				 /* bottom save, OPENCL version */
			
 
				 static void dummy_func_bottom_opencl(void *descr[] STARPU_ATTRIBUTE_UNUSED, void *arg)
			
 
				 {
			
 
				-    unsigned z;
			
 
				-    starpu_codelet_unpack_args(arg, &z);
			
 
				+	unsigned z;
			
 
				+	starpu_codelet_unpack_args(arg, &z);
			
 
				 	struct block_description *block = get_block_description(z);
			
 
				+	(void) block;
			
 
				 
			
 
				 	int workerid = starpu_worker_get_id_check();
			
 
				 	bottom_per_worker[workerid]++;
			
--- a/examples/stencil/life_opencl.c
+++ b/examples/stencil/life_opencl.c
@@ -1,7 +1,7 @@
 
				 /* StarPU --- Runtime system for heterogeneous multicore architectures.
			
 
				  *
			
 
				  * Copyright (C) 2010-2011, 2013-2014  Université de Bordeaux
			
 
				- * Copyright (C) 2016  CNRS
			
 
				+ * Copyright (C) 2016, 2017  CNRS
			
 
				  *
			
 
				  * StarPU is free software; you can redistribute it and/or modify
			
 
				  * it under the terms of the GNU Lesser General Public License as published by
			
--- a/examples/stencil/stencil-kernels.c
+++ b/examples/stencil/stencil-kernels.c
@@ -1,7 +1,7 @@
 
				 /* StarPU --- Runtime system for heterogeneous multicore architectures.
			
 
				  *
			
 
				  * Copyright (C) 2010-2015  Université de Bordeaux
			
 
				- * Copyright (C) 2012, 2013, 2016  CNRS
			
 
				+ * Copyright (C) 2012, 2013, 2016, 2017  CNRS
			
 
				  *
			
 
				  * StarPU is free software; you can redistribute it and/or modify
			
 
				  * it under the terms of the GNU Lesser General Public License as published by
			
@@ -520,6 +520,7 @@ void dummy_func_top_cpu(void *descr[] STARPU_ATTRIBUTE_UNUSED, void *arg)
 
				 void dummy_func_bottom_cpu(void *descr[] STARPU_ATTRIBUTE_UNUSED, void *arg)
			
 
				 {
			
 
				 	struct block_description *block = (struct block_description *) arg;
			
 
				+	(void) block;
			
 
				 	int workerid = starpu_worker_get_id_check();
			
 
				 	bottom_per_worker[workerid]++;
			
 
				 
			
@@ -550,6 +551,7 @@ static void dummy_func_top_cuda(void *descr[] STARPU_ATTRIBUTE_UNUSED, void *arg
 
				 static void dummy_func_bottom_cuda(void *descr[] STARPU_ATTRIBUTE_UNUSED, void *arg)
			
 
				 {
			
 
				 	struct block_description *block = (struct block_description *) arg;
			
 
				+	(void) block;
			
 
				 	int workerid = starpu_worker_get_id_check();
			
 
				 	bottom_per_worker[workerid]++;
			
 
				 
			
@@ -565,6 +567,7 @@ static void dummy_func_bottom_cuda(void *descr[] STARPU_ATTRIBUTE_UNUSED, void *
 
				 static void dummy_func_top_opencl(void *descr[] STARPU_ATTRIBUTE_UNUSED, void *arg)
			
 
				 {
			
 
				 	struct block_description *block = (struct block_description *) arg;
			
 
				+	(void) block;
			
 
				 	int workerid = starpu_worker_get_id_check();
			
 
				 	top_per_worker[workerid]++;
			
 
				 
			
@@ -581,6 +584,7 @@ static void dummy_func_top_opencl(void *descr[] STARPU_ATTRIBUTE_UNUSED, void *a
 
				 static void dummy_func_bottom_opencl(void *descr[] STARPU_ATTRIBUTE_UNUSED, void *arg)
			
 
				 {
			
 
				 	struct block_description *block = (struct block_description *) arg;
			
 
				+	(void) block;
			
 
				 	int workerid = starpu_worker_get_id_check();
			
 
				 	bottom_per_worker[workerid]++;
			
 
				 
			
--- a/examples/stencil/stencil-tasks.c
+++ b/examples/stencil/stencil-tasks.c
@@ -1,7 +1,7 @@
 
				 /* StarPU --- Runtime system for heterogeneous multicore architectures.
			
 
				  *
			
 
				  * Copyright (C) 2010, 2013-2015  Université de Bordeaux
			
 
				- * Copyright (C) 2012, 2013, 2015  CNRS
			
 
				+ * Copyright (C) 2012, 2013, 2015, 2017  CNRS
			
 
				  *
			
 
				  * StarPU is free software; you can redistribute it and/or modify
			
 
				  * it under the terms of the GNU Lesser General Public License as published by
			
@@ -78,6 +78,7 @@ static void create_task_save_local(unsigned iter, unsigned z, int dir, int local
 
				 static void send_done(void *arg)
			
 
				 {
			
 
				 	uintptr_t z = (uintptr_t) arg;
			
 
				+	(void) z;
			
 
				 	DEBUG("DO SEND %d\n", (int)z);
			
 
				 }
			
 
				 
			
@@ -106,6 +107,7 @@ static void create_task_save_mpi_send(unsigned iter, unsigned z, int dir, int lo
 
				 static void recv_done(void *arg)
			
 
				 {
			
 
				 	uintptr_t z = (uintptr_t) arg;
			
 
				+	(void) z;
			
 
				 	DEBUG("DO RECV %d\n", (int)z);
			
 
				 }
			
 
				 
			
--- a/gcc-plugin/examples/cholesky/cholesky.c
+++ b/gcc-plugin/examples/cholesky/cholesky.c
@@ -137,7 +137,7 @@ int main(int argc, char **argv)
 
				 		{
			
 
				 			for(x=0 ; x<nblocks ; x++)
			
 
				 			{
			
 
				-                                printf("Block %d,%d :\n", x, y);
			
 
				+                                printf("Block %u,%u :\n", x, y);
			
 
				 				for (j = 0; j < BLOCKSIZE; j++)
			
 
				 				{
			
 
				 					for (i = 0; i < BLOCKSIZE; i++)
			
@@ -163,7 +163,7 @@ int main(int argc, char **argv)
 
				 		{
			
 
				 			for(x=0 ; x<nblocks ; x++)
			
 
				 			{
			
 
				-                                printf("Block %d,%d :\n", x, y);
			
 
				+                                printf("Block %u,%u :\n", x, y);
			
 
				 				for (j = 0; j < BLOCKSIZE; j++)
			
 
				 				{
			
 
				 					for (i = 0; i < BLOCKSIZE; i++)
			
@@ -237,7 +237,7 @@ int main(int argc, char **argv)
 
				 									float orig = (1.0f/(1.0f+i+j)) + ((i == j)?1.0f*size:0.0f);
			
 
				 									float err = abs(test_mat[j +i*size] - orig);
			
 
				 									if (err > 0.00001) {
			
 
				-										fprintf(stderr, "Error[%d, %d] --> %2.2f != %2.2f (err %2.2f)\n", i, j, test_mat[j +i*size], orig, err);
			
 
				+										fprintf(stderr, "Error[%u, %u] --> %2.2f != %2.2f (err %2.2f)\n", i, j, test_mat[j +i*size], orig, err);
			
 
				 										correctness = 0;
			
 
				 										break;
			
 
				 									}
			
--- a/include/starpu_rand.h
+++ b/include/starpu_rand.h
@@ -1,6 +1,6 @@
 
				 /* StarPU --- Runtime system for heterogeneous multicore architectures.
			
 
				  *
			
 
				- * Copyright (C) 2012, 2013  CNRS
			
 
				+ * Copyright (C) 2012, 2013, 2017  CNRS
			
 
				  *
			
 
				  * StarPU is free software; you can redistribute it and/or modify
			
 
				  * it under the terms of the GNU Lesser General Public License as published by
			
@@ -48,7 +48,7 @@ typedef int starpu_drand48_data;
 
				 #    define starpu_srand48_r(seed, buffer)		srand48(starpu_seed(seed))
			
 
				 #    define starpu_drand48_r(buffer, result)		do {*(result) = drand48(); } while (0)
			
 
				 #    define starpu_lrand48_r(buffer, result)		do {*(result) = lrand48(); } while (0)
			
 
				-#    define starpu_erand48_r(xsubi, buffer, result)	do {*(result) = erand48(xsubi); } while (0)
			
 
				+#    define starpu_erand48_r(xsubi, buffer, result)	do {(void) buffer; *(result) = erand48(xsubi); } while (0)
			
 
				 #  endif
			
 
				 #else
			
 
				 typedef int starpu_drand48_data;
			
@@ -57,7 +57,7 @@ typedef int starpu_drand48_data;
 
				 #  define starpu_lrand48() 				rand()
			
 
				 #  define starpu_erand48(xsubi)				starpu_drand48()
			
 
				 #  define starpu_srand48_r(seed, buffer) 		srand(starpu_seed(seed))
			
 
				-#  define starpu_erand48_r(xsubi, buffer, result)	do {*(result) = ((double)(rand()) / RAND_MAX);} while (0)
			
 
				+#  define starpu_erand48_r(xsubi, buffer, result)	do {(void) xsubi; (void) buffer; *(result) = ((double)(rand()) / RAND_MAX);} while (0)
			
 
				 #endif
			
 
				 
			
 
				 #ifdef __cplusplus
			
--- a/include/starpu_task.h
+++ b/include/starpu_task.h
@@ -1,6 +1,6 @@
 
				 /* StarPU --- Runtime system for heterogeneous multicore architectures.
			
 
				  *
			
 
				- * Copyright (C) 2010-2016  Université de Bordeaux
			
 
				+ * Copyright (C) 2010-2017  Université de Bordeaux
			
 
				  * Copyright (C) 2010, 2011, 2012, 2013, 2014  CNRS
			
 
				  * Copyright (C) 2011  Télécom-SudParis
			
 
				  * Copyright (C) 2011, 2014, 2016  INRIA
			
@@ -322,6 +322,9 @@ void starpu_codelet_display_stats(struct starpu_codelet *cl);
 
				 
			
 
				 struct starpu_task *starpu_task_get_current(void);
			
 
				 
			
 
				+const char *starpu_task_get_model_name(struct starpu_task *task);
			
 
				+const char *starpu_task_get_name(struct starpu_task *task);
			
 
				+
			
 
				 void starpu_parallel_task_barrier_init(struct starpu_task *task, int workerid);
			
 
				 void starpu_parallel_task_barrier_init_n(struct starpu_task *task, int worker_size);
			
 
				 
			
--- a/mpi/src/starpu_mpi.c
+++ b/mpi/src/starpu_mpi.c
@@ -1,6 +1,6 @@
 
				 /* StarPU --- Runtime system for heterogeneous multicore architectures.
			
 
				  *
			
 
				- * Copyright (C) 2009, 2010-2016  Université de Bordeaux
			
 
				+ * Copyright (C) 2009, 2010-2017  Université de Bordeaux
			
 
				  * Copyright (C) 2010, 2011, 2012, 2013, 2014, 2015, 2016  CNRS
			
 
				  * Copyright (C) 2016  Inria
			
 
				  *
			
@@ -77,6 +77,8 @@ static int running = 0;
 
				 static int _mpi_world_size;
			
 
				 static int _mpi_world_rank;
			
 
				 #endif
			
 
				+int _starpu_mpi_fake_world_size = -1;
			
 
				+int _starpu_mpi_fake_world_rank = -1;
			
 
				 
			
 
				 /* Count requests posted by the application and not yet submitted to MPI */
			
 
				 static starpu_pthread_mutex_t mutex_posted_requests;
			
@@ -296,6 +298,11 @@ static void _starpu_mpi_submit_ready_request(void *arg)
 
				 	_STARPU_MPI_LOG_OUT();
			
 
				 }
			
 
				 
			
 
				+static void nop_acquire_cb(void *arg)
			
 
				+{
			
 
				+	starpu_data_release(arg);
			
 
				+}
			
 
				+
			
 
				 static struct _starpu_mpi_req *_starpu_mpi_isend_irecv_common(starpu_data_handle_t data_handle,
			
 
				 							      int srcdst, int data_tag, MPI_Comm comm,
			
 
				 							      unsigned detached, unsigned sync, void (*callback)(void *), void *arg,
			
@@ -307,6 +314,12 @@ static struct _starpu_mpi_req *_starpu_mpi_isend_irecv_common(starpu_data_handle
 
				 {
			
 
				 	struct _starpu_mpi_req *req;
			
 
				 
			
 
				+	if (_starpu_mpi_fake_world_size != -1)
			
 
				+	{
			
 
				+		starpu_data_acquire_cb_sequential_consistency(data_handle, mode, nop_acquire_cb, data_handle, sequential_consistency);
			
 
				+		return NULL;
			
 
				+	}
			
 
				+
			
 
				 	_STARPU_MPI_LOG_IN();
			
 
				 	_STARPU_MPI_INC_POSTED_REQUESTS(1);
			
 
				 
			
@@ -1292,6 +1305,8 @@ static void *_starpu_mpi_progress_thread_func(void *arg)
 
				 	_mpi_world_size = worldsize;
			
 
				 	_mpi_world_rank = rank;
			
 
				 #endif
			
 
				+	_starpu_mpi_fake_world_size = starpu_get_env_number("STARPU_MPI_FAKE_SIZE");
			
 
				+	_starpu_mpi_fake_world_rank = starpu_get_env_number("STARPU_MPI_FAKE_RANK");
			
 
				 
			
 
				 #ifdef STARPU_SIMGRID
			
 
				 	/* Now that MPI is set up, let the rest of simgrid get initialized */
			
@@ -1898,6 +1913,11 @@ void starpu_mpi_data_migrate(MPI_Comm comm, starpu_data_handle_t data, int new_r
 
				 
			
 
				 int starpu_mpi_comm_size(MPI_Comm comm, int *size)
			
 
				 {
			
 
				+	if (_starpu_mpi_fake_world_size != -1)
			
 
				+	{
			
 
				+		*size = _starpu_mpi_fake_world_size;
			
 
				+		return 0;
			
 
				+	}
			
 
				 #ifdef STARPU_SIMGRID
			
 
				 	STARPU_MPI_ASSERT_MSG(comm == MPI_COMM_WORLD, "StarPU-SMPI only works with MPI_COMM_WORLD for now");
			
 
				 	*size = _mpi_world_size;
			
@@ -1909,6 +1929,11 @@ int starpu_mpi_comm_size(MPI_Comm comm, int *size)
 
				 
			
 
				 int starpu_mpi_comm_rank(MPI_Comm comm, int *rank)
			
 
				 {
			
 
				+	if (_starpu_mpi_fake_world_rank != -1)
			
 
				+	{
			
 
				+		*rank = _starpu_mpi_fake_world_rank;
			
 
				+		return 0;
			
 
				+	}
			
 
				 #ifdef STARPU_SIMGRID
			
 
				 	STARPU_MPI_ASSERT_MSG(comm == MPI_COMM_WORLD, "StarPU-SMPI only works with MPI_COMM_WORLD for now");
			
 
				 	*rank = _mpi_world_rank;
			
--- a/mpi/src/starpu_mpi_private.h
+++ b/mpi/src/starpu_mpi_private.h
@@ -39,6 +39,8 @@ extern int _starpu_debug_level_max;
 
				 void _starpu_mpi_set_debug_level_min(int level);
			
 
				 void _starpu_mpi_set_debug_level_max(int level);
			
 
				 #endif
			
 
				+extern int _starpu_mpi_fake_world_size;
			
 
				+extern int _starpu_mpi_fake_world_rank;
			
 
				 
			
 
				 #ifdef STARPU_NO_ASSERT
			
 
				 #  define STARPU_MPI_ASSERT_MSG(x, msg, ...)	do { if (0) { (void) (x); }} while(0)
			
--- a/socl/examples/basicsplit/basicsplit.c
+++ b/socl/examples/basicsplit/basicsplit.c
@@ -203,7 +203,7 @@ int main(int UNUSED(argc), char** UNUSED(argv)) {
 
				   cl_uint niter = 15;
			
 
				 
			
 
				    for (i=0; i<niter; i++) {
			
 
				-      printf("Iteration %d...\n", i);
			
 
				+      printf("Iteration %u...\n", i);
			
 
				      add(cq, SIZE, s1, s2, d, 0, NULL, NULL);
			
 
				       printf("Finishing iteration...\n");
			
 
				       clFinish(cq);
			
--- a/socl/examples/clinfo/clinfo.c
+++ b/socl/examples/clinfo/clinfo.c
@@ -1,6 +1,6 @@
 
				 /* StarPU --- Runtime system for heterogeneous multicore architectures.
			
 
				  *
			
 
				- * Copyright (C) 2010,2011 University of Bordeaux
			
 
				+ * Copyright (C) 2010,2011, 2017 University of Bordeaux
			
 
				  *
			
 
				  * StarPU is free software; you can redistribute it and/or modify
			
 
				  * it under the terms of the GNU Lesser General Public License as published by
			
@@ -92,7 +92,7 @@ main(void) {
 
				          printf("  Plaform Name:\t\t\t\t\t %s\n", str);
			
 
				 
			
 
				          err = clGetDeviceIDs(platforms[i], CL_DEVICE_TYPE_ALL, 0, NULL, &num_devices);
			
 
				-         checkErr(err, "clGetDeviceIds(CL_DEVICE_TYPE_ALL)");
			
 
				+         checkErr(err, "clGetDeviceIDs(CL_DEVICE_TYPE_ALL)");
			
 
				          if (num_devices == 0) {
			
 
				             printf("  No devices found\n");
			
 
				             continue;
			
@@ -101,7 +101,10 @@ main(void) {
 
				          cl_device_id devices[num_devices];
			
 
				 
			
 
				          err = clGetDeviceIDs(platforms[i], CL_DEVICE_TYPE_ALL, num_devices, devices, NULL);
			
 
				-         checkErr(err, "clGetDeviceIds(CL_DEVICE_TYPE_ALL)");
			
 
				+         if (err == CL_DEVICE_NOT_FOUND)
			
 
				+            num_devices = 0;
			
 
				+         else
			
 
				+            checkErr(err, "clGetDeviceIDs(CL_DEVICE_TYPE_ALL)");
			
 
				 
			
 
				          printf("  Number of devices:\t\t\t\t %d\n", num_devices);
			
 
				          {
			
--- a/socl/src/cl_createbuffer.c
+++ b/socl/src/cl_createbuffer.c
@@ -127,8 +127,8 @@ soclCreateBuffer(cl_context   context,
 
				    }
			
 
				 
			
 
				    // Access mode
			
 
				-   mem->mode = flags & CL_MEM_READ_ONLY  ? CL_MEM_READ_ONLY :
			
 
				-               flags & CL_MEM_WRITE_ONLY ? CL_MEM_WRITE_ONLY : CL_MEM_READ_WRITE;
			
 
				+   mem->mode = (flags & CL_MEM_READ_ONLY) ? CL_MEM_READ_ONLY :
			
 
				+	   (flags & CL_MEM_WRITE_ONLY) ? CL_MEM_WRITE_ONLY : CL_MEM_READ_WRITE;
			
 
				 
			
 
				    // Perform data copy if necessary
			
 
				    if (flags & CL_MEM_COPY_HOST_PTR)
			
--- a/src/common/utils.h
+++ b/src/common/utils.h
@@ -1,7 +1,7 @@
 
				 /* StarPU --- Runtime system for heterogeneous multicore architectures.
			
 
				  *
			
 
				  * Copyright (C) 2010, 2012-2016  Université de Bordeaux
			
 
				- * Copyright (C) 2010, 2011, 2012, 2013, 2015, 2016  CNRS
			
 
				+ * Copyright (C) 2010, 2011, 2012, 2013, 2015, 2016, 2017  CNRS
			
 
				  *
			
 
				  * StarPU is free software; you can redistribute it and/or modify
			
 
				  * it under the terms of the GNU Lesser General Public License as published by
			
@@ -107,6 +107,7 @@
 
				 #endif
			
 
				 
			
 
				 /* TODO: cache */
			
 
				+#define _STARPU_MSG(fmt, ...) do { fprintf(stderr, STARPU_DEBUG_PREFIX"[%s] " fmt ,__starpu_func__ ,## __VA_ARGS__); } while(0)
			
 
				 #define _STARPU_DISP(fmt, ...) do { if (!_starpu_silent) {fprintf(stderr, STARPU_DEBUG_PREFIX"[%s] " fmt ,__starpu_func__ ,## __VA_ARGS__); }} while(0)
			
 
				 #define _STARPU_ERROR(fmt, ...)                                                  \
			
 
				 	do {                                                                          \
			
--- a/src/core/dependencies/tags.c
+++ b/src/core/dependencies/tags.c
@@ -1,7 +1,7 @@
 
				 /* StarPU --- Runtime system for heterogeneous multicore architectures.
			
 
				  *
			
 
				  * Copyright (C) 2009-2013, 2016  Université de Bordeaux
			
 
				- * Copyright (C) 2010, 2011, 2012, 2013, 2016  CNRS
			
 
				+ * Copyright (C) 2010, 2011, 2012, 2013, 2016, 2017  CNRS
			
 
				  * Copyright (C) 2016  Inria
			
 
				  *
			
 
				  * StarPU is free software; you can redistribute it and/or modify
			
@@ -108,7 +108,7 @@ static void _starpu_tag_free(void *_tag)
 
				 			struct _starpu_cg *cg = tag->tag_successors.succ[succ];
			
 
				 
			
 
				 			unsigned ntags = STARPU_ATOMIC_ADD(&cg->ntags, -1);
			
 
				-			unsigned remaining STARPU_ATTRIBUTE_UNUSED = STARPU_ATOMIC_ADD(&cg->remaining, -1);
			
 
				+			unsigned STARPU_ATTRIBUTE_UNUSED remaining = STARPU_ATOMIC_ADD(&cg->remaining, -1);
			
 
				 
			
 
				 			if (!ntags && (cg->cg_type == STARPU_CG_TAG))
			
 
				 				/* Last tag this cg depends on, cg becomes unreferenced */
			
--- a/src/core/sched_ctx.c
+++ b/src/core/sched_ctx.c
@@ -2682,7 +2682,7 @@ unsigned starpu_sched_ctx_has_starpu_scheduler(unsigned sched_ctx_id, unsigned *
 
				 	return sched_ctx->sched_policy != NULL;
			
 
				 }
			
 
				 
			
 
				-void *starpu_sched_ctx_get_used_data(unsigned sched_ctx_id)
			
 
				+void *starpu_sched_ctx_get_user_data(unsigned sched_ctx_id)
			
 
				 {
			
 
				 	struct _starpu_sched_ctx *sched_ctx = _starpu_get_sched_ctx_struct(sched_ctx_id);
			
 
				 	STARPU_ASSERT(sched_ctx != NULL);
			
--- a/src/core/sched_policy.c
+++ b/src/core/sched_policy.c
@@ -1,7 +1,7 @@
 
				 /* StarPU --- Runtime system for heterogeneous multicore architectures.
			
 
				  *
			
 
				  * Copyright (C) 2010-2016  Université de Bordeaux
			
 
				- * Copyright (C) 2010-2016  CNRS
			
 
				+ * Copyright (C) 2010-2017  CNRS
			
 
				  * Copyright (C) 2011, 2016  INRIA
			
 
				  * Copyright (C) 2016  Uppsala University
			
 
				  *
			
@@ -115,9 +115,12 @@ static struct starpu_sched_policy *find_sched_policy_from_name(const char *polic
 
				 	if (!policy_name)
			
 
				 		return NULL;
			
 
				 
			
 
				-	if (strncmp(policy_name, "heft", 5) == 0)
			
 
				+	if (strcmp(policy_name, "") == 0)
			
 
				+		return NULL;
			
 
				+
			
 
				+	if (strncmp(policy_name, "heft", 4) == 0)
			
 
				 	{
			
 
				-		_STARPU_DISP("Warning: heft is now called \"dmda\".\n");
			
 
				+		_STARPU_MSG("Warning: heft is now called \"dmda\".\n");
			
 
				 		return &_starpu_sched_dmda_policy;
			
 
				 	}
			
 
				 
			
@@ -135,7 +138,7 @@ static struct starpu_sched_policy *find_sched_policy_from_name(const char *polic
 
				 		}
			
 
				 	}
			
 
				 	if (strcmp(policy_name, "help") != 0)
			
 
				-	     fprintf(stderr, "Warning: scheduling policy \"%s\" was not found, try \"help\" to get a list\n", policy_name);
			
 
				+		_STARPU_MSG("Warning: scheduling policy '%s' was not found, try 'help' to get a list\n", policy_name);
			
 
				 
			
 
				 	/* nothing was found */
			
 
				 	return NULL;
			
@@ -167,8 +170,12 @@ struct starpu_sched_policy *_starpu_select_sched_policy(struct _starpu_machine_c
 
				 	if(required_policy)
			
 
				 		selected_policy = find_sched_policy_from_name(required_policy);
			
 
				 
			
 
				+	/* If there is a policy that matches the required name, return it */
			
 
				+	if (selected_policy)
			
 
				+		return selected_policy;
			
 
				+
			
 
				 	/* First, we check whether the application explicitely gave a scheduling policy or not */
			
 
				-	if (!selected_policy && user_conf && (user_conf->sched_policy))
			
 
				+	if (user_conf && (user_conf->sched_policy))
			
 
				 		return user_conf->sched_policy;
			
 
				 
			
 
				 	/* Otherwise, we look if the application specified the name of a policy to load */
			
@@ -176,15 +183,14 @@ struct starpu_sched_policy *_starpu_select_sched_policy(struct _starpu_machine_c
 
				 	sched_pol_name = starpu_getenv("STARPU_SCHED");
			
 
				 	if (sched_pol_name == NULL && user_conf && user_conf->sched_policy_name)
			
 
				 		sched_pol_name = user_conf->sched_policy_name;
			
 
				-
			
 
				-	if (!selected_policy && sched_pol_name)
			
 
				+	if (sched_pol_name)
			
 
				 		selected_policy = find_sched_policy_from_name(sched_pol_name);
			
 
				 
			
 
				-	/* Perhaps there was no policy that matched the name */
			
 
				+	/* If there is a policy that matches the name, return it */
			
 
				 	if (selected_policy)
			
 
				 		return selected_policy;
			
 
				 
			
 
				-	/* If no policy was specified, we use the greedy policy as a default */
			
 
				+	/* If no policy was specified, we use the eager policy by default */
			
 
				 	return &_starpu_sched_eager_policy;
			
 
				 }
			
 
				 
			
--- a/src/core/simgrid.c
+++ b/src/core/simgrid.c
@@ -1,8 +1,8 @@
 
				 /* StarPU --- Runtime system for heterogeneous multicore architectures.
			
 
				  *
			
 
				- * Copyright (C) 2012-2016  Université de Bordeaux
			
 
				+ * Copyright (C) 2012-2017  Université de Bordeaux
			
 
				  * Copyright (C) 2016  	    Inria
			
 
				- * Copyright (C) 2016  	    CNRS
			
 
				+ * Copyright (C) 2016, 2017  	    CNRS
			
 
				  *
			
 
				  * StarPU is free software; you can redistribute it and/or modify
			
 
				  * it under the terms of the GNU Lesser General Public License as published by
			
@@ -25,6 +25,9 @@
 
				 #include <core/perfmodel/perfmodel.h>
			
 
				 #include <core/workers.h>
			
 
				 #include <core/simgrid.h>
			
 
				+#if defined(HAVE_SG_LINK_NAME) && (SIMGRID_VERSION_MAJOR >= 4 || (SIMGRID_VERSION_MAJOR == 3 && SIMGRID_VERSION_MINOR >= 13))
			
 
				+#include <simgrid/simdag.h>
			
 
				+#endif
			
 
				 
			
 
				 #ifdef STARPU_SIMGRID
			
 
				 #include <sys/resource.h>
			
@@ -101,7 +104,7 @@ int _starpu_simgrid_get_nbhosts(const char *prefix)
 
				 		STARPU_ASSERT(starpu_mpi_world_rank);
			
 
				 		snprintf(name, sizeof(name), STARPU_MPI_AS_PREFIX"%u", starpu_mpi_world_rank());
			
 
				 		hosts = MSG_environment_as_get_hosts(_starpu_simgrid_get_as_by_name(name));
			
 
				-		len = snprintf(new_prefix, sizeof(new_prefix), "%s-%s", name, prefix);
			
 
				+		snprintf(new_prefix, sizeof(new_prefix), "%s-%s", name, prefix);
			
 
				 		prefix = new_prefix;
			
 
				 		len = strlen(prefix);
			
 
				 	}
			
@@ -719,7 +722,7 @@ _starpu_simgrid_get_memnode_host(unsigned node)
 
				 
			
 
				 void _starpu_simgrid_count_ngpus(void)
			
 
				 {
			
 
				-#if defined(HAVE_SG_LINK_NAME) && SIMGRID_VERSION_MAJOR >= 4 || (SIMGRID_VERSION_MAJOR == 3 && SIMGRID_VERSION_MINOR >= 13)
			
 
				+#if defined(HAVE_SG_LINK_NAME) && (SIMGRID_VERSION_MAJOR >= 4 || (SIMGRID_VERSION_MAJOR == 3 && SIMGRID_VERSION_MINOR >= 13))
			
 
				 	unsigned src, dst;
			
 
				 	msg_host_t ramhost = _starpu_simgrid_get_host_by_name("RAM");
			
 
				 
			
--- a/src/core/topology.c
+++ b/src/core/topology.c
@@ -1,7 +1,7 @@
 
				 /* StarPU --- Runtime system for heterogeneous multicore architectures.
			
 
				  *
			
 
				  * Copyright (C) 2009-2016  Université de Bordeaux
			
 
				- * Copyright (C) 2010, 2011, 2012, 2013, 2014, 2015, 2016 CNRS
			
 
				+ * Copyright (C) 2010, 2011, 2012, 2013, 2014, 2015, 2016, 2017 CNRS
			
 
				  * Copyright (C) 2011, 2016  INRIA
			
 
				  * Copyright (C) 2016  Uppsala University
			
 
				  *
			
@@ -128,6 +128,7 @@ _starpu_get_worker_from_driver(struct starpu_driver *d)
 
				 #endif
			
 
				 
			
 
				 			default:
			
 
				+				(void) worker;
			
 
				 				_STARPU_DEBUG("Invalid device type\n");
			
 
				 				return NULL;
			
 
				 			}
			
@@ -530,7 +531,7 @@ _starpu_deallocate_topology_userdata(hwloc_obj_t obj)
 
				 	STARPU_ASSERT(!data->worker_list || data->worker_list == (void*)-1);
			
 
				 	free(data);
			
 
				 	for (i = 0; i < obj->arity; i++)
			
 
				-		_starpu_allocate_topology_userdata(obj->children[i]);
			
 
				+		_starpu_deallocate_topology_userdata(obj->children[i]);
			
 
				 }
			
 
				 #endif
			
 
				 #endif
			
@@ -556,7 +557,11 @@ _starpu_init_topology (struct _starpu_machine_config *config)
 
				 #ifndef STARPU_SIMGRID
			
 
				 #ifdef STARPU_HAVE_HWLOC
			
 
				 	hwloc_topology_init(&topology->hwtopology);
			
 
				+#if HWLOC_API_VERSION >= 0x20000
			
 
				+	hwloc_topology_set_io_types_filter(topology->hwtopology, HWLOC_TYPE_FILTER_KEEP_IMPORTANT);
			
 
				+#else
			
 
				 	hwloc_topology_set_flags(topology->hwtopology, HWLOC_TOPOLOGY_FLAG_IO_DEVICES | HWLOC_TOPOLOGY_FLAG_IO_BRIDGES);
			
 
				+#endif
			
 
				 	hwloc_topology_load(topology->hwtopology);
			
 
				 	_starpu_allocate_topology_userdata(hwloc_get_root_obj(topology->hwtopology));
			
 
				 #endif
			
--- a/src/core/workers.c
+++ b/src/core/workers.c
@@ -1,7 +1,7 @@
 
				 /* StarPU --- Runtime system for heterogeneous multicore architectures.
			
 
				  *
			
 
				- * Copyright (C) 2009-2016  Université de Bordeaux
			
 
				- * Copyright (C) 2010, 2011, 2012, 2013, 2014, 2015, 2016  CNRS
			
 
				+ * Copyright (C) 2009-2017  Université de Bordeaux
			
 
				+ * Copyright (C) 2010, 2011, 2012, 2013, 2014, 2015, 2016, 2017  CNRS
			
 
				  * Copyright (C) 2010, 2011  INRIA
			
 
				  * Copyright (C) 2011  Télécom-SudParis
			
 
				  * Copyright (C) 2011-2012, 2016  INRIA
			
@@ -21,6 +21,9 @@
 
				 
			
 
				 #include <stdlib.h>
			
 
				 #include <stdio.h>
			
 
				+#ifdef __linux__
			
 
				+#include <sys/utsname.h>
			
 
				+#endif
			
 
				 #include <common/config.h>
			
 
				 #include <common/utils.h>
			
 
				 #include <common/graph.h>
			
@@ -1145,18 +1148,27 @@ static void _fill_tree(struct starpu_tree *tree, hwloc_obj_t curr_obj, unsigned
 
				 static void _starpu_build_tree(void)
			
 
				 {
			
 
				 #ifdef STARPU_HAVE_HWLOC
			
 
				+	hwloc_topology_t cpu_topo;
			
 
				 	struct starpu_tree *tree;
			
 
				 	_STARPU_MALLOC(tree, sizeof(struct starpu_tree));
			
 
				 	_starpu_config.topology.tree = tree;
			
 
				 
			
 
				-	hwloc_obj_t root = hwloc_get_root_obj(_starpu_config.topology.hwtopology);
			
 
				+	hwloc_topology_init(&cpu_topo);
			
 
				+#if HWLOC_API_VERSION >= 0x20000
			
 
				+	hwloc_topology_set_all_types_filter(cpu_topo, HWLOC_TYPE_FILTER_KEEP_STRUCTURE);
			
 
				+#else
			
 
				+	hwloc_topology_ignore_all_keep_structure(cpu_topo);
			
 
				+#endif
			
 
				+	hwloc_topology_load(cpu_topo);
			
 
				+	hwloc_obj_t root = hwloc_get_root_obj(cpu_topo);
			
 
				 
			
 
				 /* 	char string[128]; */
			
 
				 /* 	hwloc_obj_snprintf(string, sizeof(string), topology, root, "#", 0); */
			
 
				 /* 	printf("%*s%s %d is_pu = %d \n", 0, "", string, root->logical_index, root->type == HWLOC_OBJ_PU); */
			
 
				 
			
 
				-	/* level, is_pu, is in the tree (it will be true only after add*/
			
 
				-	_fill_tree(tree, root, 0, _starpu_config.topology.hwtopology, NULL);
			
 
				+	/* level, is_pu, is in the tree (it will be true only after add) */
			
 
				+	_fill_tree(tree, root, 0, cpu_topo, NULL);
			
 
				+	hwloc_topology_destroy(cpu_topo);
			
 
				 #endif
			
 
				 }
			
 
				 
			
@@ -1265,6 +1277,15 @@ int starpu_initialize(struct starpu_conf *user_conf, int *argc, char ***argv)
 
				 #ifdef STARPU_MODEL_DEBUG
			
 
				 	_STARPU_DISP("Warning: StarPU was configured with --enable-model-debug, which slows down a bit\n");
			
 
				 #endif
			
 
				+#ifdef __linux__
			
 
				+	{
			
 
				+		struct utsname buf;
			
 
				+		if (uname(&buf) == 0
			
 
				+		 && (!strncmp(buf.release, "4.7.", 4)
			
 
				+		  || !strncmp(buf.release, "4.8.", 4)))
			
 
				+			_STARPU_DISP("Warning: This system is running a 4.7 or 4.8 kernel. These have a severe scheduling performance regression issue, please upgrade to at least 4.9.\n");
			
 
				+	}
			
 
				+#endif
			
 
				 #endif
			
 
				 
			
 
				 	if (starpu_getenv("STARPU_ENABLE_STATS"))
			
@@ -1759,6 +1780,13 @@ int starpu_worker_get_count_by_type(enum starpu_worker_archtype type)
 
				         case STARPU_MPI_WORKER:
			
 
				             return _starpu_config.topology.nmpidevices;
			
 
				 
			
 
				+		case STARPU_ANY_WORKER:
			
 
				+			return _starpu_config.topology.ncpus+
			
 
				+			       _starpu_config.topology.ncudagpus+
			
 
				+			       _starpu_config.topology.nopenclgpus+
			
 
				+			       _starpu_config.topology.nmicdevices+
			
 
				+			       _starpu_config.topology.nsccdevices+
			
 
				+		           _starpu_config.topology.nmpidevices;
			
 
				 		default:
			
 
				 			return -EINVAL;
			
 
				 	}
			
@@ -1953,7 +1981,7 @@ unsigned starpu_worker_get_ids_by_type(enum starpu_worker_archtype type, int *wo
 
				 	unsigned id;
			
 
				 	for (id = 0; id < nworkers; id++)
			
 
				 	{
			
 
				-		if (starpu_worker_get_type(id) == type)
			
 
				+		if (type == STARPU_ANY_WORKER || starpu_worker_get_type(id) == type)
			
 
				 		{
			
 
				 			/* Perhaps the array is too small ? */
			
 
				 			if (cnt >= maxsize)
			
@@ -1975,7 +2003,7 @@ int starpu_worker_get_by_type(enum starpu_worker_archtype type, int num)
 
				 	unsigned id;
			
 
				 	for (id = 0; id < nworkers; id++)
			
 
				 	{
			
 
				-		if (starpu_worker_get_type(id) == type)
			
 
				+		if (type == STARPU_ANY_WORKER || starpu_worker_get_type(id) == type)
			
 
				 		{
			
 
				 			if (num == cnt)
			
 
				 				return id;
			
@@ -2069,7 +2097,8 @@ int starpu_worker_get_stream_workerids(unsigned devid, int *workerids, enum star
 
				 	unsigned id;
			
 
				 	for (id = 0; id < nworkers; id++)
			
 
				 	{
			
 
				-		if (_starpu_config.workers[id].devid == devid && _starpu_config.workers[id].arch == type)
			
 
				+		if (_starpu_config.workers[id].devid == devid &&
			
 
				+		    (type == STARPU_ANY_WORKER || _starpu_config.workers[id].arch == type))
			
 
				 			workerids[nw++] = id;
			
 
				 	}
			
 
				 	return nw;
			
@@ -2129,7 +2158,7 @@ int starpu_worker_get_nids_by_type(enum starpu_worker_archtype type, int *worker
 
				 	unsigned id;
			
 
				 	for (id = 0; id < nworkers; id++)
			
 
				 	{
			
 
				-		if (starpu_worker_get_type(id) == type)
			
 
				+		if (type == STARPU_ANY_WORKER || starpu_worker_get_type(id) == type)
			
 
				 		{
			
 
				 			/* Perhaps the array is too small ? */
			
 
				 			if (cnt >= maxsize)
			
@@ -2150,7 +2179,7 @@ int starpu_worker_get_nids_ctx_free_by_type(enum starpu_worker_archtype type, in
 
				 
			
 
				 	for (id = 0; id < nworkers; id++)
			
 
				 	{
			
 
				-		if (starpu_worker_get_type(id) == type)
			
 
				+		if (type == STARPU_ANY_WORKER || starpu_worker_get_type(id) == type)
			
 
				 		{
			
 
				 			/* Perhaps the array is too small ? */
			
 
				 			if (cnt >= maxsize)
			
@@ -2213,6 +2242,7 @@ starpu_driver_run(struct starpu_driver *d)
 
				 		return _starpu_run_opencl(worker);
			
 
				 #endif
			
 
				 	default:
			
 
				+		(void) worker;
			
 
				 		_STARPU_DEBUG("Invalid device type\n");
			
 
				 		return -EINVAL;
			
 
				 	}
			
@@ -2239,6 +2269,7 @@ starpu_driver_init(struct starpu_driver *d)
 
				 		return _starpu_opencl_driver_init(worker);
			
 
				 #endif
			
 
				 	default:
			
 
				+		(void) worker;
			
 
				 		return -EINVAL;
			
 
				 	}
			
 
				 }
			
@@ -2264,6 +2295,7 @@ starpu_driver_run_once(struct starpu_driver *d)
 
				 		return _starpu_opencl_driver_run_once(worker);
			
 
				 #endif
			
 
				 	default:
			
 
				+		(void) worker;
			
 
				 		return -EINVAL;
			
 
				 	}
			
 
				 }
			
@@ -2289,6 +2321,7 @@ starpu_driver_deinit(struct starpu_driver *d)
 
				 		return _starpu_opencl_driver_deinit(worker);
			
 
				 #endif
			
 
				 	default:
			
 
				+		(void) worker;
			
 
				 		return -EINVAL;
			
 
				 	}
			
 
				 }
			
--- a/src/datawizard/memalloc.c
+++ b/src/datawizard/memalloc.c
@@ -1,6 +1,6 @@
 
				 /* StarPU --- Runtime system for heterogeneous multicore architectures.
			
 
				  *
			
 
				- * Copyright (C) 2009-2016  Université de Bordeaux
			
 
				+ * Copyright (C) 2009-2017  Université de Bordeaux
			
 
				  * Copyright (C) 2010, 2011, 2012, 2013, 2014, 2015, 2016  CNRS
			
 
				  * Copyright (C) 2016  Inria
			
 
				  *
			
@@ -33,6 +33,9 @@ static unsigned target_clean_p;
 
				 /* Whether CPU memory has been explicitly limited by user */
			
 
				 static int limit_cpu_mem;
			
 
				 
			
 
				+/* Prevent memchunks from being evicted from memory before they are actually used */
			
 
				+static int diduse_barrier;
			
 
				+
			
 
				 /* This per-node RW-locks protect mc_list and memchunk_cache entries */
			
 
				 /* Note: handle header lock is always taken before this (normal add/remove case) */
			
 
				 static struct _starpu_spinlock mc_lock[STARPU_MAXNODES];
			
@@ -133,6 +136,7 @@ void _starpu_init_mem_chunk_lists(void)
 
				 	minimum_clean_p = starpu_get_env_number_default("STARPU_MINIMUM_CLEAN_BUFFERS", 5);
			
 
				 	target_clean_p = starpu_get_env_number_default("STARPU_TARGET_CLEAN_BUFFERS", 10);
			
 
				 	limit_cpu_mem = starpu_get_env_number("STARPU_LIMIT_CPU_MEM");
			
 
				+	diduse_barrier = starpu_get_env_number_default("STARPU_DIDUSE_BARRIER", 0);
			
 
				 }
			
 
				 
			
 
				 void _starpu_deinit_mem_chunk_lists(void)
			
@@ -443,6 +447,10 @@ static size_t try_to_free_mem_chunk(struct _starpu_mem_chunk *mc, unsigned node)
 
				 	if ((int) node == handle->home_node)
			
 
				 		return 0;
			
 
				 
			
 
				+	if (diduse_barrier && !mc->diduse)
			
 
				+		/* Hasn't been used yet, avoid evicting it */
			
 
				+		return 0;
			
 
				+
			
 
				 	/* REDUX memchunk */
			
 
				 	if (mc->relaxed_coherency == 2)
			
 
				 	{
			
@@ -1160,6 +1168,7 @@ static struct _starpu_mem_chunk *_starpu_memchunk_init(struct _starpu_data_repli
 
				 	mc->chunk_interface = NULL;
			
 
				 	mc->size_interface = interface_size;
			
 
				 	mc->remove_notify = NULL;
			
 
				+	mc->diduse = 0;
			
 
				 
			
 
				 	return mc;
			
 
				 }
			
@@ -1455,6 +1464,7 @@ void _starpu_memchunk_recently_used(struct _starpu_mem_chunk *mc, unsigned node)
 
				 		/* user-allocated memory */
			
 
				 		return;
			
 
				 	_starpu_spin_lock(&mc_lock[node]);
			
 
				+	mc->diduse = 1;
			
 
				 	MC_LIST_ERASE(node, mc);
			
 
				 	MC_LIST_PUSH_BACK(node, mc);
			
 
				 	_starpu_spin_unlock(&mc_lock[node]);
			
@@ -1468,6 +1478,8 @@ void _starpu_memchunk_wont_use(struct _starpu_mem_chunk *mc, unsigned node)
 
				 		/* user-allocated memory */
			
 
				 		return;
			
 
				 	_starpu_spin_lock(&mc_lock[node]);
			
 
				+	/* Avoid preventing it from being evicted */
			
 
				+	mc->diduse = 1;
			
 
				 	MC_LIST_ERASE(node, mc);
			
 
				 	/* Caller will schedule a clean transfer */
			
 
				 	mc->clean = 1;
			
--- a/src/datawizard/memalloc.h
+++ b/src/datawizard/memalloc.h
@@ -1,6 +1,6 @@
 
				 /* StarPU --- Runtime system for heterogeneous multicore architectures.
			
 
				  *
			
 
				- * Copyright (C) 2009-2010, 2012-2015  Université de Bordeaux
			
 
				+ * Copyright (C) 2009-2010, 2012-2015, 2017  Université de Bordeaux
			
 
				  * Copyright (C) 2010, 2011, 2012, 2013  CNRS
			
 
				  *
			
 
				  * StarPU is free software; you can redistribute it and/or modify
			
@@ -73,6 +73,9 @@ LIST_TYPE(_starpu_mem_chunk,
 
				 	 * remove this entry from the mc_list, so we know we have to restart
			
 
				 	 * from zero. This is protected by the corresponding mc_lock.  */
			
 
				 	struct _starpu_mem_chunk **remove_notify;
			
 
				+
			
 
				+	/* Was this chunk used since it got allocated?  */
			
 
				+	int diduse;
			
 
				 )
			
 
				 
			
 
				 void _starpu_init_mem_chunk_lists(void);
			
--- a/src/drivers/cuda/driver_cuda.c
+++ b/src/drivers/cuda/driver_cuda.c
@@ -2,7 +2,7 @@
 
				  *
			
 
				  * Copyright (C) 2009-2016  Université de Bordeaux
			
 
				  * Copyright (C) 2010  Mehdi Juhoor <mjuhoor@gmail.com>
			
 
				- * Copyright (C) 2010, 2011, 2012, 2013, 2014, 2016  CNRS
			
 
				+ * Copyright (C) 2010, 2011, 2012, 2013, 2014, 2016, 2017  CNRS
			
 
				  * Copyright (C) 2011  Télécom-SudParis
			
 
				  * Copyright (C) 2016  Uppsala University
			
 
				  *
			
@@ -267,8 +267,6 @@ done:
 
				 
			
 
				 static void init_device_context(unsigned devid, unsigned memnode)
			
 
				 {
			
 
				-	unsigned i;
			
 
				-
			
 
				 #ifndef STARPU_SIMGRID
			
 
				 	cudaError_t cures;
			
 
				 
			
@@ -351,6 +349,7 @@ static void init_device_context(unsigned devid, unsigned memnode)
 
				 	if (STARPU_UNLIKELY(cures))
			
 
				 		STARPU_CUDA_REPORT_ERROR(cures);
			
 
				 
			
 
				+	unsigned i;
			
 
				 	for (i = 0; i < ncudagpus; i++)
			
 
				 	{
			
 
				 		cures = starpu_cudaStreamCreate(&in_peer_transfer_streams[i][devid]);
			
--- a/src/drivers/driver_common/driver_common.c
+++ b/src/drivers/driver_common/driver_common.c
@@ -1,7 +1,7 @@
 
				 /* StarPU --- Runtime system for heterogeneous multicore architectures.
			
 
				  *
			
 
				- * Copyright (C) 2010-2016  Université de Bordeaux
			
 
				- * Copyright (C) 2010, 2011, 2012, 2013, 2014, 2015, 2016  CNRS
			
 
				+ * Copyright (C) 2010-2017  Université de Bordeaux
			
 
				+ * Copyright (C) 2010, 2011, 2012, 2013, 2014, 2015, 2016, 2017  CNRS
			
 
				  * Copyright (C) 2011  Télécom-SudParis
			
 
				  * Copyright (C) 2014, 2016  INRIA
			
 
				  *
			
@@ -428,10 +428,7 @@ struct starpu_task *_starpu_get_worker_task(struct _starpu_worker *worker, int w
 
				 		_starpu_worker_set_status_sleeping(workerid);
			
 
				 
			
 
				 		if (_starpu_worker_can_block(memnode, worker)
			
 
				-#ifndef STARPU_SIMGRID
			
 
				-				&& !_starpu_sched_ctx_last_worker_awake(worker)
			
 
				-#endif
			
 
				-				)
			
 
				+			&& !_starpu_sched_ctx_last_worker_awake(worker))
			
 
				 		{
			
 
				 			STARPU_PTHREAD_COND_WAIT(&worker->sched_cond, &worker->sched_mutex);
			
 
				 			STARPU_PTHREAD_MUTEX_UNLOCK_SCHED(&worker->sched_mutex);
			
@@ -440,18 +437,7 @@ struct starpu_task *_starpu_get_worker_task(struct _starpu_worker *worker, int w
 
				 		{
			
 
				 			STARPU_PTHREAD_MUTEX_UNLOCK_SCHED(&worker->sched_mutex);
			
 
				 			if (_starpu_machine_is_running())
			
 
				-			{
			
 
				 				_starpu_exponential_backoff(worker);
			
 
				-#ifdef STARPU_SIMGRID
			
 
				-				static int warned;
			
 
				-				if (!warned)
			
 
				-				{
			
 
				-					warned = 1;
			
 
				-					_STARPU_DISP("Has to make simgrid spin for CPU idle time.  You can try to pass --enable-blocking-drivers to ./configure to avoid this\n");
			
 
				-				}
			
 
				-				MSG_process_sleep(0.000010);
			
 
				-#endif
			
 
				-			}
			
 
				 		}
			
 
				 
			
 
				 		return NULL;
			
@@ -583,10 +569,7 @@ int _starpu_get_multi_worker_task(struct _starpu_worker *workers, struct starpu_
 
				 		_starpu_worker_set_status_sleeping(workerid);
			
 
				 
			
 
				 		if (_starpu_worker_can_block(memnode, worker)
			
 
				-#ifndef STARPU_SIMGRID
			
 
				-				&& !_starpu_sched_ctx_last_worker_awake(worker)
			
 
				-#endif
			
 
				-				)
			
 
				+				&& !_starpu_sched_ctx_last_worker_awake(worker))
			
 
				 		{
			
 
				 			STARPU_PTHREAD_COND_WAIT(&worker->sched_cond, &worker->sched_mutex);
			
 
				 			STARPU_PTHREAD_MUTEX_UNLOCK_SCHED(&worker->sched_mutex);
			
@@ -595,25 +578,14 @@ int _starpu_get_multi_worker_task(struct _starpu_worker *workers, struct starpu_
 
				 		{
			
 
				 			STARPU_PTHREAD_MUTEX_UNLOCK_SCHED(&worker->sched_mutex);
			
 
				 			if (_starpu_machine_is_running())
			
 
				-			{
			
 
				 				_starpu_exponential_backoff(worker);
			
 
				-#ifdef STARPU_SIMGRID
			
 
				-				static int warned;
			
 
				-				if (!warned)
			
 
				-				{
			
 
				-					warned = 1;
			
 
				-					_STARPU_DISP("Has to make simgrid spin for CPU idle time.  You can try to pass --enable-blocking-drivers to ./configure to avoid this\n");
			
 
				-				}
			
 
				-				MSG_process_sleep(0.000010);
			
 
				-#endif
			
 
				-			}
			
 
				 		}
			
 
				 		return 0;
			
 
				 	}
			
 
				 
			
 
				 	_starpu_worker_set_status_wakeup(workerid);
			
 
				 	worker->spinning_backoff = BACKOFF_MIN;
			
 
				-#endif /* STARPU_SIMGRID */
			
 
				+#endif /* !STARPU_SIMGRID */
			
 
				 
			
 
				 	STARPU_PTHREAD_MUTEX_UNLOCK_SCHED(&workers[0].sched_mutex);
			
 
				 #endif /* !STARPU_NON_BLOCKING_DRIVERS */
			
--- a/src/sched_policies/component_perfmodel_select.c
+++ b/src/sched_policies/component_perfmodel_select.c
@@ -44,7 +44,14 @@ static int perfmodel_select_push_task(struct starpu_sched_component * component,
 
				 	if(can_execute)
			
 
				 	{
			
 
				 		if(isnan(length))
			
 
				+		{
			
 
				+			static int warned;
			
 
				+			if (!warned) {
			
 
				+				warned = 1;
			
 
				+				_STARPU_DISP("Warning: performance model for %s not finished calibrating, using a dumb scheduling heuristic for now\n",starpu_task_get_name(task));
			
 
				+			}
			
 
				 			return starpu_sched_component_push_task(component,data->calibrator_component,task);
			
 
				+		}
			
 
				 		if(_STARPU_IS_ZERO(length))
			
 
				 			return starpu_sched_component_push_task(component,data->no_perfmodel_component,task);
			
 
				 		return starpu_sched_component_push_task(component,data->perfmodel_component,task);
			
--- a/src/sched_policies/component_worker.c
+++ b/src/sched_policies/component_worker.c
@@ -1,7 +1,7 @@
 
				 /* StarPU --- Runtime system for heterogeneous multicore architectures.
			
 
				  *
			
 
				  * Copyright (C) 2010-2016  Université de Bordeaux
			
 
				- * Copyright (C) 2010, 2011, 2012, 2014, 2015, 2016  CNRS
			
 
				+ * Copyright (C) 2010, 2011, 2012, 2014, 2015, 2016, 2017  CNRS
			
 
				  * Copyright (C) 2011  Télécom-SudParis
			
 
				  * Copyright (C) 2011-2013  INRIA
			
 
				  * Copyright (C) 2013  Simon Archipoff
			
@@ -683,7 +683,7 @@ static int combined_worker_push_task(struct starpu_sched_component * component,
 
				 		task_alias[i]->task->workerid = combined_worker->combined_workerid[i];
			
 
				 		task_alias[i]->left = task_alias[i-1];
			
 
				 		task_alias[i - 1]->right = task_alias[i];
			
 
				-		task_alias[i]->pntasks = &task_alias[0]->ntasks;
			
 
				+		task_alias[i]->pntasks = &(task_alias[0]->ntasks);
			
 
				 	}
			
 
				 
			
 
				 	starpu_pthread_mutex_t * mutex_to_unlock = NULL;
			
--- a/src/sched_policies/deque_modeling_policy_data_aware.c
+++ b/src/sched_policies/deque_modeling_policy_data_aware.c
@@ -1,6 +1,6 @@
 
				 /* StarPU --- Runtime system for heterogeneous multicore architectures.
			
 
				  *
			
 
				- * Copyright (C) 2010-2016  Université de Bordeaux
			
 
				+ * Copyright (C) 2010-2017  Université de Bordeaux
			
 
				  * Copyright (C) 2010, 2011, 2012, 2013, 2015, 2016  CNRS
			
 
				  * Copyright (C) 2011  Télécom-SudParis
			
 
				  * Copyright (C) 2011-2012, 2016  INRIA
			
@@ -562,11 +562,17 @@ static int _dm_push_task(struct starpu_task *task, unsigned prio, unsigned sched
 
				 				best_impl = nimpl;
			
 
				 			}
			
 
				 
			
 
				-			if (isnan(local_length))
			
 
				+			if (isnan(local_length)) {
			
 
				 				/* we are calibrating, we want to speed-up calibration time
			
 
				 				 * so we privilege non-calibrated tasks (but still
			
 
				 				 * greedily distribute them to avoid dumb schedules) */
			
 
				+				static int warned;
			
 
				+				if (!warned) {
			
 
				+					warned = 1;
			
 
				+					_STARPU_DISP("Warning: performance model for %s not finished calibrating on worker %u, using a dumb scheduling heuristic for now\n", starpu_task_get_name(task), worker);
			
 
				+				}
			
 
				 				calibrating = 1;
			
 
				+			}
			
 
				 
			
 
				 			if (isnan(local_length) || _STARPU_IS_ZERO(local_length))
			
 
				 				/* there is no prediction available for that task
			
--- a/src/sched_policies/graph_test_policy.c
+++ b/src/sched_policies/graph_test_policy.c
@@ -1,6 +1,6 @@
 
				 /* StarPU --- Runtime system for heterogeneous multicore architectures.
			
 
				  *
			
 
				- * Copyright (C) 2010-2016  Université de Bordeaux
			
 
				+ * Copyright (C) 2010-2017  Université de Bordeaux
			
 
				  * Copyright (C) 2010-2013, 2016  CNRS
			
 
				  * Copyright (C) 2011  INRIA
			
 
				  *
			
@@ -124,7 +124,7 @@ static struct _starpu_prio_deque *select_prio(unsigned sched_ctx_id, struct _sta
 
				 		if (length == 0.)
			
 
				 		{
			
 
				 			_STARPU_DISP("Warning: graph_test needs performance models for all tasks, including %s\n",
			
 
				-					_starpu_job_get_task_name(_starpu_get_job_associated_to_task(task)));
			
 
				+					starpu_task_get_name(task));
			
 
				 			power = 0.;
			
 
				 		}
			
 
				 		else
			
--- a/src/sched_policies/parallel_heft.c
+++ b/src/sched_policies/parallel_heft.c
@@ -1,7 +1,7 @@
 
				 /* StarPU --- Runtime system for heterogeneous multicore architectures.
			
 
				  *
			
 
				  * Copyright (C) 2012 INRIA
			
 
				- * Copyright (C) 2010-2016  Université de Bordeaux
			
 
				+ * Copyright (C) 2010-2017  Université de Bordeaux
			
 
				  * Copyright (C) 2011  Télécom-SudParis
			
 
				  * Copyright (C) 2016  CNRS
			
 
				  *
			
@@ -374,11 +374,17 @@ static int _parallel_heft_push_task(struct starpu_task *task, unsigned prio, uns
 
				 				nimpl_best = nimpl;
			
 
				 			}
			
 
				 
			
 
				-			if (isnan(local_task_length[worker_ctx][nimpl]))
			
 
				+			if (isnan(local_task_length[worker_ctx][nimpl])) {
			
 
				+				static int warned;
			
 
				+				if (!warned) {
			
 
				+					warned = 1;
			
 
				+					_STARPU_DISP("Warning: performance model for %s not finished calibrating on %u, using a dumb scheduling heuristic for now\n", starpu_task_get_name(task), worker);
			
 
				+				}
			
 
				 				/* we are calibrating, we want to speed-up calibration time
			
 
				 				 * so we privilege non-calibrated tasks (but still
			
 
				 				 * greedily distribute them to avoid dumb schedules) */
			
 
				 				calibrating = 1;
			
 
				+			}
			
 
				 
			
 
				 			if (isnan(local_task_length[worker_ctx][nimpl])
			
 
				 					|| _STARPU_IS_ZERO(local_task_length[worker_ctx][nimpl]))
			
--- a/src/sched_policies/work_stealing_policy.c
+++ b/src/sched_policies/work_stealing_policy.c
@@ -1,7 +1,7 @@
 
				 /* StarPU --- Runtime system for heterogeneous multicore architectures.
			
 
				  *
			
 
				  * Copyright (C) 2010-2016  Université de Bordeaux
			
 
				- * Copyright (C) 2010, 2011, 2012, 2013, 2016  CNRS
			
 
				+ * Copyright (C) 2010, 2011, 2012, 2013, 2016, 2017  CNRS
			
 
				  * Copyright (C) 2011, 2012, 2016  INRIA
			
 
				  *
			
 
				  * StarPU is free software; you can redistribute it and/or modify
			
@@ -133,7 +133,8 @@ static int select_victim_round_robin(struct _starpu_work_stealing_data *ws, unsi
 
				 		 * estimation */
			
 
				 		ntasks = ws->per_worker[workerids[worker]].queue_array->ntasks;
			
 
				 
			
 
				-		if (ntasks && ws->per_worker[workerids[worker]].busy)
			
 
				+		if (ntasks && (ws->per_worker[workerids[worker]].busy
			
 
				+					   || starpu_worker_is_blocked(workerids[worker])))
			
 
				 			break;
			
 
				 
			
 
				 		worker = (worker + 1) % nworkers;
			
@@ -538,6 +539,14 @@ static struct starpu_task *ws_pop_task(unsigned sched_ctx_id)
 
				 	{
			
 
				 		/* there was a local task */
			
 
				 		ws->per_worker[workerid].busy = 1;
			
 
				+		starpu_sched_ctx_list_task_counters_decrement(sched_ctx_id, workerid);
			
 
				+		unsigned child_sched_ctx = starpu_sched_ctx_worker_is_master_for_child_ctx(workerid, sched_ctx_id);
			
 
				+		if(child_sched_ctx != STARPU_NMAX_SCHED_CTXS)
			
 
				+		{
			
 
				+			starpu_sched_ctx_move_task_to_ctx(task, child_sched_ctx, 1, 1);
			
 
				+			starpu_sched_ctx_revert_task_counters(sched_ctx_id, task->flops);
			
 
				+			return NULL;
			
 
				+		}
			
 
				 		return task;
			
 
				 	}
			
 
				 
			
@@ -571,6 +580,7 @@ static struct starpu_task *ws_pop_task(unsigned sched_ctx_id)
 
				 	{
			
 
				 		_STARPU_TRACE_WORK_STEALING(workerid, victim);
			
 
				 		_STARPU_TASK_BREAK_ON(task, sched);
			
 
				+		starpu_sched_ctx_list_task_counters_decrement(sched_ctx_id, victim);
			
 
				 		record_data_locality(task, workerid);
			
 
				 		record_worker_locality(ws, task, workerid, sched_ctx_id);
			
 
				 		locality_popped_task(ws, task, victim, sched_ctx_id);
			
@@ -580,6 +590,16 @@ static struct starpu_task *ws_pop_task(unsigned sched_ctx_id)
 
				 	/* Done with stealing, resynchronize with core */
			
 
				 	STARPU_PTHREAD_MUTEX_LOCK_SCHED(sched_mutex);
			
 
				 
			
 
				+	if (task)
			
 
				+	{
			
 
				+		unsigned child_sched_ctx = starpu_sched_ctx_worker_is_master_for_child_ctx(workerid, sched_ctx_id);
			
 
				+		if(child_sched_ctx != STARPU_NMAX_SCHED_CTXS)
			
 
				+		{
			
 
				+			starpu_sched_ctx_move_task_to_ctx(task, child_sched_ctx, 1, 1);
			
 
				+			starpu_sched_ctx_revert_task_counters(sched_ctx_id, task->flops);
			
 
				+			return NULL;
			
 
				+		}
			
 
				+	}
			
 
				 	ws->per_worker[workerid].busy = !!task;
			
 
				 	return task;
			
 
				 }
			
@@ -589,10 +609,12 @@ int ws_push_task(struct starpu_task *task)
 
				 {
			
 
				 	unsigned sched_ctx_id = task->sched_ctx;
			
 
				 	struct _starpu_work_stealing_data *ws = (struct _starpu_work_stealing_data*)starpu_sched_ctx_get_policy_data(sched_ctx_id);
			
 
				-	int workerid = -1;
			
 
				+	int workerid;
			
 
				 
			
 
				 #ifdef USE_LOCALITY
			
 
				 	workerid = select_worker_locality(ws, task, sched_ctx_id);
			
 
				+#else
			
 
				+	workerid = -1;
			
 
				 #endif
			
 
				 	if (workerid == -1)
			
 
				 		workerid = starpu_worker_get_id();
			
@@ -618,6 +640,7 @@ int ws_push_task(struct starpu_task *task)
 
				 
			
 
				 	starpu_push_task_end(task);
			
 
				 	STARPU_PTHREAD_MUTEX_UNLOCK_SCHED(sched_mutex);
			
 
				+	starpu_sched_ctx_list_task_counters_increment(sched_ctx_id, workerid);
			
 
				 
			
 
				 #if !defined(STARPU_NON_BLOCKING_DRIVERS) || defined(STARPU_SIMGRID)
			
 
				 	/* TODO: implement fine-grain signaling, similar to what eager does */
			
@@ -724,7 +747,8 @@ static int lws_select_victim(struct _starpu_work_stealing_data *ws, unsigned sch
 
				 	{
			
 
				 		int neighbor = ws->per_worker[workerid].proxlist[i];
			
 
				 		int ntasks = ws->per_worker[neighbor].queue_array->ntasks;
			
 
				-		if (ntasks && ws->per_worker[neighbor].busy)
			
 
				+		if (ntasks && (ws->per_worker[neighbor].busy
			
 
				+					   || starpu_worker_is_blocked(neighbor)))
			
 
				 			return neighbor;
			
 
				 	}
			
 
				 	return -1;
			
--- a/src/util/misc.c
+++ b/src/util/misc.c
@@ -1,6 +1,6 @@
 
				 /* StarPU --- Runtime system for heterogeneous multicore architectures.
			
 
				  *
			
 
				- * Copyright (C) 2012, 2015  Université de Bordeaux
			
 
				+ * Copyright (C) 2012, 2015, 2017  Université de Bordeaux
			
 
				  *
			
 
				  * StarPU is free software; you can redistribute it and/or modify
			
 
				  * it under the terms of the GNU Lesser General Public License as published by
			
@@ -55,3 +55,21 @@ const char *_starpu_job_get_task_name(struct _starpu_job *j)
 
				 	else
			
 
				 		return _starpu_job_get_model_name(j);
			
 
				 }
			
 
				+
			
 
				+const char *starpu_task_get_model_name(struct starpu_task *task)
			
 
				+{
			
 
				+	if (!task)
			
 
				+		return NULL;
			
 
				+
			
 
				+	return _starpu_codelet_get_model_name(task->cl);
			
 
				+}
			
 
				+
			
 
				+const char *starpu_task_get_name(struct starpu_task *task)
			
 
				+{
			
 
				+	if (!task)
			
 
				+		return NULL;
			
 
				+	if (task->name)
			
 
				+		return task->name;
			
 
				+	else
			
 
				+		return starpu_task_get_model_name(task);
			
 
				+}
			
--- a/src/util/starpu_task_insert.c
+++ b/src/util/starpu_task_insert.c
@@ -1,7 +1,7 @@
 
				 /* StarPU --- Runtime system for heterogeneous multicore architectures.
			
 
				  *
			
 
				- * Copyright (C) 2010, 2012, 2014-2016  Université de Bordeaux
			
 
				- * Copyright (C) 2011, 2012, 2013, 2014, 2015, 2016  CNRS
			
 
				+ * Copyright (C) 2010, 2012, 2014-2017  Université de Bordeaux
			
 
				+ * Copyright (C) 2011, 2012, 2013, 2014, 2015, 2016, 2017  CNRS
			
 
				  *
			
 
				  * StarPU is free software; you can redistribute it and/or modify
			
 
				  * it under the terms of the GNU Lesser General Public License as published by
			
@@ -46,7 +46,10 @@ void _starpu_codelet_unpack_args_and_copyleft(char *cl_arg, void *_buffer, size_
 
				 		void *argptr = va_arg(varg_list, void *);
			
 
				 
			
 
				 		/* If not reading all cl_args */
			
 
				-		if(argptr == NULL)
			
 
				+		// NULL was the initial end marker, we now use 0
			
 
				+		// 0 and NULL should be the same value, but we
			
 
				+		// keep both equalities for systems on which they could be different
			
 
				+		if(argptr == 0 || argptr == NULL)
			
 
				 			break;
			
 
				 
			
 
				 		size_t arg_size;
			
--- a/tests/Makefile.am
+++ b/tests/Makefile.am
@@ -1,6 +1,6 @@
 
				 # StarPU --- Runtime system for heterogeneous multicore architectures.
			
 
				 #
			
 
				-# Copyright (C) 2009-2016  Université de Bordeaux
			
 
				+# Copyright (C) 2009-2017  Université de Bordeaux
			
 
				 # Copyright (C) 2010, 2011, 2012, 2013, 2014, 2015, 2016  CNRS
			
 
				 # Copyright (C) 2010, 2011, 2012  INRIA
			
 
				 #
			
@@ -20,8 +20,10 @@ include $(top_srcdir)/starpu.mk
 
				 if STARPU_SIMGRID
			
 
				 STARPU_PERF_MODEL_DIR=$(abs_top_srcdir)/tools/perfmodels/sampling
			
 
				 STARPU_HOSTNAME=mirage
			
 
				+MALLOC_PERTURB_=0
			
 
				 export STARPU_PERF_MODEL_DIR
			
 
				 export STARPU_HOSTNAME
			
 
				+export MALLOC_PERTURB_
			
 
				 endif
			
 
				 
			
 
				 AM_CFLAGS = $(HWLOC_CFLAGS) $(FXT_CFLAGS) -Wall $(STARPU_CUDA_CPPFLAGS) $(STARPU_OPENCL_CPPFLAGS) $(STARPU_COI_CPPFLAGS) $(STARPU_SCIF_CPPFLAGS) $(GLOBAL_AM_CFLAGS) -Wno-unused
			
--- a/tests/coverage/coverage.sh
+++ b/tests/coverage/coverage.sh
@@ -2,7 +2,7 @@
 
				 
			
 
				 # StarPU --- Runtime system for heterogeneous multicore architectures.
			
 
				 #
			
 
				-# Copyright (C) 2010  Université de Bordeaux
			
 
				+# Copyright (C) 2010, 2017  Université de Bordeaux
			
 
				 # Copyright (C) 2010, 2011  CNRS
			
 
				 #
			
 
				 # StarPU is free software; you can redistribute it and/or modify
			
@@ -28,33 +28,43 @@ check_success()
 
				 
			
 
				 apps()
			
 
				 {
			
 
				-    echo "block opencl"
			
 
				-    STARPU_NCUDA=0 STARPU_NCPUS=0 $exampledir/basic_examples/block
			
 
				-    check_success $?
			
 
				+    if [ -f $exampledir/basic_examples/block ] ; then
			
 
				+	echo "block opencl"
			
 
				+	STARPU_NCUDA=0 STARPU_NCPUS=0 $exampledir/basic_examples/block
			
 
				+	check_success $?
			
 
				+    fi
			
 
				 
			
 
				-    echo "variable opencl"
			
 
				-    STARPU_NCUDA=0 STARPU_NCPUS=0 $exampledir/basic_examples/variable 100
			
 
				-    check_success $?
			
 
				+    if [ -f $exampledir/basic_examples/variable ] ; then
			
 
				+	echo "variable opencl"
			
 
				+	STARPU_NCUDA=0 STARPU_NCPUS=0 $exampledir/basic_examples/variable 100
			
 
				+	check_success $?
			
 
				 
			
 
				-    echo "variable no worker"
			
 
				-    STARPU_NCUDA=0 STARPU_NOPENCL=0 STARPU_NCPUS=0 $exampledir/basic_examples/variable
			
 
				-    check_success $?
			
 
				+	echo "variable no worker"
			
 
				+	STARPU_NCUDA=0 STARPU_NOPENCL=0 STARPU_NCPUS=0 $exampledir/basic_examples/variable
			
 
				+	check_success $?
			
 
				+    fi
			
 
				 
			
 
				-    echo "incrementer opencl"
			
 
				-    STARPU_NCUDA=0 STARPU_NCPUS=0 $exampledir/incrementer/incrementer 10
			
 
				-    check_success $?
			
 
				+    if [ -f $exampledir/incrementer/incrementer ] ; then
			
 
				+	echo "incrementer opencl"
			
 
				+	STARPU_NCUDA=0 STARPU_NCPUS=0 $exampledir/incrementer/incrementer 10
			
 
				+	check_success $?
			
 
				 
			
 
				-    echo "incrementer no worker"
			
 
				-    STARPU_NCUDA=0 STARPU_NOPENCL=0 STARPU_NCPUS=0 $exampledir/incrementer/incrementer
			
 
				-    check_success $?
			
 
				+	echo "incrementer no worker"
			
 
				+	STARPU_NCUDA=0 STARPU_NOPENCL=0 STARPU_NCPUS=0 $exampledir/incrementer/incrementer
			
 
				+	check_success $?
			
 
				+    fi
			
 
				 
			
 
				-    echo "tag_example"
			
 
				-    $exampledir/tag_example/tag_example -iter 64 -i 128 -j 24
			
 
				-    check_success $?
			
 
				+    if [ -f $exampledir/tag_example/tag_example ] ; then
			
 
				+	echo "tag_example"
			
 
				+	$exampledir/tag_example/tag_example -iter 64 -i 128 -j 24
			
 
				+	check_success $?
			
 
				+    fi
			
 
				 
			
 
				-    echo "tag_example2"
			
 
				-    $exampledir/tag_example/tag_example2 -iter 64 -i 128
			
 
				-    check_success $?
			
 
				+    if [ -f $exampledir/tag_example/tag_example2 ] ; then
			
 
				+	echo "tag_example2"
			
 
				+	$exampledir/tag_example/tag_example2 -iter 64 -i 128
			
 
				+	check_success $?
			
 
				+    fi
			
 
				 
			
 
				     if [ -f $exampledir/cholesky/dw_cholesky ] ; then
			
 
				 	echo "chol.dm"
			
--- a/tests/datawizard/allocate.c
+++ b/tests/datawizard/allocate.c
@@ -42,6 +42,10 @@ int test_prefetch(unsigned memnodes)
 
				 	unsigned i;
			
 
				 	starpu_ssize_t available_size;
			
 
				 
			
 
				+	if (starpu_get_env_number_default("STARPU_DIDUSE_BARRIER", 0))
			
 
				+		/* This would hang */
			
 
				+		return STARPU_TEST_SKIPPED;
			
 
				+
			
 
				 	buffers[0] = malloc(SIZE_ALLOC*1024*512);
			
 
				 	STARPU_ASSERT(buffers[0]);
			
 
				 
			
--- a/tests/datawizard/simgrid-locality.c
+++ b/tests/datawizard/simgrid-locality.c
@@ -1,6 +1,6 @@
 
				 /* StarPU --- Runtime system for heterogeneous multicore architectures.
			
 
				  *
			
 
				- * Copyright (C) 2016 Université de Bordeaux
			
 
				+ * Copyright (C) 2016-2017 Université de Bordeaux
			
 
				  *
			
 
				  * StarPU is free software; you can redistribute it and/or modify
			
 
				  * it under the terms of the GNU Lesser General Public License as published by
			
@@ -17,7 +17,7 @@
 
				 /* Check that defining a main makes starpu use MSG_process_attach. */
			
 
				 #include "locality.c"
			
 
				 #include <config.h>
			
 
				-#if defined(HAVE_MSG_PROCESS_ATTACH) && SIMGRID_VERSION_MAJOR > 3 || (SIMGRID_VERSION_MAJOR == 3 && SIMGRID_VERSION_MINOR >= 14)
			
 
				+#if defined(HAVE_MSG_PROCESS_ATTACH) && SIMGRID_VERSION_MAJOR > 3 || (SIMGRID_VERSION_MAJOR == 3 && SIMGRID_VERSION_MINOR >= 15)
			
 
				 #undef main
			
 
				 int main(int argc, char *argv[]) {
			
 
				 	return starpu_main(argc, argv);
			
--- a/tests/disk/mem_reclaim.c
+++ b/tests/disk/mem_reclaim.c
@@ -142,6 +142,10 @@ int dotest(struct starpu_disk_ops *ops, char *base, void (*vector_data_register)
 
				 	int *A, *C;
			
 
				 	starpu_data_handle_t handles[NDATA];
			
 
				 
			
 
				+	if (starpu_get_env_number_default("STARPU_DIDUSE_BARRIER", 0))
			
 
				+		/* This would hang */
			
 
				+		return STARPU_TEST_SKIPPED;
			
 
				+
			
 
				 	FPRINTF(stderr, "Testing <%s>\n", text);
			
 
				 	/* Initialize StarPU without GPU devices to make sure the memory of the GPU devices will not be used */
			
 
				 	struct starpu_conf conf;
			
--- a/tests/loader.c
+++ b/tests/loader.c
@@ -237,13 +237,12 @@ int main(int argc, char *argv[])
 
				 		test_args = (char *) calloc(150, sizeof(char));
			
 
				 		sprintf(test_args, "%s/examples/spmv/matrix_market/examples/fidapm05.mtx", STARPU_SRC_DIR);
			
 
				 	}
			
 
				-
			
 
				-	if (strstr(test_name, "starpu_perfmodel_display"))
			
 
				+	else if (strstr(test_name, "starpu_perfmodel_display"))
			
 
				 	{
			
 
				 		test_args = (char *) calloc(5, sizeof(char));
			
 
				 		sprintf(test_args, "-l");
			
 
				 	}
			
 
				-	if (strstr(test_name, "starpu_perfmodel_plot"))
			
 
				+	else if (strstr(test_name, "starpu_perfmodel_plot"))
			
 
				 	{
			
 
				 		test_args = (char *) calloc(5, sizeof(char));
			
 
				 		sprintf(test_args, "-l");
			
--- a/tests/main/combined_workers/bfs/bfs.cpp
+++ b/tests/main/combined_workers/bfs/bfs.cpp
@@ -54,10 +54,10 @@ void read_file(char *input_f, unsigned int *nb_nodes, unsigned int *nb_edges,
 
				 	fscanf(fp, "%u", nb_nodes);
			
 
				 
			
 
				 	// allocate host memory
			
 
				-	*origin_graph_nodes = (Node *) malloc(sizeof(Node) * (*nb_nodes));
			
 
				-	*origin_graph_mask = (bool *) malloc(sizeof(bool) * (*nb_nodes));
			
 
				-	*origin_updating_graph_mask = (bool *) malloc(sizeof(bool) * (*nb_nodes));
			
 
				-	*origin_graph_visited = (bool *) malloc(sizeof(bool) * (*nb_nodes));
			
 
				+	*origin_graph_nodes = malloc(sizeof(Node) * (*nb_nodes));
			
 
				+	*origin_graph_mask = malloc(sizeof(bool) * (*nb_nodes));
			
 
				+	*origin_updating_graph_mask = malloc(sizeof(bool) * (*nb_nodes));
			
 
				+	*origin_graph_visited = malloc(sizeof(bool) * (*nb_nodes));
			
 
				 
			
 
				 	int start, edgeno;
			
 
				 	// initalize the memory
			
@@ -156,12 +156,12 @@ int main( int argc, char** argv)
 
				 		  &origin_graph_mask, &origin_updating_graph_mask,
			
 
				 		  &origin_graph_visited, &origin_graph_edges, &origin_cost);
			
 
				 
			
 
				-	graph_nodes = (Node *) calloc(nb_nodes, sizeof(Node));
			
 
				-	graph_mask = (bool *) calloc(nb_nodes, sizeof(bool));
			
 
				-	updating_graph_mask = (bool *) calloc(nb_nodes, sizeof(bool));
			
 
				-	graph_visited = (bool *) calloc(nb_nodes, sizeof(bool));
			
 
				-	graph_edges = (int*) calloc(nb_edges, sizeof(int));
			
 
				-	cost = (int*) calloc(nb_nodes, sizeof(int));
			
 
				+	graph_nodes = calloc(nb_nodes, sizeof(Node));
			
 
				+	graph_mask = calloc(nb_nodes, sizeof(bool));
			
 
				+	updating_graph_mask = calloc(nb_nodes, sizeof(bool));
			
 
				+	graph_visited = calloc(nb_nodes, sizeof(bool));
			
 
				+	graph_edges = calloc(nb_edges, sizeof(int));
			
 
				+	cost = calloc(nb_nodes, sizeof(int));
			
 
				 
			
 
				 	memcpy(graph_nodes, origin_graph_nodes, nb_nodes*sizeof(Node));
			
 
				 	memcpy(graph_edges, origin_graph_edges, nb_edges*sizeof(int));
			
--- a/tests/main/insert_task_value.c
+++ b/tests/main/insert_task_value.c
@@ -1,6 +1,6 @@
 
				 /* StarPU --- Runtime system for heterogeneous multicore architectures.
			
 
				  *
			
 
				- * Copyright (C) 2015, 2016  CNRS
			
 
				+ * Copyright (C) 2015, 2016, 2017  CNRS
			
 
				  *
			
 
				  * StarPU is free software; you can redistribute it and/or modify
			
 
				  * it under the terms of the GNU Lesser General Public License as published by
			
@@ -43,7 +43,7 @@ void func_cpu_int_float_multiple_unpack(void *descr[], void *_args)
 
				 	float ffactor;
			
 
				 	(void) descr;
			
 
				 
			
 
				-	starpu_codelet_unpack_args(_args, ifactor, NULL);
			
 
				+	starpu_codelet_unpack_args(_args, ifactor, 0);
			
 
				 	starpu_codelet_unpack_args(_args, ifactor, &ffactor);
			
 
				 
			
 
				 	FPRINTF(stderr, "[func_cpu_int_float_multiple_unpack] Values %d - %3.2f\n", ifactor[0], ffactor);
			
@@ -60,7 +60,7 @@ void func_cpu_int_float_unpack_copyleft(void *descr[], void *_args)
 
				 
			
 
				 	buffer_size = sizeof(int)+sizeof(float)+sizeof(size_t);
			
 
				 	buffer = calloc(buffer_size, 1);
			
 
				-	starpu_codelet_unpack_args_and_copyleft(_args, buffer, buffer_size, ifactor, NULL);
			
 
				+	starpu_codelet_unpack_args_and_copyleft(_args, buffer, buffer_size, ifactor, 0);
			
 
				 	starpu_codelet_unpack_args(buffer, &ffactor);
			
 
				 
			
 
				 	FPRINTF(stderr, "[func_cpu_int_float_unpack_copyleft] Values %d - %3.2f\n", ifactor[0], ffactor);
			
@@ -86,7 +86,7 @@ void func_cpu_float_int_multiple_unpack(void *descr[], void *_args)
 
				 	float ffactor;
			
 
				 	(void) descr;
			
 
				 
			
 
				-	starpu_codelet_unpack_args(_args, &ffactor, NULL);
			
 
				+	starpu_codelet_unpack_args(_args, &ffactor, 0);
			
 
				 	starpu_codelet_unpack_args(_args, &ffactor, ifactor);
			
 
				 
			
 
				 	FPRINTF(stderr, "[func_cpu_float_int_multiple_unpack] Values %d - %3.2f\n", ifactor[0], ffactor);
			
@@ -103,7 +103,7 @@ void func_cpu_float_int_unpack_copyleft(void *descr[], void *_args)
 
				 
			
 
				 	buffer_size = sizeof(int)+2048*sizeof(int)+sizeof(size_t);
			
 
				 	buffer = calloc(buffer_size, 1);
			
 
				-	starpu_codelet_unpack_args_and_copyleft(_args, buffer, buffer_size, &ffactor, NULL);
			
 
				+	starpu_codelet_unpack_args_and_copyleft(_args, buffer, buffer_size, &ffactor, 0);
			
 
				 	starpu_codelet_unpack_args(buffer, ifactor);
			
 
				 
			
 
				 	FPRINTF(stderr, "[func_cpu_float_int_multiple_unpack] Values %d - %3.2f\n", ifactor[0], ffactor);
			
--- a/tools/Makefile.am
+++ b/tools/Makefile.am
@@ -1,7 +1,7 @@
 
				 # StarPU --- Runtime system for heterogeneous multicore architectures.
			
 
				 #
			
 
				-# Copyright (C) 2009-2016  Université de Bordeaux
			
 
				-# Copyright (C) 2010, 2011, 2012, 2013, 2014, 2015, 2016  CNRS
			
 
				+# Copyright (C) 2009-2017  Université de Bordeaux
			
 
				+# Copyright (C) 2010, 2011, 2012, 2013, 2014, 2015, 2016, 2017  CNRS
			
 
				 # Copyright (C) 2016  Inria
			
 
				 #
			
 
				 # StarPU is free software; you can redistribute it and/or modify
			
@@ -20,8 +20,10 @@ include $(top_srcdir)/starpu.mk
 
				 if STARPU_SIMGRID
			
 
				 STARPU_PERF_MODEL_DIR=$(abs_top_srcdir)/tools/perfmodels/sampling
			
 
				 STARPU_HOSTNAME=mirage
			
 
				+MALLOC_PERTURB_=0
			
 
				 export STARPU_PERF_MODEL_DIR
			
 
				 export STARPU_HOSTNAME
			
 
				+export MALLOC_PERTURB_
			
 
				 endif
			
 
				 
			
 
				 SUBDIRS =
			
@@ -154,7 +156,8 @@ EXTRA_DIST =				\
 
				 	msvc/starpu_exec.bat		\
			
 
				 	msvc/starpu_var.bat		\
			
 
				 	msvc/starpu.sln			\
			
 
				-	msvc/starpu/starpu.vcxproj
			
 
				+	msvc/starpu/starpu.vcxproj	\
			
 
				+	cppcheck/suppressions.txt
			
 
				 
			
 
				 CLEANFILES = *.gcno *.gcda *.linkinfo starpu_idle_microsec.log figure/* mlr_*
			
 
				 
			
--- a/tools/cppcheck/suppressions.txt
+++ b/tools/cppcheck/suppressions.txt
@@ -0,0 +1,66 @@
 
				+memleakOnRealloc
			
 
				+knownConditionTrueFalse
			
 
				+variableScope
			
 
				+unusedStructMember
			
 
				+ConfigurationNotChecked
			
 
				+
			
 
				+*:tools/dev/*
			
 
				+*:starpufft/*
			
 
				+*:min-dgels/*
			
 
				+*:starpu-top/*
			
 
				+*:socl/src/CL/*
			
 
				+
			
 
				+// TODO. We should cppcheck the code
			
 
				+*:sc_hypervisor/*
			
 
				+
			
 
				+varFuncNullUB:examples/sched_ctx/two_cpu_contexts.c:76
			
 
				+negativeIndex:examples/stencil/stencil-tasks.c:200
			
 
				+negativeIndex:examples/stencil/stencil-tasks.c:203
			
 
				+constStatement:examples/stencil/*
			
 
				+
			
 
				+unreadVariable:tests/openmp/*
			
 
				+unusedLabel:tests/datawizard/gpu_register.c
			
 
				+unusedLabel:tests/datawizard/gpu_ptr_register.c
			
 
				+redundantAssignment:tests/datawizard/interfaces/test_interfaces.c:752
			
 
				+redundantAssignment:tests/datawizard/mpi_like_async.c:165
			
 
				+redundantAssignment:tests/datawizard/mpi_like_async.c:211
			
 
				+unusedPrivateFunction:tests/main/combined_workers/bfs/timer.h:45
			
 
				+redundantAssignment:tests/main/driver_api/init_run_deinit.c
			
 
				+redundantAssignment:tests/main/driver_api/run_driver.c
			
 
				+
			
 
				+uselessAssignmentPtrArg:mpi/src/starpu_mpi.c:155
			
 
				+unreadVariable:mpi/src/starpu_mpi.c:849
			
 
				+redundantAssignment:src/core/workers.c
			
 
				+
			
 
				+invalidPointerCast:src/core/perfmodel/perfmodel_nan.c:74
			
 
				+unreadVariable:src/core/dependencies/tags.c:111
			
 
				+uselessAssignmentPtrArg:src/core/sched_ctx_list.c:144
			
 
				+unusedStructMember:src/core/perfmodel/perfmodel_bus.c:62
			
 
				+unusedStructMember:src/core/perfmodel/perfmodel_bus.c:63
			
 
				+unusedStructMember:src/core/perfmodel/perfmodel_bus.c:64
			
 
				+unusedStructMember:src/core/perfmodel/perfmodel_bus.c:65
			
 
				+unusedStructMember:src/core/perfmodel/perfmodel_bus.c:66
			
 
				+unusedStructMember:src/core/simgrid.c:225
			
 
				+unusedStructMember:src/core/simgrid.c:226
			
 
				+duplicateExpression:src/util/starpu_task_insert.c:52
			
 
				+
			
 
				+// TODO: this could be an error?
			
 
				+redundantCopy:src/core/disk_ops/disk_leveldb.cpp:192
			
 
				+
			
 
				+nullPointerRedundantCheck:src/common/rbtree.c
			
 
				+wrongPrintfScanfArgNum:src/core/simgrid.c:715
			
 
				+unreadVariable:src/datawizard/interfaces/*
			
 
				+unreadVariable:src/drivers/driver_common/driver_common.c:482
			
 
				+clarifyCondition:src/drivers/opencl/driver_opencl.c:936
			
 
				+unreadVariable:src/drivers/opencl/driver_opencl.c:767
			
 
				+clarifyCondition:src/drivers/cuda/driver_cuda.c:506
			
 
				+arithOperationsOnVoidPointer:src/drivers/scc/*
			
 
				+nullPointerRedundantCheck:src/sched_policies/deque_modeling_policy_data_aware.c:197
			
 
				+sizeofDereferencedVoidPointer:src/util/fstarpu.c
			
 
				+
			
 
				+allocaCalled:gcc-plugin/src/*
			
 
				+unusedVariable:gcc-plugin/tests/*
			
 
				+unreadVariable:gcc-plugin/tests/*
			
 
				+duplicateExpression:gcc-plugin/src/*
			
 
				+
			
 
				+pointerSize:socl/src/cl_getcontextinfo.c:33
			
--- a/tools/starpu_fxt_stats.c
+++ b/tools/starpu_fxt_stats.c
@@ -1,6 +1,6 @@
 
				 /* StarPU --- Runtime system for heterogeneous multicore architectures.
			
 
				  *
			
 
				- * Copyright (C) 2011, 2012, 2013, 2014  CNRS
			
 
				+ * Copyright (C) 2011, 2012, 2013, 2014, 2017  CNRS
			
 
				  *
			
 
				  * StarPU is free software; you can redistribute it and/or modify
			
 
				  * it under the terms of the GNU Lesser General Public License as published by
			
@@ -193,12 +193,14 @@ int main(int argc, char **argv)
 
				 		{
			
 
				 			if (transfers[src][dst] != 0)
			
 
				 			{
			
 
				-				fprintf(fd_out, "%d -> %d \t %ld MB\n", src, dst, transfers[src][dst]/(1024*1024));
			
 
				+				fprintf(fd_out, "%u -> %u \t %lu MB\n", src, dst, (unsigned long)(transfers[src][dst]/(1024*1024)));
			
 
				 			}
			
 
				 		}
			
 
				 	}
			
 
				 
			
 
				-	fprintf(fd_out, "There was %d tasks and %d work stealing\n", njob, nws);
			
 
				+	fprintf(fd_out, "There was %u tasks and %u work stealing\n", njob, nws);
			
 
				+	if (fd_out != stdout)
			
 
				+		fclose(fd_out);
			
 
				 
			
 
				 	return 0;
			
 
				 }
			
--- a/tools/starpu_lp2paje.c
+++ b/tools/starpu_lp2paje.c
@@ -1,7 +1,7 @@
 
				 /* StarPU --- Runtime system for heterogeneous multicore architectures.
			
 
				  *
			
 
				  * Copyright (C) 2010-2011, 2013-2014  Université de Bordeaux
			
 
				- * Copyright (C) 2014, 2015, 2016                  CNRS
			
 
				+ * Copyright (C) 2014, 2015, 2016, 2017                  CNRS
			
 
				  *
			
 
				  * StarPU is free software; you can redistribute it and/or modify
			
 
				  * it under the terms of the GNU Lesser General Public License as published by
			
@@ -35,7 +35,7 @@ int main(int argc, char *argv[])
 
				 {
			
 
				 	int nw, nt;
			
 
				 	double tmax;
			
 
				-	int i, w, ww, t, tt, t2;
			
 
				+	int i, w, ww, t, tt;
			
 
				 	int foo;
			
 
				 	double bar;
			
 
				 
			
@@ -142,6 +142,7 @@ int main(int argc, char *argv[])
 
				 
			
 
				 		for (t = 0; t < nt; t++)
			
 
				 		{
			
 
				+			int t2;
			
 
				 			for (t2 = 0; t2 < nt; t2++)
			
 
				 			{
			
 
				 				if (t != t2 && task[t].worker == task[t2].worker)
			
--- a/tools/starpu_machine_display.c
+++ b/tools/starpu_machine_display.c
@@ -178,7 +178,7 @@ int main(int argc, char **argv)
 
				 	display_worker_names(STARPU_OPENCL_WORKER);
			
 
				 
			
 
				 #ifdef STARPU_USE_MIC
			
 
				-	fprintf(stdout, "\t%d MIC cores (from %d devices)\n", nmiccores, nmicdevs);
			
 
				+	fprintf(stdout, "\t%u MIC cores (from %u devices)\n", nmiccores, nmicdevs);
			
 
				 	display_worker_names(STARPU_MIC_WORKER);
			
 
				 #endif