9 years ago · 548ff4b4c6
--- a/examples/sched_ctx/parallel_tasks_with_cluster_api.c
+++ b/examples/sched_ctx/parallel_tasks_with_cluster_api.c
@@ -101,7 +101,14 @@ int main(int argc, char **argv)
 
				 				    STARPU_VALUE,&size,sizeof(int),
			
 
				 				    0);
			
 
				 		t->destroy = 1;
			
 
				-		t->possibly_parallel = 1;
			
 
				+		/* For two tasks, try out the case when the task isn't parallel and expect
			
 
				+			 the configuration to be sequential due to this, then automatically changed
			
 
				+			 back to the parallel one */
			
 
				+		if (i<=4 || i > 6)
			
 
				+			t->possibly_parallel = 1;
			
 
				+		/* Note that this mode requires that you put a prologue callback managing
			
 
				+			 this on all tasks to be taken into account. */
			
 
				+		t->prologue_callback_pop_func = &starpu_openmp_prologue;
			
 
				 
			
 
				 		ret=starpu_task_submit(t);
			
 
				 		if (ret == -ENODEV)
			
--- a/include/starpu_clusters_util.h
+++ b/include/starpu_clusters_util.h
@@ -72,10 +72,10 @@ int starpu_uncluster_machine(struct starpu_cluster_machine* clusters);
 
				 int starpu_cluster_print(struct starpu_cluster_machine* clusters);
			
 
				 
			
 
				 /* Prologue functions */
			
 
				-void starpu_openmp_prologue(void * sched_ctx_id);
			
 
				+void starpu_openmp_prologue(void*);
			
 
				 #define starpu_intel_openmp_mkl_prologue starpu_openmp_prologue
			
 
				 #ifdef STARPU_MKL
			
 
				-void starpu_gnu_openmp_mkl_prologue(void * sched_ctx_id);
			
 
				+void starpu_gnu_openmp_mkl_prologue(void*);
			
 
				 #endif /* STARPU_MKL */
			
 
				 
			
 
				 #ifdef __cplusplus
			
--- a/src/core/sched_ctx.c
+++ b/src/core/sched_ctx.c
@@ -566,6 +566,7 @@ struct _starpu_sched_ctx* _starpu_create_sched_ctx(struct starpu_sched_policy *p
 
				 		sched_ctx->sleeping[w] = 0;
			
 
				 	}
			
 
				 
			
 
				+	sched_ctx->parallel_view = 0;
			
 
				 
			
 
				         /*init the strategy structs and the worker_collection of the ressources of the context */
			
 
				 	if(policy)
			
--- a/src/core/sched_ctx.h
+++ b/src/core/sched_ctx.h
@@ -168,6 +168,10 @@ struct _starpu_sched_ctx
 
				 	/* perf model for the device comb of the ctx */
			
 
				 	struct starpu_perfmodel_arch perf_arch;
			
 
				 
			
 
				+	/* For parallel workers, say whether it is viewed as sequential or not. This
			
 
				+		 is a helper for the prologue code. */
			
 
				+	unsigned parallel_view;
			
 
				+
			
 
				 	/* for ctxs without policy: flag to indicate that we want to get
			
 
				 	   the threads to sleep in order to replace them with other threads or leave
			
 
				 	   them awake & use them in the parallel code*/
			
--- a/src/core/sched_policy.c
+++ b/src/core/sched_policy.c
@@ -989,7 +989,11 @@ profiling:
 
				 	}
			
 
				 
			
 
				 	if(task->prologue_callback_pop_func)
			
 
				+	{
			
 
				+		_starpu_set_current_task(task);
			
 
				 		task->prologue_callback_pop_func(task->prologue_callback_pop_arg);
			
 
				+		_starpu_set_current_task(NULL);
			
 
				+	}
			
 
				 
			
 
				 	return task;
			
 
				 }
			
--- a/src/util/starpu_clusters_create.c
+++ b/src/util/starpu_clusters_create.c
@@ -45,45 +45,67 @@ starpu_binding_function _starpu_cluster_type_get_func(starpu_cluster_types type)
 
				 	return prologue_func;
			
 
				 }
			
 
				 
			
 
				-void starpu_openmp_prologue(void *sched_ctx_id)
			
 
				+void starpu_openmp_prologue(void* arg)
			
 
				 {
			
 
				-	int sched_ctx = *(int*)sched_ctx_id;
			
 
				-	int *cpuids = NULL;
			
 
				-	int ncpuids = 0;
			
 
				 	int workerid = starpu_worker_get_id_check();
			
 
				 
			
 
				 	if (starpu_worker_get_type(workerid) == STARPU_CPU_WORKER)
			
 
				 	{
			
 
				-		starpu_sched_ctx_get_available_cpuids(sched_ctx, &cpuids, &ncpuids);
			
 
				-		omp_set_num_threads(ncpuids);
			
 
				-#pragma omp parallel
			
 
				+		struct starpu_task *task = starpu_task_get_current();
			
 
				+		int sched_ctx = task->sched_ctx;
			
 
				+		struct _starpu_sched_ctx *ctx_struct = _starpu_get_sched_ctx_struct(sched_ctx);
			
 
				+		/* If the view of the worker doesn't correspond to the view of the task,
			
 
				+			 adapt the thread team */
			
 
				+		if (ctx_struct->parallel_view != task->possibly_parallel)
			
 
				 		{
			
 
				-			starpu_sched_ctx_bind_current_thread_to_cpuid(cpuids[omp_get_thread_num()]);
			
 
				+			int *cpuids = NULL;
			
 
				+			int ncpuids = 0;
			
 
				+
			
 
				+			starpu_sched_ctx_get_available_cpuids(sched_ctx, &cpuids, &ncpuids);
			
 
				+			if (!task->possibly_parallel)
			
 
				+				ncpuids=1;
			
 
				+			omp_set_num_threads(ncpuids);
			
 
				+#pragma omp parallel
			
 
				+			{
			
 
				+				starpu_sched_ctx_bind_current_thread_to_cpuid(cpuids[omp_get_thread_num()]);
			
 
				+			}
			
 
				+			free(cpuids);
			
 
				+			ctx_struct->parallel_view = !ctx_struct->parallel_view;
			
 
				 		}
			
 
				-		free(cpuids);
			
 
				 	}
			
 
				 	return;
			
 
				 }
			
 
				 
			
 
				 #ifdef STARPU_MKL
			
 
				-void starpu_gnu_openmp_mkl_prologue(void *sched_ctx_id)
			
 
				+void starpu_gnu_openmp_mkl_prologue(void* arg)
			
 
				 {
			
 
				-	int sched_ctx = *(int*)sched_ctx_id;
			
 
				-	int *cpuids = NULL;
			
 
				-	int ncpuids = 0;
			
 
				 	int workerid = starpu_worker_get_id();
			
 
				 
			
 
				 	if (starpu_worker_get_type(workerid) == STARPU_CPU_WORKER)
			
 
				 	{
			
 
				-		starpu_sched_ctx_get_available_cpuids(sched_ctx, &cpuids, &ncpuids);
			
 
				-		omp_set_num_threads(ncpuids);
			
 
				-		mkl_set_num_threads(ncpuids);
			
 
				-		mkl_set_dynamic(0);
			
 
				-#pragma omp parallel
			
 
				+		struct starpu_task *task = starpu_task_get_current();
			
 
				+		int sched_ctx = task->sched_ctx;
			
 
				+		struct _starpu_sched_ctx *ctx_struct = _starpu_get_sched_ctx_struct(sched_ctx);
			
 
				+		/* If the view of the worker doesn't correspond to the view of the task,
			
 
				+			 adapt the thread team */
			
 
				+		if (ctx_struct->parallel_view != task->possibly_parallel)
			
 
				 		{
			
 
				-			starpu_sched_ctx_bind_current_thread_to_cpuid(cpuids[omp_get_thread_num()]);
			
 
				+			int *cpuids = NULL;
			
 
				+			int ncpuids = 0;
			
 
				+
			
 
				+			starpu_sched_ctx_get_available_cpuids(sched_ctx, &cpuids, &ncpuids);
			
 
				+			if (!task->possibly_parallel)
			
 
				+				ncpuids=1;
			
 
				+			omp_set_num_threads(ncpuids);
			
 
				+			mkl_set_num_threads(ncpuids);
			
 
				+			mkl_set_dynamic(0);
			
 
				+#pragma omp parallel
			
 
				+			{
			
 
				+				starpu_sched_ctx_bind_current_thread_to_cpuid(cpuids[omp_get_thread_num()]);
			
 
				+			}
			
 
				+			free(cpuids);
			
 
				+			ctx_struct->parallel_view = !ctx_struct->parallel_view;
			
 
				 		}
			
 
				-		free(cpuids);
			
 
				 	}
			
 
				 	return;
			
 
				 }
			
@@ -324,8 +346,8 @@ int _starpu_cluster_bind(struct _starpu_cluster *cluster)
 
				 	else
			
 
				 	{
			
 
				 		func = _starpu_cluster_type_get_func(cluster->params->type);
			
 
				-		func_arg = (void*) &cluster->id;
			
 
				-		}
			
 
				+		func_arg = NULL;
			
 
				+	}
			
 
				 
			
 
				 	return starpu_task_insert(&_starpu_cluster_bind_cl,
			
 
				 				  STARPU_SCHED_CTX, cluster->id,