12 年之前 · 9d2589a240
--- a/ChangeLog
+++ b/ChangeLog
@@ -1,6 +1,6 @@
 
				 # StarPU --- Runtime system for heterogeneous multicore architectures.
			
 
				 #
			
 
				-# Copyright (C) 2009-2012  Université de Bordeaux 1
			
 
				+# Copyright (C) 2009-2013  Université de Bordeaux 1
			
 
				 # Copyright (C) 2010, 2011, 2012, 2013  Centre National de la Recherche Scientifique
			
 
				 #
			
 
				 # StarPU is free software; you can redistribute it and/or modify
			
@@ -114,6 +114,9 @@ Changes:
 
				   * StarPU can now use poti to generate paje traces.
			
 
				   * Rename scheduling policy "parallel greedy" to "parallel eager"
			
 
				 
			
 
				+Small features:
			
 
				+  * Add starpu_worker_get_by_type and starpu_worker_get_by_devid
			
 
				+
			
 
				 Small changes:
			
 
				   * STARPU_NCPU should now be used instead of STARPU_NCPUS. STARPU_NCPUS is
			
 
				 	still available for compatibility reasons.
			
--- a/doc/chapters/basic-api.texi
+++ b/doc/chapters/basic-api.texi
@@ -286,6 +286,17 @@ chosen by the means of the @code{starpu_worker_get_count_by_type} function, or
 
				 by passing a value greater or equal to @code{STARPU_NMAXWORKERS}.
			
 
				 @end deftypefun
			
 
				 
			
 
				+@deftypefun int starpu_worker_get_by_type ({enum starpu_archtype} @var{type}, int @var{n})
			
 
				+This returns the identifier of the @var{n}-th worker that has the specified type
			
 
				+@var{type}. If there are no such worker, -1 is returned.
			
 
				+@end deftypefun
			
 
				+
			
 
				+@deftypefun int starpu_worker_get_by_devid ({enum starpu_archtype} @var{type}, int @var{devid})
			
 
				+This returns the identifier of the worker that has the specified type
			
 
				+@var{type} and devid @var{devid} (which may not be the n-th, if some devices are
			
 
				+skipped for instance). If there are no such worker, -1 is returned.
			
 
				+@end deftypefun
			
 
				+
			
 
				 @deftypefun int starpu_worker_get_devid (int @var{id})
			
 
				 This functions returns the device id of the given worker. The worker
			
 
				 should be identified with the value returned by the @code{starpu_worker_get_id} function. In the case of a
			
--- a/doc/chapters/perf-optimization.texi
+++ b/doc/chapters/perf-optimization.texi
@@ -19,6 +19,7 @@ TODO: improve!
 
				 * Task distribution vs Data transfer::
			
 
				 * Data prefetch::
			
 
				 * Power-based scheduling::
			
 
				+* Forcing scheduling::
			
 
				 * Profiling::
			
 
				 * CUDA-specific optimizations::
			
 
				 * Performance debugging::
			
@@ -402,6 +403,20 @@ consumption for that series of tasks, divide it by a thousand, repeat for
 
				 varying kinds of tasks and task sizes, and eventually feed StarPU
			
 
				 with these manual measurements through @code{starpu_perfmodel_update_history}.
			
 
				 
			
 
				+@node Static scheduling
			
 
				+@section Static scheduling
			
 
				+
			
 
				+In some cases, one may want to force some scheduling, for instance force a given
			
 
				+set of tasks to GPU0, another set to GPU1, etc. while letting some other tasks
			
 
				+be scheduled on any other device. This can indeed be useful to guide StarPU into
			
 
				+some work distribution, while still letting some degree of dynamism. For
			
 
				+instance, to force execution of a task on CUDA0:
			
 
				+
			
 
				+@example
			
 
				+task->execute_on_a_specific_worker = 1;
			
 
				+task->worker = starpu_worker_get_by_type(STARPU_CUDA_WORKER, 0);
			
 
				+@end example
			
 
				+
			
 
				 @node Profiling
			
 
				 @section Profiling
			
 
				 
			
--- a/include/starpu_worker.h
+++ b/include/starpu_worker.h
@@ -1,6 +1,6 @@
 
				 /* StarPU --- Runtime system for heterogeneous multicore architectures.
			
 
				  *
			
 
				- * Copyright (C) 2009-2012  Université de Bordeaux 1
			
 
				+ * Copyright (C) 2009-2013  Université de Bordeaux 1
			
 
				  * Copyright (C) 2010, 2011, 2012  Centre National de la Recherche Scientifique
			
 
				  *
			
 
				  * StarPU is free software; you can redistribute it and/or modify
			
@@ -79,6 +79,12 @@ int starpu_worker_get_count_by_type(enum starpu_archtype type);
 
				  * equal to STARPU_NMAXWORKERS. */
			
 
				 int starpu_worker_get_ids_by_type(enum starpu_archtype type, int *workerids, int maxsize);
			
 
				 
			
 
				+/* Return the identifier of the n-th worker of a specific type */
			
 
				+int starpu_worker_get_by_type(enum starpu_archtype type, int num);
			
 
				+
			
 
				+/* Return the identifier of the worker devid of a specific type */
			
 
				+int starpu_worker_get_by_devid(enum starpu_archtype type, int devid);
			
 
				+
			
 
				 /* StarPU associates a unique human readable string to each processing unit.
			
 
				  * This function copies at most the "maxlen" first bytes of the unique
			
 
				  * string associated to a worker identified by its identifier "id" into
			
--- a/src/core/perfmodel/perfmodel.c
+++ b/src/core/perfmodel/perfmodel.c
@@ -1,6 +1,6 @@
 
				 /* StarPU --- Runtime system for heterogeneous multicore architectures.
			
 
				  *
			
 
				- * Copyright (C) 2009-2012  Université de Bordeaux 1
			
 
				+ * Copyright (C) 2009-2013  Université de Bordeaux 1
			
 
				  * Copyright (C) 2010, 2011, 2012  Centre National de la Recherche Scientifique
			
 
				  * Copyright (C) 2011  Télécom-SudParis
			
 
				  *
			
@@ -224,7 +224,6 @@ double starpu_task_expected_conversion_time(struct starpu_task *task,
 
				 					    unsigned nimpl)
			
 
				 {
			
 
				 	unsigned i;
			
 
				-	int err;
			
 
				 	double sum = 0.0;
			
 
				 	int node;
			
 
				 
			
@@ -235,25 +234,22 @@ double starpu_task_expected_conversion_time(struct starpu_task *task,
 
				 	 */
			
 
				 #ifdef STARPU_USE_CPU
			
 
				 	int cpu_worker, cpu_node;
			
 
				-	err = starpu_worker_get_ids_by_type(STARPU_CPU_WORKER,
			
 
				-					    &cpu_worker, 1);
			
 
				-	if (err != 1 && err != -ERANGE)
			
 
				+	cpu_worker = starpu_worker_get_by_type(STARPU_CPU_WORKER, 0);
			
 
				+	if (cpu_worker == -1)
			
 
				 		return 0.0;
			
 
				 	cpu_node = starpu_worker_get_memory_node(cpu_worker);
			
 
				 #endif
			
 
				 #ifdef STARPU_USE_CUDA
			
 
				 	int cuda_worker, cuda_node;
			
 
				-	err = starpu_worker_get_ids_by_type(STARPU_CUDA_WORKER,
			
 
				-					    &cuda_worker, 1);
			
 
				-	if (err != 1 && err != -ERANGE)
			
 
				+	cuda_worker = starpu_worker_get_by_type(STARPU_CUDA_WORKER, 0);
			
 
				+	if (cuda_worker == -1)
			
 
				 		return 0.0;
			
 
				 	cuda_node = starpu_worker_get_memory_node(cuda_worker);
			
 
				 #endif
			
 
				 #ifdef STARPU_USE_OPENCL
			
 
				 	int opencl_worker, opencl_node;
			
 
				-	err = starpu_worker_get_ids_by_type(STARPU_OPENCL_WORKER,
			
 
				-					    &opencl_worker, 1);
			
 
				-	if (err != 1 && err != -ERANGE)
			
 
				+	opencl_worker = starpu_worker_get_by_type(STARPU_OPENCL_WORKER, 0);
			
 
				+	if (opencl_worker == -1)
			
 
				 		return 0.0;
			
 
				 
			
 
				 	opencl_node = starpu_worker_get_memory_node(opencl_worker);
			
--- a/src/core/workers.c
+++ b/src/core/workers.c
@@ -1243,6 +1243,40 @@ int starpu_worker_get_ids_by_type(enum starpu_archtype type, int *workerids, int
 
				 	return cnt;
			
 
				 }
			
 
				 
			
 
				+int starpu_worker_get_by_type(enum starpu_archtype type, int num)
			
 
				+{
			
 
				+	unsigned nworkers = starpu_worker_get_count();
			
 
				+
			
 
				+	int cnt = 0;
			
 
				+
			
 
				+	unsigned id;
			
 
				+	for (id = 0; id < nworkers; id++)
			
 
				+	{
			
 
				+		if (starpu_worker_get_type(id) == type)
			
 
				+		{
			
 
				+			if (num == cnt)
			
 
				+				return id;
			
 
				+			cnt++;
			
 
				+		}
			
 
				+	}
			
 
				+
			
 
				+	/* Not found */
			
 
				+	return -1;
			
 
				+}
			
 
				+
			
 
				+int starpu_worker_get_by_devid(enum starpu_archtype type, int devid)
			
 
				+{
			
 
				+	unsigned nworkers = starpu_worker_get_count();
			
 
				+
			
 
				+	unsigned id;
			
 
				+	for (id = 0; id < nworkers; id++)
			
 
				+		if (starpu_worker_get_type(id) == type && starpu_worker_get_devid(id) == devid)
			
 
				+			return id;
			
 
				+
			
 
				+	/* Not found */
			
 
				+	return -1;
			
 
				+}
			
 
				+
			
 
				 void starpu_worker_get_name(int id, char *dst, size_t maxlen)
			
 
				 {
			
 
				 	char *name = config.workers[id].name;
			
--- a/src/drivers/cpu/driver_cpu.c
+++ b/src/drivers/cpu/driver_cpu.c
@@ -178,13 +178,10 @@ static int execute_job_on_cpu(struct _starpu_job *j, struct starpu_task *worker_
 
				 static struct _starpu_worker*
			
 
				 _starpu_get_worker_from_driver(struct starpu_driver *d)
			
 
				 {
			
 
				-	int workers[d->id.cpu_id + 1];
			
 
				-	int nworkers;
			
 
				-	nworkers = starpu_worker_get_ids_by_type(STARPU_CPU_WORKER, workers, d->id.cpu_id+1);
			
 
				-	if (nworkers >= 0 && (unsigned) nworkers < d->id.cpu_id)
			
 
				-		return NULL; // No device was found.
			
 
				-
			
 
				-	return _starpu_get_worker_struct(workers[d->id.cpu_id]);
			
 
				+	int n = starpu_worker_get_by_devid(STARPU_CPU_WORKER, d->id.cpu_id);
			
 
				+	if (n == -1)
			
 
				+		return NULL;
			
 
				+	return _starpu_get_worker_struct(n);
			
 
				 }
			
 
				 
			
 
				 int _starpu_cpu_driver_init(struct starpu_driver *d)
			
--- a/src/drivers/cuda/driver_cuda.c
+++ b/src/drivers/cuda/driver_cuda.c
@@ -1,6 +1,6 @@
 
				 /* StarPU --- Runtime system for heterogeneous multicore architectures.
			
 
				  *
			
 
				- * Copyright (C) 2009-2012  Université de Bordeaux 1
			
 
				+ * Copyright (C) 2009-2013  Université de Bordeaux 1
			
 
				  * Copyright (C) 2010  Mehdi Juhoor <mjuhoor@gmail.com>
			
 
				  * Copyright (C) 2010, 2011, 2012  Centre National de la Recherche Scientifique
			
 
				  * Copyright (C) 2011  Télécom-SudParis
			
@@ -629,15 +629,11 @@ int _starpu_run_cuda(struct starpu_driver *d)
 
				 {
			
 
				 	STARPU_ASSERT(d && d->type == STARPU_CUDA_WORKER);
			
 
				 
			
 
				-	int workers[d->id.cuda_id + 1];
			
 
				-	int nworkers;
			
 
				-	nworkers = starpu_worker_get_ids_by_type(STARPU_CUDA_WORKER, workers, d->id.cuda_id+1);
			
 
				-	if (nworkers >= 0 && (unsigned) nworkers < d->id.cuda_id)
			
 
				-		return -ENODEV;
			
 
				-	
			
 
				+	int workerid = starpu_worker_get_by_devid(STARPU_CUDA_WORKER, d->id.cuda_id);
			
 
				+
			
 
				 	_STARPU_DEBUG("Running cuda %u from the application\n", d->id.cuda_id);
			
 
				 
			
 
				-	struct _starpu_worker *workerarg = _starpu_get_worker_struct(workers[d->id.cuda_id]);
			
 
				+	struct _starpu_worker *workerarg = _starpu_get_worker_struct(workerid);
			
 
				 
			
 
				 	workerarg->set = NULL;
			
 
				 	workerarg->worker_is_initialized = 0;