14 년 전 · a59c85d82a
--- a/src/Makefile.am
+++ b/src/Makefile.am
@@ -146,6 +146,7 @@ libstarpu_la_SOURCES = 						\
 
				 	sched_policies/fifo_queues.c				\
			
 
				 	sched_policies/detect_combined_workers.c		\
			
 
				 	sched_policies/parallel_heft.c				\
			
 
				+	sched_policies/parallel_greedy.c			\
			
 
				 	drivers/driver_common/driver_common.c			\
			
 
				 	datawizard/memory_nodes.c				\
			
 
				 	datawizard/write_back.c					\
			
--- a/src/core/sched_policy.c
+++ b/src/core/sched_policy.c
@@ -46,8 +46,9 @@ extern struct starpu_sched_policy_s _starpu_sched_dmda_ready_policy;
 
				 extern struct starpu_sched_policy_s _starpu_sched_dmda_sorted_policy;
			
 
				 extern struct starpu_sched_policy_s _starpu_sched_eager_policy;
			
 
				 extern struct starpu_sched_policy_s _starpu_sched_parallel_heft_policy;
			
 
				+extern struct starpu_sched_policy_s _starpu_sched_pgreedy_policy;
			
 
				 
			
 
				-#define NPREDEFINED_POLICIES	10
			
 
				+#define NPREDEFINED_POLICIES	11
			
 
				 
			
 
				 static struct starpu_sched_policy_s *predefined_policies[NPREDEFINED_POLICIES] = {
			
 
				 	&_starpu_sched_ws_policy,
			
@@ -59,7 +60,8 @@ static struct starpu_sched_policy_s *predefined_policies[NPREDEFINED_POLICIES] =
 
				 	&_starpu_sched_dmda_sorted_policy,
			
 
				 	&_starpu_sched_random_policy,
			
 
				 	&_starpu_sched_eager_policy,
			
 
				-	&_starpu_sched_parallel_heft_policy
			
 
				+	&_starpu_sched_parallel_heft_policy,
			
 
				+	&_starpu_sched_pgreedy_policy
			
 
				 };
			
 
				 
			
 
				 struct starpu_sched_policy_s *_starpu_get_sched_policy(void)
			
--- a/src/sched_policies/parallel_greedy.c
+++ b/src/sched_policies/parallel_greedy.c
@@ -0,0 +1,247 @@
 
				+/*
			
 
				+ * StarPU
			
 
				+ * Copyright (C) Université Bordeaux 1, CNRS 2008-2010 (see AUTHORS file)
			
 
				+ *
			
 
				+ * This program is free software; you can redistribute it and/or modify
			
 
				+ * it under the terms of the GNU Lesser General Public License as published by
			
 
				+ * the Free Software Foundation; either version 2.1 of the License, or (at
			
 
				+ * your option) any later version.
			
 
				+ *
			
 
				+ * This program is distributed in the hope that it will be useful, but
			
 
				+ * WITHOUT ANY WARRANTY; without even the implied warranty of
			
 
				+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
			
 
				+ *
			
 
				+ * See the GNU Lesser General Public License in COPYING.LGPL for more details.
			
 
				+ */
			
 
				+
			
 
				+#include <core/workers.h>
			
 
				+#include <sched_policies/fifo_queues.h>
			
 
				+
			
 
				+/* the former is the actual queue, the latter some container */
			
 
				+static struct starpu_fifo_taskq_s *fifo;
			
 
				+static struct starpu_fifo_taskq_s *local_fifo[STARPU_NMAXWORKERS];
			
 
				+
			
 
				+static int master_id[STARPU_NMAXWORKERS];
			
 
				+
			
 
				+static pthread_cond_t sched_cond;
			
 
				+static pthread_mutex_t sched_mutex;
			
 
				+
			
 
				+static pthread_cond_t master_sched_cond[STARPU_NMAXWORKERS];
			
 
				+static pthread_mutex_t master_sched_mutex[STARPU_NMAXWORKERS];
			
 
				+
			
 
				+/* XXX instead of 10, we should use some "MAX combination .."*/
			
 
				+static int possible_combinations_cnt[STARPU_NMAXWORKERS];
			
 
				+static int possible_combinations[STARPU_NMAXWORKERS][10];
			
 
				+static int possible_combinations_size[STARPU_NMAXWORKERS][10];
			
 
				+
			
 
				+static void initialize_pgreedy_policy(struct starpu_machine_topology_s *topology, 
			
 
				+		   __attribute__ ((unused)) struct starpu_sched_policy_s *_policy) 
			
 
				+{
			
 
				+	/* masters pick tasks from that queue */
			
 
				+	fifo = _starpu_create_fifo();
			
 
				+
			
 
				+	_starpu_sched_find_worker_combinations(topology);
			
 
				+
			
 
				+	unsigned workerid;
			
 
				+	unsigned ncombinedworkers, nworkers;
			
 
				+
			
 
				+	nworkers = topology->nworkers;
			
 
				+	ncombinedworkers = starpu_combined_worker_get_count();
			
 
				+
			
 
				+	/* Find the master of each worker. We first assign the worker as its
			
 
				+	 * own master, and then iterate over the different worker combinations
			
 
				+	 * to find the biggest combination containing this worker. */
			
 
				+
			
 
				+	for (workerid = 0; workerid < nworkers; workerid++)
			
 
				+	{
			
 
				+		int cnt = possible_combinations_cnt[workerid]++;
			
 
				+		possible_combinations[workerid][cnt] = workerid;
			
 
				+		possible_combinations_size[workerid][cnt] = 1;
			
 
				+
			
 
				+		master_id[workerid] = workerid;
			
 
				+	}
			
 
				+
			
 
				+	unsigned i;
			
 
				+	
			
 
				+	for (i = 0; i < ncombinedworkers; i++)
			
 
				+	{
			
 
				+		int workerid = nworkers + i;
			
 
				+
			
 
				+		/* Note that we ASSUME that the workers are sorted by size ! */
			
 
				+		int *workers;
			
 
				+		int size;
			
 
				+		starpu_combined_worker_get_description(workerid, &size, &workers);
			
 
				+
			
 
				+		int master = workers[0];
			
 
				+
			
 
				+		int j;
			
 
				+		for (j = 0; j < size; j++)
			
 
				+		{
			
 
				+			if (master_id[workers[j]] > master)
			
 
				+				master_id[workers[j]] = master;
			
 
				+
			
 
				+			int cnt = possible_combinations_cnt[workers[j]]++;
			
 
				+			possible_combinations[workers[j]][cnt] = workerid;
			
 
				+			possible_combinations_size[workers[j]][cnt] = size;
			
 
				+		}
			
 
				+	}
			
 
				+
			
 
				+	PTHREAD_MUTEX_INIT(&sched_mutex, NULL);
			
 
				+	PTHREAD_COND_INIT(&sched_cond, NULL);
			
 
				+
			
 
				+	for (workerid = 0; workerid < nworkers; workerid++)
			
 
				+	{
			
 
				+		PTHREAD_MUTEX_INIT(&master_sched_mutex[workerid], NULL);
			
 
				+		PTHREAD_COND_INIT(&master_sched_cond[workerid], NULL);
			
 
				+	}
			
 
				+
			
 
				+	for (workerid = 0; workerid < nworkers; workerid++)
			
 
				+	{
			
 
				+		/* slaves pick up tasks from their local queue, their master
			
 
				+		 * will put tasks directly in that local list when a parallel
			
 
				+		 * tasks comes. */
			
 
				+		local_fifo[workerid] = _starpu_create_fifo();
			
 
				+
			
 
				+		unsigned master = master_id[workerid];
			
 
				+
			
 
				+		/* All masters use the same condition/mutex */
			
 
				+		if (master == workerid)
			
 
				+		{
			
 
				+			starpu_worker_set_sched_condition(workerid,
			
 
				+				&sched_cond, &sched_mutex);
			
 
				+		}
			
 
				+		else {
			
 
				+			starpu_worker_set_sched_condition(workerid,
			
 
				+				&master_sched_cond[master],
			
 
				+				&master_sched_mutex[master]);
			
 
				+		}
			
 
				+	}
			
 
				+
			
 
				+#if 0
			
 
				+	for (workerid = 0; workerid < nworkers; workerid++)
			
 
				+	{
			
 
				+		fprintf(stderr, "MASTER of %d = %d\n", workerid, master_id[workerid]);
			
 
				+	}
			
 
				+#endif
			
 
				+}
			
 
				+
			
 
				+static void deinitialize_pgreedy_policy(__attribute__ ((unused)) struct starpu_machine_topology_s *topology, 
			
 
				+		   __attribute__ ((unused)) struct starpu_sched_policy_s *_policy) 
			
 
				+{
			
 
				+	/* TODO check that there is no task left in the queue */
			
 
				+
			
 
				+	/* deallocate the job queue */
			
 
				+	_starpu_destroy_fifo(fifo);
			
 
				+}
			
 
				+
			
 
				+static int push_task_pgreedy_policy(struct starpu_task *task)
			
 
				+{
			
 
				+	return _starpu_fifo_push_task(fifo, &sched_mutex, &sched_cond, task);
			
 
				+}
			
 
				+
			
 
				+static struct starpu_task *pop_task_pgreedy_policy(void)
			
 
				+{
			
 
				+	int workerid = starpu_worker_get_id();
			
 
				+
			
 
				+	/* If this is not a CPU, then the worker simply grabs tasks from the fifo */
			
 
				+	if (starpu_worker_get_type(workerid) != STARPU_CPU_WORKER)
			
 
				+		return  _starpu_fifo_pop_task(fifo, workerid);
			
 
				+
			
 
				+	int master = master_id[workerid];
			
 
				+
			
 
				+	if (master == workerid)
			
 
				+	{
			
 
				+		/* The worker is a master */
			
 
				+		struct starpu_task *task = _starpu_fifo_pop_task(fifo, workerid);
			
 
				+
			
 
				+		if (!task)
			
 
				+			return NULL;
			
 
				+
			
 
				+		/* Find the largest compatible worker combination */
			
 
				+		int best_size = -1;
			
 
				+		int best_workerid = -1;
			
 
				+		int i;
			
 
				+		for (i = 0; i < possible_combinations_cnt[master]; i++)
			
 
				+		{
			
 
				+			if (possible_combinations_size[workerid][i] > best_size)
			
 
				+			{
			
 
				+				int combined_worker = possible_combinations[workerid][i];
			
 
				+				if (starpu_combined_worker_may_execute_task(combined_worker, task))
			
 
				+				{
			
 
				+					best_size = possible_combinations_size[workerid][i];
			
 
				+					best_workerid = combined_worker;
			
 
				+				}
			
 
				+			}
			
 
				+		} 
			
 
				+
			
 
				+		/* In case nobody can execute this task, we let the master
			
 
				+		 * worker take it anyway, so that it can discard it afterward.
			
 
				+		 * */
			
 
				+		if (best_workerid == -1)
			
 
				+			return task;
			
 
				+		
			
 
				+		/* Is this a basic worker or a combined worker ? */
			
 
				+		int nbasic_workers = (int)starpu_worker_get_count();
			
 
				+		int is_basic_worker = (best_workerid < nbasic_workers);
			
 
				+
			
 
				+		if (is_basic_worker)
			
 
				+		{
			
 
				+			/* The master is alone */
			
 
				+			return task;
			
 
				+		}
			
 
				+		else {
			
 
				+			/* The master needs to dispatch the task between the
			
 
				+			 * different combined workers */
			
 
				+			struct starpu_combined_worker_s *combined_worker;
			
 
				+			combined_worker = _starpu_get_combined_worker_struct(best_workerid);
			
 
				+			int worker_size = combined_worker->worker_size;
			
 
				+			int *combined_workerid = combined_worker->combined_workerid;
			
 
				+
			
 
				+			starpu_job_t j = _starpu_get_job_associated_to_task(task);
			
 
				+			j->task_size = worker_size;
			
 
				+			j->combined_workerid = best_workerid;
			
 
				+			j->active_task_alias_count = 0;
			
 
				+
			
 
				+			//fprintf(stderr, "POP -> size %d best_size %d\n", worker_size, best_size);
			
 
				+
			
 
				+			PTHREAD_BARRIER_INIT(&j->before_work_barrier, NULL, worker_size);
			
 
				+			PTHREAD_BARRIER_INIT(&j->after_work_barrier, NULL, worker_size);
			
 
				+
			
 
				+			struct starpu_task *master_alias;
			
 
				+
			
 
				+			for (i = 0; i < worker_size; i++)
			
 
				+			{
			
 
				+				struct starpu_task *alias = _starpu_create_task_alias(task);
			
 
				+				int local_worker = combined_workerid[i];
			
 
				+
			
 
				+				if (i > 0)
			
 
				+				{
			
 
				+			//		fprintf(stderr, "push alias for rank i %d in fifo %p\n", i, local_fifo[local_worker]);
			
 
				+					_starpu_fifo_push_task(local_fifo[local_worker], &master_sched_mutex[master], &master_sched_cond[master], alias);
			
 
				+				}
			
 
				+				else {
			
 
				+					master_alias = alias;
			
 
				+				}
			
 
				+			}
			
 
				+
			
 
				+			return master_alias;
			
 
				+		}
			
 
				+
			
 
				+	}
			
 
				+	else {
			
 
				+		/* The worker is a slave */
			
 
				+		return _starpu_fifo_pop_task(local_fifo[workerid], workerid);
			
 
				+	}
			
 
				+}
			
 
				+
			
 
				+struct starpu_sched_policy_s _starpu_sched_pgreedy_policy = {
			
 
				+	.init_sched = initialize_pgreedy_policy,
			
 
				+	.deinit_sched = deinitialize_pgreedy_policy,
			
 
				+	.push_task = push_task_pgreedy_policy,
			
 
				+	.push_prio_task = push_task_pgreedy_policy,
			
 
				+	.pop_task = pop_task_pgreedy_policy,
			
 
				+	.post_exec_hook = NULL,
			
 
				+	.pop_every_task = NULL,
			
 
				+	.policy_name = "pgreedy",
			
 
				+	.policy_description = "parallel greedy policy"
			
 
				+};