| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533 |
- /* StarPU --- Runtime system for heterogeneous multicore architectures.
- *
- * Copyright (C) 2010-2011 Université de Bordeaux 1
- * Copyright (C) 2010-2011 Centre National de la Recherche Scientifique
- *
- * StarPU is free software; you can redistribute it and/or modify
- * it under the terms of the GNU Lesser General Public License as published by
- * the Free Software Foundation; either version 2.1 of the License, or (at
- * your option) any later version.
- *
- * StarPU is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
- *
- * See the GNU Lesser General Public License in COPYING.LGPL for more details.
- */
- #include <pthread.h>
- #include <starpu.h>
- #include <common/config.h>
- #include <common/utils.h>
- #include <core/sched_policy.h>
- #include <profiling/profiling.h>
- #include <common/barrier.h>
- static struct starpu_sched_policy policy;
- static int use_prefetch = 0;
- int starpu_get_prefetch_flag(void)
- {
- return use_prefetch;
- }
- /*
- * Predefined policies
- */
- extern struct starpu_sched_policy _starpu_sched_ws_policy;
- extern struct starpu_sched_policy _starpu_sched_prio_policy;
- extern struct starpu_sched_policy _starpu_sched_random_policy;
- extern struct starpu_sched_policy _starpu_sched_dm_policy;
- extern struct starpu_sched_policy _starpu_sched_dmda_policy;
- extern struct starpu_sched_policy _starpu_sched_dmda_ready_policy;
- extern struct starpu_sched_policy _starpu_sched_dmda_sorted_policy;
- extern struct starpu_sched_policy _starpu_sched_eager_policy;
- extern struct starpu_sched_policy _starpu_sched_parallel_heft_policy;
- extern struct starpu_sched_policy _starpu_sched_pgreedy_policy;
- extern struct starpu_sched_policy heft_policy;
- static struct starpu_sched_policy *predefined_policies[] =
- {
- &_starpu_sched_ws_policy,
- &_starpu_sched_prio_policy,
- &_starpu_sched_dm_policy,
- &_starpu_sched_dmda_policy,
- &heft_policy,
- &_starpu_sched_dmda_ready_policy,
- &_starpu_sched_dmda_sorted_policy,
- &_starpu_sched_random_policy,
- &_starpu_sched_eager_policy,
- &_starpu_sched_parallel_heft_policy,
- &_starpu_sched_pgreedy_policy
- };
- struct starpu_sched_policy *_starpu_get_sched_policy(void)
- {
- return &policy;
- }
- /*
- * Methods to initialize the scheduling policy
- */
- static void load_sched_policy(struct starpu_sched_policy *sched_policy)
- {
- STARPU_ASSERT(sched_policy);
- #ifdef STARPU_VERBOSE
- if (sched_policy->policy_name)
- {
- if (sched_policy->policy_description)
- _STARPU_DEBUG("Use %s scheduler (%s)\n", sched_policy->policy_name, sched_policy->policy_description);
- else
- _STARPU_DEBUG("Use %s scheduler \n", sched_policy->policy_name);
- }
- #endif
- policy.init_sched = sched_policy->init_sched;
- policy.deinit_sched = sched_policy->deinit_sched;
- policy.push_task = sched_policy->push_task;
- policy.push_task_notify = sched_policy->push_task_notify;
- policy.pop_task = sched_policy->pop_task;
- policy.post_exec_hook = sched_policy->post_exec_hook;
- policy.pop_every_task = sched_policy->pop_every_task;
- }
- static struct starpu_sched_policy *find_sched_policy_from_name(const char *policy_name)
- {
- if (!policy_name)
- return NULL;
- unsigned i;
- for (i = 0; i < sizeof(predefined_policies)/sizeof(predefined_policies[0]); i++)
- {
- struct starpu_sched_policy *p;
- p = predefined_policies[i];
- if (p->policy_name)
- {
- if (strcmp(policy_name, p->policy_name) == 0)
- {
- /* we found a policy with the requested name */
- return p;
- }
- }
- }
- fprintf(stderr, "Warning: scheduling policy \"%s\" was not found, try \"help\" to get a list\n", policy_name);
- /* nothing was found */
- return NULL;
- }
- static void display_sched_help_message(void)
- {
- const char *sched_env = getenv("STARPU_SCHED");
- if (sched_env && (strcmp(sched_env, "help") == 0))
- {
- fprintf(stderr, "STARPU_SCHED can be either of\n");
- /* display the description of all predefined policies */
- unsigned i;
- for (i = 0; i < sizeof(predefined_policies)/sizeof(predefined_policies[0]); i++)
- {
- struct starpu_sched_policy *p;
- p = predefined_policies[i];
- fprintf(stderr, "%s\t-> %s\n", p->policy_name, p->policy_description);
- }
- }
- }
- static struct starpu_sched_policy *select_sched_policy(struct _starpu_machine_config *config)
- {
- struct starpu_sched_policy *selected_policy = NULL;
- struct starpu_conf *user_conf = config->user_conf;
- /* First, we check whether the application explicitely gave a scheduling policy or not */
- if (user_conf && (user_conf->sched_policy))
- return user_conf->sched_policy;
- /* Otherwise, we look if the application specified the name of a policy to load */
- const char *sched_pol_name;
- if (user_conf && (user_conf->sched_policy_name))
- {
- sched_pol_name = user_conf->sched_policy_name;
- }
- else
- {
- sched_pol_name = getenv("STARPU_SCHED");
- }
- if (sched_pol_name)
- selected_policy = find_sched_policy_from_name(sched_pol_name);
- /* Perhaps there was no policy that matched the name */
- if (selected_policy)
- return selected_policy;
- /* If no policy was specified, we use the greedy policy as a default */
- return &_starpu_sched_eager_policy;
- }
- void _starpu_init_sched_policy(struct _starpu_machine_config *config)
- {
- /* Perhaps we have to display some help */
- display_sched_help_message();
- /* Prefetch is activated by default */
- use_prefetch = starpu_get_env_number("STARPU_PREFETCH");
- if (use_prefetch == -1)
- use_prefetch = 1;
- /* By default, we don't calibrate */
- unsigned do_calibrate = 0;
- if (config->user_conf && (config->user_conf->calibrate != -1))
- {
- do_calibrate = config->user_conf->calibrate;
- }
- else
- {
- int res = starpu_get_env_number("STARPU_CALIBRATE");
- do_calibrate = (res < 0)?0:(unsigned)res;
- }
- _starpu_set_calibrate_flag(do_calibrate);
- struct starpu_sched_policy *selected_policy;
- selected_policy = select_sched_policy(config);
- load_sched_policy(selected_policy);
- policy.init_sched(&config->topology, &policy);
- }
- void _starpu_deinit_sched_policy(struct _starpu_machine_config *config)
- {
- if (policy.deinit_sched)
- policy.deinit_sched(&config->topology, &policy);
- }
- /* Enqueue a task into the list of tasks explicitely attached to a worker. In
- * case workerid identifies a combined worker, a task will be enqueued into
- * each worker of the combination. */
- static int _starpu_push_task_on_specific_worker(struct starpu_task *task, int workerid)
- {
- int nbasic_workers = (int)starpu_worker_get_count();
- /* Is this a basic worker or a combined worker ? */
- int is_basic_worker = (workerid < nbasic_workers);
- unsigned memory_node;
- struct _starpu_worker *worker = NULL;
- struct _starpu_combined_worker *combined_worker = NULL;
- if (is_basic_worker)
- {
- worker = _starpu_get_worker_struct(workerid);
- memory_node = worker->memory_node;
- }
- else
- {
- combined_worker = _starpu_get_combined_worker_struct(workerid);
- memory_node = combined_worker->memory_node;
- }
- if (use_prefetch)
- starpu_prefetch_task_input_on_node(task, memory_node);
- if (policy.push_task_notify)
- policy.push_task_notify(task, workerid);
- if (is_basic_worker)
- {
- unsigned node = starpu_worker_get_memory_node(workerid);
- if (_starpu_task_uses_multiformat_handles(task))
- {
- unsigned i;
- for (i = 0; i < task->cl->nbuffers; i++)
- {
- struct starpu_task *conversion_task;
- starpu_data_handle_t handle;
- handle = task->handles[i];
- if (!_starpu_handle_needs_conversion_task(handle, node))
- continue;
- conversion_task = _starpu_create_conversion_task(handle, node);
- conversion_task->mf_skip = 1;
- conversion_task->execute_on_a_specific_worker = 1;
- conversion_task->workerid = workerid;
- _starpu_task_submit_conversion_task(conversion_task, workerid);
- //_STARPU_DEBUG("Pushing a conversion task\n");
- }
- for (i = 0; i < task->cl->nbuffers; i++)
- task->handles[i]->mf_node = node;
- }
- return _starpu_push_local_task(worker, task, 0);
- }
- else
- {
- /* This is a combined worker so we create task aliases */
- int worker_size = combined_worker->worker_size;
- int *combined_workerid = combined_worker->combined_workerid;
- int ret = 0;
- int i;
- struct _starpu_job *j = _starpu_get_job_associated_to_task(task);
- j->task_size = worker_size;
- j->combined_workerid = workerid;
- j->active_task_alias_count = 0;
- _STARPU_PTHREAD_BARRIER_INIT(&j->before_work_barrier, NULL, worker_size);
- _STARPU_PTHREAD_BARRIER_INIT(&j->after_work_barrier, NULL, worker_size);
- for (i = 0; i < worker_size; i++)
- {
- struct starpu_task *alias = _starpu_create_task_alias(task);
- worker = _starpu_get_worker_struct(combined_workerid[i]);
- ret |= _starpu_push_local_task(worker, alias, 0);
- }
- return ret;
- }
- }
- /* the generic interface that call the proper underlying implementation */
- int _starpu_push_task(struct _starpu_job *j, unsigned job_is_already_locked)
- {
- struct starpu_task *task = j->task;
- _STARPU_LOG_IN();
- _starpu_increment_nready_tasks();
- task->status = STARPU_TASK_READY;
- _starpu_profiling_set_task_push_start_time(task);
- /* in case there is no codelet associated to the task (that's a control
- * task), we directly execute its callback and enforce the
- * corresponding dependencies */
- if (task->cl == NULL)
- {
- _starpu_handle_job_termination(j, job_is_already_locked);
- _STARPU_LOG_OUT_TAG("handle_job_termination");
- return 0;
- }
- int ret;
- if (STARPU_UNLIKELY(task->execute_on_a_specific_worker))
- {
- ret = _starpu_push_task_on_specific_worker(task, task->workerid);
- }
- else
- {
- STARPU_ASSERT(policy.push_task);
- ret = policy.push_task(task);
- }
- _starpu_profiling_set_task_push_end_time(task);
- _STARPU_LOG_OUT();
- return ret;
- }
- /*
- * Given a handle that needs to be converted in order to be used on the given
- * node, returns a task that takes care of the conversion.
- */
- struct starpu_task *_starpu_create_conversion_task(starpu_data_handle_t handle,
- unsigned int node)
- {
- struct starpu_task *conversion_task;
- struct starpu_multiformat_interface *format_interface;
- enum _starpu_node_kind node_kind;
- conversion_task = starpu_task_create();
- conversion_task->synchronous = 0;
- conversion_task->buffers[0].handle = handle;
- conversion_task->buffers[0].mode = STARPU_RW;
- /* The node does not really matter here */
- format_interface = (struct starpu_multiformat_interface *) starpu_data_get_interface_on_node(handle, 0);
- node_kind = _starpu_get_node_kind(node);
- handle->refcnt++;
- handle->busy_count++;
- switch(node_kind)
- {
- case STARPU_CPU_RAM:
- switch (_starpu_get_node_kind(handle->mf_node))
- {
- case STARPU_CPU_RAM:
- STARPU_ASSERT(0);
- #ifdef STARPU_USE_CUDA
- case STARPU_CUDA_RAM:
- conversion_task->cl = format_interface->ops->cuda_to_cpu_cl;
- break;
- #endif
- #ifdef STARPU_USE_OPENCL
- case STARPU_OPENCL_RAM:
- conversion_task->cl = format_interface->ops->opencl_to_cpu_cl;
- break;
- #endif
- default:
- fprintf(stderr, "Oops : %d\n", handle->mf_node);
- STARPU_ASSERT(0);
- }
- break;
- #ifdef STARPU_USE_CUDA
- case STARPU_CUDA_RAM:
- conversion_task->cl = format_interface->ops->cpu_to_cuda_cl;
- break;
- #endif
- #ifdef STARPU_USE_OPENCL
- case STARPU_OPENCL_RAM:
- conversion_task->cl = format_interface->ops->cpu_to_opencl_cl;
- break;
- #endif
- case STARPU_SPU_LS: /* Not supported */
- default:
- STARPU_ASSERT(0);
- }
- return conversion_task;
- }
- struct starpu_task *_starpu_pop_task(struct _starpu_worker *worker)
- {
- struct starpu_task *task;
- /* We can't tell in advance which task will be picked up, so we measure
- * a timestamp, and will attribute it afterwards to the task. */
- int profiling = starpu_profiling_status_get();
- struct timespec pop_start_time;
- if (profiling)
- _starpu_clock_gettime(&pop_start_time);
- pick:
- /* perhaps there is some local task to be executed first */
- task = _starpu_pop_local_task(worker);
- if (!task && policy.pop_task)
- task = policy.pop_task();
- if (!task)
- return NULL;
- /* Make sure we do not bother with all the multiformat-specific code if
- * it is not necessary. */
- if (!_starpu_task_uses_multiformat_handles(task))
- goto profiling;
- /* This is either a conversion task, or a regular task for which the
- * conversion tasks have already been created and submitted */
- if (task->mf_skip)
- goto profiling;
- int worker_id = starpu_worker_get_id();
- if (!starpu_worker_can_execute_task(worker_id, task, 0))
- return task;
- unsigned node = starpu_worker_get_memory_node(worker_id);
- /*
- * We do have a task that uses multiformat handles. Let's create the
- * required conversion tasks.
- */
- unsigned i;
- for (i = 0; i < task->cl->nbuffers; i++)
- {
- struct starpu_task *conversion_task;
- starpu_data_handle_t handle;
- handle = task->handles[i];
- if (!_starpu_handle_needs_conversion_task(handle, node))
- continue;
- conversion_task = _starpu_create_conversion_task(handle, node);
- conversion_task->mf_skip = 1;
- conversion_task->execute_on_a_specific_worker = 1;
- conversion_task->workerid = worker_id;
- /*
- * Next tasks will need to know where these handles have gone.
- */
- handle->mf_node = node;
- _starpu_task_submit_conversion_task(conversion_task, worker_id);
- }
- task->mf_skip = 1;
- starpu_task_list_push_front(&worker->local_tasks, task);
- goto pick;
- profiling:
- /* Note that we may get a NULL task in case the scheduler was unlocked
- * for some reason. */
- if (profiling)
- {
- struct starpu_task_profiling_info *profiling_info;
- profiling_info = task->profiling_info;
- /* The task may have been created before profiling was enabled,
- * so we check if the profiling_info structure is available
- * even though we already tested if profiling is enabled. */
- if (profiling_info)
- {
- memcpy(&profiling_info->pop_start_time,
- &pop_start_time, sizeof(struct timespec));
- _starpu_clock_gettime(&profiling_info->pop_end_time);
- }
- }
- return task;
- }
- struct starpu_task *_starpu_pop_every_task(void)
- {
- STARPU_ASSERT(policy.pop_every_task);
- /* TODO set profiling info */
- return policy.pop_every_task();
- }
- void _starpu_sched_post_exec_hook(struct starpu_task *task)
- {
- if (policy.post_exec_hook)
- policy.post_exec_hook(task);
- }
- void _starpu_wait_on_sched_event(void)
- {
- struct _starpu_worker *worker = _starpu_get_local_worker_key();
- _STARPU_PTHREAD_MUTEX_LOCK(worker->sched_mutex);
- _starpu_handle_all_pending_node_data_requests(worker->memory_node);
- if (_starpu_machine_is_running())
- {
- #ifndef STARPU_NON_BLOCKING_DRIVERS
- _STARPU_PTHREAD_COND_WAIT(worker->sched_cond,
- worker->sched_mutex);
- #endif
- }
- _STARPU_PTHREAD_MUTEX_UNLOCK(worker->sched_mutex);
- }
- /* The scheduling policy may put tasks directly into a worker's local queue so
- * that it is not always necessary to create its own queue when the local queue
- * is sufficient. If "back" not null, the task is put at the back of the queue
- * where the worker will pop tasks first. Setting "back" to 0 therefore ensures
- * a FIFO ordering. */
- int starpu_push_local_task(int workerid, struct starpu_task *task, int back)
- {
- struct _starpu_worker *worker = _starpu_get_worker_struct(workerid);
- return _starpu_push_local_task(worker, task, back);
- }
|