123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819 |
- /* StarPU --- Runtime system for heterogeneous multicore architectures.
- *
- * Copyright (C) 2012, 2016, 2017 INRIA
- *
- * StarPU is free software; you can redistribute it and/or modify
- * it under the terms of the GNU Lesser General Public License as published by
- * the Free Software Foundation; either version 2.1 of the License, or (at
- * your option) any later version.
- *
- * StarPU is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
- *
- * See the GNU Lesser General Public License in COPYING.LGPL for more details.
- */
- #include <starpu.h>
- #include <common/config.h>
- #include <common/utils.h>
- #include <drivers/mp_common/mp_common.h>
- #include <drivers/mpi/driver_mpi_common.h>
- #include <datawizard/interfaces/data_interface.h>
- #include <common/barrier.h>
- #include <core/workers.h>
- #include <common/barrier_counter.h>
- #ifdef STARPU_USE_MIC
- #include <common/COISysInfo_common.h>
- #endif
- #include "sink_common.h"
- /* Return the sink kind of the running process, based on the value of the
- * STARPU_SINK environment variable.
- * If there is no valid value retrieved, return STARPU_INVALID_KIND
- */
- static enum _starpu_mp_node_kind _starpu_sink_common_get_kind(void)
- {
- /* Environment varible STARPU_SINK must be defined when running on sink
- * side : let's use it to get the kind of node we're running on */
- char *node_kind = starpu_getenv("STARPU_SINK");
- STARPU_ASSERT(node_kind);
- if (!strcmp(node_kind, "STARPU_MIC"))
- return STARPU_NODE_MIC_SINK;
- else if (!strcmp(node_kind, "STARPU_SCC"))
- return STARPU_NODE_SCC_SINK;
- else if (!strcmp(node_kind, "STARPU_MPI_MS"))
- return STARPU_NODE_MPI_SINK;
- else
- return STARPU_NODE_INVALID_KIND;
- }
- /* Send to host the number of cores of the sink device
- */
- static void _starpu_sink_common_get_nb_cores (struct _starpu_mp_node *node)
- {
- // Process packet received from `_starpu_src_common_sink_cores'.
- _starpu_mp_common_send_command (node, STARPU_MP_COMMAND_ANSWER_SINK_NBCORES,
- &node->nb_cores, sizeof (int));
- }
- /* Send to host the address of the function given in parameter
- */
- static void _starpu_sink_common_lookup(const struct _starpu_mp_node *node,
- char *func_name)
- {
- void (*func)(void);
- func = node->lookup(node,func_name);
- //_STARPU_DEBUG("Looked up %s, got %p\n", func_name, func);
- /* If we couldn't find the function, let's send an error to the host.
- * The user probably made a mistake in the name */
- if (func)
- _starpu_mp_common_send_command(node, STARPU_MP_COMMAND_ANSWER_LOOKUP,
- &func, sizeof(func));
- else
- _starpu_mp_common_send_command(node, STARPU_MP_COMMAND_ERROR_LOOKUP,
- NULL, 0);
- }
- /* Allocate a memory space and send the address of this space to the host
- */
- void _starpu_sink_common_allocate(const struct _starpu_mp_node *mp_node,
- void *arg, int arg_size)
- {
- STARPU_ASSERT(arg_size == sizeof(size_t));
- void *addr;
- _STARPU_MALLOC(addr, *(size_t *)(arg));
- /* If the allocation fail, let's send an error to the host.
- */
- if (addr)
- _starpu_mp_common_send_command(mp_node, STARPU_MP_COMMAND_ANSWER_ALLOCATE,
- &addr, sizeof(addr));
- else
- _starpu_mp_common_send_command(mp_node, STARPU_MP_COMMAND_ERROR_ALLOCATE,
- NULL, 0);
- }
- void _starpu_sink_common_free(const struct _starpu_mp_node *mp_node STARPU_ATTRIBUTE_UNUSED,
- void *arg, int arg_size)
- {
- STARPU_ASSERT(arg_size == sizeof(void *));
- free(*(void **)(arg));
- }
- static void _starpu_sink_common_copy_from_host_sync(const struct _starpu_mp_node *mp_node,
- void *arg, int arg_size)
- {
- STARPU_ASSERT(arg_size == sizeof(struct _starpu_mp_transfer_command));
- struct _starpu_mp_transfer_command *cmd = (struct _starpu_mp_transfer_command *)arg;
- mp_node->dt_recv(mp_node, cmd->addr, cmd->size, NULL);
- }
- static void _starpu_sink_common_copy_from_host_async(struct _starpu_mp_node *mp_node,
- void *arg, int arg_size)
- {
- STARPU_ASSERT(arg_size == sizeof(struct _starpu_mp_transfer_command));
- struct _starpu_mp_transfer_command *cmd = (struct _starpu_mp_transfer_command *)arg;
- /* For asynchronous transfers, we store events to test them later when they are finished */
- struct _starpu_mp_event * sink_event = _starpu_mp_event_new();
- /* Save the command to send */
- sink_event->answer_cmd = STARPU_MP_COMMAND_RECV_FROM_HOST_ASYNC_COMPLETED;
- sink_event->remote_event = cmd->event;
- /* Set the sender (host) ready because we don't want to wait its ack */
- struct _starpu_async_channel * async_channel = &sink_event->event;
- async_channel->type = STARPU_UNUSED;
- async_channel->starpu_mp_common_finished_sender = -1;
- async_channel->starpu_mp_common_finished_receiver = 0;
- async_channel->polling_node_receiver = NULL;
- async_channel->polling_node_sender = NULL;
- mp_node->dt_recv(mp_node, cmd->addr, cmd->size, &sink_event->event);
- /* Push event on the list */
- _starpu_mp_event_list_push_back(&mp_node->event_list, sink_event);
- }
- static void _starpu_sink_common_copy_to_host_sync(const struct _starpu_mp_node *mp_node,
- void *arg, int arg_size)
- {
- STARPU_ASSERT(arg_size == sizeof(struct _starpu_mp_transfer_command));
- struct _starpu_mp_transfer_command *cmd = (struct _starpu_mp_transfer_command *)arg;
- /* Save values before sending command to prevent the overwriting */
- size_t size = cmd->size;
- void * addr = cmd->addr;
- _starpu_mp_common_send_command(mp_node, STARPU_MP_COMMAND_SEND_TO_HOST, NULL, 0);
- mp_node->dt_send(mp_node, addr, size, NULL);
- }
- static void _starpu_sink_common_copy_to_host_async(struct _starpu_mp_node *mp_node,
- void *arg, int arg_size)
- {
- STARPU_ASSERT(arg_size == sizeof(struct _starpu_mp_transfer_command));
- struct _starpu_mp_transfer_command *cmd = (struct _starpu_mp_transfer_command *)arg;
- /* For asynchronous transfers, we need to say dt_send that we are in async mode
- * but we don't push event on list because we don't need to know if it's finished
- */
- struct _starpu_mp_event * sink_event = _starpu_mp_event_new();
- /* Save the command to send */
- sink_event->answer_cmd = STARPU_MP_COMMAND_SEND_TO_HOST_ASYNC_COMPLETED;
- sink_event->remote_event = cmd->event;
- /* Set the receiver (host) ready because we don't want to wait its ack */
- struct _starpu_async_channel * async_channel = &sink_event->event;
- async_channel->type = STARPU_UNUSED;
- async_channel->starpu_mp_common_finished_sender = 0;
- async_channel->starpu_mp_common_finished_receiver = -1;
- async_channel->polling_node_receiver = NULL;
- async_channel->polling_node_sender = NULL;
- mp_node->dt_send(mp_node, cmd->addr, cmd->size, &sink_event->event);
- /* Push event on the list */
- _starpu_mp_event_list_push_back(&mp_node->event_list, sink_event);
- }
- static void _starpu_sink_common_copy_from_sink_sync(const struct _starpu_mp_node *mp_node,
- void *arg, int arg_size)
- {
- STARPU_ASSERT(arg_size == sizeof(struct _starpu_mp_transfer_command_to_device));
- struct _starpu_mp_transfer_command_to_device *cmd = (struct _starpu_mp_transfer_command_to_device *)arg;
- mp_node->dt_recv_from_device(mp_node, cmd->devid, cmd->addr, cmd->size, NULL);
- _starpu_mp_common_send_command(mp_node, STARPU_MP_COMMAND_TRANSFER_COMPLETE, NULL, 0);
- }
- static void _starpu_sink_common_copy_from_sink_async(struct _starpu_mp_node *mp_node,
- void *arg, int arg_size)
- {
- STARPU_ASSERT(arg_size == sizeof(struct _starpu_mp_transfer_command_to_device));
- struct _starpu_mp_transfer_command_to_device *cmd = (struct _starpu_mp_transfer_command_to_device *)arg;
- /* For asynchronous transfers, we store events to test them later when they are finished
- */
- struct _starpu_mp_event * sink_event = _starpu_mp_event_new();
- /* Save the command to send */
- sink_event->answer_cmd = STARPU_MP_COMMAND_RECV_FROM_SINK_ASYNC_COMPLETED;
- sink_event->remote_event = cmd->event;
- /* Set the sender ready because we don't want to wait its ack */
- struct _starpu_async_channel * async_channel = &sink_event->event;
- async_channel->type = STARPU_UNUSED;
- async_channel->starpu_mp_common_finished_sender = -1;
- async_channel->starpu_mp_common_finished_receiver = 0;
- async_channel->polling_node_receiver = NULL;
- async_channel->polling_node_sender = NULL;
- mp_node->dt_recv_from_device(mp_node, cmd->devid, cmd->addr, cmd->size, &sink_event->event);
- /* Push event on the list */
- _starpu_mp_event_list_push_back(&mp_node->event_list, sink_event);
- }
- static void _starpu_sink_common_copy_to_sink_sync(const struct _starpu_mp_node *mp_node,
- void *arg, int arg_size)
- {
- STARPU_ASSERT(arg_size == sizeof(struct _starpu_mp_transfer_command_to_device));
- struct _starpu_mp_transfer_command_to_device *cmd = (struct _starpu_mp_transfer_command_to_device *)arg;
- mp_node->dt_send_to_device(mp_node, cmd->devid, cmd->addr, cmd->size, NULL);
- }
- static void _starpu_sink_common_copy_to_sink_async(struct _starpu_mp_node *mp_node,
- void *arg, int arg_size)
- {
- STARPU_ASSERT(arg_size == sizeof(struct _starpu_mp_transfer_command_to_device));
- struct _starpu_mp_transfer_command_to_device *cmd = (struct _starpu_mp_transfer_command_to_device *)arg;
- /* For asynchronous transfers, we need to say dt_send that we are in async mode
- * but we don't push event on list because we don't need to know if it's finished
- */
- struct _starpu_mp_event * sink_event = _starpu_mp_event_new();
- /* Save the command to send */
- sink_event->answer_cmd = STARPU_MP_COMMAND_SEND_TO_SINK_ASYNC_COMPLETED;
- sink_event->remote_event = cmd->event;
- /* Set the receiver ready because we don't want to wait its ack */
- struct _starpu_async_channel * async_channel = &sink_event->event;
- async_channel->type = STARPU_UNUSED;
- async_channel->starpu_mp_common_finished_sender = 0;
- async_channel->starpu_mp_common_finished_receiver = -1;
- async_channel->polling_node_receiver = NULL;
- async_channel->polling_node_sender = NULL;
- mp_node->dt_send_to_device(mp_node, cmd->devid, cmd->addr, cmd->size, &sink_event->event);
- /* Push event on the list */
- _starpu_mp_event_list_push_back(&mp_node->event_list, sink_event);
- }
- /* Receive workers and combined workers and store them into the struct config
- */
- static void _starpu_sink_common_recv_workers(struct _starpu_mp_node * node, void *arg, int arg_size)
- {
- /* Retrieve information from the message */
- STARPU_ASSERT(arg_size == (sizeof(int)*5));
- uintptr_t arg_ptr = (uintptr_t) arg;
- int i;
- int nworkers = *(int *)arg_ptr;
- arg_ptr += sizeof(nworkers);
- int worker_size = *(int *)arg_ptr;
- arg_ptr += sizeof(worker_size);
- int combined_worker_size = *(int *)arg_ptr;
- arg_ptr += sizeof(combined_worker_size);
- int baseworkerid = *(int *)arg_ptr;
- arg_ptr += sizeof(baseworkerid);
- struct _starpu_machine_config *config = _starpu_get_machine_config();
- config->topology.nworkers = *(int *)arg_ptr;
- /* Retrieve workers */
- struct _starpu_worker * workers = &config->workers[baseworkerid];
- node->dt_recv(node,workers,worker_size, NULL);
- /* Update workers to have coherent field */
- for(i=0; i<nworkers; i++)
- {
- workers[i].config = config;
- STARPU_PTHREAD_MUTEX_INIT(&workers[i].mutex,NULL);
- STARPU_PTHREAD_MUTEX_DESTROY(&workers[i].mutex);
- STARPU_PTHREAD_COND_INIT(&workers[i].started_cond,NULL);
- STARPU_PTHREAD_COND_DESTROY(&workers[i].started_cond);
- STARPU_PTHREAD_COND_INIT(&workers[i].ready_cond,NULL);
- STARPU_PTHREAD_COND_DESTROY(&workers[i].ready_cond);
- STARPU_PTHREAD_MUTEX_INIT(&workers[i].sched_mutex,NULL);
- STARPU_PTHREAD_MUTEX_DESTROY(&workers[i].sched_mutex);
- STARPU_PTHREAD_COND_INIT(&workers[i].sched_cond,NULL);
- STARPU_PTHREAD_COND_DESTROY(&workers[i].sched_cond);
- workers[i].current_task = NULL;
- workers[i].set = NULL;
- }
- /* Retrieve combined workers */
- struct _starpu_combined_worker * combined_workers = config->combined_workers;
- node->dt_recv(node, combined_workers, combined_worker_size, NULL);
- node->baseworkerid = baseworkerid;
- STARPU_PTHREAD_BARRIER_WAIT(&node->init_completed_barrier);
- }
- /* Function looping on the sink, waiting for tasks to execute.
- * If the caller is the host, don't do anything.
- */
- void _starpu_sink_common_worker(void)
- {
- struct _starpu_mp_node *node = NULL;
- enum _starpu_mp_command command = STARPU_MP_COMMAND_EXIT;
- int arg_size = 0;
- void *arg = NULL;
- int exit_starpu = 0;
- enum _starpu_mp_node_kind node_kind = _starpu_sink_common_get_kind();
- if (node_kind == STARPU_NODE_INVALID_KIND)
- _STARPU_ERROR("No valid sink kind retrieved, use the"
- "STARPU_SINK environment variable to specify"
- "this\n");
- /* Create and initialize the node */
- node = _starpu_mp_common_node_create(node_kind, -1);
- starpu_pthread_key_t worker_key;
- STARPU_PTHREAD_KEY_CREATE(&worker_key, NULL);
- while (!exit_starpu)
- {
- /* If we have received a message */
- if(node->mp_recv_is_ready(node))
- {
- command = _starpu_mp_common_recv_command(node, &arg, &arg_size);
- switch(command)
- {
- case STARPU_MP_COMMAND_EXIT:
- exit_starpu = 1;
- break;
- case STARPU_MP_COMMAND_EXECUTE_DETACHED:
- case STARPU_MP_COMMAND_EXECUTE:
- node->execute(node, arg, arg_size);
- break;
- case STARPU_MP_COMMAND_SINK_NBCORES:
- _starpu_sink_common_get_nb_cores(node);
- break;
- case STARPU_MP_COMMAND_LOOKUP:
- _starpu_sink_common_lookup(node, (char *) arg);
- break;
- case STARPU_MP_COMMAND_ALLOCATE:
- node->allocate(node, arg, arg_size);
- break;
- case STARPU_MP_COMMAND_FREE:
- node->free(node, arg, arg_size);
- break;
- case STARPU_MP_COMMAND_RECV_FROM_HOST:
- _starpu_sink_common_copy_from_host_sync(node, arg, arg_size);
- break;
- case STARPU_MP_COMMAND_SEND_TO_HOST:
- _starpu_sink_common_copy_to_host_sync(node, arg, arg_size);
- break;
- case STARPU_MP_COMMAND_RECV_FROM_SINK:
- _starpu_sink_common_copy_from_sink_sync(node, arg, arg_size);
- break;
- case STARPU_MP_COMMAND_SEND_TO_SINK:
- _starpu_sink_common_copy_to_sink_sync(node, arg, arg_size);
- break;
- case STARPU_MP_COMMAND_RECV_FROM_HOST_ASYNC:
- _starpu_sink_common_copy_from_host_async(node, arg, arg_size);
- break;
- case STARPU_MP_COMMAND_SEND_TO_HOST_ASYNC:
- _starpu_sink_common_copy_to_host_async(node, arg, arg_size);
- break;
- case STARPU_MP_COMMAND_RECV_FROM_SINK_ASYNC:
- _starpu_sink_common_copy_from_sink_async(node, arg, arg_size);
- break;
- case STARPU_MP_COMMAND_SEND_TO_SINK_ASYNC:
- _starpu_sink_common_copy_to_sink_async(node, arg, arg_size);
- break;
- case STARPU_MP_COMMAND_SYNC_WORKERS:
- _starpu_sink_common_recv_workers(node, arg, arg_size);
- break;
- default:
- _STARPU_MSG("Oops, command %x unrecognized\n", command);
- }
- }
- STARPU_PTHREAD_MUTEX_LOCK(&node->message_queue_mutex);
- /* If the list is not empty */
- if(!mp_message_list_empty(&node->message_queue))
- {
- /* We pop a message and send it to the host */
- struct mp_message * message = mp_message_list_pop_back(&node->message_queue);
- STARPU_PTHREAD_MUTEX_UNLOCK(&node->message_queue_mutex);
- //_STARPU_DEBUG("telling host that we have finished the task %p sur %d.\n", task->kernel, task->coreid);
- _starpu_mp_common_send_command(node, message->type,
- message->buffer, message->size);
- free(message->buffer);
- mp_message_delete(message);
- }
- else
- {
- STARPU_PTHREAD_MUTEX_UNLOCK(&node->message_queue_mutex);
- }
- if(!_starpu_mp_event_list_empty(&node->event_list))
- {
- struct _starpu_mp_event * sink_event = _starpu_mp_event_list_pop_front(&node->event_list);
- if (node->dt_test(&sink_event->event))
- {
- /* send ACK to host */
- _starpu_mp_common_send_command(node, sink_event->answer_cmd , &sink_event->remote_event, sizeof(sink_event->remote_event));
- _starpu_mp_event_delete(sink_event);
- }
- else
- {
- /* try later */
- _starpu_mp_event_list_push_back(&node->event_list, sink_event);
- }
-
- }
- }
- STARPU_PTHREAD_KEY_DELETE(worker_key);
- /* Deinitialize the node and release it */
- _starpu_mp_common_node_destroy(node);
- #ifdef STARPU_USE_MPI_MASTER_SLAVE
- _starpu_mpi_common_mp_deinit();
- #endif
- exit(0);
- }
- /* Search for the mp_barrier correspondind to the specified combined worker
- * and create it if it doesn't exist
- */
- static struct mp_barrier * _starpu_sink_common_get_barrier(struct _starpu_mp_node * node, int cb_workerid, int cb_workersize)
- {
- struct mp_barrier * b = NULL;
- STARPU_PTHREAD_MUTEX_LOCK(&node->barrier_mutex);
- /* Search if the barrier already exist */
- for(b = mp_barrier_list_begin(&node->barrier_list);
- b != mp_barrier_list_end(&node->barrier_list) && b->id != cb_workerid;
- b = mp_barrier_list_next(b));
- /* If we found the barrier */
- if(b != NULL)
- {
- STARPU_PTHREAD_MUTEX_UNLOCK(&node->barrier_mutex);
- return b;
- }
- else
- {
- /* Else we create, initialize and add it to the list*/
- b = mp_barrier_new();
- b->id = cb_workerid;
- STARPU_PTHREAD_BARRIER_INIT(&b->before_work_barrier,NULL,cb_workersize);
- STARPU_PTHREAD_BARRIER_INIT(&b->after_work_barrier,NULL,cb_workersize);
- mp_barrier_list_push_back(&node->barrier_list,b);
- STARPU_PTHREAD_MUTEX_UNLOCK(&node->barrier_mutex);
- return b;
- }
- }
- /* Erase for the mp_barrier correspondind to the specified combined worker
- */
- static void _starpu_sink_common_erase_barrier(struct _starpu_mp_node * node, struct mp_barrier *barrier)
- {
- STARPU_PTHREAD_MUTEX_LOCK(&node->barrier_mutex);
- mp_barrier_list_erase(&node->barrier_list,barrier);
- STARPU_PTHREAD_MUTEX_UNLOCK(&node->barrier_mutex);
- }
- /* Append the message given in parameter to the message list
- */
- static void _starpu_sink_common_append_message(struct _starpu_mp_node *node, struct mp_message * message)
- {
- STARPU_PTHREAD_MUTEX_LOCK(&node->message_queue_mutex);
- mp_message_list_push_front(&node->message_queue,message);
- STARPU_PTHREAD_MUTEX_UNLOCK(&node->message_queue_mutex);
- }
- /* Append to the message list a "STARPU_PRE_EXECUTION" message
- */
- static void _starpu_sink_common_pre_execution_message(struct _starpu_mp_node *node, struct mp_task *task)
- {
- /* Init message to tell the sink that the execution has begun */
- struct mp_message * message = mp_message_new();
- message->type = STARPU_MP_COMMAND_PRE_EXECUTION;
- _STARPU_MALLOC(message->buffer, sizeof(int));
- *(int *) message->buffer = task->combined_workerid;
- message->size = sizeof(int);
- /* Append the message to the queue */
- _starpu_sink_common_append_message(node, message);
- }
- /* Append to the message list a "STARPU_EXECUTION_COMPLETED" message
- */
- static void _starpu_sink_common_execution_completed_message(struct _starpu_mp_node *node, struct mp_task *task)
- {
- /* Init message to tell the sink that the execution is completed */
- struct mp_message * message = mp_message_new();
- if (task->detached)
- message->type = STARPU_MP_COMMAND_EXECUTION_DETACHED_COMPLETED;
- else
- message->type = STARPU_MP_COMMAND_EXECUTION_COMPLETED;
- _STARPU_MALLOC(message->buffer, sizeof(int));
- *(int*) message->buffer = task->coreid;
- message->size = sizeof(int);
- /* Append the message to the queue */
- _starpu_sink_common_append_message(node, message);
- }
- /* Bind the thread which is running on the specified core to the combined worker */
- static void _starpu_sink_common_bind_to_combined_worker(struct _starpu_mp_node *node, int coreid, struct _starpu_combined_worker * combined_worker)
- {
- int i;
- int * bind_set;
- _STARPU_MALLOC(bind_set, sizeof(int)*combined_worker->worker_size);
- for(i=0;i<combined_worker->worker_size;i++)
- bind_set[i] = combined_worker->combined_workerid[i] - node->baseworkerid;
- node->bind_thread(node, coreid, bind_set, combined_worker->worker_size);
- }
- /* Get the current rank of the worker in the combined worker
- */
- static int _starpu_sink_common_get_current_rank(int workerid, struct _starpu_combined_worker * combined_worker)
- {
- int i;
- for(i=0; i<combined_worker->worker_size; i++)
- if(workerid == combined_worker->combined_workerid[i])
- return i;
- STARPU_ASSERT(0);
- return -1;
- }
- /* Execute the task
- */
- static void _starpu_sink_common_execute_kernel(struct _starpu_mp_node *node, int coreid, struct _starpu_worker * worker, int detached)
- {
- struct _starpu_combined_worker * combined_worker = NULL;
- struct mp_task* task;
- if (detached)
- task = node->run_table_detached[coreid];
- else
- task = node->run_table[coreid];
- /* If it's a parallel task */
- if(task->is_parallel_task)
- {
- combined_worker = _starpu_get_combined_worker_struct(task->combined_workerid);
- worker->current_rank = _starpu_sink_common_get_current_rank(worker->workerid, combined_worker);
- worker->combined_workerid = task->combined_workerid;
- worker->worker_size = combined_worker->worker_size;
- /* Synchronize with others threads of the combined worker*/
- STARPU_PTHREAD_BARRIER_WAIT(&task->mp_barrier->before_work_barrier);
- /* The first thread of the combined worker */
- if(worker->current_rank == 0)
- {
- /* tell the sink that the execution has begun */
- _starpu_sink_common_pre_execution_message(node,task);
- /* If the mode is FORKJOIN,
- * the first thread binds himself
- * on all core of the combined worker*/
- if(task->type == STARPU_FORKJOIN)
- {
- _starpu_sink_common_bind_to_combined_worker(node, coreid, combined_worker);
- }
- }
- }
- else
- {
- worker->current_rank = 0;
- worker->combined_workerid = 0;
- worker->worker_size = 1;
- }
- if(task->type != STARPU_FORKJOIN || worker->current_rank == 0)
- {
- if (_starpu_get_disable_kernels() <= 0)
- {
- /* execute the task */
- task->kernel(task->interfaces,task->cl_arg);
- }
- }
- /* If it's a parallel task */
- if(task->is_parallel_task)
- {
- /* Synchronize with others threads of the combined worker*/
- STARPU_PTHREAD_BARRIER_WAIT(&task->mp_barrier->after_work_barrier);
- /* The fisrt thread of the combined */
- if(worker->current_rank == 0)
- {
- /* Erase the barrier from the list */
- _starpu_sink_common_erase_barrier(node,task->mp_barrier);
- /* If the mode is FORKJOIN,
- * the first thread rebinds himself on his own core */
- if(task->type == STARPU_FORKJOIN)
- node->bind_thread(node, coreid, &coreid, 1);
- }
- }
- if (detached)
- node->run_table_detached[coreid] = NULL;
- else
- node->run_table[coreid] = NULL;
- /* tell the sink that the execution is completed */
- _starpu_sink_common_execution_completed_message(node,task);
- /*free the task*/
- unsigned i;
- for (i = 0; i < task->nb_interfaces; i++)
- free(task->interfaces[i]);
- free(task->interfaces);
- if (task->cl_arg != NULL)
- free(task->cl_arg);
- free(task);
- }
- /* The main function executed by the thread
- * thread_arg is a structure containing the information needed by the thread
- */
- void* _starpu_sink_thread(void * thread_arg)
- {
- /* Retrieve the information from the structure */
- struct _starpu_mp_node *node = ((struct arg_sink_thread *)thread_arg)->node;
- int coreid =((struct arg_sink_thread *)thread_arg)->coreid;
- /* free the structure */
- free(thread_arg);
- STARPU_PTHREAD_BARRIER_WAIT(&node->init_completed_barrier);
- struct _starpu_worker *worker = &_starpu_get_machine_config()->workers[node->baseworkerid + coreid];
- node->bind_thread(node, coreid, &coreid, 1);
- _starpu_set_local_worker_key(worker);
- while(node->is_running)
- {
- /*Wait there is a task available */
- sem_wait(&node->sem_run_table[coreid]);
- if (node->run_table_detached[coreid] != NULL)
- _starpu_sink_common_execute_kernel(node, coreid, worker, 1);
- if (node->run_table[coreid] != NULL)
- _starpu_sink_common_execute_kernel(node, coreid, worker, 0);
- }
- starpu_pthread_exit(NULL);
- }
- /* Add the task to the specific thread and wake him up
- */
- static void _starpu_sink_common_execute_thread(struct _starpu_mp_node *node, struct mp_task *task)
- {
- int detached = task->detached;
- /* Add the task to the specific thread */
- if (detached)
- node->run_table_detached[task->coreid] = task;
- else
- node->run_table[task->coreid] = task;
- /* Unlock the mutex to wake up the thread which will execute the task */
- sem_post(&node->sem_run_table[task->coreid]);
- }
- /* Receive paquet from _starpu_src_common_execute_kernel in the form below :
- * [Function pointer on sink, number of interfaces, interfaces
- * (union _starpu_interface), cl_arg]
- * Then call the function given, passing as argument an array containing the
- * addresses of the received interfaces
- */
- void _starpu_sink_common_execute(struct _starpu_mp_node *node,
- void *arg, int arg_size)
- {
- unsigned i;
- uintptr_t arg_ptr = (uintptr_t) arg;
- struct mp_task *task;
- _STARPU_MALLOC(task, sizeof(struct mp_task));
- task->kernel = *(void(**)(void **, void *)) arg_ptr;
- arg_ptr += sizeof(task->kernel);
- task->type = *(enum starpu_codelet_type *) arg_ptr;
- arg_ptr += sizeof(task->type);
- task->is_parallel_task = *(int *) arg_ptr;
- arg_ptr += sizeof(task->is_parallel_task);
- if(task->is_parallel_task)
- {
- task->combined_workerid= *(int *) arg_ptr;
- arg_ptr += sizeof(task->combined_workerid);
- task->mp_barrier = _starpu_sink_common_get_barrier(node,task->combined_workerid,_starpu_get_combined_worker_struct(task->combined_workerid)->worker_size);
- }
- task->coreid = *(unsigned *) arg_ptr;
- arg_ptr += sizeof(task->coreid);
- task->nb_interfaces = *(unsigned *) arg_ptr;
- arg_ptr += sizeof(task->nb_interfaces);
- task->detached = *(int *) arg_ptr;
- arg_ptr += sizeof(task->detached);
- _STARPU_MALLOC(task->interfaces, task->nb_interfaces * sizeof(*task->interfaces));
- /* The function needs an array pointing to each interface it needs
- * during execution. As in sink-side there is no mean to know which
- * kind of interface to expect, the array is composed of unions of
- * interfaces, thus we expect the same size anyway */
- for (i = 0; i < task->nb_interfaces; i++)
- {
- union _starpu_interface * interface;
- _STARPU_MALLOC(interface, sizeof(union _starpu_interface));
- memcpy(interface, (void*) arg_ptr, sizeof(union _starpu_interface));
- task->interfaces[i] = interface;
- arg_ptr += sizeof(union _starpu_interface);
- }
- /* Was cl_arg sent ? */
- if (arg_size > arg_ptr - (uintptr_t) arg)
- {
- /* Copy cl_arg to prevent overwriting by an other task */
- unsigned cl_arg_size = arg_size - (arg_ptr - (uintptr_t) arg);
- _STARPU_MALLOC(task->cl_arg, cl_arg_size);
- memcpy(task->cl_arg, (void *) arg_ptr, cl_arg_size);
- }
- else
- task->cl_arg = NULL;
- //_STARPU_DEBUG("telling host that we have submitted the task %p.\n", task->kernel);
- if (task->detached)
- _starpu_mp_common_send_command(node, STARPU_MP_COMMAND_EXECUTION_DETACHED_SUBMITTED,
- NULL, 0);
- else
- _starpu_mp_common_send_command(node, STARPU_MP_COMMAND_EXECUTION_SUBMITTED,
- NULL, 0);
- //_STARPU_DEBUG("executing the task %p\n", task->kernel);
- _starpu_sink_common_execute_thread(node, task);
- }
|