| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172 | 
							- /* StarPU --- Runtime system for heterogeneous multicore architectures.
 
-  *
 
-  * Copyright (C) 2011,2013-2014                           Inria
 
-  * Copyright (C) 2015                                     Mathieu Lirzin
 
-  * Copyright (C) 2013,2017                                CNRS
 
-  *
 
-  * StarPU is free software; you can redistribute it and/or modify
 
-  * it under the terms of the GNU Lesser General Public License as published by
 
-  * the Free Software Foundation; either version 2.1 of the License, or (at
 
-  * your option) any later version.
 
-  *
 
-  * StarPU is distributed in the hope that it will be useful, but
 
-  * WITHOUT ANY WARRANTY; without even the implied warranty of
 
-  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
 
-  *
 
-  * See the GNU Lesser General Public License in COPYING.LGPL for more details.
 
-  */
 
- #ifndef SC_HYPERVISOR_MONITORING_H
 
- #define SC_HYPERVISOR_MONITORING_H
 
- #include <sc_hypervisor.h>
 
- #ifdef __cplusplus
 
- extern "C"
 
- {
 
- #endif
 
- /* structure to indicate when the moving of workers was actually done 
 
-    (moved workers can be seen in the new ctx ) */
 
- struct sc_hypervisor_resize_ack
 
- {
 
- 	/* receiver context */
 
- 	int receiver_sched_ctx;
 
- 	/* list of workers required to be moved */
 
- 	int *moved_workers;
 
- 	/* number of workers required to be moved */
 
- 	int nmoved_workers;
 
- 	/* list of workers that actually got in the receiver ctx */
 
- 	int *acked_workers;
 
- };
 
- /* wrapper attached to a sched_ctx storing monitoring information */
 
- struct sc_hypervisor_wrapper
 
- {
 
- 	/* the sched_ctx it monitors */
 
- 	unsigned sched_ctx;
 
- 	/* user configuration meant to limit resizing */
 
- 	struct sc_hypervisor_policy_config *config;
 
- 	/* the start time of the resizing sample of the workers of this context*/
 
- 	double start_time_w[STARPU_NMAXWORKERS];
 
- 	/* idle time of workers in this context */
 
- 	double current_idle_time[STARPU_NMAXWORKERS];
 
- 	/* idle time from the last resize */
 
- 	double idle_time[STARPU_NMAXWORKERS];
 
- 	/* time when the idle started */
 
- 	double idle_start_time[STARPU_NMAXWORKERS];
 
- 	
 
- 	/* time during which the worker executed tasks */
 
- 	double exec_time[STARPU_NMAXWORKERS];
 
- 	/* time when the worker started executing a task */
 
- 	double exec_start_time[STARPU_NMAXWORKERS];
 
- 	/* list of workers that will leave this contexts (lazy resizing process) */
 
- 	int worker_to_be_removed[STARPU_NMAXWORKERS];
 
- 	/* number of tasks pushed on each worker in this ctx */
 
- 	int pushed_tasks[STARPU_NMAXWORKERS];
 
- 	/* number of tasks poped from each worker in this ctx */
 
- 	int poped_tasks[STARPU_NMAXWORKERS];
 
- 	/* number of flops the context has to execute */
 
- 	double total_flops;
 
- 	/* number of flops executed since the beginning until now */
 
- 	double total_elapsed_flops[STARPU_NMAXWORKERS];
 
- 	/* number of flops executed since last resizing */
 
- 	double elapsed_flops[STARPU_NMAXWORKERS];
 
- 	/* data quantity executed on each worker in this ctx */
 
- 	size_t elapsed_data[STARPU_NMAXWORKERS];
 
- 	/* nr of tasks executed on each worker in this ctx */
 
- 	int elapsed_tasks[STARPU_NMAXWORKERS];
 
- 	/* the average speed of the type of workers when they belonged to this context */
 
- 	/* 0 - cuda 1 - cpu */
 
- 	double ref_speed[2];
 
- 	/* number of flops submitted to this ctx */
 
- 	double submitted_flops;
 
- 	/* number of flops that still have to be executed in this ctx */
 
- 	double remaining_flops;
 
- 	
 
- 	/* the start time of the resizing sample of this context*/
 
- 	double start_time;
 
- 	/* the first time a task was pushed to this context*/
 
- 	double real_start_time;
 
- 	
 
- 	/* the start time for sample in which the hyp is not allowed to react
 
- 	   bc too expensive */
 
- 	double hyp_react_start_time;
 
- 	/* the workers don't leave the current ctx until the receiver ctx 
 
- 	   doesn't ack the receive of these workers */
 
- 	struct sc_hypervisor_resize_ack resize_ack;
 
- 	/* mutex to protect the ack of workers */
 
- 	starpu_pthread_mutex_t mutex;
 
- 	/* boolean indicating if the resizing strategy can see the
 
- 	   flops of all the execution or not */
 
- 	unsigned total_flops_available;
 
- 	/* boolean indicating that a context is being sized */
 
- 	unsigned to_be_sized;
 
- 	/* boolean indicating if we add the idle of this worker to 
 
- 	   the idle of the context */
 
- 	unsigned compute_idle[STARPU_NMAXWORKERS];
 
- 	/* boolean indicating if we add the entiere idle of this 
 
- 	   worker to the idle of the context or just half*/
 
- 	unsigned compute_partial_idle[STARPU_NMAXWORKERS];
 
- 	/* consider the max in the lp */
 
- 	unsigned consider_max;
 
- };
 
- /* return the wrapper of context that saves its monitoring information */
 
- struct sc_hypervisor_wrapper *sc_hypervisor_get_wrapper(unsigned sched_ctx);
 
- /* get the list of registered contexts */
 
- unsigned *sc_hypervisor_get_sched_ctxs();
 
- /* get the number of registered contexts */
 
- int sc_hypervisor_get_nsched_ctxs();
 
- /* get the number of workers of a certain architecture in a context */
 
- int sc_hypervisor_get_nworkers_ctx(unsigned sched_ctx, enum starpu_worker_archtype arch);
 
- /* get the number of flops executed by a context since last resizing (reset to 0 when a resizing is done)*/
 
- double sc_hypervisor_get_elapsed_flops_per_sched_ctx(struct sc_hypervisor_wrapper *sc_w);
 
- /* get the number of flops executed by a context since the begining */
 
- double sc_hypervisor_get_total_elapsed_flops_per_sched_ctx(struct sc_hypervisor_wrapper* sc_w);
 
- /* compute an average value of the cpu/cuda speed */
 
- double sc_hypervisorsc_hypervisor_get_speed_per_worker_type(struct sc_hypervisor_wrapper* sc_w, enum starpu_worker_archtype arch);
 
- /* compte the actual speed of all workers of a specific type of worker */
 
- double sc_hypervisor_get_speed(struct sc_hypervisor_wrapper *sc_w, enum starpu_worker_archtype arch);
 
- #ifdef __cplusplus
 
- }
 
- #endif
 
- #endif
 
 
  |