лет назад: 13 · a0074841dc
--- a/sched_ctx_hypervisor/src/hypervisor_policies/ispeed_lp_policy.c
+++ b/sched_ctx_hypervisor/src/hypervisor_policies/ispeed_lp_policy.c
@@ -49,6 +49,16 @@ static unsigned _compute_flops_distribution_over_ctxs(int ns, int nw, double w_i
 
																 			{
															
 
																 				enum starpu_archtype arch = starpu_worker_get_type(worker);
															
 
																 				velocity[s][w] = sched_ctx_hypervisor_get_velocity(sc_w, arch);
															
 
																+				if(arch == STARPU_CUDA_WORKER)
															
 
																+				{
															
 
																+					unsigned worker_in_ctx = starpu_sched_ctx_contains_worker(worker, sc_w->sched_ctx);
															
 
																+					if(!worker_in_ctx)
															
 
																+					{
															
 
																+						double transfer_velocity = starpu_get_bandwidth_RAM_CUDA(worker) / 1000;
															
 
																+						velocity[s][w] = (velocity[s][w] * transfer_velocity) / (velocity[s][w] + transfer_velocity);
															
 
																+					}
															
 
																+				}
															
 
																+
															
 
																 			}
															
 
																 //			printf("v[w%d][s%d] = %lf\n",w, s, velocity[s][w]);
															
--- a/sched_ctx_hypervisor/src/hypervisor_policies/policy_tools.c
+++ b/sched_ctx_hypervisor/src/hypervisor_policies/policy_tools.c
@@ -454,12 +454,18 @@ double _get_velocity_per_worker(struct sched_ctx_hypervisor_wrapper *sc_w, unsig
 
																         if( elapsed_flops != 0.0)
															
 
																         {
															
 
																                 double curr_time = starpu_timing_now();
															
 
																+		size_t elapsed_data_used = sc_w->elapsed_data[worker];
															
 
																                 double elapsed_time = (curr_time - sc_w->start_time) / 1000000.0; /* in seconds */
															
 
																  		enum starpu_archtype arch = starpu_worker_get_type(worker);
															
 
																 		if(arch == STARPU_CUDA_WORKER)
															
 
																 		{
															
 
																-			double transfer_velocity = starpu_get_bandwidth_RAM_CUDA(worker);
															
 
																-			elapsed_time +=  (elapsed_data_used / transfer_velocity) / 1000000 ;
															
 
																+/* 			unsigned worker_in_ctx = starpu_sched_ctx_contains_worker(worker, sc_w->sched_ctx); */
															
 
																+/* 			if(!worker_in_ctx) */
															
 
																+/* 			{ */
															
 
																+
															
 
																+/* 				double transfer_velocity = starpu_get_bandwidth_RAM_CUDA(worker); */
															
 
																+/* 				elapsed_time +=  (elapsed_data_used / transfer_velocity) / 1000000 ; */
															
 
																+/* 			} */
															
 
																 			double latency = starpu_get_latency_RAM_CUDA(worker);
															
 
																 //			printf("%d/%d: latency %lf elapsed_time before %lf ntasks %d\n", worker, sc_w->sched_ctx, latency, elapsed_time, elapsed_tasks);
															
 
																 			elapsed_time += (elapsed_tasks * latency)/1000000;