Pārlūkot izejas kodu

port r11537 from 1.1: cudaFree takes much more than 125µs on average. 750µs is an average on the cholesky example. This still needs to be somehow tuned

Samuel Thibault 12 gadi atpakaļ
vecāks
revīzija
14016e793f
1 mainītis faili ar 2 papildinājumiem un 2 dzēšanām
  1. 2 2
      src/datawizard/malloc.c

+ 2 - 2
src/datawizard/malloc.c

@@ -501,7 +501,7 @@ _starpu_free_on_node(unsigned dst_node, uintptr_t addr, size_t size)
 #ifdef STARPU_SIMGRID
 			STARPU_PTHREAD_MUTEX_LOCK(&cuda_alloc_mutex);
 			/* Sleep for the free */
-			MSG_process_sleep(0.000125);
+			MSG_process_sleep(0.000750);
 			STARPU_PTHREAD_MUTEX_UNLOCK(&cuda_alloc_mutex);
 #else
 			cudaError_t err;
@@ -518,7 +518,7 @@ _starpu_free_on_node(unsigned dst_node, uintptr_t addr, size_t size)
 #ifdef STARPU_SIMGRID
 			STARPU_PTHREAD_MUTEX_LOCK(&opencl_alloc_mutex);
 			/* Sleep for the free */
-			MSG_process_sleep(0.000125);
+			MSG_process_sleep(0.000750);
 			STARPU_PTHREAD_MUTEX_UNLOCK(&opencl_alloc_mutex);
 #else
 			cl_int err;