瀏覽代碼

port r11537 from 1.1: cudaFree takes much more than 125µs on average. 750µs is an average on the cholesky example. This still needs to be somehow tuned

Samuel Thibault 11 年之前
父節點
當前提交
14016e793f
共有 1 個文件被更改,包括 2 次插入2 次删除
  1. 2 2
      src/datawizard/malloc.c

+ 2 - 2
src/datawizard/malloc.c

@@ -501,7 +501,7 @@ _starpu_free_on_node(unsigned dst_node, uintptr_t addr, size_t size)
 #ifdef STARPU_SIMGRID
 			STARPU_PTHREAD_MUTEX_LOCK(&cuda_alloc_mutex);
 			/* Sleep for the free */
-			MSG_process_sleep(0.000125);
+			MSG_process_sleep(0.000750);
 			STARPU_PTHREAD_MUTEX_UNLOCK(&cuda_alloc_mutex);
 #else
 			cudaError_t err;
@@ -518,7 +518,7 @@ _starpu_free_on_node(unsigned dst_node, uintptr_t addr, size_t size)
 #ifdef STARPU_SIMGRID
 			STARPU_PTHREAD_MUTEX_LOCK(&opencl_alloc_mutex);
 			/* Sleep for the free */
-			MSG_process_sleep(0.000125);
+			MSG_process_sleep(0.000750);
 			STARPU_PTHREAD_MUTEX_UNLOCK(&opencl_alloc_mutex);
 #else
 			cl_int err;