瀏覽代碼

Use a memcpy operation that relies on a stream

Cédric Augonnet 14 年之前
父節點
當前提交
339892a2a6
共有 1 個文件被更改,包括 2 次插入2 次删除
  1. 2 2
      examples/cg/cg_kernels.c

+ 2 - 2
examples/cg/cg_kernels.c

@@ -582,8 +582,8 @@ static void copy_handle_cuda(void *descr[], void *cl_arg)
 	unsigned nx = STARPU_VECTOR_GET_NX(descr[0]);
 	size_t elemsize = STARPU_VECTOR_GET_ELEMSIZE(descr[0]);
 
-	cudaMemcpy(dst, src, nx*elemsize, cudaMemcpyDeviceToDevice);
-	cudaThreadSynchronize();
+	cudaMemcpyAsync(dst, src, nx*elemsize, cudaMemcpyDeviceToDevice, starpu_cuda_get_local_stream());
+	cudaStreamSynchronize(starpu_cuda_get_local_stream());
 }
 #endif