12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394 |
- /* StarPU --- Runtime system for heterogeneous multicore architectures.
- *
- * Copyright (C) 2010-2012,2014 Université de Bordeaux
- * Copyright (C) 2011 Inria
- * Copyright (C) 2010-2013,2015,2017,2019 CNRS
- *
- * StarPU is free software; you can redistribute it and/or modify
- * it under the terms of the GNU Lesser General Public License as published by
- * the Free Software Foundation; either version 2.1 of the License, or (at
- * your option) any later version.
- *
- * StarPU is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
- *
- * See the GNU Lesser General Public License in COPYING.LGPL for more details.
- */
- #ifndef __STARPU_CUDA_H__
- #define __STARPU_CUDA_H__
- /** @defgroup API_CUDA_Extensions CUDA Extensions
- @{
- */
- #include <starpu_config.h>
- #if defined STARPU_USE_CUDA && !defined STARPU_DONT_INCLUDE_CUDA_HEADERS
- #include <cuda.h>
- #include <cuda_runtime.h>
- #include <cuda_runtime_api.h>
- #ifdef __cplusplus
- extern "C"
- {
- #endif
- /** Report a CUBLAS error. */
- void starpu_cublas_report_error(const char *func, const char *file, int line, int status);
- /** Calls starpu_cublas_report_error(), passing the current function, file and line position.*/
- #define STARPU_CUBLAS_REPORT_ERROR(status) starpu_cublas_report_error(__starpu_func__, __FILE__, __LINE__, status)
- /** Report a CUDA error. */
- void starpu_cuda_report_error(const char *func, const char *file, int line, cudaError_t status);
- /** Calls starpu_cuda_report_error(), passing the current function, file and line position.*/
- #define STARPU_CUDA_REPORT_ERROR(status) starpu_cuda_report_error(__starpu_func__, __FILE__, __LINE__, status)
- /**
- Return the current worker’s CUDA stream. StarPU
- provides a stream for every CUDA device controlled by StarPU. This
- function is only provided for convenience so that programmers can
- easily use asynchronous operations within codelets without having to
- create a stream by hand. Note that the application is not forced to
- use the stream provided by starpu_cuda_get_local_stream() and may also
- create its own streams. Synchronizing with <c>cudaThreadSynchronize()</c> is
- allowed, but will reduce the likelihood of having all transfers
- overlapped.
- */
- cudaStream_t starpu_cuda_get_local_stream(void);
- /** Return a pointer to device properties for worker \p workerid (assumed to be a CUDA worker). */
- const struct cudaDeviceProp *starpu_cuda_get_device_properties(unsigned workerid);
- /**
- Copy \p ssize bytes from the pointer \p src_ptr on \p src_node
- to the pointer \p dst_ptr on \p dst_node. The function first tries to
- copy the data asynchronous (unless \p stream is <c>NULL</c>). If the
- asynchronous copy fails or if \p stream is <c>NULL</c>, it copies the
- data synchronously. The function returns <c>-EAGAIN</c> if the
- asynchronous launch was successfull. It returns 0 if the synchronous
- copy was successful, or fails otherwise.
- */
- int starpu_cuda_copy_async_sync(void *src_ptr, unsigned src_node, void *dst_ptr, unsigned dst_node, size_t ssize, cudaStream_t stream, enum cudaMemcpyKind kind);
- /**
- Calls <c>cudaSetDevice(\p devid)</c> or <c>cudaGLSetGLDevice(\p devid)</c>,
- according to whether \p devid is among the field
- starpu_conf::cuda_opengl_interoperability.
- */
- void starpu_cuda_set_device(unsigned devid);
- #ifdef __cplusplus
- }
- #endif
- #endif /* STARPU_USE_CUDA && !STARPU_DONT_INCLUDE_CUDA_HEADERS */
- /** @} */
- #endif /* __STARPU_CUDA_H__ */
|