| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263 | /* * This file is part of the StarPU Handbook. * Copyright (C) 2009--2011  Universit@'e de Bordeaux * Copyright (C) 2010, 2011, 2012, 2013, 2014, 2016, 2017  CNRS * Copyright (C) 2011, 2012 INRIA * See the file version.doxy for copying conditions. *//*! \defgroup API_OpenCL_Extensions OpenCL Extensions\def STARPU_USE_OPENCL\ingroup API_OpenCL_ExtensionsDefined when StarPU has been installed withOpenCL support. It should be used in your code to detect theavailability of OpenCL as shown in \ref FullSourceCodeVectorScal.\def STARPU_MAXOPENCLDEVS\ingroup API_OpenCL_ExtensionsDefine the maximum number of OpenCL devices that aresupported by StarPU.\def STARPU_OPENCL_DATADIR\ingroup API_OpenCL_ExtensionsDefine the directory in which the OpenCL codelets of theapplications provided with StarPU have been installed.\struct starpu_opencl_program\ingroup API_OpenCL_ExtensionsStore the OpenCL programs as compiled for the different OpenCLdevices.\var cl_program starpu_opencl_program::programs[STARPU_MAXOPENCLDEVS]    Store each program for each OpenCL device.@name Writing OpenCL kernels\ingroup API_OpenCL_Extensions\fn void starpu_opencl_get_context(int devid, cl_context *context)\ingroup API_OpenCL_ExtensionsReturn the OpenCL context of the device designated by \p devidin \p context.\fn void starpu_opencl_get_device(int devid, cl_device_id *device)\ingroup API_OpenCL_ExtensionsReturn the cl_device_id corresponding to \p devid in \p device.\fn void starpu_opencl_get_queue(int devid, cl_command_queue *queue)\ingroup API_OpenCL_ExtensionsReturn the command queue of the device designated by \p devidinto \p queue.\fn void starpu_opencl_get_current_context(cl_context *context)\ingroup API_OpenCL_ExtensionsReturn the context of the current worker.\fn void starpu_opencl_get_current_queue(cl_command_queue *queue)\ingroup API_OpenCL_ExtensionsReturn the computation kernel command queue of the currentworker.\fn int starpu_opencl_set_kernel_args(cl_int *err, cl_kernel *kernel, ...)\ingroup API_OpenCL_ExtensionsSet the arguments of a given kernel. The list of argumentsmust be given as <c>(size_t size_of_the_argument, cl_mem *pointer_to_the_argument)</c>. The last argument must be 0. Return thenumber of arguments that were successfully set. In case of failure,return the id of the argument that could not be set and \p err is set tothe error returned by OpenCL. Otherwise, return the number ofarguments that were set.Here an example:\code{.c}int n;cl_int err;cl_kernel kernel;n = starpu_opencl_set_kernel_args(&err, 2, &kernel,                                  sizeof(foo), &foo,                                  sizeof(bar), &bar,                                  0);if (n != 2)   fprintf(stderr, "Error : %d\n", err);\endcode@name Compiling OpenCL kernels\ingroup API_OpenCL_ExtensionsSource codes for OpenCL kernels can be stored in a file or in astring. StarPU provides functions to build the program executable foreach available OpenCL device as a cl_program object. This programexecutable can then be loaded within a specific queue as explained inthe next section. These are only helpers, Applications can also fill astarpu_opencl_program array by hand for more advanced use (e.g.different programs on the different OpenCL devices, for relocationpurpose for instance).\fn int starpu_opencl_load_opencl_from_file(const char *source_file_name, struct starpu_opencl_program *opencl_programs, const char *build_options)\ingroup API_OpenCL_ExtensionsCompile an OpenCL source code stored in a file.\fn int starpu_opencl_load_opencl_from_string(const char *opencl_program_source, struct starpu_opencl_program *opencl_programs, const char *build_options)\ingroup API_OpenCL_ExtensionsCompile an OpenCL source code stored in a string.\fn int starpu_opencl_unload_opencl(struct starpu_opencl_program *opencl_programs)\ingroup API_OpenCL_ExtensionsUnload an OpenCL compiled code.\fn void starpu_opencl_load_program_source(const char *source_file_name, char *located_file_name, char *located_dir_name, char *opencl_program_source)\ingroup API_OpenCL_ExtensionsStore the contents of the file \p source_file_name in the buffer\p opencl_program_source. The file \p source_file_name can be located in thecurrent directory, or in the directory specified by the environmentvariable \ref STARPU_OPENCL_PROGRAM_DIR, orin the directory <c>share/starpu/opencl</c> of the installationdirectory of StarPU, or in the source directory of StarPU. When thefile is found, \p located_file_name is the full name of the file as ithas been located on the system, \p located_dir_name the directorywhere it has been located. Otherwise, they are both set to the emptystring.\fn void starpu_opencl_load_program_source_malloc(const char *source_file_name, char **located_file_name, char **located_dir_name, char **opencl_program_source)\ingroup API_OpenCL_ExtensionsSimilar to function starpu_opencl_load_program_source() but allocate the buffers \p located_file_name, \p located_dir_name and \p opencl_program_source.\fn int starpu_opencl_compile_opencl_from_file(const char *source_file_name, const char *build_options)\ingroup API_OpenCL_ExtensionsCompile the OpenCL kernel stored in the file \p source_file_namewith the given options \p build_options and store the result in thedirectory <c>$STARPU_HOME/.starpu/opencl</c> with the same filename as\p source_file_name. The compilation is done for every OpenCL device,and the filename is suffixed with the vendor id and the device id ofthe OpenCL device.\fn int starpu_opencl_compile_opencl_from_string(const char *opencl_program_source, const char *file_name, const char *build_options)\ingroup API_OpenCL_ExtensionsCompile the OpenCL kernel in the string \p opencl_program_sourcewith the given options \p build_options and store the result in thedirectory <c>$STARPU_HOME/.starpu/opencl</c> with the filename \pfile_name. The compilation is done for every OpenCL device, and thefilename is suffixed with the vendor id and the device id of theOpenCL device.\fn int starpu_opencl_load_binary_opencl(const char *kernel_id, struct starpu_opencl_program *opencl_programs)\ingroup API_OpenCL_ExtensionsCompile the binary OpenCL kernel identified with \p kernel_id.For every OpenCL device, the binary OpenCL kernel will be loaded fromthe file<c>$STARPU_HOME/.starpu/opencl/\<kernel_id\>.\<device_type\>.vendor_id_\<vendor_id\>_device_id_\<device_id\></c>.@name Loading OpenCL kernels\ingroup API_OpenCL_Extensions\fn int starpu_opencl_load_kernel(cl_kernel *kernel, cl_command_queue *queue, struct starpu_opencl_program *opencl_programs, const char *kernel_name, int devid)\ingroup API_OpenCL_ExtensionsCreate a kernel \p kernel for device \p devid, on its computationcommand queue returned in \p queue, using program \p opencl_programsand name \p kernel_name.\fn int starpu_opencl_release_kernel(cl_kernel kernel)\ingroup API_OpenCL_ExtensionsRelease the given \p kernel, to be called after kernel execution.@name OpenCL statistics\fn int starpu_opencl_collect_stats(cl_event event)\ingroup API_OpenCL_ExtensionsCollect statistics on a kernel execution.After termination of the kernels, the OpenCL codelet should call thisfunction with the event returned by \c clEnqueueNDRangeKernel(), tolet StarPU collect statistics about the kernel execution (used cycles,consumed energy).@name OpenCL utilities\ingroup API_OpenCL_Extensions\fn const char *starpu_opencl_error_string(cl_int status)\ingroup API_OpenCL_ExtensionsReturn the error message in English corresponding to \p status, an OpenCLerror code.\fn void starpu_opencl_display_error(const char *func, const char *file, int line, const char *msg, cl_int status)\ingroup API_OpenCL_ExtensionsGiven a valid error status, print the corresponding error message on\c stdout, along with the function name \p func, the filename\p file, the line number \p line and the message \p msg.\def STARPU_OPENCL_DISPLAY_ERROR(status)\ingroup API_OpenCL_ExtensionsCall the function starpu_opencl_display_error() with the error\p status, the current function name, current file and line number,and a empty message.\fn void starpu_opencl_report_error(const char *func, const char *file, int line, const char *msg, cl_int status)\ingroup API_OpenCL_ExtensionsCall the function starpu_opencl_display_error() and abort.\def STARPU_OPENCL_REPORT_ERROR(status)\ingroup API_OpenCL_ExtensionsCall the function starpu_opencl_report_error() with the error \pstatus, the current function name, current file and line number,and a empty message.\def STARPU_OPENCL_REPORT_ERROR_WITH_MSG(msg, status)\ingroup API_OpenCL_ExtensionsCall the function starpu_opencl_report_error() with \p msgand \p status, the current function name, current file and line number.\fn cl_int starpu_opencl_allocate_memory(int devid, cl_mem *addr, size_t size, cl_mem_flags flags)\ingroup API_OpenCL_ExtensionsAllocate \p size bytes of memory, stored in \p addr. \p flags must be a validcombination of \c cl_mem_flags values.\fn cl_int starpu_opencl_copy_ram_to_opencl(void *ptr, unsigned src_node, cl_mem buffer, unsigned dst_node, size_t size, size_t offset, cl_event *event, int *ret)\ingroup API_OpenCL_ExtensionsCopy \p size bytes from the given \p ptr on RAM \p src_node to thegiven \p buffer on OpenCL \p dst_node. \p offset is the offset, inbytes, in \p buffer. if \p event is <c>NULL</c>, the copy issynchronous, i.e the queue is synchronised before returning. If not<c>NULL</c>, \p event can be used after the call to wait for thisparticular copy to complete. This function returns <c>CL_SUCCESS</c>if the copy was successful, or a valid OpenCL error code otherwise.The integer pointed to by \p ret is set to <c>-EAGAIN</c> if theasynchronous launch was successful, or to 0 if \p event was<c>NULL</c>.\fn cl_int starpu_opencl_copy_opencl_to_ram(cl_mem buffer, unsigned src_node, void *ptr, unsigned dst_node, size_t size, size_t offset, cl_event *event, int *ret)\ingroup API_OpenCL_ExtensionsCopy \p size bytes asynchronously from the given \p buffer on OpenCL\p src_node to the given \p ptr on RAM \p dst_node. \p offset is theoffset, in bytes, in \p buffer. if \p event is <c>NULL</c>, the copyis synchronous, i.e the queue is synchronised before returning. If not<c>NULL</c>, \p event can be used after the call to wait for thisparticular copy to complete. This function returns <c>CL_SUCCESS</c>if the copy was successful, or a valid OpenCL error code otherwise.The integer pointed to by \p ret is set to <c>-EAGAIN</c> if theasynchronous launch was successful, or to 0 if \p event was<c>NULL</c>.\fn cl_int starpu_opencl_copy_opencl_to_opencl(cl_mem src, unsigned src_node, size_t src_offset, cl_mem dst, unsigned dst_node, size_t dst_offset, size_t size, cl_event *event, int *ret)\ingroup API_OpenCL_ExtensionsCopy \p size bytes asynchronously from byte offset \p src_offset of \psrc on OpenCL \p src_node to byte offset \p dst_offset of \p dst onOpenCL \p dst_node. if \p event is <c>NULL</c>, the copy issynchronous, i.e. the queue is synchronised before returning. If not<c>NULL</c>, \p event can be used after the call to wait for thisparticular copy to complete. This function returns <c>CL_SUCCESS</c>if the copy was successful, or a valid OpenCL error code otherwise.The integer pointed to by \p ret is set to <c>-EAGAIN</c> if theasynchronous launch was successful, or to 0 if \p event was<c>NULL</c>.\fn cl_int starpu_opencl_copy_async_sync(uintptr_t src, size_t src_offset, unsigned src_node, uintptr_t dst, size_t dst_offset, unsigned dst_node, size_t size, cl_event *event)\ingroup API_OpenCL_ExtensionsCopy \p size bytes from byte offset \p src_offset of \p src on \psrc_node to byte offset \p dst_offset of \p dst on \p dst_node. if \pevent is <c>NULL</c>, the copy is synchronous, i.e. the queue issynchronised before returning. If not <c>NULL</c>, \p event can beused after the call to wait for this particular copy to complete. Thefunction returns <c>-EAGAIN</c> if the asynchronous launch wassuccessfull. It returns 0 if the synchronous copy was successful, orfails otherwise.*/
 |