1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387138813891390139113921393139413951396139713981399140014011402140314041405140614071408140914101411141214131414141514161417141814191420142114221423142414251426142714281429143014311432143314341435143614371438143914401441144214431444144514461447144814491450145114521453145414551456145714581459146014611462146314641465146614671468146914701471147214731474147514761477147814791480148114821483148414851486148714881489149014911492149314941495149614971498149915001501150215031504150515061507150815091510151115121513151415151516151715181519152015211522152315241525152615271528152915301531153215331534153515361537153815391540154115421543154415451546154715481549155015511552155315541555155615571558155915601561156215631564156515661567156815691570157115721573157415751576157715781579158015811582158315841585158615871588158915901591159215931594159515961597159815991600160116021603160416051606160716081609161016111612161316141615161616171618161916201621162216231624162516261627162816291630163116321633163416351636163716381639164016411642164316441645164616471648164916501651165216531654165516561657165816591660166116621663166416651666166716681669167016711672167316741675167616771678167916801681168216831684168516861687168816891690169116921693169416951696169716981699170017011702170317041705170617071708170917101711171217131714171517161717171817191720172117221723172417251726172717281729173017311732173317341735173617371738173917401741174217431744174517461747174817491750175117521753175417551756175717581759176017611762176317641765176617671768176917701771177217731774177517761777177817791780178117821783178417851786178717881789179017911792179317941795179617971798179918001801180218031804180518061807180818091810181118121813181418151816181718181819182018211822182318241825182618271828182918301831183218331834183518361837183818391840184118421843184418451846184718481849185018511852185318541855185618571858185918601861186218631864186518661867186818691870187118721873187418751876187718781879188018811882188318841885188618871888188918901891189218931894189518961897189818991900190119021903190419051906190719081909191019111912191319141915191619171918191919201921192219231924192519261927192819291930193119321933193419351936193719381939194019411942194319441945194619471948194919501951195219531954195519561957195819591960196119621963196419651966196719681969197019711972197319741975197619771978197919801981198219831984198519861987198819891990199119921993199419951996199719981999200020012002200320042005200620072008200920102011201220132014201520162017201820192020202120222023202420252026202720282029203020312032203320342035203620372038203920402041204220432044204520462047204820492050205120522053205420552056205720582059206020612062206320642065206620672068206920702071207220732074207520762077207820792080208120822083208420852086208720882089209020912092209320942095209620972098209921002101210221032104210521062107210821092110211121122113211421152116 |
- /* StarPU --- Runtime system for heterogeneous multicore architectures.
- *
- * Copyright (C) 2009-2020 Université de Bordeaux, CNRS (LaBRI UMR 5800), Inria
- *
- * StarPU is free software; you can redistribute it and/or modify
- * it under the terms of the GNU Lesser General Public License as published by
- * the Free Software Foundation; either version 2.1 of the License, or (at
- * your option) any later version.
- *
- * StarPU is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
- *
- * See the GNU Lesser General Public License in COPYING.LGPL for more details.
- */
- #ifndef __STARPU_DATA_INTERFACES_H__
- #define __STARPU_DATA_INTERFACES_H__
- #include <starpu.h>
- #ifdef STARPU_USE_CUDA
- /* to use CUDA streams */
- # ifdef STARPU_DONT_INCLUDE_CUDA_HEADERS
- typedef void *starpu_cudaStream_t;
- # else
- # include <cuda_runtime.h>
- typedef cudaStream_t starpu_cudaStream_t;
- # endif
- #endif
- #ifdef __cplusplus
- extern "C"
- {
- #endif
- /**
- @defgroup API_Data_Interfaces Data Interfaces
- @brief Data management is done at a high-level in StarPU: rather than
- accessing a mere list of contiguous buffers, the tasks may manipulate
- data that are described by a high-level construct which we call data
- interface.
- An example of data interface is the "vector" interface which describes
- a contiguous data array on a spefic memory node. This interface is a
- simple structure containing the number of elements in the array, the
- size of the elements, and the address of the array in the appropriate
- address space (this address may be invalid if there is no valid copy
- of the array in the memory node). More informations on the data
- interfaces provided by StarPU are given in \ref API_Data_Interfaces.
- When a piece of data managed by StarPU is used by a task, the task
- implementation is given a pointer to an interface describing a valid
- copy of the data that is accessible from the current processing unit.
- Every worker is associated to a memory node which is a logical
- abstraction of the address space from which the processing unit gets
- its data. For instance, the memory node associated to the different
- CPU workers represents main memory (RAM), the memory node associated
- to a GPU is DRAM embedded on the device. Every memory node is
- identified by a logical index which is accessible from the
- function starpu_worker_get_memory_node(). When registering a piece of
- data to StarPU, the specified memory node indicates where the piece of
- data initially resides (we also call this memory node the home node of
- a piece of data).
- In the case of NUMA systems, functions starpu_memory_nodes_numa_devid_to_id()
- and starpu_memory_nodes_numa_id_to_devid() can be used to convert from NUMA node
- numbers as seen by the Operating System and NUMA node numbers as seen by StarPU.
- There are several ways to register a memory region so that it can be
- managed by StarPU. StarPU provides data interfaces for vectors, 2D
- matrices, 3D matrices as well as BCSR and CSR sparse matrices.
- Each data interface is provided with a set of field access functions.
- The ones using a <c>void *</c> parameter aimed to be used in codelet
- implementations (see for example the code in
- \ref VectorScalingUsingStarPUAPI).
- Applications can provide their own interface as shown in \ref DefiningANewDataInterface.
- @{
- */
- /**
- Define the per-interface methods. If the
- starpu_data_copy_methods::any_to_any method is provided, it will be
- used by default if no specific method is provided. It can still be
- useful to provide more specific method in case of e.g. available
- particular CUDA or OpenCL support.
- */
- struct starpu_data_copy_methods
- {
- /**
- If defined, allow the interface to declare whether it supports
- transferring from \p src_interface on node \p src_node to \p
- dst_interface on node \p dst_node, run from node \p handling_node.
- If not defined, it is assumed that the interface supports all
- transfers.
- */
- int (*can_copy)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node, unsigned handling_node);
- /**
- Define how to copy data from the \p src_interface interface on the
- \p src_node CPU node to the \p dst_interface interface on the \p
- dst_node CPU node. Return 0 on success.
- */
- int (*ram_to_ram)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
- /**
- Define how to copy data from the \p src_interface interface on the
- \p src_node CPU node to the \p dst_interface interface on the \p
- dst_node CUDA node. Return 0 on success.
- */
- int (*ram_to_cuda)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
- /**
- Define how to copy data from the \p src_interface interface on the
- \p src_node CPU node to the \p dst_interface interface on the \p
- dst_node OpenCL node. Return 0 on success.
- */
- int (*ram_to_opencl)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
- /**
- Define how to copy data from the \p src_interface interface on the
- \p src_node CPU node to the \p dst_interface interface on the \p
- dst_node FPGA node. Return 0 on success.
- */
- int (*ram_to_fpga)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
- /**
- Define how to copy data from the \p src_interface interface on the
- \p src_node CPU node to the \p dst_interface interface on the \p
- dst_node MIC node. Return 0 on success.
- */
- int (*ram_to_mic)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
- /**
- Define how to copy data from the \p src_interface interface on the
- \p src_node CUDA node to the \p dst_interface interface on the \p
- dst_node CPU node. Return 0 on success.
- */
- int (*cuda_to_ram)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
- /**
- Define how to copy data from the \p src_interface interface on the
- \p src_node CUDA node to the \p dst_interface interface on the \p
- dst_node CUDA node. Return 0 on success.
- */
- int (*cuda_to_cuda)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
- /**
- Define how to copy data from the \p src_interface interface on the
- \p src_node CUDA node to the \p dst_interface interface on the \p
- dst_node OpenCL node. Return 0 on success.
- */
- int (*cuda_to_opencl)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
- /**
- Define how to copy data from the \p src_interface interface on the
- \p src_node OpenCL node to the \p dst_interface interface on the
- \p dst_node CPU node. Return 0 on success.
- */
- int (*opencl_to_ram)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
- /**
- Define how to copy data from the \p src_interface interface on the
- \p src_node OpenCL node to the \p dst_interface interface on the
- \p dst_node CUDA node. Return 0 on success.
- */
- int (*opencl_to_cuda)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
- /**
- Define how to copy data from the \p src_interface interface on the
- \p src_node OpenCL node to the \p dst_interface interface on the
- \p dst_node OpenCL node. Return 0 on success.
- */
- int (*opencl_to_opencl)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
- /**
- Define how to copy data from the \p src_interface interface on the
- \p src_node FPGA node to the \p dst_interface interface on the \p
- dst_node CPU node. Return 0 on success.
- */
- int (*fpga_to_ram)(void *src_interface, unsigned srd_node, void *dst_interface, unsigned dst_node);
- /**
- Define how to copy data from the \p src_interface interface on the
- \p src_node MIC node to the \p dst_interface interface on the \p
- dst_node CPU node. Return 0 on success.
- */
- int (*mic_to_ram)(void *src_interface, unsigned srd_node, void *dst_interface, unsigned dst_node);
- /**
- Define how to copy data from the \p src_interface interface on the
- \p src_node CPU node to the \p dst_interface interface on the \p
- dst_node MPI Slave node. Return 0 on success.
- */
- int (*ram_to_mpi_ms)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
- /**
- Define how to copy data from the \p src_interface interface on the
- \p src_node MPI Slave node to the \p dst_interface interface on
- the \p dst_node CPU node. Return 0 on success.
- */
- int (*mpi_ms_to_ram)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
- /**
- Define how to copy data from the \p src_interface interface on the
- \p src_node MPI Slave node to the \p dst_interface interface on
- the \p dst_node MPI Slave node. Return 0 on success.
- */
- int (*mpi_ms_to_mpi_ms)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
- #ifdef STARPU_USE_CUDA
- /**
- Define how to copy data from the \p src_interface interface on the
- \p src_node CPU node to the \p dst_interface interface on the \p
- dst_node CUDA node, using the given stream. Must return 0 if the
- transfer was actually completed completely synchronously, or
- <c>-EAGAIN</c> if at least some transfers are still ongoing and
- should be awaited for by the core.
- */
- int (*ram_to_cuda_async)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node, starpu_cudaStream_t stream);
- /**
- Define how to copy data from the \p src_interface interface on the
- \p src_node CUDA node to the \p dst_interface interface on the \p
- dst_node CPU node, using the given stream. Must return 0 if the
- transfer was actually completed completely synchronously, or
- <c>-EAGAIN</c> if at least some transfers are still ongoing and
- should be awaited for by the core.
- */
- int (*cuda_to_ram_async)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node, starpu_cudaStream_t stream);
- /**
- Define how to copy data from the \p src_interface interface on the
- \p src_node CUDA node to the \p dst_interface interface on the \p
- dst_node CUDA node, using the given stream. Must return 0 if the
- transfer was actually completed completely synchronously, or
- <c>-EAGAIN</c> if at least some transfers are still ongoing and
- should be awaited for by the core.
- */
- int (*cuda_to_cuda_async)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node, starpu_cudaStream_t stream);
- #else
- int (*ram_to_cuda_async)(void);
- int (*cuda_to_ram_async)(void);
- int (*cuda_to_cuda_async)(void);
- #endif
- #if defined(STARPU_USE_OPENCL) && !defined(__CUDACC__)
- /**
- Define how to copy data from the \p src_interface interface on the
- \p src_node CPU node to the \p dst_interface interface on the \p
- dst_node OpenCL node, by recording in \p event, a pointer to a
- <c>cl_event</c>, the event of the last submitted transfer. Must
- return 0 if the transfer was actually completed completely
- synchronously, or <c>-EAGAIN</c> if at least some transfers are
- still ongoing and should be awaited for by the core.
- */
- int (*ram_to_opencl_async)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node, cl_event *event);
- /**
- Define how to copy data from the \p src_interface interface on the
- \p src_node OpenCL node to the \p dst_interface interface on the
- \p dst_node CPU node, by recording in \p event, a pointer to a
- <c>cl_event</c>, the event of the last submitted transfer. Must
- return 0 if the transfer was actually completed completely
- synchronously, or <c>-EAGAIN</c> if at least some transfers are
- still ongoing and should be awaited for by the core.
- */
- int (*opencl_to_ram_async)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node, cl_event *event);
- /**
- Define how to copy data from the \p src_interface interface on the
- \p src_node OpenCL node to the \p dst_interface interface on the
- \p dst_node OpenCL node, by recording in \p event, a pointer to a
- <c>cl_event</c>, the event of the last submitted transfer. Must
- return 0 if the transfer was actually completed completely
- synchronously, or <c>-EAGAIN</c> if at least some transfers are
- still ongoing and should be awaited for by the core.
- */
- int (*opencl_to_opencl_async)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node, cl_event *event);
- #else
- int (*ram_to_opencl_async)(void);
- int (*opencl_to_ram_async)(void);
- int (*opencl_to_opencl_async)(void);
- #endif
- /**
- Define how to copy data from the \p src_interface interface on the
- \p src_node CPU node to the \p dst_interface interface on the \p
- dst_node FPGA node. Must return 0 if the transfer was actually
- completed completely synchronously, or <c>-EAGAIN</c> if at least
- some transfers are still ongoing and should be awaited for by the
- core.
- */
- int (*ram_to_fpga_async)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
- /**
- Define how to copy data from the \p src_interface interface on the
- \p src_node FPGA node to the \p dst_interface interface on the \p
- dst_node CPU node. Must return 0 if the transfer was actually
- completed completely synchronously, or <c>-EAGAIN</c> if at least
- some transfers are still ongoing and should be awaited for by the
- core.
- */
- int (*fpga_to_ram_async)(void *src_interface, unsigned srd_node, void *dst_interface, unsigned dst_node);
- /**
- Define how to copy data from the \p src_interface interface on the
- \p src_node CPU node to the \p dst_interface interface on the \p
- dst_node MIC node. Must return 0 if the transfer was actually
- completed completely synchronously, or <c>-EAGAIN</c> if at least
- some transfers are still ongoing and should be awaited for by the
- core.
- */
- int (*ram_to_mic_async)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node);
- /**
- Define how to copy data from the \p src_interface interface on the
- \p src_node MIC node to the \p dst_interface interface on the \p
- dst_node CPU node. Must return 0 if the transfer was actually
- completed completely synchronously, or <c>-EAGAIN</c> if at least
- some transfers are still ongoing and should be awaited for by the
- core.
- */
- int (*mic_to_ram_async)(void *src_interface, unsigned srd_node, void *dst_interface, unsigned dst_node);
- /**
- Define how to copy data from the \p src_interface interface on the
- \p src_node CPU node to the \p dst_interface interface on the \p
- dst_node MPI Slave node, with the given even. Must return 0 if the
- transfer was actually completed completely synchronously, or
- <c>-EAGAIN</c> if at least some transfers are still ongoing and
- should be awaited for by the core.
- */
- int (*ram_to_mpi_ms_async)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node, void * event);
- /**
- Define how to copy data from the \p src_interface interface on the
- \p src_node MPI Slave node to the \p dst_interface interface on
- the \p dst_node CPU node, with the given event. Must return 0 if
- the transfer was actually completed completely synchronously, or
- <c>-EAGAIN</c> if at least some transfers are still ongoing and
- should be awaited for by the core.
- */
- int (*mpi_ms_to_ram_async)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node, void * event);
- /**
- Define how to copy data from the \p src_interface interface on the
- \p src_node MPI Slave node to the \p dst_interface interface on
- the \p dst_node MPI Slave node, using the given stream. Must
- return 0 if the transfer was actually completed completely
- synchronously, or <c>-EAGAIN</c> if at least some transfers are
- still ongoing and should be awaited for by the core.
- */
- int (*mpi_ms_to_mpi_ms_async)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node, void * event);
- /**
- Define how to copy data from the \p src_interface interface on the
- \p src_node node to the \p dst_interface interface on the \p
- dst_node node. This is meant to be implemented through the
- starpu_interface_copy() helper, to which async_data should be
- passed as such, and will be used to manage asynchronicity. This
- must return <c>-EAGAIN</c> if any of the starpu_interface_copy()
- calls has returned <c>-EAGAIN</c> (i.e. at least some transfer is
- still ongoing), and return 0 otherwise.
- This can only be implemented if the interface has ready-to-send
- data blocks. If the interface is more involved than
- this, i.e. it needs to collect pieces of data before
- transferring, starpu_data_interface_ops::pack_data and
- starpu_data_interface_ops::unpack_data should be implemented instead,
- and the core will just transfer the resulting data buffer.
- */
- int (*any_to_any)(void *src_interface, unsigned src_node, void *dst_interface, unsigned dst_node, void *async_data);
- };
- /**
- Identifier for all predefined StarPU data interfaces
- */
- enum starpu_data_interface_id
- {
- STARPU_UNKNOWN_INTERFACE_ID = -1, /**< Unknown interface */
- STARPU_MATRIX_INTERFACE_ID=0, /**< Identifier for the matrix data interface */
- STARPU_BLOCK_INTERFACE_ID=1, /**< Identifier for the block data interface*/
- STARPU_VECTOR_INTERFACE_ID=2, /**< Identifier for the vector data interface*/
- STARPU_CSR_INTERFACE_ID=3, /**< Identifier for the CSR data interface*/
- STARPU_BCSR_INTERFACE_ID=4, /**< Identifier for the BCSR data interface*/
- STARPU_VARIABLE_INTERFACE_ID=5, /**< Identifier for the variable data interface*/
- STARPU_VOID_INTERFACE_ID=6, /**< Identifier for the void data interface*/
- STARPU_MULTIFORMAT_INTERFACE_ID=7, /**< Identifier for the multiformat data interface*/
- STARPU_COO_INTERFACE_ID=8, /**< Identifier for the COO data interface*/
- STARPU_TENSOR_INTERFACE_ID=9, /**< Identifier for the block data interface*/
- STARPU_MAX_INTERFACE_ID=10 /**< Maximum number of data interfaces */
- };
- /**
- Per-interface data management methods.
- */
- struct starpu_data_interface_ops
- {
- /**
- Register an existing interface into a data handle.
- This iterates over all memory nodes to initialize all fields of the data
- interface on each of them. Since data is not allocated yet except on the
- home node, pointers should be left as NULL except on the \p home_node, for
- which the pointers should be copied from the given \p data_interface, which
- was filled with the application's pointers.
- This method is mandatory.
- */
- void (*register_data_handle) (starpu_data_handle_t handle, unsigned home_node, void *data_interface);
- /**
- Allocate data for the interface on a given node. This should use
- starpu_malloc_on_node() to perform the allocation(s), and fill the pointers
- in the data interface. It should return the size of the allocated memory, or
- -ENOMEM if memory could not be allocated.
- Note that the memory node can be CPU memory, GPU memory, or even disk
- area. The result returned by starpu_malloc_on_node() should be just
- stored as uintptr_t without trying to interpret it since it may be a
- GPU pointer, a disk descriptor, etc.
- This method is mandatory to be able to support memory nodes.
- */
- starpu_ssize_t (*allocate_data_on_node) (void *data_interface, unsigned node);
- /**
- Free data of the interface on a given node.
- This method is mandatory to be able to support memory nodes.
- */
- void (*free_data_on_node) (void *data_interface, unsigned node);
- /**
- Initialize the interface.
- This method is optional. It is called when initializing the
- handler on all the memory nodes.
- */
- void (*init) (void *data_interface);
- /**
- Struct with pointer to functions for performing ram/cuda/opencl synchronous and asynchronous transfers.
- This field is mandatory to be able to support memory
- nodes, except disk nodes which can be supported by just
- implementing starpu_data_interface_ops::pack_data and
- starpu_data_interface_ops::unpack_data.
- */
- const struct starpu_data_copy_methods *copy_methods;
- /**
- @deprecated
- Use starpu_data_interface_ops::to_pointer instead.
- Return the current pointer (if any) for the handle on the given node.
- This method is only required if starpu_data_interface_ops::to_pointer
- is not implemented.
- */
- void * (*handle_to_pointer) (starpu_data_handle_t handle, unsigned node);
- /**
- Return the current pointer (if any) for the given interface on the given node.
- This method is only required for starpu_data_handle_to_pointer()
- and starpu_data_get_local_ptr(), and for disk support.
- */
- void * (*to_pointer) (void *data_interface, unsigned node);
- /**
- Return whether the given \p ptr is within the data for the given interface on the given node.
- This method is optional, as it is only used for coherency checks.
- */
- int (*pointer_is_inside) (void *data_interface, unsigned node, void *ptr);
- /**
- Return an estimation of the size of data, for performance models and tracing feedback.
- */
- size_t (*get_size) (starpu_data_handle_t handle);
- /**
- Return an estimation of the size of allocated data, for allocation
- management.
- If not specified, the starpu_data_interface_ops::get_size method is
- used instead.
- */
- size_t (*get_alloc_size) (starpu_data_handle_t handle);
- /**
- Return the maximum size that the data may need to increase to. For
- instance, in the case of compressed matrix tiles this is the size
- when the block is fully dense.
- This is currently only used for feedback tools.
- */
- size_t (*get_max_size) (starpu_data_handle_t handle);
- /**
- Return a 32bit footprint which characterizes the data size and layout (nx, ny, ld, elemsize, etc.), required for indexing performance models.
- starpu_hash_crc32c_be() and alike can be used to produce this 32bit value from various types of values.
- */
- uint32_t (*footprint) (starpu_data_handle_t handle);
- /**
- Return a 32bit footprint which characterizes the data allocation, to be used
- for indexing allocation cache.
- If not specified, the starpu_data_interface_ops::footprint method is
- used instead.
- */
- uint32_t (*alloc_footprint) (starpu_data_handle_t handle);
- /**
- Compare the data size and layout of two interfaces (nx, ny, ld, elemsize,
- etc.), to be used for indexing performance models. It should return 1 if
- the two interfaces size and layout match computation-wise, and 0 otherwise.
- It does *not* compare the actual content of the interfaces.
- */
- int (*compare) (void *data_interface_a, void *data_interface_b);
- /**
- Compare the data allocation of two interfaces etc.), to be used for indexing
- allocation cache. It should return
- 1 if the two interfaces are allocation-compatible, i.e. basically have the same alloc_size, and 0 otherwise.
- If not specified, the starpu_data_interface_ops::compare method is
- used instead.
- */
- int (*alloc_compare) (void *data_interface_a, void *data_interface_b);
- /**
- Dump the sizes of a handle to a file.
- This is required for performance models
- */
- void (*display) (starpu_data_handle_t handle, FILE *f);
- /**
- Describe the data into a string in a brief way, such as one
- letter to describe the type of data, and the data
- dimensions.
- This is required for tracing feedback.
- */
- starpu_ssize_t (*describe) (void *data_interface, char *buf, size_t size);
- /**
- An identifier that is unique to each interface.
- */
- enum starpu_data_interface_id interfaceid;
- /**
- Size of the interface data descriptor.
- */
- size_t interface_size;
- /**
- */
- char is_multiformat;
- /**
- If set to non-zero, StarPU will never try to reuse an allocated
- buffer for a different handle. This can be notably useful for
- application-defined interfaces which have a dynamic size, and for
- which it thus does not make sense to reuse the buffer since will
- probably not have the proper size.
- */
- char dontcache;
- /**
- */
- struct starpu_multiformat_data_interface_ops* (*get_mf_ops)(void *data_interface);
- /**
- Pack the data handle into a contiguous buffer at the address
- allocated with <c>starpu_malloc_flags(ptr, size, 0)</c> (and thus
- returned in \p ptr) and set the size of the newly created buffer
- in \p count. If \p ptr is <c>NULL</c>, the function should not
- copy the data in the buffer but just set count to the size of the
- buffer which would have been allocated. The special value -1
- indicates the size is yet unknown.
- This method (and starpu_data_interface_ops::unpack_data) is required
- for disk support if the starpu_data_copy_methods::any_to_any method
- is not implemented (because the in-memory data layout is too
- complex).
- This is also required for MPI support if there is no registered MPI data type.
- */
- int (*pack_data) (starpu_data_handle_t handle, unsigned node, void **ptr, starpu_ssize_t *count);
- /**
- Unpack the data handle from the contiguous buffer at the address
- \p ptr of size \p count.
- The memory at the address \p ptr should be freed after the data unpacking operation.
- */
- int (*unpack_data) (starpu_data_handle_t handle, unsigned node, void *ptr, size_t count);
- /**
- Name of the interface
- */
- char *name;
- };
- /**
- @name Basic API
- @{
- */
- /**
- Register a piece of data into the handle located at the
- \p handleptr address. The \p data_interface buffer contains the initial
- description of the data in the \p home_node. The \p ops argument is a
- pointer to a structure describing the different methods used to
- manipulate this type of interface. See starpu_data_interface_ops for
- more details on this structure.
- If \p home_node is -1, StarPU will automatically allocate the memory when
- it is used for the first time in write-only mode. Once such data
- handle has been automatically allocated, it is possible to access it
- using any access mode.
- Note that StarPU supplies a set of predefined types of interface (e.g.
- vector or matrix) which can be registered by the means of helper
- functions (e.g. starpu_vector_data_register() or
- starpu_matrix_data_register()).
- */
- void starpu_data_register(starpu_data_handle_t *handleptr, int home_node, void *data_interface, struct starpu_data_interface_ops *ops);
- /**
- Register that a buffer for \p handle on \p node will be set. This is typically
- used by starpu_*_ptr_register helpers before setting the interface pointers for
- this node, to tell the core that that is now allocated.
- */
- void starpu_data_ptr_register(starpu_data_handle_t handle, unsigned node);
- /**
- Register a new piece of data into the handle \p handledst with the
- same interface as the handle \p handlesrc.
- */
- void starpu_data_register_same(starpu_data_handle_t *handledst, starpu_data_handle_t handlesrc);
- /**
- Return the pointer associated with \p handle on node \p node or <c>NULL</c>
- if handle’s interface does not support this operation or data for this
- \p handle is not allocated on that \p node.
- */
- void *starpu_data_handle_to_pointer(starpu_data_handle_t handle, unsigned node);
- /**
- Return whether the given \p ptr is within the data for \p handle on node \p
- node (1) or not (0). If the handle interface does not support this operation,
- and thus the result is unknown, -1 is returned.
- */
- int starpu_data_pointer_is_inside(starpu_data_handle_t handle, unsigned node, void *ptr);
- /**
- Return the local pointer associated with \p handle or <c>NULL</c> if
- \p handle’s interface does not have any data allocated locally.
- */
- void *starpu_data_get_local_ptr(starpu_data_handle_t handle);
- /**
- Return the interface associated with \p handle on \p memory_node.
- */
- void *starpu_data_get_interface_on_node(starpu_data_handle_t handle, unsigned memory_node);
- /**
- Return the unique identifier of the interface associated with
- the given \p handle.
- */
- enum starpu_data_interface_id starpu_data_get_interface_id(starpu_data_handle_t handle);
- /**
- Execute the packing operation of the interface of the data
- registered at \p handle (see starpu_data_interface_ops). This
- packing operation must allocate a buffer large enough at \p ptr and copy
- into the newly allocated buffer the data associated to \p handle. \p count
- will be set to the size of the allocated buffer. If \p ptr is <c>NULL</c>, the
- function should not copy the data in the buffer but just set \p count to
- the size of the buffer which would have been allocated. The special
- value -1 indicates the size is yet unknown.
- */
- int starpu_data_pack(starpu_data_handle_t handle, void **ptr, starpu_ssize_t *count);
- /**
- Unpack in handle the data located at \p ptr of size \p count as
- described by the interface of the data. The interface registered at
- \p handle must define a unpacking operation (see
- starpu_data_interface_ops).
- */
- int starpu_data_unpack(starpu_data_handle_t handle, void *ptr, size_t count);
- /**
- Return the size of the data associated with \p handle.
- */
- size_t starpu_data_get_size(starpu_data_handle_t handle);
- /**
- Return the size of the allocated data associated with \p handle.
- */
- size_t starpu_data_get_alloc_size(starpu_data_handle_t handle);
- /**
- Return the maximum size that the \p handle data may need to increase to.
- */
- starpu_ssize_t starpu_data_get_max_size(starpu_data_handle_t handle);
- /**
- Return the handle corresponding to the data pointed to by the \p ptr host pointer.
- */
- starpu_data_handle_t starpu_data_lookup(const void *ptr);
- int starpu_data_get_home_node(starpu_data_handle_t handle);
- /**
- Print basic informations on \p handle on \p node
- */
- void starpu_data_print(starpu_data_handle_t handle, unsigned node, FILE *stream);
- /**
- Return the next available id for a newly created data interface
- (\ref DefiningANewDataInterface).
- */
- int starpu_data_interface_get_next_id(void);
- /**
- Copy \p size bytes from byte offset \p src_offset of \p src on \p src_node
- to byte offset \p dst_offset of \p dst on \p dst_node. This is to be used in
- the starpu_data_copy_methods::any_to_any copy method, which is provided with \p async_data to
- be passed to starpu_interface_copy(). this returns <c>-EAGAIN</c> if the
- transfer is still ongoing, or 0 if the transfer is already completed.
- */
- int starpu_interface_copy(uintptr_t src, size_t src_offset, unsigned src_node,
- uintptr_t dst, size_t dst_offset, unsigned dst_node,
- size_t size, void *async_data);
- /**
- Copy \p numblocks blocks of \p blocksize bytes from byte offset \p src_offset
- of \p src on \p src_node to byte offset \p dst_offset of \p dst on \p
- dst_node.
- The blocks start at addresses which are ld_src (resp. ld_dst) bytes apart in
- the source (resp. destination) interface.
- If blocksize == ld_src == ld_dst, the transfer is optimized into a single
- starpu_interface_copy call.
- This is to be used in the starpu_data_copy_methods::any_to_any copy
- method for 2D data, which is provided with \p async_data to be passed to
- starpu_interface_copy(). this returns <c>-EAGAIN</c> if the transfer is still
- ongoing, or 0 if the transfer is already completed.
- */
- int starpu_interface_copy2d(uintptr_t src, size_t src_offset, unsigned src_node,
- uintptr_t dst, size_t dst_offset, unsigned dst_node,
- size_t blocksize,
- size_t numblocks, size_t ld_src, size_t ld_dst,
- void *async_data);
- /**
- Copy \p numblocks_1 * \p numblocks_2 blocks of \p blocksize bytes from byte
- offset \p src_offset of \p src on \p src_node to byte offset \p dst_offset of
- \p dst on \p dst_node.
- The blocks are grouped by \p numblocks_1 blocks whose start addresses are
- ld1_src (resp. ld1_dst) bytes apart in the source (resp. destination)
- interface.
- Such groups are grouped by numblocks_2 groups whose start addresses are
- ld2_src (resp. ld2_dst) bytes apart in the source (resp. destination)
- interface.
- If the blocks are contiguous, the transfers will be optimized.
- This is to be used in the starpu_data_copy_methods::any_to_any copy
- method for 3D data, which is provided with \p async_data to be passed to
- starpu_interface_copy(). this returns <c>-EAGAIN</c> if the transfer is still
- ongoing, or 0 if the transfer is already completed.
- */
- int starpu_interface_copy3d(uintptr_t src, size_t src_offset, unsigned src_node,
- uintptr_t dst, size_t dst_offset, unsigned dst_node,
- size_t blocksize,
- size_t numblocks1, size_t ld1_src, size_t ld1_dst,
- size_t numblocks2, size_t ld2_src, size_t ld2_dst,
- void *async_data);
- /**
- Copy \p numblocks_1 * \p numblocks_2 * \p numblocks_3 blocks of \p blocksize
- bytes from byte offset \p src_offset of \p src on \p src_node to byte offset
- \p dst_offset of \p dst on \p dst_node.
- The blocks are grouped by \p numblocks_1 blocks whose start addresses are
- ld1_src (resp. ld1_dst) bytes apart in the source (resp. destination)
- interface.
- Such groups are grouped by numblocks_2 groups whose start addresses are
- ld2_src (resp. ld2_dst) bytes apart in the source (resp. destination)
- interface.
- Such groups are grouped by numblocks_3 groups whose start addresses are
- ld3_src (resp. ld3_dst) bytes apart in the source (resp. destination)
- interface.
- If the blocks are contiguous, the transfers will be optimized.
- This is to be used in the starpu_data_copy_methods::any_to_any copy
- method for 3D data, which is provided with \p async_data to be passed to
- starpu_interface_copy(). this returns <c>-EAGAIN</c> if the transfer is still
- ongoing, or 0 if the transfer is already completed.
- */
- int starpu_interface_copy4d(uintptr_t src, size_t src_offset, unsigned src_node,
- uintptr_t dst, size_t dst_offset, unsigned dst_node,
- size_t blocksize,
- size_t numblocks1, size_t ld1_src, size_t ld1_dst,
- size_t numblocks2, size_t ld2_src, size_t ld2_dst,
- size_t numblocks3, size_t ld3_src, size_t ld3_dst,
- void *async_data);
- /**
- When an asynchonous implementation of the data transfer is implemented, the call
- to the underlying CUDA, OpenCL, etc. call should be surrounded
- by calls to starpu_interface_start_driver_copy_async() and
- starpu_interface_end_driver_copy_async(), so that it is recorded in offline
- execution traces, and the timing of the submission is checked. \p start must
- point to a variable whose value will be passed unchanged to
- starpu_interface_end_driver_copy_async().
- */
- void starpu_interface_start_driver_copy_async(unsigned src_node, unsigned dst_node, double *start);
- /**
- See starpu_interface_start_driver_copy_async().
- */
- void starpu_interface_end_driver_copy_async(unsigned src_node, unsigned dst_node, double start);
- /**
- Record in offline execution traces the copy of \p size bytes from
- node \p src_node to node \p dst_node
- */
- void starpu_interface_data_copy(unsigned src_node, unsigned dst_node, size_t size);
- /**
- Allocate \p size bytes on node \p dst_node with the given allocation \p flags. This returns 0 if
- allocation failed, the allocation method should then return <c>-ENOMEM</c> as
- allocated size. Deallocation must be done with starpu_free_on_node_flags().
- */
- uintptr_t starpu_malloc_on_node_flags(unsigned dst_node, size_t size, int flags);
- /**
- Allocate \p size bytes on node \p dst_node with the default allocation flags. This returns 0 if
- allocation failed, the allocation method should then return <c>-ENOMEM</c> as
- allocated size. Deallocation must be done with starpu_free_on_node().
- */
- uintptr_t starpu_malloc_on_node(unsigned dst_node, size_t size);
- /**
- Free \p addr of \p size bytes on node \p dst_node which was previously allocated
- with starpu_malloc_on_node_flags() with the given allocation \p flags.
- */
- void starpu_free_on_node_flags(unsigned dst_node, uintptr_t addr, size_t size, int flags);
- /**
- Free \p addr of \p size bytes on node \p dst_node which was previously allocated
- with starpu_malloc_on_node().
- */
- void starpu_free_on_node(unsigned dst_node, uintptr_t addr, size_t size);
- /**
- Define the default flags for allocations performed by starpu_malloc_on_node() and
- starpu_free_on_node(). The default is \ref STARPU_MALLOC_PINNED | \ref STARPU_MALLOC_COUNT.
- */
- void starpu_malloc_on_node_set_default_flags(unsigned node, int flags);
- /** @} */
- /**
- @name Accessing Matrix Data Interfaces
- @{
- */
- extern struct starpu_data_interface_ops starpu_interface_matrix_ops;
- /**
- Matrix interface for dense matrices
- */
- struct starpu_matrix_interface
- {
- enum starpu_data_interface_id id; /**< Identifier of the interface */
- uintptr_t ptr; /**< local pointer of the matrix */
- uintptr_t dev_handle; /**< device handle of the matrix */
- size_t offset; /**< offset in the matrix */
- uint32_t nx; /**< number of elements on the x-axis of the matrix */
- uint32_t ny; /**< number of elements on the y-axis of the matrix */
- uint32_t ld; /**< number of elements between each row of the
- matrix. Maybe be equal to starpu_matrix_interface::nx
- when there is no padding.
- */
- size_t elemsize; /**< size of the elements of the matrix */
- size_t allocsize; /**< size actually currently allocated */
- };
- /**
- Register the \p nx x \p ny 2D matrix of \p elemsize-byte elements pointed
- by \p ptr and initialize \p handle to represent it. \p ld specifies the number
- of elements between rows. a value greater than \p nx adds padding, which
- can be useful for alignment purposes.
- Here an example of how to use the function.
- \code{.c}
- float *matrix;
- starpu_data_handle_t matrix_handle;
- matrix = (float*)malloc(width * height * sizeof(float));
- starpu_matrix_data_register(&matrix_handle, STARPU_MAIN_RAM, (uintptr_t)matrix, width, width, height, sizeof(float));
- \endcode
- */
- void starpu_matrix_data_register(starpu_data_handle_t *handle, int home_node, uintptr_t ptr, uint32_t ld, uint32_t nx, uint32_t ny, size_t elemsize);
- /**
- Similar to starpu_matrix_data_register, but additionally specifies which
- allocation size should be used instead of the initial nx*ny*elemsize.
- */
- void starpu_matrix_data_register_allocsize(starpu_data_handle_t *handle, int home_node, uintptr_t ptr, uint32_t ld, uint32_t nx, uint32_t ny, size_t elemsize, size_t allocsize);
- /**
- Register into the \p handle that to store data on node \p node it should use the
- buffer located at \p ptr, or device handle \p dev_handle and offset \p offset
- (for OpenCL, notably), with \p ld elements between rows.
- */
- void starpu_matrix_ptr_register(starpu_data_handle_t handle, unsigned node, uintptr_t ptr, uintptr_t dev_handle, size_t offset, uint32_t ld);
- /**
- Return the number of elements on the x-axis of the matrix
- designated by \p handle.
- */
- uint32_t starpu_matrix_get_nx(starpu_data_handle_t handle);
- /**
- Return the number of elements on the y-axis of the matrix
- designated by \p handle.
- */
- uint32_t starpu_matrix_get_ny(starpu_data_handle_t handle);
- /**
- Return the number of elements between each row of the matrix
- designated by \p handle. Maybe be equal to nx when there is no padding.
- */
- uint32_t starpu_matrix_get_local_ld(starpu_data_handle_t handle);
- /**
- Return the local pointer associated with \p handle.
- */
- uintptr_t starpu_matrix_get_local_ptr(starpu_data_handle_t handle);
- /**
- Return the size of the elements registered into the matrix
- designated by \p handle.
- */
- size_t starpu_matrix_get_elemsize(starpu_data_handle_t handle);
- /**
- Return the allocated size of the matrix designated by \p handle.
- */
- size_t starpu_matrix_get_allocsize(starpu_data_handle_t handle);
- #if defined(STARPU_HAVE_STATEMENT_EXPRESSIONS) && defined(STARPU_DEBUG)
- #define STARPU_MATRIX_CHECK(interface) STARPU_ASSERT_MSG((((struct starpu_matrix_interface *)(interface))->id) == STARPU_MATRIX_INTERFACE_ID, "Error. The given data is not a matrix.")
- #define STARPU_MATRIX_GET_PTR(interface) ({ STARPU_MATRIX_CHECK(interface); (((struct starpu_matrix_interface *)(interface))->ptr) ; })
- #define STARPU_MATRIX_GET_DEV_HANDLE(interface) ({ STARPU_MATRIX_CHECK(interface); (((struct starpu_matrix_interface *)(interface))->dev_handle) ; })
- #define STARPU_MATRIX_GET_OFFSET(interface) ({ STARPU_MATRIX_CHECK(interface); (((struct starpu_matrix_interface *)(interface))->offset) ; })
- #define STARPU_MATRIX_GET_NX(interface) ({ STARPU_MATRIX_CHECK(interface); (((struct starpu_matrix_interface *)(interface))->nx) ; })
- #define STARPU_MATRIX_GET_NY(interface) ({ STARPU_MATRIX_CHECK(interface); (((struct starpu_matrix_interface *)(interface))->ny) ; })
- #define STARPU_MATRIX_GET_LD(interface) ({ STARPU_MATRIX_CHECK(interface); (((struct starpu_matrix_interface *)(interface))->ld) ; })
- #define STARPU_MATRIX_GET_ELEMSIZE(interface) ({ STARPU_MATRIX_CHECK(interface); (((struct starpu_matrix_interface *)(interface))->elemsize) ; })
- #define STARPU_MATRIX_GET_ALLOCSIZE(interface) ({ STARPU_MATRIX_CHECK(interface); (((struct starpu_matrix_interface *)(interface))->allocsize) ; })
- #else
- /**
- Return a pointer to the matrix designated by \p interface, valid
- on CPUs and CUDA devices only. For OpenCL devices, the device handle
- and offset need to be used instead.
- */
- #define STARPU_MATRIX_GET_PTR(interface) (((struct starpu_matrix_interface *)(interface))->ptr)
- /**
- Return a device handle for the matrix designated by \p interface,
- to be used with OpenCL. The offset returned by
- ::STARPU_MATRIX_GET_OFFSET has to be used in
- addition to this.
- */
- #define STARPU_MATRIX_GET_DEV_HANDLE(interface) (((struct starpu_matrix_interface *)(interface))->dev_handle)
- /**
- Return the offset in the matrix designated by \p interface, to be
- used with the device handle.
- */
- #define STARPU_MATRIX_GET_OFFSET(interface) (((struct starpu_matrix_interface *)(interface))->offset)
- /**
- Return the number of elements on the x-axis of the matrix
- designated by \p interface.
- */
- #define STARPU_MATRIX_GET_NX(interface) (((struct starpu_matrix_interface *)(interface))->nx)
- /**
- Return the number of elements on the y-axis of the matrix
- designated by \p interface.
- */
- #define STARPU_MATRIX_GET_NY(interface) (((struct starpu_matrix_interface *)(interface))->ny)
- /**
- Return the number of elements between each row of the matrix
- designated by \p interface. May be equal to nx when there is no padding.
- */
- #define STARPU_MATRIX_GET_LD(interface) (((struct starpu_matrix_interface *)(interface))->ld)
- /**
- Return the size of the elements registered into the matrix
- designated by \p interface.
- */
- #define STARPU_MATRIX_GET_ELEMSIZE(interface) (((struct starpu_matrix_interface *)(interface))->elemsize)
- /**
- Return the allocated size of the matrix designated by \p interface.
- */
- #define STARPU_MATRIX_GET_ALLOCSIZE(interface) (((struct starpu_matrix_interface *)(interface))->allocsize)
- #endif
- /**
- Set the number of elements on the x-axis of the matrix
- designated by \p interface.
- */
- #define STARPU_MATRIX_SET_NX(interface, newnx) do { \
- STARPU_MATRIX_CHECK(interface); \
- (((struct starpu_matrix_interface *)(interface))->nx) = (newnx); \
- } while (0)
- /**
- Set the number of elements on the y-axis of the matrix
- designated by \p interface.
- */
- #define STARPU_MATRIX_SET_NY(interface, newny) do { \
- STARPU_MATRIX_CHECK(interface); \
- (((struct starpu_matrix_interface *)(interface))->ny) = (newny); \
- } while(0)
- /**
- Set the number of elements between each row of the matrix
- designated by \p interface. May be set to the same value as nx when there is
- no padding.
- */
- #define STARPU_MATRIX_SET_LD(interface, newld) do { \
- STARPU_MATRIX_CHECK(interface); \
- (((struct starpu_matrix_interface *)(interface))->ld) = (newld); \
- } while(0)
- /** @} */
- /**
- @name Accessing COO Data Interfaces
- @{
- */
- extern struct starpu_data_interface_ops starpu_interface_coo_ops;
- /**
- COO Matrices
- */
- struct starpu_coo_interface
- {
- enum starpu_data_interface_id id; /**< identifier of the interface */
- uint32_t *columns; /**< column array of the matrix */
- uint32_t *rows; /**< row array of the matrix */
- uintptr_t values; /**< values of the matrix */
- uint32_t nx; /**< number of elements on the x-axis of the matrix */
- uint32_t ny; /**< number of elements on the y-axis of the matrix */
- uint32_t n_values; /**< number of values registered in the matrix */
- size_t elemsize; /**< size of the elements of the matrix */
- };
- /**
- Register the \p nx x \p ny 2D matrix given in the COO format, using the
- \p columns, \p rows, \p values arrays, which must have \p n_values elements of
- size \p elemsize. Initialize \p handleptr.
- */
- void starpu_coo_data_register(starpu_data_handle_t *handleptr, int home_node, uint32_t nx, uint32_t ny, uint32_t n_values, uint32_t *columns, uint32_t *rows, uintptr_t values, size_t elemsize);
- /**
- Return a pointer to the column array of the matrix designated
- by \p interface.
- */
- #define STARPU_COO_GET_COLUMNS(interface) (((struct starpu_coo_interface *)(interface))->columns)
- /**
- Return a device handle for the column array of the matrix
- designated by \p interface, to be used with OpenCL. The offset
- returned by ::STARPU_COO_GET_OFFSET has to be used in addition to
- this.
- */
- #define STARPU_COO_GET_COLUMNS_DEV_HANDLE(interface) (((struct starpu_coo_interface *)(interface))->columns)
- /**
- Return a pointer to the rows array of the matrix designated by
- \p interface.
- */
- #define STARPU_COO_GET_ROWS(interface) (((struct starpu_coo_interface *)(interface))->rows)
- /**
- Return a device handle for the row array of the matrix
- designated by \p interface, to be used on OpenCL. The offset returned
- by ::STARPU_COO_GET_OFFSET has to be used in addition to this.
- */
- #define STARPU_COO_GET_ROWS_DEV_HANDLE(interface) (((struct starpu_coo_interface *)(interface))->rows)
- /**
- Return a pointer to the values array of the matrix designated
- by \p interface.
- */
- #define STARPU_COO_GET_VALUES(interface) (((struct starpu_coo_interface *)(interface))->values)
- /**
- Return a device handle for the value array of the matrix
- designated by \p interface, to be used on OpenCL. The offset returned
- by ::STARPU_COO_GET_OFFSET has to be used in addition to this.
- */
- #define STARPU_COO_GET_VALUES_DEV_HANDLE(interface) (((struct starpu_coo_interface *)(interface))->values)
- /**
- Return the offset in the arrays of the COO matrix designated by
- \p interface.
- */
- #define STARPU_COO_GET_OFFSET 0
- /**
- Return the number of elements on the x-axis of the matrix
- designated by \p interface.
- */
- #define STARPU_COO_GET_NX(interface) (((struct starpu_coo_interface *)(interface))->nx)
- /**
- Return the number of elements on the y-axis of the matrix
- designated by \p interface.
- */
- #define STARPU_COO_GET_NY(interface) (((struct starpu_coo_interface *)(interface))->ny)
- /**
- Return the number of values registered in the matrix designated
- by \p interface.
- */
- #define STARPU_COO_GET_NVALUES(interface) (((struct starpu_coo_interface *)(interface))->n_values)
- /**
- Return the size of the elements registered into the matrix
- designated by \p interface.
- */
- #define STARPU_COO_GET_ELEMSIZE(interface) (((struct starpu_coo_interface *)(interface))->elemsize)
- /** @} */
- /**
- @name Block Data Interface
- @{
- */
- extern struct starpu_data_interface_ops starpu_interface_block_ops;
- /* TODO: rename to 3dmatrix? */
- /* TODO: add allocsize support */
- /**
- Block interface for 3D dense blocks
- */
- struct starpu_block_interface
- {
- enum starpu_data_interface_id id; /**< identifier of the interface */
- uintptr_t ptr; /**< local pointer of the block */
- uintptr_t dev_handle; /**< device handle of the block. */
- size_t offset; /**< offset in the block. */
- uint32_t nx; /**< number of elements on the x-axis of the block. */
- uint32_t ny; /**< number of elements on the y-axis of the block. */
- uint32_t nz; /**< number of elements on the z-axis of the block. */
- uint32_t ldy; /**< number of elements between two lines */
- uint32_t ldz; /**< number of elements between two planes */
- size_t elemsize; /**< size of the elements of the block. */
- };
- /**
- Register the \p nx x \p ny x \p nz 3D matrix of \p elemsize byte elements
- pointed by \p ptr and initialize \p handle to represent it. Again, \p ldy and
- \p ldz specify the number of elements between rows and between z planes.
- Here an example of how to use the function.
- \code{.c}
- float *block;
- starpu_data_handle_t block_handle;
- block = (float*)malloc(nx*ny*nz*sizeof(float));
- starpu_block_data_register(&block_handle, STARPU_MAIN_RAM, (uintptr_t)block, nx, nx*ny, nx, ny, nz, sizeof(float));
- \endcode
- */
- void starpu_block_data_register(starpu_data_handle_t *handle, int home_node, uintptr_t ptr, uint32_t ldy, uint32_t ldz, uint32_t nx, uint32_t ny, uint32_t nz, size_t elemsize);
- /**
- Register into the \p handle that to store data on node \p node it should use the
- buffer located at \p ptr, or device handle \p dev_handle and offset \p offset
- (for OpenCL, notably), with \p ldy elements between rows and \p ldz
- elements between z planes.
- */
- void starpu_block_ptr_register(starpu_data_handle_t handle, unsigned node, uintptr_t ptr, uintptr_t dev_handle, size_t offset, uint32_t ldy, uint32_t ldz);
- /**
- Return the number of elements on the x-axis of the block
- designated by \p handle.
- */
- uint32_t starpu_block_get_nx(starpu_data_handle_t handle);
- /**
- Return the number of elements on the y-axis of the block
- designated by \p handle.
- */
- uint32_t starpu_block_get_ny(starpu_data_handle_t handle);
- /**
- Return the number of elements on the z-axis of the block
- designated by \p handle.
- */
- uint32_t starpu_block_get_nz(starpu_data_handle_t handle);
- /**
- Return the number of elements between each row of the block
- designated by \p handle, in the format of the current memory node.
- */
- uint32_t starpu_block_get_local_ldy(starpu_data_handle_t handle);
- /**
- Return the number of elements between each z plane of the block
- designated by \p handle, in the format of the current memory node.
- */
- uint32_t starpu_block_get_local_ldz(starpu_data_handle_t handle);
- /**
- Return the local pointer associated with \p handle.
- */
- uintptr_t starpu_block_get_local_ptr(starpu_data_handle_t handle);
- /**
- Return the size of the elements of the block designated by
- \p handle.
- */
- size_t starpu_block_get_elemsize(starpu_data_handle_t handle);
- #if defined(STARPU_HAVE_STATEMENT_EXPRESSIONS) && defined(STARPU_DEBUG)
- #define STARPU_BLOCK_CHECK(interface) STARPU_ASSERT_MSG((((struct starpu_block_interface *)(interface))->id) == STARPU_BLOCK_INTERFACE_ID, "Error. The given data is not a block.")
- #define STARPU_BLOCK_GET_PTR(interface) ({ STARPU_BLOCK_CHECK(interface); (((struct starpu_block_interface *)(interface))->ptr) ; })
- #define STARPU_BLOCK_GET_DEV_HANDLE(interface) ({ STARPU_BLOCK_CHECK(interface); (((struct starpu_block_interface *)(interface))->dev_handle) ; })
- #define STARPU_BLOCK_GET_OFFSET(interface) ({ STARPU_BLOCK_CHECK(interface); (((struct starpu_block_interface *)(interface))->offset) ; })
- #define STARPU_BLOCK_GET_NX(interface) ({ STARPU_BLOCK_CHECK(interface); (((struct starpu_block_interface *)(interface))->nx) ; })
- #define STARPU_BLOCK_GET_NY(interface) ({ STARPU_BLOCK_CHECK(interface); (((struct starpu_block_interface *)(interface))->ny) ; })
- #define STARPU_BLOCK_GET_NZ(interface) ({ STARPU_BLOCK_CHECK(interface); (((struct starpu_block_interface *)(interface))->nz) ; })
- #define STARPU_BLOCK_GET_LDY(interface) ({ STARPU_BLOCK_CHECK(interface); (((struct starpu_block_interface *)(interface))->ldy) ; })
- #define STARPU_BLOCK_GET_LDZ(interface) ({ STARPU_BLOCK_CHECK(interface); (((struct starpu_block_interface *)(interface))->ldz) ; })
- #define STARPU_BLOCK_GET_ELEMSIZE(interface) ({ STARPU_BLOCK_CHECK(interface); (((struct starpu_block_interface *)(interface))->elemsize) ; })
- #else
- /**
- Return a pointer to the block designated by \p interface.
- */
- #define STARPU_BLOCK_GET_PTR(interface) (((struct starpu_block_interface *)(interface))->ptr)
- /**
- Return a device handle for the block designated by \p interface,
- to be used on OpenCL. The offset returned by
- ::STARPU_BLOCK_GET_OFFSET has to be used in
- addition to this.
- */
- #define STARPU_BLOCK_GET_DEV_HANDLE(interface) (((struct starpu_block_interface *)(interface))->dev_handle)
- /**
- Return the offset in the block designated by \p interface, to be
- used with the device handle.
- */
- #define STARPU_BLOCK_GET_OFFSET(interface) (((struct starpu_block_interface *)(interface))->offset)
- /**
- Return the number of elements on the x-axis of the block
- designated by \p interface.
- */
- #define STARPU_BLOCK_GET_NX(interface) (((struct starpu_block_interface *)(interface))->nx)
- /**
- Return the number of elements on the y-axis of the block
- designated by \p interface.
- */
- #define STARPU_BLOCK_GET_NY(interface) (((struct starpu_block_interface *)(interface))->ny)
- /**
- Return the number of elements on the z-axis of the block
- designated by \p interface.
- */
- #define STARPU_BLOCK_GET_NZ(interface) (((struct starpu_block_interface *)(interface))->nz)
- /**
- Return the number of elements between each row of the block
- designated by \p interface. May be equal to nx when there is no padding.
- */
- #define STARPU_BLOCK_GET_LDY(interface) (((struct starpu_block_interface *)(interface))->ldy)
- /**
- Return the number of elements between each z plane of the block
- designated by \p interface. May be equal to nx*ny when there is no
- padding.
- */
- #define STARPU_BLOCK_GET_LDZ(interface) (((struct starpu_block_interface *)(interface))->ldz)
- /**
- Return the size of the elements of the block designated by
- \p interface.
- */
- #define STARPU_BLOCK_GET_ELEMSIZE(interface) (((struct starpu_block_interface *)(interface))->elemsize)
- #endif
- /** @} */
- /**
- @name Tensor Data Interface
- @{
- */
- extern struct starpu_data_interface_ops starpu_interface_tensor_ops;
- /* TODO: rename to 4dtensor? */
- /* TODO: add allocsize support */
- /**
- Tensor interface for 4D dense tensors
- */
- struct starpu_tensor_interface
- {
- enum starpu_data_interface_id id; /**< identifier of the interface */
- uintptr_t ptr; /**< local pointer of the tensor */
- uintptr_t dev_handle; /**< device handle of the tensor. */
- size_t offset; /**< offset in the tensor. */
- uint32_t nx; /**< number of elements on the x-axis of the tensor. */
- uint32_t ny; /**< number of elements on the y-axis of the tensor. */
- uint32_t nz; /**< number of elements on the z-axis of the tensor. */
- uint32_t nt; /**< number of elements on the t-axis of the tensor. */
- uint32_t ldy; /**< number of elements between two lines */
- uint32_t ldz; /**< number of elements between two planes */
- uint32_t ldt; /**< number of elements between two cubes */
- size_t elemsize; /**< size of the elements of the tensor. */
- };
- /**
- Register the \p nx x \p ny x \p nz x \p nt 4D tensor of \p elemsize byte elements
- pointed by \p ptr and initialize \p handle to represent it. Again, \p ldy,
- \p ldz, and \p ldt specify the number of elements between rows, between z planes and between t cubes.
- Here an example of how to use the function.
- \code{.c}
- float *tensor;
- starpu_data_handle_t tensor_handle;
- tensor = (float*)malloc(nx*ny*nz*nt*sizeof(float));
- starpu_tensor_data_register(&tensor_handle, STARPU_MAIN_RAM, (uintptr_t)tensor, nx, nx*ny, nx*ny*nz, nx, ny, nz, nt, sizeof(float));
- \endcode
- */
- void starpu_tensor_data_register(starpu_data_handle_t *handle, int home_node, uintptr_t ptr, uint32_t ldy, uint32_t ldz, uint32_t ldt, uint32_t nx, uint32_t ny, uint32_t nz, uint32_t nt, size_t elemsize);
- /**
- Register into the \p handle that to store data on node \p node it should use the
- buffer located at \p ptr, or device handle \p dev_handle and offset \p offset
- (for OpenCL, notably), with \p ldy elements between rows, and \p ldz
- elements between z planes, and \p ldt elements between t cubes.
- */
- void starpu_tensor_ptr_register(starpu_data_handle_t handle, unsigned node, uintptr_t ptr, uintptr_t dev_handle, size_t offset, uint32_t ldy, uint32_t ldz, uint32_t ldt);
- /**
- Return the number of elements on the x-axis of the tensor
- designated by \p handle.
- */
- uint32_t starpu_tensor_get_nx(starpu_data_handle_t handle);
- /**
- Return the number of elements on the y-axis of the tensor
- designated by \p handle.
- */
- uint32_t starpu_tensor_get_ny(starpu_data_handle_t handle);
- /**
- Return the number of elements on the z-axis of the tensor
- designated by \p handle.
- */
- uint32_t starpu_tensor_get_nz(starpu_data_handle_t handle);
- /**
- Return the number of elements on the t-axis of the tensor
- designated by \p handle.
- */
- uint32_t starpu_tensor_get_nt(starpu_data_handle_t handle);
- /**
- Return the number of elements between each row of the tensor
- designated by \p handle, in the format of the current memory node.
- */
- uint32_t starpu_tensor_get_local_ldy(starpu_data_handle_t handle);
- /**
- Return the number of elements between each z plane of the tensor
- designated by \p handle, in the format of the current memory node.
- */
- uint32_t starpu_tensor_get_local_ldz(starpu_data_handle_t handle);
- /**
- Return the number of elements between each t cubes of the tensor
- designated by \p handle, in the format of the current memory node.
- */
- uint32_t starpu_tensor_get_local_ldt(starpu_data_handle_t handle);
- /**
- Return the local pointer associated with \p handle.
- */
- uintptr_t starpu_tensor_get_local_ptr(starpu_data_handle_t handle);
- /**
- Return the size of the elements of the tensor designated by
- \p handle.
- */
- size_t starpu_tensor_get_elemsize(starpu_data_handle_t handle);
- #if defined(STARPU_HAVE_STATEMENT_EXPRESSIONS) && defined(STARPU_DEBUG)
- #define STARPU_TENSOR_CHECK(interface) STARPU_ASSERT_MSG((((struct starpu_tensor_interface *)(interface))->id) == STARPU_TENSOR_INTERFACE_ID, "Error. The given data is not a tensor.")
- #define STARPU_TENSOR_GET_PTR(interface) ({ STARPU_TENSOR_CHECK(interface); (((struct starpu_tensor_interface *)(interface))->ptr) ; })
- #define STARPU_TENSOR_GET_DEV_HANDLE(interface) ({ STARPU_TENSOR_CHECK(interface); (((struct starpu_tensor_interface *)(interface))->dev_handle) ; })
- #define STARPU_TENSOR_GET_OFFSET(interface) ({ STARPU_TENSOR_CHECK(interface); (((struct starpu_tensor_interface *)(interface))->offset) ; })
- #define STARPU_TENSOR_GET_NX(interface) ({ STARPU_TENSOR_CHECK(interface); (((struct starpu_tensor_interface *)(interface))->nx) ; })
- #define STARPU_TENSOR_GET_NY(interface) ({ STARPU_TENSOR_CHECK(interface); (((struct starpu_tensor_interface *)(interface))->ny) ; })
- #define STARPU_TENSOR_GET_NZ(interface) ({ STARPU_TENSOR_CHECK(interface); (((struct starpu_tensor_interface *)(interface))->nz) ; })
- #define STARPU_TENSOR_GET_NT(interface) ({ STARPU_TENSOR_CHECK(interface); (((struct starpu_tensor_interface *)(interface))->nt) ; })
- #define STARPU_TENSOR_GET_LDY(interface) ({ STARPU_TENSOR_CHECK(interface); (((struct starpu_tensor_interface *)(interface))->ldy) ; })
- #define STARPU_TENSOR_GET_LDZ(interface) ({ STARPU_TENSOR_CHECK(interface); (((struct starpu_tensor_interface *)(interface))->ldz) ; })
- #define STARPU_TENSOR_GET_LDT(interface) ({ STARPU_TENSOR_CHECK(interface); (((struct starpu_tensor_interface *)(interface))->ldt) ; })
- #define STARPU_TENSOR_GET_ELEMSIZE(interface) ({ STARPU_TENSOR_CHECK(interface); (((struct starpu_tensor_interface *)(interface))->elemsize) ; })
- #else
- /**
- Return a pointer to the tensor designated by \p interface.
- */
- #define STARPU_TENSOR_GET_PTR(interface) (((struct starpu_tensor_interface *)(interface))->ptr)
- /**
- Return a device handle for the tensor designated by \p interface,
- to be used on OpenCL. The offset returned by
- ::STARPU_TENSOR_GET_OFFSET has to be used in
- addition to this.
- */
- #define STARPU_TENSOR_GET_DEV_HANDLE(interface) (((struct starpu_tensor_interface *)(interface))->dev_handle)
- /**
- Return the offset in the tensor designated by \p interface, to be
- used with the device handle.
- */
- #define STARPU_TENSOR_GET_OFFSET(interface) (((struct starpu_tensor_interface *)(interface))->offset)
- /**
- Return the number of elements on the x-axis of the tensor
- designated by \p interface.
- */
- #define STARPU_TENSOR_GET_NX(interface) (((struct starpu_tensor_interface *)(interface))->nx)
- /**
- Return the number of elements on the y-axis of the tensor
- designated by \p interface.
- */
- #define STARPU_TENSOR_GET_NY(interface) (((struct starpu_tensor_interface *)(interface))->ny)
- /**
- Return the number of elements on the z-axis of the tensor
- designated by \p interface.
- */
- #define STARPU_TENSOR_GET_NZ(interface) (((struct starpu_tensor_interface *)(interface))->nz)
- /**
- Return the number of elements on the t-axis of the tensor
- designated by \p interface.
- */
- #define STARPU_TENSOR_GET_NT(interface) (((struct starpu_tensor_interface *)(interface))->nt)
- /**
- Return the number of elements between each row of the tensor
- designated by \p interface. May be equal to nx when there is no padding.
- */
- #define STARPU_TENSOR_GET_LDY(interface) (((struct starpu_tensor_interface *)(interface))->ldy)
- /**
- Return the number of elements between each z plane of the tensor
- designated by \p interface. May be equal to nx*ny when there is no
- padding.
- */
- #define STARPU_TENSOR_GET_LDZ(interface) (((struct starpu_tensor_interface *)(interface))->ldz)
- /**
- Return the number of elements between each t cubes of the tensor
- designated by \p interface. May be equal to nx*ny*nz when there is no
- padding.
- */
- #define STARPU_TENSOR_GET_LDT(interface) (((struct starpu_tensor_interface *)(interface))->ldt)
- /**
- Return the size of the elements of the tensor designated by
- \p interface.
- */
- #define STARPU_TENSOR_GET_ELEMSIZE(interface) (((struct starpu_tensor_interface *)(interface))->elemsize)
- #endif
- /** @} */
- /**
- @name Vector Data Interface
- @{
- */
- extern struct starpu_data_interface_ops starpu_interface_vector_ops;
- /**
- */
- struct starpu_vector_interface
- {
- enum starpu_data_interface_id id; /**< Identifier of the interface */
- uintptr_t ptr; /**< local pointer of the vector */
- uintptr_t dev_handle; /**< device handle of the vector. */
- size_t offset; /**< offset in the vector */
- uint32_t nx; /**< number of elements on the x-axis of the vector */
- size_t elemsize; /**< size of the elements of the vector */
- uint32_t slice_base; /**< vector slice base, used by the StarPU OpenMP runtime support */
- size_t allocsize; /**< size actually currently allocated */
- };
- /**
- Register the \p nx \p elemsize-byte elements pointed to by \p ptr and initialize \p handle to represent it.
- Here an example of how to use the function.
- \code{.c}
- float vector[NX];
- starpu_data_handle_t vector_handle;
- starpu_vector_data_register(&vector_handle, STARPU_MAIN_RAM, (uintptr_t)vector, NX, sizeof(vector[0]));
- \endcode
- */
- void starpu_vector_data_register(starpu_data_handle_t *handle, int home_node, uintptr_t ptr, uint32_t nx, size_t elemsize);
- /**
- Similar to starpu_matrix_data_register, but additionally specifies which
- allocation size should be used instead of the initial nx*elemsize.
- */
- void starpu_vector_data_register_allocsize(starpu_data_handle_t *handle, int home_node, uintptr_t ptr, uint32_t nx, size_t elemsize, size_t allocsize);
- /**
- Register into the \p handle that to store data on node \p node it should use the
- buffer located at \p ptr, or device handle \p dev_handle and offset \p offset
- (for OpenCL, notably)
- */
- void starpu_vector_ptr_register(starpu_data_handle_t handle, unsigned node, uintptr_t ptr, uintptr_t dev_handle, size_t offset);
- /**
- Return the number of elements registered into the array designated by \p handle.
- */
- uint32_t starpu_vector_get_nx(starpu_data_handle_t handle);
- /**
- Return the size of each element of the array designated by \p handle.
- */
- size_t starpu_vector_get_elemsize(starpu_data_handle_t handle);
- /**
- Return the allocated size of the array designated by \p handle.
- */
- size_t starpu_vector_get_allocsize(starpu_data_handle_t handle);
- /**
- Return the local pointer associated with \p handle.
- */
- uintptr_t starpu_vector_get_local_ptr(starpu_data_handle_t handle);
- #if defined(STARPU_HAVE_STATEMENT_EXPRESSIONS) && defined(STARPU_DEBUG)
- #define STARPU_VECTOR_CHECK(interface) STARPU_ASSERT_MSG((((struct starpu_vector_interface *)(interface))->id) == STARPU_VECTOR_INTERFACE_ID, "Error. The given data is not a vector.")
- #define STARPU_VECTOR_GET_PTR(interface) ({ STARPU_VECTOR_CHECK(interface); (((struct starpu_vector_interface *)(interface))->ptr); })
- #define STARPU_VECTOR_GET_DEV_HANDLE(interface) ({ STARPU_VECTOR_CHECK(interface); (((struct starpu_vector_interface *)(interface))->dev_handle); })
- #define STARPU_VECTOR_GET_OFFSET(interface) ({ STARPU_VECTOR_CHECK(interface); (((struct starpu_vector_interface *)(interface))->offset); })
- #define STARPU_VECTOR_GET_NX(interface) ({ STARPU_VECTOR_CHECK(interface); (((struct starpu_vector_interface *)(interface))->nx); })
- #define STARPU_VECTOR_GET_ELEMSIZE(interface) ({ STARPU_VECTOR_CHECK(interface); (((struct starpu_vector_interface *)(interface))->elemsize); })
- #define STARPU_VECTOR_GET_ALLOCSIZE(interface) ({ STARPU_VECTOR_CHECK(interface); (((struct starpu_vector_interface *)(interface))->allocsize); })
- #define STARPU_VECTOR_GET_SLICE_BASE(interface) ({ STARPU_VECTOR_CHECK(interface); (((struct starpu_vector_interface *)(interface))->slice_base); })
- #else
- /**
- Return a pointer to the array designated by \p interface, valid on
- CPUs and CUDA only. For OpenCL, the device handle and offset need to
- be used instead.
- */
- #define STARPU_VECTOR_GET_PTR(interface) (((struct starpu_vector_interface *)(interface))->ptr)
- /**
- Return a device handle for the array designated by \p interface,
- to be used with OpenCL. the offset returned by ::STARPU_VECTOR_GET_OFFSET has to be used in
- addition to this.
- */
- #define STARPU_VECTOR_GET_DEV_HANDLE(interface) (((struct starpu_vector_interface *)(interface))->dev_handle)
- /**
- Return the offset in the array designated by \p interface, to be
- used with the device handle.
- */
- #define STARPU_VECTOR_GET_OFFSET(interface) (((struct starpu_vector_interface *)(interface))->offset)
- /**
- Return the number of elements registered into the array
- designated by \p interface.
- */
- #define STARPU_VECTOR_GET_NX(interface) (((struct starpu_vector_interface *)(interface))->nx)
- /**
- Return the size of each element of the array designated by
- \p interface.
- */
- #define STARPU_VECTOR_GET_ELEMSIZE(interface) (((struct starpu_vector_interface *)(interface))->elemsize)
- /**
- Return the size of each element of the array designated by
- \p interface.
- */
- #define STARPU_VECTOR_GET_ALLOCSIZE(interface) (((struct starpu_vector_interface *)(interface))->allocsize)
- /**
- Return the OpenMP slice base annotation of each element of the array designated by
- \p interface.
- */
- #define STARPU_VECTOR_GET_SLICE_BASE(interface) (((struct starpu_vector_interface *)(interface))->slice_base)
- #endif
- /**
- Set the number of elements registered into the array designated by \p
- interface.
- */
- #define STARPU_VECTOR_SET_NX(interface, newnx) do { \
- STARPU_VECTOR_CHECK(interface); \
- (((struct starpu_vector_interface *)(interface))->nx) = (newnx); \
- } while(0)
- /** @} */
- /**
- @name Variable Data Interface
- @{
- */
- extern struct starpu_data_interface_ops starpu_interface_variable_ops;
- /**
- Variable interface for a single data (not a vector, a matrix, a list,
- ...)
- */
- struct starpu_variable_interface
- {
- enum starpu_data_interface_id id; /**< Identifier of the interface */
- uintptr_t ptr; /**< local pointer of the variable */
- uintptr_t dev_handle; /**< device handle of the variable. */
- size_t offset; /**< offset in the variable */
- size_t elemsize; /**< size of the variable */
- };
- /**
- Register the \p size byte element pointed to by \p ptr, which is
- typically a scalar, and initialize \p handle to represent this data item.
- Here an example of how to use the function.
- \code{.c}
- float var = 42.0;
- starpu_data_handle_t var_handle;
- starpu_variable_data_register(&var_handle, STARPU_MAIN_RAM, (uintptr_t)&var, sizeof(var));
- \endcode
- */
- void starpu_variable_data_register(starpu_data_handle_t *handle, int home_node, uintptr_t ptr, size_t size);
- /**
- Register into the \p handle that to store data on node \p node it should use the
- buffer located at \p ptr, or device handle \p dev_handle and offset \p offset
- (for OpenCL, notably)
- */
- void starpu_variable_ptr_register(starpu_data_handle_t handle, unsigned node, uintptr_t ptr, uintptr_t dev_handle, size_t offset);
- /**
- Return the size of the variable designated by \p handle.
- */
- size_t starpu_variable_get_elemsize(starpu_data_handle_t handle);
- /**
- Return a pointer to the variable designated by \p handle.
- */
- uintptr_t starpu_variable_get_local_ptr(starpu_data_handle_t handle);
- #if defined(STARPU_HAVE_STATEMENT_EXPRESSIONS) && defined(STARPU_DEBUG)
- #define STARPU_VARIABLE_CHECK(interface) STARPU_ASSERT_MSG((((struct starpu_variable_interface *)(interface))->id) == STARPU_VARIABLE_INTERFACE_ID, "Error. The given data is not a variable.")
- #define STARPU_VARIABLE_GET_PTR(interface) ({ STARPU_VARIABLE_CHECK(interface); (((struct starpu_variable_interface *)(interface))->ptr) ; })
- #define STARPU_VARIABLE_GET_OFFSET(interface) ({ STARPU_VARIABLE_CHECK(interface); (((struct starpu_variable_interface *)(interface))->offset) ; })
- #define STARPU_VARIABLE_GET_ELEMSIZE(interface) ({ STARPU_VARIABLE_CHECK(interface); (((struct starpu_variable_interface *)(interface))->elemsize) ; })
- #define STARPU_VARIABLE_GET_DEV_HANDLE(interface) ({ STARPU_VARIABLE_CHECK(interface); (((struct starpu_variable_interface *)(interface))->ptr) ; })
- #else
- /**
- Return a pointer to the variable designated by \p interface.
- */
- #define STARPU_VARIABLE_GET_PTR(interface) (((struct starpu_variable_interface *)(interface))->ptr)
- /**
- Return the offset in the variable designated by \p interface, to
- be used with the device handle.
- */
- #define STARPU_VARIABLE_GET_OFFSET(interface) (((struct starpu_variable_interface *)(interface))->offset)
- /**
- Return the size of the variable designated by \p interface.
- */
- #define STARPU_VARIABLE_GET_ELEMSIZE(interface) (((struct starpu_variable_interface *)(interface))->elemsize)
- /**
- Return a device handle for the variable designated by
- \p interface, to be used with OpenCL. The offset returned by
- ::STARPU_VARIABLE_GET_OFFSET has to be
- used in addition to this.
- */
- #define STARPU_VARIABLE_GET_DEV_HANDLE(interface) (((struct starpu_variable_interface *)(interface))->ptr)
- #endif
- /** @} */
- /**
- @name Void Data Interface
- @{
- */
- extern struct starpu_data_interface_ops starpu_interface_void_ops;
- /**
- Register a void interface. There is no data really associated
- to that interface, but it may be used as a synchronization mechanism.
- It also permits to express an abstract piece of data that is managed
- by the application internally: this makes it possible to forbid the
- concurrent execution of different tasks accessing the same <c>void</c>
- data in read-write concurrently.
- */
- void starpu_void_data_register(starpu_data_handle_t *handle);
- /** @} */
- /**
- @name CSR Data Interface
- @{
- */
- extern struct starpu_data_interface_ops starpu_interface_csr_ops;
- /**
- CSR interface for sparse matrices (compressed sparse row
- representation)
- */
- struct starpu_csr_interface
- {
- enum starpu_data_interface_id id; /**< Identifier of the interface */
- uint32_t nnz; /**< number of non-zero entries */
- uint32_t nrow; /**< number of rows */
- uintptr_t nzval; /**< non-zero values */
- uint32_t *colind; /**< position of non-zero entries on the row */
- uint32_t *rowptr; /**< index (in nzval) of the first entry of the row */
- uint32_t firstentry; /**< k for k-based indexing (0 or 1 usually). also useful when partitionning the matrix. */
- size_t elemsize; /**< size of the elements of the matrix */
- };
- /**
- Register a CSR (Compressed Sparse Row Representation) sparse matrix.
- */
- void starpu_csr_data_register(starpu_data_handle_t *handle, int home_node, uint32_t nnz, uint32_t nrow, uintptr_t nzval, uint32_t *colind, uint32_t *rowptr, uint32_t firstentry, size_t elemsize);
- /**
- Return the number of non-zero values in the matrix designated
- by \p handle.
- */
- uint32_t starpu_csr_get_nnz(starpu_data_handle_t handle);
- /**
- Return the size of the row pointer array of the matrix
- designated by \p handle.
- */
- uint32_t starpu_csr_get_nrow(starpu_data_handle_t handle);
- /**
- Return the index at which all arrays (the column indexes, the
- row pointers...) of the matrix designated by \p handle.
- */
- uint32_t starpu_csr_get_firstentry(starpu_data_handle_t handle);
- /**
- Return a local pointer to the non-zero values of the matrix
- designated by \p handle.
- */
- uintptr_t starpu_csr_get_local_nzval(starpu_data_handle_t handle);
- /**
- Return a local pointer to the column index of the matrix
- designated by \p handle.
- */
- uint32_t *starpu_csr_get_local_colind(starpu_data_handle_t handle);
- /**
- Return a local pointer to the row pointer array of the matrix
- designated by \p handle.
- */
- uint32_t *starpu_csr_get_local_rowptr(starpu_data_handle_t handle);
- /**
- Return the size of the elements registered into the matrix
- designated by \p handle.
- */
- size_t starpu_csr_get_elemsize(starpu_data_handle_t handle);
- /**
- Return the number of non-zero values in the matrix designated
- by \p interface.
- */
- #define STARPU_CSR_GET_NNZ(interface) (((struct starpu_csr_interface *)(interface))->nnz)
- /**
- Return the size of the row pointer array of the matrix
- designated by \p interface.
- */
- #define STARPU_CSR_GET_NROW(interface) (((struct starpu_csr_interface *)(interface))->nrow)
- /**
- Return a pointer to the non-zero values of the matrix
- designated by \p interface.
- */
- #define STARPU_CSR_GET_NZVAL(interface) (((struct starpu_csr_interface *)(interface))->nzval)
- /**
- Return a device handle for the array of non-zero values in the
- matrix designated by \p interface. The offset returned by ::STARPU_CSR_GET_OFFSET
- has to used in addition to this.
- */
- #define STARPU_CSR_GET_NZVAL_DEV_HANDLE(interface) (((struct starpu_csr_interface *)(interface))->nnz)
- /**
- Return a pointer to the column index of the matrix designated
- by \p interface.
- */
- #define STARPU_CSR_GET_COLIND(interface) (((struct starpu_csr_interface *)(interface))->colind)
- /**
- Return a device handle for the column index of the matrix
- designated by \p interface. The offset returned by ::STARPU_CSR_GET_OFFSET has to be used in
- addition to this.
- */
- #define STARPU_CSR_GET_COLIND_DEV_HANDLE(interface) (((struct starpu_csr_interface *)(interface))->colind)
- /**
- Return a pointer to the row pointer array of the matrix
- designated by \p interface.
- */
- #define STARPU_CSR_GET_ROWPTR(interface) (((struct starpu_csr_interface *)(interface))->rowptr)
- /**
- Return a device handle for the row pointer array of the matrix
- designated by \p interface. The offset returned by ::STARPU_CSR_GET_OFFSET has to be used in
- addition to this.
- */
- #define STARPU_CSR_GET_ROWPTR_DEV_HANDLE(interface) (((struct starpu_csr_interface *)(interface))->rowptr)
- /**
- Return the offset in the arrays (colind, rowptr, nzval) of the
- matrix designated by \p interface, to be used with the device handles.
- */
- #define STARPU_CSR_GET_OFFSET 0
- /**
- Return the index at which all arrays (the column indexes, the
- row pointers...) of the \p interface start.
- */
- #define STARPU_CSR_GET_FIRSTENTRY(interface) (((struct starpu_csr_interface *)(interface))->firstentry)
- /**
- Return the size of the elements registered into the matrix
- designated by \p interface.
- */
- #define STARPU_CSR_GET_ELEMSIZE(interface) (((struct starpu_csr_interface *)(interface))->elemsize)
- /** @} */
- /**
- @name BCSR Data Interface
- @{
- */
- extern struct starpu_data_interface_ops starpu_interface_bcsr_ops;
- /**
- BCSR interface for sparse matrices (blocked compressed sparse
- row representation)
- Note: when a BCSR matrix is partitioned, nzval, colind, and rowptr point into
- the corresponding father arrays. The rowptr content is thus the same as the
- father's. Firstentry is used to offset this so it becomes valid for the child
- arrays.
- */
- struct starpu_bcsr_interface
- {
- enum starpu_data_interface_id id; /**< Identifier of the interface */
- uint32_t nnz; /**< number of non-zero BLOCKS */
- uint32_t nrow; /**< number of rows (in terms of BLOCKS) */
- uintptr_t nzval; /**< non-zero values: nnz blocks of r*c elements */
- uint32_t *colind; /**< array of nnz elements, colind[i] is the block-column index for block i in nzval */
- uint32_t *rowptr; /**< array of nrow+1
- * elements, rowptr[i] is
- * the block-index (in
- * nzval) of the first block
- * of row i. By convention,
- * rowptr[nrow] is the
- * number of blocks, this
- * allows an easier access
- * of the matrix's elements
- * for the kernels. */
- uint32_t firstentry; /**< k for k-based indexing (0 or 1 usually). Also useful when partitionning the matrix. */
- uint32_t r; /**< height of the blocks */
- uint32_t c; /**< width of the blocks */
- size_t elemsize; /**< size of the elements of the matrix */
- };
- /**
- This variant of starpu_data_register() uses the BCSR (Blocked
- Compressed Sparse Row Representation) sparse matrix interface.
- Register the sparse matrix made of \p nnz non-zero blocks of elements of
- size \p elemsize stored in \p nzval and initializes \p handle to represent it.
- Blocks have size \p r * \p c. \p nrow is the number of rows (in terms of
- blocks), \p colind is an array of nnz elements, colind[i] is the block-column index for block i in \p nzval,
- \p rowptr is an array of nrow+1 elements, rowptr[i] is the block-index (in \p nzval) of the first block of row i. By convention, rowptr[nrow] is the number of blocks, this allows an easier access of the matrix's elements for the kernels.
- \p firstentry is the index of the first entry of the given arrays
- (usually 0 or 1).
- Here an example with the following matrix:
- \code | 0 1 0 0 | \endcode
- \code | 2 3 0 0 | \endcode
- \code | 4 5 8 9 | \endcode
- \code | 6 7 10 11 | \endcode
- \code nzval = [0, 1, 2, 3] ++ [4, 5, 6, 7] ++ [8, 9, 10, 11] \endcode
- \code colind = [0, 0, 1] \endcode
- \code rowptr = [0, 1, 3] \endcode
- \code r = c = 2 \endcode
- which translates into the following code
- \code{.c}
- int R = 2; // Size of the blocks
- int C = 2;
- int NROWS = 2;
- int NNZ_BLOCKS = 3; // out of 4
- int NZVAL_SIZE = (R*C*NNZ_BLOCKS);
- int nzval[NZVAL_SIZE] =
- {
- 0, 1, 2, 3, // First block
- 4, 5, 6, 7, // Second block
- 8, 9, 10, 11 // Third block
- };
- uint32_t colind[NNZ_BLOCKS] =
- {
- 0, // block-column index for first block in nzval
- 0, // block-column index for second block in nzval
- 1 // block-column index for third block in nzval
- };
- uint32_t rowptr[NROWS+1] =
- {
- 0, // block-index in nzval of the first block of the first row.
- 1, // block-index in nzval of the first block of the second row.
- NNZ_BLOCKS // number of blocks, to allow an easier element's access for the kernels
- };
- starpu_data_handle_t bcsr_handle;
- starpu_bcsr_data_register(&bcsr_handle,
- STARPU_MAIN_RAM,
- NNZ_BLOCKS,
- NROWS,
- (uintptr_t) nzval,
- colind,
- rowptr,
- 0, // firstentry
- R,
- C,
- sizeof(nzval[0]));
- \endcode
- */
- void starpu_bcsr_data_register(starpu_data_handle_t *handle, int home_node, uint32_t nnz, uint32_t nrow, uintptr_t nzval, uint32_t *colind, uint32_t *rowptr, uint32_t firstentry, uint32_t r, uint32_t c, size_t elemsize);
- /**
- Return the number of non-zero elements in the matrix designated
- by \p handle.
- */
- uint32_t starpu_bcsr_get_nnz(starpu_data_handle_t handle);
- /**
- Return the number of rows (in terms of blocks of size r*c) in
- the matrix designated by \p handle.
- */
- uint32_t starpu_bcsr_get_nrow(starpu_data_handle_t handle);
- /**
- Return the index at which all arrays (the column indexes, the
- row pointers...) of the matrix desginated by \p handle.
- */
- uint32_t starpu_bcsr_get_firstentry(starpu_data_handle_t handle);
- /**
- Return a pointer to the non-zero values of the matrix
- designated by \p handle.
- */
- uintptr_t starpu_bcsr_get_local_nzval(starpu_data_handle_t handle);
- /**
- Return a pointer to the column index, which holds the positions
- of the non-zero entries in the matrix designated by \p handle.
- */
- uint32_t *starpu_bcsr_get_local_colind(starpu_data_handle_t handle);
- /**
- Return the row pointer array of the matrix designated by
- \p handle.
- */
- uint32_t *starpu_bcsr_get_local_rowptr(starpu_data_handle_t handle);
- /**
- Return the number of rows in a block.
- */
- uint32_t starpu_bcsr_get_r(starpu_data_handle_t handle);
- /**
- Return the number of columns in a block.
- */
- uint32_t starpu_bcsr_get_c(starpu_data_handle_t handle);
- /**
- Return the size of the elements in the matrix designated by
- \p handle.
- */
- size_t starpu_bcsr_get_elemsize(starpu_data_handle_t handle);
- /**
- Return the number of non-zero values in the matrix designated
- by \p interface.
- */
- #define STARPU_BCSR_GET_NNZ(interface) (((struct starpu_bcsr_interface *)(interface))->nnz)
- /**
- Return a pointer to the non-zero values of the matrix
- designated by \p interface.
- */
- #define STARPU_BCSR_GET_NZVAL(interface) (((struct starpu_bcsr_interface *)(interface))->nzval)
- /**
- Return a device handle for the array of non-zero values in the
- matrix designated by \p interface. The offset returned by ::STARPU_BCSR_GET_OFFSET has to be
- used in addition to this.
- */
- #define STARPU_BCSR_GET_NZVAL_DEV_HANDLE(interface) (((struct starpu_bcsr_interface *)(interface))->nnz)
- /**
- Return a pointer to the column index of the matrix designated
- by \p interface.
- */
- #define STARPU_BCSR_GET_COLIND(interface) (((struct starpu_bcsr_interface *)(interface))->colind)
- /**
- Return a device handle for the column index of the matrix
- designated by \p interface. The offset returned by ::STARPU_BCSR_GET_OFFSET has to be used in
- addition to this.
- */
- #define STARPU_BCSR_GET_COLIND_DEV_HANDLE(interface) (((struct starpu_bcsr_interface *)(interface))->colind)
- /**
- Return a pointer to the row pointer array of the matrix
- designated by \p interface.
- */
- #define STARPU_BCSR_GET_ROWPTR(interface) (((struct starpu_bcsr_interface *)(interface))->rowptr)
- /**
- Return a device handle for the row pointer array of the matrix
- designated by \p interface. The offset returned by ::STARPU_BCSR_GET_OFFSET has to be used in
- addition to this.
- */
- #define STARPU_BCSR_GET_ROWPTR_DEV_HANDLE(interface) (((struct starpu_bcsr_interface *)(interface))->rowptr)
- /**
- Return the offset in the arrays (coling, rowptr, nzval) of the
- matrix designated by \p interface, to be used with the device handles.
- */
- #define STARPU_BCSR_GET_OFFSET 0
- /** @} */
- /**
- @name Multiformat Data Interface
- @{
- */
- /**
- Multiformat operations
- */
- struct starpu_multiformat_data_interface_ops
- {
- size_t cpu_elemsize; /**< size of each element on CPUs */
- size_t opencl_elemsize; /**< size of each element on OpenCL devices */
- struct starpu_codelet *cpu_to_opencl_cl; /**< pointer to a codelet which converts from CPU to OpenCL */
- struct starpu_codelet *opencl_to_cpu_cl; /**< pointer to a codelet which converts from OpenCL to CPU */
- size_t cuda_elemsize; /**< size of each element on CUDA devices */
- struct starpu_codelet *cpu_to_cuda_cl; /**< pointer to a codelet which converts from CPU to CUDA */
- struct starpu_codelet *cuda_to_cpu_cl; /**< pointer to a codelet which converts from CUDA to CPU */
- size_t mic_elemsize; /**< size of each element on MIC devices */
- struct starpu_codelet *cpu_to_mic_cl; /**< pointer to a codelet which converts from CPU to MIC */
- struct starpu_codelet *mic_to_cpu_cl; /**< pointer to a codelet which converts from MIC to CPU */
- };
- struct starpu_multiformat_interface
- {
- enum starpu_data_interface_id id;
- void *cpu_ptr;
- void *cuda_ptr;
- void *opencl_ptr;
- void *mic_ptr;
- uint32_t nx;
- struct starpu_multiformat_data_interface_ops *ops;
- };
- /**
- Register a piece of data that can be represented in different
- ways, depending upon the processing unit that manipulates it. It
- allows the programmer, for instance, to use an array of structures
- when working on a CPU, and a structure of arrays when working on a
- GPU. \p nobjects is the number of elements in the data. \p format_ops
- describes the format.
- */
- void starpu_multiformat_data_register(starpu_data_handle_t *handle, int home_node, void *ptr, uint32_t nobjects, struct starpu_multiformat_data_interface_ops *format_ops);
- /**
- Return the local pointer to the data with CPU format.
- */
- #define STARPU_MULTIFORMAT_GET_CPU_PTR(interface) (((struct starpu_multiformat_interface *)(interface))->cpu_ptr)
- /**
- Return the local pointer to the data with CUDA format.
- */
- #define STARPU_MULTIFORMAT_GET_CUDA_PTR(interface) (((struct starpu_multiformat_interface *)(interface))->cuda_ptr)
- /**
- Return the local pointer to the data with OpenCL format.
- */
- #define STARPU_MULTIFORMAT_GET_OPENCL_PTR(interface) (((struct starpu_multiformat_interface *)(interface))->opencl_ptr)
- /**
- Return the local pointer to the data with MIC format.
- */
- #define STARPU_MULTIFORMAT_GET_MIC_PTR(interface) (((struct starpu_multiformat_interface *)(interface))->mic_ptr)
- /**
- Return the number of elements in the data.
- */
- #define STARPU_MULTIFORMAT_GET_NX(interface) (((struct starpu_multiformat_interface *)(interface))->nx)
- /** @} */
- /** @} */
- #ifdef __cplusplus
- }
- #endif
- #endif /* __STARPU_DATA_INTERFACES_H__ */
|