|
@@ -93,9 +93,9 @@ static struct starpu_perfmodel accumulate_variable_model =
|
|
struct starpu_codelet accumulate_variable_cl =
|
|
struct starpu_codelet accumulate_variable_cl =
|
|
{
|
|
{
|
|
.can_execute = can_execute,
|
|
.can_execute = can_execute,
|
|
- .cpu_funcs = {accumulate_variable_cpu, NULL},
|
|
|
|
|
|
+ .cpu_funcs = {accumulate_variable_cpu},
|
|
#ifdef STARPU_USE_CUDA
|
|
#ifdef STARPU_USE_CUDA
|
|
- .cuda_funcs = {accumulate_variable_cuda, NULL},
|
|
|
|
|
|
+ .cuda_funcs = {accumulate_variable_cuda},
|
|
.cuda_flags = {STARPU_CUDA_ASYNC},
|
|
.cuda_flags = {STARPU_CUDA_ASYNC},
|
|
#endif
|
|
#endif
|
|
.modes = {STARPU_RW, STARPU_R},
|
|
.modes = {STARPU_RW, STARPU_R},
|
|
@@ -132,9 +132,9 @@ static struct starpu_perfmodel accumulate_vector_model =
|
|
struct starpu_codelet accumulate_vector_cl =
|
|
struct starpu_codelet accumulate_vector_cl =
|
|
{
|
|
{
|
|
.can_execute = can_execute,
|
|
.can_execute = can_execute,
|
|
- .cpu_funcs = {accumulate_vector_cpu, NULL},
|
|
|
|
|
|
+ .cpu_funcs = {accumulate_vector_cpu},
|
|
#ifdef STARPU_USE_CUDA
|
|
#ifdef STARPU_USE_CUDA
|
|
- .cuda_funcs = {accumulate_vector_cuda, NULL},
|
|
|
|
|
|
+ .cuda_funcs = {accumulate_vector_cuda},
|
|
.cuda_flags = {STARPU_CUDA_ASYNC},
|
|
.cuda_flags = {STARPU_CUDA_ASYNC},
|
|
#endif
|
|
#endif
|
|
.modes = {STARPU_RW, STARPU_R},
|
|
.modes = {STARPU_RW, STARPU_R},
|
|
@@ -172,9 +172,9 @@ static struct starpu_perfmodel bzero_variable_model =
|
|
struct starpu_codelet bzero_variable_cl =
|
|
struct starpu_codelet bzero_variable_cl =
|
|
{
|
|
{
|
|
.can_execute = can_execute,
|
|
.can_execute = can_execute,
|
|
- .cpu_funcs = {bzero_variable_cpu, NULL},
|
|
|
|
|
|
+ .cpu_funcs = {bzero_variable_cpu},
|
|
#ifdef STARPU_USE_CUDA
|
|
#ifdef STARPU_USE_CUDA
|
|
- .cuda_funcs = {bzero_variable_cuda, NULL},
|
|
|
|
|
|
+ .cuda_funcs = {bzero_variable_cuda},
|
|
.cuda_flags = {STARPU_CUDA_ASYNC},
|
|
.cuda_flags = {STARPU_CUDA_ASYNC},
|
|
#endif
|
|
#endif
|
|
.modes = {STARPU_W},
|
|
.modes = {STARPU_W},
|
|
@@ -209,9 +209,9 @@ static struct starpu_perfmodel bzero_vector_model =
|
|
struct starpu_codelet bzero_vector_cl =
|
|
struct starpu_codelet bzero_vector_cl =
|
|
{
|
|
{
|
|
.can_execute = can_execute,
|
|
.can_execute = can_execute,
|
|
- .cpu_funcs = {bzero_vector_cpu, NULL},
|
|
|
|
|
|
+ .cpu_funcs = {bzero_vector_cpu},
|
|
#ifdef STARPU_USE_CUDA
|
|
#ifdef STARPU_USE_CUDA
|
|
- .cuda_funcs = {bzero_vector_cuda, NULL},
|
|
|
|
|
|
+ .cuda_funcs = {bzero_vector_cuda},
|
|
.cuda_flags = {STARPU_CUDA_ASYNC},
|
|
.cuda_flags = {STARPU_CUDA_ASYNC},
|
|
#endif
|
|
#endif
|
|
.modes = {STARPU_W},
|
|
.modes = {STARPU_W},
|
|
@@ -266,9 +266,9 @@ static struct starpu_perfmodel dot_kernel_model =
|
|
static struct starpu_codelet dot_kernel_cl =
|
|
static struct starpu_codelet dot_kernel_cl =
|
|
{
|
|
{
|
|
.can_execute = can_execute,
|
|
.can_execute = can_execute,
|
|
- .cpu_funcs = {dot_kernel_cpu, NULL},
|
|
|
|
|
|
+ .cpu_funcs = {dot_kernel_cpu},
|
|
#ifdef STARPU_USE_CUDA
|
|
#ifdef STARPU_USE_CUDA
|
|
- .cuda_funcs = {dot_kernel_cuda, NULL},
|
|
|
|
|
|
+ .cuda_funcs = {dot_kernel_cuda},
|
|
#endif
|
|
#endif
|
|
.nbuffers = 3,
|
|
.nbuffers = 3,
|
|
.model = &dot_kernel_model
|
|
.model = &dot_kernel_model
|
|
@@ -345,9 +345,9 @@ static struct starpu_perfmodel scal_kernel_model =
|
|
static struct starpu_codelet scal_kernel_cl =
|
|
static struct starpu_codelet scal_kernel_cl =
|
|
{
|
|
{
|
|
.can_execute = can_execute,
|
|
.can_execute = can_execute,
|
|
- .cpu_funcs = {scal_kernel_cpu, NULL},
|
|
|
|
|
|
+ .cpu_funcs = {scal_kernel_cpu},
|
|
#ifdef STARPU_USE_CUDA
|
|
#ifdef STARPU_USE_CUDA
|
|
- .cuda_funcs = {scal_kernel_cuda, NULL},
|
|
|
|
|
|
+ .cuda_funcs = {scal_kernel_cuda},
|
|
.cuda_flags = {STARPU_CUDA_ASYNC},
|
|
.cuda_flags = {STARPU_CUDA_ASYNC},
|
|
#endif
|
|
#endif
|
|
.nbuffers = 1,
|
|
.nbuffers = 1,
|
|
@@ -420,9 +420,9 @@ static struct starpu_codelet gemv_kernel_cl =
|
|
.can_execute = can_execute,
|
|
.can_execute = can_execute,
|
|
.type = STARPU_SPMD,
|
|
.type = STARPU_SPMD,
|
|
.max_parallelism = INT_MAX,
|
|
.max_parallelism = INT_MAX,
|
|
- .cpu_funcs = {gemv_kernel_cpu, NULL},
|
|
|
|
|
|
+ .cpu_funcs = {gemv_kernel_cpu},
|
|
#ifdef STARPU_USE_CUDA
|
|
#ifdef STARPU_USE_CUDA
|
|
- .cuda_funcs = {gemv_kernel_cuda, NULL},
|
|
|
|
|
|
+ .cuda_funcs = {gemv_kernel_cuda},
|
|
.cuda_flags = {STARPU_CUDA_ASYNC},
|
|
.cuda_flags = {STARPU_CUDA_ASYNC},
|
|
#endif
|
|
#endif
|
|
.nbuffers = 3,
|
|
.nbuffers = 3,
|
|
@@ -519,9 +519,9 @@ static struct starpu_perfmodel scal_axpy_kernel_model =
|
|
static struct starpu_codelet scal_axpy_kernel_cl =
|
|
static struct starpu_codelet scal_axpy_kernel_cl =
|
|
{
|
|
{
|
|
.can_execute = can_execute,
|
|
.can_execute = can_execute,
|
|
- .cpu_funcs = {scal_axpy_kernel_cpu, NULL},
|
|
|
|
|
|
+ .cpu_funcs = {scal_axpy_kernel_cpu},
|
|
#ifdef STARPU_USE_CUDA
|
|
#ifdef STARPU_USE_CUDA
|
|
- .cuda_funcs = {scal_axpy_kernel_cuda, NULL},
|
|
|
|
|
|
+ .cuda_funcs = {scal_axpy_kernel_cuda},
|
|
.cuda_flags = {STARPU_CUDA_ASYNC},
|
|
.cuda_flags = {STARPU_CUDA_ASYNC},
|
|
#endif
|
|
#endif
|
|
.nbuffers = 2,
|
|
.nbuffers = 2,
|
|
@@ -594,9 +594,9 @@ static struct starpu_perfmodel axpy_kernel_model =
|
|
static struct starpu_codelet axpy_kernel_cl =
|
|
static struct starpu_codelet axpy_kernel_cl =
|
|
{
|
|
{
|
|
.can_execute = can_execute,
|
|
.can_execute = can_execute,
|
|
- .cpu_funcs = {axpy_kernel_cpu, NULL},
|
|
|
|
|
|
+ .cpu_funcs = {axpy_kernel_cpu},
|
|
#ifdef STARPU_USE_CUDA
|
|
#ifdef STARPU_USE_CUDA
|
|
- .cuda_funcs = {axpy_kernel_cuda, NULL},
|
|
|
|
|
|
+ .cuda_funcs = {axpy_kernel_cuda},
|
|
.cuda_flags = {STARPU_CUDA_ASYNC},
|
|
.cuda_flags = {STARPU_CUDA_ASYNC},
|
|
#endif
|
|
#endif
|
|
.nbuffers = 2,
|
|
.nbuffers = 2,
|