multiformat_conversion_codelets.c 3.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128
  1. /* StarPU --- Runtime system for heterogeneous multicore architectures.
  2. *
  3. * Copyright (C) 2011 Institut National de Recherche en Informatique et Automatique
  4. *
  5. * StarPU is free software; you can redistribute it and/or modify
  6. * it under the terms of the GNU Lesser General Public License as published by
  7. * the Free Software Foundation; either version 2.1 of the License, or (at
  8. * your option) any later version.
  9. *
  10. * StarPU is distributed in the hope that it will be useful, but
  11. * WITHOUT ANY WARRANTY; without even the implied warranty of
  12. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
  13. *
  14. * See the GNU Lesser General Public License in COPYING.LGPL for more details.
  15. */
  16. #include <config.h>
  17. #include <starpu.h>
  18. #include "multiformat_types.h"
  19. #include "../../../helper.h"
  20. #ifdef STARPU_USE_CUDA
  21. void cuda_to_cpu(void *buffers[], void *arg)
  22. {
  23. STARPU_SKIP_IF_VALGRIND;
  24. FPRINTF(stderr, "Entering %s\n", __starpu_func__);
  25. struct struct_of_arrays *src = STARPU_MULTIFORMAT_GET_CUDA_PTR(buffers[0]);
  26. struct point *dst = STARPU_MULTIFORMAT_GET_CPU_PTR(buffers[0]);
  27. int n = STARPU_MULTIFORMAT_GET_NX(buffers[0]);
  28. int i;
  29. for (i = 0; i < n; i++)
  30. {
  31. dst[i].x = src->x[i];
  32. dst[i].y = src->y[i];
  33. }
  34. }
  35. extern void cpu_to_cuda_cuda_func(void *buffers[], void *args); struct starpu_codelet cpu_to_cuda_cl =
  36. {
  37. .cuda_funcs = {cpu_to_cuda_cuda_func, NULL},
  38. .nbuffers = 1
  39. };
  40. struct starpu_codelet cuda_to_cpu_cl =
  41. {
  42. .cpu_funcs = {cuda_to_cpu, NULL},
  43. .nbuffers = 1
  44. };
  45. #endif
  46. #ifdef STARPU_USE_OPENCL
  47. void opencl_to_cpu(void *buffers[], void *arg)
  48. {
  49. STARPU_SKIP_IF_VALGRIND;
  50. struct struct_of_arrays *src = STARPU_MULTIFORMAT_GET_OPENCL_PTR(buffers[0]);
  51. struct point *dst = STARPU_MULTIFORMAT_GET_CPU_PTR(buffers[0]);
  52. int n = STARPU_MULTIFORMAT_GET_NX(buffers[0]);
  53. int i;
  54. for (i = 0; i < n; i++)
  55. {
  56. dst[i].x = src->x[i];
  57. dst[i].y = src->y[i];
  58. }
  59. }
  60. extern void cpu_to_opencl_opencl_func(void *buffers[], void *args);
  61. struct starpu_codelet cpu_to_opencl_cl =
  62. {
  63. .opencl_funcs = {cpu_to_opencl_opencl_func, NULL},
  64. .nbuffers = 1
  65. };
  66. struct starpu_codelet opencl_to_cpu_cl =
  67. {
  68. .cpu_funcs = {opencl_to_cpu, NULL},
  69. .nbuffers = 1
  70. };
  71. #endif
  72. #ifdef STARPU_USE_MIC
  73. void mic_to_cpu(void *buffers[], void *arg)
  74. {
  75. STARPU_SKIP_IF_VALGRIND;
  76. FPRINTF(stderr, "Entering %s\n", __func__);
  77. struct struct_of_arrays *src = STARPU_MULTIFORMAT_GET_MIC_PTR(buffers[0]);
  78. struct point *dst = STARPU_MULTIFORMAT_GET_CPU_PTR(buffers[0]);
  79. int n = STARPU_MULTIFORMAT_GET_NX(buffers[0]);
  80. int i;
  81. for (i = 0; i < n; i++)
  82. {
  83. dst[i].x = src->x[i];
  84. dst[i].y = src->y[i];
  85. }
  86. }
  87. void cpu_to_mic(void *buffers[], void *args)
  88. {
  89. STARPU_SKIP_IF_VALGRIND;
  90. FPRINTF(stderr, "Entering %s\n", __func__);
  91. struct point *src = STARPU_MULTIFORMAT_GET_CPU_PTR(buffers[0]);
  92. struct struct_of_arrays *dst = STARPU_MULTIFORMAT_GET_MIC_PTR(buffers[0]);
  93. int n = STARPU_MULTIFORMAT_GET_NX(buffers[0]);
  94. int i;
  95. for (i = 0; i < n; i++)
  96. {
  97. dst->x[i] = src[i].x;
  98. dst->y[i] = src[i].y;
  99. }
  100. }
  101. struct starpu_codelet cpu_to_mic_cl =
  102. {
  103. .where = STARPU_MIC,
  104. .cpu_funcs_name = {"cpu_to_mic", NULL},
  105. .nbuffers = 1
  106. };
  107. struct starpu_codelet mic_to_cpu_cl =
  108. {
  109. .where = STARPU_CPU,
  110. .cpu_funcs = {mic_to_cpu, NULL},
  111. .nbuffers = 1
  112. };
  113. #endif