spmv_opencl.cl 1.4 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546
  1. /* StarPU --- Runtime system for heterogeneous multicore architectures.
  2. *
  3. * Copyright (C) 2010,2012,2015 CNRS
  4. * Copyright (C) 2011,2015 Université de Bordeaux
  5. *
  6. * StarPU is free software; you can redistribute it and/or modify
  7. * it under the terms of the GNU Lesser General Public License as published by
  8. * the Free Software Foundation; either version 2.1 of the License, or (at
  9. * your option) any later version.
  10. *
  11. * StarPU is distributed in the hope that it will be useful, but
  12. * WITHOUT ANY WARRANTY; without even the implied warranty of
  13. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
  14. *
  15. * See the GNU Lesser General Public License in COPYING.LGPL for more details.
  16. */
  17. /* OpenCL kernel for SPMV */
  18. __kernel void spmv(int nnz, int nrow,
  19. __global float* nzval, __global unsigned* colind,
  20. __global unsigned* rowptr, int firstentry,
  21. __global float *vecin, int nx_in,
  22. __global float *vecout, int nx_out)
  23. {
  24. const int row = get_global_id(0);
  25. if (row < nrow)
  26. {
  27. float tmp = 0.0f;
  28. unsigned index;
  29. unsigned firstindex = rowptr[row] - firstentry;
  30. unsigned lastindex = rowptr[row+1] - firstentry;
  31. for (index = firstindex; index < lastindex; index++)
  32. {
  33. unsigned col;
  34. col = colind[index];
  35. tmp += nzval[index]*vecin[col];
  36. }
  37. vecout[row] = tmp;
  38. }
  39. }