12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667 |
- #include "dw_block_spmv.h"
- static inline void common_block_spmv(void *descr[], int s, __attribute__((unused)) void *_args)
- {
-
- float *block = (float *)STARPU_MATRIX_GET_PTR(descr[0]);
- float *in = (float *)STARPU_VECTOR_GET_PTR(descr[1]);
- float *out = (float *)STARPU_VECTOR_GET_PTR(descr[2]);
- unsigned dx = STARPU_MATRIX_GET_NX(descr[0]);
- unsigned dy = STARPU_MATRIX_GET_NY(descr[0]);
- unsigned ld = STARPU_MATRIX_GET_LD(descr[0]);
- switch (s)
- {
- case 0:
- cblas_sgemv(CblasRowMajor, CblasNoTrans, dx, dy, 1.0f, block, ld, in, 1, 1.0f, out, 1);
- break;
- #ifdef STARPU_USE_CUDA
- case 1:
- cublasSgemv ('t', dx, dy, 1.0f, block, ld, in, 1, 1.0f, out, 1);
- break;
- #endif
- default:
- STARPU_ABORT();
- break;
- }
- }
- void cpu_block_spmv(void *descr[], void *_args)
- {
- common_block_spmv(descr, 0, _args);
- }
- #ifdef STARPU_USE_CUDA
- void cublas_block_spmv(void *descr[], void *_args)
- {
- common_block_spmv(descr, 1, _args);
- }
- #endif
|