lu-float.h 1.4 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152
  1. /* StarPU --- Runtime system for heterogeneous multicore architectures.
  2. *
  3. * Copyright (C) 2009, 2010 Université de Bordeaux 1
  4. * Copyright (C) 2010 Centre National de la Recherche Scientifique
  5. *
  6. * StarPU is free software; you can redistribute it and/or modify
  7. * it under the terms of the GNU Lesser General Public License as published by
  8. * the Free Software Foundation; either version 2.1 of the License, or (at
  9. * your option) any later version.
  10. *
  11. * StarPU is distributed in the hope that it will be useful, but
  12. * WITHOUT ANY WARRANTY; without even the implied warranty of
  13. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
  14. *
  15. * See the GNU Lesser General Public License in COPYING.LGPL for more details.
  16. */
  17. #define TYPE float
  18. #define CUBLAS_TYPE TYPE
  19. #define STARPU_LU(name) starpu_slu_##name
  20. #ifdef STARPU_HAVE_MAGMA
  21. #include <magmablas.h>
  22. #define CUBLAS_GEMM magmablas_sgemm
  23. #define CUBLAS_TRSM magmablas_strsm
  24. #else
  25. #define CUBLAS_GEMM cublasSgemm
  26. #define CUBLAS_TRSM cublasStrsm
  27. #endif
  28. #define CUBLAS_SCAL cublasSscal
  29. #define CUBLAS_GER cublasSger
  30. #define CUBLAS_SWAP cublasSswap
  31. #define CUBLAS_IAMAX cublasIsamax
  32. #define CPU_GEMM SGEMM
  33. #define CPU_TRSM STRSM
  34. #define CPU_SCAL SSCAL
  35. #define CPU_GER SGER
  36. #define CPU_SWAP SSWAP
  37. #define CPU_TRMM STRMM
  38. #define CPU_AXPY SAXPY
  39. #define CPU_ASUM SASUM
  40. #define CPU_IAMAX ISAMAX
  41. #define PIVOT_THRESHHOLD 10e-5
  42. #define CAN_EXECUTE