dw_sparse_cg.h 3.4 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137
  1. /*
  2. * StarPU
  3. * Copyright (C) INRIA 2008-2009 (see AUTHORS file)
  4. *
  5. * This program is free software; you can redistribute it and/or modify
  6. * it under the terms of the GNU Lesser General Public License as published by
  7. * the Free Software Foundation; either version 2.1 of the License, or (at
  8. * your option) any later version.
  9. *
  10. * This program is distributed in the hope that it will be useful, but
  11. * WITHOUT ANY WARRANTY; without even the implied warranty of
  12. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
  13. *
  14. * See the GNU Lesser General Public License in COPYING.LGPL for more details.
  15. */
  16. #ifndef __DW_SPARSE_CG_H__
  17. #define __DW_SPARSE_CG_H__
  18. #include <stdio.h>
  19. #include <stdint.h>
  20. #include <semaphore.h>
  21. #include <string.h>
  22. #include <stdint.h>
  23. #include <math.h>
  24. #include <sys/types.h>
  25. #include <pthread.h>
  26. #include <signal.h>
  27. #include <starpu_config.h>
  28. #include <starpu.h>
  29. #ifdef USE_CUDA
  30. #include <cublas.h>
  31. #endif
  32. #include "../common/blas.h"
  33. #define MAXITER 100000
  34. #define EPSILON 0.0000001f
  35. /* code parameters */
  36. static uint32_t size = 33554432;
  37. static unsigned usecpu = 0;
  38. static unsigned blocks = 512;
  39. static unsigned grids = 8;
  40. struct cg_problem {
  41. starpu_data_handle ds_matrixA;
  42. starpu_data_handle ds_vecx;
  43. starpu_data_handle ds_vecb;
  44. starpu_data_handle ds_vecr;
  45. starpu_data_handle ds_vecd;
  46. starpu_data_handle ds_vecq;
  47. sem_t *sem;
  48. float alpha;
  49. float beta;
  50. float delta_0;
  51. float delta_old;
  52. float delta_new;
  53. float epsilon;
  54. int i;
  55. unsigned size;
  56. };
  57. /* some useful functions */
  58. static void __attribute__((unused)) parse_args(int argc, char **argv)
  59. {
  60. int i;
  61. for (i = 1; i < argc; i++) {
  62. if (strcmp(argv[i], "-size") == 0) {
  63. char *argptr;
  64. size = strtol(argv[++i], &argptr, 10);
  65. }
  66. if (strcmp(argv[i], "-block") == 0) {
  67. char *argptr;
  68. blocks = strtol(argv[++i], &argptr, 10);
  69. }
  70. if (strcmp(argv[i], "-grid") == 0) {
  71. char *argptr;
  72. grids = strtol(argv[++i], &argptr, 10);
  73. }
  74. if (strcmp(argv[i], "-cpu") == 0) {
  75. usecpu = 1;
  76. }
  77. }
  78. }
  79. static void __attribute__ ((unused)) print_results(float *result, unsigned size)
  80. {
  81. printf("**** RESULTS **** \n");
  82. unsigned i;
  83. for (i = 0; i < STARPU_MIN(size, 16); i++)
  84. {
  85. printf("%d -> %f\n", i, result[i]);
  86. }
  87. }
  88. void core_codelet_func_1(starpu_data_interface_t *descr, void *arg);
  89. void core_codelet_func_2(starpu_data_interface_t *descr, void *arg);
  90. void cublas_codelet_func_3(starpu_data_interface_t *descr, void *arg);
  91. void core_codelet_func_3(starpu_data_interface_t *descr, void *arg);
  92. void core_codelet_func_4(starpu_data_interface_t *descr, void *arg);
  93. void core_codelet_func_5(starpu_data_interface_t *descr, void *arg);
  94. void cublas_codelet_func_5(starpu_data_interface_t *descr, void *arg);
  95. void cublas_codelet_func_6(starpu_data_interface_t *descr, void *arg);
  96. void core_codelet_func_6(starpu_data_interface_t *descr, void *arg);
  97. void cublas_codelet_func_7(starpu_data_interface_t *descr, void *arg);
  98. void core_codelet_func_7(starpu_data_interface_t *descr, void *arg);
  99. void cublas_codelet_func_8(starpu_data_interface_t *descr, void *arg);
  100. void core_codelet_func_8(starpu_data_interface_t *descr, void *arg);
  101. void cublas_codelet_func_9(starpu_data_interface_t *descr, void *arg);
  102. void core_codelet_func_9(starpu_data_interface_t *descr, void *arg);
  103. void iteration_cg(void *problem);
  104. void conjugate_gradient(float *nzvalA, float *vecb, float *vecx, uint32_t nnz,
  105. unsigned nrow, uint32_t *colind, uint32_t *rowptr);
  106. #endif // __DW_SPARSE_CG_H__