123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137 |
- /*
- * StarPU
- * Copyright (C) INRIA 2008-2009 (see AUTHORS file)
- *
- * This program is free software; you can redistribute it and/or modify
- * it under the terms of the GNU Lesser General Public License as published by
- * the Free Software Foundation; either version 2.1 of the License, or (at
- * your option) any later version.
- *
- * This program is distributed in the hope that it will be useful, but
- * WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
- *
- * See the GNU Lesser General Public License in COPYING.LGPL for more details.
- */
- #ifndef __DW_SPARSE_CG_H__
- #define __DW_SPARSE_CG_H__
- #include <stdio.h>
- #include <stdint.h>
- #include <semaphore.h>
- #include <string.h>
- #include <stdint.h>
- #include <math.h>
- #include <sys/types.h>
- #include <pthread.h>
- #include <signal.h>
- #include <starpu_config.h>
- #include <starpu.h>
- #ifdef USE_CUDA
- #include <cublas.h>
- #endif
- #include "../common/blas.h"
- #define MAXITER 100000
- #define EPSILON 0.0000001f
- /* code parameters */
- static uint32_t size = 33554432;
- static unsigned usecpu = 0;
- static unsigned blocks = 512;
- static unsigned grids = 8;
- struct cg_problem {
- starpu_data_handle ds_matrixA;
- starpu_data_handle ds_vecx;
- starpu_data_handle ds_vecb;
- starpu_data_handle ds_vecr;
- starpu_data_handle ds_vecd;
- starpu_data_handle ds_vecq;
- sem_t *sem;
-
- float alpha;
- float beta;
- float delta_0;
- float delta_old;
- float delta_new;
- float epsilon;
- int i;
- unsigned size;
- };
- /* some useful functions */
- static void __attribute__((unused)) parse_args(int argc, char **argv)
- {
- int i;
- for (i = 1; i < argc; i++) {
- if (strcmp(argv[i], "-size") == 0) {
- char *argptr;
- size = strtol(argv[++i], &argptr, 10);
- }
- if (strcmp(argv[i], "-block") == 0) {
- char *argptr;
- blocks = strtol(argv[++i], &argptr, 10);
- }
- if (strcmp(argv[i], "-grid") == 0) {
- char *argptr;
- grids = strtol(argv[++i], &argptr, 10);
- }
- if (strcmp(argv[i], "-cpu") == 0) {
- usecpu = 1;
- }
- }
- }
- static void __attribute__ ((unused)) print_results(float *result, unsigned size)
- {
- printf("**** RESULTS **** \n");
- unsigned i;
- for (i = 0; i < STARPU_MIN(size, 16); i++)
- {
- printf("%d -> %f\n", i, result[i]);
- }
- }
- void core_codelet_func_1(starpu_data_interface_t *descr, void *arg);
- void core_codelet_func_2(starpu_data_interface_t *descr, void *arg);
- void cublas_codelet_func_3(starpu_data_interface_t *descr, void *arg);
- void core_codelet_func_3(starpu_data_interface_t *descr, void *arg);
- void core_codelet_func_4(starpu_data_interface_t *descr, void *arg);
- void core_codelet_func_5(starpu_data_interface_t *descr, void *arg);
- void cublas_codelet_func_5(starpu_data_interface_t *descr, void *arg);
- void cublas_codelet_func_6(starpu_data_interface_t *descr, void *arg);
- void core_codelet_func_6(starpu_data_interface_t *descr, void *arg);
- void cublas_codelet_func_7(starpu_data_interface_t *descr, void *arg);
- void core_codelet_func_7(starpu_data_interface_t *descr, void *arg);
- void cublas_codelet_func_8(starpu_data_interface_t *descr, void *arg);
- void core_codelet_func_8(starpu_data_interface_t *descr, void *arg);
- void cublas_codelet_func_9(starpu_data_interface_t *descr, void *arg);
- void core_codelet_func_9(starpu_data_interface_t *descr, void *arg);
- void iteration_cg(void *problem);
- void conjugate_gradient(float *nzvalA, float *vecb, float *vecx, uint32_t nnz,
- unsigned nrow, uint32_t *colind, uint32_t *rowptr);
- #endif // __DW_SPARSE_CG_H__
|