|
@@ -18,7 +18,6 @@
|
|
|
#ifndef __DW_CHOLESKY_H__
|
|
|
#define __DW_CHOLESKY_H__
|
|
|
|
|
|
-#include <semaphore.h>
|
|
|
#include <string.h>
|
|
|
#include <math.h>
|
|
|
#include <sys/time.h>
|
|
@@ -31,42 +30,8 @@
|
|
|
#include <common/blas.h>
|
|
|
#include <starpu.h>
|
|
|
|
|
|
-#define NMAXBLOCKS 32
|
|
|
-
|
|
|
-#define TAG11(k) ((starpu_tag_t)( (1ULL<<60) | (unsigned long long)(k)))
|
|
|
-#define TAG21(k,j) ((starpu_tag_t)(((3ULL<<60) | (((unsigned long long)(k))<<32) \
|
|
|
- | (unsigned long long)(j))))
|
|
|
-#define TAG22(k,i,j) ((starpu_tag_t)(((4ULL<<60) | ((unsigned long long)(k)<<32) \
|
|
|
- | ((unsigned long long)(i)<<16) \
|
|
|
- | (unsigned long long)(j))))
|
|
|
-
|
|
|
-
|
|
|
-
|
|
|
-#define TAG11_AUX(k, prefix) ((starpu_tag_t)( (((unsigned long long)(prefix))<<60) | (1ULL<<56) | (unsigned long long)(k)))
|
|
|
-#define TAG21_AUX(k,j, prefix) ((starpu_tag_t)( (((unsigned long long)(prefix))<<60) \
|
|
|
- | ((3ULL<<56) | (((unsigned long long)(k))<<32) \
|
|
|
- | (unsigned long long)(j))))
|
|
|
-#define TAG22_AUX(k,i,j, prefix) ((starpu_tag_t)( (((unsigned long long)(prefix))<<60) \
|
|
|
- | ((4ULL<<56) | ((unsigned long long)(k)<<32) \
|
|
|
- | ((unsigned long long)(i)<<16) \
|
|
|
- | (unsigned long long)(j))))
|
|
|
-
|
|
|
#define BLOCKSIZE (size/nblocks)
|
|
|
|
|
|
-
|
|
|
-#define BLAS3_FLOP(n1,n2,n3) \
|
|
|
- (2*((uint64_t)n1)*((uint64_t)n2)*((uint64_t)n3))
|
|
|
-
|
|
|
-typedef struct {
|
|
|
- starpu_data_handle dataA;
|
|
|
- unsigned i;
|
|
|
- unsigned j;
|
|
|
- unsigned k;
|
|
|
- unsigned nblocks;
|
|
|
- unsigned *remaining;
|
|
|
- sem_t *sem;
|
|
|
-} cl_args;
|
|
|
-
|
|
|
static unsigned size = 4*1024;
|
|
|
static unsigned nblocks = 16;
|
|
|
static unsigned nbigblocks = 8;
|
|
@@ -83,10 +48,6 @@ void chol_cublas_codelet_update_u21(void *descr[], void *_args);
|
|
|
void chol_cublas_codelet_update_u22(void *descr[], void *_args);
|
|
|
#endif
|
|
|
|
|
|
-extern struct starpu_perfmodel_t chol_model_11;
|
|
|
-extern struct starpu_perfmodel_t chol_model_21;
|
|
|
-extern struct starpu_perfmodel_t chol_model_22;
|
|
|
-
|
|
|
static void __attribute__((unused)) parse_args(int argc, char **argv)
|
|
|
{
|
|
|
int i;
|