|
@@ -371,12 +371,11 @@ int STARPU_LU(lu_decomposition_pivot)(TYPE *matA, unsigned *ipiv, unsigned size,
|
|
|
double timing=0.0;
|
|
|
int ret = dw_codelet_facto_pivot(&dataA, piv_description, nblocks, get_block_with_striding, &timing);
|
|
|
|
|
|
- FPRINTF(stderr, "Computation took (in ms)\n");
|
|
|
- FPRINTF(stderr, "%2.2f\n", timing/1000);
|
|
|
-
|
|
|
unsigned n = starpu_matrix_get_nx(dataA);
|
|
|
double flop = (2.0f*n*n*n)/3.0f;
|
|
|
- FPRINTF(stderr, "Synthetic GFlops : %2.2f\n", (flop/timing/1000.0f));
|
|
|
+
|
|
|
+ PRINTF("# size\tms\tGFlops\n");
|
|
|
+ PRINTF("%u\t%.0f\t%.1f\n", n, timing/1000, flop/timing/1000.0f);
|
|
|
|
|
|
/* gather all the data */
|
|
|
starpu_data_unpartition(dataA, STARPU_MAIN_RAM);
|
|
@@ -426,12 +425,11 @@ int STARPU_LU(lu_decomposition_pivot_no_stride)(TYPE **matA, unsigned *ipiv, uns
|
|
|
double timing=0.0;
|
|
|
int ret = dw_codelet_facto_pivot(dataAp, piv_description, nblocks, get_block_with_no_striding, &timing);
|
|
|
|
|
|
- FPRINTF(stderr, "Computation took (in ms)\n");
|
|
|
- FPRINTF(stderr, "%2.2f\n", timing/1000);
|
|
|
-
|
|
|
unsigned n = starpu_matrix_get_nx(dataAp[0])*nblocks;
|
|
|
double flop = (2.0f*n*n*n)/3.0f;
|
|
|
- FPRINTF(stderr, "Synthetic GFlops : %2.2f\n", (flop/timing/1000.0f));
|
|
|
+
|
|
|
+ PRINTF("# size\tms\tGFlops\n");
|
|
|
+ PRINTF("%u\t%.0f\t%.1f\n", n, timing/1000, flop/timing/1000.0f);
|
|
|
|
|
|
for (bj = 0; bj < nblocks; bj++)
|
|
|
for (bi = 0; bi < nblocks; bi++)
|