| 1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071 | /* StarPU --- Runtime system for heterogeneous multicore architectures. * * Copyright (C) 2010-2013,2015,2017,2020                 CNRS * Copyright (C) 2009-2011,2014,2015,2017,2018, 2020            Université de Bordeaux * Copyright (C) 2012                                     Inria * Copyright (C) 2010                                     Mehdi Juhoor * * StarPU is free software; you can redistribute it and/or modify * it under the terms of the GNU Lesser General Public License as published by * the Free Software Foundation; either version 2.1 of the License, or (at * your option) any later version. * * StarPU is distributed in the hope that it will be useful, but * WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. * * See the GNU Lesser General Public License in COPYING.LGPL for more details. */#include "mpi_cholesky.h"/* This is the same as matrix_decomposition, but the matrix is not allocated in * totality on all nodes, thus allowing much bigger matrices, but doesn't allow * trivial checks */int main(int argc, char **argv){	/* create a simple definite positive symetric matrix example	 *	 *	Hilbert matrix : h(i,j) = 1/(i+j+1)	 * */	float ***bmat;	int rank, nodes, ret;	double timing, flops;#ifndef STARPU_SIMGRID	int correctness=1;#endif	ret = starpu_mpi_init_conf(&argc, &argv, 1, MPI_COMM_WORLD, NULL);	STARPU_CHECK_RETURN_VALUE(ret, "starpu_mpi_init_conf");	starpu_mpi_comm_rank(MPI_COMM_WORLD, &rank);	starpu_mpi_comm_size(MPI_COMM_WORLD, &nodes);	starpu_cublas_init();	parse_args(argc, argv, nodes);	if (check)	{		fprintf(stderr,"can't check in distributed mode\n");		check = 0;	}	matrix_init(&bmat, rank, nodes, 0);	dw_cholesky(bmat, size/nblocks, rank, nodes, &timing, &flops);	starpu_cublas_shutdown();	starpu_mpi_shutdown();	matrix_free(&bmat, rank, nodes, 0);	if (rank == 0)	{		FPRINTF(stdout, "Computation time (in ms): %2.2f\n", timing/1000);		FPRINTF(stdout, "Synthetic GFlops : %2.2f\n", (flops/timing/1000.0f));	}	return 0;}
 |