starpu_mpi_stats.c 2.5 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394
  1. /* StarPU --- Runtime system for heterogeneous multicore architectures.
  2. *
  3. * Copyright (C) 2012 Centre National de la Recherche Scientifique
  4. *
  5. * StarPU is free software; you can redistribute it and/or modify
  6. * it under the terms of the GNU Lesser General Public License as published by
  7. * the Free Software Foundation; either version 2.1 of the License, or (at
  8. * your option) any later version.
  9. *
  10. * StarPU is distributed in the hope that it will be useful, but
  11. * WITHOUT ANY WARRANTY; without even the implied warranty of
  12. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
  13. *
  14. * See the GNU Lesser General Public License in COPYING.LGPL for more details.
  15. */
  16. #include <starpu_mpi_stats.h>
  17. #include <common/config.h>
  18. #include <stdio.h>
  19. //#define STARPU_MPI_VERBOSE 1
  20. #include <starpu_mpi_private.h>
  21. /* measure the amount of data transfers between each pair of MPI nodes */
  22. static size_t *comm_amount;
  23. static int world_size;
  24. static int stats_enabled=0;
  25. void _starpu_mpi_comm_amounts_init(MPI_Comm comm)
  26. {
  27. #ifdef STARPU_COMM_STATS
  28. stats_enabled = 1;
  29. #else
  30. stats_enabled = starpu_get_env_number("STARPU_COMM_STATS");
  31. if (stats_enabled == -1)
  32. {
  33. stats_enabled = 0;
  34. }
  35. #endif /* STARPU_COMM_STATS */
  36. if (stats_enabled == 0) return;
  37. if (!getenv("STARPU_SILENT")) fprintf(stderr,"Warning: StarPU was configured with --enable-comm-stats or is executed with STARPU_COMM_STATS=1, which slows down a bit\n");
  38. MPI_Comm_size(comm, &world_size);
  39. _STARPU_MPI_DEBUG("allocating for %d nodes\n", world_size);
  40. comm_amount = (size_t *) calloc(world_size, sizeof(size_t));
  41. }
  42. void _starpu_mpi_comm_amounts_free()
  43. {
  44. if (stats_enabled == 0) return;
  45. free(comm_amount);
  46. }
  47. void _starpu_mpi_comm_amounts_inc(MPI_Comm comm, unsigned dst, MPI_Datatype datatype, int count)
  48. {
  49. int src, size;
  50. if (stats_enabled == 0) return;
  51. MPI_Comm_rank(comm, &src);
  52. MPI_Type_size(datatype, &size);
  53. _STARPU_MPI_DEBUG("[%d] adding %d to %d\n", src, count*size, dst);
  54. comm_amount[dst] += count*size;
  55. }
  56. void _starpu_mpi_comm_amounts_display(int node)
  57. {
  58. unsigned dst;
  59. size_t sum = 0;
  60. if (stats_enabled == 0) return;
  61. for (dst = 0; dst < world_size; dst++)
  62. {
  63. sum += comm_amount[dst];
  64. }
  65. fprintf(stderr, "\n[%d] Communication transfers stats:\nTOTAL transfers %f B\t%f MB\n", node, (float)sum, (float)sum/1024/1024);
  66. for (dst = 0; dst < world_size; dst++)
  67. {
  68. if (comm_amount[dst])
  69. {
  70. fprintf(stderr, "\t%d -> %d\t%f B\t%f MB\n",
  71. node, dst, (float)comm_amount[dst], ((float)comm_amount[dst])/(1024*1024));
  72. }
  73. }
  74. }