mpi_reduction_kernels.c 2.1 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677
  1. /* StarPU --- Runtime system for heterogeneous multicore architectures.
  2. *
  3. * Copyright (C) 2012 Centre National de la Recherche Scientifique
  4. *
  5. * StarPU is free software; you can redistribute it and/or modify
  6. * it under the terms of the GNU Lesser General Public License as published by
  7. * the Free Software Foundation; either version 2.1 of the License, or (at
  8. * your option) any later version.
  9. *
  10. * StarPU is distributed in the hope that it will be useful, but
  11. * WITHOUT ANY WARRANTY; without even the implied warranty of
  12. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
  13. *
  14. * See the GNU Lesser General Public License in COPYING.LGPL for more details.
  15. */
  16. #include <starpu.h>
  17. #include <mpi.h>
  18. #define _DISPLAY(fmt, args ...) do { \
  19. int _display_rank; MPI_Comm_rank(MPI_COMM_WORLD, &_display_rank); \
  20. fprintf(stderr, "[%d][%s] " fmt , _display_rank, __func__ ,##args); \
  21. fflush(stderr); } while(0)
  22. /*
  23. * Codelet to create a neutral element
  24. */
  25. void init_cpu_func(void *descr[], void *cl_arg)
  26. {
  27. long int *dot = (long int *)STARPU_VARIABLE_GET_PTR(descr[0]);
  28. *dot = 0;
  29. _DISPLAY("Init dot\n");
  30. }
  31. /*
  32. * Codelet to perform the reduction of two elements
  33. */
  34. void redux_cpu_func(void *descr[], void *cl_arg)
  35. {
  36. long int *dota = (long int *)STARPU_VARIABLE_GET_PTR(descr[0]);
  37. long int *dotb = (long int *)STARPU_VARIABLE_GET_PTR(descr[1]);
  38. *dota = *dota + *dotb;
  39. _DISPLAY("Calling redux %ld=%ld+%ld\n", *dota, *dota-*dotb, *dotb);
  40. }
  41. /*
  42. * Dot product codelet
  43. */
  44. void dot_cpu_func(void *descr[], void *cl_arg)
  45. {
  46. long int *local_x = (long int *)STARPU_VECTOR_GET_PTR(descr[0]);
  47. unsigned n = STARPU_VECTOR_GET_NX(descr[0]);
  48. long int *dot = (long int *)STARPU_VARIABLE_GET_PTR(descr[1]);
  49. // _DISPLAY("Before dot=%ld (adding %d elements...)\n", *dot, n);
  50. unsigned i;
  51. for (i = 0; i < n; i++)
  52. {
  53. // _DISPLAY("Adding %ld\n", local_x[i]);
  54. *dot += local_x[i];
  55. }
  56. // _DISPLAY("After dot=%ld\n", *dot);
  57. }
  58. /*
  59. * Display codelet
  60. */
  61. void display_cpu_func(void *descr[], void *cl_arg)
  62. {
  63. long int *local_x = (long int *)STARPU_VECTOR_GET_PTR(descr[0]);
  64. _DISPLAY("Local=%ld\n", *local_x);
  65. }