HPL_perm.c 5.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132
  1. /*
  2. * -- High Performance Computing Linpack Benchmark (HPL)
  3. * HPL - 2.0 - September 10, 2008
  4. * Antoine P. Petitet
  5. * University of Tennessee, Knoxville
  6. * Innovative Computing Laboratory
  7. * (C) Copyright 2000-2008 All Rights Reserved
  8. *
  9. * -- Copyright notice and Licensing terms:
  10. *
  11. * Redistribution and use in source and binary forms, with or without
  12. * modification, are permitted provided that the following conditions
  13. * are met:
  14. *
  15. * 1. Redistributions of source code must retain the above copyright
  16. * notice, this list of conditions and the following disclaimer.
  17. *
  18. * 2. Redistributions in binary form must reproduce the above copyright
  19. * notice, this list of conditions, and the following disclaimer in the
  20. * documentation and/or other materials provided with the distribution.
  21. *
  22. * 3. All advertising materials mentioning features or use of this
  23. * software must display the following acknowledgement:
  24. * This product includes software developed at the University of
  25. * Tennessee, Knoxville, Innovative Computing Laboratory.
  26. *
  27. * 4. The name of the University, the name of the Laboratory, or the
  28. * names of its contributors may not be used to endorse or promote
  29. * products derived from this software without specific written
  30. * permission.
  31. *
  32. * -- Disclaimer:
  33. *
  34. * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
  35. * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
  36. * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
  37. * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE UNIVERSITY
  38. * OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
  39. * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
  40. * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
  41. * DATA OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
  42. * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
  43. * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
  44. * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  45. * ---------------------------------------------------------------------
  46. */
  47. /*
  48. * Include files
  49. */
  50. #include "hpl.h"
  51. #ifdef STDC_HEADERS
  52. void HPL_perm
  53. (
  54. const int N,
  55. int * LINDXA,
  56. int * LINDXAU,
  57. int * IWORK
  58. )
  59. #else
  60. void HPL_perm
  61. ( N, LINDXA, LINDXAU, IWORK )
  62. const int N;
  63. int * LINDXA;
  64. int * LINDXAU;
  65. int * IWORK;
  66. #endif
  67. {
  68. /*
  69. * Purpose
  70. * =======
  71. *
  72. * HPL_perm combines two index arrays and generate the corresponding
  73. * permutation. First, this function computes the inverse of LINDXA, and
  74. * then combine it with LINDXAU. Second, in order to be able to perform
  75. * the permutation in place, LINDXAU is overwritten by the sequence of
  76. * permutation producing the same result. What we ultimately want to
  77. * achieve is: U[LINDXAU[i]] := U[LINDXA[i]] for i in [0..N). After the
  78. * call to this function, this in place permutation can be performed by
  79. * for i in [0..N) swap U[i] with U[LINDXAU[i]].
  80. *
  81. * Arguments
  82. * =========
  83. *
  84. * N (global input) const int
  85. * On entry, N specifies the length of the arrays LINDXA and
  86. * LINDXAU. N should be at least zero.
  87. *
  88. * LINDXA (global input/output) int *
  89. * On entry, LINDXA is an array of dimension N containing the
  90. * source indexes. On exit, LINDXA contains the combined index
  91. * array.
  92. *
  93. * LINDXAU (global input/output) int *
  94. * On entry, LINDXAU is an array of dimension N containing the
  95. * target indexes. On exit, LINDXAU contains the sequence of
  96. * permutation, that should be applied in increasing order to
  97. * permute the underlying array U in place.
  98. *
  99. * IWORK (workspace) int *
  100. * On entry, IWORK is a workarray of dimension N.
  101. *
  102. * ---------------------------------------------------------------------
  103. */
  104. /*
  105. * .. Local Variables ..
  106. */
  107. int i, j, k, fndd;
  108. /* ..
  109. * .. Executable Statements ..
  110. */
  111. /*
  112. * Inverse LINDXA - combine LINDXA and LINDXAU - Initialize IWORK
  113. */
  114. for( i = 0; i < N; i++ ) { IWORK[LINDXA[i]] = i; }
  115. for( i = 0; i < N; i++ ) { LINDXA[i] = LINDXAU[IWORK[i]]; IWORK[i] = i; }
  116. for( i = 0; i < N; i++ )
  117. {
  118. /* search LINDXA such that LINDXA[j] == i */
  119. j = 0; do { fndd = ( LINDXA[j] == i ); j++; } while( !fndd ); j--;
  120. /* search IWORK such that IWORK[k] == j */
  121. k = 0; do { fndd = ( IWORK[k] == j ); k++; } while( !fndd ); k--;
  122. /* swap IWORK[i] and IWORK[k]; LINDXAU[i] = k */
  123. j = IWORK[i]; IWORK[i] = IWORK[k]; IWORK[k] = j;
  124. LINDXAU[i] = k;
  125. }
  126. /*
  127. * End of HPL_perm
  128. */
  129. }