HPL_lmul.c 5.4 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132
  1. /*
  2. * -- High Performance Computing Linpack Benchmark (HPL)
  3. * HPL - 2.0 - September 10, 2008
  4. * Antoine P. Petitet
  5. * University of Tennessee, Knoxville
  6. * Innovative Computing Laboratory
  7. * (C) Copyright 2000-2008 All Rights Reserved
  8. *
  9. * -- Copyright notice and Licensing terms:
  10. *
  11. * Redistribution and use in source and binary forms, with or without
  12. * modification, are permitted provided that the following conditions
  13. * are met:
  14. *
  15. * 1. Redistributions of source code must retain the above copyright
  16. * notice, this list of conditions and the following disclaimer.
  17. *
  18. * 2. Redistributions in binary form must reproduce the above copyright
  19. * notice, this list of conditions, and the following disclaimer in the
  20. * documentation and/or other materials provided with the distribution.
  21. *
  22. * 3. All advertising materials mentioning features or use of this
  23. * software must display the following acknowledgement:
  24. * This product includes software developed at the University of
  25. * Tennessee, Knoxville, Innovative Computing Laboratory.
  26. *
  27. * 4. The name of the University, the name of the Laboratory, or the
  28. * names of its contributors may not be used to endorse or promote
  29. * products derived from this software without specific written
  30. * permission.
  31. *
  32. * -- Disclaimer:
  33. *
  34. * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
  35. * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
  36. * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
  37. * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE UNIVERSITY
  38. * OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
  39. * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
  40. * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
  41. * DATA OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
  42. * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
  43. * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
  44. * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  45. * ---------------------------------------------------------------------
  46. */
  47. /*
  48. * Include files
  49. */
  50. #include "hpl.h"
  51. #ifdef STDC_HEADERS
  52. void HPL_lmul
  53. (
  54. int * K,
  55. int * J,
  56. int * I
  57. )
  58. #else
  59. void HPL_lmul
  60. ( K, J, I )
  61. int * K;
  62. int * J;
  63. int * I;
  64. #endif
  65. {
  66. /*
  67. * Purpose
  68. * =======
  69. *
  70. * HPL_lmul multiplies without carry two long positive integers K and J
  71. * and puts the result into I. The long integers I, J, K are encoded on
  72. * 32 bits using an array of 2 integers. The 32-lower bits are stored in
  73. * the first entry of each array, the 32-higher bits in the second entry
  74. * of each array. For efficiency purposes, the intrisic modulo function
  75. * is inlined.
  76. *
  77. * Arguments
  78. * =========
  79. *
  80. * K (local input) int *
  81. * On entry, K is an integer array of dimension 2 containing the
  82. * encoded long integer K.
  83. *
  84. * J (local input) int *
  85. * On entry, J is an integer array of dimension 2 containing the
  86. * encoded long integer J.
  87. *
  88. * I (local output) int *
  89. * On entry, I is an integer array of dimension 2. On exit, this
  90. * array contains the encoded long integer result.
  91. *
  92. * ---------------------------------------------------------------------
  93. */
  94. /*
  95. * .. Local Variables ..
  96. */
  97. int r, c;
  98. unsigned int kk[4], jj[4], res[5];
  99. /* ..
  100. * .. Executable Statements ..
  101. */
  102. /*
  103. * Addition is done with 16 bits at a time. Multiplying two 16-bit
  104. * integers yields a 32-bit result. The lower 16-bits of the result
  105. * are kept in I, and the higher 16-bits are carried over to the
  106. * next multiplication.
  107. */
  108. for (c = 0; c < 2; ++c) {
  109. kk[2*c] = K[c] & 65535;
  110. kk[2*c+1] = ((unsigned)K[c] >> 16) & 65535;
  111. jj[2*c] = J[c] & 65535;
  112. jj[2*c+1] = ((unsigned)J[c] >> 16) & 65535;
  113. }
  114. res[0] = 0;
  115. for (c = 0; c < 4; ++c) {
  116. res[c+1] = (res[c] >> 16) & 65535;
  117. res[c] &= 65535;
  118. for (r = 0; r < c+1; ++r) {
  119. res[c] = kk[r] * jj[c-r] + (res[c] & 65535);
  120. res[c+1] += (res[c] >> 16) & 65535;
  121. }
  122. }
  123. for (c = 0; c < 2; ++c)
  124. I[c] = (int)(((res[2*c+1] & 65535) << 16) | (res[2*c] & 65535));
  125. /*
  126. * End of HPL_lmul
  127. */
  128. }