123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372 |
- /*
- * -- High Performance Computing Linpack Benchmark (HPL)
- * HPL - 2.0 - September 10, 2008
- * Antoine P. Petitet
- * University of Tennessee, Knoxville
- * Innovative Computing Laboratory
- * (C) Copyright 2000-2008 All Rights Reserved
- *
- * -- Copyright notice and Licensing terms:
- *
- * Redistribution and use in source and binary forms, with or without
- * modification, are permitted provided that the following conditions
- * are met:
- *
- * 1. Redistributions of source code must retain the above copyright
- * notice, this list of conditions and the following disclaimer.
- *
- * 2. Redistributions in binary form must reproduce the above copyright
- * notice, this list of conditions, and the following disclaimer in the
- * documentation and/or other materials provided with the distribution.
- *
- * 3. All advertising materials mentioning features or use of this
- * software must display the following acknowledgement:
- * This product includes software developed at the University of
- * Tennessee, Knoxville, Innovative Computing Laboratory.
- *
- * 4. The name of the University, the name of the Laboratory, or the
- * names of its contributors may not be used to endorse or promote
- * products derived from this software without specific written
- * permission.
- *
- * -- Disclaimer:
- *
- * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
- * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
- * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
- * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE UNIVERSITY
- * OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
- * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
- * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
- * DATA OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
- * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
- * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
- * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
- * ---------------------------------------------------------------------
- */
- /*
- * Include files
- */
- #include "hpl.h"
- #include "RCCE_lib.h"
- /*
- * ---------------------------------------------------------------------
- * Static variables
- * ---------------------------------------------------------------------
- */
- static int HPL_ptimer_disabled;
- static double HPL_ptimer_cpusec [HPL_NPTIMER],
- HPL_ptimer_cpustart [HPL_NPTIMER],
- HPL_ptimer_wallsec [HPL_NPTIMER],
- HPL_ptimer_wallstart[HPL_NPTIMER];
- #ifdef _OPENMP
- #pragma omp threadprivate(HPL_ptimer_disabled)
- #pragma omp threadprivate(HPL_ptimer_cpusec)
- #pragma omp threadprivate(HPL_ptimer_cpustart)
- #pragma omp threadprivate(HPL_ptimer_wallsec)
- #pragma omp threadprivate(HPL_ptimer_wallstart)
- #endif
- /*
- * ---------------------------------------------------------------------
- * User callable functions
- * ---------------------------------------------------------------------
- */
- #ifdef STDC_HEADERS
- void HPL_ptimer_boot( void )
- #else
- void HPL_ptimer_boot()
- #endif
- {
- /*
- * HPL_ptimer_boot (re)sets all timers to 0, and enables HPL_ptimer.
- */
- /*
- * .. Local Variables ..
- */
- int i;
- /* ..
- * .. Executable Statements ..
- */
- HPL_ptimer_disabled = 0;
- for( i = 0; i < HPL_NPTIMER; i++ )
- {
- HPL_ptimer_cpusec [i] = HPL_ptimer_wallsec [i] = HPL_rzero;
- HPL_ptimer_cpustart[i] = HPL_ptimer_wallstart[i] = HPL_PTIMER_STARTFLAG;
- }
- /*
- * End of HPL_ptimer_boot
- */
- }
- #ifdef STDC_HEADERS
- void HPL_ptimer( const int I )
- #else
- void HPL_ptimer( I )
- const int I;
- #endif
- {
- /*
- * Purpose
- * =======
- *
- * HPL_ptimer provides a "stopwatch" functionality cpu/wall timer in
- * seconds. Up to 64 separate timers can be functioning at once. The
- * first call starts the timer, and the second stops it. This routine
- * can be disenabled by calling HPL_ptimer_disable(), so that calls to
- * the timer are ignored. This feature can be used to make sure certain
- * sections of code do not affect timings, even if they call routines
- * which have HPL_ptimer calls in them. HPL_ptimer_enable() will enable
- * the timer functionality. One can retrieve the current value of a
- * timer by calling
- *
- * t0 = HPL_ptimer_inquire( HPL_WALL_TIME | HPL_CPU_TIME, I )
- *
- * where I is the timer index in [0..64). To inititialize the timer
- * functionality, one must have called HPL_ptimer_boot() prior to any of
- * the functions mentioned above.
- *
- * Arguments
- * =========
- *
- * I (global input) const int
- * On entry, I specifies the timer to stop/start.
- *
- * ---------------------------------------------------------------------
- */
- /* ..
- * .. Executable Statements ..
- */
- if( HPL_ptimer_disabled ) return;
- /*
- * If timer has not been started, start it. Otherwise, stop it and add
- * interval to count
- */
- if( HPL_ptimer_wallstart[I] == HPL_PTIMER_STARTFLAG )
- {
- HPL_ptimer_wallstart[I] = HPL_ptimer_walltime();
- HPL_ptimer_cpustart [I] = HPL_ptimer_cputime ();
- }
- else
- {
- HPL_ptimer_cpusec [I] += HPL_ptimer_cputime ()-HPL_ptimer_cpustart [I];
- HPL_ptimer_wallsec [I] += HPL_ptimer_walltime()-HPL_ptimer_wallstart[I];
- HPL_ptimer_wallstart[I] = HPL_PTIMER_STARTFLAG;
- }
- /*
- * End of HPL_ptimer
- */
- }
- #ifdef STDC_HEADERS
- void HPL_ptimer_enable( void )
- #else
- void HPL_ptimer_enable()
- #endif
- {
- /*
- * HPL_ptimer_enable sets it so calls to HPL_ptimer are not ignored.
- */
- /* ..
- * .. Executable Statements ..
- */
- HPL_ptimer_disabled = 0;
- return;
- /*
- * End of HPL_ptimer_enable
- */
- }
- #ifdef STDC_HEADERS
- void HPL_ptimer_disable( void )
- #else
- void HPL_ptimer_disable()
- #endif
- {
- /*
- * HPL_ptimer_disable sets it so calls to HPL_ptimer are ignored.
- */
- /* ..
- * .. Executable Statements ..
- */
- HPL_ptimer_disabled = 1;
- return;
- /*
- * End of HPL_ptimer_disable
- */
- }
- #ifdef STDC_HEADERS
- double HPL_ptimer_inquire
- (
- const HPL_T_PTIME TMTYPE,
- const int I
- )
- #else
- double HPL_ptimer_inquire( TMTYPE, I )
- const int I;
- const HPL_T_PTIME TMTYPE;
- #endif
- {
- /*
- * Purpose
- * =======
- *
- * HPL_ptimer_inquire returns wall- or cpu- time that has accumulated in
- * timer I.
- *
- * Arguments
- * =========
- *
- * TMTYPE (global input) const HPL_T_PTIME
- * On entry, TMTYPE specifies what time will be returned as fol-
- * lows
- * = HPL_WALL_PTIME : wall clock time is returned,
- * = HPL_CPU_PTIME : CPU time is returned (default).
- *
- * I (global input) const int
- * On entry, I specifies the timer to return.
- *
- * ---------------------------------------------------------------------
- */
- /*
- * .. Local Variables ..
- */
- double time;
- /* ..
- * .. Executable Statements ..
- */
- /*
- * If wall- or cpu-time are not available on this machine, return
- * HPL_PTIMER_ERROR
- */
- if( TMTYPE == HPL_WALL_PTIME )
- {
- if( HPL_ptimer_walltime() == HPL_PTIMER_ERROR )
- time = HPL_PTIMER_ERROR;
- else
- time = HPL_ptimer_wallsec[I];
- }
- else
- {
- if( HPL_ptimer_cputime() == HPL_PTIMER_ERROR )
- time = HPL_PTIMER_ERROR;
- else
- time = HPL_ptimer_cpusec [I];
- }
- return( time );
- /*
- * End of HPL_ptimer_inquire
- */
- }
- #ifdef STDC_HEADERS
- void HPL_ptimer_combine
- (
- MPI_Comm COMM,
- const HPL_T_PTIME_OP OPE,
- const HPL_T_PTIME TMTYPE,
- const int N,
- const int IBEG,
- double * TIMES
- )
- #else
- void HPL_ptimer_combine( COMM, OPE, TMTYPE, N, IBEG, TIMES )
- const int IBEG, N;
- const HPL_T_PTIME_OP OPE;
- const HPL_T_PTIME TMTYPE;
- MPI_Comm COMM;
- double * TIMES;
- #endif
- {
- /*
- * Purpose
- * =======
- *
- * HPL_ptimer_combine combines the timing information stored on a scope
- * of processes into the user TIMES array.
- *
- * Arguments
- * =========
- *
- * COMM (global/local input) MPI_Comm
- * The MPI communicator identifying the process collection on
- * which the timings are taken.
- *
- * OPE (global input) const HPL_T_PTIME_OP
- * On entry, OP specifies what combine operation should be done
- * as follows:
- * = HPL_AMAX_PTIME get max. time on any process (default),
- * = HPL_AMIN_PTIME get min. time on any process,
- * = HPL_SUM_PTIME get sum of times across processes.
- *
- * TMTYPE (global input) const HPL_T_PTIME
- * On entry, TMTYPE specifies what time will be returned as fol-
- * lows
- * = HPL_WALL_PTIME : wall clock time is returned,
- * = HPL_CPU_PTIME : CPU time is returned (default).
- *
- * N (global input) const int
- * On entry, N specifies the number of timers to combine.
- *
- * IBEG (global input) const int
- * On entry, IBEG specifies the first timer to be combined.
- *
- * TIMES (global output) double *
- * On entry, TIMES is an array of dimension at least N. On exit,
- * this array contains the requested timing information.
- *
- * ---------------------------------------------------------------------
- */
- /*
- * .. Local Variables ..
- */
- int i, tmpdis;
- /* ..
- * .. Executable Statements ..
- */
- tmpdis = HPL_ptimer_disabled; HPL_ptimer_disabled = 1;
- /*
- * Timer has been disabled for combine operation - copy timing informa-
- * tion into user times array. If wall- or cpu-time are not available
- * on this machine, fill in times with HPL_PTIMER_ERROR flag and return.
- */
- if( TMTYPE == HPL_WALL_PTIME )
- {
- if( HPL_ptimer_walltime() == HPL_PTIMER_ERROR )
- { for( i = 0; i < N; i++ ) TIMES[i] = HPL_PTIMER_ERROR; return; }
- else
- { for( i = 0; i < N; i++ ) TIMES[i] = HPL_ptimer_wallsec[IBEG+i]; }
- }
- else
- {
- if( HPL_ptimer_cputime() == HPL_PTIMER_ERROR )
- { for( i = 0; i < N; i++ ) TIMES[i] = HPL_PTIMER_ERROR; return; }
- else
- { for( i = 0; i < N; i++ ) TIMES[i] = HPL_ptimer_cpusec[IBEG+i]; }
- }
- /*
- * Combine all nodes information, restore HPL_ptimer_disabled, and return
- */
- for( i = 0; i < N; i++ ) {
- TIMES[i] = Mmax( HPL_rzero, TIMES[i] );
- }
- if( OPE == HPL_AMAX_PTIME )
- (void) HPL_all_reduce( (void *)(TIMES), N, HPL_DOUBLE, HPL_max, COMM );
- else if( OPE == HPL_AMIN_PTIME )
- (void) HPL_all_reduce( (void *)(TIMES), N, HPL_DOUBLE, HPL_min, COMM );
- else if( OPE == HPL_SUM_PTIME )
- (void) HPL_all_reduce( (void *)(TIMES), N, HPL_DOUBLE, HPL_sum, COMM );
- else
- (void) HPL_all_reduce( (void *)(TIMES), N, HPL_DOUBLE, HPL_max, COMM );
- HPL_ptimer_disabled = tmpdis;
- /*
- * End of HPL_ptimer_combine
- */
- }
|