| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219 | /* dlaneg.f -- translated by f2c (version 20061008).   You must link the resulting object file with libf2c:	on Microsoft Windows system, link with libf2c.lib;	on Linux or Unix systems, link with .../path/to/libf2c.a -lm	or, if you install libf2c.a in a standard place, with -lf2c -lm	-- in that order, at the end of the command line, as in		cc *.o -lf2c -lm	Source for libf2c is in /netlib/f2c/libf2c.zip, e.g.,		http://www.netlib.org/f2c/libf2c.zip*/#include "f2c.h"#include "blaswrap.h"integer _starpu_dlaneg_(integer *n, doublereal *d__, doublereal *lld, doublereal *	sigma, doublereal *pivmin, integer *r__){    /* System generated locals */    integer ret_val, i__1, i__2, i__3, i__4;    /* Local variables */    integer j;    doublereal p, t;    integer bj;    doublereal tmp;    integer neg1, neg2;    doublereal bsav, gamma, dplus;    extern logical _starpu_disnan_(doublereal *);    integer negcnt;    logical sawnan;    doublereal dminus;/*  -- LAPACK auxiliary routine (version 3.2) -- *//*     Univ. of Tennessee, Univ. of California Berkeley and NAG Ltd.. *//*     November 2006 *//*     .. Scalar Arguments .. *//*     .. *//*     .. Array Arguments .. *//*     .. *//*  Purpose *//*  ======= *//*  DLANEG computes the Sturm count, the number of negative pivots *//*  encountered while factoring tridiagonal T - sigma I = L D L^T. *//*  This implementation works directly on the factors without forming *//*  the tridiagonal matrix T.  The Sturm count is also the number of *//*  eigenvalues of T less than sigma. *//*  This routine is called from DLARRB. *//*  The current routine does not use the PIVMIN parameter but rather *//*  requires IEEE-754 propagation of Infinities and NaNs.  This *//*  routine also has no input range restrictions but does require *//*  default exception handling such that x/0 produces Inf when x is *//*  non-zero, and Inf/Inf produces NaN.  For more information, see: *//*    Marques, Riedy, and Voemel, "Benefits of IEEE-754 Features in *//*    Modern Symmetric Tridiagonal Eigensolvers," SIAM Journal on *//*    Scientific Computing, v28, n5, 2006.  DOI 10.1137/050641624 *//*    (Tech report version in LAWN 172 with the same title.) *//*  Arguments *//*  ========= *//*  N       (input) INTEGER *//*          The order of the matrix. *//*  D       (input) DOUBLE PRECISION array, dimension (N) *//*          The N diagonal elements of the diagonal matrix D. *//*  LLD     (input) DOUBLE PRECISION array, dimension (N-1) *//*          The (N-1) elements L(i)*L(i)*D(i). *//*  SIGMA   (input) DOUBLE PRECISION *//*          Shift amount in T - sigma I = L D L^T. *//*  PIVMIN  (input) DOUBLE PRECISION *//*          The minimum pivot in the Sturm sequence.  May be used *//*          when zero pivots are encountered on non-IEEE-754 *//*          architectures. *//*  R       (input) INTEGER *//*          The twist index for the twisted factorization that is used *//*          for the negcount. *//*  Further Details *//*  =============== *//*  Based on contributions by *//*     Osni Marques, LBNL/NERSC, USA *//*     Christof Voemel, University of California, Berkeley, USA *//*     Jason Riedy, University of California, Berkeley, USA *//*  ===================================================================== *//*     .. Parameters .. *//*     Some architectures propagate Infinities and NaNs very slowly, so *//*     the code computes counts in BLKLEN chunks.  Then a NaN can *//*     propagate at most BLKLEN columns before being detected.  This is *//*     not a general tuning parameter; it needs only to be just large *//*     enough that the overhead is tiny in common cases. *//*     .. *//*     .. Local Scalars .. *//*     .. *//*     .. Intrinsic Functions .. *//*     .. *//*     .. External Functions .. *//*     .. *//*     .. Executable Statements .. */    /* Parameter adjustments */    --lld;    --d__;    /* Function Body */    negcnt = 0;/*     I) upper part: L D L^T - SIGMA I = L+ D+ L+^T */    t = -(*sigma);    i__1 = *r__ - 1;    for (bj = 1; bj <= i__1; bj += 128) {	neg1 = 0;	bsav = t;/* Computing MIN */	i__3 = bj + 127, i__4 = *r__ - 1;	i__2 = min(i__3,i__4);	for (j = bj; j <= i__2; ++j) {	    dplus = d__[j] + t;	    if (dplus < 0.) {		++neg1;	    }	    tmp = t / dplus;	    t = tmp * lld[j] - *sigma;/* L21: */	}	sawnan = _starpu_disnan_(&t);/*     Run a slower version of the above loop if a NaN is detected. *//*     A NaN should occur only with a zero pivot after an infinite *//*     pivot.  In that case, substituting 1 for T/DPLUS is the *//*     correct limit. */	if (sawnan) {	    neg1 = 0;	    t = bsav;/* Computing MIN */	    i__3 = bj + 127, i__4 = *r__ - 1;	    i__2 = min(i__3,i__4);	    for (j = bj; j <= i__2; ++j) {		dplus = d__[j] + t;		if (dplus < 0.) {		    ++neg1;		}		tmp = t / dplus;		if (_starpu_disnan_(&tmp)) {		    tmp = 1.;		}		t = tmp * lld[j] - *sigma;/* L22: */	    }	}	negcnt += neg1;/* L210: */    }/*     II) lower part: L D L^T - SIGMA I = U- D- U-^T */    p = d__[*n] - *sigma;    i__1 = *r__;    for (bj = *n - 1; bj >= i__1; bj += -128) {	neg2 = 0;	bsav = p;/* Computing MAX */	i__3 = bj - 127;	i__2 = max(i__3,*r__);	for (j = bj; j >= i__2; --j) {	    dminus = lld[j] + p;	    if (dminus < 0.) {		++neg2;	    }	    tmp = p / dminus;	    p = tmp * d__[j] - *sigma;/* L23: */	}	sawnan = _starpu_disnan_(&p);/*     As above, run a slower version that substitutes 1 for Inf/Inf. */	if (sawnan) {	    neg2 = 0;	    p = bsav;/* Computing MAX */	    i__3 = bj - 127;	    i__2 = max(i__3,*r__);	    for (j = bj; j >= i__2; --j) {		dminus = lld[j] + p;		if (dminus < 0.) {		    ++neg2;		}		tmp = p / dminus;		if (_starpu_disnan_(&tmp)) {		    tmp = 1.;		}		p = tmp * d__[j] - *sigma;/* L24: */	    }	}	negcnt += neg2;/* L230: */    }/*     III) Twist index *//*       T was shifted by SIGMA initially. */    gamma = t + *sigma + p;    if (gamma < 0.) {	++negcnt;    }    ret_val = negcnt;    return ret_val;} /* _starpu_dlaneg_ */
 |