| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317 | 
							- /* _starpu_dla_gbamv.f -- translated by f2c (version 20061008).
 
-    You must link the resulting object file with libf2c:
 
- 	on Microsoft Windows system, link with libf2c.lib;
 
- 	on Linux or Unix systems, link with .../path/to/libf2c.a -lm
 
- 	or, if you install libf2c.a in a standard place, with -lf2c -lm
 
- 	-- in that order, at the end of the command line, as in
 
- 		cc *.o -lf2c -lm
 
- 	Source for libf2c is in /netlib/f2c/libf2c.zip, e.g.,
 
- 		http://www.netlib.org/f2c/libf2c.zip
 
- */
 
- #include "f2c.h"
 
- #include "blaswrap.h"
 
- /* Subroutine */ int _starpu_dla_gbamv__(integer *trans, integer *m, integer *n, 
 
- 	integer *kl, integer *ku, doublereal *alpha, doublereal *ab, integer *
 
- 	ldab, doublereal *x, integer *incx, doublereal *beta, doublereal *y, 
 
- 	integer *incy)
 
- {
 
-     /* System generated locals */
 
-     integer ab_dim1, ab_offset, i__1, i__2, i__3, i__4;
 
-     doublereal d__1;
 
-     /* Builtin functions */
 
-     double d_sign(doublereal *, doublereal *);
 
-     /* Local variables */
 
-     extern integer _starpu_ilatrans_(char *);
 
-     integer i__, j;
 
-     logical symb_zero__;
 
-     integer kd, iy, jx, kx, ky, info;
 
-     doublereal temp;
 
-     integer lenx, leny;
 
-     doublereal safe1;
 
-     extern doublereal _starpu_dlamch_(char *);
 
-     extern /* Subroutine */ int _starpu_xerbla_(char *, integer *);
 
- /*     -- LAPACK routine (version 3.2)                                 -- */
 
- /*     -- Contributed by James Demmel, Deaglan Halligan, Yozo Hida and -- */
 
- /*     -- Jason Riedy of Univ. of California Berkeley.                 -- */
 
- /*     -- November 2008                                                -- */
 
- /*     -- LAPACK is a software package provided by Univ. of Tennessee, -- */
 
- /*     -- Univ. of California Berkeley and NAG Ltd.                    -- */
 
- /*     .. */
 
- /*     .. Scalar Arguments .. */
 
- /*     .. */
 
- /*     .. Array Arguments .. */
 
- /*     .. */
 
- /*  Purpose */
 
- /*  ======= */
 
- /*  DLA_GEAMV  performs one of the matrix-vector operations */
 
- /*          y := alpha*abs(A)*abs(x) + beta*abs(y), */
 
- /*     or   y := alpha*abs(A)'*abs(x) + beta*abs(y), */
 
- /*  where alpha and beta are scalars, x and y are vectors and A is an */
 
- /*  m by n matrix. */
 
- /*  This function is primarily used in calculating error bounds. */
 
- /*  To protect against underflow during evaluation, components in */
 
- /*  the resulting vector are perturbed away from zero by (N+1) */
 
- /*  times the underflow threshold.  To prevent unnecessarily large */
 
- /*  errors for block-structure embedded in general matrices, */
 
- /*  "symbolically" zero components are not perturbed.  A zero */
 
- /*  entry is considered "symbolic" if all multiplications involved */
 
- /*  in computing that entry have at least one zero multiplicand. */
 
- /*  Parameters */
 
- /*  ========== */
 
- /*  TRANS  - INTEGER */
 
- /*           On entry, TRANS specifies the operation to be performed as */
 
- /*           follows: */
 
- /*             BLAS_NO_TRANS      y := alpha*abs(A)*abs(x) + beta*abs(y) */
 
- /*             BLAS_TRANS         y := alpha*abs(A')*abs(x) + beta*abs(y) */
 
- /*             BLAS_CONJ_TRANS    y := alpha*abs(A')*abs(x) + beta*abs(y) */
 
- /*           Unchanged on exit. */
 
- /*  M      - INTEGER */
 
- /*           On entry, M specifies the number of rows of the matrix A. */
 
- /*           M must be at least zero. */
 
- /*           Unchanged on exit. */
 
- /*  N      - INTEGER */
 
- /*           On entry, N specifies the number of columns of the matrix A. */
 
- /*           N must be at least zero. */
 
- /*           Unchanged on exit. */
 
- /*  KL     - INTEGER */
 
- /*           The number of subdiagonals within the band of A.  KL >= 0. */
 
- /*  KU     - INTEGER */
 
- /*           The number of superdiagonals within the band of A.  KU >= 0. */
 
- /*  ALPHA  - DOUBLE PRECISION */
 
- /*           On entry, ALPHA specifies the scalar alpha. */
 
- /*           Unchanged on exit. */
 
- /*  A      - DOUBLE PRECISION   array of DIMENSION ( LDA, n ) */
 
- /*           Before entry, the leading m by n part of the array A must */
 
- /*           contain the matrix of coefficients. */
 
- /*           Unchanged on exit. */
 
- /*  LDA    - INTEGER */
 
- /*           On entry, LDA specifies the first dimension of A as declared */
 
- /*           in the calling (sub) program. LDA must be at least */
 
- /*           max( 1, m ). */
 
- /*           Unchanged on exit. */
 
- /*  X      - DOUBLE PRECISION   array of DIMENSION at least */
 
- /*           ( 1 + ( n - 1 )*abs( INCX ) ) when TRANS = 'N' or 'n' */
 
- /*           and at least */
 
- /*           ( 1 + ( m - 1 )*abs( INCX ) ) otherwise. */
 
- /*           Before entry, the incremented array X must contain the */
 
- /*           vector x. */
 
- /*           Unchanged on exit. */
 
- /*  INCX   - INTEGER */
 
- /*           On entry, INCX specifies the increment for the elements of */
 
- /*           X. INCX must not be zero. */
 
- /*           Unchanged on exit. */
 
- /*  BETA   - DOUBLE PRECISION */
 
- /*           On entry, BETA specifies the scalar beta. When BETA is */
 
- /*           supplied as zero then Y need not be set on input. */
 
- /*           Unchanged on exit. */
 
- /*  Y      - DOUBLE PRECISION   array of DIMENSION at least */
 
- /*           ( 1 + ( m - 1 )*abs( INCY ) ) when TRANS = 'N' or 'n' */
 
- /*           and at least */
 
- /*           ( 1 + ( n - 1 )*abs( INCY ) ) otherwise. */
 
- /*           Before entry with BETA non-zero, the incremented array Y */
 
- /*           must contain the vector y. On exit, Y is overwritten by the */
 
- /*           updated vector y. */
 
- /*  INCY   - INTEGER */
 
- /*           On entry, INCY specifies the increment for the elements of */
 
- /*           Y. INCY must not be zero. */
 
- /*           Unchanged on exit. */
 
- /*  Level 2 Blas routine. */
 
- /*     .. */
 
- /*     .. Parameters .. */
 
- /*     .. */
 
- /*     .. Local Scalars .. */
 
- /*     .. */
 
- /*     .. External Subroutines .. */
 
- /*     .. */
 
- /*     .. External Functions .. */
 
- /*     .. */
 
- /*     .. Intrinsic Functions .. */
 
- /*     .. */
 
- /*     .. Executable Statements .. */
 
- /*     Test the input parameters. */
 
-     /* Parameter adjustments */
 
-     ab_dim1 = *ldab;
 
-     ab_offset = 1 + ab_dim1;
 
-     ab -= ab_offset;
 
-     --x;
 
-     --y;
 
-     /* Function Body */
 
-     info = 0;
 
-     if (! (*trans == _starpu_ilatrans_("N") || *trans == _starpu_ilatrans_("T") || *trans == _starpu_ilatrans_("C"))) {
 
- 	info = 1;
 
-     } else if (*m < 0) {
 
- 	info = 2;
 
-     } else if (*n < 0) {
 
- 	info = 3;
 
-     } else if (*kl < 0) {
 
- 	info = 4;
 
-     } else if (*ku < 0) {
 
- 	info = 5;
 
-     } else if (*ldab < *kl + *ku + 1) {
 
- 	info = 6;
 
-     } else if (*incx == 0) {
 
- 	info = 8;
 
-     } else if (*incy == 0) {
 
- 	info = 11;
 
-     }
 
-     if (info != 0) {
 
- 	_starpu_xerbla_("DLA_GBAMV ", &info);
 
- 	return 0;
 
-     }
 
- /*     Quick return if possible. */
 
-     if (*m == 0 || *n == 0 || *alpha == 0. && *beta == 1.) {
 
- 	return 0;
 
-     }
 
- /*     Set  LENX  and  LENY, the lengths of the vectors x and y, and set */
 
- /*     up the start points in  X  and  Y. */
 
-     if (*trans == _starpu_ilatrans_("N")) {
 
- 	lenx = *n;
 
- 	leny = *m;
 
-     } else {
 
- 	lenx = *m;
 
- 	leny = *n;
 
-     }
 
-     if (*incx > 0) {
 
- 	kx = 1;
 
-     } else {
 
- 	kx = 1 - (lenx - 1) * *incx;
 
-     }
 
-     if (*incy > 0) {
 
- 	ky = 1;
 
-     } else {
 
- 	ky = 1 - (leny - 1) * *incy;
 
-     }
 
- /*     Set SAFE1 essentially to be the underflow threshold times the */
 
- /*     number of additions in each row. */
 
-     safe1 = _starpu_dlamch_("Safe minimum");
 
-     safe1 = (*n + 1) * safe1;
 
- /*     Form  y := alpha*abs(A)*abs(x) + beta*abs(y). */
 
- /*     The O(M*N) SYMB_ZERO tests could be replaced by O(N) queries to */
 
- /*     the inexact flag.  Still doesn't help change the iteration order */
 
- /*     to per-column. */
 
-     kd = *ku + 1;
 
-     iy = ky;
 
-     if (*incx == 1) {
 
- 	i__1 = leny;
 
- 	for (i__ = 1; i__ <= i__1; ++i__) {
 
- 	    if (*beta == 0.) {
 
- 		symb_zero__ = TRUE_;
 
- 		y[iy] = 0.;
 
- 	    } else if (y[iy] == 0.) {
 
- 		symb_zero__ = TRUE_;
 
- 	    } else {
 
- 		symb_zero__ = FALSE_;
 
- 		y[iy] = *beta * (d__1 = y[iy], abs(d__1));
 
- 	    }
 
- 	    if (*alpha != 0.) {
 
- /* Computing MAX */
 
- 		i__2 = i__ - *ku;
 
- /* Computing MIN */
 
- 		i__4 = i__ + *kl;
 
- 		i__3 = min(i__4,lenx);
 
- 		for (j = max(i__2,1); j <= i__3; ++j) {
 
- 		    if (*trans == _starpu_ilatrans_("N")) {
 
- 			temp = (d__1 = ab[kd + i__ - j + j * ab_dim1], abs(
 
- 				d__1));
 
- 		    } else {
 
- 			temp = (d__1 = ab[j + (kd + i__ - j) * ab_dim1], abs(
 
- 				d__1));
 
- 		    }
 
- 		    symb_zero__ = symb_zero__ && (x[j] == 0. || temp == 0.);
 
- 		    y[iy] += *alpha * (d__1 = x[j], abs(d__1)) * temp;
 
- 		}
 
- 	    }
 
- 	    if (! symb_zero__) {
 
- 		y[iy] += d_sign(&safe1, &y[iy]);
 
- 	    }
 
- 	    iy += *incy;
 
- 	}
 
-     } else {
 
- 	i__1 = leny;
 
- 	for (i__ = 1; i__ <= i__1; ++i__) {
 
- 	    if (*beta == 0.) {
 
- 		symb_zero__ = TRUE_;
 
- 		y[iy] = 0.;
 
- 	    } else if (y[iy] == 0.) {
 
- 		symb_zero__ = TRUE_;
 
- 	    } else {
 
- 		symb_zero__ = FALSE_;
 
- 		y[iy] = *beta * (d__1 = y[iy], abs(d__1));
 
- 	    }
 
- 	    if (*alpha != 0.) {
 
- 		jx = kx;
 
- /* Computing MAX */
 
- 		i__3 = i__ - *ku;
 
- /* Computing MIN */
 
- 		i__4 = i__ + *kl;
 
- 		i__2 = min(i__4,lenx);
 
- 		for (j = max(i__3,1); j <= i__2; ++j) {
 
- 		    if (*trans == _starpu_ilatrans_("N")) {
 
- 			temp = (d__1 = ab[kd + i__ - j + j * ab_dim1], abs(
 
- 				d__1));
 
- 		    } else {
 
- 			temp = (d__1 = ab[j + (kd + i__ - j) * ab_dim1], abs(
 
- 				d__1));
 
- 		    }
 
- 		    symb_zero__ = symb_zero__ && (x[jx] == 0. || temp == 0.);
 
- 		    y[iy] += *alpha * (d__1 = x[jx], abs(d__1)) * temp;
 
- 		    jx += *incx;
 
- 		}
 
- 	    }
 
- 	    if (! symb_zero__) {
 
- 		y[iy] += d_sign(&safe1, &y[iy]);
 
- 	    }
 
- 	    iy += *incy;
 
- 	}
 
-     }
 
-     return 0;
 
- /*     End of DLA_GBAMV */
 
- } /* _starpu_dla_gbamv__ */
 
 
  |