/* Cheby.f -- translated by f2c (version of 20 August 1993  13:15:44).
   You must link the resulting object file with the libraries:
	-lf2c -lm   (in that order)
*/

#include "f2c.h"

/* Table of constant values */

static integer c__1 = 1;
static doublereal c_b5 = -1.;
static doublereal c_b6 = 1.;

/*  -- Iterative template routine --
*     Univ. of Tennessee and Oak Ridge National Laboratory
*     October 1, 1993
*     Details of this algorithm are described in "Templates for the
*     Solution of Linear Systems: Building Blocks for Iterative
*     Methods", Barrett, Berry, Chan, Demmel, Donato, Dongarra,
*     Eijkhout, Pozo, Romine, and van der Vorst, SIAM Publications,
*     1993. (ftp netlib2.cs.utk.edu; cd linalg; get templates.ps).
*
*  Purpose
*  =======
*
*  CHEBY solves the linear system Ax = b using the Chebyshev iterative
*  method with preconditioning. This version requires explicit
*  knowledge of the maximum and minimum eigenvalues. Note that these
*  eigenvalues must be real positive, which is the case for the
*  symmetric positive definite system.
*
*  Convergence test: ( norm( b - A*x ) / norm( b ) ) < TOL.
*  For other measures, see the above reference.
*
*  Arguments
*  =========
*
*  N       (input) INTEGER.
*          On entry, the dimension of the matrix.
*          Unchanged on exit.
*
*  B       (input) DOUBLE PRECISION array, dimension N.
*          On entry, right hand side vector B.
*          Unchanged on exit.
*
*  X       (input/output) DOUBLE PRECISION array, dimension N.
*          On input, the initial guess. This is commonly set to
*          the zero vector.
*          On exit, if INFO = 0, the iterated approximate solution.
*
*  WORK    (workspace) DOUBLE PRECISION array, dimension (LDW,3).
*          Workspace for residual, direction vector, etc.
*
*  LDW     (input) INTEGER
*          The leading dimension of the array WORK. LDW >= max(1,N).
*
*  ITER    (input/output) INTEGER
*          On input, the maximum iterations to be performed.
*          On output, actual number of iterations performed.
*
*  RESID   (input/output) DOUBLE PRECISION
*          On input, the allowable convergence measure for
*          norm( b - A*x ) / norm( b ).
*          On output, the final value of this measure.
*
*  MATVEC  (external subroutine)
*          The user must provide a subroutine to perform the
*          matrix-vector product
*
*               y := alpha*A*x + beta*y,
*
*          where alpha and beta are scalars, x and y are vectors,
*          and A is a matrix. Vector x must remain unchanged.
*          The solution is over-written on vector y.
*
*          The call is:
*
*             CALL MATVEC( ALPHA, X, BETA, Y )
*
*          The matrix is passed into the routine in a common block.
*
*  PSOLVE  (external subroutine)
*          The user must provide a subroutine to perform the
*          preconditioner solve routine for the linear system
*
*               M*x = b,
*
*          where x and b are vectors, and M a matrix. Vector b must
*          remain unchanged.
*          The solution is over-written on vector x.
*
*          The call is:
*
*             CALL PSOLVE( X, B )
*
*         The preconditioner is passed into the routine in a common block
*
*
*  INFO    (output) INTEGER
*
*          =  0: Successful exit. Iterated approximate solution returned.
*
*
*          >  0: Convergence to tolerance not achieved. This will be
*                set to the number of iterations performed.
*
*          <  0: Illegal input parameter.
*
*                   -1: matrix dimension N < 0
*                   -2: LDW < N
*                   -3: Maximum number of iterations ITER <= 0.
*
*  BLAS CALLS:   DAXPY, DCOPY, DDOT, DNRM2
*  ============================================================ */

int cheby_(n, b, x, work, ldw, iter, resid, matvec, psolve, info)

   integer *n, *ldw, *iter, *info;
   doublereal *b, *x, *work, *resid;
   int (*matvec) (), (*psolve) ();
{
    /* System generated locals */
    integer work_dim1, work_offset;
    doublereal d__1;

    /* Local variables */
    static doublereal beta, bnrm2;
    extern doublereal dnrm2_();
    static doublereal c, d;
    static integer p, r;
    static doublereal alpha;
    static integer z;
    extern /* Subroutine */ int dcopy_();
    static integer maxit;
    extern /* Subroutine */ int daxpy_(), geteig_();
    static doublereal eigmin, eigmax, tol;


    /* Parameter adjustments */
    work_dim1 = *ldw;
    work_offset = work_dim1 + 1;
    work -= work_offset;
    --x;
    --b;

/*  Executable Statements */

    *info = 0;

/*     Test the input parameters. */

    if (*n < 0) {
	*info = -1;
    } else if (*ldw < max(1,*n)) {
	*info = -2;
    } else if (*iter <= 0) {
	*info = -3;
    }
    if (*info != 0) {
	return 0;
    }

    maxit = *iter;
    tol = *resid;

/*     Get extremal eigenvalues. */

    geteig_(&work[work_offset], ldw, &eigmax, &eigmin);

/*     Alias workspace columns. */

    r = 1;
    p = 2;
    z = 3;

/*     Set initial residual. */

    dcopy_(n, &b[1], &c__1, &work[r * work_dim1 + 1], &c__1);
    if (dnrm2_(n, &x[1], &c__1) != 0.) {
	(*matvec)(&c_b5, &x[1], &c_b6, &work[r * work_dim1 + 1]);
	if (dnrm2_(n, &work[r * work_dim1 + 1], &c__1) < tol) {
	    goto L30;
	}
    }

    bnrm2 = dnrm2_(n, &b[1], &c__1);
    if (bnrm2 == 0.) {
	bnrm2 = 1.;
    }

/*     Initialize ellipse parameters. */

    c = (eigmax - eigmin) / 2.;
    d = (eigmax + eigmin) / 2.;

    *iter = 0;

L10:

/*     Perform Chebyshev iteration. */

    ++(*iter);

    (*psolve)(&work[z * work_dim1 + 1], &work[r * work_dim1 + 1]);
    if (*iter > 1) {
/* Computing 2nd power */
	d__1 = c * alpha / 2.;
	beta = d__1 * d__1;
	alpha = 1. / (d - beta);
	daxpy_(n, &beta, &work[p * work_dim1 + 1], &c__1, &work[z * work_dim1 
		+ 1], &c__1);
	dcopy_(n, &work[z * work_dim1 + 1], &c__1, &work[p * work_dim1 + 1], &
		c__1);
    } else {
	dcopy_(n, &work[z * work_dim1 + 1], &c__1, &work[p * work_dim1 + 1], &
		c__1);
	alpha = 2. / d;
    }

/*        Compute new approximation vector X; check accuracy. */

    daxpy_(n, &alpha, &work[p * work_dim1 + 1], &c__1, &x[1], &c__1);
    d__1 = -alpha;
    (*matvec)(&d__1, &work[p * work_dim1 + 1], &c_b6, &work[r * work_dim1 + 1]
	    );
    *resid = dnrm2_(n, &work[r * work_dim1 + 1], &c__1) / bnrm2;
    if (*resid <= tol) {
	goto L30;
    }
    if (*iter == maxit) {
	goto L20;
    }

    goto L10;

L20:

/*     Iteration fails. */

    *info = 1;
    return 0;

L30:

/*     Iteration successful; return. */

    return 0;

/*     End of CHEBY.f */

}