stellinstall/dutfx_8f_source.html

C**********************************************************************

C

C     Copyright (C) 1992  Roland W. Freund and Noel M. Nachtigal

C     All rights reserved.

C

C     This code is part of a copyrighted package.  For details, see the

C     file "cpyrit.doc" in the top-level directory.

C

C     *****************************************************************

C     ANY USE OF  THIS CODE CONSTITUTES ACCEPTANCE OF  THE TERMS OF THE

C                             COPYRIGHT NOTICE

C     *****************************************************************

C

C**********************************************************************

C

C     This file contains the routine for the TFQMR algorithm.

C

C**********************************************************************

C

      SUBROUTINE dutfx (NDIM,NLEN,NLIM,VECS,TOL,INFO)

      USE stel_kinds, ONLY: rprec

      IMPLICIT NONE

C

C     Purpose:

C     This subroutine uses the TFQMR (Transpose Free, QMR) algorithm to

C     solve linear systems.

C     It runs the  algorithm to convergence  or until  a user-specified

C     limit on the number of iterations is reached.

C

C     The  code is  set up  to solve  the system  A x = b  with initial

C     guess x_0 = 0.  Here  A x = b  denotes the preconditioned system,

C     and  it  is  connected with the  original system as follows.  Let

C     B y = c be the original unpreconditioned system to be solved, and

C     let y_0 be an arbitrary initial guess for its solution.  Then:

C          A x = b, where  A = M_1^{-1} B M_2^{-1},

C                          x = M_2 (y - y_0), b = M_1^{-1} (c - B y_0).

C     Here M = M_1 M_2 is the preconditioner.

C

C     To recover the final iterate y_n for the original system B y = c

C     from the final iterate x_n for the preconditioned system A x = b,

C     set

C               y_n = y_0 + M_2^{-1} x_n.

C

C     The algorithm was first described in the RIACS Technical Report

C     91.18, `A Transpose-Free  Quasi-Minimal  Residual Algorithm  for

C     Non-Hermitian Linear Systems`, by Roland Freund, September 1991,

C     which subsequently appeared in  SIAM J. Sci. Comput., 14 (1993),

C     pp. 470--482.

C

C     Parameters:

C     For a description of the parameters, see the file "dutfx.doc" in

C     the current directory.

C

C     External routines used:

C     double precision dlamch(ch)

C        LAPACK routine, computes machine-related constants.

C     double precision dnrm2(n,x,incx)

C        BLAS-1 routine, computes the 2-norm of x.

C     subroutine daxpby(n,z,a,x,b,y)

C        Library routine, computes z = a * x + b * y.

C     double precision ddot(n,x,incx,y,incy)

C        BLAS-1 routine, computes y^H * x.

C     subroutine drandn(n,x,seed)

C        Library routine, fills x with random numbers.

C

C     Noel M. Nachtigal

C     April 13, 1993

C

C**********************************************************************

C

      EXTERNAL dlamch, daxpby, drandn, dnrm2, ddot

      REAL(rprec)  :: DLAMCH, DNRM2, DDOT

C

      INTEGER      :: INFO(4), NDIM, NLEN, NLIM

      REAL(rprec)  :: VECS(NDIM,9)

      REAL(rprec)  :: TOL

C

C     Miscellaneous parameters.

C

      REAL(rprec) DHUN, DONE, DTEN, DZERO

      parameter(dhun = 1.0d2,done = 1.0d0,dten = 1.0d1,dzero = 0.0d0)

C

C     Local variables, permanent.

C

      INTEGER     :: IERR, N, RETLBL=0, tf, tres, vf

      SAVE        :: ierr, n, retlbl, tf, tres, vf

      REAL(rprec) :: ALPHA, BETA, ETA, RHO

      SAVE        :: alpha, beta, eta, rho

      REAL(rprec) :: COS1, VAR, R0, RESN, TAU, UCHK, UNRM

      SAVE        :: cos1, var, r0, resn, tau, uchk, unrm

C

C     Local variables, transient.

C

      INTEGER INIT, REVCOM

      REAL(rprec) DTMP

C

C     Initialize some of the permanent variables.

C

C      DATA RETLBL /0/

C

C     Check the reverse communication flag to see where to branch.

C        REVCOM   RETLBL      Comment

C           0        0    first call, go to label 10

C           1       30    returning from AXB, go to label 30

C           1       40    returning from AXB, go to label 40

C           1       60    returning from AXB, go to label 60

C           1       70    returning from AXB, go to label 70

C

      revcom  = info(2)

      info(2) = 0

      IF (revcom.EQ.0) THEN

         n = 0

         IF (retlbl.EQ.0) GO TO 10

      ELSE IF (revcom.EQ.1) THEN

         IF (retlbl.EQ.30) THEN

            GO TO 30

         ELSE IF (retlbl.EQ.40) THEN

            GO TO 40

         ELSE IF (retlbl.EQ.60) THEN

            GO TO 60

         ELSE IF (retlbl.EQ.70) THEN

            GO TO 70

         END IF

      END IF

      ierr = 1

      GO TO 90

C

C     Check whether the inputs are valid.

C

 10   ierr = 0

      IF (ndim.LT.1)    ierr = 2

      IF (nlen.LT.1)    ierr = 2

      IF (nlim.LT.1)    ierr = 2

      IF (nlen.GT.ndim) ierr = 2

      IF (ierr.NE.0) GO TO 90

C

C     Extract from INFO the output units TF and VF, the true residual

C     flag TRES, and the left starting vector flag INIT.

C

      vf   = max(info(1),0)

      init = vf / 100000

      vf   = vf - init * 100000

      tres = vf / 10000

      vf   = vf - tres * 10000

      tf   = vf / 100

      vf   = vf - tf * 100

C

C     Check the convergence tolerance.

C

      IF (tol.LE.dzero) tol = sqrt(dlamch('E'))

C

C     Start the trace messages and convergence history.

C

      IF (vf.NE.0) THEN

         WRITE (vf, *) '      N    2N-1     UNRM       RESN'

         WRITE (vf,'(2I8,1P,2E11.4)') 0, 0, done, done

      ENDIF

      IF (tf.NE.0) THEN

         WRITE (vf, *) '      N    2N-1     UNRM       RESN'

         WRITE (tf,'(2I8,1P,2E11.4)') 0, 0, done, done

      ENDIF

C

C     Set x_0 = 0 and compute the norm of the initial residual.

C

      CALL daxpby (nlen,vecs(1,5),done,vecs(1,2),dzero,vecs(1,5))

      CALL daxpby (nlen,vecs(1,1),dzero,vecs(1,1),dzero,vecs(1,1))

      r0 = dnrm2(nlen,vecs(1,5),1)

      IF ((tol.GE.done).OR.(r0.EQ.dzero)) GO TO 90

C

C     Check whether the auxiliary vector must be supplied.

C

      IF (init.EQ.0) CALL drandn (nlen,vecs(1,3),1)

C

C     Initialize the variables.

C

      n    = 1

      resn = done

      rho  = done

      var  = dzero

      eta  = dzero

      tau  = r0 * r0

      ierr = 8

      CALL daxpby (nlen,vecs(1,8),dzero,vecs(1,8),dzero,vecs(1,8))

      CALL daxpby (nlen,vecs(1,4),dzero,vecs(1,4),dzero,vecs(1,4))

      CALL daxpby (nlen,vecs(1,6),dzero,vecs(1,6),dzero,vecs(1,6))

C

C     This is one step of the TFQMR algorithm.

C     Compute \beta_{n-1} and \rho_{n-1}.

C

 20   dtmp = ddot(nlen,vecs(1,3),1,vecs(1,5),1)

      beta = dtmp / rho

      rho  = dtmp

C

C     Compute y_{2n-1}, v_{n-1}, and A y_{2n-1}.

C

      CALL daxpby (nlen,vecs(1,4),beta,vecs(1,4),done,vecs(1,8))

      CALL daxpby (nlen,vecs(1,6),done,vecs(1,5),beta,vecs(1,6))

C

C     Have the caller carry out AXB, then return here.

C        CALL AXB (VECS(1,6),VECS(1,9))

C

      info(2) = 1

      info(3) = 6

      info(4) = 9

      retlbl  = 30

      RETURN

 30   CALL daxpby (nlen,vecs(1,4),beta,vecs(1,4),done,vecs(1,9))

C

C     Compute \sigma{n-1} and check for breakdowns.

C

      dtmp = ddot(nlen,vecs(1,3),1,vecs(1,4),1)

      IF ((dtmp.EQ.dzero).OR.(rho.EQ.dzero)) THEN

         ierr = 8

         GO TO 90

      END IF

C

C     Compute \alpha_{n-1}, d_{2n-1} and w_{2n}.

C

      alpha = rho / dtmp

      dtmp  = var * eta / alpha

      CALL daxpby (nlen,vecs(1,7),done,vecs(1,6),dtmp,vecs(1,7))

      CALL daxpby (nlen,vecs(1,5),done,vecs(1,5),-alpha,vecs(1,9))

C

C     Compute \varepsilon_{2n-1}^2, \eta_{2n-1}^2, c_{2n-1}^2, and

C     \tau_{2n-1}^2.

C

      dtmp = dnrm2(nlen,vecs(1,5),1)

      dtmp = dtmp * dtmp

      var  = dtmp / tau

      cos1  = done / ( done + var )

      tau  = dtmp * cos1

      eta  = alpha * cos1

C

C     Compute x_{2n-1} and the upper bound for its residual norm.

C

      CALL daxpby (nlen,vecs(1,1),done,vecs(1,1),eta,vecs(1,7))

C

C     Compute the residual norm upper bound.

C     If the scaled upper bound is within one order of magnitude of the

C     target convergence norm, compute the true residual norm.

C

      unrm = sqrt((2*n) * tau) / r0

      uchk = unrm

      IF ((tres.EQ.0).AND.(unrm/tol.GT.dten)) GO TO 50

C

C     Have the caller carry out AXB, then return here.

C        CALL AXB (VECS(1,1),VECS(1,9))

C

      info(2) = 1

      info(3) = 1

      info(4) = 9

      retlbl  = 40

      RETURN

 40   CALL daxpby (nlen,vecs(1,9),done,vecs(1,2),-done,vecs(1,9))

      resn = dnrm2(nlen,vecs(1,9),1) / r0

      uchk = resn

C

C     Output the trace messages and convergence history.

C

 50   IF (vf.NE.0) WRITE (vf,'(2I8,2E11.4)') n, 2*n-1, unrm, resn

      IF (tf.NE.0) WRITE (tf,'(2I8,2E11.4)') n, 2*n-1, unrm, resn

C

C     Check for convergence or termination.  Stop if:

C         1. algorithm converged;

C         2. the residual norm upper bound is smaller than the computed

C     residual norm by a factor of at least 100.

C

      IF (resn.LE.tol) THEN

         ierr = 0

         GO TO 90

      ELSE IF (unrm.LT.uchk/dhun) THEN

         ierr = 4

         GO TO 90

      END IF

C

C     Compute y_{2n}, A y_{2n}, d_{2n}, and w_{2n+1}.

C

      CALL daxpby (nlen,vecs(1,6),done,vecs(1,6),-alpha,vecs(1,4))

      dtmp = var * cos1

      CALL daxpby (nlen,vecs(1,7),done,vecs(1,6),dtmp,vecs(1,7))

C

C     Have the caller carry out AXB, then return here.

C        CALL AXB (VECS(1,6),VECS(1,8))

C

      info(2) = 1

      info(3) = 6

      info(4) = 8

      retlbl  = 60

      RETURN

 60   CALL daxpby (nlen,vecs(1,5),done,vecs(1,5),-alpha,vecs(1,8))

C

C     Compute \varepsilon_{2n}^2, \eta_{2n}^2, c_{2n}^2, and

C     \tau_{2n}^2.

C

      dtmp = dnrm2(nlen,vecs(1,5),1)

      dtmp = dtmp * dtmp

      var  = dtmp / tau

      cos1 = done / ( done + var )

      tau  = dtmp * cos1

      eta  = alpha * cos1

C

C     Compute x_{2n}.

C

      CALL daxpby (nlen,vecs(1,1),done,vecs(1,1),eta,vecs(1,7))

C

C     Compute the residual norm upper bound.

C     If the scaled upper bound is within one order of magnitude of the

C     target convergence norm, compute the true residual norm.

C

      unrm = sqrt((2*n+1) * tau) / r0

      uchk = unrm

      IF ((tres.EQ.0).AND.(unrm/tol.GT.dten).AND.(n.LT.nlim)) GO TO 80

C

C     Have the caller carry out AXB, then return here.

C        CALL AXB (VECS(1,1),VECS(1,9))

C

      info(2) = 1

      info(3) = 1

      info(4) = 9

      retlbl  = 70

      RETURN

 70   CALL daxpby (nlen,vecs(1,9),done,vecs(1,2),-done,vecs(1,9))

      resn = dnrm2(nlen,vecs(1,9),1) / r0

      uchk = unrm

C

C     Output the trace messages and convergence history.

C

 80   IF (vf.NE.0) WRITE (vf,'(2I8,2E11.4)') n, 2*n, unrm, resn

      IF (tf.NE.0) WRITE (tf,'(2I8,2E11.4)') n, 2*n, unrm, resn

C

C     Check for convergence or termination.  Stop if:

C         1. algorithm converged;

C         2. the residual norm upper bound is smaller than the computed

C     residual norm by a factor of at least 100;

C         3. algorithm exceeded the iterations limit.

C

      IF (resn.LE.tol) THEN

         ierr = 0

         GO TO 90

      ELSE IF (unrm.LT.uchk/dhun) THEN

         ierr = 4

         GO TO 90

      ELSE IF (n.GE.nlim) THEN

         ierr = 4

         GO TO 90

      END IF

C

C     Update the running counter.

C

      n = n + 1

      GO TO 20

C

C     Done.

C

 90   nlim    = n

      retlbl  = 0

      info(1) = ierr

C

      RETURN

      END

C

C**********************************************************************