/[MITgcm]/MITgcm_contrib/torge/itd/code/seaice_fgmres.F

Diff of /MITgcm_contrib/torge/itd/code/seaice_fgmres.F

Parent Directory | Revision Log | View Revision Graph Revision Graph | View Patch Patch

-revision 1.1 by torge,
Wed Oct 24 21:48:53 2012 UTC
+revision 1.3 by torge,
Mon Dec 10 22:19:49 2012 UTC
 Line 15 
 C     !ROUTINE: SEAICE_FGMRES_DRIVER
  C     !INTERFACE:
        SUBROUTINE SEAICE_FGMRES_DRIVER(
       I     uIceRes, vIceRes,
       U     duIce, dvIce,
       U     iCode,
-      I     FGMRESeps,
+      I     FGMRESeps, iOutFGMRES,
       I     newtonIter, krylovIter, myTime, myIter, myThid )
  C     !DESCRIPTION: \bv
 Line 48 
 C     myIter :: Simulation timestep numb
  C     myThid :: my Thread Id. number
  C     newtonIter :: current iterate of Newton iteration
  C     krylovIter :: current iterate of Newton iteration
- C     iCode  :: FGMRES parameter to determine next step
+ C     iCode      :: FGMRES parameter to determine next step
+ C     iOutFGMRES :: control output of fgmres
        _RL     myTime
        INTEGER myIter
        INTEGER myThid
        INTEGER newtonIter
        INTEGER krylovIter
+       INTEGER iOutFGMRES
        INTEGER iCode
  C     FGMRESeps :: tolerance for FGMRES
        _RL FGMRESeps
-Line 74 
 C     FGMRES parameters
+Line 76 
 C     FGMRES parameters
  C     n  :: size of the input vector(s)
  C     im :: size of Krylov space
  C     ifgmres :: interation counter
- C     iout :: control output of fgmres
        INTEGER n
        PARAMETER ( n  = 2*sNx*sNy*nSx*nSy )
        INTEGER im
        PARAMETER ( im = 50 )
-       INTEGER ifgmres, iout
+       INTEGER ifgmres
  C     work arrays
        _RL rhs(n), sol(n)
        _RL vv(n,im+1), w(n,im)
-Line 90 
 C     they are not forgotten between Kry
+Line 91 
 C     they are not forgotten between Kry
        COMMON /FGMRES_RL/ sol, rhs, vv, w
  CEOP
- C     iout=1 give a little bit of output
-       iout=1
  C     For now, let only the master thread do all the work
  C     - copy from 2D arrays to 1D-vector
  C     - perform fgmres step (including global sums)
-Line 101 
 C     not sure if this works properly
+Line 99 
 C     not sure if this works properly
        _BEGIN_MASTER ( myThid )
        IF ( iCode .EQ. 0 ) THEN
- C     first guess is zero because it is a correction
+ C     The first guess is zero because it is a correction, but this
- C     wk2 needs to reset for iCode = 0, because it contains
+ C     is implemented by setting du/vIce=0 outside of this routine;
+ C     this make it possible to restart FGMRES with a nonzero sol
+        CALL SEAICE_MAP2VEC(n,duIce,dvIce,sol,.TRUE.,myThid)
+ C     wk2 needs to be reset for iCode = 0, because it may contain
  C     remains of the previous Krylov iteration
         DO k=1,n
-         sol(k) = 0. _d 0
          wk2(k) = 0. _d 0
         ENDDO
        ELSEIF ( iCode .EQ. 3 ) THEN
         CALL SEAICE_MAP2VEC(n,uIceRes,vIceRes,rhs,.TRUE.,myThid)
- C     change sign because we are solving J*u = -F
+ C     change sign of rhs because we are solving J*u = -F
+ C     wk2 needs to be initialised for iCode = 3, because it may contain
+ C     garbage
         DO k=1,n
          rhs(k) = -rhs(k)
+         wk2(k) = 0. _d 0
         ENDDO
        ELSE
  C     map preconditioner results or Jacobian times vector,
  C     stored in du/vIce to wk2
         CALL SEAICE_MAP2VEC(n,duIce,dvIce,wk2,.TRUE.,myThid)
        ENDIF
  C
        CALL SEAICE_FGMRES (n,im,rhs,sol,ifgmres,vv,w,wk1,wk2,
       &     FGMRESeps,SEAICEkrylovIterMax,
-      &     iout,icode,krylovIter,myThid)
+      &     iOutFGMRES,iCode,krylovIter,myThid)
  C
        IF ( iCode .EQ. 0 ) THEN
  C     map sol(ution) vector to du/vIce
         CALL SEAICE_MAP2VEC(n,duIce,dvIce,sol,.FALSE.,myThid)
-Line 133 
 C     solution (wk1=rhs) or a Jacobian t
+Line 136 
 C     solution (wk1=rhs) or a Jacobian t
         CALL SEAICE_MAP2VEC(n,duIce,dvIce,wk1,.FALSE.,myThid)
        ENDIF
        _END_MASTER ( myThid )
  C     Fill overlaps in updated fields
        CALL EXCH_UV_XY_RL( duIce, dvIce,.TRUE.,myThid)
-Line 146 
 C     !ROUTINE: SEAICE_MAP2VEC
+Line 149 
 C     !ROUTINE: SEAICE_MAP2VEC
  C     !INTERFACE:
        SUBROUTINE SEAICE_MAP2VEC(
       I     n,
       O     xfld2d, yfld2d,
       U     vector,
       I     map2vec, myThid )
  C     !DESCRIPTION: \bv
-Line 177 
 C     === local variables ===
+Line 180 
 C     === local variables ===
        INTEGER I, J, bi, bj
        INTEGER ii, jj, ib, jb, m
  CEOP
        m = n/2
        IF ( map2vec ) THEN
         DO bj=myByLo(myThid),myByHi(myThid)
-Line 193 
 CEOP
+Line 196 
 CEOP
            ENDDO
           ENDDO
          ENDDO
         ENDDO
        ELSE
         DO bj=myByLo(myThid),myByHi(myThid)
          jb = nSx*sNy*sNx*(bj-1)
-Line 208 
 CEOP
+Line 211 
 CEOP
            ENDDO
           ENDDO
          ENDDO
         ENDDO
        ENDIF
        RETURN
-Line 219 
 CBOP
+Line 222 
 CBOP
  C     !ROUTINE: SEAICE_FGMRES
  C     !INTERFACE:
        SUBROUTINE SEAICE_FGMRES (n,im,rhs,sol,i,vv,w,wk1, wk2,
       &     eps,maxits,iout,icode,its,myThid)
  C-----------------------------------------------------------------------
  C mlosch Oct 2012: modified the routine further to be compliant with
-Line 229 
 C f90 -> F
+Line 232 
 C f90 -> F
  C !-comment -> C-comment
  C double precision -> _RL
  C implicit none
  C
  C jfl Dec 1st 2006. We modified the routine so that it is double precison.
  C Here are the modifications:
  C 1) implicit real (a-h,o-z) becomes implicit real*8 (a-h,o-z)
  C 2) real bocomes real*8
  C 3) subroutine scopy.f has been changed for dcopy.f
  C 4) subroutine saxpy.f has been changed for daxpy.f
  C 5) function sdot.f has been changed for ddot.f
  C 6) 1e-08 becomes 1d-08
  C
  C Be careful with the dcopy, daxpy and ddot code...there is a slight
  C difference with the single precision versions (scopy, saxpy and sdot).
  C In the single precision versions, the array are declared sightly differently.
  C It is written for single precision:
-Line 254 
 CML   implicit double precision (a-h,o-z
+Line 257 
 CML   implicit double precision (a-h,o-z
        _RL rhs(*), sol(*), vv(n,im+1), w(n,im)
        _RL wk1(n), wk2(n), eps
  C-----------------------------------------------------------------------
  C flexible GMRES routine. This is a version of GMRES which allows a
  C a variable preconditioner. Implemented with a reverse communication
  C protocole for flexibility -
  C DISTRIBUTED VERSION (USES DISTDOT FOR DDOT)
  C explicit (exact) residual norms for restarts
  C written by Y. Saad, modified by A. Malevsky, version February 1, 1995
  C-----------------------------------------------------------------------
  C This Is A Reverse Communication Implementation.
  C-------------------------------------------------
  C USAGE: (see also comments for icode below). FGMRES
  C should be put in a loop and the loop should be active for as
  C long as icode is not equal to 0. On return fgmres will
  C    1) either be requesting the new preconditioned vector applied
  C       to wk1 in case icode.eq.1 (result should be put in wk2)
  C    2) or be requesting the product of A applied to the vector wk1
  C       in case icode.eq.2 (result should be put in wk2)
  C    3) or be terminated in case icode .eq. 0.
  C on entry always set icode = 0. So icode should be set back to zero
  C upon convergence.
  C-----------------------------------------------------------------------
  C Here is a typical way of running fgmres:
  C
  C      icode = 0
  C 1    continue
-Line 284 
 C      if (icode .eq. 1) then
+Line 287 
 C      if (icode .eq. 1) then
  C         call  precon(n, wk1, wk2)    <--- user variable preconditioning
  C         goto 1
  C      else if (icode .ge. 2) then
  C         call  matvec (n,wk1, wk2)    <--- user matrix vector product.
  C         goto 1
  C      else
  C         ----- done ----
  C         .........
  C-----------------------------------------------------------------------
  C list of parameters
  C-------------------
  C
  C n     == integer. the dimension of the problem
  C im    == size of Krylov subspace:  should not exceed 50 in this
-Line 299 
 C          version (can be reset in code
+Line 302 
 C          version (can be reset in code
  C rhs   == vector of length n containing the right hand side
  C sol   == initial guess on input, approximate solution on output
  C vv    == work space of size n x (im+1)
  C w     == work space of length n x im
  C wk1,
  C wk2,  == two work vectors of length n each used for the reverse
  C          communication protocole. When on return (icode .ne. 1)
  C          the user should call fgmres again with wk2 = precon * wk1
  C          and icode untouched. When icode.eq.1 then it means that
  C          convergence has taken place.
  C
  C eps   == tolerance for stopping criterion. process is stopped
  C          as soon as ( ||.|| is the euclidean norm):
  C          || current residual||/||initial residual|| <= eps
-Line 315 
 C maxits== maximum number of iterations
+Line 318 
 C maxits== maximum number of iterations
  C
  C iout  == output unit number number for printing intermediate results
  C          if (iout .le. 0) no statistics are printed.
  C
  C icode = integer. indicator for the reverse communication protocole.
  C         ON ENTRY : icode should be set to icode = 0.
  C         ON RETURN:
  C       * icode .eq. 1 value means that fgmres has not finished
  C         and that it is requesting a preconditioned vector before
  C         continuing. The user must compute M**(-1) wk1, where M is
  C         the preconditioing  matrix (may vary at each call) and wk1 is
  C         the vector as provided by fgmres upun return, and put the
  C         result in wk2. Then fgmres must be called again without
  C         changing any other argument.
  C       * icode .eq. 2 value means that fgmres has not finished
  C         and that it is requesting a matrix vector product before
  C         continuing. The user must compute  A * wk1, where A is the
  C         coefficient  matrix and wk1 is the vector provided by
  C         upon return. The result of the operation is to be put in
  C         the vector wk2. Then fgmres must be called again without
  C         changing any other argument.
  C       * icode .eq. 0 means that fgmres has finished and sol contains
  C         the approximate solution.
  C         comment: typically fgmres must be implemented in a loop
  C         with fgmres being called as long icode is returned with
  C         a value .ne. 0.
  C-----------------------------------------------------------------------
  C     local variables -- !jfl modif
        integer imax
        parameter ( imax = 50 )
        _RL hh(4*imax+1,4*imax),c(4*imax),s(4*imax)
        _RL rs(4*imax+1),t,ro
-Line 353 
 C---------------------------------------
+Line 356 
 C---------------------------------------
  CEOP
        save
        data epsmac/1.d-16/
  C
  C     computed goto
  C
        if ( im .gt. imax ) stop 'size of krylov space > 50'
        goto (100,200,300,11) icode +1
  continue
-Line 370 
 CML      call dcopy (n, sol, 1, wk1, 1)
+Line 373 
 CML      call dcopy (n, sol, 1, wk1, 1)
         wk1(k)=sol(k)
        enddo
        icode = 3
-       return
+       RETURN
   continue
        do j=1,n
           vv(j,1) = rhs(j) - wk2(j)
        enddo
  CML 20   ro = ddot(n, vv, 1, vv,1) !jfl modification
   call scalprod(n, vv, vv, ro, myThid)
        ro = sqrt(ro)
        if (ro .eq. 0.0d0) goto 999
        t = 1.0d0/ ro
        do j=1, n
           vv(j,1) = vv(j,1)*t
        enddo
        if (its .eq. 0) eps1=eps
        if (its .eq. 0) r0 = ro
        if (iout .gt. 0) write(*, 199) its, ro!&
  C           print *,'chau',its, ro !write(iout, 199) its, ro
  C
  C     initialize 1-st term  of rhs of hessenberg system..
  C
        rs(1) = ro
        i = 0
    i=i+1
        its = its + 1
        i1 = i + 1
        do k=1, n
           wk1(k) = vv(k,i)
        enddo
  C
  C     return
  C
        icode = 1
-       return
+       RETURN
  continue
        do k=1, n
           w(k,i) = wk2(k)
        enddo
  C
  C     call matvec operation
  C
        icode = 2
  CML      call dcopy(n, wk2, 1, wk1, 1) !jfl modification
        do k=1,n
-Line 418 
 CML      call dcopy(n, wk2, 1, wk1, 1) !
+Line 421 
 CML      call dcopy(n, wk2, 1, wk1, 1) !
        enddo
  C
  C     return
  C
-       return
+       RETURN
  continue
  C
  C     first call to ope corresponds to intialization goto back to 11.
  C
  C      if (icode .eq. 3) goto 11
  CML      call  dcopy (n, wk2, 1, vv(1,i1), 1) !jfl modification
        do k=1,n
         vv(k,i1)=wk2(k)
        enddo
  C
  C     modified gram - schmidt...
  C
        do j=1, i
  CML         t = ddot(n, vv(1,j), 1, vv(1,i1), 1) !jfl modification
           call scalprod(n, vv(1,j), vv(1,i1), t, myThid)
-Line 453 
 CML      t = sqrt(ddot(n, vv(1,i1), 1, v
+Line 456 
 CML      t = sqrt(ddot(n, vv(1,i1), 1, v
        do k=1,n
           vv(k,i1) = vv(k,i1)*t
        enddo
  C
  C     done with modified gram schimd and arnoldi step.
  C     now  update factorization of hh
  C
   if (i .eq. 1) goto 121
  C
  C     perfrom previous transformations  on i-th column of h
  C
        do k=2,i
           k1 = k-1
           t = hh(k1,i)
-Line 474 
 C-----------#determine next plane rotati
+Line 477 
 C-----------#determine next plane rotati
        s(i) = hh(i1,i)/gam
        rs(i1) = -s(i)*rs(i)
        rs(i) =  c(i)*rs(i)
  C
  C     determine res. norm. and test for convergence-
  C
        hh(i,i) = c(i)*hh(i,i) + s(i)*hh(i1,i)
        ro = abs(rs(i1))
        if (iout .gt. 0) write(*, 199) its, ro
        if (i .lt. im .and. (ro .gt. eps1))  goto 4
  C
  C     now compute solution. first solve upper triangular system.
  C
        rs(i) = rs(i)/hh(i,i)
        do ii=2,i
           k=i-ii+1
-Line 494 
 C
+Line 497 
 C
           enddo
           rs(k) = t/hh(k,k)
        enddo
  C
  C     done with back substitution..
  C     now form linear combination to get solution
  C
        do j=1, i
         t = rs(j)
  C         call daxpy(n, t, w(1,j), 1, sol,1) !jfl modification
-Line 505 
 C         call daxpy(n, t, w(1,j), 1, so
+Line 508 
 C         call daxpy(n, t, w(1,j), 1, so
          sol(k) = sol(k) + t*w(k,j)
         enddo
        enddo
  C
  C     test for return
  C
-       print *, 'ml-fgmres: its, maxits: ', its, maxits, ro, '<', eps1
        if (ro .le. eps1 .or. its .ge. maxits) goto 999
  C
  C     else compute residual vector and continue..
  C
  C       goto 10
        do j=1,i
-Line 528 
 CML        call daxpy (n, t, vv(1,j), 1,
+Line 530 
 CML        call daxpy (n, t, vv(1,j), 1,
           vv(k,1) = vv(k,1) + t*vv(k,j)
          enddo
        enddo
  C
  C     restart outer loop.
  C
        goto 20
  icode = 0
  format('   -- fgmres its =', i4, ' res. norm =', d26.16)
  C
-       return
+       RETURN
  C-----end-of-fgmres-----------------------------------------------------
  C-----------------------------------------------------------------------
-       end
+       END
  C---+----1----+----2----+----3----+----4----+----5----+----6----+----7-|--+----|
  CBOP
-Line 548 
 C     !INTERFACE:
+Line 550 
 C     !INTERFACE:
        subroutine scalprod(n,dx,dy,t,myThid)
- C
  C     forms the dot product of two vectors.
  C     uses unrolled loops for increments equal to one.
  C     jack dongarra, linpack, 3/11/78.
  C     ML: code stolen from BLAS and adapted for parallel applications
- C
        implicit none
  #include "SIZE.h"
  #include "EEPARAMS.h"
  #include "EESUPPORT.h"
-       integer myThid
+       integer n
        _RL dx(n),dy(n)
-       real*8 dtemp
        real*8 t
-       integer i,m,mp1,n
+       integer myThid
+       real*8 dtemp
+       integer i,m,mp1
  #ifdef ALLOW_USE_MPI
        INTEGER mpiRC
  #endif   /* ALLOW_USE_MPI */
-Line 578 
 C
+Line 581 
 C
        if( n .lt. 5 ) go to 60
 mp1 = m + 1
        do i = mp1,n,5
         dtemp = dtemp + dx(i)*dy(i) + dx(i + 1)*dy(i + 1) +
       &      dx(i + 2)*dy(i + 2) + dx(i + 3)*dy(i + 3) +
       &      dx(i + 4)*dy(i + 4)
        enddo
 continue
-Line 592 
 C     sum over all processors
+Line 595 
 C     sum over all processors
        ENDIF
  #endif /* ALLOW_USE_MPI */
        t = dtemp
  CML      return
  CML      end
  CML
  CML      subroutine daxpy(n,da,dx,incx,dy,incy)
  CMLC
  CMLC     constant times a vector plus a vector.
  CMLC     uses unrolled loops for increments equal to one.
  CMLC     jack dongarra, linpack, 3/11/78.
  CMLC
  CML      _RL dx(n),dy(n),da
  CML      integer i,incx,incy,ix,iy,m,mp1,n
  CMLC
  CML      if(n.le.0)return
  CML      if (da .eq. 0.0d0) return
  CML      if(incx.eq.1.and.incy.eq.1)go to 20
  CMLC
  CMLC        code for unequal increments or equal increments
  CMLC          not equal to 1
  CMLC
  CML      ix = 1
  CML      iy = 1
  CML      if(incx.lt.0)ix = (-n+1)*incx + 1
-Line 622 
 CML        ix = ix + incx
+Line 625 
 CML        ix = ix + incx
  CML        iy = iy + incy
  CML   10 continue
  CML      return
  CMLC
  CMLC        code for both increments equal to 1
  CMLC
  CMLC
  CMLC        clean-up loop
  CMLC
  CML   20 m = mod(n,4)
  CML      if( m .eq. 0 ) go to 40
  CML      do 30 i = 1,m
-Line 645 
 CML      return
+Line 648 
 CML      return
  CML      end
  CML
  CML      subroutine  dcopy(n,dx,incx,dy,incy)
  CMLC
  CMLC     copies a vector, x, to a vector, y.
  CMLC     uses unrolled loops for increments equal to one.
  CMLC     jack dongarra, linpack, 3/11/78.
  CMLC
  CML      _RL dx(n),dy(n)
  CML      integer i,incx,incy,ix,iy,m,mp1,n
  CMLC
  CML      if(n.le.0)return
  CML      if(incx.eq.1.and.incy.eq.1)go to 20
  CMLC
  CMLC        code for unequal increments or equal increments
  CMLC          not equal to 1
  CMLC
  CML      ix = 1
  CML      iy = 1
  CML      if(incx.lt.0)ix = (-n+1)*incx + 1
-Line 669 
 CML        ix = ix + incx
+Line 672 
 CML        ix = ix + incx
  CML        iy = iy + incy
  CML   10 continue
  CML      return
  CMLC
  CMLC        code for both increments equal to 1
  CMLC
  CMLC
  CMLC        clean-up loop
  CMLC
  CML   20 m = mod(n,7)
  CML      if( m .eq. 0 ) go to 40
  CML      do 30 i = 1,m

 Legend:



Removed from v.1.1
 


changed lines


 
Added in v.1.3
 Legend:



Removed from v.1.1
 


changed lines


 
Added in v.1.3
-Removed from v.1.1
+Added in v.1.3

	ViewVC Help
Powered by ViewVC 1.1.22