/[MITgcm]/MITgcm/model/src/cg3d.F

Diff of /MITgcm/model/src/cg3d.F

Parent Directory | Revision Log | View Revision Graph Revision Graph | View Patch Patch

-revision 1.18 by jmc,
Wed Aug 23 15:22:32 2006 UTC
+revision 1.19 by jmc,
Tue Sep  4 14:54:58 2007 UTC
 Line 15 
 C     !INTERFACE:
       I                myThid )
  C     !DESCRIPTION: \bv
  C     *==========================================================*
  C     | SUBROUTINE CG3D
  C     | o Three-dimensional grid problem conjugate-gradient
  C     |   inverter (with preconditioner).
  C     *==========================================================*
  C     | Con. grad is an iterative procedure for solving Ax = b.
  C     | It requires the A be symmetric.
  C     | This implementation assumes A is a seven-diagonal
  C     | matrix of the form that arises in the discrete
  C     | representation of the del^2 operator in a
  C     | three-dimensional space.
  C     | Notes:
  C     | ======
  C     | This implementation can support shared-memory
  C     | multi-threaded execution. In order to do this COMMON
  C     | blocks are used for many of the arrays - even ones that
  C     | are only used for intermedaite results. This design is
  C     | OK if you want to all the threads to collaborate on
  C     | solving the same problem. On the other hand if you want
  C     | the threads to solve several different problems
  C     | concurrently this implementation will not work.
  C     *==========================================================*
  C     \ev
 Line 75 
 C     bj
  C     eta_qrN     - Used in computing search directions
  C     eta_qrNM1     suffix N and NM1 denote current and
  C     cgBeta        previous iterations respectively.
  C     alpha
  C     sumRHS      - Sum of right-hand-side. Sometimes this is a
  C                   useful debuggin/trouble shooting diagnostic.
  C                   For neumann problems sumRHS needs to be ~0.
 Line 84 
 C     err         - Measure of residual
  C     I, J, K, N  - Loop counters ( N counts CG iterations )
        INTEGER actualIts
        _RL    actualResidual
        INTEGER bi, bj
        INTEGER I, J, K, it3d
        INTEGER Km1, Kp1
        _RL    maskM1, maskP1
-       _RL    err, errTile
+       _RL    err,    errTile(nSx,nSy)
-       _RL    eta_qrN, eta_qrNtile
+       _RL    eta_qrN,eta_qrNtile(nSx,nSy)
        _RL    eta_qrNM1
        _RL    cgBeta
-       _RL    alpha , alphaTile
+       _RL    alpha , alphaTile(nSx,nSy)
-       _RL    sumRHS, sumRHStile
+       _RL    sumRHS, sumRHStile(nSx,nSy)
        _RL    rhsMax
        _RL    rhsNorm
  CEOP
 Line 142 
 C--   Initial residual calculation (with
        sumRHS = 0. _d 0
        DO bj=myByLo(myThid),myByHi(myThid)
         DO bi=myBxLo(myThid),myBxHi(myThid)
-         errTile    = 0. _d 0
+         errTile(bi,bj)    = 0. _d 0
-         sumRHStile = 0. _d 0
+         sumRHStile(bi,bj) = 0. _d 0
          DO K=1,Nr
           Km1 = MAX(K-1, 1 )
           Kp1 = MIN(K+1, Nr)
 Line 151 
 C--   Initial residual calculation (with
           maskP1 = 1. _d 0
           IF ( K .EQ. 1 ) maskM1 = 0. _d 0
           IF ( K .EQ. Nr) maskP1 = 0. _d 0
           DO J=1,sNy
            DO I=1,sNx
             cg3d_r(I,J,K,bi,bj) = cg3d_b(I,J,K,bi,bj) -( 0.
 Line 163 
 C--   Initial residual calculation (with
       &     +aV3d(I  ,J  ,Kp1,bi,bj)*cg3d_x(I  ,J  ,Kp1,bi,bj)*maskP1
       &     +aC3d(I  ,J  ,K  ,bi,bj)*cg3d_x(I  ,J  ,K  ,bi,bj)
       &     )
-            errTile = errTile
+            errTile(bi,bj) = errTile(bi,bj)
       &     +cg3d_r(I,J,K,bi,bj)*cg3d_r(I,J,K,bi,bj)
-            sumRHStile = sumRHStile
+            sumRHStile(bi,bj) = sumRHStile(bi,bj)
       &     +cg3d_b(I,J,K,bi,bj)
            ENDDO
           ENDDO
 Line 175 
 C--   Initial residual calculation (with
            ENDDO
           ENDDO
          ENDDO
-         err    = err    + errTile
+ c       err    = err    + errTile(bi,bj)
-         sumRHS = sumRHS + sumRHStile
+ c       sumRHS = sumRHS + sumRHStile(bi,bj)
         ENDDO
        ENDDO
         CALL EXCH_S3D_RL( cg3d_r, Nr, myThid )
  c      CALL EXCH_S3D_RL( cg3d_s, Nr, myThid )
-       _GLOBAL_SUM_R8( sumRHS, myThid )
+ c     _GLOBAL_SUM_R8( sumRHS, myThid )
-       _GLOBAL_SUM_R8( err   , myThid )
+ c     _GLOBAL_SUM_R8( err   , myThid )
+        CALL GLOBAL_SUM_TILE_RL( sumRHStile, sumRHS, myThid )
+        CALL GLOBAL_SUM_TILE_RL( errTile,    err,    myThid )
        IF ( debugLevel .GE. debLevZero ) THEN
          _BEGIN_MASTER( myThid )
-Line 212 
 CcnhDebugEnds
+Line 214 
 CcnhDebugEnds
  C--    Solve preconditioning equation and update
  C--    conjugate direction vector "s".
  C      Note. On the next to loops over all tiles the inner loop ranges
  C            in sNx and sNy are expanded by 1 to avoid a communication
  C            step. However this entails a bit of gynamastics because we only
  C            want eta_qrN for the interior points.
         eta_qrN = 0. _d 0
         DO bj=myByLo(myThid),myByHi(myThid)
          DO bi=myBxLo(myThid),myBxHi(myThid)
-          eta_qrNtile = 0. _d 0
+          eta_qrNtile(bi,bj) = 0. _d 0
           DO K=1,1
            DO J=1-1,sNy+1
             DO I=1-1,sNx+1
              cg3d_q(I,J,K,bi,bj) =
       &       zMC(I  ,J  ,K,bi,bj)*cg3d_r(I  ,J  ,K,bi,bj)
             ENDDO
            ENDDO
-Line 230 
 C            want eta_qrN for the interi
+Line 232 
 C            want eta_qrN for the interi
           DO K=2,Nr
            DO J=1-1,sNy+1
             DO I=1-1,sNx+1
              cg3d_q(I,J,K,bi,bj) =
       &       zMC(I,J,K,bi,bj)*(cg3d_r(I,J,K  ,bi,bj)
       &      -zML(I,J,K,bi,bj)*cg3d_q(I,J,K-1,bi,bj))
             ENDDO
-Line 240 
 C            want eta_qrN for the interi
+Line 242 
 C            want eta_qrN for the interi
  caja      IF (Nr .GT. 1) THEN
  caja       DO J=1-1,sNy+1
  caja        DO I=1-1,sNx+1
  caja         cg3d_q(I,J,K,bi,bj) =
  caja &        zMC(i,j,k,bi,bj)*(cg3d_r(i,j,k  ,bi,bj)
  caja &       -zML(i,j,k,bi,bj)*cg3d_q(i,j,k-1,bi,bj))
  caja        ENDDO
-Line 248 
 caja       ENDDO
+Line 250 
 caja       ENDDO
  caja      ENDIF
            DO J=1,sNy
             DO I=1,sNx
-             eta_qrNtile = eta_qrNtile
+             eta_qrNtile(bi,bj) = eta_qrNtile(bi,bj)
       &      +cg3d_q(I,J,K,bi,bj)*cg3d_r(I,J,K,bi,bj)
             ENDDO
            ENDDO
-Line 256 
 caja      ENDIF
+Line 258 
 caja      ENDIF
           DO K=Nr-1,1,-1
            DO J=1-1,sNy+1
             DO I=1-1,sNx+1
              cg3d_q(I,J,K,bi,bj) =
       &      cg3d_q(I,J,K,bi,bj)
       &      -zMU(I,J,K,bi,bj)*cg3d_q(I,J,K+1,bi,bj)
             ENDDO
            ENDDO
            DO J=1,sNy
             DO I=1,sNx
-             eta_qrNtile = eta_qrNtile
+             eta_qrNtile(bi,bj) = eta_qrNtile(bi,bj)
       &      +cg3d_q(I,J,K,bi,bj)*cg3d_r(I,J,K,bi,bj)
             ENDDO
            ENDDO
           ENDDO
-          eta_qrN = eta_qrN + eta_qrNtile
+ c        eta_qrN = eta_qrN + eta_qrNtile(bi,bj)
          ENDDO
         ENDDO
  caja
-Line 287 
 caja    ENDDO
+Line 289 
 caja    ENDDO
  caja   ENDDO
  caja
-        _GLOBAL_SUM_R8(eta_qrN, myThid)
+ c      _GLOBAL_SUM_R8(eta_qrN, myThid)
+        CALL GLOBAL_SUM_TILE_RL( eta_qrNtile,eta_qrN,myThid )
  CcnhDebugStarts
  C      WRITE(*,*) ' CG3D: Iteration ',it3d-1,' eta_qrN = ',eta_qrN
  CcnhDebugEnds
-Line 302 
 CcnhDebugEnds
+Line 305 
 CcnhDebugEnds
           DO K=1,Nr
            DO J=1-1,sNy+1
             DO I=1-1,sNx+1
              cg3d_s(I,J,K,bi,bj) = cg3d_q(I,J,K,bi,bj)
       &                          + cgBeta*cg3d_s(I,J,K,bi,bj)
             ENDDO
            ENDDO
-Line 315 
 C==    q = A.s
+Line 318 
 C==    q = A.s
         alpha = 0. _d 0
         DO bj=myByLo(myThid),myByHi(myThid)
          DO bi=myBxLo(myThid),myBxHi(myThid)
-          alphaTile = 0. _d 0
+          alphaTile(bi,bj) = 0. _d 0
           IF ( Nr .GT. 1 ) THEN
            DO K=1,1
             DO J=1,sNy
              DO I=1,sNx
               cg3d_q(I,J,K,bi,bj) =
       &       aW3d(I  ,J  ,K  ,bi,bj)*cg3d_s(I-1,J  ,K  ,bi,bj)
       &      +aW3d(I+1,J  ,K  ,bi,bj)*cg3d_s(I+1,J  ,K  ,bi,bj)
       &      +aS3d(I  ,J  ,K  ,bi,bj)*cg3d_s(I  ,J-1,K  ,bi,bj)
       &      +aS3d(I  ,J+1,K  ,bi,bj)*cg3d_s(I  ,J+1,K  ,bi,bj)
       &      +aV3d(I  ,J  ,K+1,bi,bj)*cg3d_s(I  ,J  ,K+1,bi,bj)
       &      +aC3d(I  ,J  ,K  ,bi,bj)*cg3d_s(I  ,J  ,K  ,bi,bj)
-              alphaTile = alphaTile
+              alphaTile(bi,bj) = alphaTile(bi,bj)
       &                 +cg3d_s(I,J,K,bi,bj)*cg3d_q(I,J,K,bi,bj)
              ENDDO
             ENDDO
-Line 336 
 C==    q = A.s
+Line 339 
 C==    q = A.s
            DO K=1,1
             DO J=1,sNy
              DO I=1,sNx
               cg3d_q(I,J,K,bi,bj) =
       &       aW3d(I  ,J  ,K  ,bi,bj)*cg3d_s(I-1,J  ,K  ,bi,bj)
       &      +aW3d(I+1,J  ,K  ,bi,bj)*cg3d_s(I+1,J  ,K  ,bi,bj)
       &      +aS3d(I  ,J  ,K  ,bi,bj)*cg3d_s(I  ,J-1,K  ,bi,bj)
       &      +aS3d(I  ,J+1,K  ,bi,bj)*cg3d_s(I  ,J+1,K  ,bi,bj)
       &      +aC3d(I  ,J  ,K  ,bi,bj)*cg3d_s(I  ,J  ,K  ,bi,bj)
-              alphaTile = alphaTile
+              alphaTile(bi,bj) = alphaTile(bi,bj)
       &                 +cg3d_s(I,J,K,bi,bj)*cg3d_q(I,J,K,bi,bj)
              ENDDO
             ENDDO
-Line 351 
 C==    q = A.s
+Line 354 
 C==    q = A.s
           DO K=2,Nr-1
            DO J=1,sNy
             DO I=1,sNx
              cg3d_q(I,J,K,bi,bj) =
       &      aW3d(I  ,J  ,K  ,bi,bj)*cg3d_s(I-1,J  ,K  ,bi,bj)
       &     +aW3d(I+1,J  ,K  ,bi,bj)*cg3d_s(I+1,J  ,K  ,bi,bj)
       &     +aS3d(I  ,J  ,K  ,bi,bj)*cg3d_s(I  ,J-1,K  ,bi,bj)
-Line 359 
 C==    q = A.s
+Line 362 
 C==    q = A.s
       &     +aV3d(I  ,J  ,K  ,bi,bj)*cg3d_s(I  ,J  ,K-1,bi,bj)
       &     +aV3d(I  ,J  ,K+1,bi,bj)*cg3d_s(I  ,J  ,K+1,bi,bj)
       &     +aC3d(I  ,J  ,K  ,bi,bj)*cg3d_s(I  ,J  ,K  ,bi,bj)
-             alphaTile = alphaTile
+             alphaTile(bi,bj) = alphaTile(bi,bj)
       &                +cg3d_s(I,J,K,bi,bj)*cg3d_q(I,J,K,bi,bj)
             ENDDO
            ENDDO
-Line 368 
 C==    q = A.s
+Line 371 
 C==    q = A.s
            DO K=Nr,Nr
             DO J=1,sNy
              DO I=1,sNx
               cg3d_q(I,J,K,bi,bj) =
       &       aW3d(I  ,J  ,K  ,bi,bj)*cg3d_s(I-1,J  ,K  ,bi,bj)
       &      +aW3d(I+1,J  ,K  ,bi,bj)*cg3d_s(I+1,J  ,K  ,bi,bj)
       &      +aS3d(I  ,J  ,K  ,bi,bj)*cg3d_s(I  ,J-1,K  ,bi,bj)
       &      +aS3d(I  ,J+1,K  ,bi,bj)*cg3d_s(I  ,J+1,K  ,bi,bj)
       &      +aV3d(I  ,J  ,K  ,bi,bj)*cg3d_s(I  ,J  ,K-1,bi,bj)
       &      +aC3d(I  ,J  ,K  ,bi,bj)*cg3d_s(I  ,J  ,K  ,bi,bj)
-              alphaTile = alphaTile
+              alphaTile(bi,bj) = alphaTile(bi,bj)
       &                 +cg3d_s(I,J,K,bi,bj)*cg3d_q(I,J,K,bi,bj)
              ENDDO
             ENDDO
            ENDDO
           ENDIF
-          alpha = alpha + alphaTile
+ c        alpha = alpha + alphaTile(bi,bj)
          ENDDO
         ENDDO
-        _GLOBAL_SUM_R8(alpha,myThid)
+ c      _GLOBAL_SUM_R8(alpha,myThid)
+        CALL GLOBAL_SUM_TILE_RL( alphaTile,  alpha,  myThid )
  CcnhDebugStarts
  C      WRITE(*,*) ' CG3D: Iteration ',it3d-1,' SUM(s*q)= ',alpha
  CcnhDebugEnds
-Line 392 
 CcnhDebugEnds
+Line 396 
 CcnhDebugEnds
  CcnhDebugStarts
  C      WRITE(*,*) ' CG3D: Iteration ',it3d-1,' alpha= ',alpha
  CcnhDebugEnds
  C==    Update solution and residual vectors
  C      Now compute "interior" points.
         err = 0. _d 0
         DO bj=myByLo(myThid),myByHi(myThid)
          DO bi=myBxLo(myThid),myBxHi(myThid)
-         errTile    = 0. _d 0
+         errTile(bi,bj)    = 0. _d 0
           DO K=1,Nr
            DO J=1,sNy
             DO I=1,sNx
-Line 406 
 C      Now compute "interior" points.
+Line 410 
 C      Now compute "interior" points.
       &            +alpha*cg3d_s(I,J,K,bi,bj)
              cg3d_r(I,J,K,bi,bj)=cg3d_r(I,J,K,bi,bj)
       &            -alpha*cg3d_q(I,J,K,bi,bj)
-             errTile = errTile
+             errTile(bi,bj) = errTile(bi,bj)
       &             +cg3d_r(I,J,K,bi,bj)*cg3d_r(I,J,K,bi,bj)
             ENDDO
            ENDDO
           ENDDO
-          err = err + errTile
+ c        err = err + errTile(bi,bj)
          ENDDO
         ENDDO
-        _GLOBAL_SUM_R8( err   , myThid )
+ c      _GLOBAL_SUM_R8( err   , myThid )
+        CALL GLOBAL_SUM_TILE_RL( errTile,    err,    myThid )
         err = SQRT(err)
         actualIts      = it3d
         actualResidual = err

 Legend:



Removed from v.1.18
 


changed lines


 
Added in v.1.19
 Legend:



Removed from v.1.18
 


changed lines


 
Added in v.1.19
-Removed from v.1.18
+Added in v.1.19

	ViewVC Help
Powered by ViewVC 1.1.22