eesupp/inc/CPP_EEMACROS.h

C $Header: /u/gcmpack/MITgcm/eesupp/inc/CPP_EEMACROS.h,v 1.25 2017/08/10 14:06:59 mlosch Exp $
C $Name:  $

CBOP
C     !ROUTINE: CPP_EEMACROS.h
C     !INTERFACE:
C     include "CPP_EEMACROS.h"
C     !DESCRIPTION:
C     *==========================================================*
C     | CPP_EEMACROS.h
C     *==========================================================*
C     | C preprocessor "execution environment" supporting
C     | macros. Use this file to define macros for  simplifying
C     | execution environment in which a model runs - as opposed
C     | to the dynamical problem the model solves.
C     *==========================================================*
CEOP

#ifndef _CPP_EEMACROS_H_
#define _CPP_EEMACROS_H_

C     In general the following convention applies:
C     ALLOW  - indicates an feature will be included but it may
C     CAN      have a run-time flag to allow it to be switched
C              on and off.
C              If ALLOW or CAN directives are "undef'd" this generally
C              means that the feature will not be available i.e. it
C              will not be included in the compiled code and so no
C              run-time option to use the feature will be available.
C
C     ALWAYS - indicates the choice will be fixed at compile time
C              so no run-time option will be present

C     Flag used to indicate which flavour of multi-threading
C     compiler directives to use. Only set one of these.
C     USE_SOLARIS_THREADING  - Takes directives for SUN Workshop
C                              compiler.
C     USE_KAP_THREADING      - Takes directives for Kuck and
C                              Associates multi-threading compiler
C                              ( used on Digital platforms ).
C     USE_IRIX_THREADING     - Takes directives for SGI MIPS
C                              Pro Fortran compiler.
C     USE_EXEMPLAR_THREADING - Takes directives for HP SPP series
C                              compiler.
C     USE_C90_THREADING      - Takes directives for CRAY/SGI C90
C                              system F90 compiler.
#ifdef TARGET_SUN
#define USE_SOLARIS_THREADING
#define USING_THREADS
#endif

#ifdef TARGET_DEC
#define USE_KAP_THREADING
#define USING_THREADS
#endif

#ifdef TARGET_SGI
#define USE_IRIX_THREADING
#define USING_THREADS
#endif

#ifdef TARGET_HP
#define USE_EXEMPLAR_THREADING
#define USING_THREADS
#endif

#ifdef TARGET_CRAY_VECTOR
#define USE_C90_THREADING
#define USING_THREADS
#endif

#ifdef USE_OMP_THREADING
#define USING_THREADS
#endif

C--   Define the mapping for the _BARRIER macro
C     On some systems low-level hardware support can be accessed through
C     compiler directives here.
#define _BARRIER CALL BARRIER(myThid)

C--   Define the mapping for the BEGIN_CRIT() and  END_CRIT() macros.
C     On some systems we simply execute this section only using the
C     master thread i.e. its not really a critical section. We can
C     do this because we do not use critical sections in any critical
C     sections of our code!
#define _BEGIN_CRIT(a) _BEGIN_MASTER(a)
#define _END_CRIT(a)   _END_MASTER(a)

C--   Define the mapping for the BEGIN_MASTER_SECTION() and
C     END_MASTER_SECTION() macros. These are generally implemented by
C     simply choosing a particular thread to be "the master" and have
C     it alone execute the BEGIN_MASTER..., END_MASTER.. sections.

#define _BEGIN_MASTER(a) IF ( a .EQ. 1 ) THEN
#define _END_MASTER(a)   ENDIF
CcnhDebugStarts
C      Alternate form to the above macros that increments (decrements) a counter each
C      time a MASTER section is entered (exited). This counter can then be checked in barrier
C      to try and detect calls to BARRIER within single threaded sections.
C      Using these macros requires two changes to Makefile - these changes are written
C      below.
C      1 - add a filter to the CPP command to kill off commented _MASTER lines
C      2 - add a filter to the CPP output the converts the string N EWLINE to an actual newline.
C      The N EWLINE needs to be changes to have no space when this macro and Makefile changes
C      are used. Its in here with a space to stop it getting parsed by the CPP stage in these
C      comments.
C      #define _BEGIN_MASTER(a)  IF ( a .EQ. 1 ) THEN  N EWLINE      CALL BARRIER_MS(a)
C      #define _END_MASTER(a)    CALL BARRIER_MU(a) N EWLINE        ENDIF
C      'CPP = cat $< | $(TOOLSDIR)/set64bitConst.sh |  grep -v '^[cC].*_MASTER' | cpp  -traditional -P'
C      .F.f:
C      $(CPP) $(DEFINES) $(INCLUDES) |  sed 's/N EWLINE/\n/' > $@
CcnhDebugEnds

C--   Control storage of floating point operands
C     On many systems it improves performance only to use
C     8-byte precision for time stepped variables.
C     Constant in time terms ( geometric factors etc.. )
C     can use 4-byte precision, reducing memory utilisation and
C     boosting performance because of a smaller working
C     set size. However, on vector CRAY systems this degrades
C     performance.
C- Note: global_sum/max macros were used to switch to  JAM routines (obsolete);
C  in addition, since only the R4 & R8 S/R are coded, GLOBAL RS & RL macros
C  enable to call the corresponding R4 or R8 S/R.
#ifdef REAL4_IS_SLOW
#define _RS Real*8
#define RS_IS_REAL8
#define _GLOBAL_SUM_RS(a,b) CALL GLOBAL_SUM_R8 ( a, b)
#define _GLOBAL_MAX_RS(a,b) CALL GLOBAL_MAX_R8 ( a, b )
#define _MPI_TYPE_RS MPI_DOUBLE_PRECISION
#ifdef USE_OLD_MACROS_R4R8toRSRL
#define _GLOBAL_SUM_R4(a,b) CALL GLOBAL_SUM_R8 ( a, b )
#define _GLOBAL_MAX_R4(a,b) CALL GLOBAL_MAX_R8 ( a, b )
#endif
#else
#define _RS Real*4
#define RS_IS_REAL4
#define _GLOBAL_SUM_RS(a,b) CALL GLOBAL_SUM_R4 ( a, b )
#define _GLOBAL_MAX_RS(a,b) CALL GLOBAL_MAX_R4 ( a, b )
#define _MPI_TYPE_RS MPI_REAL
#ifdef USE_OLD_MACROS_R4R8toRSRL
cph Needed for some backward compatibility with broken packages
#define _GLOBAL_SUM_R4(a,b) CALL GLOBAL_SUM_R4 ( a, b )
#define _GLOBAL_MAX_R4(a,b) CALL GLOBAL_MAX_R4 ( a, b )
#endif
#endif

#define _RL Real*8
#define RL_IS_REAL8
#define _GLOBAL_SUM_RL(a,b) CALL GLOBAL_SUM_R8 ( a, b )
#define _GLOBAL_MAX_RL(a,b) CALL GLOBAL_MAX_R8 ( a, b )
#ifdef USE_OLD_MACROS_R4R8toRSRL
cph Needed for some backward compatibility with broken packages
#define _GLOBAL_SUM_R8(a,b) CALL GLOBAL_SUM_R8 ( a, b )
#define _GLOBAL_MAX_R8(a,b) CALL GLOBAL_MAX_R8 ( a, b )
#endif
#define _MPI_TYPE_RL MPI_DOUBLE_PRECISION

#define _MPI_TYPE_R4 MPI_REAL
#if (defined (TARGET_SGI) || defined (TARGET_AIX) || defined (TARGET_LAM))
#define _MPI_TYPE_R8 MPI_DOUBLE_PRECISION
#else
#define _MPI_TYPE_R8 MPI_REAL8
#endif
#define _R4 Real*4
#define _R8 Real*8

C- Note: a) exch macros were used to switch to  JAM routines (obsolete)
C        b) exch R4 & R8 macros are not practically used ; if needed,
C           will directly call the corrresponding S/R.
#define _EXCH_XY_RS(a,b) CALL EXCH_XY_RS ( a, b )
#define _EXCH_XY_RL(a,b) CALL EXCH_XY_RL ( a, b )
#define _EXCH_XYZ_RS(a,b) CALL EXCH_XYZ_RS ( a, b )
#define _EXCH_XYZ_RL(a,b) CALL EXCH_XYZ_RL ( a, b )
#ifdef USE_OLD_MACROS_R4R8toRSRL
cph Needed for some backward compatibility with broken packages
#define _EXCH_XY_R4(a,b) CALL EXCH_XY_RS ( a, b )
#define _EXCH_XY_R8(a,b) CALL EXCH_XY_RL ( a, b )
#define _EXCH_XYZ_R4(a,b) CALL EXCH_XYZ_RS ( a, b )
#define _EXCH_XYZ_R8(a,b) CALL EXCH_XYZ_RL ( a, b )
#endif

C--   Control use of JAM routines for Artic network (no longer supported)
C     These invoke optimized versions of "exchange" and "sum" that
C     utilize the programmable aspect of Artic cards.
CXXX No longer supported ; started to remove JAM routines.
CXXX #ifdef LETS_MAKE_JAM
CXXX #define _GLOBAL_SUM_RS(a,b) CALL GLOBAL_SUM_R8_JAM ( a, b)
CXXX #define _GLOBAL_SUM_RL(a,b) CALL GLOBAL_SUM_R8_JAM ( a, b )
CXXX #define _EXCH_XY_RS(a,b) CALL EXCH_XY_R8_JAM ( a, b )
CXXX #define _EXCH_XY_RL(a,b) CALL EXCH_XY_R8_JAM ( a, b )
CXXX #define _EXCH_XYZ_RS(a,b) CALL EXCH_XYZ_R8_JAM ( a, b )
CXXX #define _EXCH_XYZ_RL(a,b) CALL EXCH_XYZ_R8_JAM ( a, b )
CXXX #endif

C--   Control use of "double" precision constants.
C     Use D0 where it means REAL*8 but not where it means REAL*16
#ifdef REAL_D0_IS_16BYTES
#define D0
#endif

C--   Substitue for 1.D variables
C     Sun compilers do not use 8-byte precision for literals
C     unless .Dnn is specified. CRAY vector machines use 16-byte
C     precision when they see .Dnn which runs very slowly!
#ifdef REAL_D0_IS_16BYTES
#define _F64( a ) a
#endif
#ifndef REAL_D0_IS_16BYTES
#define _F64( a ) DFLOAT( a )
#endif

C--   Set the format for writing processor IDs, e.g. in S/R eeset_parms
C     and S/R open_copy_data_file. The default of I9.9 should work for
C     a long time (until we will use 10e10 processors and more)
#define FMT_PROC_ID 'I9.9'

#endif /* _CPP_EEMACROS_H_ */
1	jmc	1.26	C $Header: /u/gcmpack/MITgcm/eesupp/inc/CPP_EEMACROS.h,v 1.25 2017/08/10 14:06:59 mlosch Exp $
2	adcroft	1.4	C $Name: $
3
4	cnh	1.5	CBOP
5	jmc	1.17	C !ROUTINE: CPP_EEMACROS.h
6	cnh	1.5	C !INTERFACE:
7	jmc	1.26	C include "CPP_EEMACROS.h"
8	cnh	1.5	C !DESCRIPTION:
9			C ==========================================================
10	jmc	1.17	C \| CPP_EEMACROS.h
11	cnh	1.5	C ==========================================================
12	jmc	1.17	C \| C preprocessor "execution environment" supporting
13			C \| macros. Use this file to define macros for simplifying
14			C \| execution environment in which a model runs - as opposed
15			C \| to the dynamical problem the model solves.
16	cnh	1.5	C ==========================================================
17			CEOP
18	adcroft	1.1
19			#ifndef _CPP_EEMACROS_H_
20			#define _CPP_EEMACROS_H_
21
22			C In general the following convention applies:
23			C ALLOW - indicates an feature will be included but it may
24			C CAN have a run-time flag to allow it to be switched
25			C on and off.
26			C If ALLOW or CAN directives are "undef'd" this generally
27			C means that the feature will not be available i.e. it
28			C will not be included in the compiled code and so no
29			C run-time option to use the feature will be available.
30			C
31			C ALWAYS - indicates the choice will be fixed at compile time
32			C so no run-time option will be present
33
34			C Flag used to indicate which flavour of multi-threading
35			C compiler directives to use. Only set one of these.
36			C USE_SOLARIS_THREADING - Takes directives for SUN Workshop
37			C compiler.
38	jmc	1.17	C USE_KAP_THREADING - Takes directives for Kuck and
39	adcroft	1.1	C Associates multi-threading compiler
40			C ( used on Digital platforms ).
41			C USE_IRIX_THREADING - Takes directives for SGI MIPS
42			C Pro Fortran compiler.
43			C USE_EXEMPLAR_THREADING - Takes directives for HP SPP series
44			C compiler.
45			C USE_C90_THREADING - Takes directives for CRAY/SGI C90
46			C system F90 compiler.
47			#ifdef TARGET_SUN
48			#define USE_SOLARIS_THREADING
49	cnh	1.14	#define USING_THREADS
50	adcroft	1.1	#endif
51
52			#ifdef TARGET_DEC
53			#define USE_KAP_THREADING
54	cnh	1.14	#define USING_THREADS
55	adcroft	1.1	#endif
56
57			#ifdef TARGET_SGI
58			#define USE_IRIX_THREADING
59	cnh	1.14	#define USING_THREADS
60	adcroft	1.1	#endif
61
62			#ifdef TARGET_HP
63			#define USE_EXEMPLAR_THREADING
64	cnh	1.14	#define USING_THREADS
65	adcroft	1.1	#endif
66
67			#ifdef TARGET_CRAY_VECTOR
68			#define USE_C90_THREADING
69	cnh	1.14	#define USING_THREADS
70			#endif
71
72			#ifdef USE_OMP_THREADING
73			#define USING_THREADS
74	adcroft	1.1	#endif
75
76			C-- Define the mapping for the _BARRIER macro
77			C On some systems low-level hardware support can be accessed through
78			C compiler directives here.
79			#define _BARRIER CALL BARRIER(myThid)
80
81	jmc	1.17	C-- Define the mapping for the BEGIN_CRIT() and END_CRIT() macros.
82	adcroft	1.1	C On some systems we simply execute this section only using the
83			C master thread i.e. its not really a critical section. We can
84			C do this because we do not use critical sections in any critical
85			C sections of our code!
86			#define _BEGIN_CRIT(a) _BEGIN_MASTER(a)
87			#define _END_CRIT(a) _END_MASTER(a)
88
89			C-- Define the mapping for the BEGIN_MASTER_SECTION() and
90			C END_MASTER_SECTION() macros. These are generally implemented by
91			C simply choosing a particular thread to be "the master" and have
92			C it alone execute the BEGIN_MASTER..., END_MASTER.. sections.
93	cnh	1.13
94			#define _BEGIN_MASTER(a) IF ( a .EQ. 1 ) THEN
95			#define _END_MASTER(a) ENDIF
96			CcnhDebugStarts
97			C Alternate form to the above macros that increments (decrements) a counter each
98			C time a MASTER section is entered (exited). This counter can then be checked in barrier
99			C to try and detect calls to BARRIER within single threaded sections.
100			C Using these macros requires two changes to Makefile - these changes are written
101			C below.
102			C 1 - add a filter to the CPP command to kill off commented _MASTER lines
103			C 2 - add a filter to the CPP output the converts the string N EWLINE to an actual newline.
104			C The N EWLINE needs to be changes to have no space when this macro and Makefile changes
105			C are used. Its in here with a space to stop it getting parsed by the CPP stage in these
106			C comments.
107			C #define _BEGIN_MASTER(a) IF ( a .EQ. 1 ) THEN N EWLINE CALL BARRIER_MS(a)
108			C #define _END_MASTER(a) CALL BARRIER_MU(a) N EWLINE ENDIF
109			C 'CPP = cat $< \| $(TOOLSDIR)/set64bitConst.sh \| grep -v '^[cC].*_MASTER' \| cpp -traditional -P'
110			C .F.f:
111	jmc	1.23	C $(CPP) $(DEFINES) $(INCLUDES) \| sed 's/N EWLINE/\n/' > $@
112	cnh	1.13	CcnhDebugEnds
113	adcroft	1.1
114			C-- Control storage of floating point operands
115			C On many systems it improves performance only to use
116			C 8-byte precision for time stepped variables.
117			C Constant in time terms ( geometric factors etc.. )
118			C can use 4-byte precision, reducing memory utilisation and
119			C boosting performance because of a smaller working
120			C set size. However, on vector CRAY systems this degrades
121			C performance.
122	jmc	1.17	C- Note: global_sum/max macros were used to switch to JAM routines (obsolete);
123			C in addition, since only the R4 & R8 S/R are coded, GLOBAL RS & RL macros
124			C enable to call the corresponding R4 or R8 S/R.
125	adcroft	1.1	#ifdef REAL4_IS_SLOW
126			#define _RS Real*8
127			#define RS_IS_REAL8
128	jmc	1.17	#define _GLOBAL_SUM_RS(a,b) CALL GLOBAL_SUM_R8 ( a, b)
129			#define _GLOBAL_MAX_RS(a,b) CALL GLOBAL_MAX_R8 ( a, b )
130	dimitri	1.6	#define _MPI_TYPE_RS MPI_DOUBLE_PRECISION
131	heimbach	1.21	#ifdef USE_OLD_MACROS_R4R8toRSRL
132	jmc	1.26	#define _GLOBAL_SUM_R4(a,b) CALL GLOBAL_SUM_R8 ( a, b )
133	heimbach	1.21	#define _GLOBAL_MAX_R4(a,b) CALL GLOBAL_MAX_R8 ( a, b )
134			#endif
135	adcroft	1.1	#else
136			#define _RS Real*4
137			#define RS_IS_REAL4
138	jmc	1.17	#define _GLOBAL_SUM_RS(a,b) CALL GLOBAL_SUM_R4 ( a, b )
139			#define _GLOBAL_MAX_RS(a,b) CALL GLOBAL_MAX_R4 ( a, b )
140	dimitri	1.6	#define _MPI_TYPE_RS MPI_REAL
141	heimbach	1.20	#ifdef USE_OLD_MACROS_R4R8toRSRL
142			cph Needed for some backward compatibility with broken packages
143	jmc	1.26	#define _GLOBAL_SUM_R4(a,b) CALL GLOBAL_SUM_R4 ( a, b )
144	heimbach	1.20	#define _GLOBAL_MAX_R4(a,b) CALL GLOBAL_MAX_R4 ( a, b )
145			#endif
146	heimbach	1.21	#endif
147	adcroft	1.1
148			#define _RL Real*8
149	edhill	1.15	#define RL_IS_REAL8
150	jmc	1.17	#define _GLOBAL_SUM_RL(a,b) CALL GLOBAL_SUM_R8 ( a, b )
151			#define _GLOBAL_MAX_RL(a,b) CALL GLOBAL_MAX_R8 ( a, b )
152	heimbach	1.19	#ifdef USE_OLD_MACROS_R4R8toRSRL
153	heimbach	1.18	cph Needed for some backward compatibility with broken packages
154			#define _GLOBAL_SUM_R8(a,b) CALL GLOBAL_SUM_R8 ( a, b )
155			#define _GLOBAL_MAX_R8(a,b) CALL GLOBAL_MAX_R8 ( a, b )
156	heimbach	1.19	#endif
157	dimitri	1.6	#define _MPI_TYPE_RL MPI_DOUBLE_PRECISION
158	adcroft	1.4
159	dimitri	1.9	#define _MPI_TYPE_R4 MPI_REAL
160	ce107	1.12	#if (defined (TARGET_SGI) \|\| defined (TARGET_AIX) \|\| defined (TARGET_LAM))
161	dimitri	1.9	#define _MPI_TYPE_R8 MPI_DOUBLE_PRECISION
162			#else
163			#define _MPI_TYPE_R8 MPI_REAL8
164			#endif
165			#define _R4 Real*4
166			#define _R8 Real*8
167	adcroft	1.4
168	jmc	1.17	C- Note: a) exch macros were used to switch to JAM routines (obsolete)
169			C b) exch R4 & R8 macros are not practically used ; if needed,
170			C will directly call the corrresponding S/R.
171			#define _EXCH_XY_RS(a,b) CALL EXCH_XY_RS ( a, b )
172			#define _EXCH_XY_RL(a,b) CALL EXCH_XY_RL ( a, b )
173			#define _EXCH_XYZ_RS(a,b) CALL EXCH_XYZ_RS ( a, b )
174			#define _EXCH_XYZ_RL(a,b) CALL EXCH_XYZ_RL ( a, b )
175	heimbach	1.19	#ifdef USE_OLD_MACROS_R4R8toRSRL
176	heimbach	1.18	cph Needed for some backward compatibility with broken packages
177			#define _EXCH_XY_R4(a,b) CALL EXCH_XY_RS ( a, b )
178			#define _EXCH_XY_R8(a,b) CALL EXCH_XY_RL ( a, b )
179			#define _EXCH_XYZ_R4(a,b) CALL EXCH_XYZ_RS ( a, b )
180			#define _EXCH_XYZ_R8(a,b) CALL EXCH_XYZ_RL ( a, b )
181	heimbach	1.19	#endif
182	jmc	1.17
183			C-- Control use of JAM routines for Artic network (no longer supported)
184	adcroft	1.4	C These invoke optimized versions of "exchange" and "sum" that
185			C utilize the programmable aspect of Artic cards.
186	jmc	1.22	CXXX No longer supported ; started to remove JAM routines.
187			CXXX #ifdef LETS_MAKE_JAM
188			CXXX #define _GLOBAL_SUM_RS(a,b) CALL GLOBAL_SUM_R8_JAM ( a, b)
189			CXXX #define _GLOBAL_SUM_RL(a,b) CALL GLOBAL_SUM_R8_JAM ( a, b )
190			CXXX #define _EXCH_XY_RS(a,b) CALL EXCH_XY_R8_JAM ( a, b )
191			CXXX #define _EXCH_XY_RL(a,b) CALL EXCH_XY_R8_JAM ( a, b )
192			CXXX #define _EXCH_XYZ_RS(a,b) CALL EXCH_XYZ_R8_JAM ( a, b )
193			CXXX #define _EXCH_XYZ_RL(a,b) CALL EXCH_XYZ_R8_JAM ( a, b )
194			CXXX #endif
195	jmc	1.17
196	adcroft	1.1	C-- Control use of "double" precision constants.
197			C Use D0 where it means REAL8 but not where it means REAL16
198			#ifdef REAL_D0_IS_16BYTES
199			#define D0
200			#endif
201
202			C-- Substitue for 1.D variables
203			C Sun compilers do not use 8-byte precision for literals
204			C unless .Dnn is specified. CRAY vector machines use 16-byte
205			C precision when they see .Dnn which runs very slowly!
206			#ifdef REAL_D0_IS_16BYTES
207			#define _F64( a ) a
208			#endif
209			#ifndef REAL_D0_IS_16BYTES
210			#define _F64( a ) DFLOAT( a )
211			#endif
212
213	mlosch	1.25	C-- Set the format for writing processor IDs, e.g. in S/R eeset_parms
214			C and S/R open_copy_data_file. The default of I9.9 should work for
215			C a long time (until we will use 10e10 processors and more)
216			#define FMT_PROC_ID 'I9.9'
217
218	adcroft	1.1	#endif /* _CPP_EEMACROS_H_ */