1 |
C $Header: $ |
2 |
|
3 |
#include "CPP_EEOPTIONS.h" |
4 |
|
5 |
#ifndef JAM_WITH_TWO_PROCS_PER_NODE |
6 |
C Single processor JAM stuff |
7 |
|
8 |
#undef USE_MPI_EXCH |
9 |
#define USE_JAM_EXCH |
10 |
|
11 |
SUBROUTINE EXCH_XY_O1_R8_JAM( arr ) |
12 |
|
13 |
IMPLICIT NONE |
14 |
C Width 1. Single tile. No X-axis decomp. |
15 |
C No. corner update. Exchange. |
16 |
|
17 |
#define _OLx 1 |
18 |
#define _OLy 1 |
19 |
|
20 |
C == Global variables == |
21 |
#include "SIZE.h" |
22 |
#include "EEPARAMS.h" |
23 |
#include "EXCH_JAM.h" |
24 |
|
25 |
#include "MPI_INFO.h" |
26 |
#include "JAM_INFO.h" |
27 |
|
28 |
C == Compile time constants == |
29 |
|
30 |
C == Routine arguments == |
31 |
Real*8 arr(1-_OLx:sNx+_OLx,1-_OLy:sNy+_OLy) |
32 |
|
33 |
#ifdef LETS_MAKE_JAM |
34 |
|
35 |
C == Local variables == |
36 |
INTEGER I, J |
37 |
INTEGER northProc, southProc |
38 |
INTEGER farProc1, farProc2 |
39 |
INTEGER toPid, fromPid |
40 |
INTEGER rc |
41 |
|
42 |
#ifdef ALLOW_MPI |
43 |
INTEGER mpiStatus(MPI_STATUS_SIZE) |
44 |
#endif |
45 |
|
46 |
C East-west halo update (without corners) |
47 |
DO J=1,sNy |
48 |
DO I=1,_OLx |
49 |
arr(1-I ,J) = arr(sNx-I+1,J) |
50 |
arr(sNx+I,J) = arr(1+I-1 ,J) |
51 |
ENDDO |
52 |
ENDDO |
53 |
|
54 |
C Phase 1 pairing |
55 |
C | 0 | ---> | 1 | |
56 |
C | 0 | <--- | 1 | |
57 |
|
58 |
C | 2 | ---> | 3 | |
59 |
C | 2 | <--- | 3 | |
60 |
|
61 |
C | 4 | ---> | 5 | |
62 |
C | 4 | <--- | 5 | |
63 |
|
64 |
C etc ... |
65 |
C |
66 |
|
67 |
#ifdef USE_MPI_EXCH |
68 |
C North-south halo update (without corners) |
69 |
C Put my edges into a buffers |
70 |
IF ( MOD(myProcId,2) .EQ. 0 ) THEN |
71 |
DO I=1,sNx |
72 |
exchBuf1(I) = arr(I,sNy) |
73 |
exchBuf2(I) = arr(I,1 ) |
74 |
ENDDO |
75 |
ELSE |
76 |
DO I=1,sNx |
77 |
exchBuf1(I) = arr(I,1 ) |
78 |
exchBuf2(I) = arr(I,sNy) |
79 |
ENDDO |
80 |
ENDIF |
81 |
|
82 |
C Exchange the buffers |
83 |
northProc = mpi_northId |
84 |
southProc = mpi_southId |
85 |
IF ( MOD(myProcId,2) .EQ. 0 ) THEN |
86 |
farProc1 = northProc |
87 |
farProc2 = southProc |
88 |
ELSE |
89 |
farProc1 = southProc |
90 |
farProc2 = northProc |
91 |
ENDIF |
92 |
C Even-odd pairs |
93 |
IF ( farProc1 .NE. myProcId ) THEN |
94 |
CALL MPI_Sendrecv_replace(exchBuf1,sNx,MPI_REAL8, |
95 |
& farProc1,0, |
96 |
& farProc1,MPI_ANY_TAG, |
97 |
& MPI_COMM_WORLD,mpiStatus, |
98 |
& rc) |
99 |
ENDIF |
100 |
C Odd-even pairs |
101 |
IF ( farProc2 .NE. myProcId ) THEN |
102 |
CALL MPI_Sendrecv_replace(exchBuf2,sNx,MPI_REAL8, |
103 |
& farProc2,0, |
104 |
& farProc2,MPI_ANY_TAG, |
105 |
& MPI_COMM_WORLD,mpiStatus, |
106 |
& rc) |
107 |
ENDIF |
108 |
#endif |
109 |
|
110 |
#ifdef USE_JAM_EXCH |
111 |
northProc = jam_northId |
112 |
southProc = jam_southId |
113 |
IF ( MOD(myProcId,2) .EQ. 0 ) THEN |
114 |
C sendBuf1 = &arr(1,sNy ) |
115 |
C recvBuf1 = &arr(1,sNy+1) |
116 |
C sendBuf2 = &arr(1,1 ) |
117 |
C recvBuf2 = &arr(1,0 ) |
118 |
farProc1 = northProc |
119 |
farProc2 = southProc |
120 |
IF ( farProc1 .NE. myProcId ) THEN |
121 |
CALL JAM_EXCHANGE(farProc1,arr(1,sNy),arr(1,sNy+1), |
122 |
& sNx*8,jam_exchKey) |
123 |
jam_exchKey = jam_exchKey+1 |
124 |
ENDIF |
125 |
IF ( farProc2 .NE. myProcId ) THEN |
126 |
CALL JAM_EXCHANGE(farProc2,arr(1,1),arr(1,0), |
127 |
& sNx*8,jam_exchKey) |
128 |
jam_exchKey = jam_exchKey+1 |
129 |
ENDIF |
130 |
ELSE |
131 |
C sendBuf1 = &arr(1,1 ) |
132 |
C recvBuf1 = &arr(1,0 ) |
133 |
C sendBuf2 = &arr(1,sNy ) |
134 |
C recvBuf2 = &arr(1,sNy+1) |
135 |
farProc1 = southProc |
136 |
farProc2 = northProc |
137 |
IF ( farProc1 .NE. myProcId ) THEN |
138 |
CALL JAM_EXCHANGE(farProc1,arr(1,1),arr(1,0), |
139 |
& sNx*8,jam_exchKey) |
140 |
jam_exchKey = jam_exchKey+1 |
141 |
ENDIF |
142 |
IF ( farProc2 .NE. myProcId ) THEN |
143 |
CALL JAM_EXCHANGE(farProc2,arr(1,sNy),arr(1,sNy+1), |
144 |
& sNx*8,jam_exchKey) |
145 |
jam_exchKey = jam_exchKey+1 |
146 |
ENDIF |
147 |
ENDIF |
148 |
C IF ( farProc1 .NE. myProcId ) THEN |
149 |
C CALL JAM_EXCHANGE(farProc1,sendBuf1,recvBuf1,sNx*8,jam_exchKey) |
150 |
C jam_exchKey = jam_exchKey+1 |
151 |
C ENDIF |
152 |
C IF ( farProc2 .NE. myProcId ) THEN |
153 |
C CALL JAM_EXCHANGE(farProc2,sendBuf2,recvBuf2,sNx*8,jam_exchKey) |
154 |
C jam_exchKey = jam_exchKey+1 |
155 |
C ENDIF |
156 |
#endif |
157 |
|
158 |
#ifdef USE_MPI_EXCH |
159 |
C Fill overlap regions from the buffers |
160 |
IF ( MOD(myProcId,2) .EQ. 0 ) THEN |
161 |
DO I=1,sNx |
162 |
arr(I,sNy+1) = exchBuf1(I) |
163 |
arr(I,0 ) = exchBuf2(I) |
164 |
ENDDO |
165 |
ELSE |
166 |
DO I=1,sNx |
167 |
arr(I,sNy+1) = exchBuf2(I) |
168 |
arr(I,0 ) = exchBuf1(I) |
169 |
ENDDO |
170 |
ENDIF |
171 |
#endif |
172 |
|
173 |
IF ( numberOfProcs .EQ. 1 ) THEN |
174 |
DO I=1,sNx |
175 |
arr(I,sNy+1) = arr(I,1 ) |
176 |
arr(I,0 ) = arr(I,sNy) |
177 |
ENDDO |
178 |
ENDIF |
179 |
|
180 |
RETURN |
181 |
END |
182 |
|
183 |
SUBROUTINE EXCH_XY_R8_JAM( arr ) |
184 |
|
185 |
IMPLICIT NONE |
186 |
|
187 |
C Full width. Single tile. No X-axis decomp. |
188 |
C exchange. |
189 |
|
190 |
C == Global variables == |
191 |
#include "SIZE.h" |
192 |
#include "EEPARAMS.h" |
193 |
#include "EESUPPORT.h" |
194 |
#include "EXCH_JAM.h" |
195 |
|
196 |
#include "MPI_INFO.h" |
197 |
#include "JAM_INFO.h" |
198 |
|
199 |
C == Routine arguments == |
200 |
REAL*8 arr(1-OLx:sNx+OLx,1-OLy:sNy+OLy) |
201 |
|
202 |
C == Local variables == |
203 |
INTEGER I, J |
204 |
INTEGER iLo, iHi, I0 |
205 |
INTEGER northProc, southProc |
206 |
INTEGER farProc1, farProc2 |
207 |
INTEGER toPid, fromPid |
208 |
INTEGER rc |
209 |
|
210 |
#ifdef ALLOW_MPI |
211 |
INTEGER mpiStatus(MPI_STATUS_SIZE) |
212 |
#endif |
213 |
|
214 |
C East-west halo update |
215 |
DO J=1-OLy,sNy+OLy |
216 |
DO I=1,OLx |
217 |
arr(1-I ,J) = arr(sNx-I+1,J) |
218 |
arr(sNx+I,J) = arr(1+I-1 ,J) |
219 |
ENDDO |
220 |
ENDDO |
221 |
|
222 |
C Phase 1 pairing |
223 |
C | 0 | ---> | 1 | |
224 |
C | 0 | <--- | 1 | |
225 |
|
226 |
C | 2 | ---> | 3 | |
227 |
C | 2 | <--- | 3 | |
228 |
|
229 |
C | 4 | ---> | 5 | |
230 |
C | 4 | <--- | 5 | |
231 |
|
232 |
C etc ... |
233 |
C |
234 |
|
235 |
#ifdef USE_MPI_EXCH |
236 |
C North-south halo update (including corners) |
237 |
C Put my edges into a buffers |
238 |
IF ( MOD(myProcId,2) .EQ. 0 ) THEN |
239 |
DO J=1,OLy |
240 |
iLo= 1-OLx |
241 |
iHi= sNx+OLx |
242 |
I0 = (J-1)*(iHi-iLo)+1 |
243 |
DO I=iLo,iHi |
244 |
exchBuf1(I0+I-iLo) = arr(I,sNy-OLy+J) |
245 |
exchBuf2(I0+I-iLo) = arr(I,1+J-1 ) |
246 |
ENDDO |
247 |
ENDDO |
248 |
ELSE |
249 |
DO J=1,OLy |
250 |
iLo= 1-OLx |
251 |
iHi= sNx+OLx |
252 |
I0 = (J-1)*(iHi-iLo)+1 |
253 |
DO I=iLo,iHi |
254 |
exchBuf1(I0+I-iLo) = arr(I,1+J-1 ) |
255 |
exchBuf2(I0+I-iLo) = arr(I,sNy-OLy+J) |
256 |
ENDDO |
257 |
ENDDO |
258 |
ENDIF |
259 |
|
260 |
C Exchange the buffers |
261 |
northProc = mpi_northId |
262 |
southProc = mpi_southId |
263 |
IF ( MOD(myProcId,2) .EQ. 0 ) THEN |
264 |
farProc1 = northProc |
265 |
farProc2 = southProc |
266 |
ELSE |
267 |
farProc1 = southProc |
268 |
farProc2 = northProc |
269 |
ENDIF |
270 |
|
271 |
C Even-odd pairs |
272 |
IF ( farProc1 .NE. myProcId ) THEN |
273 |
CALL MPI_Sendrecv_replace(exchBuf1,OLy*(sNx+2*OLx),MPI_REAL8, |
274 |
& farProc1,0, |
275 |
& farProc1,MPI_ANY_TAG, |
276 |
& MPI_COMM_WORLD,mpiStatus, |
277 |
& rc) |
278 |
ENDIF |
279 |
C Odd-even pairs |
280 |
IF ( farProc2 .NE. myProcId ) THEN |
281 |
CALL MPI_Sendrecv_replace(exchBuf2,OLy*(sNx+2*OLx),MPI_REAL8, |
282 |
& farProc2,0, |
283 |
& farProc2,MPI_ANY_TAG, |
284 |
& MPI_COMM_WORLD,mpiStatus, |
285 |
& rc) |
286 |
ENDIF |
287 |
|
288 |
C Fill overlap regions from the buffers |
289 |
IF ( MOD(myProcId,2) .EQ. 0 ) THEN |
290 |
DO J=1,OLy |
291 |
iLo= 1-OLx |
292 |
iHi= sNx+OLx |
293 |
I0 = (J-1)*(iHi-iLo)+1 |
294 |
DO I=iLo,iHi |
295 |
arr(I,sNy+J ) = exchBuf1(I0+I-iLo) |
296 |
arr(I,1-OLy+J-1) = exchBuf2(I0+I-iLo) |
297 |
ENDDO |
298 |
ENDDO |
299 |
ELSE |
300 |
DO J=1,OLy |
301 |
iLo= 1-OLx |
302 |
iHi= sNx+OLx |
303 |
I0 = (J-1)*(iHi-iLo)+1 |
304 |
DO I=iLo,iHi |
305 |
arr(I,sNy+J ) = exchBuf2(I0+I-iLo) |
306 |
arr(I,1-OLy+J-1 ) = exchBuf1(I0+I-iLo) |
307 |
ENDDO |
308 |
ENDDO |
309 |
ENDIF |
310 |
#endif |
311 |
|
312 |
#ifdef USE_JAM_EXCH |
313 |
northProc = jam_northId |
314 |
southProc = jam_southId |
315 |
IF ( MOD(myProcId,2) .EQ. 0 ) THEN |
316 |
C sendBuf1 = &arr(1-OLx,sNy-OLy+1) |
317 |
C recvBuf1 = &arr(1-OLx,sNy+1 ) |
318 |
C sendBuf2 = &arr(1-OLx,1 ) |
319 |
C recvBuf2 = &arr(1-OLx,1-OLy ) |
320 |
farProc1 = northProc |
321 |
farProc2 = southProc |
322 |
IF ( farProc1 .NE. myProcId ) THEN |
323 |
CALL JAM_EXCHANGE(farProc1, |
324 |
& arr(1-OLx,sNy-OLy+1), |
325 |
& arr(1-OLx,sNy+1 ), |
326 |
& OLy*(sNx+2*OLx)*8, |
327 |
& jam_exchKey) |
328 |
jam_exchKey = jam_exchKey+1 |
329 |
ENDIF |
330 |
IF ( farProc2 .NE. myProcId ) THEN |
331 |
CALL JAM_EXCHANGE(farProc2, |
332 |
& arr(1-OLx,1 ), |
333 |
& arr(1-OLx,1-OLy ), |
334 |
& OLy*(sNx+2*OLx)*8, |
335 |
& jam_exchKey) |
336 |
jam_exchKey = jam_exchKey+1 |
337 |
ENDIF |
338 |
ELSE |
339 |
C sendBuf1 = &arr(1-OLx,1 ) |
340 |
C recvBuf1 = &arr(1-OLx,1-OLy ) |
341 |
C sendBuf2 = &arr(1-OLx,sNy-OLy+1) |
342 |
C recvBuf2 = &arr(1-OLx,sNy+1 ) |
343 |
farProc1 = southProc |
344 |
farProc2 = northProc |
345 |
IF ( farProc1 .NE. myProcId ) THEN |
346 |
CALL JAM_EXCHANGE(farProc1, |
347 |
& arr(1-OLx,1 ), |
348 |
& arr(1-OLx,1-OLy ), |
349 |
& OLy*(sNx+2*OLx)*8, |
350 |
& jam_exchKey) |
351 |
jam_exchKey = jam_exchKey+1 |
352 |
ENDIF |
353 |
IF ( farProc2 .NE. myProcId ) THEN |
354 |
CALL JAM_EXCHANGE(farProc2, |
355 |
& arr(1-OLx,sNy-OLy+1), |
356 |
& arr(1-OLx,sNy+1 ), |
357 |
& OLy*(sNx+2*OLx)*8, |
358 |
& jam_exchKey) |
359 |
jam_exchKey = jam_exchKey+1 |
360 |
ENDIF |
361 |
ENDIF |
362 |
#endif |
363 |
|
364 |
IF ( numberOfProcs .EQ. 1 ) THEN |
365 |
DO J=1,OLy |
366 |
iLo= 1-OLx |
367 |
iHi= sNx+OLx |
368 |
DO I=iLo,iHi |
369 |
arr(I,sNy+J ) = arr(I,1+J-1 ) |
370 |
arr(I,1-OLy+J-1) = arr(I,sNy-OLy+J) |
371 |
ENDDO |
372 |
ENDDO |
373 |
ENDIF |
374 |
|
375 |
RETURN |
376 |
END |
377 |
SUBROUTINE EXCH_XYZ_R8_JAM( arr ) |
378 |
IMPLICIT NONE |
379 |
|
380 |
C Full width, 3d. Single tile. No X-axis decomp. |
381 |
C exchange. |
382 |
|
383 |
C == Global variables == |
384 |
#include "SIZE.h" |
385 |
#include "EEPARAMS.h" |
386 |
#include "EESUPPORT.h" |
387 |
#include "EXCH_JAM.h" |
388 |
|
389 |
#include "MPI_INFO.h" |
390 |
#include "JAM_INFO.h" |
391 |
|
392 |
C == Routine arguments == |
393 |
REAL*8 arr(1-OLx:sNx+OLx,1-OLy:sNy+OLy,1:Nr) |
394 |
|
395 |
C == Local variables == |
396 |
INTEGER I, J, K |
397 |
INTEGER iLo, iHi, I0 |
398 |
INTEGER northProc, southProc |
399 |
INTEGER farProc1, farProc2 |
400 |
INTEGER toPid, fromPid |
401 |
INTEGER rc |
402 |
|
403 |
#ifdef ALLOW_MPI |
404 |
INTEGER mpiStatus(MPI_STATUS_SIZE) |
405 |
#endif |
406 |
|
407 |
C East-west halo update |
408 |
DO K=1,Nr |
409 |
DO J=1-OLy,sNy+OLy |
410 |
DO I=1,OLx |
411 |
arr(1-I ,J,K) = arr(sNx-I+1,J,K) |
412 |
arr(sNx+I,J,K) = arr(1+I-1 ,J,K) |
413 |
ENDDO |
414 |
ENDDO |
415 |
ENDDO |
416 |
|
417 |
C Phase 1 pairing |
418 |
C | 0 | ---> | 1 | |
419 |
C | 0 | <--- | 1 | |
420 |
|
421 |
C | 2 | ---> | 3 | |
422 |
C | 2 | <--- | 3 | |
423 |
|
424 |
C | 4 | ---> | 5 | |
425 |
C | 4 | <--- | 5 | |
426 |
|
427 |
C etc ... |
428 |
C |
429 |
|
430 |
#ifdef USE_MPI_EXCH |
431 |
C North-south halo update (including corners) |
432 |
DO K=1,Nr |
433 |
C Put my edges into a buffers |
434 |
IF ( MOD(myProcId,2) .EQ. 0 ) THEN |
435 |
DO J=1,OLy |
436 |
iLo= 1-OLx |
437 |
iHi= sNx+OLx |
438 |
I0 = (J-1)*(iHi-iLo)+1 |
439 |
DO I=iLo,iHi |
440 |
exchBuf1(I0+I-iLo) = arr(I,sNy-OLy+J,K) |
441 |
exchBuf2(I0+I-iLo) = arr(I,1+J-1 ,K) |
442 |
ENDDO |
443 |
ENDDO |
444 |
ELSE |
445 |
DO J=1,OLy |
446 |
iLo= 1-OLx |
447 |
iHi= sNx+OLx |
448 |
I0 = (J-1)*(iHi-iLo)+1 |
449 |
DO I=iLo,iHi |
450 |
exchBuf1(I0+I-iLo) = arr(I,1+J-1 ,K) |
451 |
exchBuf2(I0+I-iLo) = arr(I,sNy-OLy+J,K) |
452 |
ENDDO |
453 |
ENDDO |
454 |
ENDIF |
455 |
|
456 |
C Exchange the buffers |
457 |
northProc = mpi_northId |
458 |
southProc = mpi_southId |
459 |
IF ( MOD(myProcId,2) .EQ. 0 ) THEN |
460 |
farProc1 = northProc |
461 |
farProc2 = southProc |
462 |
ELSE |
463 |
farProc1 = southProc |
464 |
farProc2 = northProc |
465 |
ENDIF |
466 |
C Even-odd pairs |
467 |
IF ( farProc1 .NE. myProcId ) THEN |
468 |
CALL MPI_Sendrecv_replace(exchBuf1,OLy*(sNx+2*OLx),MPI_REAL8, |
469 |
& farProc1,0, |
470 |
& farProc1,MPI_ANY_TAG, |
471 |
& MPI_COMM_WORLD,mpiStatus, |
472 |
& rc) |
473 |
ENDIF |
474 |
C Odd-even pairs |
475 |
IF ( farProc2 .NE. myProcId ) THEN |
476 |
CALL MPI_Sendrecv_replace(exchBuf2,OLy*(sNx+2*OLx),MPI_REAL8, |
477 |
& farProc2,0, |
478 |
& farProc2,MPI_ANY_TAG, |
479 |
& MPI_COMM_WORLD,mpiStatus, |
480 |
& rc) |
481 |
ENDIF |
482 |
|
483 |
C Fill overlap regions from the buffers |
484 |
IF ( MOD(myProcId,2) .EQ. 0 ) THEN |
485 |
DO J=1,OLy |
486 |
iLo= 1-OLx |
487 |
iHi= sNx+OLx |
488 |
I0 = (J-1)*(iHi-iLo)+1 |
489 |
DO I=iLo,iHi |
490 |
arr(I,sNy+J ,K) = exchBuf1(I0+I-iLo) |
491 |
arr(I,1-OLy+J-1,K) = exchBuf2(I0+I-iLo) |
492 |
ENDDO |
493 |
ENDDO |
494 |
ELSE |
495 |
DO J=1,OLy |
496 |
iLo= 1-OLx |
497 |
iHi= sNx+OLx |
498 |
I0 = (J-1)*(iHi-iLo)+1 |
499 |
DO I=iLo,iHi |
500 |
arr(I,sNy+J ,K) = exchBuf2(I0+I-iLo) |
501 |
arr(I,1-OLy+J-1 ,K) = exchBuf1(I0+I-iLo) |
502 |
ENDDO |
503 |
ENDDO |
504 |
ENDIF |
505 |
ENDDO |
506 |
#endif |
507 |
|
508 |
#ifdef USE_JAM_EXCH |
509 |
northProc = jam_northId |
510 |
southProc = jam_southId |
511 |
DO K=1,Nr |
512 |
IF ( MOD(myProcId,2) .EQ. 0 ) THEN |
513 |
C sendBuf1 = &arr(1-OLx,sNy-OLy+1) |
514 |
C recvBuf1 = &arr(1-OLx,sNy+1 ) |
515 |
C sendBuf2 = &arr(1-OLx,1 ) |
516 |
C recvBuf2 = &arr(1-OLx,1-OLy ) |
517 |
farProc1 = northProc |
518 |
farProc2 = southProc |
519 |
IF ( farProc1 .NE. myProcId ) THEN |
520 |
CALL JAM_EXCHANGE(farProc1, |
521 |
& arr(1-OLx,sNy-OLy+1,K), |
522 |
& arr(1-OLx,sNy+1 ,K), |
523 |
& OLy*(sNx+2*OLx)*8, |
524 |
& jam_exchKey) |
525 |
jam_exchKey = jam_exchKey+1 |
526 |
ENDIF |
527 |
IF ( farProc2 .NE. myProcId ) THEN |
528 |
CALL JAM_EXCHANGE(farProc2, |
529 |
& arr(1-OLx,1 ,K), |
530 |
& arr(1-OLx,1-OLy ,K), |
531 |
& OLy*(sNx+2*OLx)*8, |
532 |
& jam_exchKey) |
533 |
jam_exchKey = jam_exchKey+1 |
534 |
ENDIF |
535 |
ELSE |
536 |
C sendBuf1 = &arr(1-OLx,1 ) |
537 |
C recvBuf1 = &arr(1-OLx,1-OLy ) |
538 |
C sendBuf2 = &arr(1-OLx,sNy-OLy+1) |
539 |
C recvBuf2 = &arr(1-OLx,sNy+1 ) |
540 |
farProc1 = southProc |
541 |
farProc2 = northProc |
542 |
IF ( farProc1 .NE. myProcId ) THEN |
543 |
CALL JAM_EXCHANGE(farProc1, |
544 |
& arr(1-OLx,1 ,K), |
545 |
& arr(1-OLx,1-OLy ,K), |
546 |
& OLy*(sNx+2*OLx)*8, |
547 |
& jam_exchKey) |
548 |
jam_exchKey = jam_exchKey+1 |
549 |
ENDIF |
550 |
IF ( farProc2 .NE. myProcId ) THEN |
551 |
CALL JAM_EXCHANGE(farProc2, |
552 |
& arr(1-OLx,sNy-OLy+1,K), |
553 |
& arr(1-OLx,sNy+1 ,K), |
554 |
& OLy*(sNx+2*OLx)*8, |
555 |
& jam_exchKey) |
556 |
jam_exchKey = jam_exchKey+1 |
557 |
ENDIF |
558 |
ENDIF |
559 |
ENDDO |
560 |
#endif |
561 |
|
562 |
IF ( numberOfProcs .EQ. 1 ) THEN |
563 |
DO K=1,Nr |
564 |
DO J=1,OLy |
565 |
iLo= 1-OLx |
566 |
iHi= sNx+OLx |
567 |
DO I=iLo,iHi |
568 |
arr(I,sNy+J ,K) = arr(I,1+J-1 ,K) |
569 |
arr(I,1-OLy+J-1,K) = arr(I,sNy-OLy+J,K) |
570 |
ENDDO |
571 |
ENDDO |
572 |
ENDDO |
573 |
ENDIF |
574 |
|
575 |
RETURN |
576 |
END |
577 |
|
578 |
#undef USE_MPI_EXCH |
579 |
#define USE_JAM_EXCH |
580 |
|
581 |
SUBROUTINE EXCH_XY_O1_R4_JAM( arr ) |
582 |
|
583 |
IMPLICIT NONE |
584 |
C Width 1. Single tile. No X-axis decomp. |
585 |
C No. corner update. Exchange. |
586 |
|
587 |
#define ALLOW_MPI |
588 |
#define _OLx 1 |
589 |
#define _OLy 1 |
590 |
|
591 |
C == Global variables == |
592 |
#include "SIZE.h" |
593 |
#include "EEPARAMS.h" |
594 |
#include "EESUPPORT.h" |
595 |
#include "EXCH_JAM.h" |
596 |
|
597 |
#include "MPI_INFO.h" |
598 |
#include "JAM_INFO.h" |
599 |
|
600 |
C == Compile time constants == |
601 |
|
602 |
C == Routine arguments == |
603 |
REAL*4 arr(1-_OLx:sNx+_OLx,1-_OLy:sNy+_OLy) |
604 |
|
605 |
C == Local variables == |
606 |
INTEGER I, J |
607 |
INTEGER northProc, southProc |
608 |
INTEGER farProc1, farProc2 |
609 |
INTEGER toPid, fromPid |
610 |
INTEGER rc |
611 |
|
612 |
#ifdef ALLOW_MPI |
613 |
INTEGER mpiStatus(MPI_STATUS_SIZE) |
614 |
#endif |
615 |
|
616 |
C East-west halo update (without corners) |
617 |
DO J=1,sNy |
618 |
DO I=1,_OLx |
619 |
arr(1-I ,J) = arr(sNx-I+1,J) |
620 |
arr(sNx+I,J) = arr(1+I-1 ,J) |
621 |
ENDDO |
622 |
ENDDO |
623 |
|
624 |
C Phase 1 pairing |
625 |
C | 0 | ---> | 1 | |
626 |
C | 0 | <--- | 1 | |
627 |
|
628 |
C | 2 | ---> | 3 | |
629 |
C | 2 | <--- | 3 | |
630 |
|
631 |
C | 4 | ---> | 5 | |
632 |
C | 4 | <--- | 5 | |
633 |
|
634 |
C etc ... |
635 |
C |
636 |
|
637 |
#ifdef USE_MPI_EXCH |
638 |
C North-south halo update (without corners) |
639 |
C Put my edges into a buffers |
640 |
IF ( MOD(myProcId,2) .EQ. 0 ) THEN |
641 |
DO I=1,sNx |
642 |
exchBuf1(I) = arr(I,sNy) |
643 |
exchBuf2(I) = arr(I,1 ) |
644 |
ENDDO |
645 |
ELSE |
646 |
DO I=1,sNx |
647 |
exchBuf1(I) = arr(I,1 ) |
648 |
exchBuf2(I) = arr(I,sNy) |
649 |
ENDDO |
650 |
ENDIF |
651 |
|
652 |
C Exchange the buffers |
653 |
northProc = mpi_northId |
654 |
southProc = mpi_southId |
655 |
IF ( MOD(myProcId,2) .EQ. 0 ) THEN |
656 |
farProc1 = northProc |
657 |
farProc2 = southProc |
658 |
ELSE |
659 |
farProc1 = southProc |
660 |
farProc2 = northProc |
661 |
ENDIF |
662 |
C Even-odd pairs |
663 |
IF ( farProc1 .NE. myProcId ) THEN |
664 |
CALL MPI_Sendrecv_replace(exchBuf1,sNx,MPI_REAL8, |
665 |
& farProc1,0, |
666 |
& farProc1,MPI_ANY_TAG, |
667 |
& MPI_COMM_WORLD,mpiStatus, |
668 |
& rc) |
669 |
ENDIF |
670 |
C Odd-even pairs |
671 |
IF ( farProc2 .NE. myProcId ) THEN |
672 |
CALL MPI_Sendrecv_replace(exchBuf2,sNx,MPI_REAL8, |
673 |
& farProc2,0, |
674 |
& farProc2,MPI_ANY_TAG, |
675 |
& MPI_COMM_WORLD,mpiStatus, |
676 |
& rc) |
677 |
ENDIF |
678 |
#endif |
679 |
|
680 |
#ifdef USE_JAM_EXCH |
681 |
northProc = jam_northId |
682 |
southProc = jam_southId |
683 |
IF ( MOD(myProcId,2) .EQ. 0 ) THEN |
684 |
C sendBuf1 = &arr(1,sNy ) |
685 |
C recvBuf1 = &arr(1,sNy+1) |
686 |
C sendBuf2 = &arr(1,1 ) |
687 |
C recvBuf2 = &arr(1,0 ) |
688 |
farProc1 = northProc |
689 |
farProc2 = southProc |
690 |
IF ( farProc1 .NE. myProcId ) THEN |
691 |
CALL JAM_EXCHANGE(farProc1,arr(1,sNy),arr(1,sNy+1), |
692 |
& sNx*4,jam_exchKey) |
693 |
jam_exchKey = jam_exchKey+1 |
694 |
ENDIF |
695 |
IF ( farProc2 .NE. myProcId ) THEN |
696 |
CALL JAM_EXCHANGE(farProc2,arr(1,1),arr(1,0), |
697 |
& sNx*4,jam_exchKey) |
698 |
jam_exchKey = jam_exchKey+1 |
699 |
ENDIF |
700 |
ELSE |
701 |
C sendBuf1 = &arr(1,1 ) |
702 |
C recvBuf1 = &arr(1,0 ) |
703 |
C sendBuf2 = &arr(1,sNy ) |
704 |
C recvBuf2 = &arr(1,sNy+1) |
705 |
farProc1 = southProc |
706 |
farProc2 = northProc |
707 |
IF ( farProc1 .NE. myProcId ) THEN |
708 |
CALL JAM_EXCHANGE(farProc1,arr(1,1),arr(1,0), |
709 |
& sNx*4,jam_exchKey) |
710 |
jam_exchKey = jam_exchKey+1 |
711 |
ENDIF |
712 |
IF ( farProc2 .NE. myProcId ) THEN |
713 |
CALL JAM_EXCHANGE(farProc2,arr(1,sNy),arr(1,sNy+1), |
714 |
& sNx*4,jam_exchKey) |
715 |
jam_exchKey = jam_exchKey+1 |
716 |
ENDIF |
717 |
ENDIF |
718 |
C IF ( farProc1 .NE. myProcId ) THEN |
719 |
C CALL JAM_EXCHANGE(farProc1,sendBuf1,recvBuf1,sNx*8,jam_exchKey) |
720 |
C jam_exchKey = jam_exchKey+1 |
721 |
C ENDIF |
722 |
C IF ( farProc2 .NE. myProcId ) THEN |
723 |
C CALL JAM_EXCHANGE(farProc2,sendBuf2,recvBuf2,sNx*8,jam_exchKey) |
724 |
C jam_exchKey = jam_exchKey+1 |
725 |
C ENDIF |
726 |
#endif |
727 |
|
728 |
#ifdef USE_MPI_EXCH |
729 |
C Fill overlap regions from the buffers |
730 |
IF ( MOD(myProcId,2) .EQ. 0 ) THEN |
731 |
DO I=1,sNx |
732 |
arr(I,sNy+1) = exchBuf1(I) |
733 |
arr(I,0 ) = exchBuf2(I) |
734 |
ENDDO |
735 |
ELSE |
736 |
DO I=1,sNx |
737 |
arr(I,sNy+1) = exchBuf2(I) |
738 |
arr(I,0 ) = exchBuf1(I) |
739 |
ENDDO |
740 |
ENDIF |
741 |
#endif |
742 |
|
743 |
IF ( numberOfProcs .EQ. 1 ) THEN |
744 |
DO I=1,sNx |
745 |
arr(I,sNy+1) = arr(I,1 ) |
746 |
arr(I,0 ) = arr(I,sNy) |
747 |
ENDDO |
748 |
ENDIF |
749 |
|
750 |
RETURN |
751 |
END |
752 |
|
753 |
SUBROUTINE EXCH_XY_R4_JAM( arr ) |
754 |
|
755 |
IMPLICIT NONE |
756 |
|
757 |
C Full width. Single tile. No X-axis decomp. |
758 |
C exchange. |
759 |
|
760 |
C == Global variables == |
761 |
#include "SIZE.h" |
762 |
#include "EEPARAMS.h" |
763 |
#include "EESUPPORT.h" |
764 |
#include "EXCH_JAM.h" |
765 |
|
766 |
#include "MPI_INFO.h" |
767 |
#include "JAM_INFO.h" |
768 |
|
769 |
C == Routine arguments == |
770 |
REAL*4 arr(1-OLx:sNx+OLx,1-OLy:sNy+OLy) |
771 |
|
772 |
C == Local variables == |
773 |
INTEGER I, J |
774 |
INTEGER iLo, iHi, I0 |
775 |
INTEGER northProc, southProc |
776 |
INTEGER farProc1, farProc2 |
777 |
INTEGER toPid, fromPid |
778 |
INTEGER rc |
779 |
|
780 |
#ifdef ALLOW_MPI |
781 |
INTEGER mpiStatus(MPI_STATUS_SIZE) |
782 |
#endif |
783 |
|
784 |
C East-west halo update |
785 |
DO J=1-OLy,sNy+OLy |
786 |
DO I=1,OLx |
787 |
arr(1-I ,J) = arr(sNx-I+1,J) |
788 |
arr(sNx+I,J) = arr(1+I-1 ,J) |
789 |
ENDDO |
790 |
ENDDO |
791 |
|
792 |
C Phase 1 pairing |
793 |
C | 0 | ---> | 1 | |
794 |
C | 0 | <--- | 1 | |
795 |
|
796 |
C | 2 | ---> | 3 | |
797 |
C | 2 | <--- | 3 | |
798 |
|
799 |
C | 4 | ---> | 5 | |
800 |
C | 4 | <--- | 5 | |
801 |
|
802 |
C etc ... |
803 |
C |
804 |
|
805 |
#ifdef USE_MPI_EXCH |
806 |
C North-south halo update (including corners) |
807 |
C Put my edges into a buffers |
808 |
IF ( MOD(myProcId,2) .EQ. 0 ) THEN |
809 |
DO J=1,OLy |
810 |
iLo= 1-OLx |
811 |
iHi= sNx+OLx |
812 |
I0 = (J-1)*(iHi-iLo)+1 |
813 |
DO I=iLo,iHi |
814 |
exchBuf1(I0+I-iLo) = arr(I,sNy-OLy+J) |
815 |
exchBuf2(I0+I-iLo) = arr(I,1+J-1 ) |
816 |
ENDDO |
817 |
ENDDO |
818 |
ELSE |
819 |
DO J=1,OLy |
820 |
iLo= 1-OLx |
821 |
iHi= sNx+OLx |
822 |
I0 = (J-1)*(iHi-iLo)+1 |
823 |
DO I=iLo,iHi |
824 |
exchBuf1(I0+I-iLo) = arr(I,1+J-1 ) |
825 |
exchBuf2(I0+I-iLo) = arr(I,sNy-OLy+J) |
826 |
ENDDO |
827 |
ENDDO |
828 |
ENDIF |
829 |
|
830 |
C Exchange the buffers |
831 |
northProc = mpi_northId |
832 |
southProc = mpi_southId |
833 |
IF ( MOD(myProcId,2) .EQ. 0 ) THEN |
834 |
farProc1 = northProc |
835 |
farProc2 = southProc |
836 |
ELSE |
837 |
farProc1 = southProc |
838 |
farProc2 = northProc |
839 |
ENDIF |
840 |
|
841 |
C Even-odd pairs |
842 |
IF ( farProc1 .NE. myProcId ) THEN |
843 |
CALL MPI_Sendrecv_replace(exchBuf1,OLy*(sNx+2*OLx),MPI_REAL8, |
844 |
& farProc1,0, |
845 |
& farProc1,MPI_ANY_TAG, |
846 |
& MPI_COMM_WORLD,mpiStatus, |
847 |
& rc) |
848 |
ENDIF |
849 |
C Odd-even pairs |
850 |
IF ( farProc2 .NE. myProcId ) THEN |
851 |
CALL MPI_Sendrecv_replace(exchBuf2,OLy*(sNx+2*OLx),MPI_REAL8, |
852 |
& farProc2,0, |
853 |
& farProc2,MPI_ANY_TAG, |
854 |
& MPI_COMM_WORLD,mpiStatus, |
855 |
& rc) |
856 |
ENDIF |
857 |
|
858 |
C Fill overlap regions from the buffers |
859 |
IF ( MOD(myProcId,2) .EQ. 0 ) THEN |
860 |
DO J=1,OLy |
861 |
iLo= 1-OLx |
862 |
iHi= sNx+OLx |
863 |
I0 = (J-1)*(iHi-iLo)+1 |
864 |
DO I=iLo,iHi |
865 |
arr(I,sNy+J ) = exchBuf1(I0+I-iLo) |
866 |
arr(I,1-OLy+J-1) = exchBuf2(I0+I-iLo) |
867 |
ENDDO |
868 |
ENDDO |
869 |
ELSE |
870 |
DO J=1,OLy |
871 |
iLo= 1-OLx |
872 |
iHi= sNx+OLx |
873 |
I0 = (J-1)*(iHi-iLo)+1 |
874 |
DO I=iLo,iHi |
875 |
arr(I,sNy+J ) = exchBuf2(I0+I-iLo) |
876 |
arr(I,1-OLy+J-1 ) = exchBuf1(I0+I-iLo) |
877 |
ENDDO |
878 |
ENDDO |
879 |
ENDIF |
880 |
#endif |
881 |
|
882 |
#ifdef USE_JAM_EXCH |
883 |
northProc = jam_northId |
884 |
southProc = jam_southId |
885 |
IF ( MOD(myProcId,2) .EQ. 0 ) THEN |
886 |
C sendBuf1 = &arr(1-OLx,sNy-OLy+1) |
887 |
C recvBuf1 = &arr(1-OLx,sNy+1 ) |
888 |
C sendBuf2 = &arr(1-OLx,1 ) |
889 |
C recvBuf2 = &arr(1-OLx,1-OLy ) |
890 |
farProc1 = northProc |
891 |
farProc2 = southProc |
892 |
IF ( farProc1 .NE. myProcId ) THEN |
893 |
CALL JAM_EXCHANGE(farProc1, |
894 |
& arr(1-OLx,sNy-OLy+1), |
895 |
& arr(1-OLx,sNy+1 ), |
896 |
& OLy*(sNx+2*OLx)*4, |
897 |
& jam_exchKey) |
898 |
jam_exchKey = jam_exchKey+1 |
899 |
ENDIF |
900 |
IF ( farProc2 .NE. myProcId ) THEN |
901 |
CALL JAM_EXCHANGE(farProc2, |
902 |
& arr(1-OLx,1 ), |
903 |
& arr(1-OLx,1-OLy ), |
904 |
& OLy*(sNx+2*OLx)*4, |
905 |
& jam_exchKey) |
906 |
jam_exchKey = jam_exchKey+1 |
907 |
ENDIF |
908 |
ELSE |
909 |
C sendBuf1 = &arr(1-OLx,1 ) |
910 |
C recvBuf1 = &arr(1-OLx,1-OLy ) |
911 |
C sendBuf2 = &arr(1-OLx,sNy-OLy+1) |
912 |
C recvBuf2 = &arr(1-OLx,sNy+1 ) |
913 |
farProc1 = southProc |
914 |
farProc2 = northProc |
915 |
IF ( farProc1 .NE. myProcId ) THEN |
916 |
CALL JAM_EXCHANGE(farProc1, |
917 |
& arr(1-OLx,1 ), |
918 |
& arr(1-OLx,1-OLy ), |
919 |
& OLy*(sNx+2*OLx)*4, |
920 |
& jam_exchKey) |
921 |
jam_exchKey = jam_exchKey+1 |
922 |
ENDIF |
923 |
IF ( farProc2 .NE. myProcId ) THEN |
924 |
CALL JAM_EXCHANGE(farProc2, |
925 |
& arr(1-OLx,sNy-OLy+1), |
926 |
& arr(1-OLx,sNy+1 ), |
927 |
& OLy*(sNx+2*OLx)*4, |
928 |
& jam_exchKey) |
929 |
jam_exchKey = jam_exchKey+1 |
930 |
ENDIF |
931 |
ENDIF |
932 |
#endif |
933 |
|
934 |
IF ( numberOfProcs .EQ. 1 ) THEN |
935 |
DO J=1,OLy |
936 |
iLo= 1-OLx |
937 |
iHi= sNx+OLx |
938 |
DO I=iLo,iHi |
939 |
arr(I,sNy+J ) = arr(I,1+J-1 ) |
940 |
arr(I,1-OLy+J-1) = arr(I,sNy-OLy+J) |
941 |
ENDDO |
942 |
ENDDO |
943 |
ENDIF |
944 |
|
945 |
RETURN |
946 |
END |
947 |
SUBROUTINE EXCH_XYZ_R4_JAM( arr ) |
948 |
IMPLICIT NONE |
949 |
|
950 |
C Full width, 3d. Single tile. No X-axis decomp. |
951 |
C exchange. |
952 |
|
953 |
C == Global variables == |
954 |
#include "SIZE.h" |
955 |
#include "EEPARAMS.h" |
956 |
#include "EESUPPORT.h" |
957 |
#include "EXCH_JAM.h" |
958 |
|
959 |
#include "MPI_INFO.h" |
960 |
#include "JAM_INFO.h" |
961 |
|
962 |
C == Routine arguments == |
963 |
REAL*4 arr(1-OLx:sNx+OLx,1-OLy:sNy+OLy,1:Nr) |
964 |
|
965 |
C == Local variables == |
966 |
INTEGER I, J, K |
967 |
INTEGER iLo, iHi, I0 |
968 |
INTEGER northProc, southProc |
969 |
INTEGER farProc1, farProc2 |
970 |
INTEGER toPid, fromPid |
971 |
INTEGER rc |
972 |
|
973 |
#ifdef ALLOW_MPI |
974 |
INTEGER mpiStatus(MPI_STATUS_SIZE) |
975 |
#endif |
976 |
|
977 |
C East-west halo update |
978 |
DO K=1,Nr |
979 |
DO J=1-OLy,sNy+OLy |
980 |
DO I=1,OLx |
981 |
arr(1-I ,J,K) = arr(sNx-I+1,J,K) |
982 |
arr(sNx+I,J,K) = arr(1+I-1 ,J,K) |
983 |
ENDDO |
984 |
ENDDO |
985 |
ENDDO |
986 |
|
987 |
C Phase 1 pairing |
988 |
C | 0 | ---> | 1 | |
989 |
C | 0 | <--- | 1 | |
990 |
|
991 |
C | 2 | ---> | 3 | |
992 |
C | 2 | <--- | 3 | |
993 |
|
994 |
C | 4 | ---> | 5 | |
995 |
C | 4 | <--- | 5 | |
996 |
|
997 |
C etc ... |
998 |
C |
999 |
|
1000 |
#ifdef USE_MPI_EXCH |
1001 |
C North-south halo update (including corners) |
1002 |
DO K=1,Nr |
1003 |
C Put my edges into a buffers |
1004 |
IF ( MOD(myProcId,2) .EQ. 0 ) THEN |
1005 |
DO J=1,OLy |
1006 |
iLo= 1-OLx |
1007 |
iHi= sNx+OLx |
1008 |
I0 = (J-1)*(iHi-iLo)+1 |
1009 |
DO I=iLo,iHi |
1010 |
exchBuf1(I0+I-iLo) = arr(I,sNy-OLy+J,K) |
1011 |
exchBuf2(I0+I-iLo) = arr(I,1+J-1 ,K) |
1012 |
ENDDO |
1013 |
ENDDO |
1014 |
ELSE |
1015 |
DO J=1,OLy |
1016 |
iLo= 1-OLx |
1017 |
iHi= sNx+OLx |
1018 |
I0 = (J-1)*(iHi-iLo)+1 |
1019 |
DO I=iLo,iHi |
1020 |
exchBuf1(I0+I-iLo) = arr(I,1+J-1 ,K) |
1021 |
exchBuf2(I0+I-iLo) = arr(I,sNy-OLy+J,K) |
1022 |
ENDDO |
1023 |
ENDDO |
1024 |
ENDIF |
1025 |
|
1026 |
C Exchange the buffers |
1027 |
northProc = mpi_northId |
1028 |
southProc = mpi_southId |
1029 |
IF ( MOD(myProcId,2) .EQ. 0 ) THEN |
1030 |
farProc1 = northProc |
1031 |
farProc2 = southProc |
1032 |
ELSE |
1033 |
farProc1 = southProc |
1034 |
farProc2 = northProc |
1035 |
ENDIF |
1036 |
C Even-odd pairs |
1037 |
IF ( farProc1 .NE. myProcId ) THEN |
1038 |
CALL MPI_Sendrecv_replace(exchBuf1,OLy*(sNx+2*OLx),MPI_REAL8, |
1039 |
& farProc1,0, |
1040 |
& farProc1,MPI_ANY_TAG, |
1041 |
& MPI_COMM_WORLD,mpiStatus, |
1042 |
& rc) |
1043 |
ENDIF |
1044 |
C Odd-even pairs |
1045 |
IF ( farProc2 .NE. myProcId ) THEN |
1046 |
CALL MPI_Sendrecv_replace(exchBuf2,OLy*(sNx+2*OLx),MPI_REAL8, |
1047 |
& farProc2,0, |
1048 |
& farProc2,MPI_ANY_TAG, |
1049 |
& MPI_COMM_WORLD,mpiStatus, |
1050 |
& rc) |
1051 |
ENDIF |
1052 |
|
1053 |
C Fill overlap regions from the buffers |
1054 |
IF ( MOD(myProcId,2) .EQ. 0 ) THEN |
1055 |
DO J=1,OLy |
1056 |
iLo= 1-OLx |
1057 |
iHi= sNx+OLx |
1058 |
I0 = (J-1)*(iHi-iLo)+1 |
1059 |
DO I=iLo,iHi |
1060 |
arr(I,sNy+J ,K) = exchBuf1(I0+I-iLo) |
1061 |
arr(I,1-OLy+J-1,K) = exchBuf2(I0+I-iLo) |
1062 |
ENDDO |
1063 |
ENDDO |
1064 |
ELSE |
1065 |
DO J=1,OLy |
1066 |
iLo= 1-OLx |
1067 |
iHi= sNx+OLx |
1068 |
I0 = (J-1)*(iHi-iLo)+1 |
1069 |
DO I=iLo,iHi |
1070 |
arr(I,sNy+J ,K) = exchBuf2(I0+I-iLo) |
1071 |
arr(I,1-OLy+J-1 ,K) = exchBuf1(I0+I-iLo) |
1072 |
ENDDO |
1073 |
ENDDO |
1074 |
ENDIF |
1075 |
ENDDO |
1076 |
#endif |
1077 |
|
1078 |
#ifdef USE_JAM_EXCH |
1079 |
northProc = jam_northId |
1080 |
southProc = jam_southId |
1081 |
DO K=1,Nr |
1082 |
IF ( MOD(myProcId,2) .EQ. 0 ) THEN |
1083 |
C sendBuf1 = &arr(1-OLx,sNy-OLy+1) |
1084 |
C recvBuf1 = &arr(1-OLx,sNy+1 ) |
1085 |
C sendBuf2 = &arr(1-OLx,1 ) |
1086 |
C recvBuf2 = &arr(1-OLx,1-OLy ) |
1087 |
farProc1 = northProc |
1088 |
farProc2 = southProc |
1089 |
IF ( farProc1 .NE. myProcId ) THEN |
1090 |
CALL JAM_EXCHANGE(farProc1, |
1091 |
& arr(1-OLx,sNy-OLy+1,K), |
1092 |
& arr(1-OLx,sNy+1 ,K), |
1093 |
& OLy*(sNx+2*OLx)*4, |
1094 |
& jam_exchKey) |
1095 |
jam_exchKey = jam_exchKey+1 |
1096 |
ENDIF |
1097 |
IF ( farProc2 .NE. myProcId ) THEN |
1098 |
CALL JAM_EXCHANGE(farProc2, |
1099 |
& arr(1-OLx,1 ,K), |
1100 |
& arr(1-OLx,1-OLy ,K), |
1101 |
& OLy*(sNx+2*OLx)*4, |
1102 |
& jam_exchKey) |
1103 |
jam_exchKey = jam_exchKey+1 |
1104 |
ENDIF |
1105 |
ELSE |
1106 |
C sendBuf1 = &arr(1-OLx,1 ) |
1107 |
C recvBuf1 = &arr(1-OLx,1-OLy ) |
1108 |
C sendBuf2 = &arr(1-OLx,sNy-OLy+1) |
1109 |
C recvBuf2 = &arr(1-OLx,sNy+1 ) |
1110 |
farProc1 = southProc |
1111 |
farProc2 = northProc |
1112 |
IF ( farProc1 .NE. myProcId ) THEN |
1113 |
CALL JAM_EXCHANGE(farProc1, |
1114 |
& arr(1-OLx,1 ,K), |
1115 |
& arr(1-OLx,1-OLy ,K), |
1116 |
& OLy*(sNx+2*OLx)*4, |
1117 |
& jam_exchKey) |
1118 |
jam_exchKey = jam_exchKey+1 |
1119 |
ENDIF |
1120 |
IF ( farProc2 .NE. myProcId ) THEN |
1121 |
CALL JAM_EXCHANGE(farProc2, |
1122 |
& arr(1-OLx,sNy-OLy+1,K), |
1123 |
& arr(1-OLx,sNy+1 ,K), |
1124 |
& OLy*(sNx+2*OLx)*4, |
1125 |
& jam_exchKey) |
1126 |
jam_exchKey = jam_exchKey+1 |
1127 |
ENDIF |
1128 |
ENDIF |
1129 |
ENDDO |
1130 |
#endif |
1131 |
|
1132 |
IF ( numberOfProcs .EQ. 1 ) THEN |
1133 |
DO K=1,Nr |
1134 |
DO J=1,OLy |
1135 |
iLo= 1-OLx |
1136 |
iHi= sNx+OLx |
1137 |
DO I=iLo,iHi |
1138 |
arr(I,sNy+J ,K) = arr(I,1+J-1 ,K) |
1139 |
arr(I,1-OLy+J-1,K) = arr(I,sNy-OLy+J,K) |
1140 |
ENDDO |
1141 |
ENDDO |
1142 |
ENDDO |
1143 |
ENDIF |
1144 |
|
1145 |
#endif /* LETS_MAKE_JAM */ |
1146 |
|
1147 |
RETURN |
1148 |
END |
1149 |
|
1150 |
#endif /* JAM_WITH_TWO_PROCS_PER_NODE */ |
1151 |
#ifdef JAM_WITH_TWO_PROCS_PER_NODE |
1152 |
C Dual processor JAM stuff |
1153 |
|
1154 |
#undef USE_MPI_EXCH |
1155 |
#define USE_JAM_EXCH |
1156 |
|
1157 |
SUBROUTINE EXCH_XY_O1_R8_JAM( arr ) |
1158 |
|
1159 |
IMPLICIT NONE |
1160 |
C Width 1. Single tile. No X-axis decomp. |
1161 |
C No. corner update. Exchange. |
1162 |
|
1163 |
#define ALLOW_MPI |
1164 |
#define _OLx 1 |
1165 |
#define _OLy 1 |
1166 |
|
1167 |
C == Global variables == |
1168 |
#include "SIZE.h" |
1169 |
#include "EEPARAMS.h" |
1170 |
#include "EXCH_JAM.h" |
1171 |
|
1172 |
#include "MPI_INFO.h" |
1173 |
#include "JAM_INFO.h" |
1174 |
|
1175 |
C == Compile time constants == |
1176 |
|
1177 |
C == Routine arguments == |
1178 |
Real*8 arr(1-_OLx:sNx+_OLx,1-_OLy:sNy+_OLy) |
1179 |
|
1180 |
C == Local variables == |
1181 |
INTEGER I, J |
1182 |
INTEGER northProc, southProc |
1183 |
INTEGER farProc1, farProc2 |
1184 |
INTEGER toPid, fromPid |
1185 |
INTEGER rc |
1186 |
INTEGER myFourWayRank |
1187 |
INTEGER exchangePhase |
1188 |
|
1189 |
C East-west halo update (without corners) |
1190 |
DO J=1,sNy |
1191 |
DO I=1,_OLx |
1192 |
arr(1-I ,J) = arr(sNx-I+1,J) |
1193 |
arr(sNx+I,J) = arr(1+I-1 ,J) |
1194 |
ENDDO |
1195 |
ENDDO |
1196 |
|
1197 |
C Phase 1 pairing |
1198 |
C | 0 | ---> | 1 | |
1199 |
C | 0 | <--- | 1 | |
1200 |
|
1201 |
C | 2 | ---> | 3 | |
1202 |
C | 2 | <--- | 3 | |
1203 |
|
1204 |
C | 4 | ---> | 5 | |
1205 |
C | 4 | <--- | 5 | |
1206 |
|
1207 |
C etc ... |
1208 |
C |
1209 |
|
1210 |
#ifdef USE_JAM_EXCH |
1211 |
northProc = jam_northId |
1212 |
southProc = jam_southId |
1213 |
myFourWayRank = MOD(myProcId,4) |
1214 |
|
1215 |
IF ( MOD(myProcId,2) .EQ. 0 ) THEN |
1216 |
farProc1 = northProc |
1217 |
farProc2 = southProc |
1218 |
IF ( farProc1 .NE. myProcId ) THEN |
1219 |
CALL JAM_EXCHANGE(farProc1,arr(1,sNy),arr(1,sNy+1),sNx*8,jam_exchKey) |
1220 |
jam_exchKey = jam_exchKey+1 |
1221 |
ENDIF |
1222 |
10 CONTINUE |
1223 |
CALL JAM_EXCHANGE_TEST( exchangePhase ) |
1224 |
IF ( myFourWayRank .EQ. 0 ) THEN |
1225 |
IF ( exchangePhase .EQ. 0 ) GOTO 11 |
1226 |
ELSE |
1227 |
IF ( exchangePhase .EQ. 1 ) GOTO 11 |
1228 |
ENDIF |
1229 |
GOTO 10 |
1230 |
11 CONTINUE |
1231 |
IF ( farProc2 .NE. myProcId ) THEN |
1232 |
CALL JAM_EXCHANGE(farProc2,arr(1,1),arr(1,0),sNx*8,jam_exchKey) |
1233 |
jam_exchKey = jam_exchKey+1 |
1234 |
ENDIF |
1235 |
CALL JAM_EXCHANGE_MARK |
1236 |
ELSE |
1237 |
farProc1 = southProc |
1238 |
farProc2 = northProc |
1239 |
IF ( farProc1 .NE. myProcId ) THEN |
1240 |
CALL JAM_EXCHANGE(farProc1,arr(1,1),arr(1,0),sNx*8,jam_exchKey) |
1241 |
jam_exchKey = jam_exchKey+1 |
1242 |
ENDIF |
1243 |
20 CONTINUE |
1244 |
CALL JAM_EXCHANGE_TEST( exchangePhase ) |
1245 |
IF ( myFourWayRank .EQ. 3 ) THEN |
1246 |
IF ( exchangePhase .EQ. 0 ) GOTO 21 |
1247 |
ELSE |
1248 |
IF ( exchangePhase .EQ. 1 ) GOTO 21 |
1249 |
ENDIF |
1250 |
GOTO 20 |
1251 |
21 CONTINUE |
1252 |
IF ( farProc2 .NE. myProcId ) THEN |
1253 |
CALL JAM_EXCHANGE(farProc2,arr(1,sNy),arr(1,sNy+1),sNx*8,jam_exchKey) |
1254 |
jam_exchKey = jam_exchKey+1 |
1255 |
ENDIF |
1256 |
CALL JAM_EXCHANGE_MARK |
1257 |
ENDIF |
1258 |
#endif |
1259 |
|
1260 |
RETURN |
1261 |
END |
1262 |
|
1263 |
SUBROUTINE EXCH_XY_R8_JAM( arr ) |
1264 |
|
1265 |
IMPLICIT NONE |
1266 |
|
1267 |
C Full width. Single tile. No X-axis decomp. |
1268 |
C exchange. |
1269 |
|
1270 |
C == Global variables == |
1271 |
#include "SIZE.h" |
1272 |
#include "EEPARAMS.h" |
1273 |
#include "EESUPPORT.h" |
1274 |
#include "EXCH_JAM.h" |
1275 |
|
1276 |
#include "MPI_INFO.h" |
1277 |
#include "JAM_INFO.h" |
1278 |
|
1279 |
C == Routine arguments == |
1280 |
Real*8 arr(1-OLx:sNx+OLx,1-OLy:sNy+OLy) |
1281 |
|
1282 |
C == Local variables == |
1283 |
INTEGER I, J |
1284 |
INTEGER iLo, iHi, I0 |
1285 |
INTEGER northProc, southProc |
1286 |
INTEGER farProc1, farProc2 |
1287 |
INTEGER toPid, fromPid |
1288 |
INTEGER rc |
1289 |
INTEGER myFourWayRank, exchangePhase |
1290 |
|
1291 |
#ifdef ALLOW_MPI |
1292 |
INTEGER mpiStatus(MPI_STATUS_SIZE) |
1293 |
#endif |
1294 |
|
1295 |
C East-west halo update |
1296 |
DO J=1-OLy,sNy+OLy |
1297 |
DO I=1,OLx |
1298 |
arr(1-I ,J) = arr(sNx-I+1,J) |
1299 |
arr(sNx+I,J) = arr(1+I-1 ,J) |
1300 |
ENDDO |
1301 |
ENDDO |
1302 |
|
1303 |
C Phase 1 pairing |
1304 |
C | 0 | ---> | 1 | |
1305 |
C | 0 | <--- | 1 | |
1306 |
|
1307 |
C | 2 | ---> | 3 | |
1308 |
C | 2 | <--- | 3 | |
1309 |
|
1310 |
C | 4 | ---> | 5 | |
1311 |
C | 4 | <--- | 5 | |
1312 |
|
1313 |
C etc ... |
1314 |
C |
1315 |
|
1316 |
#ifdef USE_JAM_EXCH |
1317 |
northProc = jam_northId |
1318 |
southProc = jam_southId |
1319 |
myFourWayRank = MOD(myProcId,4) |
1320 |
|
1321 |
IF ( MOD(myProcId,2) .EQ. 0 ) THEN |
1322 |
C sendBuf1 = &arr(1-OLx,sNy-OLy+1) |
1323 |
C recvBuf1 = &arr(1-OLx,sNy+1 ) |
1324 |
C sendBuf2 = &arr(1-OLx,1 ) |
1325 |
C recvBuf2 = &arr(1-OLx,1-OLy ) |
1326 |
farProc1 = northProc |
1327 |
farProc2 = southProc |
1328 |
IF ( farProc1 .NE. myProcId ) THEN |
1329 |
CALL JAM_EXCHANGE(farProc1, |
1330 |
& arr(1-OLx,sNy-OLy+1), |
1331 |
& arr(1-OLx,sNy+1 ), |
1332 |
& OLy*(sNx+2*OLx)*8, |
1333 |
& jam_exchKey) |
1334 |
jam_exchKey = jam_exchKey+1 |
1335 |
ENDIF |
1336 |
10 CONTINUE |
1337 |
CALL JAM_EXCHANGE_TEST( exchangePhase ) |
1338 |
IF ( myFourWayRank .EQ. 0 ) THEN |
1339 |
IF ( exchangePhase .EQ. 0 ) GOTO 11 |
1340 |
ELSE |
1341 |
IF ( exchangePhase .EQ. 1 ) GOTO 11 |
1342 |
ENDIF |
1343 |
GOTO 10 |
1344 |
11 CONTINUE |
1345 |
IF ( farProc2 .NE. myProcId ) THEN |
1346 |
CALL JAM_EXCHANGE(farProc2, |
1347 |
& arr(1-OLx,1 ), |
1348 |
& arr(1-OLx,1-OLy ), |
1349 |
& OLy*(sNx+2*OLx)*8, |
1350 |
& jam_exchKey) |
1351 |
jam_exchKey = jam_exchKey+1 |
1352 |
ENDIF |
1353 |
CALL JAM_EXCHANGE_MARK |
1354 |
ELSE |
1355 |
C sendBuf1 = &arr(1-OLx,1 ) |
1356 |
C recvBuf1 = &arr(1-OLx,1-OLy ) |
1357 |
C sendBuf2 = &arr(1-OLx,sNy-OLy+1) |
1358 |
C recvBuf2 = &arr(1-OLx,sNy+1 ) |
1359 |
farProc1 = southProc |
1360 |
farProc2 = northProc |
1361 |
IF ( farProc1 .NE. myProcId ) THEN |
1362 |
CALL JAM_EXCHANGE(farProc1, |
1363 |
& arr(1-OLx,1 ), |
1364 |
& arr(1-OLx,1-OLy ), |
1365 |
& OLy*(sNx+2*OLx)*8, |
1366 |
& jam_exchKey) |
1367 |
jam_exchKey = jam_exchKey+1 |
1368 |
ENDIF |
1369 |
20 CONTINUE |
1370 |
CALL JAM_EXCHANGE_TEST( exchangePhase ) |
1371 |
IF ( myFourWayRank .EQ. 3 ) THEN |
1372 |
IF ( exchangePhase .EQ. 0 ) GOTO 21 |
1373 |
ELSE |
1374 |
IF ( exchangePhase .EQ. 1 ) GOTO 21 |
1375 |
ENDIF |
1376 |
GOTO 20 |
1377 |
21 CONTINUE |
1378 |
IF ( farProc2 .NE. myProcId ) THEN |
1379 |
CALL JAM_EXCHANGE(farProc2, |
1380 |
& arr(1-OLx,sNy-OLy+1), |
1381 |
& arr(1-OLx,sNy+1 ), |
1382 |
& OLy*(sNx+2*OLx)*8, |
1383 |
& jam_exchKey) |
1384 |
jam_exchKey = jam_exchKey+1 |
1385 |
ENDIF |
1386 |
CALL JAM_EXCHANGE_MARK |
1387 |
ENDIF |
1388 |
#endif |
1389 |
|
1390 |
RETURN |
1391 |
END |
1392 |
SUBROUTINE EXCH_XYZ_R8_JAM( arr ) |
1393 |
IMPLICIT NONE |
1394 |
|
1395 |
C Full width, 3d. Single tile. No X-axis decomp. |
1396 |
C exchange. |
1397 |
|
1398 |
C == Global variables == |
1399 |
#include "SIZE.h" |
1400 |
#include "EEPARAMS.h" |
1401 |
#include "EESUPPORT.h" |
1402 |
#include "EXCH_JAM.h" |
1403 |
|
1404 |
#include "MPI_INFO.h" |
1405 |
#include "JAM_INFO.h" |
1406 |
|
1407 |
C == Routine arguments == |
1408 |
INTEGER myThid |
1409 |
Real*8 arr(1-OLx:sNx+OLx,1-OLy:sNy+OLy,1:Nr) |
1410 |
|
1411 |
C == Local variables == |
1412 |
INTEGER I, J, K |
1413 |
INTEGER iLo, iHi, I0 |
1414 |
INTEGER northProc, southProc |
1415 |
INTEGER farProc1, farProc2 |
1416 |
INTEGER toPid, fromPid |
1417 |
INTEGER rc |
1418 |
INTEGER myFourWayRank, exchangePhase |
1419 |
|
1420 |
#ifdef ALLOW_MPI |
1421 |
INTEGER mpiStatus(MPI_STATUS_SIZE) |
1422 |
#endif |
1423 |
|
1424 |
C East-west halo update |
1425 |
DO K=1,Nr |
1426 |
DO J=1-OLy,sNy+OLy |
1427 |
DO I=1,OLx |
1428 |
arr(1-I ,J,K) = arr(sNx-I+1,J,K) |
1429 |
arr(sNx+I,J,K) = arr(1+I-1 ,J,K) |
1430 |
ENDDO |
1431 |
ENDDO |
1432 |
ENDDO |
1433 |
|
1434 |
CcnhDebugStarts |
1435 |
C RETURN |
1436 |
CcnhDebugEnds |
1437 |
|
1438 |
C Phase 1 pairing |
1439 |
C | 0 | ---> | 1 | |
1440 |
C | 0 | <--- | 1 | |
1441 |
|
1442 |
C | 2 | ---> | 3 | |
1443 |
C | 2 | <--- | 3 | |
1444 |
|
1445 |
C | 4 | ---> | 5 | |
1446 |
C | 4 | <--- | 5 | |
1447 |
|
1448 |
C etc ... |
1449 |
C |
1450 |
|
1451 |
|
1452 |
#ifdef USE_JAM_EXCH |
1453 |
northProc = jam_northId |
1454 |
southProc = jam_southId |
1455 |
myFourWayRank = MOD(myProcId,4) |
1456 |
|
1457 |
DO K=1,Nr |
1458 |
IF ( MOD(myProcId,2) .EQ. 0 ) THEN |
1459 |
C sendBuf1 = &arr(1-OLx,sNy-OLy+1) |
1460 |
C recvBuf1 = &arr(1-OLx,sNy+1 ) |
1461 |
C sendBuf2 = &arr(1-OLx,1 ) |
1462 |
C recvBuf2 = &arr(1-OLx,1-OLy ) |
1463 |
farProc1 = northProc |
1464 |
farProc2 = southProc |
1465 |
IF ( farProc1 .NE. myProcId ) THEN |
1466 |
CALL JAM_EXCHANGE(farProc1, |
1467 |
& arr(1-OLx,sNy-OLy+1,K), |
1468 |
& arr(1-OLx,sNy+1 ,K), |
1469 |
& OLy*(sNx+2*OLx)*8, |
1470 |
& jam_exchKey) |
1471 |
jam_exchKey = jam_exchKey+1 |
1472 |
ENDIF |
1473 |
10 CONTINUE |
1474 |
CALL JAM_EXCHANGE_TEST( exchangePhase ) |
1475 |
IF ( myFourWayRank .EQ. 0 ) THEN |
1476 |
IF ( exchangePhase .EQ. 0 ) GOTO 11 |
1477 |
ELSE |
1478 |
IF ( exchangePhase .EQ. 1 ) GOTO 11 |
1479 |
ENDIF |
1480 |
GOTO 10 |
1481 |
11 CONTINUE |
1482 |
IF ( farProc2 .NE. myProcId ) THEN |
1483 |
CALL JAM_EXCHANGE(farProc2, |
1484 |
& arr(1-OLx,1 ,K), |
1485 |
& arr(1-OLx,1-OLy ,K), |
1486 |
& OLy*(sNx+2*OLx)*8, |
1487 |
& jam_exchKey) |
1488 |
jam_exchKey = jam_exchKey+1 |
1489 |
ENDIF |
1490 |
CALL JAM_EXCHANGE_MARK |
1491 |
ELSE |
1492 |
C sendBuf1 = &arr(1-OLx,1 ) |
1493 |
C recvBuf1 = &arr(1-OLx,1-OLy ) |
1494 |
C sendBuf2 = &arr(1-OLx,sNy-OLy+1) |
1495 |
C recvBuf2 = &arr(1-OLx,sNy+1 ) |
1496 |
farProc1 = southProc |
1497 |
farProc2 = northProc |
1498 |
IF ( farProc1 .NE. myProcId ) THEN |
1499 |
CALL JAM_EXCHANGE(farProc1, |
1500 |
& arr(1-OLx,1 ,K), |
1501 |
& arr(1-OLx,1-OLy ,K), |
1502 |
& OLy*(sNx+2*OLx)*8, |
1503 |
& jam_exchKey) |
1504 |
jam_exchKey = jam_exchKey+1 |
1505 |
ENDIF |
1506 |
20 CONTINUE |
1507 |
CALL JAM_EXCHANGE_TEST( exchangePhase ) |
1508 |
IF ( myFourWayRank .EQ. 3 ) THEN |
1509 |
IF ( exchangePhase .EQ. 0 ) GOTO 21 |
1510 |
ELSE |
1511 |
IF ( exchangePhase .EQ. 1 ) GOTO 21 |
1512 |
ENDIF |
1513 |
GOTO 20 |
1514 |
21 CONTINUE |
1515 |
IF ( farProc2 .NE. myProcId ) THEN |
1516 |
CALL JAM_EXCHANGE(farProc2, |
1517 |
& arr(1-OLx,sNy-OLy+1,K), |
1518 |
& arr(1-OLx,sNy+1 ,K), |
1519 |
& OLy*(sNx+2*OLx)*8, |
1520 |
& jam_exchKey) |
1521 |
jam_exchKey = jam_exchKey+1 |
1522 |
ENDIF |
1523 |
CALL JAM_EXCHANGE_MARK |
1524 |
ENDIF |
1525 |
ENDDO |
1526 |
#endif |
1527 |
|
1528 |
RETURN |
1529 |
END |
1530 |
|
1531 |
#endif /* JAM_WITH_TWO_PROCS_PER_NODE */ |