forked from altMITgcm/MITgcm
-
Notifications
You must be signed in to change notification settings - Fork 0
/
gather_2d_rx.template
243 lines (207 loc) · 6.38 KB
/
gather_2d_rx.template
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
C $Header: /u/gcmpack/MITgcm/eesupp/src/gather_2d_rx.template,v 1.7 2012/09/03 19:36:29 jmc Exp $
C $Name: $
#include "PACKAGES_CONFIG.h"
#include "CPP_EEOPTIONS.h"
CBOP
C !ROUTINE: GATHER_2D_RX
C !INTERFACE:
SUBROUTINE GATHER_2D_RX(
O gloBuff,
I myField,
I xSize, ySize,
I useExch2GlobLayOut,
I zeroBuff,
I myThid )
C !DESCRIPTION:
C Gather elements of a global 2-D array from all mpi processes to process 0.
C Note: done by Master-Thread ; might need barrier calls before and after
C this S/R call.
C !USES:
IMPLICIT NONE
#include "SIZE.h"
#include "EEPARAMS.h"
#include "EESUPPORT.h"
#ifdef ALLOW_EXCH2
#include "W2_EXCH2_SIZE.h"
#include "W2_EXCH2_TOPOLOGY.h"
#endif /* ALLOW_EXCH2 */
C !INPUT/OUTPUT PARAMETERS:
C gloBuff ( _RX ) :: full-domain 2D IO-buffer array (Output)
C myField ( _RX ) :: tiled, local (i.e. my Proc. tiles) 2D array (Input)
C xSize (integer):: global buffer 1rst dim (x)
C ySize (integer):: global buffer 2nd dim (y)
C useExch2GlobLayOut:: =T: Use Exch2 global-map layout (only with EXCH2)
C zeroBuff (logical):: =T: initialise the buffer to zero before copy
C myThid (integer):: my Thread Id number
INTEGER xSize, ySize
_RX gloBuff(xSize,ySize)
_RX myField(1:sNx,1:sNy,nSx,nSy)
LOGICAL useExch2GlobLayOut
LOGICAL zeroBuff
INTEGER myThid
CEOP
C !LOCAL VARIABLES:
INTEGER i,j, bi,bj
INTEGER iG, jG
INTEGER iBase, jBase
#ifdef ALLOW_EXCH2
INTEGER iGjLoc, jGjLoc
INTEGER tN
#endif /* ALLOW_EXCH2 */
#ifdef ALLOW_USE_MPI
INTEGER np, pId
_RX temp(1:sNx,1:sNy,nSx,nSy)
INTEGER istatus(MPI_STATUS_SIZE), ierr
INTEGER lbuff, idest, itag, ready_to_receive
#endif /* ALLOW_USE_MPI */
_BEGIN_MASTER( myThid )
IF( myProcId .EQ. 0 ) THEN
C-- Process 0 fills-in its local data
#ifdef ALLOW_EXCH2
IF ( useExch2GlobLayOut ) THEN
C-- If using blank-tiles, buffer will not be completely filled;
C safer to reset to zero to avoid unknown values in output file
IF ( zeroBuff ) THEN
DO j=1,ySize
DO i=1,xSize
gloBuff(i,j) = 0.
ENDDO
ENDDO
ENDIF
DO bj=1,nSy
DO bi=1,nSx
tN = W2_myTileList(bi,bj)
IF ( exch2_mydNx(tN) .GT. xSize ) THEN
C- face x-size larger than glob-size : fold it
iGjLoc = 0
jGjLoc = exch2_mydNx(tN) / xSize
ELSEIF ( exch2_tNy(tN) .GT. ySize ) THEN
C- tile y-size larger than glob-size : make a long line
iGjLoc = exch2_mydNx(tN)
jGjLoc = 0
ELSE
C- default (face fit into global-IO-array)
iGjLoc = 0
jGjLoc = 1
ENDIF
DO j=1,sNy
#ifdef TARGET_NEC_SX
!cdir novector
#endif
iG=exch2_txGlobalo(tN)+iGjLoc*(j-1)-1
jG=exch2_tyGlobalo(tN)+jGjLoc*(j-1)
DO i=1,sNx
gloBuff(iG+i,jG) = myField(i,j,bi,bj)
ENDDO
ENDDO
ENDDO
ENDDO
ELSE
#else /* ALLOW_EXCH2 */
IF (.TRUE.) THEN
#endif /* ALLOW_EXCH2 */
iBase = myXGlobalLo-1
jBase = myYGlobalLo-1
DO bj=1,nSy
DO bi=1,nSx
DO j=1,sNy
#ifdef TARGET_NEC_SX
!cdir novector
#endif
iG = iBase+(bi-1)*sNx
jG = jBase+(bj-1)*sNy+j
DO i=1,sNx
gloBuff(iG+i,jG) = myField(i,j,bi,bj)
ENDDO
ENDDO
ENDDO
ENDDO
C end if-else useExch2GlobLayOut
ENDIF
C- end if myProcId = 0
ENDIF
#ifdef ALLOW_USE_MPI
IF ( usingMPI ) THEN
lbuff = sNx*nSx*sNy*nSy
idest = 0
itag = 0
ready_to_receive = 0
IF( mpiMyId .EQ. 0 ) THEN
C-- Process 0 polls and receives data from each process in turn
DO np = 2, nPx*nPy
pId = np - 1
#ifndef DISABLE_MPI_READY_TO_RECEIVE
CALL MPI_SEND (ready_to_receive, 1, MPI_INTEGER,
& pId, itag, MPI_COMM_MODEL, ierr)
#endif
CALL MPI_RECV (temp, lbuff, _MPI_TYPE_RX,
& pId, itag, MPI_COMM_MODEL, istatus, ierr)
C-- Process 0 gathers the local arrays into the global buffer.
#ifdef ALLOW_EXCH2
IF ( useExch2GlobLayOut ) THEN
DO bj=1,nSy
DO bi=1,nSx
tN = W2_procTileList(bi,bj,np)
IF ( exch2_mydNx(tN) .GT. xSize ) THEN
C- face x-size larger than glob-size : fold it
iGjLoc = 0
jGjLoc = exch2_mydNx(tN) / xSize
ELSEIF ( exch2_tNy(tN) .GT. ySize ) THEN
C- tile y-size larger than glob-size : make a long line
iGjLoc = exch2_mydNx(tN)
jGjLoc = 0
ELSE
C- default (face fit into global-IO-array)
iGjLoc = 0
jGjLoc = 1
ENDIF
DO j=1,sNy
#ifdef TARGET_NEC_SX
!cdir novector
#endif
iG=exch2_txGlobalo(tN)+iGjLoc*(j-1)-1
jG=exch2_tyGlobalo(tN)+jGjLoc*(j-1)
DO i=1,sNx
gloBuff(iG+i,jG) = temp(i,j,bi,bj)
ENDDO
ENDDO
ENDDO
ENDDO
ELSE
#else /* ALLOW_EXCH2 */
IF (.TRUE.) THEN
#endif /* ALLOW_EXCH2 */
iBase = mpi_myXGlobalLo(np)-1
jBase = mpi_myYGlobalLo(np)-1
DO bj=1,nSy
DO bi=1,nSx
DO j=1,sNy
#ifdef TARGET_NEC_SX
!cdir novector
#endif
iG = iBase+(bi-1)*sNx
jG = jBase+(bj-1)*sNy+j
DO i=1,sNx
gloBuff(iG+i,jG) = temp(i,j,bi,bj)
ENDDO
ENDDO
ENDDO
ENDDO
C end if-else useExch2GlobLayOut
ENDIF
C- end loop on np
ENDDO
ELSE
C-- All proceses except 0 wait to be polled then send local array
#ifndef DISABLE_MPI_READY_TO_RECEIVE
CALL MPI_RECV (ready_to_receive, 1, MPI_INTEGER,
& idest, itag, MPI_COMM_MODEL, istatus, ierr)
#endif
CALL MPI_SEND (myField, lbuff, _MPI_TYPE_RX,
& idest, itag, MPI_COMM_MODEL, ierr)
ENDIF
ENDIF
#endif /* ALLOW_USE_MPI */
_END_MASTER( myThid )
RETURN
END