1 |
jmc |
1.1 |
#! /bin/sh |
2 |
|
|
|
3 |
jmc |
1.2 |
# $Header: /u/gcmpack/MITgcm/verification/cpl_aim+ocn/run_cpl_test,v 1.17 2010/12/06 02:52:40 jmc Exp $ |
4 |
jmc |
1.1 |
# $Name: $ |
5 |
|
|
|
6 |
|
|
#- default: |
7 |
|
|
#Npr=3 ; NpOc=1 ; |
8 |
|
|
Npr=25; NpOc=12; |
9 |
|
|
MTH= |
10 |
|
|
MTHo= |
11 |
|
|
MTHa= |
12 |
jmc |
1.2 |
#GMKopt='-devel' |
13 |
jmc |
1.1 |
GMKopt='-ieee' |
14 |
|
|
#GMKopt= |
15 |
|
|
rnkO=1 ; rnkA=`expr $rnkO + $NpOc` |
16 |
|
|
|
17 |
|
|
#- parse options: |
18 |
|
|
if [ $# -ge 1 ] ; then if test $1 = '-mth' ; then |
19 |
|
|
MTH='-omp' ; shift |
20 |
|
|
if test -f input_ocn/eedata.mth ; then MTHo=$MTH ; fi |
21 |
|
|
if test -f input_atm/eedata.mth ; then MTHa=$MTH ; fi |
22 |
|
|
fi ; fi |
23 |
|
|
if [ $# -ne 1 ] |
24 |
|
|
then |
25 |
|
|
echo 'Usage:'`basename $0`' [opt] step' |
26 |
|
|
echo ' => test coupled set-up on linux box (1.cpu)' |
27 |
|
|
echo 'opt = -mth : compile and run (if eedata.mth) 2-threads for ocn & atm' |
28 |
|
|
echo ' step = 0 : clean all directories' |
29 |
|
|
echo ' step = 1 : compile the 3 executables (cpl,ocn,atm)' |
30 |
|
|
echo ' step = 2 : copy input files and dir(s)' |
31 |
|
|
echo " step = 3 : run with $Npr mpi processes" |
32 |
|
|
echo ' step = 4 : check the results' |
33 |
|
|
echo ' step = 5 : remove output files in rank_0,1,2 dir.' |
34 |
|
|
exit |
35 |
|
|
fi |
36 |
|
|
kpr=$1 |
37 |
|
|
dir=`pwd` |
38 |
|
|
|
39 |
|
|
#============================================================================ |
40 |
|
|
|
41 |
|
|
if test $kpr = 0 |
42 |
|
|
then |
43 |
|
|
rm -f pr_group std_outp comp_res.{ocn,atm,land,sice} |
44 |
|
|
rm -f build_???/TTT.*make.* build_???/TTT.mkdepend.* |
45 |
|
|
/bin/rm -r -f rank_? rank_1? rank_2? |
46 |
|
|
if test -f build_cpl/Makefile ; then cd build_cpl ; make Clean ; cd .. ; fi |
47 |
|
|
if test -f build_ocn/Makefile ; then cd build_ocn ; make Clean ; cd .. ; fi |
48 |
|
|
if test -f build_atm/Makefile ; then cd build_atm ; make Clean ; cd .. ; fi |
49 |
|
|
fi |
50 |
|
|
if test $kpr = 5 |
51 |
|
|
then |
52 |
|
|
echo 'remove output files in rank_0,1,2 dir.' |
53 |
|
|
rm -f pr_group std_outp comp_res.{ocn,atm,land,sice} |
54 |
|
|
if test -d rank_0 ; then cd rank_0 ; rm -f Coupler.0000.clog ; cd .. ; fi |
55 |
|
|
if test -d rank_$rnkO |
56 |
|
|
then cd rank_$rnkO ; rm -f *.data *.meta STD???.0000 UV-*.0001.clog ; cd .. ; fi |
57 |
|
|
if test -d rank_$rnkA |
58 |
|
|
then cd rank_$rnkA ; rm -f *.data *.meta STD???.0000 UV-*.0001.clog ; cd .. ; fi |
59 |
|
|
fi |
60 |
|
|
|
61 |
|
|
if test $kpr = 1 |
62 |
|
|
then |
63 |
|
|
|
64 |
|
|
#- choice of the optfile: take a local one in dir verification with sufix '+mpi' |
65 |
|
|
nbOpF=`ls ../linux_* | grep '+mpi' 2> /dev/null | wc -l` |
66 |
|
|
if test $nbOpF = 1 ; then |
67 |
|
|
OPTFILE=`ls ../linux_* | grep '+mpi'` |
68 |
|
|
zz=`grep '^FC=' $OPTFILE` |
69 |
|
|
echo " Using optfile: $OPTFILE (compiler=$zz) $MTH" |
70 |
|
|
elif [ $nbOpF -ge 2 ] ; then |
71 |
|
|
echo "pick the 1rst of these ( $nbOpF ) optfiles:" |
72 |
|
|
ls ../linux_* | grep '+mpi' |
73 |
|
|
OPTFILE=`ls ../linux_* | grep '+mpi' | head -1` |
74 |
|
|
zz=`grep '^FC=' $OPTFILE` |
75 |
|
|
echo " Using optfile: $OPTFILE (compiler=$zz) $MTH" |
76 |
|
|
else |
77 |
|
|
echo "Pb in finding optfile: found $nbOpF :" |
78 |
|
|
ls ../linux_* | grep '+mpi' ; exit |
79 |
|
|
fi |
80 |
|
|
zz=`echo $OPTFILE | grep -c '^\/'` |
81 |
|
|
if test $zz = 0 ; then OPTFILE="../$OPTFILE" ; fi |
82 |
|
|
#--- |
83 |
|
|
echo '==== compile coupler:' |
84 |
|
|
cd build_cpl |
85 |
|
|
echo ' --- genmake2 (cpl):' |
86 |
|
|
../../../tools/genmake2 -of $OPTFILE -mpi $GMKopt > TTT.genmake.$$ |
87 |
|
|
tail -5 TTT.genmake.$$ |
88 |
|
|
echo ' --- make depend (cpl):' |
89 |
|
|
make depend > TTT.mkdepend.$$ |
90 |
|
|
tail -5 TTT.mkdepend.$$ |
91 |
|
|
echo ' --- make (cpl):' |
92 |
|
|
make > TTT.make.$$ 2>&1 |
93 |
|
|
tail -10 TTT.make.$$ |
94 |
|
|
echo ' ' ; cd $dir |
95 |
|
|
|
96 |
|
|
echo '==== compile OGCM:' |
97 |
|
|
cd build_ocn |
98 |
|
|
echo ' --- genmake2 (ocn):' |
99 |
|
|
../../../tools/genmake2 -of $OPTFILE -mpi $MTHo $GMKopt > TTT.genmake.$$ |
100 |
|
|
tail -5 TTT.genmake.$$ |
101 |
|
|
echo ' --- make depend (ocn):' |
102 |
|
|
make depend > TTT.mkdepend.$$ |
103 |
|
|
tail -10 TTT.mkdepend.$$ |
104 |
|
|
echo ' --- make (ocn):' |
105 |
|
|
make > TTT.make.$$ 2>&1 |
106 |
|
|
tail -10 TTT.make.$$ |
107 |
|
|
echo ' ' ; cd $dir |
108 |
|
|
|
109 |
|
|
echo '==== compile AGCM:' |
110 |
|
|
cd build_atm |
111 |
|
|
echo ' --- genmake2 (atm):' |
112 |
|
|
../../../tools/genmake2 -of $OPTFILE -mpi $MTHa $GMKopt > TTT.genmake.$$ |
113 |
|
|
tail -5 TTT.genmake.$$ |
114 |
|
|
echo ' --- make depend (atm):' |
115 |
|
|
make depend > TTT.mkdepend.$$ |
116 |
|
|
tail -10 TTT.mkdepend.$$ |
117 |
|
|
echo ' --- make (atm):' |
118 |
|
|
make > TTT.make.$$ 2>&1 |
119 |
|
|
tail -10 TTT.make.$$ |
120 |
|
|
echo ' ' ; cd $dir |
121 |
|
|
|
122 |
|
|
ls -l build_???/mitgcmuv |
123 |
|
|
|
124 |
|
|
fi |
125 |
|
|
|
126 |
|
|
if test $kpr = 2 |
127 |
|
|
then |
128 |
|
|
echo 'rm dir:' rank_? rank_1? rank_2? |
129 |
|
|
/bin/rm -r -f rank_? rank_1? rank_2? |
130 |
|
|
echo 'Link files from dir:' input_cpl '->' rank_0 |
131 |
|
|
mkdir rank_0 |
132 |
|
|
( cd rank_0 ; ln -s ../input_cpl/* . ) |
133 |
|
|
|
134 |
|
|
n=$rnkO |
135 |
|
|
echo 'Link files from dir:' input_ocn '->' rank_$n |
136 |
|
|
mkdir rank_$n |
137 |
|
|
cd rank_$n |
138 |
|
|
ln -s ../input_ocn/* . |
139 |
|
|
if test -x prepare_run ; then ./prepare_run ; fi |
140 |
|
|
if test "x$MTHo" != x ; then |
141 |
|
|
echo " MTH run: mv -f eedata.mth eedata" |
142 |
|
|
if test -h eedata ; then rm -f eedata ; fi |
143 |
|
|
mv -f eedata.mth eedata |
144 |
|
|
fi |
145 |
|
|
cd $dir |
146 |
|
|
n=`expr $n + 1` |
147 |
|
|
while [ $n -le $NpOc ] ; do |
148 |
|
|
ln -s rank_$rnkO rank_$n |
149 |
|
|
n=`expr $n + 1` |
150 |
|
|
done |
151 |
|
|
|
152 |
|
|
n=$rnkA |
153 |
|
|
echo 'Link files from dir:' input_atm '->' rank_$n |
154 |
|
|
mkdir rank_$n |
155 |
|
|
cd rank_$n |
156 |
|
|
ln -s ../input_atm/* . |
157 |
|
|
if test -x prepare_run ; then ./prepare_run ; fi |
158 |
|
|
if test "x$MTHa" != x ; then |
159 |
|
|
echo " MTH run: mv -f eedata.mth eedata" |
160 |
|
|
if test -h eedata ; then rm -f eedata ; fi |
161 |
|
|
mv -f eedata.mth eedata |
162 |
|
|
fi |
163 |
|
|
cd $dir |
164 |
|
|
n=`expr $n + 1` |
165 |
|
|
while [ $n -lt $Npr ] ; do |
166 |
|
|
ln -s rank_$rnkA rank_$n |
167 |
|
|
n=`expr $n + 1` |
168 |
|
|
done |
169 |
|
|
|
170 |
|
|
fi |
171 |
|
|
|
172 |
|
|
if test $kpr = 3 |
173 |
|
|
then |
174 |
|
|
ROOTDIR=$dir |
175 |
|
|
# rm -f rank_?/pickup*.ckptA.00?.00?.??ta |
176 |
|
|
echo $ROOTDIR |
177 |
|
|
tmpfil=TTT.$$ |
178 |
|
|
|
179 |
|
|
#--- running on the same node: |
180 |
|
|
list='' ; nc=0; xx=`hostname` |
181 |
|
|
while [ $nc -lt $Npr ] ; do list="$list $xx" ; nc=`expr $nc + 1` ; done |
182 |
|
|
#-- On darwin cluster node (from qrsh session): |
183 |
|
|
JOB_ID=`qstat | sed -n '3,$ p' | grep " $USER " | awk '{print $1}'` |
184 |
|
|
NODEFILE="/tmp/$JOB_ID.1.darwin/machines" |
185 |
|
|
echo " JOB_ID = '$JOB_ID' ; NODEFILE = '$NODEFILE'" |
186 |
|
|
#-- On ACES cluster (in PBS batch job): |
187 |
|
|
# NODEFILE=$PBS_NODEFILE |
188 |
|
|
#--- running on different nodes: |
189 |
|
|
ls -l $NODEFILE |
190 |
|
|
nprc=`cat $NODEFILE | uniq | wc -l` |
191 |
|
|
if [ $nprc -ge $Npr ] ; then |
192 |
|
|
list=`cat $NODEFILE | uniq | head -$Npr` |
193 |
|
|
else |
194 |
|
|
list=`cat $NODEFILE | head -$Npr` |
195 |
|
|
fi |
196 |
|
|
|
197 |
|
|
nc=0; nn=0; dd1=cpl ; |
198 |
|
|
rm -f pr_group ; touch pr_group |
199 |
|
|
for xx in $list |
200 |
|
|
do |
201 |
|
|
echo $xx $nn $dir/build_$dd1/mitgcmuv >> pr_group |
202 |
|
|
nc=`expr $nc + 1` |
203 |
|
|
if [ $nc -le $NpOc ] ; then dd1=ocn ; else dd1=atm ; fi |
204 |
|
|
nn=1 |
205 |
|
|
done |
206 |
jmc |
1.2 |
NpAt=`expr $Npr - 1 - $NpOc` |
207 |
|
|
RunOpt="-np 1 ./build_cpl/mitgcmuv" |
208 |
|
|
RunOpt="$RunOpt : -np $NpOc ./build_ocn/mitgcmuv" |
209 |
|
|
RunOpt="$RunOpt : -np $NpAt ./build_atm/mitgcmuv" |
210 |
jmc |
1.1 |
|
211 |
|
|
cd $ROOTDIR |
212 |
|
|
if test "x$MTH" != x ; then |
213 |
|
|
export OMP_NUM_THREADS=2 ; export KMP_STACKSIZE=400m |
214 |
|
|
if test "x$MTHo" != x ; then |
215 |
|
|
echo -n " run OCN ($MTHo) with $OMP_NUM_THREADS threads ;" |
216 |
|
|
fi |
217 |
|
|
if test "x$MTHa" != x ; then |
218 |
|
|
echo -n " run ATM ($MTHa) with $OMP_NUM_THREADS threads ;" |
219 |
|
|
fi |
220 |
|
|
echo "" |
221 |
|
|
fi |
222 |
jmc |
1.2 |
mpich=`which mpirun` |
223 |
|
|
echo $mpich | grep 'mpich-mx' > /dev/null 2>&1 |
224 |
|
|
mpichmx=$? |
225 |
|
|
echo $mpich | grep 'mpich2' > /dev/null 2>&1 |
226 |
|
|
mpich2=$? |
227 |
|
|
if test $mpich2 == 0 ; then |
228 |
|
|
#- with Hydra mpich2 (on baudelaire): |
229 |
|
|
echo "execute 'mpirun $RunOpt' :" |
230 |
|
|
mpirun $RunOpt > std_outp 2>&1 |
231 |
|
|
elif test $mpichmx == 0 ; then |
232 |
|
|
#- with mpich-mx (on beagle): |
233 |
|
|
echo "execute 'mpirun -pg pr_group -v ./build_cpl/mitgcmuv' :" |
234 |
|
|
mpirun -pg pr_group -v ./build_cpl/mitgcmuv > std_outp 2>&1 |
235 |
|
|
else |
236 |
|
|
# /usr/local/pkg/mpi/mpi-1.2.4..8a-gm-1.5/pgi/bin/mpirun.ch_gm -pg pr_group -wd $ROOTDIR --gm-kill 5 -v ./build_cpl/mitgcmuv > std_outp 2>&1 |
237 |
|
|
#- with mpich-1 (on danton, ACES): |
238 |
|
|
echo "execute 'mpirun -p4pg pr_group -v ./build_cpl/mitgcmuv' :" |
239 |
|
|
mpirun -p4pg pr_group -v ./build_cpl/mitgcmuv > std_outp 2>&1 |
240 |
|
|
fi |
241 |
jmc |
1.1 |
tail -20 std_outp |
242 |
|
|
ls -l rank_$rnkO/pickup*.ckptA.001.001.data |
243 |
|
|
ls -l rank_$rnkA/pickup*.ckptA.001.001.data |
244 |
|
|
|
245 |
|
|
fi |
246 |
|
|
|
247 |
|
|
if test $kpr = 4 |
248 |
|
|
then |
249 |
jmc |
1.2 |
CompRes="$HOME/bin/comp_res" |
250 |
jmc |
1.1 |
|
251 |
|
|
if test -f rank_$rnkO/STDOUT.0000 |
252 |
|
|
then echo '==> check Ocean output:' |
253 |
jmc |
1.2 |
$CompRes rank_$rnkO/STDOUT.0000 results/ocnSTDOUT.0000 |
254 |
jmc |
1.1 |
mv -f comp_res.log comp_res.ocn |
255 |
|
|
echo ' ' |
256 |
|
|
else echo "No Ocean output file in rank_$rnkO" ; fi |
257 |
|
|
|
258 |
|
|
if test -f rank_$rnkA/STDOUT.0000 |
259 |
|
|
then |
260 |
|
|
echo '==> check Atmos output:' |
261 |
jmc |
1.2 |
$CompRes rank_$rnkA/STDOUT.0000 results/atmSTDOUT.0000 |
262 |
jmc |
1.1 |
mv -f comp_res.log comp_res.atm |
263 |
|
|
echo '==> check Land output:' |
264 |
jmc |
1.2 |
$CompRes rank_$rnkA/STDOUT.0000 results/atmSTDOUT.0000 L |
265 |
jmc |
1.1 |
mv -f comp_res.log comp_res.land |
266 |
|
|
echo '==> check thSIce output:' |
267 |
jmc |
1.2 |
$CompRes rank_$rnkA/STDOUT.0000 results/atmSTDOUT.0000 I |
268 |
jmc |
1.1 |
mv -f comp_res.log comp_res.sice |
269 |
|
|
echo ' ' |
270 |
|
|
else echo "No Atmos output file in rank_$rnkA" ; fi |
271 |
|
|
|
272 |
|
|
fi |
273 |
|
|
|
274 |
|
|
exit 0 |