/[MITgcm]/MITgcm_contrib/test_scripts/engaging/test_engag_op64_adm
ViewVC logotype

Annotation of /MITgcm_contrib/test_scripts/engaging/test_engag_op64_adm

Parent Directory Parent Directory | Revision Log Revision Log | View Revision Graph Revision Graph


Revision 1.28 - (hide annotations) (download)
Thu Oct 19 14:43:00 2023 UTC (20 months, 4 weeks ago) by jmc
Branch: MAIN
Changes since 1.27: +7 -1 lines
check testreport exit value before running restart test

1 jmc 1.1 #!/bin/bash
2 jmc 1.13 #SBATCH -J o64Adm_tst
3 jmc 1.1 #SBATCH -p sched_mit_hill
4 jmc 1.26 #SBATCH -t 06:00:00
5 jmc 1.1 #SBATCH --mem-per-cpu 4000
6     #SBATCH -n 6
7     #SBATCH -N 2
8 jmc 1.23 # #SBATCH -x node[360,365]
9 jmc 1.13 #SBATCH -e /home/jm_c/test_engaging/output/o64Adm_tst.stderr
10     #SBATCH -o /home/jm_c/test_engaging/output/o64Adm_tst.stdout
11 jmc 1.19 #SBATCH --no-requeue
12 jmc 1.1
13 jmc 1.28 # $Header: /u/gcmpack/MITgcm_contrib/test_scripts/engaging/test_engag_op64_adm,v 1.27 2023/02/19 15:02:22 jmc Exp $
14 jmc 1.1 # $Name: $
15    
16 jmc 1.27 if test -f /etc/profile.d/modules.sh ; then . /etc/profile.d/modules.sh ; fi
17 jmc 1.3 # Note: added "ulimit -s unlimited" in file "~/.bashrc"
18 jmc 1.1 # to pass big test (the 2 fizhi-cs-* test & adjoint tests) with MPI
19    
20     umask 0022
21     #- to get case insensitive "ls" (and order of tested experiments)
22     export LC_ALL="en_US.UTF-8"
23     echo " running on: "`hostname`
24 jmc 1.27 headNode='eofe8'
25 jmc 1.1
26     dNam='engaging'
27 jmc 1.27 HERE="$HOME/test_${dNam}"
28 jmc 1.1 OUTP="$HERE/output"; SavD="$HERE/send"
29 jmc 1.27 SEND="ssh $headNode $SavD/mpack"
30 jmc 1.1 TST_DIR="/pool001/jm_c/test_$dNam"
31 jmc 1.11 tmpFil="/tmp/"`basename $0`".$$"
32     cmdCVS='cvs -d :pserver:cvsanon@mitgcm.org:/u/gcmpack -q'
33 jmc 1.13 #- which GitHub repository to use and how to access it:
34 jmc 1.17 git_repo='MITgcm'; git_code='MITgcm' ; git_other='verification_other'
35 jmc 1.11 #git_repo='altMITgcm'; #git_code='MITgcm66h'
36 jmc 1.13 #--
37     git_repo="https://github.com/$git_repo"
38     #git_repo="git://github.com/$git_repo"
39     #git_repo="git@github.com:$git_repo"
40 jmc 1.1
41 jmc 1.21 dblTr=0 ; typ='' ; addExp='' ; skipExp=''
42     sfx='o64Adm'; typ='-adm' ; dblTr=1
43 jmc 1.25 #- currently, no NetCDF => no pkg/profiles
44     skipExp="$skipExp global_oce_biogeo_bling"
45 jmc 1.1 module add open64
46     module add mvapich2/open64/64/2.0b
47     export MPI_INC_DIR="$MPI_HOME/include"
48     OPTFILE="../tools/build_options/linux_amd64_open64"
49     #options="-j 2 -devel -gsl"
50     options="$typ -MPI 6"
51     #export OMP_NUM_THREADS=2
52     #export OMP_SLAVE_STACK_SIZE=400m
53     #export GSL_IEEE_MODE=double-precision,mask-underflow,mask-denormalized
54     ulimit -s unlimited
55     #- need this to get "staf":
56 jmc 1.27 export PATH="$PATH:$HOME/bin"
57 jmc 1.1
58 jmc 1.11 gcmDIR="MITgcm_$sfx"
59 jmc 1.1 dAlt=`date +%d` ; dAlt=`expr $dAlt % 3`
60     if [ $dAlt -eq 1 ] ; then options="$options -fast"
61     else options="$options -devel" ; fi
62 jmc 1.25 if test "x$skipExp" != x ; then skipExp=`echo $skipExp | sed 's/^ *//'` ; fi
63 jmc 1.1
64 jmc 1.3 checkOut=1 ; #options="$options -do"
65 jmc 1.1 #options="$options -nc" ; checkOut=1
66 jmc 1.21 #options="$options -q" ; checkOut=0 ; dblTr=0
67 jmc 1.1
68 jmc 1.11 if test -d $TST_DIR ; then
69     echo "start from TST_DIR='$TST_DIR' at: "`date`
70     else
71     #if test ! -d $TST_DIR ; then mkdir $TST_DIR ; fi
72     #if test ! -d $TST_DIR ; then
73     # echo "ERROR: Can't create directory \"$TST_DIR\""
74     # exit 1
75     #fi
76     #echo "start in new dir TST_DIR='$TST_DIR' at: "`date`
77     echo "ERROR: missing directory \"$TST_DIR\""
78     exit 1
79     fi
80     cd $TST_DIR
81     pwd
82 jmc 1.20 df .
83 jmc 1.11
84 jmc 1.1 NSLOTS=$SLURM_NTASKS
85 jmc 1.2 THEDATE=`date`
86 jmc 1.1 echo '********************************************************************************'
87     echo 'Start job '$THEDATE
88     echo 'NSLOTS = '$NSLOTS
89     echo '======= NODELIST ==============================================================='
90     echo $SLURM_NODELIST
91 jmc 1.4 cat /etc/redhat-release
92 jmc 1.1 echo '======= env ===================================================================='
93 jmc 1.2 env | grep SLURM
94     echo '======= modules ================================================================'
95     module list 2>&1
96 jmc 1.1 echo '================================================================================'
97    
98     #- check for disk space: relative space (99%) or absolute (10.G):
99     dsp=`df -P . | tail -1 | awk '{print $5}' | sed 's/%$//'`
100     if [ $dsp -gt 99 ] ; then
101     #dsp=`df -P . | tail -1 | awk '{print $4}'`
102     #if [ $dsp -le 100000000 ] ; then
103     echo 'Not enough space on this disk => do not run testreport.'
104     df .
105     exit
106     fi
107     if [ $checkOut -eq 1 ] ; then
108 jmc 1.15 if test ! -e $gcmDIR/.git/config ; then
109     echo "no file: $gcmDIR/.git/config => try to download a fresh clone"
110     checkOut=2
111     fi
112     if test "x$addExp" != x ; then
113     if test ! -e $gcmDIR/$git_other/.git/config ; then
114     echo "no file: $gcmDIR/$git_other/.git/config => try a fresh clone"
115     checkOut=2
116     fi
117     fi
118     fi
119     if [ $checkOut -eq 1 ] ; then
120 jmc 1.1 echo "cleaning output from $gcmDIR/verification :"
121     #- remove previous output tar files and tar & remove previous output-dir
122     /bin/rm -f $gcmDIR/verification/??_${dNam}-${sfx}_????????_?.tar.gz
123     ( cd $gcmDIR/verification
124     listD=`ls -1 -d ??_${dNam}-${sfx}_????????_? 2> /dev/null`
125     for dd in $listD
126     do
127     if test -d $dd ; then
128     tar -cf ${dd}".tar" $dd > /dev/null 2>&1 && gzip ${dd}".tar" && /bin/rm -rf $dd
129 jmc 1.11 retVal=$?
130     if test "x$retVal" != x0 ; then
131 jmc 1.1 echo "ERROR in tar+gzip prev outp-dir: $dd"
132 jmc 1.11 echo " on '"`hostname`"' (return val=$retVal) but continue"
133 jmc 1.1 fi
134     fi
135     done )
136 jmc 1.27 echo "clean testreport output"
137     # ( cd $gcmDIR/verification ; ../tools/do_tst_2+2 -clean )
138 jmc 1.1 ( cd $gcmDIR/verification ; ./testreport $typ -clean )
139 jmc 1.27 if test "x$addExp" != x ; then
140     ( cd $gcmDIR/verification
141     listD=`ls -o | grep '^l' | awk '{print $8}' 2> /dev/null`
142     echo " + remove local links: $listD"
143     /bin/rm -f $listD
144     )
145     fi
146 jmc 1.17 echo "Update $git_code code in dir $gcmDIR :"
147 jmc 1.14 ( cd $gcmDIR ; git pull ) 2>&1
148 jmc 1.11 retVal=$?
149     if test "x$retVal" != x0 ; then
150     echo "git pull on '"`hostname`"' fail (return val=$retVal) => exit"
151 jmc 1.1 exit
152     fi
153 jmc 1.14 echo " and checkout master:"
154     ( cd $gcmDIR ; git checkout master -- . ) 2>&1
155 jmc 1.15 if test "x$addExp" != x ; then
156     echo "Update $git_other code in dir $gcmDIR/$git_other :"
157     ( cd $gcmDIR/$git_other ; git pull ) 2>&1
158     retVal=$?
159     if test "x$retVal" != x0 ; then
160     echo "git pull on '"`hostname`"' fail (return val=$retVal) => exit"
161     exit
162     fi
163     echo " and checkout master:"
164     ( cd $gcmDIR/$git_other ; git checkout master -- . ) 2>&1
165 jmc 1.1 fi
166     fi
167 jmc 1.17
168 jmc 1.1 if [ $checkOut -eq 2 ] ; then
169     if test -e $gcmDIR ; then
170 jmc 1.3 echo -n "Removing working copy: $gcmDIR ..."
171     rm -rf $gcmDIR
172     echo " done"
173 jmc 1.1 fi
174 jmc 1.17 echo "Make a clone of $git_code from repo: $git_repo ..."
175 jmc 1.13 git clone $git_repo/${git_code}.git $gcmDIR 2> $tmpFil
176 jmc 1.11 retVal=$?
177     if test $retVal = 0 ; then
178     echo ' done' ; rm -f $tmpFil
179     else
180     echo " Error: 'git clone' returned: $retVal"
181     cat $tmpFil ; rm -f $tmpFil
182 jmc 1.1 exit
183 jmc 1.11 fi
184 jmc 1.15 if test "x$addExp" != x ; then
185     echo "Make a clone of $git_other from repo: $git_repo ..."
186     ( cd $gcmDIR ; git clone $git_repo/${git_other}.git 2> $tmpFil )
187     retVal=$?
188     if test $retVal = 0 ; then
189     echo ' done' ; rm -f $tmpFil
190     else
191     echo " Error: 'git clone' returned: $retVal"
192     cat $tmpFil ; rm -f $tmpFil
193     exit
194     fi
195     fi
196 jmc 1.1 if test -d $gcmDIR/verification ; then
197     /usr/bin/find $gcmDIR -type d | xargs chmod g+rxs
198     /usr/bin/find $gcmDIR -type f | xargs chmod g+r
199     fi
200     fi
201    
202 jmc 1.17 #- change dir to $gcmDIR/verification + add link for additional experiments:
203 jmc 1.1 if test -e $gcmDIR/verification ; then
204     if [ $checkOut -lt 2 ] ; then
205     echo " dir $gcmDIR/verification exist" ; fi
206     cd $gcmDIR/verification
207 jmc 1.7 for exp2add in $addExp ; do
208 jmc 1.15 test -r $exp2add && /bin/rm -rf $exp2add
209     if test -d ../$git_other/$exp2add ; then
210     echo " add $exp2add link from $git_other"
211     ln -s ../$git_other/$exp2add .
212 jmc 1.7 else
213 jmc 1.15 echo " missing dir: $git_other/$exp2add"
214     continue
215 jmc 1.7 fi
216     done
217 jmc 1.1 else
218     echo "no dir: $gcmDIR/verification => exit"
219     exit
220     fi
221    
222 jmc 1.21 if [ $dblTr -eq 1 ] ; then
223 jmc 1.8 echo ''
224 jmc 1.27 #- 1) just compile ("-nr"), using "-j 2" to speed up
225 jmc 1.25 echo ./testreport $options -of $OPTFILE -skd \'$skipExp\' \
226 jmc 1.27 -j 2 -nr -odir ${dNam}-$sfx
227 jmc 1.25 ./testreport $options -of $OPTFILE -skd "$skipExp" \
228 jmc 1.27 -j 2 -nr -odir ${dNam}-$sfx
229 jmc 1.21 options="$options -q"
230     fi
231    
232     echo ''
233 jmc 1.27 #- 2) run and report results ; also finish to compile those who failed with "-j"
234 jmc 1.25 echo ./testreport $options -of $OPTFILE -skd \'$skipExp\' \
235     -odir ${dNam}-$sfx -send \'$SEND\' -sd $SavD -a jm_c@mitgcm.org
236     ./testreport $options -of $OPTFILE -skd "$skipExp" \
237     -odir ${dNam}-$sfx -send "$SEND" -sd $SavD -a jm_c@mitgcm.org
238 jmc 1.28 retVal=$?
239 jmc 1.8
240 jmc 1.28 if test "x$retVal" != x0 ; then
241     echo "<== testreport returned retVal=${retVal}, expecting 0"
242     # echo " -> skip restart test 'do_tst_2+2'"
243     #else
244 jmc 1.8 # echo ''
245 jmc 1.25 #- 3) test restart and report results
246 jmc 1.8 # echo ../tools/do_tst_2+2 -mpi \
247 jmc 1.10 # -o ${dNam}-$sfx -send \'$SEND\' -sd $SavD -a jm_c@mitgcm.org
248 jmc 1.8 # ../tools/do_tst_2+2 -mpi \
249 jmc 1.10 # -o ${dNam}-$sfx -send "$SEND" -sd $SavD -a jm_c@mitgcm.org
250 jmc 1.28 fi
251 jmc 1.1
252 jmc 1.24 # exit 0
253     echo -n "-- SLURM_TASKS_PER_NODE= $SLURM_TASKS_PER_NODE ; " >> ${OUTP}/tracer_adj.log
254     date >> ${OUTP}/tracer_adj.log
255     grep 'My Processor Name' tutorial_tracer_adjsens/run/STDOUT.000? \
256     | sed 's/tutorial_tracer_adjsens\// /' >> ${OUTP}/tracer_adj.log
257     grep 'My Processor Name' tutorial_tracer_adjsens/tr_run.som81/STDOUT.000? \
258     | sed 's/tutorial_tracer_adjsens\// /' >> ${OUTP}/tracer_adj.log

  ViewVC Help
Powered by ViewVC 1.1.22