/[MITgcm]/MITgcm_contrib/test_scripts/engaging/test_engag_op64_mpi
ViewVC logotype

Annotation of /MITgcm_contrib/test_scripts/engaging/test_engag_op64_mpi

Parent Directory Parent Directory | Revision Log Revision Log | View Revision Graph Revision Graph


Revision 1.3 - (hide annotations) (download)
Sun Feb 19 15:02:22 2023 UTC (2 years, 4 months ago) by jmc
Branch: MAIN
Changes since 1.2: +16 -19 lines
- minor tweaks to get more unifor set of scripts.
- also tweak "-j" options (added in: gfoAdm, gfoTlm, o64Adm, changed from 3
  to 2 in o64Mpi) for first compiling step (-nr).

1 jmc 1.1 #!/bin/bash
2     #SBATCH -J o64Mpi_tst
3     #SBATCH -p sched_mit_hill
4 jmc 1.2 #SBATCH -t 06:00:00
5 jmc 1.1 #SBATCH --mem-per-cpu 4000
6     #SBATCH -n 6
7     #SBATCH -N 2
8     # #SBATCH -x node[360,365]
9     #SBATCH -e /home/jm_c/test_engaging/output/o64Mpi_tst.stderr
10     #SBATCH -o /home/jm_c/test_engaging/output/o64Mpi_tst.stdout
11     #SBATCH --no-requeue
12    
13 jmc 1.3 # $Header: /u/gcmpack/MITgcm_contrib/test_scripts/engaging/test_engag_op64_mpi,v 1.2 2022/12/03 20:36:21 jmc Exp $
14 jmc 1.1 # $Name: $
15    
16 jmc 1.3 if test -f /etc/profile.d/modules.sh ; then . /etc/profile.d/modules.sh ; fi
17 jmc 1.1 # Note: added "ulimit -s unlimited" in file "~/.bashrc"
18     # to pass big test (the 2 fizhi-cs-* test & adjoint tests) with MPI
19    
20     umask 0022
21     #- to get case insensitive "ls" (and order of tested experiments)
22     export LC_ALL="en_US.UTF-8"
23     echo " running on: "`hostname`
24 jmc 1.3 headNode='eofe8'
25 jmc 1.1
26     dNam='engaging'
27 jmc 1.3 HERE="$HOME/test_${dNam}"
28 jmc 1.1 OUTP="$HERE/output"; SavD="$HERE/send"
29 jmc 1.3 SEND="ssh $headNode $SavD/mpack"
30 jmc 1.1 TST_DIR="/pool001/jm_c/test_$dNam"
31     tmpFil="/tmp/"`basename $0`".$$"
32     cmdCVS='cvs -d :pserver:cvsanon@mitgcm.org:/u/gcmpack -q'
33     #- which GitHub repository to use and how to access it:
34     git_repo='MITgcm'; git_code='MITgcm' ; git_other='verification_other'
35     #git_repo='altMITgcm'; #git_code='MITgcm66h'
36     #--
37     git_repo="https://github.com/$git_repo"
38     #git_repo="git://github.com/$git_repo"
39     #git_repo="git@github.com:$git_repo"
40    
41     dblTr=0 ; typ='' ; addExp='' ; skipExp=''
42     sfx='o64Mpi'; dblTr=1
43     #- currently, no NetCDF => no pkg/profiles
44     #skipExp="$skipExp global_oce_biogeo_bling"
45     module add open64
46     module add mvapich2/open64/64/2.0b
47     export MPI_INC_DIR="$MPI_HOME/include"
48     OPTFILE="../tools/build_options/linux_amd64_open64"
49     #options="-j 2 -devel -gsl"
50     options="$typ -MPI 6"
51     #export OMP_NUM_THREADS=2
52     #export OMP_SLAVE_STACK_SIZE=400m
53     #export GSL_IEEE_MODE=double-precision,mask-underflow,mask-denormalized
54     ulimit -s unlimited
55     #- need this to get "staf":
56     #export PATH="$PATH:$HOME/bin"
57    
58     gcmDIR="MITgcm_$sfx"
59     dAlt=`date +%d` ; dAlt=`expr $dAlt % 3`
60     if [ $dAlt -eq 1 ] ; then options="$options -fast"
61     else options="$options -devel" ; fi
62     if test "x$skipExp" != x ; then skipExp=`echo $skipExp | sed 's/^ *//'` ; fi
63    
64     checkOut=1 ; #options="$options -do"
65     #options="$options -nc" ; checkOut=1
66     #options="$options -q" ; checkOut=0 ; dblTr=0
67    
68     if test -d $TST_DIR ; then
69     echo "start from TST_DIR='$TST_DIR' at: "`date`
70     else
71     #if test ! -d $TST_DIR ; then mkdir $TST_DIR ; fi
72     #if test ! -d $TST_DIR ; then
73     # echo "ERROR: Can't create directory \"$TST_DIR\""
74     # exit 1
75     #fi
76     #echo "start in new dir TST_DIR='$TST_DIR' at: "`date`
77     echo "ERROR: missing directory \"$TST_DIR\""
78     exit 1
79     fi
80     cd $TST_DIR
81     pwd
82     df .
83    
84     NSLOTS=$SLURM_NTASKS
85     THEDATE=`date`
86     echo '********************************************************************************'
87     echo 'Start job '$THEDATE
88     echo 'NSLOTS = '$NSLOTS
89     echo '======= NODELIST ==============================================================='
90     echo $SLURM_NODELIST
91     cat /etc/redhat-release
92     echo '======= env ===================================================================='
93     env | grep SLURM
94     echo '======= modules ================================================================'
95     module list 2>&1
96     echo '================================================================================'
97    
98     #- check for disk space: relative space (99%) or absolute (10.G):
99     dsp=`df -P . | tail -1 | awk '{print $5}' | sed 's/%$//'`
100     if [ $dsp -gt 99 ] ; then
101     #dsp=`df -P . | tail -1 | awk '{print $4}'`
102     #if [ $dsp -le 100000000 ] ; then
103     echo 'Not enough space on this disk => do not run testreport.'
104     df .
105     exit
106     fi
107     if [ $checkOut -eq 1 ] ; then
108     if test ! -e $gcmDIR/.git/config ; then
109     echo "no file: $gcmDIR/.git/config => try to download a fresh clone"
110     checkOut=2
111     fi
112     if test "x$addExp" != x ; then
113     if test ! -e $gcmDIR/$git_other/.git/config ; then
114     echo "no file: $gcmDIR/$git_other/.git/config => try a fresh clone"
115     checkOut=2
116     fi
117     fi
118     fi
119     if [ $checkOut -eq 1 ] ; then
120     echo "cleaning output from $gcmDIR/verification :"
121     #- remove previous output tar files and tar & remove previous output-dir
122     /bin/rm -f $gcmDIR/verification/??_${dNam}-${sfx}_????????_?.tar.gz
123     ( cd $gcmDIR/verification
124     listD=`ls -1 -d ??_${dNam}-${sfx}_????????_? 2> /dev/null`
125     for dd in $listD
126     do
127     if test -d $dd ; then
128     tar -cf ${dd}".tar" $dd > /dev/null 2>&1 && gzip ${dd}".tar" && /bin/rm -rf $dd
129     retVal=$?
130     if test "x$retVal" != x0 ; then
131     echo "ERROR in tar+gzip prev outp-dir: $dd"
132     echo " on '"`hostname`"' (return val=$retVal) but continue"
133     fi
134     fi
135     done )
136 jmc 1.3 echo "clean tst_2+2 + testreport output"
137 jmc 1.1 ( cd $gcmDIR/verification ; ../tools/do_tst_2+2 -clean )
138     ( cd $gcmDIR/verification ; ./testreport $typ -clean )
139 jmc 1.3 if test "x$addExp" != x ; then
140     ( cd $gcmDIR/verification
141     listD=`ls -o | grep '^l' | awk '{print $8}' 2> /dev/null`
142     echo " + remove local links: $listD"
143     /bin/rm -f $listD
144     )
145     fi
146 jmc 1.1 echo "Update $git_code code in dir $gcmDIR :"
147     ( cd $gcmDIR ; git pull ) 2>&1
148     retVal=$?
149     if test "x$retVal" != x0 ; then
150     echo "git pull on '"`hostname`"' fail (return val=$retVal) => exit"
151     exit
152     fi
153     echo " and checkout master:"
154     ( cd $gcmDIR ; git checkout master -- . ) 2>&1
155     if test "x$addExp" != x ; then
156     echo "Update $git_other code in dir $gcmDIR/$git_other :"
157     ( cd $gcmDIR/$git_other ; git pull ) 2>&1
158     retVal=$?
159     if test "x$retVal" != x0 ; then
160     echo "git pull on '"`hostname`"' fail (return val=$retVal) => exit"
161     exit
162     fi
163     echo " and checkout master:"
164     ( cd $gcmDIR/$git_other ; git checkout master -- . ) 2>&1
165     fi
166     fi
167    
168     if [ $checkOut -eq 2 ] ; then
169     if test -e $gcmDIR ; then
170     echo -n "Removing working copy: $gcmDIR ..."
171     rm -rf $gcmDIR
172     echo " done"
173     fi
174     echo "Make a clone of $git_code from repo: $git_repo ..."
175     git clone $git_repo/${git_code}.git $gcmDIR 2> $tmpFil
176     retVal=$?
177     if test $retVal = 0 ; then
178     echo ' done' ; rm -f $tmpFil
179     else
180     echo " Error: 'git clone' returned: $retVal"
181     cat $tmpFil ; rm -f $tmpFil
182     exit
183     fi
184     if test "x$addExp" != x ; then
185     echo "Make a clone of $git_other from repo: $git_repo ..."
186     ( cd $gcmDIR ; git clone $git_repo/${git_other}.git 2> $tmpFil )
187     retVal=$?
188     if test $retVal = 0 ; then
189     echo ' done' ; rm -f $tmpFil
190     else
191     echo " Error: 'git clone' returned: $retVal"
192     cat $tmpFil ; rm -f $tmpFil
193     exit
194     fi
195     fi
196     if test -d $gcmDIR/verification ; then
197     /usr/bin/find $gcmDIR -type d | xargs chmod g+rxs
198     /usr/bin/find $gcmDIR -type f | xargs chmod g+r
199     fi
200     fi
201    
202     #- change dir to $gcmDIR/verification + add link for additional experiments:
203     if test -e $gcmDIR/verification ; then
204     if [ $checkOut -lt 2 ] ; then
205     echo " dir $gcmDIR/verification exist" ; fi
206     cd $gcmDIR/verification
207     for exp2add in $addExp ; do
208     test -r $exp2add && /bin/rm -rf $exp2add
209     if test -d ../$git_other/$exp2add ; then
210     echo " add $exp2add link from $git_other"
211     ln -s ../$git_other/$exp2add .
212     else
213     echo " missing dir: $git_other/$exp2add"
214     continue
215     fi
216     done
217     else
218     echo "no dir: $gcmDIR/verification => exit"
219     exit
220     fi
221    
222     if [ $dblTr -eq 1 ] ; then
223     echo ''
224 jmc 1.3 #- 1) just compile ("-nr"), using "-j 2" to speed up
225 jmc 1.1 echo ./testreport $options -of $OPTFILE -skd \'$skipExp\' \
226 jmc 1.3 -j 2 -nr -odir ${dNam}-$sfx
227 jmc 1.1 ./testreport $options -of $OPTFILE -skd "$skipExp" \
228 jmc 1.3 -j 2 -nr -odir ${dNam}-$sfx
229 jmc 1.1 options="$options -q"
230     fi
231    
232     echo ''
233     #- 2) run and report results ; also finish to compile those who failed with "-j"
234     echo ./testreport $options -of $OPTFILE -skd \'$skipExp\' \
235     -odir ${dNam}-$sfx -send \'$SEND\' -sd $SavD -a jm_c@mitgcm.org
236     ./testreport $options -of $OPTFILE -skd "$skipExp" \
237     -odir ${dNam}-$sfx -send "$SEND" -sd $SavD -a jm_c@mitgcm.org
238    
239     echo ''
240     #- 3) test restart and report results
241     echo ../tools/do_tst_2+2 -mpi \
242     -o ${dNam}-$sfx -send \'$SEND\' -sd $SavD -a jm_c@mitgcm.org
243     ../tools/do_tst_2+2 -mpi \
244     -o ${dNam}-$sfx -send "$SEND" -sd $SavD -a jm_c@mitgcm.org
245    
246     # exit 0
247     # echo -n "-- SLURM_TASKS_PER_NODE= $SLURM_TASKS_PER_NODE ; " >> ${OUTP}/tracer_adj.log
248     # date >> ${OUTP}/tracer_adj.log
249     # grep 'My Processor Name' tutorial_tracer_adjsens/run/STDOUT.000? \
250     # | sed 's/tutorial_tracer_adjsens\// /' >> ${OUTP}/tracer_adj.log
251     # grep 'My Processor Name' tutorial_tracer_adjsens/tr_run.som81/STDOUT.000? \
252     # | sed 's/tutorial_tracer_adjsens\// /' >> ${OUTP}/tracer_adj.log

  ViewVC Help
Powered by ViewVC 1.1.22