/[MITgcm]/MITgcm_contrib/test_scripts/engaging/test_engag_ifc_mpi
ViewVC logotype

Annotation of /MITgcm_contrib/test_scripts/engaging/test_engag_ifc_mpi

Parent Directory Parent Directory | Revision Log Revision Log | View Revision Graph Revision Graph


Revision 1.5 - (hide annotations) (download)
Tue Sep 12 18:47:45 2017 UTC (7 years, 10 months ago) by jmc
Branch: MAIN
Changes since 1.4: +14 -2 lines
split compilation (using -j option) and run (without -j) in 2 steps

1 jmc 1.1 #!/bin/bash
2     #SBATCH -J tst_ifcMpi
3     #SBATCH -p sched_mit_hill
4     #SBATCH --mem-per-cpu 4000
5     #SBATCH -N 2
6     #SBATCH --tasks-per-node 4
7     #SBATCH -e /home/jm_c/test_engaging/output/tst_ifcMpi.stderr
8     #SBATCH -o /home/jm_c/test_engaging/output/tst_ifcMpi.stdout
9     #SBATCH --no-requeue --constraint=centos6
10    
11 jmc 1.5 # $Header: /u/gcmpack/MITgcm_contrib/test_scripts/engaging/test_engag_ifc_mpi,v 1.4 2017/08/25 13:01:35 jmc Exp $
12 jmc 1.1 # $Name: $
13    
14     if test -f /etc/profile.d/modules.sh ; then
15     . /etc/profile.d/modules.sh
16     fi
17     # Note: added "ulimit -s unlimited" in file "~/.bashrc"
18     # to pass big test (the 2 fizhi-cs-* test & adjoint tests) with MPI
19    
20     umask 0022
21     #- to get case insensitive "ls" (and order of tested experiments)
22     export LC_ALL="en_US.UTF-8"
23     echo " running on: "`hostname`
24    
25     dNam='engaging'
26     HERE="$HOME/test_$dNam"
27     OUTP="$HERE/output"; SavD="$HERE/send"
28     SEND="ssh eofe4 $SavD/mpack"
29     TST_DIR="/pool001/jm_c/test_$dNam"
30    
31     if test -d $TST_DIR ; then
32     echo "start from TST_DIR='$TST_DIR' at: "`date`
33     else
34     #if test ! -d /scratch/jm_c ; then mkdir /scratch/jm_c ; fi
35     #if test ! -d $TST_DIR ; then mkdir $TST_DIR ; fi
36     #if test ! -d $TST_DIR ; then
37     # echo "ERROR: Can't create directory \"$TST_DIR\""
38     # exit 1
39     #fi
40     #echo "start in new dir TST_DIR='$TST_DIR' at: "`date`
41     echo "ERROR: missing directory \"$TST_DIR\""
42     exit 1
43     fi
44    
45 jmc 1.2 typ='' ; addExp='' ; skipExp=''
46     sfx='ifcMpi'
47 jmc 1.1 addExp='global_oce_cs32 global_oce_llc90'
48     module add slurm
49     module add gcc
50     module add engaging/intel/2013.1.046
51     #export MPI_INC_DIR="$MPI_HOME/include"
52     OPTFILE="../tools/build_options/linux_amd64_ifort+impi"
53     mpiCMD="mpirun -env I_MPI_DEBUG 2 -n TR_NPROC ./mitgcmuv" #- currently not used
54 jmc 1.4 options="$typ -MPI 8"
55 jmc 1.5 #options="-j 4 $options"
56 jmc 1.1 #export OMP_NUM_THREADS=2
57     #export KMP_SLAVE_STACK_SIZE=400m
58     #options="$options -gsl"
59     #export GSL_IEEE_MODE=double-precision,mask-underflow,mask-denormalized
60     ulimit -s unlimited
61     #- need this to get "staf" & "do_make_syntax.sh":
62     export PATH="$PATH:$HOME/bin"
63    
64     dAlt=`date +%d` ; dAlt=`expr $dAlt % 3`
65     if [ $dAlt -eq 1 ] ; then options="$options -ur4 -match 5" ; fi
66     options="$options -devel"
67    
68     checkOut=1 ; #options="$options -do"
69     #options="$options -nc" ; checkOut=1
70     #options="$options -q" ; checkOut=0
71    
72     NSLOTS=$SLURM_NTASKS
73     THEDATE=`date`
74     echo '********************************************************************************'
75     echo 'Start job '$THEDATE
76     echo 'NSLOTS = '$NSLOTS
77     echo '======= NODELIST ==============================================================='
78     echo $SLURM_NODELIST
79     cat /etc/redhat-release
80     echo '======= env ===================================================================='
81     env | grep SLURM
82     echo '======= modules ================================================================'
83     module list 2>&1
84     echo '================================================================================'
85    
86     #-
87     MPI_MFile="${OUTP}/mf_${sfx}" #- currently not used
88     #mpiCMD="mpirun -hostfile TR_MFILE -n TR_NPROC ./mitgcmuv"
89     #- make the testreport MPI_MFILE:
90     listNODES=`echo $SLURM_NODELIST | sed -e 's/\[/ /' -e 's/\]//' -e 's/,/ /' -e 's/-/ /'`
91     # duplicate the 2 listed nodes into a 6 list file:
92     /bin/rm -f $MPI_MFile ; touch $MPI_MFile
93     for nc in `seq 1 4` ; do pfx=''
94     for nd in $listNODES ; do
95     if test "x$pfx" = x ; then pfx=$nd ; else
96     echo "${pfx}${nd}" >> $MPI_MFile
97     fi
98     done
99     done
100    
101     cmdCVS='cvs -d :pserver:cvsanon@mitgcm.org:/u/gcmpack -q'
102     gcmDIR="MITgcm_$sfx"
103     cd $TST_DIR
104     #- check for disk space: relative space (99%) or absolute (10.G):
105     dsp=`df -P . | tail -1 | awk '{print $5}' | sed 's/%$//'`
106     if [ $dsp -gt 99 ] ; then
107     #dsp=`df -P . | tail -1 | awk '{print $4}'`
108     #if [ $dsp -le 100000000 ] ; then
109     echo 'Not enough space on this disk => do not run testreport.'
110     df .
111     exit
112     fi
113     if [ $checkOut -eq 1 ] ; then
114     if test -d $gcmDIR/CVS ; then
115     echo "cleaning output from $gcmDIR/verification :"
116     #- remove previous output tar files and tar & remove previous output-dir
117     /bin/rm -f $gcmDIR/verification/??_${dNam}-${sfx}_????????_?.tar.gz
118     ( cd $gcmDIR/verification
119     listD=`ls -1 -d ??_${dNam}-${sfx}_????????_? 2> /dev/null`
120     for dd in $listD
121     do
122     if test -d $dd ; then
123     tar -cf ${dd}".tar" $dd > /dev/null 2>&1 && gzip ${dd}".tar" && /bin/rm -rf $dd
124     RETVAL=$?
125     if test "x$RETVAL" != x0 ; then
126     echo "ERROR in tar+gzip prev outp-dir: $dd"
127     echo " on '"`hostname`"' (return val=$RETVAL) but continue"
128     fi
129     fi
130     done )
131     echo "clean tst_2+2 + testreport output (+ Makefile_syntax files)"
132     ( cd $gcmDIR/verification ; ../tools/do_tst_2+2 -clean )
133     ( cd $gcmDIR/verification ; ./testreport $typ -clean )
134     ( cd $gcmDIR/verification ; rm -f */build/Makefile_syntax )
135     ( cd $gcmDIR/verification ; rm -f */build/port_rand.i */build/ptracers_set_iolabel.i )
136     echo "cvs update of dir $gcmDIR :"
137     ( cd $gcmDIR ; $cmdCVS update -P -d ) 2>&1
138     RETVAL=$?
139     if test "x$RETVAL" != x0 ; then
140     echo "cvs update on '"`hostname`"' fail (return val=$RETVAL) => exit"
141     exit
142     fi
143     else
144     echo "no dir: $gcmDIR/CVS => try a fresh check-out"
145     checkOut=2
146     fi
147     fi
148     if [ $checkOut -eq 2 ] ; then
149     if test -e $gcmDIR ; then
150     echo -n "Removing working copy: $gcmDIR ..."
151     rm -rf $gcmDIR
152     echo " done"
153     fi
154     # cvs co MITgcm
155     echo "Downloading using '$cmdCVS co -P -d $gcmDIR MITgcm' ..."
156     $cmdCVS co -P -d $gcmDIR MITgcm > /dev/null
157     RETVAL=$?
158     if test "x$RETVAL" != x0 ; then
159     echo "cvs co on '"`hostname`"' fail (return val=$RETVAL) => exit"
160     exit
161     else echo " done" ; fi
162     if test -d $gcmDIR/verification ; then
163     /usr/bin/find $gcmDIR -type d | xargs chmod g+rxs
164     /usr/bin/find $gcmDIR -type f | xargs chmod g+r
165     fi
166     fi
167    
168     # -change dir to $gcmDIR/verification dir + add additional experiments:
169     if test -e $gcmDIR/verification ; then
170     if [ $checkOut -lt 2 ] ; then
171     echo " dir $gcmDIR/verification exist" ; fi
172     cd $gcmDIR/verification
173     for exp2add in $addExp ; do
174     if test -d ${exp2add}/CVS ; then
175     echo " assumes dir: $exp2add has been updated"
176     else
177     test -r $exp2add && /bin/rm -rf $exp2add
178     echo " add dir: $exp2add (from Contrib:verification_other)"
179     ( $cmdCVS co -P -d $exp2add \
180     MITgcm_contrib/verification_other/$exp2add > /dev/null )
181     if test $exp2add = 'global_oce_cs32' ; then
182     echo " link dir 'other_input/core2_cnyf' in here"
183     ( cd ${exp2add} ; ln -s ../../../other_input/core2_cnyf . )
184     fi
185     if test $exp2add = 'global_oce_llc90' ; then
186     echo " link dir 'other_input/gael_oce_llc90_input' to 'input_fields'"
187     ( cd ${exp2add} ; ln -s ../../../other_input/gael_oce_llc90_input input_fields )
188     echo " link dirs: 'core2_cnyf' & 'global_oce_input_fields/*' in input_verifs"
189     ( test ! -e ${exp2add}/input_verifs && mkdir ${exp2add}/input_verifs
190     cd ${exp2add}/input_verifs
191     ln -s ../../../../other_input/core2_cnyf .
192     ln -s ../../../../other_input/global_oce_input_fields/* . )
193     fi
194     /usr/bin/find $exp2add -type d | xargs chmod g+rxs
195     /usr/bin/find $exp2add -type f | xargs chmod g+r
196     fi
197     done
198     else
199     echo "no dir: $gcmDIR/verification => exit"
200     exit
201     fi
202    
203     echo ''
204 jmc 1.5 #- 0) just make all module header ( *__genmod.mod files) using modified Makefile
205 jmc 1.2 echo ./testreport $options -of $OPTFILE \
206 jmc 1.1 -nc -repl_mk do_make_syntax.sh -obj -dd
207 jmc 1.2 ./testreport $options -of $OPTFILE \
208 jmc 1.1 -nc -repl_mk do_make_syntax.sh -obj -dd
209    
210     echo ''
211 jmc 1.5 #- 1) just compile ("-nr"), using "-j 4" to speed up
212     echo ./testreport $options -of $OPTFILE \
213     -j 4 -nr -q -odir ${dNam}-$sfx
214     ./testreport $options -of $OPTFILE \
215     -j 4 -nr -q -odir ${dNam}-$sfx
216     nFc=`grep -c '^Y . N N ' tr_out.txt`
217     echo " <= fail to compile $nFc experiments"
218    
219     echo ''
220     #- 2) run and report results ; also finish to compile those who failed with "-j"
221 jmc 1.2 #echo ./testreport $options -of $OPTFILE -command \'$mpiCMD\' -mf $MPI_MFile \
222     echo ./testreport $options -of $OPTFILE \
223 jmc 1.3 -q -odir ${dNam}-$sfx -send \'$SEND\' -sd $SavD -a jmc@dev.mitgcm.org
224 jmc 1.2 #./testreport $options -of $OPTFILE -command "$mpiCMD" -mf $MPI_MFile \
225     ./testreport $options -of $OPTFILE \
226 jmc 1.3 -q -odir ${dNam}-$sfx -send "$SEND" -sd $SavD -a jmc@dev.mitgcm.org
227 jmc 1.1
228     echo ''
229 jmc 1.5 #- 3) test restart and report results
230 jmc 1.2 #echo ../tools/do_tst_2+2 -mpi -exe \'$mpiCMD\' -mf $MPI_MFile \
231     echo ../tools/do_tst_2+2 -mpi \
232 jmc 1.3 -o ${dNam}-$sfx -send \'$SEND\' -sd $SavD -a jmc@dev.mitgcm.org
233 jmc 1.2 #../tools/do_tst_2+2 -mpi -exe "$mpiCMD" -mf $MPI_MFile \
234     ../tools/do_tst_2+2 -mpi \
235 jmc 1.3 -o ${dNam}-$sfx -send "$SEND" -sd $SavD -a jmc@dev.mitgcm.org
236 jmc 1.1

  ViewVC Help
Powered by ViewVC 1.1.22