/[MITgcm]/MITgcm/tools/example_scripts/ACESgrid/check_mp2
ViewVC logotype

Contents of /MITgcm/tools/example_scripts/ACESgrid/check_mp2

Parent Directory Parent Directory | Revision Log Revision Log | View Revision Graph Revision Graph


Revision 1.1 - (show annotations) (download)
Tue Dec 14 21:34:45 2010 UTC (13 years, 4 months ago) by jmc
Branch: MAIN
CVS Tags: checkpoint62z, checkpoint62t, checkpoint62s, checkpoint62r, checkpoint62q, checkpoint62p, checkpoint62w, checkpoint62v, checkpoint62u, checkpoint63, checkpoint63d, checkpoint63e, checkpoint62y, checkpoint62x, checkpoint63a, checkpoint63b, checkpoint63c
uses "df -P ." instead of just "df ." (to work on geo cluster)

1 #!/bin/bash
2
3 # $Header: /u/gcmpack/MITgcm/tools/example_scripts/ACESgrid/aces_test_mp2_mth,v 1.2 2010/01/24 18:17:35 jmc Exp $
4 # $Name: $
5
6
7 sfx='mp2'
8 #EXE="mpiexec -pernode -comm pmi -np $NCPU ./mitgcmuv"
9 longChk=600
10 longChk=300
11 shortChk=60
12 pNam='mpiexec'
13 uNam=$USER
14 HERE=`pwd`
15 pLog="kill_$sfx.log"
16
17 echo "start $0 from $HERE at:" `date` "by user: $uNam"
18 #uNam='jmc' ; HERE='/home/jmc/test_ACES/output' ; cd $HERE
19
20 while test ! -f stop_check_$sfx
21 do
22 sleep $longChk
23 # check for defunct proc
24 nZ=`ps wauxx | grep $uNam | grep $pNam | grep '<defunct>' | wc -l`
25 if [ $nZ -ge 1 ] ; then
26 echo "found $nZ $pNam zombie processes at:" `date`
27 listZ=`ps wauxx | grep $uNam | grep $pNam | grep '<defunct>' | awk '{print $2}'`
28 sleep $shortChk
29 for p1Z in $listZ ; do
30 p2Z=`ps -f -p $p1Z | grep $pNam | grep '<defunct>' | awk '{print $2}'`
31 if test "x$p2Z" = "x$p1Z" ; then
32 #-- report to permanent log file
33 echo '--------------------' >> $pLog
34 date >> $pLog ; uname -a >> $pLog
35 ps -f -p $p1Z >> $pLog
36 #--
37 ppZ=`ps -f -p $p1Z | grep $pNam | awk '{print $3}'`
38 echo " try to kill parent proc: $ppZ at:" `date` | tee -a $pLog
39 kill -9 $ppZ
40 out=$?
41 echo " return code: $out" | tee -a $pLog
42 ps wauxx | grep $uNam | grep $pNam | tee -a $pLog
43 echo '--------------------' >> $pLog
44 else
45 echo " proc: $p1Z no more Zombie at:" `date`
46 fi
47 done
48 nZ=`ps wauxx | grep $uNam | grep $pNam | grep '<defunct>' | wc -l`
49 echo " $nZ $pNam zombie process remain at:" `date`
50 fi
51 done
52 ls -l stop_check_$sfx
53 exit

  ViewVC Help
Powered by ViewVC 1.1.22