| 1 | 
dimitri | 
1.1 | 
For interactive session, Ivy Bridge nodes: | 
| 2 | 
dimitri | 
1.4 | 
qsub -I -q devel -l select=300:ncpus=20:model=ivy,walltime=02:00:00 -m abe -M email | 
| 3 | 
  | 
  | 
qsub -I -q normal -l select=103:ncpus=20:model=ivy,walltime=8:00:00 -m abe -M email | 
| 4 | 
dimitri | 
1.8 | 
qsub -I -q long -l select=300:ncpus=20:model=ivy,walltime=120:00:00 -m abe -M menemenlis@me.com | 
| 5 | 
dimitri | 
1.4 | 
qsub -I -q long -l select=103:ncpus=20:model=ivy,min_walltime=30:00,max_walltime=120:00:00 -m abe -M email | 
| 6 | 
dimitri | 
1.1 | 
 | 
| 7 | 
dimitri | 
1.7 | 
############################# | 
| 8 | 
  | 
  | 
# 60x60x10882 configuration | 
| 9 | 
  | 
  | 
 | 
| 10 | 
  | 
  | 
qsub -I -q long -l select=600:ncpus=20:model=ivy,min_walltime=30:00,max_walltime=120:00:00 -m abe -M menemenlis@me.com | 
| 11 | 
  | 
  | 
module purge | 
| 12 | 
  | 
  | 
module load  comp-intel/2012.0.032 netcdf/4.0 | 
| 13 | 
  | 
  | 
module use -a ~kjtaylor/modulefiles | 
| 14 | 
  | 
  | 
module load sles11sp3/mpt-2.10-nasa201311271217 | 
| 15 | 
  | 
  | 
cd ~/llc_2160 | 
| 16 | 
  | 
  | 
cvs co MITgcm_code | 
| 17 | 
dimitri | 
1.8 | 
cvs co MITgcm_contrib/llc_hires/llc_2160 | 
| 18 | 
dimitri | 
1.7 | 
cd MITgcm | 
| 19 | 
  | 
  | 
mkdir build run | 
| 20 | 
  | 
  | 
lfs setstripe -c -1 run | 
| 21 | 
  | 
  | 
cd build | 
| 22 | 
  | 
  | 
cp ../../MITgcm_contrib/llc_hires/llc_2160/code/SIZE.h_60x60_10882 SIZE.h | 
| 23 | 
  | 
  | 
cp ../../MITgcm_contrib/llc_hires/llc_2160/code-async/readtile_mpiio.c . | 
| 24 | 
  | 
  | 
emacs readtile_mpiio.c | 
| 25 | 
  | 
  | 
    tileSizeX = 60; | 
| 26 | 
  | 
  | 
    tileSizeY = 60; | 
| 27 | 
  | 
  | 
../tools/genmake2 -of \ | 
| 28 | 
  | 
  | 
 ../../MITgcm_contrib/llc_hires/llc_2160/code-async/linux_amd64_ifort+mpi_ice_nas -mpi -mods \ | 
| 29 | 
  | 
  | 
 '../../MITgcm_contrib/llc_hires/llc_2160/code ../../MITgcm_contrib/llc_hires/llc_2160/code-async' | 
| 30 | 
  | 
  | 
make depend | 
| 31 | 
  | 
  | 
make -j 16 | 
| 32 | 
  | 
  | 
 | 
| 33 | 
dimitri | 
1.8 | 
cd ~/llc_2160/MITgcm/run_day49_on | 
| 34 | 
dimitri | 
1.7 | 
cp ../build/mitgcmuv mitgcmuv_60x60x10882 | 
| 35 | 
  | 
  | 
ln -sf /nobackup/dmenemen/tarballs/llc_2160/run_template/* . | 
| 36 | 
  | 
  | 
ln -sf /nobackup/dmenemen/forcing/ECMWF_operational/* . | 
| 37 | 
  | 
  | 
cp ../../MITgcm_contrib/llc_hires/llc_2160/input/* . | 
| 38 | 
  | 
  | 
mv ../../MITgcm_contrib/llc_hires/llc_2160/input/data.exch2_60x60x10882 data.exch2 | 
| 39 | 
  | 
  | 
emacs data | 
| 40 | 
  | 
  | 
 | 
| 41 | 
  | 
  | 
export MPI_BUFS_PER_PROC=1024 | 
| 42 | 
  | 
  | 
export MPI_REQUEST_MAX=65536 | 
| 43 | 
  | 
  | 
export MPI_GROUP_MAX=1024 | 
| 44 | 
  | 
  | 
export MPI_NUM_MEMORY_REGIONS=8 | 
| 45 | 
  | 
  | 
export MPI_UNBUFFERED_STDIO=1 | 
| 46 | 
  | 
  | 
export MPI_MEMMAP_OFF=1 | 
| 47 | 
dimitri | 
1.8 | 
export MPI_UD_TIMEOUT=100 | 
| 48 | 
dimitri | 
1.7 | 
mpiexec -n 12000 ./mitgcmuv_60x60x10882 | 
| 49 | 
  | 
  | 
 | 
| 50 | 
  | 
  | 
tail -f STDOUT.00000 | grep advcfl_W | 
| 51 | 
  | 
  | 
 | 
| 52 | 
dimitri | 
1.1 | 
============== | 
| 53 | 
  | 
  | 
 | 
| 54 | 
dimitri | 
1.2 | 
cd ~/llc_2160 | 
| 55 | 
dimitri | 
1.1 | 
cvs co MITgcm_code | 
| 56 | 
dimitri | 
1.2 | 
cvs co MITgcm_contrib/llc_hires/llc_2160 | 
| 57 | 
dimitri | 
1.1 | 
cd MITgcm | 
| 58 | 
  | 
  | 
module purge | 
| 59 | 
dimitri | 
1.4 | 
module load comp-intel/2012.0.032 mpi-sgi/mpt.2.08r7 netcdf/4.0 | 
| 60 | 
dimitri | 
1.1 | 
mkdir build run | 
| 61 | 
dimitri | 
1.2 | 
lfs setstripe -c -1 run | 
| 62 | 
dimitri | 
1.1 | 
cd build | 
| 63 | 
dimitri | 
1.3 | 
cp ../../MITgcm_contrib/llc_hires/llc_2160/code/SIZE.h_90x90_5004 SIZE.h | 
| 64 | 
dimitri | 
1.2 | 
../tools/genmake2 -of \ | 
| 65 | 
  | 
  | 
 ../../MITgcm_contrib/llc_hires/llc_2160/code-async/linux_amd64_ifort+mpi_ice_nas -mpi -mods \ | 
| 66 | 
  | 
  | 
 '../../MITgcm_contrib/llc_hires/llc_2160/code ../../MITgcm_contrib/llc_hires/llc_2160/code-async' | 
| 67 | 
dimitri | 
1.1 | 
make depend | 
| 68 | 
  | 
  | 
make -j 16 | 
| 69 | 
dimitri | 
1.4 | 
cd ~/llc_2160/MITgcm/run | 
| 70 | 
dimitri | 
1.1 | 
ln -sf ../build/mitgcmuv . | 
| 71 | 
  | 
  | 
ln -sf /nobackup/dmenemen/tarballs/llc_2160/run_template/* . | 
| 72 | 
dimitri | 
1.2 | 
ln -sf /nobackup/dmenemen/forcing/ECMWF_operational/* . | 
| 73 | 
  | 
  | 
cp ../../MITgcm_contrib/llc_hires/llc_2160/input/* . | 
| 74 | 
dimitri | 
1.3 | 
mv data.exch2_90x90x5004 data.exch2 | 
| 75 | 
dimitri | 
1.5 | 
export MPI_NUM_MEMORY_REGIONS=256 | 
| 76 | 
dimitri | 
1.6 | 
mpiexec -n 6000 ./mitgcmuv | 
| 77 | 
dimitri | 
1.1 | 
 | 
| 78 | 
  | 
  | 
============== | 
| 79 | 
  | 
  | 
 | 
| 80 | 
  | 
  | 
look at output | 
| 81 | 
  | 
  | 
 | 
| 82 | 
  | 
  | 
for ts=[0 120 600:10:980 1080:120:2280] | 
| 83 | 
  | 
  | 
    fld=quikread_llc(['Eta.' myint2str(ts,10) '.data'],2160); | 
| 84 | 
  | 
  | 
    clf,quikplot_llc(fld),caxis([-2.5 2]),thincolorbar | 
| 85 | 
  | 
  | 
    title(ts) | 
| 86 | 
  | 
  | 
    pause(.1) | 
| 87 | 
  | 
  | 
end | 
| 88 | 
  | 
  | 
 | 
| 89 | 
  | 
  | 
============== | 
| 90 | 
  | 
  | 
 | 
| 91 | 
  | 
  | 
to determine empty tiles: | 
| 92 | 
  | 
  | 
grep Empty STDOUT.* | 
| 93 | 
  | 
  | 
 | 
| 94 | 
  | 
  | 
============== | 
| 95 | 
  | 
  | 
 | 
| 96 | 
  | 
  | 
memory requirements: | 
| 97 | 
  | 
  | 
nPx  sNx sNy nSx cpu node0        total           rank0 rankm | 
| 98 | 
  | 
  | 
936  180 180   2 san node ran out of memory and crashed with singlecpuio | 
| 99 | 
  | 
  | 
1053 240 240   1 san node ran out of memory and crashed with singlecpuio | 
| 100 | 
  | 
  | 
1300 216 216   1 san node ran out of memory and crashed with singlecpuio | 
| 101 | 
  | 
  | 
1872 180 180   1 wes node ran out of memory and crashed with singlecpuio | 
| 102 | 
  | 
  | 
1872 180 180   1 wes 21,377,644kb 3,294,676,080kb node ran out of memory with singlecpuio and bigmem=true:mem=90GB for node 0 | 
| 103 | 
  | 
  | 
1872 180 180   1 san node ran out of memory and crashed with singlecpuio | 
| 104 | 
  | 
  | 
1872 180 180   1 san 11,558,588kb 1,356,676,140kb singlecpuio=.FALSE. | 
| 105 | 
  | 
  | 
2925 144 144   1 san  8,374,668kb 1,538,454,112kb 886MB 892MB singlecpuio=.FALSE. | 
| 106 | 
  | 
  | 
2925 144 144   1 san 27,284,996kb 4,942,949,704kb node ran out of memory and crashed with singlecpuio | 
| 107 | 
  | 
  | 
3328 135 135   1 san rank 0 run out of memory | 
| 108 | 
  | 
  | 
3328 135 135   1 san some random node run out of memory (full node for rank 0) | 
| 109 | 
  | 
  | 
4212 120 120   1 san node ran out of memory | 
| 110 | 
  | 
  | 
5200 108 108   1 san node ran out of memory | 
| 111 | 
  | 
  | 
 | 
| 112 | 
  | 
  | 
============= | 
| 113 | 
  | 
  | 
 | 
| 114 | 
  | 
  | 
2             =    2 | 
| 115 | 
  | 
  | 
3             =    3 | 
| 116 | 
  | 
  | 
2*2           =    4 | 
| 117 | 
  | 
  | 
5             =    5 | 
| 118 | 
  | 
  | 
2*3           =    6 | 
| 119 | 
  | 
  | 
2*2*2         =    8 | 
| 120 | 
  | 
  | 
3*3           =    9 | 
| 121 | 
  | 
  | 
2*5           =   10 | 
| 122 | 
  | 
  | 
2*2*3         =   12 | 
| 123 | 
  | 
  | 
3*5           =   15 | 
| 124 | 
  | 
  | 
2*2*2*2       =   16 | 
| 125 | 
  | 
  | 
2*3*3         =   18 | 
| 126 | 
  | 
  | 
2*2*5         =   20 | 
| 127 | 
  | 
  | 
2*2*2*3       =   24 | 
| 128 | 
  | 
  | 
3*3*3         =   27 | 
| 129 | 
  | 
  | 
2*3*5         =   30 | 
| 130 | 
  | 
  | 
2*2*3*3       =   36 | 
| 131 | 
  | 
  | 
2*2*2*5       =   40 | 
| 132 | 
  | 
  | 
3*3*5         =   45 | 
| 133 | 
  | 
  | 
2*2*2*2*3     =   48 * 45 | 
| 134 | 
  | 
  | 
2*3*3*3       =   54 * 40 | 
| 135 | 
  | 
  | 
2*2*3*5       =   60 * 36 | 
| 136 | 
  | 
  | 
2*2*2*3*3     =   72 * 30 | 
| 137 | 
  | 
  | 
2*2*2*2*5     =   80 * 27 | 
| 138 | 
  | 
  | 
2*3*3*5       =   90 * 24 | 
| 139 | 
  | 
  | 
2*2*3*3*3     =  108 * 20 | 
| 140 | 
  | 
  | 
2*2*2*3*5     =  120 * 18 | 
| 141 | 
  | 
  | 
3*3*3*5       =  135 * 16 | 
| 142 | 
  | 
  | 
2*2*2*2*3*3   =  144 * 15 | 
| 143 | 
  | 
  | 
2*2*3*3*5     =  180 * 12 | 
| 144 | 
  | 
  | 
2*2*2*3*3*3   =  216 * 10 | 
| 145 | 
  | 
  | 
2*2*2*2*3*5   =  240 *  9 | 
| 146 | 
  | 
  | 
2*3*3*3*5     =  270 *  8 | 
| 147 | 
  | 
  | 
2*2*2*3*3*5   =  360 *  6 | 
| 148 | 
  | 
  | 
2*2*2*2*3*3*3 =  432 *  5 | 
| 149 | 
  | 
  | 
2*2*3*3*3*5   =  540 *  4 | 
| 150 | 
  | 
  | 
2*2*2*2*3*3*5 =  720 *  3 | 
| 151 | 
  | 
  | 
2*2*2*3*3*3*5 = 1080 *  2 |