s_ecco/text/optim.tex

\section{The line search optimisation algorithm
\label{sectionoptim}}

\subsection{General features}

The line search algorithm is based on a quasi-Newton
variable storage method which was implemented by
\cite{gil-mar:89}.

TO BE CONTINUED...

\subsection{The online vs. offline version}

\begin{itemize}
%
\item {\bf Online version} \\
Every call to {\it simul} refers to an execution of the 
forward and adjoint model.
Several iterations of optimization may thus be performed within
a single run of the main program (lsopt\_top).
The following cases may occur:
%
\begin{itemize}
\item
cold start only (no optimization)
\item
cold start, followed by one or several iterations of optimization
\item
warm start from previous cold start with one or several iterations
\item
warm start from previous warm start with one or several iterations
\end{itemize}
%
\item {\bf Offline version} \\
Every call to simul refers to a read procedure which
reads the result of a forward and adjoint run
Therefore, only one call to simul is allowed,
                     {\tt itmax = 0}, for cold start
                     {\tt itmax = 1}, for warm start
Also, at the end, {\bf x(i+1)} needs to be computed and saved
to be available for the offline model and adjoint run
\end{itemize}

In order to achieve minimum difference between the online and offline code
{\bf xdiff(i+1)} is stored to file at the end of an (offline) iteration,
but recomputed identically at the beginning of the next iteration.

\subsection{Number of iterations vs. number of simulations}

{\tt - itmax:} controls the max. number of iterations \\
{\tt - nfunc:} controls the max. number of simulations 
within one iteration

\paragraph{Summary} ~ \\
From one iteration to the next the descent direction changes.
Within one iteration more than one forward and adjoint 
run may be performed.
The updated control used as input for these simulations uses the same
descent direction, but different step sizes.

\paragraph{Description} ~ \\
From one iteration to the next the descent direction dd changes using
the result for the adjoint vector gg of the previous iteration.
In lsline the updated control
\[
\tt
xdiff(i,1) = xx(i-1) + tact(i-1,1)*dd(i-1)
\]
serves as input for
a forward and adjoint model run yielding a new {\tt gg(i,1)}.
In general, the new solution passes the 1st and 2nd Wolfe tests 
so {\tt xdiff(i,1)} represents the solution sought:
\[ 
{\tt xx(i) = xdiff(i,1)}
\]
If one of the two tests fails, 
an inter- or extrapolation is invoked to determine
a new step size {\tt tact(i-1,2)}.
If more than one function call is permitted, 
the new step size is used together
with the "old" descent direction {\tt dd(i-1)}
(i.e. dd is not updated using the new {\tt gg(i)}),
to compute a new 
\[
{\tt xdiff(i,2) = xx(i-1) + tact(i-1,2)*dd(i-1)} 
\]
that serves as input
in a new forward and adjoint run, yielding {\tt gg(i,2)}.
If now, both Wolfe tests are successfull, 
the updated solution is given by
\[
\tt
xx(i) = xdiff(i,2) = xx(i-1) + tact(i-1,2)*dd(i-1)
\]

In order to save memory both the fields dd and xdiff 
have a double usage.
%
\begin{itemize}
%
\item [{\tt xdiff}] ~\\
- in {\it lsopt\_top}: used as {\tt x(i) - x(i-1)} for Hessian update \\
- in {\it lsline}:    intermediate result for control update 
{\tt x = x + tact*dd}
%
\item [{\tt dd}] ~\\
- in {\it lsopt\_top, lsline}: descent vector, {\tt dd = -gg} 
and {\tt hessupd} \\
- in {\it dgscale}: intermediate result to compute new preconditioner
%
\end{itemize}

\paragraph{The parameter file lsopt.par}

%
\begin{itemize}
%
\item {\bf NUPDATE}
max. no. of update pairs {\tt (gg(i)-gg(i-1), xx(i)-xx(i-1))}
to be stored in {\tt OPWARMD} to estimate Hessian
[pair of current iter. is stored in 
{\tt (2*jmax+2, 2*jmax+3)}
jmax must be > 0 to access these entries]
Presently {\tt NUPDATE} must be > 0 
(i.e. iteration without reference to previous
 iterations through {\tt OPWARMD} has not been tested)
%
\item {\bf EPSX}
relative precision on xx bellow which xx should not be improved
%
\item {\bf EPSG}
relative precision on gg below which optimization is 
considered successful
%
\item {\bf IPRINT}
controls verbose (>=1) or non-verbose output
%
\item {\bf NUMITER}
max. number of iterations of optimisation;
NUMTER = 0: cold start only, no optimization
%
\item {\bf ITER\_NUM}
index of new restart file to be created (not necessarily = NUMITER!)
%
\item {\bf NFUNC}
max. no. of simulations per iteration
(must be > 0);
is used if step size {\tt tact} is inter-/extrapolated;
in this case, if NFUNC > 1, a new simulation is performed with
same gradient but "improved" step size
%
\item {\bf FMIN}
first guess cost function value
(only used as long as first iteration not completed,
i.e. for jmax <= 0)
%
\end{itemize}

\paragraph{OPWARMI, OPWARMD files}
Two files retain values of previous iterations which are
used in latest iteration to update Hessian:
\begin{itemize}
%
\item {\bf OPWARMI}: contains index settings and scalar variables

{\footnotesize
\begin{tabular}{ll}
{\tt n  = nn}      & no. of control variables \\
{\tt fc = ff}      & cost value of last iteration \\
{\tt isize}        & no. of bytes per record in OPWARMD \\
{\tt m = nupdate}  & max. no. of updates for Hessian \\
{\tt jmin, jmax}   & pointer indices for OPWARMD file (cf. below) \\
{\tt gnorm0}       & norm of first (cold start) gradient gg \\
{\tt iabsiter}     & total number of iterations with respect to cold start
\end{tabular}
}
%
\item {\bf OPWARMD}: contains vectors (control and gradient)

{\scriptsize
\begin{tabular}{cll}
entry & name & description \\
\hline
     1    & {\tt xx(i)}         & control vector of latest iteration \\
     2    & {\tt gg(i)}         & gradient of latest iteration \\
     3    & {\tt xdiff(i),diag} & preconditioning vector; (1,...,1)
for cold start \\
 2*jmax+2 & {\tt gold=g(i)-g(i-1)} & for last update (jmax) \\
 2*jmax+3 & {\tt xdiff=tact*d=xx(i)-xx(i-1)} & for last update (jmax)
\end{tabular}
}
%
\end{itemize}
%
\begin{figure}[b!]
{\footnotesize
\begin{verbatim}

Example 1: jmin = 1, jmax = 3, mupd = 5

  1   2   3   |   4   5     6   7     8   9     empty     empty
|___|___|___| | |___|___| |___|___| |___|___| |___|___| |___|___|
      0       |     1         2         3

Example 2: jmin = 3, jmax = 7, mupd = 5   ---> jmax = 2

  1   2   3   |  
|___|___|___| | |___|___| |___|___| |___|___| |___|___| |___|___|
              |     6         7         3         4         5

\end{verbatim}
}
\caption{Examples of OPWARM file handling}
\label{fig:opwarm}
\end{figure}

\paragraph{Error handling}


\newpage

\begin{figure}[b!]
\input{part8/lsopt_flow_1}
\caption{Flow chart (part 1 of 3)}
\label{fig:lsoptflow1}
\end{figure}

\begin{figure}[b!]
\input{part8/lsopt_flow_2}
\caption{Flow chart (part 2 of 3)}
\label{fig:lsoptflow2}
\end{figure}

\begin{figure}[b!]
\input{part8/lsopt_flow_3}
\caption{Flow chart (part 3 of 3)}
\label{fig:lsoptflow3}
\end{figure}

1	heimbach	1.1	\section{The line search optimisation algorithm
2			\label{sectionoptim}}
3
4			\subsection{General features}
5
6			The line search algorithm is based on a quasi-Newton
7			variable storage method which was implemented by
8			\cite{gil-mar:89}.
9
10			TO BE CONTINUED...
11
12			\subsection{The online vs. offline version}
13
14			\begin{itemize}
15			%
16			\item {\bf Online version} \\
17			Every call to {\it simul} refers to an execution of the
18			forward and adjoint model.
19			Several iterations of optimization may thus be performed within
20			a single run of the main program (lsopt\_top).
21			The following cases may occur:
22			%
23			\begin{itemize}
24			\item
25			cold start only (no optimization)
26			\item
27			cold start, followed by one or several iterations of optimization
28			\item
29			warm start from previous cold start with one or several iterations
30			\item
31			warm start from previous warm start with one or several iterations
32			\end{itemize}
33			%
34			\item {\bf Offline version} \\
35			Every call to simul refers to a read procedure which
36			reads the result of a forward and adjoint run
37			Therefore, only one call to simul is allowed,
38			{\tt itmax = 0}, for cold start
39			{\tt itmax = 1}, for warm start
40			Also, at the end, {\bf x(i+1)} needs to be computed and saved
41			to be available for the offline model and adjoint run
42			\end{itemize}
43
44			In order to achieve minimum difference between the online and offline code
45			{\bf xdiff(i+1)} is stored to file at the end of an (offline) iteration,
46			but recomputed identically at the beginning of the next iteration.
47
48			\subsection{Number of iterations vs. number of simulations}
49
50			{\tt - itmax:} controls the max. number of iterations \\
51			{\tt - nfunc:} controls the max. number of simulations
52			within one iteration
53
54			\paragraph{Summary} ~ \\
55			From one iteration to the next the descent direction changes.
56			Within one iteration more than one forward and adjoint
57			run may be performed.
58			The updated control used as input for these simulations uses the same
59			descent direction, but different step sizes.
60
61			\paragraph{Description} ~ \\
62			From one iteration to the next the descent direction dd changes using
63			the result for the adjoint vector gg of the previous iteration.
64			In lsline the updated control
65			\[
66			\tt
67			xdiff(i,1) = xx(i-1) + tact(i-1,1)*dd(i-1)
68			\]
69			serves as input for
70			a forward and adjoint model run yielding a new {\tt gg(i,1)}.
71			In general, the new solution passes the 1st and 2nd Wolfe tests
72			so {\tt xdiff(i,1)} represents the solution sought:
73			\[
74			{\tt xx(i) = xdiff(i,1)}
75			\]
76			If one of the two tests fails,
77			an inter- or extrapolation is invoked to determine
78			a new step size {\tt tact(i-1,2)}.
79			If more than one function call is permitted,
80			the new step size is used together
81			with the "old" descent direction {\tt dd(i-1)}
82			(i.e. dd is not updated using the new {\tt gg(i)}),
83			to compute a new
84			\[
85			{\tt xdiff(i,2) = xx(i-1) + tact(i-1,2)*dd(i-1)}
86			\]
87			that serves as input
88			in a new forward and adjoint run, yielding {\tt gg(i,2)}.
89			If now, both Wolfe tests are successfull,
90			the updated solution is given by
91			\[
92			\tt
93			xx(i) = xdiff(i,2) = xx(i-1) + tact(i-1,2)*dd(i-1)
94			\]
95
96			In order to save memory both the fields dd and xdiff
97			have a double usage.
98			%
99			\begin{itemize}
100			%
101			\item [{\tt xdiff}] ~\\
102			- in {\it lsopt\_top}: used as {\tt x(i) - x(i-1)} for Hessian update \\
103			- in {\it lsline}: intermediate result for control update
104			{\tt x = x + tact*dd}
105			%
106			\item [{\tt dd}] ~\\
107			- in {\it lsopt\_top, lsline}: descent vector, {\tt dd = -gg}
108			and {\tt hessupd} \\
109			- in {\it dgscale}: intermediate result to compute new preconditioner
110			%
111			\end{itemize}
112
113			\paragraph{The parameter file lsopt.par}
114
115			%
116			\begin{itemize}
117			%
118			\item {\bf NUPDATE}
119			max. no. of update pairs {\tt (gg(i)-gg(i-1), xx(i)-xx(i-1))}
120			to be stored in {\tt OPWARMD} to estimate Hessian
121			[pair of current iter. is stored in
122			{\tt (2jmax+2, 2jmax+3)}
123			jmax must be > 0 to access these entries]
124			Presently {\tt NUPDATE} must be > 0
125			(i.e. iteration without reference to previous
126			iterations through {\tt OPWARMD} has not been tested)
127			%
128			\item {\bf EPSX}
129			relative precision on xx bellow which xx should not be improved
130			%
131			\item {\bf EPSG}
132			relative precision on gg below which optimization is
133			considered successful
134			%
135			\item {\bf IPRINT}
136			controls verbose (>=1) or non-verbose output
137			%
138			\item {\bf NUMITER}
139			max. number of iterations of optimisation;
140			NUMTER = 0: cold start only, no optimization
141			%
142			\item {\bf ITER\_NUM}
143			index of new restart file to be created (not necessarily = NUMITER!)
144			%
145			\item {\bf NFUNC}
146			max. no. of simulations per iteration
147			(must be > 0);
148			is used if step size {\tt tact} is inter-/extrapolated;
149			in this case, if NFUNC > 1, a new simulation is performed with
150			same gradient but "improved" step size
151			%
152			\item {\bf FMIN}
153			first guess cost function value
154			(only used as long as first iteration not completed,
155			i.e. for jmax <= 0)
156			%
157			\end{itemize}
158
159			\paragraph{OPWARMI, OPWARMD files}
160			Two files retain values of previous iterations which are
161			used in latest iteration to update Hessian:
162			\begin{itemize}
163			%
164			\item {\bf OPWARMI}: contains index settings and scalar variables
165
166			{\footnotesize
167			\begin{tabular}{ll}
168			{\tt n = nn} & no. of control variables \\
169			{\tt fc = ff} & cost value of last iteration \\
170			{\tt isize} & no. of bytes per record in OPWARMD \\
171			{\tt m = nupdate} & max. no. of updates for Hessian \\
172			{\tt jmin, jmax} & pointer indices for OPWARMD file (cf. below) \\
173			{\tt gnorm0} & norm of first (cold start) gradient gg \\
174			{\tt iabsiter} & total number of iterations with respect to cold start
175			\end{tabular}
176			}
177			%
178			\item {\bf OPWARMD}: contains vectors (control and gradient)
179
180			{\scriptsize
181			\begin{tabular}{cll}
182			entry & name & description \\
183			\hline
184			1 & {\tt xx(i)} & control vector of latest iteration \\
185			2 & {\tt gg(i)} & gradient of latest iteration \\
186			3 & {\tt xdiff(i),diag} & preconditioning vector; (1,...,1)
187			for cold start \\
188			2*jmax+2 & {\tt gold=g(i)-g(i-1)} & for last update (jmax) \\
189			2jmax+3 & {\tt xdiff=tactd=xx(i)-xx(i-1)} & for last update (jmax)
190			\end{tabular}
191			}
192			%
193			\end{itemize}
194			%
195			\begin{figure}[b!]
196			{\footnotesize
197			\begin{verbatim}
198
199			Example 1: jmin = 1, jmax = 3, mupd = 5
200
201			1 2 3 \| 4 5 6 7 8 9 empty empty
202			\|___\|___\|___\| \| \|___\|___\| \|___\|___\| \|___\|___\| \|___\|___\| \|___\|___\|
203			0 \| 1 2 3
204
205			Example 2: jmin = 3, jmax = 7, mupd = 5 ---> jmax = 2
206
207			1 2 3 \|
208			\|___\|___\|___\| \| \|___\|___\| \|___\|___\| \|___\|___\| \|___\|___\| \|___\|___\|
209			\| 6 7 3 4 5
210
211			\end{verbatim}
212			}
213			\caption{Examples of OPWARM file handling}
214			\label{fig:opwarm}
215			\end{figure}
216
217			\paragraph{Error handling}
218
219
220
221			\newpage
222
223			\begin{figure}[b!]
224			\input{part8/lsopt_flow_1}
225			\caption{Flow chart (part 1 of 3)}
226			\label{fig:lsoptflow1}
227			\end{figure}
228
229			\begin{figure}[b!]
230			\input{part8/lsopt_flow_2}
231			\caption{Flow chart (part 2 of 3)}
232			\label{fig:lsoptflow2}
233			\end{figure}
234
235			\begin{figure}[b!]
236			\input{part8/lsopt_flow_3}
237			\caption{Flow chart (part 3 of 3)}
238			\label{fig:lsoptflow3}
239			\end{figure}
240