xref: /petsc/src/tao/unconstrained/impls/ntr/ntr.c (revision 3c9e27cfca911a7d7e3219758be42726e83c4ab2)
1f89ca46fSSatish Balay #include "../src/tao/matrix/lmvmmat.h"
2a7e14dcfSSatish Balay #include "ntr.h"
3a7e14dcfSSatish Balay 
4a7e14dcfSSatish Balay #include "petscksp.h"
5a7e14dcfSSatish Balay #include "petscpc.h"
6a7e14dcfSSatish Balay #include "petsc-private/kspimpl.h"
7a7e14dcfSSatish Balay #include "petsc-private/pcimpl.h"
8a7e14dcfSSatish Balay 
9a7e14dcfSSatish Balay #define NTR_KSP_NASH    0
10a7e14dcfSSatish Balay #define NTR_KSP_STCG    1
11a7e14dcfSSatish Balay #define NTR_KSP_GLTR    2
12a7e14dcfSSatish Balay #define NTR_KSP_TYPES   3
13a7e14dcfSSatish Balay 
14a7e14dcfSSatish Balay #define NTR_PC_NONE	0
15a7e14dcfSSatish Balay #define NTR_PC_AHESS    1
16a7e14dcfSSatish Balay #define NTR_PC_BFGS     2
17a7e14dcfSSatish Balay #define NTR_PC_PETSC    3
18a7e14dcfSSatish Balay #define NTR_PC_TYPES    4
19a7e14dcfSSatish Balay 
20a7e14dcfSSatish Balay #define BFGS_SCALE_AHESS   0
21a7e14dcfSSatish Balay #define BFGS_SCALE_BFGS    1
22a7e14dcfSSatish Balay #define BFGS_SCALE_TYPES   2
23a7e14dcfSSatish Balay 
24a7e14dcfSSatish Balay #define NTR_INIT_CONSTANT	  0
25a7e14dcfSSatish Balay #define NTR_INIT_DIRECTION	  1
26a7e14dcfSSatish Balay #define NTR_INIT_INTERPOLATION	  2
27a7e14dcfSSatish Balay #define NTR_INIT_TYPES		  3
28a7e14dcfSSatish Balay 
29a7e14dcfSSatish Balay #define NTR_UPDATE_REDUCTION      0
30a7e14dcfSSatish Balay #define NTR_UPDATE_INTERPOLATION  1
31a7e14dcfSSatish Balay #define NTR_UPDATE_TYPES          2
32a7e14dcfSSatish Balay 
33a7e14dcfSSatish Balay static const char *NTR_KSP[64] = {
34a7e14dcfSSatish Balay   "nash", "stcg", "gltr"
35a7e14dcfSSatish Balay };
36a7e14dcfSSatish Balay 
37a7e14dcfSSatish Balay static const char *NTR_PC[64] = {
38a7e14dcfSSatish Balay   "none", "ahess", "bfgs", "petsc"
39a7e14dcfSSatish Balay };
40a7e14dcfSSatish Balay 
41a7e14dcfSSatish Balay static const char *BFGS_SCALE[64] = {
42a7e14dcfSSatish Balay   "ahess", "bfgs"
43a7e14dcfSSatish Balay };
44a7e14dcfSSatish Balay 
45a7e14dcfSSatish Balay static const char *NTR_INIT[64] = {
46a7e14dcfSSatish Balay   "constant", "direction", "interpolation"
47a7e14dcfSSatish Balay };
48a7e14dcfSSatish Balay 
49a7e14dcfSSatish Balay static const char *NTR_UPDATE[64] = {
50a7e14dcfSSatish Balay   "reduction", "interpolation"
51a7e14dcfSSatish Balay };
52a7e14dcfSSatish Balay 
53a7e14dcfSSatish Balay /*  Routine for BFGS preconditioner */
54a7e14dcfSSatish Balay static PetscErrorCode MatLMVMSolveShell(PC pc, Vec xin, Vec xout);
55a7e14dcfSSatish Balay 
56a7e14dcfSSatish Balay /*
57a7e14dcfSSatish Balay    TaoSolve_NTR - Implements Newton's Method with a trust region approach
58a7e14dcfSSatish Balay    for solving unconstrained minimization problems.
59a7e14dcfSSatish Balay 
60a7e14dcfSSatish Balay    The basic algorithm is taken from MINPACK-2 (dstrn).
61a7e14dcfSSatish Balay 
62a7e14dcfSSatish Balay    TaoSolve_NTR computes a local minimizer of a twice differentiable function
63a7e14dcfSSatish Balay    f by applying a trust region variant of Newton's method.  At each stage
64a7e14dcfSSatish Balay    of the algorithm, we use the prconditioned conjugate gradient method to
65a7e14dcfSSatish Balay    determine an approximate minimizer of the quadratic equation
66a7e14dcfSSatish Balay 
67a7e14dcfSSatish Balay         q(s) = <s, Hs + g>
68a7e14dcfSSatish Balay 
69a7e14dcfSSatish Balay    subject to the trust region constraint
70a7e14dcfSSatish Balay 
71a7e14dcfSSatish Balay         || s ||_M <= radius,
72a7e14dcfSSatish Balay 
73a7e14dcfSSatish Balay    where radius is the trust region radius and M is a symmetric positive
74a7e14dcfSSatish Balay    definite matrix (the preconditioner).  Here g is the gradient and H
75a7e14dcfSSatish Balay    is the Hessian matrix.
76a7e14dcfSSatish Balay 
77a7e14dcfSSatish Balay    Note:  TaoSolve_NTR MUST use the iterative solver KSPNASH, KSPSTCG,
78a7e14dcfSSatish Balay           or KSPGLTR.  Thus, we set KSPNASH, KSPSTCG, or KSPGLTR in this
79a7e14dcfSSatish Balay           routine regardless of what the user may have previously specified.
80a7e14dcfSSatish Balay */
81a7e14dcfSSatish Balay #undef __FUNCT__
82a7e14dcfSSatish Balay #define __FUNCT__ "TaoSolve_NTR"
83a7e14dcfSSatish Balay static PetscErrorCode TaoSolve_NTR(TaoSolver tao)
84a7e14dcfSSatish Balay {
85a7e14dcfSSatish Balay   TAO_NTR *tr = (TAO_NTR *)tao->data;
86a7e14dcfSSatish Balay 
87a7e14dcfSSatish Balay   PC pc;
88a7e14dcfSSatish Balay 
89a7e14dcfSSatish Balay   KSPConvergedReason ksp_reason;
90a7e14dcfSSatish Balay   TaoSolverTerminationReason reason;
91a7e14dcfSSatish Balay 
92a7e14dcfSSatish Balay   MatStructure matflag;
93a7e14dcfSSatish Balay 
94a7e14dcfSSatish Balay   PetscReal fmin, ftrial, prered, actred, kappa, sigma, beta;
95a7e14dcfSSatish Balay   PetscReal tau, tau_1, tau_2, tau_max, tau_min, max_radius;
96a7e14dcfSSatish Balay   PetscReal f, gnorm;
97a7e14dcfSSatish Balay 
98a7e14dcfSSatish Balay   PetscReal delta;
99a7e14dcfSSatish Balay   PetscReal norm_d;
100a7e14dcfSSatish Balay   PetscErrorCode ierr;
101a7e14dcfSSatish Balay 
102a7e14dcfSSatish Balay   PetscInt iter = 0;
103a7e14dcfSSatish Balay   PetscInt bfgsUpdates = 0;
104a7e14dcfSSatish Balay   PetscInt needH;
105a7e14dcfSSatish Balay 
106a7e14dcfSSatish Balay   PetscInt i_max = 5;
107a7e14dcfSSatish Balay   PetscInt j_max = 1;
108a7e14dcfSSatish Balay   PetscInt i, j, N, n, its;
109a7e14dcfSSatish Balay 
110a7e14dcfSSatish Balay   PetscFunctionBegin;
111a7e14dcfSSatish Balay 
112a7e14dcfSSatish Balay   if (tao->XL || tao->XU || tao->ops->computebounds) {
113a7e14dcfSSatish Balay     ierr = PetscPrintf(((PetscObject)tao)->comm,"WARNING: Variable bounds have been set but will be ignored by ntr algorithm\n"); CHKERRQ(ierr);
114a7e14dcfSSatish Balay   }
115a7e14dcfSSatish Balay 
116a7e14dcfSSatish Balay   tao->trust = tao->trust0;
117a7e14dcfSSatish Balay 
118a7e14dcfSSatish Balay   /* Modify the radius if it is too large or small */
119a7e14dcfSSatish Balay   tao->trust = PetscMax(tao->trust, tr->min_radius);
120a7e14dcfSSatish Balay   tao->trust = PetscMin(tao->trust, tr->max_radius);
121a7e14dcfSSatish Balay 
122a7e14dcfSSatish Balay 
123a7e14dcfSSatish Balay   if (NTR_PC_BFGS == tr->pc_type && !tr->M) {
124a7e14dcfSSatish Balay     ierr = VecGetLocalSize(tao->solution,&n); CHKERRQ(ierr);
125a7e14dcfSSatish Balay     ierr = VecGetSize(tao->solution,&N); CHKERRQ(ierr);
126a7e14dcfSSatish Balay     ierr = MatCreateLMVM(((PetscObject)tao)->comm,n,N,&tr->M); CHKERRQ(ierr);
127a7e14dcfSSatish Balay     ierr = MatLMVMAllocateVectors(tr->M,tao->solution); CHKERRQ(ierr);
128a7e14dcfSSatish Balay   }
129a7e14dcfSSatish Balay 
130a7e14dcfSSatish Balay   /* Check convergence criteria */
131a7e14dcfSSatish Balay   ierr = TaoComputeObjectiveAndGradient(tao, tao->solution, &f, tao->gradient); CHKERRQ(ierr);
132a7e14dcfSSatish Balay   ierr = VecNorm(tao->gradient,NORM_2,&gnorm); CHKERRQ(ierr);
133a7e14dcfSSatish Balay   if (PetscIsInfOrNanReal(f) || PetscIsInfOrNanReal(gnorm)) {
134a7e14dcfSSatish Balay     SETERRQ(PETSC_COMM_SELF,1, "User provided compute function generated Inf or NaN");
135a7e14dcfSSatish Balay   }
136a7e14dcfSSatish Balay   needH = 1;
137a7e14dcfSSatish Balay 
138a7e14dcfSSatish Balay   ierr = TaoMonitor(tao, iter, f, gnorm, 0.0, 1.0, &reason); CHKERRQ(ierr);
139a7e14dcfSSatish Balay   if (reason != TAO_CONTINUE_ITERATING) {
140a7e14dcfSSatish Balay     PetscFunctionReturn(0);
141a7e14dcfSSatish Balay   }
142a7e14dcfSSatish Balay 
143a7e14dcfSSatish Balay   /* Create vectors for the limited memory preconditioner */
144a7e14dcfSSatish Balay   if ((NTR_PC_BFGS == tr->pc_type) &&
145a7e14dcfSSatish Balay       (BFGS_SCALE_BFGS != tr->bfgs_scale_type)) {
146a7e14dcfSSatish Balay     if (!tr->Diag) {
147a7e14dcfSSatish Balay 	ierr = VecDuplicate(tao->solution, &tr->Diag); CHKERRQ(ierr);
148a7e14dcfSSatish Balay     }
149a7e14dcfSSatish Balay   }
150a7e14dcfSSatish Balay 
151a7e14dcfSSatish Balay   switch(tr->ksp_type) {
152a7e14dcfSSatish Balay   case NTR_KSP_NASH:
153a7e14dcfSSatish Balay     ierr = KSPSetType(tao->ksp, KSPNASH); CHKERRQ(ierr);
154a7e14dcfSSatish Balay     if (tao->ksp->ops->setfromoptions) {
155a7e14dcfSSatish Balay       (*tao->ksp->ops->setfromoptions)(tao->ksp);
156a7e14dcfSSatish Balay     }
157a7e14dcfSSatish Balay     break;
158a7e14dcfSSatish Balay 
159a7e14dcfSSatish Balay   case NTR_KSP_STCG:
160a7e14dcfSSatish Balay     ierr = KSPSetType(tao->ksp, KSPSTCG); CHKERRQ(ierr);
161a7e14dcfSSatish Balay     if (tao->ksp->ops->setfromoptions) {
162a7e14dcfSSatish Balay       (*tao->ksp->ops->setfromoptions)(tao->ksp);
163a7e14dcfSSatish Balay     }
164a7e14dcfSSatish Balay     break;
165a7e14dcfSSatish Balay 
166a7e14dcfSSatish Balay   default:
167a7e14dcfSSatish Balay     ierr = KSPSetType(tao->ksp, KSPGLTR); CHKERRQ(ierr);
168a7e14dcfSSatish Balay     if (tao->ksp->ops->setfromoptions) {
169a7e14dcfSSatish Balay       (*tao->ksp->ops->setfromoptions)(tao->ksp);
170a7e14dcfSSatish Balay     }
171a7e14dcfSSatish Balay     break;
172a7e14dcfSSatish Balay   }
173a7e14dcfSSatish Balay 
174a7e14dcfSSatish Balay   /*  Modify the preconditioner to use the bfgs approximation */
175a7e14dcfSSatish Balay   ierr = KSPGetPC(tao->ksp, &pc); CHKERRQ(ierr);
176a7e14dcfSSatish Balay   switch(tr->pc_type) {
177a7e14dcfSSatish Balay   case NTR_PC_NONE:
178a7e14dcfSSatish Balay     ierr = PCSetType(pc, PCNONE); CHKERRQ(ierr);
179a7e14dcfSSatish Balay     if (pc->ops->setfromoptions) {
180a7e14dcfSSatish Balay       (*pc->ops->setfromoptions)(pc);
181a7e14dcfSSatish Balay     }
182a7e14dcfSSatish Balay     break;
183a7e14dcfSSatish Balay 
184a7e14dcfSSatish Balay   case NTR_PC_AHESS:
185a7e14dcfSSatish Balay     ierr = PCSetType(pc, PCJACOBI); CHKERRQ(ierr);
186a7e14dcfSSatish Balay     if (pc->ops->setfromoptions) {
187a7e14dcfSSatish Balay       (*pc->ops->setfromoptions)(pc);
188a7e14dcfSSatish Balay     }
189a7e14dcfSSatish Balay     ierr = PCJacobiSetUseAbs(pc); CHKERRQ(ierr);
190a7e14dcfSSatish Balay     break;
191a7e14dcfSSatish Balay 
192a7e14dcfSSatish Balay   case NTR_PC_BFGS:
193a7e14dcfSSatish Balay     ierr = PCSetType(pc, PCSHELL); CHKERRQ(ierr);
194a7e14dcfSSatish Balay     if (pc->ops->setfromoptions) {
195a7e14dcfSSatish Balay       (*pc->ops->setfromoptions)(pc);
196a7e14dcfSSatish Balay     }
197a7e14dcfSSatish Balay     ierr = PCShellSetName(pc, "bfgs"); CHKERRQ(ierr);
198a7e14dcfSSatish Balay     ierr = PCShellSetContext(pc, tr->M); CHKERRQ(ierr);
199a7e14dcfSSatish Balay     ierr = PCShellSetApply(pc, MatLMVMSolveShell); CHKERRQ(ierr);
200a7e14dcfSSatish Balay     break;
201a7e14dcfSSatish Balay 
202a7e14dcfSSatish Balay   default:
203a7e14dcfSSatish Balay     /*  Use the pc method set by pc_type */
204a7e14dcfSSatish Balay     break;
205a7e14dcfSSatish Balay   }
206a7e14dcfSSatish Balay 
207a7e14dcfSSatish Balay   /*  Initialize trust-region radius */
208a7e14dcfSSatish Balay   switch(tr->init_type) {
209a7e14dcfSSatish Balay   case NTR_INIT_CONSTANT:
210a7e14dcfSSatish Balay     /*  Use the initial radius specified */
211a7e14dcfSSatish Balay     break;
212a7e14dcfSSatish Balay 
213a7e14dcfSSatish Balay   case NTR_INIT_INTERPOLATION:
214a7e14dcfSSatish Balay     /*  Use the initial radius specified */
215a7e14dcfSSatish Balay     max_radius = 0.0;
216a7e14dcfSSatish Balay 
217a7e14dcfSSatish Balay     for (j = 0; j < j_max; ++j) {
218a7e14dcfSSatish Balay       fmin = f;
219a7e14dcfSSatish Balay       sigma = 0.0;
220a7e14dcfSSatish Balay 
221a7e14dcfSSatish Balay       if (needH) {
222a7e14dcfSSatish Balay 	  ierr = TaoComputeHessian(tao, tao->solution, &tao->hessian, &tao->hessian_pre, &matflag); CHKERRQ(ierr);
223a7e14dcfSSatish Balay         needH = 0;
224a7e14dcfSSatish Balay       }
225a7e14dcfSSatish Balay 
226a7e14dcfSSatish Balay       for (i = 0; i < i_max; ++i) {
227a7e14dcfSSatish Balay 
228a7e14dcfSSatish Balay         ierr = VecCopy(tao->solution, tr->W); CHKERRQ(ierr);
229a7e14dcfSSatish Balay 	ierr = VecAXPY(tr->W, -tao->trust/gnorm, tao->gradient); CHKERRQ(ierr);
230a7e14dcfSSatish Balay 	ierr = TaoComputeObjective(tao, tr->W, &ftrial); CHKERRQ(ierr);
231a7e14dcfSSatish Balay 
232a7e14dcfSSatish Balay         if (PetscIsInfOrNanReal(ftrial)) {
233a7e14dcfSSatish Balay 	  tau = tr->gamma1_i;
234a7e14dcfSSatish Balay         }
235a7e14dcfSSatish Balay         else {
236a7e14dcfSSatish Balay 	  if (ftrial < fmin) {
237a7e14dcfSSatish Balay             fmin = ftrial;
238a7e14dcfSSatish Balay             sigma = -tao->trust / gnorm;
239a7e14dcfSSatish Balay           }
240a7e14dcfSSatish Balay 
241a7e14dcfSSatish Balay 	  ierr = MatMult(tao->hessian, tao->gradient, tao->stepdirection); CHKERRQ(ierr);
242a7e14dcfSSatish Balay 	  ierr = VecDot(tao->gradient, tao->stepdirection, &prered); CHKERRQ(ierr);
243a7e14dcfSSatish Balay 
244a7e14dcfSSatish Balay           prered = tao->trust * (gnorm - 0.5 * tao->trust * prered / (gnorm * gnorm));
245a7e14dcfSSatish Balay           actred = f - ftrial;
246a7e14dcfSSatish Balay 	  if ((PetscAbsScalar(actred) <= tr->epsilon) &&
247a7e14dcfSSatish Balay               (PetscAbsScalar(prered) <= tr->epsilon)) {
248a7e14dcfSSatish Balay 	    kappa = 1.0;
249a7e14dcfSSatish Balay 	  }
250a7e14dcfSSatish Balay 	  else {
251a7e14dcfSSatish Balay 	    kappa = actred / prered;
252a7e14dcfSSatish Balay 	  }
253a7e14dcfSSatish Balay 
254a7e14dcfSSatish Balay 	  tau_1 = tr->theta_i * gnorm * tao->trust / (tr->theta_i * gnorm * tao->trust + (1.0 - tr->theta_i) * prered - actred);
255a7e14dcfSSatish Balay           tau_2 = tr->theta_i * gnorm * tao->trust / (tr->theta_i * gnorm * tao->trust - (1.0 + tr->theta_i) * prered + actred);
256a7e14dcfSSatish Balay 	  tau_min = PetscMin(tau_1, tau_2);
257a7e14dcfSSatish Balay 	  tau_max = PetscMax(tau_1, tau_2);
258a7e14dcfSSatish Balay 
259a7e14dcfSSatish Balay 	  if (PetscAbsScalar(kappa - 1.0) <= tr->mu1_i) {
260a7e14dcfSSatish Balay 	    /*  Great agreement */
261a7e14dcfSSatish Balay             max_radius = PetscMax(max_radius, tao->trust);
262a7e14dcfSSatish Balay 
263a7e14dcfSSatish Balay 	    if (tau_max < 1.0) {
264a7e14dcfSSatish Balay               tau = tr->gamma3_i;
265a7e14dcfSSatish Balay             }
266a7e14dcfSSatish Balay             else if (tau_max > tr->gamma4_i) {
267a7e14dcfSSatish Balay               tau = tr->gamma4_i;
268a7e14dcfSSatish Balay             }
269a7e14dcfSSatish Balay             else {
270a7e14dcfSSatish Balay               tau = tau_max;
271a7e14dcfSSatish Balay             }
272a7e14dcfSSatish Balay           }
273a7e14dcfSSatish Balay           else if (PetscAbsScalar(kappa - 1.0) <= tr->mu2_i) {
274a7e14dcfSSatish Balay 	    /*  Good agreement */
275a7e14dcfSSatish Balay             max_radius = PetscMax(max_radius, tao->trust);
276a7e14dcfSSatish Balay 
277a7e14dcfSSatish Balay 	    if (tau_max < tr->gamma2_i) {
278a7e14dcfSSatish Balay               tau = tr->gamma2_i;
279a7e14dcfSSatish Balay             }
280a7e14dcfSSatish Balay             else if (tau_max > tr->gamma3_i) {
281a7e14dcfSSatish Balay               tau = tr->gamma3_i;
282a7e14dcfSSatish Balay             }
283a7e14dcfSSatish Balay             else {
284a7e14dcfSSatish Balay               tau = tau_max;
285a7e14dcfSSatish Balay             }
286a7e14dcfSSatish Balay           }
287a7e14dcfSSatish Balay           else {
288a7e14dcfSSatish Balay 	    /*  Not good agreement */
289a7e14dcfSSatish Balay 	    if (tau_min > 1.0) {
290a7e14dcfSSatish Balay 	      tau = tr->gamma2_i;
291a7e14dcfSSatish Balay             }
292a7e14dcfSSatish Balay             else if (tau_max < tr->gamma1_i) {
293a7e14dcfSSatish Balay               tau = tr->gamma1_i;
294a7e14dcfSSatish Balay             }
295a7e14dcfSSatish Balay 	    else if ((tau_min < tr->gamma1_i) && (tau_max >= 1.0)) {
296a7e14dcfSSatish Balay 	      tau = tr->gamma1_i;
297a7e14dcfSSatish Balay             }
298a7e14dcfSSatish Balay 	    else if ((tau_1 >= tr->gamma1_i) && (tau_1 < 1.0) &&
299a7e14dcfSSatish Balay                      ((tau_2 < tr->gamma1_i) || (tau_2 >= 1.0))) {
300a7e14dcfSSatish Balay               tau = tau_1;
301a7e14dcfSSatish Balay             }
302a7e14dcfSSatish Balay 	    else if ((tau_2 >= tr->gamma1_i) && (tau_2 < 1.0) &&
303a7e14dcfSSatish Balay                      ((tau_1 < tr->gamma1_i) || (tau_2 >= 1.0))) {
304a7e14dcfSSatish Balay               tau = tau_2;
305a7e14dcfSSatish Balay             }
306a7e14dcfSSatish Balay             else {
307a7e14dcfSSatish Balay               tau = tau_max;
308a7e14dcfSSatish Balay             }
309a7e14dcfSSatish Balay           }
310a7e14dcfSSatish Balay         }
311a7e14dcfSSatish Balay         tao->trust = tau * tao->trust;
312a7e14dcfSSatish Balay       }
313a7e14dcfSSatish Balay 
314a7e14dcfSSatish Balay       if (fmin < f) {
315a7e14dcfSSatish Balay         f = fmin;
316a7e14dcfSSatish Balay 	ierr = VecAXPY(tao->solution, sigma, tao->gradient); CHKERRQ(ierr);
317a7e14dcfSSatish Balay 	ierr = TaoComputeGradient(tao,tao->solution, tao->gradient); CHKERRQ(ierr);
318a7e14dcfSSatish Balay 
319a7e14dcfSSatish Balay 	ierr = VecNorm(tao->gradient, NORM_2, &gnorm); CHKERRQ(ierr);
320a7e14dcfSSatish Balay 
321a7e14dcfSSatish Balay         if (PetscIsInfOrNanReal(f) || PetscIsInfOrNanReal(gnorm)) {
322a7e14dcfSSatish Balay           SETERRQ(PETSC_COMM_SELF,1, "User provided compute function generated Inf or NaN");
323a7e14dcfSSatish Balay         }
324a7e14dcfSSatish Balay         needH = 1;
325a7e14dcfSSatish Balay 
326a7e14dcfSSatish Balay         ierr = TaoMonitor(tao, iter, f, gnorm, 0.0, 1.0, &reason); CHKERRQ(ierr);
327a7e14dcfSSatish Balay         if (reason != TAO_CONTINUE_ITERATING) {
328a7e14dcfSSatish Balay           PetscFunctionReturn(0);
329a7e14dcfSSatish Balay         }
330a7e14dcfSSatish Balay       }
331a7e14dcfSSatish Balay     }
332a7e14dcfSSatish Balay     tao->trust = PetscMax(tao->trust, max_radius);
333a7e14dcfSSatish Balay 
334a7e14dcfSSatish Balay     /*  Modify the radius if it is too large or small */
335a7e14dcfSSatish Balay     tao->trust = PetscMax(tao->trust, tr->min_radius);
336a7e14dcfSSatish Balay     tao->trust = PetscMin(tao->trust, tr->max_radius);
337a7e14dcfSSatish Balay     break;
338a7e14dcfSSatish Balay 
339a7e14dcfSSatish Balay   default:
340a7e14dcfSSatish Balay     /*  Norm of the first direction will initialize radius */
341a7e14dcfSSatish Balay     tao->trust = 0.0;
342a7e14dcfSSatish Balay     break;
343a7e14dcfSSatish Balay   }
344a7e14dcfSSatish Balay 
345a7e14dcfSSatish Balay   /* Set initial scaling for the BFGS preconditioner
346a7e14dcfSSatish Balay      This step is done after computing the initial trust-region radius
347a7e14dcfSSatish Balay      since the function value may have decreased */
348a7e14dcfSSatish Balay   if (NTR_PC_BFGS == tr->pc_type) {
349a7e14dcfSSatish Balay     if (f != 0.0) {
350a7e14dcfSSatish Balay       delta = 2.0 * PetscAbsScalar(f) / (gnorm*gnorm);
351a7e14dcfSSatish Balay     }
352a7e14dcfSSatish Balay     else {
353a7e14dcfSSatish Balay       delta = 2.0 / (gnorm*gnorm);
354a7e14dcfSSatish Balay     }
355a7e14dcfSSatish Balay     ierr = MatLMVMSetDelta(tr->M,delta); CHKERRQ(ierr);
356a7e14dcfSSatish Balay   }
357a7e14dcfSSatish Balay 
358a7e14dcfSSatish Balay   /* Have not converged; continue with Newton method */
359a7e14dcfSSatish Balay   while (reason == TAO_CONTINUE_ITERATING) {
360a7e14dcfSSatish Balay     ++iter;
361a7e14dcfSSatish Balay 
362a7e14dcfSSatish Balay     /* Compute the Hessian */
363a7e14dcfSSatish Balay     if (needH) {
364a7e14dcfSSatish Balay       ierr = TaoComputeHessian(tao, tao->solution, &tao->hessian, &tao->hessian_pre, &matflag); CHKERRQ(ierr);
365a7e14dcfSSatish Balay       needH = 0;
366a7e14dcfSSatish Balay     }
367a7e14dcfSSatish Balay 
368a7e14dcfSSatish Balay     if (NTR_PC_BFGS == tr->pc_type) {
369a7e14dcfSSatish Balay       if (BFGS_SCALE_AHESS == tr->bfgs_scale_type) {
370a7e14dcfSSatish Balay         /* Obtain diagonal for the bfgs preconditioner */
371a7e14dcfSSatish Balay         ierr = MatGetDiagonal(tao->hessian, tr->Diag); CHKERRQ(ierr);
372a7e14dcfSSatish Balay 	ierr = VecAbs(tr->Diag); CHKERRQ(ierr);
373a7e14dcfSSatish Balay 	ierr = VecReciprocal(tr->Diag); CHKERRQ(ierr);
374a7e14dcfSSatish Balay 	ierr = MatLMVMSetScale(tr->M,tr->Diag); CHKERRQ(ierr);
375a7e14dcfSSatish Balay       }
376a7e14dcfSSatish Balay 
377a7e14dcfSSatish Balay       /* Update the limited memory preconditioner */
378a7e14dcfSSatish Balay       ierr = MatLMVMUpdate(tr->M, tao->solution, tao->gradient); CHKERRQ(ierr);
379a7e14dcfSSatish Balay       ++bfgsUpdates;
380a7e14dcfSSatish Balay     }
381a7e14dcfSSatish Balay 
382a7e14dcfSSatish Balay     while (reason == TAO_CONTINUE_ITERATING) {
383a7e14dcfSSatish Balay       ierr = KSPSetOperators(tao->ksp, tao->hessian, tao->hessian_pre, matflag); CHKERRQ(ierr);
384a7e14dcfSSatish Balay 
385a7e14dcfSSatish Balay       /* Solve the trust region subproblem */
386a7e14dcfSSatish Balay       if (NTR_KSP_NASH == tr->ksp_type) {
387a7e14dcfSSatish Balay 	ierr = KSPNASHSetRadius(tao->ksp,tao->trust); CHKERRQ(ierr);
388a7e14dcfSSatish Balay 	ierr = KSPSolve(tao->ksp, tao->gradient, tao->stepdirection); CHKERRQ(ierr);
389a7e14dcfSSatish Balay 	ierr = KSPGetIterationNumber(tao->ksp,&its); CHKERRQ(ierr);
390a7e14dcfSSatish Balay 	tao->ksp_its+=its;
391a7e14dcfSSatish Balay 	ierr = KSPNASHGetNormD(tao->ksp, &norm_d); CHKERRQ(ierr);
392a7e14dcfSSatish Balay       } else if (NTR_KSP_STCG == tr->ksp_type) {
393a7e14dcfSSatish Balay 	ierr = KSPSTCGSetRadius(tao->ksp,tao->trust); CHKERRQ(ierr);
394a7e14dcfSSatish Balay 	ierr = KSPSolve(tao->ksp, tao->gradient, tao->stepdirection); CHKERRQ(ierr);
395a7e14dcfSSatish Balay 	ierr = KSPGetIterationNumber(tao->ksp,&its); CHKERRQ(ierr);
396a7e14dcfSSatish Balay 	tao->ksp_its+=its;
397a7e14dcfSSatish Balay 	ierr = KSPSTCGGetNormD(tao->ksp, &norm_d); CHKERRQ(ierr);
398a7e14dcfSSatish Balay       } else { /* NTR_KSP_GLTR */
399a7e14dcfSSatish Balay 	ierr = KSPGLTRSetRadius(tao->ksp,tao->trust); CHKERRQ(ierr);
400a7e14dcfSSatish Balay 	ierr = KSPSolve(tao->ksp, tao->gradient, tao->stepdirection); CHKERRQ(ierr);
401a7e14dcfSSatish Balay 	ierr = KSPGetIterationNumber(tao->ksp,&its); CHKERRQ(ierr);
402a7e14dcfSSatish Balay 	tao->ksp_its+=its;
403a7e14dcfSSatish Balay 	ierr = KSPGLTRGetNormD(tao->ksp, &norm_d); CHKERRQ(ierr);
404a7e14dcfSSatish Balay       }
405a7e14dcfSSatish Balay 
406a7e14dcfSSatish Balay       if (0.0 == tao->trust) {
407a7e14dcfSSatish Balay         /* Radius was uninitialized; use the norm of the direction */
408a7e14dcfSSatish Balay         if (norm_d > 0.0) {
409a7e14dcfSSatish Balay           tao->trust = norm_d;
410a7e14dcfSSatish Balay 
411a7e14dcfSSatish Balay           /* Modify the radius if it is too large or small */
412a7e14dcfSSatish Balay           tao->trust = PetscMax(tao->trust, tr->min_radius);
413a7e14dcfSSatish Balay           tao->trust = PetscMin(tao->trust, tr->max_radius);
414a7e14dcfSSatish Balay         }
415a7e14dcfSSatish Balay         else {
416a7e14dcfSSatish Balay           /* The direction was bad; set radius to default value and re-solve
417a7e14dcfSSatish Balay 	     the trust-region subproblem to get a direction */
418a7e14dcfSSatish Balay 	  tao->trust = tao->trust0;
419a7e14dcfSSatish Balay 
420a7e14dcfSSatish Balay           /* Modify the radius if it is too large or small */
421a7e14dcfSSatish Balay           tao->trust = PetscMax(tao->trust, tr->min_radius);
422a7e14dcfSSatish Balay           tao->trust = PetscMin(tao->trust, tr->max_radius);
423a7e14dcfSSatish Balay 
424a7e14dcfSSatish Balay 	  if (NTR_KSP_NASH == tr->ksp_type) {
425a7e14dcfSSatish Balay 	    ierr = KSPNASHSetRadius(tao->ksp,tao->trust); CHKERRQ(ierr);
426a7e14dcfSSatish Balay 	    ierr = KSPSolve(tao->ksp, tao->gradient, tao->stepdirection); CHKERRQ(ierr);
427a7e14dcfSSatish Balay 	    ierr = KSPGetIterationNumber(tao->ksp,&its); CHKERRQ(ierr);
428a7e14dcfSSatish Balay 	    tao->ksp_its+=its;
429a7e14dcfSSatish Balay 	    ierr = KSPNASHGetNormD(tao->ksp, &norm_d); CHKERRQ(ierr);
430a7e14dcfSSatish Balay 	  } else if (NTR_KSP_STCG == tr->ksp_type) {
431a7e14dcfSSatish Balay 	    ierr = KSPSTCGSetRadius(tao->ksp,tao->trust); CHKERRQ(ierr);
432a7e14dcfSSatish Balay 	    ierr = KSPSolve(tao->ksp, tao->gradient, tao->stepdirection); CHKERRQ(ierr);
433a7e14dcfSSatish Balay 	    ierr = KSPGetIterationNumber(tao->ksp,&its); CHKERRQ(ierr);
434a7e14dcfSSatish Balay 	    tao->ksp_its+=its;
435a7e14dcfSSatish Balay 	    ierr = KSPSTCGGetNormD(tao->ksp, &norm_d); CHKERRQ(ierr);
436a7e14dcfSSatish Balay 	  } else { /* NTR_KSP_GLTR */
437a7e14dcfSSatish Balay 	    ierr = KSPGLTRSetRadius(tao->ksp,tao->trust); CHKERRQ(ierr);
438a7e14dcfSSatish Balay 	    ierr = KSPSolve(tao->ksp, tao->gradient, tao->stepdirection); CHKERRQ(ierr);
439a7e14dcfSSatish Balay 	    ierr = KSPGetIterationNumber(tao->ksp,&its); CHKERRQ(ierr);
440a7e14dcfSSatish Balay 	    tao->ksp_its+=its;
441a7e14dcfSSatish Balay 	    ierr = KSPGLTRGetNormD(tao->ksp, &norm_d); CHKERRQ(ierr);
442a7e14dcfSSatish Balay 	  }
443a7e14dcfSSatish Balay 
444a7e14dcfSSatish Balay 	  if (norm_d == 0.0) {
445a7e14dcfSSatish Balay             SETERRQ(PETSC_COMM_SELF,1, "Initial direction zero");
446a7e14dcfSSatish Balay           }
447a7e14dcfSSatish Balay         }
448a7e14dcfSSatish Balay       }
449a7e14dcfSSatish Balay       ierr = VecScale(tao->stepdirection, -1.0); CHKERRQ(ierr);
450a7e14dcfSSatish Balay       ierr = KSPGetConvergedReason(tao->ksp, &ksp_reason); CHKERRQ(ierr);
451a7e14dcfSSatish Balay       if ((KSP_DIVERGED_INDEFINITE_PC == ksp_reason) &&
452a7e14dcfSSatish Balay           (NTR_PC_BFGS == tr->pc_type) && (bfgsUpdates > 1)) {
453a7e14dcfSSatish Balay         /* Preconditioner is numerically indefinite; reset the
454a7e14dcfSSatish Balay 	   approximate if using BFGS preconditioning. */
455a7e14dcfSSatish Balay 
456a7e14dcfSSatish Balay         if (f != 0.0) {
457a7e14dcfSSatish Balay           delta = 2.0 * PetscAbsScalar(f) / (gnorm*gnorm);
458a7e14dcfSSatish Balay         }
459a7e14dcfSSatish Balay         else {
460a7e14dcfSSatish Balay           delta = 2.0 / (gnorm*gnorm);
461a7e14dcfSSatish Balay         }
462a7e14dcfSSatish Balay 	ierr = MatLMVMSetDelta(tr->M, delta); CHKERRQ(ierr);
463a7e14dcfSSatish Balay 	ierr = MatLMVMReset(tr->M); CHKERRQ(ierr);
464a7e14dcfSSatish Balay 	ierr = MatLMVMUpdate(tr->M, tao->solution, tao->gradient); CHKERRQ(ierr);
465a7e14dcfSSatish Balay         bfgsUpdates = 1;
466a7e14dcfSSatish Balay       }
467a7e14dcfSSatish Balay 
468a7e14dcfSSatish Balay       if (NTR_UPDATE_REDUCTION == tr->update_type) {
469a7e14dcfSSatish Balay 	/* Get predicted reduction */
470a7e14dcfSSatish Balay 	if (NTR_KSP_NASH == tr->ksp_type) {
471a7e14dcfSSatish Balay 	  ierr = KSPNASHGetObjFcn(tao->ksp,&prered); CHKERRQ(ierr);
472a7e14dcfSSatish Balay 	} else if (NTR_KSP_STCG == tr->ksp_type) {
473a7e14dcfSSatish Balay 	  ierr = KSPSTCGGetObjFcn(tao->ksp,&prered); CHKERRQ(ierr);
474a7e14dcfSSatish Balay 	} else { /* gltr */
475a7e14dcfSSatish Balay 	  ierr = KSPGLTRGetObjFcn(tao->ksp,&prered); CHKERRQ(ierr);
476a7e14dcfSSatish Balay 	}
477a7e14dcfSSatish Balay 
478a7e14dcfSSatish Balay 	if (prered >= 0.0) {
479a7e14dcfSSatish Balay 	  /* The predicted reduction has the wrong sign.  This cannot
480a7e14dcfSSatish Balay 	     happen in infinite precision arithmetic.  Step should
481a7e14dcfSSatish Balay 	     be rejected! */
482a7e14dcfSSatish Balay 	  tao->trust = tr->alpha1 * PetscMin(tao->trust, norm_d);
483a7e14dcfSSatish Balay 	}
484a7e14dcfSSatish Balay 	else {
485a7e14dcfSSatish Balay 	  /* Compute trial step and function value */
486a7e14dcfSSatish Balay 	  ierr = VecCopy(tao->solution,tr->W); CHKERRQ(ierr);
487a7e14dcfSSatish Balay 	  ierr = VecAXPY(tr->W, 1.0, tao->stepdirection); CHKERRQ(ierr);
488a7e14dcfSSatish Balay 	  ierr = TaoComputeObjective(tao, tr->W, &ftrial); CHKERRQ(ierr);
489a7e14dcfSSatish Balay 
490a7e14dcfSSatish Balay 	  if (PetscIsInfOrNanReal(ftrial)) {
491a7e14dcfSSatish Balay 	    tao->trust = tr->alpha1 * PetscMin(tao->trust, norm_d);
492a7e14dcfSSatish Balay 	  } else {
493a7e14dcfSSatish Balay 	    /* Compute and actual reduction */
494a7e14dcfSSatish Balay 	    actred = f - ftrial;
495a7e14dcfSSatish Balay 	    prered = -prered;
496a7e14dcfSSatish Balay 	    if ((PetscAbsScalar(actred) <= tr->epsilon) &&
497a7e14dcfSSatish Balay                 (PetscAbsScalar(prered) <= tr->epsilon)) {
498a7e14dcfSSatish Balay 	      kappa = 1.0;
499a7e14dcfSSatish Balay 	    }
500a7e14dcfSSatish Balay 	    else {
501a7e14dcfSSatish Balay 	      kappa = actred / prered;
502a7e14dcfSSatish Balay 	    }
503a7e14dcfSSatish Balay 
504a7e14dcfSSatish Balay 	    /* Accept or reject the step and update radius */
505a7e14dcfSSatish Balay 	    if (kappa < tr->eta1) {
506a7e14dcfSSatish Balay 	      /* Reject the step */
507a7e14dcfSSatish Balay 	      tao->trust = tr->alpha1 * PetscMin(tao->trust, norm_d);
508a7e14dcfSSatish Balay 	    }
509a7e14dcfSSatish Balay 	    else {
510a7e14dcfSSatish Balay 	      /* Accept the step */
511a7e14dcfSSatish Balay 	      if (kappa < tr->eta2) {
512a7e14dcfSSatish Balay 		/* Marginal bad step */
513a7e14dcfSSatish Balay 		tao->trust = tr->alpha2 * PetscMin(tao->trust, norm_d);
514a7e14dcfSSatish Balay 	      }
515a7e14dcfSSatish Balay 	      else if (kappa < tr->eta3) {
516a7e14dcfSSatish Balay 		/* Reasonable step */
517a7e14dcfSSatish Balay 		tao->trust = tr->alpha3 * tao->trust;
518a7e14dcfSSatish Balay 	      }
519a7e14dcfSSatish Balay 	      else if (kappa < tr->eta4) {
520a7e14dcfSSatish Balay 		/* Good step */
521a7e14dcfSSatish Balay 		tao->trust = PetscMax(tr->alpha4 * norm_d, tao->trust);
522a7e14dcfSSatish Balay 	      }
523a7e14dcfSSatish Balay 	      else {
524a7e14dcfSSatish Balay 		/* Very good step */
525a7e14dcfSSatish Balay 		tao->trust = PetscMax(tr->alpha5 * norm_d, tao->trust);
526a7e14dcfSSatish Balay 	      }
527a7e14dcfSSatish Balay 	      break;
528a7e14dcfSSatish Balay 	    }
529a7e14dcfSSatish Balay 	  }
530a7e14dcfSSatish Balay 	}
531a7e14dcfSSatish Balay       }
532a7e14dcfSSatish Balay       else {
533a7e14dcfSSatish Balay 	/* Get predicted reduction */
534a7e14dcfSSatish Balay 	if (NTR_KSP_NASH == tr->ksp_type) {
535a7e14dcfSSatish Balay 	  ierr = KSPNASHGetObjFcn(tao->ksp,&prered); CHKERRQ(ierr);
536a7e14dcfSSatish Balay 	} else if (NTR_KSP_STCG == tr->ksp_type) {
537a7e14dcfSSatish Balay 	  ierr = KSPSTCGGetObjFcn(tao->ksp,&prered); CHKERRQ(ierr);
538a7e14dcfSSatish Balay 	} else { /* gltr */
539a7e14dcfSSatish Balay 	  ierr = KSPGLTRGetObjFcn(tao->ksp,&prered); CHKERRQ(ierr);
540a7e14dcfSSatish Balay 	}
541a7e14dcfSSatish Balay 
542a7e14dcfSSatish Balay 	if (prered >= 0.0) {
543a7e14dcfSSatish Balay 	  /* The predicted reduction has the wrong sign.  This cannot
544a7e14dcfSSatish Balay 	     happen in infinite precision arithmetic.  Step should
545a7e14dcfSSatish Balay 	     be rejected! */
546a7e14dcfSSatish Balay 	  tao->trust = tr->gamma1 * PetscMin(tao->trust, norm_d);
547a7e14dcfSSatish Balay 	}
548a7e14dcfSSatish Balay 	else {
549a7e14dcfSSatish Balay 	  ierr = VecCopy(tao->solution, tr->W); CHKERRQ(ierr);
550a7e14dcfSSatish Balay 	  ierr = VecAXPY(tr->W, 1.0, tao->stepdirection); CHKERRQ(ierr);
551a7e14dcfSSatish Balay 	  ierr = TaoComputeObjective(tao, tr->W, &ftrial); CHKERRQ(ierr);
552a7e14dcfSSatish Balay 	  if (PetscIsInfOrNanReal(ftrial)) {
553a7e14dcfSSatish Balay 	    tao->trust = tr->gamma1 * PetscMin(tao->trust, norm_d);
554a7e14dcfSSatish Balay 	  }
555a7e14dcfSSatish Balay 	  else {
556a7e14dcfSSatish Balay 	    ierr = VecDot(tao->gradient, tao->stepdirection, &beta); CHKERRQ(ierr);
557a7e14dcfSSatish Balay 	    actred = f - ftrial;
558a7e14dcfSSatish Balay 	    prered = -prered;
559a7e14dcfSSatish Balay 	    if ((PetscAbsScalar(actred) <= tr->epsilon) &&
560a7e14dcfSSatish Balay                 (PetscAbsScalar(prered) <= tr->epsilon)) {
561a7e14dcfSSatish Balay 	      kappa = 1.0;
562a7e14dcfSSatish Balay 	    }
563a7e14dcfSSatish Balay 	    else {
564a7e14dcfSSatish Balay 	      kappa = actred / prered;
565a7e14dcfSSatish Balay 	    }
566a7e14dcfSSatish Balay 
567a7e14dcfSSatish Balay 	    tau_1 = tr->theta * beta / (tr->theta * beta - (1.0 - tr->theta) * prered + actred);
568a7e14dcfSSatish Balay 	    tau_2 = tr->theta * beta / (tr->theta * beta + (1.0 + tr->theta) * prered - actred);
569a7e14dcfSSatish Balay 	    tau_min = PetscMin(tau_1, tau_2);
570a7e14dcfSSatish Balay 	    tau_max = PetscMax(tau_1, tau_2);
571a7e14dcfSSatish Balay 
572a7e14dcfSSatish Balay 	    if (kappa >= 1.0 - tr->mu1) {
573a7e14dcfSSatish Balay 	      /* Great agreement; accept step and update radius */
574a7e14dcfSSatish Balay 	      if (tau_max < 1.0) {
575a7e14dcfSSatish Balay 		tao->trust = PetscMax(tao->trust, tr->gamma3 * norm_d);
576a7e14dcfSSatish Balay 	      }
577a7e14dcfSSatish Balay 	      else if (tau_max > tr->gamma4) {
578a7e14dcfSSatish Balay 		tao->trust = PetscMax(tao->trust, tr->gamma4 * norm_d);
579a7e14dcfSSatish Balay 	      }
580a7e14dcfSSatish Balay 	      else {
581a7e14dcfSSatish Balay 		tao->trust = PetscMax(tao->trust, tau_max * norm_d);
582a7e14dcfSSatish Balay 	      }
583a7e14dcfSSatish Balay 	      break;
584a7e14dcfSSatish Balay 	    }
585a7e14dcfSSatish Balay 	    else if (kappa >= 1.0 - tr->mu2) {
586a7e14dcfSSatish Balay 	      /* Good agreement */
587a7e14dcfSSatish Balay 
588a7e14dcfSSatish Balay 	      if (tau_max < tr->gamma2) {
589a7e14dcfSSatish Balay 		tao->trust = tr->gamma2 * PetscMin(tao->trust, norm_d);
590a7e14dcfSSatish Balay 	      }
591a7e14dcfSSatish Balay 	      else if (tau_max > tr->gamma3) {
592a7e14dcfSSatish Balay 		tao->trust = PetscMax(tao->trust, tr->gamma3 * norm_d);
593a7e14dcfSSatish Balay 	      }
594a7e14dcfSSatish Balay 	      else if (tau_max < 1.0) {
595a7e14dcfSSatish Balay 		tao->trust = tau_max * PetscMin(tao->trust, norm_d);
596a7e14dcfSSatish Balay 	      }
597a7e14dcfSSatish Balay 	      else {
598a7e14dcfSSatish Balay 		tao->trust = PetscMax(tao->trust, tau_max * norm_d);
599a7e14dcfSSatish Balay 	      }
600a7e14dcfSSatish Balay 	      break;
601a7e14dcfSSatish Balay 	    }
602a7e14dcfSSatish Balay 	    else {
603a7e14dcfSSatish Balay 	      /* Not good agreement */
604a7e14dcfSSatish Balay 	      if (tau_min > 1.0) {
605a7e14dcfSSatish Balay 		tao->trust = tr->gamma2 * PetscMin(tao->trust, norm_d);
606a7e14dcfSSatish Balay 	      }
607a7e14dcfSSatish Balay 	      else if (tau_max < tr->gamma1) {
608a7e14dcfSSatish Balay 		tao->trust = tr->gamma1 * PetscMin(tao->trust, norm_d);
609a7e14dcfSSatish Balay 	      }
610a7e14dcfSSatish Balay 	      else if ((tau_min < tr->gamma1) && (tau_max >= 1.0)) {
611a7e14dcfSSatish Balay 		tao->trust = tr->gamma1 * PetscMin(tao->trust, norm_d);
612a7e14dcfSSatish Balay 	      }
613a7e14dcfSSatish Balay 	      else if ((tau_1 >= tr->gamma1) && (tau_1 < 1.0) &&
614a7e14dcfSSatish Balay 		       ((tau_2 < tr->gamma1) || (tau_2 >= 1.0))) {
615a7e14dcfSSatish Balay 		tao->trust = tau_1 * PetscMin(tao->trust, norm_d);
616a7e14dcfSSatish Balay 	      }
617a7e14dcfSSatish Balay 	      else if ((tau_2 >= tr->gamma1) && (tau_2 < 1.0) &&
618a7e14dcfSSatish Balay 		       ((tau_1 < tr->gamma1) || (tau_2 >= 1.0))) {
619a7e14dcfSSatish Balay 		tao->trust = tau_2 * PetscMin(tao->trust, norm_d);
620a7e14dcfSSatish Balay 	      }
621a7e14dcfSSatish Balay 	      else {
622a7e14dcfSSatish Balay 		tao->trust = tau_max * PetscMin(tao->trust, norm_d);
623a7e14dcfSSatish Balay 	      }
624a7e14dcfSSatish Balay 	    }
625a7e14dcfSSatish Balay 	  }
626a7e14dcfSSatish Balay 	}
627a7e14dcfSSatish Balay       }
628a7e14dcfSSatish Balay 
629a7e14dcfSSatish Balay       /* The step computed was not good and the radius was decreased.
630a7e14dcfSSatish Balay 	 Monitor the radius to terminate. */
631a7e14dcfSSatish Balay       ierr = TaoMonitor(tao, iter, f, gnorm, 0.0, tao->trust, &reason); CHKERRQ(ierr);
632a7e14dcfSSatish Balay     }
633a7e14dcfSSatish Balay 
634a7e14dcfSSatish Balay     /* The radius may have been increased; modify if it is too large */
635a7e14dcfSSatish Balay     tao->trust = PetscMin(tao->trust, tr->max_radius);
636a7e14dcfSSatish Balay 
637a7e14dcfSSatish Balay     if (reason == TAO_CONTINUE_ITERATING) {
638a7e14dcfSSatish Balay       ierr = VecCopy(tr->W, tao->solution); CHKERRQ(ierr);
639a7e14dcfSSatish Balay       f = ftrial;
640a7e14dcfSSatish Balay       ierr = TaoComputeGradient(tao, tao->solution, tao->gradient);
641a7e14dcfSSatish Balay       ierr = VecNorm(tao->gradient, NORM_2, &gnorm); CHKERRQ(ierr);
642a7e14dcfSSatish Balay       if (PetscIsInfOrNanReal(f) || PetscIsInfOrNanReal(gnorm)) {
643a7e14dcfSSatish Balay 	SETERRQ(PETSC_COMM_SELF,1, "User provided compute function generated Inf or NaN");
644a7e14dcfSSatish Balay       }
645a7e14dcfSSatish Balay       needH = 1;
646a7e14dcfSSatish Balay       ierr = TaoMonitor(tao, iter, f, gnorm, 0.0, tao->trust, &reason); CHKERRQ(ierr);
647a7e14dcfSSatish Balay     }
648a7e14dcfSSatish Balay   }
649a7e14dcfSSatish Balay   PetscFunctionReturn(0);
650a7e14dcfSSatish Balay }
651a7e14dcfSSatish Balay 
652a7e14dcfSSatish Balay /*------------------------------------------------------------*/
653a7e14dcfSSatish Balay #undef __FUNCT__
654a7e14dcfSSatish Balay #define __FUNCT__ "TaoSetUp_NTR"
655a7e14dcfSSatish Balay static PetscErrorCode TaoSetUp_NTR(TaoSolver tao)
656a7e14dcfSSatish Balay {
657a7e14dcfSSatish Balay   TAO_NTR *tr = (TAO_NTR *)tao->data;
658a7e14dcfSSatish Balay   PetscErrorCode ierr;
659a7e14dcfSSatish Balay 
660a7e14dcfSSatish Balay   PetscFunctionBegin;
661a7e14dcfSSatish Balay 
662a7e14dcfSSatish Balay   if (!tao->gradient) {ierr = VecDuplicate(tao->solution, &tao->gradient); CHKERRQ(ierr);}
663a7e14dcfSSatish Balay   if (!tao->stepdirection) {ierr = VecDuplicate(tao->solution, &tao->stepdirection); CHKERRQ(ierr);}
664a7e14dcfSSatish Balay   if (!tr->W) {ierr = VecDuplicate(tao->solution, &tr->W); CHKERRQ(ierr);}
665a7e14dcfSSatish Balay 
666a7e14dcfSSatish Balay   tr->Diag = 0;
667a7e14dcfSSatish Balay   tr->M = 0;
668a7e14dcfSSatish Balay 
669a7e14dcfSSatish Balay 
670a7e14dcfSSatish Balay   PetscFunctionReturn(0);
671a7e14dcfSSatish Balay }
672a7e14dcfSSatish Balay 
673a7e14dcfSSatish Balay /*------------------------------------------------------------*/
674a7e14dcfSSatish Balay #undef __FUNCT__
675a7e14dcfSSatish Balay #define __FUNCT__ "TaoDestroy_NTR"
676a7e14dcfSSatish Balay static PetscErrorCode TaoDestroy_NTR(TaoSolver tao)
677a7e14dcfSSatish Balay {
678a7e14dcfSSatish Balay   TAO_NTR *tr = (TAO_NTR *)tao->data;
679a7e14dcfSSatish Balay   PetscErrorCode ierr;
680a7e14dcfSSatish Balay 
681a7e14dcfSSatish Balay   PetscFunctionBegin;
682a7e14dcfSSatish Balay   if (tao->setupcalled) {
683a7e14dcfSSatish Balay     ierr = VecDestroy(&tr->W); CHKERRQ(ierr);
684a7e14dcfSSatish Balay   }
685a7e14dcfSSatish Balay   if (tr->M) {
686a7e14dcfSSatish Balay     ierr = MatDestroy(&tr->M); CHKERRQ(ierr);
687a7e14dcfSSatish Balay     tr->M = PETSC_NULL;
688a7e14dcfSSatish Balay   }
689a7e14dcfSSatish Balay   if (tr->Diag) {
690a7e14dcfSSatish Balay     ierr = VecDestroy(&tr->Diag); CHKERRQ(ierr);
691a7e14dcfSSatish Balay     tr->Diag = PETSC_NULL;
692a7e14dcfSSatish Balay   }
693a7e14dcfSSatish Balay   ierr = PetscFree(tao->data); CHKERRQ(ierr);
694a7e14dcfSSatish Balay   tao->data = PETSC_NULL;
695a7e14dcfSSatish Balay 
696a7e14dcfSSatish Balay   PetscFunctionReturn(0);
697a7e14dcfSSatish Balay }
698a7e14dcfSSatish Balay 
699a7e14dcfSSatish Balay /*------------------------------------------------------------*/
700a7e14dcfSSatish Balay #undef __FUNCT__
701a7e14dcfSSatish Balay #define __FUNCT__ "TaoSetFromOptions_NTR"
702a7e14dcfSSatish Balay static PetscErrorCode TaoSetFromOptions_NTR(TaoSolver tao)
703a7e14dcfSSatish Balay {
704a7e14dcfSSatish Balay   TAO_NTR *tr = (TAO_NTR *)tao->data;
705a7e14dcfSSatish Balay   PetscErrorCode ierr;
706a7e14dcfSSatish Balay 
707a7e14dcfSSatish Balay   PetscFunctionBegin;
708a7e14dcfSSatish Balay   ierr = PetscOptionsHead("Newton trust region method for unconstrained optimization"); CHKERRQ(ierr);
709a7e14dcfSSatish Balay   ierr = PetscOptionsEList("-tao_ntr_ksp_type", "ksp type", "", NTR_KSP, NTR_KSP_TYPES, NTR_KSP[tr->ksp_type], &tr->ksp_type, 0); CHKERRQ(ierr);
710a7e14dcfSSatish Balay   ierr = PetscOptionsEList("-tao_ntr_pc_type", "pc type", "", NTR_PC, NTR_PC_TYPES, NTR_PC[tr->pc_type], &tr->pc_type, 0); CHKERRQ(ierr);
711a7e14dcfSSatish Balay   ierr = PetscOptionsEList("-tao_ntr_bfgs_scale_type", "bfgs scale type", "", BFGS_SCALE, BFGS_SCALE_TYPES, BFGS_SCALE[tr->bfgs_scale_type], &tr->bfgs_scale_type, 0); CHKERRQ(ierr);
712a7e14dcfSSatish Balay   ierr = PetscOptionsEList("-tao_ntr_init_type", "tao->trust initialization type", "", NTR_INIT, NTR_INIT_TYPES, NTR_INIT[tr->init_type], &tr->init_type, 0); CHKERRQ(ierr);
713a7e14dcfSSatish Balay   ierr = PetscOptionsEList("-tao_ntr_update_type", "radius update type", "", NTR_UPDATE, NTR_UPDATE_TYPES, NTR_UPDATE[tr->update_type], &tr->update_type, 0); CHKERRQ(ierr);
714a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntr_eta1", "step is unsuccessful if actual reduction < eta1 * predicted reduction", "", tr->eta1, &tr->eta1, 0); CHKERRQ(ierr);
715a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntr_eta2", "", "", tr->eta2, &tr->eta2, 0); CHKERRQ(ierr);
716a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntr_eta3", "", "", tr->eta3, &tr->eta3, 0); CHKERRQ(ierr);
717a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntr_eta4", "", "", tr->eta4, &tr->eta4, 0); CHKERRQ(ierr);
718a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntr_alpha1", "", "", tr->alpha1, &tr->alpha1, 0); CHKERRQ(ierr);
719a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntr_alpha2", "", "", tr->alpha2, &tr->alpha2, 0); CHKERRQ(ierr);
720a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntr_alpha3", "", "", tr->alpha3, &tr->alpha3, 0); CHKERRQ(ierr);
721a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntr_alpha4", "", "", tr->alpha4, &tr->alpha4, 0); CHKERRQ(ierr);
722a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntr_alpha5", "", "", tr->alpha5, &tr->alpha5, 0); CHKERRQ(ierr);
723a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntr_mu1", "", "", tr->mu1, &tr->mu1, 0); CHKERRQ(ierr);
724a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntr_mu2", "", "", tr->mu2, &tr->mu2, 0); CHKERRQ(ierr);
725a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntr_gamma1", "", "", tr->gamma1, &tr->gamma1, 0); CHKERRQ(ierr);
726a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntr_gamma2", "", "", tr->gamma2, &tr->gamma2, 0); CHKERRQ(ierr);
727a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntr_gamma3", "", "", tr->gamma3, &tr->gamma3, 0); CHKERRQ(ierr);
728a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntr_gamma4", "", "", tr->gamma4, &tr->gamma4, 0); CHKERRQ(ierr);
729a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntr_theta", "", "", tr->theta, &tr->theta, 0); CHKERRQ(ierr);
730a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntr_mu1_i", "", "", tr->mu1_i, &tr->mu1_i, 0); CHKERRQ(ierr);
731a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntr_mu2_i", "", "", tr->mu2_i, &tr->mu2_i, 0); CHKERRQ(ierr);
732a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntr_gamma1_i", "", "", tr->gamma1_i, &tr->gamma1_i, 0); CHKERRQ(ierr);
733a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntr_gamma2_i", "", "", tr->gamma2_i, &tr->gamma2_i, 0); CHKERRQ(ierr);
734a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntr_gamma3_i", "", "", tr->gamma3_i, &tr->gamma3_i, 0); CHKERRQ(ierr);
735a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntr_gamma4_i", "", "", tr->gamma4_i, &tr->gamma4_i, 0); CHKERRQ(ierr);
736a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntr_theta_i", "", "", tr->theta_i, &tr->theta_i, 0); CHKERRQ(ierr);
737a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntr_min_radius", "lower bound on initial trust-region radius", "", tr->min_radius, &tr->min_radius, 0); CHKERRQ(ierr);
738a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntr_max_radius", "upper bound on trust-region radius", "", tr->max_radius, &tr->max_radius, 0); CHKERRQ(ierr);
739a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntr_epsilon", "tolerance used when computing actual and predicted reduction", "", tr->epsilon, &tr->epsilon, 0); CHKERRQ(ierr);
740a7e14dcfSSatish Balay   ierr = PetscOptionsTail(); CHKERRQ(ierr);
741a7e14dcfSSatish Balay   ierr = KSPSetFromOptions(tao->ksp); CHKERRQ(ierr);
742a7e14dcfSSatish Balay   PetscFunctionReturn(0);
743a7e14dcfSSatish Balay }
744a7e14dcfSSatish Balay 
745a7e14dcfSSatish Balay /*------------------------------------------------------------*/
746a7e14dcfSSatish Balay #undef __FUNCT__
747a7e14dcfSSatish Balay #define __FUNCT__ "TaoView_NTR"
748a7e14dcfSSatish Balay static PetscErrorCode TaoView_NTR(TaoSolver tao, PetscViewer viewer)
749a7e14dcfSSatish Balay {
750a7e14dcfSSatish Balay   TAO_NTR *tr = (TAO_NTR *)tao->data;
751a7e14dcfSSatish Balay   PetscErrorCode ierr;
752a7e14dcfSSatish Balay   PetscInt nrejects;
753a7e14dcfSSatish Balay   PetscBool isascii;
754a7e14dcfSSatish Balay   PetscFunctionBegin;
755a7e14dcfSSatish Balay   ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&isascii);CHKERRQ(ierr);
756a7e14dcfSSatish Balay   if (isascii) {
757a7e14dcfSSatish Balay     ierr = PetscViewerASCIIPushTab(viewer); CHKERRQ(ierr);
758a7e14dcfSSatish Balay     if (NTR_PC_BFGS == tr->pc_type && tr->M) {
759a7e14dcfSSatish Balay       ierr = MatLMVMGetRejects(tr->M, &nrejects); CHKERRQ(ierr);
760a7e14dcfSSatish Balay       ierr = PetscViewerASCIIPrintf(viewer, "Rejected matrix updates: %D\n", nrejects); CHKERRQ(ierr);
761a7e14dcfSSatish Balay     }
762a7e14dcfSSatish Balay     ierr = PetscViewerASCIIPopTab(viewer); CHKERRQ(ierr);
763a7e14dcfSSatish Balay 
764a7e14dcfSSatish Balay   } else {
765a7e14dcfSSatish Balay     SETERRQ1(((PetscObject)tao)->comm,PETSC_ERR_SUP,"Viewer type %s not supported for TAO NTR",((PetscObject)viewer)->type_name);
766a7e14dcfSSatish Balay   }
767a7e14dcfSSatish Balay   PetscFunctionReturn(0);
768a7e14dcfSSatish Balay }
769a7e14dcfSSatish Balay 
770a7e14dcfSSatish Balay /*------------------------------------------------------------*/
771a7e14dcfSSatish Balay EXTERN_C_BEGIN
772a7e14dcfSSatish Balay #undef __FUNCT__
773a7e14dcfSSatish Balay #define __FUNCT__ "TaoCreate_NTR"
774a7e14dcfSSatish Balay PetscErrorCode TaoCreate_NTR(TaoSolver tao)
775a7e14dcfSSatish Balay {
776a7e14dcfSSatish Balay   TAO_NTR *tr;
777a7e14dcfSSatish Balay   PetscErrorCode ierr;
778a7e14dcfSSatish Balay 
779a7e14dcfSSatish Balay   PetscFunctionBegin;
780a7e14dcfSSatish Balay 
781*3c9e27cfSGeoffrey Irving   ierr = PetscNewLog(tao,&tr); CHKERRQ(ierr);
782a7e14dcfSSatish Balay 
783a7e14dcfSSatish Balay   tao->ops->setup = TaoSetUp_NTR;
784a7e14dcfSSatish Balay   tao->ops->solve = TaoSolve_NTR;
785a7e14dcfSSatish Balay   tao->ops->view = TaoView_NTR;
786a7e14dcfSSatish Balay   tao->ops->setfromoptions = TaoSetFromOptions_NTR;
787a7e14dcfSSatish Balay   tao->ops->destroy = TaoDestroy_NTR;
788a7e14dcfSSatish Balay 
789a7e14dcfSSatish Balay   tao->max_it = 50;
790a7e14dcfSSatish Balay   tao->fatol = 1e-10;
791a7e14dcfSSatish Balay   tao->frtol = 1e-10;
792a7e14dcfSSatish Balay   tao->data = (void*)tr;
793a7e14dcfSSatish Balay 
794a7e14dcfSSatish Balay   tao->trust0 = 100.0;
795a7e14dcfSSatish Balay 
796a7e14dcfSSatish Balay   /*  Standard trust region update parameters */
797a7e14dcfSSatish Balay   tr->eta1 = 1.0e-4;
798a7e14dcfSSatish Balay   tr->eta2 = 0.25;
799a7e14dcfSSatish Balay   tr->eta3 = 0.50;
800a7e14dcfSSatish Balay   tr->eta4 = 0.90;
801a7e14dcfSSatish Balay 
802a7e14dcfSSatish Balay   tr->alpha1 = 0.25;
803a7e14dcfSSatish Balay   tr->alpha2 = 0.50;
804a7e14dcfSSatish Balay   tr->alpha3 = 1.00;
805a7e14dcfSSatish Balay   tr->alpha4 = 2.00;
806a7e14dcfSSatish Balay   tr->alpha5 = 4.00;
807a7e14dcfSSatish Balay 
808a7e14dcfSSatish Balay   /*  Interpolation parameters */
809a7e14dcfSSatish Balay   tr->mu1_i = 0.35;
810a7e14dcfSSatish Balay   tr->mu2_i = 0.50;
811a7e14dcfSSatish Balay 
812a7e14dcfSSatish Balay   tr->gamma1_i = 0.0625;
813a7e14dcfSSatish Balay   tr->gamma2_i = 0.50;
814a7e14dcfSSatish Balay   tr->gamma3_i = 2.00;
815a7e14dcfSSatish Balay   tr->gamma4_i = 5.00;
816a7e14dcfSSatish Balay 
817a7e14dcfSSatish Balay   tr->theta_i = 0.25;
818a7e14dcfSSatish Balay 
819a7e14dcfSSatish Balay   /*  Interpolation trust region update parameters */
820a7e14dcfSSatish Balay   tr->mu1 = 0.10;
821a7e14dcfSSatish Balay   tr->mu2 = 0.50;
822a7e14dcfSSatish Balay 
823a7e14dcfSSatish Balay   tr->gamma1 = 0.25;
824a7e14dcfSSatish Balay   tr->gamma2 = 0.50;
825a7e14dcfSSatish Balay   tr->gamma3 = 2.00;
826a7e14dcfSSatish Balay   tr->gamma4 = 4.00;
827a7e14dcfSSatish Balay 
828a7e14dcfSSatish Balay   tr->theta = 0.05;
829a7e14dcfSSatish Balay 
830a7e14dcfSSatish Balay   tr->min_radius = 1.0e-10;
831a7e14dcfSSatish Balay   tr->max_radius = 1.0e10;
832a7e14dcfSSatish Balay   tr->epsilon = 1.0e-6;
833a7e14dcfSSatish Balay 
834a7e14dcfSSatish Balay   tr->ksp_type        = NTR_KSP_STCG;
835a7e14dcfSSatish Balay   tr->pc_type         = NTR_PC_BFGS;
836a7e14dcfSSatish Balay   tr->bfgs_scale_type = BFGS_SCALE_AHESS;
837a7e14dcfSSatish Balay   tr->init_type	      = NTR_INIT_INTERPOLATION;
838a7e14dcfSSatish Balay   tr->update_type     = NTR_UPDATE_REDUCTION;
839a7e14dcfSSatish Balay 
840a7e14dcfSSatish Balay 
841a7e14dcfSSatish Balay   /* Set linear solver to default for trust region */
842a7e14dcfSSatish Balay   ierr = KSPCreate(((PetscObject)tao)->comm, &tao->ksp); CHKERRQ(ierr);
843a7e14dcfSSatish Balay 
844a7e14dcfSSatish Balay   PetscFunctionReturn(0);
845a7e14dcfSSatish Balay 
846a7e14dcfSSatish Balay 
847a7e14dcfSSatish Balay }
848a7e14dcfSSatish Balay EXTERN_C_END
849a7e14dcfSSatish Balay 
850a7e14dcfSSatish Balay 
851a7e14dcfSSatish Balay #undef __FUNCT__
852a7e14dcfSSatish Balay #define __FUNCT__ "MatLMVMSolveShell"
853a7e14dcfSSatish Balay static PetscErrorCode MatLMVMSolveShell(PC pc, Vec b, Vec x)
854a7e14dcfSSatish Balay {
855a7e14dcfSSatish Balay     PetscErrorCode ierr;
856a7e14dcfSSatish Balay     Mat M;
857a7e14dcfSSatish Balay     PetscFunctionBegin;
858a7e14dcfSSatish Balay     PetscValidHeaderSpecific(pc,PC_CLASSID,1);
859a7e14dcfSSatish Balay     PetscValidHeaderSpecific(b,VEC_CLASSID,2);
860a7e14dcfSSatish Balay     PetscValidHeaderSpecific(x,VEC_CLASSID,3);
861a7e14dcfSSatish Balay     ierr = PCShellGetContext(pc,(void**)&M); CHKERRQ(ierr);
862a7e14dcfSSatish Balay     ierr = MatLMVMSolve(M, b, x); CHKERRQ(ierr);
863a7e14dcfSSatish Balay     PetscFunctionReturn(0);
864a7e14dcfSSatish Balay }
865