xref: /petsc/src/tao/unconstrained/impls/ntl/ntl.c (revision f89ca46fb01025fa5f21ef09d10cb4723982ea5b)
1*f89ca46fSSatish Balay #include "../src/tao/matrix/lmvmmat.h"
2a7e14dcfSSatish Balay #include "ntl.h"
3a7e14dcfSSatish Balay 
4a7e14dcfSSatish Balay #include "petscksp.h"
5a7e14dcfSSatish Balay #include "petscpc.h"
6a7e14dcfSSatish Balay #include "petsc-private/kspimpl.h"
7a7e14dcfSSatish Balay #include "petsc-private/pcimpl.h"
8a7e14dcfSSatish Balay 
9a7e14dcfSSatish Balay #define NTL_KSP_NASH	0
10a7e14dcfSSatish Balay #define NTL_KSP_STCG	1
11a7e14dcfSSatish Balay #define NTL_KSP_GLTR	2
12a7e14dcfSSatish Balay #define NTL_KSP_TYPES	3
13a7e14dcfSSatish Balay 
14a7e14dcfSSatish Balay #define NTL_PC_NONE	0
15a7e14dcfSSatish Balay #define NTL_PC_AHESS	1
16a7e14dcfSSatish Balay #define NTL_PC_BFGS	2
17a7e14dcfSSatish Balay #define NTL_PC_PETSC	3
18a7e14dcfSSatish Balay #define NTL_PC_TYPES	4
19a7e14dcfSSatish Balay 
20a7e14dcfSSatish Balay #define BFGS_SCALE_AHESS	0
21a7e14dcfSSatish Balay #define BFGS_SCALE_BFGS		1
22a7e14dcfSSatish Balay #define BFGS_SCALE_TYPES	2
23a7e14dcfSSatish Balay 
24a7e14dcfSSatish Balay #define NTL_INIT_CONSTANT         0
25a7e14dcfSSatish Balay #define NTL_INIT_DIRECTION        1
26a7e14dcfSSatish Balay #define NTL_INIT_INTERPOLATION    2
27a7e14dcfSSatish Balay #define NTL_INIT_TYPES            3
28a7e14dcfSSatish Balay 
29a7e14dcfSSatish Balay #define NTL_UPDATE_REDUCTION      0
30a7e14dcfSSatish Balay #define NTL_UPDATE_INTERPOLATION  1
31a7e14dcfSSatish Balay #define NTL_UPDATE_TYPES          2
32a7e14dcfSSatish Balay 
33a7e14dcfSSatish Balay static const char *NTL_KSP[64] = {
34a7e14dcfSSatish Balay   "nash", "stcg", "gltr"
35a7e14dcfSSatish Balay };
36a7e14dcfSSatish Balay 
37a7e14dcfSSatish Balay static const char *NTL_PC[64] = {
38a7e14dcfSSatish Balay   "none", "ahess", "bfgs", "petsc"
39a7e14dcfSSatish Balay };
40a7e14dcfSSatish Balay 
41a7e14dcfSSatish Balay static const char *BFGS_SCALE[64] = {
42a7e14dcfSSatish Balay   "ahess", "bfgs"
43a7e14dcfSSatish Balay };
44a7e14dcfSSatish Balay 
45a7e14dcfSSatish Balay static const char *NTL_INIT[64] = {
46a7e14dcfSSatish Balay   "constant", "direction", "interpolation"
47a7e14dcfSSatish Balay };
48a7e14dcfSSatish Balay 
49a7e14dcfSSatish Balay static const char *NTL_UPDATE[64] = {
50a7e14dcfSSatish Balay   "reduction", "interpolation"
51a7e14dcfSSatish Balay };
52a7e14dcfSSatish Balay 
53a7e14dcfSSatish Balay /* Routine for BFGS preconditioner */
54a7e14dcfSSatish Balay 
55a7e14dcfSSatish Balay #undef __FUNCT__
56a7e14dcfSSatish Balay #define __FUNCT__ "MatLMVMSolveShell"
57a7e14dcfSSatish Balay static PetscErrorCode MatLMVMSolveShell(PC pc, Vec b, Vec x)
58a7e14dcfSSatish Balay {
59a7e14dcfSSatish Balay   PetscErrorCode ierr;
60a7e14dcfSSatish Balay   Mat M;
61a7e14dcfSSatish Balay 
62a7e14dcfSSatish Balay   PetscFunctionBegin;
63a7e14dcfSSatish Balay   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
64a7e14dcfSSatish Balay   PetscValidHeaderSpecific(b,VEC_CLASSID,2);
65a7e14dcfSSatish Balay   PetscValidHeaderSpecific(x,VEC_CLASSID,3);
66a7e14dcfSSatish Balay   ierr = PCShellGetContext(pc,(void**)&M); CHKERRQ(ierr);
67a7e14dcfSSatish Balay   ierr = MatLMVMSolve(M, b, x); CHKERRQ(ierr);
68a7e14dcfSSatish Balay   PetscFunctionReturn(0);
69a7e14dcfSSatish Balay }
70a7e14dcfSSatish Balay 
71a7e14dcfSSatish Balay /* Implements Newton's Method with a trust-region, line-search approach for
72a7e14dcfSSatish Balay    solving unconstrained minimization problems.  A More'-Thuente line search
73a7e14dcfSSatish Balay    is used to guarantee that the bfgs preconditioner remains positive
74a7e14dcfSSatish Balay    definite. */
75a7e14dcfSSatish Balay 
76a7e14dcfSSatish Balay #define NTL_NEWTON 		0
77a7e14dcfSSatish Balay #define NTL_BFGS 		1
78a7e14dcfSSatish Balay #define NTL_SCALED_GRADIENT 	2
79a7e14dcfSSatish Balay #define NTL_GRADIENT 		3
80a7e14dcfSSatish Balay 
81a7e14dcfSSatish Balay #undef __FUNCT__
82a7e14dcfSSatish Balay #define __FUNCT__ "TaoSolve_NTL"
83a7e14dcfSSatish Balay static PetscErrorCode TaoSolve_NTL(TaoSolver tao)
84a7e14dcfSSatish Balay {
85a7e14dcfSSatish Balay   TAO_NTL *tl = (TAO_NTL *)tao->data;
86a7e14dcfSSatish Balay 
87a7e14dcfSSatish Balay   PC pc;
88a7e14dcfSSatish Balay   KSPConvergedReason ksp_reason;
89a7e14dcfSSatish Balay   TaoSolverTerminationReason reason;
90a7e14dcfSSatish Balay   TaoLineSearchTerminationReason ls_reason;
91a7e14dcfSSatish Balay 
92a7e14dcfSSatish Balay   PetscReal fmin, ftrial, prered, actred, kappa, sigma;
93a7e14dcfSSatish Balay   PetscReal tau, tau_1, tau_2, tau_max, tau_min, max_radius;
94a7e14dcfSSatish Balay   PetscReal f, fold, gdx, gnorm;
95a7e14dcfSSatish Balay   PetscReal step = 1.0;
96a7e14dcfSSatish Balay 
97a7e14dcfSSatish Balay   PetscReal delta;
98a7e14dcfSSatish Balay   PetscReal norm_d = 0.0;
99a7e14dcfSSatish Balay   MatStructure matflag;
100a7e14dcfSSatish Balay   PetscErrorCode ierr;
101a7e14dcfSSatish Balay   PetscInt stepType;
102a7e14dcfSSatish Balay   PetscInt iter = 0,its;
103a7e14dcfSSatish Balay 
104a7e14dcfSSatish Balay   PetscInt bfgsUpdates = 0;
105a7e14dcfSSatish Balay   PetscInt needH;
106a7e14dcfSSatish Balay 
107a7e14dcfSSatish Balay   PetscInt i_max = 5;
108a7e14dcfSSatish Balay   PetscInt j_max = 1;
109a7e14dcfSSatish Balay   PetscInt i, j, n, N;
110a7e14dcfSSatish Balay 
111a7e14dcfSSatish Balay   PetscInt tr_reject;
112a7e14dcfSSatish Balay 
113a7e14dcfSSatish Balay   PetscFunctionBegin;
114a7e14dcfSSatish Balay 
115a7e14dcfSSatish Balay   if (tao->XL || tao->XU || tao->ops->computebounds) {
116a7e14dcfSSatish Balay     ierr = PetscPrintf(((PetscObject)tao)->comm,"WARNING: Variable bounds have been set but will be ignored by ntl algorithm\n"); CHKERRQ(ierr);
117a7e14dcfSSatish Balay   }
118a7e14dcfSSatish Balay 
119a7e14dcfSSatish Balay   /* Initialize trust-region radius */
120a7e14dcfSSatish Balay   tao->trust = tao->trust0;
121a7e14dcfSSatish Balay 
122a7e14dcfSSatish Balay   /* Modify the radius if it is too large or small */
123a7e14dcfSSatish Balay   tao->trust = PetscMax(tao->trust, tl->min_radius);
124a7e14dcfSSatish Balay   tao->trust = PetscMin(tao->trust, tl->max_radius);
125a7e14dcfSSatish Balay 
126a7e14dcfSSatish Balay   if (NTL_PC_BFGS == tl->pc_type && !tl->M) {
127a7e14dcfSSatish Balay     ierr = VecGetLocalSize(tao->solution,&n); CHKERRQ(ierr);
128a7e14dcfSSatish Balay     ierr = VecGetSize(tao->solution,&N); CHKERRQ(ierr);
129a7e14dcfSSatish Balay     ierr = MatCreateLMVM(((PetscObject)tao)->comm,n,N,&tl->M); CHKERRQ(ierr);
130a7e14dcfSSatish Balay     ierr = MatLMVMAllocateVectors(tl->M,tao->solution); CHKERRQ(ierr);
131a7e14dcfSSatish Balay   }
132a7e14dcfSSatish Balay 
133a7e14dcfSSatish Balay   /* Check convergence criteria */
134a7e14dcfSSatish Balay   ierr = TaoComputeObjectiveAndGradient(tao, tao->solution, &f, tao->gradient); CHKERRQ(ierr);
135a7e14dcfSSatish Balay   ierr = VecNorm(tao->gradient, NORM_2, &gnorm); CHKERRQ(ierr);
136a7e14dcfSSatish Balay   if (PetscIsInfOrNanReal(f) || PetscIsInfOrNanReal(gnorm)) {
137a7e14dcfSSatish Balay     SETERRQ(PETSC_COMM_SELF,1, "User provided compute function generated Inf or NaN");
138a7e14dcfSSatish Balay   }
139a7e14dcfSSatish Balay   needH = 1;
140a7e14dcfSSatish Balay 
141a7e14dcfSSatish Balay   ierr = TaoMonitor(tao, iter, f, gnorm, 0.0, 1.0, &reason); CHKERRQ(ierr);
142a7e14dcfSSatish Balay   if (reason != TAO_CONTINUE_ITERATING) {
143a7e14dcfSSatish Balay     PetscFunctionReturn(0);
144a7e14dcfSSatish Balay   }
145a7e14dcfSSatish Balay 
146a7e14dcfSSatish Balay   /* Create vectors for the limited memory preconditioner */
147a7e14dcfSSatish Balay   if ((NTL_PC_BFGS == tl->pc_type) &&
148a7e14dcfSSatish Balay       (BFGS_SCALE_BFGS != tl->bfgs_scale_type)) {
149a7e14dcfSSatish Balay     if (!tl->Diag) {
150a7e14dcfSSatish Balay       ierr = VecDuplicate(tao->solution, &tl->Diag); CHKERRQ(ierr);
151a7e14dcfSSatish Balay     }
152a7e14dcfSSatish Balay   }
153a7e14dcfSSatish Balay 
154a7e14dcfSSatish Balay   /* Modify the linear solver to a conjugate gradient method */
155a7e14dcfSSatish Balay   switch(tl->ksp_type) {
156a7e14dcfSSatish Balay   case NTL_KSP_NASH:
157a7e14dcfSSatish Balay     ierr = KSPSetType(tao->ksp, KSPNASH); CHKERRQ(ierr);
158a7e14dcfSSatish Balay     if (tao->ksp->ops->setfromoptions) {
159a7e14dcfSSatish Balay       (*tao->ksp->ops->setfromoptions)(tao->ksp);
160a7e14dcfSSatish Balay     }
161a7e14dcfSSatish Balay     break;
162a7e14dcfSSatish Balay 
163a7e14dcfSSatish Balay   case NTL_KSP_STCG:
164a7e14dcfSSatish Balay     ierr = KSPSetType(tao->ksp, KSPSTCG); CHKERRQ(ierr);
165a7e14dcfSSatish Balay     if (tao->ksp->ops->setfromoptions) {
166a7e14dcfSSatish Balay       (*tao->ksp->ops->setfromoptions)(tao->ksp);
167a7e14dcfSSatish Balay     }
168a7e14dcfSSatish Balay     break;
169a7e14dcfSSatish Balay 
170a7e14dcfSSatish Balay   default:
171a7e14dcfSSatish Balay     ierr = KSPSetType(tao->ksp, KSPGLTR); CHKERRQ(ierr);
172a7e14dcfSSatish Balay     if (tao->ksp->ops->setfromoptions) {
173a7e14dcfSSatish Balay       (*tao->ksp->ops->setfromoptions)(tao->ksp);
174a7e14dcfSSatish Balay     }
175a7e14dcfSSatish Balay     break;
176a7e14dcfSSatish Balay   }
177a7e14dcfSSatish Balay 
178a7e14dcfSSatish Balay   /* Modify the preconditioner to use the bfgs approximation */
179a7e14dcfSSatish Balay   ierr = KSPGetPC(tao->ksp, &pc); CHKERRQ(ierr);
180a7e14dcfSSatish Balay   switch(tl->pc_type) {
181a7e14dcfSSatish Balay   case NTL_PC_NONE:
182a7e14dcfSSatish Balay     ierr = PCSetType(pc, PCNONE); CHKERRQ(ierr);
183a7e14dcfSSatish Balay     if (pc->ops->setfromoptions) {
184a7e14dcfSSatish Balay       (*pc->ops->setfromoptions)(pc);
185a7e14dcfSSatish Balay     }
186a7e14dcfSSatish Balay     break;
187a7e14dcfSSatish Balay 
188a7e14dcfSSatish Balay   case NTL_PC_AHESS:
189a7e14dcfSSatish Balay     ierr = PCSetType(pc, PCJACOBI); CHKERRQ(ierr);
190a7e14dcfSSatish Balay     if (pc->ops->setfromoptions) {
191a7e14dcfSSatish Balay       (*pc->ops->setfromoptions)(pc);
192a7e14dcfSSatish Balay     }
193a7e14dcfSSatish Balay     ierr = PCJacobiSetUseAbs(pc); CHKERRQ(ierr);
194a7e14dcfSSatish Balay     break;
195a7e14dcfSSatish Balay 
196a7e14dcfSSatish Balay   case NTL_PC_BFGS:
197a7e14dcfSSatish Balay     ierr = PCSetType(pc, PCSHELL); CHKERRQ(ierr);
198a7e14dcfSSatish Balay     if (pc->ops->setfromoptions) {
199a7e14dcfSSatish Balay       (*pc->ops->setfromoptions)(pc);
200a7e14dcfSSatish Balay     }
201a7e14dcfSSatish Balay     ierr = PCShellSetName(pc, "bfgs"); CHKERRQ(ierr);
202a7e14dcfSSatish Balay     ierr = PCShellSetContext(pc, tl->M); CHKERRQ(ierr);
203a7e14dcfSSatish Balay     ierr = PCShellSetApply(pc, MatLMVMSolveShell); CHKERRQ(ierr);
204a7e14dcfSSatish Balay     break;
205a7e14dcfSSatish Balay 
206a7e14dcfSSatish Balay   default:
207a7e14dcfSSatish Balay     /* Use the pc method set by pc_type */
208a7e14dcfSSatish Balay     break;
209a7e14dcfSSatish Balay   }
210a7e14dcfSSatish Balay 
211a7e14dcfSSatish Balay   /* Initialize trust-region radius.  The initialization is only performed
212a7e14dcfSSatish Balay      when we are using Steihaug-Toint or the Generalized Lanczos method. */
213a7e14dcfSSatish Balay   switch(tl->init_type) {
214a7e14dcfSSatish Balay   case NTL_INIT_CONSTANT:
215a7e14dcfSSatish Balay     /* Use the initial radius specified */
216a7e14dcfSSatish Balay     break;
217a7e14dcfSSatish Balay 
218a7e14dcfSSatish Balay   case NTL_INIT_INTERPOLATION:
219a7e14dcfSSatish Balay     /* Use the initial radius specified */
220a7e14dcfSSatish Balay     max_radius = 0.0;
221a7e14dcfSSatish Balay 
222a7e14dcfSSatish Balay     for (j = 0; j < j_max; ++j) {
223a7e14dcfSSatish Balay       fmin = f;
224a7e14dcfSSatish Balay       sigma = 0.0;
225a7e14dcfSSatish Balay 
226a7e14dcfSSatish Balay       if (needH) {
227a7e14dcfSSatish Balay         ierr = TaoComputeHessian(tao, tao->solution, &tao->hessian, &tao->hessian_pre, &matflag); CHKERRQ(ierr);
228a7e14dcfSSatish Balay         needH = 0;
229a7e14dcfSSatish Balay       }
230a7e14dcfSSatish Balay 
231a7e14dcfSSatish Balay       for (i = 0; i < i_max; ++i) {
232a7e14dcfSSatish Balay 	ierr = VecCopy(tao->solution, tl->W); CHKERRQ(ierr);
233a7e14dcfSSatish Balay 	ierr = VecAXPY(tl->W, -tao->trust/gnorm, tao->gradient); CHKERRQ(ierr);
234a7e14dcfSSatish Balay 
235a7e14dcfSSatish Balay         ierr = TaoComputeObjective(tao, tl->W, &ftrial); CHKERRQ(ierr);
236a7e14dcfSSatish Balay         if (PetscIsInfOrNanReal(ftrial)) {
237a7e14dcfSSatish Balay           tau = tl->gamma1_i;
238a7e14dcfSSatish Balay         }
239a7e14dcfSSatish Balay         else {
240a7e14dcfSSatish Balay           if (ftrial < fmin) {
241a7e14dcfSSatish Balay             fmin = ftrial;
242a7e14dcfSSatish Balay             sigma = -tao->trust / gnorm;
243a7e14dcfSSatish Balay           }
244a7e14dcfSSatish Balay 
245a7e14dcfSSatish Balay 	  ierr = MatMult(tao->hessian, tao->gradient, tao->stepdirection); CHKERRQ(ierr);
246a7e14dcfSSatish Balay 	  ierr = VecDot(tao->gradient, tao->stepdirection, &prered); CHKERRQ(ierr);
247a7e14dcfSSatish Balay 
248a7e14dcfSSatish Balay           prered = tao->trust * (gnorm - 0.5 * tao->trust * prered / (gnorm * gnorm));
249a7e14dcfSSatish Balay           actred = f - ftrial;
250a7e14dcfSSatish Balay           if ((PetscAbsScalar(actred) <= tl->epsilon) &&
251a7e14dcfSSatish Balay               (PetscAbsScalar(prered) <= tl->epsilon)) {
252a7e14dcfSSatish Balay             kappa = 1.0;
253a7e14dcfSSatish Balay           }
254a7e14dcfSSatish Balay           else {
255a7e14dcfSSatish Balay             kappa = actred / prered;
256a7e14dcfSSatish Balay           }
257a7e14dcfSSatish Balay 
258a7e14dcfSSatish Balay           tau_1 = tl->theta_i * gnorm * tao->trust / (tl->theta_i * gnorm * tao->trust + (1.0 - tl->theta_i) * prered - actred);
259a7e14dcfSSatish Balay           tau_2 = tl->theta_i * gnorm * tao->trust / (tl->theta_i * gnorm * tao->trust - (1.0 + tl->theta_i) * prered + actred);
260a7e14dcfSSatish Balay           tau_min = PetscMin(tau_1, tau_2);
261a7e14dcfSSatish Balay           tau_max = PetscMax(tau_1, tau_2);
262a7e14dcfSSatish Balay 
263a7e14dcfSSatish Balay           if (PetscAbsScalar(kappa - 1.0) <= tl->mu1_i) {
264a7e14dcfSSatish Balay             /* Great agreement */
265a7e14dcfSSatish Balay             max_radius = PetscMax(max_radius, tao->trust);
266a7e14dcfSSatish Balay 
267a7e14dcfSSatish Balay             if (tau_max < 1.0) {
268a7e14dcfSSatish Balay               tau = tl->gamma3_i;
269a7e14dcfSSatish Balay             }
270a7e14dcfSSatish Balay             else if (tau_max > tl->gamma4_i) {
271a7e14dcfSSatish Balay               tau = tl->gamma4_i;
272a7e14dcfSSatish Balay             }
273a7e14dcfSSatish Balay             else if (tau_1 >= 1.0 && tau_1 <= tl->gamma4_i && tau_2 < 1.0) {
274a7e14dcfSSatish Balay               tau = tau_1;
275a7e14dcfSSatish Balay             }
276a7e14dcfSSatish Balay             else if (tau_2 >= 1.0 && tau_2 <= tl->gamma4_i && tau_1 < 1.0) {
277a7e14dcfSSatish Balay               tau = tau_2;
278a7e14dcfSSatish Balay             }
279a7e14dcfSSatish Balay             else {
280a7e14dcfSSatish Balay               tau = tau_max;
281a7e14dcfSSatish Balay             }
282a7e14dcfSSatish Balay           }
283a7e14dcfSSatish Balay           else if (PetscAbsScalar(kappa - 1.0) <= tl->mu2_i) {
284a7e14dcfSSatish Balay             /* Good agreement */
285a7e14dcfSSatish Balay             max_radius = PetscMax(max_radius, tao->trust);
286a7e14dcfSSatish Balay 
287a7e14dcfSSatish Balay             if (tau_max < tl->gamma2_i) {
288a7e14dcfSSatish Balay 	      tau = tl->gamma2_i;
289a7e14dcfSSatish Balay 	    }
290a7e14dcfSSatish Balay 	    else if (tau_max > tl->gamma3_i) {
291a7e14dcfSSatish Balay 	      tau = tl->gamma3_i;
292a7e14dcfSSatish Balay 	    }
293a7e14dcfSSatish Balay 	    else {
294a7e14dcfSSatish Balay 	      tau = tau_max;
295a7e14dcfSSatish Balay 	    }
296a7e14dcfSSatish Balay 	  }
297a7e14dcfSSatish Balay 	  else {
298a7e14dcfSSatish Balay 	    /* Not good agreement */
299a7e14dcfSSatish Balay 	    if (tau_min > 1.0) {
300a7e14dcfSSatish Balay 	      tau = tl->gamma2_i;
301a7e14dcfSSatish Balay 	    }
302a7e14dcfSSatish Balay 	    else if (tau_max < tl->gamma1_i) {
303a7e14dcfSSatish Balay 	      tau = tl->gamma1_i;
304a7e14dcfSSatish Balay 	    }
305a7e14dcfSSatish Balay 	    else if ((tau_min < tl->gamma1_i) && (tau_max >= 1.0)) {
306a7e14dcfSSatish Balay 	      tau = tl->gamma1_i;
307a7e14dcfSSatish Balay 	    }
308a7e14dcfSSatish Balay 	    else if ((tau_1 >= tl->gamma1_i) && (tau_1 < 1.0) &&
309a7e14dcfSSatish Balay 		     ((tau_2 < tl->gamma1_i) || (tau_2 >= 1.0))) {
310a7e14dcfSSatish Balay 	      tau = tau_1;
311a7e14dcfSSatish Balay 	    }
312a7e14dcfSSatish Balay 	    else if ((tau_2 >= tl->gamma1_i) && (tau_2 < 1.0) &&
313a7e14dcfSSatish Balay 		     ((tau_1 < tl->gamma1_i) || (tau_2 >= 1.0))) {
314a7e14dcfSSatish Balay 	      tau = tau_2;
315a7e14dcfSSatish Balay 	    }
316a7e14dcfSSatish Balay 	    else {
317a7e14dcfSSatish Balay 	      tau = tau_max;
318a7e14dcfSSatish Balay 	    }
319a7e14dcfSSatish Balay 	  }
320a7e14dcfSSatish Balay 	}
321a7e14dcfSSatish Balay 	tao->trust = tau * tao->trust;
322a7e14dcfSSatish Balay       }
323a7e14dcfSSatish Balay 
324a7e14dcfSSatish Balay       if (fmin < f) {
325a7e14dcfSSatish Balay 	f = fmin;
326a7e14dcfSSatish Balay 	ierr = VecAXPY(tao->solution, sigma, tao->gradient); CHKERRQ(ierr);
327a7e14dcfSSatish Balay 	ierr = TaoComputeGradient(tao, tao->solution, tao->gradient); CHKERRQ(ierr);
328a7e14dcfSSatish Balay 
329a7e14dcfSSatish Balay 	ierr = VecNorm(tao->gradient, NORM_2, &gnorm); CHKERRQ(ierr);
330a7e14dcfSSatish Balay 	if (PetscIsInfOrNanReal(f) || PetscIsInfOrNanReal(gnorm)) {
331a7e14dcfSSatish Balay 	  SETERRQ(PETSC_COMM_SELF,1, "User provided compute function generated Inf or NaN");
332a7e14dcfSSatish Balay 	}
333a7e14dcfSSatish Balay 	needH = 1;
334a7e14dcfSSatish Balay 
335a7e14dcfSSatish Balay 	ierr = TaoMonitor(tao, iter, f, gnorm, 0.0, 1.0, &reason); CHKERRQ(ierr);
336a7e14dcfSSatish Balay 	if (reason != TAO_CONTINUE_ITERATING) {
337a7e14dcfSSatish Balay 	  PetscFunctionReturn(0);
338a7e14dcfSSatish Balay 	}
339a7e14dcfSSatish Balay       }
340a7e14dcfSSatish Balay     }
341a7e14dcfSSatish Balay     tao->trust = PetscMax(tao->trust, max_radius);
342a7e14dcfSSatish Balay 
343a7e14dcfSSatish Balay     /* Modify the radius if it is too large or small */
344a7e14dcfSSatish Balay     tao->trust = PetscMax(tao->trust, tl->min_radius);
345a7e14dcfSSatish Balay     tao->trust = PetscMin(tao->trust, tl->max_radius);
346a7e14dcfSSatish Balay     break;
347a7e14dcfSSatish Balay 
348a7e14dcfSSatish Balay   default:
349a7e14dcfSSatish Balay     /* Norm of the first direction will initialize radius */
350a7e14dcfSSatish Balay     tao->trust = 0.0;
351a7e14dcfSSatish Balay     break;
352a7e14dcfSSatish Balay   }
353a7e14dcfSSatish Balay 
354a7e14dcfSSatish Balay   /* Set initial scaling for the BFGS preconditioner
355a7e14dcfSSatish Balay      This step is done after computing the initial trust-region radius
356a7e14dcfSSatish Balay      since the function value may have decreased */
357a7e14dcfSSatish Balay   if (NTL_PC_BFGS == tl->pc_type) {
358a7e14dcfSSatish Balay     if (f != 0.0) {
359a7e14dcfSSatish Balay       delta = 2.0 * PetscAbsScalar(f) / (gnorm*gnorm);
360a7e14dcfSSatish Balay     }
361a7e14dcfSSatish Balay     else {
362a7e14dcfSSatish Balay       delta = 2.0 / (gnorm*gnorm);
363a7e14dcfSSatish Balay     }
364a7e14dcfSSatish Balay     ierr = MatLMVMSetDelta(tl->M, delta); CHKERRQ(ierr);
365a7e14dcfSSatish Balay   }
366a7e14dcfSSatish Balay 
367a7e14dcfSSatish Balay   /* Set counter for gradient/reset steps */
368a7e14dcfSSatish Balay   tl->ntrust = 0;
369a7e14dcfSSatish Balay   tl->newt = 0;
370a7e14dcfSSatish Balay   tl->bfgs = 0;
371a7e14dcfSSatish Balay   tl->sgrad = 0;
372a7e14dcfSSatish Balay   tl->grad = 0;
373a7e14dcfSSatish Balay 
374a7e14dcfSSatish Balay   /* Have not converged; continue with Newton method */
375a7e14dcfSSatish Balay   while (reason == TAO_CONTINUE_ITERATING) {
376a7e14dcfSSatish Balay     ++iter;
377a7e14dcfSSatish Balay 
378a7e14dcfSSatish Balay     /* Compute the Hessian */
379a7e14dcfSSatish Balay     if (needH) {
380a7e14dcfSSatish Balay       ierr = TaoComputeHessian(tao, tao->solution, &tao->hessian, &tao->hessian_pre, &matflag); CHKERRQ(ierr);
381a7e14dcfSSatish Balay       needH = 0;
382a7e14dcfSSatish Balay     }
383a7e14dcfSSatish Balay 
384a7e14dcfSSatish Balay     if (NTL_PC_BFGS == tl->pc_type) {
385a7e14dcfSSatish Balay       if (BFGS_SCALE_AHESS == tl->bfgs_scale_type) {
386a7e14dcfSSatish Balay 	/* Obtain diagonal for the bfgs preconditioner */
387a7e14dcfSSatish Balay 	ierr = MatGetDiagonal(tao->hessian, tl->Diag); CHKERRQ(ierr);
388a7e14dcfSSatish Balay 	ierr = VecAbs(tl->Diag); CHKERRQ(ierr);
389a7e14dcfSSatish Balay 	ierr = VecReciprocal(tl->Diag); CHKERRQ(ierr);
390a7e14dcfSSatish Balay 	ierr = MatLMVMSetScale(tl->M, tl->Diag); CHKERRQ(ierr);
391a7e14dcfSSatish Balay       }
392a7e14dcfSSatish Balay 
393a7e14dcfSSatish Balay       /* Update the limited memory preconditioner */
394a7e14dcfSSatish Balay       ierr = MatLMVMUpdate(tl->M,tao->solution, tao->gradient); CHKERRQ(ierr);
395a7e14dcfSSatish Balay       ++bfgsUpdates;
396a7e14dcfSSatish Balay     }
397a7e14dcfSSatish Balay     ierr = KSPSetOperators(tao->ksp, tao->hessian, tao->hessian_pre, matflag); CHKERRQ(ierr);
398a7e14dcfSSatish Balay     /* Solve the Newton system of equations */
399a7e14dcfSSatish Balay     if (NTL_KSP_NASH == tl->ksp_type) {
400a7e14dcfSSatish Balay       ierr = KSPNASHSetRadius(tao->ksp,tl->max_radius); CHKERRQ(ierr);
401a7e14dcfSSatish Balay       ierr = KSPSolve(tao->ksp, tao->gradient, tao->stepdirection); CHKERRQ(ierr);
402a7e14dcfSSatish Balay       ierr = KSPGetIterationNumber(tao->ksp,&its); CHKERRQ(ierr);
403a7e14dcfSSatish Balay       tao->ksp_its+=its;
404a7e14dcfSSatish Balay       ierr = KSPNASHGetNormD(tao->ksp, &norm_d); CHKERRQ(ierr);
405a7e14dcfSSatish Balay     } else if (NTL_KSP_STCG == tl->ksp_type) {
406a7e14dcfSSatish Balay       ierr = KSPSTCGSetRadius(tao->ksp,tl->max_radius); CHKERRQ(ierr);
407a7e14dcfSSatish Balay       ierr = KSPSolve(tao->ksp, tao->gradient, tao->stepdirection); CHKERRQ(ierr);
408a7e14dcfSSatish Balay       ierr = KSPGetIterationNumber(tao->ksp,&its); CHKERRQ(ierr);
409a7e14dcfSSatish Balay       tao->ksp_its+=its;
410a7e14dcfSSatish Balay       ierr = KSPSTCGGetNormD(tao->ksp, &norm_d); CHKERRQ(ierr);
411a7e14dcfSSatish Balay     } else { /* NTL_KSP_GLTR */
412a7e14dcfSSatish Balay       ierr = KSPGLTRSetRadius(tao->ksp,tl->max_radius); CHKERRQ(ierr);
413a7e14dcfSSatish Balay       ierr = KSPSolve(tao->ksp, tao->gradient, tao->stepdirection); CHKERRQ(ierr);
414a7e14dcfSSatish Balay       ierr = KSPGetIterationNumber(tao->ksp,&its); CHKERRQ(ierr);
415a7e14dcfSSatish Balay       tao->ksp_its+=its;
416a7e14dcfSSatish Balay       ierr = KSPGLTRGetNormD(tao->ksp, &norm_d); CHKERRQ(ierr);
417a7e14dcfSSatish Balay     }
418a7e14dcfSSatish Balay 
419a7e14dcfSSatish Balay     if (0.0 == tao->trust) {
420a7e14dcfSSatish Balay       /* Radius was uninitialized; use the norm of the direction */
421a7e14dcfSSatish Balay       if (norm_d > 0.0) {
422a7e14dcfSSatish Balay 	tao->trust = norm_d;
423a7e14dcfSSatish Balay 
424a7e14dcfSSatish Balay 	/* Modify the radius if it is too large or small */
425a7e14dcfSSatish Balay 	tao->trust = PetscMax(tao->trust, tl->min_radius);
426a7e14dcfSSatish Balay 	tao->trust = PetscMin(tao->trust, tl->max_radius);
427a7e14dcfSSatish Balay       }
428a7e14dcfSSatish Balay       else {
429a7e14dcfSSatish Balay 	/* The direction was bad; set radius to default value and re-solve
430a7e14dcfSSatish Balay 	   the trust-region subproblem to get a direction */
431a7e14dcfSSatish Balay 	tao->trust = tao->trust0;
432a7e14dcfSSatish Balay 
433a7e14dcfSSatish Balay 	/* Modify the radius if it is too large or small */
434a7e14dcfSSatish Balay 	tao->trust = PetscMax(tao->trust, tl->min_radius);
435a7e14dcfSSatish Balay 	tao->trust = PetscMin(tao->trust, tl->max_radius);
436a7e14dcfSSatish Balay 
437a7e14dcfSSatish Balay 	if (NTL_KSP_NASH == tl->ksp_type) {
438a7e14dcfSSatish Balay 	  ierr = KSPNASHSetRadius(tao->ksp,tl->max_radius); CHKERRQ(ierr);
439a7e14dcfSSatish Balay 	  ierr = KSPSolve(tao->ksp, tao->gradient, tao->stepdirection); CHKERRQ(ierr);
440a7e14dcfSSatish Balay 	  ierr = KSPGetIterationNumber(tao->ksp,&its); CHKERRQ(ierr);
441a7e14dcfSSatish Balay 	  tao->ksp_its+=its;
442a7e14dcfSSatish Balay 	  ierr = KSPNASHGetNormD(tao->ksp, &norm_d); CHKERRQ(ierr);
443a7e14dcfSSatish Balay 	} else if (NTL_KSP_STCG == tl->ksp_type) {
444a7e14dcfSSatish Balay 	  ierr = KSPSTCGSetRadius(tao->ksp,tl->max_radius); CHKERRQ(ierr);
445a7e14dcfSSatish Balay 	  ierr = KSPSolve(tao->ksp, tao->gradient, tao->stepdirection); CHKERRQ(ierr);
446a7e14dcfSSatish Balay 	  ierr = KSPGetIterationNumber(tao->ksp,&its); CHKERRQ(ierr);
447a7e14dcfSSatish Balay 	  tao->ksp_its+=its;
448a7e14dcfSSatish Balay 	  ierr = KSPSTCGGetNormD(tao->ksp, &norm_d); CHKERRQ(ierr);
449a7e14dcfSSatish Balay 	} else { /* NTL_KSP_GLTR */
450a7e14dcfSSatish Balay 	  ierr = KSPGLTRSetRadius(tao->ksp,tl->max_radius); CHKERRQ(ierr);
451a7e14dcfSSatish Balay 	  ierr = KSPSolve(tao->ksp, tao->gradient, tao->stepdirection); CHKERRQ(ierr);
452a7e14dcfSSatish Balay 	  ierr = KSPGetIterationNumber(tao->ksp,&its); CHKERRQ(ierr);
453a7e14dcfSSatish Balay 	  tao->ksp_its+=its;
454a7e14dcfSSatish Balay 	  ierr = KSPGLTRGetNormD(tao->ksp, &norm_d); CHKERRQ(ierr);
455a7e14dcfSSatish Balay 	}
456a7e14dcfSSatish Balay 
457a7e14dcfSSatish Balay 
458a7e14dcfSSatish Balay 	if (norm_d == 0.0) {
459a7e14dcfSSatish Balay 	  SETERRQ(PETSC_COMM_SELF,1, "Initial direction zero");
460a7e14dcfSSatish Balay 	}
461a7e14dcfSSatish Balay       }
462a7e14dcfSSatish Balay     }
463a7e14dcfSSatish Balay 
464a7e14dcfSSatish Balay     ierr = VecScale(tao->stepdirection, -1.0); CHKERRQ(ierr);
465a7e14dcfSSatish Balay     ierr = KSPGetConvergedReason(tao->ksp, &ksp_reason); CHKERRQ(ierr);
466a7e14dcfSSatish Balay     if ((KSP_DIVERGED_INDEFINITE_PC == ksp_reason) &&
467a7e14dcfSSatish Balay         (NTL_PC_BFGS == tl->pc_type) && (bfgsUpdates > 1)) {
468a7e14dcfSSatish Balay       /* Preconditioner is numerically indefinite; reset the
469a7e14dcfSSatish Balay 	 approximate if using BFGS preconditioning. */
470a7e14dcfSSatish Balay 
471a7e14dcfSSatish Balay       if (f != 0.0) {
472a7e14dcfSSatish Balay         delta = 2.0 * PetscAbsScalar(f) / (gnorm*gnorm);
473a7e14dcfSSatish Balay       }
474a7e14dcfSSatish Balay       else {
475a7e14dcfSSatish Balay         delta = 2.0 / (gnorm*gnorm);
476a7e14dcfSSatish Balay       }
477a7e14dcfSSatish Balay       ierr = MatLMVMSetDelta(tl->M, delta); CHKERRQ(ierr);
478a7e14dcfSSatish Balay       ierr = MatLMVMReset(tl->M); CHKERRQ(ierr);
479a7e14dcfSSatish Balay       ierr = MatLMVMUpdate(tl->M, tao->solution, tao->gradient); CHKERRQ(ierr);
480a7e14dcfSSatish Balay       bfgsUpdates = 1;
481a7e14dcfSSatish Balay     }
482a7e14dcfSSatish Balay 
483a7e14dcfSSatish Balay     /* Check trust-region reduction conditions */
484a7e14dcfSSatish Balay     tr_reject = 0;
485a7e14dcfSSatish Balay     if (NTL_UPDATE_REDUCTION == tl->update_type) {
486a7e14dcfSSatish Balay       /* Get predicted reduction */
487a7e14dcfSSatish Balay       if (NTL_KSP_NASH == tl->ksp_type) {
488a7e14dcfSSatish Balay 	ierr = KSPNASHGetObjFcn(tao->ksp,&prered); CHKERRQ(ierr);
489a7e14dcfSSatish Balay       } else if (NTL_KSP_STCG == tl->ksp_type) {
490a7e14dcfSSatish Balay 	ierr = KSPSTCGGetObjFcn(tao->ksp,&prered); CHKERRQ(ierr);
491a7e14dcfSSatish Balay       } else { /* gltr */
492a7e14dcfSSatish Balay 	ierr = KSPGLTRGetObjFcn(tao->ksp,&prered); CHKERRQ(ierr);
493a7e14dcfSSatish Balay       }
494a7e14dcfSSatish Balay 
495a7e14dcfSSatish Balay       if (prered >= 0.0) {
496a7e14dcfSSatish Balay 	/* The predicted reduction has the wrong sign.  This cannot
497a7e14dcfSSatish Balay 	   happen in infinite precision arithmetic.  Step should
498a7e14dcfSSatish Balay 	   be rejected! */
499a7e14dcfSSatish Balay 	tao->trust = tl->alpha1 * PetscMin(tao->trust, norm_d);
500a7e14dcfSSatish Balay 	tr_reject = 1;
501a7e14dcfSSatish Balay       }
502a7e14dcfSSatish Balay       else {
503a7e14dcfSSatish Balay 	/* Compute trial step and function value */
504a7e14dcfSSatish Balay 	ierr = VecCopy(tao->solution, tl->W); CHKERRQ(ierr);
505a7e14dcfSSatish Balay 	ierr = VecAXPY(tl->W, 1.0, tao->stepdirection); CHKERRQ(ierr);
506a7e14dcfSSatish Balay 	ierr = TaoComputeObjective(tao, tl->W, &ftrial); CHKERRQ(ierr);
507a7e14dcfSSatish Balay 
508a7e14dcfSSatish Balay 	if (PetscIsInfOrNanReal(ftrial)) {
509a7e14dcfSSatish Balay 	  tao->trust = tl->alpha1 * PetscMin(tao->trust, norm_d);
510a7e14dcfSSatish Balay 	  tr_reject = 1;
511a7e14dcfSSatish Balay 	}
512a7e14dcfSSatish Balay 	else {
513a7e14dcfSSatish Balay 	  /* Compute and actual reduction */
514a7e14dcfSSatish Balay 	  actred = f - ftrial;
515a7e14dcfSSatish Balay 	  prered = -prered;
516a7e14dcfSSatish Balay 	  if ((PetscAbsScalar(actred) <= tl->epsilon) &&
517a7e14dcfSSatish Balay 	      (PetscAbsScalar(prered) <= tl->epsilon)) {
518a7e14dcfSSatish Balay 	    kappa = 1.0;
519a7e14dcfSSatish Balay 	  }
520a7e14dcfSSatish Balay 	  else {
521a7e14dcfSSatish Balay 	    kappa = actred / prered;
522a7e14dcfSSatish Balay 	  }
523a7e14dcfSSatish Balay 
524a7e14dcfSSatish Balay 	  /* Accept of reject the step and update radius */
525a7e14dcfSSatish Balay 	  if (kappa < tl->eta1) {
526a7e14dcfSSatish Balay 	    /* Reject the step */
527a7e14dcfSSatish Balay 	    tao->trust = tl->alpha1 * PetscMin(tao->trust, norm_d);
528a7e14dcfSSatish Balay 	    tr_reject = 1;
529a7e14dcfSSatish Balay 	  }
530a7e14dcfSSatish Balay 	  else {
531a7e14dcfSSatish Balay 	    /* Accept the step */
532a7e14dcfSSatish Balay 	    if (kappa < tl->eta2) {
533a7e14dcfSSatish Balay 	      /* Marginal bad step */
534a7e14dcfSSatish Balay 	      tao->trust = tl->alpha2 * PetscMin(tao->trust, norm_d);
535a7e14dcfSSatish Balay 	    }
536a7e14dcfSSatish Balay 	    else if (kappa < tl->eta3) {
537a7e14dcfSSatish Balay 	      /* Reasonable step */
538a7e14dcfSSatish Balay 	      tao->trust = tl->alpha3 * tao->trust;
539a7e14dcfSSatish Balay 	    }
540a7e14dcfSSatish Balay 	    else if (kappa < tl->eta4) {
541a7e14dcfSSatish Balay 	      /* Good step */
542a7e14dcfSSatish Balay 	      tao->trust = PetscMax(tl->alpha4 * norm_d, tao->trust);
543a7e14dcfSSatish Balay 	    }
544a7e14dcfSSatish Balay 	    else {
545a7e14dcfSSatish Balay 	      /* Very good step */
546a7e14dcfSSatish Balay 	      tao->trust = PetscMax(tl->alpha5 * norm_d, tao->trust);
547a7e14dcfSSatish Balay 	    }
548a7e14dcfSSatish Balay 	  }
549a7e14dcfSSatish Balay 	}
550a7e14dcfSSatish Balay       }
551a7e14dcfSSatish Balay     }
552a7e14dcfSSatish Balay     else {
553a7e14dcfSSatish Balay       /* Get predicted reduction */
554a7e14dcfSSatish Balay       if (NTL_KSP_NASH == tl->ksp_type) {
555a7e14dcfSSatish Balay 	ierr = KSPNASHGetObjFcn(tao->ksp,&prered); CHKERRQ(ierr);
556a7e14dcfSSatish Balay       } else if (NTL_KSP_STCG == tl->ksp_type) {
557a7e14dcfSSatish Balay 	ierr = KSPSTCGGetObjFcn(tao->ksp,&prered); CHKERRQ(ierr);
558a7e14dcfSSatish Balay       } else { /* gltr */
559a7e14dcfSSatish Balay 	ierr = KSPGLTRGetObjFcn(tao->ksp,&prered); CHKERRQ(ierr);
560a7e14dcfSSatish Balay       }
561a7e14dcfSSatish Balay 
562a7e14dcfSSatish Balay       if (prered >= 0.0) {
563a7e14dcfSSatish Balay 	/* The predicted reduction has the wrong sign.  This cannot
564a7e14dcfSSatish Balay 	   happen in infinite precision arithmetic.  Step should
565a7e14dcfSSatish Balay 	   be rejected! */
566a7e14dcfSSatish Balay 	tao->trust = tl->gamma1 * PetscMin(tao->trust, norm_d);
567a7e14dcfSSatish Balay 	tr_reject = 1;
568a7e14dcfSSatish Balay       }
569a7e14dcfSSatish Balay       else {
570a7e14dcfSSatish Balay 	ierr = VecCopy(tao->solution, tl->W); CHKERRQ(ierr);
571a7e14dcfSSatish Balay 	ierr = VecAXPY(tl->W, 1.0, tao->stepdirection); CHKERRQ(ierr);
572a7e14dcfSSatish Balay 	ierr = TaoComputeObjective(tao, tl->W, &ftrial); CHKERRQ(ierr);
573a7e14dcfSSatish Balay 	if (PetscIsInfOrNanReal(ftrial)) {
574a7e14dcfSSatish Balay 	  tao->trust = tl->gamma1 * PetscMin(tao->trust, norm_d);
575a7e14dcfSSatish Balay 	  tr_reject = 1;
576a7e14dcfSSatish Balay 	}
577a7e14dcfSSatish Balay 	else {
578a7e14dcfSSatish Balay 	  ierr = VecDot(tao->gradient, tao->stepdirection, &gdx); CHKERRQ(ierr);
579a7e14dcfSSatish Balay 
580a7e14dcfSSatish Balay 	  actred = f - ftrial;
581a7e14dcfSSatish Balay 	  prered = -prered;
582a7e14dcfSSatish Balay 	  if ((PetscAbsScalar(actred) <= tl->epsilon) &&
583a7e14dcfSSatish Balay 	      (PetscAbsScalar(prered) <= tl->epsilon)) {
584a7e14dcfSSatish Balay 	    kappa = 1.0;
585a7e14dcfSSatish Balay 	  }
586a7e14dcfSSatish Balay 	  else {
587a7e14dcfSSatish Balay 	    kappa = actred / prered;
588a7e14dcfSSatish Balay 	  }
589a7e14dcfSSatish Balay 
590a7e14dcfSSatish Balay 	  tau_1 = tl->theta * gdx / (tl->theta * gdx - (1.0 - tl->theta) * prered + actred);
591a7e14dcfSSatish Balay 	  tau_2 = tl->theta * gdx / (tl->theta * gdx + (1.0 + tl->theta) * prered - actred);
592a7e14dcfSSatish Balay 	  tau_min = PetscMin(tau_1, tau_2);
593a7e14dcfSSatish Balay 	  tau_max = PetscMax(tau_1, tau_2);
594a7e14dcfSSatish Balay 
595a7e14dcfSSatish Balay 	  if (kappa >= 1.0 - tl->mu1) {
596a7e14dcfSSatish Balay 	    /* Great agreement; accept step and update radius */
597a7e14dcfSSatish Balay 	    if (tau_max < 1.0) {
598a7e14dcfSSatish Balay 	      tao->trust = PetscMax(tao->trust, tl->gamma3 * norm_d);
599a7e14dcfSSatish Balay 	    }
600a7e14dcfSSatish Balay 	    else if (tau_max > tl->gamma4) {
601a7e14dcfSSatish Balay 	      tao->trust = PetscMax(tao->trust, tl->gamma4 * norm_d);
602a7e14dcfSSatish Balay 	    }
603a7e14dcfSSatish Balay 	    else {
604a7e14dcfSSatish Balay 	      tao->trust = PetscMax(tao->trust, tau_max * norm_d);
605a7e14dcfSSatish Balay 	    }
606a7e14dcfSSatish Balay 	  }
607a7e14dcfSSatish Balay 	  else if (kappa >= 1.0 - tl->mu2) {
608a7e14dcfSSatish Balay 	    /* Good agreement */
609a7e14dcfSSatish Balay 
610a7e14dcfSSatish Balay 	    if (tau_max < tl->gamma2) {
611a7e14dcfSSatish Balay 	      tao->trust = tl->gamma2 * PetscMin(tao->trust, norm_d);
612a7e14dcfSSatish Balay 	    }
613a7e14dcfSSatish Balay 	    else if (tau_max > tl->gamma3) {
614a7e14dcfSSatish Balay 	      tao->trust = PetscMax(tao->trust, tl->gamma3 * norm_d);
615a7e14dcfSSatish Balay 	    }              else if (tau_max < 1.0) {
616a7e14dcfSSatish Balay 	      tao->trust = tau_max * PetscMin(tao->trust, norm_d);
617a7e14dcfSSatish Balay 	    }
618a7e14dcfSSatish Balay 	    else {
619a7e14dcfSSatish Balay 	      tao->trust = PetscMax(tao->trust, tau_max * norm_d);
620a7e14dcfSSatish Balay 	    }
621a7e14dcfSSatish Balay 	  }
622a7e14dcfSSatish Balay 	  else {
623a7e14dcfSSatish Balay 	    /* Not good agreement */
624a7e14dcfSSatish Balay 	    if (tau_min > 1.0) {
625a7e14dcfSSatish Balay 	      tao->trust = tl->gamma2 * PetscMin(tao->trust, norm_d);
626a7e14dcfSSatish Balay 	    }
627a7e14dcfSSatish Balay 	    else if (tau_max < tl->gamma1) {
628a7e14dcfSSatish Balay 	      tao->trust = tl->gamma1 * PetscMin(tao->trust, norm_d);
629a7e14dcfSSatish Balay 	    }
630a7e14dcfSSatish Balay 	    else if ((tau_min < tl->gamma1) && (tau_max >= 1.0)) {
631a7e14dcfSSatish Balay 	      tao->trust = tl->gamma1 * PetscMin(tao->trust, norm_d);
632a7e14dcfSSatish Balay 	    }
633a7e14dcfSSatish Balay 	    else if ((tau_1 >= tl->gamma1) && (tau_1 < 1.0) &&
634a7e14dcfSSatish Balay 		     ((tau_2 < tl->gamma1) || (tau_2 >= 1.0))) {
635a7e14dcfSSatish Balay 	      tao->trust = tau_1 * PetscMin(tao->trust, norm_d);
636a7e14dcfSSatish Balay 	    }
637a7e14dcfSSatish Balay 	    else if ((tau_2 >= tl->gamma1) && (tau_2 < 1.0) &&
638a7e14dcfSSatish Balay 		     ((tau_1 < tl->gamma1) || (tau_2 >= 1.0))) {
639a7e14dcfSSatish Balay 	      tao->trust = tau_2 * PetscMin(tao->trust, norm_d);
640a7e14dcfSSatish Balay 	    }
641a7e14dcfSSatish Balay 	    else {
642a7e14dcfSSatish Balay 	      tao->trust = tau_max * PetscMin(tao->trust, norm_d);
643a7e14dcfSSatish Balay 	    }
644a7e14dcfSSatish Balay 	    tr_reject = 1;
645a7e14dcfSSatish Balay 	  }
646a7e14dcfSSatish Balay 	}
647a7e14dcfSSatish Balay       }
648a7e14dcfSSatish Balay     }
649a7e14dcfSSatish Balay 
650a7e14dcfSSatish Balay     if (tr_reject) {
651a7e14dcfSSatish Balay       /* The trust-region constraints rejected the step.  Apply a linesearch.
652a7e14dcfSSatish Balay 	 Check for descent direction. */
653a7e14dcfSSatish Balay       ierr = VecDot(tao->stepdirection, tao->gradient, &gdx); CHKERRQ(ierr);
654a7e14dcfSSatish Balay       if ((gdx >= 0.0) || PetscIsInfOrNanReal(gdx)) {
655a7e14dcfSSatish Balay 	/* Newton step is not descent or direction produced Inf or NaN */
656a7e14dcfSSatish Balay 
657a7e14dcfSSatish Balay 	if (NTL_PC_BFGS != tl->pc_type) {
658a7e14dcfSSatish Balay 	  /* We don't have the bfgs matrix around and updated
659a7e14dcfSSatish Balay 	     Must use gradient direction in this case */
660a7e14dcfSSatish Balay 	  ierr = VecCopy(tao->gradient, tao->stepdirection); CHKERRQ(ierr);
661a7e14dcfSSatish Balay 	  ierr = VecScale(tao->stepdirection, -1.0); CHKERRQ(ierr);
662a7e14dcfSSatish Balay 	  ++tl->grad;
663a7e14dcfSSatish Balay 	  stepType = NTL_GRADIENT;
664a7e14dcfSSatish Balay 	}
665a7e14dcfSSatish Balay 	else {
666a7e14dcfSSatish Balay 	  /* Attempt to use the BFGS direction */
667a7e14dcfSSatish Balay 	  ierr = MatLMVMSolve(tl->M, tao->gradient, tao->stepdirection); CHKERRQ(ierr);
668a7e14dcfSSatish Balay 	  ierr = VecScale(tao->stepdirection, -1.0); CHKERRQ(ierr);
669a7e14dcfSSatish Balay 
670a7e14dcfSSatish Balay 	  /* Check for success (descent direction) */
671a7e14dcfSSatish Balay 	  ierr = VecDot(tao->stepdirection, tao->gradient, &gdx); CHKERRQ(ierr);
672a7e14dcfSSatish Balay 	  if ((gdx >= 0) || PetscIsInfOrNanReal(gdx)) {
673a7e14dcfSSatish Balay 	    /* BFGS direction is not descent or direction produced not a number
674a7e14dcfSSatish Balay 	       We can assert bfgsUpdates > 1 in this case because
675a7e14dcfSSatish Balay 	       the first solve produces the scaled gradient direction,
676a7e14dcfSSatish Balay 	       which is guaranteed to be descent */
677a7e14dcfSSatish Balay 
678a7e14dcfSSatish Balay 	    /* Use steepest descent direction (scaled) */
679a7e14dcfSSatish Balay 	    if (f != 0.0) {
680a7e14dcfSSatish Balay 	      delta = 2.0 * PetscAbsScalar(f) / (gnorm*gnorm);
681a7e14dcfSSatish Balay 	    }
682a7e14dcfSSatish Balay 	    else {
683a7e14dcfSSatish Balay 	      delta = 2.0 / (gnorm*gnorm);
684a7e14dcfSSatish Balay 	    }
685a7e14dcfSSatish Balay 	    ierr = MatLMVMSetDelta(tl->M, delta); CHKERRQ(ierr);
686a7e14dcfSSatish Balay 	    ierr = MatLMVMReset(tl->M); CHKERRQ(ierr);
687a7e14dcfSSatish Balay 	    ierr = MatLMVMUpdate(tl->M, tao->solution, tao->gradient); CHKERRQ(ierr);
688a7e14dcfSSatish Balay 	    ierr = MatLMVMSolve(tl->M, tao->gradient, tao->stepdirection); CHKERRQ(ierr);
689a7e14dcfSSatish Balay 	    ierr = VecScale(tao->stepdirection, -1.0); CHKERRQ(ierr);
690a7e14dcfSSatish Balay 
691a7e14dcfSSatish Balay 	    bfgsUpdates = 1;
692a7e14dcfSSatish Balay 	    ++tl->sgrad;
693a7e14dcfSSatish Balay 	    stepType = NTL_SCALED_GRADIENT;
694a7e14dcfSSatish Balay 	  }
695a7e14dcfSSatish Balay 	  else {
696a7e14dcfSSatish Balay 	    if (1 == bfgsUpdates) {
697a7e14dcfSSatish Balay 	      /* The first BFGS direction is always the scaled gradient */
698a7e14dcfSSatish Balay 	      ++tl->sgrad;
699a7e14dcfSSatish Balay 	      stepType = NTL_SCALED_GRADIENT;
700a7e14dcfSSatish Balay 	    }
701a7e14dcfSSatish Balay 	    else {
702a7e14dcfSSatish Balay 	      ++tl->bfgs;
703a7e14dcfSSatish Balay 	      stepType = NTL_BFGS;
704a7e14dcfSSatish Balay 	    }
705a7e14dcfSSatish Balay 	  }
706a7e14dcfSSatish Balay 	}
707a7e14dcfSSatish Balay       }
708a7e14dcfSSatish Balay       else {
709a7e14dcfSSatish Balay 	/* Computed Newton step is descent */
710a7e14dcfSSatish Balay 	++tl->newt;
711a7e14dcfSSatish Balay 	stepType = NTL_NEWTON;
712a7e14dcfSSatish Balay       }
713a7e14dcfSSatish Balay 
714a7e14dcfSSatish Balay       /* Perform the linesearch */
715a7e14dcfSSatish Balay       fold = f;
716a7e14dcfSSatish Balay       ierr = VecCopy(tao->solution, tl->Xold); CHKERRQ(ierr);
717a7e14dcfSSatish Balay       ierr = VecCopy(tao->gradient, tl->Gold); CHKERRQ(ierr);
718a7e14dcfSSatish Balay 
719a7e14dcfSSatish Balay       step = 1.0;
720a7e14dcfSSatish Balay       ierr = TaoLineSearchApply(tao->linesearch, tao->solution, &f, tao->gradient, tao->stepdirection, &step, &ls_reason); CHKERRQ(ierr);
721a7e14dcfSSatish Balay       ierr = TaoAddLineSearchCounts(tao); CHKERRQ(ierr);
722a7e14dcfSSatish Balay 
723a7e14dcfSSatish Balay 
724a7e14dcfSSatish Balay       while (ls_reason != TAOLINESEARCH_SUCCESS &&
725a7e14dcfSSatish Balay 	   ls_reason != TAOLINESEARCH_SUCCESS_USER &&
726a7e14dcfSSatish Balay 	   stepType != NTL_GRADIENT) {      /* Linesearch failed */
727a7e14dcfSSatish Balay 	/* Linesearch failed */
728a7e14dcfSSatish Balay 	f = fold;
729a7e14dcfSSatish Balay 	ierr = VecCopy(tl->Xold, tao->solution); CHKERRQ(ierr);
730a7e14dcfSSatish Balay 	ierr = VecCopy(tl->Gold, tao->gradient); CHKERRQ(ierr);
731a7e14dcfSSatish Balay 
732a7e14dcfSSatish Balay 	switch(stepType) {
733a7e14dcfSSatish Balay 	case NTL_NEWTON:
734a7e14dcfSSatish Balay 	  /* Failed to obtain acceptable iterate with Newton step */
735a7e14dcfSSatish Balay 
736a7e14dcfSSatish Balay 	  if (NTL_PC_BFGS != tl->pc_type) {
737a7e14dcfSSatish Balay 	    /* We don't have the bfgs matrix around and being updated
738a7e14dcfSSatish Balay 	       Must use gradient direction in this case */
739a7e14dcfSSatish Balay 	    ierr = VecCopy(tao->gradient, tao->stepdirection); CHKERRQ(ierr);
740a7e14dcfSSatish Balay 	    ++tl->grad;
741a7e14dcfSSatish Balay 	    stepType = NTL_GRADIENT;
742a7e14dcfSSatish Balay 	  }
743a7e14dcfSSatish Balay 	  else {
744a7e14dcfSSatish Balay 	    /* Attempt to use the BFGS direction */
745a7e14dcfSSatish Balay 	    ierr = MatLMVMSolve(tl->M, tao->gradient, tao->stepdirection); CHKERRQ(ierr);
746a7e14dcfSSatish Balay 
747a7e14dcfSSatish Balay 
748a7e14dcfSSatish Balay 	    /* Check for success (descent direction) */
749a7e14dcfSSatish Balay 	    ierr = VecDot(tao->stepdirection, tao->gradient, &gdx); CHKERRQ(ierr);
750a7e14dcfSSatish Balay 	    if ((gdx <= 0) || PetscIsInfOrNanReal(gdx)) {
751a7e14dcfSSatish Balay 	      /* BFGS direction is not descent or direction produced
752a7e14dcfSSatish Balay 		 not a number.  We can assert bfgsUpdates > 1 in this case
753a7e14dcfSSatish Balay 		 Use steepest descent direction (scaled) */
754a7e14dcfSSatish Balay 
755a7e14dcfSSatish Balay 	      if (f != 0.0) {
756a7e14dcfSSatish Balay 		delta = 2.0 * PetscAbsScalar(f) / (gnorm*gnorm);
757a7e14dcfSSatish Balay 	      }
758a7e14dcfSSatish Balay 	      else {
759a7e14dcfSSatish Balay 		delta = 2.0 / (gnorm*gnorm);
760a7e14dcfSSatish Balay 	      }
761a7e14dcfSSatish Balay 	      ierr = MatLMVMSetDelta(tl->M, delta); CHKERRQ(ierr);
762a7e14dcfSSatish Balay 	      ierr = MatLMVMReset(tl->M); CHKERRQ(ierr);
763a7e14dcfSSatish Balay 	      ierr = MatLMVMUpdate(tl->M, tao->solution, tao->gradient); CHKERRQ(ierr);
764a7e14dcfSSatish Balay 	      ierr = MatLMVMSolve(tl->M, tao->gradient, tao->stepdirection); CHKERRQ(ierr);
765a7e14dcfSSatish Balay 
766a7e14dcfSSatish Balay 	      bfgsUpdates = 1;
767a7e14dcfSSatish Balay 	      ++tl->sgrad;
768a7e14dcfSSatish Balay 	      stepType = NTL_SCALED_GRADIENT;
769a7e14dcfSSatish Balay 	    }
770a7e14dcfSSatish Balay 	    else {
771a7e14dcfSSatish Balay 	      if (1 == bfgsUpdates) {
772a7e14dcfSSatish Balay 		/* The first BFGS direction is always the scaled gradient */
773a7e14dcfSSatish Balay 		++tl->sgrad;
774a7e14dcfSSatish Balay 		stepType = NTL_SCALED_GRADIENT;
775a7e14dcfSSatish Balay 	      }
776a7e14dcfSSatish Balay 	      else {
777a7e14dcfSSatish Balay 		++tl->bfgs;
778a7e14dcfSSatish Balay 		stepType = NTL_BFGS;
779a7e14dcfSSatish Balay 	      }
780a7e14dcfSSatish Balay 	    }
781a7e14dcfSSatish Balay 	  }
782a7e14dcfSSatish Balay 	  break;
783a7e14dcfSSatish Balay 
784a7e14dcfSSatish Balay 	case NTL_BFGS:
785a7e14dcfSSatish Balay 	  /* Can only enter if pc_type == NTL_PC_BFGS
786a7e14dcfSSatish Balay 	     Failed to obtain acceptable iterate with BFGS step
787a7e14dcfSSatish Balay 	     Attempt to use the scaled gradient direction */
788a7e14dcfSSatish Balay 
789a7e14dcfSSatish Balay 	  if (f != 0.0) {
790a7e14dcfSSatish Balay 	    delta = 2.0 * PetscAbsScalar(f) / (gnorm*gnorm);
791a7e14dcfSSatish Balay 	  }
792a7e14dcfSSatish Balay 	  else {
793a7e14dcfSSatish Balay 	    delta = 2.0 / (gnorm*gnorm);
794a7e14dcfSSatish Balay 	  }
795a7e14dcfSSatish Balay 	  ierr = MatLMVMSetDelta(tl->M, delta); CHKERRQ(ierr);
796a7e14dcfSSatish Balay 	  ierr = MatLMVMReset(tl->M); CHKERRQ(ierr);
797a7e14dcfSSatish Balay 	  ierr = MatLMVMUpdate(tl->M, tao->solution, tao->gradient); CHKERRQ(ierr);
798a7e14dcfSSatish Balay 	  ierr = MatLMVMSolve(tl->M, tao->gradient, tao->stepdirection); CHKERRQ(ierr);
799a7e14dcfSSatish Balay 
800a7e14dcfSSatish Balay 	  bfgsUpdates = 1;
801a7e14dcfSSatish Balay 	  ++tl->sgrad;
802a7e14dcfSSatish Balay 	  stepType = NTL_SCALED_GRADIENT;
803a7e14dcfSSatish Balay 	  break;
804a7e14dcfSSatish Balay 
805a7e14dcfSSatish Balay 	case NTL_SCALED_GRADIENT:
806a7e14dcfSSatish Balay 	  /* Can only enter if pc_type == NTL_PC_BFGS
807a7e14dcfSSatish Balay 	     The scaled gradient step did not produce a new iterate;
808a7e14dcfSSatish Balay 	     attemp to use the gradient direction.
809a7e14dcfSSatish Balay 	     Need to make sure we are not using a different diagonal scaling */
810a7e14dcfSSatish Balay 	  ierr = MatLMVMSetScale(tl->M, tl->Diag); CHKERRQ(ierr);
811a7e14dcfSSatish Balay 	  ierr = MatLMVMSetDelta(tl->M, 1.0); CHKERRQ(ierr);
812a7e14dcfSSatish Balay 	  ierr = MatLMVMReset(tl->M); CHKERRQ(ierr);
813a7e14dcfSSatish Balay 	  ierr = MatLMVMUpdate(tl->M, tao->solution, tao->gradient); CHKERRQ(ierr);
814a7e14dcfSSatish Balay 	  ierr = MatLMVMSolve(tl->M, tao->gradient, tao->stepdirection); CHKERRQ(ierr);
815a7e14dcfSSatish Balay 
816a7e14dcfSSatish Balay 	  bfgsUpdates = 1;
817a7e14dcfSSatish Balay 	  ++tl->grad;
818a7e14dcfSSatish Balay 	  stepType = NTL_GRADIENT;
819a7e14dcfSSatish Balay 	  break;
820a7e14dcfSSatish Balay 	}
821a7e14dcfSSatish Balay 	ierr = VecScale(tao->stepdirection, -1.0); CHKERRQ(ierr);
822a7e14dcfSSatish Balay 
823a7e14dcfSSatish Balay 	/* This may be incorrect; linesearch has values for stepmax and stepmin
824a7e14dcfSSatish Balay 	   that should be reset. */
825a7e14dcfSSatish Balay 	step = 1.0;
826a7e14dcfSSatish Balay 	ierr = TaoLineSearchApply(tao->linesearch, tao->solution, &f, tao->gradient, tao->stepdirection, &step, &ls_reason); CHKERRQ(ierr);
827a7e14dcfSSatish Balay 	ierr = TaoAddLineSearchCounts(tao); CHKERRQ(ierr);
828a7e14dcfSSatish Balay       }
829a7e14dcfSSatish Balay 
830a7e14dcfSSatish Balay       if (ls_reason != TAOLINESEARCH_SUCCESS &&
831a7e14dcfSSatish Balay 	  ls_reason != TAOLINESEARCH_SUCCESS_USER) {
832a7e14dcfSSatish Balay 	/* Failed to find an improving point */
833a7e14dcfSSatish Balay 	f = fold;
834a7e14dcfSSatish Balay 	ierr = VecCopy(tl->Xold, tao->solution); CHKERRQ(ierr);
835a7e14dcfSSatish Balay 	ierr = VecCopy(tl->Gold, tao->gradient); CHKERRQ(ierr);
836a7e14dcfSSatish Balay 	tao->trust = 0.0;
837a7e14dcfSSatish Balay 	step = 0.0;
838a7e14dcfSSatish Balay 	reason = TAO_DIVERGED_LS_FAILURE;
839a7e14dcfSSatish Balay 	tao->reason = TAO_DIVERGED_LS_FAILURE;
840a7e14dcfSSatish Balay 	break;
841a7e14dcfSSatish Balay       }
842a7e14dcfSSatish Balay       else if (stepType == NTL_NEWTON) {
843a7e14dcfSSatish Balay 	if (step < tl->nu1) {
844a7e14dcfSSatish Balay 	  /* Very bad step taken; reduce radius */
845a7e14dcfSSatish Balay 	  tao->trust = tl->omega1 * PetscMin(norm_d, tao->trust);
846a7e14dcfSSatish Balay 	}
847a7e14dcfSSatish Balay 	else if (step < tl->nu2) {
848a7e14dcfSSatish Balay 	  /* Reasonably bad step taken; reduce radius */
849a7e14dcfSSatish Balay 	  tao->trust = tl->omega2 * PetscMin(norm_d, tao->trust);
850a7e14dcfSSatish Balay 	}
851a7e14dcfSSatish Balay 	else if (step < tl->nu3) {
852a7e14dcfSSatish Balay 	  /* Reasonable step was taken; leave radius alone */
853a7e14dcfSSatish Balay 	  if (tl->omega3 < 1.0) {
854a7e14dcfSSatish Balay 	    tao->trust = tl->omega3 * PetscMin(norm_d, tao->trust);
855a7e14dcfSSatish Balay 	  }
856a7e14dcfSSatish Balay 	  else if (tl->omega3 > 1.0) {
857a7e14dcfSSatish Balay 	    tao->trust = PetscMax(tl->omega3 * norm_d, tao->trust);
858a7e14dcfSSatish Balay 	  }
859a7e14dcfSSatish Balay 	}
860a7e14dcfSSatish Balay 	else if (step < tl->nu4) {
861a7e14dcfSSatish Balay 	  /* Full step taken; increase the radius */
862a7e14dcfSSatish Balay 	  tao->trust = PetscMax(tl->omega4 * norm_d, tao->trust);
863a7e14dcfSSatish Balay 	}
864a7e14dcfSSatish Balay 	else {
865a7e14dcfSSatish Balay 	  /* More than full step taken; increase the radius */
866a7e14dcfSSatish Balay 	  tao->trust = PetscMax(tl->omega5 * norm_d, tao->trust);
867a7e14dcfSSatish Balay 	}
868a7e14dcfSSatish Balay       }
869a7e14dcfSSatish Balay       else {
870a7e14dcfSSatish Balay 	/* Newton step was not good; reduce the radius */
871a7e14dcfSSatish Balay 	tao->trust = tl->omega1 * PetscMin(norm_d, tao->trust);
872a7e14dcfSSatish Balay       }
873a7e14dcfSSatish Balay     }
874a7e14dcfSSatish Balay     else {
875a7e14dcfSSatish Balay       /* Trust-region step is accepted */
876a7e14dcfSSatish Balay       ierr = VecCopy(tl->W, tao->solution); CHKERRQ(ierr);
877a7e14dcfSSatish Balay       f = ftrial;
878a7e14dcfSSatish Balay       ierr = TaoComputeGradient(tao, tao->solution, tao->gradient); CHKERRQ(ierr);
879a7e14dcfSSatish Balay       ++tl->ntrust;
880a7e14dcfSSatish Balay     }
881a7e14dcfSSatish Balay 
882a7e14dcfSSatish Balay     /* The radius may have been increased; modify if it is too large */
883a7e14dcfSSatish Balay     tao->trust = PetscMin(tao->trust, tl->max_radius);
884a7e14dcfSSatish Balay 
885a7e14dcfSSatish Balay     /* Check for termination */
886a7e14dcfSSatish Balay     ierr = VecNorm(tao->gradient, NORM_2, &gnorm); CHKERRQ(ierr);
887a7e14dcfSSatish Balay     if (PetscIsInfOrNanReal(f) || PetscIsInfOrNanReal(gnorm)) {
888a7e14dcfSSatish Balay       SETERRQ(PETSC_COMM_SELF,1,"User provided compute function generated Not-a-Number");
889a7e14dcfSSatish Balay     }
890a7e14dcfSSatish Balay     needH = 1;
891a7e14dcfSSatish Balay 
892a7e14dcfSSatish Balay     ierr = TaoMonitor(tao, iter, f, gnorm, 0.0, tao->trust, &reason); CHKERRQ(ierr);
893a7e14dcfSSatish Balay   }
894a7e14dcfSSatish Balay   PetscFunctionReturn(0);
895a7e14dcfSSatish Balay }
896a7e14dcfSSatish Balay 
897a7e14dcfSSatish Balay /* ---------------------------------------------------------- */
898a7e14dcfSSatish Balay #undef __FUNCT__
899a7e14dcfSSatish Balay #define __FUNCT__ "TaoSetUp_NTL"
900a7e14dcfSSatish Balay static PetscErrorCode TaoSetUp_NTL(TaoSolver tao)
901a7e14dcfSSatish Balay {
902a7e14dcfSSatish Balay   TAO_NTL *tl = (TAO_NTL *)tao->data;
903a7e14dcfSSatish Balay   PetscErrorCode ierr;
904a7e14dcfSSatish Balay 
905a7e14dcfSSatish Balay   PetscFunctionBegin;
906a7e14dcfSSatish Balay   if (!tao->gradient) {ierr = VecDuplicate(tao->solution, &tao->gradient); CHKERRQ(ierr); }
907a7e14dcfSSatish Balay   if (!tao->stepdirection) {ierr = VecDuplicate(tao->solution, &tao->stepdirection); CHKERRQ(ierr);}
908a7e14dcfSSatish Balay   if (!tl->W) { ierr = VecDuplicate(tao->solution, &tl->W); CHKERRQ(ierr);}
909a7e14dcfSSatish Balay   if (!tl->Xold) { ierr = VecDuplicate(tao->solution, &tl->Xold); CHKERRQ(ierr);}
910a7e14dcfSSatish Balay   if (!tl->Gold) { ierr = VecDuplicate(tao->solution, &tl->Gold); CHKERRQ(ierr);}
911a7e14dcfSSatish Balay 
912a7e14dcfSSatish Balay   tl->Diag = 0;
913a7e14dcfSSatish Balay   tl->M = 0;
914a7e14dcfSSatish Balay 
915a7e14dcfSSatish Balay 
916a7e14dcfSSatish Balay   PetscFunctionReturn(0);
917a7e14dcfSSatish Balay }
918a7e14dcfSSatish Balay 
919a7e14dcfSSatish Balay /*------------------------------------------------------------*/
920a7e14dcfSSatish Balay #undef __FUNCT__
921a7e14dcfSSatish Balay #define __FUNCT__ "TaoDestroy_NTL"
922a7e14dcfSSatish Balay static PetscErrorCode TaoDestroy_NTL(TaoSolver tao)
923a7e14dcfSSatish Balay {
924a7e14dcfSSatish Balay   TAO_NTL *tl = (TAO_NTL *)tao->data;
925a7e14dcfSSatish Balay   PetscErrorCode ierr;
926a7e14dcfSSatish Balay 
927a7e14dcfSSatish Balay   PetscFunctionBegin;
928a7e14dcfSSatish Balay   if (tao->setupcalled) {
929a7e14dcfSSatish Balay     ierr = VecDestroy(&tl->W); CHKERRQ(ierr);
930a7e14dcfSSatish Balay     ierr = VecDestroy(&tl->Xold); CHKERRQ(ierr);
931a7e14dcfSSatish Balay     ierr = VecDestroy(&tl->Gold); CHKERRQ(ierr);
932a7e14dcfSSatish Balay   }
933a7e14dcfSSatish Balay   if (tl->Diag) {
934a7e14dcfSSatish Balay     ierr = VecDestroy(&tl->Diag); CHKERRQ(ierr);
935a7e14dcfSSatish Balay     tl->Diag = PETSC_NULL;
936a7e14dcfSSatish Balay   }
937a7e14dcfSSatish Balay   if (tl->M) {
938a7e14dcfSSatish Balay     ierr = MatDestroy(&tl->M); CHKERRQ(ierr);
939a7e14dcfSSatish Balay     tl->M = PETSC_NULL;
940a7e14dcfSSatish Balay   }
941a7e14dcfSSatish Balay 
942a7e14dcfSSatish Balay   ierr = PetscFree(tao->data); CHKERRQ(ierr);
943a7e14dcfSSatish Balay   tao->data = PETSC_NULL;
944a7e14dcfSSatish Balay 
945a7e14dcfSSatish Balay   PetscFunctionReturn(0);
946a7e14dcfSSatish Balay }
947a7e14dcfSSatish Balay 
948a7e14dcfSSatish Balay /*------------------------------------------------------------*/
949a7e14dcfSSatish Balay #undef __FUNCT__
950a7e14dcfSSatish Balay #define __FUNCT__ "TaoSetFromOptions_NTL"
951a7e14dcfSSatish Balay static PetscErrorCode TaoSetFromOptions_NTL(TaoSolver tao)
952a7e14dcfSSatish Balay {
953a7e14dcfSSatish Balay   TAO_NTL *tl = (TAO_NTL *)tao->data;
954a7e14dcfSSatish Balay   PetscErrorCode ierr;
955a7e14dcfSSatish Balay 
956a7e14dcfSSatish Balay   PetscFunctionBegin;
957a7e14dcfSSatish Balay   ierr = PetscOptionsHead("Newton line search method for unconstrained optimization"); CHKERRQ(ierr);
958a7e14dcfSSatish Balay   ierr = PetscOptionsEList("-tao_ntl_ksp_type", "ksp type", "", NTL_KSP, NTL_KSP_TYPES, NTL_KSP[tl->ksp_type], &tl->ksp_type, 0); CHKERRQ(ierr);
959a7e14dcfSSatish Balay   ierr = PetscOptionsEList("-tao_ntl_pc_type", "pc type", "", NTL_PC, NTL_PC_TYPES, NTL_PC[tl->pc_type], &tl->pc_type, 0); CHKERRQ(ierr);
960a7e14dcfSSatish Balay   ierr = PetscOptionsEList("-tao_ntl_bfgs_scale_type", "bfgs scale type", "", BFGS_SCALE, BFGS_SCALE_TYPES, BFGS_SCALE[tl->bfgs_scale_type], &tl->bfgs_scale_type, 0); CHKERRQ(ierr);
961a7e14dcfSSatish Balay   ierr = PetscOptionsEList("-tao_ntl_init_type", "radius initialization type", "", NTL_INIT, NTL_INIT_TYPES, NTL_INIT[tl->init_type], &tl->init_type, 0); CHKERRQ(ierr);
962a7e14dcfSSatish Balay   ierr = PetscOptionsEList("-tao_ntl_update_type", "radius update type", "", NTL_UPDATE, NTL_UPDATE_TYPES, NTL_UPDATE[tl->update_type], &tl->update_type, 0); CHKERRQ(ierr);
963a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntl_eta1", "poor steplength; reduce radius", "", tl->eta1, &tl->eta1, 0); CHKERRQ(ierr);
964a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntl_eta2", "reasonable steplength; leave radius alone", "", tl->eta2, &tl->eta2, 0); CHKERRQ(ierr);
965a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntl_eta3", "good steplength; increase radius", "", tl->eta3, &tl->eta3, 0); CHKERRQ(ierr);
966a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntl_eta4", "excellent steplength; greatly increase radius", "", tl->eta4, &tl->eta4, 0); CHKERRQ(ierr);
967a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntl_alpha1", "", "", tl->alpha1, &tl->alpha1, 0); CHKERRQ(ierr);
968a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntl_alpha2", "", "", tl->alpha2, &tl->alpha2, 0); CHKERRQ(ierr);
969a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntl_alpha3", "", "", tl->alpha3, &tl->alpha3, 0); CHKERRQ(ierr);
970a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntl_alpha4", "", "", tl->alpha4, &tl->alpha4, 0); CHKERRQ(ierr);
971a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntl_alpha5", "", "", tl->alpha5, &tl->alpha5, 0); CHKERRQ(ierr);
972a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntl_nu1", "poor steplength; reduce radius", "", tl->nu1, &tl->nu1, 0); CHKERRQ(ierr);
973a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntl_nu2", "reasonable steplength; leave radius alone", "", tl->nu2, &tl->nu2, 0); CHKERRQ(ierr);
974a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntl_nu3", "good steplength; increase radius", "", tl->nu3, &tl->nu3, 0); CHKERRQ(ierr);
975a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntl_nu4", "excellent steplength; greatly increase radius", "", tl->nu4, &tl->nu4, 0); CHKERRQ(ierr);
976a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntl_omega1", "", "", tl->omega1, &tl->omega1, 0); CHKERRQ(ierr);
977a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntl_omega2", "", "", tl->omega2, &tl->omega2, 0); CHKERRQ(ierr);
978a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntl_omega3", "", "", tl->omega3, &tl->omega3, 0); CHKERRQ(ierr);
979a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntl_omega4", "", "", tl->omega4, &tl->omega4, 0); CHKERRQ(ierr);
980a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntl_omega5", "", "", tl->omega5, &tl->omega5, 0); CHKERRQ(ierr);
981a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntl_mu1_i", "", "", tl->mu1_i, &tl->mu1_i, 0); CHKERRQ(ierr);
982a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntl_mu2_i", "", "", tl->mu2_i, &tl->mu2_i, 0); CHKERRQ(ierr);
983a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntl_gamma1_i", "", "", tl->gamma1_i, &tl->gamma1_i, 0); CHKERRQ(ierr);
984a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntl_gamma2_i", "", "", tl->gamma2_i, &tl->gamma2_i, 0); CHKERRQ(ierr);
985a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntl_gamma3_i", "", "", tl->gamma3_i, &tl->gamma3_i, 0); CHKERRQ(ierr);
986a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntl_gamma4_i", "", "", tl->gamma4_i, &tl->gamma4_i, 0); CHKERRQ(ierr);
987a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntl_theta_i", "", "", tl->theta_i, &tl->theta_i, 0); CHKERRQ(ierr);
988a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntl_mu1", "", "", tl->mu1, &tl->mu1, 0); CHKERRQ(ierr);
989a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntl_mu2", "", "", tl->mu2, &tl->mu2, 0); CHKERRQ(ierr);
990a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntl_gamma1", "", "", tl->gamma1, &tl->gamma1, 0); CHKERRQ(ierr);
991a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntl_gamma2", "", "", tl->gamma2, &tl->gamma2, 0); CHKERRQ(ierr);
992a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntl_gamma3", "", "", tl->gamma3, &tl->gamma3, 0); CHKERRQ(ierr);
993a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntl_gamma4", "", "", tl->gamma4, &tl->gamma4, 0); CHKERRQ(ierr);
994a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntl_theta", "", "", tl->theta, &tl->theta, 0); CHKERRQ(ierr);
995a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntl_min_radius", "lower bound on initial radius", "", tl->min_radius, &tl->min_radius, 0); CHKERRQ(ierr);
996a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntl_max_radius", "upper bound on radius", "", tl->max_radius, &tl->max_radius, 0); CHKERRQ(ierr);
997a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_ntl_epsilon", "tolerance used when computing actual and predicted reduction", "", tl->epsilon, &tl->epsilon, 0); CHKERRQ(ierr);
998a7e14dcfSSatish Balay   ierr = PetscOptionsTail(); CHKERRQ(ierr);
999a7e14dcfSSatish Balay   ierr = TaoLineSearchSetFromOptions(tao->linesearch); CHKERRQ(ierr);
1000a7e14dcfSSatish Balay   ierr = KSPSetFromOptions(tao->ksp); CHKERRQ(ierr);
1001a7e14dcfSSatish Balay   PetscFunctionReturn(0);
1002a7e14dcfSSatish Balay }
1003a7e14dcfSSatish Balay 
1004a7e14dcfSSatish Balay 
1005a7e14dcfSSatish Balay /*------------------------------------------------------------*/
1006a7e14dcfSSatish Balay #undef __FUNCT__
1007a7e14dcfSSatish Balay #define __FUNCT__ "TaoView_NTL"
1008a7e14dcfSSatish Balay static PetscErrorCode TaoView_NTL(TaoSolver tao, PetscViewer viewer)
1009a7e14dcfSSatish Balay {
1010a7e14dcfSSatish Balay   TAO_NTL *tl = (TAO_NTL *)tao->data;
1011a7e14dcfSSatish Balay   PetscInt nrejects;
1012a7e14dcfSSatish Balay   PetscBool isascii;
1013a7e14dcfSSatish Balay   PetscErrorCode ierr;
1014a7e14dcfSSatish Balay 
1015a7e14dcfSSatish Balay   PetscFunctionBegin;
1016a7e14dcfSSatish Balay   ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&isascii);CHKERRQ(ierr);
1017a7e14dcfSSatish Balay   if (isascii) {
1018a7e14dcfSSatish Balay     ierr = PetscViewerASCIIPushTab(viewer); CHKERRQ(ierr);
1019a7e14dcfSSatish Balay     if (NTL_PC_BFGS == tl->pc_type && tl->M) {
1020a7e14dcfSSatish Balay       ierr = MatLMVMGetRejects(tl->M, &nrejects); CHKERRQ(ierr);
1021a7e14dcfSSatish Balay       ierr = PetscViewerASCIIPrintf(viewer, "Rejected matrix updates: %D\n", nrejects); CHKERRQ(ierr);
1022a7e14dcfSSatish Balay 
1023a7e14dcfSSatish Balay     }
1024a7e14dcfSSatish Balay 
1025a7e14dcfSSatish Balay     ierr = PetscViewerASCIIPrintf(viewer, "Trust-region steps: %D\n", tl->ntrust); CHKERRQ(ierr);
1026a7e14dcfSSatish Balay     ierr = PetscViewerASCIIPrintf(viewer, "Newton search steps: %D\n", tl->newt); CHKERRQ(ierr);
1027a7e14dcfSSatish Balay     ierr = PetscViewerASCIIPrintf(viewer, "BFGS search steps: %D\n", tl->bfgs); CHKERRQ(ierr);
1028a7e14dcfSSatish Balay     ierr = PetscViewerASCIIPrintf(viewer, "Scaled gradient search steps: %D\n", tl->sgrad); CHKERRQ(ierr);
1029a7e14dcfSSatish Balay     ierr = PetscViewerASCIIPrintf(viewer, "Gradient search steps: %D\n", tl->grad); CHKERRQ(ierr);
1030a7e14dcfSSatish Balay     ierr = PetscViewerASCIIPopTab(viewer); CHKERRQ(ierr);
1031a7e14dcfSSatish Balay   } else {
1032a7e14dcfSSatish Balay     SETERRQ1(((PetscObject)tao)->comm,PETSC_ERR_SUP,"Viewer type %s not supported for TAO NTL",((PetscObject)viewer)->type_name);
1033a7e14dcfSSatish Balay   }
1034a7e14dcfSSatish Balay   PetscFunctionReturn(0);
1035a7e14dcfSSatish Balay }
1036a7e14dcfSSatish Balay 
1037a7e14dcfSSatish Balay /* ---------------------------------------------------------- */
1038a7e14dcfSSatish Balay EXTERN_C_BEGIN
1039a7e14dcfSSatish Balay #undef __FUNCT__
1040a7e14dcfSSatish Balay #define __FUNCT__ "TaoCreate_NTL"
1041a7e14dcfSSatish Balay PetscErrorCode TaoCreate_NTL(TaoSolver tao)
1042a7e14dcfSSatish Balay {
1043a7e14dcfSSatish Balay   TAO_NTL *tl;
1044a7e14dcfSSatish Balay   PetscErrorCode ierr;
1045a7e14dcfSSatish Balay   const char *morethuente_type = TAOLINESEARCH_MT;
1046a7e14dcfSSatish Balay   PetscFunctionBegin;
1047a7e14dcfSSatish Balay   ierr = PetscNewLog(tao, TAO_NTL, &tl); CHKERRQ(ierr);
1048a7e14dcfSSatish Balay 
1049a7e14dcfSSatish Balay   tao->ops->setup = TaoSetUp_NTL;
1050a7e14dcfSSatish Balay   tao->ops->solve = TaoSolve_NTL;
1051a7e14dcfSSatish Balay   tao->ops->view = TaoView_NTL;
1052a7e14dcfSSatish Balay   tao->ops->setfromoptions = TaoSetFromOptions_NTL;
1053a7e14dcfSSatish Balay   tao->ops->destroy = TaoDestroy_NTL;
1054a7e14dcfSSatish Balay 
1055a7e14dcfSSatish Balay   tao->max_it = 50;
1056a7e14dcfSSatish Balay   tao->fatol = 1e-10;
1057a7e14dcfSSatish Balay   tao->frtol = 1e-10;
1058a7e14dcfSSatish Balay   tao->data = (void*)tl;
1059a7e14dcfSSatish Balay 
1060a7e14dcfSSatish Balay   tao->trust0 = 100.0;
1061a7e14dcfSSatish Balay 
1062a7e14dcfSSatish Balay 
1063a7e14dcfSSatish Balay   /* Default values for trust-region radius update based on steplength */
1064a7e14dcfSSatish Balay   tl->nu1 = 0.25;
1065a7e14dcfSSatish Balay   tl->nu2 = 0.50;
1066a7e14dcfSSatish Balay   tl->nu3 = 1.00;
1067a7e14dcfSSatish Balay   tl->nu4 = 1.25;
1068a7e14dcfSSatish Balay 
1069a7e14dcfSSatish Balay   tl->omega1 = 0.25;
1070a7e14dcfSSatish Balay   tl->omega2 = 0.50;
1071a7e14dcfSSatish Balay   tl->omega3 = 1.00;
1072a7e14dcfSSatish Balay   tl->omega4 = 2.00;
1073a7e14dcfSSatish Balay   tl->omega5 = 4.00;
1074a7e14dcfSSatish Balay 
1075a7e14dcfSSatish Balay   /* Default values for trust-region radius update based on reduction */
1076a7e14dcfSSatish Balay   tl->eta1 = 1.0e-4;
1077a7e14dcfSSatish Balay   tl->eta2 = 0.25;
1078a7e14dcfSSatish Balay   tl->eta3 = 0.50;
1079a7e14dcfSSatish Balay   tl->eta4 = 0.90;
1080a7e14dcfSSatish Balay 
1081a7e14dcfSSatish Balay   tl->alpha1 = 0.25;
1082a7e14dcfSSatish Balay   tl->alpha2 = 0.50;
1083a7e14dcfSSatish Balay   tl->alpha3 = 1.00;
1084a7e14dcfSSatish Balay   tl->alpha4 = 2.00;
1085a7e14dcfSSatish Balay   tl->alpha5 = 4.00;
1086a7e14dcfSSatish Balay 
1087a7e14dcfSSatish Balay   /* Default values for trust-region radius update based on interpolation */
1088a7e14dcfSSatish Balay   tl->mu1 = 0.10;
1089a7e14dcfSSatish Balay   tl->mu2 = 0.50;
1090a7e14dcfSSatish Balay 
1091a7e14dcfSSatish Balay   tl->gamma1 = 0.25;
1092a7e14dcfSSatish Balay   tl->gamma2 = 0.50;
1093a7e14dcfSSatish Balay   tl->gamma3 = 2.00;
1094a7e14dcfSSatish Balay   tl->gamma4 = 4.00;
1095a7e14dcfSSatish Balay 
1096a7e14dcfSSatish Balay   tl->theta = 0.05;
1097a7e14dcfSSatish Balay 
1098a7e14dcfSSatish Balay   /* Default values for trust region initialization based on interpolation */
1099a7e14dcfSSatish Balay   tl->mu1_i = 0.35;
1100a7e14dcfSSatish Balay   tl->mu2_i = 0.50;
1101a7e14dcfSSatish Balay 
1102a7e14dcfSSatish Balay   tl->gamma1_i = 0.0625;
1103a7e14dcfSSatish Balay   tl->gamma2_i = 0.5;
1104a7e14dcfSSatish Balay   tl->gamma3_i = 2.0;
1105a7e14dcfSSatish Balay   tl->gamma4_i = 5.0;
1106a7e14dcfSSatish Balay 
1107a7e14dcfSSatish Balay   tl->theta_i = 0.25;
1108a7e14dcfSSatish Balay 
1109a7e14dcfSSatish Balay   /* Remaining parameters */
1110a7e14dcfSSatish Balay   tl->min_radius = 1.0e-10;
1111a7e14dcfSSatish Balay   tl->max_radius = 1.0e10;
1112a7e14dcfSSatish Balay   tl->epsilon = 1.0e-6;
1113a7e14dcfSSatish Balay 
1114a7e14dcfSSatish Balay   tl->ksp_type        = NTL_KSP_STCG;
1115a7e14dcfSSatish Balay   tl->pc_type         = NTL_PC_BFGS;
1116a7e14dcfSSatish Balay   tl->bfgs_scale_type = BFGS_SCALE_AHESS;
1117a7e14dcfSSatish Balay   tl->init_type       = NTL_INIT_INTERPOLATION;
1118a7e14dcfSSatish Balay   tl->update_type     = NTL_UPDATE_REDUCTION;
1119a7e14dcfSSatish Balay 
1120a7e14dcfSSatish Balay   ierr = TaoLineSearchCreate(((PetscObject)tao)->comm, &tao->linesearch); CHKERRQ(ierr);
1121a7e14dcfSSatish Balay   ierr = TaoLineSearchSetType(tao->linesearch, morethuente_type); CHKERRQ(ierr);
1122a7e14dcfSSatish Balay   ierr = TaoLineSearchUseTaoSolverRoutines(tao->linesearch, tao); CHKERRQ(ierr);
1123a7e14dcfSSatish Balay 
1124a7e14dcfSSatish Balay   ierr = KSPCreate(((PetscObject)tao)->comm, &tao->ksp); CHKERRQ(ierr);
1125a7e14dcfSSatish Balay 
1126a7e14dcfSSatish Balay   PetscFunctionReturn(0);
1127a7e14dcfSSatish Balay }
1128a7e14dcfSSatish Balay EXTERN_C_END
1129a7e14dcfSSatish Balay 
1130a7e14dcfSSatish Balay 
1131a7e14dcfSSatish Balay 
1132