xref: /petsc/src/tao/unconstrained/impls/ntl/ntl.c (revision 3ba1676111f5c958fe6c2729b46ca4d523958bb3)
155119615STodd Munson #include <../src/tao/unconstrained/impls/ntl/ntlimpl.h>
2a7e14dcfSSatish Balay 
3aaa7dc30SBarry Smith #include <petscksp.h>
4a7e14dcfSSatish Balay 
5a7e14dcfSSatish Balay #define NTL_INIT_CONSTANT      0
6a7e14dcfSSatish Balay #define NTL_INIT_DIRECTION     1
7a7e14dcfSSatish Balay #define NTL_INIT_INTERPOLATION 2
8a7e14dcfSSatish Balay #define NTL_INIT_TYPES         3
9a7e14dcfSSatish Balay 
10a7e14dcfSSatish Balay #define NTL_UPDATE_REDUCTION     0
11a7e14dcfSSatish Balay #define NTL_UPDATE_INTERPOLATION 1
12a7e14dcfSSatish Balay #define NTL_UPDATE_TYPES         2
13a7e14dcfSSatish Balay 
1487f595a5SBarry Smith static const char *NTL_INIT[64] = {"constant", "direction", "interpolation"};
15a7e14dcfSSatish Balay 
1687f595a5SBarry Smith static const char *NTL_UPDATE[64] = {"reduction", "interpolation"};
17a7e14dcfSSatish Balay 
18a7e14dcfSSatish Balay /* Implements Newton's Method with a trust-region, line-search approach for
19a7e14dcfSSatish Balay    solving unconstrained minimization problems.  A More'-Thuente line search
20a7e14dcfSSatish Balay    is used to guarantee that the bfgs preconditioner remains positive
21a7e14dcfSSatish Balay    definite. */
22a7e14dcfSSatish Balay 
23a7e14dcfSSatish Balay #define NTL_NEWTON          0
24a7e14dcfSSatish Balay #define NTL_BFGS            1
25a7e14dcfSSatish Balay #define NTL_SCALED_GRADIENT 2
26a7e14dcfSSatish Balay #define NTL_GRADIENT        3
27a7e14dcfSSatish Balay 
28d71ae5a4SJacob Faibussowitsch static PetscErrorCode TaoSolve_NTL(Tao tao)
29d71ae5a4SJacob Faibussowitsch {
30a7e14dcfSSatish Balay   TAO_NTL                     *tl = (TAO_NTL *)tao->data;
3155119615STodd Munson   KSPType                      ksp_type;
320ad3a497SAlp Dener   PetscBool                    is_nash, is_stcg, is_gltr, is_bfgs, is_jacobi, is_symmetric, sym_set;
33a7e14dcfSSatish Balay   KSPConvergedReason           ksp_reason;
3455119615STodd Munson   PC                           pc;
35e4cb33bbSBarry Smith   TaoLineSearchConvergedReason ls_reason;
36a7e14dcfSSatish Balay 
37a7e14dcfSSatish Balay   PetscReal fmin, ftrial, prered, actred, kappa, sigma;
38a7e14dcfSSatish Balay   PetscReal tau, tau_1, tau_2, tau_max, tau_min, max_radius;
39a7e14dcfSSatish Balay   PetscReal f, fold, gdx, gnorm;
40a7e14dcfSSatish Balay   PetscReal step = 1.0;
41a7e14dcfSSatish Balay 
42a7e14dcfSSatish Balay   PetscReal norm_d = 0.0;
43a7e14dcfSSatish Balay   PetscInt  stepType;
448931d482SJason Sarich   PetscInt  its;
45a7e14dcfSSatish Balay 
46a7e14dcfSSatish Balay   PetscInt bfgsUpdates = 0;
47a7e14dcfSSatish Balay   PetscInt needH;
48a7e14dcfSSatish Balay 
49a7e14dcfSSatish Balay   PetscInt i_max = 5;
50a7e14dcfSSatish Balay   PetscInt j_max = 1;
51a7e14dcfSSatish Balay   PetscInt i, j, n, N;
52a7e14dcfSSatish Balay 
53a7e14dcfSSatish Balay   PetscInt tr_reject;
54a7e14dcfSSatish Balay 
55a7e14dcfSSatish Balay   PetscFunctionBegin;
5648a46eb9SPierre Jolivet   if (tao->XL || tao->XU || tao->ops->computebounds) PetscCall(PetscInfo(tao, "WARNING: Variable bounds have been set but will be ignored by ntl algorithm\n"));
57a7e14dcfSSatish Balay 
589566063dSJacob Faibussowitsch   PetscCall(KSPGetType(tao->ksp, &ksp_type));
599566063dSJacob Faibussowitsch   PetscCall(PetscStrcmp(ksp_type, KSPNASH, &is_nash));
609566063dSJacob Faibussowitsch   PetscCall(PetscStrcmp(ksp_type, KSPSTCG, &is_stcg));
619566063dSJacob Faibussowitsch   PetscCall(PetscStrcmp(ksp_type, KSPGLTR, &is_gltr));
623c859ba3SBarry Smith   PetscCheck(is_nash || is_stcg || is_gltr, PetscObjectComm((PetscObject)tao), PETSC_ERR_SUP, "TAO_NTR requires nash, stcg, or gltr for the KSP");
63a7e14dcfSSatish Balay 
6455119615STodd Munson   /* Initialize the radius and modify if it is too large or small */
6555119615STodd Munson   tao->trust = tao->trust0;
66a7e14dcfSSatish Balay   tao->trust = PetscMax(tao->trust, tl->min_radius);
67a7e14dcfSSatish Balay   tao->trust = PetscMin(tao->trust, tl->max_radius);
68a7e14dcfSSatish Balay 
690c51296cSAlp Dener   /* Allocate the vectors needed for the BFGS approximation */
709566063dSJacob Faibussowitsch   PetscCall(KSPGetPC(tao->ksp, &pc));
719566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)pc, PCLMVM, &is_bfgs));
729566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)pc, PCJACOBI, &is_jacobi));
730c51296cSAlp Dener   if (is_bfgs) {
740c51296cSAlp Dener     tl->bfgs_pre = pc;
759566063dSJacob Faibussowitsch     PetscCall(PCLMVMGetMatLMVM(tl->bfgs_pre, &tl->M));
769566063dSJacob Faibussowitsch     PetscCall(VecGetLocalSize(tao->solution, &n));
779566063dSJacob Faibussowitsch     PetscCall(VecGetSize(tao->solution, &N));
789566063dSJacob Faibussowitsch     PetscCall(MatSetSizes(tl->M, n, n, N, N));
799566063dSJacob Faibussowitsch     PetscCall(MatLMVMAllocate(tl->M, tao->solution, tao->gradient));
809566063dSJacob Faibussowitsch     PetscCall(MatIsSymmetricKnown(tl->M, &sym_set, &is_symmetric));
813c859ba3SBarry Smith     PetscCheck(sym_set && is_symmetric, PetscObjectComm((PetscObject)tao), PETSC_ERR_ARG_INCOMP, "LMVM matrix in the LMVM preconditioner must be symmetric.");
821baa6e33SBarry Smith   } else if (is_jacobi) PetscCall(PCJacobiSetUseAbs(pc, PETSC_TRUE));
83a7e14dcfSSatish Balay 
84a7e14dcfSSatish Balay   /* Check convergence criteria */
859566063dSJacob Faibussowitsch   PetscCall(TaoComputeObjectiveAndGradient(tao, tao->solution, &f, tao->gradient));
869566063dSJacob Faibussowitsch   PetscCall(VecNorm(tao->gradient, NORM_2, &gnorm));
873c859ba3SBarry Smith   PetscCheck(!PetscIsInfOrNanReal(f) && !PetscIsInfOrNanReal(gnorm), PetscObjectComm((PetscObject)tao), PETSC_ERR_USER, "User provided compute function generated Inf or NaN");
88a7e14dcfSSatish Balay   needH = 1;
89a7e14dcfSSatish Balay 
903ecd9318SAlp Dener   tao->reason = TAO_CONTINUE_ITERATING;
919566063dSJacob Faibussowitsch   PetscCall(TaoLogConvergenceHistory(tao, f, gnorm, 0.0, tao->ksp_its));
929566063dSJacob Faibussowitsch   PetscCall(TaoMonitor(tao, tao->niter, f, gnorm, 0.0, step));
93dbbe0bcdSBarry Smith   PetscUseTypeMethod(tao, convergencetest, tao->cnvP);
94*3ba16761SJacob Faibussowitsch   if (tao->reason != TAO_CONTINUE_ITERATING) PetscFunctionReturn(PETSC_SUCCESS);
95a7e14dcfSSatish Balay 
9655119615STodd Munson   /* Initialize trust-region radius */
97a7e14dcfSSatish Balay   switch (tl->init_type) {
98a7e14dcfSSatish Balay   case NTL_INIT_CONSTANT:
99a7e14dcfSSatish Balay     /* Use the initial radius specified */
100a7e14dcfSSatish Balay     break;
101a7e14dcfSSatish Balay 
102a7e14dcfSSatish Balay   case NTL_INIT_INTERPOLATION:
103a7e14dcfSSatish Balay     /* Use the initial radius specified */
104a7e14dcfSSatish Balay     max_radius = 0.0;
105a7e14dcfSSatish Balay 
106a7e14dcfSSatish Balay     for (j = 0; j < j_max; ++j) {
107a7e14dcfSSatish Balay       fmin  = f;
108a7e14dcfSSatish Balay       sigma = 0.0;
109a7e14dcfSSatish Balay 
110a7e14dcfSSatish Balay       if (needH) {
1119566063dSJacob Faibussowitsch         PetscCall(TaoComputeHessian(tao, tao->solution, tao->hessian, tao->hessian_pre));
112a7e14dcfSSatish Balay         needH = 0;
113a7e14dcfSSatish Balay       }
114a7e14dcfSSatish Balay 
115a7e14dcfSSatish Balay       for (i = 0; i < i_max; ++i) {
1169566063dSJacob Faibussowitsch         PetscCall(VecCopy(tao->solution, tl->W));
1179566063dSJacob Faibussowitsch         PetscCall(VecAXPY(tl->W, -tao->trust / gnorm, tao->gradient));
118a7e14dcfSSatish Balay 
1199566063dSJacob Faibussowitsch         PetscCall(TaoComputeObjective(tao, tl->W, &ftrial));
120a7e14dcfSSatish Balay         if (PetscIsInfOrNanReal(ftrial)) {
121a7e14dcfSSatish Balay           tau = tl->gamma1_i;
12253506e15SBarry Smith         } else {
123a7e14dcfSSatish Balay           if (ftrial < fmin) {
124a7e14dcfSSatish Balay             fmin  = ftrial;
125a7e14dcfSSatish Balay             sigma = -tao->trust / gnorm;
126a7e14dcfSSatish Balay           }
127a7e14dcfSSatish Balay 
1289566063dSJacob Faibussowitsch           PetscCall(MatMult(tao->hessian, tao->gradient, tao->stepdirection));
1299566063dSJacob Faibussowitsch           PetscCall(VecDot(tao->gradient, tao->stepdirection, &prered));
130a7e14dcfSSatish Balay 
131a7e14dcfSSatish Balay           prered = tao->trust * (gnorm - 0.5 * tao->trust * prered / (gnorm * gnorm));
132a7e14dcfSSatish Balay           actred = f - ftrial;
13353506e15SBarry Smith           if ((PetscAbsScalar(actred) <= tl->epsilon) && (PetscAbsScalar(prered) <= tl->epsilon)) {
134a7e14dcfSSatish Balay             kappa = 1.0;
13553506e15SBarry Smith           } else {
136a7e14dcfSSatish Balay             kappa = actred / prered;
137a7e14dcfSSatish Balay           }
138a7e14dcfSSatish Balay 
139a7e14dcfSSatish Balay           tau_1   = tl->theta_i * gnorm * tao->trust / (tl->theta_i * gnorm * tao->trust + (1.0 - tl->theta_i) * prered - actred);
140a7e14dcfSSatish Balay           tau_2   = tl->theta_i * gnorm * tao->trust / (tl->theta_i * gnorm * tao->trust - (1.0 + tl->theta_i) * prered + actred);
141a7e14dcfSSatish Balay           tau_min = PetscMin(tau_1, tau_2);
142a7e14dcfSSatish Balay           tau_max = PetscMax(tau_1, tau_2);
143a7e14dcfSSatish Balay 
14418cfbf8eSSatish Balay           if (PetscAbsScalar(kappa - (PetscReal)1.0) <= tl->mu1_i) {
145a7e14dcfSSatish Balay             /* Great agreement */
146a7e14dcfSSatish Balay             max_radius = PetscMax(max_radius, tao->trust);
147a7e14dcfSSatish Balay 
148a7e14dcfSSatish Balay             if (tau_max < 1.0) {
149a7e14dcfSSatish Balay               tau = tl->gamma3_i;
15053506e15SBarry Smith             } else if (tau_max > tl->gamma4_i) {
151a7e14dcfSSatish Balay               tau = tl->gamma4_i;
15253506e15SBarry Smith             } else if (tau_1 >= 1.0 && tau_1 <= tl->gamma4_i && tau_2 < 1.0) {
153a7e14dcfSSatish Balay               tau = tau_1;
15453506e15SBarry Smith             } else if (tau_2 >= 1.0 && tau_2 <= tl->gamma4_i && tau_1 < 1.0) {
155a7e14dcfSSatish Balay               tau = tau_2;
15653506e15SBarry Smith             } else {
157a7e14dcfSSatish Balay               tau = tau_max;
158a7e14dcfSSatish Balay             }
15918cfbf8eSSatish Balay           } else if (PetscAbsScalar(kappa - (PetscReal)1.0) <= tl->mu2_i) {
160a7e14dcfSSatish Balay             /* Good agreement */
161a7e14dcfSSatish Balay             max_radius = PetscMax(max_radius, tao->trust);
162a7e14dcfSSatish Balay 
163a7e14dcfSSatish Balay             if (tau_max < tl->gamma2_i) {
164a7e14dcfSSatish Balay               tau = tl->gamma2_i;
16553506e15SBarry Smith             } else if (tau_max > tl->gamma3_i) {
166a7e14dcfSSatish Balay               tau = tl->gamma3_i;
16753506e15SBarry Smith             } else {
168a7e14dcfSSatish Balay               tau = tau_max;
169a7e14dcfSSatish Balay             }
17053506e15SBarry Smith           } else {
171a7e14dcfSSatish Balay             /* Not good agreement */
172a7e14dcfSSatish Balay             if (tau_min > 1.0) {
173a7e14dcfSSatish Balay               tau = tl->gamma2_i;
17453506e15SBarry Smith             } else if (tau_max < tl->gamma1_i) {
175a7e14dcfSSatish Balay               tau = tl->gamma1_i;
17653506e15SBarry Smith             } else if ((tau_min < tl->gamma1_i) && (tau_max >= 1.0)) {
177a7e14dcfSSatish Balay               tau = tl->gamma1_i;
17853506e15SBarry Smith             } else if ((tau_1 >= tl->gamma1_i) && (tau_1 < 1.0) && ((tau_2 < tl->gamma1_i) || (tau_2 >= 1.0))) {
179a7e14dcfSSatish Balay               tau = tau_1;
18053506e15SBarry Smith             } else if ((tau_2 >= tl->gamma1_i) && (tau_2 < 1.0) && ((tau_1 < tl->gamma1_i) || (tau_2 >= 1.0))) {
181a7e14dcfSSatish Balay               tau = tau_2;
18253506e15SBarry Smith             } else {
183a7e14dcfSSatish Balay               tau = tau_max;
184a7e14dcfSSatish Balay             }
185a7e14dcfSSatish Balay           }
186a7e14dcfSSatish Balay         }
187a7e14dcfSSatish Balay         tao->trust = tau * tao->trust;
188a7e14dcfSSatish Balay       }
189a7e14dcfSSatish Balay 
190a7e14dcfSSatish Balay       if (fmin < f) {
191a7e14dcfSSatish Balay         f = fmin;
1929566063dSJacob Faibussowitsch         PetscCall(VecAXPY(tao->solution, sigma, tao->gradient));
1939566063dSJacob Faibussowitsch         PetscCall(TaoComputeGradient(tao, tao->solution, tao->gradient));
194a7e14dcfSSatish Balay 
1959566063dSJacob Faibussowitsch         PetscCall(VecNorm(tao->gradient, NORM_2, &gnorm));
1963c859ba3SBarry Smith         PetscCheck(!PetscIsInfOrNanReal(f) && !PetscIsInfOrNanReal(gnorm), PetscObjectComm((PetscObject)tao), PETSC_ERR_USER, "User provided compute function generated Inf or NaN");
197a7e14dcfSSatish Balay         needH = 1;
198a7e14dcfSSatish Balay 
1999566063dSJacob Faibussowitsch         PetscCall(TaoLogConvergenceHistory(tao, f, gnorm, 0.0, tao->ksp_its));
2009566063dSJacob Faibussowitsch         PetscCall(TaoMonitor(tao, tao->niter, f, gnorm, 0.0, step));
201dbbe0bcdSBarry Smith         PetscUseTypeMethod(tao, convergencetest, tao->cnvP);
202*3ba16761SJacob Faibussowitsch         if (tao->reason != TAO_CONTINUE_ITERATING) PetscFunctionReturn(PETSC_SUCCESS);
203a7e14dcfSSatish Balay       }
204a7e14dcfSSatish Balay     }
205a7e14dcfSSatish Balay     tao->trust = PetscMax(tao->trust, max_radius);
206a7e14dcfSSatish Balay 
207a7e14dcfSSatish Balay     /* Modify the radius if it is too large or small */
208a7e14dcfSSatish Balay     tao->trust = PetscMax(tao->trust, tl->min_radius);
209a7e14dcfSSatish Balay     tao->trust = PetscMin(tao->trust, tl->max_radius);
210a7e14dcfSSatish Balay     break;
211a7e14dcfSSatish Balay 
212a7e14dcfSSatish Balay   default:
213a7e14dcfSSatish Balay     /* Norm of the first direction will initialize radius */
214a7e14dcfSSatish Balay     tao->trust = 0.0;
215a7e14dcfSSatish Balay     break;
216a7e14dcfSSatish Balay   }
217a7e14dcfSSatish Balay 
218a7e14dcfSSatish Balay   /* Set counter for gradient/reset steps */
219a7e14dcfSSatish Balay   tl->ntrust = 0;
220a7e14dcfSSatish Balay   tl->newt   = 0;
221a7e14dcfSSatish Balay   tl->bfgs   = 0;
222a7e14dcfSSatish Balay   tl->grad   = 0;
223a7e14dcfSSatish Balay 
224a7e14dcfSSatish Balay   /* Have not converged; continue with Newton method */
2253ecd9318SAlp Dener   while (tao->reason == TAO_CONTINUE_ITERATING) {
226e1e80dc8SAlp Dener     /* Call general purpose update function */
227dbbe0bcdSBarry Smith     PetscTryTypeMethod(tao, update, tao->niter, tao->user_update);
2288931d482SJason Sarich     ++tao->niter;
229ae93cb3cSJason Sarich     tao->ksp_its = 0;
230a7e14dcfSSatish Balay     /* Compute the Hessian */
2311baa6e33SBarry Smith     if (needH) PetscCall(TaoComputeHessian(tao, tao->solution, tao->hessian, tao->hessian_pre));
232a7e14dcfSSatish Balay 
2330c51296cSAlp Dener     if (tl->bfgs_pre) {
234a7e14dcfSSatish Balay       /* Update the limited memory preconditioner */
2359566063dSJacob Faibussowitsch       PetscCall(MatLMVMUpdate(tl->M, tao->solution, tao->gradient));
236a7e14dcfSSatish Balay       ++bfgsUpdates;
237a7e14dcfSSatish Balay     }
2389566063dSJacob Faibussowitsch     PetscCall(KSPSetOperators(tao->ksp, tao->hessian, tao->hessian_pre));
239a7e14dcfSSatish Balay     /* Solve the Newton system of equations */
2409566063dSJacob Faibussowitsch     PetscCall(KSPCGSetRadius(tao->ksp, tl->max_radius));
2419566063dSJacob Faibussowitsch     PetscCall(KSPSolve(tao->ksp, tao->gradient, tao->stepdirection));
2429566063dSJacob Faibussowitsch     PetscCall(KSPGetIterationNumber(tao->ksp, &its));
243a7e14dcfSSatish Balay     tao->ksp_its += its;
244ae93cb3cSJason Sarich     tao->ksp_tot_its += its;
2459566063dSJacob Faibussowitsch     PetscCall(KSPCGGetNormD(tao->ksp, &norm_d));
246a7e14dcfSSatish Balay 
247a7e14dcfSSatish Balay     if (0.0 == tao->trust) {
248a7e14dcfSSatish Balay       /* Radius was uninitialized; use the norm of the direction */
249a7e14dcfSSatish Balay       if (norm_d > 0.0) {
250a7e14dcfSSatish Balay         tao->trust = norm_d;
251a7e14dcfSSatish Balay 
252a7e14dcfSSatish Balay         /* Modify the radius if it is too large or small */
253a7e14dcfSSatish Balay         tao->trust = PetscMax(tao->trust, tl->min_radius);
254a7e14dcfSSatish Balay         tao->trust = PetscMin(tao->trust, tl->max_radius);
25553506e15SBarry Smith       } else {
256a7e14dcfSSatish Balay         /* The direction was bad; set radius to default value and re-solve
257a7e14dcfSSatish Balay            the trust-region subproblem to get a direction */
258a7e14dcfSSatish Balay         tao->trust = tao->trust0;
259a7e14dcfSSatish Balay 
260a7e14dcfSSatish Balay         /* Modify the radius if it is too large or small */
261a7e14dcfSSatish Balay         tao->trust = PetscMax(tao->trust, tl->min_radius);
262a7e14dcfSSatish Balay         tao->trust = PetscMin(tao->trust, tl->max_radius);
263a7e14dcfSSatish Balay 
2649566063dSJacob Faibussowitsch         PetscCall(KSPCGSetRadius(tao->ksp, tl->max_radius));
2659566063dSJacob Faibussowitsch         PetscCall(KSPSolve(tao->ksp, tao->gradient, tao->stepdirection));
2669566063dSJacob Faibussowitsch         PetscCall(KSPGetIterationNumber(tao->ksp, &its));
267a7e14dcfSSatish Balay         tao->ksp_its += its;
2682d9aa51bSJason Sarich         tao->ksp_tot_its += its;
2699566063dSJacob Faibussowitsch         PetscCall(KSPCGGetNormD(tao->ksp, &norm_d));
270a7e14dcfSSatish Balay 
2713c859ba3SBarry Smith         PetscCheck(norm_d != 0.0, PetscObjectComm((PetscObject)tao), PETSC_ERR_PLIB, "Initial direction zero");
272a7e14dcfSSatish Balay       }
273a7e14dcfSSatish Balay     }
274a7e14dcfSSatish Balay 
2759566063dSJacob Faibussowitsch     PetscCall(VecScale(tao->stepdirection, -1.0));
2769566063dSJacob Faibussowitsch     PetscCall(KSPGetConvergedReason(tao->ksp, &ksp_reason));
2770c51296cSAlp Dener     if ((KSP_DIVERGED_INDEFINITE_PC == ksp_reason) && (tl->bfgs_pre)) {
278a7e14dcfSSatish Balay       /* Preconditioner is numerically indefinite; reset the
279a7e14dcfSSatish Balay          approximate if using BFGS preconditioning. */
2809566063dSJacob Faibussowitsch       PetscCall(MatLMVMReset(tl->M, PETSC_FALSE));
2819566063dSJacob Faibussowitsch       PetscCall(MatLMVMUpdate(tl->M, tao->solution, tao->gradient));
282a7e14dcfSSatish Balay       bfgsUpdates = 1;
283a7e14dcfSSatish Balay     }
284a7e14dcfSSatish Balay 
285a7e14dcfSSatish Balay     /* Check trust-region reduction conditions */
286a7e14dcfSSatish Balay     tr_reject = 0;
287a7e14dcfSSatish Balay     if (NTL_UPDATE_REDUCTION == tl->update_type) {
288a7e14dcfSSatish Balay       /* Get predicted reduction */
2899566063dSJacob Faibussowitsch       PetscCall(KSPCGGetObjFcn(tao->ksp, &prered));
290a7e14dcfSSatish Balay       if (prered >= 0.0) {
291a7e14dcfSSatish Balay         /* The predicted reduction has the wrong sign.  This cannot
292a7e14dcfSSatish Balay            happen in infinite precision arithmetic.  Step should
293a7e14dcfSSatish Balay            be rejected! */
294a7e14dcfSSatish Balay         tao->trust = tl->alpha1 * PetscMin(tao->trust, norm_d);
295a7e14dcfSSatish Balay         tr_reject  = 1;
29653506e15SBarry Smith       } else {
297a7e14dcfSSatish Balay         /* Compute trial step and function value */
2989566063dSJacob Faibussowitsch         PetscCall(VecCopy(tao->solution, tl->W));
2999566063dSJacob Faibussowitsch         PetscCall(VecAXPY(tl->W, 1.0, tao->stepdirection));
3009566063dSJacob Faibussowitsch         PetscCall(TaoComputeObjective(tao, tl->W, &ftrial));
301a7e14dcfSSatish Balay 
302a7e14dcfSSatish Balay         if (PetscIsInfOrNanReal(ftrial)) {
303a7e14dcfSSatish Balay           tao->trust = tl->alpha1 * PetscMin(tao->trust, norm_d);
304a7e14dcfSSatish Balay           tr_reject  = 1;
30553506e15SBarry Smith         } else {
306a7e14dcfSSatish Balay           /* Compute and actual reduction */
307a7e14dcfSSatish Balay           actred = f - ftrial;
308a7e14dcfSSatish Balay           prered = -prered;
3099371c9d4SSatish Balay           if ((PetscAbsScalar(actred) <= tl->epsilon) && (PetscAbsScalar(prered) <= tl->epsilon)) {
310a7e14dcfSSatish Balay             kappa = 1.0;
31153506e15SBarry Smith           } else {
312a7e14dcfSSatish Balay             kappa = actred / prered;
313a7e14dcfSSatish Balay           }
314a7e14dcfSSatish Balay 
315a7e14dcfSSatish Balay           /* Accept of reject the step and update radius */
316a7e14dcfSSatish Balay           if (kappa < tl->eta1) {
317a7e14dcfSSatish Balay             /* Reject the step */
318a7e14dcfSSatish Balay             tao->trust = tl->alpha1 * PetscMin(tao->trust, norm_d);
319a7e14dcfSSatish Balay             tr_reject  = 1;
32053506e15SBarry Smith           } else {
321a7e14dcfSSatish Balay             /* Accept the step */
322a7e14dcfSSatish Balay             if (kappa < tl->eta2) {
323a7e14dcfSSatish Balay               /* Marginal bad step */
324a7e14dcfSSatish Balay               tao->trust = tl->alpha2 * PetscMin(tao->trust, norm_d);
32553506e15SBarry Smith             } else if (kappa < tl->eta3) {
326a7e14dcfSSatish Balay               /* Reasonable step */
327a7e14dcfSSatish Balay               tao->trust = tl->alpha3 * tao->trust;
32853506e15SBarry Smith             } else if (kappa < tl->eta4) {
329a7e14dcfSSatish Balay               /* Good step */
330a7e14dcfSSatish Balay               tao->trust = PetscMax(tl->alpha4 * norm_d, tao->trust);
33153506e15SBarry Smith             } else {
332a7e14dcfSSatish Balay               /* Very good step */
333a7e14dcfSSatish Balay               tao->trust = PetscMax(tl->alpha5 * norm_d, tao->trust);
334a7e14dcfSSatish Balay             }
335a7e14dcfSSatish Balay           }
336a7e14dcfSSatish Balay         }
337a7e14dcfSSatish Balay       }
33853506e15SBarry Smith     } else {
339a7e14dcfSSatish Balay       /* Get predicted reduction */
3409566063dSJacob Faibussowitsch       PetscCall(KSPCGGetObjFcn(tao->ksp, &prered));
341a7e14dcfSSatish Balay       if (prered >= 0.0) {
342a7e14dcfSSatish Balay         /* The predicted reduction has the wrong sign.  This cannot
343a7e14dcfSSatish Balay            happen in infinite precision arithmetic.  Step should
344a7e14dcfSSatish Balay            be rejected! */
345a7e14dcfSSatish Balay         tao->trust = tl->gamma1 * PetscMin(tao->trust, norm_d);
346a7e14dcfSSatish Balay         tr_reject  = 1;
34753506e15SBarry Smith       } else {
3489566063dSJacob Faibussowitsch         PetscCall(VecCopy(tao->solution, tl->W));
3499566063dSJacob Faibussowitsch         PetscCall(VecAXPY(tl->W, 1.0, tao->stepdirection));
3509566063dSJacob Faibussowitsch         PetscCall(TaoComputeObjective(tao, tl->W, &ftrial));
351a7e14dcfSSatish Balay         if (PetscIsInfOrNanReal(ftrial)) {
352a7e14dcfSSatish Balay           tao->trust = tl->gamma1 * PetscMin(tao->trust, norm_d);
353a7e14dcfSSatish Balay           tr_reject  = 1;
35453506e15SBarry Smith         } else {
3559566063dSJacob Faibussowitsch           PetscCall(VecDot(tao->gradient, tao->stepdirection, &gdx));
356a7e14dcfSSatish Balay 
357a7e14dcfSSatish Balay           actred = f - ftrial;
358a7e14dcfSSatish Balay           prered = -prered;
3599371c9d4SSatish Balay           if ((PetscAbsScalar(actred) <= tl->epsilon) && (PetscAbsScalar(prered) <= tl->epsilon)) {
360a7e14dcfSSatish Balay             kappa = 1.0;
36153506e15SBarry Smith           } else {
362a7e14dcfSSatish Balay             kappa = actred / prered;
363a7e14dcfSSatish Balay           }
364a7e14dcfSSatish Balay 
365a7e14dcfSSatish Balay           tau_1   = tl->theta * gdx / (tl->theta * gdx - (1.0 - tl->theta) * prered + actred);
366a7e14dcfSSatish Balay           tau_2   = tl->theta * gdx / (tl->theta * gdx + (1.0 + tl->theta) * prered - actred);
367a7e14dcfSSatish Balay           tau_min = PetscMin(tau_1, tau_2);
368a7e14dcfSSatish Balay           tau_max = PetscMax(tau_1, tau_2);
369a7e14dcfSSatish Balay 
370a7e14dcfSSatish Balay           if (kappa >= 1.0 - tl->mu1) {
371a7e14dcfSSatish Balay             /* Great agreement; accept step and update radius */
372a7e14dcfSSatish Balay             if (tau_max < 1.0) {
373a7e14dcfSSatish Balay               tao->trust = PetscMax(tao->trust, tl->gamma3 * norm_d);
37453506e15SBarry Smith             } else if (tau_max > tl->gamma4) {
375a7e14dcfSSatish Balay               tao->trust = PetscMax(tao->trust, tl->gamma4 * norm_d);
37653506e15SBarry Smith             } else {
377a7e14dcfSSatish Balay               tao->trust = PetscMax(tao->trust, tau_max * norm_d);
378a7e14dcfSSatish Balay             }
37953506e15SBarry Smith           } else if (kappa >= 1.0 - tl->mu2) {
380a7e14dcfSSatish Balay             /* Good agreement */
381a7e14dcfSSatish Balay 
382a7e14dcfSSatish Balay             if (tau_max < tl->gamma2) {
383a7e14dcfSSatish Balay               tao->trust = tl->gamma2 * PetscMin(tao->trust, norm_d);
38453506e15SBarry Smith             } else if (tau_max > tl->gamma3) {
385a7e14dcfSSatish Balay               tao->trust = PetscMax(tao->trust, tl->gamma3 * norm_d);
386a7e14dcfSSatish Balay             } else if (tau_max < 1.0) {
387a7e14dcfSSatish Balay               tao->trust = tau_max * PetscMin(tao->trust, norm_d);
38853506e15SBarry Smith             } else {
389a7e14dcfSSatish Balay               tao->trust = PetscMax(tao->trust, tau_max * norm_d);
390a7e14dcfSSatish Balay             }
39153506e15SBarry Smith           } else {
392a7e14dcfSSatish Balay             /* Not good agreement */
393a7e14dcfSSatish Balay             if (tau_min > 1.0) {
394a7e14dcfSSatish Balay               tao->trust = tl->gamma2 * PetscMin(tao->trust, norm_d);
39553506e15SBarry Smith             } else if (tau_max < tl->gamma1) {
396a7e14dcfSSatish Balay               tao->trust = tl->gamma1 * PetscMin(tao->trust, norm_d);
39753506e15SBarry Smith             } else if ((tau_min < tl->gamma1) && (tau_max >= 1.0)) {
398a7e14dcfSSatish Balay               tao->trust = tl->gamma1 * PetscMin(tao->trust, norm_d);
39953506e15SBarry Smith             } else if ((tau_1 >= tl->gamma1) && (tau_1 < 1.0) && ((tau_2 < tl->gamma1) || (tau_2 >= 1.0))) {
400a7e14dcfSSatish Balay               tao->trust = tau_1 * PetscMin(tao->trust, norm_d);
40153506e15SBarry Smith             } else if ((tau_2 >= tl->gamma1) && (tau_2 < 1.0) && ((tau_1 < tl->gamma1) || (tau_2 >= 1.0))) {
402a7e14dcfSSatish Balay               tao->trust = tau_2 * PetscMin(tao->trust, norm_d);
40353506e15SBarry Smith             } else {
404a7e14dcfSSatish Balay               tao->trust = tau_max * PetscMin(tao->trust, norm_d);
405a7e14dcfSSatish Balay             }
406a7e14dcfSSatish Balay             tr_reject = 1;
407a7e14dcfSSatish Balay           }
408a7e14dcfSSatish Balay         }
409a7e14dcfSSatish Balay       }
410a7e14dcfSSatish Balay     }
411a7e14dcfSSatish Balay 
412a7e14dcfSSatish Balay     if (tr_reject) {
413a7e14dcfSSatish Balay       /* The trust-region constraints rejected the step.  Apply a linesearch.
414a7e14dcfSSatish Balay          Check for descent direction. */
4159566063dSJacob Faibussowitsch       PetscCall(VecDot(tao->stepdirection, tao->gradient, &gdx));
416a7e14dcfSSatish Balay       if ((gdx >= 0.0) || PetscIsInfOrNanReal(gdx)) {
417a7e14dcfSSatish Balay         /* Newton step is not descent or direction produced Inf or NaN */
418a7e14dcfSSatish Balay 
4190c51296cSAlp Dener         if (!tl->bfgs_pre) {
420a7e14dcfSSatish Balay           /* We don't have the bfgs matrix around and updated
421a7e14dcfSSatish Balay              Must use gradient direction in this case */
4229566063dSJacob Faibussowitsch           PetscCall(VecCopy(tao->gradient, tao->stepdirection));
4239566063dSJacob Faibussowitsch           PetscCall(VecScale(tao->stepdirection, -1.0));
424a7e14dcfSSatish Balay           ++tl->grad;
425a7e14dcfSSatish Balay           stepType = NTL_GRADIENT;
42653506e15SBarry Smith         } else {
427a7e14dcfSSatish Balay           /* Attempt to use the BFGS direction */
4289566063dSJacob Faibussowitsch           PetscCall(MatSolve(tl->M, tao->gradient, tao->stepdirection));
4299566063dSJacob Faibussowitsch           PetscCall(VecScale(tao->stepdirection, -1.0));
430a7e14dcfSSatish Balay 
431a7e14dcfSSatish Balay           /* Check for success (descent direction) */
4329566063dSJacob Faibussowitsch           PetscCall(VecDot(tao->stepdirection, tao->gradient, &gdx));
433a7e14dcfSSatish Balay           if ((gdx >= 0) || PetscIsInfOrNanReal(gdx)) {
434a7e14dcfSSatish Balay             /* BFGS direction is not descent or direction produced not a number
435a7e14dcfSSatish Balay                We can assert bfgsUpdates > 1 in this case because
436a7e14dcfSSatish Balay                the first solve produces the scaled gradient direction,
437a7e14dcfSSatish Balay                which is guaranteed to be descent */
438a7e14dcfSSatish Balay 
439a7e14dcfSSatish Balay             /* Use steepest descent direction (scaled) */
4409566063dSJacob Faibussowitsch             PetscCall(MatLMVMReset(tl->M, PETSC_FALSE));
4419566063dSJacob Faibussowitsch             PetscCall(MatLMVMUpdate(tl->M, tao->solution, tao->gradient));
4429566063dSJacob Faibussowitsch             PetscCall(MatSolve(tl->M, tao->gradient, tao->stepdirection));
4439566063dSJacob Faibussowitsch             PetscCall(VecScale(tao->stepdirection, -1.0));
444a7e14dcfSSatish Balay 
445a7e14dcfSSatish Balay             bfgsUpdates = 1;
4460c51296cSAlp Dener             ++tl->grad;
4470c51296cSAlp Dener             stepType = NTL_GRADIENT;
44853506e15SBarry Smith           } else {
4499566063dSJacob Faibussowitsch             PetscCall(MatLMVMGetUpdateCount(tl->M, &bfgsUpdates));
450a7e14dcfSSatish Balay             if (1 == bfgsUpdates) {
451a7e14dcfSSatish Balay               /* The first BFGS direction is always the scaled gradient */
4520c51296cSAlp Dener               ++tl->grad;
4530c51296cSAlp Dener               stepType = NTL_GRADIENT;
45453506e15SBarry Smith             } else {
455a7e14dcfSSatish Balay               ++tl->bfgs;
456a7e14dcfSSatish Balay               stepType = NTL_BFGS;
457a7e14dcfSSatish Balay             }
458a7e14dcfSSatish Balay           }
459a7e14dcfSSatish Balay         }
46053506e15SBarry Smith       } else {
461a7e14dcfSSatish Balay         /* Computed Newton step is descent */
462a7e14dcfSSatish Balay         ++tl->newt;
463a7e14dcfSSatish Balay         stepType = NTL_NEWTON;
464a7e14dcfSSatish Balay       }
465a7e14dcfSSatish Balay 
466a7e14dcfSSatish Balay       /* Perform the linesearch */
467a7e14dcfSSatish Balay       fold = f;
4689566063dSJacob Faibussowitsch       PetscCall(VecCopy(tao->solution, tl->Xold));
4699566063dSJacob Faibussowitsch       PetscCall(VecCopy(tao->gradient, tl->Gold));
470a7e14dcfSSatish Balay 
471a7e14dcfSSatish Balay       step = 1.0;
4729566063dSJacob Faibussowitsch       PetscCall(TaoLineSearchApply(tao->linesearch, tao->solution, &f, tao->gradient, tao->stepdirection, &step, &ls_reason));
4739566063dSJacob Faibussowitsch       PetscCall(TaoAddLineSearchCounts(tao));
474a7e14dcfSSatish Balay 
47553506e15SBarry Smith       while (ls_reason != TAOLINESEARCH_SUCCESS && ls_reason != TAOLINESEARCH_SUCCESS_USER && stepType != NTL_GRADIENT) { /* Linesearch failed */
476a7e14dcfSSatish Balay         /* Linesearch failed */
477a7e14dcfSSatish Balay         f = fold;
4789566063dSJacob Faibussowitsch         PetscCall(VecCopy(tl->Xold, tao->solution));
4799566063dSJacob Faibussowitsch         PetscCall(VecCopy(tl->Gold, tao->gradient));
480a7e14dcfSSatish Balay 
481a7e14dcfSSatish Balay         switch (stepType) {
482a7e14dcfSSatish Balay         case NTL_NEWTON:
483a7e14dcfSSatish Balay           /* Failed to obtain acceptable iterate with Newton step */
484a7e14dcfSSatish Balay 
4850c51296cSAlp Dener           if (tl->bfgs_pre) {
486a7e14dcfSSatish Balay             /* We don't have the bfgs matrix around and being updated
487a7e14dcfSSatish Balay                Must use gradient direction in this case */
4889566063dSJacob Faibussowitsch             PetscCall(VecCopy(tao->gradient, tao->stepdirection));
489a7e14dcfSSatish Balay             ++tl->grad;
490a7e14dcfSSatish Balay             stepType = NTL_GRADIENT;
49153506e15SBarry Smith           } else {
492a7e14dcfSSatish Balay             /* Attempt to use the BFGS direction */
4939566063dSJacob Faibussowitsch             PetscCall(MatSolve(tl->M, tao->gradient, tao->stepdirection));
494a7e14dcfSSatish Balay 
495a7e14dcfSSatish Balay             /* Check for success (descent direction) */
4969566063dSJacob Faibussowitsch             PetscCall(VecDot(tao->stepdirection, tao->gradient, &gdx));
497a7e14dcfSSatish Balay             if ((gdx <= 0) || PetscIsInfOrNanReal(gdx)) {
498a7e14dcfSSatish Balay               /* BFGS direction is not descent or direction produced
499a7e14dcfSSatish Balay                  not a number.  We can assert bfgsUpdates > 1 in this case
500a7e14dcfSSatish Balay                  Use steepest descent direction (scaled) */
5019566063dSJacob Faibussowitsch               PetscCall(MatLMVMReset(tl->M, PETSC_FALSE));
5029566063dSJacob Faibussowitsch               PetscCall(MatLMVMUpdate(tl->M, tao->solution, tao->gradient));
5039566063dSJacob Faibussowitsch               PetscCall(MatSolve(tl->M, tao->gradient, tao->stepdirection));
504a7e14dcfSSatish Balay 
505a7e14dcfSSatish Balay               bfgsUpdates = 1;
5060c51296cSAlp Dener               ++tl->grad;
5070c51296cSAlp Dener               stepType = NTL_GRADIENT;
50853506e15SBarry Smith             } else {
5099566063dSJacob Faibussowitsch               PetscCall(MatLMVMGetUpdateCount(tl->M, &bfgsUpdates));
510a7e14dcfSSatish Balay               if (1 == bfgsUpdates) {
511a7e14dcfSSatish Balay                 /* The first BFGS direction is always the scaled gradient */
5120c51296cSAlp Dener                 ++tl->grad;
5130c51296cSAlp Dener                 stepType = NTL_GRADIENT;
51453506e15SBarry Smith               } else {
515a7e14dcfSSatish Balay                 ++tl->bfgs;
516a7e14dcfSSatish Balay                 stepType = NTL_BFGS;
517a7e14dcfSSatish Balay               }
518a7e14dcfSSatish Balay             }
519a7e14dcfSSatish Balay           }
520a7e14dcfSSatish Balay           break;
521a7e14dcfSSatish Balay 
522a7e14dcfSSatish Balay         case NTL_BFGS:
523a7e14dcfSSatish Balay           /* Can only enter if pc_type == NTL_PC_BFGS
524a7e14dcfSSatish Balay              Failed to obtain acceptable iterate with BFGS step
525a7e14dcfSSatish Balay              Attempt to use the scaled gradient direction */
5269566063dSJacob Faibussowitsch           PetscCall(MatLMVMReset(tl->M, PETSC_FALSE));
5279566063dSJacob Faibussowitsch           PetscCall(MatLMVMUpdate(tl->M, tao->solution, tao->gradient));
5289566063dSJacob Faibussowitsch           PetscCall(MatSolve(tl->M, tao->gradient, tao->stepdirection));
529a7e14dcfSSatish Balay 
530a7e14dcfSSatish Balay           bfgsUpdates = 1;
531a7e14dcfSSatish Balay           ++tl->grad;
532a7e14dcfSSatish Balay           stepType = NTL_GRADIENT;
533a7e14dcfSSatish Balay           break;
534a7e14dcfSSatish Balay         }
5359566063dSJacob Faibussowitsch         PetscCall(VecScale(tao->stepdirection, -1.0));
536a7e14dcfSSatish Balay 
537a7e14dcfSSatish Balay         /* This may be incorrect; linesearch has values for stepmax and stepmin
538a7e14dcfSSatish Balay            that should be reset. */
539a7e14dcfSSatish Balay         step = 1.0;
5409566063dSJacob Faibussowitsch         PetscCall(TaoLineSearchApply(tao->linesearch, tao->solution, &f, tao->gradient, tao->stepdirection, &step, &ls_reason));
5419566063dSJacob Faibussowitsch         PetscCall(TaoAddLineSearchCounts(tao));
542a7e14dcfSSatish Balay       }
543a7e14dcfSSatish Balay 
54453506e15SBarry Smith       if (ls_reason != TAOLINESEARCH_SUCCESS && ls_reason != TAOLINESEARCH_SUCCESS_USER) {
545a7e14dcfSSatish Balay         /* Failed to find an improving point */
546a7e14dcfSSatish Balay         f = fold;
5479566063dSJacob Faibussowitsch         PetscCall(VecCopy(tl->Xold, tao->solution));
5489566063dSJacob Faibussowitsch         PetscCall(VecCopy(tl->Gold, tao->gradient));
549a7e14dcfSSatish Balay         tao->trust  = 0.0;
550a7e14dcfSSatish Balay         step        = 0.0;
551a7e14dcfSSatish Balay         tao->reason = TAO_DIVERGED_LS_FAILURE;
552a7e14dcfSSatish Balay         break;
55353506e15SBarry Smith       } else if (stepType == NTL_NEWTON) {
554a7e14dcfSSatish Balay         if (step < tl->nu1) {
555a7e14dcfSSatish Balay           /* Very bad step taken; reduce radius */
556a7e14dcfSSatish Balay           tao->trust = tl->omega1 * PetscMin(norm_d, tao->trust);
55753506e15SBarry Smith         } else if (step < tl->nu2) {
558a7e14dcfSSatish Balay           /* Reasonably bad step taken; reduce radius */
559a7e14dcfSSatish Balay           tao->trust = tl->omega2 * PetscMin(norm_d, tao->trust);
56053506e15SBarry Smith         } else if (step < tl->nu3) {
561a7e14dcfSSatish Balay           /* Reasonable step was taken; leave radius alone */
562a7e14dcfSSatish Balay           if (tl->omega3 < 1.0) {
563a7e14dcfSSatish Balay             tao->trust = tl->omega3 * PetscMin(norm_d, tao->trust);
56453506e15SBarry Smith           } else if (tl->omega3 > 1.0) {
565a7e14dcfSSatish Balay             tao->trust = PetscMax(tl->omega3 * norm_d, tao->trust);
566a7e14dcfSSatish Balay           }
56753506e15SBarry Smith         } else if (step < tl->nu4) {
568a7e14dcfSSatish Balay           /* Full step taken; increase the radius */
569a7e14dcfSSatish Balay           tao->trust = PetscMax(tl->omega4 * norm_d, tao->trust);
57053506e15SBarry Smith         } else {
571a7e14dcfSSatish Balay           /* More than full step taken; increase the radius */
572a7e14dcfSSatish Balay           tao->trust = PetscMax(tl->omega5 * norm_d, tao->trust);
573a7e14dcfSSatish Balay         }
57453506e15SBarry Smith       } else {
575a7e14dcfSSatish Balay         /* Newton step was not good; reduce the radius */
576a7e14dcfSSatish Balay         tao->trust = tl->omega1 * PetscMin(norm_d, tao->trust);
577a7e14dcfSSatish Balay       }
57853506e15SBarry Smith     } else {
579a7e14dcfSSatish Balay       /* Trust-region step is accepted */
5809566063dSJacob Faibussowitsch       PetscCall(VecCopy(tl->W, tao->solution));
581a7e14dcfSSatish Balay       f = ftrial;
5829566063dSJacob Faibussowitsch       PetscCall(TaoComputeGradient(tao, tao->solution, tao->gradient));
583a7e14dcfSSatish Balay       ++tl->ntrust;
584a7e14dcfSSatish Balay     }
585a7e14dcfSSatish Balay 
586a7e14dcfSSatish Balay     /* The radius may have been increased; modify if it is too large */
587a7e14dcfSSatish Balay     tao->trust = PetscMin(tao->trust, tl->max_radius);
588a7e14dcfSSatish Balay 
589e4cb33bbSBarry Smith     /* Check for converged */
5909566063dSJacob Faibussowitsch     PetscCall(VecNorm(tao->gradient, NORM_2, &gnorm));
5913c859ba3SBarry Smith     PetscCheck(!PetscIsInfOrNanReal(f) && !PetscIsInfOrNanReal(gnorm), PetscObjectComm((PetscObject)tao), PETSC_ERR_USER, "User provided compute function generated Not-a-Number");
592a7e14dcfSSatish Balay     needH = 1;
593a7e14dcfSSatish Balay 
5949566063dSJacob Faibussowitsch     PetscCall(TaoLogConvergenceHistory(tao, f, gnorm, 0.0, tao->ksp_its));
5959566063dSJacob Faibussowitsch     PetscCall(TaoMonitor(tao, tao->niter, f, gnorm, 0.0, step));
596dbbe0bcdSBarry Smith     PetscUseTypeMethod(tao, convergencetest, tao->cnvP);
597a7e14dcfSSatish Balay   }
598*3ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
599a7e14dcfSSatish Balay }
600a7e14dcfSSatish Balay 
601a7e14dcfSSatish Balay /* ---------------------------------------------------------- */
602d71ae5a4SJacob Faibussowitsch static PetscErrorCode TaoSetUp_NTL(Tao tao)
603d71ae5a4SJacob Faibussowitsch {
604a7e14dcfSSatish Balay   TAO_NTL *tl = (TAO_NTL *)tao->data;
605a7e14dcfSSatish Balay 
606a7e14dcfSSatish Balay   PetscFunctionBegin;
6079566063dSJacob Faibussowitsch   if (!tao->gradient) PetscCall(VecDuplicate(tao->solution, &tao->gradient));
6089566063dSJacob Faibussowitsch   if (!tao->stepdirection) PetscCall(VecDuplicate(tao->solution, &tao->stepdirection));
6099566063dSJacob Faibussowitsch   if (!tl->W) PetscCall(VecDuplicate(tao->solution, &tl->W));
6109566063dSJacob Faibussowitsch   if (!tl->Xold) PetscCall(VecDuplicate(tao->solution, &tl->Xold));
6119566063dSJacob Faibussowitsch   if (!tl->Gold) PetscCall(VecDuplicate(tao->solution, &tl->Gold));
61283c8fe1dSLisandro Dalcin   tl->bfgs_pre = NULL;
61383c8fe1dSLisandro Dalcin   tl->M        = NULL;
614*3ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
615a7e14dcfSSatish Balay }
616a7e14dcfSSatish Balay 
617a7e14dcfSSatish Balay /*------------------------------------------------------------*/
618d71ae5a4SJacob Faibussowitsch static PetscErrorCode TaoDestroy_NTL(Tao tao)
619d71ae5a4SJacob Faibussowitsch {
620a7e14dcfSSatish Balay   TAO_NTL *tl = (TAO_NTL *)tao->data;
621a7e14dcfSSatish Balay 
622a7e14dcfSSatish Balay   PetscFunctionBegin;
623a7e14dcfSSatish Balay   if (tao->setupcalled) {
6249566063dSJacob Faibussowitsch     PetscCall(VecDestroy(&tl->W));
6259566063dSJacob Faibussowitsch     PetscCall(VecDestroy(&tl->Xold));
6269566063dSJacob Faibussowitsch     PetscCall(VecDestroy(&tl->Gold));
627a7e14dcfSSatish Balay   }
628a958fbfcSStefano Zampini   PetscCall(KSPDestroy(&tao->ksp));
6299566063dSJacob Faibussowitsch   PetscCall(PetscFree(tao->data));
630*3ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
631a7e14dcfSSatish Balay }
632a7e14dcfSSatish Balay 
633a7e14dcfSSatish Balay /*------------------------------------------------------------*/
634d71ae5a4SJacob Faibussowitsch static PetscErrorCode TaoSetFromOptions_NTL(Tao tao, PetscOptionItems *PetscOptionsObject)
635d71ae5a4SJacob Faibussowitsch {
636a7e14dcfSSatish Balay   TAO_NTL *tl = (TAO_NTL *)tao->data;
637a7e14dcfSSatish Balay 
638a7e14dcfSSatish Balay   PetscFunctionBegin;
639d0609cedSBarry Smith   PetscOptionsHeadBegin(PetscOptionsObject, "Newton trust region with line search method for unconstrained optimization");
6409566063dSJacob Faibussowitsch   PetscCall(PetscOptionsEList("-tao_ntl_init_type", "radius initialization type", "", NTL_INIT, NTL_INIT_TYPES, NTL_INIT[tl->init_type], &tl->init_type, NULL));
6419566063dSJacob Faibussowitsch   PetscCall(PetscOptionsEList("-tao_ntl_update_type", "radius update type", "", NTL_UPDATE, NTL_UPDATE_TYPES, NTL_UPDATE[tl->update_type], &tl->update_type, NULL));
6429566063dSJacob Faibussowitsch   PetscCall(PetscOptionsReal("-tao_ntl_eta1", "poor steplength; reduce radius", "", tl->eta1, &tl->eta1, NULL));
6439566063dSJacob Faibussowitsch   PetscCall(PetscOptionsReal("-tao_ntl_eta2", "reasonable steplength; leave radius alone", "", tl->eta2, &tl->eta2, NULL));
6449566063dSJacob Faibussowitsch   PetscCall(PetscOptionsReal("-tao_ntl_eta3", "good steplength; increase radius", "", tl->eta3, &tl->eta3, NULL));
6459566063dSJacob Faibussowitsch   PetscCall(PetscOptionsReal("-tao_ntl_eta4", "excellent steplength; greatly increase radius", "", tl->eta4, &tl->eta4, NULL));
6469566063dSJacob Faibussowitsch   PetscCall(PetscOptionsReal("-tao_ntl_alpha1", "", "", tl->alpha1, &tl->alpha1, NULL));
6479566063dSJacob Faibussowitsch   PetscCall(PetscOptionsReal("-tao_ntl_alpha2", "", "", tl->alpha2, &tl->alpha2, NULL));
6489566063dSJacob Faibussowitsch   PetscCall(PetscOptionsReal("-tao_ntl_alpha3", "", "", tl->alpha3, &tl->alpha3, NULL));
6499566063dSJacob Faibussowitsch   PetscCall(PetscOptionsReal("-tao_ntl_alpha4", "", "", tl->alpha4, &tl->alpha4, NULL));
6509566063dSJacob Faibussowitsch   PetscCall(PetscOptionsReal("-tao_ntl_alpha5", "", "", tl->alpha5, &tl->alpha5, NULL));
6519566063dSJacob Faibussowitsch   PetscCall(PetscOptionsReal("-tao_ntl_nu1", "poor steplength; reduce radius", "", tl->nu1, &tl->nu1, NULL));
6529566063dSJacob Faibussowitsch   PetscCall(PetscOptionsReal("-tao_ntl_nu2", "reasonable steplength; leave radius alone", "", tl->nu2, &tl->nu2, NULL));
6539566063dSJacob Faibussowitsch   PetscCall(PetscOptionsReal("-tao_ntl_nu3", "good steplength; increase radius", "", tl->nu3, &tl->nu3, NULL));
6549566063dSJacob Faibussowitsch   PetscCall(PetscOptionsReal("-tao_ntl_nu4", "excellent steplength; greatly increase radius", "", tl->nu4, &tl->nu4, NULL));
6559566063dSJacob Faibussowitsch   PetscCall(PetscOptionsReal("-tao_ntl_omega1", "", "", tl->omega1, &tl->omega1, NULL));
6569566063dSJacob Faibussowitsch   PetscCall(PetscOptionsReal("-tao_ntl_omega2", "", "", tl->omega2, &tl->omega2, NULL));
6579566063dSJacob Faibussowitsch   PetscCall(PetscOptionsReal("-tao_ntl_omega3", "", "", tl->omega3, &tl->omega3, NULL));
6589566063dSJacob Faibussowitsch   PetscCall(PetscOptionsReal("-tao_ntl_omega4", "", "", tl->omega4, &tl->omega4, NULL));
6599566063dSJacob Faibussowitsch   PetscCall(PetscOptionsReal("-tao_ntl_omega5", "", "", tl->omega5, &tl->omega5, NULL));
6609566063dSJacob Faibussowitsch   PetscCall(PetscOptionsReal("-tao_ntl_mu1_i", "", "", tl->mu1_i, &tl->mu1_i, NULL));
6619566063dSJacob Faibussowitsch   PetscCall(PetscOptionsReal("-tao_ntl_mu2_i", "", "", tl->mu2_i, &tl->mu2_i, NULL));
6629566063dSJacob Faibussowitsch   PetscCall(PetscOptionsReal("-tao_ntl_gamma1_i", "", "", tl->gamma1_i, &tl->gamma1_i, NULL));
6639566063dSJacob Faibussowitsch   PetscCall(PetscOptionsReal("-tao_ntl_gamma2_i", "", "", tl->gamma2_i, &tl->gamma2_i, NULL));
6649566063dSJacob Faibussowitsch   PetscCall(PetscOptionsReal("-tao_ntl_gamma3_i", "", "", tl->gamma3_i, &tl->gamma3_i, NULL));
6659566063dSJacob Faibussowitsch   PetscCall(PetscOptionsReal("-tao_ntl_gamma4_i", "", "", tl->gamma4_i, &tl->gamma4_i, NULL));
6669566063dSJacob Faibussowitsch   PetscCall(PetscOptionsReal("-tao_ntl_theta_i", "", "", tl->theta_i, &tl->theta_i, NULL));
6679566063dSJacob Faibussowitsch   PetscCall(PetscOptionsReal("-tao_ntl_mu1", "", "", tl->mu1, &tl->mu1, NULL));
6689566063dSJacob Faibussowitsch   PetscCall(PetscOptionsReal("-tao_ntl_mu2", "", "", tl->mu2, &tl->mu2, NULL));
6699566063dSJacob Faibussowitsch   PetscCall(PetscOptionsReal("-tao_ntl_gamma1", "", "", tl->gamma1, &tl->gamma1, NULL));
6709566063dSJacob Faibussowitsch   PetscCall(PetscOptionsReal("-tao_ntl_gamma2", "", "", tl->gamma2, &tl->gamma2, NULL));
6719566063dSJacob Faibussowitsch   PetscCall(PetscOptionsReal("-tao_ntl_gamma3", "", "", tl->gamma3, &tl->gamma3, NULL));
6729566063dSJacob Faibussowitsch   PetscCall(PetscOptionsReal("-tao_ntl_gamma4", "", "", tl->gamma4, &tl->gamma4, NULL));
6739566063dSJacob Faibussowitsch   PetscCall(PetscOptionsReal("-tao_ntl_theta", "", "", tl->theta, &tl->theta, NULL));
6749566063dSJacob Faibussowitsch   PetscCall(PetscOptionsReal("-tao_ntl_min_radius", "lower bound on initial radius", "", tl->min_radius, &tl->min_radius, NULL));
6759566063dSJacob Faibussowitsch   PetscCall(PetscOptionsReal("-tao_ntl_max_radius", "upper bound on radius", "", tl->max_radius, &tl->max_radius, NULL));
6769566063dSJacob Faibussowitsch   PetscCall(PetscOptionsReal("-tao_ntl_epsilon", "tolerance used when computing actual and predicted reduction", "", tl->epsilon, &tl->epsilon, NULL));
677d0609cedSBarry Smith   PetscOptionsHeadEnd();
6789566063dSJacob Faibussowitsch   PetscCall(TaoLineSearchSetFromOptions(tao->linesearch));
6799566063dSJacob Faibussowitsch   PetscCall(KSPSetFromOptions(tao->ksp));
680*3ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
681a7e14dcfSSatish Balay }
682a7e14dcfSSatish Balay 
683a7e14dcfSSatish Balay /*------------------------------------------------------------*/
684d71ae5a4SJacob Faibussowitsch static PetscErrorCode TaoView_NTL(Tao tao, PetscViewer viewer)
685d71ae5a4SJacob Faibussowitsch {
686a7e14dcfSSatish Balay   TAO_NTL  *tl = (TAO_NTL *)tao->data;
687a7e14dcfSSatish Balay   PetscBool isascii;
688a7e14dcfSSatish Balay 
689a7e14dcfSSatish Balay   PetscFunctionBegin;
6909566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERASCII, &isascii));
691a7e14dcfSSatish Balay   if (isascii) {
6929566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPushTab(viewer));
69363a3b9bcSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "Trust-region steps: %" PetscInt_FMT "\n", tl->ntrust));
69463a3b9bcSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "Newton search steps: %" PetscInt_FMT "\n", tl->newt));
69563a3b9bcSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "BFGS search steps: %" PetscInt_FMT "\n", tl->bfgs));
69663a3b9bcSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPrintf(viewer, "Gradient search steps: %" PetscInt_FMT "\n", tl->grad));
6979566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPopTab(viewer));
698a7e14dcfSSatish Balay   }
699*3ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
700a7e14dcfSSatish Balay }
701a7e14dcfSSatish Balay 
702a7e14dcfSSatish Balay /* ---------------------------------------------------------- */
7031522df2eSJason Sarich /*MC
7043850be85SAlp Dener   TAONTL - Newton's method with trust region globalization and line search fallback.
7051522df2eSJason Sarich   At each iteration, the Newton trust region method solves the system for d
7061522df2eSJason Sarich   and performs a line search in the d direction:
7071522df2eSJason Sarich 
7081522df2eSJason Sarich             min_d  .5 dT Hk d + gkT d,  s.t.   ||d|| < Delta_k
7091522df2eSJason Sarich 
7101522df2eSJason Sarich   Options Database Keys:
7119d0a60b2SAlp Dener + -tao_ntl_init_type - "constant","direction","interpolation"
7121522df2eSJason Sarich . -tao_ntl_update_type - "reduction","interpolation"
7131522df2eSJason Sarich . -tao_ntl_min_radius - lower bound on trust region radius
7141522df2eSJason Sarich . -tao_ntl_max_radius - upper bound on trust region radius
7151522df2eSJason Sarich . -tao_ntl_epsilon - tolerance for accepting actual / predicted reduction
7161522df2eSJason Sarich . -tao_ntl_mu1_i - mu1 interpolation init factor
7171522df2eSJason Sarich . -tao_ntl_mu2_i - mu2 interpolation init factor
7181522df2eSJason Sarich . -tao_ntl_gamma1_i - gamma1 interpolation init factor
7191522df2eSJason Sarich . -tao_ntl_gamma2_i - gamma2 interpolation init factor
7201522df2eSJason Sarich . -tao_ntl_gamma3_i - gamma3 interpolation init factor
7211522df2eSJason Sarich . -tao_ntl_gamma4_i - gamma4 interpolation init factor
7228966356dSPierre Jolivet . -tao_ntl_theta_i - theta1 interpolation init factor
7231522df2eSJason Sarich . -tao_ntl_eta1 - eta1 reduction update factor
7241522df2eSJason Sarich . -tao_ntl_eta2 - eta2 reduction update factor
7251522df2eSJason Sarich . -tao_ntl_eta3 - eta3 reduction update factor
7261522df2eSJason Sarich . -tao_ntl_eta4 - eta4 reduction update factor
7271522df2eSJason Sarich . -tao_ntl_alpha1 - alpha1 reduction update factor
7281522df2eSJason Sarich . -tao_ntl_alpha2 - alpha2 reduction update factor
7291522df2eSJason Sarich . -tao_ntl_alpha3 - alpha3 reduction update factor
7301522df2eSJason Sarich . -tao_ntl_alpha4 - alpha4 reduction update factor
7311522df2eSJason Sarich . -tao_ntl_alpha4 - alpha4 reduction update factor
7321522df2eSJason Sarich . -tao_ntl_mu1 - mu1 interpolation update
7331522df2eSJason Sarich . -tao_ntl_mu2 - mu2 interpolation update
7341522df2eSJason Sarich . -tao_ntl_gamma1 - gamma1 interpolcation update
7351522df2eSJason Sarich . -tao_ntl_gamma2 - gamma2 interpolcation update
7361522df2eSJason Sarich . -tao_ntl_gamma3 - gamma3 interpolcation update
7371522df2eSJason Sarich . -tao_ntl_gamma4 - gamma4 interpolation update
7381522df2eSJason Sarich - -tao_ntl_theta - theta1 interpolation update
7391522df2eSJason Sarich 
7401eb8069cSJason Sarich   Level: beginner
7411522df2eSJason Sarich M*/
742d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode TaoCreate_NTL(Tao tao)
743d71ae5a4SJacob Faibussowitsch {
744a7e14dcfSSatish Balay   TAO_NTL    *tl;
7458caf6e8cSBarry Smith   const char *morethuente_type = TAOLINESEARCHMT;
74653506e15SBarry Smith 
747a7e14dcfSSatish Balay   PetscFunctionBegin;
7484dfa11a4SJacob Faibussowitsch   PetscCall(PetscNew(&tl));
749a7e14dcfSSatish Balay   tao->ops->setup          = TaoSetUp_NTL;
750a7e14dcfSSatish Balay   tao->ops->solve          = TaoSolve_NTL;
751a7e14dcfSSatish Balay   tao->ops->view           = TaoView_NTL;
752a7e14dcfSSatish Balay   tao->ops->setfromoptions = TaoSetFromOptions_NTL;
753a7e14dcfSSatish Balay   tao->ops->destroy        = TaoDestroy_NTL;
754a7e14dcfSSatish Balay 
7556552cf8aSJason Sarich   /* Override default settings (unless already changed) */
7566552cf8aSJason Sarich   if (!tao->max_it_changed) tao->max_it = 50;
7576552cf8aSJason Sarich   if (!tao->trust0_changed) tao->trust0 = 100.0;
7586552cf8aSJason Sarich 
759a7e14dcfSSatish Balay   tao->data = (void *)tl;
760a7e14dcfSSatish Balay 
761a7e14dcfSSatish Balay   /* Default values for trust-region radius update based on steplength */
762a7e14dcfSSatish Balay   tl->nu1 = 0.25;
763a7e14dcfSSatish Balay   tl->nu2 = 0.50;
764a7e14dcfSSatish Balay   tl->nu3 = 1.00;
765a7e14dcfSSatish Balay   tl->nu4 = 1.25;
766a7e14dcfSSatish Balay 
767a7e14dcfSSatish Balay   tl->omega1 = 0.25;
768a7e14dcfSSatish Balay   tl->omega2 = 0.50;
769a7e14dcfSSatish Balay   tl->omega3 = 1.00;
770a7e14dcfSSatish Balay   tl->omega4 = 2.00;
771a7e14dcfSSatish Balay   tl->omega5 = 4.00;
772a7e14dcfSSatish Balay 
773a7e14dcfSSatish Balay   /* Default values for trust-region radius update based on reduction */
774a7e14dcfSSatish Balay   tl->eta1 = 1.0e-4;
775a7e14dcfSSatish Balay   tl->eta2 = 0.25;
776a7e14dcfSSatish Balay   tl->eta3 = 0.50;
777a7e14dcfSSatish Balay   tl->eta4 = 0.90;
778a7e14dcfSSatish Balay 
779a7e14dcfSSatish Balay   tl->alpha1 = 0.25;
780a7e14dcfSSatish Balay   tl->alpha2 = 0.50;
781a7e14dcfSSatish Balay   tl->alpha3 = 1.00;
782a7e14dcfSSatish Balay   tl->alpha4 = 2.00;
783a7e14dcfSSatish Balay   tl->alpha5 = 4.00;
784a7e14dcfSSatish Balay 
785a7e14dcfSSatish Balay   /* Default values for trust-region radius update based on interpolation */
786a7e14dcfSSatish Balay   tl->mu1 = 0.10;
787a7e14dcfSSatish Balay   tl->mu2 = 0.50;
788a7e14dcfSSatish Balay 
789a7e14dcfSSatish Balay   tl->gamma1 = 0.25;
790a7e14dcfSSatish Balay   tl->gamma2 = 0.50;
791a7e14dcfSSatish Balay   tl->gamma3 = 2.00;
792a7e14dcfSSatish Balay   tl->gamma4 = 4.00;
793a7e14dcfSSatish Balay 
794a7e14dcfSSatish Balay   tl->theta = 0.05;
795a7e14dcfSSatish Balay 
796a7e14dcfSSatish Balay   /* Default values for trust region initialization based on interpolation */
797a7e14dcfSSatish Balay   tl->mu1_i = 0.35;
798a7e14dcfSSatish Balay   tl->mu2_i = 0.50;
799a7e14dcfSSatish Balay 
800a7e14dcfSSatish Balay   tl->gamma1_i = 0.0625;
801a7e14dcfSSatish Balay   tl->gamma2_i = 0.5;
802a7e14dcfSSatish Balay   tl->gamma3_i = 2.0;
803a7e14dcfSSatish Balay   tl->gamma4_i = 5.0;
804a7e14dcfSSatish Balay 
805a7e14dcfSSatish Balay   tl->theta_i = 0.25;
806a7e14dcfSSatish Balay 
807a7e14dcfSSatish Balay   /* Remaining parameters */
808a7e14dcfSSatish Balay   tl->min_radius = 1.0e-10;
809a7e14dcfSSatish Balay   tl->max_radius = 1.0e10;
810a7e14dcfSSatish Balay   tl->epsilon    = 1.0e-6;
811a7e14dcfSSatish Balay 
812a7e14dcfSSatish Balay   tl->init_type   = NTL_INIT_INTERPOLATION;
813a7e14dcfSSatish Balay   tl->update_type = NTL_UPDATE_REDUCTION;
814a7e14dcfSSatish Balay 
8159566063dSJacob Faibussowitsch   PetscCall(TaoLineSearchCreate(((PetscObject)tao)->comm, &tao->linesearch));
8169566063dSJacob Faibussowitsch   PetscCall(PetscObjectIncrementTabLevel((PetscObject)tao->linesearch, (PetscObject)tao, 1));
8179566063dSJacob Faibussowitsch   PetscCall(TaoLineSearchSetType(tao->linesearch, morethuente_type));
8189566063dSJacob Faibussowitsch   PetscCall(TaoLineSearchUseTaoRoutines(tao->linesearch, tao));
8199566063dSJacob Faibussowitsch   PetscCall(TaoLineSearchSetOptionsPrefix(tao->linesearch, tao->hdr.prefix));
8209566063dSJacob Faibussowitsch   PetscCall(KSPCreate(((PetscObject)tao)->comm, &tao->ksp));
8219566063dSJacob Faibussowitsch   PetscCall(PetscObjectIncrementTabLevel((PetscObject)tao->ksp, (PetscObject)tao, 1));
8229566063dSJacob Faibussowitsch   PetscCall(KSPSetOptionsPrefix(tao->ksp, tao->hdr.prefix));
8239566063dSJacob Faibussowitsch   PetscCall(KSPAppendOptionsPrefix(tao->ksp, "tao_ntl_"));
8249566063dSJacob Faibussowitsch   PetscCall(KSPSetType(tao->ksp, KSPSTCG));
825*3ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
826a7e14dcfSSatish Balay }
827