xref: /petsc/src/tao/bound/impls/bnk/bnk.c (revision eb9107154965f6d42900b472f8cc894abc73f56d)
1*eb910715SAlp Dener #include <petsctaolinesearch.h>
2*eb910715SAlp Dener #include <../src/tao/bound/impls/bnk/bnk.h>
3*eb910715SAlp Dener 
4*eb910715SAlp Dener #include <petscksp.h>
5*eb910715SAlp Dener 
6*eb910715SAlp Dener /* Routine for BFGS preconditioner */
7*eb910715SAlp Dener 
8*eb910715SAlp Dener PetscErrorCode MatLMVMSolveShell(PC pc, Vec b, Vec x)
9*eb910715SAlp Dener {
10*eb910715SAlp Dener   PetscErrorCode ierr;
11*eb910715SAlp Dener   Mat            M;
12*eb910715SAlp Dener 
13*eb910715SAlp Dener   PetscFunctionBegin;
14*eb910715SAlp Dener   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
15*eb910715SAlp Dener   PetscValidHeaderSpecific(b,VEC_CLASSID,2);
16*eb910715SAlp Dener   PetscValidHeaderSpecific(x,VEC_CLASSID,3);
17*eb910715SAlp Dener   ierr = PCShellGetContext(pc,(void**)&M);CHKERRQ(ierr);
18*eb910715SAlp Dener   ierr = MatLMVMSolve(M, b, x);CHKERRQ(ierr);
19*eb910715SAlp Dener   PetscFunctionReturn(0);
20*eb910715SAlp Dener }
21*eb910715SAlp Dener 
22*eb910715SAlp Dener PetscErrorCode TaoBNKInitialize(Tao tao)
23*eb910715SAlp Dener {
24*eb910715SAlp Dener   PetscErrorCode               ierr;
25*eb910715SAlp Dener   TAO_BNK                      *bnk = (TAO_BNK *)tao->data;
26*eb910715SAlp Dener   KSPType                      ksp_type;
27*eb910715SAlp Dener   PC                           pc;
28*eb910715SAlp Dener 
29*eb910715SAlp Dener   PetscReal                    fmin, ftrial, prered, actred, kappa, sigma;
30*eb910715SAlp Dener   PetscReal                    tau, tau_1, tau_2, tau_max, tau_min, max_radius;
31*eb910715SAlp Dener   PetscReal                    delta, step = 1.0;
32*eb910715SAlp Dener 
33*eb910715SAlp Dener   PetscInt                     n,N,needH = 1;
34*eb910715SAlp Dener 
35*eb910715SAlp Dener   PetscInt                     i_max = 5;
36*eb910715SAlp Dener   PetscInt                     j_max = 1;
37*eb910715SAlp Dener   PetscInt                     i, j;
38*eb910715SAlp Dener 
39*eb910715SAlp Dener   PetscFunctionBegin;
40*eb910715SAlp Dener   /* Number of times ksp stopped because of these reasons */
41*eb910715SAlp Dener   bnk->ksp_atol = 0;
42*eb910715SAlp Dener   bnk->ksp_rtol = 0;
43*eb910715SAlp Dener   bnk->ksp_dtol = 0;
44*eb910715SAlp Dener   bnk->ksp_ctol = 0;
45*eb910715SAlp Dener   bnk->ksp_negc = 0;
46*eb910715SAlp Dener   bnk->ksp_iter = 0;
47*eb910715SAlp Dener   bnk->ksp_othr = 0;
48*eb910715SAlp Dener 
49*eb910715SAlp Dener   /* Initialize trust-region radius when using nash, stcg, or gltr
50*eb910715SAlp Dener      Command automatically ignored for other methods
51*eb910715SAlp Dener      Will be reset during the first iteration
52*eb910715SAlp Dener   */
53*eb910715SAlp Dener   ierr = KSPGetType(tao->ksp,&ksp_type);CHKERRQ(ierr);
54*eb910715SAlp Dener   ierr = PetscStrcmp(ksp_type,KSPCGNASH,&bnk->is_nash);CHKERRQ(ierr);
55*eb910715SAlp Dener   ierr = PetscStrcmp(ksp_type,KSPCGSTCG,&bnk->is_stcg);CHKERRQ(ierr);
56*eb910715SAlp Dener   ierr = PetscStrcmp(ksp_type,KSPCGGLTR,&bnk->is_gltr);CHKERRQ(ierr);
57*eb910715SAlp Dener 
58*eb910715SAlp Dener   ierr = KSPCGSetRadius(tao->ksp,bnk->max_radius);CHKERRQ(ierr);
59*eb910715SAlp Dener 
60*eb910715SAlp Dener   if (bnk->is_nash || bnk->is_stcg || bnk->is_gltr) {
61*eb910715SAlp Dener     if (tao->trust0 < 0.0) SETERRQ(PETSC_COMM_SELF,1,"Initial radius negative");
62*eb910715SAlp Dener     tao->trust = tao->trust0;
63*eb910715SAlp Dener     tao->trust = PetscMax(tao->trust, bnk->min_radius);
64*eb910715SAlp Dener     tao->trust = PetscMin(tao->trust, bnk->max_radius);
65*eb910715SAlp Dener   }
66*eb910715SAlp Dener 
67*eb910715SAlp Dener   /* Get vectors we will need */
68*eb910715SAlp Dener   if (BNK_PC_BFGS == bnk->pc_type && !bnk->M) {
69*eb910715SAlp Dener     ierr = VecGetLocalSize(tao->solution,&n);CHKERRQ(ierr);
70*eb910715SAlp Dener     ierr = VecGetSize(tao->solution,&N);CHKERRQ(ierr);
71*eb910715SAlp Dener     ierr = MatCreateLMVM(((PetscObject)tao)->comm,n,N,&bnk->M);CHKERRQ(ierr);
72*eb910715SAlp Dener     ierr = MatLMVMAllocateVectors(bnk->M,tao->solution);CHKERRQ(ierr);
73*eb910715SAlp Dener   }
74*eb910715SAlp Dener 
75*eb910715SAlp Dener   /* create vectors for the limited memory preconditioner */
76*eb910715SAlp Dener   if ((BNK_PC_BFGS == bnk->pc_type) && (BFGS_SCALE_BFGS != bnk->bfgs_scale_type)) {
77*eb910715SAlp Dener     if (!bnk->Diag) {
78*eb910715SAlp Dener       ierr = VecDuplicate(tao->solution,&bnk->Diag);CHKERRQ(ierr);
79*eb910715SAlp Dener     }
80*eb910715SAlp Dener   }
81*eb910715SAlp Dener 
82*eb910715SAlp Dener   /* Modify the preconditioner to use the bfgs approximation */
83*eb910715SAlp Dener   ierr = KSPGetPC(tao->ksp, &pc);CHKERRQ(ierr);
84*eb910715SAlp Dener   switch(bnk->pc_type) {
85*eb910715SAlp Dener   case BNK_PC_NONE:
86*eb910715SAlp Dener     ierr = PCSetType(pc, PCNONE);CHKERRQ(ierr);
87*eb910715SAlp Dener     ierr = PCSetFromOptions(pc);CHKERRQ(ierr);
88*eb910715SAlp Dener     break;
89*eb910715SAlp Dener 
90*eb910715SAlp Dener   case BNK_PC_AHESS:
91*eb910715SAlp Dener     ierr = PCSetType(pc, PCJACOBI);CHKERRQ(ierr);
92*eb910715SAlp Dener     ierr = PCSetFromOptions(pc);CHKERRQ(ierr);
93*eb910715SAlp Dener     ierr = PCJacobiSetUseAbs(pc,PETSC_TRUE);CHKERRQ(ierr);
94*eb910715SAlp Dener     break;
95*eb910715SAlp Dener 
96*eb910715SAlp Dener   case BNK_PC_BFGS:
97*eb910715SAlp Dener     ierr = PCSetType(pc, PCSHELL);CHKERRQ(ierr);
98*eb910715SAlp Dener     ierr = PCSetFromOptions(pc);CHKERRQ(ierr);
99*eb910715SAlp Dener     ierr = PCShellSetName(pc, "bfgs");CHKERRQ(ierr);
100*eb910715SAlp Dener     ierr = PCShellSetContext(pc, bnk->M);CHKERRQ(ierr);
101*eb910715SAlp Dener     ierr = PCShellSetApply(pc, MatLMVMSolveShell);CHKERRQ(ierr);
102*eb910715SAlp Dener     break;
103*eb910715SAlp Dener 
104*eb910715SAlp Dener   default:
105*eb910715SAlp Dener     /* Use the pc method set by pc_type */
106*eb910715SAlp Dener     break;
107*eb910715SAlp Dener   }
108*eb910715SAlp Dener 
109*eb910715SAlp Dener   /* Initialize trust-region radius.  The initialization is only performed
110*eb910715SAlp Dener      when we are using Nash, Steihaug-Toint or the Generalized Lanczos method. */
111*eb910715SAlp Dener   if (bnk->is_nash || bnk->is_stcg || bnk->is_gltr) {
112*eb910715SAlp Dener     switch(bnk->init_type) {
113*eb910715SAlp Dener     case BNK_INIT_CONSTANT:
114*eb910715SAlp Dener       /* Use the initial radius specified */
115*eb910715SAlp Dener       break;
116*eb910715SAlp Dener 
117*eb910715SAlp Dener     case BNK_INIT_INTERPOLATION:
118*eb910715SAlp Dener       /* Use the initial radius specified */
119*eb910715SAlp Dener       max_radius = 0.0;
120*eb910715SAlp Dener 
121*eb910715SAlp Dener       for (j = 0; j < j_max; ++j) {
122*eb910715SAlp Dener         fmin = bnk->f;
123*eb910715SAlp Dener         sigma = 0.0;
124*eb910715SAlp Dener 
125*eb910715SAlp Dener         if (needH) {
126*eb910715SAlp Dener           ierr  = TaoComputeHessian(tao, tao->solution,tao->hessian,tao->hessian_pre);CHKERRQ(ierr);
127*eb910715SAlp Dener           needH = 0;
128*eb910715SAlp Dener         }
129*eb910715SAlp Dener 
130*eb910715SAlp Dener         for (i = 0; i < i_max; ++i) {
131*eb910715SAlp Dener           ierr = VecCopy(tao->solution,bnk->W);CHKERRQ(ierr);
132*eb910715SAlp Dener           ierr = VecAXPY(bnk->W,-tao->trust/bnk->gnorm,tao->gradient);CHKERRQ(ierr);
133*eb910715SAlp Dener           ierr = TaoComputeObjective(tao, bnk->W, &ftrial);CHKERRQ(ierr);
134*eb910715SAlp Dener           if (PetscIsInfOrNanReal(ftrial)) {
135*eb910715SAlp Dener             tau = bnk->gamma1_i;
136*eb910715SAlp Dener           } else {
137*eb910715SAlp Dener             if (ftrial < fmin) {
138*eb910715SAlp Dener               fmin = ftrial;
139*eb910715SAlp Dener               sigma = -tao->trust / bnk->gnorm;
140*eb910715SAlp Dener             }
141*eb910715SAlp Dener 
142*eb910715SAlp Dener             ierr = MatMult(tao->hessian, tao->gradient, bnk->D);CHKERRQ(ierr);
143*eb910715SAlp Dener             ierr = VecDot(tao->gradient, bnk->D, &prered);CHKERRQ(ierr);
144*eb910715SAlp Dener 
145*eb910715SAlp Dener             prered = tao->trust * (bnk->gnorm - 0.5 * tao->trust * prered / (bnk->gnorm * bnk->gnorm));
146*eb910715SAlp Dener             actred = bnk->f - ftrial;
147*eb910715SAlp Dener             if ((PetscAbsScalar(actred) <= bnk->epsilon) && (PetscAbsScalar(prered) <= bnk->epsilon)) {
148*eb910715SAlp Dener               kappa = 1.0;
149*eb910715SAlp Dener             } else {
150*eb910715SAlp Dener               kappa = actred / prered;
151*eb910715SAlp Dener             }
152*eb910715SAlp Dener 
153*eb910715SAlp Dener             tau_1 = bnk->theta_i * bnk->gnorm * tao->trust / (bnk->theta_i * bnk->gnorm * tao->trust + (1.0 - bnk->theta_i) * prered - actred);
154*eb910715SAlp Dener             tau_2 = bnk->theta_i * bnk->gnorm * tao->trust / (bnk->theta_i * bnk->gnorm * tao->trust - (1.0 + bnk->theta_i) * prered + actred);
155*eb910715SAlp Dener             tau_min = PetscMin(tau_1, tau_2);
156*eb910715SAlp Dener             tau_max = PetscMax(tau_1, tau_2);
157*eb910715SAlp Dener 
158*eb910715SAlp Dener             if (PetscAbsScalar(kappa - 1.0) <= bnk->mu1_i) {
159*eb910715SAlp Dener               /* Great agreement */
160*eb910715SAlp Dener               max_radius = PetscMax(max_radius, tao->trust);
161*eb910715SAlp Dener 
162*eb910715SAlp Dener               if (tau_max < 1.0) {
163*eb910715SAlp Dener                 tau = bnk->gamma3_i;
164*eb910715SAlp Dener               } else if (tau_max > bnk->gamma4_i) {
165*eb910715SAlp Dener                 tau = bnk->gamma4_i;
166*eb910715SAlp Dener               } else if (tau_1 >= 1.0 && tau_1 <= bnk->gamma4_i && tau_2 < 1.0) {
167*eb910715SAlp Dener                 tau = tau_1;
168*eb910715SAlp Dener               } else if (tau_2 >= 1.0 && tau_2 <= bnk->gamma4_i && tau_1 < 1.0) {
169*eb910715SAlp Dener                 tau = tau_2;
170*eb910715SAlp Dener               } else {
171*eb910715SAlp Dener                 tau = tau_max;
172*eb910715SAlp Dener               }
173*eb910715SAlp Dener             } else if (PetscAbsScalar(kappa - 1.0) <= bnk->mu2_i) {
174*eb910715SAlp Dener               /* Good agreement */
175*eb910715SAlp Dener               max_radius = PetscMax(max_radius, tao->trust);
176*eb910715SAlp Dener 
177*eb910715SAlp Dener               if (tau_max < bnk->gamma2_i) {
178*eb910715SAlp Dener                 tau = bnk->gamma2_i;
179*eb910715SAlp Dener               } else if (tau_max > bnk->gamma3_i) {
180*eb910715SAlp Dener                 tau = bnk->gamma3_i;
181*eb910715SAlp Dener               } else {
182*eb910715SAlp Dener                 tau = tau_max;
183*eb910715SAlp Dener               }
184*eb910715SAlp Dener             } else {
185*eb910715SAlp Dener               /* Not good agreement */
186*eb910715SAlp Dener               if (tau_min > 1.0) {
187*eb910715SAlp Dener                 tau = bnk->gamma2_i;
188*eb910715SAlp Dener               } else if (tau_max < bnk->gamma1_i) {
189*eb910715SAlp Dener                 tau = bnk->gamma1_i;
190*eb910715SAlp Dener               } else if ((tau_min < bnk->gamma1_i) && (tau_max >= 1.0)) {
191*eb910715SAlp Dener                 tau = bnk->gamma1_i;
192*eb910715SAlp Dener               } else if ((tau_1 >= bnk->gamma1_i) && (tau_1 < 1.0) && ((tau_2 < bnk->gamma1_i) || (tau_2 >= 1.0))) {
193*eb910715SAlp Dener                 tau = tau_1;
194*eb910715SAlp Dener               } else if ((tau_2 >= bnk->gamma1_i) && (tau_2 < 1.0) && ((tau_1 < bnk->gamma1_i) || (tau_2 >= 1.0))) {
195*eb910715SAlp Dener                 tau = tau_2;
196*eb910715SAlp Dener               } else {
197*eb910715SAlp Dener                 tau = tau_max;
198*eb910715SAlp Dener               }
199*eb910715SAlp Dener             }
200*eb910715SAlp Dener           }
201*eb910715SAlp Dener           tao->trust = tau * tao->trust;
202*eb910715SAlp Dener         }
203*eb910715SAlp Dener 
204*eb910715SAlp Dener         if (fmin < bnk->f) {
205*eb910715SAlp Dener           bnk->f = fmin;
206*eb910715SAlp Dener           ierr = VecAXPY(tao->solution,sigma,tao->gradient);CHKERRQ(ierr);
207*eb910715SAlp Dener           ierr = TaoComputeGradient(tao,tao->solution,tao->gradient);CHKERRQ(ierr);
208*eb910715SAlp Dener 
209*eb910715SAlp Dener           ierr = TaoGradientNorm(tao, tao->gradient,NORM_2,&bnk->gnorm);CHKERRQ(ierr);
210*eb910715SAlp Dener           if (PetscIsInfOrNanReal(bnk->gnorm)) SETERRQ(PETSC_COMM_SELF,1, "User provided compute gradient generated Inf or NaN");
211*eb910715SAlp Dener           needH = 1;
212*eb910715SAlp Dener 
213*eb910715SAlp Dener           ierr = TaoLogConvergenceHistory(tao,bnk->f,bnk->gnorm,0.0,tao->ksp_its);CHKERRQ(ierr);
214*eb910715SAlp Dener           ierr = TaoMonitor(tao,tao->niter,bnk->f,bnk->gnorm,0.0,step);CHKERRQ(ierr);
215*eb910715SAlp Dener           ierr = (*tao->ops->convergencetest)(tao,tao->cnvP);CHKERRQ(ierr);
216*eb910715SAlp Dener           if (tao->reason != TAO_CONTINUE_ITERATING) PetscFunctionReturn(0);
217*eb910715SAlp Dener         }
218*eb910715SAlp Dener       }
219*eb910715SAlp Dener       tao->trust = PetscMax(tao->trust, max_radius);
220*eb910715SAlp Dener 
221*eb910715SAlp Dener       /* Modify the radius if it is too large or small */
222*eb910715SAlp Dener       tao->trust = PetscMax(tao->trust, bnk->min_radius);
223*eb910715SAlp Dener       tao->trust = PetscMin(tao->trust, bnk->max_radius);
224*eb910715SAlp Dener       break;
225*eb910715SAlp Dener 
226*eb910715SAlp Dener     default:
227*eb910715SAlp Dener       /* Norm of the first direction will initialize radius */
228*eb910715SAlp Dener       tao->trust = 0.0;
229*eb910715SAlp Dener       break;
230*eb910715SAlp Dener     }
231*eb910715SAlp Dener   }
232*eb910715SAlp Dener 
233*eb910715SAlp Dener   /* Set initial scaling for the BFGS preconditioner
234*eb910715SAlp Dener      This step is done after computing the initial trust-region radius
235*eb910715SAlp Dener      since the function value may have decreased */
236*eb910715SAlp Dener   if (BNK_PC_BFGS == bnk->pc_type) {
237*eb910715SAlp Dener     if (bnk->f != 0.0) {
238*eb910715SAlp Dener       delta = 2.0 * PetscAbsScalar(bnk->f) / (bnk->gnorm*bnk->gnorm);
239*eb910715SAlp Dener     } else {
240*eb910715SAlp Dener       delta = 2.0 / (bnk->gnorm*bnk->gnorm);
241*eb910715SAlp Dener     }
242*eb910715SAlp Dener     ierr = MatLMVMSetDelta(bnk->M,delta);CHKERRQ(ierr);
243*eb910715SAlp Dener   }
244*eb910715SAlp Dener 
245*eb910715SAlp Dener   /* Set counter for gradient/reset steps*/
246*eb910715SAlp Dener   bnk->newt = 0;
247*eb910715SAlp Dener   bnk->bfgs = 0;
248*eb910715SAlp Dener   bnk->sgrad = 0;
249*eb910715SAlp Dener   bnk->grad = 0;
250*eb910715SAlp Dener   PetscFunctionReturn(0);
251*eb910715SAlp Dener }
252*eb910715SAlp Dener 
253*eb910715SAlp Dener PetscErrorCode TaoBNKComputeStep(Tao tao, PetscInt *stepType)
254*eb910715SAlp Dener {
255*eb910715SAlp Dener   PetscErrorCode               ierr;
256*eb910715SAlp Dener   TAO_BNK                      *bnk = (TAO_BNK *)tao->data;
257*eb910715SAlp Dener   KSPConvergedReason           ksp_reason;
258*eb910715SAlp Dener 
259*eb910715SAlp Dener   PetscReal                    gdx, delta;
260*eb910715SAlp Dener   PetscReal                    norm_d = 0.0, e_min;
261*eb910715SAlp Dener 
262*eb910715SAlp Dener   PetscInt                     bfgsUpdates = 0;
263*eb910715SAlp Dener   PetscInt                     kspits;
264*eb910715SAlp Dener   PetscInt                     needH = 1;
265*eb910715SAlp Dener 
266*eb910715SAlp Dener   PetscFunctionBegin;
267*eb910715SAlp Dener   /* Compute the Hessian */
268*eb910715SAlp Dener   if (needH) {
269*eb910715SAlp Dener     ierr = TaoComputeHessian(tao,tao->solution,tao->hessian,tao->hessian_pre);CHKERRQ(ierr);
270*eb910715SAlp Dener   }
271*eb910715SAlp Dener 
272*eb910715SAlp Dener   if ((BNK_PC_BFGS == bnk->pc_type) && (BFGS_SCALE_AHESS == bnk->bfgs_scale_type)) {
273*eb910715SAlp Dener     /* Obtain diagonal for the bfgs preconditioner  */
274*eb910715SAlp Dener     ierr = MatGetDiagonal(tao->hessian, bnk->Diag);CHKERRQ(ierr);
275*eb910715SAlp Dener     ierr = VecAbs(bnk->Diag);CHKERRQ(ierr);
276*eb910715SAlp Dener     ierr = VecReciprocal(bnk->Diag);CHKERRQ(ierr);
277*eb910715SAlp Dener     ierr = MatLMVMSetScale(bnk->M,bnk->Diag);CHKERRQ(ierr);
278*eb910715SAlp Dener   }
279*eb910715SAlp Dener 
280*eb910715SAlp Dener   /* Shift the Hessian matrix */
281*eb910715SAlp Dener   bnk->pert = bnk->sval;
282*eb910715SAlp Dener   if (bnk->pert > 0) {
283*eb910715SAlp Dener     ierr = MatShift(tao->hessian, bnk->pert);CHKERRQ(ierr);
284*eb910715SAlp Dener     if (tao->hessian != tao->hessian_pre) {
285*eb910715SAlp Dener       ierr = MatShift(tao->hessian_pre, bnk->pert);CHKERRQ(ierr);
286*eb910715SAlp Dener     }
287*eb910715SAlp Dener   }
288*eb910715SAlp Dener 
289*eb910715SAlp Dener   if (BNK_PC_BFGS == bnk->pc_type) {
290*eb910715SAlp Dener     if (BFGS_SCALE_PHESS == bnk->bfgs_scale_type) {
291*eb910715SAlp Dener       /* Obtain diagonal for the bfgs preconditioner  */
292*eb910715SAlp Dener       ierr = MatGetDiagonal(tao->hessian, bnk->Diag);CHKERRQ(ierr);
293*eb910715SAlp Dener       ierr = VecAbs(bnk->Diag);CHKERRQ(ierr);
294*eb910715SAlp Dener       ierr = VecReciprocal(bnk->Diag);CHKERRQ(ierr);
295*eb910715SAlp Dener       ierr = MatLMVMSetScale(bnk->M,bnk->Diag);CHKERRQ(ierr);
296*eb910715SAlp Dener     }
297*eb910715SAlp Dener     /* Update the limited memory preconditioner and get existing # of updates */
298*eb910715SAlp Dener     ierr = MatLMVMUpdate(bnk->M, tao->solution, tao->gradient);CHKERRQ(ierr);
299*eb910715SAlp Dener     ierr = MatLMVMGetUpdates(bnk->M, &bfgsUpdates);CHKERRQ(ierr);
300*eb910715SAlp Dener   }
301*eb910715SAlp Dener 
302*eb910715SAlp Dener   /* Solve the Newton system of equations */
303*eb910715SAlp Dener   ierr = KSPSetOperators(tao->ksp,tao->hessian,tao->hessian_pre);CHKERRQ(ierr);
304*eb910715SAlp Dener   if (bnk->is_nash || bnk->is_stcg || bnk->is_gltr) {
305*eb910715SAlp Dener     ierr = KSPCGSetRadius(tao->ksp,bnk->max_radius);CHKERRQ(ierr);
306*eb910715SAlp Dener     ierr = KSPSolve(tao->ksp, tao->gradient, bnk->D);CHKERRQ(ierr);
307*eb910715SAlp Dener     ierr = KSPGetIterationNumber(tao->ksp,&kspits);CHKERRQ(ierr);
308*eb910715SAlp Dener     tao->ksp_its+=kspits;
309*eb910715SAlp Dener     tao->ksp_tot_its+=kspits;
310*eb910715SAlp Dener     ierr = KSPCGGetNormD(tao->ksp,&norm_d);CHKERRQ(ierr);
311*eb910715SAlp Dener 
312*eb910715SAlp Dener     if (0.0 == tao->trust) {
313*eb910715SAlp Dener       /* Radius was uninitialized; use the norm of the direction */
314*eb910715SAlp Dener       if (norm_d > 0.0) {
315*eb910715SAlp Dener         tao->trust = norm_d;
316*eb910715SAlp Dener 
317*eb910715SAlp Dener         /* Modify the radius if it is too large or small */
318*eb910715SAlp Dener         tao->trust = PetscMax(tao->trust, bnk->min_radius);
319*eb910715SAlp Dener         tao->trust = PetscMin(tao->trust, bnk->max_radius);
320*eb910715SAlp Dener       } else {
321*eb910715SAlp Dener         /* The direction was bad; set radius to default value and re-solve
322*eb910715SAlp Dener            the trust-region subproblem to get a direction */
323*eb910715SAlp Dener         tao->trust = tao->trust0;
324*eb910715SAlp Dener 
325*eb910715SAlp Dener         /* Modify the radius if it is too large or small */
326*eb910715SAlp Dener         tao->trust = PetscMax(tao->trust, bnk->min_radius);
327*eb910715SAlp Dener         tao->trust = PetscMin(tao->trust, bnk->max_radius);
328*eb910715SAlp Dener 
329*eb910715SAlp Dener         ierr = KSPCGSetRadius(tao->ksp,bnk->max_radius);CHKERRQ(ierr);
330*eb910715SAlp Dener         ierr = KSPSolve(tao->ksp, tao->gradient, bnk->D);CHKERRQ(ierr);
331*eb910715SAlp Dener         ierr = KSPGetIterationNumber(tao->ksp,&kspits);CHKERRQ(ierr);
332*eb910715SAlp Dener         tao->ksp_its+=kspits;
333*eb910715SAlp Dener         tao->ksp_tot_its+=kspits;
334*eb910715SAlp Dener         ierr = KSPCGGetNormD(tao->ksp,&norm_d);CHKERRQ(ierr);
335*eb910715SAlp Dener 
336*eb910715SAlp Dener         if (norm_d == 0.0) SETERRQ(PETSC_COMM_SELF,1, "Initial direction zero");
337*eb910715SAlp Dener       }
338*eb910715SAlp Dener     }
339*eb910715SAlp Dener   } else {
340*eb910715SAlp Dener     ierr = KSPSolve(tao->ksp, tao->gradient, bnk->D);CHKERRQ(ierr);
341*eb910715SAlp Dener     ierr = KSPGetIterationNumber(tao->ksp, &kspits);CHKERRQ(ierr);
342*eb910715SAlp Dener     tao->ksp_its += kspits;
343*eb910715SAlp Dener     tao->ksp_tot_its+=kspits;
344*eb910715SAlp Dener   }
345*eb910715SAlp Dener   ierr = VecScale(bnk->D, -1.0);CHKERRQ(ierr);
346*eb910715SAlp Dener   ierr = KSPGetConvergedReason(tao->ksp, &ksp_reason);CHKERRQ(ierr);
347*eb910715SAlp Dener   if ((KSP_DIVERGED_INDEFINITE_PC == ksp_reason) &&  (BNK_PC_BFGS == bnk->pc_type) && (bfgsUpdates > 1)) {
348*eb910715SAlp Dener     /* Preconditioner is numerically indefinite; reset the
349*eb910715SAlp Dener        approximate if using BFGS preconditioning. */
350*eb910715SAlp Dener 
351*eb910715SAlp Dener     if (bnk->f != 0.0) {
352*eb910715SAlp Dener       delta = 2.0 * PetscAbsScalar(bnk->f) / (bnk->gnorm*bnk->gnorm);
353*eb910715SAlp Dener     } else {
354*eb910715SAlp Dener       delta = 2.0 / (bnk->gnorm*bnk->gnorm);
355*eb910715SAlp Dener     }
356*eb910715SAlp Dener     ierr = MatLMVMSetDelta(bnk->M,delta);CHKERRQ(ierr);
357*eb910715SAlp Dener     ierr = MatLMVMReset(bnk->M);CHKERRQ(ierr);
358*eb910715SAlp Dener     ierr = MatLMVMUpdate(bnk->M, tao->solution, tao->gradient);CHKERRQ(ierr);
359*eb910715SAlp Dener     bfgsUpdates = 1;
360*eb910715SAlp Dener   }
361*eb910715SAlp Dener 
362*eb910715SAlp Dener   if (KSP_CONVERGED_ATOL == ksp_reason) {
363*eb910715SAlp Dener     ++bnk->ksp_atol;
364*eb910715SAlp Dener   } else if (KSP_CONVERGED_RTOL == ksp_reason) {
365*eb910715SAlp Dener     ++bnk->ksp_rtol;
366*eb910715SAlp Dener   } else if (KSP_CONVERGED_CG_CONSTRAINED == ksp_reason) {
367*eb910715SAlp Dener     ++bnk->ksp_ctol;
368*eb910715SAlp Dener   } else if (KSP_CONVERGED_CG_NEG_CURVE == ksp_reason) {
369*eb910715SAlp Dener     ++bnk->ksp_negc;
370*eb910715SAlp Dener   } else if (KSP_DIVERGED_DTOL == ksp_reason) {
371*eb910715SAlp Dener     ++bnk->ksp_dtol;
372*eb910715SAlp Dener   } else if (KSP_DIVERGED_ITS == ksp_reason) {
373*eb910715SAlp Dener     ++bnk->ksp_iter;
374*eb910715SAlp Dener   } else {
375*eb910715SAlp Dener     ++bnk->ksp_othr;
376*eb910715SAlp Dener   }
377*eb910715SAlp Dener 
378*eb910715SAlp Dener   /* Check for success (descent direction) */
379*eb910715SAlp Dener   ierr = VecDot(bnk->D, tao->gradient, &gdx);CHKERRQ(ierr);
380*eb910715SAlp Dener   if ((gdx >= 0.0) || PetscIsInfOrNanReal(gdx)) {
381*eb910715SAlp Dener     /* Newton step is not descent or direction produced Inf or NaN
382*eb910715SAlp Dener        Update the perturbation for next time */
383*eb910715SAlp Dener     if (bnk->pert <= 0.0) {
384*eb910715SAlp Dener       /* Initialize the perturbation */
385*eb910715SAlp Dener       bnk->pert = PetscMin(bnk->imax, PetscMax(bnk->imin, bnk->imfac * bnk->gnorm));
386*eb910715SAlp Dener       if (bnk->is_gltr) {
387*eb910715SAlp Dener         ierr = KSPCGGLTRGetMinEig(tao->ksp,&e_min);CHKERRQ(ierr);
388*eb910715SAlp Dener         bnk->pert = PetscMax(bnk->pert, -e_min);
389*eb910715SAlp Dener       }
390*eb910715SAlp Dener     } else {
391*eb910715SAlp Dener       /* Increase the perturbation */
392*eb910715SAlp Dener       bnk->pert = PetscMin(bnk->pmax, PetscMax(bnk->pgfac * bnk->pert, bnk->pmgfac * bnk->gnorm));
393*eb910715SAlp Dener     }
394*eb910715SAlp Dener 
395*eb910715SAlp Dener     if (BNK_PC_BFGS != bnk->pc_type) {
396*eb910715SAlp Dener       /* We don't have the bfgs matrix around and updated
397*eb910715SAlp Dener          Must use gradient direction in this case */
398*eb910715SAlp Dener       ierr = VecCopy(tao->gradient, bnk->D);CHKERRQ(ierr);
399*eb910715SAlp Dener       ierr = VecScale(bnk->D, -1.0);CHKERRQ(ierr);
400*eb910715SAlp Dener       ++bnk->grad;
401*eb910715SAlp Dener       *stepType = BNK_GRADIENT;
402*eb910715SAlp Dener     } else {
403*eb910715SAlp Dener       /* Attempt to use the BFGS direction */
404*eb910715SAlp Dener       ierr = MatLMVMSolve(bnk->M, tao->gradient, bnk->D);CHKERRQ(ierr);
405*eb910715SAlp Dener       ierr = VecScale(bnk->D, -1.0);CHKERRQ(ierr);
406*eb910715SAlp Dener 
407*eb910715SAlp Dener       /* Check for success (descent direction) */
408*eb910715SAlp Dener       ierr = VecDot(tao->gradient, bnk->D, &gdx);CHKERRQ(ierr);
409*eb910715SAlp Dener       if ((gdx >= 0) || PetscIsInfOrNanReal(gdx)) {
410*eb910715SAlp Dener         /* BFGS direction is not descent or direction produced not a number
411*eb910715SAlp Dener            We can assert bfgsUpdates > 1 in this case because
412*eb910715SAlp Dener            the first solve produces the scaled gradient direction,
413*eb910715SAlp Dener            which is guaranteed to be descent */
414*eb910715SAlp Dener 
415*eb910715SAlp Dener         /* Use steepest descent direction (scaled) */
416*eb910715SAlp Dener 
417*eb910715SAlp Dener         if (bnk->f != 0.0) {
418*eb910715SAlp Dener           delta = 2.0 * PetscAbsScalar(bnk->f) / (bnk->gnorm*bnk->gnorm);
419*eb910715SAlp Dener         } else {
420*eb910715SAlp Dener           delta = 2.0 / (bnk->gnorm*bnk->gnorm);
421*eb910715SAlp Dener         }
422*eb910715SAlp Dener         ierr = MatLMVMSetDelta(bnk->M, delta);CHKERRQ(ierr);
423*eb910715SAlp Dener         ierr = MatLMVMReset(bnk->M);CHKERRQ(ierr);
424*eb910715SAlp Dener         ierr = MatLMVMUpdate(bnk->M, tao->solution, tao->gradient);CHKERRQ(ierr);
425*eb910715SAlp Dener         ierr = MatLMVMSolve(bnk->M, tao->gradient, bnk->D);CHKERRQ(ierr);
426*eb910715SAlp Dener         ierr = VecScale(bnk->D, -1.0);CHKERRQ(ierr);
427*eb910715SAlp Dener 
428*eb910715SAlp Dener         bfgsUpdates = 1;
429*eb910715SAlp Dener         ++bnk->sgrad;
430*eb910715SAlp Dener         *stepType = BNK_SCALED_GRADIENT;
431*eb910715SAlp Dener       } else {
432*eb910715SAlp Dener         if (1 == bfgsUpdates) {
433*eb910715SAlp Dener           /* The first BFGS direction is always the scaled gradient */
434*eb910715SAlp Dener           ++bnk->sgrad;
435*eb910715SAlp Dener           *stepType = BNK_SCALED_GRADIENT;
436*eb910715SAlp Dener         } else {
437*eb910715SAlp Dener           ++bnk->bfgs;
438*eb910715SAlp Dener           *stepType = BNK_BFGS;
439*eb910715SAlp Dener         }
440*eb910715SAlp Dener       }
441*eb910715SAlp Dener     }
442*eb910715SAlp Dener   } else {
443*eb910715SAlp Dener     /* Computed Newton step is descent */
444*eb910715SAlp Dener     switch (ksp_reason) {
445*eb910715SAlp Dener     case KSP_DIVERGED_NANORINF:
446*eb910715SAlp Dener     case KSP_DIVERGED_BREAKDOWN:
447*eb910715SAlp Dener     case KSP_DIVERGED_INDEFINITE_MAT:
448*eb910715SAlp Dener     case KSP_DIVERGED_INDEFINITE_PC:
449*eb910715SAlp Dener     case KSP_CONVERGED_CG_NEG_CURVE:
450*eb910715SAlp Dener       /* Matrix or preconditioner is indefinite; increase perturbation */
451*eb910715SAlp Dener       if (bnk->pert <= 0.0) {
452*eb910715SAlp Dener         /* Initialize the perturbation */
453*eb910715SAlp Dener         bnk->pert = PetscMin(bnk->imax, PetscMax(bnk->imin, bnk->imfac * bnk->gnorm));
454*eb910715SAlp Dener         if (bnk->is_gltr) {
455*eb910715SAlp Dener           ierr = KSPCGGLTRGetMinEig(tao->ksp, &e_min);CHKERRQ(ierr);
456*eb910715SAlp Dener           bnk->pert = PetscMax(bnk->pert, -e_min);
457*eb910715SAlp Dener         }
458*eb910715SAlp Dener       } else {
459*eb910715SAlp Dener         /* Increase the perturbation */
460*eb910715SAlp Dener         bnk->pert = PetscMin(bnk->pmax, PetscMax(bnk->pgfac * bnk->pert, bnk->pmgfac * bnk->gnorm));
461*eb910715SAlp Dener       }
462*eb910715SAlp Dener       break;
463*eb910715SAlp Dener 
464*eb910715SAlp Dener     default:
465*eb910715SAlp Dener       /* Newton step computation is good; decrease perturbation */
466*eb910715SAlp Dener       bnk->pert = PetscMin(bnk->psfac * bnk->pert, bnk->pmsfac * bnk->gnorm);
467*eb910715SAlp Dener       if (bnk->pert < bnk->pmin) {
468*eb910715SAlp Dener         bnk->pert = 0.0;
469*eb910715SAlp Dener       }
470*eb910715SAlp Dener       break;
471*eb910715SAlp Dener     }
472*eb910715SAlp Dener 
473*eb910715SAlp Dener     ++bnk->newt;
474*eb910715SAlp Dener     stepType = BNK_NEWTON;
475*eb910715SAlp Dener   }
476*eb910715SAlp Dener   PetscFunctionReturn(0);
477*eb910715SAlp Dener }
478*eb910715SAlp Dener 
479*eb910715SAlp Dener /* ---------------------------------------------------------- */
480*eb910715SAlp Dener static PetscErrorCode TaoSetUp_BNK(Tao tao)
481*eb910715SAlp Dener {
482*eb910715SAlp Dener   TAO_BNK        *bnk = (TAO_BNK *)tao->data;
483*eb910715SAlp Dener   PetscErrorCode ierr;
484*eb910715SAlp Dener 
485*eb910715SAlp Dener   PetscFunctionBegin;
486*eb910715SAlp Dener   if (!tao->gradient) {ierr = VecDuplicate(tao->solution,&tao->gradient);CHKERRQ(ierr);}
487*eb910715SAlp Dener   if (!tao->stepdirection) {ierr = VecDuplicate(tao->solution,&tao->stepdirection);CHKERRQ(ierr);}
488*eb910715SAlp Dener   if (!bnk->W) {ierr = VecDuplicate(tao->solution,&bnk->W);CHKERRQ(ierr);}
489*eb910715SAlp Dener   if (!bnk->D) {ierr = VecDuplicate(tao->solution,&bnk->D);CHKERRQ(ierr);}
490*eb910715SAlp Dener   if (!bnk->Xold) {ierr = VecDuplicate(tao->solution,&bnk->Xold);CHKERRQ(ierr);}
491*eb910715SAlp Dener   if (!bnk->Gold) {ierr = VecDuplicate(tao->solution,&bnk->Gold);CHKERRQ(ierr);}
492*eb910715SAlp Dener   bnk->Diag = 0;
493*eb910715SAlp Dener   bnk->M = 0;
494*eb910715SAlp Dener   PetscFunctionReturn(0);
495*eb910715SAlp Dener }
496*eb910715SAlp Dener 
497*eb910715SAlp Dener /*------------------------------------------------------------*/
498*eb910715SAlp Dener static PetscErrorCode TaoDestroy_BNK(Tao tao)
499*eb910715SAlp Dener {
500*eb910715SAlp Dener   TAO_BNK        *bnk = (TAO_BNK *)tao->data;
501*eb910715SAlp Dener   PetscErrorCode ierr;
502*eb910715SAlp Dener 
503*eb910715SAlp Dener   PetscFunctionBegin;
504*eb910715SAlp Dener   if (tao->setupcalled) {
505*eb910715SAlp Dener     ierr = VecDestroy(&bnk->D);CHKERRQ(ierr);
506*eb910715SAlp Dener     ierr = VecDestroy(&bnk->W);CHKERRQ(ierr);
507*eb910715SAlp Dener     ierr = VecDestroy(&bnk->Xold);CHKERRQ(ierr);
508*eb910715SAlp Dener     ierr = VecDestroy(&bnk->Gold);CHKERRQ(ierr);
509*eb910715SAlp Dener   }
510*eb910715SAlp Dener   ierr = VecDestroy(&bnk->Diag);CHKERRQ(ierr);
511*eb910715SAlp Dener   ierr = MatDestroy(&bnk->M);CHKERRQ(ierr);
512*eb910715SAlp Dener   ierr = PetscFree(tao->data);CHKERRQ(ierr);
513*eb910715SAlp Dener   PetscFunctionReturn(0);
514*eb910715SAlp Dener }
515*eb910715SAlp Dener 
516*eb910715SAlp Dener /*------------------------------------------------------------*/
517*eb910715SAlp Dener static PetscErrorCode TaoSetFromOptions_BNK(PetscOptionItems *PetscOptionsObject,Tao tao)
518*eb910715SAlp Dener {
519*eb910715SAlp Dener   TAO_BNK        *bnk = (TAO_BNK *)tao->data;
520*eb910715SAlp Dener   PetscErrorCode ierr;
521*eb910715SAlp Dener 
522*eb910715SAlp Dener   PetscFunctionBegin;
523*eb910715SAlp Dener   ierr = PetscOptionsHead(PetscOptionsObject,"Newton line search method for unconstrained optimization");CHKERRQ(ierr);
524*eb910715SAlp Dener   ierr = PetscOptionsEList("-tao_BNK_pc_type", "pc type", "", BNK_PC, BNK_PC_TYPES, BNK_PC[bnk->pc_type], &bnk->pc_type, 0);CHKERRQ(ierr);
525*eb910715SAlp Dener   ierr = PetscOptionsEList("-tao_BNK_bfgs_scale_type", "bfgs scale type", "", BFGS_SCALE, BFGS_SCALE_TYPES, BFGS_SCALE[bnk->bfgs_scale_type], &bnk->bfgs_scale_type, 0);CHKERRQ(ierr);
526*eb910715SAlp Dener   ierr = PetscOptionsEList("-tao_BNK_init_type", "radius initialization type", "", BNK_INIT, BNK_INIT_TYPES, BNK_INIT[bnk->init_type], &bnk->init_type, 0);CHKERRQ(ierr);
527*eb910715SAlp Dener   ierr = PetscOptionsEList("-tao_BNK_update_type", "radius update type", "", BNK_UPDATE, BNK_UPDATE_TYPES, BNK_UPDATE[bnk->update_type], &bnk->update_type, 0);CHKERRQ(ierr);
528*eb910715SAlp Dener   ierr = PetscOptionsReal("-tao_BNK_sval", "perturbation starting value", "", bnk->sval, &bnk->sval,NULL);CHKERRQ(ierr);
529*eb910715SAlp Dener   ierr = PetscOptionsReal("-tao_BNK_imin", "minimum initial perturbation", "", bnk->imin, &bnk->imin,NULL);CHKERRQ(ierr);
530*eb910715SAlp Dener   ierr = PetscOptionsReal("-tao_BNK_imax", "maximum initial perturbation", "", bnk->imax, &bnk->imax,NULL);CHKERRQ(ierr);
531*eb910715SAlp Dener   ierr = PetscOptionsReal("-tao_BNK_imfac", "initial merit factor", "", bnk->imfac, &bnk->imfac,NULL);CHKERRQ(ierr);
532*eb910715SAlp Dener   ierr = PetscOptionsReal("-tao_BNK_pmin", "minimum perturbation", "", bnk->pmin, &bnk->pmin,NULL);CHKERRQ(ierr);
533*eb910715SAlp Dener   ierr = PetscOptionsReal("-tao_BNK_pmax", "maximum perturbation", "", bnk->pmax, &bnk->pmax,NULL);CHKERRQ(ierr);
534*eb910715SAlp Dener   ierr = PetscOptionsReal("-tao_BNK_pgfac", "growth factor", "", bnk->pgfac, &bnk->pgfac,NULL);CHKERRQ(ierr);
535*eb910715SAlp Dener   ierr = PetscOptionsReal("-tao_BNK_psfac", "shrink factor", "", bnk->psfac, &bnk->psfac,NULL);CHKERRQ(ierr);
536*eb910715SAlp Dener   ierr = PetscOptionsReal("-tao_BNK_pmgfac", "merit growth factor", "", bnk->pmgfac, &bnk->pmgfac,NULL);CHKERRQ(ierr);
537*eb910715SAlp Dener   ierr = PetscOptionsReal("-tao_BNK_pmsfac", "merit shrink factor", "", bnk->pmsfac, &bnk->pmsfac,NULL);CHKERRQ(ierr);
538*eb910715SAlp Dener   ierr = PetscOptionsReal("-tao_BNK_eta1", "poor steplength; reduce radius", "", bnk->eta1, &bnk->eta1,NULL);CHKERRQ(ierr);
539*eb910715SAlp Dener   ierr = PetscOptionsReal("-tao_BNK_eta2", "reasonable steplength; leave radius alone", "", bnk->eta2, &bnk->eta2,NULL);CHKERRQ(ierr);
540*eb910715SAlp Dener   ierr = PetscOptionsReal("-tao_BNK_eta3", "good steplength; increase radius", "", bnk->eta3, &bnk->eta3,NULL);CHKERRQ(ierr);
541*eb910715SAlp Dener   ierr = PetscOptionsReal("-tao_BNK_eta4", "excellent steplength; greatly increase radius", "", bnk->eta4, &bnk->eta4,NULL);CHKERRQ(ierr);
542*eb910715SAlp Dener   ierr = PetscOptionsReal("-tao_BNK_alpha1", "", "", bnk->alpha1, &bnk->alpha1,NULL);CHKERRQ(ierr);
543*eb910715SAlp Dener   ierr = PetscOptionsReal("-tao_BNK_alpha2", "", "", bnk->alpha2, &bnk->alpha2,NULL);CHKERRQ(ierr);
544*eb910715SAlp Dener   ierr = PetscOptionsReal("-tao_BNK_alpha3", "", "", bnk->alpha3, &bnk->alpha3,NULL);CHKERRQ(ierr);
545*eb910715SAlp Dener   ierr = PetscOptionsReal("-tao_BNK_alpha4", "", "", bnk->alpha4, &bnk->alpha4,NULL);CHKERRQ(ierr);
546*eb910715SAlp Dener   ierr = PetscOptionsReal("-tao_BNK_alpha5", "", "", bnk->alpha5, &bnk->alpha5,NULL);CHKERRQ(ierr);
547*eb910715SAlp Dener   ierr = PetscOptionsReal("-tao_BNK_nu1", "poor steplength; reduce radius", "", bnk->nu1, &bnk->nu1,NULL);CHKERRQ(ierr);
548*eb910715SAlp Dener   ierr = PetscOptionsReal("-tao_BNK_nu2", "reasonable steplength; leave radius alone", "", bnk->nu2, &bnk->nu2,NULL);CHKERRQ(ierr);
549*eb910715SAlp Dener   ierr = PetscOptionsReal("-tao_BNK_nu3", "good steplength; increase radius", "", bnk->nu3, &bnk->nu3,NULL);CHKERRQ(ierr);
550*eb910715SAlp Dener   ierr = PetscOptionsReal("-tao_BNK_nu4", "excellent steplength; greatly increase radius", "", bnk->nu4, &bnk->nu4,NULL);CHKERRQ(ierr);
551*eb910715SAlp Dener   ierr = PetscOptionsReal("-tao_BNK_omega1", "", "", bnk->omega1, &bnk->omega1,NULL);CHKERRQ(ierr);
552*eb910715SAlp Dener   ierr = PetscOptionsReal("-tao_BNK_omega2", "", "", bnk->omega2, &bnk->omega2,NULL);CHKERRQ(ierr);
553*eb910715SAlp Dener   ierr = PetscOptionsReal("-tao_BNK_omega3", "", "", bnk->omega3, &bnk->omega3,NULL);CHKERRQ(ierr);
554*eb910715SAlp Dener   ierr = PetscOptionsReal("-tao_BNK_omega4", "", "", bnk->omega4, &bnk->omega4,NULL);CHKERRQ(ierr);
555*eb910715SAlp Dener   ierr = PetscOptionsReal("-tao_BNK_omega5", "", "", bnk->omega5, &bnk->omega5,NULL);CHKERRQ(ierr);
556*eb910715SAlp Dener   ierr = PetscOptionsReal("-tao_BNK_mu1_i", "", "", bnk->mu1_i, &bnk->mu1_i,NULL);CHKERRQ(ierr);
557*eb910715SAlp Dener   ierr = PetscOptionsReal("-tao_BNK_mu2_i", "", "", bnk->mu2_i, &bnk->mu2_i,NULL);CHKERRQ(ierr);
558*eb910715SAlp Dener   ierr = PetscOptionsReal("-tao_BNK_gamma1_i", "", "", bnk->gamma1_i, &bnk->gamma1_i,NULL);CHKERRQ(ierr);
559*eb910715SAlp Dener   ierr = PetscOptionsReal("-tao_BNK_gamma2_i", "", "", bnk->gamma2_i, &bnk->gamma2_i,NULL);CHKERRQ(ierr);
560*eb910715SAlp Dener   ierr = PetscOptionsReal("-tao_BNK_gamma3_i", "", "", bnk->gamma3_i, &bnk->gamma3_i,NULL);CHKERRQ(ierr);
561*eb910715SAlp Dener   ierr = PetscOptionsReal("-tao_BNK_gamma4_i", "", "", bnk->gamma4_i, &bnk->gamma4_i,NULL);CHKERRQ(ierr);
562*eb910715SAlp Dener   ierr = PetscOptionsReal("-tao_BNK_theta_i", "", "", bnk->theta_i, &bnk->theta_i,NULL);CHKERRQ(ierr);
563*eb910715SAlp Dener   ierr = PetscOptionsReal("-tao_BNK_mu1", "", "", bnk->mu1, &bnk->mu1,NULL);CHKERRQ(ierr);
564*eb910715SAlp Dener   ierr = PetscOptionsReal("-tao_BNK_mu2", "", "", bnk->mu2, &bnk->mu2,NULL);CHKERRQ(ierr);
565*eb910715SAlp Dener   ierr = PetscOptionsReal("-tao_BNK_gamma1", "", "", bnk->gamma1, &bnk->gamma1,NULL);CHKERRQ(ierr);
566*eb910715SAlp Dener   ierr = PetscOptionsReal("-tao_BNK_gamma2", "", "", bnk->gamma2, &bnk->gamma2,NULL);CHKERRQ(ierr);
567*eb910715SAlp Dener   ierr = PetscOptionsReal("-tao_BNK_gamma3", "", "", bnk->gamma3, &bnk->gamma3,NULL);CHKERRQ(ierr);
568*eb910715SAlp Dener   ierr = PetscOptionsReal("-tao_BNK_gamma4", "", "", bnk->gamma4, &bnk->gamma4,NULL);CHKERRQ(ierr);
569*eb910715SAlp Dener   ierr = PetscOptionsReal("-tao_BNK_theta", "", "", bnk->theta, &bnk->theta,NULL);CHKERRQ(ierr);
570*eb910715SAlp Dener   ierr = PetscOptionsReal("-tao_BNK_min_radius", "lower bound on initial radius", "", bnk->min_radius, &bnk->min_radius,NULL);CHKERRQ(ierr);
571*eb910715SAlp Dener   ierr = PetscOptionsReal("-tao_BNK_max_radius", "upper bound on radius", "", bnk->max_radius, &bnk->max_radius,NULL);CHKERRQ(ierr);
572*eb910715SAlp Dener   ierr = PetscOptionsReal("-tao_BNK_epsilon", "tolerance used when computing actual and predicted reduction", "", bnk->epsilon, &bnk->epsilon,NULL);CHKERRQ(ierr);
573*eb910715SAlp Dener   ierr = PetscOptionsTail();CHKERRQ(ierr);
574*eb910715SAlp Dener   ierr = TaoLineSearchSetFromOptions(tao->linesearch);CHKERRQ(ierr);
575*eb910715SAlp Dener   ierr = KSPSetFromOptions(tao->ksp);CHKERRQ(ierr);
576*eb910715SAlp Dener   PetscFunctionReturn(0);
577*eb910715SAlp Dener }
578*eb910715SAlp Dener 
579*eb910715SAlp Dener 
580*eb910715SAlp Dener /*------------------------------------------------------------*/
581*eb910715SAlp Dener static PetscErrorCode TaoView_BNK(Tao tao, PetscViewer viewer)
582*eb910715SAlp Dener {
583*eb910715SAlp Dener   TAO_BNK        *bnk = (TAO_BNK *)tao->data;
584*eb910715SAlp Dener   PetscInt       nrejects;
585*eb910715SAlp Dener   PetscBool      isascii;
586*eb910715SAlp Dener   PetscErrorCode ierr;
587*eb910715SAlp Dener 
588*eb910715SAlp Dener   PetscFunctionBegin;
589*eb910715SAlp Dener   ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&isascii);CHKERRQ(ierr);
590*eb910715SAlp Dener   if (isascii) {
591*eb910715SAlp Dener     ierr = PetscViewerASCIIPushTab(viewer);CHKERRQ(ierr);
592*eb910715SAlp Dener     if (BNK_PC_BFGS == bnk->pc_type && bnk->M) {
593*eb910715SAlp Dener       ierr = MatLMVMGetRejects(bnk->M,&nrejects);CHKERRQ(ierr);
594*eb910715SAlp Dener       ierr = PetscViewerASCIIPrintf(viewer, "Rejected matrix updates: %D\n",nrejects);CHKERRQ(ierr);
595*eb910715SAlp Dener     }
596*eb910715SAlp Dener     ierr = PetscViewerASCIIPrintf(viewer, "Newton steps: %D\n", bnk->newt);CHKERRQ(ierr);
597*eb910715SAlp Dener     ierr = PetscViewerASCIIPrintf(viewer, "BFGS steps: %D\n", bnk->bfgs);CHKERRQ(ierr);
598*eb910715SAlp Dener     ierr = PetscViewerASCIIPrintf(viewer, "Scaled gradient steps: %D\n", bnk->sgrad);CHKERRQ(ierr);
599*eb910715SAlp Dener     ierr = PetscViewerASCIIPrintf(viewer, "Gradient steps: %D\n", bnk->grad);CHKERRQ(ierr);
600*eb910715SAlp Dener     ierr = PetscViewerASCIIPrintf(viewer, "KSP termination reasons:\n");CHKERRQ(ierr);
601*eb910715SAlp Dener     ierr = PetscViewerASCIIPrintf(viewer, "  atol: %D\n", bnk->ksp_atol);CHKERRQ(ierr);
602*eb910715SAlp Dener     ierr = PetscViewerASCIIPrintf(viewer, "  rtol: %D\n", bnk->ksp_rtol);CHKERRQ(ierr);
603*eb910715SAlp Dener     ierr = PetscViewerASCIIPrintf(viewer, "  ctol: %D\n", bnk->ksp_ctol);CHKERRQ(ierr);
604*eb910715SAlp Dener     ierr = PetscViewerASCIIPrintf(viewer, "  negc: %D\n", bnk->ksp_negc);CHKERRQ(ierr);
605*eb910715SAlp Dener     ierr = PetscViewerASCIIPrintf(viewer, "  dtol: %D\n", bnk->ksp_dtol);CHKERRQ(ierr);
606*eb910715SAlp Dener     ierr = PetscViewerASCIIPrintf(viewer, "  iter: %D\n", bnk->ksp_iter);CHKERRQ(ierr);
607*eb910715SAlp Dener     ierr = PetscViewerASCIIPrintf(viewer, "  othr: %D\n", bnk->ksp_othr);CHKERRQ(ierr);
608*eb910715SAlp Dener     ierr = PetscViewerASCIIPopTab(viewer);CHKERRQ(ierr);
609*eb910715SAlp Dener   }
610*eb910715SAlp Dener   PetscFunctionReturn(0);
611*eb910715SAlp Dener }
612*eb910715SAlp Dener 
613*eb910715SAlp Dener /* ---------------------------------------------------------- */
614*eb910715SAlp Dener /*MC
615*eb910715SAlp Dener   TAOBNK - Shared base-type for Bounded Newton-Krylov type algorithms.
616*eb910715SAlp Dener   At each iteration, the BNK method solves the symmetric
617*eb910715SAlp Dener   system of equations to obtain the step diretion dk:
618*eb910715SAlp Dener               Hk dk = -gk
619*eb910715SAlp Dener   at which point the step can be globalized either through trust-region
620*eb910715SAlp Dener   methods, or a line search, or a heuristic mixture of both.
621*eb910715SAlp Dener 
622*eb910715SAlp Dener     Options Database Keys:
623*eb910715SAlp Dener + -tao_BNK_pc_type - "none","ahess","bfgs","petsc"
624*eb910715SAlp Dener . -tao_BNK_bfgs_scale_type - "ahess","phess","bfgs"
625*eb910715SAlp Dener . -tao_BNK_init_type - "constant","direction","interpolation"
626*eb910715SAlp Dener . -tao_BNK_update_type - "step","direction","interpolation"
627*eb910715SAlp Dener . -tao_BNK_sval - perturbation starting value
628*eb910715SAlp Dener . -tao_BNK_imin - minimum initial perturbation
629*eb910715SAlp Dener . -tao_BNK_imax - maximum initial perturbation
630*eb910715SAlp Dener . -tao_BNK_pmin - minimum perturbation
631*eb910715SAlp Dener . -tao_BNK_pmax - maximum perturbation
632*eb910715SAlp Dener . -tao_BNK_pgfac - growth factor
633*eb910715SAlp Dener . -tao_BNK_psfac - shrink factor
634*eb910715SAlp Dener . -tao_BNK_imfac - initial merit factor
635*eb910715SAlp Dener . -tao_BNK_pmgfac - merit growth factor
636*eb910715SAlp Dener . -tao_BNK_pmsfac - merit shrink factor
637*eb910715SAlp Dener . -tao_BNK_eta1 - poor steplength; reduce radius
638*eb910715SAlp Dener . -tao_BNK_eta2 - reasonable steplength; leave radius
639*eb910715SAlp Dener . -tao_BNK_eta3 - good steplength; increase readius
640*eb910715SAlp Dener . -tao_BNK_eta4 - excellent steplength; greatly increase radius
641*eb910715SAlp Dener . -tao_BNK_alpha1 - alpha1 reduction
642*eb910715SAlp Dener . -tao_BNK_alpha2 - alpha2 reduction
643*eb910715SAlp Dener . -tao_BNK_alpha3 - alpha3 reduction
644*eb910715SAlp Dener . -tao_BNK_alpha4 - alpha4 reduction
645*eb910715SAlp Dener . -tao_BNK_alpha - alpha5 reduction
646*eb910715SAlp Dener . -tao_BNK_mu1 - mu1 interpolation update
647*eb910715SAlp Dener . -tao_BNK_mu2 - mu2 interpolation update
648*eb910715SAlp Dener . -tao_BNK_gamma1 - gamma1 interpolation update
649*eb910715SAlp Dener . -tao_BNK_gamma2 - gamma2 interpolation update
650*eb910715SAlp Dener . -tao_BNK_gamma3 - gamma3 interpolation update
651*eb910715SAlp Dener . -tao_BNK_gamma4 - gamma4 interpolation update
652*eb910715SAlp Dener . -tao_BNK_theta - theta interpolation update
653*eb910715SAlp Dener . -tao_BNK_omega1 - omega1 step update
654*eb910715SAlp Dener . -tao_BNK_omega2 - omega2 step update
655*eb910715SAlp Dener . -tao_BNK_omega3 - omega3 step update
656*eb910715SAlp Dener . -tao_BNK_omega4 - omega4 step update
657*eb910715SAlp Dener . -tao_BNK_omega5 - omega5 step update
658*eb910715SAlp Dener . -tao_BNK_mu1_i -  mu1 interpolation init factor
659*eb910715SAlp Dener . -tao_BNK_mu2_i -  mu2 interpolation init factor
660*eb910715SAlp Dener . -tao_BNK_gamma1_i -  gamma1 interpolation init factor
661*eb910715SAlp Dener . -tao_BNK_gamma2_i -  gamma2 interpolation init factor
662*eb910715SAlp Dener . -tao_BNK_gamma3_i -  gamma3 interpolation init factor
663*eb910715SAlp Dener . -tao_BNK_gamma4_i -  gamma4 interpolation init factor
664*eb910715SAlp Dener - -tao_BNK_theta_i -  theta interpolation init factor
665*eb910715SAlp Dener 
666*eb910715SAlp Dener   Level: beginner
667*eb910715SAlp Dener M*/
668*eb910715SAlp Dener 
669*eb910715SAlp Dener PetscErrorCode TaoCreate_BNK(Tao tao)
670*eb910715SAlp Dener {
671*eb910715SAlp Dener   TAO_BNK        *bnk;
672*eb910715SAlp Dener   const char     *morethuente_type = TAOLINESEARCHMT;
673*eb910715SAlp Dener   PetscErrorCode ierr;
674*eb910715SAlp Dener 
675*eb910715SAlp Dener   PetscFunctionBegin;
676*eb910715SAlp Dener   ierr = PetscNewLog(tao,&bnk);CHKERRQ(ierr);
677*eb910715SAlp Dener 
678*eb910715SAlp Dener   tao->ops->setup = TaoSetUp_BNK;
679*eb910715SAlp Dener   tao->ops->view = TaoView_BNK;
680*eb910715SAlp Dener   tao->ops->setfromoptions = TaoSetFromOptions_BNK;
681*eb910715SAlp Dener   tao->ops->destroy = TaoDestroy_BNK;
682*eb910715SAlp Dener 
683*eb910715SAlp Dener   /* Override default settings (unless already changed) */
684*eb910715SAlp Dener   if (!tao->max_it_changed) tao->max_it = 50;
685*eb910715SAlp Dener   if (!tao->trust0_changed) tao->trust0 = 100.0;
686*eb910715SAlp Dener 
687*eb910715SAlp Dener   tao->data = (void*)bnk;
688*eb910715SAlp Dener 
689*eb910715SAlp Dener   bnk->sval   = 0.0;
690*eb910715SAlp Dener   bnk->imin   = 1.0e-4;
691*eb910715SAlp Dener   bnk->imax   = 1.0e+2;
692*eb910715SAlp Dener   bnk->imfac  = 1.0e-1;
693*eb910715SAlp Dener 
694*eb910715SAlp Dener   bnk->pmin   = 1.0e-12;
695*eb910715SAlp Dener   bnk->pmax   = 1.0e+2;
696*eb910715SAlp Dener   bnk->pgfac  = 1.0e+1;
697*eb910715SAlp Dener   bnk->psfac  = 4.0e-1;
698*eb910715SAlp Dener   bnk->pmgfac = 1.0e-1;
699*eb910715SAlp Dener   bnk->pmsfac = 1.0e-1;
700*eb910715SAlp Dener 
701*eb910715SAlp Dener   /*  Default values for trust-region radius update based on steplength */
702*eb910715SAlp Dener   bnk->nu1 = 0.25;
703*eb910715SAlp Dener   bnk->nu2 = 0.50;
704*eb910715SAlp Dener   bnk->nu3 = 1.00;
705*eb910715SAlp Dener   bnk->nu4 = 1.25;
706*eb910715SAlp Dener 
707*eb910715SAlp Dener   bnk->omega1 = 0.25;
708*eb910715SAlp Dener   bnk->omega2 = 0.50;
709*eb910715SAlp Dener   bnk->omega3 = 1.00;
710*eb910715SAlp Dener   bnk->omega4 = 2.00;
711*eb910715SAlp Dener   bnk->omega5 = 4.00;
712*eb910715SAlp Dener 
713*eb910715SAlp Dener   /*  Default values for trust-region radius update based on reduction */
714*eb910715SAlp Dener   bnk->eta1 = 1.0e-4;
715*eb910715SAlp Dener   bnk->eta2 = 0.25;
716*eb910715SAlp Dener   bnk->eta3 = 0.50;
717*eb910715SAlp Dener   bnk->eta4 = 0.90;
718*eb910715SAlp Dener 
719*eb910715SAlp Dener   bnk->alpha1 = 0.25;
720*eb910715SAlp Dener   bnk->alpha2 = 0.50;
721*eb910715SAlp Dener   bnk->alpha3 = 1.00;
722*eb910715SAlp Dener   bnk->alpha4 = 2.00;
723*eb910715SAlp Dener   bnk->alpha5 = 4.00;
724*eb910715SAlp Dener 
725*eb910715SAlp Dener   /*  Default values for trust-region radius update based on interpolation */
726*eb910715SAlp Dener   bnk->mu1 = 0.10;
727*eb910715SAlp Dener   bnk->mu2 = 0.50;
728*eb910715SAlp Dener 
729*eb910715SAlp Dener   bnk->gamma1 = 0.25;
730*eb910715SAlp Dener   bnk->gamma2 = 0.50;
731*eb910715SAlp Dener   bnk->gamma3 = 2.00;
732*eb910715SAlp Dener   bnk->gamma4 = 4.00;
733*eb910715SAlp Dener 
734*eb910715SAlp Dener   bnk->theta = 0.05;
735*eb910715SAlp Dener 
736*eb910715SAlp Dener   /*  Default values for trust region initialization based on interpolation */
737*eb910715SAlp Dener   bnk->mu1_i = 0.35;
738*eb910715SAlp Dener   bnk->mu2_i = 0.50;
739*eb910715SAlp Dener 
740*eb910715SAlp Dener   bnk->gamma1_i = 0.0625;
741*eb910715SAlp Dener   bnk->gamma2_i = 0.5;
742*eb910715SAlp Dener   bnk->gamma3_i = 2.0;
743*eb910715SAlp Dener   bnk->gamma4_i = 5.0;
744*eb910715SAlp Dener 
745*eb910715SAlp Dener   bnk->theta_i = 0.25;
746*eb910715SAlp Dener 
747*eb910715SAlp Dener   /*  Remaining parameters */
748*eb910715SAlp Dener   bnk->min_radius = 1.0e-10;
749*eb910715SAlp Dener   bnk->max_radius = 1.0e10;
750*eb910715SAlp Dener   bnk->epsilon = 1.0e-6;
751*eb910715SAlp Dener 
752*eb910715SAlp Dener   bnk->pc_type         = BNK_PC_BFGS;
753*eb910715SAlp Dener   bnk->bfgs_scale_type = BFGS_SCALE_PHESS;
754*eb910715SAlp Dener   bnk->init_type       = BNK_INIT_INTERPOLATION;
755*eb910715SAlp Dener   bnk->update_type     = BNK_UPDATE_STEP;
756*eb910715SAlp Dener 
757*eb910715SAlp Dener   ierr = TaoLineSearchCreate(((PetscObject)tao)->comm,&tao->linesearch);CHKERRQ(ierr);
758*eb910715SAlp Dener   ierr = PetscObjectIncrementTabLevel((PetscObject)tao->linesearch, (PetscObject)tao, 1);CHKERRQ(ierr);
759*eb910715SAlp Dener   ierr = TaoLineSearchSetType(tao->linesearch,morethuente_type);CHKERRQ(ierr);
760*eb910715SAlp Dener   ierr = TaoLineSearchUseTaoRoutines(tao->linesearch,tao);CHKERRQ(ierr);
761*eb910715SAlp Dener   ierr = TaoLineSearchSetOptionsPrefix(tao->linesearch,tao->hdr.prefix);CHKERRQ(ierr);
762*eb910715SAlp Dener 
763*eb910715SAlp Dener   /*  Set linear solver to default for symmetric matrices */
764*eb910715SAlp Dener   ierr = KSPCreate(((PetscObject)tao)->comm,&tao->ksp);CHKERRQ(ierr);
765*eb910715SAlp Dener   ierr = PetscObjectIncrementTabLevel((PetscObject)tao->ksp, (PetscObject)tao, 1);CHKERRQ(ierr);
766*eb910715SAlp Dener   ierr = KSPSetOptionsPrefix(tao->ksp,tao->hdr.prefix);CHKERRQ(ierr);
767*eb910715SAlp Dener   ierr = KSPSetType(tao->ksp,KSPCGSTCG);CHKERRQ(ierr);
768*eb910715SAlp Dener   PetscFunctionReturn(0);
769*eb910715SAlp Dener }
770