1*eb910715SAlp Dener #include <petsctaolinesearch.h> 2*eb910715SAlp Dener #include <../src/tao/bound/impls/bnk/bnk.h> 3*eb910715SAlp Dener 4*eb910715SAlp Dener #include <petscksp.h> 5*eb910715SAlp Dener 6*eb910715SAlp Dener /* Routine for BFGS preconditioner */ 7*eb910715SAlp Dener 8*eb910715SAlp Dener PetscErrorCode MatLMVMSolveShell(PC pc, Vec b, Vec x) 9*eb910715SAlp Dener { 10*eb910715SAlp Dener PetscErrorCode ierr; 11*eb910715SAlp Dener Mat M; 12*eb910715SAlp Dener 13*eb910715SAlp Dener PetscFunctionBegin; 14*eb910715SAlp Dener PetscValidHeaderSpecific(pc,PC_CLASSID,1); 15*eb910715SAlp Dener PetscValidHeaderSpecific(b,VEC_CLASSID,2); 16*eb910715SAlp Dener PetscValidHeaderSpecific(x,VEC_CLASSID,3); 17*eb910715SAlp Dener ierr = PCShellGetContext(pc,(void**)&M);CHKERRQ(ierr); 18*eb910715SAlp Dener ierr = MatLMVMSolve(M, b, x);CHKERRQ(ierr); 19*eb910715SAlp Dener PetscFunctionReturn(0); 20*eb910715SAlp Dener } 21*eb910715SAlp Dener 22*eb910715SAlp Dener PetscErrorCode TaoBNKInitialize(Tao tao) 23*eb910715SAlp Dener { 24*eb910715SAlp Dener PetscErrorCode ierr; 25*eb910715SAlp Dener TAO_BNK *bnk = (TAO_BNK *)tao->data; 26*eb910715SAlp Dener KSPType ksp_type; 27*eb910715SAlp Dener PC pc; 28*eb910715SAlp Dener 29*eb910715SAlp Dener PetscReal fmin, ftrial, prered, actred, kappa, sigma; 30*eb910715SAlp Dener PetscReal tau, tau_1, tau_2, tau_max, tau_min, max_radius; 31*eb910715SAlp Dener PetscReal delta, step = 1.0; 32*eb910715SAlp Dener 33*eb910715SAlp Dener PetscInt n,N,needH = 1; 34*eb910715SAlp Dener 35*eb910715SAlp Dener PetscInt i_max = 5; 36*eb910715SAlp Dener PetscInt j_max = 1; 37*eb910715SAlp Dener PetscInt i, j; 38*eb910715SAlp Dener 39*eb910715SAlp Dener PetscFunctionBegin; 40*eb910715SAlp Dener /* Number of times ksp stopped because of these reasons */ 41*eb910715SAlp Dener bnk->ksp_atol = 0; 42*eb910715SAlp Dener bnk->ksp_rtol = 0; 43*eb910715SAlp Dener bnk->ksp_dtol = 0; 44*eb910715SAlp Dener bnk->ksp_ctol = 0; 45*eb910715SAlp Dener bnk->ksp_negc = 0; 46*eb910715SAlp Dener bnk->ksp_iter = 0; 47*eb910715SAlp Dener bnk->ksp_othr = 0; 48*eb910715SAlp Dener 49*eb910715SAlp Dener /* Initialize trust-region radius when using nash, stcg, or gltr 50*eb910715SAlp Dener Command automatically ignored for other methods 51*eb910715SAlp Dener Will be reset during the first iteration 52*eb910715SAlp Dener */ 53*eb910715SAlp Dener ierr = KSPGetType(tao->ksp,&ksp_type);CHKERRQ(ierr); 54*eb910715SAlp Dener ierr = PetscStrcmp(ksp_type,KSPCGNASH,&bnk->is_nash);CHKERRQ(ierr); 55*eb910715SAlp Dener ierr = PetscStrcmp(ksp_type,KSPCGSTCG,&bnk->is_stcg);CHKERRQ(ierr); 56*eb910715SAlp Dener ierr = PetscStrcmp(ksp_type,KSPCGGLTR,&bnk->is_gltr);CHKERRQ(ierr); 57*eb910715SAlp Dener 58*eb910715SAlp Dener ierr = KSPCGSetRadius(tao->ksp,bnk->max_radius);CHKERRQ(ierr); 59*eb910715SAlp Dener 60*eb910715SAlp Dener if (bnk->is_nash || bnk->is_stcg || bnk->is_gltr) { 61*eb910715SAlp Dener if (tao->trust0 < 0.0) SETERRQ(PETSC_COMM_SELF,1,"Initial radius negative"); 62*eb910715SAlp Dener tao->trust = tao->trust0; 63*eb910715SAlp Dener tao->trust = PetscMax(tao->trust, bnk->min_radius); 64*eb910715SAlp Dener tao->trust = PetscMin(tao->trust, bnk->max_radius); 65*eb910715SAlp Dener } 66*eb910715SAlp Dener 67*eb910715SAlp Dener /* Get vectors we will need */ 68*eb910715SAlp Dener if (BNK_PC_BFGS == bnk->pc_type && !bnk->M) { 69*eb910715SAlp Dener ierr = VecGetLocalSize(tao->solution,&n);CHKERRQ(ierr); 70*eb910715SAlp Dener ierr = VecGetSize(tao->solution,&N);CHKERRQ(ierr); 71*eb910715SAlp Dener ierr = MatCreateLMVM(((PetscObject)tao)->comm,n,N,&bnk->M);CHKERRQ(ierr); 72*eb910715SAlp Dener ierr = MatLMVMAllocateVectors(bnk->M,tao->solution);CHKERRQ(ierr); 73*eb910715SAlp Dener } 74*eb910715SAlp Dener 75*eb910715SAlp Dener /* create vectors for the limited memory preconditioner */ 76*eb910715SAlp Dener if ((BNK_PC_BFGS == bnk->pc_type) && (BFGS_SCALE_BFGS != bnk->bfgs_scale_type)) { 77*eb910715SAlp Dener if (!bnk->Diag) { 78*eb910715SAlp Dener ierr = VecDuplicate(tao->solution,&bnk->Diag);CHKERRQ(ierr); 79*eb910715SAlp Dener } 80*eb910715SAlp Dener } 81*eb910715SAlp Dener 82*eb910715SAlp Dener /* Modify the preconditioner to use the bfgs approximation */ 83*eb910715SAlp Dener ierr = KSPGetPC(tao->ksp, &pc);CHKERRQ(ierr); 84*eb910715SAlp Dener switch(bnk->pc_type) { 85*eb910715SAlp Dener case BNK_PC_NONE: 86*eb910715SAlp Dener ierr = PCSetType(pc, PCNONE);CHKERRQ(ierr); 87*eb910715SAlp Dener ierr = PCSetFromOptions(pc);CHKERRQ(ierr); 88*eb910715SAlp Dener break; 89*eb910715SAlp Dener 90*eb910715SAlp Dener case BNK_PC_AHESS: 91*eb910715SAlp Dener ierr = PCSetType(pc, PCJACOBI);CHKERRQ(ierr); 92*eb910715SAlp Dener ierr = PCSetFromOptions(pc);CHKERRQ(ierr); 93*eb910715SAlp Dener ierr = PCJacobiSetUseAbs(pc,PETSC_TRUE);CHKERRQ(ierr); 94*eb910715SAlp Dener break; 95*eb910715SAlp Dener 96*eb910715SAlp Dener case BNK_PC_BFGS: 97*eb910715SAlp Dener ierr = PCSetType(pc, PCSHELL);CHKERRQ(ierr); 98*eb910715SAlp Dener ierr = PCSetFromOptions(pc);CHKERRQ(ierr); 99*eb910715SAlp Dener ierr = PCShellSetName(pc, "bfgs");CHKERRQ(ierr); 100*eb910715SAlp Dener ierr = PCShellSetContext(pc, bnk->M);CHKERRQ(ierr); 101*eb910715SAlp Dener ierr = PCShellSetApply(pc, MatLMVMSolveShell);CHKERRQ(ierr); 102*eb910715SAlp Dener break; 103*eb910715SAlp Dener 104*eb910715SAlp Dener default: 105*eb910715SAlp Dener /* Use the pc method set by pc_type */ 106*eb910715SAlp Dener break; 107*eb910715SAlp Dener } 108*eb910715SAlp Dener 109*eb910715SAlp Dener /* Initialize trust-region radius. The initialization is only performed 110*eb910715SAlp Dener when we are using Nash, Steihaug-Toint or the Generalized Lanczos method. */ 111*eb910715SAlp Dener if (bnk->is_nash || bnk->is_stcg || bnk->is_gltr) { 112*eb910715SAlp Dener switch(bnk->init_type) { 113*eb910715SAlp Dener case BNK_INIT_CONSTANT: 114*eb910715SAlp Dener /* Use the initial radius specified */ 115*eb910715SAlp Dener break; 116*eb910715SAlp Dener 117*eb910715SAlp Dener case BNK_INIT_INTERPOLATION: 118*eb910715SAlp Dener /* Use the initial radius specified */ 119*eb910715SAlp Dener max_radius = 0.0; 120*eb910715SAlp Dener 121*eb910715SAlp Dener for (j = 0; j < j_max; ++j) { 122*eb910715SAlp Dener fmin = bnk->f; 123*eb910715SAlp Dener sigma = 0.0; 124*eb910715SAlp Dener 125*eb910715SAlp Dener if (needH) { 126*eb910715SAlp Dener ierr = TaoComputeHessian(tao, tao->solution,tao->hessian,tao->hessian_pre);CHKERRQ(ierr); 127*eb910715SAlp Dener needH = 0; 128*eb910715SAlp Dener } 129*eb910715SAlp Dener 130*eb910715SAlp Dener for (i = 0; i < i_max; ++i) { 131*eb910715SAlp Dener ierr = VecCopy(tao->solution,bnk->W);CHKERRQ(ierr); 132*eb910715SAlp Dener ierr = VecAXPY(bnk->W,-tao->trust/bnk->gnorm,tao->gradient);CHKERRQ(ierr); 133*eb910715SAlp Dener ierr = TaoComputeObjective(tao, bnk->W, &ftrial);CHKERRQ(ierr); 134*eb910715SAlp Dener if (PetscIsInfOrNanReal(ftrial)) { 135*eb910715SAlp Dener tau = bnk->gamma1_i; 136*eb910715SAlp Dener } else { 137*eb910715SAlp Dener if (ftrial < fmin) { 138*eb910715SAlp Dener fmin = ftrial; 139*eb910715SAlp Dener sigma = -tao->trust / bnk->gnorm; 140*eb910715SAlp Dener } 141*eb910715SAlp Dener 142*eb910715SAlp Dener ierr = MatMult(tao->hessian, tao->gradient, bnk->D);CHKERRQ(ierr); 143*eb910715SAlp Dener ierr = VecDot(tao->gradient, bnk->D, &prered);CHKERRQ(ierr); 144*eb910715SAlp Dener 145*eb910715SAlp Dener prered = tao->trust * (bnk->gnorm - 0.5 * tao->trust * prered / (bnk->gnorm * bnk->gnorm)); 146*eb910715SAlp Dener actred = bnk->f - ftrial; 147*eb910715SAlp Dener if ((PetscAbsScalar(actred) <= bnk->epsilon) && (PetscAbsScalar(prered) <= bnk->epsilon)) { 148*eb910715SAlp Dener kappa = 1.0; 149*eb910715SAlp Dener } else { 150*eb910715SAlp Dener kappa = actred / prered; 151*eb910715SAlp Dener } 152*eb910715SAlp Dener 153*eb910715SAlp Dener tau_1 = bnk->theta_i * bnk->gnorm * tao->trust / (bnk->theta_i * bnk->gnorm * tao->trust + (1.0 - bnk->theta_i) * prered - actred); 154*eb910715SAlp Dener tau_2 = bnk->theta_i * bnk->gnorm * tao->trust / (bnk->theta_i * bnk->gnorm * tao->trust - (1.0 + bnk->theta_i) * prered + actred); 155*eb910715SAlp Dener tau_min = PetscMin(tau_1, tau_2); 156*eb910715SAlp Dener tau_max = PetscMax(tau_1, tau_2); 157*eb910715SAlp Dener 158*eb910715SAlp Dener if (PetscAbsScalar(kappa - 1.0) <= bnk->mu1_i) { 159*eb910715SAlp Dener /* Great agreement */ 160*eb910715SAlp Dener max_radius = PetscMax(max_radius, tao->trust); 161*eb910715SAlp Dener 162*eb910715SAlp Dener if (tau_max < 1.0) { 163*eb910715SAlp Dener tau = bnk->gamma3_i; 164*eb910715SAlp Dener } else if (tau_max > bnk->gamma4_i) { 165*eb910715SAlp Dener tau = bnk->gamma4_i; 166*eb910715SAlp Dener } else if (tau_1 >= 1.0 && tau_1 <= bnk->gamma4_i && tau_2 < 1.0) { 167*eb910715SAlp Dener tau = tau_1; 168*eb910715SAlp Dener } else if (tau_2 >= 1.0 && tau_2 <= bnk->gamma4_i && tau_1 < 1.0) { 169*eb910715SAlp Dener tau = tau_2; 170*eb910715SAlp Dener } else { 171*eb910715SAlp Dener tau = tau_max; 172*eb910715SAlp Dener } 173*eb910715SAlp Dener } else if (PetscAbsScalar(kappa - 1.0) <= bnk->mu2_i) { 174*eb910715SAlp Dener /* Good agreement */ 175*eb910715SAlp Dener max_radius = PetscMax(max_radius, tao->trust); 176*eb910715SAlp Dener 177*eb910715SAlp Dener if (tau_max < bnk->gamma2_i) { 178*eb910715SAlp Dener tau = bnk->gamma2_i; 179*eb910715SAlp Dener } else if (tau_max > bnk->gamma3_i) { 180*eb910715SAlp Dener tau = bnk->gamma3_i; 181*eb910715SAlp Dener } else { 182*eb910715SAlp Dener tau = tau_max; 183*eb910715SAlp Dener } 184*eb910715SAlp Dener } else { 185*eb910715SAlp Dener /* Not good agreement */ 186*eb910715SAlp Dener if (tau_min > 1.0) { 187*eb910715SAlp Dener tau = bnk->gamma2_i; 188*eb910715SAlp Dener } else if (tau_max < bnk->gamma1_i) { 189*eb910715SAlp Dener tau = bnk->gamma1_i; 190*eb910715SAlp Dener } else if ((tau_min < bnk->gamma1_i) && (tau_max >= 1.0)) { 191*eb910715SAlp Dener tau = bnk->gamma1_i; 192*eb910715SAlp Dener } else if ((tau_1 >= bnk->gamma1_i) && (tau_1 < 1.0) && ((tau_2 < bnk->gamma1_i) || (tau_2 >= 1.0))) { 193*eb910715SAlp Dener tau = tau_1; 194*eb910715SAlp Dener } else if ((tau_2 >= bnk->gamma1_i) && (tau_2 < 1.0) && ((tau_1 < bnk->gamma1_i) || (tau_2 >= 1.0))) { 195*eb910715SAlp Dener tau = tau_2; 196*eb910715SAlp Dener } else { 197*eb910715SAlp Dener tau = tau_max; 198*eb910715SAlp Dener } 199*eb910715SAlp Dener } 200*eb910715SAlp Dener } 201*eb910715SAlp Dener tao->trust = tau * tao->trust; 202*eb910715SAlp Dener } 203*eb910715SAlp Dener 204*eb910715SAlp Dener if (fmin < bnk->f) { 205*eb910715SAlp Dener bnk->f = fmin; 206*eb910715SAlp Dener ierr = VecAXPY(tao->solution,sigma,tao->gradient);CHKERRQ(ierr); 207*eb910715SAlp Dener ierr = TaoComputeGradient(tao,tao->solution,tao->gradient);CHKERRQ(ierr); 208*eb910715SAlp Dener 209*eb910715SAlp Dener ierr = TaoGradientNorm(tao, tao->gradient,NORM_2,&bnk->gnorm);CHKERRQ(ierr); 210*eb910715SAlp Dener if (PetscIsInfOrNanReal(bnk->gnorm)) SETERRQ(PETSC_COMM_SELF,1, "User provided compute gradient generated Inf or NaN"); 211*eb910715SAlp Dener needH = 1; 212*eb910715SAlp Dener 213*eb910715SAlp Dener ierr = TaoLogConvergenceHistory(tao,bnk->f,bnk->gnorm,0.0,tao->ksp_its);CHKERRQ(ierr); 214*eb910715SAlp Dener ierr = TaoMonitor(tao,tao->niter,bnk->f,bnk->gnorm,0.0,step);CHKERRQ(ierr); 215*eb910715SAlp Dener ierr = (*tao->ops->convergencetest)(tao,tao->cnvP);CHKERRQ(ierr); 216*eb910715SAlp Dener if (tao->reason != TAO_CONTINUE_ITERATING) PetscFunctionReturn(0); 217*eb910715SAlp Dener } 218*eb910715SAlp Dener } 219*eb910715SAlp Dener tao->trust = PetscMax(tao->trust, max_radius); 220*eb910715SAlp Dener 221*eb910715SAlp Dener /* Modify the radius if it is too large or small */ 222*eb910715SAlp Dener tao->trust = PetscMax(tao->trust, bnk->min_radius); 223*eb910715SAlp Dener tao->trust = PetscMin(tao->trust, bnk->max_radius); 224*eb910715SAlp Dener break; 225*eb910715SAlp Dener 226*eb910715SAlp Dener default: 227*eb910715SAlp Dener /* Norm of the first direction will initialize radius */ 228*eb910715SAlp Dener tao->trust = 0.0; 229*eb910715SAlp Dener break; 230*eb910715SAlp Dener } 231*eb910715SAlp Dener } 232*eb910715SAlp Dener 233*eb910715SAlp Dener /* Set initial scaling for the BFGS preconditioner 234*eb910715SAlp Dener This step is done after computing the initial trust-region radius 235*eb910715SAlp Dener since the function value may have decreased */ 236*eb910715SAlp Dener if (BNK_PC_BFGS == bnk->pc_type) { 237*eb910715SAlp Dener if (bnk->f != 0.0) { 238*eb910715SAlp Dener delta = 2.0 * PetscAbsScalar(bnk->f) / (bnk->gnorm*bnk->gnorm); 239*eb910715SAlp Dener } else { 240*eb910715SAlp Dener delta = 2.0 / (bnk->gnorm*bnk->gnorm); 241*eb910715SAlp Dener } 242*eb910715SAlp Dener ierr = MatLMVMSetDelta(bnk->M,delta);CHKERRQ(ierr); 243*eb910715SAlp Dener } 244*eb910715SAlp Dener 245*eb910715SAlp Dener /* Set counter for gradient/reset steps*/ 246*eb910715SAlp Dener bnk->newt = 0; 247*eb910715SAlp Dener bnk->bfgs = 0; 248*eb910715SAlp Dener bnk->sgrad = 0; 249*eb910715SAlp Dener bnk->grad = 0; 250*eb910715SAlp Dener PetscFunctionReturn(0); 251*eb910715SAlp Dener } 252*eb910715SAlp Dener 253*eb910715SAlp Dener PetscErrorCode TaoBNKComputeStep(Tao tao, PetscInt *stepType) 254*eb910715SAlp Dener { 255*eb910715SAlp Dener PetscErrorCode ierr; 256*eb910715SAlp Dener TAO_BNK *bnk = (TAO_BNK *)tao->data; 257*eb910715SAlp Dener KSPConvergedReason ksp_reason; 258*eb910715SAlp Dener 259*eb910715SAlp Dener PetscReal gdx, delta; 260*eb910715SAlp Dener PetscReal norm_d = 0.0, e_min; 261*eb910715SAlp Dener 262*eb910715SAlp Dener PetscInt bfgsUpdates = 0; 263*eb910715SAlp Dener PetscInt kspits; 264*eb910715SAlp Dener PetscInt needH = 1; 265*eb910715SAlp Dener 266*eb910715SAlp Dener PetscFunctionBegin; 267*eb910715SAlp Dener /* Compute the Hessian */ 268*eb910715SAlp Dener if (needH) { 269*eb910715SAlp Dener ierr = TaoComputeHessian(tao,tao->solution,tao->hessian,tao->hessian_pre);CHKERRQ(ierr); 270*eb910715SAlp Dener } 271*eb910715SAlp Dener 272*eb910715SAlp Dener if ((BNK_PC_BFGS == bnk->pc_type) && (BFGS_SCALE_AHESS == bnk->bfgs_scale_type)) { 273*eb910715SAlp Dener /* Obtain diagonal for the bfgs preconditioner */ 274*eb910715SAlp Dener ierr = MatGetDiagonal(tao->hessian, bnk->Diag);CHKERRQ(ierr); 275*eb910715SAlp Dener ierr = VecAbs(bnk->Diag);CHKERRQ(ierr); 276*eb910715SAlp Dener ierr = VecReciprocal(bnk->Diag);CHKERRQ(ierr); 277*eb910715SAlp Dener ierr = MatLMVMSetScale(bnk->M,bnk->Diag);CHKERRQ(ierr); 278*eb910715SAlp Dener } 279*eb910715SAlp Dener 280*eb910715SAlp Dener /* Shift the Hessian matrix */ 281*eb910715SAlp Dener bnk->pert = bnk->sval; 282*eb910715SAlp Dener if (bnk->pert > 0) { 283*eb910715SAlp Dener ierr = MatShift(tao->hessian, bnk->pert);CHKERRQ(ierr); 284*eb910715SAlp Dener if (tao->hessian != tao->hessian_pre) { 285*eb910715SAlp Dener ierr = MatShift(tao->hessian_pre, bnk->pert);CHKERRQ(ierr); 286*eb910715SAlp Dener } 287*eb910715SAlp Dener } 288*eb910715SAlp Dener 289*eb910715SAlp Dener if (BNK_PC_BFGS == bnk->pc_type) { 290*eb910715SAlp Dener if (BFGS_SCALE_PHESS == bnk->bfgs_scale_type) { 291*eb910715SAlp Dener /* Obtain diagonal for the bfgs preconditioner */ 292*eb910715SAlp Dener ierr = MatGetDiagonal(tao->hessian, bnk->Diag);CHKERRQ(ierr); 293*eb910715SAlp Dener ierr = VecAbs(bnk->Diag);CHKERRQ(ierr); 294*eb910715SAlp Dener ierr = VecReciprocal(bnk->Diag);CHKERRQ(ierr); 295*eb910715SAlp Dener ierr = MatLMVMSetScale(bnk->M,bnk->Diag);CHKERRQ(ierr); 296*eb910715SAlp Dener } 297*eb910715SAlp Dener /* Update the limited memory preconditioner and get existing # of updates */ 298*eb910715SAlp Dener ierr = MatLMVMUpdate(bnk->M, tao->solution, tao->gradient);CHKERRQ(ierr); 299*eb910715SAlp Dener ierr = MatLMVMGetUpdates(bnk->M, &bfgsUpdates);CHKERRQ(ierr); 300*eb910715SAlp Dener } 301*eb910715SAlp Dener 302*eb910715SAlp Dener /* Solve the Newton system of equations */ 303*eb910715SAlp Dener ierr = KSPSetOperators(tao->ksp,tao->hessian,tao->hessian_pre);CHKERRQ(ierr); 304*eb910715SAlp Dener if (bnk->is_nash || bnk->is_stcg || bnk->is_gltr) { 305*eb910715SAlp Dener ierr = KSPCGSetRadius(tao->ksp,bnk->max_radius);CHKERRQ(ierr); 306*eb910715SAlp Dener ierr = KSPSolve(tao->ksp, tao->gradient, bnk->D);CHKERRQ(ierr); 307*eb910715SAlp Dener ierr = KSPGetIterationNumber(tao->ksp,&kspits);CHKERRQ(ierr); 308*eb910715SAlp Dener tao->ksp_its+=kspits; 309*eb910715SAlp Dener tao->ksp_tot_its+=kspits; 310*eb910715SAlp Dener ierr = KSPCGGetNormD(tao->ksp,&norm_d);CHKERRQ(ierr); 311*eb910715SAlp Dener 312*eb910715SAlp Dener if (0.0 == tao->trust) { 313*eb910715SAlp Dener /* Radius was uninitialized; use the norm of the direction */ 314*eb910715SAlp Dener if (norm_d > 0.0) { 315*eb910715SAlp Dener tao->trust = norm_d; 316*eb910715SAlp Dener 317*eb910715SAlp Dener /* Modify the radius if it is too large or small */ 318*eb910715SAlp Dener tao->trust = PetscMax(tao->trust, bnk->min_radius); 319*eb910715SAlp Dener tao->trust = PetscMin(tao->trust, bnk->max_radius); 320*eb910715SAlp Dener } else { 321*eb910715SAlp Dener /* The direction was bad; set radius to default value and re-solve 322*eb910715SAlp Dener the trust-region subproblem to get a direction */ 323*eb910715SAlp Dener tao->trust = tao->trust0; 324*eb910715SAlp Dener 325*eb910715SAlp Dener /* Modify the radius if it is too large or small */ 326*eb910715SAlp Dener tao->trust = PetscMax(tao->trust, bnk->min_radius); 327*eb910715SAlp Dener tao->trust = PetscMin(tao->trust, bnk->max_radius); 328*eb910715SAlp Dener 329*eb910715SAlp Dener ierr = KSPCGSetRadius(tao->ksp,bnk->max_radius);CHKERRQ(ierr); 330*eb910715SAlp Dener ierr = KSPSolve(tao->ksp, tao->gradient, bnk->D);CHKERRQ(ierr); 331*eb910715SAlp Dener ierr = KSPGetIterationNumber(tao->ksp,&kspits);CHKERRQ(ierr); 332*eb910715SAlp Dener tao->ksp_its+=kspits; 333*eb910715SAlp Dener tao->ksp_tot_its+=kspits; 334*eb910715SAlp Dener ierr = KSPCGGetNormD(tao->ksp,&norm_d);CHKERRQ(ierr); 335*eb910715SAlp Dener 336*eb910715SAlp Dener if (norm_d == 0.0) SETERRQ(PETSC_COMM_SELF,1, "Initial direction zero"); 337*eb910715SAlp Dener } 338*eb910715SAlp Dener } 339*eb910715SAlp Dener } else { 340*eb910715SAlp Dener ierr = KSPSolve(tao->ksp, tao->gradient, bnk->D);CHKERRQ(ierr); 341*eb910715SAlp Dener ierr = KSPGetIterationNumber(tao->ksp, &kspits);CHKERRQ(ierr); 342*eb910715SAlp Dener tao->ksp_its += kspits; 343*eb910715SAlp Dener tao->ksp_tot_its+=kspits; 344*eb910715SAlp Dener } 345*eb910715SAlp Dener ierr = VecScale(bnk->D, -1.0);CHKERRQ(ierr); 346*eb910715SAlp Dener ierr = KSPGetConvergedReason(tao->ksp, &ksp_reason);CHKERRQ(ierr); 347*eb910715SAlp Dener if ((KSP_DIVERGED_INDEFINITE_PC == ksp_reason) && (BNK_PC_BFGS == bnk->pc_type) && (bfgsUpdates > 1)) { 348*eb910715SAlp Dener /* Preconditioner is numerically indefinite; reset the 349*eb910715SAlp Dener approximate if using BFGS preconditioning. */ 350*eb910715SAlp Dener 351*eb910715SAlp Dener if (bnk->f != 0.0) { 352*eb910715SAlp Dener delta = 2.0 * PetscAbsScalar(bnk->f) / (bnk->gnorm*bnk->gnorm); 353*eb910715SAlp Dener } else { 354*eb910715SAlp Dener delta = 2.0 / (bnk->gnorm*bnk->gnorm); 355*eb910715SAlp Dener } 356*eb910715SAlp Dener ierr = MatLMVMSetDelta(bnk->M,delta);CHKERRQ(ierr); 357*eb910715SAlp Dener ierr = MatLMVMReset(bnk->M);CHKERRQ(ierr); 358*eb910715SAlp Dener ierr = MatLMVMUpdate(bnk->M, tao->solution, tao->gradient);CHKERRQ(ierr); 359*eb910715SAlp Dener bfgsUpdates = 1; 360*eb910715SAlp Dener } 361*eb910715SAlp Dener 362*eb910715SAlp Dener if (KSP_CONVERGED_ATOL == ksp_reason) { 363*eb910715SAlp Dener ++bnk->ksp_atol; 364*eb910715SAlp Dener } else if (KSP_CONVERGED_RTOL == ksp_reason) { 365*eb910715SAlp Dener ++bnk->ksp_rtol; 366*eb910715SAlp Dener } else if (KSP_CONVERGED_CG_CONSTRAINED == ksp_reason) { 367*eb910715SAlp Dener ++bnk->ksp_ctol; 368*eb910715SAlp Dener } else if (KSP_CONVERGED_CG_NEG_CURVE == ksp_reason) { 369*eb910715SAlp Dener ++bnk->ksp_negc; 370*eb910715SAlp Dener } else if (KSP_DIVERGED_DTOL == ksp_reason) { 371*eb910715SAlp Dener ++bnk->ksp_dtol; 372*eb910715SAlp Dener } else if (KSP_DIVERGED_ITS == ksp_reason) { 373*eb910715SAlp Dener ++bnk->ksp_iter; 374*eb910715SAlp Dener } else { 375*eb910715SAlp Dener ++bnk->ksp_othr; 376*eb910715SAlp Dener } 377*eb910715SAlp Dener 378*eb910715SAlp Dener /* Check for success (descent direction) */ 379*eb910715SAlp Dener ierr = VecDot(bnk->D, tao->gradient, &gdx);CHKERRQ(ierr); 380*eb910715SAlp Dener if ((gdx >= 0.0) || PetscIsInfOrNanReal(gdx)) { 381*eb910715SAlp Dener /* Newton step is not descent or direction produced Inf or NaN 382*eb910715SAlp Dener Update the perturbation for next time */ 383*eb910715SAlp Dener if (bnk->pert <= 0.0) { 384*eb910715SAlp Dener /* Initialize the perturbation */ 385*eb910715SAlp Dener bnk->pert = PetscMin(bnk->imax, PetscMax(bnk->imin, bnk->imfac * bnk->gnorm)); 386*eb910715SAlp Dener if (bnk->is_gltr) { 387*eb910715SAlp Dener ierr = KSPCGGLTRGetMinEig(tao->ksp,&e_min);CHKERRQ(ierr); 388*eb910715SAlp Dener bnk->pert = PetscMax(bnk->pert, -e_min); 389*eb910715SAlp Dener } 390*eb910715SAlp Dener } else { 391*eb910715SAlp Dener /* Increase the perturbation */ 392*eb910715SAlp Dener bnk->pert = PetscMin(bnk->pmax, PetscMax(bnk->pgfac * bnk->pert, bnk->pmgfac * bnk->gnorm)); 393*eb910715SAlp Dener } 394*eb910715SAlp Dener 395*eb910715SAlp Dener if (BNK_PC_BFGS != bnk->pc_type) { 396*eb910715SAlp Dener /* We don't have the bfgs matrix around and updated 397*eb910715SAlp Dener Must use gradient direction in this case */ 398*eb910715SAlp Dener ierr = VecCopy(tao->gradient, bnk->D);CHKERRQ(ierr); 399*eb910715SAlp Dener ierr = VecScale(bnk->D, -1.0);CHKERRQ(ierr); 400*eb910715SAlp Dener ++bnk->grad; 401*eb910715SAlp Dener *stepType = BNK_GRADIENT; 402*eb910715SAlp Dener } else { 403*eb910715SAlp Dener /* Attempt to use the BFGS direction */ 404*eb910715SAlp Dener ierr = MatLMVMSolve(bnk->M, tao->gradient, bnk->D);CHKERRQ(ierr); 405*eb910715SAlp Dener ierr = VecScale(bnk->D, -1.0);CHKERRQ(ierr); 406*eb910715SAlp Dener 407*eb910715SAlp Dener /* Check for success (descent direction) */ 408*eb910715SAlp Dener ierr = VecDot(tao->gradient, bnk->D, &gdx);CHKERRQ(ierr); 409*eb910715SAlp Dener if ((gdx >= 0) || PetscIsInfOrNanReal(gdx)) { 410*eb910715SAlp Dener /* BFGS direction is not descent or direction produced not a number 411*eb910715SAlp Dener We can assert bfgsUpdates > 1 in this case because 412*eb910715SAlp Dener the first solve produces the scaled gradient direction, 413*eb910715SAlp Dener which is guaranteed to be descent */ 414*eb910715SAlp Dener 415*eb910715SAlp Dener /* Use steepest descent direction (scaled) */ 416*eb910715SAlp Dener 417*eb910715SAlp Dener if (bnk->f != 0.0) { 418*eb910715SAlp Dener delta = 2.0 * PetscAbsScalar(bnk->f) / (bnk->gnorm*bnk->gnorm); 419*eb910715SAlp Dener } else { 420*eb910715SAlp Dener delta = 2.0 / (bnk->gnorm*bnk->gnorm); 421*eb910715SAlp Dener } 422*eb910715SAlp Dener ierr = MatLMVMSetDelta(bnk->M, delta);CHKERRQ(ierr); 423*eb910715SAlp Dener ierr = MatLMVMReset(bnk->M);CHKERRQ(ierr); 424*eb910715SAlp Dener ierr = MatLMVMUpdate(bnk->M, tao->solution, tao->gradient);CHKERRQ(ierr); 425*eb910715SAlp Dener ierr = MatLMVMSolve(bnk->M, tao->gradient, bnk->D);CHKERRQ(ierr); 426*eb910715SAlp Dener ierr = VecScale(bnk->D, -1.0);CHKERRQ(ierr); 427*eb910715SAlp Dener 428*eb910715SAlp Dener bfgsUpdates = 1; 429*eb910715SAlp Dener ++bnk->sgrad; 430*eb910715SAlp Dener *stepType = BNK_SCALED_GRADIENT; 431*eb910715SAlp Dener } else { 432*eb910715SAlp Dener if (1 == bfgsUpdates) { 433*eb910715SAlp Dener /* The first BFGS direction is always the scaled gradient */ 434*eb910715SAlp Dener ++bnk->sgrad; 435*eb910715SAlp Dener *stepType = BNK_SCALED_GRADIENT; 436*eb910715SAlp Dener } else { 437*eb910715SAlp Dener ++bnk->bfgs; 438*eb910715SAlp Dener *stepType = BNK_BFGS; 439*eb910715SAlp Dener } 440*eb910715SAlp Dener } 441*eb910715SAlp Dener } 442*eb910715SAlp Dener } else { 443*eb910715SAlp Dener /* Computed Newton step is descent */ 444*eb910715SAlp Dener switch (ksp_reason) { 445*eb910715SAlp Dener case KSP_DIVERGED_NANORINF: 446*eb910715SAlp Dener case KSP_DIVERGED_BREAKDOWN: 447*eb910715SAlp Dener case KSP_DIVERGED_INDEFINITE_MAT: 448*eb910715SAlp Dener case KSP_DIVERGED_INDEFINITE_PC: 449*eb910715SAlp Dener case KSP_CONVERGED_CG_NEG_CURVE: 450*eb910715SAlp Dener /* Matrix or preconditioner is indefinite; increase perturbation */ 451*eb910715SAlp Dener if (bnk->pert <= 0.0) { 452*eb910715SAlp Dener /* Initialize the perturbation */ 453*eb910715SAlp Dener bnk->pert = PetscMin(bnk->imax, PetscMax(bnk->imin, bnk->imfac * bnk->gnorm)); 454*eb910715SAlp Dener if (bnk->is_gltr) { 455*eb910715SAlp Dener ierr = KSPCGGLTRGetMinEig(tao->ksp, &e_min);CHKERRQ(ierr); 456*eb910715SAlp Dener bnk->pert = PetscMax(bnk->pert, -e_min); 457*eb910715SAlp Dener } 458*eb910715SAlp Dener } else { 459*eb910715SAlp Dener /* Increase the perturbation */ 460*eb910715SAlp Dener bnk->pert = PetscMin(bnk->pmax, PetscMax(bnk->pgfac * bnk->pert, bnk->pmgfac * bnk->gnorm)); 461*eb910715SAlp Dener } 462*eb910715SAlp Dener break; 463*eb910715SAlp Dener 464*eb910715SAlp Dener default: 465*eb910715SAlp Dener /* Newton step computation is good; decrease perturbation */ 466*eb910715SAlp Dener bnk->pert = PetscMin(bnk->psfac * bnk->pert, bnk->pmsfac * bnk->gnorm); 467*eb910715SAlp Dener if (bnk->pert < bnk->pmin) { 468*eb910715SAlp Dener bnk->pert = 0.0; 469*eb910715SAlp Dener } 470*eb910715SAlp Dener break; 471*eb910715SAlp Dener } 472*eb910715SAlp Dener 473*eb910715SAlp Dener ++bnk->newt; 474*eb910715SAlp Dener stepType = BNK_NEWTON; 475*eb910715SAlp Dener } 476*eb910715SAlp Dener PetscFunctionReturn(0); 477*eb910715SAlp Dener } 478*eb910715SAlp Dener 479*eb910715SAlp Dener /* ---------------------------------------------------------- */ 480*eb910715SAlp Dener static PetscErrorCode TaoSetUp_BNK(Tao tao) 481*eb910715SAlp Dener { 482*eb910715SAlp Dener TAO_BNK *bnk = (TAO_BNK *)tao->data; 483*eb910715SAlp Dener PetscErrorCode ierr; 484*eb910715SAlp Dener 485*eb910715SAlp Dener PetscFunctionBegin; 486*eb910715SAlp Dener if (!tao->gradient) {ierr = VecDuplicate(tao->solution,&tao->gradient);CHKERRQ(ierr);} 487*eb910715SAlp Dener if (!tao->stepdirection) {ierr = VecDuplicate(tao->solution,&tao->stepdirection);CHKERRQ(ierr);} 488*eb910715SAlp Dener if (!bnk->W) {ierr = VecDuplicate(tao->solution,&bnk->W);CHKERRQ(ierr);} 489*eb910715SAlp Dener if (!bnk->D) {ierr = VecDuplicate(tao->solution,&bnk->D);CHKERRQ(ierr);} 490*eb910715SAlp Dener if (!bnk->Xold) {ierr = VecDuplicate(tao->solution,&bnk->Xold);CHKERRQ(ierr);} 491*eb910715SAlp Dener if (!bnk->Gold) {ierr = VecDuplicate(tao->solution,&bnk->Gold);CHKERRQ(ierr);} 492*eb910715SAlp Dener bnk->Diag = 0; 493*eb910715SAlp Dener bnk->M = 0; 494*eb910715SAlp Dener PetscFunctionReturn(0); 495*eb910715SAlp Dener } 496*eb910715SAlp Dener 497*eb910715SAlp Dener /*------------------------------------------------------------*/ 498*eb910715SAlp Dener static PetscErrorCode TaoDestroy_BNK(Tao tao) 499*eb910715SAlp Dener { 500*eb910715SAlp Dener TAO_BNK *bnk = (TAO_BNK *)tao->data; 501*eb910715SAlp Dener PetscErrorCode ierr; 502*eb910715SAlp Dener 503*eb910715SAlp Dener PetscFunctionBegin; 504*eb910715SAlp Dener if (tao->setupcalled) { 505*eb910715SAlp Dener ierr = VecDestroy(&bnk->D);CHKERRQ(ierr); 506*eb910715SAlp Dener ierr = VecDestroy(&bnk->W);CHKERRQ(ierr); 507*eb910715SAlp Dener ierr = VecDestroy(&bnk->Xold);CHKERRQ(ierr); 508*eb910715SAlp Dener ierr = VecDestroy(&bnk->Gold);CHKERRQ(ierr); 509*eb910715SAlp Dener } 510*eb910715SAlp Dener ierr = VecDestroy(&bnk->Diag);CHKERRQ(ierr); 511*eb910715SAlp Dener ierr = MatDestroy(&bnk->M);CHKERRQ(ierr); 512*eb910715SAlp Dener ierr = PetscFree(tao->data);CHKERRQ(ierr); 513*eb910715SAlp Dener PetscFunctionReturn(0); 514*eb910715SAlp Dener } 515*eb910715SAlp Dener 516*eb910715SAlp Dener /*------------------------------------------------------------*/ 517*eb910715SAlp Dener static PetscErrorCode TaoSetFromOptions_BNK(PetscOptionItems *PetscOptionsObject,Tao tao) 518*eb910715SAlp Dener { 519*eb910715SAlp Dener TAO_BNK *bnk = (TAO_BNK *)tao->data; 520*eb910715SAlp Dener PetscErrorCode ierr; 521*eb910715SAlp Dener 522*eb910715SAlp Dener PetscFunctionBegin; 523*eb910715SAlp Dener ierr = PetscOptionsHead(PetscOptionsObject,"Newton line search method for unconstrained optimization");CHKERRQ(ierr); 524*eb910715SAlp Dener ierr = PetscOptionsEList("-tao_BNK_pc_type", "pc type", "", BNK_PC, BNK_PC_TYPES, BNK_PC[bnk->pc_type], &bnk->pc_type, 0);CHKERRQ(ierr); 525*eb910715SAlp Dener ierr = PetscOptionsEList("-tao_BNK_bfgs_scale_type", "bfgs scale type", "", BFGS_SCALE, BFGS_SCALE_TYPES, BFGS_SCALE[bnk->bfgs_scale_type], &bnk->bfgs_scale_type, 0);CHKERRQ(ierr); 526*eb910715SAlp Dener ierr = PetscOptionsEList("-tao_BNK_init_type", "radius initialization type", "", BNK_INIT, BNK_INIT_TYPES, BNK_INIT[bnk->init_type], &bnk->init_type, 0);CHKERRQ(ierr); 527*eb910715SAlp Dener ierr = PetscOptionsEList("-tao_BNK_update_type", "radius update type", "", BNK_UPDATE, BNK_UPDATE_TYPES, BNK_UPDATE[bnk->update_type], &bnk->update_type, 0);CHKERRQ(ierr); 528*eb910715SAlp Dener ierr = PetscOptionsReal("-tao_BNK_sval", "perturbation starting value", "", bnk->sval, &bnk->sval,NULL);CHKERRQ(ierr); 529*eb910715SAlp Dener ierr = PetscOptionsReal("-tao_BNK_imin", "minimum initial perturbation", "", bnk->imin, &bnk->imin,NULL);CHKERRQ(ierr); 530*eb910715SAlp Dener ierr = PetscOptionsReal("-tao_BNK_imax", "maximum initial perturbation", "", bnk->imax, &bnk->imax,NULL);CHKERRQ(ierr); 531*eb910715SAlp Dener ierr = PetscOptionsReal("-tao_BNK_imfac", "initial merit factor", "", bnk->imfac, &bnk->imfac,NULL);CHKERRQ(ierr); 532*eb910715SAlp Dener ierr = PetscOptionsReal("-tao_BNK_pmin", "minimum perturbation", "", bnk->pmin, &bnk->pmin,NULL);CHKERRQ(ierr); 533*eb910715SAlp Dener ierr = PetscOptionsReal("-tao_BNK_pmax", "maximum perturbation", "", bnk->pmax, &bnk->pmax,NULL);CHKERRQ(ierr); 534*eb910715SAlp Dener ierr = PetscOptionsReal("-tao_BNK_pgfac", "growth factor", "", bnk->pgfac, &bnk->pgfac,NULL);CHKERRQ(ierr); 535*eb910715SAlp Dener ierr = PetscOptionsReal("-tao_BNK_psfac", "shrink factor", "", bnk->psfac, &bnk->psfac,NULL);CHKERRQ(ierr); 536*eb910715SAlp Dener ierr = PetscOptionsReal("-tao_BNK_pmgfac", "merit growth factor", "", bnk->pmgfac, &bnk->pmgfac,NULL);CHKERRQ(ierr); 537*eb910715SAlp Dener ierr = PetscOptionsReal("-tao_BNK_pmsfac", "merit shrink factor", "", bnk->pmsfac, &bnk->pmsfac,NULL);CHKERRQ(ierr); 538*eb910715SAlp Dener ierr = PetscOptionsReal("-tao_BNK_eta1", "poor steplength; reduce radius", "", bnk->eta1, &bnk->eta1,NULL);CHKERRQ(ierr); 539*eb910715SAlp Dener ierr = PetscOptionsReal("-tao_BNK_eta2", "reasonable steplength; leave radius alone", "", bnk->eta2, &bnk->eta2,NULL);CHKERRQ(ierr); 540*eb910715SAlp Dener ierr = PetscOptionsReal("-tao_BNK_eta3", "good steplength; increase radius", "", bnk->eta3, &bnk->eta3,NULL);CHKERRQ(ierr); 541*eb910715SAlp Dener ierr = PetscOptionsReal("-tao_BNK_eta4", "excellent steplength; greatly increase radius", "", bnk->eta4, &bnk->eta4,NULL);CHKERRQ(ierr); 542*eb910715SAlp Dener ierr = PetscOptionsReal("-tao_BNK_alpha1", "", "", bnk->alpha1, &bnk->alpha1,NULL);CHKERRQ(ierr); 543*eb910715SAlp Dener ierr = PetscOptionsReal("-tao_BNK_alpha2", "", "", bnk->alpha2, &bnk->alpha2,NULL);CHKERRQ(ierr); 544*eb910715SAlp Dener ierr = PetscOptionsReal("-tao_BNK_alpha3", "", "", bnk->alpha3, &bnk->alpha3,NULL);CHKERRQ(ierr); 545*eb910715SAlp Dener ierr = PetscOptionsReal("-tao_BNK_alpha4", "", "", bnk->alpha4, &bnk->alpha4,NULL);CHKERRQ(ierr); 546*eb910715SAlp Dener ierr = PetscOptionsReal("-tao_BNK_alpha5", "", "", bnk->alpha5, &bnk->alpha5,NULL);CHKERRQ(ierr); 547*eb910715SAlp Dener ierr = PetscOptionsReal("-tao_BNK_nu1", "poor steplength; reduce radius", "", bnk->nu1, &bnk->nu1,NULL);CHKERRQ(ierr); 548*eb910715SAlp Dener ierr = PetscOptionsReal("-tao_BNK_nu2", "reasonable steplength; leave radius alone", "", bnk->nu2, &bnk->nu2,NULL);CHKERRQ(ierr); 549*eb910715SAlp Dener ierr = PetscOptionsReal("-tao_BNK_nu3", "good steplength; increase radius", "", bnk->nu3, &bnk->nu3,NULL);CHKERRQ(ierr); 550*eb910715SAlp Dener ierr = PetscOptionsReal("-tao_BNK_nu4", "excellent steplength; greatly increase radius", "", bnk->nu4, &bnk->nu4,NULL);CHKERRQ(ierr); 551*eb910715SAlp Dener ierr = PetscOptionsReal("-tao_BNK_omega1", "", "", bnk->omega1, &bnk->omega1,NULL);CHKERRQ(ierr); 552*eb910715SAlp Dener ierr = PetscOptionsReal("-tao_BNK_omega2", "", "", bnk->omega2, &bnk->omega2,NULL);CHKERRQ(ierr); 553*eb910715SAlp Dener ierr = PetscOptionsReal("-tao_BNK_omega3", "", "", bnk->omega3, &bnk->omega3,NULL);CHKERRQ(ierr); 554*eb910715SAlp Dener ierr = PetscOptionsReal("-tao_BNK_omega4", "", "", bnk->omega4, &bnk->omega4,NULL);CHKERRQ(ierr); 555*eb910715SAlp Dener ierr = PetscOptionsReal("-tao_BNK_omega5", "", "", bnk->omega5, &bnk->omega5,NULL);CHKERRQ(ierr); 556*eb910715SAlp Dener ierr = PetscOptionsReal("-tao_BNK_mu1_i", "", "", bnk->mu1_i, &bnk->mu1_i,NULL);CHKERRQ(ierr); 557*eb910715SAlp Dener ierr = PetscOptionsReal("-tao_BNK_mu2_i", "", "", bnk->mu2_i, &bnk->mu2_i,NULL);CHKERRQ(ierr); 558*eb910715SAlp Dener ierr = PetscOptionsReal("-tao_BNK_gamma1_i", "", "", bnk->gamma1_i, &bnk->gamma1_i,NULL);CHKERRQ(ierr); 559*eb910715SAlp Dener ierr = PetscOptionsReal("-tao_BNK_gamma2_i", "", "", bnk->gamma2_i, &bnk->gamma2_i,NULL);CHKERRQ(ierr); 560*eb910715SAlp Dener ierr = PetscOptionsReal("-tao_BNK_gamma3_i", "", "", bnk->gamma3_i, &bnk->gamma3_i,NULL);CHKERRQ(ierr); 561*eb910715SAlp Dener ierr = PetscOptionsReal("-tao_BNK_gamma4_i", "", "", bnk->gamma4_i, &bnk->gamma4_i,NULL);CHKERRQ(ierr); 562*eb910715SAlp Dener ierr = PetscOptionsReal("-tao_BNK_theta_i", "", "", bnk->theta_i, &bnk->theta_i,NULL);CHKERRQ(ierr); 563*eb910715SAlp Dener ierr = PetscOptionsReal("-tao_BNK_mu1", "", "", bnk->mu1, &bnk->mu1,NULL);CHKERRQ(ierr); 564*eb910715SAlp Dener ierr = PetscOptionsReal("-tao_BNK_mu2", "", "", bnk->mu2, &bnk->mu2,NULL);CHKERRQ(ierr); 565*eb910715SAlp Dener ierr = PetscOptionsReal("-tao_BNK_gamma1", "", "", bnk->gamma1, &bnk->gamma1,NULL);CHKERRQ(ierr); 566*eb910715SAlp Dener ierr = PetscOptionsReal("-tao_BNK_gamma2", "", "", bnk->gamma2, &bnk->gamma2,NULL);CHKERRQ(ierr); 567*eb910715SAlp Dener ierr = PetscOptionsReal("-tao_BNK_gamma3", "", "", bnk->gamma3, &bnk->gamma3,NULL);CHKERRQ(ierr); 568*eb910715SAlp Dener ierr = PetscOptionsReal("-tao_BNK_gamma4", "", "", bnk->gamma4, &bnk->gamma4,NULL);CHKERRQ(ierr); 569*eb910715SAlp Dener ierr = PetscOptionsReal("-tao_BNK_theta", "", "", bnk->theta, &bnk->theta,NULL);CHKERRQ(ierr); 570*eb910715SAlp Dener ierr = PetscOptionsReal("-tao_BNK_min_radius", "lower bound on initial radius", "", bnk->min_radius, &bnk->min_radius,NULL);CHKERRQ(ierr); 571*eb910715SAlp Dener ierr = PetscOptionsReal("-tao_BNK_max_radius", "upper bound on radius", "", bnk->max_radius, &bnk->max_radius,NULL);CHKERRQ(ierr); 572*eb910715SAlp Dener ierr = PetscOptionsReal("-tao_BNK_epsilon", "tolerance used when computing actual and predicted reduction", "", bnk->epsilon, &bnk->epsilon,NULL);CHKERRQ(ierr); 573*eb910715SAlp Dener ierr = PetscOptionsTail();CHKERRQ(ierr); 574*eb910715SAlp Dener ierr = TaoLineSearchSetFromOptions(tao->linesearch);CHKERRQ(ierr); 575*eb910715SAlp Dener ierr = KSPSetFromOptions(tao->ksp);CHKERRQ(ierr); 576*eb910715SAlp Dener PetscFunctionReturn(0); 577*eb910715SAlp Dener } 578*eb910715SAlp Dener 579*eb910715SAlp Dener 580*eb910715SAlp Dener /*------------------------------------------------------------*/ 581*eb910715SAlp Dener static PetscErrorCode TaoView_BNK(Tao tao, PetscViewer viewer) 582*eb910715SAlp Dener { 583*eb910715SAlp Dener TAO_BNK *bnk = (TAO_BNK *)tao->data; 584*eb910715SAlp Dener PetscInt nrejects; 585*eb910715SAlp Dener PetscBool isascii; 586*eb910715SAlp Dener PetscErrorCode ierr; 587*eb910715SAlp Dener 588*eb910715SAlp Dener PetscFunctionBegin; 589*eb910715SAlp Dener ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&isascii);CHKERRQ(ierr); 590*eb910715SAlp Dener if (isascii) { 591*eb910715SAlp Dener ierr = PetscViewerASCIIPushTab(viewer);CHKERRQ(ierr); 592*eb910715SAlp Dener if (BNK_PC_BFGS == bnk->pc_type && bnk->M) { 593*eb910715SAlp Dener ierr = MatLMVMGetRejects(bnk->M,&nrejects);CHKERRQ(ierr); 594*eb910715SAlp Dener ierr = PetscViewerASCIIPrintf(viewer, "Rejected matrix updates: %D\n",nrejects);CHKERRQ(ierr); 595*eb910715SAlp Dener } 596*eb910715SAlp Dener ierr = PetscViewerASCIIPrintf(viewer, "Newton steps: %D\n", bnk->newt);CHKERRQ(ierr); 597*eb910715SAlp Dener ierr = PetscViewerASCIIPrintf(viewer, "BFGS steps: %D\n", bnk->bfgs);CHKERRQ(ierr); 598*eb910715SAlp Dener ierr = PetscViewerASCIIPrintf(viewer, "Scaled gradient steps: %D\n", bnk->sgrad);CHKERRQ(ierr); 599*eb910715SAlp Dener ierr = PetscViewerASCIIPrintf(viewer, "Gradient steps: %D\n", bnk->grad);CHKERRQ(ierr); 600*eb910715SAlp Dener ierr = PetscViewerASCIIPrintf(viewer, "KSP termination reasons:\n");CHKERRQ(ierr); 601*eb910715SAlp Dener ierr = PetscViewerASCIIPrintf(viewer, " atol: %D\n", bnk->ksp_atol);CHKERRQ(ierr); 602*eb910715SAlp Dener ierr = PetscViewerASCIIPrintf(viewer, " rtol: %D\n", bnk->ksp_rtol);CHKERRQ(ierr); 603*eb910715SAlp Dener ierr = PetscViewerASCIIPrintf(viewer, " ctol: %D\n", bnk->ksp_ctol);CHKERRQ(ierr); 604*eb910715SAlp Dener ierr = PetscViewerASCIIPrintf(viewer, " negc: %D\n", bnk->ksp_negc);CHKERRQ(ierr); 605*eb910715SAlp Dener ierr = PetscViewerASCIIPrintf(viewer, " dtol: %D\n", bnk->ksp_dtol);CHKERRQ(ierr); 606*eb910715SAlp Dener ierr = PetscViewerASCIIPrintf(viewer, " iter: %D\n", bnk->ksp_iter);CHKERRQ(ierr); 607*eb910715SAlp Dener ierr = PetscViewerASCIIPrintf(viewer, " othr: %D\n", bnk->ksp_othr);CHKERRQ(ierr); 608*eb910715SAlp Dener ierr = PetscViewerASCIIPopTab(viewer);CHKERRQ(ierr); 609*eb910715SAlp Dener } 610*eb910715SAlp Dener PetscFunctionReturn(0); 611*eb910715SAlp Dener } 612*eb910715SAlp Dener 613*eb910715SAlp Dener /* ---------------------------------------------------------- */ 614*eb910715SAlp Dener /*MC 615*eb910715SAlp Dener TAOBNK - Shared base-type for Bounded Newton-Krylov type algorithms. 616*eb910715SAlp Dener At each iteration, the BNK method solves the symmetric 617*eb910715SAlp Dener system of equations to obtain the step diretion dk: 618*eb910715SAlp Dener Hk dk = -gk 619*eb910715SAlp Dener at which point the step can be globalized either through trust-region 620*eb910715SAlp Dener methods, or a line search, or a heuristic mixture of both. 621*eb910715SAlp Dener 622*eb910715SAlp Dener Options Database Keys: 623*eb910715SAlp Dener + -tao_BNK_pc_type - "none","ahess","bfgs","petsc" 624*eb910715SAlp Dener . -tao_BNK_bfgs_scale_type - "ahess","phess","bfgs" 625*eb910715SAlp Dener . -tao_BNK_init_type - "constant","direction","interpolation" 626*eb910715SAlp Dener . -tao_BNK_update_type - "step","direction","interpolation" 627*eb910715SAlp Dener . -tao_BNK_sval - perturbation starting value 628*eb910715SAlp Dener . -tao_BNK_imin - minimum initial perturbation 629*eb910715SAlp Dener . -tao_BNK_imax - maximum initial perturbation 630*eb910715SAlp Dener . -tao_BNK_pmin - minimum perturbation 631*eb910715SAlp Dener . -tao_BNK_pmax - maximum perturbation 632*eb910715SAlp Dener . -tao_BNK_pgfac - growth factor 633*eb910715SAlp Dener . -tao_BNK_psfac - shrink factor 634*eb910715SAlp Dener . -tao_BNK_imfac - initial merit factor 635*eb910715SAlp Dener . -tao_BNK_pmgfac - merit growth factor 636*eb910715SAlp Dener . -tao_BNK_pmsfac - merit shrink factor 637*eb910715SAlp Dener . -tao_BNK_eta1 - poor steplength; reduce radius 638*eb910715SAlp Dener . -tao_BNK_eta2 - reasonable steplength; leave radius 639*eb910715SAlp Dener . -tao_BNK_eta3 - good steplength; increase readius 640*eb910715SAlp Dener . -tao_BNK_eta4 - excellent steplength; greatly increase radius 641*eb910715SAlp Dener . -tao_BNK_alpha1 - alpha1 reduction 642*eb910715SAlp Dener . -tao_BNK_alpha2 - alpha2 reduction 643*eb910715SAlp Dener . -tao_BNK_alpha3 - alpha3 reduction 644*eb910715SAlp Dener . -tao_BNK_alpha4 - alpha4 reduction 645*eb910715SAlp Dener . -tao_BNK_alpha - alpha5 reduction 646*eb910715SAlp Dener . -tao_BNK_mu1 - mu1 interpolation update 647*eb910715SAlp Dener . -tao_BNK_mu2 - mu2 interpolation update 648*eb910715SAlp Dener . -tao_BNK_gamma1 - gamma1 interpolation update 649*eb910715SAlp Dener . -tao_BNK_gamma2 - gamma2 interpolation update 650*eb910715SAlp Dener . -tao_BNK_gamma3 - gamma3 interpolation update 651*eb910715SAlp Dener . -tao_BNK_gamma4 - gamma4 interpolation update 652*eb910715SAlp Dener . -tao_BNK_theta - theta interpolation update 653*eb910715SAlp Dener . -tao_BNK_omega1 - omega1 step update 654*eb910715SAlp Dener . -tao_BNK_omega2 - omega2 step update 655*eb910715SAlp Dener . -tao_BNK_omega3 - omega3 step update 656*eb910715SAlp Dener . -tao_BNK_omega4 - omega4 step update 657*eb910715SAlp Dener . -tao_BNK_omega5 - omega5 step update 658*eb910715SAlp Dener . -tao_BNK_mu1_i - mu1 interpolation init factor 659*eb910715SAlp Dener . -tao_BNK_mu2_i - mu2 interpolation init factor 660*eb910715SAlp Dener . -tao_BNK_gamma1_i - gamma1 interpolation init factor 661*eb910715SAlp Dener . -tao_BNK_gamma2_i - gamma2 interpolation init factor 662*eb910715SAlp Dener . -tao_BNK_gamma3_i - gamma3 interpolation init factor 663*eb910715SAlp Dener . -tao_BNK_gamma4_i - gamma4 interpolation init factor 664*eb910715SAlp Dener - -tao_BNK_theta_i - theta interpolation init factor 665*eb910715SAlp Dener 666*eb910715SAlp Dener Level: beginner 667*eb910715SAlp Dener M*/ 668*eb910715SAlp Dener 669*eb910715SAlp Dener PetscErrorCode TaoCreate_BNK(Tao tao) 670*eb910715SAlp Dener { 671*eb910715SAlp Dener TAO_BNK *bnk; 672*eb910715SAlp Dener const char *morethuente_type = TAOLINESEARCHMT; 673*eb910715SAlp Dener PetscErrorCode ierr; 674*eb910715SAlp Dener 675*eb910715SAlp Dener PetscFunctionBegin; 676*eb910715SAlp Dener ierr = PetscNewLog(tao,&bnk);CHKERRQ(ierr); 677*eb910715SAlp Dener 678*eb910715SAlp Dener tao->ops->setup = TaoSetUp_BNK; 679*eb910715SAlp Dener tao->ops->view = TaoView_BNK; 680*eb910715SAlp Dener tao->ops->setfromoptions = TaoSetFromOptions_BNK; 681*eb910715SAlp Dener tao->ops->destroy = TaoDestroy_BNK; 682*eb910715SAlp Dener 683*eb910715SAlp Dener /* Override default settings (unless already changed) */ 684*eb910715SAlp Dener if (!tao->max_it_changed) tao->max_it = 50; 685*eb910715SAlp Dener if (!tao->trust0_changed) tao->trust0 = 100.0; 686*eb910715SAlp Dener 687*eb910715SAlp Dener tao->data = (void*)bnk; 688*eb910715SAlp Dener 689*eb910715SAlp Dener bnk->sval = 0.0; 690*eb910715SAlp Dener bnk->imin = 1.0e-4; 691*eb910715SAlp Dener bnk->imax = 1.0e+2; 692*eb910715SAlp Dener bnk->imfac = 1.0e-1; 693*eb910715SAlp Dener 694*eb910715SAlp Dener bnk->pmin = 1.0e-12; 695*eb910715SAlp Dener bnk->pmax = 1.0e+2; 696*eb910715SAlp Dener bnk->pgfac = 1.0e+1; 697*eb910715SAlp Dener bnk->psfac = 4.0e-1; 698*eb910715SAlp Dener bnk->pmgfac = 1.0e-1; 699*eb910715SAlp Dener bnk->pmsfac = 1.0e-1; 700*eb910715SAlp Dener 701*eb910715SAlp Dener /* Default values for trust-region radius update based on steplength */ 702*eb910715SAlp Dener bnk->nu1 = 0.25; 703*eb910715SAlp Dener bnk->nu2 = 0.50; 704*eb910715SAlp Dener bnk->nu3 = 1.00; 705*eb910715SAlp Dener bnk->nu4 = 1.25; 706*eb910715SAlp Dener 707*eb910715SAlp Dener bnk->omega1 = 0.25; 708*eb910715SAlp Dener bnk->omega2 = 0.50; 709*eb910715SAlp Dener bnk->omega3 = 1.00; 710*eb910715SAlp Dener bnk->omega4 = 2.00; 711*eb910715SAlp Dener bnk->omega5 = 4.00; 712*eb910715SAlp Dener 713*eb910715SAlp Dener /* Default values for trust-region radius update based on reduction */ 714*eb910715SAlp Dener bnk->eta1 = 1.0e-4; 715*eb910715SAlp Dener bnk->eta2 = 0.25; 716*eb910715SAlp Dener bnk->eta3 = 0.50; 717*eb910715SAlp Dener bnk->eta4 = 0.90; 718*eb910715SAlp Dener 719*eb910715SAlp Dener bnk->alpha1 = 0.25; 720*eb910715SAlp Dener bnk->alpha2 = 0.50; 721*eb910715SAlp Dener bnk->alpha3 = 1.00; 722*eb910715SAlp Dener bnk->alpha4 = 2.00; 723*eb910715SAlp Dener bnk->alpha5 = 4.00; 724*eb910715SAlp Dener 725*eb910715SAlp Dener /* Default values for trust-region radius update based on interpolation */ 726*eb910715SAlp Dener bnk->mu1 = 0.10; 727*eb910715SAlp Dener bnk->mu2 = 0.50; 728*eb910715SAlp Dener 729*eb910715SAlp Dener bnk->gamma1 = 0.25; 730*eb910715SAlp Dener bnk->gamma2 = 0.50; 731*eb910715SAlp Dener bnk->gamma3 = 2.00; 732*eb910715SAlp Dener bnk->gamma4 = 4.00; 733*eb910715SAlp Dener 734*eb910715SAlp Dener bnk->theta = 0.05; 735*eb910715SAlp Dener 736*eb910715SAlp Dener /* Default values for trust region initialization based on interpolation */ 737*eb910715SAlp Dener bnk->mu1_i = 0.35; 738*eb910715SAlp Dener bnk->mu2_i = 0.50; 739*eb910715SAlp Dener 740*eb910715SAlp Dener bnk->gamma1_i = 0.0625; 741*eb910715SAlp Dener bnk->gamma2_i = 0.5; 742*eb910715SAlp Dener bnk->gamma3_i = 2.0; 743*eb910715SAlp Dener bnk->gamma4_i = 5.0; 744*eb910715SAlp Dener 745*eb910715SAlp Dener bnk->theta_i = 0.25; 746*eb910715SAlp Dener 747*eb910715SAlp Dener /* Remaining parameters */ 748*eb910715SAlp Dener bnk->min_radius = 1.0e-10; 749*eb910715SAlp Dener bnk->max_radius = 1.0e10; 750*eb910715SAlp Dener bnk->epsilon = 1.0e-6; 751*eb910715SAlp Dener 752*eb910715SAlp Dener bnk->pc_type = BNK_PC_BFGS; 753*eb910715SAlp Dener bnk->bfgs_scale_type = BFGS_SCALE_PHESS; 754*eb910715SAlp Dener bnk->init_type = BNK_INIT_INTERPOLATION; 755*eb910715SAlp Dener bnk->update_type = BNK_UPDATE_STEP; 756*eb910715SAlp Dener 757*eb910715SAlp Dener ierr = TaoLineSearchCreate(((PetscObject)tao)->comm,&tao->linesearch);CHKERRQ(ierr); 758*eb910715SAlp Dener ierr = PetscObjectIncrementTabLevel((PetscObject)tao->linesearch, (PetscObject)tao, 1);CHKERRQ(ierr); 759*eb910715SAlp Dener ierr = TaoLineSearchSetType(tao->linesearch,morethuente_type);CHKERRQ(ierr); 760*eb910715SAlp Dener ierr = TaoLineSearchUseTaoRoutines(tao->linesearch,tao);CHKERRQ(ierr); 761*eb910715SAlp Dener ierr = TaoLineSearchSetOptionsPrefix(tao->linesearch,tao->hdr.prefix);CHKERRQ(ierr); 762*eb910715SAlp Dener 763*eb910715SAlp Dener /* Set linear solver to default for symmetric matrices */ 764*eb910715SAlp Dener ierr = KSPCreate(((PetscObject)tao)->comm,&tao->ksp);CHKERRQ(ierr); 765*eb910715SAlp Dener ierr = PetscObjectIncrementTabLevel((PetscObject)tao->ksp, (PetscObject)tao, 1);CHKERRQ(ierr); 766*eb910715SAlp Dener ierr = KSPSetOptionsPrefix(tao->ksp,tao->hdr.prefix);CHKERRQ(ierr); 767*eb910715SAlp Dener ierr = KSPSetType(tao->ksp,KSPCGSTCG);CHKERRQ(ierr); 768*eb910715SAlp Dener PetscFunctionReturn(0); 769*eb910715SAlp Dener } 770