1eb910715SAlp Dener /* 2eb910715SAlp Dener Context for bounded Newton-Krylov type optimization algorithms 3eb910715SAlp Dener */ 4eb910715SAlp Dener 5eb910715SAlp Dener #if !defined(__TAO_BNK_H) 6eb910715SAlp Dener #define __TAO_BNK_H 7eb910715SAlp Dener #include <petsc/private/taoimpl.h> 8c0f10754SAlp Dener #include <../src/tao/bound/impls/bncg/bncg.h> 9eb910715SAlp Dener 10eb910715SAlp Dener typedef struct { 11e0ed867bSAlp Dener /* Function pointer for hessian evaluation 12e0ed867bSAlp Dener NOTE: This is necessary so that quasi-Newton-Krylov methods can "evaluate" 13e0ed867bSAlp Dener a quasi-Newton approximation while full Newton-Krylov methods call-back to 14e0ed867bSAlp Dener the application's Hessian */ 15e0ed867bSAlp Dener PetscErrorCode (*computehessian)(Tao); 166b591159SAlp Dener PetscErrorCode (*computestep)(Tao, PetscBool, KSPConvergedReason*, PetscInt*); 17e0ed867bSAlp Dener 18c0f10754SAlp Dener /* Embedded TAOBNCG */ 19c0f10754SAlp Dener Tao bncg; 20c0f10754SAlp Dener TAO_BNCG *bncg_ctx; 21e031d6f5SAlp Dener PetscInt max_cg_its, tot_cg_its; 22c0f10754SAlp Dener Vec bncg_sol; 23c0f10754SAlp Dener 24c0f10754SAlp Dener /* Allocated vectors */ 25c0f10754SAlp Dener Vec W, Xwork, Gwork, Xold, Gold; 2609164190SAlp Dener Vec unprojected_gradient, unprojected_gradient_old; 27c0f10754SAlp Dener 28c0f10754SAlp Dener /* Unallocated matrices and vectors */ 29b9ac7092SAlp Dener Mat H_inactive, Hpre_inactive; 30b9ac7092SAlp Dener Vec X_inactive, G_inactive, inactive_work, active_work; 312f75a4aaSAlp Dener IS inactive_idx, active_idx, active_lower, active_upper, active_fixed; 32eb910715SAlp Dener 33080d2917SAlp Dener /* Scalar values for the solution and step */ 34080d2917SAlp Dener PetscReal fold, f, gnorm, dnorm; 35eb910715SAlp Dener 362f75a4aaSAlp Dener /* Parameters for active set estimation */ 370a4511e9SAlp Dener PetscReal as_tol; 380a4511e9SAlp Dener PetscReal as_step; 392f75a4aaSAlp Dener 40b9ac7092SAlp Dener /* BFGS preconditioner data */ 41b9ac7092SAlp Dener PC bfgs_pre; 42b9ac7092SAlp Dener Mat M; 43b9ac7092SAlp Dener Vec Diag_min, Diag_max; 44b9ac7092SAlp Dener 45eb910715SAlp Dener /* Parameters when updating the perturbation added to the Hessian matrix 46eb910715SAlp Dener according to the following scheme: 47eb910715SAlp Dener 48eb910715SAlp Dener pert = sval; 49eb910715SAlp Dener 50eb910715SAlp Dener do until convergence 51eb910715SAlp Dener shift Hessian by pert 52eb910715SAlp Dener solve Newton system 53eb910715SAlp Dener 54eb910715SAlp Dener if (linear solver failed or did not compute a descent direction) 55eb910715SAlp Dener use steepest descent direction and increase perturbation 56eb910715SAlp Dener 57eb910715SAlp Dener if (0 == pert) 58eb910715SAlp Dener initialize perturbation 59eb910715SAlp Dener pert = min(imax, max(imin, imfac * norm(G))) 60eb910715SAlp Dener else 61eb910715SAlp Dener increase perturbation 62eb910715SAlp Dener pert = min(pmax, max(pgfac * pert, pmgfac * norm(G))) 63eb910715SAlp Dener fi 64eb910715SAlp Dener else 65eb910715SAlp Dener use linear solver direction and decrease perturbation 66eb910715SAlp Dener 67eb910715SAlp Dener pert = min(psfac * pert, pmsfac * norm(G)) 68eb910715SAlp Dener if (pert < pmin) 69eb910715SAlp Dener pert = 0 70eb910715SAlp Dener fi 71eb910715SAlp Dener fi 72eb910715SAlp Dener 73eb910715SAlp Dener perform line search 74eb910715SAlp Dener function and gradient evaluation 75eb910715SAlp Dener check convergence 76eb910715SAlp Dener od 77eb910715SAlp Dener */ 78eb910715SAlp Dener PetscReal sval; /* Starting perturbation value, default zero */ 79eb910715SAlp Dener 80eb910715SAlp Dener PetscReal imin; /* Minimum perturbation added during initialization */ 81eb910715SAlp Dener PetscReal imax; /* Maximum perturbation added during initialization */ 82eb910715SAlp Dener PetscReal imfac; /* Merit function factor during initialization */ 83eb910715SAlp Dener 84eb910715SAlp Dener PetscReal pert; /* Current perturbation value */ 85eb910715SAlp Dener PetscReal pmin; /* Minimim perturbation value */ 86eb910715SAlp Dener PetscReal pmax; /* Maximum perturbation value */ 87eb910715SAlp Dener PetscReal pgfac; /* Perturbation growth factor */ 88eb910715SAlp Dener PetscReal psfac; /* Perturbation shrink factor */ 89eb910715SAlp Dener PetscReal pmgfac; /* Merit function growth factor */ 90eb910715SAlp Dener PetscReal pmsfac; /* Merit function shrink factor */ 91eb910715SAlp Dener 92eb910715SAlp Dener /* Parameters when updating the trust-region radius based on steplength 93eb910715SAlp Dener if step < nu1 (very bad step) 94eb910715SAlp Dener radius = omega1 * min(norm(d), radius) 95eb910715SAlp Dener elif step < nu2 (bad step) 96eb910715SAlp Dener radius = omega2 * min(norm(d), radius) 97eb910715SAlp Dener elif step < nu3 (okay step) 98eb910715SAlp Dener radius = omega3 * radius; 99eb910715SAlp Dener elif step < nu4 (good step) 100eb910715SAlp Dener radius = max(omega4 * norm(d), radius) 101eb910715SAlp Dener else (very good step) 102eb910715SAlp Dener radius = max(omega5 * norm(d), radius) 103eb910715SAlp Dener fi 104eb910715SAlp Dener */ 105eb910715SAlp Dener PetscReal nu1; /* used to compute trust-region radius */ 106eb910715SAlp Dener PetscReal nu2; /* used to compute trust-region radius */ 107eb910715SAlp Dener PetscReal nu3; /* used to compute trust-region radius */ 108eb910715SAlp Dener PetscReal nu4; /* used to compute trust-region radius */ 109eb910715SAlp Dener 110eb910715SAlp Dener PetscReal omega1; /* factor used for trust-region update */ 111eb910715SAlp Dener PetscReal omega2; /* factor used for trust-region update */ 112eb910715SAlp Dener PetscReal omega3; /* factor used for trust-region update */ 113eb910715SAlp Dener PetscReal omega4; /* factor used for trust-region update */ 114eb910715SAlp Dener PetscReal omega5; /* factor used for trust-region update */ 115eb910715SAlp Dener 116eb910715SAlp Dener /* Parameters when updating the trust-region radius based on reduction 117eb910715SAlp Dener 118eb910715SAlp Dener kappa = ared / pred 119eb910715SAlp Dener if kappa < eta1 (very bad step) 120eb910715SAlp Dener radius = alpha1 * min(norm(d), radius) 121eb910715SAlp Dener elif kappa < eta2 (bad step) 122eb910715SAlp Dener radius = alpha2 * min(norm(d), radius) 123eb910715SAlp Dener elif kappa < eta3 (okay step) 124eb910715SAlp Dener radius = alpha3 * radius; 125eb910715SAlp Dener elif kappa < eta4 (good step) 126eb910715SAlp Dener radius = max(alpha4 * norm(d), radius) 127eb910715SAlp Dener else (very good step) 128eb910715SAlp Dener radius = max(alpha5 * norm(d), radius) 129eb910715SAlp Dener fi 130eb910715SAlp Dener */ 131eb910715SAlp Dener PetscReal eta1; /* used to compute trust-region radius */ 132eb910715SAlp Dener PetscReal eta2; /* used to compute trust-region radius */ 133eb910715SAlp Dener PetscReal eta3; /* used to compute trust-region radius */ 134eb910715SAlp Dener PetscReal eta4; /* used to compute trust-region radius */ 135eb910715SAlp Dener 136eb910715SAlp Dener PetscReal alpha1; /* factor used for trust-region update */ 137eb910715SAlp Dener PetscReal alpha2; /* factor used for trust-region update */ 138eb910715SAlp Dener PetscReal alpha3; /* factor used for trust-region update */ 139eb910715SAlp Dener PetscReal alpha4; /* factor used for trust-region update */ 140eb910715SAlp Dener PetscReal alpha5; /* factor used for trust-region update */ 141eb910715SAlp Dener 142eb910715SAlp Dener /* Parameters when updating the trust-region radius based on interpolation 143eb910715SAlp Dener 144eb910715SAlp Dener kappa = ared / pred 145eb910715SAlp Dener if kappa >= 1.0 - mu1 (very good step) 146eb910715SAlp Dener choose tau in [gamma3, gamma4] 147eb910715SAlp Dener radius = max(tau * norm(d), radius) 148eb910715SAlp Dener elif kappa >= 1.0 - mu2 (good step) 149eb910715SAlp Dener choose tau in [gamma2, gamma3] 150eb910715SAlp Dener if (tau >= 1.0) 151eb910715SAlp Dener radius = max(tau * norm(d), radius) 152eb910715SAlp Dener else 153eb910715SAlp Dener radius = tau * min(norm(d), radius) 154eb910715SAlp Dener fi 155eb910715SAlp Dener else (bad step) 156eb910715SAlp Dener choose tau in [gamma1, 1.0] 157eb910715SAlp Dener radius = tau * min(norm(d), radius) 158eb910715SAlp Dener fi 159eb910715SAlp Dener */ 160eb910715SAlp Dener PetscReal mu1; /* used for model agreement in interpolation */ 161eb910715SAlp Dener PetscReal mu2; /* used for model agreement in interpolation */ 162eb910715SAlp Dener 163eb910715SAlp Dener PetscReal gamma1; /* factor used for interpolation */ 164eb910715SAlp Dener PetscReal gamma2; /* factor used for interpolation */ 165eb910715SAlp Dener PetscReal gamma3; /* factor used for interpolation */ 166eb910715SAlp Dener PetscReal gamma4; /* factor used for interpolation */ 167eb910715SAlp Dener 168eb910715SAlp Dener PetscReal theta; /* factor used for interpolation */ 169eb910715SAlp Dener 170eb910715SAlp Dener /* Parameters when initializing trust-region radius based on interpolation */ 171eb910715SAlp Dener PetscReal mu1_i; /* used for model agreement in interpolation */ 172eb910715SAlp Dener PetscReal mu2_i; /* used for model agreement in interpolation */ 173eb910715SAlp Dener 174eb910715SAlp Dener PetscReal gamma1_i; /* factor used for interpolation */ 175eb910715SAlp Dener PetscReal gamma2_i; /* factor used for interpolation */ 176eb910715SAlp Dener PetscReal gamma3_i; /* factor used for interpolation */ 177eb910715SAlp Dener PetscReal gamma4_i; /* factor used for interpolation */ 178eb910715SAlp Dener 179eb910715SAlp Dener PetscReal theta_i; /* factor used for interpolation */ 180eb910715SAlp Dener 181eb910715SAlp Dener /* Other parameters */ 182eb910715SAlp Dener PetscReal min_radius; /* lower bound on initial radius value */ 183eb910715SAlp Dener PetscReal max_radius; /* upper bound on trust region radius */ 184eb910715SAlp Dener PetscReal epsilon; /* tolerance used when computing ared/pred */ 18562675beeSAlp Dener PetscReal dmin, dmax; /* upper and lower bounds for the Hessian diagonal vector */ 186eb910715SAlp Dener 187eb910715SAlp Dener PetscInt newt; /* Newton directions attempted */ 188eb910715SAlp Dener PetscInt bfgs; /* BFGS directions attempted */ 189eb910715SAlp Dener PetscInt sgrad; /* Scaled gradient directions attempted */ 190eb910715SAlp Dener PetscInt grad; /* Gradient directions attempted */ 191eb910715SAlp Dener 19262675beeSAlp Dener PetscInt as_type; /* Active set estimation method */ 193eb910715SAlp Dener PetscInt bfgs_scale_type; /* Scaling matrix to used for the bfgs preconditioner */ 194eb910715SAlp Dener PetscInt init_type; /* Trust-region initialization method */ 195eb910715SAlp Dener PetscInt update_type; /* Trust-region update method */ 196eb910715SAlp Dener 1972f75a4aaSAlp Dener /* Trackers for KSP solution type and convergence reasons */ 198eb910715SAlp Dener PetscInt ksp_atol; 199eb910715SAlp Dener PetscInt ksp_rtol; 200eb910715SAlp Dener PetscInt ksp_ctol; 201eb910715SAlp Dener PetscInt ksp_negc; 202eb910715SAlp Dener PetscInt ksp_dtol; 203eb910715SAlp Dener PetscInt ksp_iter; 204eb910715SAlp Dener PetscInt ksp_othr; 205*f4db9bf7SStefano Zampini PetscBool resetksp; 206e0ed867bSAlp Dener 207e0ed867bSAlp Dener /* Implementation specific context */ 208e0ed867bSAlp Dener void* ctx; 209eb910715SAlp Dener } TAO_BNK; 210eb910715SAlp Dener 211eb910715SAlp Dener #define BNK_NEWTON 0 212eb910715SAlp Dener #define BNK_BFGS 1 213eb910715SAlp Dener #define BNK_SCALED_GRADIENT 2 214eb910715SAlp Dener #define BNK_GRADIENT 3 215eb910715SAlp Dener 216eb910715SAlp Dener #define BNK_INIT_CONSTANT 0 217eb910715SAlp Dener #define BNK_INIT_DIRECTION 1 218eb910715SAlp Dener #define BNK_INIT_INTERPOLATION 2 219eb910715SAlp Dener #define BNK_INIT_TYPES 3 220eb910715SAlp Dener 221eb910715SAlp Dener #define BNK_UPDATE_STEP 0 222eb910715SAlp Dener #define BNK_UPDATE_REDUCTION 1 223eb910715SAlp Dener #define BNK_UPDATE_INTERPOLATION 2 224eb910715SAlp Dener #define BNK_UPDATE_TYPES 3 225eb910715SAlp Dener 2262f75a4aaSAlp Dener #define BNK_AS_NONE 0 2272f75a4aaSAlp Dener #define BNK_AS_BERTSEKAS 1 2282f75a4aaSAlp Dener #define BNK_AS_TYPES 2 2292f75a4aaSAlp Dener 230eb910715SAlp Dener PETSC_INTERN PetscErrorCode TaoCreate_BNK(Tao); 2319b6ef848SAlp Dener PETSC_INTERN PetscErrorCode TaoSetUp_BNK(Tao); 232e0ed867bSAlp Dener PETSC_INTERN PetscErrorCode TaoSetFromOptions_BNK(PetscOptionItems*, Tao); 233e0ed867bSAlp Dener PETSC_INTERN PetscErrorCode TaoDestroy_BNK(Tao); 234e0ed867bSAlp Dener PETSC_INTERN PetscErrorCode TaoView_BNK(Tao, PetscViewer); 235e0ed867bSAlp Dener 236e0ed867bSAlp Dener PETSC_INTERN PetscErrorCode TaoSolve_BNLS(Tao); 237e0ed867bSAlp Dener PETSC_INTERN PetscErrorCode TaoSolve_BNTR(Tao); 238e0ed867bSAlp Dener PETSC_INTERN PetscErrorCode TaoSolve_BNTL(Tao); 239eb910715SAlp Dener 240cd929ea3SAlp Dener PETSC_INTERN PetscErrorCode TaoBNKPreconBFGS(PC, Vec, Vec); 241c0f10754SAlp Dener PETSC_INTERN PetscErrorCode TaoBNKInitialize(Tao, PetscInt, PetscBool*); 24208752603SAlp Dener PETSC_INTERN PetscErrorCode TaoBNKEstimateActiveSet(Tao, PetscInt); 24362675beeSAlp Dener PETSC_INTERN PetscErrorCode TaoBNKComputeHessian(Tao); 244a1318120SAlp Dener PETSC_INTERN PetscErrorCode TaoBNKBoundStep(Tao, PetscInt, Vec); 245c0f10754SAlp Dener PETSC_INTERN PetscErrorCode TaoBNKTakeCGSteps(Tao, PetscBool*); 2466b591159SAlp Dener PETSC_INTERN PetscErrorCode TaoBNKComputeStep(Tao, PetscBool, KSPConvergedReason*, PetscInt*); 2475e9b73cbSAlp Dener PETSC_INTERN PetscErrorCode TaoBNKRecomputePred(Tao, Vec, PetscReal*); 248e465cd6fSAlp Dener PETSC_INTERN PetscErrorCode TaoBNKSafeguardStep(Tao, KSPConvergedReason, PetscInt*); 249937a31a1SAlp Dener PETSC_INTERN PetscErrorCode TaoBNKPerformLineSearch(Tao, PetscInt*, PetscReal*, TaoLineSearchConvergedReason*); 25028017e9fSAlp Dener PETSC_INTERN PetscErrorCode TaoBNKUpdateTrustRadius(Tao, PetscReal, PetscReal, PetscInt, PetscInt, PetscBool*); 25162675beeSAlp Dener PETSC_INTERN PetscErrorCode TaoBNKAddStepCounts(Tao, PetscInt); 252b9ac7092SAlp Dener 253b9ac7092SAlp Dener #endif /* if !defined(__TAO_BNK_H) */ 254