1eb910715SAlp Dener /* 2eb910715SAlp Dener Context for bounded Newton-Krylov type optimization algorithms 3eb910715SAlp Dener */ 4eb910715SAlp Dener 5eb910715SAlp Dener #if !defined(__TAO_BNK_H) 6eb910715SAlp Dener #define __TAO_BNK_H 7eb910715SAlp Dener #include <petsc/private/taoimpl.h> 8eb910715SAlp Dener #include <../src/tao/matrix/lmvmmat.h> 9eb910715SAlp Dener 10eb910715SAlp Dener typedef struct { 1109164190SAlp Dener Mat H_inactive, Hpre_inactive, M; 122f75a4aaSAlp Dener Vec W, Xwork, Gwork, inactive_work, active_work; 13*5e9b73cbSAlp Dener Vec Xold, Gold, Diag, Diag_red, Diag_min, Diag_max; 14*5e9b73cbSAlp Dener Vec X_inactive, G_inactive; 1509164190SAlp Dener Vec unprojected_gradient, unprojected_gradient_old; 162f75a4aaSAlp Dener IS inactive_idx, active_idx, active_lower, active_upper, active_fixed; 17eb910715SAlp Dener 18080d2917SAlp Dener /* Scalar values for the solution and step */ 19080d2917SAlp Dener PetscReal fold, f, gnorm, dnorm; 20eb910715SAlp Dener 212f75a4aaSAlp Dener /* Parameters for active set estimation */ 220a4511e9SAlp Dener PetscReal as_tol; 230a4511e9SAlp Dener PetscReal as_step; 242f75a4aaSAlp Dener 25eb910715SAlp Dener /* Parameters when updating the perturbation added to the Hessian matrix 26eb910715SAlp Dener according to the following scheme: 27eb910715SAlp Dener 28eb910715SAlp Dener pert = sval; 29eb910715SAlp Dener 30eb910715SAlp Dener do until convergence 31eb910715SAlp Dener shift Hessian by pert 32eb910715SAlp Dener solve Newton system 33eb910715SAlp Dener 34eb910715SAlp Dener if (linear solver failed or did not compute a descent direction) 35eb910715SAlp Dener use steepest descent direction and increase perturbation 36eb910715SAlp Dener 37eb910715SAlp Dener if (0 == pert) 38eb910715SAlp Dener initialize perturbation 39eb910715SAlp Dener pert = min(imax, max(imin, imfac * norm(G))) 40eb910715SAlp Dener else 41eb910715SAlp Dener increase perturbation 42eb910715SAlp Dener pert = min(pmax, max(pgfac * pert, pmgfac * norm(G))) 43eb910715SAlp Dener fi 44eb910715SAlp Dener else 45eb910715SAlp Dener use linear solver direction and decrease perturbation 46eb910715SAlp Dener 47eb910715SAlp Dener pert = min(psfac * pert, pmsfac * norm(G)) 48eb910715SAlp Dener if (pert < pmin) 49eb910715SAlp Dener pert = 0 50eb910715SAlp Dener fi 51eb910715SAlp Dener fi 52eb910715SAlp Dener 53eb910715SAlp Dener perform line search 54eb910715SAlp Dener function and gradient evaluation 55eb910715SAlp Dener check convergence 56eb910715SAlp Dener od 57eb910715SAlp Dener */ 58eb910715SAlp Dener PetscReal sval; /* Starting perturbation value, default zero */ 59eb910715SAlp Dener 60eb910715SAlp Dener PetscReal imin; /* Minimum perturbation added during initialization */ 61eb910715SAlp Dener PetscReal imax; /* Maximum perturbation added during initialization */ 62eb910715SAlp Dener PetscReal imfac; /* Merit function factor during initialization */ 63eb910715SAlp Dener 64eb910715SAlp Dener PetscReal pert; /* Current perturbation value */ 65eb910715SAlp Dener PetscReal pmin; /* Minimim perturbation value */ 66eb910715SAlp Dener PetscReal pmax; /* Maximum perturbation value */ 67eb910715SAlp Dener PetscReal pgfac; /* Perturbation growth factor */ 68eb910715SAlp Dener PetscReal psfac; /* Perturbation shrink factor */ 69eb910715SAlp Dener PetscReal pmgfac; /* Merit function growth factor */ 70eb910715SAlp Dener PetscReal pmsfac; /* Merit function shrink factor */ 71eb910715SAlp Dener 72eb910715SAlp Dener /* Parameters when updating the trust-region radius based on steplength 73eb910715SAlp Dener if step < nu1 (very bad step) 74eb910715SAlp Dener radius = omega1 * min(norm(d), radius) 75eb910715SAlp Dener elif step < nu2 (bad step) 76eb910715SAlp Dener radius = omega2 * min(norm(d), radius) 77eb910715SAlp Dener elif step < nu3 (okay step) 78eb910715SAlp Dener radius = omega3 * radius; 79eb910715SAlp Dener elif step < nu4 (good step) 80eb910715SAlp Dener radius = max(omega4 * norm(d), radius) 81eb910715SAlp Dener else (very good step) 82eb910715SAlp Dener radius = max(omega5 * norm(d), radius) 83eb910715SAlp Dener fi 84eb910715SAlp Dener */ 85eb910715SAlp Dener PetscReal nu1; /* used to compute trust-region radius */ 86eb910715SAlp Dener PetscReal nu2; /* used to compute trust-region radius */ 87eb910715SAlp Dener PetscReal nu3; /* used to compute trust-region radius */ 88eb910715SAlp Dener PetscReal nu4; /* used to compute trust-region radius */ 89eb910715SAlp Dener 90eb910715SAlp Dener PetscReal omega1; /* factor used for trust-region update */ 91eb910715SAlp Dener PetscReal omega2; /* factor used for trust-region update */ 92eb910715SAlp Dener PetscReal omega3; /* factor used for trust-region update */ 93eb910715SAlp Dener PetscReal omega4; /* factor used for trust-region update */ 94eb910715SAlp Dener PetscReal omega5; /* factor used for trust-region update */ 95eb910715SAlp Dener 96eb910715SAlp Dener /* Parameters when updating the trust-region radius based on reduction 97eb910715SAlp Dener 98eb910715SAlp Dener kappa = ared / pred 99eb910715SAlp Dener if kappa < eta1 (very bad step) 100eb910715SAlp Dener radius = alpha1 * min(norm(d), radius) 101eb910715SAlp Dener elif kappa < eta2 (bad step) 102eb910715SAlp Dener radius = alpha2 * min(norm(d), radius) 103eb910715SAlp Dener elif kappa < eta3 (okay step) 104eb910715SAlp Dener radius = alpha3 * radius; 105eb910715SAlp Dener elif kappa < eta4 (good step) 106eb910715SAlp Dener radius = max(alpha4 * norm(d), radius) 107eb910715SAlp Dener else (very good step) 108eb910715SAlp Dener radius = max(alpha5 * norm(d), radius) 109eb910715SAlp Dener fi 110eb910715SAlp Dener */ 111eb910715SAlp Dener PetscReal eta1; /* used to compute trust-region radius */ 112eb910715SAlp Dener PetscReal eta2; /* used to compute trust-region radius */ 113eb910715SAlp Dener PetscReal eta3; /* used to compute trust-region radius */ 114eb910715SAlp Dener PetscReal eta4; /* used to compute trust-region radius */ 115eb910715SAlp Dener 116eb910715SAlp Dener PetscReal alpha1; /* factor used for trust-region update */ 117eb910715SAlp Dener PetscReal alpha2; /* factor used for trust-region update */ 118eb910715SAlp Dener PetscReal alpha3; /* factor used for trust-region update */ 119eb910715SAlp Dener PetscReal alpha4; /* factor used for trust-region update */ 120eb910715SAlp Dener PetscReal alpha5; /* factor used for trust-region update */ 121eb910715SAlp Dener 122eb910715SAlp Dener /* Parameters when updating the trust-region radius based on interpolation 123eb910715SAlp Dener 124eb910715SAlp Dener kappa = ared / pred 125eb910715SAlp Dener if kappa >= 1.0 - mu1 (very good step) 126eb910715SAlp Dener choose tau in [gamma3, gamma4] 127eb910715SAlp Dener radius = max(tau * norm(d), radius) 128eb910715SAlp Dener elif kappa >= 1.0 - mu2 (good step) 129eb910715SAlp Dener choose tau in [gamma2, gamma3] 130eb910715SAlp Dener if (tau >= 1.0) 131eb910715SAlp Dener radius = max(tau * norm(d), radius) 132eb910715SAlp Dener else 133eb910715SAlp Dener radius = tau * min(norm(d), radius) 134eb910715SAlp Dener fi 135eb910715SAlp Dener else (bad step) 136eb910715SAlp Dener choose tau in [gamma1, 1.0] 137eb910715SAlp Dener radius = tau * min(norm(d), radius) 138eb910715SAlp Dener fi 139eb910715SAlp Dener */ 140eb910715SAlp Dener PetscReal mu1; /* used for model agreement in interpolation */ 141eb910715SAlp Dener PetscReal mu2; /* used for model agreement in interpolation */ 142eb910715SAlp Dener 143eb910715SAlp Dener PetscReal gamma1; /* factor used for interpolation */ 144eb910715SAlp Dener PetscReal gamma2; /* factor used for interpolation */ 145eb910715SAlp Dener PetscReal gamma3; /* factor used for interpolation */ 146eb910715SAlp Dener PetscReal gamma4; /* factor used for interpolation */ 147eb910715SAlp Dener 148eb910715SAlp Dener PetscReal theta; /* factor used for interpolation */ 149eb910715SAlp Dener 150eb910715SAlp Dener /* Parameters when initializing trust-region radius based on interpolation */ 151eb910715SAlp Dener PetscReal mu1_i; /* used for model agreement in interpolation */ 152eb910715SAlp Dener PetscReal mu2_i; /* used for model agreement in interpolation */ 153eb910715SAlp Dener 154eb910715SAlp Dener PetscReal gamma1_i; /* factor used for interpolation */ 155eb910715SAlp Dener PetscReal gamma2_i; /* factor used for interpolation */ 156eb910715SAlp Dener PetscReal gamma3_i; /* factor used for interpolation */ 157eb910715SAlp Dener PetscReal gamma4_i; /* factor used for interpolation */ 158eb910715SAlp Dener 159eb910715SAlp Dener PetscReal theta_i; /* factor used for interpolation */ 160eb910715SAlp Dener 161eb910715SAlp Dener /* Other parameters */ 162eb910715SAlp Dener PetscReal min_radius; /* lower bound on initial radius value */ 163eb910715SAlp Dener PetscReal max_radius; /* upper bound on trust region radius */ 164eb910715SAlp Dener PetscReal epsilon; /* tolerance used when computing ared/pred */ 16562675beeSAlp Dener PetscReal dmin, dmax; /* upper and lower bounds for the Hessian diagonal vector */ 166eb910715SAlp Dener 167eb910715SAlp Dener PetscInt newt; /* Newton directions attempted */ 168eb910715SAlp Dener PetscInt bfgs; /* BFGS directions attempted */ 169eb910715SAlp Dener PetscInt sgrad; /* Scaled gradient directions attempted */ 170eb910715SAlp Dener PetscInt grad; /* Gradient directions attempted */ 171eb910715SAlp Dener 17262675beeSAlp Dener PetscInt as_type; /* Active set estimation method */ 173eb910715SAlp Dener PetscInt pc_type; /* Preconditioner for the code */ 174eb910715SAlp Dener PetscInt bfgs_scale_type; /* Scaling matrix to used for the bfgs preconditioner */ 175eb910715SAlp Dener PetscInt init_type; /* Trust-region initialization method */ 176eb910715SAlp Dener PetscInt update_type; /* Trust-region update method */ 177eb910715SAlp Dener 1782f75a4aaSAlp Dener /* Trackers for KSP solution type and convergence reasons */ 179eb910715SAlp Dener PetscInt ksp_atol; 180eb910715SAlp Dener PetscInt ksp_rtol; 181eb910715SAlp Dener PetscInt ksp_ctol; 182eb910715SAlp Dener PetscInt ksp_negc; 183eb910715SAlp Dener PetscInt ksp_dtol; 184eb910715SAlp Dener PetscInt ksp_iter; 185eb910715SAlp Dener PetscInt ksp_othr; 186eb910715SAlp Dener PetscBool is_nash, is_stcg, is_gltr; 187eb910715SAlp Dener } TAO_BNK; 188eb910715SAlp Dener 189eb910715SAlp Dener #endif /* if !defined(__TAO_BNK_H) */ 190eb910715SAlp Dener 191eb910715SAlp Dener #define BNK_NEWTON 0 192eb910715SAlp Dener #define BNK_BFGS 1 193eb910715SAlp Dener #define BNK_SCALED_GRADIENT 2 194eb910715SAlp Dener #define BNK_GRADIENT 3 195eb910715SAlp Dener 196eb910715SAlp Dener #define BNK_PC_NONE 0 197eb910715SAlp Dener #define BNK_PC_AHESS 1 198eb910715SAlp Dener #define BNK_PC_BFGS 2 199eb910715SAlp Dener #define BNK_PC_PETSC 3 200eb910715SAlp Dener #define BNK_PC_TYPES 4 201eb910715SAlp Dener 202eb910715SAlp Dener #define BFGS_SCALE_AHESS 0 203eb910715SAlp Dener #define BFGS_SCALE_PHESS 1 204eb910715SAlp Dener #define BFGS_SCALE_BFGS 2 205eb910715SAlp Dener #define BFGS_SCALE_TYPES 3 206eb910715SAlp Dener 207eb910715SAlp Dener #define BNK_INIT_CONSTANT 0 208eb910715SAlp Dener #define BNK_INIT_DIRECTION 1 209eb910715SAlp Dener #define BNK_INIT_INTERPOLATION 2 210eb910715SAlp Dener #define BNK_INIT_TYPES 3 211eb910715SAlp Dener 212eb910715SAlp Dener #define BNK_UPDATE_STEP 0 213eb910715SAlp Dener #define BNK_UPDATE_REDUCTION 1 214eb910715SAlp Dener #define BNK_UPDATE_INTERPOLATION 2 215eb910715SAlp Dener #define BNK_UPDATE_TYPES 3 216eb910715SAlp Dener 2172f75a4aaSAlp Dener #define BNK_AS_NONE 0 2182f75a4aaSAlp Dener #define BNK_AS_BERTSEKAS 1 2192f75a4aaSAlp Dener #define BNK_AS_TYPES 2 2202f75a4aaSAlp Dener 221eb910715SAlp Dener static const char *BNK_PC[64] = {"none", "ahess", "bfgs", "petsc"}; 222eb910715SAlp Dener 223eb910715SAlp Dener static const char *BFGS_SCALE[64] = {"ahess", "phess", "bfgs"}; 224eb910715SAlp Dener 225eb910715SAlp Dener static const char *BNK_INIT[64] = {"constant", "direction", "interpolation"}; 226eb910715SAlp Dener 227eb910715SAlp Dener static const char *BNK_UPDATE[64] = {"step", "reduction", "interpolation"}; 228eb910715SAlp Dener 2292f75a4aaSAlp Dener static const char *BNK_AS[64] = {"none", "bertsekas"}; 2302f75a4aaSAlp Dener 231eb910715SAlp Dener PETSC_INTERN PetscErrorCode TaoCreate_BNK(Tao); 2329b6ef848SAlp Dener PETSC_INTERN PetscErrorCode TaoSetUp_BNK(Tao); 233eb910715SAlp Dener 234eb910715SAlp Dener PETSC_INTERN PetscErrorCode MatLMVMSolveShell(PC, Vec, Vec); 23562675beeSAlp Dener PETSC_INTERN PetscErrorCode TaoBNKInitialize(Tao, PetscInt); 2362f75a4aaSAlp Dener PETSC_INTERN PetscErrorCode TaoBNKEstimateActiveSet(Tao); 23762675beeSAlp Dener PETSC_INTERN PetscErrorCode TaoBNKComputeHessian(Tao); 2382f75a4aaSAlp Dener PETSC_INTERN PetscErrorCode TaoBNKBoundStep(Tao, Vec); 23962675beeSAlp Dener PETSC_INTERN PetscErrorCode TaoBNKComputeStep(Tao, PetscBool, KSPConvergedReason*); 240*5e9b73cbSAlp Dener PETSC_INTERN PetscErrorCode TaoBNKRecomputePred(Tao, Vec, PetscReal*); 241e465cd6fSAlp Dener PETSC_INTERN PetscErrorCode TaoBNKSafeguardStep(Tao, KSPConvergedReason, PetscInt*); 242c14b763aSAlp Dener PETSC_INTERN PetscErrorCode TaoBNKPerformLineSearch(Tao, PetscInt, PetscReal*, TaoLineSearchConvergedReason*); 24328017e9fSAlp Dener PETSC_INTERN PetscErrorCode TaoBNKUpdateTrustRadius(Tao, PetscReal, PetscReal, PetscInt, PetscInt, PetscBool*); 24462675beeSAlp Dener PETSC_INTERN PetscErrorCode TaoBNKAddStepCounts(Tao, PetscInt); 245