1eb910715SAlp Dener /* 2eb910715SAlp Dener Context for bounded Newton-Krylov type optimization algorithms 3eb910715SAlp Dener */ 4eb910715SAlp Dener 5eb910715SAlp Dener #if !defined(__TAO_BNK_H) 6eb910715SAlp Dener #define __TAO_BNK_H 7eb910715SAlp Dener #include <petsc/private/taoimpl.h> 8eb910715SAlp Dener #include <../src/tao/matrix/lmvmmat.h> 9eb910715SAlp Dener 10eb910715SAlp Dener typedef struct { 1109164190SAlp Dener Mat H_inactive, Hpre_inactive, M; 122f75a4aaSAlp Dener Vec W, Xwork, Gwork, inactive_work, active_work; 13*62675beeSAlp Dener Vec Xold, Gold, Diag, Diag_min, Diag_max; 1409164190SAlp Dener Vec unprojected_gradient, unprojected_gradient_old; 152f75a4aaSAlp Dener IS inactive_idx, active_idx, active_lower, active_upper, active_fixed; 16eb910715SAlp Dener 17080d2917SAlp Dener /* Scalar values for the solution and step */ 18080d2917SAlp Dener PetscReal fold, f, gnorm, dnorm; 19eb910715SAlp Dener 202f75a4aaSAlp Dener /* Parameters for active set estimation */ 210a4511e9SAlp Dener PetscReal as_tol; 220a4511e9SAlp Dener PetscReal as_step; 232f75a4aaSAlp Dener 24eb910715SAlp Dener /* Parameters when updating the perturbation added to the Hessian matrix 25eb910715SAlp Dener according to the following scheme: 26eb910715SAlp Dener 27eb910715SAlp Dener pert = sval; 28eb910715SAlp Dener 29eb910715SAlp Dener do until convergence 30eb910715SAlp Dener shift Hessian by pert 31eb910715SAlp Dener solve Newton system 32eb910715SAlp Dener 33eb910715SAlp Dener if (linear solver failed or did not compute a descent direction) 34eb910715SAlp Dener use steepest descent direction and increase perturbation 35eb910715SAlp Dener 36eb910715SAlp Dener if (0 == pert) 37eb910715SAlp Dener initialize perturbation 38eb910715SAlp Dener pert = min(imax, max(imin, imfac * norm(G))) 39eb910715SAlp Dener else 40eb910715SAlp Dener increase perturbation 41eb910715SAlp Dener pert = min(pmax, max(pgfac * pert, pmgfac * norm(G))) 42eb910715SAlp Dener fi 43eb910715SAlp Dener else 44eb910715SAlp Dener use linear solver direction and decrease perturbation 45eb910715SAlp Dener 46eb910715SAlp Dener pert = min(psfac * pert, pmsfac * norm(G)) 47eb910715SAlp Dener if (pert < pmin) 48eb910715SAlp Dener pert = 0 49eb910715SAlp Dener fi 50eb910715SAlp Dener fi 51eb910715SAlp Dener 52eb910715SAlp Dener perform line search 53eb910715SAlp Dener function and gradient evaluation 54eb910715SAlp Dener check convergence 55eb910715SAlp Dener od 56eb910715SAlp Dener */ 57eb910715SAlp Dener PetscReal sval; /* Starting perturbation value, default zero */ 58eb910715SAlp Dener 59eb910715SAlp Dener PetscReal imin; /* Minimum perturbation added during initialization */ 60eb910715SAlp Dener PetscReal imax; /* Maximum perturbation added during initialization */ 61eb910715SAlp Dener PetscReal imfac; /* Merit function factor during initialization */ 62eb910715SAlp Dener 63eb910715SAlp Dener PetscReal pert; /* Current perturbation value */ 64eb910715SAlp Dener PetscReal pmin; /* Minimim perturbation value */ 65eb910715SAlp Dener PetscReal pmax; /* Maximum perturbation value */ 66eb910715SAlp Dener PetscReal pgfac; /* Perturbation growth factor */ 67eb910715SAlp Dener PetscReal psfac; /* Perturbation shrink factor */ 68eb910715SAlp Dener PetscReal pmgfac; /* Merit function growth factor */ 69eb910715SAlp Dener PetscReal pmsfac; /* Merit function shrink factor */ 70eb910715SAlp Dener 71eb910715SAlp Dener /* Parameters when updating the trust-region radius based on steplength 72eb910715SAlp Dener if step < nu1 (very bad step) 73eb910715SAlp Dener radius = omega1 * min(norm(d), radius) 74eb910715SAlp Dener elif step < nu2 (bad step) 75eb910715SAlp Dener radius = omega2 * min(norm(d), radius) 76eb910715SAlp Dener elif step < nu3 (okay step) 77eb910715SAlp Dener radius = omega3 * radius; 78eb910715SAlp Dener elif step < nu4 (good step) 79eb910715SAlp Dener radius = max(omega4 * norm(d), radius) 80eb910715SAlp Dener else (very good step) 81eb910715SAlp Dener radius = max(omega5 * norm(d), radius) 82eb910715SAlp Dener fi 83eb910715SAlp Dener */ 84eb910715SAlp Dener PetscReal nu1; /* used to compute trust-region radius */ 85eb910715SAlp Dener PetscReal nu2; /* used to compute trust-region radius */ 86eb910715SAlp Dener PetscReal nu3; /* used to compute trust-region radius */ 87eb910715SAlp Dener PetscReal nu4; /* used to compute trust-region radius */ 88eb910715SAlp Dener 89eb910715SAlp Dener PetscReal omega1; /* factor used for trust-region update */ 90eb910715SAlp Dener PetscReal omega2; /* factor used for trust-region update */ 91eb910715SAlp Dener PetscReal omega3; /* factor used for trust-region update */ 92eb910715SAlp Dener PetscReal omega4; /* factor used for trust-region update */ 93eb910715SAlp Dener PetscReal omega5; /* factor used for trust-region update */ 94eb910715SAlp Dener 95eb910715SAlp Dener /* Parameters when updating the trust-region radius based on reduction 96eb910715SAlp Dener 97eb910715SAlp Dener kappa = ared / pred 98eb910715SAlp Dener if kappa < eta1 (very bad step) 99eb910715SAlp Dener radius = alpha1 * min(norm(d), radius) 100eb910715SAlp Dener elif kappa < eta2 (bad step) 101eb910715SAlp Dener radius = alpha2 * min(norm(d), radius) 102eb910715SAlp Dener elif kappa < eta3 (okay step) 103eb910715SAlp Dener radius = alpha3 * radius; 104eb910715SAlp Dener elif kappa < eta4 (good step) 105eb910715SAlp Dener radius = max(alpha4 * norm(d), radius) 106eb910715SAlp Dener else (very good step) 107eb910715SAlp Dener radius = max(alpha5 * norm(d), radius) 108eb910715SAlp Dener fi 109eb910715SAlp Dener */ 110eb910715SAlp Dener PetscReal eta1; /* used to compute trust-region radius */ 111eb910715SAlp Dener PetscReal eta2; /* used to compute trust-region radius */ 112eb910715SAlp Dener PetscReal eta3; /* used to compute trust-region radius */ 113eb910715SAlp Dener PetscReal eta4; /* used to compute trust-region radius */ 114eb910715SAlp Dener 115eb910715SAlp Dener PetscReal alpha1; /* factor used for trust-region update */ 116eb910715SAlp Dener PetscReal alpha2; /* factor used for trust-region update */ 117eb910715SAlp Dener PetscReal alpha3; /* factor used for trust-region update */ 118eb910715SAlp Dener PetscReal alpha4; /* factor used for trust-region update */ 119eb910715SAlp Dener PetscReal alpha5; /* factor used for trust-region update */ 120eb910715SAlp Dener 121eb910715SAlp Dener /* Parameters when updating the trust-region radius based on interpolation 122eb910715SAlp Dener 123eb910715SAlp Dener kappa = ared / pred 124eb910715SAlp Dener if kappa >= 1.0 - mu1 (very good step) 125eb910715SAlp Dener choose tau in [gamma3, gamma4] 126eb910715SAlp Dener radius = max(tau * norm(d), radius) 127eb910715SAlp Dener elif kappa >= 1.0 - mu2 (good step) 128eb910715SAlp Dener choose tau in [gamma2, gamma3] 129eb910715SAlp Dener if (tau >= 1.0) 130eb910715SAlp Dener radius = max(tau * norm(d), radius) 131eb910715SAlp Dener else 132eb910715SAlp Dener radius = tau * min(norm(d), radius) 133eb910715SAlp Dener fi 134eb910715SAlp Dener else (bad step) 135eb910715SAlp Dener choose tau in [gamma1, 1.0] 136eb910715SAlp Dener radius = tau * min(norm(d), radius) 137eb910715SAlp Dener fi 138eb910715SAlp Dener */ 139eb910715SAlp Dener PetscReal mu1; /* used for model agreement in interpolation */ 140eb910715SAlp Dener PetscReal mu2; /* used for model agreement in interpolation */ 141eb910715SAlp Dener 142eb910715SAlp Dener PetscReal gamma1; /* factor used for interpolation */ 143eb910715SAlp Dener PetscReal gamma2; /* factor used for interpolation */ 144eb910715SAlp Dener PetscReal gamma3; /* factor used for interpolation */ 145eb910715SAlp Dener PetscReal gamma4; /* factor used for interpolation */ 146eb910715SAlp Dener 147eb910715SAlp Dener PetscReal theta; /* factor used for interpolation */ 148eb910715SAlp Dener 149eb910715SAlp Dener /* Parameters when initializing trust-region radius based on interpolation */ 150eb910715SAlp Dener PetscReal mu1_i; /* used for model agreement in interpolation */ 151eb910715SAlp Dener PetscReal mu2_i; /* used for model agreement in interpolation */ 152eb910715SAlp Dener 153eb910715SAlp Dener PetscReal gamma1_i; /* factor used for interpolation */ 154eb910715SAlp Dener PetscReal gamma2_i; /* factor used for interpolation */ 155eb910715SAlp Dener PetscReal gamma3_i; /* factor used for interpolation */ 156eb910715SAlp Dener PetscReal gamma4_i; /* factor used for interpolation */ 157eb910715SAlp Dener 158eb910715SAlp Dener PetscReal theta_i; /* factor used for interpolation */ 159eb910715SAlp Dener 160eb910715SAlp Dener /* Other parameters */ 161eb910715SAlp Dener PetscReal min_radius; /* lower bound on initial radius value */ 162eb910715SAlp Dener PetscReal max_radius; /* upper bound on trust region radius */ 163eb910715SAlp Dener PetscReal epsilon; /* tolerance used when computing ared/pred */ 164*62675beeSAlp Dener PetscReal dmin, dmax; /* upper and lower bounds for the Hessian diagonal vector */ 165eb910715SAlp Dener 166eb910715SAlp Dener PetscInt newt; /* Newton directions attempted */ 167eb910715SAlp Dener PetscInt bfgs; /* BFGS directions attempted */ 168eb910715SAlp Dener PetscInt sgrad; /* Scaled gradient directions attempted */ 169eb910715SAlp Dener PetscInt grad; /* Gradient directions attempted */ 170eb910715SAlp Dener 171*62675beeSAlp Dener PetscInt as_type; /* Active set estimation method */ 172eb910715SAlp Dener PetscInt pc_type; /* Preconditioner for the code */ 173eb910715SAlp Dener PetscInt bfgs_scale_type; /* Scaling matrix to used for the bfgs preconditioner */ 174eb910715SAlp Dener PetscInt init_type; /* Trust-region initialization method */ 175eb910715SAlp Dener PetscInt update_type; /* Trust-region update method */ 176eb910715SAlp Dener 1772f75a4aaSAlp Dener /* Trackers for KSP solution type and convergence reasons */ 178eb910715SAlp Dener PetscInt ksp_atol; 179eb910715SAlp Dener PetscInt ksp_rtol; 180eb910715SAlp Dener PetscInt ksp_ctol; 181eb910715SAlp Dener PetscInt ksp_negc; 182eb910715SAlp Dener PetscInt ksp_dtol; 183eb910715SAlp Dener PetscInt ksp_iter; 184eb910715SAlp Dener PetscInt ksp_othr; 185eb910715SAlp Dener PetscBool is_nash, is_stcg, is_gltr; 186eb910715SAlp Dener } TAO_BNK; 187eb910715SAlp Dener 188eb910715SAlp Dener #endif /* if !defined(__TAO_BNK_H) */ 189eb910715SAlp Dener 190eb910715SAlp Dener #define BNK_NEWTON 0 191eb910715SAlp Dener #define BNK_BFGS 1 192eb910715SAlp Dener #define BNK_SCALED_GRADIENT 2 193eb910715SAlp Dener #define BNK_GRADIENT 3 194eb910715SAlp Dener 195eb910715SAlp Dener #define BNK_PC_NONE 0 196eb910715SAlp Dener #define BNK_PC_AHESS 1 197eb910715SAlp Dener #define BNK_PC_BFGS 2 198eb910715SAlp Dener #define BNK_PC_PETSC 3 199eb910715SAlp Dener #define BNK_PC_TYPES 4 200eb910715SAlp Dener 201eb910715SAlp Dener #define BFGS_SCALE_AHESS 0 202eb910715SAlp Dener #define BFGS_SCALE_PHESS 1 203eb910715SAlp Dener #define BFGS_SCALE_BFGS 2 204eb910715SAlp Dener #define BFGS_SCALE_TYPES 3 205eb910715SAlp Dener 206eb910715SAlp Dener #define BNK_INIT_CONSTANT 0 207eb910715SAlp Dener #define BNK_INIT_DIRECTION 1 208eb910715SAlp Dener #define BNK_INIT_INTERPOLATION 2 209eb910715SAlp Dener #define BNK_INIT_TYPES 3 210eb910715SAlp Dener 211eb910715SAlp Dener #define BNK_UPDATE_STEP 0 212eb910715SAlp Dener #define BNK_UPDATE_REDUCTION 1 213eb910715SAlp Dener #define BNK_UPDATE_INTERPOLATION 2 214eb910715SAlp Dener #define BNK_UPDATE_TYPES 3 215eb910715SAlp Dener 2162f75a4aaSAlp Dener #define BNK_AS_NONE 0 2172f75a4aaSAlp Dener #define BNK_AS_BERTSEKAS 1 2182f75a4aaSAlp Dener #define BNK_AS_TYPES 2 2192f75a4aaSAlp Dener 220eb910715SAlp Dener static const char *BNK_PC[64] = {"none", "ahess", "bfgs", "petsc"}; 221eb910715SAlp Dener 222eb910715SAlp Dener static const char *BFGS_SCALE[64] = {"ahess", "phess", "bfgs"}; 223eb910715SAlp Dener 224eb910715SAlp Dener static const char *BNK_INIT[64] = {"constant", "direction", "interpolation"}; 225eb910715SAlp Dener 226eb910715SAlp Dener static const char *BNK_UPDATE[64] = {"step", "reduction", "interpolation"}; 227eb910715SAlp Dener 2282f75a4aaSAlp Dener static const char *BNK_AS[64] = {"none", "bertsekas"}; 2292f75a4aaSAlp Dener 230eb910715SAlp Dener PETSC_INTERN PetscErrorCode TaoCreate_BNK(Tao); 231eb910715SAlp Dener 232eb910715SAlp Dener PETSC_INTERN PetscErrorCode MatLMVMSolveShell(PC, Vec, Vec); 233*62675beeSAlp Dener PETSC_INTERN PetscErrorCode TaoBNKInitialize(Tao, PetscInt); 2342f75a4aaSAlp Dener PETSC_INTERN PetscErrorCode TaoBNKEstimateActiveSet(Tao); 235*62675beeSAlp Dener PETSC_INTERN PetscErrorCode TaoBNKComputeHessian(Tao); 2362f75a4aaSAlp Dener PETSC_INTERN PetscErrorCode TaoBNKBoundStep(Tao, Vec); 237*62675beeSAlp Dener PETSC_INTERN PetscErrorCode TaoBNKComputeStep(Tao, PetscBool, KSPConvergedReason*); 238e465cd6fSAlp Dener PETSC_INTERN PetscErrorCode TaoBNKSafeguardStep(Tao, KSPConvergedReason, PetscInt*); 239c14b763aSAlp Dener PETSC_INTERN PetscErrorCode TaoBNKPerformLineSearch(Tao, PetscInt, PetscReal*, TaoLineSearchConvergedReason*); 24028017e9fSAlp Dener PETSC_INTERN PetscErrorCode TaoBNKUpdateTrustRadius(Tao, PetscReal, PetscReal, PetscInt, PetscInt, PetscBool*); 241*62675beeSAlp Dener PETSC_INTERN PetscErrorCode TaoBNKAddStepCounts(Tao, PetscInt); 242