xref: /petsc/src/tao/bound/impls/bnk/bnk.h (revision f4db9bf761fa2b8a53a11d1c2fa5aeb4622be051)
1eb910715SAlp Dener /*
2eb910715SAlp Dener Context for bounded Newton-Krylov type optimization algorithms
3eb910715SAlp Dener */
4eb910715SAlp Dener 
5eb910715SAlp Dener #if !defined(__TAO_BNK_H)
6eb910715SAlp Dener #define __TAO_BNK_H
7eb910715SAlp Dener #include <petsc/private/taoimpl.h>
8c0f10754SAlp Dener #include <../src/tao/bound/impls/bncg/bncg.h>
9eb910715SAlp Dener 
10eb910715SAlp Dener typedef struct {
11e0ed867bSAlp Dener   /* Function pointer for hessian evaluation
12e0ed867bSAlp Dener      NOTE: This is necessary so that quasi-Newton-Krylov methods can "evaluate"
13e0ed867bSAlp Dener      a quasi-Newton approximation while full Newton-Krylov methods call-back to
14e0ed867bSAlp Dener      the application's Hessian */
15e0ed867bSAlp Dener   PetscErrorCode (*computehessian)(Tao);
166b591159SAlp Dener   PetscErrorCode (*computestep)(Tao, PetscBool, KSPConvergedReason*, PetscInt*);
17e0ed867bSAlp Dener 
18c0f10754SAlp Dener   /* Embedded TAOBNCG */
19c0f10754SAlp Dener   Tao bncg;
20c0f10754SAlp Dener   TAO_BNCG *bncg_ctx;
21e031d6f5SAlp Dener   PetscInt max_cg_its, tot_cg_its;
22c0f10754SAlp Dener   Vec bncg_sol;
23c0f10754SAlp Dener 
24c0f10754SAlp Dener   /* Allocated vectors */
25c0f10754SAlp Dener   Vec W, Xwork, Gwork, Xold, Gold;
2609164190SAlp Dener   Vec unprojected_gradient, unprojected_gradient_old;
27c0f10754SAlp Dener 
28c0f10754SAlp Dener   /* Unallocated matrices and vectors */
29b9ac7092SAlp Dener   Mat H_inactive, Hpre_inactive;
30b9ac7092SAlp Dener   Vec X_inactive, G_inactive, inactive_work, active_work;
312f75a4aaSAlp Dener   IS  inactive_idx, active_idx, active_lower, active_upper, active_fixed;
32eb910715SAlp Dener 
33080d2917SAlp Dener   /* Scalar values for the solution and step */
34080d2917SAlp Dener   PetscReal fold, f, gnorm, dnorm;
35eb910715SAlp Dener 
362f75a4aaSAlp Dener   /* Parameters for active set estimation */
370a4511e9SAlp Dener   PetscReal as_tol;
380a4511e9SAlp Dener   PetscReal as_step;
392f75a4aaSAlp Dener 
40b9ac7092SAlp Dener   /* BFGS preconditioner data */
41b9ac7092SAlp Dener   PC bfgs_pre;
42b9ac7092SAlp Dener   Mat M;
43b9ac7092SAlp Dener   Vec Diag_min, Diag_max;
44b9ac7092SAlp Dener 
45eb910715SAlp Dener   /* Parameters when updating the perturbation added to the Hessian matrix
46eb910715SAlp Dener      according to the following scheme:
47eb910715SAlp Dener 
48eb910715SAlp Dener      pert = sval;
49eb910715SAlp Dener 
50eb910715SAlp Dener      do until convergence
51eb910715SAlp Dener        shift Hessian by pert
52eb910715SAlp Dener        solve Newton system
53eb910715SAlp Dener 
54eb910715SAlp Dener        if (linear solver failed or did not compute a descent direction)
55eb910715SAlp Dener          use steepest descent direction and increase perturbation
56eb910715SAlp Dener 
57eb910715SAlp Dener          if (0 == pert)
58eb910715SAlp Dener            initialize perturbation
59eb910715SAlp Dener            pert = min(imax, max(imin, imfac * norm(G)))
60eb910715SAlp Dener          else
61eb910715SAlp Dener            increase perturbation
62eb910715SAlp Dener            pert = min(pmax, max(pgfac * pert, pmgfac * norm(G)))
63eb910715SAlp Dener          fi
64eb910715SAlp Dener        else
65eb910715SAlp Dener          use linear solver direction and decrease perturbation
66eb910715SAlp Dener 
67eb910715SAlp Dener          pert = min(psfac * pert, pmsfac * norm(G))
68eb910715SAlp Dener          if (pert < pmin)
69eb910715SAlp Dener            pert = 0
70eb910715SAlp Dener          fi
71eb910715SAlp Dener        fi
72eb910715SAlp Dener 
73eb910715SAlp Dener        perform line search
74eb910715SAlp Dener        function and gradient evaluation
75eb910715SAlp Dener        check convergence
76eb910715SAlp Dener      od
77eb910715SAlp Dener   */
78eb910715SAlp Dener   PetscReal sval;               /*  Starting perturbation value, default zero */
79eb910715SAlp Dener 
80eb910715SAlp Dener   PetscReal imin;               /*  Minimum perturbation added during initialization  */
81eb910715SAlp Dener   PetscReal imax;               /*  Maximum perturbation added during initialization */
82eb910715SAlp Dener   PetscReal imfac;              /*  Merit function factor during initialization */
83eb910715SAlp Dener 
84eb910715SAlp Dener   PetscReal pert;               /*  Current perturbation value */
85eb910715SAlp Dener   PetscReal pmin;               /*  Minimim perturbation value */
86eb910715SAlp Dener   PetscReal pmax;               /*  Maximum perturbation value */
87eb910715SAlp Dener   PetscReal pgfac;              /*  Perturbation growth factor */
88eb910715SAlp Dener   PetscReal psfac;              /*  Perturbation shrink factor */
89eb910715SAlp Dener   PetscReal pmgfac;             /*  Merit function growth factor */
90eb910715SAlp Dener   PetscReal pmsfac;             /*  Merit function shrink factor */
91eb910715SAlp Dener 
92eb910715SAlp Dener   /* Parameters when updating the trust-region radius based on steplength
93eb910715SAlp Dener      if   step < nu1            (very bad step)
94eb910715SAlp Dener        radius = omega1 * min(norm(d), radius)
95eb910715SAlp Dener      elif step < nu2            (bad step)
96eb910715SAlp Dener        radius = omega2 * min(norm(d), radius)
97eb910715SAlp Dener      elif step < nu3            (okay step)
98eb910715SAlp Dener        radius = omega3 * radius;
99eb910715SAlp Dener      elif step < nu4            (good step)
100eb910715SAlp Dener        radius = max(omega4 * norm(d), radius)
101eb910715SAlp Dener      else                       (very good step)
102eb910715SAlp Dener        radius = max(omega5 * norm(d), radius)
103eb910715SAlp Dener      fi
104eb910715SAlp Dener   */
105eb910715SAlp Dener   PetscReal nu1;                /*  used to compute trust-region radius */
106eb910715SAlp Dener   PetscReal nu2;                /*  used to compute trust-region radius */
107eb910715SAlp Dener   PetscReal nu3;                /*  used to compute trust-region radius */
108eb910715SAlp Dener   PetscReal nu4;                /*  used to compute trust-region radius */
109eb910715SAlp Dener 
110eb910715SAlp Dener   PetscReal omega1;             /*  factor used for trust-region update */
111eb910715SAlp Dener   PetscReal omega2;             /*  factor used for trust-region update */
112eb910715SAlp Dener   PetscReal omega3;             /*  factor used for trust-region update */
113eb910715SAlp Dener   PetscReal omega4;             /*  factor used for trust-region update */
114eb910715SAlp Dener   PetscReal omega5;             /*  factor used for trust-region update */
115eb910715SAlp Dener 
116eb910715SAlp Dener   /* Parameters when updating the trust-region radius based on reduction
117eb910715SAlp Dener 
118eb910715SAlp Dener      kappa = ared / pred
119eb910715SAlp Dener      if   kappa < eta1          (very bad step)
120eb910715SAlp Dener        radius = alpha1 * min(norm(d), radius)
121eb910715SAlp Dener      elif kappa < eta2          (bad step)
122eb910715SAlp Dener        radius = alpha2 * min(norm(d), radius)
123eb910715SAlp Dener      elif kappa < eta3          (okay step)
124eb910715SAlp Dener        radius = alpha3 * radius;
125eb910715SAlp Dener      elif kappa < eta4          (good step)
126eb910715SAlp Dener        radius = max(alpha4 * norm(d), radius)
127eb910715SAlp Dener      else                       (very good step)
128eb910715SAlp Dener        radius = max(alpha5 * norm(d), radius)
129eb910715SAlp Dener      fi
130eb910715SAlp Dener   */
131eb910715SAlp Dener   PetscReal eta1;               /*  used to compute trust-region radius */
132eb910715SAlp Dener   PetscReal eta2;               /*  used to compute trust-region radius */
133eb910715SAlp Dener   PetscReal eta3;               /*  used to compute trust-region radius */
134eb910715SAlp Dener   PetscReal eta4;               /*  used to compute trust-region radius */
135eb910715SAlp Dener 
136eb910715SAlp Dener   PetscReal alpha1;             /*  factor used for trust-region update */
137eb910715SAlp Dener   PetscReal alpha2;             /*  factor used for trust-region update */
138eb910715SAlp Dener   PetscReal alpha3;             /*  factor used for trust-region update */
139eb910715SAlp Dener   PetscReal alpha4;             /*  factor used for trust-region update */
140eb910715SAlp Dener   PetscReal alpha5;             /*  factor used for trust-region update */
141eb910715SAlp Dener 
142eb910715SAlp Dener   /* Parameters when updating the trust-region radius based on interpolation
143eb910715SAlp Dener 
144eb910715SAlp Dener      kappa = ared / pred
145eb910715SAlp Dener      if   kappa >= 1.0 - mu1    (very good step)
146eb910715SAlp Dener        choose tau in [gamma3, gamma4]
147eb910715SAlp Dener        radius = max(tau * norm(d), radius)
148eb910715SAlp Dener      elif kappa >= 1.0 - mu2    (good step)
149eb910715SAlp Dener        choose tau in [gamma2, gamma3]
150eb910715SAlp Dener        if (tau >= 1.0)
151eb910715SAlp Dener          radius = max(tau * norm(d), radius)
152eb910715SAlp Dener        else
153eb910715SAlp Dener          radius = tau * min(norm(d), radius)
154eb910715SAlp Dener        fi
155eb910715SAlp Dener      else                       (bad step)
156eb910715SAlp Dener        choose tau in [gamma1, 1.0]
157eb910715SAlp Dener        radius = tau * min(norm(d), radius)
158eb910715SAlp Dener      fi
159eb910715SAlp Dener   */
160eb910715SAlp Dener   PetscReal mu1;                /*  used for model agreement in interpolation */
161eb910715SAlp Dener   PetscReal mu2;                /*  used for model agreement in interpolation */
162eb910715SAlp Dener 
163eb910715SAlp Dener   PetscReal gamma1;             /*  factor used for interpolation */
164eb910715SAlp Dener   PetscReal gamma2;             /*  factor used for interpolation */
165eb910715SAlp Dener   PetscReal gamma3;             /*  factor used for interpolation */
166eb910715SAlp Dener   PetscReal gamma4;             /*  factor used for interpolation */
167eb910715SAlp Dener 
168eb910715SAlp Dener   PetscReal theta;              /*  factor used for interpolation */
169eb910715SAlp Dener 
170eb910715SAlp Dener   /*  Parameters when initializing trust-region radius based on interpolation */
171eb910715SAlp Dener   PetscReal mu1_i;              /*  used for model agreement in interpolation */
172eb910715SAlp Dener   PetscReal mu2_i;              /*  used for model agreement in interpolation */
173eb910715SAlp Dener 
174eb910715SAlp Dener   PetscReal gamma1_i;           /*  factor used for interpolation */
175eb910715SAlp Dener   PetscReal gamma2_i;           /*  factor used for interpolation */
176eb910715SAlp Dener   PetscReal gamma3_i;           /*  factor used for interpolation */
177eb910715SAlp Dener   PetscReal gamma4_i;           /*  factor used for interpolation */
178eb910715SAlp Dener 
179eb910715SAlp Dener   PetscReal theta_i;            /*  factor used for interpolation */
180eb910715SAlp Dener 
181eb910715SAlp Dener   /*  Other parameters */
182eb910715SAlp Dener   PetscReal min_radius;         /*  lower bound on initial radius value */
183eb910715SAlp Dener   PetscReal max_radius;         /*  upper bound on trust region radius */
184eb910715SAlp Dener   PetscReal epsilon;            /*  tolerance used when computing ared/pred */
18562675beeSAlp Dener   PetscReal dmin, dmax;         /*  upper and lower bounds for the Hessian diagonal vector */
186eb910715SAlp Dener 
187eb910715SAlp Dener   PetscInt newt;                /*  Newton directions attempted */
188eb910715SAlp Dener   PetscInt bfgs;                /*  BFGS directions attempted */
189eb910715SAlp Dener   PetscInt sgrad;               /*  Scaled gradient directions attempted */
190eb910715SAlp Dener   PetscInt grad;                /*  Gradient directions attempted */
191eb910715SAlp Dener 
19262675beeSAlp Dener   PetscInt as_type;             /*  Active set estimation method */
193eb910715SAlp Dener   PetscInt bfgs_scale_type;     /*  Scaling matrix to used for the bfgs preconditioner */
194eb910715SAlp Dener   PetscInt init_type;           /*  Trust-region initialization method */
195eb910715SAlp Dener   PetscInt update_type;         /*  Trust-region update method */
196eb910715SAlp Dener 
1972f75a4aaSAlp Dener   /* Trackers for KSP solution type and convergence reasons */
198eb910715SAlp Dener   PetscInt ksp_atol;
199eb910715SAlp Dener   PetscInt ksp_rtol;
200eb910715SAlp Dener   PetscInt ksp_ctol;
201eb910715SAlp Dener   PetscInt ksp_negc;
202eb910715SAlp Dener   PetscInt ksp_dtol;
203eb910715SAlp Dener   PetscInt ksp_iter;
204eb910715SAlp Dener   PetscInt ksp_othr;
205*f4db9bf7SStefano Zampini   PetscBool resetksp;
206e0ed867bSAlp Dener 
207e0ed867bSAlp Dener   /* Implementation specific context */
208e0ed867bSAlp Dener   void* ctx;
209eb910715SAlp Dener } TAO_BNK;
210eb910715SAlp Dener 
211eb910715SAlp Dener #define BNK_NEWTON              0
212eb910715SAlp Dener #define BNK_BFGS                1
213eb910715SAlp Dener #define BNK_SCALED_GRADIENT     2
214eb910715SAlp Dener #define BNK_GRADIENT            3
215eb910715SAlp Dener 
216eb910715SAlp Dener #define BNK_INIT_CONSTANT         0
217eb910715SAlp Dener #define BNK_INIT_DIRECTION        1
218eb910715SAlp Dener #define BNK_INIT_INTERPOLATION    2
219eb910715SAlp Dener #define BNK_INIT_TYPES            3
220eb910715SAlp Dener 
221eb910715SAlp Dener #define BNK_UPDATE_STEP           0
222eb910715SAlp Dener #define BNK_UPDATE_REDUCTION      1
223eb910715SAlp Dener #define BNK_UPDATE_INTERPOLATION  2
224eb910715SAlp Dener #define BNK_UPDATE_TYPES          3
225eb910715SAlp Dener 
2262f75a4aaSAlp Dener #define BNK_AS_NONE        0
2272f75a4aaSAlp Dener #define BNK_AS_BERTSEKAS   1
2282f75a4aaSAlp Dener #define BNK_AS_TYPES       2
2292f75a4aaSAlp Dener 
230eb910715SAlp Dener PETSC_INTERN PetscErrorCode TaoCreate_BNK(Tao);
2319b6ef848SAlp Dener PETSC_INTERN PetscErrorCode TaoSetUp_BNK(Tao);
232e0ed867bSAlp Dener PETSC_INTERN PetscErrorCode TaoSetFromOptions_BNK(PetscOptionItems*, Tao);
233e0ed867bSAlp Dener PETSC_INTERN PetscErrorCode TaoDestroy_BNK(Tao);
234e0ed867bSAlp Dener PETSC_INTERN PetscErrorCode TaoView_BNK(Tao, PetscViewer);
235e0ed867bSAlp Dener 
236e0ed867bSAlp Dener PETSC_INTERN PetscErrorCode TaoSolve_BNLS(Tao);
237e0ed867bSAlp Dener PETSC_INTERN PetscErrorCode TaoSolve_BNTR(Tao);
238e0ed867bSAlp Dener PETSC_INTERN PetscErrorCode TaoSolve_BNTL(Tao);
239eb910715SAlp Dener 
240cd929ea3SAlp Dener PETSC_INTERN PetscErrorCode TaoBNKPreconBFGS(PC, Vec, Vec);
241c0f10754SAlp Dener PETSC_INTERN PetscErrorCode TaoBNKInitialize(Tao, PetscInt, PetscBool*);
24208752603SAlp Dener PETSC_INTERN PetscErrorCode TaoBNKEstimateActiveSet(Tao, PetscInt);
24362675beeSAlp Dener PETSC_INTERN PetscErrorCode TaoBNKComputeHessian(Tao);
244a1318120SAlp Dener PETSC_INTERN PetscErrorCode TaoBNKBoundStep(Tao, PetscInt, Vec);
245c0f10754SAlp Dener PETSC_INTERN PetscErrorCode TaoBNKTakeCGSteps(Tao, PetscBool*);
2466b591159SAlp Dener PETSC_INTERN PetscErrorCode TaoBNKComputeStep(Tao, PetscBool, KSPConvergedReason*, PetscInt*);
2475e9b73cbSAlp Dener PETSC_INTERN PetscErrorCode TaoBNKRecomputePred(Tao, Vec, PetscReal*);
248e465cd6fSAlp Dener PETSC_INTERN PetscErrorCode TaoBNKSafeguardStep(Tao, KSPConvergedReason, PetscInt*);
249937a31a1SAlp Dener PETSC_INTERN PetscErrorCode TaoBNKPerformLineSearch(Tao, PetscInt*, PetscReal*, TaoLineSearchConvergedReason*);
25028017e9fSAlp Dener PETSC_INTERN PetscErrorCode TaoBNKUpdateTrustRadius(Tao, PetscReal, PetscReal, PetscInt, PetscInt, PetscBool*);
25162675beeSAlp Dener PETSC_INTERN PetscErrorCode TaoBNKAddStepCounts(Tao, PetscInt);
252b9ac7092SAlp Dener 
253b9ac7092SAlp Dener #endif /* if !defined(__TAO_BNK_H) */
254