xref: /petsc/src/tao/unconstrained/impls/bmrm/bmrm.c (revision ad349883cef1a8c54c33e0d5808df6b9a80db1b2)
1aaa7dc30SBarry Smith #include <../src/tao/unconstrained/impls/bmrm/bmrm.h>
2a7e14dcfSSatish Balay 
3a7e14dcfSSatish Balay static PetscErrorCode init_df_solver(TAO_DF *);
4a7e14dcfSSatish Balay static PetscErrorCode ensure_df_space(PetscInt, TAO_DF *);
5a7e14dcfSSatish Balay static PetscErrorCode destroy_df_solver(TAO_DF *);
60e660641SBarry Smith static PetscReal      phi(PetscReal *, PetscInt, PetscReal, PetscReal *, PetscReal, PetscReal *, PetscReal *, PetscReal *);
70e660641SBarry Smith static PetscInt       project(PetscInt, PetscReal *, PetscReal, PetscReal *, PetscReal *, PetscReal *, PetscReal *, PetscReal *, TAO_DF *);
8a7e14dcfSSatish Balay 
9*ad349883SBarry Smith static PetscErrorCode solve(TAO_DF *df)
10*ad349883SBarry Smith {
11*ad349883SBarry Smith   PetscInt    i, j, innerIter, it, it2, luv, info;
12*ad349883SBarry Smith   PetscReal   gd, max, ak, bk, akold, bkold, lamnew, alpha, kktlam = 0.0, lam_ext;
13*ad349883SBarry Smith   PetscReal   DELTAsv, ProdDELTAsv;
14*ad349883SBarry Smith   PetscReal   c, *tempQ;
15*ad349883SBarry Smith   PetscReal  *x = df->x, *a = df->a, b = df->b, *l = df->l, *u = df->u, tol = df->tol;
16*ad349883SBarry Smith   PetscReal  *tempv = df->tempv, *y = df->y, *g = df->g, *d = df->d, *Qd = df->Qd;
17*ad349883SBarry Smith   PetscReal  *xplus = df->xplus, *tplus = df->tplus, *sk = df->sk, *yk = df->yk;
18*ad349883SBarry Smith   PetscReal **Q = df->Q, *f = df->f, *t = df->t;
19*ad349883SBarry Smith   PetscInt    dim = df->dim, *ipt = df->ipt, *ipt2 = df->ipt2, *uv = df->uv;
20*ad349883SBarry Smith 
21*ad349883SBarry Smith   /* variables for the adaptive nonmonotone linesearch */
22*ad349883SBarry Smith   PetscInt  L, llast;
23*ad349883SBarry Smith   PetscReal fr, fbest, fv, fc, fv0;
24*ad349883SBarry Smith 
25*ad349883SBarry Smith   c = BMRM_INFTY;
26*ad349883SBarry Smith 
27*ad349883SBarry Smith   DELTAsv = EPS_SV;
28*ad349883SBarry Smith   if (tol <= 1.0e-5 || dim <= 20) ProdDELTAsv = 0.0F;
29*ad349883SBarry Smith   else ProdDELTAsv = EPS_SV;
30*ad349883SBarry Smith 
31*ad349883SBarry Smith   for (i = 0; i < dim; i++) tempv[i] = -x[i];
32*ad349883SBarry Smith 
33*ad349883SBarry Smith   lam_ext = 0.0;
34*ad349883SBarry Smith 
35*ad349883SBarry Smith   /* Project the initial solution */
36*ad349883SBarry Smith   project(dim, a, b, tempv, l, u, x, &lam_ext, df);
37*ad349883SBarry Smith 
38*ad349883SBarry Smith   /* Compute gradient
39*ad349883SBarry Smith      g = Q*x + f; */
40*ad349883SBarry Smith 
41*ad349883SBarry Smith   it = 0;
42*ad349883SBarry Smith   for (i = 0; i < dim; i++) {
43*ad349883SBarry Smith     if (PetscAbsReal(x[i]) > ProdDELTAsv) ipt[it++] = i;
44*ad349883SBarry Smith   }
45*ad349883SBarry Smith 
46*ad349883SBarry Smith   PetscCall(PetscArrayzero(t, dim));
47*ad349883SBarry Smith   for (i = 0; i < it; i++) {
48*ad349883SBarry Smith     tempQ = Q[ipt[i]];
49*ad349883SBarry Smith     for (j = 0; j < dim; j++) t[j] += (tempQ[j] * x[ipt[i]]);
50*ad349883SBarry Smith   }
51*ad349883SBarry Smith   for (i = 0; i < dim; i++) g[i] = t[i] + f[i];
52*ad349883SBarry Smith 
53*ad349883SBarry Smith   /* y = -(x_{k} - g_{k}) */
54*ad349883SBarry Smith   for (i = 0; i < dim; i++) y[i] = g[i] - x[i];
55*ad349883SBarry Smith 
56*ad349883SBarry Smith   /* Project x_{k} - g_{k} */
57*ad349883SBarry Smith   project(dim, a, b, y, l, u, tempv, &lam_ext, df);
58*ad349883SBarry Smith 
59*ad349883SBarry Smith   /* y = P(x_{k} - g_{k}) - x_{k} */
60*ad349883SBarry Smith   max = ALPHA_MIN;
61*ad349883SBarry Smith   for (i = 0; i < dim; i++) {
62*ad349883SBarry Smith     y[i] = tempv[i] - x[i];
63*ad349883SBarry Smith     if (PetscAbsReal(y[i]) > max) max = PetscAbsReal(y[i]);
64*ad349883SBarry Smith   }
65*ad349883SBarry Smith 
66*ad349883SBarry Smith   if (max < tol * 1e-3) return PETSC_SUCCESS;
67*ad349883SBarry Smith 
68*ad349883SBarry Smith   alpha = 1.0 / max;
69*ad349883SBarry Smith 
70*ad349883SBarry Smith   /* fv0 = f(x_{0}). Recall t = Q x_{k}  */
71*ad349883SBarry Smith   fv0 = 0.0;
72*ad349883SBarry Smith   for (i = 0; i < dim; i++) fv0 += x[i] * (0.5 * t[i] + f[i]);
73*ad349883SBarry Smith 
74*ad349883SBarry Smith   /* adaptive nonmonotone linesearch */
75*ad349883SBarry Smith   L     = 2;
76*ad349883SBarry Smith   fr    = ALPHA_MAX;
77*ad349883SBarry Smith   fbest = fv0;
78*ad349883SBarry Smith   fc    = fv0;
79*ad349883SBarry Smith   llast = 0;
80*ad349883SBarry Smith   akold = bkold = 0.0;
81*ad349883SBarry Smith 
82*ad349883SBarry Smith   /*     Iterator begins     */
83*ad349883SBarry Smith   for (innerIter = 1; innerIter <= df->maxPGMIter; innerIter++) {
84*ad349883SBarry Smith     /* tempv = -(x_{k} - alpha*g_{k}) */
85*ad349883SBarry Smith     for (i = 0; i < dim; i++) tempv[i] = alpha * g[i] - x[i];
86*ad349883SBarry Smith 
87*ad349883SBarry Smith     /* Project x_{k} - alpha*g_{k} */
88*ad349883SBarry Smith     project(dim, a, b, tempv, l, u, y, &lam_ext, df);
89*ad349883SBarry Smith 
90*ad349883SBarry Smith     /* gd = \inner{d_{k}}{g_{k}}
91*ad349883SBarry Smith         d = P(x_{k} - alpha*g_{k}) - x_{k}
92*ad349883SBarry Smith     */
93*ad349883SBarry Smith     gd = 0.0;
94*ad349883SBarry Smith     for (i = 0; i < dim; i++) {
95*ad349883SBarry Smith       d[i] = y[i] - x[i];
96*ad349883SBarry Smith       gd += d[i] * g[i];
97*ad349883SBarry Smith     }
98*ad349883SBarry Smith 
99*ad349883SBarry Smith     /* Gradient computation  */
100*ad349883SBarry Smith 
101*ad349883SBarry Smith     /* compute Qd = Q*d  or  Qd = Q*y - t depending on their sparsity */
102*ad349883SBarry Smith 
103*ad349883SBarry Smith     it = it2 = 0;
104*ad349883SBarry Smith     for (i = 0; i < dim; i++) {
105*ad349883SBarry Smith       if (PetscAbsReal(d[i]) > (ProdDELTAsv * 1.0e-2)) ipt[it++] = i;
106*ad349883SBarry Smith     }
107*ad349883SBarry Smith     for (i = 0; i < dim; i++) {
108*ad349883SBarry Smith       if (PetscAbsReal(y[i]) > ProdDELTAsv) ipt2[it2++] = i;
109*ad349883SBarry Smith     }
110*ad349883SBarry Smith 
111*ad349883SBarry Smith     PetscCall(PetscArrayzero(Qd, dim));
112*ad349883SBarry Smith     /* compute Qd = Q*d */
113*ad349883SBarry Smith     if (it < it2) {
114*ad349883SBarry Smith       for (i = 0; i < it; i++) {
115*ad349883SBarry Smith         tempQ = Q[ipt[i]];
116*ad349883SBarry Smith         for (j = 0; j < dim; j++) Qd[j] += (tempQ[j] * d[ipt[i]]);
117*ad349883SBarry Smith       }
118*ad349883SBarry Smith     } else { /* compute Qd = Q*y-t */
119*ad349883SBarry Smith       for (i = 0; i < it2; i++) {
120*ad349883SBarry Smith         tempQ = Q[ipt2[i]];
121*ad349883SBarry Smith         for (j = 0; j < dim; j++) Qd[j] += (tempQ[j] * y[ipt2[i]]);
122*ad349883SBarry Smith       }
123*ad349883SBarry Smith       for (j = 0; j < dim; j++) Qd[j] -= t[j];
124*ad349883SBarry Smith     }
125*ad349883SBarry Smith 
126*ad349883SBarry Smith     /* ak = inner{d_{k}}{d_{k}} */
127*ad349883SBarry Smith     ak = 0.0;
128*ad349883SBarry Smith     for (i = 0; i < dim; i++) ak += d[i] * d[i];
129*ad349883SBarry Smith 
130*ad349883SBarry Smith     bk = 0.0;
131*ad349883SBarry Smith     for (i = 0; i < dim; i++) bk += d[i] * Qd[i];
132*ad349883SBarry Smith 
133*ad349883SBarry Smith     if (bk > EPS * ak && gd < 0.0) lamnew = -gd / bk;
134*ad349883SBarry Smith     else lamnew = 1.0;
135*ad349883SBarry Smith 
136*ad349883SBarry Smith     /* fv is computing f(x_{k} + d_{k}) */
137*ad349883SBarry Smith     fv = 0.0;
138*ad349883SBarry Smith     for (i = 0; i < dim; i++) {
139*ad349883SBarry Smith       xplus[i] = x[i] + d[i];
140*ad349883SBarry Smith       tplus[i] = t[i] + Qd[i];
141*ad349883SBarry Smith       fv += xplus[i] * (0.5 * tplus[i] + f[i]);
142*ad349883SBarry Smith     }
143*ad349883SBarry Smith 
144*ad349883SBarry Smith     /* fr is fref */
145*ad349883SBarry Smith     if ((innerIter == 1 && fv >= fv0) || (innerIter > 1 && fv >= fr)) {
146*ad349883SBarry Smith       fv = 0.0;
147*ad349883SBarry Smith       for (i = 0; i < dim; i++) {
148*ad349883SBarry Smith         xplus[i] = x[i] + lamnew * d[i];
149*ad349883SBarry Smith         tplus[i] = t[i] + lamnew * Qd[i];
150*ad349883SBarry Smith         fv += xplus[i] * (0.5 * tplus[i] + f[i]);
151*ad349883SBarry Smith       }
152*ad349883SBarry Smith     }
153*ad349883SBarry Smith 
154*ad349883SBarry Smith     for (i = 0; i < dim; i++) {
155*ad349883SBarry Smith       sk[i] = xplus[i] - x[i];
156*ad349883SBarry Smith       yk[i] = tplus[i] - t[i];
157*ad349883SBarry Smith       x[i]  = xplus[i];
158*ad349883SBarry Smith       t[i]  = tplus[i];
159*ad349883SBarry Smith       g[i]  = t[i] + f[i];
160*ad349883SBarry Smith     }
161*ad349883SBarry Smith 
162*ad349883SBarry Smith     /* update the line search control parameters */
163*ad349883SBarry Smith     if (fv < fbest) {
164*ad349883SBarry Smith       fbest = fv;
165*ad349883SBarry Smith       fc    = fv;
166*ad349883SBarry Smith       llast = 0;
167*ad349883SBarry Smith     } else {
168*ad349883SBarry Smith       fc = (fc > fv ? fc : fv);
169*ad349883SBarry Smith       llast++;
170*ad349883SBarry Smith       if (llast == L) {
171*ad349883SBarry Smith         fr    = fc;
172*ad349883SBarry Smith         fc    = fv;
173*ad349883SBarry Smith         llast = 0;
174*ad349883SBarry Smith       }
175*ad349883SBarry Smith     }
176*ad349883SBarry Smith 
177*ad349883SBarry Smith     ak = bk = 0.0;
178*ad349883SBarry Smith     for (i = 0; i < dim; i++) {
179*ad349883SBarry Smith       ak += sk[i] * sk[i];
180*ad349883SBarry Smith       bk += sk[i] * yk[i];
181*ad349883SBarry Smith     }
182*ad349883SBarry Smith 
183*ad349883SBarry Smith     if (bk <= EPS * ak) alpha = ALPHA_MAX;
184*ad349883SBarry Smith     else {
185*ad349883SBarry Smith       if (bkold < EPS * akold) alpha = ak / bk;
186*ad349883SBarry Smith       else alpha = (akold + ak) / (bkold + bk);
187*ad349883SBarry Smith 
188*ad349883SBarry Smith       if (alpha > ALPHA_MAX) alpha = ALPHA_MAX;
189*ad349883SBarry Smith       else if (alpha < ALPHA_MIN) alpha = ALPHA_MIN;
190*ad349883SBarry Smith     }
191*ad349883SBarry Smith 
192*ad349883SBarry Smith     akold = ak;
193*ad349883SBarry Smith     bkold = bk;
194*ad349883SBarry Smith 
195*ad349883SBarry Smith     /* stopping criterion based on KKT conditions */
196*ad349883SBarry Smith     /* at optimal, gradient of lagrangian w.r.t. x is zero */
197*ad349883SBarry Smith 
198*ad349883SBarry Smith     bk = 0.0;
199*ad349883SBarry Smith     for (i = 0; i < dim; i++) bk += x[i] * x[i];
200*ad349883SBarry Smith 
201*ad349883SBarry Smith     if (PetscSqrtReal(ak) < tol * 10 * PetscSqrtReal(bk)) {
202*ad349883SBarry Smith       it     = 0;
203*ad349883SBarry Smith       luv    = 0;
204*ad349883SBarry Smith       kktlam = 0.0;
205*ad349883SBarry Smith       for (i = 0; i < dim; i++) {
206*ad349883SBarry Smith         /* x[i] is active hence lagrange multipliers for box constraints
207*ad349883SBarry Smith                 are zero. The lagrange multiplier for ineq. const. is then
208*ad349883SBarry Smith                 defined as below
209*ad349883SBarry Smith         */
210*ad349883SBarry Smith         if ((x[i] > DELTAsv) && (x[i] < c - DELTAsv)) {
211*ad349883SBarry Smith           ipt[it++] = i;
212*ad349883SBarry Smith           kktlam    = kktlam - a[i] * g[i];
213*ad349883SBarry Smith         } else uv[luv++] = i;
214*ad349883SBarry Smith       }
215*ad349883SBarry Smith 
216*ad349883SBarry Smith       if (it == 0 && PetscSqrtReal(ak) < tol * 0.5 * PetscSqrtReal(bk)) return PETSC_SUCCESS;
217*ad349883SBarry Smith       else {
218*ad349883SBarry Smith         kktlam = kktlam / it;
219*ad349883SBarry Smith         info   = 1;
220*ad349883SBarry Smith         for (i = 0; i < it; i++) {
221*ad349883SBarry Smith           if (PetscAbsReal(a[ipt[i]] * g[ipt[i]] + kktlam) > tol) {
222*ad349883SBarry Smith             info = 0;
223*ad349883SBarry Smith             break;
224*ad349883SBarry Smith           }
225*ad349883SBarry Smith         }
226*ad349883SBarry Smith         if (info == 1) {
227*ad349883SBarry Smith           for (i = 0; i < luv; i++) {
228*ad349883SBarry Smith             if (x[uv[i]] <= DELTAsv) {
229*ad349883SBarry Smith               /* x[i] == lower bound, hence, lagrange multiplier (say, beta) for lower bound may
230*ad349883SBarry Smith                      not be zero. So, the gradient without beta is > 0
231*ad349883SBarry Smith               */
232*ad349883SBarry Smith               if (g[uv[i]] + kktlam * a[uv[i]] < -tol) {
233*ad349883SBarry Smith                 info = 0;
234*ad349883SBarry Smith                 break;
235*ad349883SBarry Smith               }
236*ad349883SBarry Smith             } else {
237*ad349883SBarry Smith               /* x[i] == upper bound, hence, lagrange multiplier (say, eta) for upper bound may
238*ad349883SBarry Smith                      not be zero. So, the gradient without eta is < 0
239*ad349883SBarry Smith               */
240*ad349883SBarry Smith               if (g[uv[i]] + kktlam * a[uv[i]] > tol) {
241*ad349883SBarry Smith                 info = 0;
242*ad349883SBarry Smith                 break;
243*ad349883SBarry Smith               }
244*ad349883SBarry Smith             }
245*ad349883SBarry Smith           }
246*ad349883SBarry Smith         }
247*ad349883SBarry Smith 
248*ad349883SBarry Smith         if (info == 1) return PETSC_SUCCESS;
249*ad349883SBarry Smith       }
250*ad349883SBarry Smith     }
251*ad349883SBarry Smith   }
252*ad349883SBarry Smith   return PETSC_SUCCESS;
253*ad349883SBarry Smith }
254*ad349883SBarry Smith 
255a7e14dcfSSatish Balay /* The main solver function
256a7e14dcfSSatish Balay 
257a7e14dcfSSatish Balay    f = Remp(W)          This is what the user provides us from the application layer
258a7e14dcfSSatish Balay    So the ComputeGradient function for instance should get us back the subgradient of Remp(W)
259a7e14dcfSSatish Balay 
260a7e14dcfSSatish Balay    Regularizer assumed to be L2 norm = lambda*0.5*W'W ()
261a7e14dcfSSatish Balay */
262a7e14dcfSSatish Balay 
263d71ae5a4SJacob Faibussowitsch static PetscErrorCode make_grad_node(Vec X, Vec_Chain **p)
264d71ae5a4SJacob Faibussowitsch {
265a7e14dcfSSatish Balay   PetscFunctionBegin;
2669566063dSJacob Faibussowitsch   PetscCall(PetscNew(p));
2679566063dSJacob Faibussowitsch   PetscCall(VecDuplicate(X, &(*p)->V));
2689566063dSJacob Faibussowitsch   PetscCall(VecCopy(X, (*p)->V));
2696c23d075SBarry Smith   (*p)->next = NULL;
2703ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
271a7e14dcfSSatish Balay }
272a7e14dcfSSatish Balay 
273d71ae5a4SJacob Faibussowitsch static PetscErrorCode destroy_grad_list(Vec_Chain *head)
274d71ae5a4SJacob Faibussowitsch {
275a7e14dcfSSatish Balay   Vec_Chain *p = head->next, *q;
276a7e14dcfSSatish Balay 
277a7e14dcfSSatish Balay   PetscFunctionBegin;
278a7e14dcfSSatish Balay   while (p) {
279a7e14dcfSSatish Balay     q = p->next;
2809566063dSJacob Faibussowitsch     PetscCall(VecDestroy(&p->V));
2819566063dSJacob Faibussowitsch     PetscCall(PetscFree(p));
282a7e14dcfSSatish Balay     p = q;
283a7e14dcfSSatish Balay   }
2846c23d075SBarry Smith   head->next = NULL;
2853ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
286a7e14dcfSSatish Balay }
287a7e14dcfSSatish Balay 
288d71ae5a4SJacob Faibussowitsch static PetscErrorCode TaoSolve_BMRM(Tao tao)
289d71ae5a4SJacob Faibussowitsch {
290a7e14dcfSSatish Balay   TAO_DF    df;
291a7e14dcfSSatish Balay   TAO_BMRM *bmrm = (TAO_BMRM *)tao->data;
292a7e14dcfSSatish Balay 
293a7e14dcfSSatish Balay   /* Values and pointers to parts of the optimization problem */
294a7e14dcfSSatish Balay   PetscReal   f = 0.0;
295a7e14dcfSSatish Balay   Vec         W = tao->solution;
296a7e14dcfSSatish Balay   Vec         G = tao->gradient;
297a7e14dcfSSatish Balay   PetscReal   lambda;
298a7e14dcfSSatish Balay   PetscReal   bt;
299a7e14dcfSSatish Balay   Vec_Chain   grad_list, *tail_glist, *pgrad;
300a7e14dcfSSatish Balay   PetscInt    i;
301a7e14dcfSSatish Balay   PetscMPIInt rank;
302a7e14dcfSSatish Balay 
303e4cb33bbSBarry Smith   /* Used in converged criteria check */
304a7e14dcfSSatish Balay   PetscReal reg;
3057fb8a5e4SKarl Rupp   PetscReal jtwt = 0.0, max_jtwt, pre_epsilon, epsilon, jw, min_jw;
306a7e14dcfSSatish Balay   PetscReal innerSolverTol;
307ba4b436cSBarry Smith   MPI_Comm  comm;
308a7e14dcfSSatish Balay 
309a7e14dcfSSatish Balay   PetscFunctionBegin;
3109566063dSJacob Faibussowitsch   PetscCall(PetscObjectGetComm((PetscObject)tao, &comm));
3119566063dSJacob Faibussowitsch   PetscCallMPI(MPI_Comm_rank(comm, &rank));
312a7e14dcfSSatish Balay   lambda = bmrm->lambda;
313a7e14dcfSSatish Balay 
314a7e14dcfSSatish Balay   /* Check Stopping Condition */
315a7e14dcfSSatish Balay   tao->step      = 1.0;
316a7e14dcfSSatish Balay   max_jtwt       = -BMRM_INFTY;
317a7e14dcfSSatish Balay   min_jw         = BMRM_INFTY;
318a7e14dcfSSatish Balay   innerSolverTol = 1.0;
319a7e14dcfSSatish Balay   epsilon        = 0.0;
320a7e14dcfSSatish Balay 
321dd400576SPatrick Sanan   if (rank == 0) {
3229566063dSJacob Faibussowitsch     PetscCall(init_df_solver(&df));
323a7e14dcfSSatish Balay     grad_list.next = NULL;
324a7e14dcfSSatish Balay     tail_glist     = &grad_list;
325a7e14dcfSSatish Balay   }
326a7e14dcfSSatish Balay 
327a7e14dcfSSatish Balay   df.tol      = 1e-6;
3283ecd9318SAlp Dener   tao->reason = TAO_CONTINUE_ITERATING;
329a7e14dcfSSatish Balay 
330a7e14dcfSSatish Balay   /*-----------------Algorithm Begins------------------------*/
331a7e14dcfSSatish Balay   /* make the scatter */
3329566063dSJacob Faibussowitsch   PetscCall(VecScatterCreateToZero(W, &bmrm->scatter, &bmrm->local_w));
3339566063dSJacob Faibussowitsch   PetscCall(VecAssemblyBegin(bmrm->local_w));
3349566063dSJacob Faibussowitsch   PetscCall(VecAssemblyEnd(bmrm->local_w));
335a7e14dcfSSatish Balay 
336a7e14dcfSSatish Balay   /* NOTE: In application pass the sub-gradient of Remp(W) */
3379566063dSJacob Faibussowitsch   PetscCall(TaoComputeObjectiveAndGradient(tao, W, &f, G));
3389566063dSJacob Faibussowitsch   PetscCall(TaoLogConvergenceHistory(tao, f, 1.0, 0.0, tao->ksp_its));
3399566063dSJacob Faibussowitsch   PetscCall(TaoMonitor(tao, tao->niter, f, 1.0, 0.0, tao->step));
340dbbe0bcdSBarry Smith   PetscUseTypeMethod(tao, convergencetest, tao->cnvP);
3413ecd9318SAlp Dener 
3423ecd9318SAlp Dener   while (tao->reason == TAO_CONTINUE_ITERATING) {
343e1e80dc8SAlp Dener     /* Call general purpose update function */
344dbbe0bcdSBarry Smith     PetscTryTypeMethod(tao, update, tao->niter, tao->user_update);
345e1e80dc8SAlp Dener 
346a7e14dcfSSatish Balay     /* compute bt = Remp(Wt-1) - <Wt-1, At> */
3479566063dSJacob Faibussowitsch     PetscCall(VecDot(W, G, &bt));
348a7e14dcfSSatish Balay     bt = f - bt;
349a7e14dcfSSatish Balay 
3509dddd249SSatish Balay     /* First gather the gradient to the rank-0 node */
3519566063dSJacob Faibussowitsch     PetscCall(VecScatterBegin(bmrm->scatter, G, bmrm->local_w, INSERT_VALUES, SCATTER_FORWARD));
3529566063dSJacob Faibussowitsch     PetscCall(VecScatterEnd(bmrm->scatter, G, bmrm->local_w, INSERT_VALUES, SCATTER_FORWARD));
353a7e14dcfSSatish Balay 
354a7e14dcfSSatish Balay     /* Bring up the inner solver */
355dd400576SPatrick Sanan     if (rank == 0) {
3569566063dSJacob Faibussowitsch       PetscCall(ensure_df_space(tao->niter + 1, &df));
3579566063dSJacob Faibussowitsch       PetscCall(make_grad_node(bmrm->local_w, &pgrad));
358a7e14dcfSSatish Balay       tail_glist->next = pgrad;
359a7e14dcfSSatish Balay       tail_glist       = pgrad;
360a7e14dcfSSatish Balay 
3618931d482SJason Sarich       df.a[tao->niter] = 1.0;
3628931d482SJason Sarich       df.f[tao->niter] = -bt;
3638931d482SJason Sarich       df.u[tao->niter] = 1.0;
3648931d482SJason Sarich       df.l[tao->niter] = 0.0;
365a7e14dcfSSatish Balay 
366a7e14dcfSSatish Balay       /* set up the Q */
367a7e14dcfSSatish Balay       pgrad = grad_list.next;
3688931d482SJason Sarich       for (i = 0; i <= tao->niter; i++) {
3693c859ba3SBarry Smith         PetscCheck(pgrad, PETSC_COMM_SELF, PETSC_ERR_PLIB, "Assert that there are at least tao->niter+1 pgrad available");
3709566063dSJacob Faibussowitsch         PetscCall(VecDot(pgrad->V, bmrm->local_w, &reg));
3718931d482SJason Sarich         df.Q[i][tao->niter] = df.Q[tao->niter][i] = reg / lambda;
372a7e14dcfSSatish Balay         pgrad                                     = pgrad->next;
373a7e14dcfSSatish Balay       }
374a7e14dcfSSatish Balay 
3758931d482SJason Sarich       if (tao->niter > 0) {
3768931d482SJason Sarich         df.x[tao->niter] = 0.0;
3779566063dSJacob Faibussowitsch         PetscCall(solve(&df));
3789371c9d4SSatish Balay       } else df.x[0] = 1.0;
379a7e14dcfSSatish Balay 
380a7e14dcfSSatish Balay       /* now computing Jt*(alpha_t) which should be = Jt(wt) to check convergence */
381a7e14dcfSSatish Balay       jtwt = 0.0;
3829566063dSJacob Faibussowitsch       PetscCall(VecSet(bmrm->local_w, 0.0));
383a7e14dcfSSatish Balay       pgrad = grad_list.next;
3848931d482SJason Sarich       for (i = 0; i <= tao->niter; i++) {
385a7e14dcfSSatish Balay         jtwt -= df.x[i] * df.f[i];
3869566063dSJacob Faibussowitsch         PetscCall(VecAXPY(bmrm->local_w, -df.x[i] / lambda, pgrad->V));
387a7e14dcfSSatish Balay         pgrad = pgrad->next;
388a7e14dcfSSatish Balay       }
389a7e14dcfSSatish Balay 
3909566063dSJacob Faibussowitsch       PetscCall(VecNorm(bmrm->local_w, NORM_2, &reg));
391a7e14dcfSSatish Balay       reg = 0.5 * lambda * reg * reg;
392a7e14dcfSSatish Balay       jtwt -= reg;
393a7e14dcfSSatish Balay     } /* end if rank == 0 */
394a7e14dcfSSatish Balay 
395a7e14dcfSSatish Balay     /* scatter the new W to all nodes */
3969566063dSJacob Faibussowitsch     PetscCall(VecScatterBegin(bmrm->scatter, bmrm->local_w, W, INSERT_VALUES, SCATTER_REVERSE));
3979566063dSJacob Faibussowitsch     PetscCall(VecScatterEnd(bmrm->scatter, bmrm->local_w, W, INSERT_VALUES, SCATTER_REVERSE));
398a7e14dcfSSatish Balay 
3999566063dSJacob Faibussowitsch     PetscCall(TaoComputeObjectiveAndGradient(tao, W, &f, G));
400a7e14dcfSSatish Balay 
4019566063dSJacob Faibussowitsch     PetscCallMPI(MPI_Bcast(&jtwt, 1, MPIU_REAL, 0, comm));
4029566063dSJacob Faibussowitsch     PetscCallMPI(MPI_Bcast(&reg, 1, MPIU_REAL, 0, comm));
403a7e14dcfSSatish Balay 
404a7e14dcfSSatish Balay     jw = reg + f; /* J(w) = regularizer + Remp(w) */
4050e660641SBarry Smith     if (jw < min_jw) min_jw = jw;
4060e660641SBarry Smith     if (jtwt > max_jtwt) max_jtwt = jtwt;
407a7e14dcfSSatish Balay 
408a7e14dcfSSatish Balay     pre_epsilon = epsilon;
409a7e14dcfSSatish Balay     epsilon     = min_jw - jtwt;
410a7e14dcfSSatish Balay 
411dd400576SPatrick Sanan     if (rank == 0) {
4120e660641SBarry Smith       if (innerSolverTol > epsilon) innerSolverTol = epsilon;
4130e660641SBarry Smith       else if (innerSolverTol < 1e-7) innerSolverTol = 1e-7;
414a7e14dcfSSatish Balay 
415a7e14dcfSSatish Balay       /* if the annealing doesn't work well, lower the inner solver tolerance */
4160e660641SBarry Smith       if (pre_epsilon < epsilon) innerSolverTol *= 0.2;
417a7e14dcfSSatish Balay 
418a7e14dcfSSatish Balay       df.tol = innerSolverTol * 0.5;
419a7e14dcfSSatish Balay     }
420a7e14dcfSSatish Balay 
4218931d482SJason Sarich     tao->niter++;
4229566063dSJacob Faibussowitsch     PetscCall(TaoLogConvergenceHistory(tao, min_jw, epsilon, 0.0, tao->ksp_its));
4239566063dSJacob Faibussowitsch     PetscCall(TaoMonitor(tao, tao->niter, min_jw, epsilon, 0.0, tao->step));
424dbbe0bcdSBarry Smith     PetscUseTypeMethod(tao, convergencetest, tao->cnvP);
425a7e14dcfSSatish Balay   }
426a7e14dcfSSatish Balay 
427a7e14dcfSSatish Balay   /* free all the memory */
428dd400576SPatrick Sanan   if (rank == 0) {
4299566063dSJacob Faibussowitsch     PetscCall(destroy_grad_list(&grad_list));
4309566063dSJacob Faibussowitsch     PetscCall(destroy_df_solver(&df));
431a7e14dcfSSatish Balay   }
432a7e14dcfSSatish Balay 
4339566063dSJacob Faibussowitsch   PetscCall(VecDestroy(&bmrm->local_w));
4349566063dSJacob Faibussowitsch   PetscCall(VecScatterDestroy(&bmrm->scatter));
4353ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
436a7e14dcfSSatish Balay }
437a7e14dcfSSatish Balay 
438a7e14dcfSSatish Balay /* ---------------------------------------------------------- */
439a7e14dcfSSatish Balay 
440d71ae5a4SJacob Faibussowitsch static PetscErrorCode TaoSetup_BMRM(Tao tao)
441d71ae5a4SJacob Faibussowitsch {
442a7e14dcfSSatish Balay   PetscFunctionBegin;
443a7e14dcfSSatish Balay   /* Allocate some arrays */
4449566063dSJacob Faibussowitsch   if (!tao->gradient) PetscCall(VecDuplicate(tao->solution, &tao->gradient));
4453ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
446a7e14dcfSSatish Balay }
447a7e14dcfSSatish Balay 
448a7e14dcfSSatish Balay /*------------------------------------------------------------*/
449d71ae5a4SJacob Faibussowitsch static PetscErrorCode TaoDestroy_BMRM(Tao tao)
450d71ae5a4SJacob Faibussowitsch {
451a7e14dcfSSatish Balay   PetscFunctionBegin;
4529566063dSJacob Faibussowitsch   PetscCall(PetscFree(tao->data));
4533ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
454a7e14dcfSSatish Balay }
455a7e14dcfSSatish Balay 
456d71ae5a4SJacob Faibussowitsch static PetscErrorCode TaoSetFromOptions_BMRM(Tao tao, PetscOptionItems *PetscOptionsObject)
457d71ae5a4SJacob Faibussowitsch {
458a7e14dcfSSatish Balay   TAO_BMRM *bmrm = (TAO_BMRM *)tao->data;
459a7e14dcfSSatish Balay 
460a7e14dcfSSatish Balay   PetscFunctionBegin;
461d0609cedSBarry Smith   PetscOptionsHeadBegin(PetscOptionsObject, "BMRM for regularized risk minimization");
4629566063dSJacob Faibussowitsch   PetscCall(PetscOptionsReal("-tao_bmrm_lambda", "regulariser weight", "", 100, &bmrm->lambda, NULL));
463d0609cedSBarry Smith   PetscOptionsHeadEnd();
4643ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
465a7e14dcfSSatish Balay }
466a7e14dcfSSatish Balay 
467a7e14dcfSSatish Balay /*------------------------------------------------------------*/
468d71ae5a4SJacob Faibussowitsch static PetscErrorCode TaoView_BMRM(Tao tao, PetscViewer viewer)
469d71ae5a4SJacob Faibussowitsch {
470a7e14dcfSSatish Balay   PetscBool isascii;
471a7e14dcfSSatish Balay 
472a7e14dcfSSatish Balay   PetscFunctionBegin;
4739566063dSJacob Faibussowitsch   PetscCall(PetscObjectTypeCompare((PetscObject)viewer, PETSCVIEWERASCII, &isascii));
474a7e14dcfSSatish Balay   if (isascii) {
4759566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPushTab(viewer));
4769566063dSJacob Faibussowitsch     PetscCall(PetscViewerASCIIPopTab(viewer));
477a7e14dcfSSatish Balay   }
4783ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
479a7e14dcfSSatish Balay }
480a7e14dcfSSatish Balay 
481a7e14dcfSSatish Balay /*------------------------------------------------------------*/
4821522df2eSJason Sarich /*MC
4831522df2eSJason Sarich   TAOBMRM - bundle method for regularized risk minimization
4841522df2eSJason Sarich 
4851522df2eSJason Sarich   Options Database Keys:
4861522df2eSJason Sarich . - tao_bmrm_lambda - regulariser weight
4871522df2eSJason Sarich 
4881eb8069cSJason Sarich   Level: beginner
4891522df2eSJason Sarich M*/
4901522df2eSJason Sarich 
491d71ae5a4SJacob Faibussowitsch PETSC_EXTERN PetscErrorCode TaoCreate_BMRM(Tao tao)
492d71ae5a4SJacob Faibussowitsch {
493a7e14dcfSSatish Balay   TAO_BMRM *bmrm;
494a7e14dcfSSatish Balay 
495a7e14dcfSSatish Balay   PetscFunctionBegin;
496a7e14dcfSSatish Balay   tao->ops->setup          = TaoSetup_BMRM;
497a7e14dcfSSatish Balay   tao->ops->solve          = TaoSolve_BMRM;
498a7e14dcfSSatish Balay   tao->ops->view           = TaoView_BMRM;
499a7e14dcfSSatish Balay   tao->ops->setfromoptions = TaoSetFromOptions_BMRM;
500a7e14dcfSSatish Balay   tao->ops->destroy        = TaoDestroy_BMRM;
501a7e14dcfSSatish Balay 
5024dfa11a4SJacob Faibussowitsch   PetscCall(PetscNew(&bmrm));
503a7e14dcfSSatish Balay   bmrm->lambda = 1.0;
504a7e14dcfSSatish Balay   tao->data    = (void *)bmrm;
505a7e14dcfSSatish Balay 
5066552cf8aSJason Sarich   /* Override default settings (unless already changed) */
5076552cf8aSJason Sarich   if (!tao->max_it_changed) tao->max_it = 2000;
5086552cf8aSJason Sarich   if (!tao->max_funcs_changed) tao->max_funcs = 4000;
5096552cf8aSJason Sarich   if (!tao->gatol_changed) tao->gatol = 1.0e-12;
5106552cf8aSJason Sarich   if (!tao->grtol_changed) tao->grtol = 1.0e-12;
511a7e14dcfSSatish Balay 
5123ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
513a7e14dcfSSatish Balay }
514a7e14dcfSSatish Balay 
51566976f2fSJacob Faibussowitsch static PetscErrorCode init_df_solver(TAO_DF *df)
516d71ae5a4SJacob Faibussowitsch {
517a7e14dcfSSatish Balay   PetscInt i, n = INCRE_DIM;
518a7e14dcfSSatish Balay 
519a7e14dcfSSatish Balay   PetscFunctionBegin;
520a7e14dcfSSatish Balay   /* default values */
521a7e14dcfSSatish Balay   df->maxProjIter = 200;
522a7e14dcfSSatish Balay   df->maxPGMIter  = 300000;
523a7e14dcfSSatish Balay   df->b           = 1.0;
524a7e14dcfSSatish Balay 
525a7e14dcfSSatish Balay   /* memory space required by Dai-Fletcher */
526a7e14dcfSSatish Balay   df->cur_num_cp = n;
5279566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &df->f));
5289566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &df->a));
5299566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &df->l));
5309566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &df->u));
5319566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &df->x));
5329566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &df->Q));
533a7e14dcfSSatish Balay 
53448a46eb9SPierre Jolivet   for (i = 0; i < n; i++) PetscCall(PetscMalloc1(n, &df->Q[i]));
535a7e14dcfSSatish Balay 
5369566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &df->g));
5379566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &df->y));
5389566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &df->tempv));
5399566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &df->d));
5409566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &df->Qd));
5419566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &df->t));
5429566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &df->xplus));
5439566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &df->tplus));
5449566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &df->sk));
5459566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &df->yk));
546a7e14dcfSSatish Balay 
5479566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &df->ipt));
5489566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &df->ipt2));
5499566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &df->uv));
5503ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
551a7e14dcfSSatish Balay }
552a7e14dcfSSatish Balay 
55366976f2fSJacob Faibussowitsch static PetscErrorCode ensure_df_space(PetscInt dim, TAO_DF *df)
554d71ae5a4SJacob Faibussowitsch {
555a7e14dcfSSatish Balay   PetscReal *tmp, **tmp_Q;
556a7e14dcfSSatish Balay   PetscInt   i, n, old_n;
557a7e14dcfSSatish Balay 
558a7e14dcfSSatish Balay   PetscFunctionBegin;
55953506e15SBarry Smith   df->dim = dim;
5603ba16761SJacob Faibussowitsch   if (dim <= df->cur_num_cp) PetscFunctionReturn(PETSC_SUCCESS);
561a7e14dcfSSatish Balay 
562a7e14dcfSSatish Balay   old_n = df->cur_num_cp;
563a7e14dcfSSatish Balay   df->cur_num_cp += INCRE_DIM;
564a7e14dcfSSatish Balay   n = df->cur_num_cp;
565a7e14dcfSSatish Balay 
566a7e14dcfSSatish Balay   /* memory space required by dai-fletcher */
5679566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &tmp));
5689566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(tmp, df->f, old_n));
5699566063dSJacob Faibussowitsch   PetscCall(PetscFree(df->f));
570a7e14dcfSSatish Balay   df->f = tmp;
571a7e14dcfSSatish Balay 
5729566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &tmp));
5739566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(tmp, df->a, old_n));
5749566063dSJacob Faibussowitsch   PetscCall(PetscFree(df->a));
575a7e14dcfSSatish Balay   df->a = tmp;
576a7e14dcfSSatish Balay 
5779566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &tmp));
5789566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(tmp, df->l, old_n));
5799566063dSJacob Faibussowitsch   PetscCall(PetscFree(df->l));
580a7e14dcfSSatish Balay   df->l = tmp;
581a7e14dcfSSatish Balay 
5829566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &tmp));
5839566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(tmp, df->u, old_n));
5849566063dSJacob Faibussowitsch   PetscCall(PetscFree(df->u));
585a7e14dcfSSatish Balay   df->u = tmp;
586a7e14dcfSSatish Balay 
5879566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &tmp));
5889566063dSJacob Faibussowitsch   PetscCall(PetscArraycpy(tmp, df->x, old_n));
5899566063dSJacob Faibussowitsch   PetscCall(PetscFree(df->x));
590a7e14dcfSSatish Balay   df->x = tmp;
591a7e14dcfSSatish Balay 
5929566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &tmp_Q));
59353506e15SBarry Smith   for (i = 0; i < n; i++) {
5949566063dSJacob Faibussowitsch     PetscCall(PetscMalloc1(n, &tmp_Q[i]));
59553506e15SBarry Smith     if (i < old_n) {
5969566063dSJacob Faibussowitsch       PetscCall(PetscArraycpy(tmp_Q[i], df->Q[i], old_n));
5979566063dSJacob Faibussowitsch       PetscCall(PetscFree(df->Q[i]));
598a7e14dcfSSatish Balay     }
599a7e14dcfSSatish Balay   }
600a7e14dcfSSatish Balay 
6019566063dSJacob Faibussowitsch   PetscCall(PetscFree(df->Q));
602a7e14dcfSSatish Balay   df->Q = tmp_Q;
603a7e14dcfSSatish Balay 
6049566063dSJacob Faibussowitsch   PetscCall(PetscFree(df->g));
6059566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &df->g));
606a7e14dcfSSatish Balay 
6079566063dSJacob Faibussowitsch   PetscCall(PetscFree(df->y));
6089566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &df->y));
609a7e14dcfSSatish Balay 
6109566063dSJacob Faibussowitsch   PetscCall(PetscFree(df->tempv));
6119566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &df->tempv));
612a7e14dcfSSatish Balay 
6139566063dSJacob Faibussowitsch   PetscCall(PetscFree(df->d));
6149566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &df->d));
615a7e14dcfSSatish Balay 
6169566063dSJacob Faibussowitsch   PetscCall(PetscFree(df->Qd));
6179566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &df->Qd));
618a7e14dcfSSatish Balay 
6199566063dSJacob Faibussowitsch   PetscCall(PetscFree(df->t));
6209566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &df->t));
621a7e14dcfSSatish Balay 
6229566063dSJacob Faibussowitsch   PetscCall(PetscFree(df->xplus));
6239566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &df->xplus));
624a7e14dcfSSatish Balay 
6259566063dSJacob Faibussowitsch   PetscCall(PetscFree(df->tplus));
6269566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &df->tplus));
627a7e14dcfSSatish Balay 
6289566063dSJacob Faibussowitsch   PetscCall(PetscFree(df->sk));
6299566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &df->sk));
630a7e14dcfSSatish Balay 
6319566063dSJacob Faibussowitsch   PetscCall(PetscFree(df->yk));
6329566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &df->yk));
633a7e14dcfSSatish Balay 
6349566063dSJacob Faibussowitsch   PetscCall(PetscFree(df->ipt));
6359566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &df->ipt));
636a7e14dcfSSatish Balay 
6379566063dSJacob Faibussowitsch   PetscCall(PetscFree(df->ipt2));
6389566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &df->ipt2));
639a7e14dcfSSatish Balay 
6409566063dSJacob Faibussowitsch   PetscCall(PetscFree(df->uv));
6419566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(n, &df->uv));
6423ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
643a7e14dcfSSatish Balay }
644a7e14dcfSSatish Balay 
64566976f2fSJacob Faibussowitsch static PetscErrorCode destroy_df_solver(TAO_DF *df)
646d71ae5a4SJacob Faibussowitsch {
647a7e14dcfSSatish Balay   PetscInt i;
6486c23d075SBarry Smith 
649a7e14dcfSSatish Balay   PetscFunctionBegin;
6509566063dSJacob Faibussowitsch   PetscCall(PetscFree(df->f));
6519566063dSJacob Faibussowitsch   PetscCall(PetscFree(df->a));
6529566063dSJacob Faibussowitsch   PetscCall(PetscFree(df->l));
6539566063dSJacob Faibussowitsch   PetscCall(PetscFree(df->u));
6549566063dSJacob Faibussowitsch   PetscCall(PetscFree(df->x));
655a7e14dcfSSatish Balay 
65648a46eb9SPierre Jolivet   for (i = 0; i < df->cur_num_cp; i++) PetscCall(PetscFree(df->Q[i]));
6579566063dSJacob Faibussowitsch   PetscCall(PetscFree(df->Q));
6589566063dSJacob Faibussowitsch   PetscCall(PetscFree(df->ipt));
6599566063dSJacob Faibussowitsch   PetscCall(PetscFree(df->ipt2));
6609566063dSJacob Faibussowitsch   PetscCall(PetscFree(df->uv));
6619566063dSJacob Faibussowitsch   PetscCall(PetscFree(df->g));
6629566063dSJacob Faibussowitsch   PetscCall(PetscFree(df->y));
6639566063dSJacob Faibussowitsch   PetscCall(PetscFree(df->tempv));
6649566063dSJacob Faibussowitsch   PetscCall(PetscFree(df->d));
6659566063dSJacob Faibussowitsch   PetscCall(PetscFree(df->Qd));
6669566063dSJacob Faibussowitsch   PetscCall(PetscFree(df->t));
6679566063dSJacob Faibussowitsch   PetscCall(PetscFree(df->xplus));
6689566063dSJacob Faibussowitsch   PetscCall(PetscFree(df->tplus));
6699566063dSJacob Faibussowitsch   PetscCall(PetscFree(df->sk));
6709566063dSJacob Faibussowitsch   PetscCall(PetscFree(df->yk));
6713ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
672a7e14dcfSSatish Balay }
673a7e14dcfSSatish Balay 
674a7e14dcfSSatish Balay /* Piecewise linear monotone target function for the Dai-Fletcher projector */
67566976f2fSJacob Faibussowitsch static PetscReal phi(PetscReal *x, PetscInt n, PetscReal lambda, PetscReal *a, PetscReal b, PetscReal *c, PetscReal *l, PetscReal *u)
676d71ae5a4SJacob Faibussowitsch {
677a7e14dcfSSatish Balay   PetscReal r = 0.0;
678a7e14dcfSSatish Balay   PetscInt  i;
679a7e14dcfSSatish Balay 
680a7e14dcfSSatish Balay   for (i = 0; i < n; i++) {
681a7e14dcfSSatish Balay     x[i] = -c[i] + lambda * a[i];
6826c23d075SBarry Smith     if (x[i] > u[i]) x[i] = u[i];
6836c23d075SBarry Smith     else if (x[i] < l[i]) x[i] = l[i];
684a7e14dcfSSatish Balay     r += a[i] * x[i];
685a7e14dcfSSatish Balay   }
686a7e14dcfSSatish Balay   return r - b;
687a7e14dcfSSatish Balay }
688a7e14dcfSSatish Balay 
689a7e14dcfSSatish Balay /** Modified Dai-Fletcher QP projector solves the problem:
690a7e14dcfSSatish Balay  *
691a7e14dcfSSatish Balay  *      minimise  0.5*x'*x - c'*x
692a7e14dcfSSatish Balay  *      subj to   a'*x = b
693a7e14dcfSSatish Balay  *                l \leq x \leq u
694a7e14dcfSSatish Balay  *
695a7e14dcfSSatish Balay  *  \param c The point to be projected onto feasible set
696a7e14dcfSSatish Balay  */
69766976f2fSJacob Faibussowitsch static PetscInt project(PetscInt n, PetscReal *a, PetscReal b, PetscReal *c, PetscReal *l, PetscReal *u, PetscReal *x, PetscReal *lam_ext, TAO_DF *df)
698d71ae5a4SJacob Faibussowitsch {
699a7e14dcfSSatish Balay   PetscReal lambda, lambdal, lambdau, dlambda, lambda_new;
700a7e14dcfSSatish Balay   PetscReal r, rl, ru, s;
701a7e14dcfSSatish Balay   PetscInt  innerIter;
702a7e14dcfSSatish Balay   PetscBool nonNegativeSlack = PETSC_FALSE;
703a7e14dcfSSatish Balay 
704a7e14dcfSSatish Balay   *lam_ext  = 0;
705a7e14dcfSSatish Balay   lambda    = 0;
706a7e14dcfSSatish Balay   dlambda   = 0.5;
707a7e14dcfSSatish Balay   innerIter = 1;
708a7e14dcfSSatish Balay 
709a7e14dcfSSatish Balay   /*  \phi(x;lambda) := 0.5*x'*x + c'*x - lambda*(a'*x-b)
710a7e14dcfSSatish Balay    *
711a7e14dcfSSatish Balay    *  Optimality conditions for \phi:
712a7e14dcfSSatish Balay    *
713a7e14dcfSSatish Balay    *  1. lambda   <= 0
714a7e14dcfSSatish Balay    *  2. r        <= 0
715a7e14dcfSSatish Balay    *  3. r*lambda == 0
716a7e14dcfSSatish Balay    */
717a7e14dcfSSatish Balay 
718a7e14dcfSSatish Balay   /* Bracketing Phase */
719a7e14dcfSSatish Balay   r = phi(x, n, lambda, a, b, c, l, u);
720a7e14dcfSSatish Balay 
7216c23d075SBarry Smith   if (nonNegativeSlack) {
722a7e14dcfSSatish Balay     /* inequality constraint, i.e., with \xi >= 0 constraint */
7233ba16761SJacob Faibussowitsch     if (r < TOL_R) return PETSC_SUCCESS;
7246c23d075SBarry Smith   } else {
725a7e14dcfSSatish Balay     /* equality constraint ,i.e., without \xi >= 0 constraint */
7263ba16761SJacob Faibussowitsch     if (PetscAbsReal(r) < TOL_R) return PETSC_SUCCESS;
727a7e14dcfSSatish Balay   }
728a7e14dcfSSatish Balay 
729a7e14dcfSSatish Balay   if (r < 0.0) {
730a7e14dcfSSatish Balay     lambdal = lambda;
731a7e14dcfSSatish Balay     rl      = r;
732a7e14dcfSSatish Balay     lambda  = lambda + dlambda;
733a7e14dcfSSatish Balay     r       = phi(x, n, lambda, a, b, c, l, u);
734a7e14dcfSSatish Balay     while (r < 0.0 && dlambda < BMRM_INFTY) {
735a7e14dcfSSatish Balay       lambdal = lambda;
736a7e14dcfSSatish Balay       s       = rl / r - 1.0;
737a7e14dcfSSatish Balay       if (s < 0.1) s = 0.1;
738a7e14dcfSSatish Balay       dlambda = dlambda + dlambda / s;
739a7e14dcfSSatish Balay       lambda  = lambda + dlambda;
740a7e14dcfSSatish Balay       rl      = r;
741a7e14dcfSSatish Balay       r       = phi(x, n, lambda, a, b, c, l, u);
742a7e14dcfSSatish Balay     }
743a7e14dcfSSatish Balay     lambdau = lambda;
744a7e14dcfSSatish Balay     ru      = r;
7456c23d075SBarry Smith   } else {
746a7e14dcfSSatish Balay     lambdau = lambda;
747a7e14dcfSSatish Balay     ru      = r;
748a7e14dcfSSatish Balay     lambda  = lambda - dlambda;
749a7e14dcfSSatish Balay     r       = phi(x, n, lambda, a, b, c, l, u);
750a7e14dcfSSatish Balay     while (r > 0.0 && dlambda > -BMRM_INFTY) {
751a7e14dcfSSatish Balay       lambdau = lambda;
752a7e14dcfSSatish Balay       s       = ru / r - 1.0;
753a7e14dcfSSatish Balay       if (s < 0.1) s = 0.1;
754a7e14dcfSSatish Balay       dlambda = dlambda + dlambda / s;
755a7e14dcfSSatish Balay       lambda  = lambda - dlambda;
756a7e14dcfSSatish Balay       ru      = r;
757a7e14dcfSSatish Balay       r       = phi(x, n, lambda, a, b, c, l, u);
758a7e14dcfSSatish Balay     }
759a7e14dcfSSatish Balay     lambdal = lambda;
760a7e14dcfSSatish Balay     rl      = r;
761a7e14dcfSSatish Balay   }
762a7e14dcfSSatish Balay 
7633c859ba3SBarry Smith   PetscCheck(PetscAbsReal(dlambda) <= BMRM_INFTY, PETSC_COMM_SELF, PETSC_ERR_PLIB, "L2N2_DaiFletcherPGM detected Infeasible QP problem!");
764a7e14dcfSSatish Balay 
765ad540459SPierre Jolivet   if (ru == 0) return innerIter;
766a7e14dcfSSatish Balay 
767a7e14dcfSSatish Balay   /* Secant Phase */
768a7e14dcfSSatish Balay   s       = 1.0 - rl / ru;
769a7e14dcfSSatish Balay   dlambda = dlambda / s;
770a7e14dcfSSatish Balay   lambda  = lambdau - dlambda;
771a7e14dcfSSatish Balay   r       = phi(x, n, lambda, a, b, c, l, u);
772a7e14dcfSSatish Balay 
7739371c9d4SSatish Balay   while (PetscAbsReal(r) > TOL_R && dlambda > TOL_LAM * (1.0 + PetscAbsReal(lambda)) && innerIter < df->maxProjIter) {
774a7e14dcfSSatish Balay     innerIter++;
775a7e14dcfSSatish Balay     if (r > 0.0) {
776a7e14dcfSSatish Balay       if (s <= 2.0) {
777a7e14dcfSSatish Balay         lambdau = lambda;
778a7e14dcfSSatish Balay         ru      = r;
779a7e14dcfSSatish Balay         s       = 1.0 - rl / ru;
780a7e14dcfSSatish Balay         dlambda = (lambdau - lambdal) / s;
781a7e14dcfSSatish Balay         lambda  = lambdau - dlambda;
78253506e15SBarry Smith       } else {
783a7e14dcfSSatish Balay         s = ru / r - 1.0;
784a7e14dcfSSatish Balay         if (s < 0.1) s = 0.1;
785a7e14dcfSSatish Balay         dlambda    = (lambdau - lambda) / s;
786a7e14dcfSSatish Balay         lambda_new = 0.75 * lambdal + 0.25 * lambda;
7879371c9d4SSatish Balay         if (lambda_new < (lambda - dlambda)) lambda_new = lambda - dlambda;
788a7e14dcfSSatish Balay         lambdau = lambda;
789a7e14dcfSSatish Balay         ru      = r;
790a7e14dcfSSatish Balay         lambda  = lambda_new;
791a7e14dcfSSatish Balay         s       = (lambdau - lambdal) / (lambdau - lambda);
792a7e14dcfSSatish Balay       }
79353506e15SBarry Smith     } else {
794a7e14dcfSSatish Balay       if (s >= 2.0) {
795a7e14dcfSSatish Balay         lambdal = lambda;
796a7e14dcfSSatish Balay         rl      = r;
797a7e14dcfSSatish Balay         s       = 1.0 - rl / ru;
798a7e14dcfSSatish Balay         dlambda = (lambdau - lambdal) / s;
799a7e14dcfSSatish Balay         lambda  = lambdau - dlambda;
80053506e15SBarry Smith       } else {
801a7e14dcfSSatish Balay         s = rl / r - 1.0;
802a7e14dcfSSatish Balay         if (s < 0.1) s = 0.1;
803a7e14dcfSSatish Balay         dlambda    = (lambda - lambdal) / s;
804a7e14dcfSSatish Balay         lambda_new = 0.75 * lambdau + 0.25 * lambda;
8059371c9d4SSatish Balay         if (lambda_new > (lambda + dlambda)) lambda_new = lambda + dlambda;
806a7e14dcfSSatish Balay         lambdal = lambda;
807a7e14dcfSSatish Balay         rl      = r;
808a7e14dcfSSatish Balay         lambda  = lambda_new;
809a7e14dcfSSatish Balay         s       = (lambdau - lambdal) / (lambdau - lambda);
810a7e14dcfSSatish Balay       }
811a7e14dcfSSatish Balay     }
812a7e14dcfSSatish Balay     r = phi(x, n, lambda, a, b, c, l, u);
813a7e14dcfSSatish Balay   }
814a7e14dcfSSatish Balay 
815a7e14dcfSSatish Balay   *lam_ext = lambda;
81648a46eb9SPierre Jolivet   if (innerIter >= df->maxProjIter) PetscCall(PetscInfo(NULL, "WARNING: DaiFletcher max iterations\n"));
817a7e14dcfSSatish Balay   return innerIter;
818a7e14dcfSSatish Balay }
819