xref: /petsc/src/tao/unconstrained/impls/bmrm/bmrm.c (revision 3ecd93180ca3e0505f53284726a9519041077843)
1aaa7dc30SBarry Smith #include <../src/tao/unconstrained/impls/bmrm/bmrm.h>
2a7e14dcfSSatish Balay 
3a7e14dcfSSatish Balay static PetscErrorCode init_df_solver(TAO_DF*);
4a7e14dcfSSatish Balay static PetscErrorCode ensure_df_space(PetscInt, TAO_DF*);
5a7e14dcfSSatish Balay static PetscErrorCode destroy_df_solver(TAO_DF*);
60e660641SBarry Smith static PetscReal phi(PetscReal*,PetscInt,PetscReal,PetscReal*,PetscReal,PetscReal*,PetscReal*,PetscReal*);
70e660641SBarry Smith static PetscInt project(PetscInt,PetscReal*,PetscReal,PetscReal*,PetscReal*,PetscReal*,PetscReal*,PetscReal*,TAO_DF*);
8a7e14dcfSSatish Balay static PetscErrorCode solve(TAO_DF*);
9a7e14dcfSSatish Balay 
10a7e14dcfSSatish Balay 
11a7e14dcfSSatish Balay /*------------------------------------------------------------*/
12a7e14dcfSSatish Balay /* The main solver function
13a7e14dcfSSatish Balay 
14a7e14dcfSSatish Balay    f = Remp(W)          This is what the user provides us from the application layer
15a7e14dcfSSatish Balay    So the ComputeGradient function for instance should get us back the subgradient of Remp(W)
16a7e14dcfSSatish Balay 
17a7e14dcfSSatish Balay    Regularizer assumed to be L2 norm = lambda*0.5*W'W ()
18a7e14dcfSSatish Balay */
19a7e14dcfSSatish Balay 
20a7e14dcfSSatish Balay static PetscErrorCode make_grad_node(Vec X, Vec_Chain **p)
21a7e14dcfSSatish Balay {
22a7e14dcfSSatish Balay   PetscErrorCode ierr;
23a7e14dcfSSatish Balay 
24a7e14dcfSSatish Balay   PetscFunctionBegin;
250e660641SBarry Smith   ierr = PetscNew(p);CHKERRQ(ierr);
26a7e14dcfSSatish Balay   ierr = VecDuplicate(X, &(*p)->V);CHKERRQ(ierr);
27a7e14dcfSSatish Balay   ierr = VecCopy(X, (*p)->V);CHKERRQ(ierr);
286c23d075SBarry Smith   (*p)->next = NULL;
29a7e14dcfSSatish Balay   PetscFunctionReturn(0);
30a7e14dcfSSatish Balay }
31a7e14dcfSSatish Balay 
32a7e14dcfSSatish Balay static PetscErrorCode destroy_grad_list(Vec_Chain *head)
33a7e14dcfSSatish Balay {
34a7e14dcfSSatish Balay   PetscErrorCode ierr;
35a7e14dcfSSatish Balay   Vec_Chain      *p = head->next, *q;
36a7e14dcfSSatish Balay 
37a7e14dcfSSatish Balay   PetscFunctionBegin;
38a7e14dcfSSatish Balay   while(p) {
39a7e14dcfSSatish Balay     q = p->next;
40a7e14dcfSSatish Balay     ierr = VecDestroy(&p->V);CHKERRQ(ierr);
41a7e14dcfSSatish Balay     ierr = PetscFree(p);CHKERRQ(ierr);
42a7e14dcfSSatish Balay     p = q;
43a7e14dcfSSatish Balay   }
446c23d075SBarry Smith   head->next = NULL;
45a7e14dcfSSatish Balay   PetscFunctionReturn(0);
46a7e14dcfSSatish Balay }
47a7e14dcfSSatish Balay 
48a7e14dcfSSatish Balay 
49441846f8SBarry Smith static PetscErrorCode TaoSolve_BMRM(Tao tao)
50a7e14dcfSSatish Balay {
51a7e14dcfSSatish Balay   PetscErrorCode     ierr;
52a7e14dcfSSatish Balay   TAO_DF             df;
53a7e14dcfSSatish Balay   TAO_BMRM           *bmrm = (TAO_BMRM*)tao->data;
54a7e14dcfSSatish Balay 
55a7e14dcfSSatish Balay   /* Values and pointers to parts of the optimization problem */
56a7e14dcfSSatish Balay   PetscReal          f = 0.0;
57a7e14dcfSSatish Balay   Vec                W = tao->solution;
58a7e14dcfSSatish Balay   Vec                G = tao->gradient;
59a7e14dcfSSatish Balay   PetscReal          lambda;
60a7e14dcfSSatish Balay   PetscReal          bt;
61a7e14dcfSSatish Balay   Vec_Chain          grad_list, *tail_glist, *pgrad;
62a7e14dcfSSatish Balay   PetscInt           i;
63a7e14dcfSSatish Balay   PetscMPIInt        rank;
64a7e14dcfSSatish Balay 
65e4cb33bbSBarry Smith   /* Used in converged criteria check */
66a7e14dcfSSatish Balay   PetscReal          reg;
677fb8a5e4SKarl Rupp   PetscReal          jtwt = 0.0, max_jtwt, pre_epsilon, epsilon, jw, min_jw;
68a7e14dcfSSatish Balay   PetscReal          innerSolverTol;
69ba4b436cSBarry Smith   MPI_Comm           comm;
70a7e14dcfSSatish Balay 
71a7e14dcfSSatish Balay   PetscFunctionBegin;
72ba4b436cSBarry Smith   ierr = PetscObjectGetComm((PetscObject)tao,&comm);CHKERRQ(ierr);
73ba4b436cSBarry Smith   ierr = MPI_Comm_rank(comm, &rank);CHKERRQ(ierr);
74a7e14dcfSSatish Balay   lambda = bmrm->lambda;
75a7e14dcfSSatish Balay 
76a7e14dcfSSatish Balay   /* Check Stopping Condition */
77a7e14dcfSSatish Balay   tao->step = 1.0;
78a7e14dcfSSatish Balay   max_jtwt = -BMRM_INFTY;
79a7e14dcfSSatish Balay   min_jw = BMRM_INFTY;
80a7e14dcfSSatish Balay   innerSolverTol = 1.0;
81a7e14dcfSSatish Balay   epsilon = 0.0;
82a7e14dcfSSatish Balay 
830e660641SBarry Smith   if (!rank) {
84a7e14dcfSSatish Balay     ierr = init_df_solver(&df);CHKERRQ(ierr);
85a7e14dcfSSatish Balay     grad_list.next = NULL;
86a7e14dcfSSatish Balay     tail_glist = &grad_list;
87a7e14dcfSSatish Balay   }
88a7e14dcfSSatish Balay 
89a7e14dcfSSatish Balay   df.tol = 1e-6;
90*3ecd9318SAlp Dener   tao->reason = TAO_CONTINUE_ITERATING;
91a7e14dcfSSatish Balay 
92a7e14dcfSSatish Balay   /*-----------------Algorithm Begins------------------------*/
93a7e14dcfSSatish Balay   /* make the scatter */
94a7e14dcfSSatish Balay   ierr = VecScatterCreateToZero(W, &bmrm->scatter, &bmrm->local_w);CHKERRQ(ierr);
95a7e14dcfSSatish Balay   ierr = VecAssemblyBegin(bmrm->local_w);CHKERRQ(ierr);
96a7e14dcfSSatish Balay   ierr = VecAssemblyEnd(bmrm->local_w);CHKERRQ(ierr);
97a7e14dcfSSatish Balay 
98a7e14dcfSSatish Balay   /* NOTE: In application pass the sub-gradient of Remp(W) */
99a7e14dcfSSatish Balay   ierr = TaoComputeObjectiveAndGradient(tao, W, &f, G);CHKERRQ(ierr);
100*3ecd9318SAlp Dener   ierr = TaoLogConvergenceHistory(tao,f,1.0,0.0,tao->ksp_its);CHKERRQ(ierr);
101*3ecd9318SAlp Dener   ierr = TaoMonitor(tao,tao->niter,f,1.0,0.0,tao->step);CHKERRQ(ierr);
102*3ecd9318SAlp Dener   ierr = (*tao->ops->convergencetest)(tao,tao->cnvP);CHKERRQ(ierr);
103*3ecd9318SAlp Dener 
104*3ecd9318SAlp Dener   while (tao->reason == TAO_CONTINUE_ITERATING) {
105a7e14dcfSSatish Balay     /* compute bt = Remp(Wt-1) - <Wt-1, At> */
106a7e14dcfSSatish Balay     ierr = VecDot(W, G, &bt);CHKERRQ(ierr);
107a7e14dcfSSatish Balay     bt = f - bt;
108a7e14dcfSSatish Balay 
109a7e14dcfSSatish Balay     /* First gather the gradient to the master node */
110a7e14dcfSSatish Balay     ierr = VecScatterBegin(bmrm->scatter, G, bmrm->local_w, INSERT_VALUES, SCATTER_FORWARD);CHKERRQ(ierr);
111a7e14dcfSSatish Balay     ierr = VecScatterEnd(bmrm->scatter, G, bmrm->local_w, INSERT_VALUES, SCATTER_FORWARD);CHKERRQ(ierr);
112a7e14dcfSSatish Balay 
113a7e14dcfSSatish Balay     /* Bring up the inner solver */
1140e660641SBarry Smith     if (!rank) {
1158931d482SJason Sarich       ierr = ensure_df_space(tao->niter+1, &df);CHKERRQ(ierr);
116a7e14dcfSSatish Balay       ierr = make_grad_node(bmrm->local_w, &pgrad);CHKERRQ(ierr);
117a7e14dcfSSatish Balay       tail_glist->next = pgrad;
118a7e14dcfSSatish Balay       tail_glist = pgrad;
119a7e14dcfSSatish Balay 
1208931d482SJason Sarich       df.a[tao->niter] = 1.0;
1218931d482SJason Sarich       df.f[tao->niter] = -bt;
1228931d482SJason Sarich       df.u[tao->niter] = 1.0;
1238931d482SJason Sarich       df.l[tao->niter] = 0.0;
124a7e14dcfSSatish Balay 
125a7e14dcfSSatish Balay       /* set up the Q */
126a7e14dcfSSatish Balay       pgrad = grad_list.next;
1278931d482SJason Sarich       for (i=0; i<=tao->niter; i++) {
1282a808120SBarry Smith         if (!pgrad) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Assert that there are at least tao->niter+1 pgrad available");
129a7e14dcfSSatish Balay         ierr = VecDot(pgrad->V, bmrm->local_w, &reg);CHKERRQ(ierr);
1308931d482SJason Sarich         df.Q[i][tao->niter] = df.Q[tao->niter][i] = reg / lambda;
131a7e14dcfSSatish Balay         pgrad = pgrad->next;
132a7e14dcfSSatish Balay       }
133a7e14dcfSSatish Balay 
1348931d482SJason Sarich       if (tao->niter > 0) {
1358931d482SJason Sarich         df.x[tao->niter] = 0.0;
136a7e14dcfSSatish Balay         ierr = solve(&df);CHKERRQ(ierr);
1370e660641SBarry Smith       } else
138a7e14dcfSSatish Balay         df.x[0] = 1.0;
139a7e14dcfSSatish Balay 
140a7e14dcfSSatish Balay       /* now computing Jt*(alpha_t) which should be = Jt(wt) to check convergence */
141a7e14dcfSSatish Balay       jtwt = 0.0;
142a7e14dcfSSatish Balay       ierr = VecSet(bmrm->local_w, 0.0);CHKERRQ(ierr);
143a7e14dcfSSatish Balay       pgrad = grad_list.next;
1448931d482SJason Sarich       for (i=0; i<=tao->niter; i++) {
145a7e14dcfSSatish Balay         jtwt -= df.x[i] * df.f[i];
146a7e14dcfSSatish Balay         ierr = VecAXPY(bmrm->local_w, -df.x[i] / lambda, pgrad->V);CHKERRQ(ierr);
147a7e14dcfSSatish Balay         pgrad = pgrad->next;
148a7e14dcfSSatish Balay       }
149a7e14dcfSSatish Balay 
150a7e14dcfSSatish Balay       ierr = VecNorm(bmrm->local_w, NORM_2, &reg);CHKERRQ(ierr);
151a7e14dcfSSatish Balay       reg = 0.5*lambda*reg*reg;
152a7e14dcfSSatish Balay       jtwt -= reg;
153a7e14dcfSSatish Balay     } /* end if rank == 0 */
154a7e14dcfSSatish Balay 
155a7e14dcfSSatish Balay     /* scatter the new W to all nodes */
156a7e14dcfSSatish Balay     ierr = VecScatterBegin(bmrm->scatter,bmrm->local_w,W,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
157a7e14dcfSSatish Balay     ierr = VecScatterEnd(bmrm->scatter,bmrm->local_w,W,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
158a7e14dcfSSatish Balay 
159a7e14dcfSSatish Balay     ierr = TaoComputeObjectiveAndGradient(tao, W, &f, G);CHKERRQ(ierr);
160a7e14dcfSSatish Balay 
161ba4b436cSBarry Smith     ierr = MPI_Bcast(&jtwt,1,MPIU_REAL,0,comm);CHKERRQ(ierr);
162ba4b436cSBarry Smith     ierr = MPI_Bcast(&reg,1,MPIU_REAL,0,comm);CHKERRQ(ierr);
163a7e14dcfSSatish Balay 
164a7e14dcfSSatish Balay     jw = reg + f;                                       /* J(w) = regularizer + Remp(w) */
1650e660641SBarry Smith     if (jw < min_jw) min_jw = jw;
1660e660641SBarry Smith     if (jtwt > max_jtwt) max_jtwt = jtwt;
167a7e14dcfSSatish Balay 
168a7e14dcfSSatish Balay     pre_epsilon = epsilon;
169a7e14dcfSSatish Balay     epsilon = min_jw - jtwt;
170a7e14dcfSSatish Balay 
1710e660641SBarry Smith     if (!rank) {
1720e660641SBarry Smith       if (innerSolverTol > epsilon) innerSolverTol = epsilon;
1730e660641SBarry Smith       else if (innerSolverTol < 1e-7) innerSolverTol = 1e-7;
174a7e14dcfSSatish Balay 
175a7e14dcfSSatish Balay       /* if the annealing doesn't work well, lower the inner solver tolerance */
1760e660641SBarry Smith       if(pre_epsilon < epsilon) innerSolverTol *= 0.2;
177a7e14dcfSSatish Balay 
178a7e14dcfSSatish Balay       df.tol = innerSolverTol*0.5;
179a7e14dcfSSatish Balay     }
180a7e14dcfSSatish Balay 
1818931d482SJason Sarich     tao->niter++;
182*3ecd9318SAlp Dener     ierr = TaoLogConvergenceHistory(tao,min_jw,epsilon,0.0,tao->ksp_its);CHKERRQ(ierr);
183*3ecd9318SAlp Dener     ierr = TaoMonitor(tao,tao->niter,min_jw,epsilon,0.0,tao->step);CHKERRQ(ierr);
184*3ecd9318SAlp Dener     ierr = (*tao->ops->convergencetest)(tao,tao->cnvP);CHKERRQ(ierr);
185a7e14dcfSSatish Balay   }
186a7e14dcfSSatish Balay 
187a7e14dcfSSatish Balay   /* free all the memory */
1880e660641SBarry Smith   if (!rank) {
189a7e14dcfSSatish Balay     ierr = destroy_grad_list(&grad_list);CHKERRQ(ierr);
190a7e14dcfSSatish Balay     ierr = destroy_df_solver(&df);CHKERRQ(ierr);
191a7e14dcfSSatish Balay   }
192a7e14dcfSSatish Balay 
193a7e14dcfSSatish Balay   ierr = VecDestroy(&bmrm->local_w);CHKERRQ(ierr);
194a7e14dcfSSatish Balay   ierr = VecScatterDestroy(&bmrm->scatter);CHKERRQ(ierr);
195a7e14dcfSSatish Balay   PetscFunctionReturn(0);
196a7e14dcfSSatish Balay }
197a7e14dcfSSatish Balay 
198a7e14dcfSSatish Balay 
199a7e14dcfSSatish Balay /* ---------------------------------------------------------- */
200a7e14dcfSSatish Balay 
201441846f8SBarry Smith static PetscErrorCode TaoSetup_BMRM(Tao tao)
2020e660641SBarry Smith {
203a7e14dcfSSatish Balay 
204a7e14dcfSSatish Balay   PetscErrorCode ierr;
205a7e14dcfSSatish Balay 
206a7e14dcfSSatish Balay   PetscFunctionBegin;
207a7e14dcfSSatish Balay   /* Allocate some arrays */
208a7e14dcfSSatish Balay   if (!tao->gradient) {
209a7e14dcfSSatish Balay     ierr = VecDuplicate(tao->solution, &tao->gradient);CHKERRQ(ierr);
210a7e14dcfSSatish Balay   }
211a7e14dcfSSatish Balay   PetscFunctionReturn(0);
212a7e14dcfSSatish Balay }
213a7e14dcfSSatish Balay 
214a7e14dcfSSatish Balay /*------------------------------------------------------------*/
215441846f8SBarry Smith static PetscErrorCode TaoDestroy_BMRM(Tao tao)
216a7e14dcfSSatish Balay {
217a7e14dcfSSatish Balay   PetscErrorCode ierr;
218a7e14dcfSSatish Balay 
219a7e14dcfSSatish Balay   PetscFunctionBegin;
220a7e14dcfSSatish Balay   ierr = PetscFree(tao->data);CHKERRQ(ierr);
221a7e14dcfSSatish Balay   PetscFunctionReturn(0);
222a7e14dcfSSatish Balay }
223a7e14dcfSSatish Balay 
2244416b707SBarry Smith static PetscErrorCode TaoSetFromOptions_BMRM(PetscOptionItems *PetscOptionsObject,Tao tao)
225a7e14dcfSSatish Balay {
226a7e14dcfSSatish Balay   PetscErrorCode ierr;
227a7e14dcfSSatish Balay   TAO_BMRM*      bmrm = (TAO_BMRM*)tao->data;
228a7e14dcfSSatish Balay 
229a7e14dcfSSatish Balay   PetscFunctionBegin;
2301a1499c8SBarry Smith   ierr = PetscOptionsHead(PetscOptionsObject,"BMRM for regularized risk minimization");CHKERRQ(ierr);
23194ae4db5SBarry Smith   ierr = PetscOptionsReal("-tao_bmrm_lambda", "regulariser weight","", 100,&bmrm->lambda,NULL);CHKERRQ(ierr);
232a7e14dcfSSatish Balay   ierr = PetscOptionsTail();CHKERRQ(ierr);
233a7e14dcfSSatish Balay   PetscFunctionReturn(0);
234a7e14dcfSSatish Balay }
235a7e14dcfSSatish Balay 
236a7e14dcfSSatish Balay /*------------------------------------------------------------*/
237441846f8SBarry Smith static PetscErrorCode TaoView_BMRM(Tao tao, PetscViewer viewer)
238a7e14dcfSSatish Balay {
239a7e14dcfSSatish Balay   PetscBool      isascii;
240a7e14dcfSSatish Balay   PetscErrorCode ierr;
241a7e14dcfSSatish Balay 
242a7e14dcfSSatish Balay   PetscFunctionBegin;
243a7e14dcfSSatish Balay   ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&isascii);CHKERRQ(ierr);
244a7e14dcfSSatish Balay   if (isascii) {
245a7e14dcfSSatish Balay     ierr = PetscViewerASCIIPushTab(viewer);CHKERRQ(ierr);
246a7e14dcfSSatish Balay     ierr = PetscViewerASCIIPopTab(viewer);CHKERRQ(ierr);
247a7e14dcfSSatish Balay   }
248a7e14dcfSSatish Balay   PetscFunctionReturn(0);
249a7e14dcfSSatish Balay }
250a7e14dcfSSatish Balay 
251a7e14dcfSSatish Balay /*------------------------------------------------------------*/
2521522df2eSJason Sarich /*MC
2531522df2eSJason Sarich   TAOBMRM - bundle method for regularized risk minimization
2541522df2eSJason Sarich 
2551522df2eSJason Sarich   Options Database Keys:
2561522df2eSJason Sarich . - tao_bmrm_lambda - regulariser weight
2571522df2eSJason Sarich 
2581eb8069cSJason Sarich   Level: beginner
2591522df2eSJason Sarich M*/
2601522df2eSJason Sarich 
261728e0ed0SBarry Smith PETSC_EXTERN PetscErrorCode TaoCreate_BMRM(Tao tao)
262a7e14dcfSSatish Balay {
263a7e14dcfSSatish Balay   TAO_BMRM       *bmrm;
264a7e14dcfSSatish Balay   PetscErrorCode ierr;
265a7e14dcfSSatish Balay 
266a7e14dcfSSatish Balay   PetscFunctionBegin;
267a7e14dcfSSatish Balay   tao->ops->setup = TaoSetup_BMRM;
268a7e14dcfSSatish Balay   tao->ops->solve = TaoSolve_BMRM;
269a7e14dcfSSatish Balay   tao->ops->view  = TaoView_BMRM;
270a7e14dcfSSatish Balay   tao->ops->setfromoptions = TaoSetFromOptions_BMRM;
271a7e14dcfSSatish Balay   tao->ops->destroy = TaoDestroy_BMRM;
272a7e14dcfSSatish Balay 
2733c9e27cfSGeoffrey Irving   ierr = PetscNewLog(tao,&bmrm);CHKERRQ(ierr);
274a7e14dcfSSatish Balay   bmrm->lambda = 1.0;
275a7e14dcfSSatish Balay   tao->data = (void*)bmrm;
276a7e14dcfSSatish Balay 
2776552cf8aSJason Sarich   /* Override default settings (unless already changed) */
2786552cf8aSJason Sarich   if (!tao->max_it_changed) tao->max_it = 2000;
2796552cf8aSJason Sarich   if (!tao->max_funcs_changed) tao->max_funcs = 4000;
2806552cf8aSJason Sarich   if (!tao->gatol_changed) tao->gatol = 1.0e-12;
2816552cf8aSJason Sarich   if (!tao->grtol_changed) tao->grtol = 1.0e-12;
282a7e14dcfSSatish Balay 
283a7e14dcfSSatish Balay   PetscFunctionReturn(0);
284a7e14dcfSSatish Balay }
285a7e14dcfSSatish Balay 
286a7e14dcfSSatish Balay PetscErrorCode init_df_solver(TAO_DF *df)
287a7e14dcfSSatish Balay {
288a7e14dcfSSatish Balay   PetscInt       i, n = INCRE_DIM;
289a7e14dcfSSatish Balay   PetscErrorCode ierr;
290a7e14dcfSSatish Balay 
291a7e14dcfSSatish Balay   PetscFunctionBegin;
292a7e14dcfSSatish Balay   /* default values */
293a7e14dcfSSatish Balay   df->maxProjIter = 200;
294a7e14dcfSSatish Balay   df->maxPGMIter = 300000;
295a7e14dcfSSatish Balay   df->b = 1.0;
296a7e14dcfSSatish Balay 
297a7e14dcfSSatish Balay   /* memory space required by Dai-Fletcher */
298a7e14dcfSSatish Balay   df->cur_num_cp = n;
2990e660641SBarry Smith   ierr = PetscMalloc1(n, &df->f);CHKERRQ(ierr);
3000e660641SBarry Smith   ierr = PetscMalloc1(n, &df->a);CHKERRQ(ierr);
3010e660641SBarry Smith   ierr = PetscMalloc1(n, &df->l);CHKERRQ(ierr);
3020e660641SBarry Smith   ierr = PetscMalloc1(n, &df->u);CHKERRQ(ierr);
3030e660641SBarry Smith   ierr = PetscMalloc1(n, &df->x);CHKERRQ(ierr);
304e1cc520bSBarry Smith   ierr = PetscMalloc1(n, &df->Q);CHKERRQ(ierr);
305a7e14dcfSSatish Balay 
306a7e14dcfSSatish Balay   for (i = 0; i < n; i ++) {
3070e660641SBarry Smith     ierr = PetscMalloc1(n, &df->Q[i]);CHKERRQ(ierr);
308a7e14dcfSSatish Balay   }
309a7e14dcfSSatish Balay 
3100e660641SBarry Smith   ierr = PetscMalloc1(n, &df->g);CHKERRQ(ierr);
3110e660641SBarry Smith   ierr = PetscMalloc1(n, &df->y);CHKERRQ(ierr);
3120e660641SBarry Smith   ierr = PetscMalloc1(n, &df->tempv);CHKERRQ(ierr);
3130e660641SBarry Smith   ierr = PetscMalloc1(n, &df->d);CHKERRQ(ierr);
3140e660641SBarry Smith   ierr = PetscMalloc1(n, &df->Qd);CHKERRQ(ierr);
3150e660641SBarry Smith   ierr = PetscMalloc1(n, &df->t);CHKERRQ(ierr);
3160e660641SBarry Smith   ierr = PetscMalloc1(n, &df->xplus);CHKERRQ(ierr);
3170e660641SBarry Smith   ierr = PetscMalloc1(n, &df->tplus);CHKERRQ(ierr);
3180e660641SBarry Smith   ierr = PetscMalloc1(n, &df->sk);CHKERRQ(ierr);
3190e660641SBarry Smith   ierr = PetscMalloc1(n, &df->yk);CHKERRQ(ierr);
320a7e14dcfSSatish Balay 
321e1cc520bSBarry Smith   ierr = PetscMalloc1(n, &df->ipt);CHKERRQ(ierr);
322e1cc520bSBarry Smith   ierr = PetscMalloc1(n, &df->ipt2);CHKERRQ(ierr);
323e1cc520bSBarry Smith   ierr = PetscMalloc1(n, &df->uv);CHKERRQ(ierr);
324a7e14dcfSSatish Balay   PetscFunctionReturn(0);
325a7e14dcfSSatish Balay }
326a7e14dcfSSatish Balay 
327a7e14dcfSSatish Balay PetscErrorCode ensure_df_space(PetscInt dim, TAO_DF *df)
328a7e14dcfSSatish Balay {
329a7e14dcfSSatish Balay   PetscErrorCode ierr;
330a7e14dcfSSatish Balay   PetscReal      *tmp, **tmp_Q;
331a7e14dcfSSatish Balay   PetscInt       i, n, old_n;
332a7e14dcfSSatish Balay 
333a7e14dcfSSatish Balay   PetscFunctionBegin;
33453506e15SBarry Smith   df->dim = dim;
33553506e15SBarry Smith   if (dim <= df->cur_num_cp) PetscFunctionReturn(0);
336a7e14dcfSSatish Balay 
337a7e14dcfSSatish Balay   old_n = df->cur_num_cp;
338a7e14dcfSSatish Balay   df->cur_num_cp += INCRE_DIM;
339a7e14dcfSSatish Balay   n = df->cur_num_cp;
340a7e14dcfSSatish Balay 
341a7e14dcfSSatish Balay   /* memory space required by dai-fletcher */
3420e660641SBarry Smith   ierr = PetscMalloc1(n, &tmp);CHKERRQ(ierr);
343a7e14dcfSSatish Balay   ierr = PetscMemcpy(tmp, df->f, sizeof(PetscReal)*old_n);CHKERRQ(ierr);
344a7e14dcfSSatish Balay   ierr = PetscFree(df->f);CHKERRQ(ierr);
345a7e14dcfSSatish Balay   df->f = tmp;
346a7e14dcfSSatish Balay 
3470e660641SBarry Smith   ierr = PetscMalloc1(n, &tmp);CHKERRQ(ierr);
348a7e14dcfSSatish Balay   ierr = PetscMemcpy(tmp, df->a, sizeof(PetscReal)*old_n);CHKERRQ(ierr);
349a7e14dcfSSatish Balay   ierr = PetscFree(df->a);CHKERRQ(ierr);
350a7e14dcfSSatish Balay   df->a = tmp;
351a7e14dcfSSatish Balay 
3520e660641SBarry Smith   ierr = PetscMalloc1(n, &tmp);CHKERRQ(ierr);
353a7e14dcfSSatish Balay   ierr = PetscMemcpy(tmp, df->l, sizeof(PetscReal)*old_n);CHKERRQ(ierr);
354a7e14dcfSSatish Balay   ierr = PetscFree(df->l);CHKERRQ(ierr);
355a7e14dcfSSatish Balay   df->l = tmp;
356a7e14dcfSSatish Balay 
3570e660641SBarry Smith   ierr = PetscMalloc1(n, &tmp);CHKERRQ(ierr);
358a7e14dcfSSatish Balay   ierr = PetscMemcpy(tmp, df->u, sizeof(PetscReal)*old_n);CHKERRQ(ierr);
359a7e14dcfSSatish Balay   ierr = PetscFree(df->u);CHKERRQ(ierr);
360a7e14dcfSSatish Balay   df->u = tmp;
361a7e14dcfSSatish Balay 
3620e660641SBarry Smith   ierr = PetscMalloc1(n, &tmp);CHKERRQ(ierr);
363a7e14dcfSSatish Balay   ierr = PetscMemcpy(tmp, df->x, sizeof(PetscReal)*old_n);CHKERRQ(ierr);
364a7e14dcfSSatish Balay   ierr = PetscFree(df->x);CHKERRQ(ierr);
365a7e14dcfSSatish Balay   df->x = tmp;
366a7e14dcfSSatish Balay 
367e1cc520bSBarry Smith   ierr = PetscMalloc1(n, &tmp_Q);CHKERRQ(ierr);
36853506e15SBarry Smith   for (i = 0; i < n; i ++) {
3690e660641SBarry Smith     ierr = PetscMalloc1(n, &tmp_Q[i]);CHKERRQ(ierr);
37053506e15SBarry Smith     if (i < old_n) {
371a7e14dcfSSatish Balay       ierr = PetscMemcpy(tmp_Q[i], df->Q[i], sizeof(PetscReal)*old_n);CHKERRQ(ierr);
372a7e14dcfSSatish Balay       ierr = PetscFree(df->Q[i]);CHKERRQ(ierr);
373a7e14dcfSSatish Balay     }
374a7e14dcfSSatish Balay   }
375a7e14dcfSSatish Balay 
376a7e14dcfSSatish Balay   ierr = PetscFree(df->Q);CHKERRQ(ierr);
377a7e14dcfSSatish Balay   df->Q = tmp_Q;
378a7e14dcfSSatish Balay 
379a7e14dcfSSatish Balay   ierr = PetscFree(df->g);CHKERRQ(ierr);
3800e660641SBarry Smith   ierr = PetscMalloc1(n, &df->g);CHKERRQ(ierr);
381a7e14dcfSSatish Balay 
382a7e14dcfSSatish Balay   ierr = PetscFree(df->y);CHKERRQ(ierr);
3830e660641SBarry Smith   ierr = PetscMalloc1(n, &df->y);CHKERRQ(ierr);
384a7e14dcfSSatish Balay 
385a7e14dcfSSatish Balay   ierr = PetscFree(df->tempv);CHKERRQ(ierr);
3860e660641SBarry Smith   ierr = PetscMalloc1(n, &df->tempv);CHKERRQ(ierr);
387a7e14dcfSSatish Balay 
388a7e14dcfSSatish Balay   ierr = PetscFree(df->d);CHKERRQ(ierr);
3890e660641SBarry Smith   ierr = PetscMalloc1(n, &df->d);CHKERRQ(ierr);
390a7e14dcfSSatish Balay 
391a7e14dcfSSatish Balay   ierr = PetscFree(df->Qd);CHKERRQ(ierr);
3920e660641SBarry Smith   ierr = PetscMalloc1(n, &df->Qd);CHKERRQ(ierr);
393a7e14dcfSSatish Balay 
394a7e14dcfSSatish Balay   ierr = PetscFree(df->t);CHKERRQ(ierr);
3950e660641SBarry Smith   ierr = PetscMalloc1(n, &df->t);CHKERRQ(ierr);
396a7e14dcfSSatish Balay 
397a7e14dcfSSatish Balay   ierr = PetscFree(df->xplus);CHKERRQ(ierr);
3980e660641SBarry Smith   ierr = PetscMalloc1(n, &df->xplus);CHKERRQ(ierr);
399a7e14dcfSSatish Balay 
400a7e14dcfSSatish Balay   ierr = PetscFree(df->tplus);CHKERRQ(ierr);
4010e660641SBarry Smith   ierr = PetscMalloc1(n, &df->tplus);CHKERRQ(ierr);
402a7e14dcfSSatish Balay 
403a7e14dcfSSatish Balay   ierr = PetscFree(df->sk);CHKERRQ(ierr);
4040e660641SBarry Smith   ierr = PetscMalloc1(n, &df->sk);CHKERRQ(ierr);
405a7e14dcfSSatish Balay 
406a7e14dcfSSatish Balay   ierr = PetscFree(df->yk);CHKERRQ(ierr);
4070e660641SBarry Smith   ierr = PetscMalloc1(n, &df->yk);CHKERRQ(ierr);
408a7e14dcfSSatish Balay 
409a7e14dcfSSatish Balay   ierr = PetscFree(df->ipt);CHKERRQ(ierr);
410e1cc520bSBarry Smith   ierr = PetscMalloc1(n, &df->ipt);CHKERRQ(ierr);
411a7e14dcfSSatish Balay 
412a7e14dcfSSatish Balay   ierr = PetscFree(df->ipt2);CHKERRQ(ierr);
4130e660641SBarry Smith   ierr = PetscMalloc1(n, &df->ipt2);CHKERRQ(ierr);
414a7e14dcfSSatish Balay 
415a7e14dcfSSatish Balay   ierr = PetscFree(df->uv);CHKERRQ(ierr);
4160e660641SBarry Smith   ierr = PetscMalloc1(n, &df->uv);CHKERRQ(ierr);
417a7e14dcfSSatish Balay   PetscFunctionReturn(0);
418a7e14dcfSSatish Balay }
419a7e14dcfSSatish Balay 
420a7e14dcfSSatish Balay PetscErrorCode destroy_df_solver(TAO_DF *df)
421a7e14dcfSSatish Balay {
422a7e14dcfSSatish Balay   PetscErrorCode ierr;
423a7e14dcfSSatish Balay   PetscInt       i;
4246c23d075SBarry Smith 
425a7e14dcfSSatish Balay   PetscFunctionBegin;
4266c23d075SBarry Smith   ierr = PetscFree(df->f);CHKERRQ(ierr);
4276c23d075SBarry Smith   ierr = PetscFree(df->a);CHKERRQ(ierr);
4286c23d075SBarry Smith   ierr = PetscFree(df->l);CHKERRQ(ierr);
4296c23d075SBarry Smith   ierr = PetscFree(df->u);CHKERRQ(ierr);
4306c23d075SBarry Smith   ierr = PetscFree(df->x);CHKERRQ(ierr);
431a7e14dcfSSatish Balay 
4326c23d075SBarry Smith   for (i = 0; i < df->cur_num_cp; i ++) {
433a7e14dcfSSatish Balay     ierr = PetscFree(df->Q[i]);CHKERRQ(ierr);
434a7e14dcfSSatish Balay   }
435a7e14dcfSSatish Balay   ierr = PetscFree(df->Q);CHKERRQ(ierr);
4366c23d075SBarry Smith   ierr = PetscFree(df->ipt);CHKERRQ(ierr);
4376c23d075SBarry Smith   ierr = PetscFree(df->ipt2);CHKERRQ(ierr);
4386c23d075SBarry Smith   ierr = PetscFree(df->uv);CHKERRQ(ierr);
4396c23d075SBarry Smith   ierr = PetscFree(df->g);CHKERRQ(ierr);
4406c23d075SBarry Smith   ierr = PetscFree(df->y);CHKERRQ(ierr);
4416c23d075SBarry Smith   ierr = PetscFree(df->tempv);CHKERRQ(ierr);
4426c23d075SBarry Smith   ierr = PetscFree(df->d);CHKERRQ(ierr);
4436c23d075SBarry Smith   ierr = PetscFree(df->Qd);CHKERRQ(ierr);
4446c23d075SBarry Smith   ierr = PetscFree(df->t);CHKERRQ(ierr);
4456c23d075SBarry Smith   ierr = PetscFree(df->xplus);CHKERRQ(ierr);
4466c23d075SBarry Smith   ierr = PetscFree(df->tplus);CHKERRQ(ierr);
4476c23d075SBarry Smith   ierr = PetscFree(df->sk);CHKERRQ(ierr);
4486c23d075SBarry Smith   ierr = PetscFree(df->yk);CHKERRQ(ierr);
449a7e14dcfSSatish Balay   PetscFunctionReturn(0);
450a7e14dcfSSatish Balay }
451a7e14dcfSSatish Balay 
452a7e14dcfSSatish Balay /* Piecewise linear monotone target function for the Dai-Fletcher projector */
4536c23d075SBarry Smith PetscReal phi(PetscReal *x,PetscInt n,PetscReal lambda,PetscReal *a,PetscReal b,PetscReal *c,PetscReal *l,PetscReal *u)
454a7e14dcfSSatish Balay {
455a7e14dcfSSatish Balay   PetscReal r = 0.0;
456a7e14dcfSSatish Balay   PetscInt  i;
457a7e14dcfSSatish Balay 
458a7e14dcfSSatish Balay   for (i = 0; i < n; i++){
459a7e14dcfSSatish Balay     x[i] = -c[i] + lambda*a[i];
4606c23d075SBarry Smith     if (x[i] > u[i])     x[i] = u[i];
4616c23d075SBarry Smith     else if(x[i] < l[i]) x[i] = l[i];
462a7e14dcfSSatish Balay     r += a[i]*x[i];
463a7e14dcfSSatish Balay   }
464a7e14dcfSSatish Balay   return r - b;
465a7e14dcfSSatish Balay }
466a7e14dcfSSatish Balay 
467a7e14dcfSSatish Balay /** Modified Dai-Fletcher QP projector solves the problem:
468a7e14dcfSSatish Balay  *
469a7e14dcfSSatish Balay  *      minimise  0.5*x'*x - c'*x
470a7e14dcfSSatish Balay  *      subj to   a'*x = b
471a7e14dcfSSatish Balay  *                l \leq x \leq u
472a7e14dcfSSatish Balay  *
473a7e14dcfSSatish Balay  *  \param c The point to be projected onto feasible set
474a7e14dcfSSatish Balay  */
4756c23d075SBarry Smith PetscInt project(PetscInt n,PetscReal *a,PetscReal b,PetscReal *c,PetscReal *l,PetscReal *u,PetscReal *x,PetscReal *lam_ext,TAO_DF *df)
476a7e14dcfSSatish Balay {
477a7e14dcfSSatish Balay   PetscReal      lambda, lambdal, lambdau, dlambda, lambda_new;
478a7e14dcfSSatish Balay   PetscReal      r, rl, ru, s;
479a7e14dcfSSatish Balay   PetscInt       innerIter;
480a7e14dcfSSatish Balay   PetscBool      nonNegativeSlack = PETSC_FALSE;
48153506e15SBarry Smith   PetscErrorCode ierr;
482a7e14dcfSSatish Balay 
483a7e14dcfSSatish Balay   *lam_ext = 0;
484a7e14dcfSSatish Balay   lambda  = 0;
485a7e14dcfSSatish Balay   dlambda = 0.5;
486a7e14dcfSSatish Balay   innerIter = 1;
487a7e14dcfSSatish Balay 
488a7e14dcfSSatish Balay   /*  \phi(x;lambda) := 0.5*x'*x + c'*x - lambda*(a'*x-b)
489a7e14dcfSSatish Balay    *
490a7e14dcfSSatish Balay    *  Optimality conditions for \phi:
491a7e14dcfSSatish Balay    *
492a7e14dcfSSatish Balay    *  1. lambda   <= 0
493a7e14dcfSSatish Balay    *  2. r        <= 0
494a7e14dcfSSatish Balay    *  3. r*lambda == 0
495a7e14dcfSSatish Balay    */
496a7e14dcfSSatish Balay 
497a7e14dcfSSatish Balay   /* Bracketing Phase */
498a7e14dcfSSatish Balay   r = phi(x, n, lambda, a, b, c, l, u);
499a7e14dcfSSatish Balay 
5006c23d075SBarry Smith   if(nonNegativeSlack) {
501a7e14dcfSSatish Balay     /* inequality constraint, i.e., with \xi >= 0 constraint */
50253506e15SBarry Smith     if (r < TOL_R) return 0;
5036c23d075SBarry Smith   } else  {
504a7e14dcfSSatish Balay     /* equality constraint ,i.e., without \xi >= 0 constraint */
5051118d4bcSLisandro Dalcin     if (PetscAbsReal(r) < TOL_R) return 0;
506a7e14dcfSSatish Balay   }
507a7e14dcfSSatish Balay 
508a7e14dcfSSatish Balay   if (r < 0.0){
509a7e14dcfSSatish Balay     lambdal = lambda;
510a7e14dcfSSatish Balay     rl      = r;
511a7e14dcfSSatish Balay     lambda  = lambda + dlambda;
512a7e14dcfSSatish Balay     r       = phi(x, n, lambda, a, b, c, l, u);
513a7e14dcfSSatish Balay     while (r < 0.0 && dlambda < BMRM_INFTY)  {
514a7e14dcfSSatish Balay       lambdal = lambda;
515a7e14dcfSSatish Balay       s       = rl/r - 1.0;
516a7e14dcfSSatish Balay       if (s < 0.1) s = 0.1;
517a7e14dcfSSatish Balay       dlambda = dlambda + dlambda/s;
518a7e14dcfSSatish Balay       lambda  = lambda + dlambda;
519a7e14dcfSSatish Balay       rl      = r;
520a7e14dcfSSatish Balay       r       = phi(x, n, lambda, a, b, c, l, u);
521a7e14dcfSSatish Balay     }
522a7e14dcfSSatish Balay     lambdau = lambda;
523a7e14dcfSSatish Balay     ru      = r;
5246c23d075SBarry Smith   } else {
525a7e14dcfSSatish Balay     lambdau = lambda;
526a7e14dcfSSatish Balay     ru      = r;
527a7e14dcfSSatish Balay     lambda  = lambda - dlambda;
528a7e14dcfSSatish Balay     r       = phi(x, n, lambda, a, b, c, l, u);
529a7e14dcfSSatish Balay     while (r > 0.0 && dlambda > -BMRM_INFTY) {
530a7e14dcfSSatish Balay       lambdau = lambda;
531a7e14dcfSSatish Balay       s       = ru/r - 1.0;
532a7e14dcfSSatish Balay       if (s < 0.1) s = 0.1;
533a7e14dcfSSatish Balay       dlambda = dlambda + dlambda/s;
534a7e14dcfSSatish Balay       lambda  = lambda - dlambda;
535a7e14dcfSSatish Balay       ru      = r;
536a7e14dcfSSatish Balay       r       = phi(x, n, lambda, a, b, c, l, u);
537a7e14dcfSSatish Balay     }
538a7e14dcfSSatish Balay     lambdal = lambda;
539a7e14dcfSSatish Balay     rl      = r;
540a7e14dcfSSatish Balay   }
541a7e14dcfSSatish Balay 
5421118d4bcSLisandro Dalcin   if(PetscAbsReal(dlambda) > BMRM_INFTY) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"L2N2_DaiFletcherPGM detected Infeasible QP problem!");
543a7e14dcfSSatish Balay 
544a7e14dcfSSatish Balay   if(ru == 0){
545a7e14dcfSSatish Balay     return innerIter;
546a7e14dcfSSatish Balay   }
547a7e14dcfSSatish Balay 
548a7e14dcfSSatish Balay   /* Secant Phase */
549a7e14dcfSSatish Balay   s       = 1.0 - rl/ru;
550a7e14dcfSSatish Balay   dlambda = dlambda/s;
551a7e14dcfSSatish Balay   lambda  = lambdau - dlambda;
552a7e14dcfSSatish Balay   r       = phi(x, n, lambda, a, b, c, l, u);
553a7e14dcfSSatish Balay 
5541118d4bcSLisandro Dalcin   while (PetscAbsReal(r) > TOL_R
5551118d4bcSLisandro Dalcin          && dlambda > TOL_LAM * (1.0 + PetscAbsReal(lambda))
556a7e14dcfSSatish Balay          && innerIter < df->maxProjIter){
557a7e14dcfSSatish Balay     innerIter++;
558a7e14dcfSSatish Balay     if (r > 0.0){
559a7e14dcfSSatish Balay       if (s <= 2.0){
560a7e14dcfSSatish Balay         lambdau = lambda;
561a7e14dcfSSatish Balay         ru      = r;
562a7e14dcfSSatish Balay         s       = 1.0 - rl/ru;
563a7e14dcfSSatish Balay         dlambda = (lambdau - lambdal) / s;
564a7e14dcfSSatish Balay         lambda  = lambdau - dlambda;
56553506e15SBarry Smith       } else {
566a7e14dcfSSatish Balay         s          = ru/r-1.0;
567a7e14dcfSSatish Balay         if (s < 0.1) s = 0.1;
568a7e14dcfSSatish Balay         dlambda    = (lambdau - lambda) / s;
569a7e14dcfSSatish Balay         lambda_new = 0.75*lambdal + 0.25*lambda;
570a7e14dcfSSatish Balay         if (lambda_new < (lambda - dlambda))
571a7e14dcfSSatish Balay           lambda_new = lambda - dlambda;
572a7e14dcfSSatish Balay         lambdau    = lambda;
573a7e14dcfSSatish Balay         ru         = r;
574a7e14dcfSSatish Balay         lambda     = lambda_new;
575a7e14dcfSSatish Balay         s          = (lambdau - lambdal) / (lambdau - lambda);
576a7e14dcfSSatish Balay       }
57753506e15SBarry Smith     } else {
578a7e14dcfSSatish Balay       if (s >= 2.0){
579a7e14dcfSSatish Balay         lambdal = lambda;
580a7e14dcfSSatish Balay         rl      = r;
581a7e14dcfSSatish Balay         s       = 1.0 - rl/ru;
582a7e14dcfSSatish Balay         dlambda = (lambdau - lambdal) / s;
583a7e14dcfSSatish Balay         lambda  = lambdau - dlambda;
58453506e15SBarry Smith       } else {
585a7e14dcfSSatish Balay         s          = rl/r - 1.0;
586a7e14dcfSSatish Balay         if (s < 0.1) s = 0.1;
587a7e14dcfSSatish Balay         dlambda    = (lambda-lambdal) / s;
588a7e14dcfSSatish Balay         lambda_new = 0.75*lambdau + 0.25*lambda;
589a7e14dcfSSatish Balay         if (lambda_new > (lambda + dlambda))
590a7e14dcfSSatish Balay           lambda_new = lambda + dlambda;
591a7e14dcfSSatish Balay         lambdal    = lambda;
592a7e14dcfSSatish Balay         rl         = r;
593a7e14dcfSSatish Balay         lambda     = lambda_new;
594a7e14dcfSSatish Balay         s          = (lambdau - lambdal) / (lambdau-lambda);
595a7e14dcfSSatish Balay       }
596a7e14dcfSSatish Balay     }
597a7e14dcfSSatish Balay     r = phi(x, n, lambda, a, b, c, l, u);
598a7e14dcfSSatish Balay   }
599a7e14dcfSSatish Balay 
600a7e14dcfSSatish Balay   *lam_ext = lambda;
60153506e15SBarry Smith   if(innerIter >= df->maxProjIter) {
60253506e15SBarry Smith     ierr = PetscPrintf(PETSC_COMM_SELF, "WARNING: DaiFletcher max iterations\n");CHKERRQ(ierr);
60353506e15SBarry Smith   }
604a7e14dcfSSatish Balay   return innerIter;
605a7e14dcfSSatish Balay }
606a7e14dcfSSatish Balay 
607a7e14dcfSSatish Balay 
608a7e14dcfSSatish Balay PetscErrorCode solve(TAO_DF *df)
609a7e14dcfSSatish Balay {
610a7e14dcfSSatish Balay   PetscErrorCode ierr;
611a7e14dcfSSatish Balay   PetscInt       i, j, innerIter, it, it2, luv, info, lscount = 0, projcount = 0;
612a7e14dcfSSatish Balay   PetscReal      gd, max, ak, bk, akold, bkold, lamnew, alpha, kktlam=0.0, lam_ext;
613a7e14dcfSSatish Balay   PetscReal      DELTAsv, ProdDELTAsv;
614a7e14dcfSSatish Balay   PetscReal      c, *tempQ;
615a7e14dcfSSatish Balay   PetscReal      *x = df->x, *a = df->a, b = df->b, *l = df->l, *u = df->u, tol = df->tol;
616a7e14dcfSSatish Balay   PetscReal      *tempv = df->tempv, *y = df->y, *g = df->g, *d = df->d, *Qd = df->Qd;
617a7e14dcfSSatish Balay   PetscReal      *xplus = df->xplus, *tplus = df->tplus, *sk = df->sk, *yk = df->yk;
618a7e14dcfSSatish Balay   PetscReal      **Q = df->Q, *f = df->f, *t = df->t;
619a7e14dcfSSatish Balay   PetscInt       dim = df->dim, *ipt = df->ipt, *ipt2 = df->ipt2, *uv = df->uv;
620a7e14dcfSSatish Balay 
621a7e14dcfSSatish Balay   /*** variables for the adaptive nonmonotone linesearch ***/
622a7e14dcfSSatish Balay   PetscInt    L, llast;
623a7e14dcfSSatish Balay   PetscReal   fr, fbest, fv, fc, fv0;
62453506e15SBarry Smith 
625a7e14dcfSSatish Balay   c = BMRM_INFTY;
626a7e14dcfSSatish Balay 
627a7e14dcfSSatish Balay   DELTAsv = EPS_SV;
62853506e15SBarry Smith   if (tol <= 1.0e-5 || dim <= 20) ProdDELTAsv = 0.0F;
62953506e15SBarry Smith   else  ProdDELTAsv = EPS_SV;
630a7e14dcfSSatish Balay 
63153506e15SBarry Smith   for (i = 0; i < dim; i++)  tempv[i] = -x[i];
632a7e14dcfSSatish Balay 
633a7e14dcfSSatish Balay   lam_ext = 0.0;
634a7e14dcfSSatish Balay 
635a7e14dcfSSatish Balay   /* Project the initial solution */
636a7e14dcfSSatish Balay   projcount += project(dim, a, b, tempv, l, u, x, &lam_ext, df);
637a7e14dcfSSatish Balay 
638a7e14dcfSSatish Balay   /* Compute gradient
639a7e14dcfSSatish Balay      g = Q*x + f; */
640a7e14dcfSSatish Balay 
641a7e14dcfSSatish Balay   it = 0;
64253506e15SBarry Smith   for (i = 0; i < dim; i++) {
6431118d4bcSLisandro Dalcin     if (PetscAbsReal(x[i]) > ProdDELTAsv) ipt[it++] = i;
64453506e15SBarry Smith   }
645a7e14dcfSSatish Balay 
646a7e14dcfSSatish Balay   ierr = PetscMemzero(t, dim*sizeof(PetscReal));CHKERRQ(ierr);
647a7e14dcfSSatish Balay   for (i = 0; i < it; i++){
648a7e14dcfSSatish Balay     tempQ = Q[ipt[i]];
64953506e15SBarry Smith     for (j = 0; j < dim; j++) t[j] += (tempQ[j]*x[ipt[i]]);
650a7e14dcfSSatish Balay   }
651a7e14dcfSSatish Balay   for (i = 0; i < dim; i++){
652a7e14dcfSSatish Balay     g[i] = t[i] + f[i];
653a7e14dcfSSatish Balay   }
654a7e14dcfSSatish Balay 
655a7e14dcfSSatish Balay 
656a7e14dcfSSatish Balay   /* y = -(x_{k} - g_{k}) */
657a7e14dcfSSatish Balay   for (i = 0; i < dim; i++){
658a7e14dcfSSatish Balay     y[i] = g[i] - x[i];
659a7e14dcfSSatish Balay   }
660a7e14dcfSSatish Balay 
661a7e14dcfSSatish Balay   /* Project x_{k} - g_{k} */
662a7e14dcfSSatish Balay   projcount += project(dim, a, b, y, l, u, tempv, &lam_ext, df);
663a7e14dcfSSatish Balay 
664a7e14dcfSSatish Balay   /* y = P(x_{k} - g_{k}) - x_{k} */
665a7e14dcfSSatish Balay   max = ALPHA_MIN;
666a7e14dcfSSatish Balay   for (i = 0; i < dim; i++){
667a7e14dcfSSatish Balay     y[i] = tempv[i] - x[i];
6681118d4bcSLisandro Dalcin     if (PetscAbsReal(y[i]) > max) max = PetscAbsReal(y[i]);
669a7e14dcfSSatish Balay   }
670a7e14dcfSSatish Balay 
671a7e14dcfSSatish Balay   if (max < tol*1e-3){
672a7e14dcfSSatish Balay     return 0;
673a7e14dcfSSatish Balay   }
674a7e14dcfSSatish Balay 
675a7e14dcfSSatish Balay   alpha = 1.0 / max;
676a7e14dcfSSatish Balay 
677a7e14dcfSSatish Balay   /* fv0 = f(x_{0}). Recall t = Q x_{k}  */
678a7e14dcfSSatish Balay   fv0   = 0.0;
67953506e15SBarry Smith   for (i = 0; i < dim; i++) fv0 += x[i] * (0.5*t[i] + f[i]);
680a7e14dcfSSatish Balay 
681a7e14dcfSSatish Balay   /*** adaptive nonmonotone linesearch ***/
682a7e14dcfSSatish Balay   L     = 2;
683a7e14dcfSSatish Balay   fr    = ALPHA_MAX;
684a7e14dcfSSatish Balay   fbest = fv0;
685a7e14dcfSSatish Balay   fc    = fv0;
686a7e14dcfSSatish Balay   llast = 0;
687a7e14dcfSSatish Balay   akold = bkold = 0.0;
688a7e14dcfSSatish Balay 
689a7e14dcfSSatish Balay   /***      Iterator begins     ***/
690a7e14dcfSSatish Balay   for (innerIter = 1; innerIter <= df->maxPGMIter; innerIter++) {
691a7e14dcfSSatish Balay 
692a7e14dcfSSatish Balay     /* tempv = -(x_{k} - alpha*g_{k}) */
69353506e15SBarry Smith     for (i = 0; i < dim; i++)  tempv[i] = alpha*g[i] - x[i];
694a7e14dcfSSatish Balay 
695a7e14dcfSSatish Balay     /* Project x_{k} - alpha*g_{k} */
696a7e14dcfSSatish Balay     projcount += project(dim, a, b, tempv, l, u, y, &lam_ext, df);
697a7e14dcfSSatish Balay 
698a7e14dcfSSatish Balay 
699a7e14dcfSSatish Balay     /* gd = \inner{d_{k}}{g_{k}}
700a7e14dcfSSatish Balay         d = P(x_{k} - alpha*g_{k}) - x_{k}
701a7e14dcfSSatish Balay     */
702a7e14dcfSSatish Balay     gd = 0.0;
703a7e14dcfSSatish Balay     for (i = 0; i < dim; i++){
704a7e14dcfSSatish Balay       d[i] = y[i] - x[i];
705a7e14dcfSSatish Balay       gd  += d[i] * g[i];
706a7e14dcfSSatish Balay     }
707a7e14dcfSSatish Balay 
708a7e14dcfSSatish Balay     /* Gradient computation  */
709a7e14dcfSSatish Balay 
710a7e14dcfSSatish Balay     /* compute Qd = Q*d  or  Qd = Q*y - t depending on their sparsity */
711a7e14dcfSSatish Balay 
712a7e14dcfSSatish Balay     it = it2 = 0;
71353506e15SBarry Smith     for (i = 0; i < dim; i++){
7141118d4bcSLisandro Dalcin       if (PetscAbsReal(d[i]) > (ProdDELTAsv*1.0e-2)) ipt[it++]   = i;
71553506e15SBarry Smith     }
71653506e15SBarry Smith     for (i = 0; i < dim; i++) {
7171118d4bcSLisandro Dalcin       if (PetscAbsReal(y[i]) > ProdDELTAsv) ipt2[it2++] = i;
71853506e15SBarry Smith     }
719a7e14dcfSSatish Balay 
720a7e14dcfSSatish Balay     ierr = PetscMemzero(Qd, dim*sizeof(PetscReal));CHKERRQ(ierr);
721a7e14dcfSSatish Balay     /* compute Qd = Q*d */
722a7e14dcfSSatish Balay     if (it < it2){
723a7e14dcfSSatish Balay       for (i = 0; i < it; i++){
724a7e14dcfSSatish Balay         tempQ = Q[ipt[i]];
72553506e15SBarry Smith         for (j = 0; j < dim; j++) Qd[j] += (tempQ[j] * d[ipt[i]]);
726a7e14dcfSSatish Balay       }
72753506e15SBarry Smith     } else { /* compute Qd = Q*y-t */
728a7e14dcfSSatish Balay       for (i = 0; i < it2; i++){
729a7e14dcfSSatish Balay         tempQ = Q[ipt2[i]];
73053506e15SBarry Smith         for (j = 0; j < dim; j++) Qd[j] += (tempQ[j] * y[ipt2[i]]);
731a7e14dcfSSatish Balay       }
73253506e15SBarry Smith       for (j = 0; j < dim; j++) Qd[j] -= t[j];
733a7e14dcfSSatish Balay     }
734a7e14dcfSSatish Balay 
735a7e14dcfSSatish Balay     /* ak = inner{d_{k}}{d_{k}} */
736a7e14dcfSSatish Balay     ak = 0.0;
73753506e15SBarry Smith     for (i = 0; i < dim; i++) ak += d[i] * d[i];
738a7e14dcfSSatish Balay 
739a7e14dcfSSatish Balay     bk = 0.0;
74053506e15SBarry Smith     for (i = 0; i < dim; i++) bk += d[i]*Qd[i];
741a7e14dcfSSatish Balay 
74253506e15SBarry Smith     if (bk > EPS*ak && gd < 0.0)  lamnew = -gd/bk;
74353506e15SBarry Smith     else lamnew = 1.0;
744a7e14dcfSSatish Balay 
745a7e14dcfSSatish Balay     /* fv is computing f(x_{k} + d_{k}) */
746a7e14dcfSSatish Balay     fv = 0.0;
747a7e14dcfSSatish Balay     for (i = 0; i < dim; i++){
748a7e14dcfSSatish Balay       xplus[i] = x[i] + d[i];
749a7e14dcfSSatish Balay       tplus[i] = t[i] + Qd[i];
750a7e14dcfSSatish Balay       fv      += xplus[i] * (0.5*tplus[i] + f[i]);
751a7e14dcfSSatish Balay     }
752a7e14dcfSSatish Balay 
753a7e14dcfSSatish Balay     /* fr is fref */
754a7e14dcfSSatish Balay     if ((innerIter == 1 && fv >= fv0) || (innerIter > 1 && fv >= fr)){
755a7e14dcfSSatish Balay       lscount++;
756a7e14dcfSSatish Balay       fv = 0.0;
757a7e14dcfSSatish Balay       for (i = 0; i < dim; i++){
758a7e14dcfSSatish Balay         xplus[i] = x[i] + lamnew*d[i];
759a7e14dcfSSatish Balay         tplus[i] = t[i] + lamnew*Qd[i];
760a7e14dcfSSatish Balay         fv      += xplus[i] * (0.5*tplus[i] + f[i]);
761a7e14dcfSSatish Balay       }
762a7e14dcfSSatish Balay     }
763a7e14dcfSSatish Balay 
764a7e14dcfSSatish Balay     for (i = 0; i < dim; i++){
765a7e14dcfSSatish Balay       sk[i] = xplus[i] - x[i];
766a7e14dcfSSatish Balay       yk[i] = tplus[i] - t[i];
767a7e14dcfSSatish Balay       x[i]  = xplus[i];
768a7e14dcfSSatish Balay       t[i]  = tplus[i];
769a7e14dcfSSatish Balay       g[i]  = t[i] + f[i];
770a7e14dcfSSatish Balay     }
771a7e14dcfSSatish Balay 
772a7e14dcfSSatish Balay     /* update the line search control parameters */
773a7e14dcfSSatish Balay     if (fv < fbest){
774a7e14dcfSSatish Balay       fbest = fv;
775a7e14dcfSSatish Balay       fc    = fv;
776a7e14dcfSSatish Balay       llast = 0;
77753506e15SBarry Smith     } else {
778a7e14dcfSSatish Balay       fc = (fc > fv ? fc : fv);
779a7e14dcfSSatish Balay       llast++;
780a7e14dcfSSatish Balay       if (llast == L){
781a7e14dcfSSatish Balay         fr    = fc;
782a7e14dcfSSatish Balay         fc    = fv;
783a7e14dcfSSatish Balay         llast = 0;
784a7e14dcfSSatish Balay       }
785a7e14dcfSSatish Balay     }
786a7e14dcfSSatish Balay 
787a7e14dcfSSatish Balay     ak = bk = 0.0;
788a7e14dcfSSatish Balay     for (i = 0; i < dim; i++){
789a7e14dcfSSatish Balay       ak += sk[i] * sk[i];
790a7e14dcfSSatish Balay       bk += sk[i] * yk[i];
791a7e14dcfSSatish Balay     }
792a7e14dcfSSatish Balay 
79353506e15SBarry Smith     if (bk <= EPS*ak) alpha = ALPHA_MAX;
794a7e14dcfSSatish Balay     else {
79553506e15SBarry Smith       if (bkold < EPS*akold) alpha = ak/bk;
79653506e15SBarry Smith       else alpha = (akold+ak)/(bkold+bk);
797a7e14dcfSSatish Balay 
79853506e15SBarry Smith       if (alpha > ALPHA_MAX) alpha = ALPHA_MAX;
79953506e15SBarry Smith       else if (alpha < ALPHA_MIN) alpha = ALPHA_MIN;
800a7e14dcfSSatish Balay     }
801a7e14dcfSSatish Balay 
802a7e14dcfSSatish Balay     akold = ak;
803a7e14dcfSSatish Balay     bkold = bk;
804a7e14dcfSSatish Balay 
805a7e14dcfSSatish Balay     /*** stopping criterion based on KKT conditions ***/
806a7e14dcfSSatish Balay     /* at optimal, gradient of lagrangian w.r.t. x is zero */
807a7e14dcfSSatish Balay 
808a7e14dcfSSatish Balay     bk = 0.0;
80953506e15SBarry Smith     for (i = 0; i < dim; i++) bk +=  x[i] * x[i];
810a7e14dcfSSatish Balay 
81153506e15SBarry Smith     if (PetscSqrtReal(ak) < tol*10 * PetscSqrtReal(bk)){
812a7e14dcfSSatish Balay       it     = 0;
813a7e14dcfSSatish Balay       luv    = 0;
814a7e14dcfSSatish Balay       kktlam = 0.0;
815a7e14dcfSSatish Balay       for (i = 0; i < dim; i++){
816a7e14dcfSSatish Balay         /* x[i] is active hence lagrange multipliers for box constraints
817a7e14dcfSSatish Balay                 are zero. The lagrange multiplier for ineq. const. is then
818a7e14dcfSSatish Balay                 defined as below
819a7e14dcfSSatish Balay         */
820a7e14dcfSSatish Balay         if ((x[i] > DELTAsv) && (x[i] < c-DELTAsv)){
821a7e14dcfSSatish Balay           ipt[it++] = i;
822a7e14dcfSSatish Balay           kktlam    = kktlam - a[i]*g[i];
82353506e15SBarry Smith         } else  uv[luv++] = i;
824a7e14dcfSSatish Balay       }
825a7e14dcfSSatish Balay 
82653506e15SBarry Smith       if (it == 0 && PetscSqrtReal(ak) < tol*0.5 * PetscSqrtReal(bk)) return 0;
827a7e14dcfSSatish Balay       else {
828a7e14dcfSSatish Balay         kktlam = kktlam/it;
829a7e14dcfSSatish Balay         info   = 1;
830a7e14dcfSSatish Balay         for (i = 0; i < it; i++) {
8311118d4bcSLisandro Dalcin           if (PetscAbsReal(a[ipt[i]] * g[ipt[i]] + kktlam) > tol) {
832a7e14dcfSSatish Balay             info = 0;
833a7e14dcfSSatish Balay             break;
834a7e14dcfSSatish Balay           }
835a7e14dcfSSatish Balay         }
836a7e14dcfSSatish Balay         if (info == 1)  {
837a7e14dcfSSatish Balay           for (i = 0; i < luv; i++)  {
838a7e14dcfSSatish Balay             if (x[uv[i]] <= DELTAsv){
839a7e14dcfSSatish Balay               /* x[i] == lower bound, hence, lagrange multiplier (say, beta) for lower bound may
840a7e14dcfSSatish Balay                      not be zero. So, the gradient without beta is > 0
841a7e14dcfSSatish Balay               */
842a7e14dcfSSatish Balay               if (g[uv[i]] + kktlam*a[uv[i]] < -tol){
843a7e14dcfSSatish Balay                 info = 0;
844a7e14dcfSSatish Balay                 break;
845a7e14dcfSSatish Balay               }
84653506e15SBarry Smith             } else {
847a7e14dcfSSatish Balay               /* x[i] == upper bound, hence, lagrange multiplier (say, eta) for upper bound may
848a7e14dcfSSatish Balay                      not be zero. So, the gradient without eta is < 0
849a7e14dcfSSatish Balay               */
850a7e14dcfSSatish Balay               if (g[uv[i]] + kktlam*a[uv[i]] > tol) {
851a7e14dcfSSatish Balay                 info = 0;
852a7e14dcfSSatish Balay                 break;
853a7e14dcfSSatish Balay               }
854a7e14dcfSSatish Balay             }
855a7e14dcfSSatish Balay           }
856a7e14dcfSSatish Balay         }
857a7e14dcfSSatish Balay 
85853506e15SBarry Smith         if (info == 1) return 0;
859a7e14dcfSSatish Balay       }
860a7e14dcfSSatish Balay     }
861a7e14dcfSSatish Balay   }
862a7e14dcfSSatish Balay   return 0;
863a7e14dcfSSatish Balay }
864a7e14dcfSSatish Balay 
865a7e14dcfSSatish Balay 
866