xref: /petsc/src/tao/unconstrained/impls/bmrm/bmrm.c (revision aaa7dc30da3270cff6cb10b1db605b2ca746f216)
1*aaa7dc30SBarry Smith #include <../src/tao/unconstrained/impls/bmrm/bmrm.h>
2a7e14dcfSSatish Balay 
3a7e14dcfSSatish Balay static PetscErrorCode init_df_solver(TAO_DF*);
4a7e14dcfSSatish Balay static PetscErrorCode ensure_df_space(PetscInt, TAO_DF*);
5a7e14dcfSSatish Balay static PetscErrorCode destroy_df_solver(TAO_DF*);
60e660641SBarry Smith static PetscReal phi(PetscReal*,PetscInt,PetscReal,PetscReal*,PetscReal,PetscReal*,PetscReal*,PetscReal*);
70e660641SBarry Smith static PetscInt project(PetscInt,PetscReal*,PetscReal,PetscReal*,PetscReal*,PetscReal*,PetscReal*,PetscReal*,TAO_DF*);
8a7e14dcfSSatish Balay static PetscErrorCode solve(TAO_DF*);
9a7e14dcfSSatish Balay 
10a7e14dcfSSatish Balay 
11a7e14dcfSSatish Balay /*------------------------------------------------------------*/
12a7e14dcfSSatish Balay /* The main solver function
13a7e14dcfSSatish Balay 
14a7e14dcfSSatish Balay    f = Remp(W)          This is what the user provides us from the application layer
15a7e14dcfSSatish Balay    So the ComputeGradient function for instance should get us back the subgradient of Remp(W)
16a7e14dcfSSatish Balay 
17a7e14dcfSSatish Balay    Regularizer assumed to be L2 norm = lambda*0.5*W'W ()
18a7e14dcfSSatish Balay */
19a7e14dcfSSatish Balay 
20a7e14dcfSSatish Balay #undef __FUNCT__
21a7e14dcfSSatish Balay #define __FUNCT__ "make_grad_node"
22a7e14dcfSSatish Balay static PetscErrorCode make_grad_node(Vec X, Vec_Chain **p)
23a7e14dcfSSatish Balay {
24a7e14dcfSSatish Balay   PetscErrorCode ierr;
25a7e14dcfSSatish Balay 
26a7e14dcfSSatish Balay   PetscFunctionBegin;
270e660641SBarry Smith   ierr = PetscNew(p);CHKERRQ(ierr);
28a7e14dcfSSatish Balay   ierr = VecDuplicate(X, &(*p)->V);CHKERRQ(ierr);
29a7e14dcfSSatish Balay   ierr = VecCopy(X, (*p)->V);CHKERRQ(ierr);
306c23d075SBarry Smith   (*p)->next = NULL;
31a7e14dcfSSatish Balay   PetscFunctionReturn(0);
32a7e14dcfSSatish Balay }
33a7e14dcfSSatish Balay 
34a7e14dcfSSatish Balay #undef __FUNCT__
35a7e14dcfSSatish Balay #define __FUNCT__ "destroy_grad_list"
36a7e14dcfSSatish Balay static PetscErrorCode destroy_grad_list(Vec_Chain *head)
37a7e14dcfSSatish Balay {
38a7e14dcfSSatish Balay   PetscErrorCode ierr;
39a7e14dcfSSatish Balay   Vec_Chain      *p = head->next, *q;
40a7e14dcfSSatish Balay 
41a7e14dcfSSatish Balay   PetscFunctionBegin;
42a7e14dcfSSatish Balay   while(p) {
43a7e14dcfSSatish Balay     q = p->next;
44a7e14dcfSSatish Balay     ierr = VecDestroy(&p->V);CHKERRQ(ierr);
45a7e14dcfSSatish Balay     ierr = PetscFree(p);CHKERRQ(ierr);
46a7e14dcfSSatish Balay     p = q;
47a7e14dcfSSatish Balay   }
486c23d075SBarry Smith   head->next = NULL;
49a7e14dcfSSatish Balay   PetscFunctionReturn(0);
50a7e14dcfSSatish Balay }
51a7e14dcfSSatish Balay 
52a7e14dcfSSatish Balay 
53a7e14dcfSSatish Balay #undef __FUNCT__
54a7e14dcfSSatish Balay #define __FUNCT__ "TaoSolve_BMRM"
55a7e14dcfSSatish Balay static PetscErrorCode TaoSolve_BMRM(TaoSolver tao)
56a7e14dcfSSatish Balay {
57a7e14dcfSSatish Balay   PetscErrorCode             ierr;
58a7e14dcfSSatish Balay   TaoSolverTerminationReason reason;
59a7e14dcfSSatish Balay   TAO_DF                     df;
60a7e14dcfSSatish Balay   TAO_BMRM                   *bmrm = (TAO_BMRM*)tao->data;
61a7e14dcfSSatish Balay 
62a7e14dcfSSatish Balay   /* Values and pointers to parts of the optimization problem */
63a7e14dcfSSatish Balay   PetscReal                  f = 0.0;
64a7e14dcfSSatish Balay   Vec                        W = tao->solution;
65a7e14dcfSSatish Balay   Vec                        G = tao->gradient;
66a7e14dcfSSatish Balay   PetscReal                  lambda;
67a7e14dcfSSatish Balay   PetscReal                  bt;
68a7e14dcfSSatish Balay   Vec_Chain                  grad_list, *tail_glist, *pgrad;
69a7e14dcfSSatish Balay   PetscInt                   iter = 0;
70a7e14dcfSSatish Balay   PetscInt                   i;
71a7e14dcfSSatish Balay   PetscMPIInt                rank;
72a7e14dcfSSatish Balay 
73a7e14dcfSSatish Balay   /* Used in termination criteria check */
74a7e14dcfSSatish Balay   PetscReal                  reg;
75a7e14dcfSSatish Balay   PetscReal                  jtwt, max_jtwt, pre_epsilon, epsilon, jw, min_jw;
76a7e14dcfSSatish Balay   PetscReal                  innerSolverTol;
77a7e14dcfSSatish Balay 
78a7e14dcfSSatish Balay   PetscFunctionBegin;
79a7e14dcfSSatish Balay   ierr = MPI_Comm_rank(PETSC_COMM_WORLD, &rank);CHKERRQ(ierr);
80a7e14dcfSSatish Balay   lambda = bmrm->lambda;
81a7e14dcfSSatish Balay 
82a7e14dcfSSatish Balay   /* Check Stopping Condition */
83a7e14dcfSSatish Balay   tao->step = 1.0;
84a7e14dcfSSatish Balay   max_jtwt = -BMRM_INFTY;
85a7e14dcfSSatish Balay   min_jw = BMRM_INFTY;
86a7e14dcfSSatish Balay   innerSolverTol = 1.0;
87a7e14dcfSSatish Balay   epsilon = 0.0;
88a7e14dcfSSatish Balay 
890e660641SBarry Smith   if (!rank) {
90a7e14dcfSSatish Balay     ierr = init_df_solver(&df);CHKERRQ(ierr);
91a7e14dcfSSatish Balay     grad_list.next = NULL;
92a7e14dcfSSatish Balay     tail_glist = &grad_list;
93a7e14dcfSSatish Balay   }
94a7e14dcfSSatish Balay 
95a7e14dcfSSatish Balay   df.tol = 1e-6;
96a7e14dcfSSatish Balay   reason = TAO_CONTINUE_ITERATING;
97a7e14dcfSSatish Balay 
98a7e14dcfSSatish Balay   /*-----------------Algorithm Begins------------------------*/
99a7e14dcfSSatish Balay   /* make the scatter */
100a7e14dcfSSatish Balay   ierr = VecScatterCreateToZero(W, &bmrm->scatter, &bmrm->local_w);CHKERRQ(ierr);
101a7e14dcfSSatish Balay   ierr = VecAssemblyBegin(bmrm->local_w);CHKERRQ(ierr);
102a7e14dcfSSatish Balay   ierr = VecAssemblyEnd(bmrm->local_w);CHKERRQ(ierr);
103a7e14dcfSSatish Balay 
104a7e14dcfSSatish Balay   /* NOTE: In application pass the sub-gradient of Remp(W) */
105a7e14dcfSSatish Balay   ierr = TaoComputeObjectiveAndGradient(tao, W, &f, G);CHKERRQ(ierr);
106a7e14dcfSSatish Balay   ierr = TaoMonitor(tao,iter,f,1.0,0.0,tao->step,&reason);CHKERRQ(ierr);
107a7e14dcfSSatish Balay   while (reason == TAO_CONTINUE_ITERATING) {
108a7e14dcfSSatish Balay     /* compute bt = Remp(Wt-1) - <Wt-1, At> */
109a7e14dcfSSatish Balay     ierr = VecDot(W, G, &bt);CHKERRQ(ierr);
110a7e14dcfSSatish Balay     bt = f - bt;
111a7e14dcfSSatish Balay 
112a7e14dcfSSatish Balay     /* First gather the gradient to the master node */
113a7e14dcfSSatish Balay     ierr = VecScatterBegin(bmrm->scatter, G, bmrm->local_w, INSERT_VALUES, SCATTER_FORWARD);CHKERRQ(ierr);
114a7e14dcfSSatish Balay     ierr = VecScatterEnd(bmrm->scatter, G, bmrm->local_w, INSERT_VALUES, SCATTER_FORWARD);CHKERRQ(ierr);
115a7e14dcfSSatish Balay 
116a7e14dcfSSatish Balay     /* Bring up the inner solver */
1170e660641SBarry Smith     if (!rank) {
118a7e14dcfSSatish Balay       ierr = ensure_df_space(iter+1, &df); CHKERRQ(ierr);
119a7e14dcfSSatish Balay       ierr = make_grad_node(bmrm->local_w, &pgrad);CHKERRQ(ierr);
120a7e14dcfSSatish Balay       tail_glist->next = pgrad;
121a7e14dcfSSatish Balay       tail_glist = pgrad;
122a7e14dcfSSatish Balay 
123a7e14dcfSSatish Balay       df.a[iter] = 1.0;
124a7e14dcfSSatish Balay       df.f[iter] = -bt;
125a7e14dcfSSatish Balay       df.u[iter] = 1.0;
126a7e14dcfSSatish Balay       df.l[iter] = 0.0;
127a7e14dcfSSatish Balay 
128a7e14dcfSSatish Balay       /* set up the Q */
129a7e14dcfSSatish Balay       pgrad = grad_list.next;
130a7e14dcfSSatish Balay       for (i=0; i<=iter; i++) {
131a7e14dcfSSatish Balay         ierr = VecDot(pgrad->V, bmrm->local_w, &reg);CHKERRQ(ierr);
132a7e14dcfSSatish Balay         df.Q[i][iter] = df.Q[iter][i] = reg / lambda;
133a7e14dcfSSatish Balay         pgrad = pgrad->next;
134a7e14dcfSSatish Balay       }
135a7e14dcfSSatish Balay 
136a7e14dcfSSatish Balay       if (iter > 0) {
137a7e14dcfSSatish Balay         df.x[iter] = 0.0;
138a7e14dcfSSatish Balay         ierr = solve(&df); CHKERRQ(ierr);
1390e660641SBarry Smith       } else
140a7e14dcfSSatish Balay         df.x[0] = 1.0;
141a7e14dcfSSatish Balay 
142a7e14dcfSSatish Balay       /* now computing Jt*(alpha_t) which should be = Jt(wt) to check convergence */
143a7e14dcfSSatish Balay       jtwt = 0.0;
144a7e14dcfSSatish Balay       ierr = VecSet(bmrm->local_w, 0.0); CHKERRQ(ierr);
145a7e14dcfSSatish Balay       pgrad = grad_list.next;
146a7e14dcfSSatish Balay       for (i=0; i<=iter; i++) {
147a7e14dcfSSatish Balay         jtwt -= df.x[i] * df.f[i];
148a7e14dcfSSatish Balay         ierr = VecAXPY(bmrm->local_w, -df.x[i] / lambda, pgrad->V); CHKERRQ(ierr);
149a7e14dcfSSatish Balay         pgrad = pgrad->next;
150a7e14dcfSSatish Balay       }
151a7e14dcfSSatish Balay 
152a7e14dcfSSatish Balay       ierr = VecNorm(bmrm->local_w, NORM_2, &reg); CHKERRQ(ierr);
153a7e14dcfSSatish Balay       reg = 0.5*lambda*reg*reg;
154a7e14dcfSSatish Balay       jtwt -= reg;
155a7e14dcfSSatish Balay     } /* end if rank == 0 */
156a7e14dcfSSatish Balay 
157a7e14dcfSSatish Balay     /* scatter the new W to all nodes */
158a7e14dcfSSatish Balay     ierr = VecScatterBegin(bmrm->scatter,bmrm->local_w,W,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
159a7e14dcfSSatish Balay     ierr = VecScatterEnd(bmrm->scatter,bmrm->local_w,W,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
160a7e14dcfSSatish Balay 
161a7e14dcfSSatish Balay     ierr = TaoComputeObjectiveAndGradient(tao, W, &f, G);CHKERRQ(ierr);
162a7e14dcfSSatish Balay 
163a7e14dcfSSatish Balay     MPI_Bcast(&jtwt,1,MPI_DOUBLE,0,PETSC_COMM_WORLD);
164a7e14dcfSSatish Balay     MPI_Bcast(&reg,1,MPI_DOUBLE,0,PETSC_COMM_WORLD);
165a7e14dcfSSatish Balay 
166a7e14dcfSSatish Balay     jw = reg + f;                                       /* J(w) = regularizer + Remp(w) */
1670e660641SBarry Smith     if (jw < min_jw) min_jw = jw;
1680e660641SBarry Smith     if (jtwt > max_jtwt) max_jtwt = jtwt;
169a7e14dcfSSatish Balay 
170a7e14dcfSSatish Balay     pre_epsilon = epsilon;
171a7e14dcfSSatish Balay     epsilon = min_jw - jtwt;
172a7e14dcfSSatish Balay 
1730e660641SBarry Smith     if (!rank) {
1740e660641SBarry Smith       if (innerSolverTol > epsilon) innerSolverTol = epsilon;
1750e660641SBarry Smith       else if (innerSolverTol < 1e-7) innerSolverTol = 1e-7;
176a7e14dcfSSatish Balay 
177a7e14dcfSSatish Balay       /* if the annealing doesn't work well, lower the inner solver tolerance */
1780e660641SBarry Smith       if(pre_epsilon < epsilon) innerSolverTol *= 0.2;
179a7e14dcfSSatish Balay 
180a7e14dcfSSatish Balay       df.tol = innerSolverTol*0.5;
181a7e14dcfSSatish Balay     }
182a7e14dcfSSatish Balay 
183a7e14dcfSSatish Balay     iter++;
184a7e14dcfSSatish Balay     ierr = TaoMonitor(tao,iter,min_jw,epsilon,0.0,tao->step,&reason);CHKERRQ(ierr);
185a7e14dcfSSatish Balay   }
186a7e14dcfSSatish Balay 
187a7e14dcfSSatish Balay   /* free all the memory */
1880e660641SBarry Smith   if (!rank) {
189a7e14dcfSSatish Balay     ierr = destroy_grad_list(&grad_list);CHKERRQ(ierr);
190a7e14dcfSSatish Balay     ierr = destroy_df_solver(&df);CHKERRQ(ierr);
191a7e14dcfSSatish Balay   }
192a7e14dcfSSatish Balay 
193a7e14dcfSSatish Balay   ierr = VecDestroy(&bmrm->local_w);CHKERRQ(ierr);
194a7e14dcfSSatish Balay   ierr = VecScatterDestroy(&bmrm->scatter);CHKERRQ(ierr);
195a7e14dcfSSatish Balay   PetscFunctionReturn(0);
196a7e14dcfSSatish Balay }
197a7e14dcfSSatish Balay 
198a7e14dcfSSatish Balay 
199a7e14dcfSSatish Balay /* ---------------------------------------------------------- */
200a7e14dcfSSatish Balay 
201a7e14dcfSSatish Balay #undef __FUNCT__
202a7e14dcfSSatish Balay #define __FUNCT__ "TaoSetup_BMRM"
2030e660641SBarry Smith static PetscErrorCode TaoSetup_BMRM(TaoSolver tao)
2040e660641SBarry Smith {
205a7e14dcfSSatish Balay 
206a7e14dcfSSatish Balay   PetscErrorCode ierr;
207a7e14dcfSSatish Balay 
208a7e14dcfSSatish Balay   PetscFunctionBegin;
209a7e14dcfSSatish Balay   /* Allocate some arrays */
210a7e14dcfSSatish Balay   if (!tao->gradient) {
211a7e14dcfSSatish Balay     ierr = VecDuplicate(tao->solution, &tao->gradient);   CHKERRQ(ierr);
212a7e14dcfSSatish Balay   }
213a7e14dcfSSatish Balay   PetscFunctionReturn(0);
214a7e14dcfSSatish Balay }
215a7e14dcfSSatish Balay 
216a7e14dcfSSatish Balay /*------------------------------------------------------------*/
217a7e14dcfSSatish Balay #undef __FUNCT__
218a7e14dcfSSatish Balay #define __FUNCT__ "TaoDestroy_BMRM"
219a7e14dcfSSatish Balay static PetscErrorCode TaoDestroy_BMRM(TaoSolver tao)
220a7e14dcfSSatish Balay {
221a7e14dcfSSatish Balay   PetscErrorCode ierr;
222a7e14dcfSSatish Balay 
223a7e14dcfSSatish Balay   PetscFunctionBegin;
224a7e14dcfSSatish Balay   ierr = PetscFree(tao->data);CHKERRQ(ierr);
225a7e14dcfSSatish Balay   PetscFunctionReturn(0);
226a7e14dcfSSatish Balay }
227a7e14dcfSSatish Balay 
228a7e14dcfSSatish Balay #undef __FUNCT__
229a7e14dcfSSatish Balay #define __FUNCT__ "TaoSetFromOptions_BMRM"
230a7e14dcfSSatish Balay static PetscErrorCode TaoSetFromOptions_BMRM(TaoSolver tao)
231a7e14dcfSSatish Balay {
232a7e14dcfSSatish Balay   PetscErrorCode ierr;
233a7e14dcfSSatish Balay   TAO_BMRM*      bmrm = (TAO_BMRM*)tao->data;
234a7e14dcfSSatish Balay   PetscBool      flg;
235a7e14dcfSSatish Balay 
236a7e14dcfSSatish Balay   PetscFunctionBegin;
237a7e14dcfSSatish Balay   ierr = PetscOptionsHead("BMRM for regularized risk minimization");CHKERRQ(ierr);
238a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_bmrm_lambda", "regulariser weight","", 100,&bmrm->lambda,&flg); CHKERRQ(ierr);
239a7e14dcfSSatish Balay   ierr = PetscOptionsTail();CHKERRQ(ierr);
240a7e14dcfSSatish Balay   PetscFunctionReturn(0);
241a7e14dcfSSatish Balay }
242a7e14dcfSSatish Balay 
243a7e14dcfSSatish Balay /*------------------------------------------------------------*/
244a7e14dcfSSatish Balay #undef __FUNCT__
245a7e14dcfSSatish Balay #define __FUNCT__ "TaoView_BMRM"
246a7e14dcfSSatish Balay static PetscErrorCode TaoView_BMRM(TaoSolver tao, PetscViewer viewer)
247a7e14dcfSSatish Balay {
248a7e14dcfSSatish Balay   PetscBool      isascii;
249a7e14dcfSSatish Balay   PetscErrorCode ierr;
250a7e14dcfSSatish Balay 
251a7e14dcfSSatish Balay   PetscFunctionBegin;
252a7e14dcfSSatish Balay   ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&isascii);CHKERRQ(ierr);
253a7e14dcfSSatish Balay   if (isascii) {
254a7e14dcfSSatish Balay     ierr = PetscViewerASCIIPushTab(viewer);CHKERRQ(ierr);
255a7e14dcfSSatish Balay     ierr = PetscViewerASCIIPopTab(viewer);CHKERRQ(ierr);
256a7e14dcfSSatish Balay   }
257a7e14dcfSSatish Balay   PetscFunctionReturn(0);
258a7e14dcfSSatish Balay }
259a7e14dcfSSatish Balay 
260a7e14dcfSSatish Balay /*------------------------------------------------------------*/
261a7e14dcfSSatish Balay EXTERN_C_BEGIN
262a7e14dcfSSatish Balay #undef __FUNCT__
263a7e14dcfSSatish Balay #define __FUNCT__ "TaoCreate_BMRM"
264a7e14dcfSSatish Balay PetscErrorCode TaoCreate_BMRM(TaoSolver tao)
265a7e14dcfSSatish Balay {
266a7e14dcfSSatish Balay   TAO_BMRM       *bmrm;
267a7e14dcfSSatish Balay   PetscErrorCode ierr;
268a7e14dcfSSatish Balay 
269a7e14dcfSSatish Balay   PetscFunctionBegin;
270a7e14dcfSSatish Balay   tao->ops->setup = TaoSetup_BMRM;
271a7e14dcfSSatish Balay   tao->ops->solve = TaoSolve_BMRM;
272a7e14dcfSSatish Balay   tao->ops->view  = TaoView_BMRM;
273a7e14dcfSSatish Balay   tao->ops->setfromoptions = TaoSetFromOptions_BMRM;
274a7e14dcfSSatish Balay   tao->ops->destroy = TaoDestroy_BMRM;
275a7e14dcfSSatish Balay 
2763c9e27cfSGeoffrey Irving   ierr = PetscNewLog(tao,&bmrm);CHKERRQ(ierr);
277a7e14dcfSSatish Balay   bmrm->lambda = 1.0;
278a7e14dcfSSatish Balay   tao->data = (void*)bmrm;
279a7e14dcfSSatish Balay 
280a7e14dcfSSatish Balay   /* Note: May need to be tuned! */
281a7e14dcfSSatish Balay   tao->max_it = 2048;
282a7e14dcfSSatish Balay   tao->max_funcs = 300000;
283a7e14dcfSSatish Balay   tao->fatol = 1e-20;
284a7e14dcfSSatish Balay   tao->frtol = 1e-25;
285a7e14dcfSSatish Balay   tao->gatol = 1e-25;
286a7e14dcfSSatish Balay   tao->grtol = 1e-25;
287a7e14dcfSSatish Balay 
288a7e14dcfSSatish Balay   PetscFunctionReturn(0);
289a7e14dcfSSatish Balay }
290a7e14dcfSSatish Balay EXTERN_C_END
291a7e14dcfSSatish Balay 
292a7e14dcfSSatish Balay #undef __FUNCT__
293a7e14dcfSSatish Balay #define __FUNCT__ "init_df_solver"
294a7e14dcfSSatish Balay PetscErrorCode init_df_solver(TAO_DF *df)
295a7e14dcfSSatish Balay {
296a7e14dcfSSatish Balay   PetscInt       i, n = INCRE_DIM;
297a7e14dcfSSatish Balay   PetscErrorCode ierr;
298a7e14dcfSSatish Balay 
299a7e14dcfSSatish Balay   PetscFunctionBegin;
300a7e14dcfSSatish Balay   /* default values */
301a7e14dcfSSatish Balay   df->maxProjIter = 200;
302a7e14dcfSSatish Balay   df->maxPGMIter = 300000;
303a7e14dcfSSatish Balay   df->b = 1.0;
304a7e14dcfSSatish Balay 
305a7e14dcfSSatish Balay   /* memory space required by Dai-Fletcher */
306a7e14dcfSSatish Balay   df->cur_num_cp = n;
3070e660641SBarry Smith   ierr = PetscMalloc1(n, &df->f); CHKERRQ(ierr);
3080e660641SBarry Smith   ierr = PetscMalloc1(n, &df->a); CHKERRQ(ierr);
3090e660641SBarry Smith   ierr = PetscMalloc1(n, &df->l); CHKERRQ(ierr);
3100e660641SBarry Smith   ierr = PetscMalloc1(n, &df->u); CHKERRQ(ierr);
3110e660641SBarry Smith   ierr = PetscMalloc1(n, &df->x); CHKERRQ(ierr);
312e1cc520bSBarry Smith   ierr = PetscMalloc1(n, &df->Q); CHKERRQ(ierr);
313a7e14dcfSSatish Balay 
314a7e14dcfSSatish Balay   for (i = 0; i < n; i ++) {
3150e660641SBarry Smith     ierr = PetscMalloc1(n, &df->Q[i]); CHKERRQ(ierr);
316a7e14dcfSSatish Balay   }
317a7e14dcfSSatish Balay 
3180e660641SBarry Smith   ierr = PetscMalloc1(n, &df->g); CHKERRQ(ierr);
3190e660641SBarry Smith   ierr = PetscMalloc1(n, &df->y); CHKERRQ(ierr);
3200e660641SBarry Smith   ierr = PetscMalloc1(n, &df->tempv); CHKERRQ(ierr);
3210e660641SBarry Smith   ierr = PetscMalloc1(n, &df->d); CHKERRQ(ierr);
3220e660641SBarry Smith   ierr = PetscMalloc1(n, &df->Qd); CHKERRQ(ierr);
3230e660641SBarry Smith   ierr = PetscMalloc1(n, &df->t); CHKERRQ(ierr);
3240e660641SBarry Smith   ierr = PetscMalloc1(n, &df->xplus); CHKERRQ(ierr);
3250e660641SBarry Smith   ierr = PetscMalloc1(n, &df->tplus); CHKERRQ(ierr);
3260e660641SBarry Smith   ierr = PetscMalloc1(n, &df->sk); CHKERRQ(ierr);
3270e660641SBarry Smith   ierr = PetscMalloc1(n, &df->yk); CHKERRQ(ierr);
328a7e14dcfSSatish Balay 
329e1cc520bSBarry Smith   ierr = PetscMalloc1(n, &df->ipt); CHKERRQ(ierr);
330e1cc520bSBarry Smith   ierr = PetscMalloc1(n, &df->ipt2); CHKERRQ(ierr);
331e1cc520bSBarry Smith   ierr = PetscMalloc1(n, &df->uv); CHKERRQ(ierr);
332a7e14dcfSSatish Balay   PetscFunctionReturn(0);
333a7e14dcfSSatish Balay }
334a7e14dcfSSatish Balay 
335a7e14dcfSSatish Balay #undef __FUNCT__
336a7e14dcfSSatish Balay #define __FUNCT__ "ensure_df_space"
337a7e14dcfSSatish Balay PetscErrorCode ensure_df_space(PetscInt dim, TAO_DF *df)
338a7e14dcfSSatish Balay {
339a7e14dcfSSatish Balay   PetscErrorCode ierr;
340a7e14dcfSSatish Balay   PetscReal      *tmp, **tmp_Q;
341a7e14dcfSSatish Balay   PetscInt       i, n, old_n;
342a7e14dcfSSatish Balay 
343a7e14dcfSSatish Balay   PetscFunctionBegin;
34453506e15SBarry Smith   df->dim = dim;
34553506e15SBarry Smith   if (dim <= df->cur_num_cp) PetscFunctionReturn(0);
346a7e14dcfSSatish Balay 
347a7e14dcfSSatish Balay   old_n = df->cur_num_cp;
348a7e14dcfSSatish Balay   df->cur_num_cp += INCRE_DIM;
349a7e14dcfSSatish Balay   n = df->cur_num_cp;
350a7e14dcfSSatish Balay 
351a7e14dcfSSatish Balay   /* memory space required by dai-fletcher */
3520e660641SBarry Smith   ierr = PetscMalloc1(n, &tmp); CHKERRQ(ierr);
353a7e14dcfSSatish Balay   ierr = PetscMemcpy(tmp, df->f, sizeof(PetscReal)*old_n); CHKERRQ(ierr);
354a7e14dcfSSatish Balay   ierr = PetscFree(df->f); CHKERRQ(ierr);
355a7e14dcfSSatish Balay   df->f = tmp;
356a7e14dcfSSatish Balay 
3570e660641SBarry Smith   ierr = PetscMalloc1(n, &tmp); CHKERRQ(ierr);
358a7e14dcfSSatish Balay   ierr = PetscMemcpy(tmp, df->a, sizeof(PetscReal)*old_n); CHKERRQ(ierr);
359a7e14dcfSSatish Balay   ierr = PetscFree(df->a); CHKERRQ(ierr);
360a7e14dcfSSatish Balay   df->a = tmp;
361a7e14dcfSSatish Balay 
3620e660641SBarry Smith   ierr = PetscMalloc1(n, &tmp); CHKERRQ(ierr);
363a7e14dcfSSatish Balay   ierr = PetscMemcpy(tmp, df->l, sizeof(PetscReal)*old_n); CHKERRQ(ierr);
364a7e14dcfSSatish Balay   ierr = PetscFree(df->l); CHKERRQ(ierr);
365a7e14dcfSSatish Balay   df->l = tmp;
366a7e14dcfSSatish Balay 
3670e660641SBarry Smith   ierr = PetscMalloc1(n, &tmp); CHKERRQ(ierr);
368a7e14dcfSSatish Balay   ierr = PetscMemcpy(tmp, df->u, sizeof(PetscReal)*old_n); CHKERRQ(ierr);
369a7e14dcfSSatish Balay   ierr = PetscFree(df->u); CHKERRQ(ierr);
370a7e14dcfSSatish Balay   df->u = tmp;
371a7e14dcfSSatish Balay 
3720e660641SBarry Smith   ierr = PetscMalloc1(n, &tmp); CHKERRQ(ierr);
373a7e14dcfSSatish Balay   ierr = PetscMemcpy(tmp, df->x, sizeof(PetscReal)*old_n); CHKERRQ(ierr);
374a7e14dcfSSatish Balay   ierr = PetscFree(df->x); CHKERRQ(ierr);
375a7e14dcfSSatish Balay   df->x = tmp;
376a7e14dcfSSatish Balay 
377e1cc520bSBarry Smith   ierr = PetscMalloc1(n, &tmp_Q); CHKERRQ(ierr);
37853506e15SBarry Smith   for (i = 0; i < n; i ++) {
3790e660641SBarry Smith     ierr = PetscMalloc1(n, &tmp_Q[i]); CHKERRQ(ierr);
38053506e15SBarry Smith     if (i < old_n) {
381a7e14dcfSSatish Balay       ierr = PetscMemcpy(tmp_Q[i], df->Q[i], sizeof(PetscReal)*old_n); CHKERRQ(ierr);
382a7e14dcfSSatish Balay       ierr = PetscFree(df->Q[i]); CHKERRQ(ierr);
383a7e14dcfSSatish Balay     }
384a7e14dcfSSatish Balay   }
385a7e14dcfSSatish Balay 
386a7e14dcfSSatish Balay   ierr = PetscFree(df->Q); CHKERRQ(ierr);
387a7e14dcfSSatish Balay   df->Q = tmp_Q;
388a7e14dcfSSatish Balay 
389a7e14dcfSSatish Balay   ierr = PetscFree(df->g); CHKERRQ(ierr);
3900e660641SBarry Smith   ierr = PetscMalloc1(n, &df->g); CHKERRQ(ierr);
391a7e14dcfSSatish Balay 
392a7e14dcfSSatish Balay   ierr = PetscFree(df->y); CHKERRQ(ierr);
3930e660641SBarry Smith   ierr = PetscMalloc1(n, &df->y); CHKERRQ(ierr);
394a7e14dcfSSatish Balay 
395a7e14dcfSSatish Balay   ierr = PetscFree(df->tempv); CHKERRQ(ierr);
3960e660641SBarry Smith   ierr = PetscMalloc1(n, &df->tempv); CHKERRQ(ierr);
397a7e14dcfSSatish Balay 
398a7e14dcfSSatish Balay   ierr = PetscFree(df->d); CHKERRQ(ierr);
3990e660641SBarry Smith   ierr = PetscMalloc1(n, &df->d); CHKERRQ(ierr);
400a7e14dcfSSatish Balay 
401a7e14dcfSSatish Balay   ierr = PetscFree(df->Qd); CHKERRQ(ierr);
4020e660641SBarry Smith   ierr = PetscMalloc1(n, &df->Qd); CHKERRQ(ierr);
403a7e14dcfSSatish Balay 
404a7e14dcfSSatish Balay   ierr = PetscFree(df->t); CHKERRQ(ierr);
4050e660641SBarry Smith   ierr = PetscMalloc1(n, &df->t); CHKERRQ(ierr);
406a7e14dcfSSatish Balay 
407a7e14dcfSSatish Balay   ierr = PetscFree(df->xplus); CHKERRQ(ierr);
4080e660641SBarry Smith   ierr = PetscMalloc1(n, &df->xplus); CHKERRQ(ierr);
409a7e14dcfSSatish Balay 
410a7e14dcfSSatish Balay   ierr = PetscFree(df->tplus); CHKERRQ(ierr);
4110e660641SBarry Smith   ierr = PetscMalloc1(n, &df->tplus); CHKERRQ(ierr);
412a7e14dcfSSatish Balay 
413a7e14dcfSSatish Balay   ierr = PetscFree(df->sk); CHKERRQ(ierr);
4140e660641SBarry Smith   ierr = PetscMalloc1(n, &df->sk); CHKERRQ(ierr);
415a7e14dcfSSatish Balay 
416a7e14dcfSSatish Balay   ierr = PetscFree(df->yk); CHKERRQ(ierr);
4170e660641SBarry Smith   ierr = PetscMalloc1(n, &df->yk); CHKERRQ(ierr);
418a7e14dcfSSatish Balay 
419a7e14dcfSSatish Balay   ierr = PetscFree(df->ipt); CHKERRQ(ierr);
420e1cc520bSBarry Smith   ierr = PetscMalloc1(n, &df->ipt); CHKERRQ(ierr);
421a7e14dcfSSatish Balay 
422a7e14dcfSSatish Balay   ierr = PetscFree(df->ipt2); CHKERRQ(ierr);
4230e660641SBarry Smith   ierr = PetscMalloc1(n, &df->ipt2); CHKERRQ(ierr);
424a7e14dcfSSatish Balay 
425a7e14dcfSSatish Balay   ierr = PetscFree(df->uv); CHKERRQ(ierr);
4260e660641SBarry Smith   ierr = PetscMalloc1(n, &df->uv); CHKERRQ(ierr);
427a7e14dcfSSatish Balay   PetscFunctionReturn(0);
428a7e14dcfSSatish Balay }
429a7e14dcfSSatish Balay 
430a7e14dcfSSatish Balay #undef __FUNCT__
431a7e14dcfSSatish Balay #define __FUNCT__ "destroy_df_solver"
432a7e14dcfSSatish Balay PetscErrorCode destroy_df_solver(TAO_DF *df)
433a7e14dcfSSatish Balay {
434a7e14dcfSSatish Balay   PetscErrorCode ierr;
435a7e14dcfSSatish Balay   PetscInt       i;
4366c23d075SBarry Smith 
437a7e14dcfSSatish Balay   PetscFunctionBegin;
4386c23d075SBarry Smith   ierr = PetscFree(df->f); CHKERRQ(ierr);
4396c23d075SBarry Smith   ierr = PetscFree(df->a); CHKERRQ(ierr);
4406c23d075SBarry Smith   ierr = PetscFree(df->l); CHKERRQ(ierr);
4416c23d075SBarry Smith   ierr = PetscFree(df->u); CHKERRQ(ierr);
4426c23d075SBarry Smith   ierr = PetscFree(df->x); CHKERRQ(ierr);
443a7e14dcfSSatish Balay 
4446c23d075SBarry Smith   for (i = 0; i < df->cur_num_cp; i ++) {
445a7e14dcfSSatish Balay     ierr = PetscFree(df->Q[i]); CHKERRQ(ierr);
446a7e14dcfSSatish Balay   }
447a7e14dcfSSatish Balay   ierr = PetscFree(df->Q); CHKERRQ(ierr);
4486c23d075SBarry Smith   ierr = PetscFree(df->ipt); CHKERRQ(ierr);
4496c23d075SBarry Smith   ierr = PetscFree(df->ipt2); CHKERRQ(ierr);
4506c23d075SBarry Smith   ierr = PetscFree(df->uv); CHKERRQ(ierr);
4516c23d075SBarry Smith   ierr = PetscFree(df->g); CHKERRQ(ierr);
4526c23d075SBarry Smith   ierr = PetscFree(df->y); CHKERRQ(ierr);
4536c23d075SBarry Smith   ierr = PetscFree(df->tempv); CHKERRQ(ierr);
4546c23d075SBarry Smith   ierr = PetscFree(df->d); CHKERRQ(ierr);
4556c23d075SBarry Smith   ierr = PetscFree(df->Qd); CHKERRQ(ierr);
4566c23d075SBarry Smith   ierr = PetscFree(df->t); CHKERRQ(ierr);
4576c23d075SBarry Smith   ierr = PetscFree(df->xplus); CHKERRQ(ierr);
4586c23d075SBarry Smith   ierr = PetscFree(df->tplus); CHKERRQ(ierr);
4596c23d075SBarry Smith   ierr = PetscFree(df->sk); CHKERRQ(ierr);
4606c23d075SBarry Smith   ierr = PetscFree(df->yk); CHKERRQ(ierr);
461a7e14dcfSSatish Balay   PetscFunctionReturn(0);
462a7e14dcfSSatish Balay }
463a7e14dcfSSatish Balay 
464a7e14dcfSSatish Balay /* Piecewise linear monotone target function for the Dai-Fletcher projector */
465a7e14dcfSSatish Balay #undef __FUNCT__
466a7e14dcfSSatish Balay #define __FUNCT__ "phi"
4676c23d075SBarry Smith PetscReal phi(PetscReal *x,PetscInt n,PetscReal lambda,PetscReal *a,PetscReal b,PetscReal *c,PetscReal *l,PetscReal *u)
468a7e14dcfSSatish Balay {
469a7e14dcfSSatish Balay   PetscReal r = 0.0;
470a7e14dcfSSatish Balay   PetscInt  i;
471a7e14dcfSSatish Balay 
472a7e14dcfSSatish Balay   for (i = 0; i < n; i++){
473a7e14dcfSSatish Balay     x[i] = -c[i] + lambda*a[i];
4746c23d075SBarry Smith     if (x[i] > u[i])     x[i] = u[i];
4756c23d075SBarry Smith     else if(x[i] < l[i]) x[i] = l[i];
476a7e14dcfSSatish Balay     r += a[i]*x[i];
477a7e14dcfSSatish Balay   }
478a7e14dcfSSatish Balay   return r - b;
479a7e14dcfSSatish Balay }
480a7e14dcfSSatish Balay 
481a7e14dcfSSatish Balay /** Modified Dai-Fletcher QP projector solves the problem:
482a7e14dcfSSatish Balay  *
483a7e14dcfSSatish Balay  *      minimise  0.5*x'*x - c'*x
484a7e14dcfSSatish Balay  *      subj to   a'*x = b
485a7e14dcfSSatish Balay  *                l \leq x \leq u
486a7e14dcfSSatish Balay  *
487a7e14dcfSSatish Balay  *  \param c The point to be projected onto feasible set
488a7e14dcfSSatish Balay  */
489a7e14dcfSSatish Balay #undef __FUNCT__
490a7e14dcfSSatish Balay #define __FUNCT__ "project"
4916c23d075SBarry Smith PetscInt project(PetscInt n,PetscReal *a,PetscReal b,PetscReal *c,PetscReal *l,PetscReal *u,PetscReal *x,PetscReal *lam_ext,TAO_DF *df)
492a7e14dcfSSatish Balay {
493a7e14dcfSSatish Balay   PetscReal      lambda, lambdal, lambdau, dlambda, lambda_new;
494a7e14dcfSSatish Balay   PetscReal      r, rl, ru, s;
495a7e14dcfSSatish Balay   PetscInt       innerIter;
496a7e14dcfSSatish Balay   PetscBool      nonNegativeSlack = PETSC_FALSE;
49753506e15SBarry Smith   PetscErrorCode ierr;
498a7e14dcfSSatish Balay 
499a7e14dcfSSatish Balay   *lam_ext = 0;
500a7e14dcfSSatish Balay   lambda  = 0;
501a7e14dcfSSatish Balay   dlambda = 0.5;
502a7e14dcfSSatish Balay   innerIter = 1;
503a7e14dcfSSatish Balay 
504a7e14dcfSSatish Balay   /*  \phi(x;lambda) := 0.5*x'*x + c'*x - lambda*(a'*x-b)
505a7e14dcfSSatish Balay    *
506a7e14dcfSSatish Balay    *  Optimality conditions for \phi:
507a7e14dcfSSatish Balay    *
508a7e14dcfSSatish Balay    *  1. lambda   <= 0
509a7e14dcfSSatish Balay    *  2. r        <= 0
510a7e14dcfSSatish Balay    *  3. r*lambda == 0
511a7e14dcfSSatish Balay    */
512a7e14dcfSSatish Balay 
513a7e14dcfSSatish Balay   /* Bracketing Phase */
514a7e14dcfSSatish Balay   r = phi(x, n, lambda, a, b, c, l, u);
515a7e14dcfSSatish Balay 
5166c23d075SBarry Smith   if(nonNegativeSlack) {
517a7e14dcfSSatish Balay     /* inequality constraint, i.e., with \xi >= 0 constraint */
51853506e15SBarry Smith     if (r < TOL_R) return 0;
5196c23d075SBarry Smith   } else  {
520a7e14dcfSSatish Balay     /* equality constraint ,i.e., without \xi >= 0 constraint */
52153506e15SBarry Smith     if (fabs(r) < TOL_R) return 0;
522a7e14dcfSSatish Balay   }
523a7e14dcfSSatish Balay 
524a7e14dcfSSatish Balay   if (r < 0.0){
525a7e14dcfSSatish Balay     lambdal = lambda;
526a7e14dcfSSatish Balay     rl      = r;
527a7e14dcfSSatish Balay     lambda  = lambda + dlambda;
528a7e14dcfSSatish Balay     r       = phi(x, n, lambda, a, b, c, l, u);
529a7e14dcfSSatish Balay     while (r < 0.0 && dlambda < BMRM_INFTY)  {
530a7e14dcfSSatish Balay       lambdal = lambda;
531a7e14dcfSSatish Balay       s       = rl/r - 1.0;
532a7e14dcfSSatish Balay       if (s < 0.1) s = 0.1;
533a7e14dcfSSatish Balay       dlambda = dlambda + dlambda/s;
534a7e14dcfSSatish Balay       lambda  = lambda + dlambda;
535a7e14dcfSSatish Balay       rl      = r;
536a7e14dcfSSatish Balay       r       = phi(x, n, lambda, a, b, c, l, u);
537a7e14dcfSSatish Balay     }
538a7e14dcfSSatish Balay     lambdau = lambda;
539a7e14dcfSSatish Balay     ru      = r;
5406c23d075SBarry Smith   } else {
541a7e14dcfSSatish Balay     lambdau = lambda;
542a7e14dcfSSatish Balay     ru      = r;
543a7e14dcfSSatish Balay     lambda  = lambda - dlambda;
544a7e14dcfSSatish Balay     r       = phi(x, n, lambda, a, b, c, l, u);
545a7e14dcfSSatish Balay     while (r > 0.0 && dlambda > -BMRM_INFTY) {
546a7e14dcfSSatish Balay       lambdau = lambda;
547a7e14dcfSSatish Balay       s       = ru/r - 1.0;
548a7e14dcfSSatish Balay       if (s < 0.1) s = 0.1;
549a7e14dcfSSatish Balay       dlambda = dlambda + dlambda/s;
550a7e14dcfSSatish Balay       lambda  = lambda - dlambda;
551a7e14dcfSSatish Balay       ru      = r;
552a7e14dcfSSatish Balay       r       = phi(x, n, lambda, a, b, c, l, u);
553a7e14dcfSSatish Balay     }
554a7e14dcfSSatish Balay     lambdal = lambda;
555a7e14dcfSSatish Balay     rl      = r;
556a7e14dcfSSatish Balay   }
557a7e14dcfSSatish Balay 
5586c23d075SBarry Smith   if(fabs(dlambda) > BMRM_INFTY) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"L2N2_DaiFletcherPGM detected Infeasible QP problem!");
559a7e14dcfSSatish Balay 
560a7e14dcfSSatish Balay   if(ru == 0){
561a7e14dcfSSatish Balay     lambda = lambdau;
562a7e14dcfSSatish Balay     r = phi(x, n, lambda, a, b, c, l, u);
563a7e14dcfSSatish Balay     return innerIter;
564a7e14dcfSSatish Balay   }
565a7e14dcfSSatish Balay 
566a7e14dcfSSatish Balay   /* Secant Phase */
567a7e14dcfSSatish Balay   s       = 1.0 - rl/ru;
568a7e14dcfSSatish Balay   dlambda = dlambda/s;
569a7e14dcfSSatish Balay   lambda  = lambdau - dlambda;
570a7e14dcfSSatish Balay   r       = phi(x, n, lambda, a, b, c, l, u);
571a7e14dcfSSatish Balay 
572a7e14dcfSSatish Balay   while (fabs(r) > TOL_R
573a7e14dcfSSatish Balay          && dlambda > TOL_LAM * (1.0 + fabs(lambda))
574a7e14dcfSSatish Balay          && innerIter < df->maxProjIter){
575a7e14dcfSSatish Balay     innerIter++;
576a7e14dcfSSatish Balay     if (r > 0.0){
577a7e14dcfSSatish Balay       if (s <= 2.0){
578a7e14dcfSSatish Balay         lambdau = lambda;
579a7e14dcfSSatish Balay         ru      = r;
580a7e14dcfSSatish Balay         s       = 1.0 - rl/ru;
581a7e14dcfSSatish Balay         dlambda = (lambdau - lambdal) / s;
582a7e14dcfSSatish Balay         lambda  = lambdau - dlambda;
58353506e15SBarry Smith       } else {
584a7e14dcfSSatish Balay         s          = ru/r-1.0;
585a7e14dcfSSatish Balay         if (s < 0.1) s = 0.1;
586a7e14dcfSSatish Balay         dlambda    = (lambdau - lambda) / s;
587a7e14dcfSSatish Balay         lambda_new = 0.75*lambdal + 0.25*lambda;
588a7e14dcfSSatish Balay         if (lambda_new < (lambda - dlambda))
589a7e14dcfSSatish Balay           lambda_new = lambda - dlambda;
590a7e14dcfSSatish Balay         lambdau    = lambda;
591a7e14dcfSSatish Balay         ru         = r;
592a7e14dcfSSatish Balay         lambda     = lambda_new;
593a7e14dcfSSatish Balay         s          = (lambdau - lambdal) / (lambdau - lambda);
594a7e14dcfSSatish Balay       }
59553506e15SBarry Smith     } else {
596a7e14dcfSSatish Balay       if (s >= 2.0){
597a7e14dcfSSatish Balay         lambdal = lambda;
598a7e14dcfSSatish Balay         rl      = r;
599a7e14dcfSSatish Balay         s       = 1.0 - rl/ru;
600a7e14dcfSSatish Balay         dlambda = (lambdau - lambdal) / s;
601a7e14dcfSSatish Balay         lambda  = lambdau - dlambda;
60253506e15SBarry Smith       } else {
603a7e14dcfSSatish Balay         s          = rl/r - 1.0;
604a7e14dcfSSatish Balay         if (s < 0.1) s = 0.1;
605a7e14dcfSSatish Balay         dlambda    = (lambda-lambdal) / s;
606a7e14dcfSSatish Balay         lambda_new = 0.75*lambdau + 0.25*lambda;
607a7e14dcfSSatish Balay         if (lambda_new > (lambda + dlambda))
608a7e14dcfSSatish Balay           lambda_new = lambda + dlambda;
609a7e14dcfSSatish Balay         lambdal    = lambda;
610a7e14dcfSSatish Balay         rl         = r;
611a7e14dcfSSatish Balay         lambda     = lambda_new;
612a7e14dcfSSatish Balay         s          = (lambdau - lambdal) / (lambdau-lambda);
613a7e14dcfSSatish Balay       }
614a7e14dcfSSatish Balay     }
615a7e14dcfSSatish Balay     r = phi(x, n, lambda, a, b, c, l, u);
616a7e14dcfSSatish Balay   }
617a7e14dcfSSatish Balay 
618a7e14dcfSSatish Balay   *lam_ext = lambda;
61953506e15SBarry Smith   if(innerIter >= df->maxProjIter) {
62053506e15SBarry Smith     ierr = PetscPrintf(PETSC_COMM_SELF, "WARNING: DaiFletcher max iterations\n");CHKERRQ(ierr);
62153506e15SBarry Smith   }
622a7e14dcfSSatish Balay   return innerIter;
623a7e14dcfSSatish Balay }
624a7e14dcfSSatish Balay 
625a7e14dcfSSatish Balay 
626a7e14dcfSSatish Balay #undef __FUNCT__
627a7e14dcfSSatish Balay #define __FUNCT__ "solve"
628a7e14dcfSSatish Balay PetscErrorCode solve(TAO_DF *df)
629a7e14dcfSSatish Balay {
630a7e14dcfSSatish Balay   PetscErrorCode ierr;
631a7e14dcfSSatish Balay   PetscInt       i, j, innerIter, it, it2, luv, info, lscount = 0, projcount = 0;
632a7e14dcfSSatish Balay   PetscReal      gd, max, ak, bk, akold, bkold, lamnew, alpha, kktlam=0.0, lam_ext;
633a7e14dcfSSatish Balay   PetscReal      DELTAsv, ProdDELTAsv;
634a7e14dcfSSatish Balay   PetscReal      c, *tempQ;
635a7e14dcfSSatish Balay   PetscReal      *x = df->x, *a = df->a, b = df->b, *l = df->l, *u = df->u, tol = df->tol;
636a7e14dcfSSatish Balay   PetscReal      *tempv = df->tempv, *y = df->y, *g = df->g, *d = df->d, *Qd = df->Qd;
637a7e14dcfSSatish Balay   PetscReal      *xplus = df->xplus, *tplus = df->tplus, *sk = df->sk, *yk = df->yk;
638a7e14dcfSSatish Balay   PetscReal      **Q = df->Q, *f = df->f, *t = df->t;
639a7e14dcfSSatish Balay   PetscInt       dim = df->dim, *ipt = df->ipt, *ipt2 = df->ipt2, *uv = df->uv;
640a7e14dcfSSatish Balay 
641a7e14dcfSSatish Balay   /*** variables for the adaptive nonmonotone linesearch ***/
642a7e14dcfSSatish Balay   PetscInt    L, llast;
643a7e14dcfSSatish Balay   PetscReal   fr, fbest, fv, fc, fv0;
64453506e15SBarry Smith 
645a7e14dcfSSatish Balay   c = BMRM_INFTY;
646a7e14dcfSSatish Balay 
647a7e14dcfSSatish Balay   DELTAsv = EPS_SV;
64853506e15SBarry Smith   if (tol <= 1.0e-5 || dim <= 20) ProdDELTAsv = 0.0F;
64953506e15SBarry Smith   else  ProdDELTAsv = EPS_SV;
650a7e14dcfSSatish Balay 
65153506e15SBarry Smith   for (i = 0; i < dim; i++)  tempv[i] = -x[i];
652a7e14dcfSSatish Balay 
653a7e14dcfSSatish Balay   lam_ext = 0.0;
654a7e14dcfSSatish Balay 
655a7e14dcfSSatish Balay   /* Project the initial solution */
656a7e14dcfSSatish Balay   projcount += project(dim, a, b, tempv, l, u, x, &lam_ext, df);
657a7e14dcfSSatish Balay 
658a7e14dcfSSatish Balay   /* Compute gradient
659a7e14dcfSSatish Balay      g = Q*x + f; */
660a7e14dcfSSatish Balay 
661a7e14dcfSSatish Balay   it = 0;
66253506e15SBarry Smith   for (i = 0; i < dim; i++) {
66353506e15SBarry Smith     if (fabs(x[i]) > ProdDELTAsv) ipt[it++] = i;
66453506e15SBarry Smith   }
665a7e14dcfSSatish Balay 
666a7e14dcfSSatish Balay   ierr = PetscMemzero(t, dim*sizeof(PetscReal)); CHKERRQ(ierr);
667a7e14dcfSSatish Balay   for (i = 0; i < it; i++){
668a7e14dcfSSatish Balay     tempQ = Q[ipt[i]];
66953506e15SBarry Smith     for (j = 0; j < dim; j++) t[j] += (tempQ[j]*x[ipt[i]]);
670a7e14dcfSSatish Balay   }
671a7e14dcfSSatish Balay   for (i = 0; i < dim; i++){
672a7e14dcfSSatish Balay     g[i] = t[i] + f[i];
673a7e14dcfSSatish Balay   }
674a7e14dcfSSatish Balay 
675a7e14dcfSSatish Balay 
676a7e14dcfSSatish Balay   /* y = -(x_{k} - g_{k}) */
677a7e14dcfSSatish Balay   for (i = 0; i < dim; i++){
678a7e14dcfSSatish Balay     y[i] = g[i] - x[i];
679a7e14dcfSSatish Balay   }
680a7e14dcfSSatish Balay 
681a7e14dcfSSatish Balay   /* Project x_{k} - g_{k} */
682a7e14dcfSSatish Balay   projcount += project(dim, a, b, y, l, u, tempv, &lam_ext, df);
683a7e14dcfSSatish Balay 
684a7e14dcfSSatish Balay   /* y = P(x_{k} - g_{k}) - x_{k} */
685a7e14dcfSSatish Balay   max = ALPHA_MIN;
686a7e14dcfSSatish Balay   for (i = 0; i < dim; i++){
687a7e14dcfSSatish Balay     y[i] = tempv[i] - x[i];
68853506e15SBarry Smith     if (fabs(y[i]) > max) max = fabs(y[i]);
689a7e14dcfSSatish Balay   }
690a7e14dcfSSatish Balay 
691a7e14dcfSSatish Balay   if (max < tol*1e-3){
692a7e14dcfSSatish Balay     lscount = 0;
693a7e14dcfSSatish Balay     innerIter    = 0;
694a7e14dcfSSatish Balay     return 0;
695a7e14dcfSSatish Balay   }
696a7e14dcfSSatish Balay 
697a7e14dcfSSatish Balay   alpha = 1.0 / max;
698a7e14dcfSSatish Balay 
699a7e14dcfSSatish Balay   /* fv0 = f(x_{0}). Recall t = Q x_{k}  */
700a7e14dcfSSatish Balay   fv0   = 0.0;
70153506e15SBarry Smith   for (i = 0; i < dim; i++) fv0 += x[i] * (0.5*t[i] + f[i]);
702a7e14dcfSSatish Balay 
703a7e14dcfSSatish Balay   /*** adaptive nonmonotone linesearch ***/
704a7e14dcfSSatish Balay   L     = 2;
705a7e14dcfSSatish Balay   fr    = ALPHA_MAX;
706a7e14dcfSSatish Balay   fbest = fv0;
707a7e14dcfSSatish Balay   fc    = fv0;
708a7e14dcfSSatish Balay   llast = 0;
709a7e14dcfSSatish Balay   akold = bkold = 0.0;
710a7e14dcfSSatish Balay 
711a7e14dcfSSatish Balay   /***      Iterator begins     ***/
712a7e14dcfSSatish Balay   for (innerIter = 1; innerIter <= df->maxPGMIter; innerIter++) {
713a7e14dcfSSatish Balay 
714a7e14dcfSSatish Balay     /* tempv = -(x_{k} - alpha*g_{k}) */
71553506e15SBarry Smith     for (i = 0; i < dim; i++)  tempv[i] = alpha*g[i] - x[i];
716a7e14dcfSSatish Balay 
717a7e14dcfSSatish Balay     /* Project x_{k} - alpha*g_{k} */
718a7e14dcfSSatish Balay     projcount += project(dim, a, b, tempv, l, u, y, &lam_ext, df);
719a7e14dcfSSatish Balay 
720a7e14dcfSSatish Balay 
721a7e14dcfSSatish Balay     /* gd = \inner{d_{k}}{g_{k}}
722a7e14dcfSSatish Balay         d = P(x_{k} - alpha*g_{k}) - x_{k}
723a7e14dcfSSatish Balay     */
724a7e14dcfSSatish Balay     gd = 0.0;
725a7e14dcfSSatish Balay     for (i = 0; i < dim; i++){
726a7e14dcfSSatish Balay       d[i] = y[i] - x[i];
727a7e14dcfSSatish Balay       gd  += d[i] * g[i];
728a7e14dcfSSatish Balay     }
729a7e14dcfSSatish Balay 
730a7e14dcfSSatish Balay     /* Gradient computation  */
731a7e14dcfSSatish Balay 
732a7e14dcfSSatish Balay     /* compute Qd = Q*d  or  Qd = Q*y - t depending on their sparsity */
733a7e14dcfSSatish Balay 
734a7e14dcfSSatish Balay     it = it2 = 0;
73553506e15SBarry Smith     for (i = 0; i < dim; i++){
73653506e15SBarry Smith       if (fabs(d[i]) > (ProdDELTAsv*1.0e-2)) ipt[it++]   = i;
73753506e15SBarry Smith     }
73853506e15SBarry Smith     for (i = 0; i < dim; i++) {
73953506e15SBarry Smith       if (fabs(y[i]) > ProdDELTAsv) ipt2[it2++] = i;
74053506e15SBarry Smith     }
741a7e14dcfSSatish Balay 
742a7e14dcfSSatish Balay     ierr = PetscMemzero(Qd, dim*sizeof(PetscReal)); CHKERRQ(ierr);
743a7e14dcfSSatish Balay     /* compute Qd = Q*d */
744a7e14dcfSSatish Balay     if (it < it2){
745a7e14dcfSSatish Balay       for (i = 0; i < it; i++){
746a7e14dcfSSatish Balay         tempQ = Q[ipt[i]];
74753506e15SBarry Smith         for (j = 0; j < dim; j++) Qd[j] += (tempQ[j] * d[ipt[i]]);
748a7e14dcfSSatish Balay       }
74953506e15SBarry Smith     } else { /* compute Qd = Q*y-t */
750a7e14dcfSSatish Balay       for (i = 0; i < it2; i++){
751a7e14dcfSSatish Balay         tempQ = Q[ipt2[i]];
75253506e15SBarry Smith         for (j = 0; j < dim; j++) Qd[j] += (tempQ[j] * y[ipt2[i]]);
753a7e14dcfSSatish Balay       }
75453506e15SBarry Smith       for (j = 0; j < dim; j++) Qd[j] -= t[j];
755a7e14dcfSSatish Balay     }
756a7e14dcfSSatish Balay 
757a7e14dcfSSatish Balay     /* ak = inner{d_{k}}{d_{k}} */
758a7e14dcfSSatish Balay     ak = 0.0;
75953506e15SBarry Smith     for (i = 0; i < dim; i++) ak += d[i] * d[i];
760a7e14dcfSSatish Balay 
761a7e14dcfSSatish Balay     bk = 0.0;
76253506e15SBarry Smith     for (i = 0; i < dim; i++) bk += d[i]*Qd[i];
763a7e14dcfSSatish Balay 
76453506e15SBarry Smith     if (bk > EPS*ak && gd < 0.0)  lamnew = -gd/bk;
76553506e15SBarry Smith     else lamnew = 1.0;
766a7e14dcfSSatish Balay 
767a7e14dcfSSatish Balay     /* fv is computing f(x_{k} + d_{k}) */
768a7e14dcfSSatish Balay     fv = 0.0;
769a7e14dcfSSatish Balay     for (i = 0; i < dim; i++){
770a7e14dcfSSatish Balay       xplus[i] = x[i] + d[i];
771a7e14dcfSSatish Balay       tplus[i] = t[i] + Qd[i];
772a7e14dcfSSatish Balay       fv      += xplus[i] * (0.5*tplus[i] + f[i]);
773a7e14dcfSSatish Balay     }
774a7e14dcfSSatish Balay 
775a7e14dcfSSatish Balay     /* fr is fref */
776a7e14dcfSSatish Balay     if ((innerIter == 1 && fv >= fv0) || (innerIter > 1 && fv >= fr)){
777a7e14dcfSSatish Balay       lscount++;
778a7e14dcfSSatish Balay       fv = 0.0;
779a7e14dcfSSatish Balay       for (i = 0; i < dim; i++){
780a7e14dcfSSatish Balay         xplus[i] = x[i] + lamnew*d[i];
781a7e14dcfSSatish Balay         tplus[i] = t[i] + lamnew*Qd[i];
782a7e14dcfSSatish Balay         fv      += xplus[i] * (0.5*tplus[i] + f[i]);
783a7e14dcfSSatish Balay       }
784a7e14dcfSSatish Balay     }
785a7e14dcfSSatish Balay 
786a7e14dcfSSatish Balay     for (i = 0; i < dim; i++){
787a7e14dcfSSatish Balay       sk[i] = xplus[i] - x[i];
788a7e14dcfSSatish Balay       yk[i] = tplus[i] - t[i];
789a7e14dcfSSatish Balay       x[i]  = xplus[i];
790a7e14dcfSSatish Balay       t[i]  = tplus[i];
791a7e14dcfSSatish Balay       g[i]  = t[i] + f[i];
792a7e14dcfSSatish Balay     }
793a7e14dcfSSatish Balay 
794a7e14dcfSSatish Balay     /* update the line search control parameters */
795a7e14dcfSSatish Balay     if (fv < fbest){
796a7e14dcfSSatish Balay       fbest = fv;
797a7e14dcfSSatish Balay       fc    = fv;
798a7e14dcfSSatish Balay       llast = 0;
79953506e15SBarry Smith     } else {
800a7e14dcfSSatish Balay       fc = (fc > fv ? fc : fv);
801a7e14dcfSSatish Balay       llast++;
802a7e14dcfSSatish Balay       if (llast == L){
803a7e14dcfSSatish Balay         fr    = fc;
804a7e14dcfSSatish Balay         fc    = fv;
805a7e14dcfSSatish Balay         llast = 0;
806a7e14dcfSSatish Balay       }
807a7e14dcfSSatish Balay     }
808a7e14dcfSSatish Balay 
809a7e14dcfSSatish Balay     ak = bk = 0.0;
810a7e14dcfSSatish Balay     for (i = 0; i < dim; i++){
811a7e14dcfSSatish Balay       ak += sk[i] * sk[i];
812a7e14dcfSSatish Balay       bk += sk[i] * yk[i];
813a7e14dcfSSatish Balay     }
814a7e14dcfSSatish Balay 
81553506e15SBarry Smith     if (bk <= EPS*ak) alpha = ALPHA_MAX;
816a7e14dcfSSatish Balay     else {
81753506e15SBarry Smith       if (bkold < EPS*akold) alpha = ak/bk;
81853506e15SBarry Smith       else alpha = (akold+ak)/(bkold+bk);
819a7e14dcfSSatish Balay 
82053506e15SBarry Smith       if (alpha > ALPHA_MAX) alpha = ALPHA_MAX;
82153506e15SBarry Smith       else if (alpha < ALPHA_MIN) alpha = ALPHA_MIN;
822a7e14dcfSSatish Balay     }
823a7e14dcfSSatish Balay 
824a7e14dcfSSatish Balay     akold = ak;
825a7e14dcfSSatish Balay     bkold = bk;
826a7e14dcfSSatish Balay 
827a7e14dcfSSatish Balay     /*** stopping criterion based on KKT conditions ***/
828a7e14dcfSSatish Balay     /* at optimal, gradient of lagrangian w.r.t. x is zero */
829a7e14dcfSSatish Balay 
830a7e14dcfSSatish Balay     bk = 0.0;
83153506e15SBarry Smith     for (i = 0; i < dim; i++) bk +=  x[i] * x[i];
832a7e14dcfSSatish Balay 
83353506e15SBarry Smith     if (PetscSqrtReal(ak) < tol*10 * PetscSqrtReal(bk)){
834a7e14dcfSSatish Balay       it     = 0;
835a7e14dcfSSatish Balay       luv    = 0;
836a7e14dcfSSatish Balay       kktlam = 0.0;
837a7e14dcfSSatish Balay       for (i = 0; i < dim; i++){
838a7e14dcfSSatish Balay         /* x[i] is active hence lagrange multipliers for box constraints
839a7e14dcfSSatish Balay                 are zero. The lagrange multiplier for ineq. const. is then
840a7e14dcfSSatish Balay                 defined as below
841a7e14dcfSSatish Balay         */
842a7e14dcfSSatish Balay         if ((x[i] > DELTAsv) && (x[i] < c-DELTAsv)){
843a7e14dcfSSatish Balay           ipt[it++] = i;
844a7e14dcfSSatish Balay           kktlam    = kktlam - a[i]*g[i];
84553506e15SBarry Smith         } else  uv[luv++] = i;
846a7e14dcfSSatish Balay       }
847a7e14dcfSSatish Balay 
84853506e15SBarry Smith       if (it == 0 && PetscSqrtReal(ak) < tol*0.5 * PetscSqrtReal(bk)) return 0;
849a7e14dcfSSatish Balay       else {
850a7e14dcfSSatish Balay         kktlam = kktlam/it;
851a7e14dcfSSatish Balay         info   = 1;
852a7e14dcfSSatish Balay         for (i = 0; i < it; i++) {
853a7e14dcfSSatish Balay           if (fabs(a[ipt[i]] * g[ipt[i]] + kktlam) > tol) {
854a7e14dcfSSatish Balay             info = 0;
855a7e14dcfSSatish Balay             break;
856a7e14dcfSSatish Balay           }
857a7e14dcfSSatish Balay         }
858a7e14dcfSSatish Balay         if (info == 1)  {
859a7e14dcfSSatish Balay           for (i = 0; i < luv; i++)  {
860a7e14dcfSSatish Balay             if (x[uv[i]] <= DELTAsv){
861a7e14dcfSSatish Balay               /* x[i] == lower bound, hence, lagrange multiplier (say, beta) for lower bound may
862a7e14dcfSSatish Balay                      not be zero. So, the gradient without beta is > 0
863a7e14dcfSSatish Balay               */
864a7e14dcfSSatish Balay               if (g[uv[i]] + kktlam*a[uv[i]] < -tol){
865a7e14dcfSSatish Balay                 info = 0;
866a7e14dcfSSatish Balay                 break;
867a7e14dcfSSatish Balay               }
86853506e15SBarry Smith             } else {
869a7e14dcfSSatish Balay               /* x[i] == upper bound, hence, lagrange multiplier (say, eta) for upper bound may
870a7e14dcfSSatish Balay                      not be zero. So, the gradient without eta is < 0
871a7e14dcfSSatish Balay               */
872a7e14dcfSSatish Balay               if (g[uv[i]] + kktlam*a[uv[i]] > tol) {
873a7e14dcfSSatish Balay                 info = 0;
874a7e14dcfSSatish Balay                 break;
875a7e14dcfSSatish Balay               }
876a7e14dcfSSatish Balay             }
877a7e14dcfSSatish Balay           }
878a7e14dcfSSatish Balay         }
879a7e14dcfSSatish Balay 
88053506e15SBarry Smith         if (info == 1) return 0;
881a7e14dcfSSatish Balay       }
882a7e14dcfSSatish Balay     }
883a7e14dcfSSatish Balay   }
884a7e14dcfSSatish Balay   return 0;
885a7e14dcfSSatish Balay }
886a7e14dcfSSatish Balay 
887a7e14dcfSSatish Balay 
888