xref: /petsc/src/tao/unconstrained/impls/bmrm/bmrm.c (revision 8931d48269a3fd1175e58f4f026fe4afbe678bc2)
1aaa7dc30SBarry Smith #include <../src/tao/unconstrained/impls/bmrm/bmrm.h>
2a7e14dcfSSatish Balay 
3a7e14dcfSSatish Balay static PetscErrorCode init_df_solver(TAO_DF*);
4a7e14dcfSSatish Balay static PetscErrorCode ensure_df_space(PetscInt, TAO_DF*);
5a7e14dcfSSatish Balay static PetscErrorCode destroy_df_solver(TAO_DF*);
60e660641SBarry Smith static PetscReal phi(PetscReal*,PetscInt,PetscReal,PetscReal*,PetscReal,PetscReal*,PetscReal*,PetscReal*);
70e660641SBarry Smith static PetscInt project(PetscInt,PetscReal*,PetscReal,PetscReal*,PetscReal*,PetscReal*,PetscReal*,PetscReal*,TAO_DF*);
8a7e14dcfSSatish Balay static PetscErrorCode solve(TAO_DF*);
9a7e14dcfSSatish Balay 
10a7e14dcfSSatish Balay 
11a7e14dcfSSatish Balay /*------------------------------------------------------------*/
12a7e14dcfSSatish Balay /* The main solver function
13a7e14dcfSSatish Balay 
14a7e14dcfSSatish Balay    f = Remp(W)          This is what the user provides us from the application layer
15a7e14dcfSSatish Balay    So the ComputeGradient function for instance should get us back the subgradient of Remp(W)
16a7e14dcfSSatish Balay 
17a7e14dcfSSatish Balay    Regularizer assumed to be L2 norm = lambda*0.5*W'W ()
18a7e14dcfSSatish Balay */
19a7e14dcfSSatish Balay 
20a7e14dcfSSatish Balay #undef __FUNCT__
21a7e14dcfSSatish Balay #define __FUNCT__ "make_grad_node"
22a7e14dcfSSatish Balay static PetscErrorCode make_grad_node(Vec X, Vec_Chain **p)
23a7e14dcfSSatish Balay {
24a7e14dcfSSatish Balay   PetscErrorCode ierr;
25a7e14dcfSSatish Balay 
26a7e14dcfSSatish Balay   PetscFunctionBegin;
270e660641SBarry Smith   ierr = PetscNew(p);CHKERRQ(ierr);
28a7e14dcfSSatish Balay   ierr = VecDuplicate(X, &(*p)->V);CHKERRQ(ierr);
29a7e14dcfSSatish Balay   ierr = VecCopy(X, (*p)->V);CHKERRQ(ierr);
306c23d075SBarry Smith   (*p)->next = NULL;
31a7e14dcfSSatish Balay   PetscFunctionReturn(0);
32a7e14dcfSSatish Balay }
33a7e14dcfSSatish Balay 
34a7e14dcfSSatish Balay #undef __FUNCT__
35a7e14dcfSSatish Balay #define __FUNCT__ "destroy_grad_list"
36a7e14dcfSSatish Balay static PetscErrorCode destroy_grad_list(Vec_Chain *head)
37a7e14dcfSSatish Balay {
38a7e14dcfSSatish Balay   PetscErrorCode ierr;
39a7e14dcfSSatish Balay   Vec_Chain      *p = head->next, *q;
40a7e14dcfSSatish Balay 
41a7e14dcfSSatish Balay   PetscFunctionBegin;
42a7e14dcfSSatish Balay   while(p) {
43a7e14dcfSSatish Balay     q = p->next;
44a7e14dcfSSatish Balay     ierr = VecDestroy(&p->V);CHKERRQ(ierr);
45a7e14dcfSSatish Balay     ierr = PetscFree(p);CHKERRQ(ierr);
46a7e14dcfSSatish Balay     p = q;
47a7e14dcfSSatish Balay   }
486c23d075SBarry Smith   head->next = NULL;
49a7e14dcfSSatish Balay   PetscFunctionReturn(0);
50a7e14dcfSSatish Balay }
51a7e14dcfSSatish Balay 
52a7e14dcfSSatish Balay 
53a7e14dcfSSatish Balay #undef __FUNCT__
54a7e14dcfSSatish Balay #define __FUNCT__ "TaoSolve_BMRM"
55441846f8SBarry Smith static PetscErrorCode TaoSolve_BMRM(Tao tao)
56a7e14dcfSSatish Balay {
57a7e14dcfSSatish Balay   PetscErrorCode     ierr;
58e4cb33bbSBarry Smith   TaoConvergedReason reason;
59a7e14dcfSSatish Balay   TAO_DF             df;
60a7e14dcfSSatish Balay   TAO_BMRM           *bmrm = (TAO_BMRM*)tao->data;
61a7e14dcfSSatish Balay 
62a7e14dcfSSatish Balay   /* Values and pointers to parts of the optimization problem */
63a7e14dcfSSatish Balay   PetscReal          f = 0.0;
64a7e14dcfSSatish Balay   Vec                W = tao->solution;
65a7e14dcfSSatish Balay   Vec                G = tao->gradient;
66a7e14dcfSSatish Balay   PetscReal          lambda;
67a7e14dcfSSatish Balay   PetscReal          bt;
68a7e14dcfSSatish Balay   Vec_Chain          grad_list, *tail_glist, *pgrad;
69a7e14dcfSSatish Balay   PetscInt           i;
70a7e14dcfSSatish Balay   PetscMPIInt        rank;
71a7e14dcfSSatish Balay 
72e4cb33bbSBarry Smith   /* Used in converged criteria check */
73a7e14dcfSSatish Balay   PetscReal          reg;
74a7e14dcfSSatish Balay   PetscReal          jtwt, max_jtwt, pre_epsilon, epsilon, jw, min_jw;
75a7e14dcfSSatish Balay   PetscReal          innerSolverTol;
76ba4b436cSBarry Smith   MPI_Comm           comm;
77a7e14dcfSSatish Balay 
78a7e14dcfSSatish Balay   PetscFunctionBegin;
79ba4b436cSBarry Smith   ierr = PetscObjectGetComm((PetscObject)tao,&comm);CHKERRQ(ierr);
80ba4b436cSBarry Smith   ierr = MPI_Comm_rank(comm, &rank);CHKERRQ(ierr);
81a7e14dcfSSatish Balay   lambda = bmrm->lambda;
82a7e14dcfSSatish Balay 
83a7e14dcfSSatish Balay   /* Check Stopping Condition */
84a7e14dcfSSatish Balay   tao->step = 1.0;
85a7e14dcfSSatish Balay   max_jtwt = -BMRM_INFTY;
86a7e14dcfSSatish Balay   min_jw = BMRM_INFTY;
87a7e14dcfSSatish Balay   innerSolverTol = 1.0;
88a7e14dcfSSatish Balay   epsilon = 0.0;
89a7e14dcfSSatish Balay 
900e660641SBarry Smith   if (!rank) {
91a7e14dcfSSatish Balay     ierr = init_df_solver(&df);CHKERRQ(ierr);
92a7e14dcfSSatish Balay     grad_list.next = NULL;
93a7e14dcfSSatish Balay     tail_glist = &grad_list;
94a7e14dcfSSatish Balay   }
95a7e14dcfSSatish Balay 
96a7e14dcfSSatish Balay   df.tol = 1e-6;
97a7e14dcfSSatish Balay   reason = TAO_CONTINUE_ITERATING;
98a7e14dcfSSatish Balay 
99a7e14dcfSSatish Balay   /*-----------------Algorithm Begins------------------------*/
100a7e14dcfSSatish Balay   /* make the scatter */
101a7e14dcfSSatish Balay   ierr = VecScatterCreateToZero(W, &bmrm->scatter, &bmrm->local_w);CHKERRQ(ierr);
102a7e14dcfSSatish Balay   ierr = VecAssemblyBegin(bmrm->local_w);CHKERRQ(ierr);
103a7e14dcfSSatish Balay   ierr = VecAssemblyEnd(bmrm->local_w);CHKERRQ(ierr);
104a7e14dcfSSatish Balay 
105a7e14dcfSSatish Balay   /* NOTE: In application pass the sub-gradient of Remp(W) */
106a7e14dcfSSatish Balay   ierr = TaoComputeObjectiveAndGradient(tao, W, &f, G);CHKERRQ(ierr);
107*8931d482SJason Sarich   ierr = TaoMonitor(tao,tao->niter,f,1.0,0.0,tao->step,&reason);CHKERRQ(ierr);
108a7e14dcfSSatish Balay   while (reason == TAO_CONTINUE_ITERATING) {
109a7e14dcfSSatish Balay     /* compute bt = Remp(Wt-1) - <Wt-1, At> */
110a7e14dcfSSatish Balay     ierr = VecDot(W, G, &bt);CHKERRQ(ierr);
111a7e14dcfSSatish Balay     bt = f - bt;
112a7e14dcfSSatish Balay 
113a7e14dcfSSatish Balay     /* First gather the gradient to the master node */
114a7e14dcfSSatish Balay     ierr = VecScatterBegin(bmrm->scatter, G, bmrm->local_w, INSERT_VALUES, SCATTER_FORWARD);CHKERRQ(ierr);
115a7e14dcfSSatish Balay     ierr = VecScatterEnd(bmrm->scatter, G, bmrm->local_w, INSERT_VALUES, SCATTER_FORWARD);CHKERRQ(ierr);
116a7e14dcfSSatish Balay 
117a7e14dcfSSatish Balay     /* Bring up the inner solver */
1180e660641SBarry Smith     if (!rank) {
119*8931d482SJason Sarich       ierr = ensure_df_space(tao->niter+1, &df); CHKERRQ(ierr);
120a7e14dcfSSatish Balay       ierr = make_grad_node(bmrm->local_w, &pgrad);CHKERRQ(ierr);
121a7e14dcfSSatish Balay       tail_glist->next = pgrad;
122a7e14dcfSSatish Balay       tail_glist = pgrad;
123a7e14dcfSSatish Balay 
124*8931d482SJason Sarich       df.a[tao->niter] = 1.0;
125*8931d482SJason Sarich       df.f[tao->niter] = -bt;
126*8931d482SJason Sarich       df.u[tao->niter] = 1.0;
127*8931d482SJason Sarich       df.l[tao->niter] = 0.0;
128a7e14dcfSSatish Balay 
129a7e14dcfSSatish Balay       /* set up the Q */
130a7e14dcfSSatish Balay       pgrad = grad_list.next;
131*8931d482SJason Sarich       for (i=0; i<=tao->niter; i++) {
132a7e14dcfSSatish Balay         ierr = VecDot(pgrad->V, bmrm->local_w, &reg);CHKERRQ(ierr);
133*8931d482SJason Sarich         df.Q[i][tao->niter] = df.Q[tao->niter][i] = reg / lambda;
134a7e14dcfSSatish Balay         pgrad = pgrad->next;
135a7e14dcfSSatish Balay       }
136a7e14dcfSSatish Balay 
137*8931d482SJason Sarich       if (tao->niter > 0) {
138*8931d482SJason Sarich         df.x[tao->niter] = 0.0;
139a7e14dcfSSatish Balay         ierr = solve(&df); CHKERRQ(ierr);
1400e660641SBarry Smith       } else
141a7e14dcfSSatish Balay         df.x[0] = 1.0;
142a7e14dcfSSatish Balay 
143a7e14dcfSSatish Balay       /* now computing Jt*(alpha_t) which should be = Jt(wt) to check convergence */
144a7e14dcfSSatish Balay       jtwt = 0.0;
145a7e14dcfSSatish Balay       ierr = VecSet(bmrm->local_w, 0.0); CHKERRQ(ierr);
146a7e14dcfSSatish Balay       pgrad = grad_list.next;
147*8931d482SJason Sarich       for (i=0; i<=tao->niter; i++) {
148a7e14dcfSSatish Balay         jtwt -= df.x[i] * df.f[i];
149a7e14dcfSSatish Balay         ierr = VecAXPY(bmrm->local_w, -df.x[i] / lambda, pgrad->V); CHKERRQ(ierr);
150a7e14dcfSSatish Balay         pgrad = pgrad->next;
151a7e14dcfSSatish Balay       }
152a7e14dcfSSatish Balay 
153a7e14dcfSSatish Balay       ierr = VecNorm(bmrm->local_w, NORM_2, &reg); CHKERRQ(ierr);
154a7e14dcfSSatish Balay       reg = 0.5*lambda*reg*reg;
155a7e14dcfSSatish Balay       jtwt -= reg;
156a7e14dcfSSatish Balay     } /* end if rank == 0 */
157a7e14dcfSSatish Balay 
158a7e14dcfSSatish Balay     /* scatter the new W to all nodes */
159a7e14dcfSSatish Balay     ierr = VecScatterBegin(bmrm->scatter,bmrm->local_w,W,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
160a7e14dcfSSatish Balay     ierr = VecScatterEnd(bmrm->scatter,bmrm->local_w,W,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
161a7e14dcfSSatish Balay 
162a7e14dcfSSatish Balay     ierr = TaoComputeObjectiveAndGradient(tao, W, &f, G);CHKERRQ(ierr);
163a7e14dcfSSatish Balay 
164ba4b436cSBarry Smith     ierr = MPI_Bcast(&jtwt,1,MPIU_REAL,0,comm);CHKERRQ(ierr);
165ba4b436cSBarry Smith     ierr = MPI_Bcast(&reg,1,MPIU_REAL,0,comm);CHKERRQ(ierr);
166a7e14dcfSSatish Balay 
167a7e14dcfSSatish Balay     jw = reg + f;                                       /* J(w) = regularizer + Remp(w) */
1680e660641SBarry Smith     if (jw < min_jw) min_jw = jw;
1690e660641SBarry Smith     if (jtwt > max_jtwt) max_jtwt = jtwt;
170a7e14dcfSSatish Balay 
171a7e14dcfSSatish Balay     pre_epsilon = epsilon;
172a7e14dcfSSatish Balay     epsilon = min_jw - jtwt;
173a7e14dcfSSatish Balay 
1740e660641SBarry Smith     if (!rank) {
1750e660641SBarry Smith       if (innerSolverTol > epsilon) innerSolverTol = epsilon;
1760e660641SBarry Smith       else if (innerSolverTol < 1e-7) innerSolverTol = 1e-7;
177a7e14dcfSSatish Balay 
178a7e14dcfSSatish Balay       /* if the annealing doesn't work well, lower the inner solver tolerance */
1790e660641SBarry Smith       if(pre_epsilon < epsilon) innerSolverTol *= 0.2;
180a7e14dcfSSatish Balay 
181a7e14dcfSSatish Balay       df.tol = innerSolverTol*0.5;
182a7e14dcfSSatish Balay     }
183a7e14dcfSSatish Balay 
184*8931d482SJason Sarich     tao->niter++;
185*8931d482SJason Sarich     ierr = TaoMonitor(tao,tao->niter,min_jw,epsilon,0.0,tao->step,&reason);CHKERRQ(ierr);
186a7e14dcfSSatish Balay   }
187a7e14dcfSSatish Balay 
188a7e14dcfSSatish Balay   /* free all the memory */
1890e660641SBarry Smith   if (!rank) {
190a7e14dcfSSatish Balay     ierr = destroy_grad_list(&grad_list);CHKERRQ(ierr);
191a7e14dcfSSatish Balay     ierr = destroy_df_solver(&df);CHKERRQ(ierr);
192a7e14dcfSSatish Balay   }
193a7e14dcfSSatish Balay 
194a7e14dcfSSatish Balay   ierr = VecDestroy(&bmrm->local_w);CHKERRQ(ierr);
195a7e14dcfSSatish Balay   ierr = VecScatterDestroy(&bmrm->scatter);CHKERRQ(ierr);
196a7e14dcfSSatish Balay   PetscFunctionReturn(0);
197a7e14dcfSSatish Balay }
198a7e14dcfSSatish Balay 
199a7e14dcfSSatish Balay 
200a7e14dcfSSatish Balay /* ---------------------------------------------------------- */
201a7e14dcfSSatish Balay 
202a7e14dcfSSatish Balay #undef __FUNCT__
203a7e14dcfSSatish Balay #define __FUNCT__ "TaoSetup_BMRM"
204441846f8SBarry Smith static PetscErrorCode TaoSetup_BMRM(Tao tao)
2050e660641SBarry Smith {
206a7e14dcfSSatish Balay 
207a7e14dcfSSatish Balay   PetscErrorCode ierr;
208a7e14dcfSSatish Balay 
209a7e14dcfSSatish Balay   PetscFunctionBegin;
210a7e14dcfSSatish Balay   /* Allocate some arrays */
211a7e14dcfSSatish Balay   if (!tao->gradient) {
212a7e14dcfSSatish Balay     ierr = VecDuplicate(tao->solution, &tao->gradient);   CHKERRQ(ierr);
213a7e14dcfSSatish Balay   }
214a7e14dcfSSatish Balay   PetscFunctionReturn(0);
215a7e14dcfSSatish Balay }
216a7e14dcfSSatish Balay 
217a7e14dcfSSatish Balay /*------------------------------------------------------------*/
218a7e14dcfSSatish Balay #undef __FUNCT__
219a7e14dcfSSatish Balay #define __FUNCT__ "TaoDestroy_BMRM"
220441846f8SBarry Smith static PetscErrorCode TaoDestroy_BMRM(Tao tao)
221a7e14dcfSSatish Balay {
222a7e14dcfSSatish Balay   PetscErrorCode ierr;
223a7e14dcfSSatish Balay 
224a7e14dcfSSatish Balay   PetscFunctionBegin;
225a7e14dcfSSatish Balay   ierr = PetscFree(tao->data);CHKERRQ(ierr);
226a7e14dcfSSatish Balay   PetscFunctionReturn(0);
227a7e14dcfSSatish Balay }
228a7e14dcfSSatish Balay 
229a7e14dcfSSatish Balay #undef __FUNCT__
230a7e14dcfSSatish Balay #define __FUNCT__ "TaoSetFromOptions_BMRM"
2318c34d3f5SBarry Smith static PetscErrorCode TaoSetFromOptions_BMRM(PetscOptions *PetscOptionsObject,Tao tao)
232a7e14dcfSSatish Balay {
233a7e14dcfSSatish Balay   PetscErrorCode ierr;
234a7e14dcfSSatish Balay   TAO_BMRM*      bmrm = (TAO_BMRM*)tao->data;
235a7e14dcfSSatish Balay 
236a7e14dcfSSatish Balay   PetscFunctionBegin;
2371a1499c8SBarry Smith   ierr = PetscOptionsHead(PetscOptionsObject,"BMRM for regularized risk minimization");CHKERRQ(ierr);
23894ae4db5SBarry Smith   ierr = PetscOptionsReal("-tao_bmrm_lambda", "regulariser weight","", 100,&bmrm->lambda,NULL); CHKERRQ(ierr);
239a7e14dcfSSatish Balay   ierr = PetscOptionsTail();CHKERRQ(ierr);
240a7e14dcfSSatish Balay   PetscFunctionReturn(0);
241a7e14dcfSSatish Balay }
242a7e14dcfSSatish Balay 
243a7e14dcfSSatish Balay /*------------------------------------------------------------*/
244a7e14dcfSSatish Balay #undef __FUNCT__
245a7e14dcfSSatish Balay #define __FUNCT__ "TaoView_BMRM"
246441846f8SBarry Smith static PetscErrorCode TaoView_BMRM(Tao tao, PetscViewer viewer)
247a7e14dcfSSatish Balay {
248a7e14dcfSSatish Balay   PetscBool      isascii;
249a7e14dcfSSatish Balay   PetscErrorCode ierr;
250a7e14dcfSSatish Balay 
251a7e14dcfSSatish Balay   PetscFunctionBegin;
252a7e14dcfSSatish Balay   ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&isascii);CHKERRQ(ierr);
253a7e14dcfSSatish Balay   if (isascii) {
254a7e14dcfSSatish Balay     ierr = PetscViewerASCIIPushTab(viewer);CHKERRQ(ierr);
255a7e14dcfSSatish Balay     ierr = PetscViewerASCIIPopTab(viewer);CHKERRQ(ierr);
256a7e14dcfSSatish Balay   }
257a7e14dcfSSatish Balay   PetscFunctionReturn(0);
258a7e14dcfSSatish Balay }
259a7e14dcfSSatish Balay 
260a7e14dcfSSatish Balay /*------------------------------------------------------------*/
2611522df2eSJason Sarich /*MC
2621522df2eSJason Sarich   TAOBMRM - bundle method for regularized risk minimization
2631522df2eSJason Sarich 
2641522df2eSJason Sarich   Options Database Keys:
2651522df2eSJason Sarich . - tao_bmrm_lambda - regulariser weight
2661522df2eSJason Sarich 
2671eb8069cSJason Sarich   Level: beginner
2681522df2eSJason Sarich M*/
2691522df2eSJason Sarich 
270a7e14dcfSSatish Balay #undef __FUNCT__
271a7e14dcfSSatish Balay #define __FUNCT__ "TaoCreate_BMRM"
272728e0ed0SBarry Smith PETSC_EXTERN PetscErrorCode TaoCreate_BMRM(Tao tao)
273a7e14dcfSSatish Balay {
274a7e14dcfSSatish Balay   TAO_BMRM       *bmrm;
275a7e14dcfSSatish Balay   PetscErrorCode ierr;
276a7e14dcfSSatish Balay 
277a7e14dcfSSatish Balay   PetscFunctionBegin;
278a7e14dcfSSatish Balay   tao->ops->setup = TaoSetup_BMRM;
279a7e14dcfSSatish Balay   tao->ops->solve = TaoSolve_BMRM;
280a7e14dcfSSatish Balay   tao->ops->view  = TaoView_BMRM;
281a7e14dcfSSatish Balay   tao->ops->setfromoptions = TaoSetFromOptions_BMRM;
282a7e14dcfSSatish Balay   tao->ops->destroy = TaoDestroy_BMRM;
283a7e14dcfSSatish Balay 
2843c9e27cfSGeoffrey Irving   ierr = PetscNewLog(tao,&bmrm);CHKERRQ(ierr);
285a7e14dcfSSatish Balay   bmrm->lambda = 1.0;
286a7e14dcfSSatish Balay   tao->data = (void*)bmrm;
287a7e14dcfSSatish Balay 
288a7e14dcfSSatish Balay   /* Note: May need to be tuned! */
289a7e14dcfSSatish Balay   tao->max_it = 2048;
290a7e14dcfSSatish Balay   tao->max_funcs = 300000;
291a7e14dcfSSatish Balay   tao->fatol = 1e-20;
292a7e14dcfSSatish Balay   tao->frtol = 1e-25;
293a7e14dcfSSatish Balay   tao->gatol = 1e-25;
294a7e14dcfSSatish Balay   tao->grtol = 1e-25;
295a7e14dcfSSatish Balay 
296a7e14dcfSSatish Balay   PetscFunctionReturn(0);
297a7e14dcfSSatish Balay }
298a7e14dcfSSatish Balay 
299a7e14dcfSSatish Balay #undef __FUNCT__
300a7e14dcfSSatish Balay #define __FUNCT__ "init_df_solver"
301a7e14dcfSSatish Balay PetscErrorCode init_df_solver(TAO_DF *df)
302a7e14dcfSSatish Balay {
303a7e14dcfSSatish Balay   PetscInt       i, n = INCRE_DIM;
304a7e14dcfSSatish Balay   PetscErrorCode ierr;
305a7e14dcfSSatish Balay 
306a7e14dcfSSatish Balay   PetscFunctionBegin;
307a7e14dcfSSatish Balay   /* default values */
308a7e14dcfSSatish Balay   df->maxProjIter = 200;
309a7e14dcfSSatish Balay   df->maxPGMIter = 300000;
310a7e14dcfSSatish Balay   df->b = 1.0;
311a7e14dcfSSatish Balay 
312a7e14dcfSSatish Balay   /* memory space required by Dai-Fletcher */
313a7e14dcfSSatish Balay   df->cur_num_cp = n;
3140e660641SBarry Smith   ierr = PetscMalloc1(n, &df->f); CHKERRQ(ierr);
3150e660641SBarry Smith   ierr = PetscMalloc1(n, &df->a); CHKERRQ(ierr);
3160e660641SBarry Smith   ierr = PetscMalloc1(n, &df->l); CHKERRQ(ierr);
3170e660641SBarry Smith   ierr = PetscMalloc1(n, &df->u); CHKERRQ(ierr);
3180e660641SBarry Smith   ierr = PetscMalloc1(n, &df->x); CHKERRQ(ierr);
319e1cc520bSBarry Smith   ierr = PetscMalloc1(n, &df->Q); CHKERRQ(ierr);
320a7e14dcfSSatish Balay 
321a7e14dcfSSatish Balay   for (i = 0; i < n; i ++) {
3220e660641SBarry Smith     ierr = PetscMalloc1(n, &df->Q[i]); CHKERRQ(ierr);
323a7e14dcfSSatish Balay   }
324a7e14dcfSSatish Balay 
3250e660641SBarry Smith   ierr = PetscMalloc1(n, &df->g); CHKERRQ(ierr);
3260e660641SBarry Smith   ierr = PetscMalloc1(n, &df->y); CHKERRQ(ierr);
3270e660641SBarry Smith   ierr = PetscMalloc1(n, &df->tempv); CHKERRQ(ierr);
3280e660641SBarry Smith   ierr = PetscMalloc1(n, &df->d); CHKERRQ(ierr);
3290e660641SBarry Smith   ierr = PetscMalloc1(n, &df->Qd); CHKERRQ(ierr);
3300e660641SBarry Smith   ierr = PetscMalloc1(n, &df->t); CHKERRQ(ierr);
3310e660641SBarry Smith   ierr = PetscMalloc1(n, &df->xplus); CHKERRQ(ierr);
3320e660641SBarry Smith   ierr = PetscMalloc1(n, &df->tplus); CHKERRQ(ierr);
3330e660641SBarry Smith   ierr = PetscMalloc1(n, &df->sk); CHKERRQ(ierr);
3340e660641SBarry Smith   ierr = PetscMalloc1(n, &df->yk); CHKERRQ(ierr);
335a7e14dcfSSatish Balay 
336e1cc520bSBarry Smith   ierr = PetscMalloc1(n, &df->ipt); CHKERRQ(ierr);
337e1cc520bSBarry Smith   ierr = PetscMalloc1(n, &df->ipt2); CHKERRQ(ierr);
338e1cc520bSBarry Smith   ierr = PetscMalloc1(n, &df->uv); CHKERRQ(ierr);
339a7e14dcfSSatish Balay   PetscFunctionReturn(0);
340a7e14dcfSSatish Balay }
341a7e14dcfSSatish Balay 
342a7e14dcfSSatish Balay #undef __FUNCT__
343a7e14dcfSSatish Balay #define __FUNCT__ "ensure_df_space"
344a7e14dcfSSatish Balay PetscErrorCode ensure_df_space(PetscInt dim, TAO_DF *df)
345a7e14dcfSSatish Balay {
346a7e14dcfSSatish Balay   PetscErrorCode ierr;
347a7e14dcfSSatish Balay   PetscReal      *tmp, **tmp_Q;
348a7e14dcfSSatish Balay   PetscInt       i, n, old_n;
349a7e14dcfSSatish Balay 
350a7e14dcfSSatish Balay   PetscFunctionBegin;
35153506e15SBarry Smith   df->dim = dim;
35253506e15SBarry Smith   if (dim <= df->cur_num_cp) PetscFunctionReturn(0);
353a7e14dcfSSatish Balay 
354a7e14dcfSSatish Balay   old_n = df->cur_num_cp;
355a7e14dcfSSatish Balay   df->cur_num_cp += INCRE_DIM;
356a7e14dcfSSatish Balay   n = df->cur_num_cp;
357a7e14dcfSSatish Balay 
358a7e14dcfSSatish Balay   /* memory space required by dai-fletcher */
3590e660641SBarry Smith   ierr = PetscMalloc1(n, &tmp); CHKERRQ(ierr);
360a7e14dcfSSatish Balay   ierr = PetscMemcpy(tmp, df->f, sizeof(PetscReal)*old_n); CHKERRQ(ierr);
361a7e14dcfSSatish Balay   ierr = PetscFree(df->f); CHKERRQ(ierr);
362a7e14dcfSSatish Balay   df->f = tmp;
363a7e14dcfSSatish Balay 
3640e660641SBarry Smith   ierr = PetscMalloc1(n, &tmp); CHKERRQ(ierr);
365a7e14dcfSSatish Balay   ierr = PetscMemcpy(tmp, df->a, sizeof(PetscReal)*old_n); CHKERRQ(ierr);
366a7e14dcfSSatish Balay   ierr = PetscFree(df->a); CHKERRQ(ierr);
367a7e14dcfSSatish Balay   df->a = tmp;
368a7e14dcfSSatish Balay 
3690e660641SBarry Smith   ierr = PetscMalloc1(n, &tmp); CHKERRQ(ierr);
370a7e14dcfSSatish Balay   ierr = PetscMemcpy(tmp, df->l, sizeof(PetscReal)*old_n); CHKERRQ(ierr);
371a7e14dcfSSatish Balay   ierr = PetscFree(df->l); CHKERRQ(ierr);
372a7e14dcfSSatish Balay   df->l = tmp;
373a7e14dcfSSatish Balay 
3740e660641SBarry Smith   ierr = PetscMalloc1(n, &tmp); CHKERRQ(ierr);
375a7e14dcfSSatish Balay   ierr = PetscMemcpy(tmp, df->u, sizeof(PetscReal)*old_n); CHKERRQ(ierr);
376a7e14dcfSSatish Balay   ierr = PetscFree(df->u); CHKERRQ(ierr);
377a7e14dcfSSatish Balay   df->u = tmp;
378a7e14dcfSSatish Balay 
3790e660641SBarry Smith   ierr = PetscMalloc1(n, &tmp); CHKERRQ(ierr);
380a7e14dcfSSatish Balay   ierr = PetscMemcpy(tmp, df->x, sizeof(PetscReal)*old_n); CHKERRQ(ierr);
381a7e14dcfSSatish Balay   ierr = PetscFree(df->x); CHKERRQ(ierr);
382a7e14dcfSSatish Balay   df->x = tmp;
383a7e14dcfSSatish Balay 
384e1cc520bSBarry Smith   ierr = PetscMalloc1(n, &tmp_Q); CHKERRQ(ierr);
38553506e15SBarry Smith   for (i = 0; i < n; i ++) {
3860e660641SBarry Smith     ierr = PetscMalloc1(n, &tmp_Q[i]); CHKERRQ(ierr);
38753506e15SBarry Smith     if (i < old_n) {
388a7e14dcfSSatish Balay       ierr = PetscMemcpy(tmp_Q[i], df->Q[i], sizeof(PetscReal)*old_n); CHKERRQ(ierr);
389a7e14dcfSSatish Balay       ierr = PetscFree(df->Q[i]); CHKERRQ(ierr);
390a7e14dcfSSatish Balay     }
391a7e14dcfSSatish Balay   }
392a7e14dcfSSatish Balay 
393a7e14dcfSSatish Balay   ierr = PetscFree(df->Q); CHKERRQ(ierr);
394a7e14dcfSSatish Balay   df->Q = tmp_Q;
395a7e14dcfSSatish Balay 
396a7e14dcfSSatish Balay   ierr = PetscFree(df->g); CHKERRQ(ierr);
3970e660641SBarry Smith   ierr = PetscMalloc1(n, &df->g); CHKERRQ(ierr);
398a7e14dcfSSatish Balay 
399a7e14dcfSSatish Balay   ierr = PetscFree(df->y); CHKERRQ(ierr);
4000e660641SBarry Smith   ierr = PetscMalloc1(n, &df->y); CHKERRQ(ierr);
401a7e14dcfSSatish Balay 
402a7e14dcfSSatish Balay   ierr = PetscFree(df->tempv); CHKERRQ(ierr);
4030e660641SBarry Smith   ierr = PetscMalloc1(n, &df->tempv); CHKERRQ(ierr);
404a7e14dcfSSatish Balay 
405a7e14dcfSSatish Balay   ierr = PetscFree(df->d); CHKERRQ(ierr);
4060e660641SBarry Smith   ierr = PetscMalloc1(n, &df->d); CHKERRQ(ierr);
407a7e14dcfSSatish Balay 
408a7e14dcfSSatish Balay   ierr = PetscFree(df->Qd); CHKERRQ(ierr);
4090e660641SBarry Smith   ierr = PetscMalloc1(n, &df->Qd); CHKERRQ(ierr);
410a7e14dcfSSatish Balay 
411a7e14dcfSSatish Balay   ierr = PetscFree(df->t); CHKERRQ(ierr);
4120e660641SBarry Smith   ierr = PetscMalloc1(n, &df->t); CHKERRQ(ierr);
413a7e14dcfSSatish Balay 
414a7e14dcfSSatish Balay   ierr = PetscFree(df->xplus); CHKERRQ(ierr);
4150e660641SBarry Smith   ierr = PetscMalloc1(n, &df->xplus); CHKERRQ(ierr);
416a7e14dcfSSatish Balay 
417a7e14dcfSSatish Balay   ierr = PetscFree(df->tplus); CHKERRQ(ierr);
4180e660641SBarry Smith   ierr = PetscMalloc1(n, &df->tplus); CHKERRQ(ierr);
419a7e14dcfSSatish Balay 
420a7e14dcfSSatish Balay   ierr = PetscFree(df->sk); CHKERRQ(ierr);
4210e660641SBarry Smith   ierr = PetscMalloc1(n, &df->sk); CHKERRQ(ierr);
422a7e14dcfSSatish Balay 
423a7e14dcfSSatish Balay   ierr = PetscFree(df->yk); CHKERRQ(ierr);
4240e660641SBarry Smith   ierr = PetscMalloc1(n, &df->yk); CHKERRQ(ierr);
425a7e14dcfSSatish Balay 
426a7e14dcfSSatish Balay   ierr = PetscFree(df->ipt); CHKERRQ(ierr);
427e1cc520bSBarry Smith   ierr = PetscMalloc1(n, &df->ipt); CHKERRQ(ierr);
428a7e14dcfSSatish Balay 
429a7e14dcfSSatish Balay   ierr = PetscFree(df->ipt2); CHKERRQ(ierr);
4300e660641SBarry Smith   ierr = PetscMalloc1(n, &df->ipt2); CHKERRQ(ierr);
431a7e14dcfSSatish Balay 
432a7e14dcfSSatish Balay   ierr = PetscFree(df->uv); CHKERRQ(ierr);
4330e660641SBarry Smith   ierr = PetscMalloc1(n, &df->uv); CHKERRQ(ierr);
434a7e14dcfSSatish Balay   PetscFunctionReturn(0);
435a7e14dcfSSatish Balay }
436a7e14dcfSSatish Balay 
437a7e14dcfSSatish Balay #undef __FUNCT__
438a7e14dcfSSatish Balay #define __FUNCT__ "destroy_df_solver"
439a7e14dcfSSatish Balay PetscErrorCode destroy_df_solver(TAO_DF *df)
440a7e14dcfSSatish Balay {
441a7e14dcfSSatish Balay   PetscErrorCode ierr;
442a7e14dcfSSatish Balay   PetscInt       i;
4436c23d075SBarry Smith 
444a7e14dcfSSatish Balay   PetscFunctionBegin;
4456c23d075SBarry Smith   ierr = PetscFree(df->f); CHKERRQ(ierr);
4466c23d075SBarry Smith   ierr = PetscFree(df->a); CHKERRQ(ierr);
4476c23d075SBarry Smith   ierr = PetscFree(df->l); CHKERRQ(ierr);
4486c23d075SBarry Smith   ierr = PetscFree(df->u); CHKERRQ(ierr);
4496c23d075SBarry Smith   ierr = PetscFree(df->x); CHKERRQ(ierr);
450a7e14dcfSSatish Balay 
4516c23d075SBarry Smith   for (i = 0; i < df->cur_num_cp; i ++) {
452a7e14dcfSSatish Balay     ierr = PetscFree(df->Q[i]); CHKERRQ(ierr);
453a7e14dcfSSatish Balay   }
454a7e14dcfSSatish Balay   ierr = PetscFree(df->Q); CHKERRQ(ierr);
4556c23d075SBarry Smith   ierr = PetscFree(df->ipt); CHKERRQ(ierr);
4566c23d075SBarry Smith   ierr = PetscFree(df->ipt2); CHKERRQ(ierr);
4576c23d075SBarry Smith   ierr = PetscFree(df->uv); CHKERRQ(ierr);
4586c23d075SBarry Smith   ierr = PetscFree(df->g); CHKERRQ(ierr);
4596c23d075SBarry Smith   ierr = PetscFree(df->y); CHKERRQ(ierr);
4606c23d075SBarry Smith   ierr = PetscFree(df->tempv); CHKERRQ(ierr);
4616c23d075SBarry Smith   ierr = PetscFree(df->d); CHKERRQ(ierr);
4626c23d075SBarry Smith   ierr = PetscFree(df->Qd); CHKERRQ(ierr);
4636c23d075SBarry Smith   ierr = PetscFree(df->t); CHKERRQ(ierr);
4646c23d075SBarry Smith   ierr = PetscFree(df->xplus); CHKERRQ(ierr);
4656c23d075SBarry Smith   ierr = PetscFree(df->tplus); CHKERRQ(ierr);
4666c23d075SBarry Smith   ierr = PetscFree(df->sk); CHKERRQ(ierr);
4676c23d075SBarry Smith   ierr = PetscFree(df->yk); CHKERRQ(ierr);
468a7e14dcfSSatish Balay   PetscFunctionReturn(0);
469a7e14dcfSSatish Balay }
470a7e14dcfSSatish Balay 
471a7e14dcfSSatish Balay /* Piecewise linear monotone target function for the Dai-Fletcher projector */
472a7e14dcfSSatish Balay #undef __FUNCT__
473a7e14dcfSSatish Balay #define __FUNCT__ "phi"
4746c23d075SBarry Smith PetscReal phi(PetscReal *x,PetscInt n,PetscReal lambda,PetscReal *a,PetscReal b,PetscReal *c,PetscReal *l,PetscReal *u)
475a7e14dcfSSatish Balay {
476a7e14dcfSSatish Balay   PetscReal r = 0.0;
477a7e14dcfSSatish Balay   PetscInt  i;
478a7e14dcfSSatish Balay 
479a7e14dcfSSatish Balay   for (i = 0; i < n; i++){
480a7e14dcfSSatish Balay     x[i] = -c[i] + lambda*a[i];
4816c23d075SBarry Smith     if (x[i] > u[i])     x[i] = u[i];
4826c23d075SBarry Smith     else if(x[i] < l[i]) x[i] = l[i];
483a7e14dcfSSatish Balay     r += a[i]*x[i];
484a7e14dcfSSatish Balay   }
485a7e14dcfSSatish Balay   return r - b;
486a7e14dcfSSatish Balay }
487a7e14dcfSSatish Balay 
488a7e14dcfSSatish Balay /** Modified Dai-Fletcher QP projector solves the problem:
489a7e14dcfSSatish Balay  *
490a7e14dcfSSatish Balay  *      minimise  0.5*x'*x - c'*x
491a7e14dcfSSatish Balay  *      subj to   a'*x = b
492a7e14dcfSSatish Balay  *                l \leq x \leq u
493a7e14dcfSSatish Balay  *
494a7e14dcfSSatish Balay  *  \param c The point to be projected onto feasible set
495a7e14dcfSSatish Balay  */
496a7e14dcfSSatish Balay #undef __FUNCT__
497a7e14dcfSSatish Balay #define __FUNCT__ "project"
4986c23d075SBarry Smith PetscInt project(PetscInt n,PetscReal *a,PetscReal b,PetscReal *c,PetscReal *l,PetscReal *u,PetscReal *x,PetscReal *lam_ext,TAO_DF *df)
499a7e14dcfSSatish Balay {
500a7e14dcfSSatish Balay   PetscReal      lambda, lambdal, lambdau, dlambda, lambda_new;
501a7e14dcfSSatish Balay   PetscReal      r, rl, ru, s;
502a7e14dcfSSatish Balay   PetscInt       innerIter;
503a7e14dcfSSatish Balay   PetscBool      nonNegativeSlack = PETSC_FALSE;
50453506e15SBarry Smith   PetscErrorCode ierr;
505a7e14dcfSSatish Balay 
506a7e14dcfSSatish Balay   *lam_ext = 0;
507a7e14dcfSSatish Balay   lambda  = 0;
508a7e14dcfSSatish Balay   dlambda = 0.5;
509a7e14dcfSSatish Balay   innerIter = 1;
510a7e14dcfSSatish Balay 
511a7e14dcfSSatish Balay   /*  \phi(x;lambda) := 0.5*x'*x + c'*x - lambda*(a'*x-b)
512a7e14dcfSSatish Balay    *
513a7e14dcfSSatish Balay    *  Optimality conditions for \phi:
514a7e14dcfSSatish Balay    *
515a7e14dcfSSatish Balay    *  1. lambda   <= 0
516a7e14dcfSSatish Balay    *  2. r        <= 0
517a7e14dcfSSatish Balay    *  3. r*lambda == 0
518a7e14dcfSSatish Balay    */
519a7e14dcfSSatish Balay 
520a7e14dcfSSatish Balay   /* Bracketing Phase */
521a7e14dcfSSatish Balay   r = phi(x, n, lambda, a, b, c, l, u);
522a7e14dcfSSatish Balay 
5236c23d075SBarry Smith   if(nonNegativeSlack) {
524a7e14dcfSSatish Balay     /* inequality constraint, i.e., with \xi >= 0 constraint */
52553506e15SBarry Smith     if (r < TOL_R) return 0;
5266c23d075SBarry Smith   } else  {
527a7e14dcfSSatish Balay     /* equality constraint ,i.e., without \xi >= 0 constraint */
52853506e15SBarry Smith     if (fabs(r) < TOL_R) return 0;
529a7e14dcfSSatish Balay   }
530a7e14dcfSSatish Balay 
531a7e14dcfSSatish Balay   if (r < 0.0){
532a7e14dcfSSatish Balay     lambdal = lambda;
533a7e14dcfSSatish Balay     rl      = r;
534a7e14dcfSSatish Balay     lambda  = lambda + dlambda;
535a7e14dcfSSatish Balay     r       = phi(x, n, lambda, a, b, c, l, u);
536a7e14dcfSSatish Balay     while (r < 0.0 && dlambda < BMRM_INFTY)  {
537a7e14dcfSSatish Balay       lambdal = lambda;
538a7e14dcfSSatish Balay       s       = rl/r - 1.0;
539a7e14dcfSSatish Balay       if (s < 0.1) s = 0.1;
540a7e14dcfSSatish Balay       dlambda = dlambda + dlambda/s;
541a7e14dcfSSatish Balay       lambda  = lambda + dlambda;
542a7e14dcfSSatish Balay       rl      = r;
543a7e14dcfSSatish Balay       r       = phi(x, n, lambda, a, b, c, l, u);
544a7e14dcfSSatish Balay     }
545a7e14dcfSSatish Balay     lambdau = lambda;
546a7e14dcfSSatish Balay     ru      = r;
5476c23d075SBarry Smith   } else {
548a7e14dcfSSatish Balay     lambdau = lambda;
549a7e14dcfSSatish Balay     ru      = r;
550a7e14dcfSSatish Balay     lambda  = lambda - dlambda;
551a7e14dcfSSatish Balay     r       = phi(x, n, lambda, a, b, c, l, u);
552a7e14dcfSSatish Balay     while (r > 0.0 && dlambda > -BMRM_INFTY) {
553a7e14dcfSSatish Balay       lambdau = lambda;
554a7e14dcfSSatish Balay       s       = ru/r - 1.0;
555a7e14dcfSSatish Balay       if (s < 0.1) s = 0.1;
556a7e14dcfSSatish Balay       dlambda = dlambda + dlambda/s;
557a7e14dcfSSatish Balay       lambda  = lambda - dlambda;
558a7e14dcfSSatish Balay       ru      = r;
559a7e14dcfSSatish Balay       r       = phi(x, n, lambda, a, b, c, l, u);
560a7e14dcfSSatish Balay     }
561a7e14dcfSSatish Balay     lambdal = lambda;
562a7e14dcfSSatish Balay     rl      = r;
563a7e14dcfSSatish Balay   }
564a7e14dcfSSatish Balay 
5656c23d075SBarry Smith   if(fabs(dlambda) > BMRM_INFTY) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"L2N2_DaiFletcherPGM detected Infeasible QP problem!");
566a7e14dcfSSatish Balay 
567a7e14dcfSSatish Balay   if(ru == 0){
568a7e14dcfSSatish Balay     lambda = lambdau;
569a7e14dcfSSatish Balay     r = phi(x, n, lambda, a, b, c, l, u);
570a7e14dcfSSatish Balay     return innerIter;
571a7e14dcfSSatish Balay   }
572a7e14dcfSSatish Balay 
573a7e14dcfSSatish Balay   /* Secant Phase */
574a7e14dcfSSatish Balay   s       = 1.0 - rl/ru;
575a7e14dcfSSatish Balay   dlambda = dlambda/s;
576a7e14dcfSSatish Balay   lambda  = lambdau - dlambda;
577a7e14dcfSSatish Balay   r       = phi(x, n, lambda, a, b, c, l, u);
578a7e14dcfSSatish Balay 
579a7e14dcfSSatish Balay   while (fabs(r) > TOL_R
580a7e14dcfSSatish Balay          && dlambda > TOL_LAM * (1.0 + fabs(lambda))
581a7e14dcfSSatish Balay          && innerIter < df->maxProjIter){
582a7e14dcfSSatish Balay     innerIter++;
583a7e14dcfSSatish Balay     if (r > 0.0){
584a7e14dcfSSatish Balay       if (s <= 2.0){
585a7e14dcfSSatish Balay         lambdau = lambda;
586a7e14dcfSSatish Balay         ru      = r;
587a7e14dcfSSatish Balay         s       = 1.0 - rl/ru;
588a7e14dcfSSatish Balay         dlambda = (lambdau - lambdal) / s;
589a7e14dcfSSatish Balay         lambda  = lambdau - dlambda;
59053506e15SBarry Smith       } else {
591a7e14dcfSSatish Balay         s          = ru/r-1.0;
592a7e14dcfSSatish Balay         if (s < 0.1) s = 0.1;
593a7e14dcfSSatish Balay         dlambda    = (lambdau - lambda) / s;
594a7e14dcfSSatish Balay         lambda_new = 0.75*lambdal + 0.25*lambda;
595a7e14dcfSSatish Balay         if (lambda_new < (lambda - dlambda))
596a7e14dcfSSatish Balay           lambda_new = lambda - dlambda;
597a7e14dcfSSatish Balay         lambdau    = lambda;
598a7e14dcfSSatish Balay         ru         = r;
599a7e14dcfSSatish Balay         lambda     = lambda_new;
600a7e14dcfSSatish Balay         s          = (lambdau - lambdal) / (lambdau - lambda);
601a7e14dcfSSatish Balay       }
60253506e15SBarry Smith     } else {
603a7e14dcfSSatish Balay       if (s >= 2.0){
604a7e14dcfSSatish Balay         lambdal = lambda;
605a7e14dcfSSatish Balay         rl      = r;
606a7e14dcfSSatish Balay         s       = 1.0 - rl/ru;
607a7e14dcfSSatish Balay         dlambda = (lambdau - lambdal) / s;
608a7e14dcfSSatish Balay         lambda  = lambdau - dlambda;
60953506e15SBarry Smith       } else {
610a7e14dcfSSatish Balay         s          = rl/r - 1.0;
611a7e14dcfSSatish Balay         if (s < 0.1) s = 0.1;
612a7e14dcfSSatish Balay         dlambda    = (lambda-lambdal) / s;
613a7e14dcfSSatish Balay         lambda_new = 0.75*lambdau + 0.25*lambda;
614a7e14dcfSSatish Balay         if (lambda_new > (lambda + dlambda))
615a7e14dcfSSatish Balay           lambda_new = lambda + dlambda;
616a7e14dcfSSatish Balay         lambdal    = lambda;
617a7e14dcfSSatish Balay         rl         = r;
618a7e14dcfSSatish Balay         lambda     = lambda_new;
619a7e14dcfSSatish Balay         s          = (lambdau - lambdal) / (lambdau-lambda);
620a7e14dcfSSatish Balay       }
621a7e14dcfSSatish Balay     }
622a7e14dcfSSatish Balay     r = phi(x, n, lambda, a, b, c, l, u);
623a7e14dcfSSatish Balay   }
624a7e14dcfSSatish Balay 
625a7e14dcfSSatish Balay   *lam_ext = lambda;
62653506e15SBarry Smith   if(innerIter >= df->maxProjIter) {
62753506e15SBarry Smith     ierr = PetscPrintf(PETSC_COMM_SELF, "WARNING: DaiFletcher max iterations\n");CHKERRQ(ierr);
62853506e15SBarry Smith   }
629a7e14dcfSSatish Balay   return innerIter;
630a7e14dcfSSatish Balay }
631a7e14dcfSSatish Balay 
632a7e14dcfSSatish Balay 
633a7e14dcfSSatish Balay #undef __FUNCT__
634a7e14dcfSSatish Balay #define __FUNCT__ "solve"
635a7e14dcfSSatish Balay PetscErrorCode solve(TAO_DF *df)
636a7e14dcfSSatish Balay {
637a7e14dcfSSatish Balay   PetscErrorCode ierr;
638a7e14dcfSSatish Balay   PetscInt       i, j, innerIter, it, it2, luv, info, lscount = 0, projcount = 0;
639a7e14dcfSSatish Balay   PetscReal      gd, max, ak, bk, akold, bkold, lamnew, alpha, kktlam=0.0, lam_ext;
640a7e14dcfSSatish Balay   PetscReal      DELTAsv, ProdDELTAsv;
641a7e14dcfSSatish Balay   PetscReal      c, *tempQ;
642a7e14dcfSSatish Balay   PetscReal      *x = df->x, *a = df->a, b = df->b, *l = df->l, *u = df->u, tol = df->tol;
643a7e14dcfSSatish Balay   PetscReal      *tempv = df->tempv, *y = df->y, *g = df->g, *d = df->d, *Qd = df->Qd;
644a7e14dcfSSatish Balay   PetscReal      *xplus = df->xplus, *tplus = df->tplus, *sk = df->sk, *yk = df->yk;
645a7e14dcfSSatish Balay   PetscReal      **Q = df->Q, *f = df->f, *t = df->t;
646a7e14dcfSSatish Balay   PetscInt       dim = df->dim, *ipt = df->ipt, *ipt2 = df->ipt2, *uv = df->uv;
647a7e14dcfSSatish Balay 
648a7e14dcfSSatish Balay   /*** variables for the adaptive nonmonotone linesearch ***/
649a7e14dcfSSatish Balay   PetscInt    L, llast;
650a7e14dcfSSatish Balay   PetscReal   fr, fbest, fv, fc, fv0;
65153506e15SBarry Smith 
652a7e14dcfSSatish Balay   c = BMRM_INFTY;
653a7e14dcfSSatish Balay 
654a7e14dcfSSatish Balay   DELTAsv = EPS_SV;
65553506e15SBarry Smith   if (tol <= 1.0e-5 || dim <= 20) ProdDELTAsv = 0.0F;
65653506e15SBarry Smith   else  ProdDELTAsv = EPS_SV;
657a7e14dcfSSatish Balay 
65853506e15SBarry Smith   for (i = 0; i < dim; i++)  tempv[i] = -x[i];
659a7e14dcfSSatish Balay 
660a7e14dcfSSatish Balay   lam_ext = 0.0;
661a7e14dcfSSatish Balay 
662a7e14dcfSSatish Balay   /* Project the initial solution */
663a7e14dcfSSatish Balay   projcount += project(dim, a, b, tempv, l, u, x, &lam_ext, df);
664a7e14dcfSSatish Balay 
665a7e14dcfSSatish Balay   /* Compute gradient
666a7e14dcfSSatish Balay      g = Q*x + f; */
667a7e14dcfSSatish Balay 
668a7e14dcfSSatish Balay   it = 0;
66953506e15SBarry Smith   for (i = 0; i < dim; i++) {
67053506e15SBarry Smith     if (fabs(x[i]) > ProdDELTAsv) ipt[it++] = i;
67153506e15SBarry Smith   }
672a7e14dcfSSatish Balay 
673a7e14dcfSSatish Balay   ierr = PetscMemzero(t, dim*sizeof(PetscReal)); CHKERRQ(ierr);
674a7e14dcfSSatish Balay   for (i = 0; i < it; i++){
675a7e14dcfSSatish Balay     tempQ = Q[ipt[i]];
67653506e15SBarry Smith     for (j = 0; j < dim; j++) t[j] += (tempQ[j]*x[ipt[i]]);
677a7e14dcfSSatish Balay   }
678a7e14dcfSSatish Balay   for (i = 0; i < dim; i++){
679a7e14dcfSSatish Balay     g[i] = t[i] + f[i];
680a7e14dcfSSatish Balay   }
681a7e14dcfSSatish Balay 
682a7e14dcfSSatish Balay 
683a7e14dcfSSatish Balay   /* y = -(x_{k} - g_{k}) */
684a7e14dcfSSatish Balay   for (i = 0; i < dim; i++){
685a7e14dcfSSatish Balay     y[i] = g[i] - x[i];
686a7e14dcfSSatish Balay   }
687a7e14dcfSSatish Balay 
688a7e14dcfSSatish Balay   /* Project x_{k} - g_{k} */
689a7e14dcfSSatish Balay   projcount += project(dim, a, b, y, l, u, tempv, &lam_ext, df);
690a7e14dcfSSatish Balay 
691a7e14dcfSSatish Balay   /* y = P(x_{k} - g_{k}) - x_{k} */
692a7e14dcfSSatish Balay   max = ALPHA_MIN;
693a7e14dcfSSatish Balay   for (i = 0; i < dim; i++){
694a7e14dcfSSatish Balay     y[i] = tempv[i] - x[i];
69553506e15SBarry Smith     if (fabs(y[i]) > max) max = fabs(y[i]);
696a7e14dcfSSatish Balay   }
697a7e14dcfSSatish Balay 
698a7e14dcfSSatish Balay   if (max < tol*1e-3){
699a7e14dcfSSatish Balay     lscount = 0;
700a7e14dcfSSatish Balay     innerIter    = 0;
701a7e14dcfSSatish Balay     return 0;
702a7e14dcfSSatish Balay   }
703a7e14dcfSSatish Balay 
704a7e14dcfSSatish Balay   alpha = 1.0 / max;
705a7e14dcfSSatish Balay 
706a7e14dcfSSatish Balay   /* fv0 = f(x_{0}). Recall t = Q x_{k}  */
707a7e14dcfSSatish Balay   fv0   = 0.0;
70853506e15SBarry Smith   for (i = 0; i < dim; i++) fv0 += x[i] * (0.5*t[i] + f[i]);
709a7e14dcfSSatish Balay 
710a7e14dcfSSatish Balay   /*** adaptive nonmonotone linesearch ***/
711a7e14dcfSSatish Balay   L     = 2;
712a7e14dcfSSatish Balay   fr    = ALPHA_MAX;
713a7e14dcfSSatish Balay   fbest = fv0;
714a7e14dcfSSatish Balay   fc    = fv0;
715a7e14dcfSSatish Balay   llast = 0;
716a7e14dcfSSatish Balay   akold = bkold = 0.0;
717a7e14dcfSSatish Balay 
718a7e14dcfSSatish Balay   /***      Iterator begins     ***/
719a7e14dcfSSatish Balay   for (innerIter = 1; innerIter <= df->maxPGMIter; innerIter++) {
720a7e14dcfSSatish Balay 
721a7e14dcfSSatish Balay     /* tempv = -(x_{k} - alpha*g_{k}) */
72253506e15SBarry Smith     for (i = 0; i < dim; i++)  tempv[i] = alpha*g[i] - x[i];
723a7e14dcfSSatish Balay 
724a7e14dcfSSatish Balay     /* Project x_{k} - alpha*g_{k} */
725a7e14dcfSSatish Balay     projcount += project(dim, a, b, tempv, l, u, y, &lam_ext, df);
726a7e14dcfSSatish Balay 
727a7e14dcfSSatish Balay 
728a7e14dcfSSatish Balay     /* gd = \inner{d_{k}}{g_{k}}
729a7e14dcfSSatish Balay         d = P(x_{k} - alpha*g_{k}) - x_{k}
730a7e14dcfSSatish Balay     */
731a7e14dcfSSatish Balay     gd = 0.0;
732a7e14dcfSSatish Balay     for (i = 0; i < dim; i++){
733a7e14dcfSSatish Balay       d[i] = y[i] - x[i];
734a7e14dcfSSatish Balay       gd  += d[i] * g[i];
735a7e14dcfSSatish Balay     }
736a7e14dcfSSatish Balay 
737a7e14dcfSSatish Balay     /* Gradient computation  */
738a7e14dcfSSatish Balay 
739a7e14dcfSSatish Balay     /* compute Qd = Q*d  or  Qd = Q*y - t depending on their sparsity */
740a7e14dcfSSatish Balay 
741a7e14dcfSSatish Balay     it = it2 = 0;
74253506e15SBarry Smith     for (i = 0; i < dim; i++){
74353506e15SBarry Smith       if (fabs(d[i]) > (ProdDELTAsv*1.0e-2)) ipt[it++]   = i;
74453506e15SBarry Smith     }
74553506e15SBarry Smith     for (i = 0; i < dim; i++) {
74653506e15SBarry Smith       if (fabs(y[i]) > ProdDELTAsv) ipt2[it2++] = i;
74753506e15SBarry Smith     }
748a7e14dcfSSatish Balay 
749a7e14dcfSSatish Balay     ierr = PetscMemzero(Qd, dim*sizeof(PetscReal)); CHKERRQ(ierr);
750a7e14dcfSSatish Balay     /* compute Qd = Q*d */
751a7e14dcfSSatish Balay     if (it < it2){
752a7e14dcfSSatish Balay       for (i = 0; i < it; i++){
753a7e14dcfSSatish Balay         tempQ = Q[ipt[i]];
75453506e15SBarry Smith         for (j = 0; j < dim; j++) Qd[j] += (tempQ[j] * d[ipt[i]]);
755a7e14dcfSSatish Balay       }
75653506e15SBarry Smith     } else { /* compute Qd = Q*y-t */
757a7e14dcfSSatish Balay       for (i = 0; i < it2; i++){
758a7e14dcfSSatish Balay         tempQ = Q[ipt2[i]];
75953506e15SBarry Smith         for (j = 0; j < dim; j++) Qd[j] += (tempQ[j] * y[ipt2[i]]);
760a7e14dcfSSatish Balay       }
76153506e15SBarry Smith       for (j = 0; j < dim; j++) Qd[j] -= t[j];
762a7e14dcfSSatish Balay     }
763a7e14dcfSSatish Balay 
764a7e14dcfSSatish Balay     /* ak = inner{d_{k}}{d_{k}} */
765a7e14dcfSSatish Balay     ak = 0.0;
76653506e15SBarry Smith     for (i = 0; i < dim; i++) ak += d[i] * d[i];
767a7e14dcfSSatish Balay 
768a7e14dcfSSatish Balay     bk = 0.0;
76953506e15SBarry Smith     for (i = 0; i < dim; i++) bk += d[i]*Qd[i];
770a7e14dcfSSatish Balay 
77153506e15SBarry Smith     if (bk > EPS*ak && gd < 0.0)  lamnew = -gd/bk;
77253506e15SBarry Smith     else lamnew = 1.0;
773a7e14dcfSSatish Balay 
774a7e14dcfSSatish Balay     /* fv is computing f(x_{k} + d_{k}) */
775a7e14dcfSSatish Balay     fv = 0.0;
776a7e14dcfSSatish Balay     for (i = 0; i < dim; i++){
777a7e14dcfSSatish Balay       xplus[i] = x[i] + d[i];
778a7e14dcfSSatish Balay       tplus[i] = t[i] + Qd[i];
779a7e14dcfSSatish Balay       fv      += xplus[i] * (0.5*tplus[i] + f[i]);
780a7e14dcfSSatish Balay     }
781a7e14dcfSSatish Balay 
782a7e14dcfSSatish Balay     /* fr is fref */
783a7e14dcfSSatish Balay     if ((innerIter == 1 && fv >= fv0) || (innerIter > 1 && fv >= fr)){
784a7e14dcfSSatish Balay       lscount++;
785a7e14dcfSSatish Balay       fv = 0.0;
786a7e14dcfSSatish Balay       for (i = 0; i < dim; i++){
787a7e14dcfSSatish Balay         xplus[i] = x[i] + lamnew*d[i];
788a7e14dcfSSatish Balay         tplus[i] = t[i] + lamnew*Qd[i];
789a7e14dcfSSatish Balay         fv      += xplus[i] * (0.5*tplus[i] + f[i]);
790a7e14dcfSSatish Balay       }
791a7e14dcfSSatish Balay     }
792a7e14dcfSSatish Balay 
793a7e14dcfSSatish Balay     for (i = 0; i < dim; i++){
794a7e14dcfSSatish Balay       sk[i] = xplus[i] - x[i];
795a7e14dcfSSatish Balay       yk[i] = tplus[i] - t[i];
796a7e14dcfSSatish Balay       x[i]  = xplus[i];
797a7e14dcfSSatish Balay       t[i]  = tplus[i];
798a7e14dcfSSatish Balay       g[i]  = t[i] + f[i];
799a7e14dcfSSatish Balay     }
800a7e14dcfSSatish Balay 
801a7e14dcfSSatish Balay     /* update the line search control parameters */
802a7e14dcfSSatish Balay     if (fv < fbest){
803a7e14dcfSSatish Balay       fbest = fv;
804a7e14dcfSSatish Balay       fc    = fv;
805a7e14dcfSSatish Balay       llast = 0;
80653506e15SBarry Smith     } else {
807a7e14dcfSSatish Balay       fc = (fc > fv ? fc : fv);
808a7e14dcfSSatish Balay       llast++;
809a7e14dcfSSatish Balay       if (llast == L){
810a7e14dcfSSatish Balay         fr    = fc;
811a7e14dcfSSatish Balay         fc    = fv;
812a7e14dcfSSatish Balay         llast = 0;
813a7e14dcfSSatish Balay       }
814a7e14dcfSSatish Balay     }
815a7e14dcfSSatish Balay 
816a7e14dcfSSatish Balay     ak = bk = 0.0;
817a7e14dcfSSatish Balay     for (i = 0; i < dim; i++){
818a7e14dcfSSatish Balay       ak += sk[i] * sk[i];
819a7e14dcfSSatish Balay       bk += sk[i] * yk[i];
820a7e14dcfSSatish Balay     }
821a7e14dcfSSatish Balay 
82253506e15SBarry Smith     if (bk <= EPS*ak) alpha = ALPHA_MAX;
823a7e14dcfSSatish Balay     else {
82453506e15SBarry Smith       if (bkold < EPS*akold) alpha = ak/bk;
82553506e15SBarry Smith       else alpha = (akold+ak)/(bkold+bk);
826a7e14dcfSSatish Balay 
82753506e15SBarry Smith       if (alpha > ALPHA_MAX) alpha = ALPHA_MAX;
82853506e15SBarry Smith       else if (alpha < ALPHA_MIN) alpha = ALPHA_MIN;
829a7e14dcfSSatish Balay     }
830a7e14dcfSSatish Balay 
831a7e14dcfSSatish Balay     akold = ak;
832a7e14dcfSSatish Balay     bkold = bk;
833a7e14dcfSSatish Balay 
834a7e14dcfSSatish Balay     /*** stopping criterion based on KKT conditions ***/
835a7e14dcfSSatish Balay     /* at optimal, gradient of lagrangian w.r.t. x is zero */
836a7e14dcfSSatish Balay 
837a7e14dcfSSatish Balay     bk = 0.0;
83853506e15SBarry Smith     for (i = 0; i < dim; i++) bk +=  x[i] * x[i];
839a7e14dcfSSatish Balay 
84053506e15SBarry Smith     if (PetscSqrtReal(ak) < tol*10 * PetscSqrtReal(bk)){
841a7e14dcfSSatish Balay       it     = 0;
842a7e14dcfSSatish Balay       luv    = 0;
843a7e14dcfSSatish Balay       kktlam = 0.0;
844a7e14dcfSSatish Balay       for (i = 0; i < dim; i++){
845a7e14dcfSSatish Balay         /* x[i] is active hence lagrange multipliers for box constraints
846a7e14dcfSSatish Balay                 are zero. The lagrange multiplier for ineq. const. is then
847a7e14dcfSSatish Balay                 defined as below
848a7e14dcfSSatish Balay         */
849a7e14dcfSSatish Balay         if ((x[i] > DELTAsv) && (x[i] < c-DELTAsv)){
850a7e14dcfSSatish Balay           ipt[it++] = i;
851a7e14dcfSSatish Balay           kktlam    = kktlam - a[i]*g[i];
85253506e15SBarry Smith         } else  uv[luv++] = i;
853a7e14dcfSSatish Balay       }
854a7e14dcfSSatish Balay 
85553506e15SBarry Smith       if (it == 0 && PetscSqrtReal(ak) < tol*0.5 * PetscSqrtReal(bk)) return 0;
856a7e14dcfSSatish Balay       else {
857a7e14dcfSSatish Balay         kktlam = kktlam/it;
858a7e14dcfSSatish Balay         info   = 1;
859a7e14dcfSSatish Balay         for (i = 0; i < it; i++) {
860a7e14dcfSSatish Balay           if (fabs(a[ipt[i]] * g[ipt[i]] + kktlam) > tol) {
861a7e14dcfSSatish Balay             info = 0;
862a7e14dcfSSatish Balay             break;
863a7e14dcfSSatish Balay           }
864a7e14dcfSSatish Balay         }
865a7e14dcfSSatish Balay         if (info == 1)  {
866a7e14dcfSSatish Balay           for (i = 0; i < luv; i++)  {
867a7e14dcfSSatish Balay             if (x[uv[i]] <= DELTAsv){
868a7e14dcfSSatish Balay               /* x[i] == lower bound, hence, lagrange multiplier (say, beta) for lower bound may
869a7e14dcfSSatish Balay                      not be zero. So, the gradient without beta is > 0
870a7e14dcfSSatish Balay               */
871a7e14dcfSSatish Balay               if (g[uv[i]] + kktlam*a[uv[i]] < -tol){
872a7e14dcfSSatish Balay                 info = 0;
873a7e14dcfSSatish Balay                 break;
874a7e14dcfSSatish Balay               }
87553506e15SBarry Smith             } else {
876a7e14dcfSSatish Balay               /* x[i] == upper bound, hence, lagrange multiplier (say, eta) for upper bound may
877a7e14dcfSSatish Balay                      not be zero. So, the gradient without eta is < 0
878a7e14dcfSSatish Balay               */
879a7e14dcfSSatish Balay               if (g[uv[i]] + kktlam*a[uv[i]] > tol) {
880a7e14dcfSSatish Balay                 info = 0;
881a7e14dcfSSatish Balay                 break;
882a7e14dcfSSatish Balay               }
883a7e14dcfSSatish Balay             }
884a7e14dcfSSatish Balay           }
885a7e14dcfSSatish Balay         }
886a7e14dcfSSatish Balay 
88753506e15SBarry Smith         if (info == 1) return 0;
888a7e14dcfSSatish Balay       }
889a7e14dcfSSatish Balay     }
890a7e14dcfSSatish Balay   }
891a7e14dcfSSatish Balay   return 0;
892a7e14dcfSSatish Balay }
893a7e14dcfSSatish Balay 
894a7e14dcfSSatish Balay 
895