xref: /petsc/src/tao/unconstrained/impls/bmrm/bmrm.c (revision 2a80812038b9881e71d725c7f5a502aeff50e549)
1aaa7dc30SBarry Smith #include <../src/tao/unconstrained/impls/bmrm/bmrm.h>
2a7e14dcfSSatish Balay 
3a7e14dcfSSatish Balay static PetscErrorCode init_df_solver(TAO_DF*);
4a7e14dcfSSatish Balay static PetscErrorCode ensure_df_space(PetscInt, TAO_DF*);
5a7e14dcfSSatish Balay static PetscErrorCode destroy_df_solver(TAO_DF*);
60e660641SBarry Smith static PetscReal phi(PetscReal*,PetscInt,PetscReal,PetscReal*,PetscReal,PetscReal*,PetscReal*,PetscReal*);
70e660641SBarry Smith static PetscInt project(PetscInt,PetscReal*,PetscReal,PetscReal*,PetscReal*,PetscReal*,PetscReal*,PetscReal*,TAO_DF*);
8a7e14dcfSSatish Balay static PetscErrorCode solve(TAO_DF*);
9a7e14dcfSSatish Balay 
10a7e14dcfSSatish Balay 
11a7e14dcfSSatish Balay /*------------------------------------------------------------*/
12a7e14dcfSSatish Balay /* The main solver function
13a7e14dcfSSatish Balay 
14a7e14dcfSSatish Balay    f = Remp(W)          This is what the user provides us from the application layer
15a7e14dcfSSatish Balay    So the ComputeGradient function for instance should get us back the subgradient of Remp(W)
16a7e14dcfSSatish Balay 
17a7e14dcfSSatish Balay    Regularizer assumed to be L2 norm = lambda*0.5*W'W ()
18a7e14dcfSSatish Balay */
19a7e14dcfSSatish Balay 
20a7e14dcfSSatish Balay #undef __FUNCT__
21a7e14dcfSSatish Balay #define __FUNCT__ "make_grad_node"
22a7e14dcfSSatish Balay static PetscErrorCode make_grad_node(Vec X, Vec_Chain **p)
23a7e14dcfSSatish Balay {
24a7e14dcfSSatish Balay   PetscErrorCode ierr;
25a7e14dcfSSatish Balay 
26a7e14dcfSSatish Balay   PetscFunctionBegin;
270e660641SBarry Smith   ierr = PetscNew(p);CHKERRQ(ierr);
28a7e14dcfSSatish Balay   ierr = VecDuplicate(X, &(*p)->V);CHKERRQ(ierr);
29a7e14dcfSSatish Balay   ierr = VecCopy(X, (*p)->V);CHKERRQ(ierr);
306c23d075SBarry Smith   (*p)->next = NULL;
31a7e14dcfSSatish Balay   PetscFunctionReturn(0);
32a7e14dcfSSatish Balay }
33a7e14dcfSSatish Balay 
34a7e14dcfSSatish Balay #undef __FUNCT__
35a7e14dcfSSatish Balay #define __FUNCT__ "destroy_grad_list"
36a7e14dcfSSatish Balay static PetscErrorCode destroy_grad_list(Vec_Chain *head)
37a7e14dcfSSatish Balay {
38a7e14dcfSSatish Balay   PetscErrorCode ierr;
39a7e14dcfSSatish Balay   Vec_Chain      *p = head->next, *q;
40a7e14dcfSSatish Balay 
41a7e14dcfSSatish Balay   PetscFunctionBegin;
42a7e14dcfSSatish Balay   while(p) {
43a7e14dcfSSatish Balay     q = p->next;
44a7e14dcfSSatish Balay     ierr = VecDestroy(&p->V);CHKERRQ(ierr);
45a7e14dcfSSatish Balay     ierr = PetscFree(p);CHKERRQ(ierr);
46a7e14dcfSSatish Balay     p = q;
47a7e14dcfSSatish Balay   }
486c23d075SBarry Smith   head->next = NULL;
49a7e14dcfSSatish Balay   PetscFunctionReturn(0);
50a7e14dcfSSatish Balay }
51a7e14dcfSSatish Balay 
52a7e14dcfSSatish Balay 
53a7e14dcfSSatish Balay #undef __FUNCT__
54a7e14dcfSSatish Balay #define __FUNCT__ "TaoSolve_BMRM"
55441846f8SBarry Smith static PetscErrorCode TaoSolve_BMRM(Tao tao)
56a7e14dcfSSatish Balay {
57a7e14dcfSSatish Balay   PetscErrorCode     ierr;
58e4cb33bbSBarry Smith   TaoConvergedReason reason;
59a7e14dcfSSatish Balay   TAO_DF             df;
60a7e14dcfSSatish Balay   TAO_BMRM           *bmrm = (TAO_BMRM*)tao->data;
61a7e14dcfSSatish Balay 
62a7e14dcfSSatish Balay   /* Values and pointers to parts of the optimization problem */
63a7e14dcfSSatish Balay   PetscReal          f = 0.0;
64a7e14dcfSSatish Balay   Vec                W = tao->solution;
65a7e14dcfSSatish Balay   Vec                G = tao->gradient;
66a7e14dcfSSatish Balay   PetscReal          lambda;
67a7e14dcfSSatish Balay   PetscReal          bt;
68a7e14dcfSSatish Balay   Vec_Chain          grad_list, *tail_glist, *pgrad;
69a7e14dcfSSatish Balay   PetscInt           i;
70a7e14dcfSSatish Balay   PetscMPIInt        rank;
71a7e14dcfSSatish Balay 
72e4cb33bbSBarry Smith   /* Used in converged criteria check */
73a7e14dcfSSatish Balay   PetscReal          reg;
74a7e14dcfSSatish Balay   PetscReal          jtwt, max_jtwt, pre_epsilon, epsilon, jw, min_jw;
75a7e14dcfSSatish Balay   PetscReal          innerSolverTol;
76ba4b436cSBarry Smith   MPI_Comm           comm;
77a7e14dcfSSatish Balay 
78a7e14dcfSSatish Balay   PetscFunctionBegin;
79ba4b436cSBarry Smith   ierr = PetscObjectGetComm((PetscObject)tao,&comm);CHKERRQ(ierr);
80ba4b436cSBarry Smith   ierr = MPI_Comm_rank(comm, &rank);CHKERRQ(ierr);
81a7e14dcfSSatish Balay   lambda = bmrm->lambda;
82a7e14dcfSSatish Balay 
83a7e14dcfSSatish Balay   /* Check Stopping Condition */
84a7e14dcfSSatish Balay   tao->step = 1.0;
85a7e14dcfSSatish Balay   max_jtwt = -BMRM_INFTY;
86a7e14dcfSSatish Balay   min_jw = BMRM_INFTY;
87a7e14dcfSSatish Balay   innerSolverTol = 1.0;
88a7e14dcfSSatish Balay   epsilon = 0.0;
89a7e14dcfSSatish Balay 
900e660641SBarry Smith   if (!rank) {
91a7e14dcfSSatish Balay     ierr = init_df_solver(&df);CHKERRQ(ierr);
92a7e14dcfSSatish Balay     grad_list.next = NULL;
93a7e14dcfSSatish Balay     tail_glist = &grad_list;
94a7e14dcfSSatish Balay   }
95a7e14dcfSSatish Balay 
96a7e14dcfSSatish Balay   df.tol = 1e-6;
97a7e14dcfSSatish Balay   reason = TAO_CONTINUE_ITERATING;
98a7e14dcfSSatish Balay 
99a7e14dcfSSatish Balay   /*-----------------Algorithm Begins------------------------*/
100a7e14dcfSSatish Balay   /* make the scatter */
101a7e14dcfSSatish Balay   ierr = VecScatterCreateToZero(W, &bmrm->scatter, &bmrm->local_w);CHKERRQ(ierr);
102a7e14dcfSSatish Balay   ierr = VecAssemblyBegin(bmrm->local_w);CHKERRQ(ierr);
103a7e14dcfSSatish Balay   ierr = VecAssemblyEnd(bmrm->local_w);CHKERRQ(ierr);
104a7e14dcfSSatish Balay 
105a7e14dcfSSatish Balay   /* NOTE: In application pass the sub-gradient of Remp(W) */
106a7e14dcfSSatish Balay   ierr = TaoComputeObjectiveAndGradient(tao, W, &f, G);CHKERRQ(ierr);
1078931d482SJason Sarich   ierr = TaoMonitor(tao,tao->niter,f,1.0,0.0,tao->step,&reason);CHKERRQ(ierr);
108a7e14dcfSSatish Balay   while (reason == TAO_CONTINUE_ITERATING) {
109a7e14dcfSSatish Balay     /* compute bt = Remp(Wt-1) - <Wt-1, At> */
110a7e14dcfSSatish Balay     ierr = VecDot(W, G, &bt);CHKERRQ(ierr);
111a7e14dcfSSatish Balay     bt = f - bt;
112a7e14dcfSSatish Balay 
113a7e14dcfSSatish Balay     /* First gather the gradient to the master node */
114a7e14dcfSSatish Balay     ierr = VecScatterBegin(bmrm->scatter, G, bmrm->local_w, INSERT_VALUES, SCATTER_FORWARD);CHKERRQ(ierr);
115a7e14dcfSSatish Balay     ierr = VecScatterEnd(bmrm->scatter, G, bmrm->local_w, INSERT_VALUES, SCATTER_FORWARD);CHKERRQ(ierr);
116a7e14dcfSSatish Balay 
117a7e14dcfSSatish Balay     /* Bring up the inner solver */
1180e660641SBarry Smith     if (!rank) {
1198931d482SJason Sarich       ierr = ensure_df_space(tao->niter+1, &df);CHKERRQ(ierr);
120a7e14dcfSSatish Balay       ierr = make_grad_node(bmrm->local_w, &pgrad);CHKERRQ(ierr);
121a7e14dcfSSatish Balay       tail_glist->next = pgrad;
122a7e14dcfSSatish Balay       tail_glist = pgrad;
123a7e14dcfSSatish Balay 
1248931d482SJason Sarich       df.a[tao->niter] = 1.0;
1258931d482SJason Sarich       df.f[tao->niter] = -bt;
1268931d482SJason Sarich       df.u[tao->niter] = 1.0;
1278931d482SJason Sarich       df.l[tao->niter] = 0.0;
128a7e14dcfSSatish Balay 
129a7e14dcfSSatish Balay       /* set up the Q */
130a7e14dcfSSatish Balay       pgrad = grad_list.next;
1318931d482SJason Sarich       for (i=0; i<=tao->niter; i++) {
132*2a808120SBarry Smith         if (!pgrad) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Assert that there are at least tao->niter+1 pgrad available");
133a7e14dcfSSatish Balay         ierr = VecDot(pgrad->V, bmrm->local_w, &reg);CHKERRQ(ierr);
1348931d482SJason Sarich         df.Q[i][tao->niter] = df.Q[tao->niter][i] = reg / lambda;
135a7e14dcfSSatish Balay         pgrad = pgrad->next;
136a7e14dcfSSatish Balay       }
137a7e14dcfSSatish Balay 
1388931d482SJason Sarich       if (tao->niter > 0) {
1398931d482SJason Sarich         df.x[tao->niter] = 0.0;
140a7e14dcfSSatish Balay         ierr = solve(&df);CHKERRQ(ierr);
1410e660641SBarry Smith       } else
142a7e14dcfSSatish Balay         df.x[0] = 1.0;
143a7e14dcfSSatish Balay 
144a7e14dcfSSatish Balay       /* now computing Jt*(alpha_t) which should be = Jt(wt) to check convergence */
145a7e14dcfSSatish Balay       jtwt = 0.0;
146a7e14dcfSSatish Balay       ierr = VecSet(bmrm->local_w, 0.0);CHKERRQ(ierr);
147a7e14dcfSSatish Balay       pgrad = grad_list.next;
1488931d482SJason Sarich       for (i=0; i<=tao->niter; i++) {
149a7e14dcfSSatish Balay         jtwt -= df.x[i] * df.f[i];
150a7e14dcfSSatish Balay         ierr = VecAXPY(bmrm->local_w, -df.x[i] / lambda, pgrad->V);CHKERRQ(ierr);
151a7e14dcfSSatish Balay         pgrad = pgrad->next;
152a7e14dcfSSatish Balay       }
153a7e14dcfSSatish Balay 
154a7e14dcfSSatish Balay       ierr = VecNorm(bmrm->local_w, NORM_2, &reg);CHKERRQ(ierr);
155a7e14dcfSSatish Balay       reg = 0.5*lambda*reg*reg;
156a7e14dcfSSatish Balay       jtwt -= reg;
157a7e14dcfSSatish Balay     } /* end if rank == 0 */
158a7e14dcfSSatish Balay 
159a7e14dcfSSatish Balay     /* scatter the new W to all nodes */
160a7e14dcfSSatish Balay     ierr = VecScatterBegin(bmrm->scatter,bmrm->local_w,W,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
161a7e14dcfSSatish Balay     ierr = VecScatterEnd(bmrm->scatter,bmrm->local_w,W,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
162a7e14dcfSSatish Balay 
163a7e14dcfSSatish Balay     ierr = TaoComputeObjectiveAndGradient(tao, W, &f, G);CHKERRQ(ierr);
164a7e14dcfSSatish Balay 
165ba4b436cSBarry Smith     ierr = MPI_Bcast(&jtwt,1,MPIU_REAL,0,comm);CHKERRQ(ierr);
166ba4b436cSBarry Smith     ierr = MPI_Bcast(&reg,1,MPIU_REAL,0,comm);CHKERRQ(ierr);
167a7e14dcfSSatish Balay 
168a7e14dcfSSatish Balay     jw = reg + f;                                       /* J(w) = regularizer + Remp(w) */
1690e660641SBarry Smith     if (jw < min_jw) min_jw = jw;
1700e660641SBarry Smith     if (jtwt > max_jtwt) max_jtwt = jtwt;
171a7e14dcfSSatish Balay 
172a7e14dcfSSatish Balay     pre_epsilon = epsilon;
173a7e14dcfSSatish Balay     epsilon = min_jw - jtwt;
174a7e14dcfSSatish Balay 
1750e660641SBarry Smith     if (!rank) {
1760e660641SBarry Smith       if (innerSolverTol > epsilon) innerSolverTol = epsilon;
1770e660641SBarry Smith       else if (innerSolverTol < 1e-7) innerSolverTol = 1e-7;
178a7e14dcfSSatish Balay 
179a7e14dcfSSatish Balay       /* if the annealing doesn't work well, lower the inner solver tolerance */
1800e660641SBarry Smith       if(pre_epsilon < epsilon) innerSolverTol *= 0.2;
181a7e14dcfSSatish Balay 
182a7e14dcfSSatish Balay       df.tol = innerSolverTol*0.5;
183a7e14dcfSSatish Balay     }
184a7e14dcfSSatish Balay 
1858931d482SJason Sarich     tao->niter++;
1868931d482SJason Sarich     ierr = TaoMonitor(tao,tao->niter,min_jw,epsilon,0.0,tao->step,&reason);CHKERRQ(ierr);
187a7e14dcfSSatish Balay   }
188a7e14dcfSSatish Balay 
189a7e14dcfSSatish Balay   /* free all the memory */
1900e660641SBarry Smith   if (!rank) {
191a7e14dcfSSatish Balay     ierr = destroy_grad_list(&grad_list);CHKERRQ(ierr);
192a7e14dcfSSatish Balay     ierr = destroy_df_solver(&df);CHKERRQ(ierr);
193a7e14dcfSSatish Balay   }
194a7e14dcfSSatish Balay 
195a7e14dcfSSatish Balay   ierr = VecDestroy(&bmrm->local_w);CHKERRQ(ierr);
196a7e14dcfSSatish Balay   ierr = VecScatterDestroy(&bmrm->scatter);CHKERRQ(ierr);
197a7e14dcfSSatish Balay   PetscFunctionReturn(0);
198a7e14dcfSSatish Balay }
199a7e14dcfSSatish Balay 
200a7e14dcfSSatish Balay 
201a7e14dcfSSatish Balay /* ---------------------------------------------------------- */
202a7e14dcfSSatish Balay 
203a7e14dcfSSatish Balay #undef __FUNCT__
204a7e14dcfSSatish Balay #define __FUNCT__ "TaoSetup_BMRM"
205441846f8SBarry Smith static PetscErrorCode TaoSetup_BMRM(Tao tao)
2060e660641SBarry Smith {
207a7e14dcfSSatish Balay 
208a7e14dcfSSatish Balay   PetscErrorCode ierr;
209a7e14dcfSSatish Balay 
210a7e14dcfSSatish Balay   PetscFunctionBegin;
211a7e14dcfSSatish Balay   /* Allocate some arrays */
212a7e14dcfSSatish Balay   if (!tao->gradient) {
213a7e14dcfSSatish Balay     ierr = VecDuplicate(tao->solution, &tao->gradient);CHKERRQ(ierr);
214a7e14dcfSSatish Balay   }
215a7e14dcfSSatish Balay   PetscFunctionReturn(0);
216a7e14dcfSSatish Balay }
217a7e14dcfSSatish Balay 
218a7e14dcfSSatish Balay /*------------------------------------------------------------*/
219a7e14dcfSSatish Balay #undef __FUNCT__
220a7e14dcfSSatish Balay #define __FUNCT__ "TaoDestroy_BMRM"
221441846f8SBarry Smith static PetscErrorCode TaoDestroy_BMRM(Tao tao)
222a7e14dcfSSatish Balay {
223a7e14dcfSSatish Balay   PetscErrorCode ierr;
224a7e14dcfSSatish Balay 
225a7e14dcfSSatish Balay   PetscFunctionBegin;
226a7e14dcfSSatish Balay   ierr = PetscFree(tao->data);CHKERRQ(ierr);
227a7e14dcfSSatish Balay   PetscFunctionReturn(0);
228a7e14dcfSSatish Balay }
229a7e14dcfSSatish Balay 
230a7e14dcfSSatish Balay #undef __FUNCT__
231a7e14dcfSSatish Balay #define __FUNCT__ "TaoSetFromOptions_BMRM"
2324416b707SBarry Smith static PetscErrorCode TaoSetFromOptions_BMRM(PetscOptionItems *PetscOptionsObject,Tao tao)
233a7e14dcfSSatish Balay {
234a7e14dcfSSatish Balay   PetscErrorCode ierr;
235a7e14dcfSSatish Balay   TAO_BMRM*      bmrm = (TAO_BMRM*)tao->data;
236a7e14dcfSSatish Balay 
237a7e14dcfSSatish Balay   PetscFunctionBegin;
2381a1499c8SBarry Smith   ierr = PetscOptionsHead(PetscOptionsObject,"BMRM for regularized risk minimization");CHKERRQ(ierr);
23994ae4db5SBarry Smith   ierr = PetscOptionsReal("-tao_bmrm_lambda", "regulariser weight","", 100,&bmrm->lambda,NULL);CHKERRQ(ierr);
240a7e14dcfSSatish Balay   ierr = PetscOptionsTail();CHKERRQ(ierr);
241a7e14dcfSSatish Balay   PetscFunctionReturn(0);
242a7e14dcfSSatish Balay }
243a7e14dcfSSatish Balay 
244a7e14dcfSSatish Balay /*------------------------------------------------------------*/
245a7e14dcfSSatish Balay #undef __FUNCT__
246a7e14dcfSSatish Balay #define __FUNCT__ "TaoView_BMRM"
247441846f8SBarry Smith static PetscErrorCode TaoView_BMRM(Tao tao, PetscViewer viewer)
248a7e14dcfSSatish Balay {
249a7e14dcfSSatish Balay   PetscBool      isascii;
250a7e14dcfSSatish Balay   PetscErrorCode ierr;
251a7e14dcfSSatish Balay 
252a7e14dcfSSatish Balay   PetscFunctionBegin;
253a7e14dcfSSatish Balay   ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&isascii);CHKERRQ(ierr);
254a7e14dcfSSatish Balay   if (isascii) {
255a7e14dcfSSatish Balay     ierr = PetscViewerASCIIPushTab(viewer);CHKERRQ(ierr);
256a7e14dcfSSatish Balay     ierr = PetscViewerASCIIPopTab(viewer);CHKERRQ(ierr);
257a7e14dcfSSatish Balay   }
258a7e14dcfSSatish Balay   PetscFunctionReturn(0);
259a7e14dcfSSatish Balay }
260a7e14dcfSSatish Balay 
261a7e14dcfSSatish Balay /*------------------------------------------------------------*/
2621522df2eSJason Sarich /*MC
2631522df2eSJason Sarich   TAOBMRM - bundle method for regularized risk minimization
2641522df2eSJason Sarich 
2651522df2eSJason Sarich   Options Database Keys:
2661522df2eSJason Sarich . - tao_bmrm_lambda - regulariser weight
2671522df2eSJason Sarich 
2681eb8069cSJason Sarich   Level: beginner
2691522df2eSJason Sarich M*/
2701522df2eSJason Sarich 
271a7e14dcfSSatish Balay #undef __FUNCT__
272a7e14dcfSSatish Balay #define __FUNCT__ "TaoCreate_BMRM"
273728e0ed0SBarry Smith PETSC_EXTERN PetscErrorCode TaoCreate_BMRM(Tao tao)
274a7e14dcfSSatish Balay {
275a7e14dcfSSatish Balay   TAO_BMRM       *bmrm;
276a7e14dcfSSatish Balay   PetscErrorCode ierr;
277a7e14dcfSSatish Balay 
278a7e14dcfSSatish Balay   PetscFunctionBegin;
279a7e14dcfSSatish Balay   tao->ops->setup = TaoSetup_BMRM;
280a7e14dcfSSatish Balay   tao->ops->solve = TaoSolve_BMRM;
281a7e14dcfSSatish Balay   tao->ops->view  = TaoView_BMRM;
282a7e14dcfSSatish Balay   tao->ops->setfromoptions = TaoSetFromOptions_BMRM;
283a7e14dcfSSatish Balay   tao->ops->destroy = TaoDestroy_BMRM;
284a7e14dcfSSatish Balay 
2853c9e27cfSGeoffrey Irving   ierr = PetscNewLog(tao,&bmrm);CHKERRQ(ierr);
286a7e14dcfSSatish Balay   bmrm->lambda = 1.0;
287a7e14dcfSSatish Balay   tao->data = (void*)bmrm;
288a7e14dcfSSatish Balay 
2896552cf8aSJason Sarich   /* Override default settings (unless already changed) */
2906552cf8aSJason Sarich   if (!tao->max_it_changed) tao->max_it = 2000;
2916552cf8aSJason Sarich   if (!tao->max_funcs_changed) tao->max_funcs = 4000;
2926552cf8aSJason Sarich   if (!tao->gatol_changed) tao->gatol = 1.0e-12;
2936552cf8aSJason Sarich   if (!tao->grtol_changed) tao->grtol = 1.0e-12;
294a7e14dcfSSatish Balay 
295a7e14dcfSSatish Balay   PetscFunctionReturn(0);
296a7e14dcfSSatish Balay }
297a7e14dcfSSatish Balay 
298a7e14dcfSSatish Balay #undef __FUNCT__
299a7e14dcfSSatish Balay #define __FUNCT__ "init_df_solver"
300a7e14dcfSSatish Balay PetscErrorCode init_df_solver(TAO_DF *df)
301a7e14dcfSSatish Balay {
302a7e14dcfSSatish Balay   PetscInt       i, n = INCRE_DIM;
303a7e14dcfSSatish Balay   PetscErrorCode ierr;
304a7e14dcfSSatish Balay 
305a7e14dcfSSatish Balay   PetscFunctionBegin;
306a7e14dcfSSatish Balay   /* default values */
307a7e14dcfSSatish Balay   df->maxProjIter = 200;
308a7e14dcfSSatish Balay   df->maxPGMIter = 300000;
309a7e14dcfSSatish Balay   df->b = 1.0;
310a7e14dcfSSatish Balay 
311a7e14dcfSSatish Balay   /* memory space required by Dai-Fletcher */
312a7e14dcfSSatish Balay   df->cur_num_cp = n;
3130e660641SBarry Smith   ierr = PetscMalloc1(n, &df->f);CHKERRQ(ierr);
3140e660641SBarry Smith   ierr = PetscMalloc1(n, &df->a);CHKERRQ(ierr);
3150e660641SBarry Smith   ierr = PetscMalloc1(n, &df->l);CHKERRQ(ierr);
3160e660641SBarry Smith   ierr = PetscMalloc1(n, &df->u);CHKERRQ(ierr);
3170e660641SBarry Smith   ierr = PetscMalloc1(n, &df->x);CHKERRQ(ierr);
318e1cc520bSBarry Smith   ierr = PetscMalloc1(n, &df->Q);CHKERRQ(ierr);
319a7e14dcfSSatish Balay 
320a7e14dcfSSatish Balay   for (i = 0; i < n; i ++) {
3210e660641SBarry Smith     ierr = PetscMalloc1(n, &df->Q[i]);CHKERRQ(ierr);
322a7e14dcfSSatish Balay   }
323a7e14dcfSSatish Balay 
3240e660641SBarry Smith   ierr = PetscMalloc1(n, &df->g);CHKERRQ(ierr);
3250e660641SBarry Smith   ierr = PetscMalloc1(n, &df->y);CHKERRQ(ierr);
3260e660641SBarry Smith   ierr = PetscMalloc1(n, &df->tempv);CHKERRQ(ierr);
3270e660641SBarry Smith   ierr = PetscMalloc1(n, &df->d);CHKERRQ(ierr);
3280e660641SBarry Smith   ierr = PetscMalloc1(n, &df->Qd);CHKERRQ(ierr);
3290e660641SBarry Smith   ierr = PetscMalloc1(n, &df->t);CHKERRQ(ierr);
3300e660641SBarry Smith   ierr = PetscMalloc1(n, &df->xplus);CHKERRQ(ierr);
3310e660641SBarry Smith   ierr = PetscMalloc1(n, &df->tplus);CHKERRQ(ierr);
3320e660641SBarry Smith   ierr = PetscMalloc1(n, &df->sk);CHKERRQ(ierr);
3330e660641SBarry Smith   ierr = PetscMalloc1(n, &df->yk);CHKERRQ(ierr);
334a7e14dcfSSatish Balay 
335e1cc520bSBarry Smith   ierr = PetscMalloc1(n, &df->ipt);CHKERRQ(ierr);
336e1cc520bSBarry Smith   ierr = PetscMalloc1(n, &df->ipt2);CHKERRQ(ierr);
337e1cc520bSBarry Smith   ierr = PetscMalloc1(n, &df->uv);CHKERRQ(ierr);
338a7e14dcfSSatish Balay   PetscFunctionReturn(0);
339a7e14dcfSSatish Balay }
340a7e14dcfSSatish Balay 
341a7e14dcfSSatish Balay #undef __FUNCT__
342a7e14dcfSSatish Balay #define __FUNCT__ "ensure_df_space"
343a7e14dcfSSatish Balay PetscErrorCode ensure_df_space(PetscInt dim, TAO_DF *df)
344a7e14dcfSSatish Balay {
345a7e14dcfSSatish Balay   PetscErrorCode ierr;
346a7e14dcfSSatish Balay   PetscReal      *tmp, **tmp_Q;
347a7e14dcfSSatish Balay   PetscInt       i, n, old_n;
348a7e14dcfSSatish Balay 
349a7e14dcfSSatish Balay   PetscFunctionBegin;
35053506e15SBarry Smith   df->dim = dim;
35153506e15SBarry Smith   if (dim <= df->cur_num_cp) PetscFunctionReturn(0);
352a7e14dcfSSatish Balay 
353a7e14dcfSSatish Balay   old_n = df->cur_num_cp;
354a7e14dcfSSatish Balay   df->cur_num_cp += INCRE_DIM;
355a7e14dcfSSatish Balay   n = df->cur_num_cp;
356a7e14dcfSSatish Balay 
357a7e14dcfSSatish Balay   /* memory space required by dai-fletcher */
3580e660641SBarry Smith   ierr = PetscMalloc1(n, &tmp);CHKERRQ(ierr);
359a7e14dcfSSatish Balay   ierr = PetscMemcpy(tmp, df->f, sizeof(PetscReal)*old_n);CHKERRQ(ierr);
360a7e14dcfSSatish Balay   ierr = PetscFree(df->f);CHKERRQ(ierr);
361a7e14dcfSSatish Balay   df->f = tmp;
362a7e14dcfSSatish Balay 
3630e660641SBarry Smith   ierr = PetscMalloc1(n, &tmp);CHKERRQ(ierr);
364a7e14dcfSSatish Balay   ierr = PetscMemcpy(tmp, df->a, sizeof(PetscReal)*old_n);CHKERRQ(ierr);
365a7e14dcfSSatish Balay   ierr = PetscFree(df->a);CHKERRQ(ierr);
366a7e14dcfSSatish Balay   df->a = tmp;
367a7e14dcfSSatish Balay 
3680e660641SBarry Smith   ierr = PetscMalloc1(n, &tmp);CHKERRQ(ierr);
369a7e14dcfSSatish Balay   ierr = PetscMemcpy(tmp, df->l, sizeof(PetscReal)*old_n);CHKERRQ(ierr);
370a7e14dcfSSatish Balay   ierr = PetscFree(df->l);CHKERRQ(ierr);
371a7e14dcfSSatish Balay   df->l = tmp;
372a7e14dcfSSatish Balay 
3730e660641SBarry Smith   ierr = PetscMalloc1(n, &tmp);CHKERRQ(ierr);
374a7e14dcfSSatish Balay   ierr = PetscMemcpy(tmp, df->u, sizeof(PetscReal)*old_n);CHKERRQ(ierr);
375a7e14dcfSSatish Balay   ierr = PetscFree(df->u);CHKERRQ(ierr);
376a7e14dcfSSatish Balay   df->u = tmp;
377a7e14dcfSSatish Balay 
3780e660641SBarry Smith   ierr = PetscMalloc1(n, &tmp);CHKERRQ(ierr);
379a7e14dcfSSatish Balay   ierr = PetscMemcpy(tmp, df->x, sizeof(PetscReal)*old_n);CHKERRQ(ierr);
380a7e14dcfSSatish Balay   ierr = PetscFree(df->x);CHKERRQ(ierr);
381a7e14dcfSSatish Balay   df->x = tmp;
382a7e14dcfSSatish Balay 
383e1cc520bSBarry Smith   ierr = PetscMalloc1(n, &tmp_Q);CHKERRQ(ierr);
38453506e15SBarry Smith   for (i = 0; i < n; i ++) {
3850e660641SBarry Smith     ierr = PetscMalloc1(n, &tmp_Q[i]);CHKERRQ(ierr);
38653506e15SBarry Smith     if (i < old_n) {
387a7e14dcfSSatish Balay       ierr = PetscMemcpy(tmp_Q[i], df->Q[i], sizeof(PetscReal)*old_n);CHKERRQ(ierr);
388a7e14dcfSSatish Balay       ierr = PetscFree(df->Q[i]);CHKERRQ(ierr);
389a7e14dcfSSatish Balay     }
390a7e14dcfSSatish Balay   }
391a7e14dcfSSatish Balay 
392a7e14dcfSSatish Balay   ierr = PetscFree(df->Q);CHKERRQ(ierr);
393a7e14dcfSSatish Balay   df->Q = tmp_Q;
394a7e14dcfSSatish Balay 
395a7e14dcfSSatish Balay   ierr = PetscFree(df->g);CHKERRQ(ierr);
3960e660641SBarry Smith   ierr = PetscMalloc1(n, &df->g);CHKERRQ(ierr);
397a7e14dcfSSatish Balay 
398a7e14dcfSSatish Balay   ierr = PetscFree(df->y);CHKERRQ(ierr);
3990e660641SBarry Smith   ierr = PetscMalloc1(n, &df->y);CHKERRQ(ierr);
400a7e14dcfSSatish Balay 
401a7e14dcfSSatish Balay   ierr = PetscFree(df->tempv);CHKERRQ(ierr);
4020e660641SBarry Smith   ierr = PetscMalloc1(n, &df->tempv);CHKERRQ(ierr);
403a7e14dcfSSatish Balay 
404a7e14dcfSSatish Balay   ierr = PetscFree(df->d);CHKERRQ(ierr);
4050e660641SBarry Smith   ierr = PetscMalloc1(n, &df->d);CHKERRQ(ierr);
406a7e14dcfSSatish Balay 
407a7e14dcfSSatish Balay   ierr = PetscFree(df->Qd);CHKERRQ(ierr);
4080e660641SBarry Smith   ierr = PetscMalloc1(n, &df->Qd);CHKERRQ(ierr);
409a7e14dcfSSatish Balay 
410a7e14dcfSSatish Balay   ierr = PetscFree(df->t);CHKERRQ(ierr);
4110e660641SBarry Smith   ierr = PetscMalloc1(n, &df->t);CHKERRQ(ierr);
412a7e14dcfSSatish Balay 
413a7e14dcfSSatish Balay   ierr = PetscFree(df->xplus);CHKERRQ(ierr);
4140e660641SBarry Smith   ierr = PetscMalloc1(n, &df->xplus);CHKERRQ(ierr);
415a7e14dcfSSatish Balay 
416a7e14dcfSSatish Balay   ierr = PetscFree(df->tplus);CHKERRQ(ierr);
4170e660641SBarry Smith   ierr = PetscMalloc1(n, &df->tplus);CHKERRQ(ierr);
418a7e14dcfSSatish Balay 
419a7e14dcfSSatish Balay   ierr = PetscFree(df->sk);CHKERRQ(ierr);
4200e660641SBarry Smith   ierr = PetscMalloc1(n, &df->sk);CHKERRQ(ierr);
421a7e14dcfSSatish Balay 
422a7e14dcfSSatish Balay   ierr = PetscFree(df->yk);CHKERRQ(ierr);
4230e660641SBarry Smith   ierr = PetscMalloc1(n, &df->yk);CHKERRQ(ierr);
424a7e14dcfSSatish Balay 
425a7e14dcfSSatish Balay   ierr = PetscFree(df->ipt);CHKERRQ(ierr);
426e1cc520bSBarry Smith   ierr = PetscMalloc1(n, &df->ipt);CHKERRQ(ierr);
427a7e14dcfSSatish Balay 
428a7e14dcfSSatish Balay   ierr = PetscFree(df->ipt2);CHKERRQ(ierr);
4290e660641SBarry Smith   ierr = PetscMalloc1(n, &df->ipt2);CHKERRQ(ierr);
430a7e14dcfSSatish Balay 
431a7e14dcfSSatish Balay   ierr = PetscFree(df->uv);CHKERRQ(ierr);
4320e660641SBarry Smith   ierr = PetscMalloc1(n, &df->uv);CHKERRQ(ierr);
433a7e14dcfSSatish Balay   PetscFunctionReturn(0);
434a7e14dcfSSatish Balay }
435a7e14dcfSSatish Balay 
436a7e14dcfSSatish Balay #undef __FUNCT__
437a7e14dcfSSatish Balay #define __FUNCT__ "destroy_df_solver"
438a7e14dcfSSatish Balay PetscErrorCode destroy_df_solver(TAO_DF *df)
439a7e14dcfSSatish Balay {
440a7e14dcfSSatish Balay   PetscErrorCode ierr;
441a7e14dcfSSatish Balay   PetscInt       i;
4426c23d075SBarry Smith 
443a7e14dcfSSatish Balay   PetscFunctionBegin;
4446c23d075SBarry Smith   ierr = PetscFree(df->f);CHKERRQ(ierr);
4456c23d075SBarry Smith   ierr = PetscFree(df->a);CHKERRQ(ierr);
4466c23d075SBarry Smith   ierr = PetscFree(df->l);CHKERRQ(ierr);
4476c23d075SBarry Smith   ierr = PetscFree(df->u);CHKERRQ(ierr);
4486c23d075SBarry Smith   ierr = PetscFree(df->x);CHKERRQ(ierr);
449a7e14dcfSSatish Balay 
4506c23d075SBarry Smith   for (i = 0; i < df->cur_num_cp; i ++) {
451a7e14dcfSSatish Balay     ierr = PetscFree(df->Q[i]);CHKERRQ(ierr);
452a7e14dcfSSatish Balay   }
453a7e14dcfSSatish Balay   ierr = PetscFree(df->Q);CHKERRQ(ierr);
4546c23d075SBarry Smith   ierr = PetscFree(df->ipt);CHKERRQ(ierr);
4556c23d075SBarry Smith   ierr = PetscFree(df->ipt2);CHKERRQ(ierr);
4566c23d075SBarry Smith   ierr = PetscFree(df->uv);CHKERRQ(ierr);
4576c23d075SBarry Smith   ierr = PetscFree(df->g);CHKERRQ(ierr);
4586c23d075SBarry Smith   ierr = PetscFree(df->y);CHKERRQ(ierr);
4596c23d075SBarry Smith   ierr = PetscFree(df->tempv);CHKERRQ(ierr);
4606c23d075SBarry Smith   ierr = PetscFree(df->d);CHKERRQ(ierr);
4616c23d075SBarry Smith   ierr = PetscFree(df->Qd);CHKERRQ(ierr);
4626c23d075SBarry Smith   ierr = PetscFree(df->t);CHKERRQ(ierr);
4636c23d075SBarry Smith   ierr = PetscFree(df->xplus);CHKERRQ(ierr);
4646c23d075SBarry Smith   ierr = PetscFree(df->tplus);CHKERRQ(ierr);
4656c23d075SBarry Smith   ierr = PetscFree(df->sk);CHKERRQ(ierr);
4666c23d075SBarry Smith   ierr = PetscFree(df->yk);CHKERRQ(ierr);
467a7e14dcfSSatish Balay   PetscFunctionReturn(0);
468a7e14dcfSSatish Balay }
469a7e14dcfSSatish Balay 
470a7e14dcfSSatish Balay /* Piecewise linear monotone target function for the Dai-Fletcher projector */
471a7e14dcfSSatish Balay #undef __FUNCT__
472a7e14dcfSSatish Balay #define __FUNCT__ "phi"
4736c23d075SBarry Smith PetscReal phi(PetscReal *x,PetscInt n,PetscReal lambda,PetscReal *a,PetscReal b,PetscReal *c,PetscReal *l,PetscReal *u)
474a7e14dcfSSatish Balay {
475a7e14dcfSSatish Balay   PetscReal r = 0.0;
476a7e14dcfSSatish Balay   PetscInt  i;
477a7e14dcfSSatish Balay 
478a7e14dcfSSatish Balay   for (i = 0; i < n; i++){
479a7e14dcfSSatish Balay     x[i] = -c[i] + lambda*a[i];
4806c23d075SBarry Smith     if (x[i] > u[i])     x[i] = u[i];
4816c23d075SBarry Smith     else if(x[i] < l[i]) x[i] = l[i];
482a7e14dcfSSatish Balay     r += a[i]*x[i];
483a7e14dcfSSatish Balay   }
484a7e14dcfSSatish Balay   return r - b;
485a7e14dcfSSatish Balay }
486a7e14dcfSSatish Balay 
487a7e14dcfSSatish Balay /** Modified Dai-Fletcher QP projector solves the problem:
488a7e14dcfSSatish Balay  *
489a7e14dcfSSatish Balay  *      minimise  0.5*x'*x - c'*x
490a7e14dcfSSatish Balay  *      subj to   a'*x = b
491a7e14dcfSSatish Balay  *                l \leq x \leq u
492a7e14dcfSSatish Balay  *
493a7e14dcfSSatish Balay  *  \param c The point to be projected onto feasible set
494a7e14dcfSSatish Balay  */
495a7e14dcfSSatish Balay #undef __FUNCT__
496a7e14dcfSSatish Balay #define __FUNCT__ "project"
4976c23d075SBarry Smith PetscInt project(PetscInt n,PetscReal *a,PetscReal b,PetscReal *c,PetscReal *l,PetscReal *u,PetscReal *x,PetscReal *lam_ext,TAO_DF *df)
498a7e14dcfSSatish Balay {
499a7e14dcfSSatish Balay   PetscReal      lambda, lambdal, lambdau, dlambda, lambda_new;
500a7e14dcfSSatish Balay   PetscReal      r, rl, ru, s;
501a7e14dcfSSatish Balay   PetscInt       innerIter;
502a7e14dcfSSatish Balay   PetscBool      nonNegativeSlack = PETSC_FALSE;
50353506e15SBarry Smith   PetscErrorCode ierr;
504a7e14dcfSSatish Balay 
505a7e14dcfSSatish Balay   *lam_ext = 0;
506a7e14dcfSSatish Balay   lambda  = 0;
507a7e14dcfSSatish Balay   dlambda = 0.5;
508a7e14dcfSSatish Balay   innerIter = 1;
509a7e14dcfSSatish Balay 
510a7e14dcfSSatish Balay   /*  \phi(x;lambda) := 0.5*x'*x + c'*x - lambda*(a'*x-b)
511a7e14dcfSSatish Balay    *
512a7e14dcfSSatish Balay    *  Optimality conditions for \phi:
513a7e14dcfSSatish Balay    *
514a7e14dcfSSatish Balay    *  1. lambda   <= 0
515a7e14dcfSSatish Balay    *  2. r        <= 0
516a7e14dcfSSatish Balay    *  3. r*lambda == 0
517a7e14dcfSSatish Balay    */
518a7e14dcfSSatish Balay 
519a7e14dcfSSatish Balay   /* Bracketing Phase */
520a7e14dcfSSatish Balay   r = phi(x, n, lambda, a, b, c, l, u);
521a7e14dcfSSatish Balay 
5226c23d075SBarry Smith   if(nonNegativeSlack) {
523a7e14dcfSSatish Balay     /* inequality constraint, i.e., with \xi >= 0 constraint */
52453506e15SBarry Smith     if (r < TOL_R) return 0;
5256c23d075SBarry Smith   } else  {
526a7e14dcfSSatish Balay     /* equality constraint ,i.e., without \xi >= 0 constraint */
52753506e15SBarry Smith     if (fabs(r) < TOL_R) return 0;
528a7e14dcfSSatish Balay   }
529a7e14dcfSSatish Balay 
530a7e14dcfSSatish Balay   if (r < 0.0){
531a7e14dcfSSatish Balay     lambdal = lambda;
532a7e14dcfSSatish Balay     rl      = r;
533a7e14dcfSSatish Balay     lambda  = lambda + dlambda;
534a7e14dcfSSatish Balay     r       = phi(x, n, lambda, a, b, c, l, u);
535a7e14dcfSSatish Balay     while (r < 0.0 && dlambda < BMRM_INFTY)  {
536a7e14dcfSSatish Balay       lambdal = lambda;
537a7e14dcfSSatish Balay       s       = rl/r - 1.0;
538a7e14dcfSSatish Balay       if (s < 0.1) s = 0.1;
539a7e14dcfSSatish Balay       dlambda = dlambda + dlambda/s;
540a7e14dcfSSatish Balay       lambda  = lambda + dlambda;
541a7e14dcfSSatish Balay       rl      = r;
542a7e14dcfSSatish Balay       r       = phi(x, n, lambda, a, b, c, l, u);
543a7e14dcfSSatish Balay     }
544a7e14dcfSSatish Balay     lambdau = lambda;
545a7e14dcfSSatish Balay     ru      = r;
5466c23d075SBarry Smith   } else {
547a7e14dcfSSatish Balay     lambdau = lambda;
548a7e14dcfSSatish Balay     ru      = r;
549a7e14dcfSSatish Balay     lambda  = lambda - dlambda;
550a7e14dcfSSatish Balay     r       = phi(x, n, lambda, a, b, c, l, u);
551a7e14dcfSSatish Balay     while (r > 0.0 && dlambda > -BMRM_INFTY) {
552a7e14dcfSSatish Balay       lambdau = lambda;
553a7e14dcfSSatish Balay       s       = ru/r - 1.0;
554a7e14dcfSSatish Balay       if (s < 0.1) s = 0.1;
555a7e14dcfSSatish Balay       dlambda = dlambda + dlambda/s;
556a7e14dcfSSatish Balay       lambda  = lambda - dlambda;
557a7e14dcfSSatish Balay       ru      = r;
558a7e14dcfSSatish Balay       r       = phi(x, n, lambda, a, b, c, l, u);
559a7e14dcfSSatish Balay     }
560a7e14dcfSSatish Balay     lambdal = lambda;
561a7e14dcfSSatish Balay     rl      = r;
562a7e14dcfSSatish Balay   }
563a7e14dcfSSatish Balay 
5646c23d075SBarry Smith   if(fabs(dlambda) > BMRM_INFTY) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"L2N2_DaiFletcherPGM detected Infeasible QP problem!");
565a7e14dcfSSatish Balay 
566a7e14dcfSSatish Balay   if(ru == 0){
567a7e14dcfSSatish Balay     return innerIter;
568a7e14dcfSSatish Balay   }
569a7e14dcfSSatish Balay 
570a7e14dcfSSatish Balay   /* Secant Phase */
571a7e14dcfSSatish Balay   s       = 1.0 - rl/ru;
572a7e14dcfSSatish Balay   dlambda = dlambda/s;
573a7e14dcfSSatish Balay   lambda  = lambdau - dlambda;
574a7e14dcfSSatish Balay   r       = phi(x, n, lambda, a, b, c, l, u);
575a7e14dcfSSatish Balay 
576a7e14dcfSSatish Balay   while (fabs(r) > TOL_R
577a7e14dcfSSatish Balay          && dlambda > TOL_LAM * (1.0 + fabs(lambda))
578a7e14dcfSSatish Balay          && innerIter < df->maxProjIter){
579a7e14dcfSSatish Balay     innerIter++;
580a7e14dcfSSatish Balay     if (r > 0.0){
581a7e14dcfSSatish Balay       if (s <= 2.0){
582a7e14dcfSSatish Balay         lambdau = lambda;
583a7e14dcfSSatish Balay         ru      = r;
584a7e14dcfSSatish Balay         s       = 1.0 - rl/ru;
585a7e14dcfSSatish Balay         dlambda = (lambdau - lambdal) / s;
586a7e14dcfSSatish Balay         lambda  = lambdau - dlambda;
58753506e15SBarry Smith       } else {
588a7e14dcfSSatish Balay         s          = ru/r-1.0;
589a7e14dcfSSatish Balay         if (s < 0.1) s = 0.1;
590a7e14dcfSSatish Balay         dlambda    = (lambdau - lambda) / s;
591a7e14dcfSSatish Balay         lambda_new = 0.75*lambdal + 0.25*lambda;
592a7e14dcfSSatish Balay         if (lambda_new < (lambda - dlambda))
593a7e14dcfSSatish Balay           lambda_new = lambda - dlambda;
594a7e14dcfSSatish Balay         lambdau    = lambda;
595a7e14dcfSSatish Balay         ru         = r;
596a7e14dcfSSatish Balay         lambda     = lambda_new;
597a7e14dcfSSatish Balay         s          = (lambdau - lambdal) / (lambdau - lambda);
598a7e14dcfSSatish Balay       }
59953506e15SBarry Smith     } else {
600a7e14dcfSSatish Balay       if (s >= 2.0){
601a7e14dcfSSatish Balay         lambdal = lambda;
602a7e14dcfSSatish Balay         rl      = r;
603a7e14dcfSSatish Balay         s       = 1.0 - rl/ru;
604a7e14dcfSSatish Balay         dlambda = (lambdau - lambdal) / s;
605a7e14dcfSSatish Balay         lambda  = lambdau - dlambda;
60653506e15SBarry Smith       } else {
607a7e14dcfSSatish Balay         s          = rl/r - 1.0;
608a7e14dcfSSatish Balay         if (s < 0.1) s = 0.1;
609a7e14dcfSSatish Balay         dlambda    = (lambda-lambdal) / s;
610a7e14dcfSSatish Balay         lambda_new = 0.75*lambdau + 0.25*lambda;
611a7e14dcfSSatish Balay         if (lambda_new > (lambda + dlambda))
612a7e14dcfSSatish Balay           lambda_new = lambda + dlambda;
613a7e14dcfSSatish Balay         lambdal    = lambda;
614a7e14dcfSSatish Balay         rl         = r;
615a7e14dcfSSatish Balay         lambda     = lambda_new;
616a7e14dcfSSatish Balay         s          = (lambdau - lambdal) / (lambdau-lambda);
617a7e14dcfSSatish Balay       }
618a7e14dcfSSatish Balay     }
619a7e14dcfSSatish Balay     r = phi(x, n, lambda, a, b, c, l, u);
620a7e14dcfSSatish Balay   }
621a7e14dcfSSatish Balay 
622a7e14dcfSSatish Balay   *lam_ext = lambda;
62353506e15SBarry Smith   if(innerIter >= df->maxProjIter) {
62453506e15SBarry Smith     ierr = PetscPrintf(PETSC_COMM_SELF, "WARNING: DaiFletcher max iterations\n");CHKERRQ(ierr);
62553506e15SBarry Smith   }
626a7e14dcfSSatish Balay   return innerIter;
627a7e14dcfSSatish Balay }
628a7e14dcfSSatish Balay 
629a7e14dcfSSatish Balay 
630a7e14dcfSSatish Balay #undef __FUNCT__
631a7e14dcfSSatish Balay #define __FUNCT__ "solve"
632a7e14dcfSSatish Balay PetscErrorCode solve(TAO_DF *df)
633a7e14dcfSSatish Balay {
634a7e14dcfSSatish Balay   PetscErrorCode ierr;
635a7e14dcfSSatish Balay   PetscInt       i, j, innerIter, it, it2, luv, info, lscount = 0, projcount = 0;
636a7e14dcfSSatish Balay   PetscReal      gd, max, ak, bk, akold, bkold, lamnew, alpha, kktlam=0.0, lam_ext;
637a7e14dcfSSatish Balay   PetscReal      DELTAsv, ProdDELTAsv;
638a7e14dcfSSatish Balay   PetscReal      c, *tempQ;
639a7e14dcfSSatish Balay   PetscReal      *x = df->x, *a = df->a, b = df->b, *l = df->l, *u = df->u, tol = df->tol;
640a7e14dcfSSatish Balay   PetscReal      *tempv = df->tempv, *y = df->y, *g = df->g, *d = df->d, *Qd = df->Qd;
641a7e14dcfSSatish Balay   PetscReal      *xplus = df->xplus, *tplus = df->tplus, *sk = df->sk, *yk = df->yk;
642a7e14dcfSSatish Balay   PetscReal      **Q = df->Q, *f = df->f, *t = df->t;
643a7e14dcfSSatish Balay   PetscInt       dim = df->dim, *ipt = df->ipt, *ipt2 = df->ipt2, *uv = df->uv;
644a7e14dcfSSatish Balay 
645a7e14dcfSSatish Balay   /*** variables for the adaptive nonmonotone linesearch ***/
646a7e14dcfSSatish Balay   PetscInt    L, llast;
647a7e14dcfSSatish Balay   PetscReal   fr, fbest, fv, fc, fv0;
64853506e15SBarry Smith 
649a7e14dcfSSatish Balay   c = BMRM_INFTY;
650a7e14dcfSSatish Balay 
651a7e14dcfSSatish Balay   DELTAsv = EPS_SV;
65253506e15SBarry Smith   if (tol <= 1.0e-5 || dim <= 20) ProdDELTAsv = 0.0F;
65353506e15SBarry Smith   else  ProdDELTAsv = EPS_SV;
654a7e14dcfSSatish Balay 
65553506e15SBarry Smith   for (i = 0; i < dim; i++)  tempv[i] = -x[i];
656a7e14dcfSSatish Balay 
657a7e14dcfSSatish Balay   lam_ext = 0.0;
658a7e14dcfSSatish Balay 
659a7e14dcfSSatish Balay   /* Project the initial solution */
660a7e14dcfSSatish Balay   projcount += project(dim, a, b, tempv, l, u, x, &lam_ext, df);
661a7e14dcfSSatish Balay 
662a7e14dcfSSatish Balay   /* Compute gradient
663a7e14dcfSSatish Balay      g = Q*x + f; */
664a7e14dcfSSatish Balay 
665a7e14dcfSSatish Balay   it = 0;
66653506e15SBarry Smith   for (i = 0; i < dim; i++) {
66753506e15SBarry Smith     if (fabs(x[i]) > ProdDELTAsv) ipt[it++] = i;
66853506e15SBarry Smith   }
669a7e14dcfSSatish Balay 
670a7e14dcfSSatish Balay   ierr = PetscMemzero(t, dim*sizeof(PetscReal));CHKERRQ(ierr);
671a7e14dcfSSatish Balay   for (i = 0; i < it; i++){
672a7e14dcfSSatish Balay     tempQ = Q[ipt[i]];
67353506e15SBarry Smith     for (j = 0; j < dim; j++) t[j] += (tempQ[j]*x[ipt[i]]);
674a7e14dcfSSatish Balay   }
675a7e14dcfSSatish Balay   for (i = 0; i < dim; i++){
676a7e14dcfSSatish Balay     g[i] = t[i] + f[i];
677a7e14dcfSSatish Balay   }
678a7e14dcfSSatish Balay 
679a7e14dcfSSatish Balay 
680a7e14dcfSSatish Balay   /* y = -(x_{k} - g_{k}) */
681a7e14dcfSSatish Balay   for (i = 0; i < dim; i++){
682a7e14dcfSSatish Balay     y[i] = g[i] - x[i];
683a7e14dcfSSatish Balay   }
684a7e14dcfSSatish Balay 
685a7e14dcfSSatish Balay   /* Project x_{k} - g_{k} */
686a7e14dcfSSatish Balay   projcount += project(dim, a, b, y, l, u, tempv, &lam_ext, df);
687a7e14dcfSSatish Balay 
688a7e14dcfSSatish Balay   /* y = P(x_{k} - g_{k}) - x_{k} */
689a7e14dcfSSatish Balay   max = ALPHA_MIN;
690a7e14dcfSSatish Balay   for (i = 0; i < dim; i++){
691a7e14dcfSSatish Balay     y[i] = tempv[i] - x[i];
69253506e15SBarry Smith     if (fabs(y[i]) > max) max = fabs(y[i]);
693a7e14dcfSSatish Balay   }
694a7e14dcfSSatish Balay 
695a7e14dcfSSatish Balay   if (max < tol*1e-3){
696a7e14dcfSSatish Balay     return 0;
697a7e14dcfSSatish Balay   }
698a7e14dcfSSatish Balay 
699a7e14dcfSSatish Balay   alpha = 1.0 / max;
700a7e14dcfSSatish Balay 
701a7e14dcfSSatish Balay   /* fv0 = f(x_{0}). Recall t = Q x_{k}  */
702a7e14dcfSSatish Balay   fv0   = 0.0;
70353506e15SBarry Smith   for (i = 0; i < dim; i++) fv0 += x[i] * (0.5*t[i] + f[i]);
704a7e14dcfSSatish Balay 
705a7e14dcfSSatish Balay   /*** adaptive nonmonotone linesearch ***/
706a7e14dcfSSatish Balay   L     = 2;
707a7e14dcfSSatish Balay   fr    = ALPHA_MAX;
708a7e14dcfSSatish Balay   fbest = fv0;
709a7e14dcfSSatish Balay   fc    = fv0;
710a7e14dcfSSatish Balay   llast = 0;
711a7e14dcfSSatish Balay   akold = bkold = 0.0;
712a7e14dcfSSatish Balay 
713a7e14dcfSSatish Balay   /***      Iterator begins     ***/
714a7e14dcfSSatish Balay   for (innerIter = 1; innerIter <= df->maxPGMIter; innerIter++) {
715a7e14dcfSSatish Balay 
716a7e14dcfSSatish Balay     /* tempv = -(x_{k} - alpha*g_{k}) */
71753506e15SBarry Smith     for (i = 0; i < dim; i++)  tempv[i] = alpha*g[i] - x[i];
718a7e14dcfSSatish Balay 
719a7e14dcfSSatish Balay     /* Project x_{k} - alpha*g_{k} */
720a7e14dcfSSatish Balay     projcount += project(dim, a, b, tempv, l, u, y, &lam_ext, df);
721a7e14dcfSSatish Balay 
722a7e14dcfSSatish Balay 
723a7e14dcfSSatish Balay     /* gd = \inner{d_{k}}{g_{k}}
724a7e14dcfSSatish Balay         d = P(x_{k} - alpha*g_{k}) - x_{k}
725a7e14dcfSSatish Balay     */
726a7e14dcfSSatish Balay     gd = 0.0;
727a7e14dcfSSatish Balay     for (i = 0; i < dim; i++){
728a7e14dcfSSatish Balay       d[i] = y[i] - x[i];
729a7e14dcfSSatish Balay       gd  += d[i] * g[i];
730a7e14dcfSSatish Balay     }
731a7e14dcfSSatish Balay 
732a7e14dcfSSatish Balay     /* Gradient computation  */
733a7e14dcfSSatish Balay 
734a7e14dcfSSatish Balay     /* compute Qd = Q*d  or  Qd = Q*y - t depending on their sparsity */
735a7e14dcfSSatish Balay 
736a7e14dcfSSatish Balay     it = it2 = 0;
73753506e15SBarry Smith     for (i = 0; i < dim; i++){
73853506e15SBarry Smith       if (fabs(d[i]) > (ProdDELTAsv*1.0e-2)) ipt[it++]   = i;
73953506e15SBarry Smith     }
74053506e15SBarry Smith     for (i = 0; i < dim; i++) {
74153506e15SBarry Smith       if (fabs(y[i]) > ProdDELTAsv) ipt2[it2++] = i;
74253506e15SBarry Smith     }
743a7e14dcfSSatish Balay 
744a7e14dcfSSatish Balay     ierr = PetscMemzero(Qd, dim*sizeof(PetscReal));CHKERRQ(ierr);
745a7e14dcfSSatish Balay     /* compute Qd = Q*d */
746a7e14dcfSSatish Balay     if (it < it2){
747a7e14dcfSSatish Balay       for (i = 0; i < it; i++){
748a7e14dcfSSatish Balay         tempQ = Q[ipt[i]];
74953506e15SBarry Smith         for (j = 0; j < dim; j++) Qd[j] += (tempQ[j] * d[ipt[i]]);
750a7e14dcfSSatish Balay       }
75153506e15SBarry Smith     } else { /* compute Qd = Q*y-t */
752a7e14dcfSSatish Balay       for (i = 0; i < it2; i++){
753a7e14dcfSSatish Balay         tempQ = Q[ipt2[i]];
75453506e15SBarry Smith         for (j = 0; j < dim; j++) Qd[j] += (tempQ[j] * y[ipt2[i]]);
755a7e14dcfSSatish Balay       }
75653506e15SBarry Smith       for (j = 0; j < dim; j++) Qd[j] -= t[j];
757a7e14dcfSSatish Balay     }
758a7e14dcfSSatish Balay 
759a7e14dcfSSatish Balay     /* ak = inner{d_{k}}{d_{k}} */
760a7e14dcfSSatish Balay     ak = 0.0;
76153506e15SBarry Smith     for (i = 0; i < dim; i++) ak += d[i] * d[i];
762a7e14dcfSSatish Balay 
763a7e14dcfSSatish Balay     bk = 0.0;
76453506e15SBarry Smith     for (i = 0; i < dim; i++) bk += d[i]*Qd[i];
765a7e14dcfSSatish Balay 
76653506e15SBarry Smith     if (bk > EPS*ak && gd < 0.0)  lamnew = -gd/bk;
76753506e15SBarry Smith     else lamnew = 1.0;
768a7e14dcfSSatish Balay 
769a7e14dcfSSatish Balay     /* fv is computing f(x_{k} + d_{k}) */
770a7e14dcfSSatish Balay     fv = 0.0;
771a7e14dcfSSatish Balay     for (i = 0; i < dim; i++){
772a7e14dcfSSatish Balay       xplus[i] = x[i] + d[i];
773a7e14dcfSSatish Balay       tplus[i] = t[i] + Qd[i];
774a7e14dcfSSatish Balay       fv      += xplus[i] * (0.5*tplus[i] + f[i]);
775a7e14dcfSSatish Balay     }
776a7e14dcfSSatish Balay 
777a7e14dcfSSatish Balay     /* fr is fref */
778a7e14dcfSSatish Balay     if ((innerIter == 1 && fv >= fv0) || (innerIter > 1 && fv >= fr)){
779a7e14dcfSSatish Balay       lscount++;
780a7e14dcfSSatish Balay       fv = 0.0;
781a7e14dcfSSatish Balay       for (i = 0; i < dim; i++){
782a7e14dcfSSatish Balay         xplus[i] = x[i] + lamnew*d[i];
783a7e14dcfSSatish Balay         tplus[i] = t[i] + lamnew*Qd[i];
784a7e14dcfSSatish Balay         fv      += xplus[i] * (0.5*tplus[i] + f[i]);
785a7e14dcfSSatish Balay       }
786a7e14dcfSSatish Balay     }
787a7e14dcfSSatish Balay 
788a7e14dcfSSatish Balay     for (i = 0; i < dim; i++){
789a7e14dcfSSatish Balay       sk[i] = xplus[i] - x[i];
790a7e14dcfSSatish Balay       yk[i] = tplus[i] - t[i];
791a7e14dcfSSatish Balay       x[i]  = xplus[i];
792a7e14dcfSSatish Balay       t[i]  = tplus[i];
793a7e14dcfSSatish Balay       g[i]  = t[i] + f[i];
794a7e14dcfSSatish Balay     }
795a7e14dcfSSatish Balay 
796a7e14dcfSSatish Balay     /* update the line search control parameters */
797a7e14dcfSSatish Balay     if (fv < fbest){
798a7e14dcfSSatish Balay       fbest = fv;
799a7e14dcfSSatish Balay       fc    = fv;
800a7e14dcfSSatish Balay       llast = 0;
80153506e15SBarry Smith     } else {
802a7e14dcfSSatish Balay       fc = (fc > fv ? fc : fv);
803a7e14dcfSSatish Balay       llast++;
804a7e14dcfSSatish Balay       if (llast == L){
805a7e14dcfSSatish Balay         fr    = fc;
806a7e14dcfSSatish Balay         fc    = fv;
807a7e14dcfSSatish Balay         llast = 0;
808a7e14dcfSSatish Balay       }
809a7e14dcfSSatish Balay     }
810a7e14dcfSSatish Balay 
811a7e14dcfSSatish Balay     ak = bk = 0.0;
812a7e14dcfSSatish Balay     for (i = 0; i < dim; i++){
813a7e14dcfSSatish Balay       ak += sk[i] * sk[i];
814a7e14dcfSSatish Balay       bk += sk[i] * yk[i];
815a7e14dcfSSatish Balay     }
816a7e14dcfSSatish Balay 
81753506e15SBarry Smith     if (bk <= EPS*ak) alpha = ALPHA_MAX;
818a7e14dcfSSatish Balay     else {
81953506e15SBarry Smith       if (bkold < EPS*akold) alpha = ak/bk;
82053506e15SBarry Smith       else alpha = (akold+ak)/(bkold+bk);
821a7e14dcfSSatish Balay 
82253506e15SBarry Smith       if (alpha > ALPHA_MAX) alpha = ALPHA_MAX;
82353506e15SBarry Smith       else if (alpha < ALPHA_MIN) alpha = ALPHA_MIN;
824a7e14dcfSSatish Balay     }
825a7e14dcfSSatish Balay 
826a7e14dcfSSatish Balay     akold = ak;
827a7e14dcfSSatish Balay     bkold = bk;
828a7e14dcfSSatish Balay 
829a7e14dcfSSatish Balay     /*** stopping criterion based on KKT conditions ***/
830a7e14dcfSSatish Balay     /* at optimal, gradient of lagrangian w.r.t. x is zero */
831a7e14dcfSSatish Balay 
832a7e14dcfSSatish Balay     bk = 0.0;
83353506e15SBarry Smith     for (i = 0; i < dim; i++) bk +=  x[i] * x[i];
834a7e14dcfSSatish Balay 
83553506e15SBarry Smith     if (PetscSqrtReal(ak) < tol*10 * PetscSqrtReal(bk)){
836a7e14dcfSSatish Balay       it     = 0;
837a7e14dcfSSatish Balay       luv    = 0;
838a7e14dcfSSatish Balay       kktlam = 0.0;
839a7e14dcfSSatish Balay       for (i = 0; i < dim; i++){
840a7e14dcfSSatish Balay         /* x[i] is active hence lagrange multipliers for box constraints
841a7e14dcfSSatish Balay                 are zero. The lagrange multiplier for ineq. const. is then
842a7e14dcfSSatish Balay                 defined as below
843a7e14dcfSSatish Balay         */
844a7e14dcfSSatish Balay         if ((x[i] > DELTAsv) && (x[i] < c-DELTAsv)){
845a7e14dcfSSatish Balay           ipt[it++] = i;
846a7e14dcfSSatish Balay           kktlam    = kktlam - a[i]*g[i];
84753506e15SBarry Smith         } else  uv[luv++] = i;
848a7e14dcfSSatish Balay       }
849a7e14dcfSSatish Balay 
85053506e15SBarry Smith       if (it == 0 && PetscSqrtReal(ak) < tol*0.5 * PetscSqrtReal(bk)) return 0;
851a7e14dcfSSatish Balay       else {
852a7e14dcfSSatish Balay         kktlam = kktlam/it;
853a7e14dcfSSatish Balay         info   = 1;
854a7e14dcfSSatish Balay         for (i = 0; i < it; i++) {
855a7e14dcfSSatish Balay           if (fabs(a[ipt[i]] * g[ipt[i]] + kktlam) > tol) {
856a7e14dcfSSatish Balay             info = 0;
857a7e14dcfSSatish Balay             break;
858a7e14dcfSSatish Balay           }
859a7e14dcfSSatish Balay         }
860a7e14dcfSSatish Balay         if (info == 1)  {
861a7e14dcfSSatish Balay           for (i = 0; i < luv; i++)  {
862a7e14dcfSSatish Balay             if (x[uv[i]] <= DELTAsv){
863a7e14dcfSSatish Balay               /* x[i] == lower bound, hence, lagrange multiplier (say, beta) for lower bound may
864a7e14dcfSSatish Balay                      not be zero. So, the gradient without beta is > 0
865a7e14dcfSSatish Balay               */
866a7e14dcfSSatish Balay               if (g[uv[i]] + kktlam*a[uv[i]] < -tol){
867a7e14dcfSSatish Balay                 info = 0;
868a7e14dcfSSatish Balay                 break;
869a7e14dcfSSatish Balay               }
87053506e15SBarry Smith             } else {
871a7e14dcfSSatish Balay               /* x[i] == upper bound, hence, lagrange multiplier (say, eta) for upper bound may
872a7e14dcfSSatish Balay                      not be zero. So, the gradient without eta is < 0
873a7e14dcfSSatish Balay               */
874a7e14dcfSSatish Balay               if (g[uv[i]] + kktlam*a[uv[i]] > tol) {
875a7e14dcfSSatish Balay                 info = 0;
876a7e14dcfSSatish Balay                 break;
877a7e14dcfSSatish Balay               }
878a7e14dcfSSatish Balay             }
879a7e14dcfSSatish Balay           }
880a7e14dcfSSatish Balay         }
881a7e14dcfSSatish Balay 
88253506e15SBarry Smith         if (info == 1) return 0;
883a7e14dcfSSatish Balay       }
884a7e14dcfSSatish Balay     }
885a7e14dcfSSatish Balay   }
886a7e14dcfSSatish Balay   return 0;
887a7e14dcfSSatish Balay }
888a7e14dcfSSatish Balay 
889a7e14dcfSSatish Balay 
890