xref: /petsc/src/tao/unconstrained/impls/bmrm/bmrm.c (revision 6c23d07575f07c9a033c9cb13c1a90726fd2593a)
1a7e14dcfSSatish Balay #include "bmrm.h"
2a7e14dcfSSatish Balay 
3a7e14dcfSSatish Balay static PetscErrorCode init_df_solver(TAO_DF*);
4a7e14dcfSSatish Balay static PetscErrorCode ensure_df_space(PetscInt, TAO_DF*);
5a7e14dcfSSatish Balay static PetscErrorCode destroy_df_solver(TAO_DF*);
6a7e14dcfSSatish Balay static PetscReal phi(PetscReal*,PetscInt,PetscReal,PetscReal*,
7a7e14dcfSSatish Balay 		     PetscReal,PetscReal*,PetscReal*,PetscReal*);
8a7e14dcfSSatish Balay static PetscInt project(PetscInt,PetscReal*,PetscReal,PetscReal*,
9a7e14dcfSSatish Balay 			PetscReal*,PetscReal*,PetscReal*,PetscReal*,TAO_DF*);
10a7e14dcfSSatish Balay 
11a7e14dcfSSatish Balay static PetscErrorCode solve(TAO_DF*);
12a7e14dcfSSatish Balay 
13a7e14dcfSSatish Balay 
14a7e14dcfSSatish Balay /*------------------------------------------------------------*/
15a7e14dcfSSatish Balay /* The main solver function
16a7e14dcfSSatish Balay 
17a7e14dcfSSatish Balay    f = Remp(W)		This is what the user provides us from the application layer
18a7e14dcfSSatish Balay    So the ComputeGradient function for instance should get us back the subgradient of Remp(W)
19a7e14dcfSSatish Balay 
20a7e14dcfSSatish Balay    Regularizer assumed to be L2 norm = lambda*0.5*W'W ()
21a7e14dcfSSatish Balay */
22a7e14dcfSSatish Balay 
23a7e14dcfSSatish Balay #undef __FUNCT__
24a7e14dcfSSatish Balay #define __FUNCT__ "make_grad_node"
25a7e14dcfSSatish Balay static PetscErrorCode make_grad_node(Vec X, Vec_Chain **p)
26a7e14dcfSSatish Balay {
27a7e14dcfSSatish Balay   PetscErrorCode ierr;
28a7e14dcfSSatish Balay 
29a7e14dcfSSatish Balay   PetscFunctionBegin;
30a7e14dcfSSatish Balay 
31a7e14dcfSSatish Balay   ierr = PetscMalloc(sizeof(Vec_Chain), p); CHKERRQ(ierr);
32a7e14dcfSSatish Balay   ierr = VecDuplicate(X, &(*p)->V); CHKERRQ(ierr);
33a7e14dcfSSatish Balay   ierr = VecCopy(X, (*p)->V); CHKERRQ(ierr);
34*6c23d075SBarry Smith   (*p)->next = NULL;
35a7e14dcfSSatish Balay 
36a7e14dcfSSatish Balay   PetscFunctionReturn(0);
37a7e14dcfSSatish Balay }
38a7e14dcfSSatish Balay 
39a7e14dcfSSatish Balay 
40a7e14dcfSSatish Balay #undef __FUNCT__
41a7e14dcfSSatish Balay #define __FUNCT__ "destroy_grad_list"
42a7e14dcfSSatish Balay static PetscErrorCode destroy_grad_list(Vec_Chain *head)
43a7e14dcfSSatish Balay {
44a7e14dcfSSatish Balay   PetscErrorCode ierr;
45a7e14dcfSSatish Balay   Vec_Chain *p = head->next, *q;
46a7e14dcfSSatish Balay 
47a7e14dcfSSatish Balay   PetscFunctionBegin;
48a7e14dcfSSatish Balay   while(p) {
49a7e14dcfSSatish Balay     q = p->next;
50a7e14dcfSSatish Balay     ierr = VecDestroy(&p->V); CHKERRQ(ierr);
51a7e14dcfSSatish Balay     ierr = PetscFree(p); CHKERRQ(ierr);
52a7e14dcfSSatish Balay     p = q;
53a7e14dcfSSatish Balay   }
54*6c23d075SBarry Smith   head->next = NULL;
55a7e14dcfSSatish Balay 
56a7e14dcfSSatish Balay   PetscFunctionReturn(0);
57a7e14dcfSSatish Balay }
58a7e14dcfSSatish Balay 
59a7e14dcfSSatish Balay 
60a7e14dcfSSatish Balay #undef __FUNCT__
61a7e14dcfSSatish Balay #define __FUNCT__ "TaoSolve_BMRM"
62a7e14dcfSSatish Balay static PetscErrorCode TaoSolve_BMRM(TaoSolver tao)
63a7e14dcfSSatish Balay {
64a7e14dcfSSatish Balay   PetscErrorCode ierr;
65a7e14dcfSSatish Balay   TaoSolverTerminationReason reason;
66a7e14dcfSSatish Balay   TAO_DF df;
67a7e14dcfSSatish Balay   TAO_BMRM *bmrm = (TAO_BMRM*)tao->data;
68a7e14dcfSSatish Balay 
69a7e14dcfSSatish Balay   /* Values and pointers to parts of the optimization problem */
70a7e14dcfSSatish Balay   PetscReal f = 0.0;
71a7e14dcfSSatish Balay   Vec W = tao->solution;
72a7e14dcfSSatish Balay   Vec G = tao->gradient;
73a7e14dcfSSatish Balay   PetscReal lambda;
74a7e14dcfSSatish Balay 
75a7e14dcfSSatish Balay   PetscReal bt;
76a7e14dcfSSatish Balay   Vec_Chain grad_list, *tail_glist, *pgrad;
77a7e14dcfSSatish Balay 
78a7e14dcfSSatish Balay   PetscInt iter = 0;
79a7e14dcfSSatish Balay   PetscInt i;
80a7e14dcfSSatish Balay   PetscMPIInt rank;
81a7e14dcfSSatish Balay 
82a7e14dcfSSatish Balay   /* Used in termination criteria check */
83a7e14dcfSSatish Balay   PetscReal reg;
84a7e14dcfSSatish Balay   PetscReal jtwt, max_jtwt, pre_epsilon, epsilon, jw, min_jw;
85a7e14dcfSSatish Balay   PetscReal innerSolverTol;
86a7e14dcfSSatish Balay 
87a7e14dcfSSatish Balay   PetscFunctionBegin;
88a7e14dcfSSatish Balay 
89a7e14dcfSSatish Balay   ierr = MPI_Comm_rank(PETSC_COMM_WORLD, &rank); CHKERRQ(ierr);
90a7e14dcfSSatish Balay   lambda = bmrm->lambda;
91a7e14dcfSSatish Balay 
92a7e14dcfSSatish Balay   /* Check Stopping Condition */
93a7e14dcfSSatish Balay   tao->step = 1.0;
94a7e14dcfSSatish Balay   max_jtwt = -BMRM_INFTY;
95a7e14dcfSSatish Balay   min_jw = BMRM_INFTY;
96a7e14dcfSSatish Balay   innerSolverTol = 1.0;
97a7e14dcfSSatish Balay   epsilon = 0.0;
98a7e14dcfSSatish Balay 
99a7e14dcfSSatish Balay   if (rank == 0) {
100a7e14dcfSSatish Balay     ierr = init_df_solver(&df); CHKERRQ(ierr);
101a7e14dcfSSatish Balay     grad_list.next = NULL;
102a7e14dcfSSatish Balay     tail_glist = &grad_list;
103a7e14dcfSSatish Balay   }
104a7e14dcfSSatish Balay 
105a7e14dcfSSatish Balay   df.tol = 1e-6;
106a7e14dcfSSatish Balay   reason = TAO_CONTINUE_ITERATING;
107a7e14dcfSSatish Balay 
108a7e14dcfSSatish Balay   /*-----------------Algorithm Begins------------------------*/
109a7e14dcfSSatish Balay   /* make the scatter */
110a7e14dcfSSatish Balay   ierr = VecScatterCreateToZero(W, &bmrm->scatter, &bmrm->local_w); CHKERRQ(ierr);
111a7e14dcfSSatish Balay   ierr = VecAssemblyBegin(bmrm->local_w); CHKERRQ(ierr);
112a7e14dcfSSatish Balay   ierr = VecAssemblyEnd(bmrm->local_w); CHKERRQ(ierr);
113a7e14dcfSSatish Balay 
114a7e14dcfSSatish Balay 	/* NOTE: In application pass the sub-gradient of Remp(W) */
115a7e14dcfSSatish Balay   ierr = TaoComputeObjectiveAndGradient(tao, W, &f, G); CHKERRQ(ierr);
116a7e14dcfSSatish Balay   ierr = TaoMonitor(tao,iter,f,1.0,0.0,tao->step,&reason); CHKERRQ(ierr);
117a7e14dcfSSatish Balay   while (reason == TAO_CONTINUE_ITERATING) {
118a7e14dcfSSatish Balay     /* compute bt = Remp(Wt-1) - <Wt-1, At> */
119a7e14dcfSSatish Balay     ierr = VecDot(W, G, &bt); CHKERRQ(ierr);
120a7e14dcfSSatish Balay     bt = f - bt;
121a7e14dcfSSatish Balay 
122a7e14dcfSSatish Balay     /* First gather the gradient to the master node */
123a7e14dcfSSatish Balay     ierr = VecScatterBegin(bmrm->scatter, G, bmrm->local_w, INSERT_VALUES, SCATTER_FORWARD); CHKERRQ(ierr);
124a7e14dcfSSatish Balay     ierr = VecScatterEnd(bmrm->scatter, G, bmrm->local_w, INSERT_VALUES, SCATTER_FORWARD); CHKERRQ(ierr);
125a7e14dcfSSatish Balay 
126a7e14dcfSSatish Balay     /* Bring up the inner solver */
127a7e14dcfSSatish Balay     if (rank == 0) {
128a7e14dcfSSatish Balay       ierr = ensure_df_space(iter+1, &df);  CHKERRQ(ierr);
129a7e14dcfSSatish Balay       ierr = make_grad_node(bmrm->local_w, &pgrad); CHKERRQ(ierr);
130a7e14dcfSSatish Balay       tail_glist->next = pgrad;
131a7e14dcfSSatish Balay       tail_glist = pgrad;
132a7e14dcfSSatish Balay 
133a7e14dcfSSatish Balay       df.a[iter] = 1.0;
134a7e14dcfSSatish Balay       df.f[iter] = -bt;
135a7e14dcfSSatish Balay       df.u[iter] = 1.0;
136a7e14dcfSSatish Balay       df.l[iter] = 0.0;
137a7e14dcfSSatish Balay 
138a7e14dcfSSatish Balay       /* set up the Q */
139a7e14dcfSSatish Balay       pgrad = grad_list.next;
140a7e14dcfSSatish Balay       for (i=0; i<=iter; i++) {
141a7e14dcfSSatish Balay         ierr = VecDot(pgrad->V, bmrm->local_w, &reg); CHKERRQ(ierr);
142a7e14dcfSSatish Balay         df.Q[i][iter] = df.Q[iter][i] = reg / lambda;
143a7e14dcfSSatish Balay         pgrad = pgrad->next;
144a7e14dcfSSatish Balay       }
145a7e14dcfSSatish Balay 
146a7e14dcfSSatish Balay       if (iter > 0) {
147a7e14dcfSSatish Balay         df.x[iter] = 0.0;
148a7e14dcfSSatish Balay         ierr = solve(&df);  CHKERRQ(ierr);
149a7e14dcfSSatish Balay       }
150a7e14dcfSSatish Balay       else
151a7e14dcfSSatish Balay 	df.x[0] = 1.0;
152a7e14dcfSSatish Balay 
153a7e14dcfSSatish Balay       /* now computing Jt*(alpha_t) which should be = Jt(wt) to check convergence */
154a7e14dcfSSatish Balay       jtwt = 0.0;
155a7e14dcfSSatish Balay       ierr = VecSet(bmrm->local_w, 0.0);  CHKERRQ(ierr);
156a7e14dcfSSatish Balay       pgrad = grad_list.next;
157a7e14dcfSSatish Balay       for (i=0; i<=iter; i++) {
158a7e14dcfSSatish Balay         jtwt -= df.x[i] * df.f[i];
159a7e14dcfSSatish Balay         ierr = VecAXPY(bmrm->local_w, -df.x[i] / lambda, pgrad->V);  CHKERRQ(ierr);
160a7e14dcfSSatish Balay         pgrad = pgrad->next;
161a7e14dcfSSatish Balay       }
162a7e14dcfSSatish Balay 
163a7e14dcfSSatish Balay       ierr = VecNorm(bmrm->local_w, NORM_2, &reg);  CHKERRQ(ierr);
164a7e14dcfSSatish Balay       reg = 0.5*lambda*reg*reg;
165a7e14dcfSSatish Balay       jtwt -= reg;
166a7e14dcfSSatish Balay     } /* end if rank == 0 */
167a7e14dcfSSatish Balay 
168a7e14dcfSSatish Balay     /* scatter the new W to all nodes */
169a7e14dcfSSatish Balay     ierr = VecScatterBegin(bmrm->scatter,bmrm->local_w,W,INSERT_VALUES,SCATTER_REVERSE); CHKERRQ(ierr);
170a7e14dcfSSatish Balay     ierr = VecScatterEnd(bmrm->scatter,bmrm->local_w,W,INSERT_VALUES,SCATTER_REVERSE); CHKERRQ(ierr);
171a7e14dcfSSatish Balay 
172a7e14dcfSSatish Balay     ierr = TaoComputeObjectiveAndGradient(tao, W, &f, G); CHKERRQ(ierr);
173a7e14dcfSSatish Balay 
174a7e14dcfSSatish Balay     MPI_Bcast(&jtwt,1,MPI_DOUBLE,0,PETSC_COMM_WORLD);
175a7e14dcfSSatish Balay     MPI_Bcast(&reg,1,MPI_DOUBLE,0,PETSC_COMM_WORLD);
176a7e14dcfSSatish Balay 
177a7e14dcfSSatish Balay     jw = reg + f;					/* J(w) = regularizer + Remp(w) */
178a7e14dcfSSatish Balay     if (jw < min_jw)
179a7e14dcfSSatish Balay       min_jw = jw;
180a7e14dcfSSatish Balay     if (jtwt > max_jtwt)
181a7e14dcfSSatish Balay       max_jtwt = jtwt;
182a7e14dcfSSatish Balay 
183a7e14dcfSSatish Balay     pre_epsilon = epsilon;
184a7e14dcfSSatish Balay     epsilon = min_jw - jtwt;
185a7e14dcfSSatish Balay 
186a7e14dcfSSatish Balay     if (rank == 0) {
187a7e14dcfSSatish Balay       if (innerSolverTol > epsilon)
188a7e14dcfSSatish Balay         innerSolverTol = epsilon;
189a7e14dcfSSatish Balay       else if (innerSolverTol < 1e-7)
190a7e14dcfSSatish Balay         innerSolverTol = 1e-7;
191a7e14dcfSSatish Balay 
192a7e14dcfSSatish Balay       /* if the annealing doesn't work well, lower the inner solver tolerance */
193a7e14dcfSSatish Balay       if(pre_epsilon < epsilon)
194a7e14dcfSSatish Balay         innerSolverTol *= 0.2;
195a7e14dcfSSatish Balay 
196a7e14dcfSSatish Balay       df.tol = innerSolverTol*0.5;
197a7e14dcfSSatish Balay     }
198a7e14dcfSSatish Balay 
199a7e14dcfSSatish Balay     iter++;
200a7e14dcfSSatish Balay     ierr = TaoMonitor(tao,iter,min_jw,epsilon,0.0,tao->step,&reason); CHKERRQ(ierr);
201a7e14dcfSSatish Balay   }
202a7e14dcfSSatish Balay 
203a7e14dcfSSatish Balay   /* free all the memory */
204a7e14dcfSSatish Balay   if (rank == 0) {
205a7e14dcfSSatish Balay     ierr = destroy_grad_list(&grad_list); 	CHKERRQ(ierr);
206a7e14dcfSSatish Balay     ierr = destroy_df_solver(&df); CHKERRQ(ierr);
207a7e14dcfSSatish Balay   }
208a7e14dcfSSatish Balay 
209a7e14dcfSSatish Balay   ierr = VecDestroy(&bmrm->local_w); CHKERRQ(ierr);
210a7e14dcfSSatish Balay   ierr = VecScatterDestroy(&bmrm->scatter); CHKERRQ(ierr);
211a7e14dcfSSatish Balay 
212a7e14dcfSSatish Balay   PetscFunctionReturn(0);
213a7e14dcfSSatish Balay }
214a7e14dcfSSatish Balay 
215a7e14dcfSSatish Balay 
216a7e14dcfSSatish Balay /* ---------------------------------------------------------- */
217a7e14dcfSSatish Balay 
218a7e14dcfSSatish Balay #undef __FUNCT__
219a7e14dcfSSatish Balay #define __FUNCT__ "TaoSetup_BMRM"
220a7e14dcfSSatish Balay static PetscErrorCode TaoSetup_BMRM(TaoSolver tao) {
221a7e14dcfSSatish Balay 
222a7e14dcfSSatish Balay   PetscErrorCode      ierr;
223a7e14dcfSSatish Balay 
224a7e14dcfSSatish Balay   PetscFunctionBegin;
225a7e14dcfSSatish Balay 
226a7e14dcfSSatish Balay   /* Allocate some arrays */
227a7e14dcfSSatish Balay   if (!tao->gradient) {
228a7e14dcfSSatish Balay     ierr = VecDuplicate(tao->solution, &tao->gradient);    CHKERRQ(ierr);
229a7e14dcfSSatish Balay   }
230a7e14dcfSSatish Balay 
231a7e14dcfSSatish Balay   PetscFunctionReturn(0);
232a7e14dcfSSatish Balay }
233a7e14dcfSSatish Balay 
234a7e14dcfSSatish Balay 
235a7e14dcfSSatish Balay /*------------------------------------------------------------*/
236a7e14dcfSSatish Balay 
237a7e14dcfSSatish Balay #undef __FUNCT__
238a7e14dcfSSatish Balay #define __FUNCT__ "TaoDestroy_BMRM"
239a7e14dcfSSatish Balay static PetscErrorCode TaoDestroy_BMRM(TaoSolver tao)
240a7e14dcfSSatish Balay {
241a7e14dcfSSatish Balay   PetscErrorCode ierr;
242a7e14dcfSSatish Balay 
243a7e14dcfSSatish Balay   PetscFunctionBegin;
244a7e14dcfSSatish Balay   ierr = PetscFree(tao->data); CHKERRQ(ierr);
245a7e14dcfSSatish Balay   PetscFunctionReturn(0);
246a7e14dcfSSatish Balay }
247a7e14dcfSSatish Balay 
248a7e14dcfSSatish Balay 
249a7e14dcfSSatish Balay #undef __FUNCT__
250a7e14dcfSSatish Balay #define __FUNCT__ "TaoSetFromOptions_BMRM"
251a7e14dcfSSatish Balay static PetscErrorCode TaoSetFromOptions_BMRM(TaoSolver tao)
252a7e14dcfSSatish Balay {
253a7e14dcfSSatish Balay   PetscErrorCode ierr;
254a7e14dcfSSatish Balay   TAO_BMRM*      bmrm = (TAO_BMRM*)tao->data;
255a7e14dcfSSatish Balay   PetscBool      flg;
256a7e14dcfSSatish Balay 
257a7e14dcfSSatish Balay   PetscFunctionBegin;
258a7e14dcfSSatish Balay   ierr = PetscOptionsHead("BMRM for regularized risk minimization");CHKERRQ(ierr);
259a7e14dcfSSatish Balay   ierr = PetscOptionsReal("-tao_bmrm_lambda", "regulariser weight","", 100,&bmrm->lambda,&flg);  CHKERRQ(ierr);
260a7e14dcfSSatish Balay   ierr = PetscOptionsTail();CHKERRQ(ierr);
261a7e14dcfSSatish Balay   PetscFunctionReturn(0);
262a7e14dcfSSatish Balay }
263a7e14dcfSSatish Balay 
264a7e14dcfSSatish Balay 
265a7e14dcfSSatish Balay /*------------------------------------------------------------*/
266a7e14dcfSSatish Balay #undef __FUNCT__
267a7e14dcfSSatish Balay #define __FUNCT__ "TaoView_BMRM"
268a7e14dcfSSatish Balay static PetscErrorCode TaoView_BMRM(TaoSolver tao, PetscViewer viewer)
269a7e14dcfSSatish Balay {
270a7e14dcfSSatish Balay   PetscBool           isascii;
271a7e14dcfSSatish Balay   PetscErrorCode      ierr;
272a7e14dcfSSatish Balay 
273a7e14dcfSSatish Balay   PetscFunctionBegin;
274a7e14dcfSSatish Balay   ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&isascii);CHKERRQ(ierr);
275a7e14dcfSSatish Balay   if (isascii) {
276a7e14dcfSSatish Balay     ierr = PetscViewerASCIIPushTab(viewer); CHKERRQ(ierr);
277a7e14dcfSSatish Balay     ierr = PetscViewerASCIIPopTab(viewer); CHKERRQ(ierr);
278a7e14dcfSSatish Balay   }
279a7e14dcfSSatish Balay   else{
280a7e14dcfSSatish Balay     SETERRQ1(((PetscObject)tao)->comm,PETSC_ERR_SUP,"Viewer type %s not supported for TAO BMRM",((PetscObject)viewer)->type_name);
281a7e14dcfSSatish Balay   }
282a7e14dcfSSatish Balay 
283a7e14dcfSSatish Balay   PetscFunctionReturn(0);
284a7e14dcfSSatish Balay }
285a7e14dcfSSatish Balay 
286a7e14dcfSSatish Balay 
287a7e14dcfSSatish Balay /*------------------------------------------------------------*/
288a7e14dcfSSatish Balay EXTERN_C_BEGIN
289a7e14dcfSSatish Balay #undef __FUNCT__
290a7e14dcfSSatish Balay #define __FUNCT__ "TaoCreate_BMRM"
291a7e14dcfSSatish Balay PetscErrorCode TaoCreate_BMRM(TaoSolver tao)
292a7e14dcfSSatish Balay {
293a7e14dcfSSatish Balay   TAO_BMRM *bmrm;
294a7e14dcfSSatish Balay   PetscErrorCode      ierr;
295a7e14dcfSSatish Balay 
296a7e14dcfSSatish Balay   PetscFunctionBegin;
297a7e14dcfSSatish Balay   tao->ops->setup = TaoSetup_BMRM;
298a7e14dcfSSatish Balay   tao->ops->solve = TaoSolve_BMRM;
299a7e14dcfSSatish Balay   tao->ops->view  = TaoView_BMRM;
300a7e14dcfSSatish Balay   tao->ops->setfromoptions = TaoSetFromOptions_BMRM;
301a7e14dcfSSatish Balay   tao->ops->destroy = TaoDestroy_BMRM;
302a7e14dcfSSatish Balay 
3033c9e27cfSGeoffrey Irving   ierr = PetscNewLog(tao,&bmrm); CHKERRQ(ierr);
304a7e14dcfSSatish Balay   bmrm->lambda = 1.0;
305a7e14dcfSSatish Balay   tao->data = (void*)bmrm;
306a7e14dcfSSatish Balay 
307a7e14dcfSSatish Balay   /* Note: May need to be tuned! */
308a7e14dcfSSatish Balay   tao->max_it = 2048;
309a7e14dcfSSatish Balay   tao->max_funcs = 300000;
310a7e14dcfSSatish Balay   tao->fatol = 1e-20;
311a7e14dcfSSatish Balay   tao->frtol = 1e-25;
312a7e14dcfSSatish Balay   tao->gatol = 1e-25;
313a7e14dcfSSatish Balay   tao->grtol = 1e-25;
314a7e14dcfSSatish Balay 
315a7e14dcfSSatish Balay   PetscFunctionReturn(0);
316a7e14dcfSSatish Balay }
317a7e14dcfSSatish Balay EXTERN_C_END
318a7e14dcfSSatish Balay 
319a7e14dcfSSatish Balay 
320a7e14dcfSSatish Balay 
321a7e14dcfSSatish Balay #undef __FUNCT__
322a7e14dcfSSatish Balay #define __FUNCT__ "init_df_solver"
323a7e14dcfSSatish Balay PetscErrorCode init_df_solver(TAO_DF *df)
324a7e14dcfSSatish Balay {
325a7e14dcfSSatish Balay   PetscInt i, n = INCRE_DIM;
326a7e14dcfSSatish Balay   PetscErrorCode ierr;
327a7e14dcfSSatish Balay 
328a7e14dcfSSatish Balay   PetscFunctionBegin;
329a7e14dcfSSatish Balay 
330a7e14dcfSSatish Balay   /* default values */
331a7e14dcfSSatish Balay   df->maxProjIter = 200;
332a7e14dcfSSatish Balay   df->maxPGMIter = 300000;
333a7e14dcfSSatish Balay   df->b = 1.0;
334a7e14dcfSSatish Balay 
335a7e14dcfSSatish Balay   /* memory space required by Dai-Fletcher */
336a7e14dcfSSatish Balay   df->cur_num_cp = n;
337a7e14dcfSSatish Balay   ierr = PetscMalloc(sizeof(PetscReal)*n, &df->f);  CHKERRQ(ierr);
338a7e14dcfSSatish Balay   ierr = PetscMalloc(sizeof(PetscReal)*n, &df->a);  CHKERRQ(ierr);
339a7e14dcfSSatish Balay   ierr = PetscMalloc(sizeof(PetscReal)*n, &df->l);  CHKERRQ(ierr);
340a7e14dcfSSatish Balay   ierr = PetscMalloc(sizeof(PetscReal)*n, &df->u);  CHKERRQ(ierr);
341a7e14dcfSSatish Balay   ierr = PetscMalloc(sizeof(PetscReal)*n, &df->x);  CHKERRQ(ierr);
342a7e14dcfSSatish Balay   ierr = PetscMalloc(sizeof(PetscReal*)*n, &df->Q);  CHKERRQ(ierr);
343a7e14dcfSSatish Balay 
344a7e14dcfSSatish Balay   for (i = 0; i < n; i ++) {
345a7e14dcfSSatish Balay     ierr = PetscMalloc(sizeof(PetscReal)*n, &df->Q[i]);  CHKERRQ(ierr);
346a7e14dcfSSatish Balay   }
347a7e14dcfSSatish Balay 
348a7e14dcfSSatish Balay   ierr = PetscMalloc(sizeof(PetscReal)*n, &df->g);  CHKERRQ(ierr);
349a7e14dcfSSatish Balay   ierr = PetscMalloc(sizeof(PetscReal)*n, &df->y);  CHKERRQ(ierr);
350a7e14dcfSSatish Balay   ierr = PetscMalloc(sizeof(PetscReal)*n, &df->tempv);  CHKERRQ(ierr);
351a7e14dcfSSatish Balay   ierr = PetscMalloc(sizeof(PetscReal)*n, &df->d);  CHKERRQ(ierr);
352a7e14dcfSSatish Balay   ierr = PetscMalloc(sizeof(PetscReal)*n, &df->Qd);  CHKERRQ(ierr);
353a7e14dcfSSatish Balay   ierr = PetscMalloc(sizeof(PetscReal)*n, &df->t);  CHKERRQ(ierr);
354a7e14dcfSSatish Balay   ierr = PetscMalloc(sizeof(PetscReal)*n, &df->xplus);  CHKERRQ(ierr);
355a7e14dcfSSatish Balay   ierr = PetscMalloc(sizeof(PetscReal)*n, &df->tplus);  CHKERRQ(ierr);
356a7e14dcfSSatish Balay   ierr = PetscMalloc(sizeof(PetscReal)*n, &df->sk);  CHKERRQ(ierr);
357a7e14dcfSSatish Balay   ierr = PetscMalloc(sizeof(PetscReal)*n, &df->yk);  CHKERRQ(ierr);
358a7e14dcfSSatish Balay 
359a7e14dcfSSatish Balay   ierr = PetscMalloc(sizeof(PetscInt)*n, &df->ipt);  CHKERRQ(ierr);
360a7e14dcfSSatish Balay   ierr = PetscMalloc(sizeof(PetscInt)*n, &df->ipt2);  CHKERRQ(ierr);
361a7e14dcfSSatish Balay   ierr = PetscMalloc(sizeof(PetscInt)*n, &df->uv);  CHKERRQ(ierr);
362a7e14dcfSSatish Balay 
363a7e14dcfSSatish Balay   PetscFunctionReturn(0);
364a7e14dcfSSatish Balay }
365a7e14dcfSSatish Balay 
366a7e14dcfSSatish Balay 
367a7e14dcfSSatish Balay #undef __FUNCT__
368a7e14dcfSSatish Balay #define __FUNCT__ "ensure_df_space"
369a7e14dcfSSatish Balay PetscErrorCode ensure_df_space(PetscInt dim, TAO_DF *df)
370a7e14dcfSSatish Balay {
371a7e14dcfSSatish Balay   PetscErrorCode ierr;
372a7e14dcfSSatish Balay   PetscReal *tmp, **tmp_Q;
373a7e14dcfSSatish Balay   PetscInt i, n, old_n;
374a7e14dcfSSatish Balay 
375a7e14dcfSSatish Balay   df->dim = dim;
376a7e14dcfSSatish Balay   if (dim <= df->cur_num_cp)
377a7e14dcfSSatish Balay     return 0;
378a7e14dcfSSatish Balay 
379a7e14dcfSSatish Balay   PetscFunctionBegin;
380a7e14dcfSSatish Balay 
381a7e14dcfSSatish Balay   old_n = df->cur_num_cp;
382a7e14dcfSSatish Balay   df->cur_num_cp += INCRE_DIM;
383a7e14dcfSSatish Balay   n = df->cur_num_cp;
384a7e14dcfSSatish Balay 
385a7e14dcfSSatish Balay   /* memory space required by dai-fletcher */
386a7e14dcfSSatish Balay   ierr = PetscMalloc(sizeof(PetscReal)*n, &tmp);  CHKERRQ(ierr);
387a7e14dcfSSatish Balay   ierr = PetscMemcpy(tmp, df->f, sizeof(PetscReal)*old_n);  CHKERRQ(ierr);
388a7e14dcfSSatish Balay   ierr = PetscFree(df->f);  CHKERRQ(ierr);
389a7e14dcfSSatish Balay   df->f = tmp;
390a7e14dcfSSatish Balay 
391a7e14dcfSSatish Balay   ierr = PetscMalloc(sizeof(PetscReal)*n, &tmp);  CHKERRQ(ierr);
392a7e14dcfSSatish Balay   ierr = PetscMemcpy(tmp, df->a, sizeof(PetscReal)*old_n);  CHKERRQ(ierr);
393a7e14dcfSSatish Balay   ierr = PetscFree(df->a);  CHKERRQ(ierr);
394a7e14dcfSSatish Balay   df->a = tmp;
395a7e14dcfSSatish Balay 
396a7e14dcfSSatish Balay   ierr = PetscMalloc(sizeof(PetscReal)*n, &tmp);  CHKERRQ(ierr);
397a7e14dcfSSatish Balay   ierr = PetscMemcpy(tmp, df->l, sizeof(PetscReal)*old_n);  CHKERRQ(ierr);
398a7e14dcfSSatish Balay   ierr = PetscFree(df->l);  CHKERRQ(ierr);
399a7e14dcfSSatish Balay   df->l = tmp;
400a7e14dcfSSatish Balay 
401a7e14dcfSSatish Balay   ierr = PetscMalloc(sizeof(PetscReal)*n, &tmp);  CHKERRQ(ierr);
402a7e14dcfSSatish Balay   ierr = PetscMemcpy(tmp, df->u, sizeof(PetscReal)*old_n);  CHKERRQ(ierr);
403a7e14dcfSSatish Balay   ierr = PetscFree(df->u);  CHKERRQ(ierr);
404a7e14dcfSSatish Balay   df->u = tmp;
405a7e14dcfSSatish Balay 
406a7e14dcfSSatish Balay   ierr = PetscMalloc(sizeof(PetscReal)*n, &tmp);  CHKERRQ(ierr);
407a7e14dcfSSatish Balay   ierr = PetscMemcpy(tmp, df->x, sizeof(PetscReal)*old_n);  CHKERRQ(ierr);
408a7e14dcfSSatish Balay   ierr = PetscFree(df->x);  CHKERRQ(ierr);
409a7e14dcfSSatish Balay   df->x = tmp;
410a7e14dcfSSatish Balay 
411a7e14dcfSSatish Balay   ierr = PetscMalloc(sizeof(PetscReal*)*n, &tmp_Q);  CHKERRQ(ierr);
412a7e14dcfSSatish Balay   for (i = 0; i < n; i ++)
413a7e14dcfSSatish Balay   {
414a7e14dcfSSatish Balay     ierr = PetscMalloc(sizeof(PetscReal)*n, &tmp_Q[i]);  CHKERRQ(ierr);
415a7e14dcfSSatish Balay     if (i < old_n)
416a7e14dcfSSatish Balay     {
417a7e14dcfSSatish Balay       ierr = PetscMemcpy(tmp_Q[i], df->Q[i], sizeof(PetscReal)*old_n);  CHKERRQ(ierr);
418a7e14dcfSSatish Balay       ierr = PetscFree(df->Q[i]);  CHKERRQ(ierr);
419a7e14dcfSSatish Balay     }
420a7e14dcfSSatish Balay   }
421a7e14dcfSSatish Balay 
422a7e14dcfSSatish Balay   ierr = PetscFree(df->Q);  CHKERRQ(ierr);
423a7e14dcfSSatish Balay   df->Q = tmp_Q;
424a7e14dcfSSatish Balay 
425a7e14dcfSSatish Balay   ierr = PetscFree(df->g);  CHKERRQ(ierr);
426a7e14dcfSSatish Balay   ierr = PetscMalloc(sizeof(PetscReal)*n, &df->g);  CHKERRQ(ierr);
427a7e14dcfSSatish Balay 
428a7e14dcfSSatish Balay   ierr = PetscFree(df->y);  CHKERRQ(ierr);
429a7e14dcfSSatish Balay   ierr = PetscMalloc(sizeof(PetscReal)*n, &df->y);  CHKERRQ(ierr);
430a7e14dcfSSatish Balay 
431a7e14dcfSSatish Balay   ierr = PetscFree(df->tempv);  CHKERRQ(ierr);
432a7e14dcfSSatish Balay   ierr = PetscMalloc(sizeof(PetscReal)*n, &df->tempv);  CHKERRQ(ierr);
433a7e14dcfSSatish Balay 
434a7e14dcfSSatish Balay   ierr = PetscFree(df->d);  CHKERRQ(ierr);
435a7e14dcfSSatish Balay   ierr = PetscMalloc(sizeof(PetscReal)*n, &df->d);  CHKERRQ(ierr);
436a7e14dcfSSatish Balay 
437a7e14dcfSSatish Balay   ierr = PetscFree(df->Qd);  CHKERRQ(ierr);
438a7e14dcfSSatish Balay   ierr = PetscMalloc(sizeof(PetscReal)*n, &df->Qd);  CHKERRQ(ierr);
439a7e14dcfSSatish Balay 
440a7e14dcfSSatish Balay   ierr = PetscFree(df->t);  CHKERRQ(ierr);
441a7e14dcfSSatish Balay   ierr = PetscMalloc(sizeof(PetscReal)*n, &df->t);  CHKERRQ(ierr);
442a7e14dcfSSatish Balay 
443a7e14dcfSSatish Balay   ierr = PetscFree(df->xplus);  CHKERRQ(ierr);
444a7e14dcfSSatish Balay   ierr = PetscMalloc(sizeof(PetscReal)*n, &df->xplus);  CHKERRQ(ierr);
445a7e14dcfSSatish Balay 
446a7e14dcfSSatish Balay   ierr = PetscFree(df->tplus);  CHKERRQ(ierr);
447a7e14dcfSSatish Balay   ierr = PetscMalloc(sizeof(PetscReal)*n, &df->tplus);  CHKERRQ(ierr);
448a7e14dcfSSatish Balay 
449a7e14dcfSSatish Balay   ierr = PetscFree(df->sk);  CHKERRQ(ierr);
450a7e14dcfSSatish Balay   ierr = PetscMalloc(sizeof(PetscReal)*n, &df->sk);  CHKERRQ(ierr);
451a7e14dcfSSatish Balay 
452a7e14dcfSSatish Balay   ierr = PetscFree(df->yk);  CHKERRQ(ierr);
453a7e14dcfSSatish Balay   ierr = PetscMalloc(sizeof(PetscReal)*n, &df->yk);  CHKERRQ(ierr);
454a7e14dcfSSatish Balay 
455a7e14dcfSSatish Balay   ierr = PetscFree(df->ipt);  CHKERRQ(ierr);
456a7e14dcfSSatish Balay   ierr = PetscMalloc(sizeof(PetscInt)*n, &df->ipt);  CHKERRQ(ierr);
457a7e14dcfSSatish Balay 
458a7e14dcfSSatish Balay   ierr = PetscFree(df->ipt2);  CHKERRQ(ierr);
459a7e14dcfSSatish Balay   ierr = PetscMalloc(sizeof(PetscInt)*n, &df->ipt2);  CHKERRQ(ierr);
460a7e14dcfSSatish Balay 
461a7e14dcfSSatish Balay   ierr = PetscFree(df->uv);  CHKERRQ(ierr);
462a7e14dcfSSatish Balay   ierr = PetscMalloc(sizeof(PetscInt)*n, &df->uv);  CHKERRQ(ierr);
463a7e14dcfSSatish Balay 
464a7e14dcfSSatish Balay   PetscFunctionReturn(0);
465a7e14dcfSSatish Balay }
466a7e14dcfSSatish Balay 
467a7e14dcfSSatish Balay 
468a7e14dcfSSatish Balay #undef __FUNCT__
469a7e14dcfSSatish Balay #define __FUNCT__ "destroy_df_solver"
470a7e14dcfSSatish Balay PetscErrorCode destroy_df_solver(TAO_DF *df)
471a7e14dcfSSatish Balay {
472a7e14dcfSSatish Balay   PetscErrorCode ierr;
473a7e14dcfSSatish Balay   PetscInt       i;
474*6c23d075SBarry Smith 
475a7e14dcfSSatish Balay   PetscFunctionBegin;
476*6c23d075SBarry Smith   ierr = PetscFree(df->f);  CHKERRQ(ierr);
477*6c23d075SBarry Smith   ierr = PetscFree(df->a);  CHKERRQ(ierr);
478*6c23d075SBarry Smith   ierr = PetscFree(df->l);  CHKERRQ(ierr);
479*6c23d075SBarry Smith   ierr = PetscFree(df->u);  CHKERRQ(ierr);
480*6c23d075SBarry Smith   ierr = PetscFree(df->x);  CHKERRQ(ierr);
481a7e14dcfSSatish Balay 
482*6c23d075SBarry Smith   for (i = 0; i < df->cur_num_cp; i ++) {
483a7e14dcfSSatish Balay     ierr = PetscFree(df->Q[i]);  CHKERRQ(ierr);
484a7e14dcfSSatish Balay   }
485a7e14dcfSSatish Balay   ierr = PetscFree(df->Q);  CHKERRQ(ierr);
486*6c23d075SBarry Smith   ierr = PetscFree(df->ipt);  CHKERRQ(ierr);
487*6c23d075SBarry Smith   ierr = PetscFree(df->ipt2);  CHKERRQ(ierr);
488*6c23d075SBarry Smith   ierr = PetscFree(df->uv);  CHKERRQ(ierr);
489*6c23d075SBarry Smith   ierr = PetscFree(df->g);  CHKERRQ(ierr);
490*6c23d075SBarry Smith   ierr = PetscFree(df->y);  CHKERRQ(ierr);
491*6c23d075SBarry Smith   ierr = PetscFree(df->tempv);  CHKERRQ(ierr);
492*6c23d075SBarry Smith   ierr = PetscFree(df->d);  CHKERRQ(ierr);
493*6c23d075SBarry Smith   ierr = PetscFree(df->Qd);  CHKERRQ(ierr);
494*6c23d075SBarry Smith   ierr = PetscFree(df->t);  CHKERRQ(ierr);
495*6c23d075SBarry Smith   ierr = PetscFree(df->xplus);  CHKERRQ(ierr);
496*6c23d075SBarry Smith   ierr = PetscFree(df->tplus);  CHKERRQ(ierr);
497*6c23d075SBarry Smith   ierr = PetscFree(df->sk);  CHKERRQ(ierr);
498*6c23d075SBarry Smith   ierr = PetscFree(df->yk);  CHKERRQ(ierr);
499a7e14dcfSSatish Balay   PetscFunctionReturn(0);
500a7e14dcfSSatish Balay }
501a7e14dcfSSatish Balay 
502a7e14dcfSSatish Balay 
503a7e14dcfSSatish Balay /* Piecewise linear monotone target function for the Dai-Fletcher projector */
504a7e14dcfSSatish Balay #undef __FUNCT__
505a7e14dcfSSatish Balay #define __FUNCT__ "phi"
506*6c23d075SBarry Smith PetscReal phi(PetscReal *x,PetscInt n,PetscReal lambda,PetscReal *a,PetscReal b,PetscReal *c,PetscReal *l,PetscReal *u)
507a7e14dcfSSatish Balay {
508a7e14dcfSSatish Balay   PetscReal r = 0.0;
509a7e14dcfSSatish Balay   PetscInt  i;
510a7e14dcfSSatish Balay 
511a7e14dcfSSatish Balay   for (i = 0; i < n; i++){
512a7e14dcfSSatish Balay     x[i] = -c[i] + lambda*a[i];
513*6c23d075SBarry Smith     if (x[i] > u[i])     x[i] = u[i];
514*6c23d075SBarry Smith     else if(x[i] < l[i]) x[i] = l[i];
515a7e14dcfSSatish Balay     r += a[i]*x[i];
516a7e14dcfSSatish Balay   }
517a7e14dcfSSatish Balay   return r - b;
518a7e14dcfSSatish Balay }
519a7e14dcfSSatish Balay 
520a7e14dcfSSatish Balay /** Modified Dai-Fletcher QP projector solves the problem:
521a7e14dcfSSatish Balay  *
522a7e14dcfSSatish Balay  *      minimise  0.5*x'*x - c'*x
523a7e14dcfSSatish Balay  *      subj to   a'*x = b
524a7e14dcfSSatish Balay  *                l \leq x \leq u
525a7e14dcfSSatish Balay  *
526a7e14dcfSSatish Balay  *  \param c The point to be projected onto feasible set
527a7e14dcfSSatish Balay  */
528a7e14dcfSSatish Balay #undef __FUNCT__
529a7e14dcfSSatish Balay #define __FUNCT__ "project"
530*6c23d075SBarry Smith PetscInt project(PetscInt n,PetscReal *a,PetscReal b,PetscReal *c,PetscReal *l,PetscReal *u,PetscReal *x,PetscReal *lam_ext,TAO_DF *df)
531a7e14dcfSSatish Balay {
532a7e14dcfSSatish Balay   PetscReal lambda, lambdal, lambdau, dlambda, lambda_new;
533a7e14dcfSSatish Balay   PetscReal r, rl, ru, s;
534a7e14dcfSSatish Balay   PetscInt  innerIter;
535a7e14dcfSSatish Balay   PetscBool nonNegativeSlack = PETSC_FALSE;
536a7e14dcfSSatish Balay 
537a7e14dcfSSatish Balay   *lam_ext = 0;
538a7e14dcfSSatish Balay   lambda  = 0;
539a7e14dcfSSatish Balay   dlambda = 0.5;
540a7e14dcfSSatish Balay   innerIter = 1;
541a7e14dcfSSatish Balay 
542a7e14dcfSSatish Balay   /*  \phi(x;lambda) := 0.5*x'*x + c'*x - lambda*(a'*x-b)
543a7e14dcfSSatish Balay    *
544a7e14dcfSSatish Balay    *  Optimality conditions for \phi:
545a7e14dcfSSatish Balay    *
546a7e14dcfSSatish Balay    *  1. lambda   <= 0
547a7e14dcfSSatish Balay    *  2. r        <= 0
548a7e14dcfSSatish Balay    *  3. r*lambda == 0
549a7e14dcfSSatish Balay    */
550a7e14dcfSSatish Balay 
551a7e14dcfSSatish Balay   /* Bracketing Phase */
552a7e14dcfSSatish Balay   r = phi(x, n, lambda, a, b, c, l, u);
553a7e14dcfSSatish Balay 
554*6c23d075SBarry Smith   if(nonNegativeSlack) {
555a7e14dcfSSatish Balay     /* inequality constraint, i.e., with \xi >= 0 constraint */
556a7e14dcfSSatish Balay     if (r < TOL_R)
557a7e14dcfSSatish Balay       return 0;
558*6c23d075SBarry Smith   } else  {
559a7e14dcfSSatish Balay     /* equality constraint ,i.e., without \xi >= 0 constraint */
560a7e14dcfSSatish Balay     if (fabs(r) < TOL_R)
561a7e14dcfSSatish Balay       return 0;
562a7e14dcfSSatish Balay   }
563a7e14dcfSSatish Balay 
564a7e14dcfSSatish Balay   if (r < 0.0){
565a7e14dcfSSatish Balay     lambdal = lambda;
566a7e14dcfSSatish Balay     rl      = r;
567a7e14dcfSSatish Balay     lambda  = lambda + dlambda;
568a7e14dcfSSatish Balay     r       = phi(x, n, lambda, a, b, c, l, u);
569a7e14dcfSSatish Balay     while (r < 0.0 && dlambda < BMRM_INFTY)  {
570a7e14dcfSSatish Balay       lambdal = lambda;
571a7e14dcfSSatish Balay       s       = rl/r - 1.0;
572a7e14dcfSSatish Balay       if (s < 0.1) s = 0.1;
573a7e14dcfSSatish Balay       dlambda = dlambda + dlambda/s;
574a7e14dcfSSatish Balay       lambda  = lambda + dlambda;
575a7e14dcfSSatish Balay       rl      = r;
576a7e14dcfSSatish Balay       r       = phi(x, n, lambda, a, b, c, l, u);
577a7e14dcfSSatish Balay     }
578a7e14dcfSSatish Balay     lambdau = lambda;
579a7e14dcfSSatish Balay     ru      = r;
580*6c23d075SBarry Smith   } else {
581a7e14dcfSSatish Balay     lambdau = lambda;
582a7e14dcfSSatish Balay     ru      = r;
583a7e14dcfSSatish Balay     lambda  = lambda - dlambda;
584a7e14dcfSSatish Balay     r       = phi(x, n, lambda, a, b, c, l, u);
585a7e14dcfSSatish Balay     while (r > 0.0 && dlambda > -BMRM_INFTY) {
586a7e14dcfSSatish Balay       lambdau = lambda;
587a7e14dcfSSatish Balay       s       = ru/r - 1.0;
588a7e14dcfSSatish Balay       if (s < 0.1) s = 0.1;
589a7e14dcfSSatish Balay       dlambda = dlambda + dlambda/s;
590a7e14dcfSSatish Balay       lambda  = lambda - dlambda;
591a7e14dcfSSatish Balay       ru      = r;
592a7e14dcfSSatish Balay       r       = phi(x, n, lambda, a, b, c, l, u);
593a7e14dcfSSatish Balay     }
594a7e14dcfSSatish Balay     lambdal = lambda;
595a7e14dcfSSatish Balay     rl      = r;
596a7e14dcfSSatish Balay   }
597a7e14dcfSSatish Balay 
598*6c23d075SBarry Smith   if(fabs(dlambda) > BMRM_INFTY) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"L2N2_DaiFletcherPGM detected Infeasible QP problem!");
599a7e14dcfSSatish Balay 
600a7e14dcfSSatish Balay   if(ru == 0){
601a7e14dcfSSatish Balay     lambda = lambdau;
602a7e14dcfSSatish Balay     r = phi(x, n, lambda, a, b, c, l, u);
603a7e14dcfSSatish Balay     return innerIter;
604a7e14dcfSSatish Balay   }
605a7e14dcfSSatish Balay 
606a7e14dcfSSatish Balay   /* Secant Phase */
607a7e14dcfSSatish Balay   s       = 1.0 - rl/ru;
608a7e14dcfSSatish Balay   dlambda = dlambda/s;
609a7e14dcfSSatish Balay   lambda  = lambdau - dlambda;
610a7e14dcfSSatish Balay   r       = phi(x, n, lambda, a, b, c, l, u);
611a7e14dcfSSatish Balay 
612a7e14dcfSSatish Balay   while (fabs(r) > TOL_R
613a7e14dcfSSatish Balay          && dlambda > TOL_LAM * (1.0 + fabs(lambda))
614a7e14dcfSSatish Balay          && innerIter < df->maxProjIter){
615a7e14dcfSSatish Balay     innerIter++;
616a7e14dcfSSatish Balay     if (r > 0.0){
617a7e14dcfSSatish Balay       if (s <= 2.0){
618a7e14dcfSSatish Balay         lambdau = lambda;
619a7e14dcfSSatish Balay         ru      = r;
620a7e14dcfSSatish Balay         s       = 1.0 - rl/ru;
621a7e14dcfSSatish Balay         dlambda = (lambdau - lambdal) / s;
622a7e14dcfSSatish Balay         lambda  = lambdau - dlambda;
623a7e14dcfSSatish Balay       }
624a7e14dcfSSatish Balay       else {
625a7e14dcfSSatish Balay         s          = ru/r-1.0;
626a7e14dcfSSatish Balay         if (s < 0.1) s = 0.1;
627a7e14dcfSSatish Balay         dlambda    = (lambdau - lambda) / s;
628a7e14dcfSSatish Balay         lambda_new = 0.75*lambdal + 0.25*lambda;
629a7e14dcfSSatish Balay         if (lambda_new < (lambda - dlambda))
630a7e14dcfSSatish Balay           lambda_new = lambda - dlambda;
631a7e14dcfSSatish Balay         lambdau    = lambda;
632a7e14dcfSSatish Balay         ru         = r;
633a7e14dcfSSatish Balay         lambda     = lambda_new;
634a7e14dcfSSatish Balay         s          = (lambdau - lambdal) / (lambdau - lambda);
635a7e14dcfSSatish Balay       }
636a7e14dcfSSatish Balay     }
637a7e14dcfSSatish Balay     else {
638a7e14dcfSSatish Balay       if (s >= 2.0){
639a7e14dcfSSatish Balay         lambdal = lambda;
640a7e14dcfSSatish Balay         rl      = r;
641a7e14dcfSSatish Balay         s       = 1.0 - rl/ru;
642a7e14dcfSSatish Balay         dlambda = (lambdau - lambdal) / s;
643a7e14dcfSSatish Balay         lambda  = lambdau - dlambda;
644a7e14dcfSSatish Balay       }
645a7e14dcfSSatish Balay       else {
646a7e14dcfSSatish Balay         s          = rl/r - 1.0;
647a7e14dcfSSatish Balay         if (s < 0.1) s = 0.1;
648a7e14dcfSSatish Balay         dlambda    = (lambda-lambdal) / s;
649a7e14dcfSSatish Balay         lambda_new = 0.75*lambdau + 0.25*lambda;
650a7e14dcfSSatish Balay         if (lambda_new > (lambda + dlambda))
651a7e14dcfSSatish Balay           lambda_new = lambda + dlambda;
652a7e14dcfSSatish Balay         lambdal    = lambda;
653a7e14dcfSSatish Balay         rl         = r;
654a7e14dcfSSatish Balay         lambda     = lambda_new;
655a7e14dcfSSatish Balay         s          = (lambdau - lambdal) / (lambdau-lambda);
656a7e14dcfSSatish Balay       }
657a7e14dcfSSatish Balay     }
658a7e14dcfSSatish Balay     r = phi(x, n, lambda, a, b, c, l, u);
659a7e14dcfSSatish Balay   }
660a7e14dcfSSatish Balay 
661a7e14dcfSSatish Balay   *lam_ext = lambda;
662a7e14dcfSSatish Balay   if(innerIter >= df->maxProjIter)
663a7e14dcfSSatish Balay     PetscPrintf(PETSC_COMM_SELF, "WARNING: DaiFletcher max iterations\n");
664a7e14dcfSSatish Balay 
665a7e14dcfSSatish Balay   return innerIter;
666a7e14dcfSSatish Balay }
667a7e14dcfSSatish Balay 
668a7e14dcfSSatish Balay 
669a7e14dcfSSatish Balay #undef __FUNCT__
670a7e14dcfSSatish Balay #define __FUNCT__ "solve"
671a7e14dcfSSatish Balay PetscErrorCode solve(TAO_DF *df)
672a7e14dcfSSatish Balay {
673a7e14dcfSSatish Balay   PetscErrorCode ierr;
674a7e14dcfSSatish Balay   PetscInt    i, j, innerIter, it, it2, luv, info, lscount = 0, projcount = 0;
675a7e14dcfSSatish Balay   PetscReal gd, max, ak, bk, akold, bkold, lamnew, alpha, kktlam=0.0, lam_ext;
676a7e14dcfSSatish Balay   PetscReal DELTAsv, ProdDELTAsv;
677a7e14dcfSSatish Balay   PetscReal c, *tempQ;
678a7e14dcfSSatish Balay   PetscReal *x = df->x, *a = df->a, b = df->b, *l = df->l, *u = df->u, tol = df->tol;
679a7e14dcfSSatish Balay   PetscReal *tempv = df->tempv, *y = df->y, *g = df->g, *d = df->d, *Qd = df->Qd;
680a7e14dcfSSatish Balay   PetscReal *xplus = df->xplus, *tplus = df->tplus, *sk = df->sk, *yk = df->yk;
681a7e14dcfSSatish Balay   PetscReal **Q = df->Q, *f = df->f, *t = df->t;
682a7e14dcfSSatish Balay   PetscInt dim = df->dim, *ipt = df->ipt, *ipt2 = df->ipt2, *uv = df->uv;
683a7e14dcfSSatish Balay 
684a7e14dcfSSatish Balay   /*** variables for the adaptive nonmonotone linesearch ***/
685a7e14dcfSSatish Balay   PetscInt    L, llast;
686a7e14dcfSSatish Balay   PetscReal fr, fbest, fv, fc, fv0;
687a7e14dcfSSatish Balay   c = BMRM_INFTY;
688a7e14dcfSSatish Balay 
689a7e14dcfSSatish Balay   DELTAsv = EPS_SV;
690a7e14dcfSSatish Balay   if (tol <= 1.0e-5 || dim <= 20)
691a7e14dcfSSatish Balay     ProdDELTAsv = 0.0F;
692a7e14dcfSSatish Balay   else
693a7e14dcfSSatish Balay     ProdDELTAsv = EPS_SV;
694a7e14dcfSSatish Balay 
695a7e14dcfSSatish Balay   for (i = 0; i < dim; i++)
696a7e14dcfSSatish Balay     tempv[i] = -x[i];
697a7e14dcfSSatish Balay 
698a7e14dcfSSatish Balay   lam_ext = 0.0;
699a7e14dcfSSatish Balay 
700a7e14dcfSSatish Balay   /* Project the initial solution */
701a7e14dcfSSatish Balay   projcount += project(dim, a, b, tempv, l, u, x, &lam_ext, df);
702a7e14dcfSSatish Balay 
703a7e14dcfSSatish Balay   /* Compute gradient
704a7e14dcfSSatish Balay      g = Q*x + f; */
705a7e14dcfSSatish Balay 
706a7e14dcfSSatish Balay   it = 0;
707a7e14dcfSSatish Balay   for (i = 0; i < dim; i++)
708a7e14dcfSSatish Balay     if (fabs(x[i]) > ProdDELTAsv)
709a7e14dcfSSatish Balay       ipt[it++] = i;
710a7e14dcfSSatish Balay 
711a7e14dcfSSatish Balay   ierr = PetscMemzero(t, dim*sizeof(PetscReal));  CHKERRQ(ierr);
712a7e14dcfSSatish Balay   for (i = 0; i < it; i++){
713a7e14dcfSSatish Balay     tempQ = Q[ipt[i]];
714a7e14dcfSSatish Balay     for (j = 0; j < dim; j++)
715a7e14dcfSSatish Balay       t[j] += (tempQ[j]*x[ipt[i]]);
716a7e14dcfSSatish Balay   }
717a7e14dcfSSatish Balay   for (i = 0; i < dim; i++){
718a7e14dcfSSatish Balay     g[i] = t[i] + f[i];
719a7e14dcfSSatish Balay   }
720a7e14dcfSSatish Balay 
721a7e14dcfSSatish Balay 
722a7e14dcfSSatish Balay   /* y = -(x_{k} - g_{k}) */
723a7e14dcfSSatish Balay   for (i = 0; i < dim; i++){
724a7e14dcfSSatish Balay     y[i] = g[i] - x[i];
725a7e14dcfSSatish Balay   }
726a7e14dcfSSatish Balay 
727a7e14dcfSSatish Balay   /* Project x_{k} - g_{k} */
728a7e14dcfSSatish Balay   projcount += project(dim, a, b, y, l, u, tempv, &lam_ext, df);
729a7e14dcfSSatish Balay 
730a7e14dcfSSatish Balay   /* y = P(x_{k} - g_{k}) - x_{k} */
731a7e14dcfSSatish Balay   max = ALPHA_MIN;
732a7e14dcfSSatish Balay   for (i = 0; i < dim; i++){
733a7e14dcfSSatish Balay     y[i] = tempv[i] - x[i];
734a7e14dcfSSatish Balay     if (fabs(y[i]) > max)
735a7e14dcfSSatish Balay       max = fabs(y[i]);
736a7e14dcfSSatish Balay   }
737a7e14dcfSSatish Balay 
738a7e14dcfSSatish Balay   if (max < tol*1e-3){
739a7e14dcfSSatish Balay     lscount = 0;
740a7e14dcfSSatish Balay     innerIter    = 0;
741a7e14dcfSSatish Balay     return 0;
742a7e14dcfSSatish Balay   }
743a7e14dcfSSatish Balay 
744a7e14dcfSSatish Balay   alpha = 1.0 / max;
745a7e14dcfSSatish Balay 
746a7e14dcfSSatish Balay   /* fv0 = f(x_{0}). Recall t = Q x_{k}  */
747a7e14dcfSSatish Balay   fv0   = 0.0;
748a7e14dcfSSatish Balay   for (i = 0; i < dim; i++)
749a7e14dcfSSatish Balay     fv0 += x[i] * (0.5*t[i] + f[i]);
750a7e14dcfSSatish Balay 
751a7e14dcfSSatish Balay   /*** adaptive nonmonotone linesearch ***/
752a7e14dcfSSatish Balay   L     = 2;
753a7e14dcfSSatish Balay   fr    = ALPHA_MAX;
754a7e14dcfSSatish Balay   fbest = fv0;
755a7e14dcfSSatish Balay   fc    = fv0;
756a7e14dcfSSatish Balay   llast = 0;
757a7e14dcfSSatish Balay   akold = bkold = 0.0;
758a7e14dcfSSatish Balay 
759a7e14dcfSSatish Balay   /***      Iterator begins     ***/
760a7e14dcfSSatish Balay   for (innerIter = 1; innerIter <= df->maxPGMIter; innerIter++) {
761a7e14dcfSSatish Balay 
762a7e14dcfSSatish Balay     /* tempv = -(x_{k} - alpha*g_{k}) */
763a7e14dcfSSatish Balay     for (i = 0; i < dim; i++)
764a7e14dcfSSatish Balay       tempv[i] = alpha*g[i] - x[i];
765a7e14dcfSSatish Balay 
766a7e14dcfSSatish Balay     /* Project x_{k} - alpha*g_{k} */
767a7e14dcfSSatish Balay     projcount += project(dim, a, b, tempv, l, u, y, &lam_ext, df);
768a7e14dcfSSatish Balay 
769a7e14dcfSSatish Balay 
770a7e14dcfSSatish Balay     /* gd = \inner{d_{k}}{g_{k}}
771a7e14dcfSSatish Balay         d = P(x_{k} - alpha*g_{k}) - x_{k}
772a7e14dcfSSatish Balay     */
773a7e14dcfSSatish Balay     gd = 0.0;
774a7e14dcfSSatish Balay     for (i = 0; i < dim; i++){
775a7e14dcfSSatish Balay       d[i] = y[i] - x[i];
776a7e14dcfSSatish Balay       gd  += d[i] * g[i];
777a7e14dcfSSatish Balay     }
778a7e14dcfSSatish Balay 
779a7e14dcfSSatish Balay     /* Gradient computation  */
780a7e14dcfSSatish Balay 
781a7e14dcfSSatish Balay     /* compute Qd = Q*d  or  Qd = Q*y - t depending on their sparsity */
782a7e14dcfSSatish Balay 
783a7e14dcfSSatish Balay     it = it2 = 0;
784a7e14dcfSSatish Balay     for (i = 0; i < dim; i++)
785a7e14dcfSSatish Balay       if (fabs(d[i]) > (ProdDELTAsv*1.0e-2))
786a7e14dcfSSatish Balay         ipt[it++]   = i;
787a7e14dcfSSatish Balay     for (i = 0; i < dim; i++)
788a7e14dcfSSatish Balay       if (fabs(y[i]) > ProdDELTAsv)
789a7e14dcfSSatish Balay         ipt2[it2++] = i;
790a7e14dcfSSatish Balay 
791a7e14dcfSSatish Balay     ierr = PetscMemzero(Qd, dim*sizeof(PetscReal));  CHKERRQ(ierr);
792a7e14dcfSSatish Balay     /* compute Qd = Q*d */
793a7e14dcfSSatish Balay     if (it < it2){
794a7e14dcfSSatish Balay       for (i = 0; i < it; i++){
795a7e14dcfSSatish Balay         tempQ = Q[ipt[i]];
796a7e14dcfSSatish Balay         for (j = 0; j < dim; j++)
797a7e14dcfSSatish Balay           Qd[j] += (tempQ[j] * d[ipt[i]]);
798a7e14dcfSSatish Balay       }
799a7e14dcfSSatish Balay     }
800a7e14dcfSSatish Balay     else { /* compute Qd = Q*y-t */
801a7e14dcfSSatish Balay       for (i = 0; i < it2; i++){
802a7e14dcfSSatish Balay         tempQ = Q[ipt2[i]];
803a7e14dcfSSatish Balay         for (j = 0; j < dim; j++)
804a7e14dcfSSatish Balay           Qd[j] += (tempQ[j] * y[ipt2[i]]);
805a7e14dcfSSatish Balay       }
806a7e14dcfSSatish Balay       for (j = 0; j < dim; j++)
807a7e14dcfSSatish Balay         Qd[j] -= t[j];
808a7e14dcfSSatish Balay     }
809a7e14dcfSSatish Balay 
810a7e14dcfSSatish Balay 
811a7e14dcfSSatish Balay     /* ak = inner{d_{k}}{d_{k}} */
812a7e14dcfSSatish Balay     ak = 0.0;
813a7e14dcfSSatish Balay     for (i = 0; i < dim; i++)
814a7e14dcfSSatish Balay       ak += d[i] * d[i];
815a7e14dcfSSatish Balay 
816a7e14dcfSSatish Balay     bk = 0.0;
817a7e14dcfSSatish Balay     for (i = 0; i < dim; i++)
818a7e14dcfSSatish Balay       bk += d[i]*Qd[i];
819a7e14dcfSSatish Balay 
820a7e14dcfSSatish Balay     if (bk > EPS*ak && gd < 0.0)    /* ak is normd */
821a7e14dcfSSatish Balay       lamnew = -gd/bk;
822a7e14dcfSSatish Balay     else
823a7e14dcfSSatish Balay       lamnew = 1.0;
824a7e14dcfSSatish Balay 
825a7e14dcfSSatish Balay     /* fv is computing f(x_{k} + d_{k}) */
826a7e14dcfSSatish Balay     fv = 0.0;
827a7e14dcfSSatish Balay     for (i = 0; i < dim; i++){
828a7e14dcfSSatish Balay       xplus[i] = x[i] + d[i];
829a7e14dcfSSatish Balay       tplus[i] = t[i] + Qd[i];
830a7e14dcfSSatish Balay       fv      += xplus[i] * (0.5*tplus[i] + f[i]);
831a7e14dcfSSatish Balay     }
832a7e14dcfSSatish Balay 
833a7e14dcfSSatish Balay     /* fr is fref */
834a7e14dcfSSatish Balay     if ((innerIter == 1 && fv >= fv0) || (innerIter > 1 && fv >= fr)){
835a7e14dcfSSatish Balay       lscount++;
836a7e14dcfSSatish Balay       fv = 0.0;
837a7e14dcfSSatish Balay       for (i = 0; i < dim; i++){
838a7e14dcfSSatish Balay         xplus[i] = x[i] + lamnew*d[i];
839a7e14dcfSSatish Balay         tplus[i] = t[i] + lamnew*Qd[i];
840a7e14dcfSSatish Balay         fv      += xplus[i] * (0.5*tplus[i] + f[i]);
841a7e14dcfSSatish Balay       }
842a7e14dcfSSatish Balay     }
843a7e14dcfSSatish Balay 
844a7e14dcfSSatish Balay     for (i = 0; i < dim; i++){
845a7e14dcfSSatish Balay       sk[i] = xplus[i] - x[i];
846a7e14dcfSSatish Balay       yk[i] = tplus[i] - t[i];
847a7e14dcfSSatish Balay       x[i]  = xplus[i];
848a7e14dcfSSatish Balay       t[i]  = tplus[i];
849a7e14dcfSSatish Balay       g[i]  = t[i] + f[i];
850a7e14dcfSSatish Balay     }
851a7e14dcfSSatish Balay 
852a7e14dcfSSatish Balay 
853a7e14dcfSSatish Balay     /* update the line search control parameters */
854a7e14dcfSSatish Balay 
855a7e14dcfSSatish Balay     if (fv < fbest){
856a7e14dcfSSatish Balay       fbest = fv;
857a7e14dcfSSatish Balay       fc    = fv;
858a7e14dcfSSatish Balay       llast = 0;
859a7e14dcfSSatish Balay     }
860a7e14dcfSSatish Balay     else {
861a7e14dcfSSatish Balay       fc = (fc > fv ? fc : fv);
862a7e14dcfSSatish Balay       llast++;
863a7e14dcfSSatish Balay       if (llast == L){
864a7e14dcfSSatish Balay         fr    = fc;
865a7e14dcfSSatish Balay         fc    = fv;
866a7e14dcfSSatish Balay         llast = 0;
867a7e14dcfSSatish Balay       }
868a7e14dcfSSatish Balay     }
869a7e14dcfSSatish Balay 
870a7e14dcfSSatish Balay     ak = bk = 0.0;
871a7e14dcfSSatish Balay     for (i = 0; i < dim; i++){
872a7e14dcfSSatish Balay       ak += sk[i] * sk[i];
873a7e14dcfSSatish Balay       bk += sk[i] * yk[i];
874a7e14dcfSSatish Balay     }
875a7e14dcfSSatish Balay 
876a7e14dcfSSatish Balay     if (bk <= EPS*ak)
877a7e14dcfSSatish Balay       alpha = ALPHA_MAX;
878a7e14dcfSSatish Balay     else{
879a7e14dcfSSatish Balay       if (bkold < EPS*akold)
880a7e14dcfSSatish Balay         alpha = ak/bk;
881a7e14dcfSSatish Balay       else
882a7e14dcfSSatish Balay         alpha = (akold+ak)/(bkold+bk);
883a7e14dcfSSatish Balay 
884a7e14dcfSSatish Balay       if (alpha > ALPHA_MAX)
885a7e14dcfSSatish Balay         alpha = ALPHA_MAX;
886a7e14dcfSSatish Balay       else if (alpha < ALPHA_MIN)
887a7e14dcfSSatish Balay         alpha = ALPHA_MIN;
888a7e14dcfSSatish Balay     }
889a7e14dcfSSatish Balay 
890a7e14dcfSSatish Balay     akold = ak;
891a7e14dcfSSatish Balay     bkold = bk;
892a7e14dcfSSatish Balay 
893a7e14dcfSSatish Balay 
894a7e14dcfSSatish Balay     /*** stopping criterion based on KKT conditions ***/
895a7e14dcfSSatish Balay     /* at optimal, gradient of lagrangian w.r.t. x is zero */
896a7e14dcfSSatish Balay 
897a7e14dcfSSatish Balay     bk = 0.0;
898a7e14dcfSSatish Balay     for (i = 0; i < dim; i++)
899a7e14dcfSSatish Balay       bk +=  x[i] * x[i];
900a7e14dcfSSatish Balay 
901a7e14dcfSSatish Balay     if (sqrt(ak) < tol*10 * sqrt(bk)){
902a7e14dcfSSatish Balay       it     = 0;
903a7e14dcfSSatish Balay       luv    = 0;
904a7e14dcfSSatish Balay       kktlam = 0.0;
905a7e14dcfSSatish Balay       for (i = 0; i < dim; i++){
906a7e14dcfSSatish Balay         /* x[i] is active hence lagrange multipliers for box constraints
907a7e14dcfSSatish Balay                 are zero. The lagrange multiplier for ineq. const. is then
908a7e14dcfSSatish Balay                 defined as below
909a7e14dcfSSatish Balay         */
910a7e14dcfSSatish Balay         if ((x[i] > DELTAsv) && (x[i] < c-DELTAsv)){
911a7e14dcfSSatish Balay           ipt[it++] = i;
912a7e14dcfSSatish Balay           kktlam    = kktlam - a[i]*g[i];
913a7e14dcfSSatish Balay         }
914a7e14dcfSSatish Balay         else
915a7e14dcfSSatish Balay           uv[luv++] = i;
916a7e14dcfSSatish Balay       }
917a7e14dcfSSatish Balay 
918a7e14dcfSSatish Balay       if (it == 0 && sqrt(ak) < tol*0.5 * sqrt(bk))
919a7e14dcfSSatish Balay         return 0;
920a7e14dcfSSatish Balay       else {
921a7e14dcfSSatish Balay         kktlam = kktlam/it;
922a7e14dcfSSatish Balay         info   = 1;
923a7e14dcfSSatish Balay         for (i = 0; i < it; i++) {
924a7e14dcfSSatish Balay           if (fabs(a[ipt[i]] * g[ipt[i]] + kktlam) > tol) {
925a7e14dcfSSatish Balay             info = 0;
926a7e14dcfSSatish Balay             break;
927a7e14dcfSSatish Balay           }
928a7e14dcfSSatish Balay         }
929a7e14dcfSSatish Balay         if (info == 1)  {
930a7e14dcfSSatish Balay           for (i = 0; i < luv; i++)  {
931a7e14dcfSSatish Balay             if (x[uv[i]] <= DELTAsv){
932a7e14dcfSSatish Balay               /* x[i] == lower bound, hence, lagrange multiplier (say, beta) for lower bound may
933a7e14dcfSSatish Balay                      not be zero. So, the gradient without beta is > 0
934a7e14dcfSSatish Balay               */
935a7e14dcfSSatish Balay               if (g[uv[i]] + kktlam*a[uv[i]] < -tol){
936a7e14dcfSSatish Balay                 info = 0;
937a7e14dcfSSatish Balay                 break;
938a7e14dcfSSatish Balay               }
939a7e14dcfSSatish Balay             }
940a7e14dcfSSatish Balay             else {
941a7e14dcfSSatish Balay               /* x[i] == upper bound, hence, lagrange multiplier (say, eta) for upper bound may
942a7e14dcfSSatish Balay                      not be zero. So, the gradient without eta is < 0
943a7e14dcfSSatish Balay               */
944a7e14dcfSSatish Balay               if (g[uv[i]] + kktlam*a[uv[i]] > tol) {
945a7e14dcfSSatish Balay                 info = 0;
946a7e14dcfSSatish Balay                 break;
947a7e14dcfSSatish Balay               }
948a7e14dcfSSatish Balay             }
949a7e14dcfSSatish Balay           }
950a7e14dcfSSatish Balay         }
951a7e14dcfSSatish Balay 
952a7e14dcfSSatish Balay         if (info == 1)
953a7e14dcfSSatish Balay           return 0;
954a7e14dcfSSatish Balay       }
955a7e14dcfSSatish Balay     }
956a7e14dcfSSatish Balay   }
957a7e14dcfSSatish Balay   return 0;
958a7e14dcfSSatish Balay }
959a7e14dcfSSatish Balay 
960a7e14dcfSSatish Balay 
961