1aaa7dc30SBarry Smith #include <../src/tao/unconstrained/impls/bmrm/bmrm.h> 2a7e14dcfSSatish Balay 3a7e14dcfSSatish Balay static PetscErrorCode init_df_solver(TAO_DF*); 4a7e14dcfSSatish Balay static PetscErrorCode ensure_df_space(PetscInt, TAO_DF*); 5a7e14dcfSSatish Balay static PetscErrorCode destroy_df_solver(TAO_DF*); 60e660641SBarry Smith static PetscReal phi(PetscReal*,PetscInt,PetscReal,PetscReal*,PetscReal,PetscReal*,PetscReal*,PetscReal*); 70e660641SBarry Smith static PetscInt project(PetscInt,PetscReal*,PetscReal,PetscReal*,PetscReal*,PetscReal*,PetscReal*,PetscReal*,TAO_DF*); 8a7e14dcfSSatish Balay static PetscErrorCode solve(TAO_DF*); 9a7e14dcfSSatish Balay 10a7e14dcfSSatish Balay 11a7e14dcfSSatish Balay /*------------------------------------------------------------*/ 12a7e14dcfSSatish Balay /* The main solver function 13a7e14dcfSSatish Balay 14a7e14dcfSSatish Balay f = Remp(W) This is what the user provides us from the application layer 15a7e14dcfSSatish Balay So the ComputeGradient function for instance should get us back the subgradient of Remp(W) 16a7e14dcfSSatish Balay 17a7e14dcfSSatish Balay Regularizer assumed to be L2 norm = lambda*0.5*W'W () 18a7e14dcfSSatish Balay */ 19a7e14dcfSSatish Balay 20a7e14dcfSSatish Balay #undef __FUNCT__ 21a7e14dcfSSatish Balay #define __FUNCT__ "make_grad_node" 22a7e14dcfSSatish Balay static PetscErrorCode make_grad_node(Vec X, Vec_Chain **p) 23a7e14dcfSSatish Balay { 24a7e14dcfSSatish Balay PetscErrorCode ierr; 25a7e14dcfSSatish Balay 26a7e14dcfSSatish Balay PetscFunctionBegin; 270e660641SBarry Smith ierr = PetscNew(p);CHKERRQ(ierr); 28a7e14dcfSSatish Balay ierr = VecDuplicate(X, &(*p)->V);CHKERRQ(ierr); 29a7e14dcfSSatish Balay ierr = VecCopy(X, (*p)->V);CHKERRQ(ierr); 306c23d075SBarry Smith (*p)->next = NULL; 31a7e14dcfSSatish Balay PetscFunctionReturn(0); 32a7e14dcfSSatish Balay } 33a7e14dcfSSatish Balay 34a7e14dcfSSatish Balay #undef __FUNCT__ 35a7e14dcfSSatish Balay #define __FUNCT__ "destroy_grad_list" 36a7e14dcfSSatish Balay static PetscErrorCode destroy_grad_list(Vec_Chain *head) 37a7e14dcfSSatish Balay { 38a7e14dcfSSatish Balay PetscErrorCode ierr; 39a7e14dcfSSatish Balay Vec_Chain *p = head->next, *q; 40a7e14dcfSSatish Balay 41a7e14dcfSSatish Balay PetscFunctionBegin; 42a7e14dcfSSatish Balay while(p) { 43a7e14dcfSSatish Balay q = p->next; 44a7e14dcfSSatish Balay ierr = VecDestroy(&p->V);CHKERRQ(ierr); 45a7e14dcfSSatish Balay ierr = PetscFree(p);CHKERRQ(ierr); 46a7e14dcfSSatish Balay p = q; 47a7e14dcfSSatish Balay } 486c23d075SBarry Smith head->next = NULL; 49a7e14dcfSSatish Balay PetscFunctionReturn(0); 50a7e14dcfSSatish Balay } 51a7e14dcfSSatish Balay 52a7e14dcfSSatish Balay 53a7e14dcfSSatish Balay #undef __FUNCT__ 54a7e14dcfSSatish Balay #define __FUNCT__ "TaoSolve_BMRM" 55441846f8SBarry Smith static PetscErrorCode TaoSolve_BMRM(Tao tao) 56a7e14dcfSSatish Balay { 57a7e14dcfSSatish Balay PetscErrorCode ierr; 58e4cb33bbSBarry Smith TaoConvergedReason reason; 59a7e14dcfSSatish Balay TAO_DF df; 60a7e14dcfSSatish Balay TAO_BMRM *bmrm = (TAO_BMRM*)tao->data; 61a7e14dcfSSatish Balay 62a7e14dcfSSatish Balay /* Values and pointers to parts of the optimization problem */ 63a7e14dcfSSatish Balay PetscReal f = 0.0; 64a7e14dcfSSatish Balay Vec W = tao->solution; 65a7e14dcfSSatish Balay Vec G = tao->gradient; 66a7e14dcfSSatish Balay PetscReal lambda; 67a7e14dcfSSatish Balay PetscReal bt; 68a7e14dcfSSatish Balay Vec_Chain grad_list, *tail_glist, *pgrad; 69a7e14dcfSSatish Balay PetscInt iter = 0; 70a7e14dcfSSatish Balay PetscInt i; 71a7e14dcfSSatish Balay PetscMPIInt rank; 72a7e14dcfSSatish Balay 73e4cb33bbSBarry Smith /* Used in converged criteria check */ 74a7e14dcfSSatish Balay PetscReal reg; 75a7e14dcfSSatish Balay PetscReal jtwt, max_jtwt, pre_epsilon, epsilon, jw, min_jw; 76a7e14dcfSSatish Balay PetscReal innerSolverTol; 77ba4b436cSBarry Smith MPI_Comm comm; 78a7e14dcfSSatish Balay 79a7e14dcfSSatish Balay PetscFunctionBegin; 80ba4b436cSBarry Smith ierr = PetscObjectGetComm((PetscObject)tao,&comm);CHKERRQ(ierr); 81ba4b436cSBarry Smith ierr = MPI_Comm_rank(comm, &rank);CHKERRQ(ierr); 82a7e14dcfSSatish Balay lambda = bmrm->lambda; 83a7e14dcfSSatish Balay 84a7e14dcfSSatish Balay /* Check Stopping Condition */ 85a7e14dcfSSatish Balay tao->step = 1.0; 86a7e14dcfSSatish Balay max_jtwt = -BMRM_INFTY; 87a7e14dcfSSatish Balay min_jw = BMRM_INFTY; 88a7e14dcfSSatish Balay innerSolverTol = 1.0; 89a7e14dcfSSatish Balay epsilon = 0.0; 90a7e14dcfSSatish Balay 910e660641SBarry Smith if (!rank) { 92a7e14dcfSSatish Balay ierr = init_df_solver(&df);CHKERRQ(ierr); 93a7e14dcfSSatish Balay grad_list.next = NULL; 94a7e14dcfSSatish Balay tail_glist = &grad_list; 95a7e14dcfSSatish Balay } 96a7e14dcfSSatish Balay 97a7e14dcfSSatish Balay df.tol = 1e-6; 98a7e14dcfSSatish Balay reason = TAO_CONTINUE_ITERATING; 99a7e14dcfSSatish Balay 100a7e14dcfSSatish Balay /*-----------------Algorithm Begins------------------------*/ 101a7e14dcfSSatish Balay /* make the scatter */ 102a7e14dcfSSatish Balay ierr = VecScatterCreateToZero(W, &bmrm->scatter, &bmrm->local_w);CHKERRQ(ierr); 103a7e14dcfSSatish Balay ierr = VecAssemblyBegin(bmrm->local_w);CHKERRQ(ierr); 104a7e14dcfSSatish Balay ierr = VecAssemblyEnd(bmrm->local_w);CHKERRQ(ierr); 105a7e14dcfSSatish Balay 106a7e14dcfSSatish Balay /* NOTE: In application pass the sub-gradient of Remp(W) */ 107a7e14dcfSSatish Balay ierr = TaoComputeObjectiveAndGradient(tao, W, &f, G);CHKERRQ(ierr); 108a7e14dcfSSatish Balay ierr = TaoMonitor(tao,iter,f,1.0,0.0,tao->step,&reason);CHKERRQ(ierr); 109a7e14dcfSSatish Balay while (reason == TAO_CONTINUE_ITERATING) { 110a7e14dcfSSatish Balay /* compute bt = Remp(Wt-1) - <Wt-1, At> */ 111a7e14dcfSSatish Balay ierr = VecDot(W, G, &bt);CHKERRQ(ierr); 112a7e14dcfSSatish Balay bt = f - bt; 113a7e14dcfSSatish Balay 114a7e14dcfSSatish Balay /* First gather the gradient to the master node */ 115a7e14dcfSSatish Balay ierr = VecScatterBegin(bmrm->scatter, G, bmrm->local_w, INSERT_VALUES, SCATTER_FORWARD);CHKERRQ(ierr); 116a7e14dcfSSatish Balay ierr = VecScatterEnd(bmrm->scatter, G, bmrm->local_w, INSERT_VALUES, SCATTER_FORWARD);CHKERRQ(ierr); 117a7e14dcfSSatish Balay 118a7e14dcfSSatish Balay /* Bring up the inner solver */ 1190e660641SBarry Smith if (!rank) { 120a7e14dcfSSatish Balay ierr = ensure_df_space(iter+1, &df); CHKERRQ(ierr); 121a7e14dcfSSatish Balay ierr = make_grad_node(bmrm->local_w, &pgrad);CHKERRQ(ierr); 122a7e14dcfSSatish Balay tail_glist->next = pgrad; 123a7e14dcfSSatish Balay tail_glist = pgrad; 124a7e14dcfSSatish Balay 125a7e14dcfSSatish Balay df.a[iter] = 1.0; 126a7e14dcfSSatish Balay df.f[iter] = -bt; 127a7e14dcfSSatish Balay df.u[iter] = 1.0; 128a7e14dcfSSatish Balay df.l[iter] = 0.0; 129a7e14dcfSSatish Balay 130a7e14dcfSSatish Balay /* set up the Q */ 131a7e14dcfSSatish Balay pgrad = grad_list.next; 132a7e14dcfSSatish Balay for (i=0; i<=iter; i++) { 133a7e14dcfSSatish Balay ierr = VecDot(pgrad->V, bmrm->local_w, ®);CHKERRQ(ierr); 134a7e14dcfSSatish Balay df.Q[i][iter] = df.Q[iter][i] = reg / lambda; 135a7e14dcfSSatish Balay pgrad = pgrad->next; 136a7e14dcfSSatish Balay } 137a7e14dcfSSatish Balay 138a7e14dcfSSatish Balay if (iter > 0) { 139a7e14dcfSSatish Balay df.x[iter] = 0.0; 140a7e14dcfSSatish Balay ierr = solve(&df); CHKERRQ(ierr); 1410e660641SBarry Smith } else 142a7e14dcfSSatish Balay df.x[0] = 1.0; 143a7e14dcfSSatish Balay 144a7e14dcfSSatish Balay /* now computing Jt*(alpha_t) which should be = Jt(wt) to check convergence */ 145a7e14dcfSSatish Balay jtwt = 0.0; 146a7e14dcfSSatish Balay ierr = VecSet(bmrm->local_w, 0.0); CHKERRQ(ierr); 147a7e14dcfSSatish Balay pgrad = grad_list.next; 148a7e14dcfSSatish Balay for (i=0; i<=iter; i++) { 149a7e14dcfSSatish Balay jtwt -= df.x[i] * df.f[i]; 150a7e14dcfSSatish Balay ierr = VecAXPY(bmrm->local_w, -df.x[i] / lambda, pgrad->V); CHKERRQ(ierr); 151a7e14dcfSSatish Balay pgrad = pgrad->next; 152a7e14dcfSSatish Balay } 153a7e14dcfSSatish Balay 154a7e14dcfSSatish Balay ierr = VecNorm(bmrm->local_w, NORM_2, ®); CHKERRQ(ierr); 155a7e14dcfSSatish Balay reg = 0.5*lambda*reg*reg; 156a7e14dcfSSatish Balay jtwt -= reg; 157a7e14dcfSSatish Balay } /* end if rank == 0 */ 158a7e14dcfSSatish Balay 159a7e14dcfSSatish Balay /* scatter the new W to all nodes */ 160a7e14dcfSSatish Balay ierr = VecScatterBegin(bmrm->scatter,bmrm->local_w,W,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 161a7e14dcfSSatish Balay ierr = VecScatterEnd(bmrm->scatter,bmrm->local_w,W,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 162a7e14dcfSSatish Balay 163a7e14dcfSSatish Balay ierr = TaoComputeObjectiveAndGradient(tao, W, &f, G);CHKERRQ(ierr); 164a7e14dcfSSatish Balay 165ba4b436cSBarry Smith ierr = MPI_Bcast(&jtwt,1,MPIU_REAL,0,comm);CHKERRQ(ierr); 166ba4b436cSBarry Smith ierr = MPI_Bcast(®,1,MPIU_REAL,0,comm);CHKERRQ(ierr); 167a7e14dcfSSatish Balay 168a7e14dcfSSatish Balay jw = reg + f; /* J(w) = regularizer + Remp(w) */ 1690e660641SBarry Smith if (jw < min_jw) min_jw = jw; 1700e660641SBarry Smith if (jtwt > max_jtwt) max_jtwt = jtwt; 171a7e14dcfSSatish Balay 172a7e14dcfSSatish Balay pre_epsilon = epsilon; 173a7e14dcfSSatish Balay epsilon = min_jw - jtwt; 174a7e14dcfSSatish Balay 1750e660641SBarry Smith if (!rank) { 1760e660641SBarry Smith if (innerSolverTol > epsilon) innerSolverTol = epsilon; 1770e660641SBarry Smith else if (innerSolverTol < 1e-7) innerSolverTol = 1e-7; 178a7e14dcfSSatish Balay 179a7e14dcfSSatish Balay /* if the annealing doesn't work well, lower the inner solver tolerance */ 1800e660641SBarry Smith if(pre_epsilon < epsilon) innerSolverTol *= 0.2; 181a7e14dcfSSatish Balay 182a7e14dcfSSatish Balay df.tol = innerSolverTol*0.5; 183a7e14dcfSSatish Balay } 184a7e14dcfSSatish Balay 185a7e14dcfSSatish Balay iter++; 186a7e14dcfSSatish Balay ierr = TaoMonitor(tao,iter,min_jw,epsilon,0.0,tao->step,&reason);CHKERRQ(ierr); 187a7e14dcfSSatish Balay } 188a7e14dcfSSatish Balay 189a7e14dcfSSatish Balay /* free all the memory */ 1900e660641SBarry Smith if (!rank) { 191a7e14dcfSSatish Balay ierr = destroy_grad_list(&grad_list);CHKERRQ(ierr); 192a7e14dcfSSatish Balay ierr = destroy_df_solver(&df);CHKERRQ(ierr); 193a7e14dcfSSatish Balay } 194a7e14dcfSSatish Balay 195a7e14dcfSSatish Balay ierr = VecDestroy(&bmrm->local_w);CHKERRQ(ierr); 196a7e14dcfSSatish Balay ierr = VecScatterDestroy(&bmrm->scatter);CHKERRQ(ierr); 197a7e14dcfSSatish Balay PetscFunctionReturn(0); 198a7e14dcfSSatish Balay } 199a7e14dcfSSatish Balay 200a7e14dcfSSatish Balay 201a7e14dcfSSatish Balay /* ---------------------------------------------------------- */ 202a7e14dcfSSatish Balay 203a7e14dcfSSatish Balay #undef __FUNCT__ 204a7e14dcfSSatish Balay #define __FUNCT__ "TaoSetup_BMRM" 205441846f8SBarry Smith static PetscErrorCode TaoSetup_BMRM(Tao tao) 2060e660641SBarry Smith { 207a7e14dcfSSatish Balay 208a7e14dcfSSatish Balay PetscErrorCode ierr; 209a7e14dcfSSatish Balay 210a7e14dcfSSatish Balay PetscFunctionBegin; 211a7e14dcfSSatish Balay /* Allocate some arrays */ 212a7e14dcfSSatish Balay if (!tao->gradient) { 213a7e14dcfSSatish Balay ierr = VecDuplicate(tao->solution, &tao->gradient); CHKERRQ(ierr); 214a7e14dcfSSatish Balay } 215a7e14dcfSSatish Balay PetscFunctionReturn(0); 216a7e14dcfSSatish Balay } 217a7e14dcfSSatish Balay 218a7e14dcfSSatish Balay /*------------------------------------------------------------*/ 219a7e14dcfSSatish Balay #undef __FUNCT__ 220a7e14dcfSSatish Balay #define __FUNCT__ "TaoDestroy_BMRM" 221441846f8SBarry Smith static PetscErrorCode TaoDestroy_BMRM(Tao tao) 222a7e14dcfSSatish Balay { 223a7e14dcfSSatish Balay PetscErrorCode ierr; 224a7e14dcfSSatish Balay 225a7e14dcfSSatish Balay PetscFunctionBegin; 226a7e14dcfSSatish Balay ierr = PetscFree(tao->data);CHKERRQ(ierr); 227a7e14dcfSSatish Balay PetscFunctionReturn(0); 228a7e14dcfSSatish Balay } 229a7e14dcfSSatish Balay 230a7e14dcfSSatish Balay #undef __FUNCT__ 231a7e14dcfSSatish Balay #define __FUNCT__ "TaoSetFromOptions_BMRM" 232441846f8SBarry Smith static PetscErrorCode TaoSetFromOptions_BMRM(Tao tao) 233a7e14dcfSSatish Balay { 234a7e14dcfSSatish Balay PetscErrorCode ierr; 235a7e14dcfSSatish Balay TAO_BMRM* bmrm = (TAO_BMRM*)tao->data; 236a7e14dcfSSatish Balay 237a7e14dcfSSatish Balay PetscFunctionBegin; 238a7e14dcfSSatish Balay ierr = PetscOptionsHead("BMRM for regularized risk minimization");CHKERRQ(ierr); 239*94ae4db5SBarry Smith ierr = PetscOptionsReal("-tao_bmrm_lambda", "regulariser weight","", 100,&bmrm->lambda,NULL); CHKERRQ(ierr); 240a7e14dcfSSatish Balay ierr = PetscOptionsTail();CHKERRQ(ierr); 241a7e14dcfSSatish Balay PetscFunctionReturn(0); 242a7e14dcfSSatish Balay } 243a7e14dcfSSatish Balay 244a7e14dcfSSatish Balay /*------------------------------------------------------------*/ 245a7e14dcfSSatish Balay #undef __FUNCT__ 246a7e14dcfSSatish Balay #define __FUNCT__ "TaoView_BMRM" 247441846f8SBarry Smith static PetscErrorCode TaoView_BMRM(Tao tao, PetscViewer viewer) 248a7e14dcfSSatish Balay { 249a7e14dcfSSatish Balay PetscBool isascii; 250a7e14dcfSSatish Balay PetscErrorCode ierr; 251a7e14dcfSSatish Balay 252a7e14dcfSSatish Balay PetscFunctionBegin; 253a7e14dcfSSatish Balay ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&isascii);CHKERRQ(ierr); 254a7e14dcfSSatish Balay if (isascii) { 255a7e14dcfSSatish Balay ierr = PetscViewerASCIIPushTab(viewer);CHKERRQ(ierr); 256a7e14dcfSSatish Balay ierr = PetscViewerASCIIPopTab(viewer);CHKERRQ(ierr); 257a7e14dcfSSatish Balay } 258a7e14dcfSSatish Balay PetscFunctionReturn(0); 259a7e14dcfSSatish Balay } 260a7e14dcfSSatish Balay 261a7e14dcfSSatish Balay /*------------------------------------------------------------*/ 2621522df2eSJason Sarich /*MC 2631522df2eSJason Sarich TAOBMRM - bundle method for regularized risk minimization 2641522df2eSJason Sarich 2651522df2eSJason Sarich Options Database Keys: 2661522df2eSJason Sarich . - tao_bmrm_lambda - regulariser weight 2671522df2eSJason Sarich 2681eb8069cSJason Sarich Level: beginner 2691522df2eSJason Sarich M*/ 2701522df2eSJason Sarich 271a7e14dcfSSatish Balay EXTERN_C_BEGIN 272a7e14dcfSSatish Balay #undef __FUNCT__ 273a7e14dcfSSatish Balay #define __FUNCT__ "TaoCreate_BMRM" 274441846f8SBarry Smith PetscErrorCode TaoCreate_BMRM(Tao tao) 275a7e14dcfSSatish Balay { 276a7e14dcfSSatish Balay TAO_BMRM *bmrm; 277a7e14dcfSSatish Balay PetscErrorCode ierr; 278a7e14dcfSSatish Balay 279a7e14dcfSSatish Balay PetscFunctionBegin; 280a7e14dcfSSatish Balay tao->ops->setup = TaoSetup_BMRM; 281a7e14dcfSSatish Balay tao->ops->solve = TaoSolve_BMRM; 282a7e14dcfSSatish Balay tao->ops->view = TaoView_BMRM; 283a7e14dcfSSatish Balay tao->ops->setfromoptions = TaoSetFromOptions_BMRM; 284a7e14dcfSSatish Balay tao->ops->destroy = TaoDestroy_BMRM; 285a7e14dcfSSatish Balay 2863c9e27cfSGeoffrey Irving ierr = PetscNewLog(tao,&bmrm);CHKERRQ(ierr); 287a7e14dcfSSatish Balay bmrm->lambda = 1.0; 288a7e14dcfSSatish Balay tao->data = (void*)bmrm; 289a7e14dcfSSatish Balay 290a7e14dcfSSatish Balay /* Note: May need to be tuned! */ 291a7e14dcfSSatish Balay tao->max_it = 2048; 292a7e14dcfSSatish Balay tao->max_funcs = 300000; 293a7e14dcfSSatish Balay tao->fatol = 1e-20; 294a7e14dcfSSatish Balay tao->frtol = 1e-25; 295a7e14dcfSSatish Balay tao->gatol = 1e-25; 296a7e14dcfSSatish Balay tao->grtol = 1e-25; 297a7e14dcfSSatish Balay 298a7e14dcfSSatish Balay PetscFunctionReturn(0); 299a7e14dcfSSatish Balay } 300a7e14dcfSSatish Balay EXTERN_C_END 301a7e14dcfSSatish Balay 302a7e14dcfSSatish Balay #undef __FUNCT__ 303a7e14dcfSSatish Balay #define __FUNCT__ "init_df_solver" 304a7e14dcfSSatish Balay PetscErrorCode init_df_solver(TAO_DF *df) 305a7e14dcfSSatish Balay { 306a7e14dcfSSatish Balay PetscInt i, n = INCRE_DIM; 307a7e14dcfSSatish Balay PetscErrorCode ierr; 308a7e14dcfSSatish Balay 309a7e14dcfSSatish Balay PetscFunctionBegin; 310a7e14dcfSSatish Balay /* default values */ 311a7e14dcfSSatish Balay df->maxProjIter = 200; 312a7e14dcfSSatish Balay df->maxPGMIter = 300000; 313a7e14dcfSSatish Balay df->b = 1.0; 314a7e14dcfSSatish Balay 315a7e14dcfSSatish Balay /* memory space required by Dai-Fletcher */ 316a7e14dcfSSatish Balay df->cur_num_cp = n; 3170e660641SBarry Smith ierr = PetscMalloc1(n, &df->f); CHKERRQ(ierr); 3180e660641SBarry Smith ierr = PetscMalloc1(n, &df->a); CHKERRQ(ierr); 3190e660641SBarry Smith ierr = PetscMalloc1(n, &df->l); CHKERRQ(ierr); 3200e660641SBarry Smith ierr = PetscMalloc1(n, &df->u); CHKERRQ(ierr); 3210e660641SBarry Smith ierr = PetscMalloc1(n, &df->x); CHKERRQ(ierr); 322e1cc520bSBarry Smith ierr = PetscMalloc1(n, &df->Q); CHKERRQ(ierr); 323a7e14dcfSSatish Balay 324a7e14dcfSSatish Balay for (i = 0; i < n; i ++) { 3250e660641SBarry Smith ierr = PetscMalloc1(n, &df->Q[i]); CHKERRQ(ierr); 326a7e14dcfSSatish Balay } 327a7e14dcfSSatish Balay 3280e660641SBarry Smith ierr = PetscMalloc1(n, &df->g); CHKERRQ(ierr); 3290e660641SBarry Smith ierr = PetscMalloc1(n, &df->y); CHKERRQ(ierr); 3300e660641SBarry Smith ierr = PetscMalloc1(n, &df->tempv); CHKERRQ(ierr); 3310e660641SBarry Smith ierr = PetscMalloc1(n, &df->d); CHKERRQ(ierr); 3320e660641SBarry Smith ierr = PetscMalloc1(n, &df->Qd); CHKERRQ(ierr); 3330e660641SBarry Smith ierr = PetscMalloc1(n, &df->t); CHKERRQ(ierr); 3340e660641SBarry Smith ierr = PetscMalloc1(n, &df->xplus); CHKERRQ(ierr); 3350e660641SBarry Smith ierr = PetscMalloc1(n, &df->tplus); CHKERRQ(ierr); 3360e660641SBarry Smith ierr = PetscMalloc1(n, &df->sk); CHKERRQ(ierr); 3370e660641SBarry Smith ierr = PetscMalloc1(n, &df->yk); CHKERRQ(ierr); 338a7e14dcfSSatish Balay 339e1cc520bSBarry Smith ierr = PetscMalloc1(n, &df->ipt); CHKERRQ(ierr); 340e1cc520bSBarry Smith ierr = PetscMalloc1(n, &df->ipt2); CHKERRQ(ierr); 341e1cc520bSBarry Smith ierr = PetscMalloc1(n, &df->uv); CHKERRQ(ierr); 342a7e14dcfSSatish Balay PetscFunctionReturn(0); 343a7e14dcfSSatish Balay } 344a7e14dcfSSatish Balay 345a7e14dcfSSatish Balay #undef __FUNCT__ 346a7e14dcfSSatish Balay #define __FUNCT__ "ensure_df_space" 347a7e14dcfSSatish Balay PetscErrorCode ensure_df_space(PetscInt dim, TAO_DF *df) 348a7e14dcfSSatish Balay { 349a7e14dcfSSatish Balay PetscErrorCode ierr; 350a7e14dcfSSatish Balay PetscReal *tmp, **tmp_Q; 351a7e14dcfSSatish Balay PetscInt i, n, old_n; 352a7e14dcfSSatish Balay 353a7e14dcfSSatish Balay PetscFunctionBegin; 35453506e15SBarry Smith df->dim = dim; 35553506e15SBarry Smith if (dim <= df->cur_num_cp) PetscFunctionReturn(0); 356a7e14dcfSSatish Balay 357a7e14dcfSSatish Balay old_n = df->cur_num_cp; 358a7e14dcfSSatish Balay df->cur_num_cp += INCRE_DIM; 359a7e14dcfSSatish Balay n = df->cur_num_cp; 360a7e14dcfSSatish Balay 361a7e14dcfSSatish Balay /* memory space required by dai-fletcher */ 3620e660641SBarry Smith ierr = PetscMalloc1(n, &tmp); CHKERRQ(ierr); 363a7e14dcfSSatish Balay ierr = PetscMemcpy(tmp, df->f, sizeof(PetscReal)*old_n); CHKERRQ(ierr); 364a7e14dcfSSatish Balay ierr = PetscFree(df->f); CHKERRQ(ierr); 365a7e14dcfSSatish Balay df->f = tmp; 366a7e14dcfSSatish Balay 3670e660641SBarry Smith ierr = PetscMalloc1(n, &tmp); CHKERRQ(ierr); 368a7e14dcfSSatish Balay ierr = PetscMemcpy(tmp, df->a, sizeof(PetscReal)*old_n); CHKERRQ(ierr); 369a7e14dcfSSatish Balay ierr = PetscFree(df->a); CHKERRQ(ierr); 370a7e14dcfSSatish Balay df->a = tmp; 371a7e14dcfSSatish Balay 3720e660641SBarry Smith ierr = PetscMalloc1(n, &tmp); CHKERRQ(ierr); 373a7e14dcfSSatish Balay ierr = PetscMemcpy(tmp, df->l, sizeof(PetscReal)*old_n); CHKERRQ(ierr); 374a7e14dcfSSatish Balay ierr = PetscFree(df->l); CHKERRQ(ierr); 375a7e14dcfSSatish Balay df->l = tmp; 376a7e14dcfSSatish Balay 3770e660641SBarry Smith ierr = PetscMalloc1(n, &tmp); CHKERRQ(ierr); 378a7e14dcfSSatish Balay ierr = PetscMemcpy(tmp, df->u, sizeof(PetscReal)*old_n); CHKERRQ(ierr); 379a7e14dcfSSatish Balay ierr = PetscFree(df->u); CHKERRQ(ierr); 380a7e14dcfSSatish Balay df->u = tmp; 381a7e14dcfSSatish Balay 3820e660641SBarry Smith ierr = PetscMalloc1(n, &tmp); CHKERRQ(ierr); 383a7e14dcfSSatish Balay ierr = PetscMemcpy(tmp, df->x, sizeof(PetscReal)*old_n); CHKERRQ(ierr); 384a7e14dcfSSatish Balay ierr = PetscFree(df->x); CHKERRQ(ierr); 385a7e14dcfSSatish Balay df->x = tmp; 386a7e14dcfSSatish Balay 387e1cc520bSBarry Smith ierr = PetscMalloc1(n, &tmp_Q); CHKERRQ(ierr); 38853506e15SBarry Smith for (i = 0; i < n; i ++) { 3890e660641SBarry Smith ierr = PetscMalloc1(n, &tmp_Q[i]); CHKERRQ(ierr); 39053506e15SBarry Smith if (i < old_n) { 391a7e14dcfSSatish Balay ierr = PetscMemcpy(tmp_Q[i], df->Q[i], sizeof(PetscReal)*old_n); CHKERRQ(ierr); 392a7e14dcfSSatish Balay ierr = PetscFree(df->Q[i]); CHKERRQ(ierr); 393a7e14dcfSSatish Balay } 394a7e14dcfSSatish Balay } 395a7e14dcfSSatish Balay 396a7e14dcfSSatish Balay ierr = PetscFree(df->Q); CHKERRQ(ierr); 397a7e14dcfSSatish Balay df->Q = tmp_Q; 398a7e14dcfSSatish Balay 399a7e14dcfSSatish Balay ierr = PetscFree(df->g); CHKERRQ(ierr); 4000e660641SBarry Smith ierr = PetscMalloc1(n, &df->g); CHKERRQ(ierr); 401a7e14dcfSSatish Balay 402a7e14dcfSSatish Balay ierr = PetscFree(df->y); CHKERRQ(ierr); 4030e660641SBarry Smith ierr = PetscMalloc1(n, &df->y); CHKERRQ(ierr); 404a7e14dcfSSatish Balay 405a7e14dcfSSatish Balay ierr = PetscFree(df->tempv); CHKERRQ(ierr); 4060e660641SBarry Smith ierr = PetscMalloc1(n, &df->tempv); CHKERRQ(ierr); 407a7e14dcfSSatish Balay 408a7e14dcfSSatish Balay ierr = PetscFree(df->d); CHKERRQ(ierr); 4090e660641SBarry Smith ierr = PetscMalloc1(n, &df->d); CHKERRQ(ierr); 410a7e14dcfSSatish Balay 411a7e14dcfSSatish Balay ierr = PetscFree(df->Qd); CHKERRQ(ierr); 4120e660641SBarry Smith ierr = PetscMalloc1(n, &df->Qd); CHKERRQ(ierr); 413a7e14dcfSSatish Balay 414a7e14dcfSSatish Balay ierr = PetscFree(df->t); CHKERRQ(ierr); 4150e660641SBarry Smith ierr = PetscMalloc1(n, &df->t); CHKERRQ(ierr); 416a7e14dcfSSatish Balay 417a7e14dcfSSatish Balay ierr = PetscFree(df->xplus); CHKERRQ(ierr); 4180e660641SBarry Smith ierr = PetscMalloc1(n, &df->xplus); CHKERRQ(ierr); 419a7e14dcfSSatish Balay 420a7e14dcfSSatish Balay ierr = PetscFree(df->tplus); CHKERRQ(ierr); 4210e660641SBarry Smith ierr = PetscMalloc1(n, &df->tplus); CHKERRQ(ierr); 422a7e14dcfSSatish Balay 423a7e14dcfSSatish Balay ierr = PetscFree(df->sk); CHKERRQ(ierr); 4240e660641SBarry Smith ierr = PetscMalloc1(n, &df->sk); CHKERRQ(ierr); 425a7e14dcfSSatish Balay 426a7e14dcfSSatish Balay ierr = PetscFree(df->yk); CHKERRQ(ierr); 4270e660641SBarry Smith ierr = PetscMalloc1(n, &df->yk); CHKERRQ(ierr); 428a7e14dcfSSatish Balay 429a7e14dcfSSatish Balay ierr = PetscFree(df->ipt); CHKERRQ(ierr); 430e1cc520bSBarry Smith ierr = PetscMalloc1(n, &df->ipt); CHKERRQ(ierr); 431a7e14dcfSSatish Balay 432a7e14dcfSSatish Balay ierr = PetscFree(df->ipt2); CHKERRQ(ierr); 4330e660641SBarry Smith ierr = PetscMalloc1(n, &df->ipt2); CHKERRQ(ierr); 434a7e14dcfSSatish Balay 435a7e14dcfSSatish Balay ierr = PetscFree(df->uv); CHKERRQ(ierr); 4360e660641SBarry Smith ierr = PetscMalloc1(n, &df->uv); CHKERRQ(ierr); 437a7e14dcfSSatish Balay PetscFunctionReturn(0); 438a7e14dcfSSatish Balay } 439a7e14dcfSSatish Balay 440a7e14dcfSSatish Balay #undef __FUNCT__ 441a7e14dcfSSatish Balay #define __FUNCT__ "destroy_df_solver" 442a7e14dcfSSatish Balay PetscErrorCode destroy_df_solver(TAO_DF *df) 443a7e14dcfSSatish Balay { 444a7e14dcfSSatish Balay PetscErrorCode ierr; 445a7e14dcfSSatish Balay PetscInt i; 4466c23d075SBarry Smith 447a7e14dcfSSatish Balay PetscFunctionBegin; 4486c23d075SBarry Smith ierr = PetscFree(df->f); CHKERRQ(ierr); 4496c23d075SBarry Smith ierr = PetscFree(df->a); CHKERRQ(ierr); 4506c23d075SBarry Smith ierr = PetscFree(df->l); CHKERRQ(ierr); 4516c23d075SBarry Smith ierr = PetscFree(df->u); CHKERRQ(ierr); 4526c23d075SBarry Smith ierr = PetscFree(df->x); CHKERRQ(ierr); 453a7e14dcfSSatish Balay 4546c23d075SBarry Smith for (i = 0; i < df->cur_num_cp; i ++) { 455a7e14dcfSSatish Balay ierr = PetscFree(df->Q[i]); CHKERRQ(ierr); 456a7e14dcfSSatish Balay } 457a7e14dcfSSatish Balay ierr = PetscFree(df->Q); CHKERRQ(ierr); 4586c23d075SBarry Smith ierr = PetscFree(df->ipt); CHKERRQ(ierr); 4596c23d075SBarry Smith ierr = PetscFree(df->ipt2); CHKERRQ(ierr); 4606c23d075SBarry Smith ierr = PetscFree(df->uv); CHKERRQ(ierr); 4616c23d075SBarry Smith ierr = PetscFree(df->g); CHKERRQ(ierr); 4626c23d075SBarry Smith ierr = PetscFree(df->y); CHKERRQ(ierr); 4636c23d075SBarry Smith ierr = PetscFree(df->tempv); CHKERRQ(ierr); 4646c23d075SBarry Smith ierr = PetscFree(df->d); CHKERRQ(ierr); 4656c23d075SBarry Smith ierr = PetscFree(df->Qd); CHKERRQ(ierr); 4666c23d075SBarry Smith ierr = PetscFree(df->t); CHKERRQ(ierr); 4676c23d075SBarry Smith ierr = PetscFree(df->xplus); CHKERRQ(ierr); 4686c23d075SBarry Smith ierr = PetscFree(df->tplus); CHKERRQ(ierr); 4696c23d075SBarry Smith ierr = PetscFree(df->sk); CHKERRQ(ierr); 4706c23d075SBarry Smith ierr = PetscFree(df->yk); CHKERRQ(ierr); 471a7e14dcfSSatish Balay PetscFunctionReturn(0); 472a7e14dcfSSatish Balay } 473a7e14dcfSSatish Balay 474a7e14dcfSSatish Balay /* Piecewise linear monotone target function for the Dai-Fletcher projector */ 475a7e14dcfSSatish Balay #undef __FUNCT__ 476a7e14dcfSSatish Balay #define __FUNCT__ "phi" 4776c23d075SBarry Smith PetscReal phi(PetscReal *x,PetscInt n,PetscReal lambda,PetscReal *a,PetscReal b,PetscReal *c,PetscReal *l,PetscReal *u) 478a7e14dcfSSatish Balay { 479a7e14dcfSSatish Balay PetscReal r = 0.0; 480a7e14dcfSSatish Balay PetscInt i; 481a7e14dcfSSatish Balay 482a7e14dcfSSatish Balay for (i = 0; i < n; i++){ 483a7e14dcfSSatish Balay x[i] = -c[i] + lambda*a[i]; 4846c23d075SBarry Smith if (x[i] > u[i]) x[i] = u[i]; 4856c23d075SBarry Smith else if(x[i] < l[i]) x[i] = l[i]; 486a7e14dcfSSatish Balay r += a[i]*x[i]; 487a7e14dcfSSatish Balay } 488a7e14dcfSSatish Balay return r - b; 489a7e14dcfSSatish Balay } 490a7e14dcfSSatish Balay 491a7e14dcfSSatish Balay /** Modified Dai-Fletcher QP projector solves the problem: 492a7e14dcfSSatish Balay * 493a7e14dcfSSatish Balay * minimise 0.5*x'*x - c'*x 494a7e14dcfSSatish Balay * subj to a'*x = b 495a7e14dcfSSatish Balay * l \leq x \leq u 496a7e14dcfSSatish Balay * 497a7e14dcfSSatish Balay * \param c The point to be projected onto feasible set 498a7e14dcfSSatish Balay */ 499a7e14dcfSSatish Balay #undef __FUNCT__ 500a7e14dcfSSatish Balay #define __FUNCT__ "project" 5016c23d075SBarry Smith PetscInt project(PetscInt n,PetscReal *a,PetscReal b,PetscReal *c,PetscReal *l,PetscReal *u,PetscReal *x,PetscReal *lam_ext,TAO_DF *df) 502a7e14dcfSSatish Balay { 503a7e14dcfSSatish Balay PetscReal lambda, lambdal, lambdau, dlambda, lambda_new; 504a7e14dcfSSatish Balay PetscReal r, rl, ru, s; 505a7e14dcfSSatish Balay PetscInt innerIter; 506a7e14dcfSSatish Balay PetscBool nonNegativeSlack = PETSC_FALSE; 50753506e15SBarry Smith PetscErrorCode ierr; 508a7e14dcfSSatish Balay 509a7e14dcfSSatish Balay *lam_ext = 0; 510a7e14dcfSSatish Balay lambda = 0; 511a7e14dcfSSatish Balay dlambda = 0.5; 512a7e14dcfSSatish Balay innerIter = 1; 513a7e14dcfSSatish Balay 514a7e14dcfSSatish Balay /* \phi(x;lambda) := 0.5*x'*x + c'*x - lambda*(a'*x-b) 515a7e14dcfSSatish Balay * 516a7e14dcfSSatish Balay * Optimality conditions for \phi: 517a7e14dcfSSatish Balay * 518a7e14dcfSSatish Balay * 1. lambda <= 0 519a7e14dcfSSatish Balay * 2. r <= 0 520a7e14dcfSSatish Balay * 3. r*lambda == 0 521a7e14dcfSSatish Balay */ 522a7e14dcfSSatish Balay 523a7e14dcfSSatish Balay /* Bracketing Phase */ 524a7e14dcfSSatish Balay r = phi(x, n, lambda, a, b, c, l, u); 525a7e14dcfSSatish Balay 5266c23d075SBarry Smith if(nonNegativeSlack) { 527a7e14dcfSSatish Balay /* inequality constraint, i.e., with \xi >= 0 constraint */ 52853506e15SBarry Smith if (r < TOL_R) return 0; 5296c23d075SBarry Smith } else { 530a7e14dcfSSatish Balay /* equality constraint ,i.e., without \xi >= 0 constraint */ 53153506e15SBarry Smith if (fabs(r) < TOL_R) return 0; 532a7e14dcfSSatish Balay } 533a7e14dcfSSatish Balay 534a7e14dcfSSatish Balay if (r < 0.0){ 535a7e14dcfSSatish Balay lambdal = lambda; 536a7e14dcfSSatish Balay rl = r; 537a7e14dcfSSatish Balay lambda = lambda + dlambda; 538a7e14dcfSSatish Balay r = phi(x, n, lambda, a, b, c, l, u); 539a7e14dcfSSatish Balay while (r < 0.0 && dlambda < BMRM_INFTY) { 540a7e14dcfSSatish Balay lambdal = lambda; 541a7e14dcfSSatish Balay s = rl/r - 1.0; 542a7e14dcfSSatish Balay if (s < 0.1) s = 0.1; 543a7e14dcfSSatish Balay dlambda = dlambda + dlambda/s; 544a7e14dcfSSatish Balay lambda = lambda + dlambda; 545a7e14dcfSSatish Balay rl = r; 546a7e14dcfSSatish Balay r = phi(x, n, lambda, a, b, c, l, u); 547a7e14dcfSSatish Balay } 548a7e14dcfSSatish Balay lambdau = lambda; 549a7e14dcfSSatish Balay ru = r; 5506c23d075SBarry Smith } else { 551a7e14dcfSSatish Balay lambdau = lambda; 552a7e14dcfSSatish Balay ru = r; 553a7e14dcfSSatish Balay lambda = lambda - dlambda; 554a7e14dcfSSatish Balay r = phi(x, n, lambda, a, b, c, l, u); 555a7e14dcfSSatish Balay while (r > 0.0 && dlambda > -BMRM_INFTY) { 556a7e14dcfSSatish Balay lambdau = lambda; 557a7e14dcfSSatish Balay s = ru/r - 1.0; 558a7e14dcfSSatish Balay if (s < 0.1) s = 0.1; 559a7e14dcfSSatish Balay dlambda = dlambda + dlambda/s; 560a7e14dcfSSatish Balay lambda = lambda - dlambda; 561a7e14dcfSSatish Balay ru = r; 562a7e14dcfSSatish Balay r = phi(x, n, lambda, a, b, c, l, u); 563a7e14dcfSSatish Balay } 564a7e14dcfSSatish Balay lambdal = lambda; 565a7e14dcfSSatish Balay rl = r; 566a7e14dcfSSatish Balay } 567a7e14dcfSSatish Balay 5686c23d075SBarry Smith if(fabs(dlambda) > BMRM_INFTY) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"L2N2_DaiFletcherPGM detected Infeasible QP problem!"); 569a7e14dcfSSatish Balay 570a7e14dcfSSatish Balay if(ru == 0){ 571a7e14dcfSSatish Balay lambda = lambdau; 572a7e14dcfSSatish Balay r = phi(x, n, lambda, a, b, c, l, u); 573a7e14dcfSSatish Balay return innerIter; 574a7e14dcfSSatish Balay } 575a7e14dcfSSatish Balay 576a7e14dcfSSatish Balay /* Secant Phase */ 577a7e14dcfSSatish Balay s = 1.0 - rl/ru; 578a7e14dcfSSatish Balay dlambda = dlambda/s; 579a7e14dcfSSatish Balay lambda = lambdau - dlambda; 580a7e14dcfSSatish Balay r = phi(x, n, lambda, a, b, c, l, u); 581a7e14dcfSSatish Balay 582a7e14dcfSSatish Balay while (fabs(r) > TOL_R 583a7e14dcfSSatish Balay && dlambda > TOL_LAM * (1.0 + fabs(lambda)) 584a7e14dcfSSatish Balay && innerIter < df->maxProjIter){ 585a7e14dcfSSatish Balay innerIter++; 586a7e14dcfSSatish Balay if (r > 0.0){ 587a7e14dcfSSatish Balay if (s <= 2.0){ 588a7e14dcfSSatish Balay lambdau = lambda; 589a7e14dcfSSatish Balay ru = r; 590a7e14dcfSSatish Balay s = 1.0 - rl/ru; 591a7e14dcfSSatish Balay dlambda = (lambdau - lambdal) / s; 592a7e14dcfSSatish Balay lambda = lambdau - dlambda; 59353506e15SBarry Smith } else { 594a7e14dcfSSatish Balay s = ru/r-1.0; 595a7e14dcfSSatish Balay if (s < 0.1) s = 0.1; 596a7e14dcfSSatish Balay dlambda = (lambdau - lambda) / s; 597a7e14dcfSSatish Balay lambda_new = 0.75*lambdal + 0.25*lambda; 598a7e14dcfSSatish Balay if (lambda_new < (lambda - dlambda)) 599a7e14dcfSSatish Balay lambda_new = lambda - dlambda; 600a7e14dcfSSatish Balay lambdau = lambda; 601a7e14dcfSSatish Balay ru = r; 602a7e14dcfSSatish Balay lambda = lambda_new; 603a7e14dcfSSatish Balay s = (lambdau - lambdal) / (lambdau - lambda); 604a7e14dcfSSatish Balay } 60553506e15SBarry Smith } else { 606a7e14dcfSSatish Balay if (s >= 2.0){ 607a7e14dcfSSatish Balay lambdal = lambda; 608a7e14dcfSSatish Balay rl = r; 609a7e14dcfSSatish Balay s = 1.0 - rl/ru; 610a7e14dcfSSatish Balay dlambda = (lambdau - lambdal) / s; 611a7e14dcfSSatish Balay lambda = lambdau - dlambda; 61253506e15SBarry Smith } else { 613a7e14dcfSSatish Balay s = rl/r - 1.0; 614a7e14dcfSSatish Balay if (s < 0.1) s = 0.1; 615a7e14dcfSSatish Balay dlambda = (lambda-lambdal) / s; 616a7e14dcfSSatish Balay lambda_new = 0.75*lambdau + 0.25*lambda; 617a7e14dcfSSatish Balay if (lambda_new > (lambda + dlambda)) 618a7e14dcfSSatish Balay lambda_new = lambda + dlambda; 619a7e14dcfSSatish Balay lambdal = lambda; 620a7e14dcfSSatish Balay rl = r; 621a7e14dcfSSatish Balay lambda = lambda_new; 622a7e14dcfSSatish Balay s = (lambdau - lambdal) / (lambdau-lambda); 623a7e14dcfSSatish Balay } 624a7e14dcfSSatish Balay } 625a7e14dcfSSatish Balay r = phi(x, n, lambda, a, b, c, l, u); 626a7e14dcfSSatish Balay } 627a7e14dcfSSatish Balay 628a7e14dcfSSatish Balay *lam_ext = lambda; 62953506e15SBarry Smith if(innerIter >= df->maxProjIter) { 63053506e15SBarry Smith ierr = PetscPrintf(PETSC_COMM_SELF, "WARNING: DaiFletcher max iterations\n");CHKERRQ(ierr); 63153506e15SBarry Smith } 632a7e14dcfSSatish Balay return innerIter; 633a7e14dcfSSatish Balay } 634a7e14dcfSSatish Balay 635a7e14dcfSSatish Balay 636a7e14dcfSSatish Balay #undef __FUNCT__ 637a7e14dcfSSatish Balay #define __FUNCT__ "solve" 638a7e14dcfSSatish Balay PetscErrorCode solve(TAO_DF *df) 639a7e14dcfSSatish Balay { 640a7e14dcfSSatish Balay PetscErrorCode ierr; 641a7e14dcfSSatish Balay PetscInt i, j, innerIter, it, it2, luv, info, lscount = 0, projcount = 0; 642a7e14dcfSSatish Balay PetscReal gd, max, ak, bk, akold, bkold, lamnew, alpha, kktlam=0.0, lam_ext; 643a7e14dcfSSatish Balay PetscReal DELTAsv, ProdDELTAsv; 644a7e14dcfSSatish Balay PetscReal c, *tempQ; 645a7e14dcfSSatish Balay PetscReal *x = df->x, *a = df->a, b = df->b, *l = df->l, *u = df->u, tol = df->tol; 646a7e14dcfSSatish Balay PetscReal *tempv = df->tempv, *y = df->y, *g = df->g, *d = df->d, *Qd = df->Qd; 647a7e14dcfSSatish Balay PetscReal *xplus = df->xplus, *tplus = df->tplus, *sk = df->sk, *yk = df->yk; 648a7e14dcfSSatish Balay PetscReal **Q = df->Q, *f = df->f, *t = df->t; 649a7e14dcfSSatish Balay PetscInt dim = df->dim, *ipt = df->ipt, *ipt2 = df->ipt2, *uv = df->uv; 650a7e14dcfSSatish Balay 651a7e14dcfSSatish Balay /*** variables for the adaptive nonmonotone linesearch ***/ 652a7e14dcfSSatish Balay PetscInt L, llast; 653a7e14dcfSSatish Balay PetscReal fr, fbest, fv, fc, fv0; 65453506e15SBarry Smith 655a7e14dcfSSatish Balay c = BMRM_INFTY; 656a7e14dcfSSatish Balay 657a7e14dcfSSatish Balay DELTAsv = EPS_SV; 65853506e15SBarry Smith if (tol <= 1.0e-5 || dim <= 20) ProdDELTAsv = 0.0F; 65953506e15SBarry Smith else ProdDELTAsv = EPS_SV; 660a7e14dcfSSatish Balay 66153506e15SBarry Smith for (i = 0; i < dim; i++) tempv[i] = -x[i]; 662a7e14dcfSSatish Balay 663a7e14dcfSSatish Balay lam_ext = 0.0; 664a7e14dcfSSatish Balay 665a7e14dcfSSatish Balay /* Project the initial solution */ 666a7e14dcfSSatish Balay projcount += project(dim, a, b, tempv, l, u, x, &lam_ext, df); 667a7e14dcfSSatish Balay 668a7e14dcfSSatish Balay /* Compute gradient 669a7e14dcfSSatish Balay g = Q*x + f; */ 670a7e14dcfSSatish Balay 671a7e14dcfSSatish Balay it = 0; 67253506e15SBarry Smith for (i = 0; i < dim; i++) { 67353506e15SBarry Smith if (fabs(x[i]) > ProdDELTAsv) ipt[it++] = i; 67453506e15SBarry Smith } 675a7e14dcfSSatish Balay 676a7e14dcfSSatish Balay ierr = PetscMemzero(t, dim*sizeof(PetscReal)); CHKERRQ(ierr); 677a7e14dcfSSatish Balay for (i = 0; i < it; i++){ 678a7e14dcfSSatish Balay tempQ = Q[ipt[i]]; 67953506e15SBarry Smith for (j = 0; j < dim; j++) t[j] += (tempQ[j]*x[ipt[i]]); 680a7e14dcfSSatish Balay } 681a7e14dcfSSatish Balay for (i = 0; i < dim; i++){ 682a7e14dcfSSatish Balay g[i] = t[i] + f[i]; 683a7e14dcfSSatish Balay } 684a7e14dcfSSatish Balay 685a7e14dcfSSatish Balay 686a7e14dcfSSatish Balay /* y = -(x_{k} - g_{k}) */ 687a7e14dcfSSatish Balay for (i = 0; i < dim; i++){ 688a7e14dcfSSatish Balay y[i] = g[i] - x[i]; 689a7e14dcfSSatish Balay } 690a7e14dcfSSatish Balay 691a7e14dcfSSatish Balay /* Project x_{k} - g_{k} */ 692a7e14dcfSSatish Balay projcount += project(dim, a, b, y, l, u, tempv, &lam_ext, df); 693a7e14dcfSSatish Balay 694a7e14dcfSSatish Balay /* y = P(x_{k} - g_{k}) - x_{k} */ 695a7e14dcfSSatish Balay max = ALPHA_MIN; 696a7e14dcfSSatish Balay for (i = 0; i < dim; i++){ 697a7e14dcfSSatish Balay y[i] = tempv[i] - x[i]; 69853506e15SBarry Smith if (fabs(y[i]) > max) max = fabs(y[i]); 699a7e14dcfSSatish Balay } 700a7e14dcfSSatish Balay 701a7e14dcfSSatish Balay if (max < tol*1e-3){ 702a7e14dcfSSatish Balay lscount = 0; 703a7e14dcfSSatish Balay innerIter = 0; 704a7e14dcfSSatish Balay return 0; 705a7e14dcfSSatish Balay } 706a7e14dcfSSatish Balay 707a7e14dcfSSatish Balay alpha = 1.0 / max; 708a7e14dcfSSatish Balay 709a7e14dcfSSatish Balay /* fv0 = f(x_{0}). Recall t = Q x_{k} */ 710a7e14dcfSSatish Balay fv0 = 0.0; 71153506e15SBarry Smith for (i = 0; i < dim; i++) fv0 += x[i] * (0.5*t[i] + f[i]); 712a7e14dcfSSatish Balay 713a7e14dcfSSatish Balay /*** adaptive nonmonotone linesearch ***/ 714a7e14dcfSSatish Balay L = 2; 715a7e14dcfSSatish Balay fr = ALPHA_MAX; 716a7e14dcfSSatish Balay fbest = fv0; 717a7e14dcfSSatish Balay fc = fv0; 718a7e14dcfSSatish Balay llast = 0; 719a7e14dcfSSatish Balay akold = bkold = 0.0; 720a7e14dcfSSatish Balay 721a7e14dcfSSatish Balay /*** Iterator begins ***/ 722a7e14dcfSSatish Balay for (innerIter = 1; innerIter <= df->maxPGMIter; innerIter++) { 723a7e14dcfSSatish Balay 724a7e14dcfSSatish Balay /* tempv = -(x_{k} - alpha*g_{k}) */ 72553506e15SBarry Smith for (i = 0; i < dim; i++) tempv[i] = alpha*g[i] - x[i]; 726a7e14dcfSSatish Balay 727a7e14dcfSSatish Balay /* Project x_{k} - alpha*g_{k} */ 728a7e14dcfSSatish Balay projcount += project(dim, a, b, tempv, l, u, y, &lam_ext, df); 729a7e14dcfSSatish Balay 730a7e14dcfSSatish Balay 731a7e14dcfSSatish Balay /* gd = \inner{d_{k}}{g_{k}} 732a7e14dcfSSatish Balay d = P(x_{k} - alpha*g_{k}) - x_{k} 733a7e14dcfSSatish Balay */ 734a7e14dcfSSatish Balay gd = 0.0; 735a7e14dcfSSatish Balay for (i = 0; i < dim; i++){ 736a7e14dcfSSatish Balay d[i] = y[i] - x[i]; 737a7e14dcfSSatish Balay gd += d[i] * g[i]; 738a7e14dcfSSatish Balay } 739a7e14dcfSSatish Balay 740a7e14dcfSSatish Balay /* Gradient computation */ 741a7e14dcfSSatish Balay 742a7e14dcfSSatish Balay /* compute Qd = Q*d or Qd = Q*y - t depending on their sparsity */ 743a7e14dcfSSatish Balay 744a7e14dcfSSatish Balay it = it2 = 0; 74553506e15SBarry Smith for (i = 0; i < dim; i++){ 74653506e15SBarry Smith if (fabs(d[i]) > (ProdDELTAsv*1.0e-2)) ipt[it++] = i; 74753506e15SBarry Smith } 74853506e15SBarry Smith for (i = 0; i < dim; i++) { 74953506e15SBarry Smith if (fabs(y[i]) > ProdDELTAsv) ipt2[it2++] = i; 75053506e15SBarry Smith } 751a7e14dcfSSatish Balay 752a7e14dcfSSatish Balay ierr = PetscMemzero(Qd, dim*sizeof(PetscReal)); CHKERRQ(ierr); 753a7e14dcfSSatish Balay /* compute Qd = Q*d */ 754a7e14dcfSSatish Balay if (it < it2){ 755a7e14dcfSSatish Balay for (i = 0; i < it; i++){ 756a7e14dcfSSatish Balay tempQ = Q[ipt[i]]; 75753506e15SBarry Smith for (j = 0; j < dim; j++) Qd[j] += (tempQ[j] * d[ipt[i]]); 758a7e14dcfSSatish Balay } 75953506e15SBarry Smith } else { /* compute Qd = Q*y-t */ 760a7e14dcfSSatish Balay for (i = 0; i < it2; i++){ 761a7e14dcfSSatish Balay tempQ = Q[ipt2[i]]; 76253506e15SBarry Smith for (j = 0; j < dim; j++) Qd[j] += (tempQ[j] * y[ipt2[i]]); 763a7e14dcfSSatish Balay } 76453506e15SBarry Smith for (j = 0; j < dim; j++) Qd[j] -= t[j]; 765a7e14dcfSSatish Balay } 766a7e14dcfSSatish Balay 767a7e14dcfSSatish Balay /* ak = inner{d_{k}}{d_{k}} */ 768a7e14dcfSSatish Balay ak = 0.0; 76953506e15SBarry Smith for (i = 0; i < dim; i++) ak += d[i] * d[i]; 770a7e14dcfSSatish Balay 771a7e14dcfSSatish Balay bk = 0.0; 77253506e15SBarry Smith for (i = 0; i < dim; i++) bk += d[i]*Qd[i]; 773a7e14dcfSSatish Balay 77453506e15SBarry Smith if (bk > EPS*ak && gd < 0.0) lamnew = -gd/bk; 77553506e15SBarry Smith else lamnew = 1.0; 776a7e14dcfSSatish Balay 777a7e14dcfSSatish Balay /* fv is computing f(x_{k} + d_{k}) */ 778a7e14dcfSSatish Balay fv = 0.0; 779a7e14dcfSSatish Balay for (i = 0; i < dim; i++){ 780a7e14dcfSSatish Balay xplus[i] = x[i] + d[i]; 781a7e14dcfSSatish Balay tplus[i] = t[i] + Qd[i]; 782a7e14dcfSSatish Balay fv += xplus[i] * (0.5*tplus[i] + f[i]); 783a7e14dcfSSatish Balay } 784a7e14dcfSSatish Balay 785a7e14dcfSSatish Balay /* fr is fref */ 786a7e14dcfSSatish Balay if ((innerIter == 1 && fv >= fv0) || (innerIter > 1 && fv >= fr)){ 787a7e14dcfSSatish Balay lscount++; 788a7e14dcfSSatish Balay fv = 0.0; 789a7e14dcfSSatish Balay for (i = 0; i < dim; i++){ 790a7e14dcfSSatish Balay xplus[i] = x[i] + lamnew*d[i]; 791a7e14dcfSSatish Balay tplus[i] = t[i] + lamnew*Qd[i]; 792a7e14dcfSSatish Balay fv += xplus[i] * (0.5*tplus[i] + f[i]); 793a7e14dcfSSatish Balay } 794a7e14dcfSSatish Balay } 795a7e14dcfSSatish Balay 796a7e14dcfSSatish Balay for (i = 0; i < dim; i++){ 797a7e14dcfSSatish Balay sk[i] = xplus[i] - x[i]; 798a7e14dcfSSatish Balay yk[i] = tplus[i] - t[i]; 799a7e14dcfSSatish Balay x[i] = xplus[i]; 800a7e14dcfSSatish Balay t[i] = tplus[i]; 801a7e14dcfSSatish Balay g[i] = t[i] + f[i]; 802a7e14dcfSSatish Balay } 803a7e14dcfSSatish Balay 804a7e14dcfSSatish Balay /* update the line search control parameters */ 805a7e14dcfSSatish Balay if (fv < fbest){ 806a7e14dcfSSatish Balay fbest = fv; 807a7e14dcfSSatish Balay fc = fv; 808a7e14dcfSSatish Balay llast = 0; 80953506e15SBarry Smith } else { 810a7e14dcfSSatish Balay fc = (fc > fv ? fc : fv); 811a7e14dcfSSatish Balay llast++; 812a7e14dcfSSatish Balay if (llast == L){ 813a7e14dcfSSatish Balay fr = fc; 814a7e14dcfSSatish Balay fc = fv; 815a7e14dcfSSatish Balay llast = 0; 816a7e14dcfSSatish Balay } 817a7e14dcfSSatish Balay } 818a7e14dcfSSatish Balay 819a7e14dcfSSatish Balay ak = bk = 0.0; 820a7e14dcfSSatish Balay for (i = 0; i < dim; i++){ 821a7e14dcfSSatish Balay ak += sk[i] * sk[i]; 822a7e14dcfSSatish Balay bk += sk[i] * yk[i]; 823a7e14dcfSSatish Balay } 824a7e14dcfSSatish Balay 82553506e15SBarry Smith if (bk <= EPS*ak) alpha = ALPHA_MAX; 826a7e14dcfSSatish Balay else { 82753506e15SBarry Smith if (bkold < EPS*akold) alpha = ak/bk; 82853506e15SBarry Smith else alpha = (akold+ak)/(bkold+bk); 829a7e14dcfSSatish Balay 83053506e15SBarry Smith if (alpha > ALPHA_MAX) alpha = ALPHA_MAX; 83153506e15SBarry Smith else if (alpha < ALPHA_MIN) alpha = ALPHA_MIN; 832a7e14dcfSSatish Balay } 833a7e14dcfSSatish Balay 834a7e14dcfSSatish Balay akold = ak; 835a7e14dcfSSatish Balay bkold = bk; 836a7e14dcfSSatish Balay 837a7e14dcfSSatish Balay /*** stopping criterion based on KKT conditions ***/ 838a7e14dcfSSatish Balay /* at optimal, gradient of lagrangian w.r.t. x is zero */ 839a7e14dcfSSatish Balay 840a7e14dcfSSatish Balay bk = 0.0; 84153506e15SBarry Smith for (i = 0; i < dim; i++) bk += x[i] * x[i]; 842a7e14dcfSSatish Balay 84353506e15SBarry Smith if (PetscSqrtReal(ak) < tol*10 * PetscSqrtReal(bk)){ 844a7e14dcfSSatish Balay it = 0; 845a7e14dcfSSatish Balay luv = 0; 846a7e14dcfSSatish Balay kktlam = 0.0; 847a7e14dcfSSatish Balay for (i = 0; i < dim; i++){ 848a7e14dcfSSatish Balay /* x[i] is active hence lagrange multipliers for box constraints 849a7e14dcfSSatish Balay are zero. The lagrange multiplier for ineq. const. is then 850a7e14dcfSSatish Balay defined as below 851a7e14dcfSSatish Balay */ 852a7e14dcfSSatish Balay if ((x[i] > DELTAsv) && (x[i] < c-DELTAsv)){ 853a7e14dcfSSatish Balay ipt[it++] = i; 854a7e14dcfSSatish Balay kktlam = kktlam - a[i]*g[i]; 85553506e15SBarry Smith } else uv[luv++] = i; 856a7e14dcfSSatish Balay } 857a7e14dcfSSatish Balay 85853506e15SBarry Smith if (it == 0 && PetscSqrtReal(ak) < tol*0.5 * PetscSqrtReal(bk)) return 0; 859a7e14dcfSSatish Balay else { 860a7e14dcfSSatish Balay kktlam = kktlam/it; 861a7e14dcfSSatish Balay info = 1; 862a7e14dcfSSatish Balay for (i = 0; i < it; i++) { 863a7e14dcfSSatish Balay if (fabs(a[ipt[i]] * g[ipt[i]] + kktlam) > tol) { 864a7e14dcfSSatish Balay info = 0; 865a7e14dcfSSatish Balay break; 866a7e14dcfSSatish Balay } 867a7e14dcfSSatish Balay } 868a7e14dcfSSatish Balay if (info == 1) { 869a7e14dcfSSatish Balay for (i = 0; i < luv; i++) { 870a7e14dcfSSatish Balay if (x[uv[i]] <= DELTAsv){ 871a7e14dcfSSatish Balay /* x[i] == lower bound, hence, lagrange multiplier (say, beta) for lower bound may 872a7e14dcfSSatish Balay not be zero. So, the gradient without beta is > 0 873a7e14dcfSSatish Balay */ 874a7e14dcfSSatish Balay if (g[uv[i]] + kktlam*a[uv[i]] < -tol){ 875a7e14dcfSSatish Balay info = 0; 876a7e14dcfSSatish Balay break; 877a7e14dcfSSatish Balay } 87853506e15SBarry Smith } else { 879a7e14dcfSSatish Balay /* x[i] == upper bound, hence, lagrange multiplier (say, eta) for upper bound may 880a7e14dcfSSatish Balay not be zero. So, the gradient without eta is < 0 881a7e14dcfSSatish Balay */ 882a7e14dcfSSatish Balay if (g[uv[i]] + kktlam*a[uv[i]] > tol) { 883a7e14dcfSSatish Balay info = 0; 884a7e14dcfSSatish Balay break; 885a7e14dcfSSatish Balay } 886a7e14dcfSSatish Balay } 887a7e14dcfSSatish Balay } 888a7e14dcfSSatish Balay } 889a7e14dcfSSatish Balay 89053506e15SBarry Smith if (info == 1) return 0; 891a7e14dcfSSatish Balay } 892a7e14dcfSSatish Balay } 893a7e14dcfSSatish Balay } 894a7e14dcfSSatish Balay return 0; 895a7e14dcfSSatish Balay } 896a7e14dcfSSatish Balay 897a7e14dcfSSatish Balay 898