1a7e14dcfSSatish Balay #include "bmrm.h" 2a7e14dcfSSatish Balay 3a7e14dcfSSatish Balay static PetscErrorCode init_df_solver(TAO_DF*); 4a7e14dcfSSatish Balay static PetscErrorCode ensure_df_space(PetscInt, TAO_DF*); 5a7e14dcfSSatish Balay static PetscErrorCode destroy_df_solver(TAO_DF*); 6a7e14dcfSSatish Balay static PetscReal phi(PetscReal*,PetscInt,PetscReal,PetscReal*, 7a7e14dcfSSatish Balay PetscReal,PetscReal*,PetscReal*,PetscReal*); 8a7e14dcfSSatish Balay static PetscInt project(PetscInt,PetscReal*,PetscReal,PetscReal*, 9a7e14dcfSSatish Balay PetscReal*,PetscReal*,PetscReal*,PetscReal*,TAO_DF*); 10a7e14dcfSSatish Balay 11a7e14dcfSSatish Balay static PetscErrorCode solve(TAO_DF*); 12a7e14dcfSSatish Balay 13a7e14dcfSSatish Balay 14a7e14dcfSSatish Balay /*------------------------------------------------------------*/ 15a7e14dcfSSatish Balay /* The main solver function 16a7e14dcfSSatish Balay 17a7e14dcfSSatish Balay f = Remp(W) This is what the user provides us from the application layer 18a7e14dcfSSatish Balay So the ComputeGradient function for instance should get us back the subgradient of Remp(W) 19a7e14dcfSSatish Balay 20a7e14dcfSSatish Balay Regularizer assumed to be L2 norm = lambda*0.5*W'W () 21a7e14dcfSSatish Balay */ 22a7e14dcfSSatish Balay 23a7e14dcfSSatish Balay #undef __FUNCT__ 24a7e14dcfSSatish Balay #define __FUNCT__ "make_grad_node" 25a7e14dcfSSatish Balay static PetscErrorCode make_grad_node(Vec X, Vec_Chain **p) 26a7e14dcfSSatish Balay { 27a7e14dcfSSatish Balay PetscErrorCode ierr; 28a7e14dcfSSatish Balay 29a7e14dcfSSatish Balay PetscFunctionBegin; 30a7e14dcfSSatish Balay 31a7e14dcfSSatish Balay ierr = PetscMalloc(sizeof(Vec_Chain), p);CHKERRQ(ierr); 32a7e14dcfSSatish Balay ierr = VecDuplicate(X, &(*p)->V);CHKERRQ(ierr); 33a7e14dcfSSatish Balay ierr = VecCopy(X, (*p)->V);CHKERRQ(ierr); 346c23d075SBarry Smith (*p)->next = NULL; 35a7e14dcfSSatish Balay 36a7e14dcfSSatish Balay PetscFunctionReturn(0); 37a7e14dcfSSatish Balay } 38a7e14dcfSSatish Balay 39a7e14dcfSSatish Balay 40a7e14dcfSSatish Balay #undef __FUNCT__ 41a7e14dcfSSatish Balay #define __FUNCT__ "destroy_grad_list" 42a7e14dcfSSatish Balay static PetscErrorCode destroy_grad_list(Vec_Chain *head) 43a7e14dcfSSatish Balay { 44a7e14dcfSSatish Balay PetscErrorCode ierr; 45a7e14dcfSSatish Balay Vec_Chain *p = head->next, *q; 46a7e14dcfSSatish Balay 47a7e14dcfSSatish Balay PetscFunctionBegin; 48a7e14dcfSSatish Balay while(p) { 49a7e14dcfSSatish Balay q = p->next; 50a7e14dcfSSatish Balay ierr = VecDestroy(&p->V);CHKERRQ(ierr); 51a7e14dcfSSatish Balay ierr = PetscFree(p);CHKERRQ(ierr); 52a7e14dcfSSatish Balay p = q; 53a7e14dcfSSatish Balay } 546c23d075SBarry Smith head->next = NULL; 55a7e14dcfSSatish Balay 56a7e14dcfSSatish Balay PetscFunctionReturn(0); 57a7e14dcfSSatish Balay } 58a7e14dcfSSatish Balay 59a7e14dcfSSatish Balay 60a7e14dcfSSatish Balay #undef __FUNCT__ 61a7e14dcfSSatish Balay #define __FUNCT__ "TaoSolve_BMRM" 62a7e14dcfSSatish Balay static PetscErrorCode TaoSolve_BMRM(TaoSolver tao) 63a7e14dcfSSatish Balay { 64a7e14dcfSSatish Balay PetscErrorCode ierr; 65a7e14dcfSSatish Balay TaoSolverTerminationReason reason; 66a7e14dcfSSatish Balay TAO_DF df; 67a7e14dcfSSatish Balay TAO_BMRM *bmrm = (TAO_BMRM*)tao->data; 68a7e14dcfSSatish Balay 69a7e14dcfSSatish Balay /* Values and pointers to parts of the optimization problem */ 70a7e14dcfSSatish Balay PetscReal f = 0.0; 71a7e14dcfSSatish Balay Vec W = tao->solution; 72a7e14dcfSSatish Balay Vec G = tao->gradient; 73a7e14dcfSSatish Balay PetscReal lambda; 74a7e14dcfSSatish Balay 75a7e14dcfSSatish Balay PetscReal bt; 76a7e14dcfSSatish Balay Vec_Chain grad_list, *tail_glist, *pgrad; 77a7e14dcfSSatish Balay 78a7e14dcfSSatish Balay PetscInt iter = 0; 79a7e14dcfSSatish Balay PetscInt i; 80a7e14dcfSSatish Balay PetscMPIInt rank; 81a7e14dcfSSatish Balay 82a7e14dcfSSatish Balay /* Used in termination criteria check */ 83a7e14dcfSSatish Balay PetscReal reg; 84a7e14dcfSSatish Balay PetscReal jtwt, max_jtwt, pre_epsilon, epsilon, jw, min_jw; 85a7e14dcfSSatish Balay PetscReal innerSolverTol; 86a7e14dcfSSatish Balay 87a7e14dcfSSatish Balay PetscFunctionBegin; 88a7e14dcfSSatish Balay 89a7e14dcfSSatish Balay ierr = MPI_Comm_rank(PETSC_COMM_WORLD, &rank);CHKERRQ(ierr); 90a7e14dcfSSatish Balay lambda = bmrm->lambda; 91a7e14dcfSSatish Balay 92a7e14dcfSSatish Balay /* Check Stopping Condition */ 93a7e14dcfSSatish Balay tao->step = 1.0; 94a7e14dcfSSatish Balay max_jtwt = -BMRM_INFTY; 95a7e14dcfSSatish Balay min_jw = BMRM_INFTY; 96a7e14dcfSSatish Balay innerSolverTol = 1.0; 97a7e14dcfSSatish Balay epsilon = 0.0; 98a7e14dcfSSatish Balay 99a7e14dcfSSatish Balay if (rank == 0) { 100a7e14dcfSSatish Balay ierr = init_df_solver(&df);CHKERRQ(ierr); 101a7e14dcfSSatish Balay grad_list.next = NULL; 102a7e14dcfSSatish Balay tail_glist = &grad_list; 103a7e14dcfSSatish Balay } 104a7e14dcfSSatish Balay 105a7e14dcfSSatish Balay df.tol = 1e-6; 106a7e14dcfSSatish Balay reason = TAO_CONTINUE_ITERATING; 107a7e14dcfSSatish Balay 108a7e14dcfSSatish Balay /*-----------------Algorithm Begins------------------------*/ 109a7e14dcfSSatish Balay /* make the scatter */ 110a7e14dcfSSatish Balay ierr = VecScatterCreateToZero(W, &bmrm->scatter, &bmrm->local_w);CHKERRQ(ierr); 111a7e14dcfSSatish Balay ierr = VecAssemblyBegin(bmrm->local_w);CHKERRQ(ierr); 112a7e14dcfSSatish Balay ierr = VecAssemblyEnd(bmrm->local_w);CHKERRQ(ierr); 113a7e14dcfSSatish Balay 114a7e14dcfSSatish Balay /* NOTE: In application pass the sub-gradient of Remp(W) */ 115a7e14dcfSSatish Balay ierr = TaoComputeObjectiveAndGradient(tao, W, &f, G);CHKERRQ(ierr); 116a7e14dcfSSatish Balay ierr = TaoMonitor(tao,iter,f,1.0,0.0,tao->step,&reason);CHKERRQ(ierr); 117a7e14dcfSSatish Balay while (reason == TAO_CONTINUE_ITERATING) { 118a7e14dcfSSatish Balay /* compute bt = Remp(Wt-1) - <Wt-1, At> */ 119a7e14dcfSSatish Balay ierr = VecDot(W, G, &bt);CHKERRQ(ierr); 120a7e14dcfSSatish Balay bt = f - bt; 121a7e14dcfSSatish Balay 122a7e14dcfSSatish Balay /* First gather the gradient to the master node */ 123a7e14dcfSSatish Balay ierr = VecScatterBegin(bmrm->scatter, G, bmrm->local_w, INSERT_VALUES, SCATTER_FORWARD);CHKERRQ(ierr); 124a7e14dcfSSatish Balay ierr = VecScatterEnd(bmrm->scatter, G, bmrm->local_w, INSERT_VALUES, SCATTER_FORWARD);CHKERRQ(ierr); 125a7e14dcfSSatish Balay 126a7e14dcfSSatish Balay /* Bring up the inner solver */ 127a7e14dcfSSatish Balay if (rank == 0) { 128a7e14dcfSSatish Balay ierr = ensure_df_space(iter+1, &df); CHKERRQ(ierr); 129a7e14dcfSSatish Balay ierr = make_grad_node(bmrm->local_w, &pgrad);CHKERRQ(ierr); 130a7e14dcfSSatish Balay tail_glist->next = pgrad; 131a7e14dcfSSatish Balay tail_glist = pgrad; 132a7e14dcfSSatish Balay 133a7e14dcfSSatish Balay df.a[iter] = 1.0; 134a7e14dcfSSatish Balay df.f[iter] = -bt; 135a7e14dcfSSatish Balay df.u[iter] = 1.0; 136a7e14dcfSSatish Balay df.l[iter] = 0.0; 137a7e14dcfSSatish Balay 138a7e14dcfSSatish Balay /* set up the Q */ 139a7e14dcfSSatish Balay pgrad = grad_list.next; 140a7e14dcfSSatish Balay for (i=0; i<=iter; i++) { 141a7e14dcfSSatish Balay ierr = VecDot(pgrad->V, bmrm->local_w, ®);CHKERRQ(ierr); 142a7e14dcfSSatish Balay df.Q[i][iter] = df.Q[iter][i] = reg / lambda; 143a7e14dcfSSatish Balay pgrad = pgrad->next; 144a7e14dcfSSatish Balay } 145a7e14dcfSSatish Balay 146a7e14dcfSSatish Balay if (iter > 0) { 147a7e14dcfSSatish Balay df.x[iter] = 0.0; 148a7e14dcfSSatish Balay ierr = solve(&df); CHKERRQ(ierr); 149a7e14dcfSSatish Balay } 150a7e14dcfSSatish Balay else 151a7e14dcfSSatish Balay df.x[0] = 1.0; 152a7e14dcfSSatish Balay 153a7e14dcfSSatish Balay /* now computing Jt*(alpha_t) which should be = Jt(wt) to check convergence */ 154a7e14dcfSSatish Balay jtwt = 0.0; 155a7e14dcfSSatish Balay ierr = VecSet(bmrm->local_w, 0.0); CHKERRQ(ierr); 156a7e14dcfSSatish Balay pgrad = grad_list.next; 157a7e14dcfSSatish Balay for (i=0; i<=iter; i++) { 158a7e14dcfSSatish Balay jtwt -= df.x[i] * df.f[i]; 159a7e14dcfSSatish Balay ierr = VecAXPY(bmrm->local_w, -df.x[i] / lambda, pgrad->V); CHKERRQ(ierr); 160a7e14dcfSSatish Balay pgrad = pgrad->next; 161a7e14dcfSSatish Balay } 162a7e14dcfSSatish Balay 163a7e14dcfSSatish Balay ierr = VecNorm(bmrm->local_w, NORM_2, ®); CHKERRQ(ierr); 164a7e14dcfSSatish Balay reg = 0.5*lambda*reg*reg; 165a7e14dcfSSatish Balay jtwt -= reg; 166a7e14dcfSSatish Balay } /* end if rank == 0 */ 167a7e14dcfSSatish Balay 168a7e14dcfSSatish Balay /* scatter the new W to all nodes */ 169a7e14dcfSSatish Balay ierr = VecScatterBegin(bmrm->scatter,bmrm->local_w,W,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 170a7e14dcfSSatish Balay ierr = VecScatterEnd(bmrm->scatter,bmrm->local_w,W,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 171a7e14dcfSSatish Balay 172a7e14dcfSSatish Balay ierr = TaoComputeObjectiveAndGradient(tao, W, &f, G);CHKERRQ(ierr); 173a7e14dcfSSatish Balay 174a7e14dcfSSatish Balay MPI_Bcast(&jtwt,1,MPI_DOUBLE,0,PETSC_COMM_WORLD); 175a7e14dcfSSatish Balay MPI_Bcast(®,1,MPI_DOUBLE,0,PETSC_COMM_WORLD); 176a7e14dcfSSatish Balay 177a7e14dcfSSatish Balay jw = reg + f; /* J(w) = regularizer + Remp(w) */ 178a7e14dcfSSatish Balay if (jw < min_jw) 179a7e14dcfSSatish Balay min_jw = jw; 180a7e14dcfSSatish Balay if (jtwt > max_jtwt) 181a7e14dcfSSatish Balay max_jtwt = jtwt; 182a7e14dcfSSatish Balay 183a7e14dcfSSatish Balay pre_epsilon = epsilon; 184a7e14dcfSSatish Balay epsilon = min_jw - jtwt; 185a7e14dcfSSatish Balay 186a7e14dcfSSatish Balay if (rank == 0) { 187a7e14dcfSSatish Balay if (innerSolverTol > epsilon) 188a7e14dcfSSatish Balay innerSolverTol = epsilon; 189a7e14dcfSSatish Balay else if (innerSolverTol < 1e-7) 190a7e14dcfSSatish Balay innerSolverTol = 1e-7; 191a7e14dcfSSatish Balay 192a7e14dcfSSatish Balay /* if the annealing doesn't work well, lower the inner solver tolerance */ 193a7e14dcfSSatish Balay if(pre_epsilon < epsilon) 194a7e14dcfSSatish Balay innerSolverTol *= 0.2; 195a7e14dcfSSatish Balay 196a7e14dcfSSatish Balay df.tol = innerSolverTol*0.5; 197a7e14dcfSSatish Balay } 198a7e14dcfSSatish Balay 199a7e14dcfSSatish Balay iter++; 200a7e14dcfSSatish Balay ierr = TaoMonitor(tao,iter,min_jw,epsilon,0.0,tao->step,&reason);CHKERRQ(ierr); 201a7e14dcfSSatish Balay } 202a7e14dcfSSatish Balay 203a7e14dcfSSatish Balay /* free all the memory */ 204a7e14dcfSSatish Balay if (rank == 0) { 205a7e14dcfSSatish Balay ierr = destroy_grad_list(&grad_list); CHKERRQ(ierr); 206a7e14dcfSSatish Balay ierr = destroy_df_solver(&df);CHKERRQ(ierr); 207a7e14dcfSSatish Balay } 208a7e14dcfSSatish Balay 209a7e14dcfSSatish Balay ierr = VecDestroy(&bmrm->local_w);CHKERRQ(ierr); 210a7e14dcfSSatish Balay ierr = VecScatterDestroy(&bmrm->scatter);CHKERRQ(ierr); 211a7e14dcfSSatish Balay 212a7e14dcfSSatish Balay PetscFunctionReturn(0); 213a7e14dcfSSatish Balay } 214a7e14dcfSSatish Balay 215a7e14dcfSSatish Balay 216a7e14dcfSSatish Balay /* ---------------------------------------------------------- */ 217a7e14dcfSSatish Balay 218a7e14dcfSSatish Balay #undef __FUNCT__ 219a7e14dcfSSatish Balay #define __FUNCT__ "TaoSetup_BMRM" 220a7e14dcfSSatish Balay static PetscErrorCode TaoSetup_BMRM(TaoSolver tao) { 221a7e14dcfSSatish Balay 222a7e14dcfSSatish Balay PetscErrorCode ierr; 223a7e14dcfSSatish Balay 224a7e14dcfSSatish Balay PetscFunctionBegin; 225a7e14dcfSSatish Balay 226a7e14dcfSSatish Balay /* Allocate some arrays */ 227a7e14dcfSSatish Balay if (!tao->gradient) { 228a7e14dcfSSatish Balay ierr = VecDuplicate(tao->solution, &tao->gradient); CHKERRQ(ierr); 229a7e14dcfSSatish Balay } 230a7e14dcfSSatish Balay 231a7e14dcfSSatish Balay PetscFunctionReturn(0); 232a7e14dcfSSatish Balay } 233a7e14dcfSSatish Balay 234a7e14dcfSSatish Balay 235a7e14dcfSSatish Balay /*------------------------------------------------------------*/ 236a7e14dcfSSatish Balay 237a7e14dcfSSatish Balay #undef __FUNCT__ 238a7e14dcfSSatish Balay #define __FUNCT__ "TaoDestroy_BMRM" 239a7e14dcfSSatish Balay static PetscErrorCode TaoDestroy_BMRM(TaoSolver tao) 240a7e14dcfSSatish Balay { 241a7e14dcfSSatish Balay PetscErrorCode ierr; 242a7e14dcfSSatish Balay 243a7e14dcfSSatish Balay PetscFunctionBegin; 244a7e14dcfSSatish Balay ierr = PetscFree(tao->data);CHKERRQ(ierr); 245a7e14dcfSSatish Balay PetscFunctionReturn(0); 246a7e14dcfSSatish Balay } 247a7e14dcfSSatish Balay 248a7e14dcfSSatish Balay 249a7e14dcfSSatish Balay #undef __FUNCT__ 250a7e14dcfSSatish Balay #define __FUNCT__ "TaoSetFromOptions_BMRM" 251a7e14dcfSSatish Balay static PetscErrorCode TaoSetFromOptions_BMRM(TaoSolver tao) 252a7e14dcfSSatish Balay { 253a7e14dcfSSatish Balay PetscErrorCode ierr; 254a7e14dcfSSatish Balay TAO_BMRM* bmrm = (TAO_BMRM*)tao->data; 255a7e14dcfSSatish Balay PetscBool flg; 256a7e14dcfSSatish Balay 257a7e14dcfSSatish Balay PetscFunctionBegin; 258a7e14dcfSSatish Balay ierr = PetscOptionsHead("BMRM for regularized risk minimization");CHKERRQ(ierr); 259a7e14dcfSSatish Balay ierr = PetscOptionsReal("-tao_bmrm_lambda", "regulariser weight","", 100,&bmrm->lambda,&flg); CHKERRQ(ierr); 260a7e14dcfSSatish Balay ierr = PetscOptionsTail();CHKERRQ(ierr); 261a7e14dcfSSatish Balay PetscFunctionReturn(0); 262a7e14dcfSSatish Balay } 263a7e14dcfSSatish Balay 264a7e14dcfSSatish Balay 265a7e14dcfSSatish Balay /*------------------------------------------------------------*/ 266a7e14dcfSSatish Balay #undef __FUNCT__ 267a7e14dcfSSatish Balay #define __FUNCT__ "TaoView_BMRM" 268a7e14dcfSSatish Balay static PetscErrorCode TaoView_BMRM(TaoSolver tao, PetscViewer viewer) 269a7e14dcfSSatish Balay { 270a7e14dcfSSatish Balay PetscBool isascii; 271a7e14dcfSSatish Balay PetscErrorCode ierr; 272a7e14dcfSSatish Balay 273a7e14dcfSSatish Balay PetscFunctionBegin; 274a7e14dcfSSatish Balay ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&isascii);CHKERRQ(ierr); 275a7e14dcfSSatish Balay if (isascii) { 276a7e14dcfSSatish Balay ierr = PetscViewerASCIIPushTab(viewer);CHKERRQ(ierr); 277a7e14dcfSSatish Balay ierr = PetscViewerASCIIPopTab(viewer);CHKERRQ(ierr); 278a7e14dcfSSatish Balay } 279a7e14dcfSSatish Balay PetscFunctionReturn(0); 280a7e14dcfSSatish Balay } 281a7e14dcfSSatish Balay 282a7e14dcfSSatish Balay 283a7e14dcfSSatish Balay /*------------------------------------------------------------*/ 284a7e14dcfSSatish Balay EXTERN_C_BEGIN 285a7e14dcfSSatish Balay #undef __FUNCT__ 286a7e14dcfSSatish Balay #define __FUNCT__ "TaoCreate_BMRM" 287a7e14dcfSSatish Balay PetscErrorCode TaoCreate_BMRM(TaoSolver tao) 288a7e14dcfSSatish Balay { 289a7e14dcfSSatish Balay TAO_BMRM *bmrm; 290a7e14dcfSSatish Balay PetscErrorCode ierr; 291a7e14dcfSSatish Balay 292a7e14dcfSSatish Balay PetscFunctionBegin; 293a7e14dcfSSatish Balay tao->ops->setup = TaoSetup_BMRM; 294a7e14dcfSSatish Balay tao->ops->solve = TaoSolve_BMRM; 295a7e14dcfSSatish Balay tao->ops->view = TaoView_BMRM; 296a7e14dcfSSatish Balay tao->ops->setfromoptions = TaoSetFromOptions_BMRM; 297a7e14dcfSSatish Balay tao->ops->destroy = TaoDestroy_BMRM; 298a7e14dcfSSatish Balay 2993c9e27cfSGeoffrey Irving ierr = PetscNewLog(tao,&bmrm);CHKERRQ(ierr); 300a7e14dcfSSatish Balay bmrm->lambda = 1.0; 301a7e14dcfSSatish Balay tao->data = (void*)bmrm; 302a7e14dcfSSatish Balay 303a7e14dcfSSatish Balay /* Note: May need to be tuned! */ 304a7e14dcfSSatish Balay tao->max_it = 2048; 305a7e14dcfSSatish Balay tao->max_funcs = 300000; 306a7e14dcfSSatish Balay tao->fatol = 1e-20; 307a7e14dcfSSatish Balay tao->frtol = 1e-25; 308a7e14dcfSSatish Balay tao->gatol = 1e-25; 309a7e14dcfSSatish Balay tao->grtol = 1e-25; 310a7e14dcfSSatish Balay 311a7e14dcfSSatish Balay PetscFunctionReturn(0); 312a7e14dcfSSatish Balay } 313a7e14dcfSSatish Balay EXTERN_C_END 314a7e14dcfSSatish Balay 315a7e14dcfSSatish Balay #undef __FUNCT__ 316a7e14dcfSSatish Balay #define __FUNCT__ "init_df_solver" 317a7e14dcfSSatish Balay PetscErrorCode init_df_solver(TAO_DF *df) 318a7e14dcfSSatish Balay { 319a7e14dcfSSatish Balay PetscInt i, n = INCRE_DIM; 320a7e14dcfSSatish Balay PetscErrorCode ierr; 321a7e14dcfSSatish Balay 322a7e14dcfSSatish Balay PetscFunctionBegin; 323a7e14dcfSSatish Balay /* default values */ 324a7e14dcfSSatish Balay df->maxProjIter = 200; 325a7e14dcfSSatish Balay df->maxPGMIter = 300000; 326a7e14dcfSSatish Balay df->b = 1.0; 327a7e14dcfSSatish Balay 328a7e14dcfSSatish Balay /* memory space required by Dai-Fletcher */ 329a7e14dcfSSatish Balay df->cur_num_cp = n; 330a7e14dcfSSatish Balay ierr = PetscMalloc(sizeof(PetscReal)*n, &df->f); CHKERRQ(ierr); 331a7e14dcfSSatish Balay ierr = PetscMalloc(sizeof(PetscReal)*n, &df->a); CHKERRQ(ierr); 332a7e14dcfSSatish Balay ierr = PetscMalloc(sizeof(PetscReal)*n, &df->l); CHKERRQ(ierr); 333a7e14dcfSSatish Balay ierr = PetscMalloc(sizeof(PetscReal)*n, &df->u); CHKERRQ(ierr); 334a7e14dcfSSatish Balay ierr = PetscMalloc(sizeof(PetscReal)*n, &df->x); CHKERRQ(ierr); 335a7e14dcfSSatish Balay ierr = PetscMalloc(sizeof(PetscReal*)*n, &df->Q); CHKERRQ(ierr); 336a7e14dcfSSatish Balay 337a7e14dcfSSatish Balay for (i = 0; i < n; i ++) { 338a7e14dcfSSatish Balay ierr = PetscMalloc(sizeof(PetscReal)*n, &df->Q[i]); CHKERRQ(ierr); 339a7e14dcfSSatish Balay } 340a7e14dcfSSatish Balay 341a7e14dcfSSatish Balay ierr = PetscMalloc(sizeof(PetscReal)*n, &df->g); CHKERRQ(ierr); 342a7e14dcfSSatish Balay ierr = PetscMalloc(sizeof(PetscReal)*n, &df->y); CHKERRQ(ierr); 343a7e14dcfSSatish Balay ierr = PetscMalloc(sizeof(PetscReal)*n, &df->tempv); CHKERRQ(ierr); 344a7e14dcfSSatish Balay ierr = PetscMalloc(sizeof(PetscReal)*n, &df->d); CHKERRQ(ierr); 345a7e14dcfSSatish Balay ierr = PetscMalloc(sizeof(PetscReal)*n, &df->Qd); CHKERRQ(ierr); 346a7e14dcfSSatish Balay ierr = PetscMalloc(sizeof(PetscReal)*n, &df->t); CHKERRQ(ierr); 347a7e14dcfSSatish Balay ierr = PetscMalloc(sizeof(PetscReal)*n, &df->xplus); CHKERRQ(ierr); 348a7e14dcfSSatish Balay ierr = PetscMalloc(sizeof(PetscReal)*n, &df->tplus); CHKERRQ(ierr); 349a7e14dcfSSatish Balay ierr = PetscMalloc(sizeof(PetscReal)*n, &df->sk); CHKERRQ(ierr); 350a7e14dcfSSatish Balay ierr = PetscMalloc(sizeof(PetscReal)*n, &df->yk); CHKERRQ(ierr); 351a7e14dcfSSatish Balay 352a7e14dcfSSatish Balay ierr = PetscMalloc(sizeof(PetscInt)*n, &df->ipt); CHKERRQ(ierr); 353a7e14dcfSSatish Balay ierr = PetscMalloc(sizeof(PetscInt)*n, &df->ipt2); CHKERRQ(ierr); 354a7e14dcfSSatish Balay ierr = PetscMalloc(sizeof(PetscInt)*n, &df->uv); CHKERRQ(ierr); 355a7e14dcfSSatish Balay PetscFunctionReturn(0); 356a7e14dcfSSatish Balay } 357a7e14dcfSSatish Balay 358a7e14dcfSSatish Balay #undef __FUNCT__ 359a7e14dcfSSatish Balay #define __FUNCT__ "ensure_df_space" 360a7e14dcfSSatish Balay PetscErrorCode ensure_df_space(PetscInt dim, TAO_DF *df) 361a7e14dcfSSatish Balay { 362a7e14dcfSSatish Balay PetscErrorCode ierr; 363a7e14dcfSSatish Balay PetscReal *tmp, **tmp_Q; 364a7e14dcfSSatish Balay PetscInt i, n, old_n; 365a7e14dcfSSatish Balay 366a7e14dcfSSatish Balay PetscFunctionBegin; 367*53506e15SBarry Smith df->dim = dim; 368*53506e15SBarry Smith if (dim <= df->cur_num_cp) PetscFunctionReturn(0); 369a7e14dcfSSatish Balay 370a7e14dcfSSatish Balay old_n = df->cur_num_cp; 371a7e14dcfSSatish Balay df->cur_num_cp += INCRE_DIM; 372a7e14dcfSSatish Balay n = df->cur_num_cp; 373a7e14dcfSSatish Balay 374a7e14dcfSSatish Balay /* memory space required by dai-fletcher */ 375a7e14dcfSSatish Balay ierr = PetscMalloc(sizeof(PetscReal)*n, &tmp); CHKERRQ(ierr); 376a7e14dcfSSatish Balay ierr = PetscMemcpy(tmp, df->f, sizeof(PetscReal)*old_n); CHKERRQ(ierr); 377a7e14dcfSSatish Balay ierr = PetscFree(df->f); CHKERRQ(ierr); 378a7e14dcfSSatish Balay df->f = tmp; 379a7e14dcfSSatish Balay 380a7e14dcfSSatish Balay ierr = PetscMalloc(sizeof(PetscReal)*n, &tmp); CHKERRQ(ierr); 381a7e14dcfSSatish Balay ierr = PetscMemcpy(tmp, df->a, sizeof(PetscReal)*old_n); CHKERRQ(ierr); 382a7e14dcfSSatish Balay ierr = PetscFree(df->a); CHKERRQ(ierr); 383a7e14dcfSSatish Balay df->a = tmp; 384a7e14dcfSSatish Balay 385a7e14dcfSSatish Balay ierr = PetscMalloc(sizeof(PetscReal)*n, &tmp); CHKERRQ(ierr); 386a7e14dcfSSatish Balay ierr = PetscMemcpy(tmp, df->l, sizeof(PetscReal)*old_n); CHKERRQ(ierr); 387a7e14dcfSSatish Balay ierr = PetscFree(df->l); CHKERRQ(ierr); 388a7e14dcfSSatish Balay df->l = tmp; 389a7e14dcfSSatish Balay 390a7e14dcfSSatish Balay ierr = PetscMalloc(sizeof(PetscReal)*n, &tmp); CHKERRQ(ierr); 391a7e14dcfSSatish Balay ierr = PetscMemcpy(tmp, df->u, sizeof(PetscReal)*old_n); CHKERRQ(ierr); 392a7e14dcfSSatish Balay ierr = PetscFree(df->u); CHKERRQ(ierr); 393a7e14dcfSSatish Balay df->u = tmp; 394a7e14dcfSSatish Balay 395a7e14dcfSSatish Balay ierr = PetscMalloc(sizeof(PetscReal)*n, &tmp); CHKERRQ(ierr); 396a7e14dcfSSatish Balay ierr = PetscMemcpy(tmp, df->x, sizeof(PetscReal)*old_n); CHKERRQ(ierr); 397a7e14dcfSSatish Balay ierr = PetscFree(df->x); CHKERRQ(ierr); 398a7e14dcfSSatish Balay df->x = tmp; 399a7e14dcfSSatish Balay 400a7e14dcfSSatish Balay ierr = PetscMalloc(sizeof(PetscReal*)*n, &tmp_Q); CHKERRQ(ierr); 401*53506e15SBarry Smith for (i = 0; i < n; i ++) { 402a7e14dcfSSatish Balay ierr = PetscMalloc(sizeof(PetscReal)*n, &tmp_Q[i]); CHKERRQ(ierr); 403*53506e15SBarry Smith if (i < old_n) { 404a7e14dcfSSatish Balay ierr = PetscMemcpy(tmp_Q[i], df->Q[i], sizeof(PetscReal)*old_n); CHKERRQ(ierr); 405a7e14dcfSSatish Balay ierr = PetscFree(df->Q[i]); CHKERRQ(ierr); 406a7e14dcfSSatish Balay } 407a7e14dcfSSatish Balay } 408a7e14dcfSSatish Balay 409a7e14dcfSSatish Balay ierr = PetscFree(df->Q); CHKERRQ(ierr); 410a7e14dcfSSatish Balay df->Q = tmp_Q; 411a7e14dcfSSatish Balay 412a7e14dcfSSatish Balay ierr = PetscFree(df->g); CHKERRQ(ierr); 413a7e14dcfSSatish Balay ierr = PetscMalloc(sizeof(PetscReal)*n, &df->g); CHKERRQ(ierr); 414a7e14dcfSSatish Balay 415a7e14dcfSSatish Balay ierr = PetscFree(df->y); CHKERRQ(ierr); 416a7e14dcfSSatish Balay ierr = PetscMalloc(sizeof(PetscReal)*n, &df->y); CHKERRQ(ierr); 417a7e14dcfSSatish Balay 418a7e14dcfSSatish Balay ierr = PetscFree(df->tempv); CHKERRQ(ierr); 419a7e14dcfSSatish Balay ierr = PetscMalloc(sizeof(PetscReal)*n, &df->tempv); CHKERRQ(ierr); 420a7e14dcfSSatish Balay 421a7e14dcfSSatish Balay ierr = PetscFree(df->d); CHKERRQ(ierr); 422a7e14dcfSSatish Balay ierr = PetscMalloc(sizeof(PetscReal)*n, &df->d); CHKERRQ(ierr); 423a7e14dcfSSatish Balay 424a7e14dcfSSatish Balay ierr = PetscFree(df->Qd); CHKERRQ(ierr); 425a7e14dcfSSatish Balay ierr = PetscMalloc(sizeof(PetscReal)*n, &df->Qd); CHKERRQ(ierr); 426a7e14dcfSSatish Balay 427a7e14dcfSSatish Balay ierr = PetscFree(df->t); CHKERRQ(ierr); 428a7e14dcfSSatish Balay ierr = PetscMalloc(sizeof(PetscReal)*n, &df->t); CHKERRQ(ierr); 429a7e14dcfSSatish Balay 430a7e14dcfSSatish Balay ierr = PetscFree(df->xplus); CHKERRQ(ierr); 431a7e14dcfSSatish Balay ierr = PetscMalloc(sizeof(PetscReal)*n, &df->xplus); CHKERRQ(ierr); 432a7e14dcfSSatish Balay 433a7e14dcfSSatish Balay ierr = PetscFree(df->tplus); CHKERRQ(ierr); 434a7e14dcfSSatish Balay ierr = PetscMalloc(sizeof(PetscReal)*n, &df->tplus); CHKERRQ(ierr); 435a7e14dcfSSatish Balay 436a7e14dcfSSatish Balay ierr = PetscFree(df->sk); CHKERRQ(ierr); 437a7e14dcfSSatish Balay ierr = PetscMalloc(sizeof(PetscReal)*n, &df->sk); CHKERRQ(ierr); 438a7e14dcfSSatish Balay 439a7e14dcfSSatish Balay ierr = PetscFree(df->yk); CHKERRQ(ierr); 440a7e14dcfSSatish Balay ierr = PetscMalloc(sizeof(PetscReal)*n, &df->yk); CHKERRQ(ierr); 441a7e14dcfSSatish Balay 442a7e14dcfSSatish Balay ierr = PetscFree(df->ipt); CHKERRQ(ierr); 443a7e14dcfSSatish Balay ierr = PetscMalloc(sizeof(PetscInt)*n, &df->ipt); CHKERRQ(ierr); 444a7e14dcfSSatish Balay 445a7e14dcfSSatish Balay ierr = PetscFree(df->ipt2); CHKERRQ(ierr); 446a7e14dcfSSatish Balay ierr = PetscMalloc(sizeof(PetscInt)*n, &df->ipt2); CHKERRQ(ierr); 447a7e14dcfSSatish Balay 448a7e14dcfSSatish Balay ierr = PetscFree(df->uv); CHKERRQ(ierr); 449a7e14dcfSSatish Balay ierr = PetscMalloc(sizeof(PetscInt)*n, &df->uv); CHKERRQ(ierr); 450a7e14dcfSSatish Balay PetscFunctionReturn(0); 451a7e14dcfSSatish Balay } 452a7e14dcfSSatish Balay 453a7e14dcfSSatish Balay 454a7e14dcfSSatish Balay #undef __FUNCT__ 455a7e14dcfSSatish Balay #define __FUNCT__ "destroy_df_solver" 456a7e14dcfSSatish Balay PetscErrorCode destroy_df_solver(TAO_DF *df) 457a7e14dcfSSatish Balay { 458a7e14dcfSSatish Balay PetscErrorCode ierr; 459a7e14dcfSSatish Balay PetscInt i; 4606c23d075SBarry Smith 461a7e14dcfSSatish Balay PetscFunctionBegin; 4626c23d075SBarry Smith ierr = PetscFree(df->f); CHKERRQ(ierr); 4636c23d075SBarry Smith ierr = PetscFree(df->a); CHKERRQ(ierr); 4646c23d075SBarry Smith ierr = PetscFree(df->l); CHKERRQ(ierr); 4656c23d075SBarry Smith ierr = PetscFree(df->u); CHKERRQ(ierr); 4666c23d075SBarry Smith ierr = PetscFree(df->x); CHKERRQ(ierr); 467a7e14dcfSSatish Balay 4686c23d075SBarry Smith for (i = 0; i < df->cur_num_cp; i ++) { 469a7e14dcfSSatish Balay ierr = PetscFree(df->Q[i]); CHKERRQ(ierr); 470a7e14dcfSSatish Balay } 471a7e14dcfSSatish Balay ierr = PetscFree(df->Q); CHKERRQ(ierr); 4726c23d075SBarry Smith ierr = PetscFree(df->ipt); CHKERRQ(ierr); 4736c23d075SBarry Smith ierr = PetscFree(df->ipt2); CHKERRQ(ierr); 4746c23d075SBarry Smith ierr = PetscFree(df->uv); CHKERRQ(ierr); 4756c23d075SBarry Smith ierr = PetscFree(df->g); CHKERRQ(ierr); 4766c23d075SBarry Smith ierr = PetscFree(df->y); CHKERRQ(ierr); 4776c23d075SBarry Smith ierr = PetscFree(df->tempv); CHKERRQ(ierr); 4786c23d075SBarry Smith ierr = PetscFree(df->d); CHKERRQ(ierr); 4796c23d075SBarry Smith ierr = PetscFree(df->Qd); CHKERRQ(ierr); 4806c23d075SBarry Smith ierr = PetscFree(df->t); CHKERRQ(ierr); 4816c23d075SBarry Smith ierr = PetscFree(df->xplus); CHKERRQ(ierr); 4826c23d075SBarry Smith ierr = PetscFree(df->tplus); CHKERRQ(ierr); 4836c23d075SBarry Smith ierr = PetscFree(df->sk); CHKERRQ(ierr); 4846c23d075SBarry Smith ierr = PetscFree(df->yk); CHKERRQ(ierr); 485a7e14dcfSSatish Balay PetscFunctionReturn(0); 486a7e14dcfSSatish Balay } 487a7e14dcfSSatish Balay 488a7e14dcfSSatish Balay 489a7e14dcfSSatish Balay /* Piecewise linear monotone target function for the Dai-Fletcher projector */ 490a7e14dcfSSatish Balay #undef __FUNCT__ 491a7e14dcfSSatish Balay #define __FUNCT__ "phi" 4926c23d075SBarry Smith PetscReal phi(PetscReal *x,PetscInt n,PetscReal lambda,PetscReal *a,PetscReal b,PetscReal *c,PetscReal *l,PetscReal *u) 493a7e14dcfSSatish Balay { 494a7e14dcfSSatish Balay PetscReal r = 0.0; 495a7e14dcfSSatish Balay PetscInt i; 496a7e14dcfSSatish Balay 497a7e14dcfSSatish Balay for (i = 0; i < n; i++){ 498a7e14dcfSSatish Balay x[i] = -c[i] + lambda*a[i]; 4996c23d075SBarry Smith if (x[i] > u[i]) x[i] = u[i]; 5006c23d075SBarry Smith else if(x[i] < l[i]) x[i] = l[i]; 501a7e14dcfSSatish Balay r += a[i]*x[i]; 502a7e14dcfSSatish Balay } 503a7e14dcfSSatish Balay return r - b; 504a7e14dcfSSatish Balay } 505a7e14dcfSSatish Balay 506a7e14dcfSSatish Balay /** Modified Dai-Fletcher QP projector solves the problem: 507a7e14dcfSSatish Balay * 508a7e14dcfSSatish Balay * minimise 0.5*x'*x - c'*x 509a7e14dcfSSatish Balay * subj to a'*x = b 510a7e14dcfSSatish Balay * l \leq x \leq u 511a7e14dcfSSatish Balay * 512a7e14dcfSSatish Balay * \param c The point to be projected onto feasible set 513a7e14dcfSSatish Balay */ 514a7e14dcfSSatish Balay #undef __FUNCT__ 515a7e14dcfSSatish Balay #define __FUNCT__ "project" 5166c23d075SBarry Smith PetscInt project(PetscInt n,PetscReal *a,PetscReal b,PetscReal *c,PetscReal *l,PetscReal *u,PetscReal *x,PetscReal *lam_ext,TAO_DF *df) 517a7e14dcfSSatish Balay { 518a7e14dcfSSatish Balay PetscReal lambda, lambdal, lambdau, dlambda, lambda_new; 519a7e14dcfSSatish Balay PetscReal r, rl, ru, s; 520a7e14dcfSSatish Balay PetscInt innerIter; 521a7e14dcfSSatish Balay PetscBool nonNegativeSlack = PETSC_FALSE; 522*53506e15SBarry Smith PetscErrorCode ierr; 523a7e14dcfSSatish Balay 524a7e14dcfSSatish Balay *lam_ext = 0; 525a7e14dcfSSatish Balay lambda = 0; 526a7e14dcfSSatish Balay dlambda = 0.5; 527a7e14dcfSSatish Balay innerIter = 1; 528a7e14dcfSSatish Balay 529a7e14dcfSSatish Balay /* \phi(x;lambda) := 0.5*x'*x + c'*x - lambda*(a'*x-b) 530a7e14dcfSSatish Balay * 531a7e14dcfSSatish Balay * Optimality conditions for \phi: 532a7e14dcfSSatish Balay * 533a7e14dcfSSatish Balay * 1. lambda <= 0 534a7e14dcfSSatish Balay * 2. r <= 0 535a7e14dcfSSatish Balay * 3. r*lambda == 0 536a7e14dcfSSatish Balay */ 537a7e14dcfSSatish Balay 538a7e14dcfSSatish Balay /* Bracketing Phase */ 539a7e14dcfSSatish Balay r = phi(x, n, lambda, a, b, c, l, u); 540a7e14dcfSSatish Balay 5416c23d075SBarry Smith if(nonNegativeSlack) { 542a7e14dcfSSatish Balay /* inequality constraint, i.e., with \xi >= 0 constraint */ 543*53506e15SBarry Smith if (r < TOL_R) return 0; 5446c23d075SBarry Smith } else { 545a7e14dcfSSatish Balay /* equality constraint ,i.e., without \xi >= 0 constraint */ 546*53506e15SBarry Smith if (fabs(r) < TOL_R) return 0; 547a7e14dcfSSatish Balay } 548a7e14dcfSSatish Balay 549a7e14dcfSSatish Balay if (r < 0.0){ 550a7e14dcfSSatish Balay lambdal = lambda; 551a7e14dcfSSatish Balay rl = r; 552a7e14dcfSSatish Balay lambda = lambda + dlambda; 553a7e14dcfSSatish Balay r = phi(x, n, lambda, a, b, c, l, u); 554a7e14dcfSSatish Balay while (r < 0.0 && dlambda < BMRM_INFTY) { 555a7e14dcfSSatish Balay lambdal = lambda; 556a7e14dcfSSatish Balay s = rl/r - 1.0; 557a7e14dcfSSatish Balay if (s < 0.1) s = 0.1; 558a7e14dcfSSatish Balay dlambda = dlambda + dlambda/s; 559a7e14dcfSSatish Balay lambda = lambda + dlambda; 560a7e14dcfSSatish Balay rl = r; 561a7e14dcfSSatish Balay r = phi(x, n, lambda, a, b, c, l, u); 562a7e14dcfSSatish Balay } 563a7e14dcfSSatish Balay lambdau = lambda; 564a7e14dcfSSatish Balay ru = r; 5656c23d075SBarry Smith } else { 566a7e14dcfSSatish Balay lambdau = lambda; 567a7e14dcfSSatish Balay ru = r; 568a7e14dcfSSatish Balay lambda = lambda - dlambda; 569a7e14dcfSSatish Balay r = phi(x, n, lambda, a, b, c, l, u); 570a7e14dcfSSatish Balay while (r > 0.0 && dlambda > -BMRM_INFTY) { 571a7e14dcfSSatish Balay lambdau = lambda; 572a7e14dcfSSatish Balay s = ru/r - 1.0; 573a7e14dcfSSatish Balay if (s < 0.1) s = 0.1; 574a7e14dcfSSatish Balay dlambda = dlambda + dlambda/s; 575a7e14dcfSSatish Balay lambda = lambda - dlambda; 576a7e14dcfSSatish Balay ru = r; 577a7e14dcfSSatish Balay r = phi(x, n, lambda, a, b, c, l, u); 578a7e14dcfSSatish Balay } 579a7e14dcfSSatish Balay lambdal = lambda; 580a7e14dcfSSatish Balay rl = r; 581a7e14dcfSSatish Balay } 582a7e14dcfSSatish Balay 5836c23d075SBarry Smith if(fabs(dlambda) > BMRM_INFTY) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"L2N2_DaiFletcherPGM detected Infeasible QP problem!"); 584a7e14dcfSSatish Balay 585a7e14dcfSSatish Balay if(ru == 0){ 586a7e14dcfSSatish Balay lambda = lambdau; 587a7e14dcfSSatish Balay r = phi(x, n, lambda, a, b, c, l, u); 588a7e14dcfSSatish Balay return innerIter; 589a7e14dcfSSatish Balay } 590a7e14dcfSSatish Balay 591a7e14dcfSSatish Balay /* Secant Phase */ 592a7e14dcfSSatish Balay s = 1.0 - rl/ru; 593a7e14dcfSSatish Balay dlambda = dlambda/s; 594a7e14dcfSSatish Balay lambda = lambdau - dlambda; 595a7e14dcfSSatish Balay r = phi(x, n, lambda, a, b, c, l, u); 596a7e14dcfSSatish Balay 597a7e14dcfSSatish Balay while (fabs(r) > TOL_R 598a7e14dcfSSatish Balay && dlambda > TOL_LAM * (1.0 + fabs(lambda)) 599a7e14dcfSSatish Balay && innerIter < df->maxProjIter){ 600a7e14dcfSSatish Balay innerIter++; 601a7e14dcfSSatish Balay if (r > 0.0){ 602a7e14dcfSSatish Balay if (s <= 2.0){ 603a7e14dcfSSatish Balay lambdau = lambda; 604a7e14dcfSSatish Balay ru = r; 605a7e14dcfSSatish Balay s = 1.0 - rl/ru; 606a7e14dcfSSatish Balay dlambda = (lambdau - lambdal) / s; 607a7e14dcfSSatish Balay lambda = lambdau - dlambda; 608*53506e15SBarry Smith } else { 609a7e14dcfSSatish Balay s = ru/r-1.0; 610a7e14dcfSSatish Balay if (s < 0.1) s = 0.1; 611a7e14dcfSSatish Balay dlambda = (lambdau - lambda) / s; 612a7e14dcfSSatish Balay lambda_new = 0.75*lambdal + 0.25*lambda; 613a7e14dcfSSatish Balay if (lambda_new < (lambda - dlambda)) 614a7e14dcfSSatish Balay lambda_new = lambda - dlambda; 615a7e14dcfSSatish Balay lambdau = lambda; 616a7e14dcfSSatish Balay ru = r; 617a7e14dcfSSatish Balay lambda = lambda_new; 618a7e14dcfSSatish Balay s = (lambdau - lambdal) / (lambdau - lambda); 619a7e14dcfSSatish Balay } 620*53506e15SBarry Smith } else { 621a7e14dcfSSatish Balay if (s >= 2.0){ 622a7e14dcfSSatish Balay lambdal = lambda; 623a7e14dcfSSatish Balay rl = r; 624a7e14dcfSSatish Balay s = 1.0 - rl/ru; 625a7e14dcfSSatish Balay dlambda = (lambdau - lambdal) / s; 626a7e14dcfSSatish Balay lambda = lambdau - dlambda; 627*53506e15SBarry Smith } else { 628a7e14dcfSSatish Balay s = rl/r - 1.0; 629a7e14dcfSSatish Balay if (s < 0.1) s = 0.1; 630a7e14dcfSSatish Balay dlambda = (lambda-lambdal) / s; 631a7e14dcfSSatish Balay lambda_new = 0.75*lambdau + 0.25*lambda; 632a7e14dcfSSatish Balay if (lambda_new > (lambda + dlambda)) 633a7e14dcfSSatish Balay lambda_new = lambda + dlambda; 634a7e14dcfSSatish Balay lambdal = lambda; 635a7e14dcfSSatish Balay rl = r; 636a7e14dcfSSatish Balay lambda = lambda_new; 637a7e14dcfSSatish Balay s = (lambdau - lambdal) / (lambdau-lambda); 638a7e14dcfSSatish Balay } 639a7e14dcfSSatish Balay } 640a7e14dcfSSatish Balay r = phi(x, n, lambda, a, b, c, l, u); 641a7e14dcfSSatish Balay } 642a7e14dcfSSatish Balay 643a7e14dcfSSatish Balay *lam_ext = lambda; 644*53506e15SBarry Smith if(innerIter >= df->maxProjIter) { 645*53506e15SBarry Smith ierr = PetscPrintf(PETSC_COMM_SELF, "WARNING: DaiFletcher max iterations\n");CHKERRQ(ierr); 646*53506e15SBarry Smith } 647a7e14dcfSSatish Balay return innerIter; 648a7e14dcfSSatish Balay } 649a7e14dcfSSatish Balay 650a7e14dcfSSatish Balay 651a7e14dcfSSatish Balay #undef __FUNCT__ 652a7e14dcfSSatish Balay #define __FUNCT__ "solve" 653a7e14dcfSSatish Balay PetscErrorCode solve(TAO_DF *df) 654a7e14dcfSSatish Balay { 655a7e14dcfSSatish Balay PetscErrorCode ierr; 656a7e14dcfSSatish Balay PetscInt i, j, innerIter, it, it2, luv, info, lscount = 0, projcount = 0; 657a7e14dcfSSatish Balay PetscReal gd, max, ak, bk, akold, bkold, lamnew, alpha, kktlam=0.0, lam_ext; 658a7e14dcfSSatish Balay PetscReal DELTAsv, ProdDELTAsv; 659a7e14dcfSSatish Balay PetscReal c, *tempQ; 660a7e14dcfSSatish Balay PetscReal *x = df->x, *a = df->a, b = df->b, *l = df->l, *u = df->u, tol = df->tol; 661a7e14dcfSSatish Balay PetscReal *tempv = df->tempv, *y = df->y, *g = df->g, *d = df->d, *Qd = df->Qd; 662a7e14dcfSSatish Balay PetscReal *xplus = df->xplus, *tplus = df->tplus, *sk = df->sk, *yk = df->yk; 663a7e14dcfSSatish Balay PetscReal **Q = df->Q, *f = df->f, *t = df->t; 664a7e14dcfSSatish Balay PetscInt dim = df->dim, *ipt = df->ipt, *ipt2 = df->ipt2, *uv = df->uv; 665a7e14dcfSSatish Balay 666a7e14dcfSSatish Balay /*** variables for the adaptive nonmonotone linesearch ***/ 667a7e14dcfSSatish Balay PetscInt L, llast; 668a7e14dcfSSatish Balay PetscReal fr, fbest, fv, fc, fv0; 669*53506e15SBarry Smith 670a7e14dcfSSatish Balay c = BMRM_INFTY; 671a7e14dcfSSatish Balay 672a7e14dcfSSatish Balay DELTAsv = EPS_SV; 673*53506e15SBarry Smith if (tol <= 1.0e-5 || dim <= 20) ProdDELTAsv = 0.0F; 674*53506e15SBarry Smith else ProdDELTAsv = EPS_SV; 675a7e14dcfSSatish Balay 676*53506e15SBarry Smith for (i = 0; i < dim; i++) tempv[i] = -x[i]; 677a7e14dcfSSatish Balay 678a7e14dcfSSatish Balay lam_ext = 0.0; 679a7e14dcfSSatish Balay 680a7e14dcfSSatish Balay /* Project the initial solution */ 681a7e14dcfSSatish Balay projcount += project(dim, a, b, tempv, l, u, x, &lam_ext, df); 682a7e14dcfSSatish Balay 683a7e14dcfSSatish Balay /* Compute gradient 684a7e14dcfSSatish Balay g = Q*x + f; */ 685a7e14dcfSSatish Balay 686a7e14dcfSSatish Balay it = 0; 687*53506e15SBarry Smith for (i = 0; i < dim; i++) { 688*53506e15SBarry Smith if (fabs(x[i]) > ProdDELTAsv) ipt[it++] = i; 689*53506e15SBarry Smith } 690a7e14dcfSSatish Balay 691a7e14dcfSSatish Balay ierr = PetscMemzero(t, dim*sizeof(PetscReal)); CHKERRQ(ierr); 692a7e14dcfSSatish Balay for (i = 0; i < it; i++){ 693a7e14dcfSSatish Balay tempQ = Q[ipt[i]]; 694*53506e15SBarry Smith for (j = 0; j < dim; j++) t[j] += (tempQ[j]*x[ipt[i]]); 695a7e14dcfSSatish Balay } 696a7e14dcfSSatish Balay for (i = 0; i < dim; i++){ 697a7e14dcfSSatish Balay g[i] = t[i] + f[i]; 698a7e14dcfSSatish Balay } 699a7e14dcfSSatish Balay 700a7e14dcfSSatish Balay 701a7e14dcfSSatish Balay /* y = -(x_{k} - g_{k}) */ 702a7e14dcfSSatish Balay for (i = 0; i < dim; i++){ 703a7e14dcfSSatish Balay y[i] = g[i] - x[i]; 704a7e14dcfSSatish Balay } 705a7e14dcfSSatish Balay 706a7e14dcfSSatish Balay /* Project x_{k} - g_{k} */ 707a7e14dcfSSatish Balay projcount += project(dim, a, b, y, l, u, tempv, &lam_ext, df); 708a7e14dcfSSatish Balay 709a7e14dcfSSatish Balay /* y = P(x_{k} - g_{k}) - x_{k} */ 710a7e14dcfSSatish Balay max = ALPHA_MIN; 711a7e14dcfSSatish Balay for (i = 0; i < dim; i++){ 712a7e14dcfSSatish Balay y[i] = tempv[i] - x[i]; 713*53506e15SBarry Smith if (fabs(y[i]) > max) max = fabs(y[i]); 714a7e14dcfSSatish Balay } 715a7e14dcfSSatish Balay 716a7e14dcfSSatish Balay if (max < tol*1e-3){ 717a7e14dcfSSatish Balay lscount = 0; 718a7e14dcfSSatish Balay innerIter = 0; 719a7e14dcfSSatish Balay return 0; 720a7e14dcfSSatish Balay } 721a7e14dcfSSatish Balay 722a7e14dcfSSatish Balay alpha = 1.0 / max; 723a7e14dcfSSatish Balay 724a7e14dcfSSatish Balay /* fv0 = f(x_{0}). Recall t = Q x_{k} */ 725a7e14dcfSSatish Balay fv0 = 0.0; 726*53506e15SBarry Smith for (i = 0; i < dim; i++) fv0 += x[i] * (0.5*t[i] + f[i]); 727a7e14dcfSSatish Balay 728a7e14dcfSSatish Balay /*** adaptive nonmonotone linesearch ***/ 729a7e14dcfSSatish Balay L = 2; 730a7e14dcfSSatish Balay fr = ALPHA_MAX; 731a7e14dcfSSatish Balay fbest = fv0; 732a7e14dcfSSatish Balay fc = fv0; 733a7e14dcfSSatish Balay llast = 0; 734a7e14dcfSSatish Balay akold = bkold = 0.0; 735a7e14dcfSSatish Balay 736a7e14dcfSSatish Balay /*** Iterator begins ***/ 737a7e14dcfSSatish Balay for (innerIter = 1; innerIter <= df->maxPGMIter; innerIter++) { 738a7e14dcfSSatish Balay 739a7e14dcfSSatish Balay /* tempv = -(x_{k} - alpha*g_{k}) */ 740*53506e15SBarry Smith for (i = 0; i < dim; i++) tempv[i] = alpha*g[i] - x[i]; 741a7e14dcfSSatish Balay 742a7e14dcfSSatish Balay /* Project x_{k} - alpha*g_{k} */ 743a7e14dcfSSatish Balay projcount += project(dim, a, b, tempv, l, u, y, &lam_ext, df); 744a7e14dcfSSatish Balay 745a7e14dcfSSatish Balay 746a7e14dcfSSatish Balay /* gd = \inner{d_{k}}{g_{k}} 747a7e14dcfSSatish Balay d = P(x_{k} - alpha*g_{k}) - x_{k} 748a7e14dcfSSatish Balay */ 749a7e14dcfSSatish Balay gd = 0.0; 750a7e14dcfSSatish Balay for (i = 0; i < dim; i++){ 751a7e14dcfSSatish Balay d[i] = y[i] - x[i]; 752a7e14dcfSSatish Balay gd += d[i] * g[i]; 753a7e14dcfSSatish Balay } 754a7e14dcfSSatish Balay 755a7e14dcfSSatish Balay /* Gradient computation */ 756a7e14dcfSSatish Balay 757a7e14dcfSSatish Balay /* compute Qd = Q*d or Qd = Q*y - t depending on their sparsity */ 758a7e14dcfSSatish Balay 759a7e14dcfSSatish Balay it = it2 = 0; 760*53506e15SBarry Smith for (i = 0; i < dim; i++){ 761*53506e15SBarry Smith if (fabs(d[i]) > (ProdDELTAsv*1.0e-2)) ipt[it++] = i; 762*53506e15SBarry Smith } 763*53506e15SBarry Smith for (i = 0; i < dim; i++) { 764*53506e15SBarry Smith if (fabs(y[i]) > ProdDELTAsv) ipt2[it2++] = i; 765*53506e15SBarry Smith } 766a7e14dcfSSatish Balay 767a7e14dcfSSatish Balay ierr = PetscMemzero(Qd, dim*sizeof(PetscReal)); CHKERRQ(ierr); 768a7e14dcfSSatish Balay /* compute Qd = Q*d */ 769a7e14dcfSSatish Balay if (it < it2){ 770a7e14dcfSSatish Balay for (i = 0; i < it; i++){ 771a7e14dcfSSatish Balay tempQ = Q[ipt[i]]; 772*53506e15SBarry Smith for (j = 0; j < dim; j++) Qd[j] += (tempQ[j] * d[ipt[i]]); 773a7e14dcfSSatish Balay } 774*53506e15SBarry Smith } else { /* compute Qd = Q*y-t */ 775a7e14dcfSSatish Balay for (i = 0; i < it2; i++){ 776a7e14dcfSSatish Balay tempQ = Q[ipt2[i]]; 777*53506e15SBarry Smith for (j = 0; j < dim; j++) Qd[j] += (tempQ[j] * y[ipt2[i]]); 778a7e14dcfSSatish Balay } 779*53506e15SBarry Smith for (j = 0; j < dim; j++) Qd[j] -= t[j]; 780a7e14dcfSSatish Balay } 781a7e14dcfSSatish Balay 782a7e14dcfSSatish Balay /* ak = inner{d_{k}}{d_{k}} */ 783a7e14dcfSSatish Balay ak = 0.0; 784*53506e15SBarry Smith for (i = 0; i < dim; i++) ak += d[i] * d[i]; 785a7e14dcfSSatish Balay 786a7e14dcfSSatish Balay bk = 0.0; 787*53506e15SBarry Smith for (i = 0; i < dim; i++) bk += d[i]*Qd[i]; 788a7e14dcfSSatish Balay 789*53506e15SBarry Smith if (bk > EPS*ak && gd < 0.0) lamnew = -gd/bk; 790*53506e15SBarry Smith else lamnew = 1.0; 791a7e14dcfSSatish Balay 792a7e14dcfSSatish Balay /* fv is computing f(x_{k} + d_{k}) */ 793a7e14dcfSSatish Balay fv = 0.0; 794a7e14dcfSSatish Balay for (i = 0; i < dim; i++){ 795a7e14dcfSSatish Balay xplus[i] = x[i] + d[i]; 796a7e14dcfSSatish Balay tplus[i] = t[i] + Qd[i]; 797a7e14dcfSSatish Balay fv += xplus[i] * (0.5*tplus[i] + f[i]); 798a7e14dcfSSatish Balay } 799a7e14dcfSSatish Balay 800a7e14dcfSSatish Balay /* fr is fref */ 801a7e14dcfSSatish Balay if ((innerIter == 1 && fv >= fv0) || (innerIter > 1 && fv >= fr)){ 802a7e14dcfSSatish Balay lscount++; 803a7e14dcfSSatish Balay fv = 0.0; 804a7e14dcfSSatish Balay for (i = 0; i < dim; i++){ 805a7e14dcfSSatish Balay xplus[i] = x[i] + lamnew*d[i]; 806a7e14dcfSSatish Balay tplus[i] = t[i] + lamnew*Qd[i]; 807a7e14dcfSSatish Balay fv += xplus[i] * (0.5*tplus[i] + f[i]); 808a7e14dcfSSatish Balay } 809a7e14dcfSSatish Balay } 810a7e14dcfSSatish Balay 811a7e14dcfSSatish Balay for (i = 0; i < dim; i++){ 812a7e14dcfSSatish Balay sk[i] = xplus[i] - x[i]; 813a7e14dcfSSatish Balay yk[i] = tplus[i] - t[i]; 814a7e14dcfSSatish Balay x[i] = xplus[i]; 815a7e14dcfSSatish Balay t[i] = tplus[i]; 816a7e14dcfSSatish Balay g[i] = t[i] + f[i]; 817a7e14dcfSSatish Balay } 818a7e14dcfSSatish Balay 819a7e14dcfSSatish Balay /* update the line search control parameters */ 820a7e14dcfSSatish Balay if (fv < fbest){ 821a7e14dcfSSatish Balay fbest = fv; 822a7e14dcfSSatish Balay fc = fv; 823a7e14dcfSSatish Balay llast = 0; 824*53506e15SBarry Smith } else { 825a7e14dcfSSatish Balay fc = (fc > fv ? fc : fv); 826a7e14dcfSSatish Balay llast++; 827a7e14dcfSSatish Balay if (llast == L){ 828a7e14dcfSSatish Balay fr = fc; 829a7e14dcfSSatish Balay fc = fv; 830a7e14dcfSSatish Balay llast = 0; 831a7e14dcfSSatish Balay } 832a7e14dcfSSatish Balay } 833a7e14dcfSSatish Balay 834a7e14dcfSSatish Balay ak = bk = 0.0; 835a7e14dcfSSatish Balay for (i = 0; i < dim; i++){ 836a7e14dcfSSatish Balay ak += sk[i] * sk[i]; 837a7e14dcfSSatish Balay bk += sk[i] * yk[i]; 838a7e14dcfSSatish Balay } 839a7e14dcfSSatish Balay 840*53506e15SBarry Smith if (bk <= EPS*ak) alpha = ALPHA_MAX; 841a7e14dcfSSatish Balay else { 842*53506e15SBarry Smith if (bkold < EPS*akold) alpha = ak/bk; 843*53506e15SBarry Smith else alpha = (akold+ak)/(bkold+bk); 844a7e14dcfSSatish Balay 845*53506e15SBarry Smith if (alpha > ALPHA_MAX) alpha = ALPHA_MAX; 846*53506e15SBarry Smith else if (alpha < ALPHA_MIN) alpha = ALPHA_MIN; 847a7e14dcfSSatish Balay } 848a7e14dcfSSatish Balay 849a7e14dcfSSatish Balay akold = ak; 850a7e14dcfSSatish Balay bkold = bk; 851a7e14dcfSSatish Balay 852a7e14dcfSSatish Balay /*** stopping criterion based on KKT conditions ***/ 853a7e14dcfSSatish Balay /* at optimal, gradient of lagrangian w.r.t. x is zero */ 854a7e14dcfSSatish Balay 855a7e14dcfSSatish Balay bk = 0.0; 856*53506e15SBarry Smith for (i = 0; i < dim; i++) bk += x[i] * x[i]; 857a7e14dcfSSatish Balay 858*53506e15SBarry Smith if (PetscSqrtReal(ak) < tol*10 * PetscSqrtReal(bk)){ 859a7e14dcfSSatish Balay it = 0; 860a7e14dcfSSatish Balay luv = 0; 861a7e14dcfSSatish Balay kktlam = 0.0; 862a7e14dcfSSatish Balay for (i = 0; i < dim; i++){ 863a7e14dcfSSatish Balay /* x[i] is active hence lagrange multipliers for box constraints 864a7e14dcfSSatish Balay are zero. The lagrange multiplier for ineq. const. is then 865a7e14dcfSSatish Balay defined as below 866a7e14dcfSSatish Balay */ 867a7e14dcfSSatish Balay if ((x[i] > DELTAsv) && (x[i] < c-DELTAsv)){ 868a7e14dcfSSatish Balay ipt[it++] = i; 869a7e14dcfSSatish Balay kktlam = kktlam - a[i]*g[i]; 870*53506e15SBarry Smith } else uv[luv++] = i; 871a7e14dcfSSatish Balay } 872a7e14dcfSSatish Balay 873*53506e15SBarry Smith if (it == 0 && PetscSqrtReal(ak) < tol*0.5 * PetscSqrtReal(bk)) return 0; 874a7e14dcfSSatish Balay else { 875a7e14dcfSSatish Balay kktlam = kktlam/it; 876a7e14dcfSSatish Balay info = 1; 877a7e14dcfSSatish Balay for (i = 0; i < it; i++) { 878a7e14dcfSSatish Balay if (fabs(a[ipt[i]] * g[ipt[i]] + kktlam) > tol) { 879a7e14dcfSSatish Balay info = 0; 880a7e14dcfSSatish Balay break; 881a7e14dcfSSatish Balay } 882a7e14dcfSSatish Balay } 883a7e14dcfSSatish Balay if (info == 1) { 884a7e14dcfSSatish Balay for (i = 0; i < luv; i++) { 885a7e14dcfSSatish Balay if (x[uv[i]] <= DELTAsv){ 886a7e14dcfSSatish Balay /* x[i] == lower bound, hence, lagrange multiplier (say, beta) for lower bound may 887a7e14dcfSSatish Balay not be zero. So, the gradient without beta is > 0 888a7e14dcfSSatish Balay */ 889a7e14dcfSSatish Balay if (g[uv[i]] + kktlam*a[uv[i]] < -tol){ 890a7e14dcfSSatish Balay info = 0; 891a7e14dcfSSatish Balay break; 892a7e14dcfSSatish Balay } 893*53506e15SBarry Smith } else { 894a7e14dcfSSatish Balay /* x[i] == upper bound, hence, lagrange multiplier (say, eta) for upper bound may 895a7e14dcfSSatish Balay not be zero. So, the gradient without eta is < 0 896a7e14dcfSSatish Balay */ 897a7e14dcfSSatish Balay if (g[uv[i]] + kktlam*a[uv[i]] > tol) { 898a7e14dcfSSatish Balay info = 0; 899a7e14dcfSSatish Balay break; 900a7e14dcfSSatish Balay } 901a7e14dcfSSatish Balay } 902a7e14dcfSSatish Balay } 903a7e14dcfSSatish Balay } 904a7e14dcfSSatish Balay 905*53506e15SBarry Smith if (info == 1) return 0; 906a7e14dcfSSatish Balay } 907a7e14dcfSSatish Balay } 908a7e14dcfSSatish Balay } 909a7e14dcfSSatish Balay return 0; 910a7e14dcfSSatish Balay } 911a7e14dcfSSatish Balay 912a7e14dcfSSatish Balay 913