1c4762a1bSJed Brown /* 2c4762a1bSJed Brown Include "petsctao.h" so that we can use TAO solvers. Note that this 3c4762a1bSJed Brown file automatically includes libraries such as: 4c4762a1bSJed Brown petsc.h - base PETSc routines petscvec.h - vectors 5a5b23f4aSJose E. Roman petscsys.h - system routines petscmat.h - matrices 6c4762a1bSJed Brown petscis.h - index sets petscksp.h - Krylov subspace methods 7c4762a1bSJed Brown petscviewer.h - viewers petscpc.h - preconditioners 8c4762a1bSJed Brown 9c4762a1bSJed Brown */ 10c4762a1bSJed Brown 11c4762a1bSJed Brown #include <petsctao.h> 12c4762a1bSJed Brown 13c4762a1bSJed Brown /* 14c4762a1bSJed Brown Description: These data are the result of a NIST study involving 15c4762a1bSJed Brown ultrasonic calibration. The response variable is 16c4762a1bSJed Brown ultrasonic response, and the predictor variable is 17c4762a1bSJed Brown metal distance. 18c4762a1bSJed Brown 19c4762a1bSJed Brown Reference: Chwirut, D., NIST (197?). 20c4762a1bSJed Brown Ultrasonic Reference Block Study. 21c4762a1bSJed Brown */ 22c4762a1bSJed Brown 23c4762a1bSJed Brown static char help[]="Finds the nonlinear least-squares solution to the model \n\ 24c4762a1bSJed Brown y = exp[-b1*x]/(b2+b3*x) + e \n"; 25c4762a1bSJed Brown 26c4762a1bSJed Brown /* T 27c4762a1bSJed Brown Concepts: TAO^Solving a system of nonlinear equations, nonlinear least squares 28c4762a1bSJed Brown Routines: TaoCreate(); 29c4762a1bSJed Brown Routines: TaoSetType(); 30c4762a1bSJed Brown Routines: TaoSetResidualRoutine(); 31c4762a1bSJed Brown Routines: TaoSetMonitor(); 32c4762a1bSJed Brown Routines: TaoSetInitialVector(); 33c4762a1bSJed Brown Routines: TaoSetFromOptions(); 34c4762a1bSJed Brown Routines: TaoSolve(); 35c4762a1bSJed Brown Routines: TaoDestroy(); 36c4762a1bSJed Brown Processors: n 37c4762a1bSJed Brown T*/ 38c4762a1bSJed Brown 39c4762a1bSJed Brown #define NOBSERVATIONS 214 40c4762a1bSJed Brown #define NPARAMETERS 3 41c4762a1bSJed Brown 42c4762a1bSJed Brown #define DIE_TAG 2000 43c4762a1bSJed Brown #define IDLE_TAG 1000 44c4762a1bSJed Brown 45c4762a1bSJed Brown /* User-defined application context */ 46c4762a1bSJed Brown typedef struct { 47c4762a1bSJed Brown /* Working space */ 48c4762a1bSJed Brown PetscReal t[NOBSERVATIONS]; /* array of independent variables of observation */ 49c4762a1bSJed Brown PetscReal y[NOBSERVATIONS]; /* array of dependent variables */ 50c4762a1bSJed Brown PetscMPIInt size,rank; 51c4762a1bSJed Brown } AppCtx; 52c4762a1bSJed Brown 53c4762a1bSJed Brown /* User provided Routines */ 54c4762a1bSJed Brown PetscErrorCode InitializeData(AppCtx *user); 55c4762a1bSJed Brown PetscErrorCode FormStartingPoint(Vec); 56c4762a1bSJed Brown PetscErrorCode EvaluateFunction(Tao, Vec, Vec, void *); 57c4762a1bSJed Brown PetscErrorCode TaskWorker(AppCtx *user); 58c4762a1bSJed Brown PetscErrorCode StopWorkers(AppCtx *user); 59c4762a1bSJed Brown PetscErrorCode RunSimulation(PetscReal *x, PetscInt i, PetscReal*f, AppCtx *user); 60c4762a1bSJed Brown 61c4762a1bSJed Brown /*--------------------------------------------------------------------*/ 62c4762a1bSJed Brown int main(int argc,char **argv) 63c4762a1bSJed Brown { 64c4762a1bSJed Brown PetscErrorCode ierr; /* used to check for functions returning nonzeros */ 65c4762a1bSJed Brown Vec x, f; /* solution, function */ 66c4762a1bSJed Brown Tao tao; /* Tao solver context */ 67c4762a1bSJed Brown AppCtx user; /* user-defined work context */ 68c4762a1bSJed Brown 69c4762a1bSJed Brown /* Initialize TAO and PETSc */ 70c4762a1bSJed Brown ierr = PetscInitialize(&argc,&argv,(char *)0,help);if (ierr) return ierr; 71c4762a1bSJed Brown MPI_Comm_size(MPI_COMM_WORLD,&user.size); 72c4762a1bSJed Brown MPI_Comm_rank(MPI_COMM_WORLD,&user.rank); 73c4762a1bSJed Brown ierr = InitializeData(&user);CHKERRQ(ierr); 74c4762a1bSJed Brown 75c4762a1bSJed Brown /* Run optimization on rank 0 */ 76c4762a1bSJed Brown if (user.rank == 0) { 77c4762a1bSJed Brown /* Allocate vectors */ 78c4762a1bSJed Brown ierr = VecCreateSeq(PETSC_COMM_SELF,NPARAMETERS,&x);CHKERRQ(ierr); 79c4762a1bSJed Brown ierr = VecCreateSeq(PETSC_COMM_SELF,NOBSERVATIONS,&f);CHKERRQ(ierr); 80c4762a1bSJed Brown 81c4762a1bSJed Brown /* TAO code begins here */ 82c4762a1bSJed Brown 83c4762a1bSJed Brown /* Create TAO solver and set desired solution method */ 84c4762a1bSJed Brown ierr = TaoCreate(PETSC_COMM_SELF,&tao);CHKERRQ(ierr); 85c4762a1bSJed Brown ierr = TaoSetType(tao,TAOPOUNDERS);CHKERRQ(ierr); 86c4762a1bSJed Brown 87c4762a1bSJed Brown /* Set the function and Jacobian routines. */ 88c4762a1bSJed Brown ierr = FormStartingPoint(x);CHKERRQ(ierr); 89c4762a1bSJed Brown ierr = TaoSetInitialVector(tao,x);CHKERRQ(ierr); 90c4762a1bSJed Brown ierr = TaoSetResidualRoutine(tao,f,EvaluateFunction,(void*)&user);CHKERRQ(ierr); 91c4762a1bSJed Brown 92c4762a1bSJed Brown /* Check for any TAO command line arguments */ 93c4762a1bSJed Brown ierr = TaoSetFromOptions(tao);CHKERRQ(ierr); 94c4762a1bSJed Brown 95c4762a1bSJed Brown /* Perform the Solve */ 96c4762a1bSJed Brown ierr = TaoSolve(tao);CHKERRQ(ierr); 97c4762a1bSJed Brown 98c4762a1bSJed Brown /* Free TAO data structures */ 99c4762a1bSJed Brown ierr = TaoDestroy(&tao);CHKERRQ(ierr); 100c4762a1bSJed Brown 101c4762a1bSJed Brown /* Free PETSc data structures */ 102c4762a1bSJed Brown ierr = VecDestroy(&x);CHKERRQ(ierr); 103c4762a1bSJed Brown ierr = VecDestroy(&f);CHKERRQ(ierr); 104c4762a1bSJed Brown StopWorkers(&user); 105c4762a1bSJed Brown } else { 106c4762a1bSJed Brown TaskWorker(&user); 107c4762a1bSJed Brown } 108c4762a1bSJed Brown ierr = PetscFinalize(); 109c4762a1bSJed Brown return ierr; 110c4762a1bSJed Brown } 111c4762a1bSJed Brown 112c4762a1bSJed Brown /*--------------------------------------------------------------------*/ 113c4762a1bSJed Brown PetscErrorCode EvaluateFunction(Tao tao, Vec X, Vec F, void *ptr) 114c4762a1bSJed Brown { 115c4762a1bSJed Brown AppCtx *user = (AppCtx *)ptr; 116c4762a1bSJed Brown PetscInt i; 117c4762a1bSJed Brown PetscReal *x,*f; 118c4762a1bSJed Brown PetscErrorCode ierr; 119c4762a1bSJed Brown 120c4762a1bSJed Brown PetscFunctionBegin; 121c4762a1bSJed Brown ierr = VecGetArray(X,&x);CHKERRQ(ierr); 122c4762a1bSJed Brown ierr = VecGetArray(F,&f);CHKERRQ(ierr); 123c4762a1bSJed Brown if (user->size == 1) { 124c4762a1bSJed Brown /* Single processor */ 125c4762a1bSJed Brown for (i=0;i<NOBSERVATIONS;i++) { 126c4762a1bSJed Brown ierr = RunSimulation(x,i,&f[i],user);CHKERRQ(ierr); 127c4762a1bSJed Brown } 128c4762a1bSJed Brown } else { 1299dddd249SSatish Balay /* Multiprocessor main */ 130c4762a1bSJed Brown PetscMPIInt tag; 131c4762a1bSJed Brown PetscInt finishedtasks,next_task,checkedin; 132c4762a1bSJed Brown PetscReal f_i=0.0; 133c4762a1bSJed Brown MPI_Status status; 134c4762a1bSJed Brown 135c4762a1bSJed Brown next_task=0; 136c4762a1bSJed Brown finishedtasks=0; 137c4762a1bSJed Brown checkedin=0; 138c4762a1bSJed Brown 139c4762a1bSJed Brown while (finishedtasks < NOBSERVATIONS || checkedin < user->size-1) { 140ffc4695bSBarry Smith ierr = MPI_Recv(&f_i,1,MPIU_REAL,MPI_ANY_SOURCE,MPI_ANY_TAG,PETSC_COMM_WORLD,&status);CHKERRMPI(ierr); 141c4762a1bSJed Brown if (status.MPI_TAG == IDLE_TAG) { 142c4762a1bSJed Brown checkedin++; 143c4762a1bSJed Brown } else { 144c4762a1bSJed Brown 145c4762a1bSJed Brown tag = status.MPI_TAG; 146c4762a1bSJed Brown f[tag] = (PetscReal)f_i; 147c4762a1bSJed Brown finishedtasks++; 148c4762a1bSJed Brown } 149c4762a1bSJed Brown 150c4762a1bSJed Brown if (next_task<NOBSERVATIONS) { 151ffc4695bSBarry Smith ierr = MPI_Send(x,NPARAMETERS,MPIU_REAL,status.MPI_SOURCE,next_task,PETSC_COMM_WORLD);CHKERRMPI(ierr); 152c4762a1bSJed Brown next_task++; 153c4762a1bSJed Brown 154c4762a1bSJed Brown } else { 155c4762a1bSJed Brown /* Send idle message */ 156ffc4695bSBarry Smith ierr = MPI_Send(x,NPARAMETERS,MPIU_REAL,status.MPI_SOURCE,IDLE_TAG,PETSC_COMM_WORLD);CHKERRMPI(ierr); 157c4762a1bSJed Brown } 158c4762a1bSJed Brown } 159c4762a1bSJed Brown } 160c4762a1bSJed Brown ierr = VecRestoreArray(X,&x);CHKERRQ(ierr); 161c4762a1bSJed Brown ierr = VecRestoreArray(F,&f);CHKERRQ(ierr); 162c4762a1bSJed Brown PetscLogFlops(6*NOBSERVATIONS); 163c4762a1bSJed Brown PetscFunctionReturn(0); 164c4762a1bSJed Brown } 165c4762a1bSJed Brown 166c4762a1bSJed Brown /* ------------------------------------------------------------ */ 167c4762a1bSJed Brown PetscErrorCode FormStartingPoint(Vec X) 168c4762a1bSJed Brown { 169c4762a1bSJed Brown PetscReal *x; 170c4762a1bSJed Brown PetscErrorCode ierr; 171c4762a1bSJed Brown 172c4762a1bSJed Brown PetscFunctionBegin; 173c4762a1bSJed Brown ierr = VecGetArray(X,&x);CHKERRQ(ierr); 174c4762a1bSJed Brown x[0] = 0.15; 175c4762a1bSJed Brown x[1] = 0.008; 176c4762a1bSJed Brown x[2] = 0.010; 177c4762a1bSJed Brown VecRestoreArray(X,&x);CHKERRQ(ierr); 178c4762a1bSJed Brown PetscFunctionReturn(0); 179c4762a1bSJed Brown } 180c4762a1bSJed Brown 181c4762a1bSJed Brown /* ---------------------------------------------------------------------- */ 182c4762a1bSJed Brown PetscErrorCode InitializeData(AppCtx *user) 183c4762a1bSJed Brown { 184c4762a1bSJed Brown PetscReal *t=user->t,*y=user->y; 185c4762a1bSJed Brown PetscInt i=0; 186c4762a1bSJed Brown 187c4762a1bSJed Brown PetscFunctionBegin; 188c4762a1bSJed Brown y[i] = 92.9000; t[i++] = 0.5000; 189c4762a1bSJed Brown y[i] = 78.7000; t[i++] = 0.6250; 190c4762a1bSJed Brown y[i] = 64.2000; t[i++] = 0.7500; 191c4762a1bSJed Brown y[i] = 64.9000; t[i++] = 0.8750; 192c4762a1bSJed Brown y[i] = 57.1000; t[i++] = 1.0000; 193c4762a1bSJed Brown y[i] = 43.3000; t[i++] = 1.2500; 194c4762a1bSJed Brown y[i] = 31.1000; t[i++] = 1.7500; 195c4762a1bSJed Brown y[i] = 23.6000; t[i++] = 2.2500; 196c4762a1bSJed Brown y[i] = 31.0500; t[i++] = 1.7500; 197c4762a1bSJed Brown y[i] = 23.7750; t[i++] = 2.2500; 198c4762a1bSJed Brown y[i] = 17.7375; t[i++] = 2.7500; 199c4762a1bSJed Brown y[i] = 13.8000; t[i++] = 3.2500; 200c4762a1bSJed Brown y[i] = 11.5875; t[i++] = 3.7500; 201c4762a1bSJed Brown y[i] = 9.4125; t[i++] = 4.2500; 202c4762a1bSJed Brown y[i] = 7.7250; t[i++] = 4.7500; 203c4762a1bSJed Brown y[i] = 7.3500; t[i++] = 5.2500; 204c4762a1bSJed Brown y[i] = 8.0250; t[i++] = 5.7500; 205c4762a1bSJed Brown y[i] = 90.6000; t[i++] = 0.5000; 206c4762a1bSJed Brown y[i] = 76.9000; t[i++] = 0.6250; 207c4762a1bSJed Brown y[i] = 71.6000; t[i++] = 0.7500; 208c4762a1bSJed Brown y[i] = 63.6000; t[i++] = 0.8750; 209c4762a1bSJed Brown y[i] = 54.0000; t[i++] = 1.0000; 210c4762a1bSJed Brown y[i] = 39.2000; t[i++] = 1.2500; 211c4762a1bSJed Brown y[i] = 29.3000; t[i++] = 1.7500; 212c4762a1bSJed Brown y[i] = 21.4000; t[i++] = 2.2500; 213c4762a1bSJed Brown y[i] = 29.1750; t[i++] = 1.7500; 214c4762a1bSJed Brown y[i] = 22.1250; t[i++] = 2.2500; 215c4762a1bSJed Brown y[i] = 17.5125; t[i++] = 2.7500; 216c4762a1bSJed Brown y[i] = 14.2500; t[i++] = 3.2500; 217c4762a1bSJed Brown y[i] = 9.4500; t[i++] = 3.7500; 218c4762a1bSJed Brown y[i] = 9.1500; t[i++] = 4.2500; 219c4762a1bSJed Brown y[i] = 7.9125; t[i++] = 4.7500; 220c4762a1bSJed Brown y[i] = 8.4750; t[i++] = 5.2500; 221c4762a1bSJed Brown y[i] = 6.1125; t[i++] = 5.7500; 222c4762a1bSJed Brown y[i] = 80.0000; t[i++] = 0.5000; 223c4762a1bSJed Brown y[i] = 79.0000; t[i++] = 0.6250; 224c4762a1bSJed Brown y[i] = 63.8000; t[i++] = 0.7500; 225c4762a1bSJed Brown y[i] = 57.2000; t[i++] = 0.8750; 226c4762a1bSJed Brown y[i] = 53.2000; t[i++] = 1.0000; 227c4762a1bSJed Brown y[i] = 42.5000; t[i++] = 1.2500; 228c4762a1bSJed Brown y[i] = 26.8000; t[i++] = 1.7500; 229c4762a1bSJed Brown y[i] = 20.4000; t[i++] = 2.2500; 230c4762a1bSJed Brown y[i] = 26.8500; t[i++] = 1.7500; 231c4762a1bSJed Brown y[i] = 21.0000; t[i++] = 2.2500; 232c4762a1bSJed Brown y[i] = 16.4625; t[i++] = 2.7500; 233c4762a1bSJed Brown y[i] = 12.5250; t[i++] = 3.2500; 234c4762a1bSJed Brown y[i] = 10.5375; t[i++] = 3.7500; 235c4762a1bSJed Brown y[i] = 8.5875; t[i++] = 4.2500; 236c4762a1bSJed Brown y[i] = 7.1250; t[i++] = 4.7500; 237c4762a1bSJed Brown y[i] = 6.1125; t[i++] = 5.2500; 238c4762a1bSJed Brown y[i] = 5.9625; t[i++] = 5.7500; 239c4762a1bSJed Brown y[i] = 74.1000; t[i++] = 0.5000; 240c4762a1bSJed Brown y[i] = 67.3000; t[i++] = 0.6250; 241c4762a1bSJed Brown y[i] = 60.8000; t[i++] = 0.7500; 242c4762a1bSJed Brown y[i] = 55.5000; t[i++] = 0.8750; 243c4762a1bSJed Brown y[i] = 50.3000; t[i++] = 1.0000; 244c4762a1bSJed Brown y[i] = 41.0000; t[i++] = 1.2500; 245c4762a1bSJed Brown y[i] = 29.4000; t[i++] = 1.7500; 246c4762a1bSJed Brown y[i] = 20.4000; t[i++] = 2.2500; 247c4762a1bSJed Brown y[i] = 29.3625; t[i++] = 1.7500; 248c4762a1bSJed Brown y[i] = 21.1500; t[i++] = 2.2500; 249c4762a1bSJed Brown y[i] = 16.7625; t[i++] = 2.7500; 250c4762a1bSJed Brown y[i] = 13.2000; t[i++] = 3.2500; 251c4762a1bSJed Brown y[i] = 10.8750; t[i++] = 3.7500; 252c4762a1bSJed Brown y[i] = 8.1750; t[i++] = 4.2500; 253c4762a1bSJed Brown y[i] = 7.3500; t[i++] = 4.7500; 254c4762a1bSJed Brown y[i] = 5.9625; t[i++] = 5.2500; 255c4762a1bSJed Brown y[i] = 5.6250; t[i++] = 5.7500; 256c4762a1bSJed Brown y[i] = 81.5000; t[i++] = .5000; 257c4762a1bSJed Brown y[i] = 62.4000; t[i++] = .7500; 258c4762a1bSJed Brown y[i] = 32.5000; t[i++] = 1.5000; 259c4762a1bSJed Brown y[i] = 12.4100; t[i++] = 3.0000; 260c4762a1bSJed Brown y[i] = 13.1200; t[i++] = 3.0000; 261c4762a1bSJed Brown y[i] = 15.5600; t[i++] = 3.0000; 262c4762a1bSJed Brown y[i] = 5.6300; t[i++] = 6.0000; 263c4762a1bSJed Brown y[i] = 78.0000; t[i++] = .5000; 264c4762a1bSJed Brown y[i] = 59.9000; t[i++] = .7500; 265c4762a1bSJed Brown y[i] = 33.2000; t[i++] = 1.5000; 266c4762a1bSJed Brown y[i] = 13.8400; t[i++] = 3.0000; 267c4762a1bSJed Brown y[i] = 12.7500; t[i++] = 3.0000; 268c4762a1bSJed Brown y[i] = 14.6200; t[i++] = 3.0000; 269c4762a1bSJed Brown y[i] = 3.9400; t[i++] = 6.0000; 270c4762a1bSJed Brown y[i] = 76.8000; t[i++] = .5000; 271c4762a1bSJed Brown y[i] = 61.0000; t[i++] = .7500; 272c4762a1bSJed Brown y[i] = 32.9000; t[i++] = 1.5000; 273c4762a1bSJed Brown y[i] = 13.8700; t[i++] = 3.0000; 274c4762a1bSJed Brown y[i] = 11.8100; t[i++] = 3.0000; 275c4762a1bSJed Brown y[i] = 13.3100; t[i++] = 3.0000; 276c4762a1bSJed Brown y[i] = 5.4400; t[i++] = 6.0000; 277c4762a1bSJed Brown y[i] = 78.0000; t[i++] = .5000; 278c4762a1bSJed Brown y[i] = 63.5000; t[i++] = .7500; 279c4762a1bSJed Brown y[i] = 33.8000; t[i++] = 1.5000; 280c4762a1bSJed Brown y[i] = 12.5600; t[i++] = 3.0000; 281c4762a1bSJed Brown y[i] = 5.6300; t[i++] = 6.0000; 282c4762a1bSJed Brown y[i] = 12.7500; t[i++] = 3.0000; 283c4762a1bSJed Brown y[i] = 13.1200; t[i++] = 3.0000; 284c4762a1bSJed Brown y[i] = 5.4400; t[i++] = 6.0000; 285c4762a1bSJed Brown y[i] = 76.8000; t[i++] = .5000; 286c4762a1bSJed Brown y[i] = 60.0000; t[i++] = .7500; 287c4762a1bSJed Brown y[i] = 47.8000; t[i++] = 1.0000; 288c4762a1bSJed Brown y[i] = 32.0000; t[i++] = 1.5000; 289c4762a1bSJed Brown y[i] = 22.2000; t[i++] = 2.0000; 290c4762a1bSJed Brown y[i] = 22.5700; t[i++] = 2.0000; 291c4762a1bSJed Brown y[i] = 18.8200; t[i++] = 2.5000; 292c4762a1bSJed Brown y[i] = 13.9500; t[i++] = 3.0000; 293c4762a1bSJed Brown y[i] = 11.2500; t[i++] = 4.0000; 294c4762a1bSJed Brown y[i] = 9.0000; t[i++] = 5.0000; 295c4762a1bSJed Brown y[i] = 6.6700; t[i++] = 6.0000; 296c4762a1bSJed Brown y[i] = 75.8000; t[i++] = .5000; 297c4762a1bSJed Brown y[i] = 62.0000; t[i++] = .7500; 298c4762a1bSJed Brown y[i] = 48.8000; t[i++] = 1.0000; 299c4762a1bSJed Brown y[i] = 35.2000; t[i++] = 1.5000; 300c4762a1bSJed Brown y[i] = 20.0000; t[i++] = 2.0000; 301c4762a1bSJed Brown y[i] = 20.3200; t[i++] = 2.0000; 302c4762a1bSJed Brown y[i] = 19.3100; t[i++] = 2.5000; 303c4762a1bSJed Brown y[i] = 12.7500; t[i++] = 3.0000; 304c4762a1bSJed Brown y[i] = 10.4200; t[i++] = 4.0000; 305c4762a1bSJed Brown y[i] = 7.3100; t[i++] = 5.0000; 306c4762a1bSJed Brown y[i] = 7.4200; t[i++] = 6.0000; 307c4762a1bSJed Brown y[i] = 70.5000; t[i++] = .5000; 308c4762a1bSJed Brown y[i] = 59.5000; t[i++] = .7500; 309c4762a1bSJed Brown y[i] = 48.5000; t[i++] = 1.0000; 310c4762a1bSJed Brown y[i] = 35.8000; t[i++] = 1.5000; 311c4762a1bSJed Brown y[i] = 21.0000; t[i++] = 2.0000; 312c4762a1bSJed Brown y[i] = 21.6700; t[i++] = 2.0000; 313c4762a1bSJed Brown y[i] = 21.0000; t[i++] = 2.5000; 314c4762a1bSJed Brown y[i] = 15.6400; t[i++] = 3.0000; 315c4762a1bSJed Brown y[i] = 8.1700; t[i++] = 4.0000; 316c4762a1bSJed Brown y[i] = 8.5500; t[i++] = 5.0000; 317c4762a1bSJed Brown y[i] = 10.1200; t[i++] = 6.0000; 318c4762a1bSJed Brown y[i] = 78.0000; t[i++] = .5000; 319c4762a1bSJed Brown y[i] = 66.0000; t[i++] = .6250; 320c4762a1bSJed Brown y[i] = 62.0000; t[i++] = .7500; 321c4762a1bSJed Brown y[i] = 58.0000; t[i++] = .8750; 322c4762a1bSJed Brown y[i] = 47.7000; t[i++] = 1.0000; 323c4762a1bSJed Brown y[i] = 37.8000; t[i++] = 1.2500; 324c4762a1bSJed Brown y[i] = 20.2000; t[i++] = 2.2500; 325c4762a1bSJed Brown y[i] = 21.0700; t[i++] = 2.2500; 326c4762a1bSJed Brown y[i] = 13.8700; t[i++] = 2.7500; 327c4762a1bSJed Brown y[i] = 9.6700; t[i++] = 3.2500; 328c4762a1bSJed Brown y[i] = 7.7600; t[i++] = 3.7500; 329c4762a1bSJed Brown y[i] = 5.4400; t[i++] = 4.2500; 330c4762a1bSJed Brown y[i] = 4.8700; t[i++] = 4.7500; 331c4762a1bSJed Brown y[i] = 4.0100; t[i++] = 5.2500; 332c4762a1bSJed Brown y[i] = 3.7500; t[i++] = 5.7500; 333c4762a1bSJed Brown y[i] = 24.1900; t[i++] = 3.0000; 334c4762a1bSJed Brown y[i] = 25.7600; t[i++] = 3.0000; 335c4762a1bSJed Brown y[i] = 18.0700; t[i++] = 3.0000; 336c4762a1bSJed Brown y[i] = 11.8100; t[i++] = 3.0000; 337c4762a1bSJed Brown y[i] = 12.0700; t[i++] = 3.0000; 338c4762a1bSJed Brown y[i] = 16.1200; t[i++] = 3.0000; 339c4762a1bSJed Brown y[i] = 70.8000; t[i++] = .5000; 340c4762a1bSJed Brown y[i] = 54.7000; t[i++] = .7500; 341c4762a1bSJed Brown y[i] = 48.0000; t[i++] = 1.0000; 342c4762a1bSJed Brown y[i] = 39.8000; t[i++] = 1.5000; 343c4762a1bSJed Brown y[i] = 29.8000; t[i++] = 2.0000; 344c4762a1bSJed Brown y[i] = 23.7000; t[i++] = 2.5000; 345c4762a1bSJed Brown y[i] = 29.6200; t[i++] = 2.0000; 346c4762a1bSJed Brown y[i] = 23.8100; t[i++] = 2.5000; 347c4762a1bSJed Brown y[i] = 17.7000; t[i++] = 3.0000; 348c4762a1bSJed Brown y[i] = 11.5500; t[i++] = 4.0000; 349c4762a1bSJed Brown y[i] = 12.0700; t[i++] = 5.0000; 350c4762a1bSJed Brown y[i] = 8.7400; t[i++] = 6.0000; 351c4762a1bSJed Brown y[i] = 80.7000; t[i++] = .5000; 352c4762a1bSJed Brown y[i] = 61.3000; t[i++] = .7500; 353c4762a1bSJed Brown y[i] = 47.5000; t[i++] = 1.0000; 354c4762a1bSJed Brown y[i] = 29.0000; t[i++] = 1.5000; 355c4762a1bSJed Brown y[i] = 24.0000; t[i++] = 2.0000; 356c4762a1bSJed Brown y[i] = 17.7000; t[i++] = 2.5000; 357c4762a1bSJed Brown y[i] = 24.5600; t[i++] = 2.0000; 358c4762a1bSJed Brown y[i] = 18.6700; t[i++] = 2.5000; 359c4762a1bSJed Brown y[i] = 16.2400; t[i++] = 3.0000; 360c4762a1bSJed Brown y[i] = 8.7400; t[i++] = 4.0000; 361c4762a1bSJed Brown y[i] = 7.8700; t[i++] = 5.0000; 362c4762a1bSJed Brown y[i] = 8.5100; t[i++] = 6.0000; 363c4762a1bSJed Brown y[i] = 66.7000; t[i++] = .5000; 364c4762a1bSJed Brown y[i] = 59.2000; t[i++] = .7500; 365c4762a1bSJed Brown y[i] = 40.8000; t[i++] = 1.0000; 366c4762a1bSJed Brown y[i] = 30.7000; t[i++] = 1.5000; 367c4762a1bSJed Brown y[i] = 25.7000; t[i++] = 2.0000; 368c4762a1bSJed Brown y[i] = 16.3000; t[i++] = 2.5000; 369c4762a1bSJed Brown y[i] = 25.9900; t[i++] = 2.0000; 370c4762a1bSJed Brown y[i] = 16.9500; t[i++] = 2.5000; 371c4762a1bSJed Brown y[i] = 13.3500; t[i++] = 3.0000; 372c4762a1bSJed Brown y[i] = 8.6200; t[i++] = 4.0000; 373c4762a1bSJed Brown y[i] = 7.2000; t[i++] = 5.0000; 374c4762a1bSJed Brown y[i] = 6.6400; t[i++] = 6.0000; 375c4762a1bSJed Brown y[i] = 13.6900; t[i++] = 3.0000; 376c4762a1bSJed Brown y[i] = 81.0000; t[i++] = .5000; 377c4762a1bSJed Brown y[i] = 64.5000; t[i++] = .7500; 378c4762a1bSJed Brown y[i] = 35.5000; t[i++] = 1.5000; 379c4762a1bSJed Brown y[i] = 13.3100; t[i++] = 3.0000; 380c4762a1bSJed Brown y[i] = 4.8700; t[i++] = 6.0000; 381c4762a1bSJed Brown y[i] = 12.9400; t[i++] = 3.0000; 382c4762a1bSJed Brown y[i] = 5.0600; t[i++] = 6.0000; 383c4762a1bSJed Brown y[i] = 15.1900; t[i++] = 3.0000; 384c4762a1bSJed Brown y[i] = 14.6200; t[i++] = 3.0000; 385c4762a1bSJed Brown y[i] = 15.6400; t[i++] = 3.0000; 386c4762a1bSJed Brown y[i] = 25.5000; t[i++] = 1.7500; 387c4762a1bSJed Brown y[i] = 25.9500; t[i++] = 1.7500; 388c4762a1bSJed Brown y[i] = 81.7000; t[i++] = .5000; 389c4762a1bSJed Brown y[i] = 61.6000; t[i++] = .7500; 390c4762a1bSJed Brown y[i] = 29.8000; t[i++] = 1.7500; 391c4762a1bSJed Brown y[i] = 29.8100; t[i++] = 1.7500; 392c4762a1bSJed Brown y[i] = 17.1700; t[i++] = 2.7500; 393c4762a1bSJed Brown y[i] = 10.3900; t[i++] = 3.7500; 394c4762a1bSJed Brown y[i] = 28.4000; t[i++] = 1.7500; 395c4762a1bSJed Brown y[i] = 28.6900; t[i++] = 1.7500; 396c4762a1bSJed Brown y[i] = 81.3000; t[i++] = .5000; 397c4762a1bSJed Brown y[i] = 60.9000; t[i++] = .7500; 398c4762a1bSJed Brown y[i] = 16.6500; t[i++] = 2.7500; 399c4762a1bSJed Brown y[i] = 10.0500; t[i++] = 3.7500; 400c4762a1bSJed Brown y[i] = 28.9000; t[i++] = 1.7500; 401c4762a1bSJed Brown y[i] = 28.9500; t[i++] = 1.7500; 402c4762a1bSJed Brown PetscFunctionReturn(0); 403c4762a1bSJed Brown } 404c4762a1bSJed Brown 405c4762a1bSJed Brown PetscErrorCode TaskWorker(AppCtx *user) 406c4762a1bSJed Brown { 407c4762a1bSJed Brown PetscReal x[NPARAMETERS],f = 0.0; 408c4762a1bSJed Brown PetscMPIInt tag=IDLE_TAG; 409c4762a1bSJed Brown PetscInt index; 410c4762a1bSJed Brown MPI_Status status; 411c4762a1bSJed Brown PetscErrorCode ierr; 412c4762a1bSJed Brown 413c4762a1bSJed Brown PetscFunctionBegin; 4149dddd249SSatish Balay /* Send check-in message to rank-0 */ 415c4762a1bSJed Brown 416ffc4695bSBarry Smith ierr = MPI_Send(&f,1,MPIU_REAL,0,IDLE_TAG,PETSC_COMM_WORLD);CHKERRMPI(ierr); 417c4762a1bSJed Brown while (tag != DIE_TAG) { 418ffc4695bSBarry Smith ierr = MPI_Recv(x,NPARAMETERS,MPIU_REAL,0,MPI_ANY_TAG,PETSC_COMM_WORLD,&status);CHKERRMPI(ierr); 419c4762a1bSJed Brown tag = status.MPI_TAG; 420c4762a1bSJed Brown if (tag == IDLE_TAG) { 421ffc4695bSBarry Smith ierr = MPI_Send(&f,1,MPIU_REAL,0,IDLE_TAG,PETSC_COMM_WORLD);CHKERRMPI(ierr); 422c4762a1bSJed Brown } else if (tag != DIE_TAG) { 423c4762a1bSJed Brown index = (PetscInt)tag; 424c4762a1bSJed Brown ierr = RunSimulation(x,index,&f,user);CHKERRQ(ierr); 42555b25c41SPierre Jolivet ierr = MPI_Send(&f,1,MPIU_REAL,0,tag,PETSC_COMM_WORLD);CHKERRMPI(ierr); 426c4762a1bSJed Brown } 427c4762a1bSJed Brown } 428c4762a1bSJed Brown PetscFunctionReturn(0); 429c4762a1bSJed Brown } 430c4762a1bSJed Brown 431c4762a1bSJed Brown PetscErrorCode RunSimulation(PetscReal *x, PetscInt i, PetscReal*f, AppCtx *user) 432c4762a1bSJed Brown { 433c4762a1bSJed Brown PetscReal *t = user->t; 434c4762a1bSJed Brown PetscReal *y = user->y; 435c4762a1bSJed Brown #if defined(PETSC_USE_REAL_SINGLE) 436*e1dfdf8eSBarry Smith *f = y[i] - exp(-x[0]*t[i])/(x[1] + x[2]*t[i]); /* expf() for single-precision breaks this example on Freebsd, Valgrind errors on Linux */ 437c4762a1bSJed Brown #else 438c4762a1bSJed Brown *f = y[i] - PetscExpScalar(-x[0]*t[i])/(x[1] + x[2]*t[i]); 439c4762a1bSJed Brown #endif 440c4762a1bSJed Brown return(0); 441c4762a1bSJed Brown } 442c4762a1bSJed Brown 443c4762a1bSJed Brown PetscErrorCode StopWorkers(AppCtx *user) 444c4762a1bSJed Brown { 445c4762a1bSJed Brown PetscInt checkedin; 446c4762a1bSJed Brown MPI_Status status; 447c4762a1bSJed Brown PetscReal f,x[NPARAMETERS]; 448c4762a1bSJed Brown PetscErrorCode ierr; 449c4762a1bSJed Brown 450c4762a1bSJed Brown PetscFunctionBegin; 451c4762a1bSJed Brown checkedin=0; 452c4762a1bSJed Brown while (checkedin < user->size-1) { 453ffc4695bSBarry Smith ierr = MPI_Recv(&f,1,MPIU_REAL,MPI_ANY_SOURCE,MPI_ANY_TAG,PETSC_COMM_WORLD,&status);CHKERRMPI(ierr); 454c4762a1bSJed Brown checkedin++; 455c4762a1bSJed Brown ierr = PetscArrayzero(x,NPARAMETERS);CHKERRQ(ierr); 456ffc4695bSBarry Smith ierr = MPI_Send(x,NPARAMETERS,MPIU_REAL,status.MPI_SOURCE,DIE_TAG,PETSC_COMM_WORLD);CHKERRMPI(ierr); 457c4762a1bSJed Brown } 458c4762a1bSJed Brown PetscFunctionReturn(0); 459c4762a1bSJed Brown } 460c4762a1bSJed Brown 461c4762a1bSJed Brown /*TEST 462c4762a1bSJed Brown 463c4762a1bSJed Brown build: 464c4762a1bSJed Brown requires: !complex 465c4762a1bSJed Brown 466c4762a1bSJed Brown test: 467c4762a1bSJed Brown nsize: 3 468c4762a1bSJed Brown requires: !single 469c4762a1bSJed Brown args: -tao_smonitor -tao_max_it 100 -tao_type pounders -tao_gatol 1.e-5 470c4762a1bSJed Brown 471c4762a1bSJed Brown TEST*/ 472