1*c4762a1bSJed Brown /* 2*c4762a1bSJed Brown Include "petsctao.h" so that we can use TAO solvers. Note that this 3*c4762a1bSJed Brown file automatically includes libraries such as: 4*c4762a1bSJed Brown petsc.h - base PETSc routines petscvec.h - vectors 5*c4762a1bSJed Brown petscsys.h - sysem routines petscmat.h - matrices 6*c4762a1bSJed Brown petscis.h - index sets petscksp.h - Krylov subspace methods 7*c4762a1bSJed Brown petscviewer.h - viewers petscpc.h - preconditioners 8*c4762a1bSJed Brown 9*c4762a1bSJed Brown */ 10*c4762a1bSJed Brown 11*c4762a1bSJed Brown #include <petsctao.h> 12*c4762a1bSJed Brown 13*c4762a1bSJed Brown /* 14*c4762a1bSJed Brown Description: These data are the result of a NIST study involving 15*c4762a1bSJed Brown ultrasonic calibration. The response variable is 16*c4762a1bSJed Brown ultrasonic response, and the predictor variable is 17*c4762a1bSJed Brown metal distance. 18*c4762a1bSJed Brown 19*c4762a1bSJed Brown Reference: Chwirut, D., NIST (197?). 20*c4762a1bSJed Brown Ultrasonic Reference Block Study. 21*c4762a1bSJed Brown */ 22*c4762a1bSJed Brown 23*c4762a1bSJed Brown static char help[]="Finds the nonlinear least-squares solution to the model \n\ 24*c4762a1bSJed Brown y = exp[-b1*x]/(b2+b3*x) + e \n"; 25*c4762a1bSJed Brown 26*c4762a1bSJed Brown /* T 27*c4762a1bSJed Brown Concepts: TAO^Solving a system of nonlinear equations, nonlinear least squares 28*c4762a1bSJed Brown Routines: TaoCreate(); 29*c4762a1bSJed Brown Routines: TaoSetType(); 30*c4762a1bSJed Brown Routines: TaoSetResidualRoutine(); 31*c4762a1bSJed Brown Routines: TaoSetMonitor(); 32*c4762a1bSJed Brown Routines: TaoSetInitialVector(); 33*c4762a1bSJed Brown Routines: TaoSetFromOptions(); 34*c4762a1bSJed Brown Routines: TaoSolve(); 35*c4762a1bSJed Brown Routines: TaoDestroy(); 36*c4762a1bSJed Brown Processors: n 37*c4762a1bSJed Brown T*/ 38*c4762a1bSJed Brown 39*c4762a1bSJed Brown #define NOBSERVATIONS 214 40*c4762a1bSJed Brown #define NPARAMETERS 3 41*c4762a1bSJed Brown 42*c4762a1bSJed Brown #define DIE_TAG 2000 43*c4762a1bSJed Brown #define IDLE_TAG 1000 44*c4762a1bSJed Brown 45*c4762a1bSJed Brown /* User-defined application context */ 46*c4762a1bSJed Brown typedef struct { 47*c4762a1bSJed Brown /* Working space */ 48*c4762a1bSJed Brown PetscReal t[NOBSERVATIONS]; /* array of independent variables of observation */ 49*c4762a1bSJed Brown PetscReal y[NOBSERVATIONS]; /* array of dependent variables */ 50*c4762a1bSJed Brown PetscMPIInt size,rank; 51*c4762a1bSJed Brown } AppCtx; 52*c4762a1bSJed Brown 53*c4762a1bSJed Brown /* User provided Routines */ 54*c4762a1bSJed Brown PetscErrorCode InitializeData(AppCtx *user); 55*c4762a1bSJed Brown PetscErrorCode FormStartingPoint(Vec); 56*c4762a1bSJed Brown PetscErrorCode EvaluateFunction(Tao, Vec, Vec, void *); 57*c4762a1bSJed Brown PetscErrorCode TaskWorker(AppCtx *user); 58*c4762a1bSJed Brown PetscErrorCode StopWorkers(AppCtx *user); 59*c4762a1bSJed Brown PetscErrorCode RunSimulation(PetscReal *x, PetscInt i, PetscReal*f, AppCtx *user); 60*c4762a1bSJed Brown 61*c4762a1bSJed Brown /*--------------------------------------------------------------------*/ 62*c4762a1bSJed Brown int main(int argc,char **argv) 63*c4762a1bSJed Brown { 64*c4762a1bSJed Brown PetscErrorCode ierr; /* used to check for functions returning nonzeros */ 65*c4762a1bSJed Brown Vec x, f; /* solution, function */ 66*c4762a1bSJed Brown Tao tao; /* Tao solver context */ 67*c4762a1bSJed Brown AppCtx user; /* user-defined work context */ 68*c4762a1bSJed Brown 69*c4762a1bSJed Brown /* Initialize TAO and PETSc */ 70*c4762a1bSJed Brown ierr = PetscInitialize(&argc,&argv,(char *)0,help);if (ierr) return ierr; 71*c4762a1bSJed Brown MPI_Comm_size(MPI_COMM_WORLD,&user.size); 72*c4762a1bSJed Brown MPI_Comm_rank(MPI_COMM_WORLD,&user.rank); 73*c4762a1bSJed Brown ierr = InitializeData(&user);CHKERRQ(ierr); 74*c4762a1bSJed Brown 75*c4762a1bSJed Brown /* Run optimization on rank 0 */ 76*c4762a1bSJed Brown if (user.rank == 0) { 77*c4762a1bSJed Brown /* Allocate vectors */ 78*c4762a1bSJed Brown ierr = VecCreateSeq(PETSC_COMM_SELF,NPARAMETERS,&x);CHKERRQ(ierr); 79*c4762a1bSJed Brown ierr = VecCreateSeq(PETSC_COMM_SELF,NOBSERVATIONS,&f);CHKERRQ(ierr); 80*c4762a1bSJed Brown 81*c4762a1bSJed Brown /* TAO code begins here */ 82*c4762a1bSJed Brown 83*c4762a1bSJed Brown /* Create TAO solver and set desired solution method */ 84*c4762a1bSJed Brown ierr = TaoCreate(PETSC_COMM_SELF,&tao);CHKERRQ(ierr); 85*c4762a1bSJed Brown ierr = TaoSetType(tao,TAOPOUNDERS);CHKERRQ(ierr); 86*c4762a1bSJed Brown 87*c4762a1bSJed Brown /* Set the function and Jacobian routines. */ 88*c4762a1bSJed Brown ierr = FormStartingPoint(x);CHKERRQ(ierr); 89*c4762a1bSJed Brown ierr = TaoSetInitialVector(tao,x);CHKERRQ(ierr); 90*c4762a1bSJed Brown ierr = TaoSetResidualRoutine(tao,f,EvaluateFunction,(void*)&user);CHKERRQ(ierr); 91*c4762a1bSJed Brown 92*c4762a1bSJed Brown /* Check for any TAO command line arguments */ 93*c4762a1bSJed Brown ierr = TaoSetFromOptions(tao);CHKERRQ(ierr); 94*c4762a1bSJed Brown 95*c4762a1bSJed Brown /* Perform the Solve */ 96*c4762a1bSJed Brown ierr = TaoSolve(tao);CHKERRQ(ierr); 97*c4762a1bSJed Brown 98*c4762a1bSJed Brown /* Free TAO data structures */ 99*c4762a1bSJed Brown ierr = TaoDestroy(&tao);CHKERRQ(ierr); 100*c4762a1bSJed Brown 101*c4762a1bSJed Brown /* Free PETSc data structures */ 102*c4762a1bSJed Brown ierr = VecDestroy(&x);CHKERRQ(ierr); 103*c4762a1bSJed Brown ierr = VecDestroy(&f);CHKERRQ(ierr); 104*c4762a1bSJed Brown StopWorkers(&user); 105*c4762a1bSJed Brown } else { 106*c4762a1bSJed Brown TaskWorker(&user); 107*c4762a1bSJed Brown } 108*c4762a1bSJed Brown ierr = PetscFinalize(); 109*c4762a1bSJed Brown return ierr; 110*c4762a1bSJed Brown } 111*c4762a1bSJed Brown 112*c4762a1bSJed Brown /*--------------------------------------------------------------------*/ 113*c4762a1bSJed Brown PetscErrorCode EvaluateFunction(Tao tao, Vec X, Vec F, void *ptr) 114*c4762a1bSJed Brown { 115*c4762a1bSJed Brown AppCtx *user = (AppCtx *)ptr; 116*c4762a1bSJed Brown PetscInt i; 117*c4762a1bSJed Brown PetscReal *x,*f; 118*c4762a1bSJed Brown PetscErrorCode ierr; 119*c4762a1bSJed Brown 120*c4762a1bSJed Brown PetscFunctionBegin; 121*c4762a1bSJed Brown ierr = VecGetArray(X,&x);CHKERRQ(ierr); 122*c4762a1bSJed Brown ierr = VecGetArray(F,&f);CHKERRQ(ierr); 123*c4762a1bSJed Brown if (user->size == 1) { 124*c4762a1bSJed Brown /* Single processor */ 125*c4762a1bSJed Brown for (i=0;i<NOBSERVATIONS;i++) { 126*c4762a1bSJed Brown ierr = RunSimulation(x,i,&f[i],user);CHKERRQ(ierr); 127*c4762a1bSJed Brown } 128*c4762a1bSJed Brown } else { 129*c4762a1bSJed Brown /* Multiprocessor master */ 130*c4762a1bSJed Brown PetscMPIInt tag; 131*c4762a1bSJed Brown PetscInt finishedtasks,next_task,checkedin; 132*c4762a1bSJed Brown PetscReal f_i=0.0; 133*c4762a1bSJed Brown MPI_Status status; 134*c4762a1bSJed Brown 135*c4762a1bSJed Brown next_task=0; 136*c4762a1bSJed Brown finishedtasks=0; 137*c4762a1bSJed Brown checkedin=0; 138*c4762a1bSJed Brown 139*c4762a1bSJed Brown while(finishedtasks < NOBSERVATIONS || checkedin < user->size-1) { 140*c4762a1bSJed Brown ierr = MPI_Recv(&f_i,1,MPIU_REAL,MPI_ANY_SOURCE,MPI_ANY_TAG,PETSC_COMM_WORLD,&status);CHKERRQ(ierr); 141*c4762a1bSJed Brown if (status.MPI_TAG == IDLE_TAG) { 142*c4762a1bSJed Brown checkedin++; 143*c4762a1bSJed Brown } else { 144*c4762a1bSJed Brown 145*c4762a1bSJed Brown tag = status.MPI_TAG; 146*c4762a1bSJed Brown f[tag] = (PetscReal)f_i; 147*c4762a1bSJed Brown finishedtasks++; 148*c4762a1bSJed Brown } 149*c4762a1bSJed Brown 150*c4762a1bSJed Brown if (next_task<NOBSERVATIONS) { 151*c4762a1bSJed Brown ierr = MPI_Send(x,NPARAMETERS,MPIU_REAL,status.MPI_SOURCE,next_task,PETSC_COMM_WORLD);CHKERRQ(ierr); 152*c4762a1bSJed Brown next_task++; 153*c4762a1bSJed Brown 154*c4762a1bSJed Brown } else { 155*c4762a1bSJed Brown /* Send idle message */ 156*c4762a1bSJed Brown ierr = MPI_Send(x,NPARAMETERS,MPIU_REAL,status.MPI_SOURCE,IDLE_TAG,PETSC_COMM_WORLD);CHKERRQ(ierr); 157*c4762a1bSJed Brown } 158*c4762a1bSJed Brown } 159*c4762a1bSJed Brown } 160*c4762a1bSJed Brown ierr = VecRestoreArray(X,&x);CHKERRQ(ierr); 161*c4762a1bSJed Brown ierr = VecRestoreArray(F,&f);CHKERRQ(ierr); 162*c4762a1bSJed Brown PetscLogFlops(6*NOBSERVATIONS); 163*c4762a1bSJed Brown PetscFunctionReturn(0); 164*c4762a1bSJed Brown } 165*c4762a1bSJed Brown 166*c4762a1bSJed Brown /* ------------------------------------------------------------ */ 167*c4762a1bSJed Brown PetscErrorCode FormStartingPoint(Vec X) 168*c4762a1bSJed Brown { 169*c4762a1bSJed Brown PetscReal *x; 170*c4762a1bSJed Brown PetscErrorCode ierr; 171*c4762a1bSJed Brown 172*c4762a1bSJed Brown PetscFunctionBegin; 173*c4762a1bSJed Brown ierr = VecGetArray(X,&x);CHKERRQ(ierr); 174*c4762a1bSJed Brown x[0] = 0.15; 175*c4762a1bSJed Brown x[1] = 0.008; 176*c4762a1bSJed Brown x[2] = 0.010; 177*c4762a1bSJed Brown VecRestoreArray(X,&x);CHKERRQ(ierr); 178*c4762a1bSJed Brown PetscFunctionReturn(0); 179*c4762a1bSJed Brown } 180*c4762a1bSJed Brown 181*c4762a1bSJed Brown /* ---------------------------------------------------------------------- */ 182*c4762a1bSJed Brown PetscErrorCode InitializeData(AppCtx *user) 183*c4762a1bSJed Brown { 184*c4762a1bSJed Brown PetscReal *t=user->t,*y=user->y; 185*c4762a1bSJed Brown PetscInt i=0; 186*c4762a1bSJed Brown 187*c4762a1bSJed Brown PetscFunctionBegin; 188*c4762a1bSJed Brown y[i] = 92.9000; t[i++] = 0.5000; 189*c4762a1bSJed Brown y[i] = 78.7000; t[i++] = 0.6250; 190*c4762a1bSJed Brown y[i] = 64.2000; t[i++] = 0.7500; 191*c4762a1bSJed Brown y[i] = 64.9000; t[i++] = 0.8750; 192*c4762a1bSJed Brown y[i] = 57.1000; t[i++] = 1.0000; 193*c4762a1bSJed Brown y[i] = 43.3000; t[i++] = 1.2500; 194*c4762a1bSJed Brown y[i] = 31.1000; t[i++] = 1.7500; 195*c4762a1bSJed Brown y[i] = 23.6000; t[i++] = 2.2500; 196*c4762a1bSJed Brown y[i] = 31.0500; t[i++] = 1.7500; 197*c4762a1bSJed Brown y[i] = 23.7750; t[i++] = 2.2500; 198*c4762a1bSJed Brown y[i] = 17.7375; t[i++] = 2.7500; 199*c4762a1bSJed Brown y[i] = 13.8000; t[i++] = 3.2500; 200*c4762a1bSJed Brown y[i] = 11.5875; t[i++] = 3.7500; 201*c4762a1bSJed Brown y[i] = 9.4125; t[i++] = 4.2500; 202*c4762a1bSJed Brown y[i] = 7.7250; t[i++] = 4.7500; 203*c4762a1bSJed Brown y[i] = 7.3500; t[i++] = 5.2500; 204*c4762a1bSJed Brown y[i] = 8.0250; t[i++] = 5.7500; 205*c4762a1bSJed Brown y[i] = 90.6000; t[i++] = 0.5000; 206*c4762a1bSJed Brown y[i] = 76.9000; t[i++] = 0.6250; 207*c4762a1bSJed Brown y[i] = 71.6000; t[i++] = 0.7500; 208*c4762a1bSJed Brown y[i] = 63.6000; t[i++] = 0.8750; 209*c4762a1bSJed Brown y[i] = 54.0000; t[i++] = 1.0000; 210*c4762a1bSJed Brown y[i] = 39.2000; t[i++] = 1.2500; 211*c4762a1bSJed Brown y[i] = 29.3000; t[i++] = 1.7500; 212*c4762a1bSJed Brown y[i] = 21.4000; t[i++] = 2.2500; 213*c4762a1bSJed Brown y[i] = 29.1750; t[i++] = 1.7500; 214*c4762a1bSJed Brown y[i] = 22.1250; t[i++] = 2.2500; 215*c4762a1bSJed Brown y[i] = 17.5125; t[i++] = 2.7500; 216*c4762a1bSJed Brown y[i] = 14.2500; t[i++] = 3.2500; 217*c4762a1bSJed Brown y[i] = 9.4500; t[i++] = 3.7500; 218*c4762a1bSJed Brown y[i] = 9.1500; t[i++] = 4.2500; 219*c4762a1bSJed Brown y[i] = 7.9125; t[i++] = 4.7500; 220*c4762a1bSJed Brown y[i] = 8.4750; t[i++] = 5.2500; 221*c4762a1bSJed Brown y[i] = 6.1125; t[i++] = 5.7500; 222*c4762a1bSJed Brown y[i] = 80.0000; t[i++] = 0.5000; 223*c4762a1bSJed Brown y[i] = 79.0000; t[i++] = 0.6250; 224*c4762a1bSJed Brown y[i] = 63.8000; t[i++] = 0.7500; 225*c4762a1bSJed Brown y[i] = 57.2000; t[i++] = 0.8750; 226*c4762a1bSJed Brown y[i] = 53.2000; t[i++] = 1.0000; 227*c4762a1bSJed Brown y[i] = 42.5000; t[i++] = 1.2500; 228*c4762a1bSJed Brown y[i] = 26.8000; t[i++] = 1.7500; 229*c4762a1bSJed Brown y[i] = 20.4000; t[i++] = 2.2500; 230*c4762a1bSJed Brown y[i] = 26.8500; t[i++] = 1.7500; 231*c4762a1bSJed Brown y[i] = 21.0000; t[i++] = 2.2500; 232*c4762a1bSJed Brown y[i] = 16.4625; t[i++] = 2.7500; 233*c4762a1bSJed Brown y[i] = 12.5250; t[i++] = 3.2500; 234*c4762a1bSJed Brown y[i] = 10.5375; t[i++] = 3.7500; 235*c4762a1bSJed Brown y[i] = 8.5875; t[i++] = 4.2500; 236*c4762a1bSJed Brown y[i] = 7.1250; t[i++] = 4.7500; 237*c4762a1bSJed Brown y[i] = 6.1125; t[i++] = 5.2500; 238*c4762a1bSJed Brown y[i] = 5.9625; t[i++] = 5.7500; 239*c4762a1bSJed Brown y[i] = 74.1000; t[i++] = 0.5000; 240*c4762a1bSJed Brown y[i] = 67.3000; t[i++] = 0.6250; 241*c4762a1bSJed Brown y[i] = 60.8000; t[i++] = 0.7500; 242*c4762a1bSJed Brown y[i] = 55.5000; t[i++] = 0.8750; 243*c4762a1bSJed Brown y[i] = 50.3000; t[i++] = 1.0000; 244*c4762a1bSJed Brown y[i] = 41.0000; t[i++] = 1.2500; 245*c4762a1bSJed Brown y[i] = 29.4000; t[i++] = 1.7500; 246*c4762a1bSJed Brown y[i] = 20.4000; t[i++] = 2.2500; 247*c4762a1bSJed Brown y[i] = 29.3625; t[i++] = 1.7500; 248*c4762a1bSJed Brown y[i] = 21.1500; t[i++] = 2.2500; 249*c4762a1bSJed Brown y[i] = 16.7625; t[i++] = 2.7500; 250*c4762a1bSJed Brown y[i] = 13.2000; t[i++] = 3.2500; 251*c4762a1bSJed Brown y[i] = 10.8750; t[i++] = 3.7500; 252*c4762a1bSJed Brown y[i] = 8.1750; t[i++] = 4.2500; 253*c4762a1bSJed Brown y[i] = 7.3500; t[i++] = 4.7500; 254*c4762a1bSJed Brown y[i] = 5.9625; t[i++] = 5.2500; 255*c4762a1bSJed Brown y[i] = 5.6250; t[i++] = 5.7500; 256*c4762a1bSJed Brown y[i] = 81.5000; t[i++] = .5000; 257*c4762a1bSJed Brown y[i] = 62.4000; t[i++] = .7500; 258*c4762a1bSJed Brown y[i] = 32.5000; t[i++] = 1.5000; 259*c4762a1bSJed Brown y[i] = 12.4100; t[i++] = 3.0000; 260*c4762a1bSJed Brown y[i] = 13.1200; t[i++] = 3.0000; 261*c4762a1bSJed Brown y[i] = 15.5600; t[i++] = 3.0000; 262*c4762a1bSJed Brown y[i] = 5.6300; t[i++] = 6.0000; 263*c4762a1bSJed Brown y[i] = 78.0000; t[i++] = .5000; 264*c4762a1bSJed Brown y[i] = 59.9000; t[i++] = .7500; 265*c4762a1bSJed Brown y[i] = 33.2000; t[i++] = 1.5000; 266*c4762a1bSJed Brown y[i] = 13.8400; t[i++] = 3.0000; 267*c4762a1bSJed Brown y[i] = 12.7500; t[i++] = 3.0000; 268*c4762a1bSJed Brown y[i] = 14.6200; t[i++] = 3.0000; 269*c4762a1bSJed Brown y[i] = 3.9400; t[i++] = 6.0000; 270*c4762a1bSJed Brown y[i] = 76.8000; t[i++] = .5000; 271*c4762a1bSJed Brown y[i] = 61.0000; t[i++] = .7500; 272*c4762a1bSJed Brown y[i] = 32.9000; t[i++] = 1.5000; 273*c4762a1bSJed Brown y[i] = 13.8700; t[i++] = 3.0000; 274*c4762a1bSJed Brown y[i] = 11.8100; t[i++] = 3.0000; 275*c4762a1bSJed Brown y[i] = 13.3100; t[i++] = 3.0000; 276*c4762a1bSJed Brown y[i] = 5.4400; t[i++] = 6.0000; 277*c4762a1bSJed Brown y[i] = 78.0000; t[i++] = .5000; 278*c4762a1bSJed Brown y[i] = 63.5000; t[i++] = .7500; 279*c4762a1bSJed Brown y[i] = 33.8000; t[i++] = 1.5000; 280*c4762a1bSJed Brown y[i] = 12.5600; t[i++] = 3.0000; 281*c4762a1bSJed Brown y[i] = 5.6300; t[i++] = 6.0000; 282*c4762a1bSJed Brown y[i] = 12.7500; t[i++] = 3.0000; 283*c4762a1bSJed Brown y[i] = 13.1200; t[i++] = 3.0000; 284*c4762a1bSJed Brown y[i] = 5.4400; t[i++] = 6.0000; 285*c4762a1bSJed Brown y[i] = 76.8000; t[i++] = .5000; 286*c4762a1bSJed Brown y[i] = 60.0000; t[i++] = .7500; 287*c4762a1bSJed Brown y[i] = 47.8000; t[i++] = 1.0000; 288*c4762a1bSJed Brown y[i] = 32.0000; t[i++] = 1.5000; 289*c4762a1bSJed Brown y[i] = 22.2000; t[i++] = 2.0000; 290*c4762a1bSJed Brown y[i] = 22.5700; t[i++] = 2.0000; 291*c4762a1bSJed Brown y[i] = 18.8200; t[i++] = 2.5000; 292*c4762a1bSJed Brown y[i] = 13.9500; t[i++] = 3.0000; 293*c4762a1bSJed Brown y[i] = 11.2500; t[i++] = 4.0000; 294*c4762a1bSJed Brown y[i] = 9.0000; t[i++] = 5.0000; 295*c4762a1bSJed Brown y[i] = 6.6700; t[i++] = 6.0000; 296*c4762a1bSJed Brown y[i] = 75.8000; t[i++] = .5000; 297*c4762a1bSJed Brown y[i] = 62.0000; t[i++] = .7500; 298*c4762a1bSJed Brown y[i] = 48.8000; t[i++] = 1.0000; 299*c4762a1bSJed Brown y[i] = 35.2000; t[i++] = 1.5000; 300*c4762a1bSJed Brown y[i] = 20.0000; t[i++] = 2.0000; 301*c4762a1bSJed Brown y[i] = 20.3200; t[i++] = 2.0000; 302*c4762a1bSJed Brown y[i] = 19.3100; t[i++] = 2.5000; 303*c4762a1bSJed Brown y[i] = 12.7500; t[i++] = 3.0000; 304*c4762a1bSJed Brown y[i] = 10.4200; t[i++] = 4.0000; 305*c4762a1bSJed Brown y[i] = 7.3100; t[i++] = 5.0000; 306*c4762a1bSJed Brown y[i] = 7.4200; t[i++] = 6.0000; 307*c4762a1bSJed Brown y[i] = 70.5000; t[i++] = .5000; 308*c4762a1bSJed Brown y[i] = 59.5000; t[i++] = .7500; 309*c4762a1bSJed Brown y[i] = 48.5000; t[i++] = 1.0000; 310*c4762a1bSJed Brown y[i] = 35.8000; t[i++] = 1.5000; 311*c4762a1bSJed Brown y[i] = 21.0000; t[i++] = 2.0000; 312*c4762a1bSJed Brown y[i] = 21.6700; t[i++] = 2.0000; 313*c4762a1bSJed Brown y[i] = 21.0000; t[i++] = 2.5000; 314*c4762a1bSJed Brown y[i] = 15.6400; t[i++] = 3.0000; 315*c4762a1bSJed Brown y[i] = 8.1700; t[i++] = 4.0000; 316*c4762a1bSJed Brown y[i] = 8.5500; t[i++] = 5.0000; 317*c4762a1bSJed Brown y[i] = 10.1200; t[i++] = 6.0000; 318*c4762a1bSJed Brown y[i] = 78.0000; t[i++] = .5000; 319*c4762a1bSJed Brown y[i] = 66.0000; t[i++] = .6250; 320*c4762a1bSJed Brown y[i] = 62.0000; t[i++] = .7500; 321*c4762a1bSJed Brown y[i] = 58.0000; t[i++] = .8750; 322*c4762a1bSJed Brown y[i] = 47.7000; t[i++] = 1.0000; 323*c4762a1bSJed Brown y[i] = 37.8000; t[i++] = 1.2500; 324*c4762a1bSJed Brown y[i] = 20.2000; t[i++] = 2.2500; 325*c4762a1bSJed Brown y[i] = 21.0700; t[i++] = 2.2500; 326*c4762a1bSJed Brown y[i] = 13.8700; t[i++] = 2.7500; 327*c4762a1bSJed Brown y[i] = 9.6700; t[i++] = 3.2500; 328*c4762a1bSJed Brown y[i] = 7.7600; t[i++] = 3.7500; 329*c4762a1bSJed Brown y[i] = 5.4400; t[i++] = 4.2500; 330*c4762a1bSJed Brown y[i] = 4.8700; t[i++] = 4.7500; 331*c4762a1bSJed Brown y[i] = 4.0100; t[i++] = 5.2500; 332*c4762a1bSJed Brown y[i] = 3.7500; t[i++] = 5.7500; 333*c4762a1bSJed Brown y[i] = 24.1900; t[i++] = 3.0000; 334*c4762a1bSJed Brown y[i] = 25.7600; t[i++] = 3.0000; 335*c4762a1bSJed Brown y[i] = 18.0700; t[i++] = 3.0000; 336*c4762a1bSJed Brown y[i] = 11.8100; t[i++] = 3.0000; 337*c4762a1bSJed Brown y[i] = 12.0700; t[i++] = 3.0000; 338*c4762a1bSJed Brown y[i] = 16.1200; t[i++] = 3.0000; 339*c4762a1bSJed Brown y[i] = 70.8000; t[i++] = .5000; 340*c4762a1bSJed Brown y[i] = 54.7000; t[i++] = .7500; 341*c4762a1bSJed Brown y[i] = 48.0000; t[i++] = 1.0000; 342*c4762a1bSJed Brown y[i] = 39.8000; t[i++] = 1.5000; 343*c4762a1bSJed Brown y[i] = 29.8000; t[i++] = 2.0000; 344*c4762a1bSJed Brown y[i] = 23.7000; t[i++] = 2.5000; 345*c4762a1bSJed Brown y[i] = 29.6200; t[i++] = 2.0000; 346*c4762a1bSJed Brown y[i] = 23.8100; t[i++] = 2.5000; 347*c4762a1bSJed Brown y[i] = 17.7000; t[i++] = 3.0000; 348*c4762a1bSJed Brown y[i] = 11.5500; t[i++] = 4.0000; 349*c4762a1bSJed Brown y[i] = 12.0700; t[i++] = 5.0000; 350*c4762a1bSJed Brown y[i] = 8.7400; t[i++] = 6.0000; 351*c4762a1bSJed Brown y[i] = 80.7000; t[i++] = .5000; 352*c4762a1bSJed Brown y[i] = 61.3000; t[i++] = .7500; 353*c4762a1bSJed Brown y[i] = 47.5000; t[i++] = 1.0000; 354*c4762a1bSJed Brown y[i] = 29.0000; t[i++] = 1.5000; 355*c4762a1bSJed Brown y[i] = 24.0000; t[i++] = 2.0000; 356*c4762a1bSJed Brown y[i] = 17.7000; t[i++] = 2.5000; 357*c4762a1bSJed Brown y[i] = 24.5600; t[i++] = 2.0000; 358*c4762a1bSJed Brown y[i] = 18.6700; t[i++] = 2.5000; 359*c4762a1bSJed Brown y[i] = 16.2400; t[i++] = 3.0000; 360*c4762a1bSJed Brown y[i] = 8.7400; t[i++] = 4.0000; 361*c4762a1bSJed Brown y[i] = 7.8700; t[i++] = 5.0000; 362*c4762a1bSJed Brown y[i] = 8.5100; t[i++] = 6.0000; 363*c4762a1bSJed Brown y[i] = 66.7000; t[i++] = .5000; 364*c4762a1bSJed Brown y[i] = 59.2000; t[i++] = .7500; 365*c4762a1bSJed Brown y[i] = 40.8000; t[i++] = 1.0000; 366*c4762a1bSJed Brown y[i] = 30.7000; t[i++] = 1.5000; 367*c4762a1bSJed Brown y[i] = 25.7000; t[i++] = 2.0000; 368*c4762a1bSJed Brown y[i] = 16.3000; t[i++] = 2.5000; 369*c4762a1bSJed Brown y[i] = 25.9900; t[i++] = 2.0000; 370*c4762a1bSJed Brown y[i] = 16.9500; t[i++] = 2.5000; 371*c4762a1bSJed Brown y[i] = 13.3500; t[i++] = 3.0000; 372*c4762a1bSJed Brown y[i] = 8.6200; t[i++] = 4.0000; 373*c4762a1bSJed Brown y[i] = 7.2000; t[i++] = 5.0000; 374*c4762a1bSJed Brown y[i] = 6.6400; t[i++] = 6.0000; 375*c4762a1bSJed Brown y[i] = 13.6900; t[i++] = 3.0000; 376*c4762a1bSJed Brown y[i] = 81.0000; t[i++] = .5000; 377*c4762a1bSJed Brown y[i] = 64.5000; t[i++] = .7500; 378*c4762a1bSJed Brown y[i] = 35.5000; t[i++] = 1.5000; 379*c4762a1bSJed Brown y[i] = 13.3100; t[i++] = 3.0000; 380*c4762a1bSJed Brown y[i] = 4.8700; t[i++] = 6.0000; 381*c4762a1bSJed Brown y[i] = 12.9400; t[i++] = 3.0000; 382*c4762a1bSJed Brown y[i] = 5.0600; t[i++] = 6.0000; 383*c4762a1bSJed Brown y[i] = 15.1900; t[i++] = 3.0000; 384*c4762a1bSJed Brown y[i] = 14.6200; t[i++] = 3.0000; 385*c4762a1bSJed Brown y[i] = 15.6400; t[i++] = 3.0000; 386*c4762a1bSJed Brown y[i] = 25.5000; t[i++] = 1.7500; 387*c4762a1bSJed Brown y[i] = 25.9500; t[i++] = 1.7500; 388*c4762a1bSJed Brown y[i] = 81.7000; t[i++] = .5000; 389*c4762a1bSJed Brown y[i] = 61.6000; t[i++] = .7500; 390*c4762a1bSJed Brown y[i] = 29.8000; t[i++] = 1.7500; 391*c4762a1bSJed Brown y[i] = 29.8100; t[i++] = 1.7500; 392*c4762a1bSJed Brown y[i] = 17.1700; t[i++] = 2.7500; 393*c4762a1bSJed Brown y[i] = 10.3900; t[i++] = 3.7500; 394*c4762a1bSJed Brown y[i] = 28.4000; t[i++] = 1.7500; 395*c4762a1bSJed Brown y[i] = 28.6900; t[i++] = 1.7500; 396*c4762a1bSJed Brown y[i] = 81.3000; t[i++] = .5000; 397*c4762a1bSJed Brown y[i] = 60.9000; t[i++] = .7500; 398*c4762a1bSJed Brown y[i] = 16.6500; t[i++] = 2.7500; 399*c4762a1bSJed Brown y[i] = 10.0500; t[i++] = 3.7500; 400*c4762a1bSJed Brown y[i] = 28.9000; t[i++] = 1.7500; 401*c4762a1bSJed Brown y[i] = 28.9500; t[i++] = 1.7500; 402*c4762a1bSJed Brown PetscFunctionReturn(0); 403*c4762a1bSJed Brown } 404*c4762a1bSJed Brown 405*c4762a1bSJed Brown PetscErrorCode TaskWorker(AppCtx *user) 406*c4762a1bSJed Brown { 407*c4762a1bSJed Brown PetscReal x[NPARAMETERS],f = 0.0; 408*c4762a1bSJed Brown PetscMPIInt tag=IDLE_TAG; 409*c4762a1bSJed Brown PetscInt index; 410*c4762a1bSJed Brown MPI_Status status; 411*c4762a1bSJed Brown PetscErrorCode ierr; 412*c4762a1bSJed Brown 413*c4762a1bSJed Brown PetscFunctionBegin; 414*c4762a1bSJed Brown /* Send check-in message to master */ 415*c4762a1bSJed Brown 416*c4762a1bSJed Brown ierr = MPI_Send(&f,1,MPIU_REAL,0,IDLE_TAG,PETSC_COMM_WORLD);CHKERRQ(ierr); 417*c4762a1bSJed Brown while (tag != DIE_TAG) { 418*c4762a1bSJed Brown ierr = MPI_Recv(x,NPARAMETERS,MPIU_REAL,0,MPI_ANY_TAG,PETSC_COMM_WORLD,&status);CHKERRQ(ierr); 419*c4762a1bSJed Brown tag = status.MPI_TAG; 420*c4762a1bSJed Brown if (tag == IDLE_TAG) { 421*c4762a1bSJed Brown ierr = MPI_Send(&f,1,MPIU_REAL,0,IDLE_TAG,PETSC_COMM_WORLD);CHKERRQ(ierr); 422*c4762a1bSJed Brown } else if (tag != DIE_TAG) { 423*c4762a1bSJed Brown index = (PetscInt)tag; 424*c4762a1bSJed Brown ierr=RunSimulation(x,index,&f,user);CHKERRQ(ierr); 425*c4762a1bSJed Brown ierr=MPI_Send(&f,1,MPIU_REAL,0,tag,PETSC_COMM_WORLD);CHKERRQ(ierr); 426*c4762a1bSJed Brown } 427*c4762a1bSJed Brown } 428*c4762a1bSJed Brown PetscFunctionReturn(0); 429*c4762a1bSJed Brown } 430*c4762a1bSJed Brown 431*c4762a1bSJed Brown PetscErrorCode RunSimulation(PetscReal *x, PetscInt i, PetscReal*f, AppCtx *user) 432*c4762a1bSJed Brown { 433*c4762a1bSJed Brown PetscReal *t = user->t; 434*c4762a1bSJed Brown PetscReal *y = user->y; 435*c4762a1bSJed Brown #if defined(PETSC_USE_REAL_SINGLE) 436*c4762a1bSJed Brown *f = y[i] - exp(-x[0]*t[i])/(x[1] + x[2]*t[i]); /* expf() for single-precision breaks this example on freebsd, valgrind errors on linux */ 437*c4762a1bSJed Brown #else 438*c4762a1bSJed Brown *f = y[i] - PetscExpScalar(-x[0]*t[i])/(x[1] + x[2]*t[i]); 439*c4762a1bSJed Brown #endif 440*c4762a1bSJed Brown return(0); 441*c4762a1bSJed Brown } 442*c4762a1bSJed Brown 443*c4762a1bSJed Brown PetscErrorCode StopWorkers(AppCtx *user) 444*c4762a1bSJed Brown { 445*c4762a1bSJed Brown PetscInt checkedin; 446*c4762a1bSJed Brown MPI_Status status; 447*c4762a1bSJed Brown PetscReal f,x[NPARAMETERS]; 448*c4762a1bSJed Brown PetscErrorCode ierr; 449*c4762a1bSJed Brown 450*c4762a1bSJed Brown PetscFunctionBegin; 451*c4762a1bSJed Brown checkedin=0; 452*c4762a1bSJed Brown while(checkedin < user->size-1) { 453*c4762a1bSJed Brown ierr = MPI_Recv(&f,1,MPIU_REAL,MPI_ANY_SOURCE,MPI_ANY_TAG,PETSC_COMM_WORLD,&status);CHKERRQ(ierr); 454*c4762a1bSJed Brown checkedin++; 455*c4762a1bSJed Brown ierr = PetscArrayzero(x,NPARAMETERS);CHKERRQ(ierr); 456*c4762a1bSJed Brown ierr = MPI_Send(x,NPARAMETERS,MPIU_REAL,status.MPI_SOURCE,DIE_TAG,PETSC_COMM_WORLD);CHKERRQ(ierr); 457*c4762a1bSJed Brown } 458*c4762a1bSJed Brown PetscFunctionReturn(0); 459*c4762a1bSJed Brown } 460*c4762a1bSJed Brown 461*c4762a1bSJed Brown /*TEST 462*c4762a1bSJed Brown 463*c4762a1bSJed Brown build: 464*c4762a1bSJed Brown requires: !complex 465*c4762a1bSJed Brown 466*c4762a1bSJed Brown test: 467*c4762a1bSJed Brown nsize: 3 468*c4762a1bSJed Brown requires: !single 469*c4762a1bSJed Brown args: -tao_smonitor -tao_max_it 100 -tao_type pounders -tao_gatol 1.e-5 470*c4762a1bSJed Brown 471*c4762a1bSJed Brown TEST*/ 472