xref: /petsc/src/tao/leastsquares/tutorials/chwirut2.c (revision e1dfdf8ee4c7821fb66aa2bc5b82c246b72b1bc1)
1c4762a1bSJed Brown /*
2c4762a1bSJed Brown    Include "petsctao.h" so that we can use TAO solvers.  Note that this
3c4762a1bSJed Brown    file automatically includes libraries such as:
4c4762a1bSJed Brown      petsc.h       - base PETSc routines   petscvec.h - vectors
5a5b23f4aSJose E. Roman      petscsys.h    - system routines        petscmat.h - matrices
6c4762a1bSJed Brown      petscis.h     - index sets            petscksp.h - Krylov subspace methods
7c4762a1bSJed Brown      petscviewer.h - viewers               petscpc.h  - preconditioners
8c4762a1bSJed Brown 
9c4762a1bSJed Brown */
10c4762a1bSJed Brown 
11c4762a1bSJed Brown #include <petsctao.h>
12c4762a1bSJed Brown 
13c4762a1bSJed Brown /*
14c4762a1bSJed Brown Description:   These data are the result of a NIST study involving
15c4762a1bSJed Brown                ultrasonic calibration.  The response variable is
16c4762a1bSJed Brown                ultrasonic response, and the predictor variable is
17c4762a1bSJed Brown                metal distance.
18c4762a1bSJed Brown 
19c4762a1bSJed Brown Reference:     Chwirut, D., NIST (197?).
20c4762a1bSJed Brown                Ultrasonic Reference Block Study.
21c4762a1bSJed Brown */
22c4762a1bSJed Brown 
23c4762a1bSJed Brown static char help[]="Finds the nonlinear least-squares solution to the model \n\
24c4762a1bSJed Brown             y = exp[-b1*x]/(b2+b3*x)  +  e \n";
25c4762a1bSJed Brown 
26c4762a1bSJed Brown /* T
27c4762a1bSJed Brown    Concepts: TAO^Solving a system of nonlinear equations, nonlinear least squares
28c4762a1bSJed Brown    Routines: TaoCreate();
29c4762a1bSJed Brown    Routines: TaoSetType();
30c4762a1bSJed Brown    Routines: TaoSetResidualRoutine();
31c4762a1bSJed Brown    Routines: TaoSetMonitor();
32c4762a1bSJed Brown    Routines: TaoSetInitialVector();
33c4762a1bSJed Brown    Routines: TaoSetFromOptions();
34c4762a1bSJed Brown    Routines: TaoSolve();
35c4762a1bSJed Brown    Routines: TaoDestroy();
36c4762a1bSJed Brown    Processors: n
37c4762a1bSJed Brown T*/
38c4762a1bSJed Brown 
39c4762a1bSJed Brown #define NOBSERVATIONS 214
40c4762a1bSJed Brown #define NPARAMETERS 3
41c4762a1bSJed Brown 
42c4762a1bSJed Brown #define DIE_TAG 2000
43c4762a1bSJed Brown #define IDLE_TAG 1000
44c4762a1bSJed Brown 
45c4762a1bSJed Brown /* User-defined application context */
46c4762a1bSJed Brown typedef struct {
47c4762a1bSJed Brown   /* Working space */
48c4762a1bSJed Brown   PetscReal   t[NOBSERVATIONS];   /* array of independent variables of observation */
49c4762a1bSJed Brown   PetscReal   y[NOBSERVATIONS];   /* array of dependent variables */
50c4762a1bSJed Brown   PetscMPIInt size,rank;
51c4762a1bSJed Brown } AppCtx;
52c4762a1bSJed Brown 
53c4762a1bSJed Brown /* User provided Routines */
54c4762a1bSJed Brown PetscErrorCode InitializeData(AppCtx *user);
55c4762a1bSJed Brown PetscErrorCode FormStartingPoint(Vec);
56c4762a1bSJed Brown PetscErrorCode EvaluateFunction(Tao, Vec, Vec, void *);
57c4762a1bSJed Brown PetscErrorCode TaskWorker(AppCtx *user);
58c4762a1bSJed Brown PetscErrorCode StopWorkers(AppCtx *user);
59c4762a1bSJed Brown PetscErrorCode RunSimulation(PetscReal *x, PetscInt i, PetscReal*f, AppCtx *user);
60c4762a1bSJed Brown 
61c4762a1bSJed Brown /*--------------------------------------------------------------------*/
62c4762a1bSJed Brown int main(int argc,char **argv)
63c4762a1bSJed Brown {
64c4762a1bSJed Brown   PetscErrorCode ierr;           /* used to check for functions returning nonzeros */
65c4762a1bSJed Brown   Vec            x, f;               /* solution, function */
66c4762a1bSJed Brown   Tao            tao;                /* Tao solver context */
67c4762a1bSJed Brown   AppCtx         user;               /* user-defined work context */
68c4762a1bSJed Brown 
69c4762a1bSJed Brown    /* Initialize TAO and PETSc */
70c4762a1bSJed Brown   ierr = PetscInitialize(&argc,&argv,(char *)0,help);if (ierr) return ierr;
71c4762a1bSJed Brown   MPI_Comm_size(MPI_COMM_WORLD,&user.size);
72c4762a1bSJed Brown   MPI_Comm_rank(MPI_COMM_WORLD,&user.rank);
73c4762a1bSJed Brown   ierr = InitializeData(&user);CHKERRQ(ierr);
74c4762a1bSJed Brown 
75c4762a1bSJed Brown   /* Run optimization on rank 0 */
76c4762a1bSJed Brown   if (user.rank == 0) {
77c4762a1bSJed Brown     /* Allocate vectors */
78c4762a1bSJed Brown     ierr = VecCreateSeq(PETSC_COMM_SELF,NPARAMETERS,&x);CHKERRQ(ierr);
79c4762a1bSJed Brown     ierr = VecCreateSeq(PETSC_COMM_SELF,NOBSERVATIONS,&f);CHKERRQ(ierr);
80c4762a1bSJed Brown 
81c4762a1bSJed Brown     /* TAO code begins here */
82c4762a1bSJed Brown 
83c4762a1bSJed Brown     /* Create TAO solver and set desired solution method */
84c4762a1bSJed Brown     ierr = TaoCreate(PETSC_COMM_SELF,&tao);CHKERRQ(ierr);
85c4762a1bSJed Brown     ierr = TaoSetType(tao,TAOPOUNDERS);CHKERRQ(ierr);
86c4762a1bSJed Brown 
87c4762a1bSJed Brown     /* Set the function and Jacobian routines. */
88c4762a1bSJed Brown     ierr = FormStartingPoint(x);CHKERRQ(ierr);
89c4762a1bSJed Brown     ierr = TaoSetInitialVector(tao,x);CHKERRQ(ierr);
90c4762a1bSJed Brown     ierr = TaoSetResidualRoutine(tao,f,EvaluateFunction,(void*)&user);CHKERRQ(ierr);
91c4762a1bSJed Brown 
92c4762a1bSJed Brown     /* Check for any TAO command line arguments */
93c4762a1bSJed Brown     ierr = TaoSetFromOptions(tao);CHKERRQ(ierr);
94c4762a1bSJed Brown 
95c4762a1bSJed Brown     /* Perform the Solve */
96c4762a1bSJed Brown     ierr = TaoSolve(tao);CHKERRQ(ierr);
97c4762a1bSJed Brown 
98c4762a1bSJed Brown     /* Free TAO data structures */
99c4762a1bSJed Brown     ierr = TaoDestroy(&tao);CHKERRQ(ierr);
100c4762a1bSJed Brown 
101c4762a1bSJed Brown     /* Free PETSc data structures */
102c4762a1bSJed Brown     ierr = VecDestroy(&x);CHKERRQ(ierr);
103c4762a1bSJed Brown     ierr = VecDestroy(&f);CHKERRQ(ierr);
104c4762a1bSJed Brown     StopWorkers(&user);
105c4762a1bSJed Brown   } else {
106c4762a1bSJed Brown     TaskWorker(&user);
107c4762a1bSJed Brown   }
108c4762a1bSJed Brown   ierr = PetscFinalize();
109c4762a1bSJed Brown   return ierr;
110c4762a1bSJed Brown }
111c4762a1bSJed Brown 
112c4762a1bSJed Brown /*--------------------------------------------------------------------*/
113c4762a1bSJed Brown PetscErrorCode EvaluateFunction(Tao tao, Vec X, Vec F, void *ptr)
114c4762a1bSJed Brown {
115c4762a1bSJed Brown   AppCtx         *user = (AppCtx *)ptr;
116c4762a1bSJed Brown   PetscInt       i;
117c4762a1bSJed Brown   PetscReal      *x,*f;
118c4762a1bSJed Brown   PetscErrorCode ierr;
119c4762a1bSJed Brown 
120c4762a1bSJed Brown   PetscFunctionBegin;
121c4762a1bSJed Brown   ierr = VecGetArray(X,&x);CHKERRQ(ierr);
122c4762a1bSJed Brown   ierr = VecGetArray(F,&f);CHKERRQ(ierr);
123c4762a1bSJed Brown   if (user->size == 1) {
124c4762a1bSJed Brown     /* Single processor */
125c4762a1bSJed Brown     for (i=0;i<NOBSERVATIONS;i++) {
126c4762a1bSJed Brown       ierr = RunSimulation(x,i,&f[i],user);CHKERRQ(ierr);
127c4762a1bSJed Brown     }
128c4762a1bSJed Brown   } else {
1299dddd249SSatish Balay     /* Multiprocessor main */
130c4762a1bSJed Brown     PetscMPIInt tag;
131c4762a1bSJed Brown     PetscInt    finishedtasks,next_task,checkedin;
132c4762a1bSJed Brown     PetscReal   f_i=0.0;
133c4762a1bSJed Brown     MPI_Status  status;
134c4762a1bSJed Brown 
135c4762a1bSJed Brown     next_task=0;
136c4762a1bSJed Brown     finishedtasks=0;
137c4762a1bSJed Brown     checkedin=0;
138c4762a1bSJed Brown 
139c4762a1bSJed Brown     while (finishedtasks < NOBSERVATIONS || checkedin < user->size-1) {
140ffc4695bSBarry Smith       ierr = MPI_Recv(&f_i,1,MPIU_REAL,MPI_ANY_SOURCE,MPI_ANY_TAG,PETSC_COMM_WORLD,&status);CHKERRMPI(ierr);
141c4762a1bSJed Brown       if (status.MPI_TAG == IDLE_TAG) {
142c4762a1bSJed Brown         checkedin++;
143c4762a1bSJed Brown       } else {
144c4762a1bSJed Brown 
145c4762a1bSJed Brown         tag = status.MPI_TAG;
146c4762a1bSJed Brown         f[tag] = (PetscReal)f_i;
147c4762a1bSJed Brown         finishedtasks++;
148c4762a1bSJed Brown       }
149c4762a1bSJed Brown 
150c4762a1bSJed Brown       if (next_task<NOBSERVATIONS) {
151ffc4695bSBarry Smith         ierr = MPI_Send(x,NPARAMETERS,MPIU_REAL,status.MPI_SOURCE,next_task,PETSC_COMM_WORLD);CHKERRMPI(ierr);
152c4762a1bSJed Brown         next_task++;
153c4762a1bSJed Brown 
154c4762a1bSJed Brown       } else {
155c4762a1bSJed Brown         /* Send idle message */
156ffc4695bSBarry Smith         ierr = MPI_Send(x,NPARAMETERS,MPIU_REAL,status.MPI_SOURCE,IDLE_TAG,PETSC_COMM_WORLD);CHKERRMPI(ierr);
157c4762a1bSJed Brown       }
158c4762a1bSJed Brown     }
159c4762a1bSJed Brown   }
160c4762a1bSJed Brown   ierr = VecRestoreArray(X,&x);CHKERRQ(ierr);
161c4762a1bSJed Brown   ierr = VecRestoreArray(F,&f);CHKERRQ(ierr);
162c4762a1bSJed Brown   PetscLogFlops(6*NOBSERVATIONS);
163c4762a1bSJed Brown   PetscFunctionReturn(0);
164c4762a1bSJed Brown }
165c4762a1bSJed Brown 
166c4762a1bSJed Brown /* ------------------------------------------------------------ */
167c4762a1bSJed Brown PetscErrorCode FormStartingPoint(Vec X)
168c4762a1bSJed Brown {
169c4762a1bSJed Brown   PetscReal      *x;
170c4762a1bSJed Brown   PetscErrorCode ierr;
171c4762a1bSJed Brown 
172c4762a1bSJed Brown   PetscFunctionBegin;
173c4762a1bSJed Brown   ierr = VecGetArray(X,&x);CHKERRQ(ierr);
174c4762a1bSJed Brown   x[0] = 0.15;
175c4762a1bSJed Brown   x[1] = 0.008;
176c4762a1bSJed Brown   x[2] = 0.010;
177c4762a1bSJed Brown   VecRestoreArray(X,&x);CHKERRQ(ierr);
178c4762a1bSJed Brown   PetscFunctionReturn(0);
179c4762a1bSJed Brown }
180c4762a1bSJed Brown 
181c4762a1bSJed Brown /* ---------------------------------------------------------------------- */
182c4762a1bSJed Brown PetscErrorCode InitializeData(AppCtx *user)
183c4762a1bSJed Brown {
184c4762a1bSJed Brown   PetscReal *t=user->t,*y=user->y;
185c4762a1bSJed Brown   PetscInt  i=0;
186c4762a1bSJed Brown 
187c4762a1bSJed Brown   PetscFunctionBegin;
188c4762a1bSJed Brown   y[i] =   92.9000;   t[i++] =  0.5000;
189c4762a1bSJed Brown   y[i] =    78.7000;  t[i++] =   0.6250;
190c4762a1bSJed Brown   y[i] =    64.2000;  t[i++] =   0.7500;
191c4762a1bSJed Brown   y[i] =    64.9000;  t[i++] =   0.8750;
192c4762a1bSJed Brown   y[i] =    57.1000;  t[i++] =   1.0000;
193c4762a1bSJed Brown   y[i] =    43.3000;  t[i++] =   1.2500;
194c4762a1bSJed Brown   y[i] =    31.1000;   t[i++] =  1.7500;
195c4762a1bSJed Brown   y[i] =    23.6000;   t[i++] =  2.2500;
196c4762a1bSJed Brown   y[i] =    31.0500;   t[i++] =  1.7500;
197c4762a1bSJed Brown   y[i] =    23.7750;   t[i++] =  2.2500;
198c4762a1bSJed Brown   y[i] =    17.7375;   t[i++] =  2.7500;
199c4762a1bSJed Brown   y[i] =    13.8000;   t[i++] =  3.2500;
200c4762a1bSJed Brown   y[i] =    11.5875;   t[i++] =  3.7500;
201c4762a1bSJed Brown   y[i] =     9.4125;   t[i++] =  4.2500;
202c4762a1bSJed Brown   y[i] =     7.7250;   t[i++] =  4.7500;
203c4762a1bSJed Brown   y[i] =     7.3500;   t[i++] =  5.2500;
204c4762a1bSJed Brown   y[i] =     8.0250;   t[i++] =  5.7500;
205c4762a1bSJed Brown   y[i] =    90.6000;   t[i++] =  0.5000;
206c4762a1bSJed Brown   y[i] =    76.9000;   t[i++] =  0.6250;
207c4762a1bSJed Brown   y[i] =    71.6000;   t[i++] = 0.7500;
208c4762a1bSJed Brown   y[i] =    63.6000;   t[i++] =  0.8750;
209c4762a1bSJed Brown   y[i] =    54.0000;   t[i++] =  1.0000;
210c4762a1bSJed Brown   y[i] =    39.2000;   t[i++] =  1.2500;
211c4762a1bSJed Brown   y[i] =    29.3000;   t[i++] = 1.7500;
212c4762a1bSJed Brown   y[i] =    21.4000;   t[i++] =  2.2500;
213c4762a1bSJed Brown   y[i] =    29.1750;   t[i++] =  1.7500;
214c4762a1bSJed Brown   y[i] =    22.1250;   t[i++] =  2.2500;
215c4762a1bSJed Brown   y[i] =    17.5125;   t[i++] =  2.7500;
216c4762a1bSJed Brown   y[i] =    14.2500;   t[i++] =  3.2500;
217c4762a1bSJed Brown   y[i] =     9.4500;   t[i++] =  3.7500;
218c4762a1bSJed Brown   y[i] =     9.1500;   t[i++] =  4.2500;
219c4762a1bSJed Brown   y[i] =     7.9125;   t[i++] =  4.7500;
220c4762a1bSJed Brown   y[i] =     8.4750;   t[i++] =  5.2500;
221c4762a1bSJed Brown   y[i] =     6.1125;   t[i++] =  5.7500;
222c4762a1bSJed Brown   y[i] =    80.0000;   t[i++] =  0.5000;
223c4762a1bSJed Brown   y[i] =    79.0000;   t[i++] =  0.6250;
224c4762a1bSJed Brown   y[i] =    63.8000;   t[i++] =  0.7500;
225c4762a1bSJed Brown   y[i] =    57.2000;   t[i++] =  0.8750;
226c4762a1bSJed Brown   y[i] =    53.2000;   t[i++] =  1.0000;
227c4762a1bSJed Brown   y[i] =   42.5000;   t[i++] =  1.2500;
228c4762a1bSJed Brown   y[i] =   26.8000;   t[i++] =  1.7500;
229c4762a1bSJed Brown   y[i] =    20.4000;   t[i++] =  2.2500;
230c4762a1bSJed Brown   y[i] =    26.8500;  t[i++] =   1.7500;
231c4762a1bSJed Brown   y[i] =    21.0000;  t[i++] =   2.2500;
232c4762a1bSJed Brown   y[i] =    16.4625;  t[i++] =   2.7500;
233c4762a1bSJed Brown   y[i] =    12.5250;  t[i++] =   3.2500;
234c4762a1bSJed Brown   y[i] =    10.5375;  t[i++] =   3.7500;
235c4762a1bSJed Brown   y[i] =     8.5875;  t[i++] =   4.2500;
236c4762a1bSJed Brown   y[i] =     7.1250;  t[i++] =   4.7500;
237c4762a1bSJed Brown   y[i] =     6.1125;  t[i++] =   5.2500;
238c4762a1bSJed Brown   y[i] =     5.9625;  t[i++] =   5.7500;
239c4762a1bSJed Brown   y[i] =    74.1000;  t[i++] =   0.5000;
240c4762a1bSJed Brown   y[i] =    67.3000;  t[i++] =   0.6250;
241c4762a1bSJed Brown   y[i] =    60.8000;  t[i++] =   0.7500;
242c4762a1bSJed Brown   y[i] =    55.5000;  t[i++] =   0.8750;
243c4762a1bSJed Brown   y[i] =    50.3000;  t[i++] =   1.0000;
244c4762a1bSJed Brown   y[i] =    41.0000;  t[i++] =   1.2500;
245c4762a1bSJed Brown   y[i] =    29.4000;  t[i++] =   1.7500;
246c4762a1bSJed Brown   y[i] =    20.4000;  t[i++] =   2.2500;
247c4762a1bSJed Brown   y[i] =    29.3625;  t[i++] =   1.7500;
248c4762a1bSJed Brown   y[i] =    21.1500;  t[i++] =   2.2500;
249c4762a1bSJed Brown   y[i] =    16.7625;  t[i++] =   2.7500;
250c4762a1bSJed Brown   y[i] =    13.2000;  t[i++] =   3.2500;
251c4762a1bSJed Brown   y[i] =    10.8750;  t[i++] =   3.7500;
252c4762a1bSJed Brown   y[i] =     8.1750;  t[i++] =   4.2500;
253c4762a1bSJed Brown   y[i] =     7.3500;  t[i++] =   4.7500;
254c4762a1bSJed Brown   y[i] =     5.9625;  t[i++] =  5.2500;
255c4762a1bSJed Brown   y[i] =     5.6250;  t[i++] =   5.7500;
256c4762a1bSJed Brown   y[i] =    81.5000;  t[i++] =    .5000;
257c4762a1bSJed Brown   y[i] =    62.4000;  t[i++] =    .7500;
258c4762a1bSJed Brown   y[i] =    32.5000;  t[i++] =   1.5000;
259c4762a1bSJed Brown   y[i] =    12.4100;  t[i++] =   3.0000;
260c4762a1bSJed Brown   y[i] =    13.1200;  t[i++] =   3.0000;
261c4762a1bSJed Brown   y[i] =    15.5600;  t[i++] =   3.0000;
262c4762a1bSJed Brown   y[i] =     5.6300;  t[i++] =   6.0000;
263c4762a1bSJed Brown   y[i] =    78.0000;   t[i++] =   .5000;
264c4762a1bSJed Brown   y[i] =    59.9000;  t[i++] =    .7500;
265c4762a1bSJed Brown   y[i] =    33.2000;  t[i++] =   1.5000;
266c4762a1bSJed Brown   y[i] =    13.8400;  t[i++] =   3.0000;
267c4762a1bSJed Brown   y[i] =    12.7500;  t[i++] =   3.0000;
268c4762a1bSJed Brown   y[i] =    14.6200;  t[i++] =   3.0000;
269c4762a1bSJed Brown   y[i] =     3.9400;  t[i++] =   6.0000;
270c4762a1bSJed Brown   y[i] =    76.8000;  t[i++] =    .5000;
271c4762a1bSJed Brown   y[i] =    61.0000;  t[i++] =    .7500;
272c4762a1bSJed Brown   y[i] =    32.9000;  t[i++] =   1.5000;
273c4762a1bSJed Brown   y[i] =   13.8700;   t[i++] = 3.0000;
274c4762a1bSJed Brown   y[i] =    11.8100;  t[i++] =   3.0000;
275c4762a1bSJed Brown   y[i] =    13.3100;  t[i++] =   3.0000;
276c4762a1bSJed Brown   y[i] =     5.4400;  t[i++] =   6.0000;
277c4762a1bSJed Brown   y[i] =    78.0000;  t[i++] =    .5000;
278c4762a1bSJed Brown   y[i] =    63.5000;  t[i++] =    .7500;
279c4762a1bSJed Brown   y[i] =    33.8000;  t[i++] =   1.5000;
280c4762a1bSJed Brown   y[i] =    12.5600;  t[i++] =   3.0000;
281c4762a1bSJed Brown   y[i] =     5.6300;  t[i++] =   6.0000;
282c4762a1bSJed Brown   y[i] =    12.7500;  t[i++] =   3.0000;
283c4762a1bSJed Brown   y[i] =    13.1200;  t[i++] =   3.0000;
284c4762a1bSJed Brown   y[i] =     5.4400;  t[i++] =   6.0000;
285c4762a1bSJed Brown   y[i] =    76.8000;  t[i++] =    .5000;
286c4762a1bSJed Brown   y[i] =    60.0000;  t[i++] =    .7500;
287c4762a1bSJed Brown   y[i] =    47.8000;  t[i++] =   1.0000;
288c4762a1bSJed Brown   y[i] =    32.0000;  t[i++] =   1.5000;
289c4762a1bSJed Brown   y[i] =    22.2000;  t[i++] =   2.0000;
290c4762a1bSJed Brown   y[i] =    22.5700;  t[i++] =   2.0000;
291c4762a1bSJed Brown   y[i] =    18.8200;  t[i++] =   2.5000;
292c4762a1bSJed Brown   y[i] =    13.9500;  t[i++] =   3.0000;
293c4762a1bSJed Brown   y[i] =    11.2500;  t[i++] =   4.0000;
294c4762a1bSJed Brown   y[i] =     9.0000;  t[i++] =   5.0000;
295c4762a1bSJed Brown   y[i] =     6.6700;  t[i++] =   6.0000;
296c4762a1bSJed Brown   y[i] =    75.8000;  t[i++] =    .5000;
297c4762a1bSJed Brown   y[i] =    62.0000;  t[i++] =    .7500;
298c4762a1bSJed Brown   y[i] =    48.8000;  t[i++] =   1.0000;
299c4762a1bSJed Brown   y[i] =    35.2000;  t[i++] =   1.5000;
300c4762a1bSJed Brown   y[i] =    20.0000;  t[i++] =   2.0000;
301c4762a1bSJed Brown   y[i] =    20.3200;  t[i++] =   2.0000;
302c4762a1bSJed Brown   y[i] =    19.3100;  t[i++] =   2.5000;
303c4762a1bSJed Brown   y[i] =    12.7500;  t[i++] =   3.0000;
304c4762a1bSJed Brown   y[i] =    10.4200;  t[i++] =   4.0000;
305c4762a1bSJed Brown   y[i] =     7.3100;  t[i++] =   5.0000;
306c4762a1bSJed Brown   y[i] =     7.4200;  t[i++] =   6.0000;
307c4762a1bSJed Brown   y[i] =    70.5000;  t[i++] =    .5000;
308c4762a1bSJed Brown   y[i] =    59.5000;  t[i++] =    .7500;
309c4762a1bSJed Brown   y[i] =    48.5000;  t[i++] =   1.0000;
310c4762a1bSJed Brown   y[i] =    35.8000;  t[i++] =   1.5000;
311c4762a1bSJed Brown   y[i] =    21.0000;  t[i++] =   2.0000;
312c4762a1bSJed Brown   y[i] =    21.6700;  t[i++] =   2.0000;
313c4762a1bSJed Brown   y[i] =    21.0000;  t[i++] =   2.5000;
314c4762a1bSJed Brown   y[i] =    15.6400;  t[i++] =   3.0000;
315c4762a1bSJed Brown   y[i] =     8.1700;  t[i++] =   4.0000;
316c4762a1bSJed Brown   y[i] =     8.5500;  t[i++] =   5.0000;
317c4762a1bSJed Brown   y[i] =    10.1200;  t[i++] =   6.0000;
318c4762a1bSJed Brown   y[i] =    78.0000;  t[i++] =    .5000;
319c4762a1bSJed Brown   y[i] =    66.0000;  t[i++] =    .6250;
320c4762a1bSJed Brown   y[i] =    62.0000;  t[i++] =    .7500;
321c4762a1bSJed Brown   y[i] =    58.0000;  t[i++] =    .8750;
322c4762a1bSJed Brown   y[i] =    47.7000;  t[i++] =   1.0000;
323c4762a1bSJed Brown   y[i] =    37.8000;  t[i++] =   1.2500;
324c4762a1bSJed Brown   y[i] =    20.2000;  t[i++] =   2.2500;
325c4762a1bSJed Brown   y[i] =    21.0700;  t[i++] =   2.2500;
326c4762a1bSJed Brown   y[i] =    13.8700;  t[i++] =   2.7500;
327c4762a1bSJed Brown   y[i] =     9.6700;  t[i++] =   3.2500;
328c4762a1bSJed Brown   y[i] =     7.7600;  t[i++] =   3.7500;
329c4762a1bSJed Brown   y[i] =    5.4400;   t[i++] =  4.2500;
330c4762a1bSJed Brown   y[i] =    4.8700;   t[i++] =  4.7500;
331c4762a1bSJed Brown   y[i] =     4.0100;  t[i++] =   5.2500;
332c4762a1bSJed Brown   y[i] =     3.7500;  t[i++] =   5.7500;
333c4762a1bSJed Brown   y[i] =    24.1900;  t[i++] =   3.0000;
334c4762a1bSJed Brown   y[i] =    25.7600;  t[i++] =   3.0000;
335c4762a1bSJed Brown   y[i] =    18.0700;  t[i++] =   3.0000;
336c4762a1bSJed Brown   y[i] =    11.8100;  t[i++] =   3.0000;
337c4762a1bSJed Brown   y[i] =    12.0700;  t[i++] =   3.0000;
338c4762a1bSJed Brown   y[i] =    16.1200;  t[i++] =   3.0000;
339c4762a1bSJed Brown   y[i] =    70.8000;  t[i++] =    .5000;
340c4762a1bSJed Brown   y[i] =    54.7000;  t[i++] =    .7500;
341c4762a1bSJed Brown   y[i] =    48.0000;  t[i++] =   1.0000;
342c4762a1bSJed Brown   y[i] =    39.8000;  t[i++] =   1.5000;
343c4762a1bSJed Brown   y[i] =    29.8000;  t[i++] =   2.0000;
344c4762a1bSJed Brown   y[i] =    23.7000;  t[i++] =   2.5000;
345c4762a1bSJed Brown   y[i] =    29.6200;  t[i++] =   2.0000;
346c4762a1bSJed Brown   y[i] =    23.8100;  t[i++] =   2.5000;
347c4762a1bSJed Brown   y[i] =    17.7000;  t[i++] =   3.0000;
348c4762a1bSJed Brown   y[i] =    11.5500;  t[i++] =   4.0000;
349c4762a1bSJed Brown   y[i] =    12.0700;  t[i++] =   5.0000;
350c4762a1bSJed Brown   y[i] =     8.7400;  t[i++] =   6.0000;
351c4762a1bSJed Brown   y[i] =    80.7000;  t[i++] =    .5000;
352c4762a1bSJed Brown   y[i] =    61.3000;  t[i++] =    .7500;
353c4762a1bSJed Brown   y[i] =    47.5000;  t[i++] =   1.0000;
354c4762a1bSJed Brown    y[i] =   29.0000;  t[i++] =   1.5000;
355c4762a1bSJed Brown    y[i] =   24.0000;  t[i++] =   2.0000;
356c4762a1bSJed Brown   y[i] =    17.7000;  t[i++] =   2.5000;
357c4762a1bSJed Brown   y[i] =    24.5600;  t[i++] =   2.0000;
358c4762a1bSJed Brown   y[i] =    18.6700;  t[i++] =   2.5000;
359c4762a1bSJed Brown    y[i] =   16.2400;  t[i++] =   3.0000;
360c4762a1bSJed Brown   y[i] =     8.7400;  t[i++] =   4.0000;
361c4762a1bSJed Brown   y[i] =     7.8700;  t[i++] =   5.0000;
362c4762a1bSJed Brown   y[i] =     8.5100;  t[i++] =   6.0000;
363c4762a1bSJed Brown   y[i] =    66.7000;  t[i++] =    .5000;
364c4762a1bSJed Brown   y[i] =    59.2000;  t[i++] =    .7500;
365c4762a1bSJed Brown   y[i] =    40.8000;  t[i++] =   1.0000;
366c4762a1bSJed Brown   y[i] =    30.7000;  t[i++] =   1.5000;
367c4762a1bSJed Brown   y[i] =    25.7000;  t[i++] =   2.0000;
368c4762a1bSJed Brown   y[i] =    16.3000;  t[i++] =   2.5000;
369c4762a1bSJed Brown   y[i] =    25.9900;  t[i++] =   2.0000;
370c4762a1bSJed Brown   y[i] =    16.9500;  t[i++] =   2.5000;
371c4762a1bSJed Brown   y[i] =    13.3500;  t[i++] =   3.0000;
372c4762a1bSJed Brown   y[i] =     8.6200;  t[i++] =   4.0000;
373c4762a1bSJed Brown   y[i] =     7.2000;  t[i++] =   5.0000;
374c4762a1bSJed Brown   y[i] =     6.6400;  t[i++] =   6.0000;
375c4762a1bSJed Brown   y[i] =    13.6900;  t[i++] =   3.0000;
376c4762a1bSJed Brown   y[i] =    81.0000;  t[i++] =    .5000;
377c4762a1bSJed Brown   y[i] =    64.5000;  t[i++] =    .7500;
378c4762a1bSJed Brown   y[i] =    35.5000;  t[i++] =   1.5000;
379c4762a1bSJed Brown    y[i] =   13.3100;  t[i++] =   3.0000;
380c4762a1bSJed Brown   y[i] =     4.8700;  t[i++] =   6.0000;
381c4762a1bSJed Brown   y[i] =    12.9400;  t[i++] =   3.0000;
382c4762a1bSJed Brown   y[i] =     5.0600;  t[i++] =   6.0000;
383c4762a1bSJed Brown   y[i] =    15.1900;  t[i++] =   3.0000;
384c4762a1bSJed Brown   y[i] =    14.6200;  t[i++] =   3.0000;
385c4762a1bSJed Brown   y[i] =    15.6400;  t[i++] =   3.0000;
386c4762a1bSJed Brown   y[i] =    25.5000;  t[i++] =   1.7500;
387c4762a1bSJed Brown   y[i] =    25.9500;  t[i++] =   1.7500;
388c4762a1bSJed Brown   y[i] =    81.7000;  t[i++] =    .5000;
389c4762a1bSJed Brown   y[i] =    61.6000;  t[i++] =    .7500;
390c4762a1bSJed Brown   y[i] =    29.8000;  t[i++] =   1.7500;
391c4762a1bSJed Brown   y[i] =    29.8100;  t[i++] =   1.7500;
392c4762a1bSJed Brown   y[i] =    17.1700;  t[i++] =   2.7500;
393c4762a1bSJed Brown   y[i] =    10.3900;  t[i++] =   3.7500;
394c4762a1bSJed Brown   y[i] =    28.4000;  t[i++] =   1.7500;
395c4762a1bSJed Brown   y[i] =    28.6900;  t[i++] =   1.7500;
396c4762a1bSJed Brown   y[i] =    81.3000;  t[i++] =    .5000;
397c4762a1bSJed Brown   y[i] =    60.9000;  t[i++] =    .7500;
398c4762a1bSJed Brown   y[i] =    16.6500;  t[i++] =   2.7500;
399c4762a1bSJed Brown   y[i] =    10.0500;  t[i++] =   3.7500;
400c4762a1bSJed Brown   y[i] =    28.9000;  t[i++] =   1.7500;
401c4762a1bSJed Brown   y[i] =    28.9500;  t[i++] =   1.7500;
402c4762a1bSJed Brown   PetscFunctionReturn(0);
403c4762a1bSJed Brown }
404c4762a1bSJed Brown 
405c4762a1bSJed Brown PetscErrorCode TaskWorker(AppCtx *user)
406c4762a1bSJed Brown {
407c4762a1bSJed Brown   PetscReal      x[NPARAMETERS],f = 0.0;
408c4762a1bSJed Brown   PetscMPIInt    tag=IDLE_TAG;
409c4762a1bSJed Brown   PetscInt       index;
410c4762a1bSJed Brown   MPI_Status     status;
411c4762a1bSJed Brown   PetscErrorCode ierr;
412c4762a1bSJed Brown 
413c4762a1bSJed Brown   PetscFunctionBegin;
4149dddd249SSatish Balay   /* Send check-in message to rank-0 */
415c4762a1bSJed Brown 
416ffc4695bSBarry Smith   ierr = MPI_Send(&f,1,MPIU_REAL,0,IDLE_TAG,PETSC_COMM_WORLD);CHKERRMPI(ierr);
417c4762a1bSJed Brown   while (tag != DIE_TAG) {
418ffc4695bSBarry Smith     ierr = MPI_Recv(x,NPARAMETERS,MPIU_REAL,0,MPI_ANY_TAG,PETSC_COMM_WORLD,&status);CHKERRMPI(ierr);
419c4762a1bSJed Brown     tag = status.MPI_TAG;
420c4762a1bSJed Brown     if (tag == IDLE_TAG) {
421ffc4695bSBarry Smith       ierr = MPI_Send(&f,1,MPIU_REAL,0,IDLE_TAG,PETSC_COMM_WORLD);CHKERRMPI(ierr);
422c4762a1bSJed Brown     } else if (tag != DIE_TAG) {
423c4762a1bSJed Brown       index = (PetscInt)tag;
424c4762a1bSJed Brown       ierr = RunSimulation(x,index,&f,user);CHKERRQ(ierr);
42555b25c41SPierre Jolivet       ierr = MPI_Send(&f,1,MPIU_REAL,0,tag,PETSC_COMM_WORLD);CHKERRMPI(ierr);
426c4762a1bSJed Brown     }
427c4762a1bSJed Brown   }
428c4762a1bSJed Brown   PetscFunctionReturn(0);
429c4762a1bSJed Brown }
430c4762a1bSJed Brown 
431c4762a1bSJed Brown PetscErrorCode RunSimulation(PetscReal *x, PetscInt i, PetscReal*f, AppCtx *user)
432c4762a1bSJed Brown {
433c4762a1bSJed Brown   PetscReal *t = user->t;
434c4762a1bSJed Brown   PetscReal *y = user->y;
435c4762a1bSJed Brown #if defined(PETSC_USE_REAL_SINGLE)
436*e1dfdf8eSBarry Smith   *f = y[i] - exp(-x[0]*t[i])/(x[1] + x[2]*t[i]); /* expf() for single-precision breaks this example on Freebsd, Valgrind errors on Linux */
437c4762a1bSJed Brown #else
438c4762a1bSJed Brown   *f = y[i] - PetscExpScalar(-x[0]*t[i])/(x[1] + x[2]*t[i]);
439c4762a1bSJed Brown #endif
440c4762a1bSJed Brown   return(0);
441c4762a1bSJed Brown }
442c4762a1bSJed Brown 
443c4762a1bSJed Brown PetscErrorCode StopWorkers(AppCtx *user)
444c4762a1bSJed Brown {
445c4762a1bSJed Brown   PetscInt       checkedin;
446c4762a1bSJed Brown   MPI_Status     status;
447c4762a1bSJed Brown   PetscReal      f,x[NPARAMETERS];
448c4762a1bSJed Brown   PetscErrorCode ierr;
449c4762a1bSJed Brown 
450c4762a1bSJed Brown   PetscFunctionBegin;
451c4762a1bSJed Brown   checkedin=0;
452c4762a1bSJed Brown   while (checkedin < user->size-1) {
453ffc4695bSBarry Smith     ierr = MPI_Recv(&f,1,MPIU_REAL,MPI_ANY_SOURCE,MPI_ANY_TAG,PETSC_COMM_WORLD,&status);CHKERRMPI(ierr);
454c4762a1bSJed Brown     checkedin++;
455c4762a1bSJed Brown     ierr = PetscArrayzero(x,NPARAMETERS);CHKERRQ(ierr);
456ffc4695bSBarry Smith     ierr = MPI_Send(x,NPARAMETERS,MPIU_REAL,status.MPI_SOURCE,DIE_TAG,PETSC_COMM_WORLD);CHKERRMPI(ierr);
457c4762a1bSJed Brown   }
458c4762a1bSJed Brown   PetscFunctionReturn(0);
459c4762a1bSJed Brown }
460c4762a1bSJed Brown 
461c4762a1bSJed Brown /*TEST
462c4762a1bSJed Brown 
463c4762a1bSJed Brown    build:
464c4762a1bSJed Brown       requires: !complex
465c4762a1bSJed Brown 
466c4762a1bSJed Brown    test:
467c4762a1bSJed Brown       nsize: 3
468c4762a1bSJed Brown       requires: !single
469c4762a1bSJed Brown       args: -tao_smonitor -tao_max_it 100 -tao_type pounders -tao_gatol 1.e-5
470c4762a1bSJed Brown 
471c4762a1bSJed Brown TEST*/
472