1c4762a1bSJed Brown static char help[] = "Demonstrates automatic, matrix-free Jacobian generation using ADOL-C for a time-dependent PDE in 2d, solved using implicit timestepping.\n"; 2c4762a1bSJed Brown 3c4762a1bSJed Brown /* 4c4762a1bSJed Brown Concepts: TS^time-dependent nonlinear problems 5c4762a1bSJed Brown Concepts: Automatic differentiation using ADOL-C 6c4762a1bSJed Brown Concepts: Matrix-free methods 7c4762a1bSJed Brown */ 8c4762a1bSJed Brown /* 9c4762a1bSJed Brown REQUIRES configuration of PETSc with option --download-adolc. 10c4762a1bSJed Brown 11c4762a1bSJed Brown For documentation on ADOL-C, see 12c4762a1bSJed Brown $PETSC_ARCH/externalpackages/ADOL-C-2.6.0/ADOL-C/doc/adolc-manual.pdf 13c4762a1bSJed Brown */ 14c4762a1bSJed Brown /* ------------------------------------------------------------------------ 15c4762a1bSJed Brown See ../advection-diffusion-reaction/ex5 for a description of the problem 16c4762a1bSJed Brown ------------------------------------------------------------------------- */ 17c4762a1bSJed Brown 18c4762a1bSJed Brown #include <petscdmda.h> 19c4762a1bSJed Brown #include <petscts.h> 20c4762a1bSJed Brown #include "adolc-utils/init.cxx" 21c4762a1bSJed Brown #include "adolc-utils/matfree.cxx" 22c4762a1bSJed Brown #include <adolc/adolc.h> 23c4762a1bSJed Brown 24c4762a1bSJed Brown /* (Passive) field for the two variables */ 25c4762a1bSJed Brown typedef struct { 26c4762a1bSJed Brown PetscScalar u,v; 27c4762a1bSJed Brown } Field; 28c4762a1bSJed Brown 29c4762a1bSJed Brown /* Active field for the two variables */ 30c4762a1bSJed Brown typedef struct { 31c4762a1bSJed Brown adouble u,v; 32c4762a1bSJed Brown } AField; 33c4762a1bSJed Brown 34c4762a1bSJed Brown /* Application context */ 35c4762a1bSJed Brown typedef struct { 36c4762a1bSJed Brown PetscReal D1,D2,gamma,kappa; 37c4762a1bSJed Brown AField **u_a,**f_a; 38c4762a1bSJed Brown AdolcCtx *adctx; /* Automatic differentation support */ 39c4762a1bSJed Brown } AppCtx; 40c4762a1bSJed Brown 41c4762a1bSJed Brown extern PetscErrorCode InitialConditions(DM da,Vec U); 42c4762a1bSJed Brown extern PetscErrorCode InitializeLambda(DM da,Vec lambda,PetscReal x,PetscReal y); 43c4762a1bSJed Brown extern PetscErrorCode IFunctionLocalPassive(DMDALocalInfo *info,PetscReal t,Field**u,Field**udot,Field**f,void *ptr); 44c4762a1bSJed Brown extern PetscErrorCode IFunctionActive(TS ts,PetscReal ftime,Vec U,Vec Udot,Vec F,void *ptr); 45c4762a1bSJed Brown extern PetscErrorCode IJacobianMatFree(TS ts,PetscReal t,Vec X,Vec Xdot,PetscReal a,Mat A_shell,Mat B,void *ctx); 46c4762a1bSJed Brown 47c4762a1bSJed Brown int main(int argc,char **argv) 48c4762a1bSJed Brown { 49c4762a1bSJed Brown TS ts; /* ODE integrator */ 50c4762a1bSJed Brown Vec x,r; /* solution, residual */ 51c4762a1bSJed Brown PetscErrorCode ierr; 52c4762a1bSJed Brown DM da; 53c4762a1bSJed Brown AppCtx appctx; /* Application context */ 54c4762a1bSJed Brown AdolcMatCtx matctx; /* Matrix (free) context */ 55c4762a1bSJed Brown Vec lambda[1]; 56c4762a1bSJed Brown PetscBool forwardonly=PETSC_FALSE; 57c4762a1bSJed Brown Mat A; /* (Matrix free) Jacobian matrix */ 58c4762a1bSJed Brown PetscInt gxm,gym; 59c4762a1bSJed Brown 60c4762a1bSJed Brown /* - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - 61c4762a1bSJed Brown Initialize program 62c4762a1bSJed Brown - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - */ 63c4762a1bSJed Brown ierr = PetscInitialize(&argc,&argv,NULL,help);if (ierr) return ierr; 64c4762a1bSJed Brown ierr = PetscOptionsGetBool(NULL,NULL,"-forwardonly",&forwardonly,NULL);CHKERRQ(ierr); 65c4762a1bSJed Brown PetscFunctionBeginUser; 66c4762a1bSJed Brown appctx.D1 = 8.0e-5; 67c4762a1bSJed Brown appctx.D2 = 4.0e-5; 68c4762a1bSJed Brown appctx.gamma = .024; 69c4762a1bSJed Brown appctx.kappa = .06; 70c4762a1bSJed Brown ierr = PetscLogEventRegister("df/dx forward",MAT_CLASSID,&matctx.event1);CHKERRQ(ierr); 71c4762a1bSJed Brown ierr = PetscLogEventRegister("df/d(xdot) forward",MAT_CLASSID,&matctx.event2);CHKERRQ(ierr); 72c4762a1bSJed Brown ierr = PetscLogEventRegister("df/dx reverse",MAT_CLASSID,&matctx.event3);CHKERRQ(ierr); 73c4762a1bSJed Brown ierr = PetscLogEventRegister("df/d(xdot) reverse",MAT_CLASSID,&matctx.event4);CHKERRQ(ierr); 74c4762a1bSJed Brown 75c4762a1bSJed Brown /* - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - 76c4762a1bSJed Brown Create distributed array (DMDA) to manage parallel grid and vectors 77c4762a1bSJed Brown - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - */ 78c4762a1bSJed Brown ierr = DMDACreate2d(PETSC_COMM_WORLD,DM_BOUNDARY_PERIODIC,DM_BOUNDARY_PERIODIC,DMDA_STENCIL_STAR,65,65,PETSC_DECIDE,PETSC_DECIDE,2,1,NULL,NULL,&da);CHKERRQ(ierr); 79c4762a1bSJed Brown ierr = DMSetFromOptions(da);CHKERRQ(ierr); 80c4762a1bSJed Brown ierr = DMSetUp(da);CHKERRQ(ierr); 81c4762a1bSJed Brown ierr = DMDASetFieldName(da,0,"u");CHKERRQ(ierr); 82c4762a1bSJed Brown ierr = DMDASetFieldName(da,1,"v");CHKERRQ(ierr); 83c4762a1bSJed Brown 84c4762a1bSJed Brown /* - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - 85c4762a1bSJed Brown Extract global vectors from DMDA; then duplicate for remaining 86c4762a1bSJed Brown vectors that are the same types 87c4762a1bSJed Brown - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - */ 88c4762a1bSJed Brown ierr = DMCreateGlobalVector(da,&x);CHKERRQ(ierr); 89c4762a1bSJed Brown ierr = VecDuplicate(x,&r);CHKERRQ(ierr); 90c4762a1bSJed Brown 91c4762a1bSJed Brown /* - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - 92c4762a1bSJed Brown Create matrix free context and specify usage of PETSc-ADOL-C drivers 93c4762a1bSJed Brown - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - */ 94c4762a1bSJed Brown ierr = DMSetMatType(da,MATSHELL);CHKERRQ(ierr); 95c4762a1bSJed Brown ierr = DMCreateMatrix(da,&A);CHKERRQ(ierr); 96c4762a1bSJed Brown ierr = MatShellSetContext(A,&matctx);CHKERRQ(ierr); 97c4762a1bSJed Brown ierr = MatShellSetOperation(A,MATOP_MULT,(void (*)(void))PetscAdolcIJacobianVectorProductIDMass);CHKERRQ(ierr); 98c4762a1bSJed Brown ierr = MatShellSetOperation(A,MATOP_MULT_TRANSPOSE,(void (*)(void))PetscAdolcIJacobianTransposeVectorProductIDMass);CHKERRQ(ierr); 99c4762a1bSJed Brown ierr = VecDuplicate(x,&matctx.X);CHKERRQ(ierr); 100c4762a1bSJed Brown ierr = VecDuplicate(x,&matctx.Xdot);CHKERRQ(ierr); 101c4762a1bSJed Brown ierr = DMGetLocalVector(da,&matctx.localX0);CHKERRQ(ierr); 102c4762a1bSJed Brown 103c4762a1bSJed Brown /* - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - 104c4762a1bSJed Brown Create timestepping solver context 105c4762a1bSJed Brown - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - */ 106c4762a1bSJed Brown ierr = TSCreate(PETSC_COMM_WORLD,&ts);CHKERRQ(ierr); 107c4762a1bSJed Brown ierr = TSSetType(ts,TSCN);CHKERRQ(ierr); 108c4762a1bSJed Brown ierr = TSSetDM(ts,da);CHKERRQ(ierr); 109c4762a1bSJed Brown ierr = TSSetProblemType(ts,TS_NONLINEAR);CHKERRQ(ierr); 110c4762a1bSJed Brown ierr = DMDATSSetIFunctionLocal(da,INSERT_VALUES,(DMDATSIFunctionLocal)IFunctionLocalPassive,&appctx);CHKERRQ(ierr); 111c4762a1bSJed Brown 112c4762a1bSJed Brown /* - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - 113c4762a1bSJed Brown Some data required for matrix-free context 114c4762a1bSJed Brown - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - */ 115c4762a1bSJed Brown ierr = DMDAGetGhostCorners(da,NULL,NULL,NULL,&gxm,&gym,NULL);CHKERRQ(ierr); 116c4762a1bSJed Brown matctx.m = 2*gxm*gym;matctx.n = 2*gxm*gym; /* Number of dependent and independent variables */ 117c4762a1bSJed Brown matctx.flg = PETSC_FALSE; /* Flag for reverse mode */ 118c4762a1bSJed Brown matctx.tag1 = 1; /* Tape identifier */ 119c4762a1bSJed Brown 120c4762a1bSJed Brown /* - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - 121c4762a1bSJed Brown Trace function just once 122c4762a1bSJed Brown - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - */ 123c4762a1bSJed Brown ierr = PetscNew(&appctx.adctx);CHKERRQ(ierr); 124c4762a1bSJed Brown ierr = IFunctionActive(ts,1.,x,matctx.Xdot,r,&appctx);CHKERRQ(ierr); 125c4762a1bSJed Brown ierr = PetscFree(appctx.adctx);CHKERRQ(ierr); 126c4762a1bSJed Brown 127c4762a1bSJed Brown /* - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - 128c4762a1bSJed Brown Set Jacobian. In this case, IJacobian simply acts to pass context 129c4762a1bSJed Brown information to the matrix-free Jacobian vector product. 130c4762a1bSJed Brown - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - */ 131c4762a1bSJed Brown ierr = TSSetIJacobian(ts,A,A,IJacobianMatFree,&appctx);CHKERRQ(ierr); 132c4762a1bSJed Brown 133c4762a1bSJed Brown /* - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - 134c4762a1bSJed Brown Set initial conditions 135c4762a1bSJed Brown - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - */ 136c4762a1bSJed Brown ierr = InitialConditions(da,x);CHKERRQ(ierr); 137c4762a1bSJed Brown ierr = TSSetSolution(ts,x);CHKERRQ(ierr); 138c4762a1bSJed Brown 139c4762a1bSJed Brown /* - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - 140c4762a1bSJed Brown Have the TS save its trajectory so that TSAdjointSolve() may be used 141c4762a1bSJed Brown and set solver options 142c4762a1bSJed Brown - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - */ 143c4762a1bSJed Brown if (!forwardonly) { 144c4762a1bSJed Brown ierr = TSSetSaveTrajectory(ts);CHKERRQ(ierr); 145c4762a1bSJed Brown ierr = TSSetMaxTime(ts,200.0);CHKERRQ(ierr); 146c4762a1bSJed Brown ierr = TSSetTimeStep(ts,0.5);CHKERRQ(ierr); 147c4762a1bSJed Brown } else { 148c4762a1bSJed Brown ierr = TSSetMaxTime(ts,2000.0);CHKERRQ(ierr); 149c4762a1bSJed Brown ierr = TSSetTimeStep(ts,10);CHKERRQ(ierr); 150c4762a1bSJed Brown } 151c4762a1bSJed Brown ierr = TSSetExactFinalTime(ts,TS_EXACTFINALTIME_STEPOVER);CHKERRQ(ierr); 152c4762a1bSJed Brown ierr = TSSetFromOptions(ts);CHKERRQ(ierr); 153c4762a1bSJed Brown 154c4762a1bSJed Brown /* - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - 155c4762a1bSJed Brown Solve ODE system 156c4762a1bSJed Brown - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - */ 157c4762a1bSJed Brown ierr = TSSolve(ts,x);CHKERRQ(ierr); 158c4762a1bSJed Brown if (!forwardonly) { 159c4762a1bSJed Brown /* - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - 160c4762a1bSJed Brown Start the Adjoint model 161c4762a1bSJed Brown - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - */ 162c4762a1bSJed Brown ierr = VecDuplicate(x,&lambda[0]);CHKERRQ(ierr); 163c4762a1bSJed Brown /* Reset initial conditions for the adjoint integration */ 164c4762a1bSJed Brown ierr = InitializeLambda(da,lambda[0],0.5,0.5);CHKERRQ(ierr); 165c4762a1bSJed Brown ierr = TSSetCostGradients(ts,1,lambda,NULL);CHKERRQ(ierr); 166c4762a1bSJed Brown ierr = TSAdjointSolve(ts);CHKERRQ(ierr); 167c4762a1bSJed Brown ierr = VecDestroy(&lambda[0]);CHKERRQ(ierr); 168c4762a1bSJed Brown } 169c4762a1bSJed Brown 170c4762a1bSJed Brown /* - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - 171c4762a1bSJed Brown Free work space. All PETSc objects should be destroyed when they 172c4762a1bSJed Brown are no longer needed. 173c4762a1bSJed Brown - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - */ 174c4762a1bSJed Brown ierr = DMRestoreLocalVector(da,&matctx.localX0);CHKERRQ(ierr); 175c4762a1bSJed Brown ierr = VecDestroy(&r);CHKERRQ(ierr); 176c4762a1bSJed Brown ierr = VecDestroy(&matctx.X);CHKERRQ(ierr); 177c4762a1bSJed Brown ierr = VecDestroy(&matctx.Xdot);CHKERRQ(ierr); 178c4762a1bSJed Brown ierr = MatDestroy(&A);CHKERRQ(ierr); 179c4762a1bSJed Brown ierr = VecDestroy(&x);CHKERRQ(ierr); 180c4762a1bSJed Brown ierr = TSDestroy(&ts);CHKERRQ(ierr); 181c4762a1bSJed Brown ierr = DMDestroy(&da);CHKERRQ(ierr); 182c4762a1bSJed Brown 183c4762a1bSJed Brown ierr = PetscFinalize(); 184c4762a1bSJed Brown return ierr; 185c4762a1bSJed Brown } 186c4762a1bSJed Brown 187c4762a1bSJed Brown PetscErrorCode InitialConditions(DM da,Vec U) 188c4762a1bSJed Brown { 189c4762a1bSJed Brown PetscErrorCode ierr; 190c4762a1bSJed Brown PetscInt i,j,xs,ys,xm,ym,Mx,My; 191c4762a1bSJed Brown Field **u; 192c4762a1bSJed Brown PetscReal hx,hy,x,y; 193c4762a1bSJed Brown 194c4762a1bSJed Brown PetscFunctionBegin; 195c4762a1bSJed Brown ierr = DMDAGetInfo(da,PETSC_IGNORE,&Mx,&My,PETSC_IGNORE,PETSC_IGNORE,PETSC_IGNORE,PETSC_IGNORE,PETSC_IGNORE,PETSC_IGNORE,PETSC_IGNORE,PETSC_IGNORE,PETSC_IGNORE,PETSC_IGNORE);CHKERRQ(ierr); 196c4762a1bSJed Brown 197c4762a1bSJed Brown hx = 2.5/(PetscReal)Mx; 198c4762a1bSJed Brown hy = 2.5/(PetscReal)My; 199c4762a1bSJed Brown 200c4762a1bSJed Brown /* 201c4762a1bSJed Brown Get pointers to vector data 202c4762a1bSJed Brown */ 203c4762a1bSJed Brown ierr = DMDAVecGetArray(da,U,&u);CHKERRQ(ierr); 204c4762a1bSJed Brown 205c4762a1bSJed Brown /* 206c4762a1bSJed Brown Get local grid boundaries 207c4762a1bSJed Brown */ 208c4762a1bSJed Brown ierr = DMDAGetCorners(da,&xs,&ys,NULL,&xm,&ym,NULL);CHKERRQ(ierr); 209c4762a1bSJed Brown 210c4762a1bSJed Brown /* 211c4762a1bSJed Brown Compute function over the locally owned part of the grid 212c4762a1bSJed Brown */ 213c4762a1bSJed Brown for (j=ys; j<ys+ym; j++) { 214c4762a1bSJed Brown y = j*hy; 215c4762a1bSJed Brown for (i=xs; i<xs+xm; i++) { 216c4762a1bSJed Brown x = i*hx; 217*66baab88SBarry Smith if (PetscApproximateGTE(x,1.0) && PetscApproximateLTE(x,1.5) && PetscApproximateGTE(y,1.0) && PetscApproximateLTE(y,1.5)) u[j][i].v = PetscPowReal(PetscSinReal(4.0*PETSC_PI*x),2.0)*PetscPowReal(PetscSinReal(4.0*PETSC_PI*y),2.0)/4.0; 218c4762a1bSJed Brown else u[j][i].v = 0.0; 219c4762a1bSJed Brown 220c4762a1bSJed Brown u[j][i].u = 1.0 - 2.0*u[j][i].v; 221c4762a1bSJed Brown } 222c4762a1bSJed Brown } 223c4762a1bSJed Brown 224c4762a1bSJed Brown /* 225c4762a1bSJed Brown Restore vectors 226c4762a1bSJed Brown */ 227c4762a1bSJed Brown ierr = DMDAVecRestoreArray(da,U,&u);CHKERRQ(ierr); 228c4762a1bSJed Brown PetscFunctionReturn(0); 229c4762a1bSJed Brown } 230c4762a1bSJed Brown 231c4762a1bSJed Brown PetscErrorCode InitializeLambda(DM da,Vec lambda,PetscReal x,PetscReal y) 232c4762a1bSJed Brown { 233c4762a1bSJed Brown PetscInt i,j,Mx,My,xs,ys,xm,ym; 234c4762a1bSJed Brown PetscErrorCode ierr; 235c4762a1bSJed Brown Field **l; 236c4762a1bSJed Brown 237410585f6SHong Zhang PetscFunctionBegin; 238c4762a1bSJed Brown ierr = DMDAGetInfo(da,PETSC_IGNORE,&Mx,&My,PETSC_IGNORE,PETSC_IGNORE,PETSC_IGNORE,PETSC_IGNORE,PETSC_IGNORE,PETSC_IGNORE,PETSC_IGNORE,PETSC_IGNORE,PETSC_IGNORE,PETSC_IGNORE);CHKERRQ(ierr); 239c4762a1bSJed Brown /* locate the global i index for x and j index for y */ 240c4762a1bSJed Brown i = (PetscInt)(x*(Mx-1)); 241c4762a1bSJed Brown j = (PetscInt)(y*(My-1)); 242c4762a1bSJed Brown ierr = DMDAGetCorners(da,&xs,&ys,NULL,&xm,&ym,NULL);CHKERRQ(ierr); 243c4762a1bSJed Brown 244c4762a1bSJed Brown if (xs <= i && i < xs+xm && ys <= j && j < ys+ym) { 245c4762a1bSJed Brown /* the i,j vertex is on this process */ 246c4762a1bSJed Brown ierr = DMDAVecGetArray(da,lambda,&l);CHKERRQ(ierr); 247c4762a1bSJed Brown l[j][i].u = 1.0; 248c4762a1bSJed Brown l[j][i].v = 1.0; 249c4762a1bSJed Brown ierr = DMDAVecRestoreArray(da,lambda,&l);CHKERRQ(ierr); 250c4762a1bSJed Brown } 251c4762a1bSJed Brown PetscFunctionReturn(0); 252c4762a1bSJed Brown } 253c4762a1bSJed Brown 254c4762a1bSJed Brown PetscErrorCode IFunctionLocalPassive(DMDALocalInfo *info,PetscReal t,Field**u,Field**udot,Field**f,void *ptr) 255c4762a1bSJed Brown { 256c4762a1bSJed Brown AppCtx *appctx = (AppCtx*)ptr; 257c4762a1bSJed Brown PetscInt i,j,xs,ys,xm,ym; 258c4762a1bSJed Brown PetscReal hx,hy,sx,sy; 259c4762a1bSJed Brown PetscScalar uc,uxx,uyy,vc,vxx,vyy; 260c4762a1bSJed Brown PetscErrorCode ierr; 261c4762a1bSJed Brown 262c4762a1bSJed Brown PetscFunctionBegin; 263c4762a1bSJed Brown hx = 2.50/(PetscReal)(info->mx); sx = 1.0/(hx*hx); 264c4762a1bSJed Brown hy = 2.50/(PetscReal)(info->my); sy = 1.0/(hy*hy); 265c4762a1bSJed Brown 266c4762a1bSJed Brown /* Get local grid boundaries */ 267c4762a1bSJed Brown xs = info->xs; xm = info->xm; ys = info->ys; ym = info->ym; 268c4762a1bSJed Brown 269c4762a1bSJed Brown /* Compute function over the locally owned part of the grid */ 270c4762a1bSJed Brown for (j=ys; j<ys+ym; j++) { 271c4762a1bSJed Brown for (i=xs; i<xs+xm; i++) { 272c4762a1bSJed Brown uc = u[j][i].u; 273c4762a1bSJed Brown uxx = (-2.0*uc + u[j][i-1].u + u[j][i+1].u)*sx; 274c4762a1bSJed Brown uyy = (-2.0*uc + u[j-1][i].u + u[j+1][i].u)*sy; 275c4762a1bSJed Brown vc = u[j][i].v; 276c4762a1bSJed Brown vxx = (-2.0*vc + u[j][i-1].v + u[j][i+1].v)*sx; 277c4762a1bSJed Brown vyy = (-2.0*vc + u[j-1][i].v + u[j+1][i].v)*sy; 278c4762a1bSJed Brown f[j][i].u = udot[j][i].u - appctx->D1*(uxx + uyy) + uc*vc*vc - appctx->gamma*(1.0 - uc); 279c4762a1bSJed Brown f[j][i].v = udot[j][i].v - appctx->D2*(vxx + vyy) - uc*vc*vc + (appctx->gamma + appctx->kappa)*vc; 280c4762a1bSJed Brown } 281c4762a1bSJed Brown } 282ca0c957dSBarry Smith ierr = PetscLogFlops(16.0*xm*ym);CHKERRQ(ierr); 283c4762a1bSJed Brown PetscFunctionReturn(0); 284c4762a1bSJed Brown } 285c4762a1bSJed Brown 286c4762a1bSJed Brown PetscErrorCode IFunctionActive(TS ts,PetscReal ftime,Vec U,Vec Udot,Vec F,void *ptr) 287c4762a1bSJed Brown { 288c4762a1bSJed Brown PetscErrorCode ierr; 289c4762a1bSJed Brown AppCtx *appctx = (AppCtx*)ptr; 290c4762a1bSJed Brown DM da; 291c4762a1bSJed Brown DMDALocalInfo info; 292c4762a1bSJed Brown Field **u,**f,**udot; 293c4762a1bSJed Brown Vec localU; 294c4762a1bSJed Brown PetscInt i,j,xs,ys,xm,ym,gxs,gys,gxm,gym; 295c4762a1bSJed Brown PetscReal hx,hy,sx,sy; 296c4762a1bSJed Brown adouble uc,uxx,uyy,vc,vxx,vyy; 297c4762a1bSJed Brown AField **f_a,*f_c,**u_a,*u_c; 298c4762a1bSJed Brown PetscScalar dummy; 299c4762a1bSJed Brown 300c4762a1bSJed Brown PetscFunctionBegin; 301c4762a1bSJed Brown ierr = TSGetDM(ts,&da);CHKERRQ(ierr); 302c4762a1bSJed Brown ierr = DMDAGetLocalInfo(da,&info);CHKERRQ(ierr); 303c4762a1bSJed Brown ierr = DMGetLocalVector(da,&localU);CHKERRQ(ierr); 304c4762a1bSJed Brown hx = 2.50/(PetscReal)(info.mx); sx = 1.0/(hx*hx); 305c4762a1bSJed Brown hy = 2.50/(PetscReal)(info.my); sy = 1.0/(hy*hy); 306c4762a1bSJed Brown xs = info.xs; xm = info.xm; gxs = info.gxs; gxm = info.gxm; 307c4762a1bSJed Brown ys = info.ys; ym = info.ym; gys = info.gys; gym = info.gym; 308c4762a1bSJed Brown 309c4762a1bSJed Brown /* 310c4762a1bSJed Brown Scatter ghost points to local vector,using the 2-step process 311c4762a1bSJed Brown DMGlobalToLocalBegin(),DMGlobalToLocalEnd(). 312c4762a1bSJed Brown By placing code between these two statements, computations can be 313c4762a1bSJed Brown done while messages are in transition. 314c4762a1bSJed Brown */ 315c4762a1bSJed Brown ierr = DMGlobalToLocalBegin(da,U,INSERT_VALUES,localU);CHKERRQ(ierr); 316c4762a1bSJed Brown ierr = DMGlobalToLocalEnd(da,U,INSERT_VALUES,localU);CHKERRQ(ierr); 317c4762a1bSJed Brown 318c4762a1bSJed Brown /* 319c4762a1bSJed Brown Get pointers to vector data 320c4762a1bSJed Brown */ 321c4762a1bSJed Brown ierr = DMDAVecGetArrayRead(da,localU,&u);CHKERRQ(ierr); 322c4762a1bSJed Brown ierr = DMDAVecGetArray(da,F,&f);CHKERRQ(ierr); 323c4762a1bSJed Brown ierr = DMDAVecGetArrayRead(da,Udot,&udot);CHKERRQ(ierr); 324c4762a1bSJed Brown 325c4762a1bSJed Brown /* 326c4762a1bSJed Brown Create contiguous 1-arrays of AFields 327c4762a1bSJed Brown 328c4762a1bSJed Brown NOTE: Memory for ADOL-C active variables (such as adouble and AField) 329c4762a1bSJed Brown cannot be allocated using PetscMalloc, as this does not call the 330c4762a1bSJed Brown relevant class constructor. Instead, we use the C++ keyword `new`. 331c4762a1bSJed Brown */ 332c4762a1bSJed Brown u_c = new AField[info.gxm*info.gym]; 333c4762a1bSJed Brown f_c = new AField[info.gxm*info.gym]; 334c4762a1bSJed Brown 335c4762a1bSJed Brown /* Create corresponding 2-arrays of AFields */ 336c4762a1bSJed Brown u_a = new AField*[info.gym]; 337c4762a1bSJed Brown f_a = new AField*[info.gym]; 338c4762a1bSJed Brown 339c4762a1bSJed Brown /* Align indices between array types to endow 2d array with ghost points */ 340c4762a1bSJed Brown ierr = GiveGhostPoints(da,u_c,&u_a);CHKERRQ(ierr); 341c4762a1bSJed Brown ierr = GiveGhostPoints(da,f_c,&f_a);CHKERRQ(ierr); 342c4762a1bSJed Brown 343c4762a1bSJed Brown trace_on(1); /* Start of active section on tape 1 */ 344c4762a1bSJed Brown 345c4762a1bSJed Brown /* 346c4762a1bSJed Brown Mark independence 347c4762a1bSJed Brown 348c4762a1bSJed Brown NOTE: Ghost points are marked as independent, in place of the points they represent on 349c4762a1bSJed Brown other processors / on other boundaries. 350c4762a1bSJed Brown */ 351c4762a1bSJed Brown for (j=gys; j<gys+gym; j++) { 352c4762a1bSJed Brown for (i=gxs; i<gxs+gxm; i++) { 353c4762a1bSJed Brown u_a[j][i].u <<= u[j][i].u; 354c4762a1bSJed Brown u_a[j][i].v <<= u[j][i].v; 355c4762a1bSJed Brown } 356c4762a1bSJed Brown } 357c4762a1bSJed Brown 358c4762a1bSJed Brown /* Compute function over the locally owned part of the grid */ 359c4762a1bSJed Brown for (j=ys; j<ys+ym; j++) { 360c4762a1bSJed Brown for (i=xs; i<xs+xm; i++) { 361c4762a1bSJed Brown uc = u_a[j][i].u; 362c4762a1bSJed Brown uxx = (-2.0*uc + u_a[j][i-1].u + u_a[j][i+1].u)*sx; 363c4762a1bSJed Brown uyy = (-2.0*uc + u_a[j-1][i].u + u_a[j+1][i].u)*sy; 364c4762a1bSJed Brown vc = u_a[j][i].v; 365c4762a1bSJed Brown vxx = (-2.0*vc + u_a[j][i-1].v + u_a[j][i+1].v)*sx; 366c4762a1bSJed Brown vyy = (-2.0*vc + u_a[j-1][i].v + u_a[j+1][i].v)*sy; 367c4762a1bSJed Brown f_a[j][i].u = udot[j][i].u - appctx->D1*(uxx + uyy) + uc*vc*vc - appctx->gamma*(1.0 - uc); 368c4762a1bSJed Brown f_a[j][i].v = udot[j][i].v - appctx->D2*(vxx + vyy) - uc*vc*vc + (appctx->gamma + appctx->kappa)*vc; 369c4762a1bSJed Brown } 370c4762a1bSJed Brown } 371c4762a1bSJed Brown 372c4762a1bSJed Brown /* 373c4762a1bSJed Brown Mark dependence 374c4762a1bSJed Brown 375c4762a1bSJed Brown NOTE: Marking dependence of dummy variables makes the index notation much simpler when forming 376c4762a1bSJed Brown the Jacobian later. 377c4762a1bSJed Brown */ 378c4762a1bSJed Brown for (j=gys; j<gys+gym; j++) { 379c4762a1bSJed Brown for (i=gxs; i<gxs+gxm; i++) { 380c4762a1bSJed Brown if ((i < xs) || (i >= xs+xm) || (j < ys) || (j >= ys+ym)) { 381c4762a1bSJed Brown f_a[j][i].u >>= dummy; 382c4762a1bSJed Brown f_a[j][i].v >>= dummy; 383c4762a1bSJed Brown } else { 384c4762a1bSJed Brown f_a[j][i].u >>= f[j][i].u; 385c4762a1bSJed Brown f_a[j][i].v >>= f[j][i].v; 386c4762a1bSJed Brown } 387c4762a1bSJed Brown } 388c4762a1bSJed Brown } 389c4762a1bSJed Brown trace_off(); /* End of active section */ 390ca0c957dSBarry Smith ierr = PetscLogFlops(16.0*xm*ym);CHKERRQ(ierr); 391c4762a1bSJed Brown 392c4762a1bSJed Brown /* Restore vectors */ 393c4762a1bSJed Brown ierr = DMDAVecRestoreArray(da,F,&f);CHKERRQ(ierr); 394c4762a1bSJed Brown ierr = DMDAVecRestoreArrayRead(da,localU,&u);CHKERRQ(ierr); 395c4762a1bSJed Brown ierr = DMDAVecRestoreArrayRead(da,Udot,&udot);CHKERRQ(ierr); 396c4762a1bSJed Brown 397410585f6SHong Zhang ierr = DMRestoreLocalVector(da,&localU);CHKERRQ(ierr); 398410585f6SHong Zhang 399c4762a1bSJed Brown /* Destroy AFields appropriately */ 400c4762a1bSJed Brown f_a += info.gys; 401c4762a1bSJed Brown u_a += info.gys; 402c4762a1bSJed Brown delete[] f_a; 403c4762a1bSJed Brown delete[] u_a; 404c4762a1bSJed Brown delete[] f_c; 405c4762a1bSJed Brown delete[] u_c; 406c4762a1bSJed Brown PetscFunctionReturn(0); 407c4762a1bSJed Brown } 408c4762a1bSJed Brown 409c4762a1bSJed Brown /* 410c4762a1bSJed Brown Simply acts to pass TS information to the AdolcMatCtx 411c4762a1bSJed Brown */ 412c4762a1bSJed Brown PetscErrorCode IJacobianMatFree(TS ts,PetscReal t,Vec X,Vec Xdot,PetscReal a,Mat A_shell,Mat B,void *ctx) 413c4762a1bSJed Brown { 414c4762a1bSJed Brown AdolcMatCtx *mctx; 415c4762a1bSJed Brown PetscErrorCode ierr; 416c4762a1bSJed Brown DM da; 417c4762a1bSJed Brown 418c4762a1bSJed Brown PetscFunctionBeginUser; 4193ec1f749SStefano Zampini ierr = MatShellGetContext(A_shell,&mctx);CHKERRQ(ierr); 420c4762a1bSJed Brown 421c4762a1bSJed Brown mctx->time = t; 422c4762a1bSJed Brown mctx->shift = a; 423c4762a1bSJed Brown if (mctx->ts != ts) mctx->ts = ts; 424c4762a1bSJed Brown ierr = VecCopy(X,mctx->X);CHKERRQ(ierr); 425c4762a1bSJed Brown ierr = VecCopy(Xdot,mctx->Xdot);CHKERRQ(ierr); 426c4762a1bSJed Brown ierr = TSGetDM(ts,&da);CHKERRQ(ierr); 427c4762a1bSJed Brown ierr = DMGlobalToLocalBegin(da,mctx->X,INSERT_VALUES,mctx->localX0);CHKERRQ(ierr); 428c4762a1bSJed Brown ierr = DMGlobalToLocalEnd(da,mctx->X,INSERT_VALUES,mctx->localX0);CHKERRQ(ierr); 429c4762a1bSJed Brown PetscFunctionReturn(0); 430c4762a1bSJed Brown } 431c4762a1bSJed Brown 432c4762a1bSJed Brown /*TEST 433c4762a1bSJed Brown 434c4762a1bSJed Brown build: 435c4762a1bSJed Brown requires: double !complex adolc 436c4762a1bSJed Brown 437c4762a1bSJed Brown test: 438c4762a1bSJed Brown suffix: 1 439c4762a1bSJed Brown args: -ts_max_steps 1 -da_grid_x 12 -da_grid_y 12 -snes_test_jacobian 440c4762a1bSJed Brown output_file: output/adr_ex5adj_mf_1.out 441c4762a1bSJed Brown 442c4762a1bSJed Brown test: 443c4762a1bSJed Brown suffix: 2 444c4762a1bSJed Brown nsize: 4 445c4762a1bSJed Brown args: -ts_max_steps 10 -da_grid_x 12 -da_grid_y 12 -ts_monitor -ts_adjoint_monitor 446c4762a1bSJed Brown output_file: output/adr_ex5adj_mf_2.out 447c4762a1bSJed Brown 448c4762a1bSJed Brown TEST*/ 449