xref: /petsc/src/dm/impls/da/da2.c (revision 76a8abe0e2b3324ea6e141c3dc7c9c387c682989)
19a42bb27SBarry Smith 
2af0996ceSBarry Smith #include <petsc/private/dmdaimpl.h>    /*I   "petscdmda.h"   I*/
39804daf3SBarry Smith #include <petscdraw.h>
447c6ae99SBarry Smith 
5e0877f53SBarry Smith static PetscErrorCode DMView_DA_2d(DM da,PetscViewer viewer)
647c6ae99SBarry Smith {
747c6ae99SBarry Smith   PetscErrorCode ierr;
847c6ae99SBarry Smith   PetscMPIInt    rank;
9c9493c35SStefano Zampini   PetscBool      iascii,isdraw,isglvis,isbinary;
1047c6ae99SBarry Smith   DM_DA          *dd = (DM_DA*)da->data;
119a42bb27SBarry Smith #if defined(PETSC_HAVE_MATLAB_ENGINE)
129a42bb27SBarry Smith   PetscBool ismatlab;
139a42bb27SBarry Smith #endif
1447c6ae99SBarry Smith 
1547c6ae99SBarry Smith   PetscFunctionBegin;
16ce94432eSBarry Smith   ierr = MPI_Comm_rank(PetscObjectComm((PetscObject)da),&rank);CHKERRQ(ierr);
1747c6ae99SBarry Smith 
18251f4c67SDmitry Karpeev   ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&iascii);CHKERRQ(ierr);
19251f4c67SDmitry Karpeev   ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERDRAW,&isdraw);CHKERRQ(ierr);
20c9493c35SStefano Zampini   ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERGLVIS,&isglvis);CHKERRQ(ierr);
21251f4c67SDmitry Karpeev   ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERBINARY,&isbinary);CHKERRQ(ierr);
229a42bb27SBarry Smith #if defined(PETSC_HAVE_MATLAB_ENGINE)
23251f4c67SDmitry Karpeev   ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERMATLAB,&ismatlab);CHKERRQ(ierr);
249a42bb27SBarry Smith #endif
2547c6ae99SBarry Smith   if (iascii) {
2647c6ae99SBarry Smith     PetscViewerFormat format;
2747c6ae99SBarry Smith 
2847c6ae99SBarry Smith     ierr = PetscViewerGetFormat(viewer, &format);CHKERRQ(ierr);
29*76a8abe0SBarry Smith     if (format == PETSC_VIEWER_LOAD_BALANCE) {
30*76a8abe0SBarry Smith       PetscInt      i,nmax = 0,nmin = PETSC_MAX_INT,navg = 0,*nz,nzlocal;
31*76a8abe0SBarry Smith       DMDALocalInfo info;
32*76a8abe0SBarry Smith       PetscMPIInt   size;
33*76a8abe0SBarry Smith       ierr = MPI_Comm_size(PetscObjectComm((PetscObject)da),&size);CHKERRQ(ierr);
34*76a8abe0SBarry Smith       ierr = DMDAGetLocalInfo(da,&info);CHKERRQ(ierr);
35*76a8abe0SBarry Smith       nzlocal = info.xm*info.ym;
36*76a8abe0SBarry Smith       ierr = PetscMalloc1(size,&nz);CHKERRQ(ierr);
37*76a8abe0SBarry Smith       ierr = MPI_Allgather(&nzlocal,1,MPIU_INT,nz,1,MPIU_INT,PetscObjectComm((PetscObject)da));CHKERRQ(ierr);
38*76a8abe0SBarry Smith       for (i=0; i<(PetscInt)size; i++) {
39*76a8abe0SBarry Smith         nmax = PetscMax(nmax,nz[i]);
40*76a8abe0SBarry Smith         nmin = PetscMin(nmin,nz[i]);
41*76a8abe0SBarry Smith         navg += nz[i];
42*76a8abe0SBarry Smith       }
43*76a8abe0SBarry Smith       ierr = PetscFree(nz);CHKERRQ(ierr);
44*76a8abe0SBarry Smith       navg = navg/size;
45*76a8abe0SBarry Smith       ierr = PetscViewerASCIIPrintf(viewer,"  Load Balance - Grid Points: Min %D  avg %D  max %D\n",nmin,navg,nmax);CHKERRQ(ierr);
46*76a8abe0SBarry Smith       PetscFunctionReturn(0);
47*76a8abe0SBarry Smith     }
488135c375SStefano Zampini     if (format != PETSC_VIEWER_ASCII_VTK && format != PETSC_VIEWER_ASCII_VTK_CELL && format != PETSC_VIEWER_ASCII_GLVIS) {
49aa219208SBarry Smith       DMDALocalInfo info;
50aa219208SBarry Smith       ierr = DMDAGetLocalInfo(da,&info);CHKERRQ(ierr);
511575c14dSBarry Smith       ierr = PetscViewerASCIIPushSynchronized(viewer);CHKERRQ(ierr);
5247c6ae99SBarry Smith       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Processor [%d] M %D N %D m %D n %D w %D s %D\n",rank,dd->M,dd->N,dd->m,dd->n,dd->w,dd->s);CHKERRQ(ierr);
5347c6ae99SBarry Smith       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"X range of indices: %D %D, Y range of indices: %D %D\n",info.xs,info.xs+info.xm,info.ys,info.ys+info.ym);CHKERRQ(ierr);
5447c6ae99SBarry Smith       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
551575c14dSBarry Smith       ierr = PetscViewerASCIIPopSynchronized(viewer);CHKERRQ(ierr);
568135c375SStefano Zampini     } else if (format == PETSC_VIEWER_ASCII_GLVIS) {
578135c375SStefano Zampini       ierr = DMView_DA_GLVis(da,viewer);CHKERRQ(ierr);
583da9ae13SJed Brown     } else {
593da9ae13SJed Brown       ierr = DMView_DA_VTK(da,viewer);CHKERRQ(ierr);
6047c6ae99SBarry Smith     }
6147c6ae99SBarry Smith   } else if (isdraw) {
6247c6ae99SBarry Smith     PetscDraw      draw;
6347c6ae99SBarry Smith     double         ymin = -1*dd->s-1,ymax = dd->N+dd->s;
6447c6ae99SBarry Smith     double         xmin = -1*dd->s-1,xmax = dd->M+dd->s;
6547c6ae99SBarry Smith     double         x,y;
668ea3bf28SBarry Smith     PetscInt       base;
678ea3bf28SBarry Smith     const PetscInt *idx;
6847c6ae99SBarry Smith     char           node[10];
6947c6ae99SBarry Smith     PetscBool      isnull;
7047c6ae99SBarry Smith 
7147c6ae99SBarry Smith     ierr = PetscViewerDrawGetDraw(viewer,0,&draw);CHKERRQ(ierr);
725b399a63SLisandro Dalcin     ierr = PetscDrawIsNull(draw,&isnull);CHKERRQ(ierr);
735b399a63SLisandro Dalcin     if (isnull) PetscFunctionReturn(0);
7447c6ae99SBarry Smith 
755b399a63SLisandro Dalcin     ierr = PetscDrawCheckResizedWindow(draw);CHKERRQ(ierr);
765b399a63SLisandro Dalcin     ierr = PetscDrawClear(draw);CHKERRQ(ierr);
775b399a63SLisandro Dalcin     ierr = PetscDrawSetCoordinates(draw,xmin,ymin,xmax,ymax);CHKERRQ(ierr);
785b399a63SLisandro Dalcin 
795b399a63SLisandro Dalcin     ierr = PetscDrawCollectiveBegin(draw);CHKERRQ(ierr);
8047c6ae99SBarry Smith     /* first processor draw all node lines */
8147c6ae99SBarry Smith     if (!rank) {
8247c6ae99SBarry Smith       ymin = 0.0; ymax = dd->N - 1;
8347c6ae99SBarry Smith       for (xmin=0; xmin<dd->M; xmin++) {
8447c6ae99SBarry Smith         ierr = PetscDrawLine(draw,xmin,ymin,xmin,ymax,PETSC_DRAW_BLACK);CHKERRQ(ierr);
8547c6ae99SBarry Smith       }
8647c6ae99SBarry Smith       xmin = 0.0; xmax = dd->M - 1;
8747c6ae99SBarry Smith       for (ymin=0; ymin<dd->N; ymin++) {
8847c6ae99SBarry Smith         ierr = PetscDrawLine(draw,xmin,ymin,xmax,ymin,PETSC_DRAW_BLACK);CHKERRQ(ierr);
8947c6ae99SBarry Smith       }
9047c6ae99SBarry Smith     }
915b399a63SLisandro Dalcin     ierr = PetscDrawCollectiveEnd(draw);CHKERRQ(ierr);
925b399a63SLisandro Dalcin     ierr = PetscDrawFlush(draw);CHKERRQ(ierr);
9347c6ae99SBarry Smith     ierr = PetscDrawPause(draw);CHKERRQ(ierr);
9447c6ae99SBarry Smith 
955b399a63SLisandro Dalcin     ierr = PetscDrawCollectiveBegin(draw);CHKERRQ(ierr);
9647c6ae99SBarry Smith     /* draw my box */
975b399a63SLisandro Dalcin     xmin = dd->xs/dd->w; xmax =(dd->xe-1)/dd->w; ymin = dd->ys; ymax = dd->ye - 1;
9847c6ae99SBarry Smith     ierr = PetscDrawLine(draw,xmin,ymin,xmax,ymin,PETSC_DRAW_RED);CHKERRQ(ierr);
9947c6ae99SBarry Smith     ierr = PetscDrawLine(draw,xmin,ymin,xmin,ymax,PETSC_DRAW_RED);CHKERRQ(ierr);
10047c6ae99SBarry Smith     ierr = PetscDrawLine(draw,xmin,ymax,xmax,ymax,PETSC_DRAW_RED);CHKERRQ(ierr);
10147c6ae99SBarry Smith     ierr = PetscDrawLine(draw,xmax,ymin,xmax,ymax,PETSC_DRAW_RED);CHKERRQ(ierr);
10247c6ae99SBarry Smith     /* put in numbers */
10347c6ae99SBarry Smith     base = (dd->base)/dd->w;
10447c6ae99SBarry Smith     for (y=ymin; y<=ymax; y++) {
10547c6ae99SBarry Smith       for (x=xmin; x<=xmax; x++) {
1065b399a63SLisandro Dalcin         ierr = PetscSNPrintf(node,sizeof(node),"%d",(int)base++);CHKERRQ(ierr);
10747c6ae99SBarry Smith         ierr = PetscDrawString(draw,x,y,PETSC_DRAW_BLACK,node);CHKERRQ(ierr);
10847c6ae99SBarry Smith       }
10947c6ae99SBarry Smith     }
1105b399a63SLisandro Dalcin     ierr = PetscDrawCollectiveEnd(draw);CHKERRQ(ierr);
1115b399a63SLisandro Dalcin     ierr = PetscDrawFlush(draw);CHKERRQ(ierr);
11247c6ae99SBarry Smith     ierr = PetscDrawPause(draw);CHKERRQ(ierr);
11347c6ae99SBarry Smith 
1145b399a63SLisandro Dalcin     ierr = PetscDrawCollectiveBegin(draw);CHKERRQ(ierr);
1155b399a63SLisandro Dalcin     /* overlay ghost numbers, useful for error checking */
11645b6f7e9SBarry Smith     ierr = ISLocalToGlobalMappingGetBlockIndices(da->ltogmap,&idx);CHKERRQ(ierr);
1175b399a63SLisandro Dalcin     base = 0; xmin = dd->Xs; xmax = dd->Xe; ymin = dd->Ys; ymax = dd->Ye;
11847c6ae99SBarry Smith     for (y=ymin; y<ymax; y++) {
11947c6ae99SBarry Smith       for (x=xmin; x<xmax; x++) {
12047c6ae99SBarry Smith         if ((base % dd->w) == 0) {
1215b399a63SLisandro Dalcin           ierr = PetscSNPrintf(node,sizeof(node),"%d",(int)(idx[base/dd->w]));CHKERRQ(ierr);
12247c6ae99SBarry Smith           ierr = PetscDrawString(draw,x/dd->w,y,PETSC_DRAW_BLUE,node);CHKERRQ(ierr);
12347c6ae99SBarry Smith         }
12447c6ae99SBarry Smith         base++;
12547c6ae99SBarry Smith       }
12647c6ae99SBarry Smith     }
127302440fdSBarry Smith     ierr = ISLocalToGlobalMappingRestoreBlockIndices(da->ltogmap,&idx);CHKERRQ(ierr);
1285b399a63SLisandro Dalcin     ierr = PetscDrawCollectiveEnd(draw);CHKERRQ(ierr);
1295b399a63SLisandro Dalcin     ierr = PetscDrawFlush(draw);CHKERRQ(ierr);
13047c6ae99SBarry Smith     ierr = PetscDrawPause(draw);CHKERRQ(ierr);
131832b7cebSLisandro Dalcin     ierr = PetscDrawSave(draw);CHKERRQ(ierr);
132c9493c35SStefano Zampini   } else if (isglvis) {
133c9493c35SStefano Zampini     ierr = DMView_DA_GLVis(da,viewer);CHKERRQ(ierr);
1349a42bb27SBarry Smith   } else if (isbinary) {
1359a42bb27SBarry Smith     ierr = DMView_DA_Binary(da,viewer);CHKERRQ(ierr);
1369a42bb27SBarry Smith #if defined(PETSC_HAVE_MATLAB_ENGINE)
1379a42bb27SBarry Smith   } else if (ismatlab) {
1389a42bb27SBarry Smith     ierr = DMView_DA_Matlab(da,viewer);CHKERRQ(ierr);
1399a42bb27SBarry Smith #endif
14011aeaf0aSBarry Smith   }
14147c6ae99SBarry Smith   PetscFunctionReturn(0);
14247c6ae99SBarry Smith }
14347c6ae99SBarry Smith 
14447c6ae99SBarry Smith /*
14547c6ae99SBarry Smith       M is number of grid points
14647c6ae99SBarry Smith       m is number of processors
14747c6ae99SBarry Smith 
14847c6ae99SBarry Smith */
1497087cfbeSBarry Smith PetscErrorCode  DMDASplitComm2d(MPI_Comm comm,PetscInt M,PetscInt N,PetscInt sw,MPI_Comm *outcomm)
15047c6ae99SBarry Smith {
15147c6ae99SBarry Smith   PetscErrorCode ierr;
15247c6ae99SBarry Smith   PetscInt       m,n = 0,x = 0,y = 0;
15347c6ae99SBarry Smith   PetscMPIInt    size,csize,rank;
15447c6ae99SBarry Smith 
15547c6ae99SBarry Smith   PetscFunctionBegin;
15647c6ae99SBarry Smith   ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr);
15747c6ae99SBarry Smith   ierr = MPI_Comm_rank(comm,&rank);CHKERRQ(ierr);
15847c6ae99SBarry Smith 
15947c6ae99SBarry Smith   csize = 4*size;
16047c6ae99SBarry Smith   do {
16147c6ae99SBarry Smith     if (csize % 4) SETERRQ4(PETSC_COMM_SELF,PETSC_ERR_ARG_INCOMP,"Cannot split communicator of size %d tried %d %D %D",size,csize,x,y);
16247c6ae99SBarry Smith     csize = csize/4;
16347c6ae99SBarry Smith 
164369cc0aeSBarry Smith     m = (PetscInt)(0.5 + PetscSqrtReal(((PetscReal)M)*((PetscReal)csize)/((PetscReal)N)));
16547c6ae99SBarry Smith     if (!m) m = 1;
16647c6ae99SBarry Smith     while (m > 0) {
16747c6ae99SBarry Smith       n = csize/m;
16847c6ae99SBarry Smith       if (m*n == csize) break;
16947c6ae99SBarry Smith       m--;
17047c6ae99SBarry Smith     }
17147c6ae99SBarry Smith     if (M > N && m < n) {PetscInt _m = m; m = n; n = _m;}
17247c6ae99SBarry Smith 
17347c6ae99SBarry Smith     x = M/m + ((M % m) > ((csize-1) % m));
17447c6ae99SBarry Smith     y = (N + (csize-1)/m)/n;
17547c6ae99SBarry Smith   } while ((x < 4 || y < 4) && csize > 1);
17647c6ae99SBarry Smith   if (size != csize) {
17747c6ae99SBarry Smith     MPI_Group   entire_group,sub_group;
17847c6ae99SBarry Smith     PetscMPIInt i,*groupies;
17947c6ae99SBarry Smith 
18047c6ae99SBarry Smith     ierr = MPI_Comm_group(comm,&entire_group);CHKERRQ(ierr);
181785e854fSJed Brown     ierr = PetscMalloc1(csize,&groupies);CHKERRQ(ierr);
18247c6ae99SBarry Smith     for (i=0; i<csize; i++) {
18347c6ae99SBarry Smith       groupies[i] = (rank/csize)*csize + i;
18447c6ae99SBarry Smith     }
18547c6ae99SBarry Smith     ierr = MPI_Group_incl(entire_group,csize,groupies,&sub_group);CHKERRQ(ierr);
18647c6ae99SBarry Smith     ierr = PetscFree(groupies);CHKERRQ(ierr);
18747c6ae99SBarry Smith     ierr = MPI_Comm_create(comm,sub_group,outcomm);CHKERRQ(ierr);
18847c6ae99SBarry Smith     ierr = MPI_Group_free(&entire_group);CHKERRQ(ierr);
18947c6ae99SBarry Smith     ierr = MPI_Group_free(&sub_group);CHKERRQ(ierr);
190aa219208SBarry Smith     ierr = PetscInfo1(0,"DMDASplitComm2d:Creating redundant coarse problems of size %d\n",csize);CHKERRQ(ierr);
19147c6ae99SBarry Smith   } else {
19247c6ae99SBarry Smith     *outcomm = comm;
19347c6ae99SBarry Smith   }
19447c6ae99SBarry Smith   PetscFunctionReturn(0);
19547c6ae99SBarry Smith }
19647c6ae99SBarry Smith 
19747c6ae99SBarry Smith #if defined(new)
19847c6ae99SBarry Smith /*
199aa219208SBarry Smith   DMDAGetDiagonal_MFFD - Gets the diagonal for a matrix free matrix where local
200aa219208SBarry Smith     function lives on a DMDA
20147c6ae99SBarry Smith 
20247c6ae99SBarry Smith         y ~= (F(u + ha) - F(u))/h,
20347c6ae99SBarry Smith   where F = nonlinear function, as set by SNESSetFunction()
20447c6ae99SBarry Smith         u = current iterate
20547c6ae99SBarry Smith         h = difference interval
20647c6ae99SBarry Smith */
207aa219208SBarry Smith PetscErrorCode DMDAGetDiagonal_MFFD(DM da,Vec U,Vec a)
20847c6ae99SBarry Smith {
20947c6ae99SBarry Smith   PetscScalar    h,*aa,*ww,v;
21047c6ae99SBarry Smith   PetscReal      epsilon = PETSC_SQRT_MACHINE_EPSILON,umin = 100.0*PETSC_SQRT_MACHINE_EPSILON;
21147c6ae99SBarry Smith   PetscErrorCode ierr;
21247c6ae99SBarry Smith   PetscInt       gI,nI;
21347c6ae99SBarry Smith   MatStencil     stencil;
214aa219208SBarry Smith   DMDALocalInfo  info;
21547c6ae99SBarry Smith 
21647c6ae99SBarry Smith   PetscFunctionBegin;
21747c6ae99SBarry Smith   ierr = (*ctx->func)(0,U,a,ctx->funcctx);CHKERRQ(ierr);
21847c6ae99SBarry Smith   ierr = (*ctx->funcisetbase)(U,ctx->funcctx);CHKERRQ(ierr);
21947c6ae99SBarry Smith 
22047c6ae99SBarry Smith   ierr = VecGetArray(U,&ww);CHKERRQ(ierr);
22147c6ae99SBarry Smith   ierr = VecGetArray(a,&aa);CHKERRQ(ierr);
22247c6ae99SBarry Smith 
22347c6ae99SBarry Smith   nI = 0;
22447c6ae99SBarry Smith   h  = ww[gI];
22547c6ae99SBarry Smith   if (h == 0.0) h = 1.0;
22647c6ae99SBarry Smith   if (PetscAbsScalar(h) < umin && PetscRealPart(h) >= 0.0) h = umin;
22747c6ae99SBarry Smith   else if (PetscRealPart(h) < 0.0 && PetscAbsScalar(h) < umin) h = -umin;
22847c6ae99SBarry Smith   h *= epsilon;
22947c6ae99SBarry Smith 
23047c6ae99SBarry Smith   ww[gI] += h;
23147c6ae99SBarry Smith   ierr    = (*ctx->funci)(i,w,&v,ctx->funcctx);CHKERRQ(ierr);
23247c6ae99SBarry Smith   aa[nI]  = (v - aa[nI])/h;
23347c6ae99SBarry Smith   ww[gI] -= h;
23447c6ae99SBarry Smith   nI++;
2358865f1eaSKarl Rupp 
23647c6ae99SBarry Smith   ierr = VecRestoreArray(U,&ww);CHKERRQ(ierr);
23747c6ae99SBarry Smith   ierr = VecRestoreArray(a,&aa);CHKERRQ(ierr);
23847c6ae99SBarry Smith   PetscFunctionReturn(0);
23947c6ae99SBarry Smith }
24047c6ae99SBarry Smith #endif
24147c6ae99SBarry Smith 
2427087cfbeSBarry Smith PetscErrorCode  DMSetUp_DA_2D(DM da)
24347c6ae99SBarry Smith {
24447c6ae99SBarry Smith   DM_DA            *dd = (DM_DA*)da->data;
24547c6ae99SBarry Smith   const PetscInt   M            = dd->M;
24647c6ae99SBarry Smith   const PetscInt   N            = dd->N;
24747c6ae99SBarry Smith   PetscInt         m            = dd->m;
24847c6ae99SBarry Smith   PetscInt         n            = dd->n;
24947c6ae99SBarry Smith   const PetscInt   dof          = dd->w;
25047c6ae99SBarry Smith   const PetscInt   s            = dd->s;
251bff4a2f0SMatthew G. Knepley   DMBoundaryType   bx           = dd->bx;
252bff4a2f0SMatthew G. Knepley   DMBoundaryType   by           = dd->by;
25319fd82e9SBarry Smith   DMDAStencilType  stencil_type = dd->stencil_type;
25447c6ae99SBarry Smith   PetscInt         *lx          = dd->lx;
25547c6ae99SBarry Smith   PetscInt         *ly          = dd->ly;
25647c6ae99SBarry Smith   MPI_Comm         comm;
25747c6ae99SBarry Smith   PetscMPIInt      rank,size;
258bd1fc5aeSBarry Smith   PetscInt         xs,xe,ys,ye,x,y,Xs,Xe,Ys,Ye,IXs,IXe,IYs,IYe;
2598ea3bf28SBarry Smith   PetscInt         up,down,left,right,i,n0,n1,n2,n3,n5,n6,n7,n8,*idx,nn;
260db87c5ecSEthan Coon   PetscInt         xbase,*bases,*ldims,j,x_t,y_t,s_t,base,count;
26147c6ae99SBarry Smith   PetscInt         s_x,s_y; /* s proportionalized to w */
26247c6ae99SBarry Smith   PetscInt         sn0 = 0,sn2 = 0,sn6 = 0,sn8 = 0;
26347c6ae99SBarry Smith   Vec              local,global;
264bd1fc5aeSBarry Smith   VecScatter       gtol;
26545b6f7e9SBarry Smith   IS               to,from;
26647c6ae99SBarry Smith   PetscErrorCode   ierr;
26747c6ae99SBarry Smith 
26847c6ae99SBarry Smith   PetscFunctionBegin;
269bff4a2f0SMatthew G. Knepley   if (stencil_type == DMDA_STENCIL_BOX && (bx == DM_BOUNDARY_MIRROR || by == DM_BOUNDARY_MIRROR)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"Mirror boundary and box stencil");
27047c6ae99SBarry Smith   ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr);
2713855c12bSBarry Smith #if !defined(PETSC_USE_64BIT_INDICES)
272bafee8b4SSatish Balay   if (((PetscInt64) M)*((PetscInt64) N)*((PetscInt64) dof) > (PetscInt64) PETSC_MPI_INT_MAX) SETERRQ3(comm,PETSC_ERR_INT_OVERFLOW,"Mesh of %D by %D by %D (dof) is too large for 32 bit indices",M,N,dof);
2733855c12bSBarry Smith #endif
27447c6ae99SBarry Smith 
27547c6ae99SBarry Smith   if (dof < 1) SETERRQ1(comm,PETSC_ERR_ARG_OUTOFRANGE,"Must have 1 or more degrees of freedom per node: %D",dof);
27647c6ae99SBarry Smith   if (s < 0) SETERRQ1(comm,PETSC_ERR_ARG_OUTOFRANGE,"Stencil width cannot be negative: %D",s);
27747c6ae99SBarry Smith 
27847c6ae99SBarry Smith   ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr);
27947c6ae99SBarry Smith   ierr = MPI_Comm_rank(comm,&rank);CHKERRQ(ierr);
28047c6ae99SBarry Smith 
2817d310018SBarry Smith   dd->p = 1;
28247c6ae99SBarry Smith   if (m != PETSC_DECIDE) {
28347c6ae99SBarry Smith     if (m < 1) SETERRQ1(comm,PETSC_ERR_ARG_OUTOFRANGE,"Non-positive number of processors in X direction: %D",m);
28447c6ae99SBarry Smith     else if (m > size) SETERRQ2(comm,PETSC_ERR_ARG_OUTOFRANGE,"Too many processors in X direction: %D %d",m,size);
28547c6ae99SBarry Smith   }
28647c6ae99SBarry Smith   if (n != PETSC_DECIDE) {
28747c6ae99SBarry Smith     if (n < 1) SETERRQ1(comm,PETSC_ERR_ARG_OUTOFRANGE,"Non-positive number of processors in Y direction: %D",n);
28847c6ae99SBarry Smith     else if (n > size) SETERRQ2(comm,PETSC_ERR_ARG_OUTOFRANGE,"Too many processors in Y direction: %D %d",n,size);
28947c6ae99SBarry Smith   }
29047c6ae99SBarry Smith 
29147c6ae99SBarry Smith   if (m == PETSC_DECIDE || n == PETSC_DECIDE) {
29247c6ae99SBarry Smith     if (n != PETSC_DECIDE) {
29347c6ae99SBarry Smith       m = size/n;
29447c6ae99SBarry Smith     } else if (m != PETSC_DECIDE) {
29547c6ae99SBarry Smith       n = size/m;
29647c6ae99SBarry Smith     } else {
29747c6ae99SBarry Smith       /* try for squarish distribution */
298369cc0aeSBarry Smith       m = (PetscInt)(0.5 + PetscSqrtReal(((PetscReal)M)*((PetscReal)size)/((PetscReal)N)));
29947c6ae99SBarry Smith       if (!m) m = 1;
30047c6ae99SBarry Smith       while (m > 0) {
30147c6ae99SBarry Smith         n = size/m;
30247c6ae99SBarry Smith         if (m*n == size) break;
30347c6ae99SBarry Smith         m--;
30447c6ae99SBarry Smith       }
30547c6ae99SBarry Smith       if (M > N && m < n) {PetscInt _m = m; m = n; n = _m;}
30647c6ae99SBarry Smith     }
30747c6ae99SBarry Smith     if (m*n != size) SETERRQ(comm,PETSC_ERR_PLIB,"Unable to create partition, check the size of the communicator and input m and n ");
30847c6ae99SBarry Smith   } else if (m*n != size) SETERRQ(comm,PETSC_ERR_ARG_OUTOFRANGE,"Given Bad partition");
30947c6ae99SBarry Smith 
31047c6ae99SBarry Smith   if (M < m) SETERRQ2(comm,PETSC_ERR_ARG_OUTOFRANGE,"Partition in x direction is too fine! %D %D",M,m);
31147c6ae99SBarry Smith   if (N < n) SETERRQ2(comm,PETSC_ERR_ARG_OUTOFRANGE,"Partition in y direction is too fine! %D %D",N,n);
31247c6ae99SBarry Smith 
31347c6ae99SBarry Smith   /*
31447c6ae99SBarry Smith      Determine locally owned region
31547c6ae99SBarry Smith      xs is the first local node number, x is the number of local nodes
31647c6ae99SBarry Smith   */
31747c6ae99SBarry Smith   if (!lx) {
318785e854fSJed Brown     ierr = PetscMalloc1(m, &dd->lx);CHKERRQ(ierr);
31947c6ae99SBarry Smith     lx   = dd->lx;
32047c6ae99SBarry Smith     for (i=0; i<m; i++) {
32147c6ae99SBarry Smith       lx[i] = M/m + ((M % m) > i);
32247c6ae99SBarry Smith     }
32347c6ae99SBarry Smith   }
32447c6ae99SBarry Smith   x  = lx[rank % m];
32547c6ae99SBarry Smith   xs = 0;
32647c6ae99SBarry Smith   for (i=0; i<(rank % m); i++) {
32747c6ae99SBarry Smith     xs += lx[i];
32847c6ae99SBarry Smith   }
32947c6ae99SBarry Smith #if defined(PETSC_USE_DEBUG)
33047c6ae99SBarry Smith   left = xs;
33147c6ae99SBarry Smith   for (i=(rank % m); i<m; i++) {
33247c6ae99SBarry Smith     left += lx[i];
33347c6ae99SBarry Smith   }
33447c6ae99SBarry Smith   if (left != M) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Sum of lx across processors not equal to M: %D %D",left,M);
33547c6ae99SBarry Smith #endif
33647c6ae99SBarry Smith 
33747c6ae99SBarry Smith   /*
33847c6ae99SBarry Smith      Determine locally owned region
33947c6ae99SBarry Smith      ys is the first local node number, y is the number of local nodes
34047c6ae99SBarry Smith   */
34147c6ae99SBarry Smith   if (!ly) {
342785e854fSJed Brown     ierr = PetscMalloc1(n, &dd->ly);CHKERRQ(ierr);
34347c6ae99SBarry Smith     ly   = dd->ly;
34447c6ae99SBarry Smith     for (i=0; i<n; i++) {
34547c6ae99SBarry Smith       ly[i] = N/n + ((N % n) > i);
34647c6ae99SBarry Smith     }
34747c6ae99SBarry Smith   }
34847c6ae99SBarry Smith   y  = ly[rank/m];
34947c6ae99SBarry Smith   ys = 0;
35047c6ae99SBarry Smith   for (i=0; i<(rank/m); i++) {
35147c6ae99SBarry Smith     ys += ly[i];
35247c6ae99SBarry Smith   }
35347c6ae99SBarry Smith #if defined(PETSC_USE_DEBUG)
35447c6ae99SBarry Smith   left = ys;
35547c6ae99SBarry Smith   for (i=(rank/m); i<n; i++) {
35647c6ae99SBarry Smith     left += ly[i];
35747c6ae99SBarry Smith   }
35847c6ae99SBarry Smith   if (left != N) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Sum of ly across processors not equal to N: %D %D",left,N);
35947c6ae99SBarry Smith #endif
36047c6ae99SBarry Smith 
361bcea557cSEthan Coon   /*
362bcea557cSEthan Coon    check if the scatter requires more than one process neighbor or wraps around
363bcea557cSEthan Coon    the domain more than once
364bcea557cSEthan Coon   */
365bff4a2f0SMatthew G. Knepley   if ((x < s) && ((m > 1) || (bx == DM_BOUNDARY_PERIODIC))) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Local x-width of domain x %D is smaller than stencil width s %D",x,s);
366bff4a2f0SMatthew G. Knepley   if ((y < s) && ((n > 1) || (by == DM_BOUNDARY_PERIODIC))) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Local y-width of domain y %D is smaller than stencil width s %D",y,s);
36747c6ae99SBarry Smith   xe = xs + x;
36847c6ae99SBarry Smith   ye = ys + y;
36947c6ae99SBarry Smith 
370ce00eea3SSatish Balay   /* determine ghost region (Xs) and region scattered into (IXs)  */
371d9c9ebe5SPeter Brune   if (xs-s > 0) {
372d9c9ebe5SPeter Brune     Xs = xs - s; IXs = xs - s;
37388661749SPeter Brune   } else {
37488661749SPeter Brune     if (bx) {
37588661749SPeter Brune       Xs = xs - s;
37688661749SPeter Brune     } else {
37788661749SPeter Brune       Xs = 0;
37888661749SPeter Brune     }
37988661749SPeter Brune     IXs = 0;
38088661749SPeter Brune   }
381d9c9ebe5SPeter Brune   if (xe+s <= M) {
382d9c9ebe5SPeter Brune     Xe = xe + s; IXe = xe + s;
38388661749SPeter Brune   } else {
38488661749SPeter Brune     if (bx) {
385d9c9ebe5SPeter Brune       Xs = xs - s; Xe = xe + s;
38688661749SPeter Brune     } else {
38788661749SPeter Brune       Xe = M;
38888661749SPeter Brune     }
38988661749SPeter Brune     IXe = M;
39088661749SPeter Brune   }
39147c6ae99SBarry Smith 
392bff4a2f0SMatthew G. Knepley   if (bx == DM_BOUNDARY_PERIODIC || bx == DM_BOUNDARY_MIRROR) {
393d9c9ebe5SPeter Brune     IXs = xs - s;
394d9c9ebe5SPeter Brune     IXe = xe + s;
395d9c9ebe5SPeter Brune     Xs  = xs - s;
396d9c9ebe5SPeter Brune     Xe  = xe + s;
39788661749SPeter Brune   }
39847c6ae99SBarry Smith 
399d9c9ebe5SPeter Brune   if (ys-s > 0) {
400d9c9ebe5SPeter Brune     Ys = ys - s; IYs = ys - s;
40188661749SPeter Brune   } else {
40288661749SPeter Brune     if (by) {
40388661749SPeter Brune       Ys = ys - s;
40488661749SPeter Brune     } else {
40588661749SPeter Brune       Ys = 0;
40688661749SPeter Brune     }
40788661749SPeter Brune     IYs = 0;
40888661749SPeter Brune   }
409d9c9ebe5SPeter Brune   if (ye+s <= N) {
410d9c9ebe5SPeter Brune     Ye = ye + s; IYe = ye + s;
41188661749SPeter Brune   } else {
41288661749SPeter Brune     if (by) {
41388661749SPeter Brune       Ye = ye + s;
41488661749SPeter Brune     } else {
41588661749SPeter Brune       Ye = N;
41688661749SPeter Brune     }
41788661749SPeter Brune     IYe = N;
41888661749SPeter Brune   }
41988661749SPeter Brune 
420bff4a2f0SMatthew G. Knepley   if (by == DM_BOUNDARY_PERIODIC || by == DM_BOUNDARY_MIRROR) {
421d9c9ebe5SPeter Brune     IYs = ys - s;
422d9c9ebe5SPeter Brune     IYe = ye + s;
423d9c9ebe5SPeter Brune     Ys  = ys - s;
424d9c9ebe5SPeter Brune     Ye  = ye + s;
42588661749SPeter Brune   }
42688661749SPeter Brune 
42788661749SPeter Brune   /* stencil length in each direction */
428d9c9ebe5SPeter Brune   s_x = s;
429d9c9ebe5SPeter Brune   s_y = s;
43047c6ae99SBarry Smith 
43147c6ae99SBarry Smith   /* determine starting point of each processor */
43247c6ae99SBarry Smith   nn       = x*y;
433dcca6d9dSJed Brown   ierr     = PetscMalloc2(size+1,&bases,size,&ldims);CHKERRQ(ierr);
43447c6ae99SBarry Smith   ierr     = MPI_Allgather(&nn,1,MPIU_INT,ldims,1,MPIU_INT,comm);CHKERRQ(ierr);
43547c6ae99SBarry Smith   bases[0] = 0;
43647c6ae99SBarry Smith   for (i=1; i<=size; i++) {
43747c6ae99SBarry Smith     bases[i] = ldims[i-1];
43847c6ae99SBarry Smith   }
43947c6ae99SBarry Smith   for (i=1; i<=size; i++) {
44047c6ae99SBarry Smith     bases[i] += bases[i-1];
44147c6ae99SBarry Smith   }
442ce00eea3SSatish Balay   base = bases[rank]*dof;
44347c6ae99SBarry Smith 
44447c6ae99SBarry Smith   /* allocate the base parallel and sequential vectors */
445ce00eea3SSatish Balay   dd->Nlocal = x*y*dof;
446b1fb7eb7SBarry Smith   ierr       = VecCreateMPIWithArray(comm,dof,dd->Nlocal,PETSC_DECIDE,NULL,&global);CHKERRQ(ierr);
447ce00eea3SSatish Balay   dd->nlocal = (Xe-Xs)*(Ye-Ys)*dof;
448b1fb7eb7SBarry Smith   ierr       = VecCreateSeqWithArray(PETSC_COMM_SELF,dof,dd->nlocal,NULL,&local);CHKERRQ(ierr);
44947c6ae99SBarry Smith 
45047c6ae99SBarry Smith   /* generate appropriate vector scatters */
45147c6ae99SBarry Smith   /* local to global inserts non-ghost point region into global */
45202fe608eSBarry Smith   ierr  = PetscMalloc1((IXe-IXs)*(IYe-IYs),&idx);CHKERRQ(ierr);
453ce00eea3SSatish Balay   left  = xs - Xs; right = left + x;
454ce00eea3SSatish Balay   down  = ys - Ys; up = down + y;
45547c6ae99SBarry Smith   count = 0;
45647c6ae99SBarry Smith   for (i=down; i<up; i++) {
457ce00eea3SSatish Balay     for (j=left; j<right; j++) {
458ce00eea3SSatish Balay       idx[count++] = i*(Xe-Xs) + j;
45947c6ae99SBarry Smith     }
46047c6ae99SBarry Smith   }
46147c6ae99SBarry Smith 
462ce00eea3SSatish Balay   /* global to local must include ghost points within the domain,
463ce00eea3SSatish Balay      but not ghost points outside the domain that aren't periodic */
464d9c9ebe5SPeter Brune   if (stencil_type == DMDA_STENCIL_BOX) {
465ce00eea3SSatish Balay     left  = IXs - Xs; right = left + (IXe-IXs);
466ce00eea3SSatish Balay     down  = IYs - Ys; up = down + (IYe-IYs);
467ce00eea3SSatish Balay     count = 0;
468ce00eea3SSatish Balay     for (i=down; i<up; i++) {
469ce00eea3SSatish Balay       for (j=left; j<right; j++) {
470ce00eea3SSatish Balay         idx[count++] = j + i*(Xe-Xs);
471ce00eea3SSatish Balay       }
472ce00eea3SSatish Balay     }
473ce00eea3SSatish Balay     ierr = ISCreateBlock(comm,dof,count,idx,PETSC_OWN_POINTER,&to);CHKERRQ(ierr);
474ce00eea3SSatish Balay 
47547c6ae99SBarry Smith   } else {
47647c6ae99SBarry Smith     /* must drop into cross shape region */
47747c6ae99SBarry Smith     /*       ---------|
47847c6ae99SBarry Smith             |  top    |
479ce00eea3SSatish Balay          |---         ---| up
48047c6ae99SBarry Smith          |   middle      |
48147c6ae99SBarry Smith          |               |
482ce00eea3SSatish Balay          ----         ---- down
48347c6ae99SBarry Smith             | bottom  |
48447c6ae99SBarry Smith             -----------
48547c6ae99SBarry Smith          Xs xs        xe Xe */
486ce00eea3SSatish Balay     left  = xs - Xs; right = left + x;
487ce00eea3SSatish Balay     down  = ys - Ys; up = down + y;
48847c6ae99SBarry Smith     count = 0;
489ce00eea3SSatish Balay     /* bottom */
490ce00eea3SSatish Balay     for (i=(IYs-Ys); i<down; i++) {
491ce00eea3SSatish Balay       for (j=left; j<right; j++) {
492ce00eea3SSatish Balay         idx[count++] = j + i*(Xe-Xs);
49347c6ae99SBarry Smith       }
49447c6ae99SBarry Smith     }
49547c6ae99SBarry Smith     /* middle */
49647c6ae99SBarry Smith     for (i=down; i<up; i++) {
497ce00eea3SSatish Balay       for (j=(IXs-Xs); j<(IXe-Xs); j++) {
498ce00eea3SSatish Balay         idx[count++] = j + i*(Xe-Xs);
49947c6ae99SBarry Smith       }
50047c6ae99SBarry Smith     }
50147c6ae99SBarry Smith     /* top */
502ce00eea3SSatish Balay     for (i=up; i<up+IYe-ye; i++) {
503ce00eea3SSatish Balay       for (j=left; j<right; j++) {
504ce00eea3SSatish Balay         idx[count++] = j + i*(Xe-Xs);
50547c6ae99SBarry Smith       }
50647c6ae99SBarry Smith     }
50747c6ae99SBarry Smith     ierr = ISCreateBlock(comm,dof,count,idx,PETSC_OWN_POINTER,&to);CHKERRQ(ierr);
50847c6ae99SBarry Smith   }
50947c6ae99SBarry Smith 
51047c6ae99SBarry Smith 
51147c6ae99SBarry Smith   /* determine who lies on each side of us stored in    n6 n7 n8
51247c6ae99SBarry Smith                                                         n3    n5
51347c6ae99SBarry Smith                                                         n0 n1 n2
51447c6ae99SBarry Smith   */
51547c6ae99SBarry Smith 
51647c6ae99SBarry Smith   /* Assume the Non-Periodic Case */
51747c6ae99SBarry Smith   n1 = rank - m;
51847c6ae99SBarry Smith   if (rank % m) {
51947c6ae99SBarry Smith     n0 = n1 - 1;
52047c6ae99SBarry Smith   } else {
52147c6ae99SBarry Smith     n0 = -1;
52247c6ae99SBarry Smith   }
52347c6ae99SBarry Smith   if ((rank+1) % m) {
52447c6ae99SBarry Smith     n2 = n1 + 1;
52547c6ae99SBarry Smith     n5 = rank + 1;
52647c6ae99SBarry Smith     n8 = rank + m + 1; if (n8 >= m*n) n8 = -1;
52747c6ae99SBarry Smith   } else {
52847c6ae99SBarry Smith     n2 = -1; n5 = -1; n8 = -1;
52947c6ae99SBarry Smith   }
53047c6ae99SBarry Smith   if (rank % m) {
53147c6ae99SBarry Smith     n3 = rank - 1;
53247c6ae99SBarry Smith     n6 = n3 + m; if (n6 >= m*n) n6 = -1;
53347c6ae99SBarry Smith   } else {
53447c6ae99SBarry Smith     n3 = -1; n6 = -1;
53547c6ae99SBarry Smith   }
53647c6ae99SBarry Smith   n7 = rank + m; if (n7 >= m*n) n7 = -1;
53747c6ae99SBarry Smith 
538bff4a2f0SMatthew G. Knepley   if (bx == DM_BOUNDARY_PERIODIC && by == DM_BOUNDARY_PERIODIC) {
53947c6ae99SBarry Smith     /* Modify for Periodic Cases */
54047c6ae99SBarry Smith     /* Handle all four corners */
54147c6ae99SBarry Smith     if ((n6 < 0) && (n7 < 0) && (n3 < 0)) n6 = m-1;
54247c6ae99SBarry Smith     if ((n8 < 0) && (n7 < 0) && (n5 < 0)) n8 = 0;
54347c6ae99SBarry Smith     if ((n2 < 0) && (n5 < 0) && (n1 < 0)) n2 = size-m;
54447c6ae99SBarry Smith     if ((n0 < 0) && (n3 < 0) && (n1 < 0)) n0 = size-1;
54547c6ae99SBarry Smith 
54647c6ae99SBarry Smith     /* Handle Top and Bottom Sides */
54747c6ae99SBarry Smith     if (n1 < 0) n1 = rank + m * (n-1);
54847c6ae99SBarry Smith     if (n7 < 0) n7 = rank - m * (n-1);
54947c6ae99SBarry Smith     if ((n3 >= 0) && (n0 < 0)) n0 = size - m + rank - 1;
55047c6ae99SBarry Smith     if ((n3 >= 0) && (n6 < 0)) n6 = (rank%m)-1;
55147c6ae99SBarry Smith     if ((n5 >= 0) && (n2 < 0)) n2 = size - m + rank + 1;
55247c6ae99SBarry Smith     if ((n5 >= 0) && (n8 < 0)) n8 = (rank%m)+1;
55347c6ae99SBarry Smith 
55447c6ae99SBarry Smith     /* Handle Left and Right Sides */
55547c6ae99SBarry Smith     if (n3 < 0) n3 = rank + (m-1);
55647c6ae99SBarry Smith     if (n5 < 0) n5 = rank - (m-1);
55747c6ae99SBarry Smith     if ((n1 >= 0) && (n0 < 0)) n0 = rank-1;
55847c6ae99SBarry Smith     if ((n1 >= 0) && (n2 < 0)) n2 = rank-2*m+1;
55947c6ae99SBarry Smith     if ((n7 >= 0) && (n6 < 0)) n6 = rank+2*m-1;
56047c6ae99SBarry Smith     if ((n7 >= 0) && (n8 < 0)) n8 = rank+1;
561bff4a2f0SMatthew G. Knepley   } else if (by == DM_BOUNDARY_PERIODIC) {  /* Handle Top and Bottom Sides */
562ce00eea3SSatish Balay     if (n1 < 0) n1 = rank + m * (n-1);
563ce00eea3SSatish Balay     if (n7 < 0) n7 = rank - m * (n-1);
564ce00eea3SSatish Balay     if ((n3 >= 0) && (n0 < 0)) n0 = size - m + rank - 1;
565ce00eea3SSatish Balay     if ((n3 >= 0) && (n6 < 0)) n6 = (rank%m)-1;
566ce00eea3SSatish Balay     if ((n5 >= 0) && (n2 < 0)) n2 = size - m + rank + 1;
567ce00eea3SSatish Balay     if ((n5 >= 0) && (n8 < 0)) n8 = (rank%m)+1;
568bff4a2f0SMatthew G. Knepley   } else if (bx == DM_BOUNDARY_PERIODIC) { /* Handle Left and Right Sides */
569ce00eea3SSatish Balay     if (n3 < 0) n3 = rank + (m-1);
570ce00eea3SSatish Balay     if (n5 < 0) n5 = rank - (m-1);
571ce00eea3SSatish Balay     if ((n1 >= 0) && (n0 < 0)) n0 = rank-1;
572ce00eea3SSatish Balay     if ((n1 >= 0) && (n2 < 0)) n2 = rank-2*m+1;
573ce00eea3SSatish Balay     if ((n7 >= 0) && (n6 < 0)) n6 = rank+2*m-1;
574ce00eea3SSatish Balay     if ((n7 >= 0) && (n8 < 0)) n8 = rank+1;
57547c6ae99SBarry Smith   }
576ce00eea3SSatish Balay 
577785e854fSJed Brown   ierr = PetscMalloc1(9,&dd->neighbors);CHKERRQ(ierr);
5788865f1eaSKarl Rupp 
57947c6ae99SBarry Smith   dd->neighbors[0] = n0;
58047c6ae99SBarry Smith   dd->neighbors[1] = n1;
58147c6ae99SBarry Smith   dd->neighbors[2] = n2;
58247c6ae99SBarry Smith   dd->neighbors[3] = n3;
58347c6ae99SBarry Smith   dd->neighbors[4] = rank;
58447c6ae99SBarry Smith   dd->neighbors[5] = n5;
58547c6ae99SBarry Smith   dd->neighbors[6] = n6;
58647c6ae99SBarry Smith   dd->neighbors[7] = n7;
58747c6ae99SBarry Smith   dd->neighbors[8] = n8;
58847c6ae99SBarry Smith 
589d9c9ebe5SPeter Brune   if (stencil_type == DMDA_STENCIL_STAR) {
59047c6ae99SBarry Smith     /* save corner processor numbers */
59147c6ae99SBarry Smith     sn0 = n0; sn2 = n2; sn6 = n6; sn8 = n8;
59247c6ae99SBarry Smith     n0  = n2 = n6 = n8 = -1;
59347c6ae99SBarry Smith   }
59447c6ae99SBarry Smith 
595785e854fSJed Brown   ierr = PetscMalloc1((Xe-Xs)*(Ye-Ys),&idx);CHKERRQ(ierr);
59647c6ae99SBarry Smith 
597ce00eea3SSatish Balay   nn = 0;
59847c6ae99SBarry Smith   xbase = bases[rank];
59947c6ae99SBarry Smith   for (i=1; i<=s_y; i++) {
60047c6ae99SBarry Smith     if (n0 >= 0) { /* left below */
601ce00eea3SSatish Balay       x_t = lx[n0 % m];
60247c6ae99SBarry Smith       y_t = ly[(n0/m)];
60347c6ae99SBarry Smith       s_t = bases[n0] + x_t*y_t - (s_y-i)*x_t - s_x;
6048865f1eaSKarl Rupp       for (j=0; j<s_x; j++) idx[nn++] = s_t++;
60547c6ae99SBarry Smith     }
606ac119b13SBarry Smith 
60747c6ae99SBarry Smith     if (n1 >= 0) { /* directly below */
60847c6ae99SBarry Smith       x_t = x;
60947c6ae99SBarry Smith       y_t = ly[(n1/m)];
61047c6ae99SBarry Smith       s_t = bases[n1] + x_t*y_t - (s_y+1-i)*x_t;
6118865f1eaSKarl Rupp       for (j=0; j<x_t; j++) idx[nn++] = s_t++;
612bff4a2f0SMatthew G. Knepley     } else if (by == DM_BOUNDARY_MIRROR) {
6138865f1eaSKarl Rupp       for (j=0; j<x; j++) idx[nn++] = bases[rank] + x*(s_y - i + 1)  + j;
61447c6ae99SBarry Smith     }
615ac119b13SBarry Smith 
61647c6ae99SBarry Smith     if (n2 >= 0) { /* right below */
617ce00eea3SSatish Balay       x_t = lx[n2 % m];
61847c6ae99SBarry Smith       y_t = ly[(n2/m)];
61947c6ae99SBarry Smith       s_t = bases[n2] + x_t*y_t - (s_y+1-i)*x_t;
6208865f1eaSKarl Rupp       for (j=0; j<s_x; j++) idx[nn++] = s_t++;
62147c6ae99SBarry Smith     }
62247c6ae99SBarry Smith   }
62347c6ae99SBarry Smith 
62447c6ae99SBarry Smith   for (i=0; i<y; i++) {
62547c6ae99SBarry Smith     if (n3 >= 0) { /* directly left */
626ce00eea3SSatish Balay       x_t = lx[n3 % m];
62747c6ae99SBarry Smith       /* y_t = y; */
62847c6ae99SBarry Smith       s_t = bases[n3] + (i+1)*x_t - s_x;
6298865f1eaSKarl Rupp       for (j=0; j<s_x; j++) idx[nn++] = s_t++;
630bff4a2f0SMatthew G. Knepley     } else if (bx == DM_BOUNDARY_MIRROR) {
6318865f1eaSKarl Rupp       for (j=0; j<s_x; j++) idx[nn++] = bases[rank] + x*i + s_x - j;
63247c6ae99SBarry Smith     }
63347c6ae99SBarry Smith 
6348865f1eaSKarl Rupp     for (j=0; j<x; j++) idx[nn++] = xbase++; /* interior */
63547c6ae99SBarry Smith 
63647c6ae99SBarry Smith     if (n5 >= 0) { /* directly right */
637ce00eea3SSatish Balay       x_t = lx[n5 % m];
63847c6ae99SBarry Smith       /* y_t = y; */
63947c6ae99SBarry Smith       s_t = bases[n5] + (i)*x_t;
6408865f1eaSKarl Rupp       for (j=0; j<s_x; j++) idx[nn++] = s_t++;
641bff4a2f0SMatthew G. Knepley     } else if (bx == DM_BOUNDARY_MIRROR) {
6428865f1eaSKarl Rupp       for (j=0; j<s_x; j++) idx[nn++] = bases[rank] + x*(i + 1) - 2 - j;
64347c6ae99SBarry Smith     }
64447c6ae99SBarry Smith   }
64547c6ae99SBarry Smith 
64647c6ae99SBarry Smith   for (i=1; i<=s_y; i++) {
64747c6ae99SBarry Smith     if (n6 >= 0) { /* left above */
648ce00eea3SSatish Balay       x_t = lx[n6 % m];
64947c6ae99SBarry Smith       /* y_t = ly[(n6/m)]; */
65047c6ae99SBarry Smith       s_t = bases[n6] + (i)*x_t - s_x;
6518865f1eaSKarl Rupp       for (j=0; j<s_x; j++) idx[nn++] = s_t++;
65247c6ae99SBarry Smith     }
653ac119b13SBarry Smith 
65447c6ae99SBarry Smith     if (n7 >= 0) { /* directly above */
65547c6ae99SBarry Smith       x_t = x;
65647c6ae99SBarry Smith       /* y_t = ly[(n7/m)]; */
65747c6ae99SBarry Smith       s_t = bases[n7] + (i-1)*x_t;
6588865f1eaSKarl Rupp       for (j=0; j<x_t; j++) idx[nn++] = s_t++;
659bff4a2f0SMatthew G. Knepley     } else if (by == DM_BOUNDARY_MIRROR) {
6608865f1eaSKarl Rupp       for (j=0; j<x; j++) idx[nn++] = bases[rank] + x*(y - i - 1)  + j;
66147c6ae99SBarry Smith     }
662ac119b13SBarry Smith 
66347c6ae99SBarry Smith     if (n8 >= 0) { /* right above */
664ce00eea3SSatish Balay       x_t = lx[n8 % m];
66547c6ae99SBarry Smith       /* y_t = ly[(n8/m)]; */
66647c6ae99SBarry Smith       s_t = bases[n8] + (i-1)*x_t;
6678865f1eaSKarl Rupp       for (j=0; j<s_x; j++) idx[nn++] = s_t++;
66847c6ae99SBarry Smith     }
66947c6ae99SBarry Smith   }
67047c6ae99SBarry Smith 
671b1fb7eb7SBarry Smith   ierr = ISCreateBlock(comm,dof,nn,idx,PETSC_USE_POINTER,&from);CHKERRQ(ierr);
67247c6ae99SBarry Smith   ierr = VecScatterCreate(global,from,local,to,&gtol);CHKERRQ(ierr);
6733bb1ff40SBarry Smith   ierr = PetscLogObjectParent((PetscObject)da,(PetscObject)gtol);CHKERRQ(ierr);
674fcfd50ebSBarry Smith   ierr = ISDestroy(&to);CHKERRQ(ierr);
675fcfd50ebSBarry Smith   ierr = ISDestroy(&from);CHKERRQ(ierr);
67647c6ae99SBarry Smith 
677d9c9ebe5SPeter Brune   if (stencil_type == DMDA_STENCIL_STAR) {
678ce00eea3SSatish Balay     n0 = sn0; n2 = sn2; n6 = sn6; n8 = sn8;
679ce00eea3SSatish Balay   }
680ce00eea3SSatish Balay 
681288e7d53SBarry Smith   if (((stencil_type == DMDA_STENCIL_STAR)  || (bx && bx != DM_BOUNDARY_PERIODIC) || (by && by != DM_BOUNDARY_PERIODIC))) {
68247c6ae99SBarry Smith     /*
68347c6ae99SBarry Smith         Recompute the local to global mappings, this time keeping the
684ce00eea3SSatish Balay       information about the cross corner processor numbers and any ghosted
685ce00eea3SSatish Balay       but not periodic indices.
68647c6ae99SBarry Smith     */
68747c6ae99SBarry Smith     nn    = 0;
68847c6ae99SBarry Smith     xbase = bases[rank];
68947c6ae99SBarry Smith     for (i=1; i<=s_y; i++) {
69047c6ae99SBarry Smith       if (n0 >= 0) { /* left below */
691ce00eea3SSatish Balay         x_t = lx[n0 % m];
69247c6ae99SBarry Smith         y_t = ly[(n0/m)];
69347c6ae99SBarry Smith         s_t = bases[n0] + x_t*y_t - (s_y-i)*x_t - s_x;
6948865f1eaSKarl Rupp         for (j=0; j<s_x; j++) idx[nn++] = s_t++;
695ce00eea3SSatish Balay       } else if (xs-Xs > 0 && ys-Ys > 0) {
6968865f1eaSKarl Rupp         for (j=0; j<s_x; j++) idx[nn++] = -1;
69747c6ae99SBarry Smith       }
69847c6ae99SBarry Smith       if (n1 >= 0) { /* directly below */
69947c6ae99SBarry Smith         x_t = x;
70047c6ae99SBarry Smith         y_t = ly[(n1/m)];
70147c6ae99SBarry Smith         s_t = bases[n1] + x_t*y_t - (s_y+1-i)*x_t;
7028865f1eaSKarl Rupp         for (j=0; j<x_t; j++) idx[nn++] = s_t++;
703ce00eea3SSatish Balay       } else if (ys-Ys > 0) {
704bff4a2f0SMatthew G. Knepley         if (by == DM_BOUNDARY_MIRROR) {
7058865f1eaSKarl Rupp           for (j=0; j<x; j++) idx[nn++] = bases[rank] + x*(s_y - i + 1)  + j;
706624904c4SBarry Smith         } else {
7078865f1eaSKarl Rupp           for (j=0; j<x; j++) idx[nn++] = -1;
70847c6ae99SBarry Smith         }
709624904c4SBarry Smith       }
71047c6ae99SBarry Smith       if (n2 >= 0) { /* right below */
711ce00eea3SSatish Balay         x_t = lx[n2 % m];
71247c6ae99SBarry Smith         y_t = ly[(n2/m)];
71347c6ae99SBarry Smith         s_t = bases[n2] + x_t*y_t - (s_y+1-i)*x_t;
7148865f1eaSKarl Rupp         for (j=0; j<s_x; j++) idx[nn++] = s_t++;
715ce00eea3SSatish Balay       } else if (Xe-xe> 0 && ys-Ys > 0) {
7168865f1eaSKarl Rupp         for (j=0; j<s_x; j++) idx[nn++] = -1;
71747c6ae99SBarry Smith       }
71847c6ae99SBarry Smith     }
71947c6ae99SBarry Smith 
72047c6ae99SBarry Smith     for (i=0; i<y; i++) {
72147c6ae99SBarry Smith       if (n3 >= 0) { /* directly left */
722ce00eea3SSatish Balay         x_t = lx[n3 % m];
72347c6ae99SBarry Smith         /* y_t = y; */
72447c6ae99SBarry Smith         s_t = bases[n3] + (i+1)*x_t - s_x;
7258865f1eaSKarl Rupp         for (j=0; j<s_x; j++) idx[nn++] = s_t++;
726ce00eea3SSatish Balay       } else if (xs-Xs > 0) {
727bff4a2f0SMatthew G. Knepley         if (bx == DM_BOUNDARY_MIRROR) {
7288865f1eaSKarl Rupp           for (j=0; j<s_x; j++) idx[nn++] = bases[rank] + x*i + s_x - j;
729624904c4SBarry Smith         } else {
7308865f1eaSKarl Rupp           for (j=0; j<s_x; j++) idx[nn++] = -1;
73147c6ae99SBarry Smith         }
732624904c4SBarry Smith       }
73347c6ae99SBarry Smith 
7348865f1eaSKarl Rupp       for (j=0; j<x; j++) idx[nn++] = xbase++; /* interior */
73547c6ae99SBarry Smith 
73647c6ae99SBarry Smith       if (n5 >= 0) { /* directly right */
737ce00eea3SSatish Balay         x_t = lx[n5 % m];
73847c6ae99SBarry Smith         /* y_t = y; */
73947c6ae99SBarry Smith         s_t = bases[n5] + (i)*x_t;
7408865f1eaSKarl Rupp         for (j=0; j<s_x; j++) idx[nn++] = s_t++;
741ce00eea3SSatish Balay       } else if (Xe-xe > 0) {
742bff4a2f0SMatthew G. Knepley         if (bx == DM_BOUNDARY_MIRROR) {
7438865f1eaSKarl Rupp           for (j=0; j<s_x; j++) idx[nn++] = bases[rank] + x*(i + 1) - 2 - j;
744624904c4SBarry Smith         } else {
7458865f1eaSKarl Rupp           for (j=0; j<s_x; j++) idx[nn++] = -1;
74647c6ae99SBarry Smith         }
74747c6ae99SBarry Smith       }
748624904c4SBarry Smith     }
74947c6ae99SBarry Smith 
75047c6ae99SBarry Smith     for (i=1; i<=s_y; i++) {
75147c6ae99SBarry Smith       if (n6 >= 0) { /* left above */
752ce00eea3SSatish Balay         x_t = lx[n6 % m];
75347c6ae99SBarry Smith         /* y_t = ly[(n6/m)]; */
75447c6ae99SBarry Smith         s_t = bases[n6] + (i)*x_t - s_x;
7558865f1eaSKarl Rupp         for (j=0; j<s_x; j++) idx[nn++] = s_t++;
756ce00eea3SSatish Balay       } else if (xs-Xs > 0 && Ye-ye > 0) {
7578865f1eaSKarl Rupp         for (j=0; j<s_x; j++) idx[nn++] = -1;
75847c6ae99SBarry Smith       }
75947c6ae99SBarry Smith       if (n7 >= 0) { /* directly above */
76047c6ae99SBarry Smith         x_t = x;
76147c6ae99SBarry Smith         /* y_t = ly[(n7/m)]; */
76247c6ae99SBarry Smith         s_t = bases[n7] + (i-1)*x_t;
7638865f1eaSKarl Rupp         for (j=0; j<x_t; j++) idx[nn++] = s_t++;
764ce00eea3SSatish Balay       } else if (Ye-ye > 0) {
765bff4a2f0SMatthew G. Knepley         if (by == DM_BOUNDARY_MIRROR) {
7668865f1eaSKarl Rupp           for (j=0; j<x; j++) idx[nn++] = bases[rank] + x*(y - i - 1)  + j;
767624904c4SBarry Smith         } else {
7688865f1eaSKarl Rupp           for (j=0; j<x; j++) idx[nn++] = -1;
76947c6ae99SBarry Smith         }
770624904c4SBarry Smith       }
77147c6ae99SBarry Smith       if (n8 >= 0) { /* right above */
772ce00eea3SSatish Balay         x_t = lx[n8 % m];
77347c6ae99SBarry Smith         /* y_t = ly[(n8/m)]; */
77447c6ae99SBarry Smith         s_t = bases[n8] + (i-1)*x_t;
7758865f1eaSKarl Rupp         for (j=0; j<s_x; j++) idx[nn++] = s_t++;
776ce00eea3SSatish Balay       } else if (Xe-xe > 0 && Ye-ye > 0) {
7778865f1eaSKarl Rupp         for (j=0; j<s_x; j++) idx[nn++] = -1;
77847c6ae99SBarry Smith       }
77947c6ae99SBarry Smith     }
78047c6ae99SBarry Smith   }
781ce00eea3SSatish Balay   /*
782ce00eea3SSatish Balay      Set the local to global ordering in the global vector, this allows use
783ce00eea3SSatish Balay      of VecSetValuesLocal().
784ce00eea3SSatish Balay   */
78545b6f7e9SBarry Smith   ierr = ISLocalToGlobalMappingCreate(comm,dof,nn,idx,PETSC_OWN_POINTER,&da->ltogmap);CHKERRQ(ierr);
7863bb1ff40SBarry Smith   ierr = PetscLogObjectParent((PetscObject)da,(PetscObject)da->ltogmap);CHKERRQ(ierr);
78747c6ae99SBarry Smith 
788ce00eea3SSatish Balay   ierr  = PetscFree2(bases,ldims);CHKERRQ(ierr);
78947c6ae99SBarry Smith   dd->m = m;  dd->n  = n;
790ce00eea3SSatish Balay   /* note petsc expects xs/xe/Xs/Xe to be multiplied by #dofs in many places */
791ce00eea3SSatish Balay   dd->xs = xs*dof; dd->xe = xe*dof; dd->ys = ys; dd->ye = ye; dd->zs = 0; dd->ze = 1;
792ce00eea3SSatish Balay   dd->Xs = Xs*dof; dd->Xe = Xe*dof; dd->Ys = Ys; dd->Ye = Ye; dd->Zs = 0; dd->Ze = 1;
79347c6ae99SBarry Smith 
794fcfd50ebSBarry Smith   ierr = VecDestroy(&local);CHKERRQ(ierr);
795fcfd50ebSBarry Smith   ierr = VecDestroy(&global);CHKERRQ(ierr);
79647c6ae99SBarry Smith 
79747c6ae99SBarry Smith   dd->gtol      = gtol;
79847c6ae99SBarry Smith   dd->base      = base;
7999a42bb27SBarry Smith   da->ops->view = DMView_DA_2d;
8000298fd71SBarry Smith   dd->ltol      = NULL;
8010298fd71SBarry Smith   dd->ao        = NULL;
80247c6ae99SBarry Smith   PetscFunctionReturn(0);
80347c6ae99SBarry Smith }
80447c6ae99SBarry Smith 
80547c6ae99SBarry Smith /*@C
806aa219208SBarry Smith    DMDACreate2d -  Creates an object that will manage the communication of  two-dimensional
80747c6ae99SBarry Smith    regular array data that is distributed across some processors.
80847c6ae99SBarry Smith 
80947c6ae99SBarry Smith    Collective on MPI_Comm
81047c6ae99SBarry Smith 
81147c6ae99SBarry Smith    Input Parameters:
81247c6ae99SBarry Smith +  comm - MPI communicator
8131321219cSEthan Coon .  bx,by - type of ghost nodes the array have.
814bff4a2f0SMatthew G. Knepley          Use one of DM_BOUNDARY_NONE, DM_BOUNDARY_GHOSTED, DM_BOUNDARY_PERIODIC.
815aa219208SBarry Smith .  stencil_type - stencil type.  Use either DMDA_STENCIL_BOX or DMDA_STENCIL_STAR.
816897f7067SBarry Smith .  M,N - global dimension in each direction of the array
81747c6ae99SBarry Smith .  m,n - corresponding number of processors in each dimension
81847c6ae99SBarry Smith          (or PETSC_DECIDE to have calculated)
81947c6ae99SBarry Smith .  dof - number of degrees of freedom per node
82047c6ae99SBarry Smith .  s - stencil width
82147c6ae99SBarry Smith -  lx, ly - arrays containing the number of nodes in each cell along
8220298fd71SBarry Smith            the x and y coordinates, or NULL. If non-null, these
82347c6ae99SBarry Smith            must be of length as m and n, and the corresponding
82447c6ae99SBarry Smith            m and n cannot be PETSC_DECIDE. The sum of the lx[] entries
82547c6ae99SBarry Smith            must be M, and the sum of the ly[] entries must be N.
82647c6ae99SBarry Smith 
82747c6ae99SBarry Smith    Output Parameter:
82847c6ae99SBarry Smith .  da - the resulting distributed array object
82947c6ae99SBarry Smith 
83047c6ae99SBarry Smith    Options Database Key:
831706a11cbSBarry Smith +  -dm_view - Calls DMView() at the conclusion of DMDACreate2d()
83247c6ae99SBarry Smith .  -da_grid_x <nx> - number of grid points in x direction, if M < 0
83347c6ae99SBarry Smith .  -da_grid_y <ny> - number of grid points in y direction, if N < 0
83447c6ae99SBarry Smith .  -da_processors_x <nx> - number of processors in x direction
83547c6ae99SBarry Smith .  -da_processors_y <ny> - number of processors in y direction
836e0f5d30fSBarry Smith .  -da_refine_x <rx> - refinement ratio in x direction
837e0f5d30fSBarry Smith .  -da_refine_y <ry> - refinement ratio in y direction
838e0f5d30fSBarry Smith -  -da_refine <n> - refine the DMDA n times before creating, if M or N < 0
839e0f5d30fSBarry Smith 
84047c6ae99SBarry Smith 
84147c6ae99SBarry Smith    Level: beginner
84247c6ae99SBarry Smith 
84347c6ae99SBarry Smith    Notes:
844aa219208SBarry Smith    The stencil type DMDA_STENCIL_STAR with width 1 corresponds to the
845aa219208SBarry Smith    standard 5-pt stencil, while DMDA_STENCIL_BOX with width 1 denotes
84647c6ae99SBarry Smith    the standard 9-pt stencil.
84747c6ae99SBarry Smith 
848aa219208SBarry Smith    The array data itself is NOT stored in the DMDA, it is stored in Vec objects;
849564755cdSBarry Smith    The appropriate vector objects can be obtained with calls to DMCreateGlobalVector()
850564755cdSBarry Smith    and DMCreateLocalVector() and calls to VecDuplicate() if more are needed.
85147c6ae99SBarry Smith 
852897f7067SBarry Smith    You must call DMSetUp() after this call before using this DM.
853897f7067SBarry Smith 
854897f7067SBarry Smith    If you wish to use the options database to change values in the DMDA call DMSetFromOptions() after this call
855897f7067SBarry Smith    but before DMSetUp().
856897f7067SBarry Smith 
85747c6ae99SBarry Smith .keywords: distributed array, create, two-dimensional
85847c6ae99SBarry Smith 
859aa219208SBarry Smith .seealso: DMDestroy(), DMView(), DMDACreate1d(), DMDACreate3d(), DMGlobalToLocalBegin(), DMDAGetRefinementFactor(),
86099f0b487SRichard Tran Mills           DMGlobalToLocalEnd(), DMLocalToGlobalBegin(), DMLocalToLocalBegin(), DMLocalToLocalEnd(), DMDASetRefinementFactor(),
861d461ba97SBarry Smith           DMDAGetInfo(), DMCreateGlobalVector(), DMCreateLocalVector(), DMDACreateNaturalVector(), DMLoad(), DMDAGetOwnershipRanges()
86247c6ae99SBarry Smith 
86347c6ae99SBarry Smith @*/
864fe16a2e9SBarry Smith 
865bff4a2f0SMatthew G. Knepley PetscErrorCode  DMDACreate2d(MPI_Comm comm,DMBoundaryType bx,DMBoundaryType by,DMDAStencilType stencil_type,
8669a42bb27SBarry Smith                           PetscInt M,PetscInt N,PetscInt m,PetscInt n,PetscInt dof,PetscInt s,const PetscInt lx[],const PetscInt ly[],DM *da)
86747c6ae99SBarry Smith {
86847c6ae99SBarry Smith   PetscErrorCode ierr;
86947c6ae99SBarry Smith 
87047c6ae99SBarry Smith   PetscFunctionBegin;
871aa219208SBarry Smith   ierr = DMDACreate(comm, da);CHKERRQ(ierr);
872c73cfb54SMatthew G. Knepley   ierr = DMSetDimension(*da, 2);CHKERRQ(ierr);
873aa219208SBarry Smith   ierr = DMDASetSizes(*da, M, N, 1);CHKERRQ(ierr);
874aa219208SBarry Smith   ierr = DMDASetNumProcs(*da, m, n, PETSC_DECIDE);CHKERRQ(ierr);
875bff4a2f0SMatthew G. Knepley   ierr = DMDASetBoundaryType(*da, bx, by, DM_BOUNDARY_NONE);CHKERRQ(ierr);
876aa219208SBarry Smith   ierr = DMDASetDof(*da, dof);CHKERRQ(ierr);
877aa219208SBarry Smith   ierr = DMDASetStencilType(*da, stencil_type);CHKERRQ(ierr);
878aa219208SBarry Smith   ierr = DMDASetStencilWidth(*da, s);CHKERRQ(ierr);
8790298fd71SBarry Smith   ierr = DMDASetOwnershipRanges(*da, lx, ly, NULL);CHKERRQ(ierr);
88047c6ae99SBarry Smith   PetscFunctionReturn(0);
88147c6ae99SBarry Smith }
882