xref: /petsc/src/dm/impls/da/fdda.c (revision 5e26d47bee92f501842428e6c4c2289ae309a7be)
147c6ae99SBarry Smith 
2af0996ceSBarry Smith #include <petsc/private/dmdaimpl.h> /*I      "petscdmda.h"     I*/
307475bc1SBarry Smith #include <petscmat.h>
447c6ae99SBarry Smith 
5e727c939SJed Brown extern PetscErrorCode DMCreateColoring_DA_1d_MPIAIJ(DM,ISColoringType,ISColoring*);
6e727c939SJed Brown extern PetscErrorCode DMCreateColoring_DA_2d_MPIAIJ(DM,ISColoringType,ISColoring*);
7e727c939SJed Brown extern PetscErrorCode DMCreateColoring_DA_2d_5pt_MPIAIJ(DM,ISColoringType,ISColoring*);
8e727c939SJed Brown extern PetscErrorCode DMCreateColoring_DA_3d_MPIAIJ(DM,ISColoringType,ISColoring*);
947c6ae99SBarry Smith 
1047c6ae99SBarry Smith /*
1147c6ae99SBarry Smith    For ghost i that may be negative or greater than the upper bound this
1247c6ae99SBarry Smith   maps it into the 0:m-1 range using periodicity
1347c6ae99SBarry Smith */
1447c6ae99SBarry Smith #define SetInRange(i,m) ((i < 0) ? m+i : ((i >= m) ? i-m : i))
1547c6ae99SBarry Smith 
16ce308e1dSBarry Smith static PetscErrorCode DMDASetBlockFills_Private(const PetscInt *dfill,PetscInt w,PetscInt **rfill)
1747c6ae99SBarry Smith {
1847c6ae99SBarry Smith   PetscErrorCode ierr;
1947c6ae99SBarry Smith   PetscInt       i,j,nz,*fill;
2047c6ae99SBarry Smith 
2147c6ae99SBarry Smith   PetscFunctionBegin;
2247c6ae99SBarry Smith   if (!dfill) PetscFunctionReturn(0);
2347c6ae99SBarry Smith 
2447c6ae99SBarry Smith   /* count number nonzeros */
2547c6ae99SBarry Smith   nz = 0;
2647c6ae99SBarry Smith   for (i=0; i<w; i++) {
2747c6ae99SBarry Smith     for (j=0; j<w; j++) {
2847c6ae99SBarry Smith       if (dfill[w*i+j]) nz++;
2947c6ae99SBarry Smith     }
3047c6ae99SBarry Smith   }
31854ce69bSBarry Smith   ierr = PetscMalloc1(nz + w + 1,&fill);CHKERRQ(ierr);
3247c6ae99SBarry Smith   /* construct modified CSR storage of nonzero structure */
33ce308e1dSBarry Smith   /*  fill[0 -- w] marks starts of each row of column indices (and end of last row)
34ce308e1dSBarry Smith    so fill[1] - fill[0] gives number of nonzeros in first row etc */
3547c6ae99SBarry Smith   nz = w + 1;
3647c6ae99SBarry Smith   for (i=0; i<w; i++) {
3747c6ae99SBarry Smith     fill[i] = nz;
3847c6ae99SBarry Smith     for (j=0; j<w; j++) {
3947c6ae99SBarry Smith       if (dfill[w*i+j]) {
4047c6ae99SBarry Smith         fill[nz] = j;
4147c6ae99SBarry Smith         nz++;
4247c6ae99SBarry Smith       }
4347c6ae99SBarry Smith     }
4447c6ae99SBarry Smith   }
4547c6ae99SBarry Smith   fill[w] = nz;
4647c6ae99SBarry Smith 
4747c6ae99SBarry Smith   *rfill = fill;
4847c6ae99SBarry Smith   PetscFunctionReturn(0);
4947c6ae99SBarry Smith }
5047c6ae99SBarry Smith 
5147c6ae99SBarry Smith /*@
52aa219208SBarry Smith     DMDASetBlockFills - Sets the fill pattern in each block for a multi-component problem
53950540a4SJed Brown     of the matrix returned by DMCreateMatrix().
5447c6ae99SBarry Smith 
55aa219208SBarry Smith     Logically Collective on DMDA
5647c6ae99SBarry Smith 
5747c6ae99SBarry Smith     Input Parameter:
5847c6ae99SBarry Smith +   da - the distributed array
590298fd71SBarry Smith .   dfill - the fill pattern in the diagonal block (may be NULL, means use dense block)
6047c6ae99SBarry Smith -   ofill - the fill pattern in the off-diagonal blocks
6147c6ae99SBarry Smith 
6247c6ae99SBarry Smith 
6347c6ae99SBarry Smith     Level: developer
6447c6ae99SBarry Smith 
6547c6ae99SBarry Smith     Notes: This only makes sense when you are doing multicomponent problems but using the
6647c6ae99SBarry Smith        MPIAIJ matrix format
6747c6ae99SBarry Smith 
6847c6ae99SBarry Smith            The format for dfill and ofill is a 2 dimensional dof by dof matrix with 1 entries
6947c6ae99SBarry Smith        representing coupling and 0 entries for missing coupling. For example
7047c6ae99SBarry Smith $             dfill[9] = {1, 0, 0,
7147c6ae99SBarry Smith $                         1, 1, 0,
7247c6ae99SBarry Smith $                         0, 1, 1}
7347c6ae99SBarry Smith        means that row 0 is coupled with only itself in the diagonal block, row 1 is coupled with
7447c6ae99SBarry Smith        itself and row 0 (in the diagonal block) and row 2 is coupled with itself and row 1 (in the
7547c6ae99SBarry Smith        diagonal block).
7647c6ae99SBarry Smith 
77aa219208SBarry Smith      DMDASetGetMatrix() allows you to provide general code for those more complicated nonzero patterns then
7847c6ae99SBarry Smith      can be represented in the dfill, ofill format
7947c6ae99SBarry Smith 
8047c6ae99SBarry Smith    Contributed by Glenn Hammond
8147c6ae99SBarry Smith 
828ddb5d8bSBarry Smith .seealso DMCreateMatrix(), DMDASetGetMatrix(), DMSetMatrixPreallocateOnly()
8347c6ae99SBarry Smith 
8447c6ae99SBarry Smith @*/
85ce308e1dSBarry Smith PetscErrorCode  DMDASetBlockFills(DM da,const PetscInt *dfill,const PetscInt *ofill)
8647c6ae99SBarry Smith {
8747c6ae99SBarry Smith   DM_DA          *dd = (DM_DA*)da->data;
8847c6ae99SBarry Smith   PetscErrorCode ierr;
89ae4f298aSBarry Smith   PetscInt       i,k,cnt = 1;
9047c6ae99SBarry Smith 
9147c6ae99SBarry Smith   PetscFunctionBegin;
92aa219208SBarry Smith   ierr = DMDASetBlockFills_Private(dfill,dd->w,&dd->dfill);CHKERRQ(ierr);
93aa219208SBarry Smith   ierr = DMDASetBlockFills_Private(ofill,dd->w,&dd->ofill);CHKERRQ(ierr);
94ae4f298aSBarry Smith 
95ae4f298aSBarry Smith   /* ofillcount tracks the columns of ofill that have any nonzero in thems; the value in each location is the number of
96ae4f298aSBarry Smith    columns to the left with any nonzeros in them plus 1 */
971795a4d1SJed Brown   ierr = PetscCalloc1(dd->w,&dd->ofillcols);CHKERRQ(ierr);
98ae4f298aSBarry Smith   for (i=0; i<dd->w; i++) {
99ae4f298aSBarry Smith     for (k=dd->ofill[i]; k<dd->ofill[i+1]; k++) dd->ofillcols[dd->ofill[k]] = 1;
100ae4f298aSBarry Smith   }
101ae4f298aSBarry Smith   for (i=0; i<dd->w; i++) {
102ae4f298aSBarry Smith     if (dd->ofillcols[i]) {
103ae4f298aSBarry Smith       dd->ofillcols[i] = cnt++;
104ae4f298aSBarry Smith     }
105ae4f298aSBarry Smith   }
10647c6ae99SBarry Smith   PetscFunctionReturn(0);
10747c6ae99SBarry Smith }
10847c6ae99SBarry Smith 
10947c6ae99SBarry Smith 
110b412c318SBarry Smith PetscErrorCode  DMCreateColoring_DA(DM da,ISColoringType ctype,ISColoring *coloring)
11147c6ae99SBarry Smith {
11247c6ae99SBarry Smith   PetscErrorCode   ierr;
11347c6ae99SBarry Smith   PetscInt         dim,m,n,p,nc;
114bff4a2f0SMatthew G. Knepley   DMBoundaryType bx,by,bz;
11547c6ae99SBarry Smith   MPI_Comm         comm;
11647c6ae99SBarry Smith   PetscMPIInt      size;
11747c6ae99SBarry Smith   PetscBool        isBAIJ;
11847c6ae99SBarry Smith   DM_DA            *dd = (DM_DA*)da->data;
11947c6ae99SBarry Smith 
12047c6ae99SBarry Smith   PetscFunctionBegin;
12147c6ae99SBarry Smith   /*
12247c6ae99SBarry Smith                                   m
12347c6ae99SBarry Smith           ------------------------------------------------------
12447c6ae99SBarry Smith          |                                                     |
12547c6ae99SBarry Smith          |                                                     |
12647c6ae99SBarry Smith          |               ----------------------                |
12747c6ae99SBarry Smith          |               |                    |                |
12847c6ae99SBarry Smith       n  |           yn  |                    |                |
12947c6ae99SBarry Smith          |               |                    |                |
13047c6ae99SBarry Smith          |               .---------------------                |
13147c6ae99SBarry Smith          |             (xs,ys)     xn                          |
13247c6ae99SBarry Smith          |            .                                        |
13347c6ae99SBarry Smith          |         (gxs,gys)                                   |
13447c6ae99SBarry Smith          |                                                     |
13547c6ae99SBarry Smith           -----------------------------------------------------
13647c6ae99SBarry Smith   */
13747c6ae99SBarry Smith 
13847c6ae99SBarry Smith   /*
13947c6ae99SBarry Smith          nc - number of components per grid point
14047c6ae99SBarry Smith          col - number of colors needed in one direction for single component problem
14147c6ae99SBarry Smith 
14247c6ae99SBarry Smith   */
1431321219cSEthan Coon   ierr = DMDAGetInfo(da,&dim,0,0,0,&m,&n,&p,&nc,0,&bx,&by,&bz,0);CHKERRQ(ierr);
14447c6ae99SBarry Smith 
14547c6ae99SBarry Smith   ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr);
14647c6ae99SBarry Smith   ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr);
1475bdb020cSBarry Smith   if (ctype == IS_COLORING_LOCAL) {
14847c6ae99SBarry Smith     if (size == 1) {
14947c6ae99SBarry Smith       ctype = IS_COLORING_GLOBAL;
15047c6ae99SBarry Smith     } else if (dim > 1) {
151bff4a2f0SMatthew G. Knepley       if ((m==1 && bx == DM_BOUNDARY_PERIODIC) || (n==1 && by == DM_BOUNDARY_PERIODIC) || (p==1 && bz == DM_BOUNDARY_PERIODIC)) {
1525bdb020cSBarry Smith         SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"IS_COLORING_LOCAL cannot be used for periodic boundary condition having both ends of the domain  on the same process");
15347c6ae99SBarry Smith       }
15447c6ae99SBarry Smith     }
15547c6ae99SBarry Smith   }
15647c6ae99SBarry Smith 
157aa219208SBarry Smith   /* Tell the DMDA it has 1 degree of freedom per grid point so that the coloring for BAIJ
15847c6ae99SBarry Smith      matrices is for the blocks, not the individual matrix elements  */
159b412c318SBarry Smith   ierr = PetscStrcmp(da->mattype,MATBAIJ,&isBAIJ);CHKERRQ(ierr);
160b412c318SBarry Smith   if (!isBAIJ) {ierr = PetscStrcmp(da->mattype,MATMPIBAIJ,&isBAIJ);CHKERRQ(ierr);}
161b412c318SBarry Smith   if (!isBAIJ) {ierr = PetscStrcmp(da->mattype,MATSEQBAIJ,&isBAIJ);CHKERRQ(ierr);}
16247c6ae99SBarry Smith   if (isBAIJ) {
16347c6ae99SBarry Smith     dd->w  = 1;
16447c6ae99SBarry Smith     dd->xs = dd->xs/nc;
16547c6ae99SBarry Smith     dd->xe = dd->xe/nc;
16647c6ae99SBarry Smith     dd->Xs = dd->Xs/nc;
16747c6ae99SBarry Smith     dd->Xe = dd->Xe/nc;
16847c6ae99SBarry Smith   }
16947c6ae99SBarry Smith 
17047c6ae99SBarry Smith   /*
171aa219208SBarry Smith      We do not provide a getcoloring function in the DMDA operations because
172aa219208SBarry Smith    the basic DMDA does not know about matrices. We think of DMDA as being more
17347c6ae99SBarry Smith    more low-level then matrices.
17447c6ae99SBarry Smith   */
17547c6ae99SBarry Smith   if (dim == 1) {
176e727c939SJed Brown     ierr = DMCreateColoring_DA_1d_MPIAIJ(da,ctype,coloring);CHKERRQ(ierr);
17747c6ae99SBarry Smith   } else if (dim == 2) {
178e727c939SJed Brown     ierr =  DMCreateColoring_DA_2d_MPIAIJ(da,ctype,coloring);CHKERRQ(ierr);
17947c6ae99SBarry Smith   } else if (dim == 3) {
180e727c939SJed Brown     ierr =  DMCreateColoring_DA_3d_MPIAIJ(da,ctype,coloring);CHKERRQ(ierr);
181ce94432eSBarry Smith   } else SETERRQ1(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"Not done for %D dimension, send us mail petsc-maint@mcs.anl.gov for code",dim);
18247c6ae99SBarry Smith   if (isBAIJ) {
18347c6ae99SBarry Smith     dd->w  = nc;
18447c6ae99SBarry Smith     dd->xs = dd->xs*nc;
18547c6ae99SBarry Smith     dd->xe = dd->xe*nc;
18647c6ae99SBarry Smith     dd->Xs = dd->Xs*nc;
18747c6ae99SBarry Smith     dd->Xe = dd->Xe*nc;
18847c6ae99SBarry Smith   }
18947c6ae99SBarry Smith   PetscFunctionReturn(0);
19047c6ae99SBarry Smith }
19147c6ae99SBarry Smith 
19247c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/
19347c6ae99SBarry Smith 
194e727c939SJed Brown PetscErrorCode DMCreateColoring_DA_2d_MPIAIJ(DM da,ISColoringType ctype,ISColoring *coloring)
19547c6ae99SBarry Smith {
19647c6ae99SBarry Smith   PetscErrorCode   ierr;
19747c6ae99SBarry Smith   PetscInt         xs,ys,nx,ny,i,j,ii,gxs,gys,gnx,gny,m,n,M,N,dim,s,k,nc,col;
19847c6ae99SBarry Smith   PetscInt         ncolors;
19947c6ae99SBarry Smith   MPI_Comm         comm;
200bff4a2f0SMatthew G. Knepley   DMBoundaryType bx,by;
201aa219208SBarry Smith   DMDAStencilType  st;
20247c6ae99SBarry Smith   ISColoringValue  *colors;
20347c6ae99SBarry Smith   DM_DA            *dd = (DM_DA*)da->data;
20447c6ae99SBarry Smith 
20547c6ae99SBarry Smith   PetscFunctionBegin;
20647c6ae99SBarry Smith   /*
20747c6ae99SBarry Smith          nc - number of components per grid point
20847c6ae99SBarry Smith          col - number of colors needed in one direction for single component problem
20947c6ae99SBarry Smith 
21047c6ae99SBarry Smith   */
2111321219cSEthan Coon   ierr = DMDAGetInfo(da,&dim,&m,&n,0,&M,&N,0,&nc,&s,&bx,&by,0,&st);CHKERRQ(ierr);
21247c6ae99SBarry Smith   col  = 2*s + 1;
213aa219208SBarry Smith   ierr = DMDAGetCorners(da,&xs,&ys,0,&nx,&ny,0);CHKERRQ(ierr);
214aa219208SBarry Smith   ierr = DMDAGetGhostCorners(da,&gxs,&gys,0,&gnx,&gny,0);CHKERRQ(ierr);
21547c6ae99SBarry Smith   ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr);
21647c6ae99SBarry Smith 
21747c6ae99SBarry Smith   /* special case as taught to us by Paul Hovland */
218aa219208SBarry Smith   if (st == DMDA_STENCIL_STAR && s == 1) {
219e727c939SJed Brown     ierr = DMCreateColoring_DA_2d_5pt_MPIAIJ(da,ctype,coloring);CHKERRQ(ierr);
22047c6ae99SBarry Smith   } else {
22147c6ae99SBarry Smith 
222bff4a2f0SMatthew G. Knepley     if (bx == DM_BOUNDARY_PERIODIC && (m % col)) SETERRQ2(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in X (%d) is divisible\n\
22347c6ae99SBarry Smith                                                             by 2*stencil_width + 1 (%d)\n", m, col);
224bff4a2f0SMatthew G. Knepley     if (by == DM_BOUNDARY_PERIODIC && (n % col)) SETERRQ2(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in Y (%d) is divisible\n\
22547c6ae99SBarry Smith                                                             by 2*stencil_width + 1 (%d)\n", n, col);
22647c6ae99SBarry Smith     if (ctype == IS_COLORING_GLOBAL) {
22747c6ae99SBarry Smith       if (!dd->localcoloring) {
228785e854fSJed Brown         ierr = PetscMalloc1(nc*nx*ny,&colors);CHKERRQ(ierr);
22947c6ae99SBarry Smith         ii   = 0;
23047c6ae99SBarry Smith         for (j=ys; j<ys+ny; j++) {
23147c6ae99SBarry Smith           for (i=xs; i<xs+nx; i++) {
23247c6ae99SBarry Smith             for (k=0; k<nc; k++) {
23347c6ae99SBarry Smith               colors[ii++] = k + nc*((i % col) + col*(j % col));
23447c6ae99SBarry Smith             }
23547c6ae99SBarry Smith           }
23647c6ae99SBarry Smith         }
23747c6ae99SBarry Smith         ncolors = nc + nc*(col-1 + col*(col-1));
238aaf3ff59SMatthew G. Knepley         ierr    = ISColoringCreate(comm,ncolors,nc*nx*ny,colors,PETSC_OWN_POINTER,&dd->localcoloring);CHKERRQ(ierr);
23947c6ae99SBarry Smith       }
24047c6ae99SBarry Smith       *coloring = dd->localcoloring;
2415bdb020cSBarry Smith     } else if (ctype == IS_COLORING_LOCAL) {
24247c6ae99SBarry Smith       if (!dd->ghostedcoloring) {
243785e854fSJed Brown         ierr = PetscMalloc1(nc*gnx*gny,&colors);CHKERRQ(ierr);
24447c6ae99SBarry Smith         ii   = 0;
24547c6ae99SBarry Smith         for (j=gys; j<gys+gny; j++) {
24647c6ae99SBarry Smith           for (i=gxs; i<gxs+gnx; i++) {
24747c6ae99SBarry Smith             for (k=0; k<nc; k++) {
24847c6ae99SBarry Smith               /* the complicated stuff is to handle periodic boundaries */
24947c6ae99SBarry Smith               colors[ii++] = k + nc*((SetInRange(i,m) % col) + col*(SetInRange(j,n) % col));
25047c6ae99SBarry Smith             }
25147c6ae99SBarry Smith           }
25247c6ae99SBarry Smith         }
25347c6ae99SBarry Smith         ncolors = nc + nc*(col - 1 + col*(col-1));
254aaf3ff59SMatthew G. Knepley         ierr    = ISColoringCreate(comm,ncolors,nc*gnx*gny,colors,PETSC_OWN_POINTER,&dd->ghostedcoloring);CHKERRQ(ierr);
25547c6ae99SBarry Smith         /* PetscIntView(ncolors,(PetscInt*)colors,0); */
25647c6ae99SBarry Smith 
2575bdb020cSBarry Smith         ierr = ISColoringSetType(dd->ghostedcoloring,IS_COLORING_LOCAL);CHKERRQ(ierr);
25847c6ae99SBarry Smith       }
25947c6ae99SBarry Smith       *coloring = dd->ghostedcoloring;
260ce94432eSBarry Smith     } else SETERRQ1(PetscObjectComm((PetscObject)da),PETSC_ERR_ARG_WRONG,"Unknown ISColoringType %d",(int)ctype);
26147c6ae99SBarry Smith   }
26247c6ae99SBarry Smith   ierr = ISColoringReference(*coloring);CHKERRQ(ierr);
26347c6ae99SBarry Smith   PetscFunctionReturn(0);
26447c6ae99SBarry Smith }
26547c6ae99SBarry Smith 
26647c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/
26747c6ae99SBarry Smith 
268e727c939SJed Brown PetscErrorCode DMCreateColoring_DA_3d_MPIAIJ(DM da,ISColoringType ctype,ISColoring *coloring)
26947c6ae99SBarry Smith {
27047c6ae99SBarry Smith   PetscErrorCode   ierr;
27147c6ae99SBarry Smith   PetscInt         xs,ys,nx,ny,i,j,gxs,gys,gnx,gny,m,n,p,dim,s,k,nc,col,zs,gzs,ii,l,nz,gnz,M,N,P;
27247c6ae99SBarry Smith   PetscInt         ncolors;
27347c6ae99SBarry Smith   MPI_Comm         comm;
274bff4a2f0SMatthew G. Knepley   DMBoundaryType bx,by,bz;
275aa219208SBarry Smith   DMDAStencilType  st;
27647c6ae99SBarry Smith   ISColoringValue  *colors;
27747c6ae99SBarry Smith   DM_DA            *dd = (DM_DA*)da->data;
27847c6ae99SBarry Smith 
27947c6ae99SBarry Smith   PetscFunctionBegin;
28047c6ae99SBarry Smith   /*
28147c6ae99SBarry Smith          nc - number of components per grid point
28247c6ae99SBarry Smith          col - number of colors needed in one direction for single component problem
28347c6ae99SBarry Smith 
28447c6ae99SBarry Smith   */
2851321219cSEthan Coon   ierr = DMDAGetInfo(da,&dim,&m,&n,&p,&M,&N,&P,&nc,&s,&bx,&by,&bz,&st);CHKERRQ(ierr);
28647c6ae99SBarry Smith   col  = 2*s + 1;
287bff4a2f0SMatthew G. Knepley   if (bx == DM_BOUNDARY_PERIODIC && (m % col)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in X is divisible\n\
28847c6ae99SBarry Smith                                                          by 2*stencil_width + 1\n");
289bff4a2f0SMatthew G. Knepley   if (by == DM_BOUNDARY_PERIODIC && (n % col)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in Y is divisible\n\
29047c6ae99SBarry Smith                                                          by 2*stencil_width + 1\n");
291bff4a2f0SMatthew G. Knepley   if (bz == DM_BOUNDARY_PERIODIC && (p % col)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in Z is divisible\n\
29247c6ae99SBarry Smith                                                          by 2*stencil_width + 1\n");
29347c6ae99SBarry Smith 
294aa219208SBarry Smith   ierr = DMDAGetCorners(da,&xs,&ys,&zs,&nx,&ny,&nz);CHKERRQ(ierr);
295aa219208SBarry Smith   ierr = DMDAGetGhostCorners(da,&gxs,&gys,&gzs,&gnx,&gny,&gnz);CHKERRQ(ierr);
29647c6ae99SBarry Smith   ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr);
29747c6ae99SBarry Smith 
29847c6ae99SBarry Smith   /* create the coloring */
29947c6ae99SBarry Smith   if (ctype == IS_COLORING_GLOBAL) {
30047c6ae99SBarry Smith     if (!dd->localcoloring) {
301785e854fSJed Brown       ierr = PetscMalloc1(nc*nx*ny*nz,&colors);CHKERRQ(ierr);
30247c6ae99SBarry Smith       ii   = 0;
30347c6ae99SBarry Smith       for (k=zs; k<zs+nz; k++) {
30447c6ae99SBarry Smith         for (j=ys; j<ys+ny; j++) {
30547c6ae99SBarry Smith           for (i=xs; i<xs+nx; i++) {
30647c6ae99SBarry Smith             for (l=0; l<nc; l++) {
30747c6ae99SBarry Smith               colors[ii++] = l + nc*((i % col) + col*(j % col) + col*col*(k % col));
30847c6ae99SBarry Smith             }
30947c6ae99SBarry Smith           }
31047c6ae99SBarry Smith         }
31147c6ae99SBarry Smith       }
31247c6ae99SBarry Smith       ncolors = nc + nc*(col-1 + col*(col-1)+ col*col*(col-1));
313aaf3ff59SMatthew G. Knepley       ierr    = ISColoringCreate(comm,ncolors,nc*nx*ny*nz,colors,PETSC_OWN_POINTER,&dd->localcoloring);CHKERRQ(ierr);
31447c6ae99SBarry Smith     }
31547c6ae99SBarry Smith     *coloring = dd->localcoloring;
3165bdb020cSBarry Smith   } else if (ctype == IS_COLORING_LOCAL) {
31747c6ae99SBarry Smith     if (!dd->ghostedcoloring) {
318785e854fSJed Brown       ierr = PetscMalloc1(nc*gnx*gny*gnz,&colors);CHKERRQ(ierr);
31947c6ae99SBarry Smith       ii   = 0;
32047c6ae99SBarry Smith       for (k=gzs; k<gzs+gnz; k++) {
32147c6ae99SBarry Smith         for (j=gys; j<gys+gny; j++) {
32247c6ae99SBarry Smith           for (i=gxs; i<gxs+gnx; i++) {
32347c6ae99SBarry Smith             for (l=0; l<nc; l++) {
32447c6ae99SBarry Smith               /* the complicated stuff is to handle periodic boundaries */
32547c6ae99SBarry Smith               colors[ii++] = l + nc*((SetInRange(i,m) % col) + col*(SetInRange(j,n) % col) + col*col*(SetInRange(k,p) % col));
32647c6ae99SBarry Smith             }
32747c6ae99SBarry Smith           }
32847c6ae99SBarry Smith         }
32947c6ae99SBarry Smith       }
33047c6ae99SBarry Smith       ncolors = nc + nc*(col-1 + col*(col-1)+ col*col*(col-1));
331aaf3ff59SMatthew G. Knepley       ierr    = ISColoringCreate(comm,ncolors,nc*gnx*gny*gnz,colors,PETSC_OWN_POINTER,&dd->ghostedcoloring);CHKERRQ(ierr);
3325bdb020cSBarry Smith       ierr    = ISColoringSetType(dd->ghostedcoloring,IS_COLORING_LOCAL);CHKERRQ(ierr);
33347c6ae99SBarry Smith     }
33447c6ae99SBarry Smith     *coloring = dd->ghostedcoloring;
335ce94432eSBarry Smith   } else SETERRQ1(PetscObjectComm((PetscObject)da),PETSC_ERR_ARG_WRONG,"Unknown ISColoringType %d",(int)ctype);
33647c6ae99SBarry Smith   ierr = ISColoringReference(*coloring);CHKERRQ(ierr);
33747c6ae99SBarry Smith   PetscFunctionReturn(0);
33847c6ae99SBarry Smith }
33947c6ae99SBarry Smith 
34047c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/
34147c6ae99SBarry Smith 
342e727c939SJed Brown PetscErrorCode DMCreateColoring_DA_1d_MPIAIJ(DM da,ISColoringType ctype,ISColoring *coloring)
34347c6ae99SBarry Smith {
34447c6ae99SBarry Smith   PetscErrorCode   ierr;
34547c6ae99SBarry Smith   PetscInt         xs,nx,i,i1,gxs,gnx,l,m,M,dim,s,nc,col;
34647c6ae99SBarry Smith   PetscInt         ncolors;
34747c6ae99SBarry Smith   MPI_Comm         comm;
348bff4a2f0SMatthew G. Knepley   DMBoundaryType bx;
34947c6ae99SBarry Smith   ISColoringValue  *colors;
35047c6ae99SBarry Smith   DM_DA            *dd = (DM_DA*)da->data;
35147c6ae99SBarry Smith 
35247c6ae99SBarry Smith   PetscFunctionBegin;
35347c6ae99SBarry Smith   /*
35447c6ae99SBarry Smith          nc - number of components per grid point
35547c6ae99SBarry Smith          col - number of colors needed in one direction for single component problem
35647c6ae99SBarry Smith 
35747c6ae99SBarry Smith   */
3581321219cSEthan Coon   ierr = DMDAGetInfo(da,&dim,&m,0,0,&M,0,0,&nc,&s,&bx,0,0,0);CHKERRQ(ierr);
35947c6ae99SBarry Smith   col  = 2*s + 1;
36047c6ae99SBarry Smith 
361bff4a2f0SMatthew G. Knepley   if (bx == DM_BOUNDARY_PERIODIC && (m % col)) SETERRQ2(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points %d is divisible\n\
36231e6f798SBarry Smith                                                           by 2*stencil_width + 1 %d\n",(int)m,(int)col);
36347c6ae99SBarry Smith 
364aa219208SBarry Smith   ierr = DMDAGetCorners(da,&xs,0,0,&nx,0,0);CHKERRQ(ierr);
365aa219208SBarry Smith   ierr = DMDAGetGhostCorners(da,&gxs,0,0,&gnx,0,0);CHKERRQ(ierr);
36647c6ae99SBarry Smith   ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr);
36747c6ae99SBarry Smith 
36847c6ae99SBarry Smith   /* create the coloring */
36947c6ae99SBarry Smith   if (ctype == IS_COLORING_GLOBAL) {
37047c6ae99SBarry Smith     if (!dd->localcoloring) {
371785e854fSJed Brown       ierr = PetscMalloc1(nc*nx,&colors);CHKERRQ(ierr);
372ae4f298aSBarry Smith       if (dd->ofillcols) {
373ae4f298aSBarry Smith         PetscInt tc = 0;
374ae4f298aSBarry Smith         for (i=0; i<nc; i++) tc += (PetscInt) (dd->ofillcols[i] > 0);
375ae4f298aSBarry Smith         i1 = 0;
376ae4f298aSBarry Smith         for (i=xs; i<xs+nx; i++) {
377ae4f298aSBarry Smith           for (l=0; l<nc; l++) {
378ae4f298aSBarry Smith             if (dd->ofillcols[l] && (i % col)) {
379ae4f298aSBarry Smith               colors[i1++] =  nc - 1 + tc*((i % col) - 1) + dd->ofillcols[l];
380ae4f298aSBarry Smith             } else {
381ae4f298aSBarry Smith               colors[i1++] = l;
382ae4f298aSBarry Smith             }
383ae4f298aSBarry Smith           }
384ae4f298aSBarry Smith         }
385ae4f298aSBarry Smith         ncolors = nc + 2*s*tc;
386ae4f298aSBarry Smith       } else {
38747c6ae99SBarry Smith         i1 = 0;
38847c6ae99SBarry Smith         for (i=xs; i<xs+nx; i++) {
38947c6ae99SBarry Smith           for (l=0; l<nc; l++) {
39047c6ae99SBarry Smith             colors[i1++] = l + nc*(i % col);
39147c6ae99SBarry Smith           }
39247c6ae99SBarry Smith         }
39347c6ae99SBarry Smith         ncolors = nc + nc*(col-1);
394ae4f298aSBarry Smith       }
395aaf3ff59SMatthew G. Knepley       ierr = ISColoringCreate(comm,ncolors,nc*nx,colors,PETSC_OWN_POINTER,&dd->localcoloring);CHKERRQ(ierr);
39647c6ae99SBarry Smith     }
39747c6ae99SBarry Smith     *coloring = dd->localcoloring;
3985bdb020cSBarry Smith   } else if (ctype == IS_COLORING_LOCAL) {
39947c6ae99SBarry Smith     if (!dd->ghostedcoloring) {
400785e854fSJed Brown       ierr = PetscMalloc1(nc*gnx,&colors);CHKERRQ(ierr);
40147c6ae99SBarry Smith       i1   = 0;
40247c6ae99SBarry Smith       for (i=gxs; i<gxs+gnx; i++) {
40347c6ae99SBarry Smith         for (l=0; l<nc; l++) {
40447c6ae99SBarry Smith           /* the complicated stuff is to handle periodic boundaries */
40547c6ae99SBarry Smith           colors[i1++] = l + nc*(SetInRange(i,m) % col);
40647c6ae99SBarry Smith         }
40747c6ae99SBarry Smith       }
40847c6ae99SBarry Smith       ncolors = nc + nc*(col-1);
409aaf3ff59SMatthew G. Knepley       ierr    = ISColoringCreate(comm,ncolors,nc*gnx,colors,PETSC_OWN_POINTER,&dd->ghostedcoloring);CHKERRQ(ierr);
4105bdb020cSBarry Smith       ierr    = ISColoringSetType(dd->ghostedcoloring,IS_COLORING_LOCAL);CHKERRQ(ierr);
41147c6ae99SBarry Smith     }
41247c6ae99SBarry Smith     *coloring = dd->ghostedcoloring;
413ce94432eSBarry Smith   } else SETERRQ1(PetscObjectComm((PetscObject)da),PETSC_ERR_ARG_WRONG,"Unknown ISColoringType %d",(int)ctype);
41447c6ae99SBarry Smith   ierr = ISColoringReference(*coloring);CHKERRQ(ierr);
41547c6ae99SBarry Smith   PetscFunctionReturn(0);
41647c6ae99SBarry Smith }
41747c6ae99SBarry Smith 
418e727c939SJed Brown PetscErrorCode DMCreateColoring_DA_2d_5pt_MPIAIJ(DM da,ISColoringType ctype,ISColoring *coloring)
41947c6ae99SBarry Smith {
42047c6ae99SBarry Smith   PetscErrorCode   ierr;
42147c6ae99SBarry Smith   PetscInt         xs,ys,nx,ny,i,j,ii,gxs,gys,gnx,gny,m,n,dim,s,k,nc;
42247c6ae99SBarry Smith   PetscInt         ncolors;
42347c6ae99SBarry Smith   MPI_Comm         comm;
424bff4a2f0SMatthew G. Knepley   DMBoundaryType bx,by;
42547c6ae99SBarry Smith   ISColoringValue  *colors;
42647c6ae99SBarry Smith   DM_DA            *dd = (DM_DA*)da->data;
42747c6ae99SBarry Smith 
42847c6ae99SBarry Smith   PetscFunctionBegin;
42947c6ae99SBarry Smith   /*
43047c6ae99SBarry Smith          nc - number of components per grid point
43147c6ae99SBarry Smith          col - number of colors needed in one direction for single component problem
43247c6ae99SBarry Smith 
43347c6ae99SBarry Smith   */
4341321219cSEthan Coon   ierr = DMDAGetInfo(da,&dim,&m,&n,0,0,0,0,&nc,&s,&bx,&by,0,0);CHKERRQ(ierr);
435aa219208SBarry Smith   ierr = DMDAGetCorners(da,&xs,&ys,0,&nx,&ny,0);CHKERRQ(ierr);
436aa219208SBarry Smith   ierr = DMDAGetGhostCorners(da,&gxs,&gys,0,&gnx,&gny,0);CHKERRQ(ierr);
43747c6ae99SBarry Smith   ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr);
43847c6ae99SBarry Smith 
439bff4a2f0SMatthew G. Knepley   if (bx == DM_BOUNDARY_PERIODIC && (m % 5)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in X is divisible by 5\n");
440bff4a2f0SMatthew G. Knepley   if (by == DM_BOUNDARY_PERIODIC && (n % 5)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in Y is divisible by 5\n");
44147c6ae99SBarry Smith 
44247c6ae99SBarry Smith   /* create the coloring */
44347c6ae99SBarry Smith   if (ctype == IS_COLORING_GLOBAL) {
44447c6ae99SBarry Smith     if (!dd->localcoloring) {
445785e854fSJed Brown       ierr = PetscMalloc1(nc*nx*ny,&colors);CHKERRQ(ierr);
44647c6ae99SBarry Smith       ii   = 0;
44747c6ae99SBarry Smith       for (j=ys; j<ys+ny; j++) {
44847c6ae99SBarry Smith         for (i=xs; i<xs+nx; i++) {
44947c6ae99SBarry Smith           for (k=0; k<nc; k++) {
45047c6ae99SBarry Smith             colors[ii++] = k + nc*((3*j+i) % 5);
45147c6ae99SBarry Smith           }
45247c6ae99SBarry Smith         }
45347c6ae99SBarry Smith       }
45447c6ae99SBarry Smith       ncolors = 5*nc;
455aaf3ff59SMatthew G. Knepley       ierr    = ISColoringCreate(comm,ncolors,nc*nx*ny,colors,PETSC_OWN_POINTER,&dd->localcoloring);CHKERRQ(ierr);
45647c6ae99SBarry Smith     }
45747c6ae99SBarry Smith     *coloring = dd->localcoloring;
4585bdb020cSBarry Smith   } else if (ctype == IS_COLORING_LOCAL) {
45947c6ae99SBarry Smith     if (!dd->ghostedcoloring) {
460785e854fSJed Brown       ierr = PetscMalloc1(nc*gnx*gny,&colors);CHKERRQ(ierr);
46147c6ae99SBarry Smith       ii = 0;
46247c6ae99SBarry Smith       for (j=gys; j<gys+gny; j++) {
46347c6ae99SBarry Smith         for (i=gxs; i<gxs+gnx; i++) {
46447c6ae99SBarry Smith           for (k=0; k<nc; k++) {
46547c6ae99SBarry Smith             colors[ii++] = k + nc*((3*SetInRange(j,n) + SetInRange(i,m)) % 5);
46647c6ae99SBarry Smith           }
46747c6ae99SBarry Smith         }
46847c6ae99SBarry Smith       }
46947c6ae99SBarry Smith       ncolors = 5*nc;
470aaf3ff59SMatthew G. Knepley       ierr    = ISColoringCreate(comm,ncolors,nc*gnx*gny,colors,PETSC_OWN_POINTER,&dd->ghostedcoloring);CHKERRQ(ierr);
4715bdb020cSBarry Smith       ierr    = ISColoringSetType(dd->ghostedcoloring,IS_COLORING_LOCAL);CHKERRQ(ierr);
47247c6ae99SBarry Smith     }
47347c6ae99SBarry Smith     *coloring = dd->ghostedcoloring;
474ce94432eSBarry Smith   } else SETERRQ1(PetscObjectComm((PetscObject)da),PETSC_ERR_ARG_WRONG,"Unknown ISColoringType %d",(int)ctype);
47547c6ae99SBarry Smith   PetscFunctionReturn(0);
47647c6ae99SBarry Smith }
47747c6ae99SBarry Smith 
47847c6ae99SBarry Smith /* =========================================================================== */
479950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_1d_MPIAIJ(DM,Mat);
480ce308e1dSBarry Smith extern PetscErrorCode DMCreateMatrix_DA_1d_MPIAIJ_Fill(DM,Mat);
481950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_2d_MPIAIJ(DM,Mat);
482950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_2d_MPIAIJ_Fill(DM,Mat);
483950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_3d_MPIAIJ(DM,Mat);
484950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_3d_MPIAIJ_Fill(DM,Mat);
485950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_2d_MPIBAIJ(DM,Mat);
486950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_3d_MPIBAIJ(DM,Mat);
487950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_2d_MPISBAIJ(DM,Mat);
488950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_3d_MPISBAIJ(DM,Mat);
489*5e26d47bSHong Zhang extern PetscErrorCode DMCreateMatrix_DA_2d_MPIELL(DM,Mat);
49047c6ae99SBarry Smith 
4918bbdbebaSMatthew G Knepley /*@C
492c688c046SMatthew G Knepley    MatSetupDM - Sets the DMDA that is to be used by the HYPRE_StructMatrix PETSc matrix
49347c6ae99SBarry Smith 
49447c6ae99SBarry Smith    Logically Collective on Mat
49547c6ae99SBarry Smith 
49647c6ae99SBarry Smith    Input Parameters:
49747c6ae99SBarry Smith +  mat - the matrix
49847c6ae99SBarry Smith -  da - the da
49947c6ae99SBarry Smith 
50047c6ae99SBarry Smith    Level: intermediate
50147c6ae99SBarry Smith 
50247c6ae99SBarry Smith @*/
503c688c046SMatthew G Knepley PetscErrorCode MatSetupDM(Mat mat,DM da)
50447c6ae99SBarry Smith {
50547c6ae99SBarry Smith   PetscErrorCode ierr;
50647c6ae99SBarry Smith 
50747c6ae99SBarry Smith   PetscFunctionBegin;
50847c6ae99SBarry Smith   PetscValidHeaderSpecific(mat,MAT_CLASSID,1);
50947c6ae99SBarry Smith   PetscValidHeaderSpecific(da,DM_CLASSID,1);
510c688c046SMatthew G Knepley   ierr = PetscTryMethod(mat,"MatSetupDM_C",(Mat,DM),(mat,da));CHKERRQ(ierr);
51147c6ae99SBarry Smith   PetscFunctionReturn(0);
51247c6ae99SBarry Smith }
51347c6ae99SBarry Smith 
5147087cfbeSBarry Smith PetscErrorCode  MatView_MPI_DA(Mat A,PetscViewer viewer)
51547c6ae99SBarry Smith {
5169a42bb27SBarry Smith   DM                da;
51747c6ae99SBarry Smith   PetscErrorCode    ierr;
51847c6ae99SBarry Smith   const char        *prefix;
51947c6ae99SBarry Smith   Mat               Anatural;
52047c6ae99SBarry Smith   AO                ao;
52147c6ae99SBarry Smith   PetscInt          rstart,rend,*petsc,i;
52247c6ae99SBarry Smith   IS                is;
52347c6ae99SBarry Smith   MPI_Comm          comm;
52474388724SJed Brown   PetscViewerFormat format;
52547c6ae99SBarry Smith 
52647c6ae99SBarry Smith   PetscFunctionBegin;
52774388724SJed Brown   /* Check whether we are just printing info, in which case MatView() already viewed everything we wanted to view */
52874388724SJed Brown   ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr);
52974388724SJed Brown   if (format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(0);
53074388724SJed Brown 
53147c6ae99SBarry Smith   ierr = PetscObjectGetComm((PetscObject)A,&comm);CHKERRQ(ierr);
532c688c046SMatthew G Knepley   ierr = MatGetDM(A, &da);CHKERRQ(ierr);
533ce94432eSBarry Smith   if (!da) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"Matrix not generated from a DMDA");
53447c6ae99SBarry Smith 
535aa219208SBarry Smith   ierr = DMDAGetAO(da,&ao);CHKERRQ(ierr);
53647c6ae99SBarry Smith   ierr = MatGetOwnershipRange(A,&rstart,&rend);CHKERRQ(ierr);
537854ce69bSBarry Smith   ierr = PetscMalloc1(rend-rstart,&petsc);CHKERRQ(ierr);
53847c6ae99SBarry Smith   for (i=rstart; i<rend; i++) petsc[i-rstart] = i;
53947c6ae99SBarry Smith   ierr = AOApplicationToPetsc(ao,rend-rstart,petsc);CHKERRQ(ierr);
54047c6ae99SBarry Smith   ierr = ISCreateGeneral(comm,rend-rstart,petsc,PETSC_OWN_POINTER,&is);CHKERRQ(ierr);
54147c6ae99SBarry Smith 
54247c6ae99SBarry Smith   /* call viewer on natural ordering */
5437dae84e0SHong Zhang   ierr = MatCreateSubMatrix(A,is,is,MAT_INITIAL_MATRIX,&Anatural);CHKERRQ(ierr);
544fcfd50ebSBarry Smith   ierr = ISDestroy(&is);CHKERRQ(ierr);
54547c6ae99SBarry Smith   ierr = PetscObjectGetOptionsPrefix((PetscObject)A,&prefix);CHKERRQ(ierr);
54647c6ae99SBarry Smith   ierr = PetscObjectSetOptionsPrefix((PetscObject)Anatural,prefix);CHKERRQ(ierr);
54747c6ae99SBarry Smith   ierr = PetscObjectSetName((PetscObject)Anatural,((PetscObject)A)->name);CHKERRQ(ierr);
548539c167fSBarry Smith   ierr = MatView(Anatural,viewer);CHKERRQ(ierr);
549fcfd50ebSBarry Smith   ierr = MatDestroy(&Anatural);CHKERRQ(ierr);
55047c6ae99SBarry Smith   PetscFunctionReturn(0);
55147c6ae99SBarry Smith }
55247c6ae99SBarry Smith 
5537087cfbeSBarry Smith PetscErrorCode  MatLoad_MPI_DA(Mat A,PetscViewer viewer)
55447c6ae99SBarry Smith {
5559a42bb27SBarry Smith   DM             da;
55647c6ae99SBarry Smith   PetscErrorCode ierr;
55747c6ae99SBarry Smith   Mat            Anatural,Aapp;
55847c6ae99SBarry Smith   AO             ao;
559539c167fSBarry Smith   PetscInt       rstart,rend,*app,i,m,n,M,N;
56047c6ae99SBarry Smith   IS             is;
56147c6ae99SBarry Smith   MPI_Comm       comm;
56247c6ae99SBarry Smith 
56347c6ae99SBarry Smith   PetscFunctionBegin;
56447c6ae99SBarry Smith   ierr = PetscObjectGetComm((PetscObject)A,&comm);CHKERRQ(ierr);
565c688c046SMatthew G Knepley   ierr = MatGetDM(A, &da);CHKERRQ(ierr);
566ce94432eSBarry Smith   if (!da) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"Matrix not generated from a DMDA");
56747c6ae99SBarry Smith 
56847c6ae99SBarry Smith   /* Load the matrix in natural ordering */
569ce94432eSBarry Smith   ierr = MatCreate(PetscObjectComm((PetscObject)A),&Anatural);CHKERRQ(ierr);
57047c6ae99SBarry Smith   ierr = MatSetType(Anatural,((PetscObject)A)->type_name);CHKERRQ(ierr);
571539c167fSBarry Smith   ierr = MatGetSize(A,&M,&N);CHKERRQ(ierr);
572539c167fSBarry Smith   ierr = MatGetLocalSize(A,&m,&n);CHKERRQ(ierr);
573539c167fSBarry Smith   ierr = MatSetSizes(Anatural,m,n,M,N);CHKERRQ(ierr);
57447c6ae99SBarry Smith   ierr = MatLoad(Anatural,viewer);CHKERRQ(ierr);
57547c6ae99SBarry Smith 
57647c6ae99SBarry Smith   /* Map natural ordering to application ordering and create IS */
577aa219208SBarry Smith   ierr = DMDAGetAO(da,&ao);CHKERRQ(ierr);
57847c6ae99SBarry Smith   ierr = MatGetOwnershipRange(Anatural,&rstart,&rend);CHKERRQ(ierr);
579854ce69bSBarry Smith   ierr = PetscMalloc1(rend-rstart,&app);CHKERRQ(ierr);
58047c6ae99SBarry Smith   for (i=rstart; i<rend; i++) app[i-rstart] = i;
58147c6ae99SBarry Smith   ierr = AOPetscToApplication(ao,rend-rstart,app);CHKERRQ(ierr);
58247c6ae99SBarry Smith   ierr = ISCreateGeneral(comm,rend-rstart,app,PETSC_OWN_POINTER,&is);CHKERRQ(ierr);
58347c6ae99SBarry Smith 
58447c6ae99SBarry Smith   /* Do permutation and replace header */
5857dae84e0SHong Zhang   ierr = MatCreateSubMatrix(Anatural,is,is,MAT_INITIAL_MATRIX,&Aapp);CHKERRQ(ierr);
58628be2f97SBarry Smith   ierr = MatHeaderReplace(A,&Aapp);CHKERRQ(ierr);
587fcfd50ebSBarry Smith   ierr = ISDestroy(&is);CHKERRQ(ierr);
588fcfd50ebSBarry Smith   ierr = MatDestroy(&Anatural);CHKERRQ(ierr);
58947c6ae99SBarry Smith   PetscFunctionReturn(0);
59047c6ae99SBarry Smith }
59147c6ae99SBarry Smith 
592b412c318SBarry Smith PetscErrorCode DMCreateMatrix_DA(DM da, Mat *J)
59347c6ae99SBarry Smith {
59447c6ae99SBarry Smith   PetscErrorCode ierr;
59547c6ae99SBarry Smith   PetscInt       dim,dof,nx,ny,nz,dims[3],starts[3],M,N,P;
59647c6ae99SBarry Smith   Mat            A;
59747c6ae99SBarry Smith   MPI_Comm       comm;
59819fd82e9SBarry Smith   MatType        Atype;
59937d0c07bSMatthew G Knepley   PetscSection   section, sectionGlobal;
600*5e26d47bSHong Zhang   void           (*aij)(void)=NULL,(*baij)(void)=NULL,(*sbaij)(void)=NULL,(*ell)(void)=NULL;
601b412c318SBarry Smith   MatType        mtype;
60247c6ae99SBarry Smith   PetscMPIInt    size;
60347c6ae99SBarry Smith   DM_DA          *dd = (DM_DA*)da->data;
60447c6ae99SBarry Smith 
60547c6ae99SBarry Smith   PetscFunctionBegin;
606607a6623SBarry Smith   ierr = MatInitializePackage();CHKERRQ(ierr);
607b412c318SBarry Smith   mtype = da->mattype;
60847c6ae99SBarry Smith 
60937d0c07bSMatthew G Knepley   ierr = DMGetDefaultSection(da, &section);CHKERRQ(ierr);
61037d0c07bSMatthew G Knepley   if (section) {
61137d0c07bSMatthew G Knepley     PetscInt  bs = -1;
61237d0c07bSMatthew G Knepley     PetscInt  localSize;
61337d0c07bSMatthew G Knepley     PetscBool isShell, isBlock, isSeqBlock, isMPIBlock, isSymBlock, isSymSeqBlock, isSymMPIBlock, isSymmetric;
61437d0c07bSMatthew G Knepley 
61537d0c07bSMatthew G Knepley     ierr = DMGetDefaultGlobalSection(da, &sectionGlobal);CHKERRQ(ierr);
61637d0c07bSMatthew G Knepley     ierr = PetscSectionGetConstrainedStorageSize(sectionGlobal, &localSize);CHKERRQ(ierr);
617b5579763SJed Brown     ierr = MatCreate(PetscObjectComm((PetscObject)da),&A);CHKERRQ(ierr);
618b5579763SJed Brown     ierr = MatSetSizes(A,localSize,localSize,PETSC_DETERMINE,PETSC_DETERMINE);CHKERRQ(ierr);
619b5579763SJed Brown     ierr = MatSetType(A,mtype);CHKERRQ(ierr);
62037d0c07bSMatthew G Knepley     ierr = PetscStrcmp(mtype,MATSHELL,&isShell);CHKERRQ(ierr);
62137d0c07bSMatthew G Knepley     ierr = PetscStrcmp(mtype,MATBAIJ,&isBlock);CHKERRQ(ierr);
62237d0c07bSMatthew G Knepley     ierr = PetscStrcmp(mtype,MATSEQBAIJ,&isSeqBlock);CHKERRQ(ierr);
62337d0c07bSMatthew G Knepley     ierr = PetscStrcmp(mtype,MATMPIBAIJ,&isMPIBlock);CHKERRQ(ierr);
62437d0c07bSMatthew G Knepley     ierr = PetscStrcmp(mtype,MATSBAIJ,&isSymBlock);CHKERRQ(ierr);
62537d0c07bSMatthew G Knepley     ierr = PetscStrcmp(mtype,MATSEQSBAIJ,&isSymSeqBlock);CHKERRQ(ierr);
62637d0c07bSMatthew G Knepley     ierr = PetscStrcmp(mtype,MATMPISBAIJ,&isSymMPIBlock);CHKERRQ(ierr);
62737d0c07bSMatthew G Knepley     /* Check for symmetric storage */
62837d0c07bSMatthew G Knepley     isSymmetric = (PetscBool) (isSymBlock || isSymSeqBlock || isSymMPIBlock);
62937d0c07bSMatthew G Knepley     if (isSymmetric) {
63037d0c07bSMatthew G Knepley       ierr = MatSetOption(*J, MAT_IGNORE_LOWER_TRIANGULAR, PETSC_TRUE);CHKERRQ(ierr);
63137d0c07bSMatthew G Knepley     }
63237d0c07bSMatthew G Knepley     if (!isShell) {
63337d0c07bSMatthew G Knepley       PetscInt *dnz, *onz, *dnzu, *onzu, bsLocal;
63437d0c07bSMatthew G Knepley 
63537d0c07bSMatthew G Knepley       if (bs < 0) {
63637d0c07bSMatthew G Knepley         if (isBlock || isSeqBlock || isMPIBlock || isSymBlock || isSymSeqBlock || isSymMPIBlock) {
63737d0c07bSMatthew G Knepley           PetscInt pStart, pEnd, p, dof;
63837d0c07bSMatthew G Knepley 
63937d0c07bSMatthew G Knepley           ierr = PetscSectionGetChart(sectionGlobal, &pStart, &pEnd);CHKERRQ(ierr);
64037d0c07bSMatthew G Knepley           for (p = pStart; p < pEnd; ++p) {
64137d0c07bSMatthew G Knepley             ierr = PetscSectionGetDof(sectionGlobal, p, &dof);CHKERRQ(ierr);
64237d0c07bSMatthew G Knepley             if (dof) {
64337d0c07bSMatthew G Knepley               bs = dof;
64437d0c07bSMatthew G Knepley               break;
64537d0c07bSMatthew G Knepley             }
64637d0c07bSMatthew G Knepley           }
64737d0c07bSMatthew G Knepley         } else {
64837d0c07bSMatthew G Knepley           bs = 1;
64937d0c07bSMatthew G Knepley         }
65037d0c07bSMatthew G Knepley         /* Must have same blocksize on all procs (some might have no points) */
65137d0c07bSMatthew G Knepley         bsLocal = bs;
652b2566f29SBarry Smith         ierr    = MPIU_Allreduce(&bsLocal, &bs, 1, MPIU_INT, MPI_MAX, PetscObjectComm((PetscObject)da));CHKERRQ(ierr);
65337d0c07bSMatthew G Knepley       }
6541795a4d1SJed Brown       ierr = PetscCalloc4(localSize/bs, &dnz, localSize/bs, &onz, localSize/bs, &dnzu, localSize/bs, &onzu);CHKERRQ(ierr);
655552f7358SJed Brown       /* ierr = DMPlexPreallocateOperator(dm, bs, section, sectionGlobal, dnz, onz, dnzu, onzu, *J, fillMatrix);CHKERRQ(ierr); */
65637d0c07bSMatthew G Knepley       ierr = PetscFree4(dnz, onz, dnzu, onzu);CHKERRQ(ierr);
65737d0c07bSMatthew G Knepley     }
65837d0c07bSMatthew G Knepley   }
65947c6ae99SBarry Smith   /*
66047c6ae99SBarry Smith                                   m
66147c6ae99SBarry Smith           ------------------------------------------------------
66247c6ae99SBarry Smith          |                                                     |
66347c6ae99SBarry Smith          |                                                     |
66447c6ae99SBarry Smith          |               ----------------------                |
66547c6ae99SBarry Smith          |               |                    |                |
66647c6ae99SBarry Smith       n  |           ny  |                    |                |
66747c6ae99SBarry Smith          |               |                    |                |
66847c6ae99SBarry Smith          |               .---------------------                |
66947c6ae99SBarry Smith          |             (xs,ys)     nx                          |
67047c6ae99SBarry Smith          |            .                                        |
67147c6ae99SBarry Smith          |         (gxs,gys)                                   |
67247c6ae99SBarry Smith          |                                                     |
67347c6ae99SBarry Smith           -----------------------------------------------------
67447c6ae99SBarry Smith   */
67547c6ae99SBarry Smith 
67647c6ae99SBarry Smith   /*
67747c6ae99SBarry Smith          nc - number of components per grid point
67847c6ae99SBarry Smith          col - number of colors needed in one direction for single component problem
67947c6ae99SBarry Smith 
68047c6ae99SBarry Smith   */
681e30e807fSPeter Brune   M   = dd->M;
682e30e807fSPeter Brune   N   = dd->N;
683e30e807fSPeter Brune   P   = dd->P;
684c73cfb54SMatthew G. Knepley   dim = da->dim;
685e30e807fSPeter Brune   dof = dd->w;
686e30e807fSPeter Brune   /* ierr = DMDAGetInfo(da,&dim,&M,&N,&P,0,0,0,&dof,0,0,0,0,0);CHKERRQ(ierr); */
687aa219208SBarry Smith   ierr = DMDAGetCorners(da,0,0,0,&nx,&ny,&nz);CHKERRQ(ierr);
68847c6ae99SBarry Smith   ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr);
68947c6ae99SBarry Smith   ierr = MatCreate(comm,&A);CHKERRQ(ierr);
69047c6ae99SBarry Smith   ierr = MatSetSizes(A,dof*nx*ny*nz,dof*nx*ny*nz,dof*M*N*P,dof*M*N*P);CHKERRQ(ierr);
691b412c318SBarry Smith   ierr = MatSetType(A,mtype);CHKERRQ(ierr);
69295ee5b0eSBarry Smith   ierr = MatSetDM(A,da);CHKERRQ(ierr);
693b06ff27eSHong Zhang   if (da->structure_only) {
694b06ff27eSHong Zhang     ierr = MatSetOption(A,MAT_STRUCTURE_ONLY,PETSC_TRUE);CHKERRQ(ierr);
695b06ff27eSHong Zhang   }
69647c6ae99SBarry Smith   ierr = MatGetType(A,&Atype);CHKERRQ(ierr);
69747c6ae99SBarry Smith   /*
698aa219208SBarry Smith      We do not provide a getmatrix function in the DMDA operations because
699aa219208SBarry Smith    the basic DMDA does not know about matrices. We think of DMDA as being more
70047c6ae99SBarry Smith    more low-level than matrices. This is kind of cheating but, cause sometimes
701aa219208SBarry Smith    we think of DMDA has higher level than matrices.
70247c6ae99SBarry Smith 
70347c6ae99SBarry Smith      We could switch based on Atype (or mtype), but we do not since the
70447c6ae99SBarry Smith    specialized setting routines depend only the particular preallocation
70547c6ae99SBarry Smith    details of the matrix, not the type itself.
70647c6ae99SBarry Smith   */
70747c6ae99SBarry Smith   ierr = PetscObjectQueryFunction((PetscObject)A,"MatMPIAIJSetPreallocation_C",&aij);CHKERRQ(ierr);
70847c6ae99SBarry Smith   if (!aij) {
70947c6ae99SBarry Smith     ierr = PetscObjectQueryFunction((PetscObject)A,"MatSeqAIJSetPreallocation_C",&aij);CHKERRQ(ierr);
71047c6ae99SBarry Smith   }
71147c6ae99SBarry Smith   if (!aij) {
71247c6ae99SBarry Smith     ierr = PetscObjectQueryFunction((PetscObject)A,"MatMPIBAIJSetPreallocation_C",&baij);CHKERRQ(ierr);
71347c6ae99SBarry Smith     if (!baij) {
71447c6ae99SBarry Smith       ierr = PetscObjectQueryFunction((PetscObject)A,"MatSeqBAIJSetPreallocation_C",&baij);CHKERRQ(ierr);
71547c6ae99SBarry Smith     }
71647c6ae99SBarry Smith     if (!baij) {
71747c6ae99SBarry Smith       ierr = PetscObjectQueryFunction((PetscObject)A,"MatMPISBAIJSetPreallocation_C",&sbaij);CHKERRQ(ierr);
71847c6ae99SBarry Smith       if (!sbaij) {
71947c6ae99SBarry Smith         ierr = PetscObjectQueryFunction((PetscObject)A,"MatSeqSBAIJSetPreallocation_C",&sbaij);CHKERRQ(ierr);
72047c6ae99SBarry Smith       }
721*5e26d47bSHong Zhang       if (!sbaij) {
722*5e26d47bSHong Zhang         ierr = PetscObjectQueryFunction((PetscObject)A,"MatMPIELLSetPreallocation_C",&ell);CHKERRQ(ierr);
723*5e26d47bSHong Zhang         if (!ell) {
724*5e26d47bSHong Zhang           ierr = PetscObjectQueryFunction((PetscObject)A,"MatSeqELLSetPreallocation_C",&ell);CHKERRQ(ierr);
725*5e26d47bSHong Zhang         }
726*5e26d47bSHong Zhang       }
72747c6ae99SBarry Smith     }
72847c6ae99SBarry Smith   }
72947c6ae99SBarry Smith   if (aij) {
73047c6ae99SBarry Smith     if (dim == 1) {
731ce308e1dSBarry Smith       if (dd->ofill) {
732ce308e1dSBarry Smith         ierr = DMCreateMatrix_DA_1d_MPIAIJ_Fill(da,A);CHKERRQ(ierr);
733ce308e1dSBarry Smith       } else {
734950540a4SJed Brown         ierr = DMCreateMatrix_DA_1d_MPIAIJ(da,A);CHKERRQ(ierr);
735ce308e1dSBarry Smith       }
73647c6ae99SBarry Smith     } else if (dim == 2) {
73747c6ae99SBarry Smith       if (dd->ofill) {
738950540a4SJed Brown         ierr = DMCreateMatrix_DA_2d_MPIAIJ_Fill(da,A);CHKERRQ(ierr);
73947c6ae99SBarry Smith       } else {
740950540a4SJed Brown         ierr = DMCreateMatrix_DA_2d_MPIAIJ(da,A);CHKERRQ(ierr);
74147c6ae99SBarry Smith       }
74247c6ae99SBarry Smith     } else if (dim == 3) {
74347c6ae99SBarry Smith       if (dd->ofill) {
744950540a4SJed Brown         ierr = DMCreateMatrix_DA_3d_MPIAIJ_Fill(da,A);CHKERRQ(ierr);
74547c6ae99SBarry Smith       } else {
746950540a4SJed Brown         ierr = DMCreateMatrix_DA_3d_MPIAIJ(da,A);CHKERRQ(ierr);
74747c6ae99SBarry Smith       }
74847c6ae99SBarry Smith     }
74947c6ae99SBarry Smith   } else if (baij) {
75047c6ae99SBarry Smith     if (dim == 2) {
751950540a4SJed Brown       ierr = DMCreateMatrix_DA_2d_MPIBAIJ(da,A);CHKERRQ(ierr);
75247c6ae99SBarry Smith     } else if (dim == 3) {
753950540a4SJed Brown       ierr = DMCreateMatrix_DA_3d_MPIBAIJ(da,A);CHKERRQ(ierr);
754ce94432eSBarry Smith     } else SETERRQ3(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"Not implemented for %D dimension and Matrix Type: %s in %D dimension! Send mail to petsc-maint@mcs.anl.gov for code",dim,Atype,dim);
75547c6ae99SBarry Smith   } else if (sbaij) {
75647c6ae99SBarry Smith     if (dim == 2) {
757950540a4SJed Brown       ierr = DMCreateMatrix_DA_2d_MPISBAIJ(da,A);CHKERRQ(ierr);
75847c6ae99SBarry Smith     } else if (dim == 3) {
759950540a4SJed Brown       ierr = DMCreateMatrix_DA_3d_MPISBAIJ(da,A);CHKERRQ(ierr);
760ce94432eSBarry Smith     } else SETERRQ3(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"Not implemented for %D dimension and Matrix Type: %s in %D dimension! Send mail to petsc-maint@mcs.anl.gov for code",dim,Atype,dim);
761*5e26d47bSHong Zhang   } else if (ell) {
762*5e26d47bSHong Zhang      if (dim ==2) {
763*5e26d47bSHong Zhang        ierr = DMCreateMatrix_DA_2d_MPIELL(da,A);CHKERRQ(ierr);
764*5e26d47bSHong Zhang      } else SETERRQ3(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"Not implemented for %D dimension and Matrix Type: %s in %D dimension! Send mail to petsc-maint@mcs.anl.gov for code",dim,Atype,dim);
765869776cdSLisandro Dalcin   }else {
76645b6f7e9SBarry Smith     ISLocalToGlobalMapping ltog;
767b026d285SBarry Smith     ierr = MatSetBlockSize(A,dof);CHKERRQ(ierr);
7682949035bSJed Brown     ierr = MatSetUp(A);CHKERRQ(ierr);
769b026d285SBarry Smith     ierr = DMGetLocalToGlobalMapping(da,&ltog);CHKERRQ(ierr);
770869776cdSLisandro Dalcin     ierr = MatSetLocalToGlobalMapping(A,ltog,ltog);CHKERRQ(ierr);
77147c6ae99SBarry Smith   }
772aa219208SBarry Smith   ierr = DMDAGetGhostCorners(da,&starts[0],&starts[1],&starts[2],&dims[0],&dims[1],&dims[2]);CHKERRQ(ierr);
77347c6ae99SBarry Smith   ierr = MatSetStencil(A,dim,dims,starts,dof);CHKERRQ(ierr);
774c688c046SMatthew G Knepley   ierr = MatSetDM(A,da);CHKERRQ(ierr);
77547c6ae99SBarry Smith   ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr);
77647c6ae99SBarry Smith   if (size > 1) {
77747c6ae99SBarry Smith     /* change viewer to display matrix in natural ordering */
77847c6ae99SBarry Smith     ierr = MatShellSetOperation(A, MATOP_VIEW, (void (*)(void))MatView_MPI_DA);CHKERRQ(ierr);
77947c6ae99SBarry Smith     ierr = MatShellSetOperation(A, MATOP_LOAD, (void (*)(void))MatLoad_MPI_DA);CHKERRQ(ierr);
78047c6ae99SBarry Smith   }
781b5579763SJed Brown   ierr = MatSetFromOptions(A);CHKERRQ(ierr);
78247c6ae99SBarry Smith   *J = A;
78347c6ae99SBarry Smith   PetscFunctionReturn(0);
78447c6ae99SBarry Smith }
78547c6ae99SBarry Smith 
78647c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/
787*5e26d47bSHong Zhang #undef __FUNCT__
788*5e26d47bSHong Zhang #define __FUNCT__ "DMCreateMatrix_DA_2d_MPIELL"
789*5e26d47bSHong Zhang PetscErrorCode DMCreateMatrix_DA_2d_MPIELL(DM da,Mat J)
790*5e26d47bSHong Zhang {
791*5e26d47bSHong Zhang   PetscErrorCode         ierr;
792*5e26d47bSHong Zhang   PetscInt               xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny,m,n,dim,s,*cols = NULL,k,nc,*rows = NULL,col,cnt,l,p;
793*5e26d47bSHong Zhang   PetscInt               lstart,lend,pstart,pend,*dnz,*onz;
794*5e26d47bSHong Zhang   MPI_Comm               comm;
795*5e26d47bSHong Zhang   PetscScalar            *values;
796*5e26d47bSHong Zhang   DMBoundaryType         bx,by;
797*5e26d47bSHong Zhang   ISLocalToGlobalMapping ltog;
798*5e26d47bSHong Zhang   DMDAStencilType        st;
799*5e26d47bSHong Zhang 
800*5e26d47bSHong Zhang   PetscFunctionBegin;
801*5e26d47bSHong Zhang   /*
802*5e26d47bSHong Zhang          nc - number of components per grid point
803*5e26d47bSHong Zhang          col - number of colors needed in one direction for single component problem
804*5e26d47bSHong Zhang 
805*5e26d47bSHong Zhang   */
806*5e26d47bSHong Zhang   ierr = DMDAGetInfo(da,&dim,&m,&n,0,0,0,0,&nc,&s,&bx,&by,0,&st);CHKERRQ(ierr);
807*5e26d47bSHong Zhang   col  = 2*s + 1;
808*5e26d47bSHong Zhang   ierr = DMDAGetCorners(da,&xs,&ys,0,&nx,&ny,0);CHKERRQ(ierr);
809*5e26d47bSHong Zhang   ierr = DMDAGetGhostCorners(da,&gxs,&gys,0,&gnx,&gny,0);CHKERRQ(ierr);
810*5e26d47bSHong Zhang   ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr);
811*5e26d47bSHong Zhang 
812*5e26d47bSHong Zhang   ierr = PetscMalloc2(nc,&rows,col*col*nc*nc,&cols);CHKERRQ(ierr);
813*5e26d47bSHong Zhang   ierr = DMGetLocalToGlobalMapping(da,&ltog);CHKERRQ(ierr);
814*5e26d47bSHong Zhang 
815*5e26d47bSHong Zhang   ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr);
816*5e26d47bSHong Zhang   /* determine the matrix preallocation information */
817*5e26d47bSHong Zhang   ierr = MatPreallocateInitialize(comm,nc*nx*ny,nc*nx*ny,dnz,onz);CHKERRQ(ierr);
818*5e26d47bSHong Zhang   for (i=xs; i<xs+nx; i++) {
819*5e26d47bSHong Zhang 
820*5e26d47bSHong Zhang     pstart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i));
821*5e26d47bSHong Zhang     pend   = (bx == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,m-i-1));
822*5e26d47bSHong Zhang 
823*5e26d47bSHong Zhang     for (j=ys; j<ys+ny; j++) {
824*5e26d47bSHong Zhang       slot = i - gxs + gnx*(j - gys);
825*5e26d47bSHong Zhang 
826*5e26d47bSHong Zhang       lstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j));
827*5e26d47bSHong Zhang       lend   = (by == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,n-j-1));
828*5e26d47bSHong Zhang 
829*5e26d47bSHong Zhang       cnt = 0;
830*5e26d47bSHong Zhang       for (k=0; k<nc; k++) {
831*5e26d47bSHong Zhang         for (l=lstart; l<lend+1; l++) {
832*5e26d47bSHong Zhang           for (p=pstart; p<pend+1; p++) {
833*5e26d47bSHong Zhang             if ((st == DMDA_STENCIL_BOX) || (!l || !p)) {  /* entries on star have either l = 0 or p = 0 */
834*5e26d47bSHong Zhang               cols[cnt++] = k + nc*(slot + gnx*l + p);
835*5e26d47bSHong Zhang             }
836*5e26d47bSHong Zhang           }
837*5e26d47bSHong Zhang         }
838*5e26d47bSHong Zhang         rows[k] = k + nc*(slot);
839*5e26d47bSHong Zhang       }
840*5e26d47bSHong Zhang       ierr = MatPreallocateSetLocal(ltog,nc,rows,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr);
841*5e26d47bSHong Zhang     }
842*5e26d47bSHong Zhang   }
843*5e26d47bSHong Zhang   ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr);
844*5e26d47bSHong Zhang   ierr = MatSeqELLSetPreallocation(J,0,dnz);CHKERRQ(ierr);
845*5e26d47bSHong Zhang   //ierr = MatMPIELLSetPreallocation(J,0,dnz,0,onz);CHKERRQ(ierr);
846*5e26d47bSHong Zhang   ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr);
847*5e26d47bSHong Zhang 
848*5e26d47bSHong Zhang   ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr);
849*5e26d47bSHong Zhang 
850*5e26d47bSHong Zhang   /*
851*5e26d47bSHong Zhang     For each node in the grid: we get the neighbors in the local (on processor ordering
852*5e26d47bSHong Zhang     that includes the ghost points) then MatSetValuesLocal() maps those indices to the global
853*5e26d47bSHong Zhang     PETSc ordering.
854*5e26d47bSHong Zhang   */
855*5e26d47bSHong Zhang   if (!da->prealloc_only) {
856*5e26d47bSHong Zhang     ierr = PetscCalloc1(col*col*nc*nc,&values);CHKERRQ(ierr);
857*5e26d47bSHong Zhang     for (i=xs; i<xs+nx; i++) {
858*5e26d47bSHong Zhang 
859*5e26d47bSHong Zhang       pstart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i));
860*5e26d47bSHong Zhang       pend   = (bx == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,m-i-1));
861*5e26d47bSHong Zhang 
862*5e26d47bSHong Zhang       for (j=ys; j<ys+ny; j++) {
863*5e26d47bSHong Zhang         slot = i - gxs + gnx*(j - gys);
864*5e26d47bSHong Zhang 
865*5e26d47bSHong Zhang         lstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j));
866*5e26d47bSHong Zhang         lend   = (by == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,n-j-1));
867*5e26d47bSHong Zhang 
868*5e26d47bSHong Zhang         cnt = 0;
869*5e26d47bSHong Zhang         for (k=0; k<nc; k++) {
870*5e26d47bSHong Zhang           for (l=lstart; l<lend+1; l++) {
871*5e26d47bSHong Zhang             for (p=pstart; p<pend+1; p++) {
872*5e26d47bSHong Zhang               if ((st == DMDA_STENCIL_BOX) || (!l || !p)) {  /* entries on star have either l = 0 or p = 0 */
873*5e26d47bSHong Zhang                 cols[cnt++] = k + nc*(slot + gnx*l + p);
874*5e26d47bSHong Zhang               }
875*5e26d47bSHong Zhang             }
876*5e26d47bSHong Zhang           }
877*5e26d47bSHong Zhang           rows[k] = k + nc*(slot);
878*5e26d47bSHong Zhang         }
879*5e26d47bSHong Zhang         ierr = MatSetValuesLocal(J,nc,rows,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr);
880*5e26d47bSHong Zhang       }
881*5e26d47bSHong Zhang     }
882*5e26d47bSHong Zhang     ierr = PetscFree(values);CHKERRQ(ierr);
883*5e26d47bSHong Zhang     ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
884*5e26d47bSHong Zhang     ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
885*5e26d47bSHong Zhang     ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr);
886*5e26d47bSHong Zhang   }
887*5e26d47bSHong Zhang   ierr = PetscFree2(rows,cols);CHKERRQ(ierr);
888*5e26d47bSHong Zhang   PetscFunctionReturn(0);
889*5e26d47bSHong Zhang }
890*5e26d47bSHong Zhang 
891*5e26d47bSHong Zhang #undef __FUNCT__
892*5e26d47bSHong Zhang #define __FUNCT__ "DMCreateMatrix_DA_2d_MPIAIJ"
893950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_2d_MPIAIJ(DM da,Mat J)
89447c6ae99SBarry Smith {
89547c6ae99SBarry Smith   PetscErrorCode         ierr;
896c1154cd5SBarry Smith   PetscInt               xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny,m,n,dim,s,*cols = NULL,k,nc,*rows = NULL,col,cnt,l,p,M,N;
89747c6ae99SBarry Smith   PetscInt               lstart,lend,pstart,pend,*dnz,*onz;
89847c6ae99SBarry Smith   MPI_Comm               comm;
89947c6ae99SBarry Smith   PetscScalar            *values;
900bff4a2f0SMatthew G. Knepley   DMBoundaryType         bx,by;
90145b6f7e9SBarry Smith   ISLocalToGlobalMapping ltog;
902aa219208SBarry Smith   DMDAStencilType        st;
903c1154cd5SBarry Smith   PetscBool              removedups = PETSC_FALSE;
90447c6ae99SBarry Smith 
90547c6ae99SBarry Smith   PetscFunctionBegin;
90647c6ae99SBarry Smith   /*
90747c6ae99SBarry Smith          nc - number of components per grid point
90847c6ae99SBarry Smith          col - number of colors needed in one direction for single component problem
90947c6ae99SBarry Smith 
91047c6ae99SBarry Smith   */
911c1154cd5SBarry Smith   ierr = DMDAGetInfo(da,&dim,&m,&n,&M,&N,0,0,&nc,&s,&bx,&by,0,&st);CHKERRQ(ierr);
91247c6ae99SBarry Smith   col  = 2*s + 1;
913c1154cd5SBarry Smith   /*
914c1154cd5SBarry Smith        With one processor in periodic domains in a skinny dimension the code will label nonzero columns multiple times
915c1154cd5SBarry Smith        because of "wrapping" around the end of the domain hitting an entry already counted in the other direction.
916c1154cd5SBarry Smith   */
917c1154cd5SBarry Smith   if (M == 1 && 2*s >= m) removedups = PETSC_TRUE;
918c1154cd5SBarry Smith   if (N == 1 && 2*s >= n) removedups = PETSC_TRUE;
919aa219208SBarry Smith   ierr = DMDAGetCorners(da,&xs,&ys,0,&nx,&ny,0);CHKERRQ(ierr);
920aa219208SBarry Smith   ierr = DMDAGetGhostCorners(da,&gxs,&gys,0,&gnx,&gny,0);CHKERRQ(ierr);
92147c6ae99SBarry Smith   ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr);
92247c6ae99SBarry Smith 
923dcca6d9dSJed Brown   ierr = PetscMalloc2(nc,&rows,col*col*nc*nc,&cols);CHKERRQ(ierr);
9241411c6eeSJed Brown   ierr = DMGetLocalToGlobalMapping(da,&ltog);CHKERRQ(ierr);
92547c6ae99SBarry Smith 
92606ca8cadSBarry Smith   ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr);
92747c6ae99SBarry Smith   /* determine the matrix preallocation information */
92847c6ae99SBarry Smith   ierr = MatPreallocateInitialize(comm,nc*nx*ny,nc*nx*ny,dnz,onz);CHKERRQ(ierr);
92947c6ae99SBarry Smith   for (i=xs; i<xs+nx; i++) {
93047c6ae99SBarry Smith 
931bff4a2f0SMatthew G. Knepley     pstart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i));
932bff4a2f0SMatthew G. Knepley     pend   = (bx == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,m-i-1));
93347c6ae99SBarry Smith 
93447c6ae99SBarry Smith     for (j=ys; j<ys+ny; j++) {
93547c6ae99SBarry Smith       slot = i - gxs + gnx*(j - gys);
93647c6ae99SBarry Smith 
937bff4a2f0SMatthew G. Knepley       lstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j));
938bff4a2f0SMatthew G. Knepley       lend   = (by == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,n-j-1));
93947c6ae99SBarry Smith 
94047c6ae99SBarry Smith       cnt = 0;
94147c6ae99SBarry Smith       for (k=0; k<nc; k++) {
94247c6ae99SBarry Smith         for (l=lstart; l<lend+1; l++) {
94347c6ae99SBarry Smith           for (p=pstart; p<pend+1; p++) {
944aa219208SBarry Smith             if ((st == DMDA_STENCIL_BOX) || (!l || !p)) {  /* entries on star have either l = 0 or p = 0 */
94547c6ae99SBarry Smith               cols[cnt++] = k + nc*(slot + gnx*l + p);
94647c6ae99SBarry Smith             }
94747c6ae99SBarry Smith           }
94847c6ae99SBarry Smith         }
94947c6ae99SBarry Smith         rows[k] = k + nc*(slot);
95047c6ae99SBarry Smith       }
951c1154cd5SBarry Smith       if (removedups) {
952c1154cd5SBarry Smith         ierr = MatPreallocateSetLocalRemoveDups(ltog,nc,rows,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr);
953c1154cd5SBarry Smith       } else {
954784ac674SJed Brown         ierr = MatPreallocateSetLocal(ltog,nc,rows,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr);
95547c6ae99SBarry Smith       }
95647c6ae99SBarry Smith     }
957c1154cd5SBarry Smith   }
958f73d5cc4SBarry Smith   ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr);
95947c6ae99SBarry Smith   ierr = MatSeqAIJSetPreallocation(J,0,dnz);CHKERRQ(ierr);
96047c6ae99SBarry Smith   ierr = MatMPIAIJSetPreallocation(J,0,dnz,0,onz);CHKERRQ(ierr);
96147c6ae99SBarry Smith   ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr);
96247c6ae99SBarry Smith 
963784ac674SJed Brown   ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr);
96447c6ae99SBarry Smith 
96547c6ae99SBarry Smith   /*
96647c6ae99SBarry Smith     For each node in the grid: we get the neighbors in the local (on processor ordering
96747c6ae99SBarry Smith     that includes the ghost points) then MatSetValuesLocal() maps those indices to the global
96847c6ae99SBarry Smith     PETSc ordering.
96947c6ae99SBarry Smith   */
970fcfd50ebSBarry Smith   if (!da->prealloc_only) {
9711795a4d1SJed Brown     ierr = PetscCalloc1(col*col*nc*nc,&values);CHKERRQ(ierr);
97247c6ae99SBarry Smith     for (i=xs; i<xs+nx; i++) {
97347c6ae99SBarry Smith 
974bff4a2f0SMatthew G. Knepley       pstart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i));
975bff4a2f0SMatthew G. Knepley       pend   = (bx == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,m-i-1));
97647c6ae99SBarry Smith 
97747c6ae99SBarry Smith       for (j=ys; j<ys+ny; j++) {
97847c6ae99SBarry Smith         slot = i - gxs + gnx*(j - gys);
97947c6ae99SBarry Smith 
980bff4a2f0SMatthew G. Knepley         lstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j));
981bff4a2f0SMatthew G. Knepley         lend   = (by == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,n-j-1));
98247c6ae99SBarry Smith 
98347c6ae99SBarry Smith         cnt = 0;
98447c6ae99SBarry Smith         for (k=0; k<nc; k++) {
98547c6ae99SBarry Smith           for (l=lstart; l<lend+1; l++) {
98647c6ae99SBarry Smith             for (p=pstart; p<pend+1; p++) {
987aa219208SBarry Smith               if ((st == DMDA_STENCIL_BOX) || (!l || !p)) {  /* entries on star have either l = 0 or p = 0 */
98847c6ae99SBarry Smith                 cols[cnt++] = k + nc*(slot + gnx*l + p);
98947c6ae99SBarry Smith               }
99047c6ae99SBarry Smith             }
99147c6ae99SBarry Smith           }
99247c6ae99SBarry Smith           rows[k] = k + nc*(slot);
99347c6ae99SBarry Smith         }
99447c6ae99SBarry Smith         ierr = MatSetValuesLocal(J,nc,rows,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr);
99547c6ae99SBarry Smith       }
99647c6ae99SBarry Smith     }
99747c6ae99SBarry Smith     ierr = PetscFree(values);CHKERRQ(ierr);
99847c6ae99SBarry Smith     ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
99947c6ae99SBarry Smith     ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1000189e4007SBarry Smith     ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr);
100147c6ae99SBarry Smith   }
100247c6ae99SBarry Smith   ierr = PetscFree2(rows,cols);CHKERRQ(ierr);
100347c6ae99SBarry Smith   PetscFunctionReturn(0);
100447c6ae99SBarry Smith }
100547c6ae99SBarry Smith 
1006950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_2d_MPIAIJ_Fill(DM da,Mat J)
100747c6ae99SBarry Smith {
100847c6ae99SBarry Smith   PetscErrorCode         ierr;
100947c6ae99SBarry Smith   PetscInt               xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny;
1010c1154cd5SBarry Smith   PetscInt               m,n,dim,s,*cols,k,nc,row,col,cnt,maxcnt = 0,l,p,M,N;
101147c6ae99SBarry Smith   PetscInt               lstart,lend,pstart,pend,*dnz,*onz;
101247c6ae99SBarry Smith   DM_DA                  *dd = (DM_DA*)da->data;
101347c6ae99SBarry Smith   PetscInt               ifill_col,*ofill = dd->ofill, *dfill = dd->dfill;
101447c6ae99SBarry Smith   MPI_Comm               comm;
101547c6ae99SBarry Smith   PetscScalar            *values;
1016bff4a2f0SMatthew G. Knepley   DMBoundaryType         bx,by;
101745b6f7e9SBarry Smith   ISLocalToGlobalMapping ltog;
1018aa219208SBarry Smith   DMDAStencilType        st;
1019c1154cd5SBarry Smith   PetscBool              removedups = PETSC_FALSE;
102047c6ae99SBarry Smith 
102147c6ae99SBarry Smith   PetscFunctionBegin;
102247c6ae99SBarry Smith   /*
102347c6ae99SBarry Smith          nc - number of components per grid point
102447c6ae99SBarry Smith          col - number of colors needed in one direction for single component problem
102547c6ae99SBarry Smith 
102647c6ae99SBarry Smith   */
1027c1154cd5SBarry Smith   ierr = DMDAGetInfo(da,&dim,&m,&n,&M,&N,0,0,&nc,&s,&bx,&by,0,&st);CHKERRQ(ierr);
102847c6ae99SBarry Smith   col  = 2*s + 1;
1029c1154cd5SBarry Smith   /*
1030c1154cd5SBarry Smith        With one processor in periodic domains in a skinny dimension the code will label nonzero columns multiple times
1031c1154cd5SBarry Smith        because of "wrapping" around the end of the domain hitting an entry already counted in the other direction.
1032c1154cd5SBarry Smith   */
1033c1154cd5SBarry Smith   if (M == 1 && 2*s >= m) removedups = PETSC_TRUE;
1034c1154cd5SBarry Smith   if (N == 1 && 2*s >= n) removedups = PETSC_TRUE;
1035aa219208SBarry Smith   ierr = DMDAGetCorners(da,&xs,&ys,0,&nx,&ny,0);CHKERRQ(ierr);
1036aa219208SBarry Smith   ierr = DMDAGetGhostCorners(da,&gxs,&gys,0,&gnx,&gny,0);CHKERRQ(ierr);
103747c6ae99SBarry Smith   ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr);
103847c6ae99SBarry Smith 
10394b26d1cfSBarry Smith   ierr = PetscMalloc1(col*col*nc,&cols);CHKERRQ(ierr);
10401411c6eeSJed Brown   ierr = DMGetLocalToGlobalMapping(da,&ltog);CHKERRQ(ierr);
104147c6ae99SBarry Smith 
104206ca8cadSBarry Smith   ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr);
104347c6ae99SBarry Smith   /* determine the matrix preallocation information */
104447c6ae99SBarry Smith   ierr = MatPreallocateInitialize(comm,nc*nx*ny,nc*nx*ny,dnz,onz);CHKERRQ(ierr);
104547c6ae99SBarry Smith   for (i=xs; i<xs+nx; i++) {
104647c6ae99SBarry Smith 
1047bff4a2f0SMatthew G. Knepley     pstart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i));
1048bff4a2f0SMatthew G. Knepley     pend   = (bx == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,m-i-1));
104947c6ae99SBarry Smith 
105047c6ae99SBarry Smith     for (j=ys; j<ys+ny; j++) {
105147c6ae99SBarry Smith       slot = i - gxs + gnx*(j - gys);
105247c6ae99SBarry Smith 
1053bff4a2f0SMatthew G. Knepley       lstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j));
1054bff4a2f0SMatthew G. Knepley       lend   = (by == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,n-j-1));
105547c6ae99SBarry Smith 
105647c6ae99SBarry Smith       for (k=0; k<nc; k++) {
105747c6ae99SBarry Smith         cnt = 0;
105847c6ae99SBarry Smith         for (l=lstart; l<lend+1; l++) {
105947c6ae99SBarry Smith           for (p=pstart; p<pend+1; p++) {
106047c6ae99SBarry Smith             if (l || p) {
1061aa219208SBarry Smith               if ((st == DMDA_STENCIL_BOX) || (!l || !p)) {  /* entries on star */
10628865f1eaSKarl Rupp                 for (ifill_col=ofill[k]; ifill_col<ofill[k+1]; ifill_col++) cols[cnt++] = ofill[ifill_col] + nc*(slot + gnx*l + p);
106347c6ae99SBarry Smith               }
106447c6ae99SBarry Smith             } else {
106547c6ae99SBarry Smith               if (dfill) {
10668865f1eaSKarl Rupp                 for (ifill_col=dfill[k]; ifill_col<dfill[k+1]; ifill_col++) cols[cnt++] = dfill[ifill_col] + nc*(slot + gnx*l + p);
106747c6ae99SBarry Smith               } else {
10688865f1eaSKarl Rupp                 for (ifill_col=0; ifill_col<nc; ifill_col++) cols[cnt++] = ifill_col + nc*(slot + gnx*l + p);
106947c6ae99SBarry Smith               }
107047c6ae99SBarry Smith             }
107147c6ae99SBarry Smith           }
107247c6ae99SBarry Smith         }
107347c6ae99SBarry Smith         row    = k + nc*(slot);
1074c0ab637bSBarry Smith         maxcnt = PetscMax(maxcnt,cnt);
1075c1154cd5SBarry Smith         if (removedups) {
1076c1154cd5SBarry Smith           ierr   = MatPreallocateSetLocalRemoveDups(ltog,1,&row,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr);
1077c1154cd5SBarry Smith         } else {
1078784ac674SJed Brown           ierr   = MatPreallocateSetLocal(ltog,1,&row,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr);
107947c6ae99SBarry Smith         }
108047c6ae99SBarry Smith       }
108147c6ae99SBarry Smith     }
1082c1154cd5SBarry Smith   }
108347c6ae99SBarry Smith   ierr = MatSeqAIJSetPreallocation(J,0,dnz);CHKERRQ(ierr);
108447c6ae99SBarry Smith   ierr = MatMPIAIJSetPreallocation(J,0,dnz,0,onz);CHKERRQ(ierr);
108547c6ae99SBarry Smith   ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr);
1086784ac674SJed Brown   ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr);
108747c6ae99SBarry Smith 
108847c6ae99SBarry Smith   /*
108947c6ae99SBarry Smith     For each node in the grid: we get the neighbors in the local (on processor ordering
109047c6ae99SBarry Smith     that includes the ghost points) then MatSetValuesLocal() maps those indices to the global
109147c6ae99SBarry Smith     PETSc ordering.
109247c6ae99SBarry Smith   */
1093fcfd50ebSBarry Smith   if (!da->prealloc_only) {
1094c0ab637bSBarry Smith     ierr = PetscCalloc1(maxcnt,&values);CHKERRQ(ierr);
109547c6ae99SBarry Smith     for (i=xs; i<xs+nx; i++) {
109647c6ae99SBarry Smith 
1097bff4a2f0SMatthew G. Knepley       pstart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i));
1098bff4a2f0SMatthew G. Knepley       pend   = (bx == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,m-i-1));
109947c6ae99SBarry Smith 
110047c6ae99SBarry Smith       for (j=ys; j<ys+ny; j++) {
110147c6ae99SBarry Smith         slot = i - gxs + gnx*(j - gys);
110247c6ae99SBarry Smith 
1103bff4a2f0SMatthew G. Knepley         lstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j));
1104bff4a2f0SMatthew G. Knepley         lend   = (by == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,n-j-1));
110547c6ae99SBarry Smith 
110647c6ae99SBarry Smith         for (k=0; k<nc; k++) {
110747c6ae99SBarry Smith           cnt = 0;
110847c6ae99SBarry Smith           for (l=lstart; l<lend+1; l++) {
110947c6ae99SBarry Smith             for (p=pstart; p<pend+1; p++) {
111047c6ae99SBarry Smith               if (l || p) {
1111aa219208SBarry Smith                 if ((st == DMDA_STENCIL_BOX) || (!l || !p)) {  /* entries on star */
11128865f1eaSKarl Rupp                   for (ifill_col=ofill[k]; ifill_col<ofill[k+1]; ifill_col++) cols[cnt++] = ofill[ifill_col] + nc*(slot + gnx*l + p);
111347c6ae99SBarry Smith                 }
111447c6ae99SBarry Smith               } else {
111547c6ae99SBarry Smith                 if (dfill) {
11168865f1eaSKarl Rupp                   for (ifill_col=dfill[k]; ifill_col<dfill[k+1]; ifill_col++) cols[cnt++] = dfill[ifill_col] + nc*(slot + gnx*l + p);
111747c6ae99SBarry Smith                 } else {
11188865f1eaSKarl Rupp                   for (ifill_col=0; ifill_col<nc; ifill_col++) cols[cnt++] = ifill_col + nc*(slot + gnx*l + p);
111947c6ae99SBarry Smith                 }
112047c6ae99SBarry Smith               }
112147c6ae99SBarry Smith             }
112247c6ae99SBarry Smith           }
112347c6ae99SBarry Smith           row  = k + nc*(slot);
112447c6ae99SBarry Smith           ierr = MatSetValuesLocal(J,1,&row,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr);
112547c6ae99SBarry Smith         }
112647c6ae99SBarry Smith       }
112747c6ae99SBarry Smith     }
112847c6ae99SBarry Smith     ierr = PetscFree(values);CHKERRQ(ierr);
112947c6ae99SBarry Smith     ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
113047c6ae99SBarry Smith     ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1131189e4007SBarry Smith     ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr);
113247c6ae99SBarry Smith   }
113347c6ae99SBarry Smith   ierr = PetscFree(cols);CHKERRQ(ierr);
113447c6ae99SBarry Smith   PetscFunctionReturn(0);
113547c6ae99SBarry Smith }
113647c6ae99SBarry Smith 
113747c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/
113847c6ae99SBarry Smith 
1139950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_3d_MPIAIJ(DM da,Mat J)
114047c6ae99SBarry Smith {
114147c6ae99SBarry Smith   PetscErrorCode         ierr;
114247c6ae99SBarry Smith   PetscInt               xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny;
11430298fd71SBarry Smith   PetscInt               m,n,dim,s,*cols = NULL,k,nc,*rows = NULL,col,cnt,l,p,*dnz = NULL,*onz = NULL;
1144c1154cd5SBarry Smith   PetscInt               istart,iend,jstart,jend,kstart,kend,zs,nz,gzs,gnz,ii,jj,kk,M,N,P;
114547c6ae99SBarry Smith   MPI_Comm               comm;
114647c6ae99SBarry Smith   PetscScalar            *values;
1147bff4a2f0SMatthew G. Knepley   DMBoundaryType         bx,by,bz;
114845b6f7e9SBarry Smith   ISLocalToGlobalMapping ltog;
1149aa219208SBarry Smith   DMDAStencilType        st;
1150c1154cd5SBarry Smith   PetscBool              removedups = PETSC_FALSE;
115147c6ae99SBarry Smith 
115247c6ae99SBarry Smith   PetscFunctionBegin;
115347c6ae99SBarry Smith   /*
115447c6ae99SBarry Smith          nc - number of components per grid point
115547c6ae99SBarry Smith          col - number of colors needed in one direction for single component problem
115647c6ae99SBarry Smith 
115747c6ae99SBarry Smith   */
1158c1154cd5SBarry Smith   ierr = DMDAGetInfo(da,&dim,&m,&n,&p,&M,&N,&P,&nc,&s,&bx,&by,&bz,&st);CHKERRQ(ierr);
115947c6ae99SBarry Smith   col  = 2*s + 1;
116047c6ae99SBarry Smith 
1161c1154cd5SBarry Smith   /*
1162c1154cd5SBarry Smith        With one processor in periodic domains in a skinny dimension the code will label nonzero columns multiple times
1163c1154cd5SBarry Smith        because of "wrapping" around the end of the domain hitting an entry already counted in the other direction.
1164c1154cd5SBarry Smith   */
1165c1154cd5SBarry Smith   if (M == 1 && 2*s >= m) removedups = PETSC_TRUE;
1166c1154cd5SBarry Smith   if (N == 1 && 2*s >= n) removedups = PETSC_TRUE;
1167c1154cd5SBarry Smith   if (P == 1 && 2*s >= p) removedups = PETSC_TRUE;
1168c1154cd5SBarry Smith 
1169aa219208SBarry Smith   ierr = DMDAGetCorners(da,&xs,&ys,&zs,&nx,&ny,&nz);CHKERRQ(ierr);
1170aa219208SBarry Smith   ierr = DMDAGetGhostCorners(da,&gxs,&gys,&gzs,&gnx,&gny,&gnz);CHKERRQ(ierr);
117147c6ae99SBarry Smith   ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr);
117247c6ae99SBarry Smith 
1173dcca6d9dSJed Brown   ierr = PetscMalloc2(nc,&rows,col*col*col*nc*nc,&cols);CHKERRQ(ierr);
11741411c6eeSJed Brown   ierr = DMGetLocalToGlobalMapping(da,&ltog);CHKERRQ(ierr);
117547c6ae99SBarry Smith 
117606ca8cadSBarry Smith   ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr);
117747c6ae99SBarry Smith   /* determine the matrix preallocation information */
117847c6ae99SBarry Smith   ierr = MatPreallocateInitialize(comm,nc*nx*ny*nz,nc*nx*ny*nz,dnz,onz);CHKERRQ(ierr);
117947c6ae99SBarry Smith   for (i=xs; i<xs+nx; i++) {
1180bff4a2f0SMatthew G. Knepley     istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i));
1181bff4a2f0SMatthew G. Knepley     iend   = (bx == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,m-i-1));
118247c6ae99SBarry Smith     for (j=ys; j<ys+ny; j++) {
1183bff4a2f0SMatthew G. Knepley       jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j));
1184bff4a2f0SMatthew G. Knepley       jend   = (by == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,n-j-1));
118547c6ae99SBarry Smith       for (k=zs; k<zs+nz; k++) {
1186bff4a2f0SMatthew G. Knepley         kstart = (bz == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k));
1187bff4a2f0SMatthew G. Knepley         kend   = (bz == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,p-k-1));
118847c6ae99SBarry Smith 
118947c6ae99SBarry Smith         slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs);
119047c6ae99SBarry Smith 
119147c6ae99SBarry Smith         cnt = 0;
119247c6ae99SBarry Smith         for (l=0; l<nc; l++) {
119347c6ae99SBarry Smith           for (ii=istart; ii<iend+1; ii++) {
119447c6ae99SBarry Smith             for (jj=jstart; jj<jend+1; jj++) {
119547c6ae99SBarry Smith               for (kk=kstart; kk<kend+1; kk++) {
1196aa219208SBarry Smith                 if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/
119747c6ae99SBarry Smith                   cols[cnt++] = l + nc*(slot + ii + gnx*jj + gnx*gny*kk);
119847c6ae99SBarry Smith                 }
119947c6ae99SBarry Smith               }
120047c6ae99SBarry Smith             }
120147c6ae99SBarry Smith           }
120247c6ae99SBarry Smith           rows[l] = l + nc*(slot);
120347c6ae99SBarry Smith         }
1204c1154cd5SBarry Smith         if (removedups) {
1205c1154cd5SBarry Smith           ierr = MatPreallocateSetLocalRemoveDups(ltog,nc,rows,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr);
1206c1154cd5SBarry Smith         } else {
1207784ac674SJed Brown           ierr = MatPreallocateSetLocal(ltog,nc,rows,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr);
120847c6ae99SBarry Smith         }
120947c6ae99SBarry Smith       }
121047c6ae99SBarry Smith     }
1211c1154cd5SBarry Smith   }
1212f73d5cc4SBarry Smith   ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr);
121347c6ae99SBarry Smith   ierr = MatSeqAIJSetPreallocation(J,0,dnz);CHKERRQ(ierr);
121447c6ae99SBarry Smith   ierr = MatMPIAIJSetPreallocation(J,0,dnz,0,onz);CHKERRQ(ierr);
121547c6ae99SBarry Smith   ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr);
1216784ac674SJed Brown   ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr);
121747c6ae99SBarry Smith 
121847c6ae99SBarry Smith   /*
121947c6ae99SBarry Smith     For each node in the grid: we get the neighbors in the local (on processor ordering
122047c6ae99SBarry Smith     that includes the ghost points) then MatSetValuesLocal() maps those indices to the global
122147c6ae99SBarry Smith     PETSc ordering.
122247c6ae99SBarry Smith   */
1223fcfd50ebSBarry Smith   if (!da->prealloc_only) {
12241795a4d1SJed Brown     ierr = PetscCalloc1(col*col*col*nc*nc*nc,&values);CHKERRQ(ierr);
122547c6ae99SBarry Smith     for (i=xs; i<xs+nx; i++) {
1226bff4a2f0SMatthew G. Knepley       istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i));
1227bff4a2f0SMatthew G. Knepley       iend   = (bx == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,m-i-1));
122847c6ae99SBarry Smith       for (j=ys; j<ys+ny; j++) {
1229bff4a2f0SMatthew G. Knepley         jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j));
1230bff4a2f0SMatthew G. Knepley         jend   = (by == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,n-j-1));
123147c6ae99SBarry Smith         for (k=zs; k<zs+nz; k++) {
1232bff4a2f0SMatthew G. Knepley           kstart = (bz == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k));
1233bff4a2f0SMatthew G. Knepley           kend   = (bz == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,p-k-1));
123447c6ae99SBarry Smith 
123547c6ae99SBarry Smith           slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs);
123647c6ae99SBarry Smith 
123747c6ae99SBarry Smith           cnt = 0;
123847c6ae99SBarry Smith           for (l=0; l<nc; l++) {
123947c6ae99SBarry Smith             for (ii=istart; ii<iend+1; ii++) {
124047c6ae99SBarry Smith               for (jj=jstart; jj<jend+1; jj++) {
124147c6ae99SBarry Smith                 for (kk=kstart; kk<kend+1; kk++) {
1242aa219208SBarry Smith                   if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/
124347c6ae99SBarry Smith                     cols[cnt++] = l + nc*(slot + ii + gnx*jj + gnx*gny*kk);
124447c6ae99SBarry Smith                   }
124547c6ae99SBarry Smith                 }
124647c6ae99SBarry Smith               }
124747c6ae99SBarry Smith             }
124847c6ae99SBarry Smith             rows[l] = l + nc*(slot);
124947c6ae99SBarry Smith           }
125047c6ae99SBarry Smith           ierr = MatSetValuesLocal(J,nc,rows,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr);
125147c6ae99SBarry Smith         }
125247c6ae99SBarry Smith       }
125347c6ae99SBarry Smith     }
125447c6ae99SBarry Smith     ierr = PetscFree(values);CHKERRQ(ierr);
125547c6ae99SBarry Smith     ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
125647c6ae99SBarry Smith     ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1257189e4007SBarry Smith     ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr);
125847c6ae99SBarry Smith   }
125947c6ae99SBarry Smith   ierr = PetscFree2(rows,cols);CHKERRQ(ierr);
126047c6ae99SBarry Smith   PetscFunctionReturn(0);
126147c6ae99SBarry Smith }
126247c6ae99SBarry Smith 
126347c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/
126447c6ae99SBarry Smith 
1265ce308e1dSBarry Smith PetscErrorCode DMCreateMatrix_DA_1d_MPIAIJ_Fill(DM da,Mat J)
1266ce308e1dSBarry Smith {
1267ce308e1dSBarry Smith   PetscErrorCode         ierr;
1268ce308e1dSBarry Smith   DM_DA                  *dd = (DM_DA*)da->data;
1269ce308e1dSBarry Smith   PetscInt               xs,nx,i,j,gxs,gnx,row,k,l;
12708d4c968fSBarry Smith   PetscInt               m,dim,s,*cols = NULL,nc,cnt,maxcnt = 0,*ocols;
12710acb5bebSBarry Smith   PetscInt               *ofill = dd->ofill,*dfill = dd->dfill;
1272ce308e1dSBarry Smith   PetscScalar            *values;
1273bff4a2f0SMatthew G. Knepley   DMBoundaryType         bx;
127445b6f7e9SBarry Smith   ISLocalToGlobalMapping ltog;
1275ce308e1dSBarry Smith   PetscMPIInt            rank,size;
1276ce308e1dSBarry Smith 
1277ce308e1dSBarry Smith   PetscFunctionBegin;
1278bff4a2f0SMatthew G. Knepley   if (dd->bx == DM_BOUNDARY_PERIODIC) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"With fill provided not implemented with periodic boundary conditions");
1279ce94432eSBarry Smith   ierr = MPI_Comm_rank(PetscObjectComm((PetscObject)da),&rank);CHKERRQ(ierr);
1280ce94432eSBarry Smith   ierr = MPI_Comm_size(PetscObjectComm((PetscObject)da),&size);CHKERRQ(ierr);
1281ce308e1dSBarry Smith 
1282ce308e1dSBarry Smith   /*
1283ce308e1dSBarry Smith          nc - number of components per grid point
1284ce308e1dSBarry Smith 
1285ce308e1dSBarry Smith   */
1286ce308e1dSBarry Smith   ierr = DMDAGetInfo(da,&dim,&m,0,0,0,0,0,&nc,&s,&bx,0,0,0);CHKERRQ(ierr);
1287ce308e1dSBarry Smith   ierr = DMDAGetCorners(da,&xs,0,0,&nx,0,0);CHKERRQ(ierr);
1288ce308e1dSBarry Smith   ierr = DMDAGetGhostCorners(da,&gxs,0,0,&gnx,0,0);CHKERRQ(ierr);
1289ce308e1dSBarry Smith 
1290ce308e1dSBarry Smith   ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr);
12911795a4d1SJed Brown   ierr = PetscCalloc2(nx*nc,&cols,nx*nc,&ocols);CHKERRQ(ierr);
1292ce308e1dSBarry Smith 
1293ce308e1dSBarry Smith   /*
1294ce308e1dSBarry Smith         note should be smaller for first and last process with no periodic
1295ce308e1dSBarry Smith         does not handle dfill
1296ce308e1dSBarry Smith   */
1297ce308e1dSBarry Smith   cnt = 0;
1298ce308e1dSBarry Smith   /* coupling with process to the left */
1299ce308e1dSBarry Smith   for (i=0; i<s; i++) {
1300ce308e1dSBarry Smith     for (j=0; j<nc; j++) {
1301ce308e1dSBarry Smith       ocols[cnt] = ((!rank) ? 0 : (s - i)*(ofill[j+1] - ofill[j]));
13020acb5bebSBarry Smith       cols[cnt]  = dfill[j+1] - dfill[j] + (s + i)*(ofill[j+1] - ofill[j]);
1303c0ab637bSBarry Smith       maxcnt = PetscMax(maxcnt,ocols[cnt]+cols[cnt]);
1304ce308e1dSBarry Smith       cnt++;
1305ce308e1dSBarry Smith     }
1306ce308e1dSBarry Smith   }
1307ce308e1dSBarry Smith   for (i=s; i<nx-s; i++) {
1308ce308e1dSBarry Smith     for (j=0; j<nc; j++) {
13090acb5bebSBarry Smith       cols[cnt] = dfill[j+1] - dfill[j] + 2*s*(ofill[j+1] - ofill[j]);
1310c0ab637bSBarry Smith       maxcnt = PetscMax(maxcnt,ocols[cnt]+cols[cnt]);
1311ce308e1dSBarry Smith       cnt++;
1312ce308e1dSBarry Smith     }
1313ce308e1dSBarry Smith   }
1314ce308e1dSBarry Smith   /* coupling with process to the right */
1315ce308e1dSBarry Smith   for (i=nx-s; i<nx; i++) {
1316ce308e1dSBarry Smith     for (j=0; j<nc; j++) {
1317ce308e1dSBarry Smith       ocols[cnt] = ((rank == (size-1)) ? 0 : (i - nx + s + 1)*(ofill[j+1] - ofill[j]));
13180acb5bebSBarry Smith       cols[cnt]  = dfill[j+1] - dfill[j] + (s + nx - i - 1)*(ofill[j+1] - ofill[j]);
1319c0ab637bSBarry Smith       maxcnt = PetscMax(maxcnt,ocols[cnt]+cols[cnt]);
1320ce308e1dSBarry Smith       cnt++;
1321ce308e1dSBarry Smith     }
1322ce308e1dSBarry Smith   }
1323ce308e1dSBarry Smith 
1324ce308e1dSBarry Smith   ierr = MatSeqAIJSetPreallocation(J,0,cols);CHKERRQ(ierr);
1325ce308e1dSBarry Smith   ierr = MatMPIAIJSetPreallocation(J,0,cols,0,ocols);CHKERRQ(ierr);
1326ce308e1dSBarry Smith   ierr = PetscFree2(cols,ocols);CHKERRQ(ierr);
1327ce308e1dSBarry Smith 
1328ce308e1dSBarry Smith   ierr = DMGetLocalToGlobalMapping(da,&ltog);CHKERRQ(ierr);
1329ce308e1dSBarry Smith   ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr);
1330ce308e1dSBarry Smith 
1331ce308e1dSBarry Smith   /*
1332ce308e1dSBarry Smith     For each node in the grid: we get the neighbors in the local (on processor ordering
1333ce308e1dSBarry Smith     that includes the ghost points) then MatSetValuesLocal() maps those indices to the global
1334ce308e1dSBarry Smith     PETSc ordering.
1335ce308e1dSBarry Smith   */
1336ce308e1dSBarry Smith   if (!da->prealloc_only) {
1337c0ab637bSBarry Smith     ierr = PetscCalloc2(maxcnt,&values,maxcnt,&cols);CHKERRQ(ierr);
1338ce308e1dSBarry Smith 
1339ce308e1dSBarry Smith     row = xs*nc;
1340ce308e1dSBarry Smith     /* coupling with process to the left */
1341ce308e1dSBarry Smith     for (i=xs; i<xs+s; i++) {
1342ce308e1dSBarry Smith       for (j=0; j<nc; j++) {
1343ce308e1dSBarry Smith         cnt = 0;
1344ce308e1dSBarry Smith         if (rank) {
1345ce308e1dSBarry Smith           for (l=0; l<s; l++) {
1346ce308e1dSBarry Smith             for (k=ofill[j]; k<ofill[j+1]; k++) cols[cnt++] = (i - s + l)*nc + ofill[k];
1347ce308e1dSBarry Smith           }
1348ce308e1dSBarry Smith         }
13490acb5bebSBarry Smith         if (dfill) {
13500acb5bebSBarry Smith           for (k=dfill[j]; k<dfill[j+1]; k++) {
13510acb5bebSBarry Smith             cols[cnt++] = i*nc + dfill[k];
13520acb5bebSBarry Smith           }
13530acb5bebSBarry Smith         } else {
1354ce308e1dSBarry Smith           for (k=0; k<nc; k++) {
1355ce308e1dSBarry Smith             cols[cnt++] = i*nc + k;
1356ce308e1dSBarry Smith           }
13570acb5bebSBarry Smith         }
1358ce308e1dSBarry Smith         for (l=0; l<s; l++) {
1359ce308e1dSBarry Smith           for (k=ofill[j]; k<ofill[j+1]; k++) cols[cnt++] = (i + s - l)*nc + ofill[k];
1360ce308e1dSBarry Smith         }
1361ce308e1dSBarry Smith         ierr = MatSetValues(J,1,&row,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr);
1362ce308e1dSBarry Smith         row++;
1363ce308e1dSBarry Smith       }
1364ce308e1dSBarry Smith     }
1365ce308e1dSBarry Smith     for (i=xs+s; i<xs+nx-s; i++) {
1366ce308e1dSBarry Smith       for (j=0; j<nc; j++) {
1367ce308e1dSBarry Smith         cnt = 0;
1368ce308e1dSBarry Smith         for (l=0; l<s; l++) {
1369ce308e1dSBarry Smith           for (k=ofill[j]; k<ofill[j+1]; k++) cols[cnt++] = (i - s + l)*nc + ofill[k];
1370ce308e1dSBarry Smith         }
13710acb5bebSBarry Smith         if (dfill) {
13720acb5bebSBarry Smith           for (k=dfill[j]; k<dfill[j+1]; k++) {
13730acb5bebSBarry Smith             cols[cnt++] = i*nc + dfill[k];
13740acb5bebSBarry Smith           }
13750acb5bebSBarry Smith         } else {
1376ce308e1dSBarry Smith           for (k=0; k<nc; k++) {
1377ce308e1dSBarry Smith             cols[cnt++] = i*nc + k;
1378ce308e1dSBarry Smith           }
13790acb5bebSBarry Smith         }
1380ce308e1dSBarry Smith         for (l=0; l<s; l++) {
1381ce308e1dSBarry Smith           for (k=ofill[j]; k<ofill[j+1]; k++) cols[cnt++] = (i + s - l)*nc + ofill[k];
1382ce308e1dSBarry Smith         }
1383ce308e1dSBarry Smith         ierr = MatSetValues(J,1,&row,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr);
1384ce308e1dSBarry Smith         row++;
1385ce308e1dSBarry Smith       }
1386ce308e1dSBarry Smith     }
1387ce308e1dSBarry Smith     /* coupling with process to the right */
1388ce308e1dSBarry Smith     for (i=xs+nx-s; i<xs+nx; i++) {
1389ce308e1dSBarry Smith       for (j=0; j<nc; j++) {
1390ce308e1dSBarry Smith         cnt = 0;
1391ce308e1dSBarry Smith         for (l=0; l<s; l++) {
1392ce308e1dSBarry Smith           for (k=ofill[j]; k<ofill[j+1]; k++) cols[cnt++] = (i - s + l)*nc + ofill[k];
1393ce308e1dSBarry Smith         }
13940acb5bebSBarry Smith         if (dfill) {
13950acb5bebSBarry Smith           for (k=dfill[j]; k<dfill[j+1]; k++) {
13960acb5bebSBarry Smith             cols[cnt++] = i*nc + dfill[k];
13970acb5bebSBarry Smith           }
13980acb5bebSBarry Smith         } else {
1399ce308e1dSBarry Smith           for (k=0; k<nc; k++) {
1400ce308e1dSBarry Smith             cols[cnt++] = i*nc + k;
1401ce308e1dSBarry Smith           }
14020acb5bebSBarry Smith         }
1403ce308e1dSBarry Smith         if (rank < size-1) {
1404ce308e1dSBarry Smith           for (l=0; l<s; l++) {
1405ce308e1dSBarry Smith             for (k=ofill[j]; k<ofill[j+1]; k++) cols[cnt++] = (i + s - l)*nc + ofill[k];
1406ce308e1dSBarry Smith           }
1407ce308e1dSBarry Smith         }
1408ce308e1dSBarry Smith         ierr = MatSetValues(J,1,&row,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr);
1409ce308e1dSBarry Smith         row++;
1410ce308e1dSBarry Smith       }
1411ce308e1dSBarry Smith     }
1412c0ab637bSBarry Smith     ierr = PetscFree2(values,cols);CHKERRQ(ierr);
1413ce308e1dSBarry Smith     ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1414ce308e1dSBarry Smith     ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1415189e4007SBarry Smith     ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr);
1416ce308e1dSBarry Smith   }
1417ce308e1dSBarry Smith   PetscFunctionReturn(0);
1418ce308e1dSBarry Smith }
1419ce308e1dSBarry Smith 
1420ce308e1dSBarry Smith /* ---------------------------------------------------------------------------------*/
1421ce308e1dSBarry Smith 
1422950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_1d_MPIAIJ(DM da,Mat J)
142347c6ae99SBarry Smith {
142447c6ae99SBarry Smith   PetscErrorCode         ierr;
142547c6ae99SBarry Smith   PetscInt               xs,nx,i,i1,slot,gxs,gnx;
14260298fd71SBarry Smith   PetscInt               m,dim,s,*cols = NULL,nc,*rows = NULL,col,cnt,l;
142747c6ae99SBarry Smith   PetscInt               istart,iend;
142847c6ae99SBarry Smith   PetscScalar            *values;
1429bff4a2f0SMatthew G. Knepley   DMBoundaryType         bx;
143045b6f7e9SBarry Smith   ISLocalToGlobalMapping ltog;
143147c6ae99SBarry Smith 
143247c6ae99SBarry Smith   PetscFunctionBegin;
143347c6ae99SBarry Smith   /*
143447c6ae99SBarry Smith          nc - number of components per grid point
143547c6ae99SBarry Smith          col - number of colors needed in one direction for single component problem
143647c6ae99SBarry Smith 
143747c6ae99SBarry Smith   */
14381321219cSEthan Coon   ierr = DMDAGetInfo(da,&dim,&m,0,0,0,0,0,&nc,&s,&bx,0,0,0);CHKERRQ(ierr);
143947c6ae99SBarry Smith   col  = 2*s + 1;
144047c6ae99SBarry Smith 
1441aa219208SBarry Smith   ierr = DMDAGetCorners(da,&xs,0,0,&nx,0,0);CHKERRQ(ierr);
1442aa219208SBarry Smith   ierr = DMDAGetGhostCorners(da,&gxs,0,0,&gnx,0,0);CHKERRQ(ierr);
144347c6ae99SBarry Smith 
1444f73d5cc4SBarry Smith   ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr);
144547c6ae99SBarry Smith   ierr = MatSeqAIJSetPreallocation(J,col*nc,0);CHKERRQ(ierr);
144647c6ae99SBarry Smith   ierr = MatMPIAIJSetPreallocation(J,col*nc,0,col*nc,0);CHKERRQ(ierr);
144747c6ae99SBarry Smith 
14481411c6eeSJed Brown   ierr = DMGetLocalToGlobalMapping(da,&ltog);CHKERRQ(ierr);
1449784ac674SJed Brown   ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr);
145047c6ae99SBarry Smith 
145147c6ae99SBarry Smith   /*
145247c6ae99SBarry Smith     For each node in the grid: we get the neighbors in the local (on processor ordering
145347c6ae99SBarry Smith     that includes the ghost points) then MatSetValuesLocal() maps those indices to the global
145447c6ae99SBarry Smith     PETSc ordering.
145547c6ae99SBarry Smith   */
1456fcfd50ebSBarry Smith   if (!da->prealloc_only) {
1457dcca6d9dSJed Brown     ierr = PetscMalloc2(nc,&rows,col*nc*nc,&cols);CHKERRQ(ierr);
14581795a4d1SJed Brown     ierr = PetscCalloc1(col*nc*nc,&values);CHKERRQ(ierr);
145947c6ae99SBarry Smith     for (i=xs; i<xs+nx; i++) {
146047c6ae99SBarry Smith       istart = PetscMax(-s,gxs - i);
146147c6ae99SBarry Smith       iend   = PetscMin(s,gxs + gnx - i - 1);
146247c6ae99SBarry Smith       slot   = i - gxs;
146347c6ae99SBarry Smith 
146447c6ae99SBarry Smith       cnt = 0;
146547c6ae99SBarry Smith       for (l=0; l<nc; l++) {
146647c6ae99SBarry Smith         for (i1=istart; i1<iend+1; i1++) {
146747c6ae99SBarry Smith           cols[cnt++] = l + nc*(slot + i1);
146847c6ae99SBarry Smith         }
146947c6ae99SBarry Smith         rows[l] = l + nc*(slot);
147047c6ae99SBarry Smith       }
147147c6ae99SBarry Smith       ierr = MatSetValuesLocal(J,nc,rows,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr);
147247c6ae99SBarry Smith     }
147347c6ae99SBarry Smith     ierr = PetscFree(values);CHKERRQ(ierr);
147447c6ae99SBarry Smith     ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
147547c6ae99SBarry Smith     ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1476189e4007SBarry Smith     ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr);
147747c6ae99SBarry Smith     ierr = PetscFree2(rows,cols);CHKERRQ(ierr);
1478ce308e1dSBarry Smith   }
147947c6ae99SBarry Smith   PetscFunctionReturn(0);
148047c6ae99SBarry Smith }
148147c6ae99SBarry Smith 
1482950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_2d_MPIBAIJ(DM da,Mat J)
148347c6ae99SBarry Smith {
148447c6ae99SBarry Smith   PetscErrorCode         ierr;
148547c6ae99SBarry Smith   PetscInt               xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny;
148647c6ae99SBarry Smith   PetscInt               m,n,dim,s,*cols,nc,col,cnt,*dnz,*onz;
148747c6ae99SBarry Smith   PetscInt               istart,iend,jstart,jend,ii,jj;
148847c6ae99SBarry Smith   MPI_Comm               comm;
148947c6ae99SBarry Smith   PetscScalar            *values;
1490bff4a2f0SMatthew G. Knepley   DMBoundaryType         bx,by;
1491aa219208SBarry Smith   DMDAStencilType        st;
149245b6f7e9SBarry Smith   ISLocalToGlobalMapping ltog;
149347c6ae99SBarry Smith 
149447c6ae99SBarry Smith   PetscFunctionBegin;
149547c6ae99SBarry Smith   /*
149647c6ae99SBarry Smith      nc - number of components per grid point
149747c6ae99SBarry Smith      col - number of colors needed in one direction for single component problem
149847c6ae99SBarry Smith   */
14991321219cSEthan Coon   ierr = DMDAGetInfo(da,&dim,&m,&n,0,0,0,0,&nc,&s,&bx,&by,0,&st);CHKERRQ(ierr);
150047c6ae99SBarry Smith   col  = 2*s + 1;
150147c6ae99SBarry Smith 
1502aa219208SBarry Smith   ierr = DMDAGetCorners(da,&xs,&ys,0,&nx,&ny,0);CHKERRQ(ierr);
1503aa219208SBarry Smith   ierr = DMDAGetGhostCorners(da,&gxs,&gys,0,&gnx,&gny,0);CHKERRQ(ierr);
150447c6ae99SBarry Smith   ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr);
150547c6ae99SBarry Smith 
1506785e854fSJed Brown   ierr = PetscMalloc1(col*col*nc*nc,&cols);CHKERRQ(ierr);
150747c6ae99SBarry Smith 
15081411c6eeSJed Brown   ierr = DMGetLocalToGlobalMapping(da,&ltog);CHKERRQ(ierr);
150947c6ae99SBarry Smith 
151047c6ae99SBarry Smith   /* determine the matrix preallocation information */
151147c6ae99SBarry Smith   ierr = MatPreallocateInitialize(comm,nx*ny,nx*ny,dnz,onz);CHKERRQ(ierr);
151247c6ae99SBarry Smith   for (i=xs; i<xs+nx; i++) {
1513bff4a2f0SMatthew G. Knepley     istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i));
1514bff4a2f0SMatthew G. Knepley     iend   = (bx == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,m-i-1));
151547c6ae99SBarry Smith     for (j=ys; j<ys+ny; j++) {
1516bff4a2f0SMatthew G. Knepley       jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j));
1517bff4a2f0SMatthew G. Knepley       jend   = (by == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,n-j-1));
151847c6ae99SBarry Smith       slot   = i - gxs + gnx*(j - gys);
151947c6ae99SBarry Smith 
152047c6ae99SBarry Smith       /* Find block columns in block row */
152147c6ae99SBarry Smith       cnt = 0;
152247c6ae99SBarry Smith       for (ii=istart; ii<iend+1; ii++) {
152347c6ae99SBarry Smith         for (jj=jstart; jj<jend+1; jj++) {
1524aa219208SBarry Smith           if (st == DMDA_STENCIL_BOX || !ii || !jj) { /* BOX or on the STAR */
152547c6ae99SBarry Smith             cols[cnt++] = slot + ii + gnx*jj;
152647c6ae99SBarry Smith           }
152747c6ae99SBarry Smith         }
152847c6ae99SBarry Smith       }
1529d6e23781SBarry Smith       ierr = MatPreallocateSetLocalBlock(ltog,1,&slot,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr);
153047c6ae99SBarry Smith     }
153147c6ae99SBarry Smith   }
153247c6ae99SBarry Smith   ierr = MatSeqBAIJSetPreallocation(J,nc,0,dnz);CHKERRQ(ierr);
153347c6ae99SBarry Smith   ierr = MatMPIBAIJSetPreallocation(J,nc,0,dnz,0,onz);CHKERRQ(ierr);
153447c6ae99SBarry Smith   ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr);
153547c6ae99SBarry Smith 
1536784ac674SJed Brown   ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr);
153747c6ae99SBarry Smith 
153847c6ae99SBarry Smith   /*
153947c6ae99SBarry Smith     For each node in the grid: we get the neighbors in the local (on processor ordering
154047c6ae99SBarry Smith     that includes the ghost points) then MatSetValuesLocal() maps those indices to the global
154147c6ae99SBarry Smith     PETSc ordering.
154247c6ae99SBarry Smith   */
1543fcfd50ebSBarry Smith   if (!da->prealloc_only) {
15441795a4d1SJed Brown     ierr = PetscCalloc1(col*col*nc*nc,&values);CHKERRQ(ierr);
154547c6ae99SBarry Smith     for (i=xs; i<xs+nx; i++) {
1546bff4a2f0SMatthew G. Knepley       istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i));
1547bff4a2f0SMatthew G. Knepley       iend   = (bx == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,m-i-1));
154847c6ae99SBarry Smith       for (j=ys; j<ys+ny; j++) {
1549bff4a2f0SMatthew G. Knepley         jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j));
1550bff4a2f0SMatthew G. Knepley         jend   = (by == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,n-j-1));
155147c6ae99SBarry Smith         slot = i - gxs + gnx*(j - gys);
155247c6ae99SBarry Smith         cnt  = 0;
155347c6ae99SBarry Smith         for (ii=istart; ii<iend+1; ii++) {
155447c6ae99SBarry Smith           for (jj=jstart; jj<jend+1; jj++) {
1555aa219208SBarry Smith             if (st == DMDA_STENCIL_BOX || !ii || !jj) { /* BOX or on the STAR */
155647c6ae99SBarry Smith               cols[cnt++] = slot + ii + gnx*jj;
155747c6ae99SBarry Smith             }
155847c6ae99SBarry Smith           }
155947c6ae99SBarry Smith         }
156047c6ae99SBarry Smith         ierr = MatSetValuesBlockedLocal(J,1,&slot,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr);
156147c6ae99SBarry Smith       }
156247c6ae99SBarry Smith     }
156347c6ae99SBarry Smith     ierr = PetscFree(values);CHKERRQ(ierr);
156447c6ae99SBarry Smith     ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
156547c6ae99SBarry Smith     ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1566189e4007SBarry Smith     ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr);
156747c6ae99SBarry Smith   }
156847c6ae99SBarry Smith   ierr = PetscFree(cols);CHKERRQ(ierr);
156947c6ae99SBarry Smith   PetscFunctionReturn(0);
157047c6ae99SBarry Smith }
157147c6ae99SBarry Smith 
1572950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_3d_MPIBAIJ(DM da,Mat J)
157347c6ae99SBarry Smith {
157447c6ae99SBarry Smith   PetscErrorCode         ierr;
157547c6ae99SBarry Smith   PetscInt               xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny;
157647c6ae99SBarry Smith   PetscInt               m,n,dim,s,*cols,k,nc,col,cnt,p,*dnz,*onz;
157747c6ae99SBarry Smith   PetscInt               istart,iend,jstart,jend,kstart,kend,zs,nz,gzs,gnz,ii,jj,kk;
157847c6ae99SBarry Smith   MPI_Comm               comm;
157947c6ae99SBarry Smith   PetscScalar            *values;
1580bff4a2f0SMatthew G. Knepley   DMBoundaryType         bx,by,bz;
1581aa219208SBarry Smith   DMDAStencilType        st;
158245b6f7e9SBarry Smith   ISLocalToGlobalMapping ltog;
158347c6ae99SBarry Smith 
158447c6ae99SBarry Smith   PetscFunctionBegin;
158547c6ae99SBarry Smith   /*
158647c6ae99SBarry Smith          nc - number of components per grid point
158747c6ae99SBarry Smith          col - number of colors needed in one direction for single component problem
158847c6ae99SBarry Smith 
158947c6ae99SBarry Smith   */
15901321219cSEthan Coon   ierr = DMDAGetInfo(da,&dim,&m,&n,&p,0,0,0,&nc,&s,&bx,&by,&bz,&st);CHKERRQ(ierr);
159147c6ae99SBarry Smith   col  = 2*s + 1;
159247c6ae99SBarry Smith 
1593aa219208SBarry Smith   ierr = DMDAGetCorners(da,&xs,&ys,&zs,&nx,&ny,&nz);CHKERRQ(ierr);
1594aa219208SBarry Smith   ierr = DMDAGetGhostCorners(da,&gxs,&gys,&gzs,&gnx,&gny,&gnz);CHKERRQ(ierr);
159547c6ae99SBarry Smith   ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr);
159647c6ae99SBarry Smith 
1597785e854fSJed Brown   ierr = PetscMalloc1(col*col*col,&cols);CHKERRQ(ierr);
159847c6ae99SBarry Smith 
15991411c6eeSJed Brown   ierr = DMGetLocalToGlobalMapping(da,&ltog);CHKERRQ(ierr);
160047c6ae99SBarry Smith 
160147c6ae99SBarry Smith   /* determine the matrix preallocation information */
160247c6ae99SBarry Smith   ierr = MatPreallocateInitialize(comm,nx*ny*nz,nx*ny*nz,dnz,onz);CHKERRQ(ierr);
160347c6ae99SBarry Smith   for (i=xs; i<xs+nx; i++) {
1604bff4a2f0SMatthew G. Knepley     istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i));
1605bff4a2f0SMatthew G. Knepley     iend   = (bx == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,m-i-1));
160647c6ae99SBarry Smith     for (j=ys; j<ys+ny; j++) {
1607bff4a2f0SMatthew G. Knepley       jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j));
1608bff4a2f0SMatthew G. Knepley       jend   = (by == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,n-j-1));
160947c6ae99SBarry Smith       for (k=zs; k<zs+nz; k++) {
1610bff4a2f0SMatthew G. Knepley         kstart = (bz == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k));
1611bff4a2f0SMatthew G. Knepley         kend   = (bz == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,p-k-1));
161247c6ae99SBarry Smith 
161347c6ae99SBarry Smith         slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs);
161447c6ae99SBarry Smith 
161547c6ae99SBarry Smith         /* Find block columns in block row */
161647c6ae99SBarry Smith         cnt = 0;
161747c6ae99SBarry Smith         for (ii=istart; ii<iend+1; ii++) {
161847c6ae99SBarry Smith           for (jj=jstart; jj<jend+1; jj++) {
161947c6ae99SBarry Smith             for (kk=kstart; kk<kend+1; kk++) {
1620aa219208SBarry Smith               if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/
162147c6ae99SBarry Smith                 cols[cnt++] = slot + ii + gnx*jj + gnx*gny*kk;
162247c6ae99SBarry Smith               }
162347c6ae99SBarry Smith             }
162447c6ae99SBarry Smith           }
162547c6ae99SBarry Smith         }
1626d6e23781SBarry Smith         ierr = MatPreallocateSetLocalBlock(ltog,1,&slot,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr);
162747c6ae99SBarry Smith       }
162847c6ae99SBarry Smith     }
162947c6ae99SBarry Smith   }
163047c6ae99SBarry Smith   ierr = MatSeqBAIJSetPreallocation(J,nc,0,dnz);CHKERRQ(ierr);
163147c6ae99SBarry Smith   ierr = MatMPIBAIJSetPreallocation(J,nc,0,dnz,0,onz);CHKERRQ(ierr);
163247c6ae99SBarry Smith   ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr);
163347c6ae99SBarry Smith 
1634784ac674SJed Brown   ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr);
163547c6ae99SBarry Smith 
163647c6ae99SBarry Smith   /*
163747c6ae99SBarry Smith     For each node in the grid: we get the neighbors in the local (on processor ordering
163847c6ae99SBarry Smith     that includes the ghost points) then MatSetValuesLocal() maps those indices to the global
163947c6ae99SBarry Smith     PETSc ordering.
164047c6ae99SBarry Smith   */
1641fcfd50ebSBarry Smith   if (!da->prealloc_only) {
16421795a4d1SJed Brown     ierr = PetscCalloc1(col*col*col*nc*nc,&values);CHKERRQ(ierr);
164347c6ae99SBarry Smith     for (i=xs; i<xs+nx; i++) {
1644bff4a2f0SMatthew G. Knepley       istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i));
1645bff4a2f0SMatthew G. Knepley       iend   = (bx == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,m-i-1));
164647c6ae99SBarry Smith       for (j=ys; j<ys+ny; j++) {
1647bff4a2f0SMatthew G. Knepley         jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j));
1648bff4a2f0SMatthew G. Knepley         jend   = (by == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,n-j-1));
164947c6ae99SBarry Smith         for (k=zs; k<zs+nz; k++) {
1650bff4a2f0SMatthew G. Knepley           kstart = (bz == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k));
1651bff4a2f0SMatthew G. Knepley           kend   = (bz == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,p-k-1));
165247c6ae99SBarry Smith 
165347c6ae99SBarry Smith           slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs);
165447c6ae99SBarry Smith 
165547c6ae99SBarry Smith           cnt = 0;
165647c6ae99SBarry Smith           for (ii=istart; ii<iend+1; ii++) {
165747c6ae99SBarry Smith             for (jj=jstart; jj<jend+1; jj++) {
165847c6ae99SBarry Smith               for (kk=kstart; kk<kend+1; kk++) {
1659aa219208SBarry Smith                 if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/
166047c6ae99SBarry Smith                   cols[cnt++] = slot + ii + gnx*jj + gnx*gny*kk;
166147c6ae99SBarry Smith                 }
166247c6ae99SBarry Smith               }
166347c6ae99SBarry Smith             }
166447c6ae99SBarry Smith           }
166547c6ae99SBarry Smith           ierr = MatSetValuesBlockedLocal(J,1,&slot,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr);
166647c6ae99SBarry Smith         }
166747c6ae99SBarry Smith       }
166847c6ae99SBarry Smith     }
166947c6ae99SBarry Smith     ierr = PetscFree(values);CHKERRQ(ierr);
167047c6ae99SBarry Smith     ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
167147c6ae99SBarry Smith     ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1672189e4007SBarry Smith     ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr);
167347c6ae99SBarry Smith   }
167447c6ae99SBarry Smith   ierr = PetscFree(cols);CHKERRQ(ierr);
167547c6ae99SBarry Smith   PetscFunctionReturn(0);
167647c6ae99SBarry Smith }
167747c6ae99SBarry Smith 
167847c6ae99SBarry Smith /*
167947c6ae99SBarry Smith   This helper is for of SBAIJ preallocation, to discard the lower-triangular values which are difficult to
168047c6ae99SBarry Smith   identify in the local ordering with periodic domain.
168147c6ae99SBarry Smith */
168247c6ae99SBarry Smith static PetscErrorCode L2GFilterUpperTriangular(ISLocalToGlobalMapping ltog,PetscInt *row,PetscInt *cnt,PetscInt col[])
168347c6ae99SBarry Smith {
168447c6ae99SBarry Smith   PetscErrorCode ierr;
168547c6ae99SBarry Smith   PetscInt       i,n;
168647c6ae99SBarry Smith 
168747c6ae99SBarry Smith   PetscFunctionBegin;
1688d6e23781SBarry Smith   ierr = ISLocalToGlobalMappingApplyBlock(ltog,1,row,row);CHKERRQ(ierr);
1689d6e23781SBarry Smith   ierr = ISLocalToGlobalMappingApplyBlock(ltog,*cnt,col,col);CHKERRQ(ierr);
169047c6ae99SBarry Smith   for (i=0,n=0; i<*cnt; i++) {
169147c6ae99SBarry Smith     if (col[i] >= *row) col[n++] = col[i];
169247c6ae99SBarry Smith   }
169347c6ae99SBarry Smith   *cnt = n;
169447c6ae99SBarry Smith   PetscFunctionReturn(0);
169547c6ae99SBarry Smith }
169647c6ae99SBarry Smith 
1697950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_2d_MPISBAIJ(DM da,Mat J)
169847c6ae99SBarry Smith {
169947c6ae99SBarry Smith   PetscErrorCode         ierr;
170047c6ae99SBarry Smith   PetscInt               xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny;
170147c6ae99SBarry Smith   PetscInt               m,n,dim,s,*cols,nc,col,cnt,*dnz,*onz;
170247c6ae99SBarry Smith   PetscInt               istart,iend,jstart,jend,ii,jj;
170347c6ae99SBarry Smith   MPI_Comm               comm;
170447c6ae99SBarry Smith   PetscScalar            *values;
1705bff4a2f0SMatthew G. Knepley   DMBoundaryType         bx,by;
1706aa219208SBarry Smith   DMDAStencilType        st;
170745b6f7e9SBarry Smith   ISLocalToGlobalMapping ltog;
170847c6ae99SBarry Smith 
170947c6ae99SBarry Smith   PetscFunctionBegin;
171047c6ae99SBarry Smith   /*
171147c6ae99SBarry Smith      nc - number of components per grid point
171247c6ae99SBarry Smith      col - number of colors needed in one direction for single component problem
171347c6ae99SBarry Smith   */
17141321219cSEthan Coon   ierr = DMDAGetInfo(da,&dim,&m,&n,0,0,0,0,&nc,&s,&bx,&by,0,&st);CHKERRQ(ierr);
171547c6ae99SBarry Smith   col  = 2*s + 1;
171647c6ae99SBarry Smith 
1717aa219208SBarry Smith   ierr = DMDAGetCorners(da,&xs,&ys,0,&nx,&ny,0);CHKERRQ(ierr);
1718aa219208SBarry Smith   ierr = DMDAGetGhostCorners(da,&gxs,&gys,0,&gnx,&gny,0);CHKERRQ(ierr);
171947c6ae99SBarry Smith   ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr);
172047c6ae99SBarry Smith 
1721785e854fSJed Brown   ierr = PetscMalloc1(col*col*nc*nc,&cols);CHKERRQ(ierr);
172247c6ae99SBarry Smith 
17231411c6eeSJed Brown   ierr = DMGetLocalToGlobalMapping(da,&ltog);CHKERRQ(ierr);
172447c6ae99SBarry Smith 
172547c6ae99SBarry Smith   /* determine the matrix preallocation information */
1726eabe889fSLisandro Dalcin   ierr = MatPreallocateInitialize(comm,nx*ny,nx*ny,dnz,onz);CHKERRQ(ierr);
172747c6ae99SBarry Smith   for (i=xs; i<xs+nx; i++) {
1728bff4a2f0SMatthew G. Knepley     istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i));
1729bff4a2f0SMatthew G. Knepley     iend   = (bx == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,m-i-1));
173047c6ae99SBarry Smith     for (j=ys; j<ys+ny; j++) {
1731bff4a2f0SMatthew G. Knepley       jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j));
1732bff4a2f0SMatthew G. Knepley       jend   = (by == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,n-j-1));
173347c6ae99SBarry Smith       slot   = i - gxs + gnx*(j - gys);
173447c6ae99SBarry Smith 
173547c6ae99SBarry Smith       /* Find block columns in block row */
173647c6ae99SBarry Smith       cnt = 0;
173747c6ae99SBarry Smith       for (ii=istart; ii<iend+1; ii++) {
173847c6ae99SBarry Smith         for (jj=jstart; jj<jend+1; jj++) {
1739aa219208SBarry Smith           if (st == DMDA_STENCIL_BOX || !ii || !jj) {
174047c6ae99SBarry Smith             cols[cnt++] = slot + ii + gnx*jj;
174147c6ae99SBarry Smith           }
174247c6ae99SBarry Smith         }
174347c6ae99SBarry Smith       }
174445b6f7e9SBarry Smith       ierr = L2GFilterUpperTriangular(ltog,&slot,&cnt,cols);CHKERRQ(ierr);
1745d6e23781SBarry Smith       ierr = MatPreallocateSymmetricSetBlock(slot,cnt,cols,dnz,onz);CHKERRQ(ierr);
174647c6ae99SBarry Smith     }
174747c6ae99SBarry Smith   }
174847c6ae99SBarry Smith   ierr = MatSeqSBAIJSetPreallocation(J,nc,0,dnz);CHKERRQ(ierr);
174947c6ae99SBarry Smith   ierr = MatMPISBAIJSetPreallocation(J,nc,0,dnz,0,onz);CHKERRQ(ierr);
175047c6ae99SBarry Smith   ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr);
175147c6ae99SBarry Smith 
1752784ac674SJed Brown   ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr);
175347c6ae99SBarry Smith 
175447c6ae99SBarry Smith   /*
175547c6ae99SBarry Smith     For each node in the grid: we get the neighbors in the local (on processor ordering
175647c6ae99SBarry Smith     that includes the ghost points) then MatSetValuesLocal() maps those indices to the global
175747c6ae99SBarry Smith     PETSc ordering.
175847c6ae99SBarry Smith   */
1759fcfd50ebSBarry Smith   if (!da->prealloc_only) {
17601795a4d1SJed Brown     ierr = PetscCalloc1(col*col*nc*nc,&values);CHKERRQ(ierr);
176147c6ae99SBarry Smith     for (i=xs; i<xs+nx; i++) {
1762bff4a2f0SMatthew G. Knepley       istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i));
1763bff4a2f0SMatthew G. Knepley       iend   = (bx == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,m-i-1));
176447c6ae99SBarry Smith       for (j=ys; j<ys+ny; j++) {
1765bff4a2f0SMatthew G. Knepley         jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j));
1766bff4a2f0SMatthew G. Knepley         jend   = (by == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,n-j-1));
176747c6ae99SBarry Smith         slot   = i - gxs + gnx*(j - gys);
176847c6ae99SBarry Smith 
176947c6ae99SBarry Smith         /* Find block columns in block row */
177047c6ae99SBarry Smith         cnt = 0;
177147c6ae99SBarry Smith         for (ii=istart; ii<iend+1; ii++) {
177247c6ae99SBarry Smith           for (jj=jstart; jj<jend+1; jj++) {
1773aa219208SBarry Smith             if (st == DMDA_STENCIL_BOX || !ii || !jj) {
177447c6ae99SBarry Smith               cols[cnt++] = slot + ii + gnx*jj;
177547c6ae99SBarry Smith             }
177647c6ae99SBarry Smith           }
177747c6ae99SBarry Smith         }
177845b6f7e9SBarry Smith         ierr = L2GFilterUpperTriangular(ltog,&slot,&cnt,cols);CHKERRQ(ierr);
177947c6ae99SBarry Smith         ierr = MatSetValuesBlocked(J,1,&slot,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr);
178047c6ae99SBarry Smith       }
178147c6ae99SBarry Smith     }
178247c6ae99SBarry Smith     ierr = PetscFree(values);CHKERRQ(ierr);
178347c6ae99SBarry Smith     ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
178447c6ae99SBarry Smith     ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1785189e4007SBarry Smith     ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr);
178647c6ae99SBarry Smith   }
178747c6ae99SBarry Smith   ierr = PetscFree(cols);CHKERRQ(ierr);
178847c6ae99SBarry Smith   PetscFunctionReturn(0);
178947c6ae99SBarry Smith }
179047c6ae99SBarry Smith 
1791950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_3d_MPISBAIJ(DM da,Mat J)
179247c6ae99SBarry Smith {
179347c6ae99SBarry Smith   PetscErrorCode         ierr;
179447c6ae99SBarry Smith   PetscInt               xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny;
179547c6ae99SBarry Smith   PetscInt               m,n,dim,s,*cols,k,nc,col,cnt,p,*dnz,*onz;
179647c6ae99SBarry Smith   PetscInt               istart,iend,jstart,jend,kstart,kend,zs,nz,gzs,gnz,ii,jj,kk;
179747c6ae99SBarry Smith   MPI_Comm               comm;
179847c6ae99SBarry Smith   PetscScalar            *values;
1799bff4a2f0SMatthew G. Knepley   DMBoundaryType         bx,by,bz;
1800aa219208SBarry Smith   DMDAStencilType        st;
180145b6f7e9SBarry Smith   ISLocalToGlobalMapping ltog;
180247c6ae99SBarry Smith 
180347c6ae99SBarry Smith   PetscFunctionBegin;
180447c6ae99SBarry Smith   /*
180547c6ae99SBarry Smith      nc - number of components per grid point
180647c6ae99SBarry Smith      col - number of colors needed in one direction for single component problem
180747c6ae99SBarry Smith   */
18081321219cSEthan Coon   ierr = DMDAGetInfo(da,&dim,&m,&n,&p,0,0,0,&nc,&s,&bx,&by,&bz,&st);CHKERRQ(ierr);
180947c6ae99SBarry Smith   col  = 2*s + 1;
181047c6ae99SBarry Smith 
1811aa219208SBarry Smith   ierr = DMDAGetCorners(da,&xs,&ys,&zs,&nx,&ny,&nz);CHKERRQ(ierr);
1812aa219208SBarry Smith   ierr = DMDAGetGhostCorners(da,&gxs,&gys,&gzs,&gnx,&gny,&gnz);CHKERRQ(ierr);
181347c6ae99SBarry Smith   ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr);
181447c6ae99SBarry Smith 
181547c6ae99SBarry Smith   /* create the matrix */
1816785e854fSJed Brown   ierr = PetscMalloc1(col*col*col,&cols);CHKERRQ(ierr);
181747c6ae99SBarry Smith 
18181411c6eeSJed Brown   ierr = DMGetLocalToGlobalMapping(da,&ltog);CHKERRQ(ierr);
181947c6ae99SBarry Smith 
182047c6ae99SBarry Smith   /* determine the matrix preallocation information */
1821eabe889fSLisandro Dalcin   ierr = MatPreallocateInitialize(comm,nx*ny*nz,nx*ny*nz,dnz,onz);CHKERRQ(ierr);
182247c6ae99SBarry Smith   for (i=xs; i<xs+nx; i++) {
1823bff4a2f0SMatthew G. Knepley     istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i));
1824bff4a2f0SMatthew G. Knepley     iend   = (bx == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,m-i-1));
182547c6ae99SBarry Smith     for (j=ys; j<ys+ny; j++) {
1826bff4a2f0SMatthew G. Knepley       jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j));
1827bff4a2f0SMatthew G. Knepley       jend   = (by == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,n-j-1));
182847c6ae99SBarry Smith       for (k=zs; k<zs+nz; k++) {
1829bff4a2f0SMatthew G. Knepley         kstart = (bz == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k));
1830bff4a2f0SMatthew G. Knepley         kend   = (bz == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,p-k-1));
183147c6ae99SBarry Smith 
183247c6ae99SBarry Smith         slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs);
183347c6ae99SBarry Smith 
183447c6ae99SBarry Smith         /* Find block columns in block row */
183547c6ae99SBarry Smith         cnt = 0;
183647c6ae99SBarry Smith         for (ii=istart; ii<iend+1; ii++) {
183747c6ae99SBarry Smith           for (jj=jstart; jj<jend+1; jj++) {
183847c6ae99SBarry Smith             for (kk=kstart; kk<kend+1; kk++) {
1839aa219208SBarry Smith               if ((st == DMDA_STENCIL_BOX) || (!ii && !jj) || (!jj && !kk) || (!ii && !kk)) {
184047c6ae99SBarry Smith                 cols[cnt++] = slot + ii + gnx*jj + gnx*gny*kk;
184147c6ae99SBarry Smith               }
184247c6ae99SBarry Smith             }
184347c6ae99SBarry Smith           }
184447c6ae99SBarry Smith         }
184545b6f7e9SBarry Smith         ierr = L2GFilterUpperTriangular(ltog,&slot,&cnt,cols);CHKERRQ(ierr);
1846d6e23781SBarry Smith         ierr = MatPreallocateSymmetricSetBlock(slot,cnt,cols,dnz,onz);CHKERRQ(ierr);
184747c6ae99SBarry Smith       }
184847c6ae99SBarry Smith     }
184947c6ae99SBarry Smith   }
185047c6ae99SBarry Smith   ierr = MatSeqSBAIJSetPreallocation(J,nc,0,dnz);CHKERRQ(ierr);
185147c6ae99SBarry Smith   ierr = MatMPISBAIJSetPreallocation(J,nc,0,dnz,0,onz);CHKERRQ(ierr);
185247c6ae99SBarry Smith   ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr);
185347c6ae99SBarry Smith 
1854784ac674SJed Brown   ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr);
185547c6ae99SBarry Smith 
185647c6ae99SBarry Smith   /*
185747c6ae99SBarry Smith     For each node in the grid: we get the neighbors in the local (on processor ordering
185847c6ae99SBarry Smith     that includes the ghost points) then MatSetValuesLocal() maps those indices to the global
185947c6ae99SBarry Smith     PETSc ordering.
186047c6ae99SBarry Smith   */
1861fcfd50ebSBarry Smith   if (!da->prealloc_only) {
18621795a4d1SJed Brown     ierr = PetscCalloc1(col*col*col*nc*nc,&values);CHKERRQ(ierr);
186347c6ae99SBarry Smith     for (i=xs; i<xs+nx; i++) {
1864bff4a2f0SMatthew G. Knepley       istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i));
1865bff4a2f0SMatthew G. Knepley       iend   = (bx == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,m-i-1));
186647c6ae99SBarry Smith       for (j=ys; j<ys+ny; j++) {
1867bff4a2f0SMatthew G. Knepley         jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j));
1868bff4a2f0SMatthew G. Knepley         jend   = (by == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,n-j-1));
186947c6ae99SBarry Smith         for (k=zs; k<zs+nz; k++) {
1870bff4a2f0SMatthew G. Knepley           kstart = (bz == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k));
1871bff4a2f0SMatthew G. Knepley           kend   = (bz == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,p-k-1));
187247c6ae99SBarry Smith 
187347c6ae99SBarry Smith           slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs);
187447c6ae99SBarry Smith 
187547c6ae99SBarry Smith           cnt = 0;
187647c6ae99SBarry Smith           for (ii=istart; ii<iend+1; ii++) {
187747c6ae99SBarry Smith             for (jj=jstart; jj<jend+1; jj++) {
187847c6ae99SBarry Smith               for (kk=kstart; kk<kend+1; kk++) {
1879aa219208SBarry Smith                 if ((st == DMDA_STENCIL_BOX) || (!ii && !jj) || (!jj && !kk) || (!ii && !kk)) {
188047c6ae99SBarry Smith                   cols[cnt++] = slot + ii + gnx*jj + gnx*gny*kk;
188147c6ae99SBarry Smith                 }
188247c6ae99SBarry Smith               }
188347c6ae99SBarry Smith             }
188447c6ae99SBarry Smith           }
188545b6f7e9SBarry Smith           ierr = L2GFilterUpperTriangular(ltog,&slot,&cnt,cols);CHKERRQ(ierr);
188647c6ae99SBarry Smith           ierr = MatSetValuesBlocked(J,1,&slot,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr);
188747c6ae99SBarry Smith         }
188847c6ae99SBarry Smith       }
188947c6ae99SBarry Smith     }
189047c6ae99SBarry Smith     ierr = PetscFree(values);CHKERRQ(ierr);
189147c6ae99SBarry Smith     ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
189247c6ae99SBarry Smith     ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1893189e4007SBarry Smith     ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr);
189447c6ae99SBarry Smith   }
189547c6ae99SBarry Smith   ierr = PetscFree(cols);CHKERRQ(ierr);
189647c6ae99SBarry Smith   PetscFunctionReturn(0);
189747c6ae99SBarry Smith }
189847c6ae99SBarry Smith 
189947c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/
190047c6ae99SBarry Smith 
1901950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_3d_MPIAIJ_Fill(DM da,Mat J)
190247c6ae99SBarry Smith {
190347c6ae99SBarry Smith   PetscErrorCode         ierr;
190447c6ae99SBarry Smith   PetscInt               xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny;
1905c0ab637bSBarry Smith   PetscInt               m,n,dim,s,*cols,k,nc,row,col,cnt, maxcnt = 0,l,p,*dnz,*onz;
1906c1154cd5SBarry Smith   PetscInt               istart,iend,jstart,jend,kstart,kend,zs,nz,gzs,gnz,ii,jj,kk,M,N,P;
190747c6ae99SBarry Smith   DM_DA                  *dd = (DM_DA*)da->data;
190847c6ae99SBarry Smith   PetscInt               ifill_col,*dfill = dd->dfill,*ofill = dd->ofill;
190947c6ae99SBarry Smith   MPI_Comm               comm;
191047c6ae99SBarry Smith   PetscScalar            *values;
1911bff4a2f0SMatthew G. Knepley   DMBoundaryType         bx,by,bz;
191245b6f7e9SBarry Smith   ISLocalToGlobalMapping ltog;
1913aa219208SBarry Smith   DMDAStencilType        st;
1914c1154cd5SBarry Smith   PetscBool              removedups = PETSC_FALSE;
191547c6ae99SBarry Smith 
191647c6ae99SBarry Smith   PetscFunctionBegin;
191747c6ae99SBarry Smith   /*
191847c6ae99SBarry Smith          nc - number of components per grid point
191947c6ae99SBarry Smith          col - number of colors needed in one direction for single component problem
192047c6ae99SBarry Smith 
192147c6ae99SBarry Smith   */
1922c1154cd5SBarry Smith   ierr = DMDAGetInfo(da,&dim,&m,&n,&p,&M,&N,&P,&nc,&s,&bx,&by,&bz,&st);CHKERRQ(ierr);
192347c6ae99SBarry Smith   col  = 2*s + 1;
1924bff4a2f0SMatthew G. Knepley   if (bx == DM_BOUNDARY_PERIODIC && (m % col)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in X is divisible\n\
192547c6ae99SBarry Smith                  by 2*stencil_width + 1\n");
1926bff4a2f0SMatthew G. Knepley   if (by == DM_BOUNDARY_PERIODIC && (n % col)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in Y is divisible\n\
192747c6ae99SBarry Smith                  by 2*stencil_width + 1\n");
1928bff4a2f0SMatthew G. Knepley   if (bz == DM_BOUNDARY_PERIODIC && (p % col)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in Z is divisible\n\
192947c6ae99SBarry Smith                  by 2*stencil_width + 1\n");
193047c6ae99SBarry Smith 
1931c1154cd5SBarry Smith   /*
1932c1154cd5SBarry Smith        With one processor in periodic domains in a skinny dimension the code will label nonzero columns multiple times
1933c1154cd5SBarry Smith        because of "wrapping" around the end of the domain hitting an entry already counted in the other direction.
1934c1154cd5SBarry Smith   */
1935c1154cd5SBarry Smith   if (M == 1 && 2*s >= m) removedups = PETSC_TRUE;
1936c1154cd5SBarry Smith   if (N == 1 && 2*s >= n) removedups = PETSC_TRUE;
1937c1154cd5SBarry Smith   if (P == 1 && 2*s >= p) removedups = PETSC_TRUE;
1938c1154cd5SBarry Smith 
1939aa219208SBarry Smith   ierr = DMDAGetCorners(da,&xs,&ys,&zs,&nx,&ny,&nz);CHKERRQ(ierr);
1940aa219208SBarry Smith   ierr = DMDAGetGhostCorners(da,&gxs,&gys,&gzs,&gnx,&gny,&gnz);CHKERRQ(ierr);
194147c6ae99SBarry Smith   ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr);
194247c6ae99SBarry Smith 
1943785e854fSJed Brown   ierr = PetscMalloc1(col*col*col*nc,&cols);CHKERRQ(ierr);
19441411c6eeSJed Brown   ierr = DMGetLocalToGlobalMapping(da,&ltog);CHKERRQ(ierr);
194547c6ae99SBarry Smith 
194647c6ae99SBarry Smith   /* determine the matrix preallocation information */
194747c6ae99SBarry Smith   ierr = MatPreallocateInitialize(comm,nc*nx*ny*nz,nc*nx*ny*nz,dnz,onz);CHKERRQ(ierr);
194847c6ae99SBarry Smith 
194906ca8cadSBarry Smith   ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr);
195047c6ae99SBarry Smith   for (i=xs; i<xs+nx; i++) {
1951bff4a2f0SMatthew G. Knepley     istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i));
1952bff4a2f0SMatthew G. Knepley     iend   = (bx == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,m-i-1));
195347c6ae99SBarry Smith     for (j=ys; j<ys+ny; j++) {
1954bff4a2f0SMatthew G. Knepley       jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j));
1955bff4a2f0SMatthew G. Knepley       jend   = (by == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,n-j-1));
195647c6ae99SBarry Smith       for (k=zs; k<zs+nz; k++) {
1957bff4a2f0SMatthew G. Knepley         kstart = (bz == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k));
1958bff4a2f0SMatthew G. Knepley         kend   = (bz == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,p-k-1));
195947c6ae99SBarry Smith 
196047c6ae99SBarry Smith         slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs);
196147c6ae99SBarry Smith 
196247c6ae99SBarry Smith         for (l=0; l<nc; l++) {
196347c6ae99SBarry Smith           cnt = 0;
196447c6ae99SBarry Smith           for (ii=istart; ii<iend+1; ii++) {
196547c6ae99SBarry Smith             for (jj=jstart; jj<jend+1; jj++) {
196647c6ae99SBarry Smith               for (kk=kstart; kk<kend+1; kk++) {
196747c6ae99SBarry Smith                 if (ii || jj || kk) {
1968aa219208SBarry Smith                   if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/
19698865f1eaSKarl Rupp                     for (ifill_col=ofill[l]; ifill_col<ofill[l+1]; ifill_col++) cols[cnt++] = ofill[ifill_col] + nc*(slot + ii + gnx*jj + gnx*gny*kk);
197047c6ae99SBarry Smith                   }
197147c6ae99SBarry Smith                 } else {
197247c6ae99SBarry Smith                   if (dfill) {
19738865f1eaSKarl Rupp                     for (ifill_col=dfill[l]; ifill_col<dfill[l+1]; ifill_col++) cols[cnt++] = dfill[ifill_col] + nc*(slot + ii + gnx*jj + gnx*gny*kk);
197447c6ae99SBarry Smith                   } else {
19758865f1eaSKarl Rupp                     for (ifill_col=0; ifill_col<nc; ifill_col++) cols[cnt++] = ifill_col + nc*(slot + ii + gnx*jj + gnx*gny*kk);
197647c6ae99SBarry Smith                   }
197747c6ae99SBarry Smith                 }
197847c6ae99SBarry Smith               }
197947c6ae99SBarry Smith             }
198047c6ae99SBarry Smith           }
198147c6ae99SBarry Smith           row  = l + nc*(slot);
1982c0ab637bSBarry Smith           maxcnt = PetscMax(maxcnt,cnt);
1983c1154cd5SBarry Smith           if (removedups) {
1984c1154cd5SBarry Smith             ierr = MatPreallocateSetLocalRemoveDups(ltog,1,&row,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr);
1985c1154cd5SBarry Smith           } else {
1986784ac674SJed Brown             ierr = MatPreallocateSetLocal(ltog,1,&row,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr);
198747c6ae99SBarry Smith           }
198847c6ae99SBarry Smith         }
198947c6ae99SBarry Smith       }
199047c6ae99SBarry Smith     }
1991c1154cd5SBarry Smith   }
199247c6ae99SBarry Smith   ierr = MatSeqAIJSetPreallocation(J,0,dnz);CHKERRQ(ierr);
199347c6ae99SBarry Smith   ierr = MatMPIAIJSetPreallocation(J,0,dnz,0,onz);CHKERRQ(ierr);
199447c6ae99SBarry Smith   ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr);
1995784ac674SJed Brown   ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr);
199647c6ae99SBarry Smith 
199747c6ae99SBarry Smith   /*
199847c6ae99SBarry Smith     For each node in the grid: we get the neighbors in the local (on processor ordering
199947c6ae99SBarry Smith     that includes the ghost points) then MatSetValuesLocal() maps those indices to the global
200047c6ae99SBarry Smith     PETSc ordering.
200147c6ae99SBarry Smith   */
2002fcfd50ebSBarry Smith   if (!da->prealloc_only) {
2003c0ab637bSBarry Smith     ierr = PetscCalloc1(maxcnt,&values);CHKERRQ(ierr);
200447c6ae99SBarry Smith     for (i=xs; i<xs+nx; i++) {
2005bff4a2f0SMatthew G. Knepley       istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i));
2006bff4a2f0SMatthew G. Knepley       iend   = (bx == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,m-i-1));
200747c6ae99SBarry Smith       for (j=ys; j<ys+ny; j++) {
2008bff4a2f0SMatthew G. Knepley         jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j));
2009bff4a2f0SMatthew G. Knepley         jend   = (by == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,n-j-1));
201047c6ae99SBarry Smith         for (k=zs; k<zs+nz; k++) {
2011bff4a2f0SMatthew G. Knepley           kstart = (bz == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k));
2012bff4a2f0SMatthew G. Knepley           kend   = (bz == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,p-k-1));
201347c6ae99SBarry Smith 
201447c6ae99SBarry Smith           slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs);
201547c6ae99SBarry Smith 
201647c6ae99SBarry Smith           for (l=0; l<nc; l++) {
201747c6ae99SBarry Smith             cnt = 0;
201847c6ae99SBarry Smith             for (ii=istart; ii<iend+1; ii++) {
201947c6ae99SBarry Smith               for (jj=jstart; jj<jend+1; jj++) {
202047c6ae99SBarry Smith                 for (kk=kstart; kk<kend+1; kk++) {
202147c6ae99SBarry Smith                   if (ii || jj || kk) {
2022aa219208SBarry Smith                     if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/
20238865f1eaSKarl Rupp                       for (ifill_col=ofill[l]; ifill_col<ofill[l+1]; ifill_col++) cols[cnt++] = ofill[ifill_col] + nc*(slot + ii + gnx*jj + gnx*gny*kk);
202447c6ae99SBarry Smith                     }
202547c6ae99SBarry Smith                   } else {
202647c6ae99SBarry Smith                     if (dfill) {
20278865f1eaSKarl Rupp                       for (ifill_col=dfill[l]; ifill_col<dfill[l+1]; ifill_col++) cols[cnt++] = dfill[ifill_col] + nc*(slot + ii + gnx*jj + gnx*gny*kk);
202847c6ae99SBarry Smith                     } else {
20298865f1eaSKarl Rupp                       for (ifill_col=0; ifill_col<nc; ifill_col++) cols[cnt++] = ifill_col + nc*(slot + ii + gnx*jj + gnx*gny*kk);
203047c6ae99SBarry Smith                     }
203147c6ae99SBarry Smith                   }
203247c6ae99SBarry Smith                 }
203347c6ae99SBarry Smith               }
203447c6ae99SBarry Smith             }
203547c6ae99SBarry Smith             row  = l + nc*(slot);
203647c6ae99SBarry Smith             ierr = MatSetValuesLocal(J,1,&row,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr);
203747c6ae99SBarry Smith           }
203847c6ae99SBarry Smith         }
203947c6ae99SBarry Smith       }
204047c6ae99SBarry Smith     }
204147c6ae99SBarry Smith     ierr = PetscFree(values);CHKERRQ(ierr);
204247c6ae99SBarry Smith     ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
204347c6ae99SBarry Smith     ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2044189e4007SBarry Smith     ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr);
204547c6ae99SBarry Smith   }
204647c6ae99SBarry Smith   ierr = PetscFree(cols);CHKERRQ(ierr);
204747c6ae99SBarry Smith   PetscFunctionReturn(0);
204847c6ae99SBarry Smith }
2049