xref: /petsc/src/dm/impls/da/fdda.c (revision 711261dbbbbafbd91025daf565915c8e28cc040d)
147c6ae99SBarry Smith 
2af0996ceSBarry Smith #include <petsc/private/dmdaimpl.h> /*I      "petscdmda.h"     I*/
307475bc1SBarry Smith #include <petscmat.h>
447c6ae99SBarry Smith 
5e727c939SJed Brown extern PetscErrorCode DMCreateColoring_DA_1d_MPIAIJ(DM,ISColoringType,ISColoring*);
6e727c939SJed Brown extern PetscErrorCode DMCreateColoring_DA_2d_MPIAIJ(DM,ISColoringType,ISColoring*);
7e727c939SJed Brown extern PetscErrorCode DMCreateColoring_DA_2d_5pt_MPIAIJ(DM,ISColoringType,ISColoring*);
8e727c939SJed Brown extern PetscErrorCode DMCreateColoring_DA_3d_MPIAIJ(DM,ISColoringType,ISColoring*);
947c6ae99SBarry Smith 
1047c6ae99SBarry Smith /*
1147c6ae99SBarry Smith    For ghost i that may be negative or greater than the upper bound this
1247c6ae99SBarry Smith   maps it into the 0:m-1 range using periodicity
1347c6ae99SBarry Smith */
1447c6ae99SBarry Smith #define SetInRange(i,m) ((i < 0) ? m+i : ((i >= m) ? i-m : i))
1547c6ae99SBarry Smith 
16ce308e1dSBarry Smith static PetscErrorCode DMDASetBlockFills_Private(const PetscInt *dfill,PetscInt w,PetscInt **rfill)
1747c6ae99SBarry Smith {
1847c6ae99SBarry Smith   PetscErrorCode ierr;
1947c6ae99SBarry Smith   PetscInt       i,j,nz,*fill;
2047c6ae99SBarry Smith 
2147c6ae99SBarry Smith   PetscFunctionBegin;
2247c6ae99SBarry Smith   if (!dfill) PetscFunctionReturn(0);
2347c6ae99SBarry Smith 
2447c6ae99SBarry Smith   /* count number nonzeros */
2547c6ae99SBarry Smith   nz = 0;
2647c6ae99SBarry Smith   for (i=0; i<w; i++) {
2747c6ae99SBarry Smith     for (j=0; j<w; j++) {
2847c6ae99SBarry Smith       if (dfill[w*i+j]) nz++;
2947c6ae99SBarry Smith     }
3047c6ae99SBarry Smith   }
31854ce69bSBarry Smith   ierr = PetscMalloc1(nz + w + 1,&fill);CHKERRQ(ierr);
3247c6ae99SBarry Smith   /* construct modified CSR storage of nonzero structure */
33ce308e1dSBarry Smith   /*  fill[0 -- w] marks starts of each row of column indices (and end of last row)
34ce308e1dSBarry Smith    so fill[1] - fill[0] gives number of nonzeros in first row etc */
3547c6ae99SBarry Smith   nz = w + 1;
3647c6ae99SBarry Smith   for (i=0; i<w; i++) {
3747c6ae99SBarry Smith     fill[i] = nz;
3847c6ae99SBarry Smith     for (j=0; j<w; j++) {
3947c6ae99SBarry Smith       if (dfill[w*i+j]) {
4047c6ae99SBarry Smith         fill[nz] = j;
4147c6ae99SBarry Smith         nz++;
4247c6ae99SBarry Smith       }
4347c6ae99SBarry Smith     }
4447c6ae99SBarry Smith   }
4547c6ae99SBarry Smith   fill[w] = nz;
4647c6ae99SBarry Smith 
4747c6ae99SBarry Smith   *rfill = fill;
4847c6ae99SBarry Smith   PetscFunctionReturn(0);
4947c6ae99SBarry Smith }
5047c6ae99SBarry Smith 
5147c6ae99SBarry Smith /*@
52aa219208SBarry Smith     DMDASetBlockFills - Sets the fill pattern in each block for a multi-component problem
53950540a4SJed Brown     of the matrix returned by DMCreateMatrix().
5447c6ae99SBarry Smith 
55aa219208SBarry Smith     Logically Collective on DMDA
5647c6ae99SBarry Smith 
5747c6ae99SBarry Smith     Input Parameter:
5847c6ae99SBarry Smith +   da - the distributed array
590298fd71SBarry Smith .   dfill - the fill pattern in the diagonal block (may be NULL, means use dense block)
6047c6ae99SBarry Smith -   ofill - the fill pattern in the off-diagonal blocks
6147c6ae99SBarry Smith 
6247c6ae99SBarry Smith 
6347c6ae99SBarry Smith     Level: developer
6447c6ae99SBarry Smith 
6547c6ae99SBarry Smith     Notes: This only makes sense when you are doing multicomponent problems but using the
6647c6ae99SBarry Smith        MPIAIJ matrix format
6747c6ae99SBarry Smith 
6847c6ae99SBarry Smith            The format for dfill and ofill is a 2 dimensional dof by dof matrix with 1 entries
6947c6ae99SBarry Smith        representing coupling and 0 entries for missing coupling. For example
7047c6ae99SBarry Smith $             dfill[9] = {1, 0, 0,
7147c6ae99SBarry Smith $                         1, 1, 0,
7247c6ae99SBarry Smith $                         0, 1, 1}
7347c6ae99SBarry Smith        means that row 0 is coupled with only itself in the diagonal block, row 1 is coupled with
7447c6ae99SBarry Smith        itself and row 0 (in the diagonal block) and row 2 is coupled with itself and row 1 (in the
7547c6ae99SBarry Smith        diagonal block).
7647c6ae99SBarry Smith 
77aa219208SBarry Smith      DMDASetGetMatrix() allows you to provide general code for those more complicated nonzero patterns then
7847c6ae99SBarry Smith      can be represented in the dfill, ofill format
7947c6ae99SBarry Smith 
8047c6ae99SBarry Smith    Contributed by Glenn Hammond
8147c6ae99SBarry Smith 
828ddb5d8bSBarry Smith .seealso DMCreateMatrix(), DMDASetGetMatrix(), DMSetMatrixPreallocateOnly()
8347c6ae99SBarry Smith 
8447c6ae99SBarry Smith @*/
85ce308e1dSBarry Smith PetscErrorCode  DMDASetBlockFills(DM da,const PetscInt *dfill,const PetscInt *ofill)
8647c6ae99SBarry Smith {
8747c6ae99SBarry Smith   DM_DA          *dd = (DM_DA*)da->data;
8847c6ae99SBarry Smith   PetscErrorCode ierr;
89ae4f298aSBarry Smith   PetscInt       i,k,cnt = 1;
9047c6ae99SBarry Smith 
9147c6ae99SBarry Smith   PetscFunctionBegin;
92aa219208SBarry Smith   ierr = DMDASetBlockFills_Private(dfill,dd->w,&dd->dfill);CHKERRQ(ierr);
93aa219208SBarry Smith   ierr = DMDASetBlockFills_Private(ofill,dd->w,&dd->ofill);CHKERRQ(ierr);
94ae4f298aSBarry Smith 
95ae4f298aSBarry Smith   /* ofillcount tracks the columns of ofill that have any nonzero in thems; the value in each location is the number of
96ae4f298aSBarry Smith    columns to the left with any nonzeros in them plus 1 */
971795a4d1SJed Brown   ierr = PetscCalloc1(dd->w,&dd->ofillcols);CHKERRQ(ierr);
98ae4f298aSBarry Smith   for (i=0; i<dd->w; i++) {
99ae4f298aSBarry Smith     for (k=dd->ofill[i]; k<dd->ofill[i+1]; k++) dd->ofillcols[dd->ofill[k]] = 1;
100ae4f298aSBarry Smith   }
101ae4f298aSBarry Smith   for (i=0; i<dd->w; i++) {
102ae4f298aSBarry Smith     if (dd->ofillcols[i]) {
103ae4f298aSBarry Smith       dd->ofillcols[i] = cnt++;
104ae4f298aSBarry Smith     }
105ae4f298aSBarry Smith   }
10647c6ae99SBarry Smith   PetscFunctionReturn(0);
10747c6ae99SBarry Smith }
10847c6ae99SBarry Smith 
10947c6ae99SBarry Smith 
110b412c318SBarry Smith PetscErrorCode  DMCreateColoring_DA(DM da,ISColoringType ctype,ISColoring *coloring)
11147c6ae99SBarry Smith {
11247c6ae99SBarry Smith   PetscErrorCode   ierr;
11347c6ae99SBarry Smith   PetscInt         dim,m,n,p,nc;
114bff4a2f0SMatthew G. Knepley   DMBoundaryType bx,by,bz;
11547c6ae99SBarry Smith   MPI_Comm         comm;
11647c6ae99SBarry Smith   PetscMPIInt      size;
11747c6ae99SBarry Smith   PetscBool        isBAIJ;
11847c6ae99SBarry Smith   DM_DA            *dd = (DM_DA*)da->data;
11947c6ae99SBarry Smith 
12047c6ae99SBarry Smith   PetscFunctionBegin;
12147c6ae99SBarry Smith   /*
12247c6ae99SBarry Smith                                   m
12347c6ae99SBarry Smith           ------------------------------------------------------
12447c6ae99SBarry Smith          |                                                     |
12547c6ae99SBarry Smith          |                                                     |
12647c6ae99SBarry Smith          |               ----------------------                |
12747c6ae99SBarry Smith          |               |                    |                |
12847c6ae99SBarry Smith       n  |           yn  |                    |                |
12947c6ae99SBarry Smith          |               |                    |                |
13047c6ae99SBarry Smith          |               .---------------------                |
13147c6ae99SBarry Smith          |             (xs,ys)     xn                          |
13247c6ae99SBarry Smith          |            .                                        |
13347c6ae99SBarry Smith          |         (gxs,gys)                                   |
13447c6ae99SBarry Smith          |                                                     |
13547c6ae99SBarry Smith           -----------------------------------------------------
13647c6ae99SBarry Smith   */
13747c6ae99SBarry Smith 
13847c6ae99SBarry Smith   /*
13947c6ae99SBarry Smith          nc - number of components per grid point
14047c6ae99SBarry Smith          col - number of colors needed in one direction for single component problem
14147c6ae99SBarry Smith 
14247c6ae99SBarry Smith   */
1431321219cSEthan Coon   ierr = DMDAGetInfo(da,&dim,0,0,0,&m,&n,&p,&nc,0,&bx,&by,&bz,0);CHKERRQ(ierr);
14447c6ae99SBarry Smith 
14547c6ae99SBarry Smith   ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr);
14647c6ae99SBarry Smith   ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr);
1475bdb020cSBarry Smith   if (ctype == IS_COLORING_LOCAL) {
14847c6ae99SBarry Smith     if (size == 1) {
14947c6ae99SBarry Smith       ctype = IS_COLORING_GLOBAL;
15047c6ae99SBarry Smith     } else if (dim > 1) {
151bff4a2f0SMatthew G. Knepley       if ((m==1 && bx == DM_BOUNDARY_PERIODIC) || (n==1 && by == DM_BOUNDARY_PERIODIC) || (p==1 && bz == DM_BOUNDARY_PERIODIC)) {
1525bdb020cSBarry Smith         SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"IS_COLORING_LOCAL cannot be used for periodic boundary condition having both ends of the domain  on the same process");
15347c6ae99SBarry Smith       }
15447c6ae99SBarry Smith     }
15547c6ae99SBarry Smith   }
15647c6ae99SBarry Smith 
157aa219208SBarry Smith   /* Tell the DMDA it has 1 degree of freedom per grid point so that the coloring for BAIJ
15847c6ae99SBarry Smith      matrices is for the blocks, not the individual matrix elements  */
159b412c318SBarry Smith   ierr = PetscStrcmp(da->mattype,MATBAIJ,&isBAIJ);CHKERRQ(ierr);
160b412c318SBarry Smith   if (!isBAIJ) {ierr = PetscStrcmp(da->mattype,MATMPIBAIJ,&isBAIJ);CHKERRQ(ierr);}
161b412c318SBarry Smith   if (!isBAIJ) {ierr = PetscStrcmp(da->mattype,MATSEQBAIJ,&isBAIJ);CHKERRQ(ierr);}
16247c6ae99SBarry Smith   if (isBAIJ) {
16347c6ae99SBarry Smith     dd->w  = 1;
16447c6ae99SBarry Smith     dd->xs = dd->xs/nc;
16547c6ae99SBarry Smith     dd->xe = dd->xe/nc;
16647c6ae99SBarry Smith     dd->Xs = dd->Xs/nc;
16747c6ae99SBarry Smith     dd->Xe = dd->Xe/nc;
16847c6ae99SBarry Smith   }
16947c6ae99SBarry Smith 
17047c6ae99SBarry Smith   /*
171aa219208SBarry Smith      We do not provide a getcoloring function in the DMDA operations because
172aa219208SBarry Smith    the basic DMDA does not know about matrices. We think of DMDA as being more
17347c6ae99SBarry Smith    more low-level then matrices.
17447c6ae99SBarry Smith   */
17547c6ae99SBarry Smith   if (dim == 1) {
176e727c939SJed Brown     ierr = DMCreateColoring_DA_1d_MPIAIJ(da,ctype,coloring);CHKERRQ(ierr);
17747c6ae99SBarry Smith   } else if (dim == 2) {
178e727c939SJed Brown     ierr =  DMCreateColoring_DA_2d_MPIAIJ(da,ctype,coloring);CHKERRQ(ierr);
17947c6ae99SBarry Smith   } else if (dim == 3) {
180e727c939SJed Brown     ierr =  DMCreateColoring_DA_3d_MPIAIJ(da,ctype,coloring);CHKERRQ(ierr);
181ce94432eSBarry Smith   } else SETERRQ1(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"Not done for %D dimension, send us mail petsc-maint@mcs.anl.gov for code",dim);
18247c6ae99SBarry Smith   if (isBAIJ) {
18347c6ae99SBarry Smith     dd->w  = nc;
18447c6ae99SBarry Smith     dd->xs = dd->xs*nc;
18547c6ae99SBarry Smith     dd->xe = dd->xe*nc;
18647c6ae99SBarry Smith     dd->Xs = dd->Xs*nc;
18747c6ae99SBarry Smith     dd->Xe = dd->Xe*nc;
18847c6ae99SBarry Smith   }
18947c6ae99SBarry Smith   PetscFunctionReturn(0);
19047c6ae99SBarry Smith }
19147c6ae99SBarry Smith 
19247c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/
19347c6ae99SBarry Smith 
194e727c939SJed Brown PetscErrorCode DMCreateColoring_DA_2d_MPIAIJ(DM da,ISColoringType ctype,ISColoring *coloring)
19547c6ae99SBarry Smith {
19647c6ae99SBarry Smith   PetscErrorCode   ierr;
19747c6ae99SBarry Smith   PetscInt         xs,ys,nx,ny,i,j,ii,gxs,gys,gnx,gny,m,n,M,N,dim,s,k,nc,col;
19847c6ae99SBarry Smith   PetscInt         ncolors;
19947c6ae99SBarry Smith   MPI_Comm         comm;
200bff4a2f0SMatthew G. Knepley   DMBoundaryType bx,by;
201aa219208SBarry Smith   DMDAStencilType  st;
20247c6ae99SBarry Smith   ISColoringValue  *colors;
20347c6ae99SBarry Smith   DM_DA            *dd = (DM_DA*)da->data;
20447c6ae99SBarry Smith 
20547c6ae99SBarry Smith   PetscFunctionBegin;
20647c6ae99SBarry Smith   /*
20747c6ae99SBarry Smith          nc - number of components per grid point
20847c6ae99SBarry Smith          col - number of colors needed in one direction for single component problem
20947c6ae99SBarry Smith 
21047c6ae99SBarry Smith   */
2111321219cSEthan Coon   ierr = DMDAGetInfo(da,&dim,&m,&n,0,&M,&N,0,&nc,&s,&bx,&by,0,&st);CHKERRQ(ierr);
21247c6ae99SBarry Smith   col  = 2*s + 1;
213aa219208SBarry Smith   ierr = DMDAGetCorners(da,&xs,&ys,0,&nx,&ny,0);CHKERRQ(ierr);
214aa219208SBarry Smith   ierr = DMDAGetGhostCorners(da,&gxs,&gys,0,&gnx,&gny,0);CHKERRQ(ierr);
21547c6ae99SBarry Smith   ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr);
21647c6ae99SBarry Smith 
21747c6ae99SBarry Smith   /* special case as taught to us by Paul Hovland */
218aa219208SBarry Smith   if (st == DMDA_STENCIL_STAR && s == 1) {
219e727c939SJed Brown     ierr = DMCreateColoring_DA_2d_5pt_MPIAIJ(da,ctype,coloring);CHKERRQ(ierr);
22047c6ae99SBarry Smith   } else {
22147c6ae99SBarry Smith 
222bff4a2f0SMatthew G. Knepley     if (bx == DM_BOUNDARY_PERIODIC && (m % col)) SETERRQ2(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in X (%d) is divisible\n\
22347c6ae99SBarry Smith                                                             by 2*stencil_width + 1 (%d)\n", m, col);
224bff4a2f0SMatthew G. Knepley     if (by == DM_BOUNDARY_PERIODIC && (n % col)) SETERRQ2(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in Y (%d) is divisible\n\
22547c6ae99SBarry Smith                                                             by 2*stencil_width + 1 (%d)\n", n, col);
22647c6ae99SBarry Smith     if (ctype == IS_COLORING_GLOBAL) {
22747c6ae99SBarry Smith       if (!dd->localcoloring) {
228785e854fSJed Brown         ierr = PetscMalloc1(nc*nx*ny,&colors);CHKERRQ(ierr);
22947c6ae99SBarry Smith         ii   = 0;
23047c6ae99SBarry Smith         for (j=ys; j<ys+ny; j++) {
23147c6ae99SBarry Smith           for (i=xs; i<xs+nx; i++) {
23247c6ae99SBarry Smith             for (k=0; k<nc; k++) {
23347c6ae99SBarry Smith               colors[ii++] = k + nc*((i % col) + col*(j % col));
23447c6ae99SBarry Smith             }
23547c6ae99SBarry Smith           }
23647c6ae99SBarry Smith         }
23747c6ae99SBarry Smith         ncolors = nc + nc*(col-1 + col*(col-1));
238aaf3ff59SMatthew G. Knepley         ierr    = ISColoringCreate(comm,ncolors,nc*nx*ny,colors,PETSC_OWN_POINTER,&dd->localcoloring);CHKERRQ(ierr);
23947c6ae99SBarry Smith       }
24047c6ae99SBarry Smith       *coloring = dd->localcoloring;
2415bdb020cSBarry Smith     } else if (ctype == IS_COLORING_LOCAL) {
24247c6ae99SBarry Smith       if (!dd->ghostedcoloring) {
243785e854fSJed Brown         ierr = PetscMalloc1(nc*gnx*gny,&colors);CHKERRQ(ierr);
24447c6ae99SBarry Smith         ii   = 0;
24547c6ae99SBarry Smith         for (j=gys; j<gys+gny; j++) {
24647c6ae99SBarry Smith           for (i=gxs; i<gxs+gnx; i++) {
24747c6ae99SBarry Smith             for (k=0; k<nc; k++) {
24847c6ae99SBarry Smith               /* the complicated stuff is to handle periodic boundaries */
24947c6ae99SBarry Smith               colors[ii++] = k + nc*((SetInRange(i,m) % col) + col*(SetInRange(j,n) % col));
25047c6ae99SBarry Smith             }
25147c6ae99SBarry Smith           }
25247c6ae99SBarry Smith         }
25347c6ae99SBarry Smith         ncolors = nc + nc*(col - 1 + col*(col-1));
254aaf3ff59SMatthew G. Knepley         ierr    = ISColoringCreate(comm,ncolors,nc*gnx*gny,colors,PETSC_OWN_POINTER,&dd->ghostedcoloring);CHKERRQ(ierr);
25547c6ae99SBarry Smith         /* PetscIntView(ncolors,(PetscInt*)colors,0); */
25647c6ae99SBarry Smith 
2575bdb020cSBarry Smith         ierr = ISColoringSetType(dd->ghostedcoloring,IS_COLORING_LOCAL);CHKERRQ(ierr);
25847c6ae99SBarry Smith       }
25947c6ae99SBarry Smith       *coloring = dd->ghostedcoloring;
260ce94432eSBarry Smith     } else SETERRQ1(PetscObjectComm((PetscObject)da),PETSC_ERR_ARG_WRONG,"Unknown ISColoringType %d",(int)ctype);
26147c6ae99SBarry Smith   }
26247c6ae99SBarry Smith   ierr = ISColoringReference(*coloring);CHKERRQ(ierr);
26347c6ae99SBarry Smith   PetscFunctionReturn(0);
26447c6ae99SBarry Smith }
26547c6ae99SBarry Smith 
26647c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/
26747c6ae99SBarry Smith 
268e727c939SJed Brown PetscErrorCode DMCreateColoring_DA_3d_MPIAIJ(DM da,ISColoringType ctype,ISColoring *coloring)
26947c6ae99SBarry Smith {
27047c6ae99SBarry Smith   PetscErrorCode   ierr;
27147c6ae99SBarry Smith   PetscInt         xs,ys,nx,ny,i,j,gxs,gys,gnx,gny,m,n,p,dim,s,k,nc,col,zs,gzs,ii,l,nz,gnz,M,N,P;
27247c6ae99SBarry Smith   PetscInt         ncolors;
27347c6ae99SBarry Smith   MPI_Comm         comm;
274bff4a2f0SMatthew G. Knepley   DMBoundaryType bx,by,bz;
275aa219208SBarry Smith   DMDAStencilType  st;
27647c6ae99SBarry Smith   ISColoringValue  *colors;
27747c6ae99SBarry Smith   DM_DA            *dd = (DM_DA*)da->data;
27847c6ae99SBarry Smith 
27947c6ae99SBarry Smith   PetscFunctionBegin;
28047c6ae99SBarry Smith   /*
28147c6ae99SBarry Smith          nc - number of components per grid point
28247c6ae99SBarry Smith          col - number of colors needed in one direction for single component problem
28347c6ae99SBarry Smith 
28447c6ae99SBarry Smith   */
2851321219cSEthan Coon   ierr = DMDAGetInfo(da,&dim,&m,&n,&p,&M,&N,&P,&nc,&s,&bx,&by,&bz,&st);CHKERRQ(ierr);
28647c6ae99SBarry Smith   col  = 2*s + 1;
287bff4a2f0SMatthew G. Knepley   if (bx == DM_BOUNDARY_PERIODIC && (m % col)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in X is divisible\n\
28847c6ae99SBarry Smith                                                          by 2*stencil_width + 1\n");
289bff4a2f0SMatthew G. Knepley   if (by == DM_BOUNDARY_PERIODIC && (n % col)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in Y is divisible\n\
29047c6ae99SBarry Smith                                                          by 2*stencil_width + 1\n");
291bff4a2f0SMatthew G. Knepley   if (bz == DM_BOUNDARY_PERIODIC && (p % col)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in Z is divisible\n\
29247c6ae99SBarry Smith                                                          by 2*stencil_width + 1\n");
29347c6ae99SBarry Smith 
294aa219208SBarry Smith   ierr = DMDAGetCorners(da,&xs,&ys,&zs,&nx,&ny,&nz);CHKERRQ(ierr);
295aa219208SBarry Smith   ierr = DMDAGetGhostCorners(da,&gxs,&gys,&gzs,&gnx,&gny,&gnz);CHKERRQ(ierr);
29647c6ae99SBarry Smith   ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr);
29747c6ae99SBarry Smith 
29847c6ae99SBarry Smith   /* create the coloring */
29947c6ae99SBarry Smith   if (ctype == IS_COLORING_GLOBAL) {
30047c6ae99SBarry Smith     if (!dd->localcoloring) {
301785e854fSJed Brown       ierr = PetscMalloc1(nc*nx*ny*nz,&colors);CHKERRQ(ierr);
30247c6ae99SBarry Smith       ii   = 0;
30347c6ae99SBarry Smith       for (k=zs; k<zs+nz; k++) {
30447c6ae99SBarry Smith         for (j=ys; j<ys+ny; j++) {
30547c6ae99SBarry Smith           for (i=xs; i<xs+nx; i++) {
30647c6ae99SBarry Smith             for (l=0; l<nc; l++) {
30747c6ae99SBarry Smith               colors[ii++] = l + nc*((i % col) + col*(j % col) + col*col*(k % col));
30847c6ae99SBarry Smith             }
30947c6ae99SBarry Smith           }
31047c6ae99SBarry Smith         }
31147c6ae99SBarry Smith       }
31247c6ae99SBarry Smith       ncolors = nc + nc*(col-1 + col*(col-1)+ col*col*(col-1));
313aaf3ff59SMatthew G. Knepley       ierr    = ISColoringCreate(comm,ncolors,nc*nx*ny*nz,colors,PETSC_OWN_POINTER,&dd->localcoloring);CHKERRQ(ierr);
31447c6ae99SBarry Smith     }
31547c6ae99SBarry Smith     *coloring = dd->localcoloring;
3165bdb020cSBarry Smith   } else if (ctype == IS_COLORING_LOCAL) {
31747c6ae99SBarry Smith     if (!dd->ghostedcoloring) {
318785e854fSJed Brown       ierr = PetscMalloc1(nc*gnx*gny*gnz,&colors);CHKERRQ(ierr);
31947c6ae99SBarry Smith       ii   = 0;
32047c6ae99SBarry Smith       for (k=gzs; k<gzs+gnz; k++) {
32147c6ae99SBarry Smith         for (j=gys; j<gys+gny; j++) {
32247c6ae99SBarry Smith           for (i=gxs; i<gxs+gnx; i++) {
32347c6ae99SBarry Smith             for (l=0; l<nc; l++) {
32447c6ae99SBarry Smith               /* the complicated stuff is to handle periodic boundaries */
32547c6ae99SBarry Smith               colors[ii++] = l + nc*((SetInRange(i,m) % col) + col*(SetInRange(j,n) % col) + col*col*(SetInRange(k,p) % col));
32647c6ae99SBarry Smith             }
32747c6ae99SBarry Smith           }
32847c6ae99SBarry Smith         }
32947c6ae99SBarry Smith       }
33047c6ae99SBarry Smith       ncolors = nc + nc*(col-1 + col*(col-1)+ col*col*(col-1));
331aaf3ff59SMatthew G. Knepley       ierr    = ISColoringCreate(comm,ncolors,nc*gnx*gny*gnz,colors,PETSC_OWN_POINTER,&dd->ghostedcoloring);CHKERRQ(ierr);
3325bdb020cSBarry Smith       ierr    = ISColoringSetType(dd->ghostedcoloring,IS_COLORING_LOCAL);CHKERRQ(ierr);
33347c6ae99SBarry Smith     }
33447c6ae99SBarry Smith     *coloring = dd->ghostedcoloring;
335ce94432eSBarry Smith   } else SETERRQ1(PetscObjectComm((PetscObject)da),PETSC_ERR_ARG_WRONG,"Unknown ISColoringType %d",(int)ctype);
33647c6ae99SBarry Smith   ierr = ISColoringReference(*coloring);CHKERRQ(ierr);
33747c6ae99SBarry Smith   PetscFunctionReturn(0);
33847c6ae99SBarry Smith }
33947c6ae99SBarry Smith 
34047c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/
34147c6ae99SBarry Smith 
342e727c939SJed Brown PetscErrorCode DMCreateColoring_DA_1d_MPIAIJ(DM da,ISColoringType ctype,ISColoring *coloring)
34347c6ae99SBarry Smith {
34447c6ae99SBarry Smith   PetscErrorCode   ierr;
34547c6ae99SBarry Smith   PetscInt         xs,nx,i,i1,gxs,gnx,l,m,M,dim,s,nc,col;
34647c6ae99SBarry Smith   PetscInt         ncolors;
34747c6ae99SBarry Smith   MPI_Comm         comm;
348bff4a2f0SMatthew G. Knepley   DMBoundaryType bx;
34947c6ae99SBarry Smith   ISColoringValue  *colors;
35047c6ae99SBarry Smith   DM_DA            *dd = (DM_DA*)da->data;
35147c6ae99SBarry Smith 
35247c6ae99SBarry Smith   PetscFunctionBegin;
35347c6ae99SBarry Smith   /*
35447c6ae99SBarry Smith          nc - number of components per grid point
35547c6ae99SBarry Smith          col - number of colors needed in one direction for single component problem
35647c6ae99SBarry Smith 
35747c6ae99SBarry Smith   */
3581321219cSEthan Coon   ierr = DMDAGetInfo(da,&dim,&m,0,0,&M,0,0,&nc,&s,&bx,0,0,0);CHKERRQ(ierr);
35947c6ae99SBarry Smith   col  = 2*s + 1;
36047c6ae99SBarry Smith 
361bff4a2f0SMatthew G. Knepley   if (bx == DM_BOUNDARY_PERIODIC && (m % col)) SETERRQ2(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points %d is divisible\n\
36231e6f798SBarry Smith                                                           by 2*stencil_width + 1 %d\n",(int)m,(int)col);
36347c6ae99SBarry Smith 
364aa219208SBarry Smith   ierr = DMDAGetCorners(da,&xs,0,0,&nx,0,0);CHKERRQ(ierr);
365aa219208SBarry Smith   ierr = DMDAGetGhostCorners(da,&gxs,0,0,&gnx,0,0);CHKERRQ(ierr);
36647c6ae99SBarry Smith   ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr);
36747c6ae99SBarry Smith 
36847c6ae99SBarry Smith   /* create the coloring */
36947c6ae99SBarry Smith   if (ctype == IS_COLORING_GLOBAL) {
37047c6ae99SBarry Smith     if (!dd->localcoloring) {
371785e854fSJed Brown       ierr = PetscMalloc1(nc*nx,&colors);CHKERRQ(ierr);
372ae4f298aSBarry Smith       if (dd->ofillcols) {
373ae4f298aSBarry Smith         PetscInt tc = 0;
374ae4f298aSBarry Smith         for (i=0; i<nc; i++) tc += (PetscInt) (dd->ofillcols[i] > 0);
375ae4f298aSBarry Smith         i1 = 0;
376ae4f298aSBarry Smith         for (i=xs; i<xs+nx; i++) {
377ae4f298aSBarry Smith           for (l=0; l<nc; l++) {
378ae4f298aSBarry Smith             if (dd->ofillcols[l] && (i % col)) {
379ae4f298aSBarry Smith               colors[i1++] =  nc - 1 + tc*((i % col) - 1) + dd->ofillcols[l];
380ae4f298aSBarry Smith             } else {
381ae4f298aSBarry Smith               colors[i1++] = l;
382ae4f298aSBarry Smith             }
383ae4f298aSBarry Smith           }
384ae4f298aSBarry Smith         }
385ae4f298aSBarry Smith         ncolors = nc + 2*s*tc;
386ae4f298aSBarry Smith       } else {
38747c6ae99SBarry Smith         i1 = 0;
38847c6ae99SBarry Smith         for (i=xs; i<xs+nx; i++) {
38947c6ae99SBarry Smith           for (l=0; l<nc; l++) {
39047c6ae99SBarry Smith             colors[i1++] = l + nc*(i % col);
39147c6ae99SBarry Smith           }
39247c6ae99SBarry Smith         }
39347c6ae99SBarry Smith         ncolors = nc + nc*(col-1);
394ae4f298aSBarry Smith       }
395aaf3ff59SMatthew G. Knepley       ierr = ISColoringCreate(comm,ncolors,nc*nx,colors,PETSC_OWN_POINTER,&dd->localcoloring);CHKERRQ(ierr);
39647c6ae99SBarry Smith     }
39747c6ae99SBarry Smith     *coloring = dd->localcoloring;
3985bdb020cSBarry Smith   } else if (ctype == IS_COLORING_LOCAL) {
39947c6ae99SBarry Smith     if (!dd->ghostedcoloring) {
400785e854fSJed Brown       ierr = PetscMalloc1(nc*gnx,&colors);CHKERRQ(ierr);
40147c6ae99SBarry Smith       i1   = 0;
40247c6ae99SBarry Smith       for (i=gxs; i<gxs+gnx; i++) {
40347c6ae99SBarry Smith         for (l=0; l<nc; l++) {
40447c6ae99SBarry Smith           /* the complicated stuff is to handle periodic boundaries */
40547c6ae99SBarry Smith           colors[i1++] = l + nc*(SetInRange(i,m) % col);
40647c6ae99SBarry Smith         }
40747c6ae99SBarry Smith       }
40847c6ae99SBarry Smith       ncolors = nc + nc*(col-1);
409aaf3ff59SMatthew G. Knepley       ierr    = ISColoringCreate(comm,ncolors,nc*gnx,colors,PETSC_OWN_POINTER,&dd->ghostedcoloring);CHKERRQ(ierr);
4105bdb020cSBarry Smith       ierr    = ISColoringSetType(dd->ghostedcoloring,IS_COLORING_LOCAL);CHKERRQ(ierr);
41147c6ae99SBarry Smith     }
41247c6ae99SBarry Smith     *coloring = dd->ghostedcoloring;
413ce94432eSBarry Smith   } else SETERRQ1(PetscObjectComm((PetscObject)da),PETSC_ERR_ARG_WRONG,"Unknown ISColoringType %d",(int)ctype);
41447c6ae99SBarry Smith   ierr = ISColoringReference(*coloring);CHKERRQ(ierr);
41547c6ae99SBarry Smith   PetscFunctionReturn(0);
41647c6ae99SBarry Smith }
41747c6ae99SBarry Smith 
418e727c939SJed Brown PetscErrorCode DMCreateColoring_DA_2d_5pt_MPIAIJ(DM da,ISColoringType ctype,ISColoring *coloring)
41947c6ae99SBarry Smith {
42047c6ae99SBarry Smith   PetscErrorCode   ierr;
42147c6ae99SBarry Smith   PetscInt         xs,ys,nx,ny,i,j,ii,gxs,gys,gnx,gny,m,n,dim,s,k,nc;
42247c6ae99SBarry Smith   PetscInt         ncolors;
42347c6ae99SBarry Smith   MPI_Comm         comm;
424bff4a2f0SMatthew G. Knepley   DMBoundaryType bx,by;
42547c6ae99SBarry Smith   ISColoringValue  *colors;
42647c6ae99SBarry Smith   DM_DA            *dd = (DM_DA*)da->data;
42747c6ae99SBarry Smith 
42847c6ae99SBarry Smith   PetscFunctionBegin;
42947c6ae99SBarry Smith   /*
43047c6ae99SBarry Smith          nc - number of components per grid point
43147c6ae99SBarry Smith          col - number of colors needed in one direction for single component problem
43247c6ae99SBarry Smith 
43347c6ae99SBarry Smith   */
4341321219cSEthan Coon   ierr = DMDAGetInfo(da,&dim,&m,&n,0,0,0,0,&nc,&s,&bx,&by,0,0);CHKERRQ(ierr);
435aa219208SBarry Smith   ierr = DMDAGetCorners(da,&xs,&ys,0,&nx,&ny,0);CHKERRQ(ierr);
436aa219208SBarry Smith   ierr = DMDAGetGhostCorners(da,&gxs,&gys,0,&gnx,&gny,0);CHKERRQ(ierr);
43747c6ae99SBarry Smith   ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr);
43847c6ae99SBarry Smith 
439bff4a2f0SMatthew G. Knepley   if (bx == DM_BOUNDARY_PERIODIC && (m % 5)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in X is divisible by 5\n");
440bff4a2f0SMatthew G. Knepley   if (by == DM_BOUNDARY_PERIODIC && (n % 5)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in Y is divisible by 5\n");
44147c6ae99SBarry Smith 
44247c6ae99SBarry Smith   /* create the coloring */
44347c6ae99SBarry Smith   if (ctype == IS_COLORING_GLOBAL) {
44447c6ae99SBarry Smith     if (!dd->localcoloring) {
445785e854fSJed Brown       ierr = PetscMalloc1(nc*nx*ny,&colors);CHKERRQ(ierr);
44647c6ae99SBarry Smith       ii   = 0;
44747c6ae99SBarry Smith       for (j=ys; j<ys+ny; j++) {
44847c6ae99SBarry Smith         for (i=xs; i<xs+nx; i++) {
44947c6ae99SBarry Smith           for (k=0; k<nc; k++) {
45047c6ae99SBarry Smith             colors[ii++] = k + nc*((3*j+i) % 5);
45147c6ae99SBarry Smith           }
45247c6ae99SBarry Smith         }
45347c6ae99SBarry Smith       }
45447c6ae99SBarry Smith       ncolors = 5*nc;
455aaf3ff59SMatthew G. Knepley       ierr    = ISColoringCreate(comm,ncolors,nc*nx*ny,colors,PETSC_OWN_POINTER,&dd->localcoloring);CHKERRQ(ierr);
45647c6ae99SBarry Smith     }
45747c6ae99SBarry Smith     *coloring = dd->localcoloring;
4585bdb020cSBarry Smith   } else if (ctype == IS_COLORING_LOCAL) {
45947c6ae99SBarry Smith     if (!dd->ghostedcoloring) {
460785e854fSJed Brown       ierr = PetscMalloc1(nc*gnx*gny,&colors);CHKERRQ(ierr);
46147c6ae99SBarry Smith       ii = 0;
46247c6ae99SBarry Smith       for (j=gys; j<gys+gny; j++) {
46347c6ae99SBarry Smith         for (i=gxs; i<gxs+gnx; i++) {
46447c6ae99SBarry Smith           for (k=0; k<nc; k++) {
46547c6ae99SBarry Smith             colors[ii++] = k + nc*((3*SetInRange(j,n) + SetInRange(i,m)) % 5);
46647c6ae99SBarry Smith           }
46747c6ae99SBarry Smith         }
46847c6ae99SBarry Smith       }
46947c6ae99SBarry Smith       ncolors = 5*nc;
470aaf3ff59SMatthew G. Knepley       ierr    = ISColoringCreate(comm,ncolors,nc*gnx*gny,colors,PETSC_OWN_POINTER,&dd->ghostedcoloring);CHKERRQ(ierr);
4715bdb020cSBarry Smith       ierr    = ISColoringSetType(dd->ghostedcoloring,IS_COLORING_LOCAL);CHKERRQ(ierr);
47247c6ae99SBarry Smith     }
47347c6ae99SBarry Smith     *coloring = dd->ghostedcoloring;
474ce94432eSBarry Smith   } else SETERRQ1(PetscObjectComm((PetscObject)da),PETSC_ERR_ARG_WRONG,"Unknown ISColoringType %d",(int)ctype);
47547c6ae99SBarry Smith   PetscFunctionReturn(0);
47647c6ae99SBarry Smith }
47747c6ae99SBarry Smith 
47847c6ae99SBarry Smith /* =========================================================================== */
479950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_1d_MPIAIJ(DM,Mat);
480ce308e1dSBarry Smith extern PetscErrorCode DMCreateMatrix_DA_1d_MPIAIJ_Fill(DM,Mat);
481950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_2d_MPIAIJ(DM,Mat);
482950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_2d_MPIAIJ_Fill(DM,Mat);
483950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_3d_MPIAIJ(DM,Mat);
484950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_3d_MPIAIJ_Fill(DM,Mat);
485950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_2d_MPIBAIJ(DM,Mat);
486950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_3d_MPIBAIJ(DM,Mat);
487950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_2d_MPISBAIJ(DM,Mat);
488950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_3d_MPISBAIJ(DM,Mat);
4895e26d47bSHong Zhang extern PetscErrorCode DMCreateMatrix_DA_2d_MPIELL(DM,Mat);
490*711261dbSHong Zhang extern PetscErrorCode DMCreateMatrix_DA_3d_MPIELL(DM,Mat);
49147c6ae99SBarry Smith 
4928bbdbebaSMatthew G Knepley /*@C
493c688c046SMatthew G Knepley    MatSetupDM - Sets the DMDA that is to be used by the HYPRE_StructMatrix PETSc matrix
49447c6ae99SBarry Smith 
49547c6ae99SBarry Smith    Logically Collective on Mat
49647c6ae99SBarry Smith 
49747c6ae99SBarry Smith    Input Parameters:
49847c6ae99SBarry Smith +  mat - the matrix
49947c6ae99SBarry Smith -  da - the da
50047c6ae99SBarry Smith 
50147c6ae99SBarry Smith    Level: intermediate
50247c6ae99SBarry Smith 
50347c6ae99SBarry Smith @*/
504c688c046SMatthew G Knepley PetscErrorCode MatSetupDM(Mat mat,DM da)
50547c6ae99SBarry Smith {
50647c6ae99SBarry Smith   PetscErrorCode ierr;
50747c6ae99SBarry Smith 
50847c6ae99SBarry Smith   PetscFunctionBegin;
50947c6ae99SBarry Smith   PetscValidHeaderSpecific(mat,MAT_CLASSID,1);
51047c6ae99SBarry Smith   PetscValidHeaderSpecific(da,DM_CLASSID,1);
511c688c046SMatthew G Knepley   ierr = PetscTryMethod(mat,"MatSetupDM_C",(Mat,DM),(mat,da));CHKERRQ(ierr);
51247c6ae99SBarry Smith   PetscFunctionReturn(0);
51347c6ae99SBarry Smith }
51447c6ae99SBarry Smith 
5157087cfbeSBarry Smith PetscErrorCode  MatView_MPI_DA(Mat A,PetscViewer viewer)
51647c6ae99SBarry Smith {
5179a42bb27SBarry Smith   DM                da;
51847c6ae99SBarry Smith   PetscErrorCode    ierr;
51947c6ae99SBarry Smith   const char        *prefix;
52047c6ae99SBarry Smith   Mat               Anatural;
52147c6ae99SBarry Smith   AO                ao;
52247c6ae99SBarry Smith   PetscInt          rstart,rend,*petsc,i;
52347c6ae99SBarry Smith   IS                is;
52447c6ae99SBarry Smith   MPI_Comm          comm;
52574388724SJed Brown   PetscViewerFormat format;
52647c6ae99SBarry Smith 
52747c6ae99SBarry Smith   PetscFunctionBegin;
52874388724SJed Brown   /* Check whether we are just printing info, in which case MatView() already viewed everything we wanted to view */
52974388724SJed Brown   ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr);
53074388724SJed Brown   if (format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(0);
53174388724SJed Brown 
53247c6ae99SBarry Smith   ierr = PetscObjectGetComm((PetscObject)A,&comm);CHKERRQ(ierr);
533c688c046SMatthew G Knepley   ierr = MatGetDM(A, &da);CHKERRQ(ierr);
534ce94432eSBarry Smith   if (!da) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"Matrix not generated from a DMDA");
53547c6ae99SBarry Smith 
536aa219208SBarry Smith   ierr = DMDAGetAO(da,&ao);CHKERRQ(ierr);
53747c6ae99SBarry Smith   ierr = MatGetOwnershipRange(A,&rstart,&rend);CHKERRQ(ierr);
538854ce69bSBarry Smith   ierr = PetscMalloc1(rend-rstart,&petsc);CHKERRQ(ierr);
53947c6ae99SBarry Smith   for (i=rstart; i<rend; i++) petsc[i-rstart] = i;
54047c6ae99SBarry Smith   ierr = AOApplicationToPetsc(ao,rend-rstart,petsc);CHKERRQ(ierr);
54147c6ae99SBarry Smith   ierr = ISCreateGeneral(comm,rend-rstart,petsc,PETSC_OWN_POINTER,&is);CHKERRQ(ierr);
54247c6ae99SBarry Smith 
54347c6ae99SBarry Smith   /* call viewer on natural ordering */
5447dae84e0SHong Zhang   ierr = MatCreateSubMatrix(A,is,is,MAT_INITIAL_MATRIX,&Anatural);CHKERRQ(ierr);
545fcfd50ebSBarry Smith   ierr = ISDestroy(&is);CHKERRQ(ierr);
54647c6ae99SBarry Smith   ierr = PetscObjectGetOptionsPrefix((PetscObject)A,&prefix);CHKERRQ(ierr);
54747c6ae99SBarry Smith   ierr = PetscObjectSetOptionsPrefix((PetscObject)Anatural,prefix);CHKERRQ(ierr);
54847c6ae99SBarry Smith   ierr = PetscObjectSetName((PetscObject)Anatural,((PetscObject)A)->name);CHKERRQ(ierr);
549539c167fSBarry Smith   ierr = MatView(Anatural,viewer);CHKERRQ(ierr);
550fcfd50ebSBarry Smith   ierr = MatDestroy(&Anatural);CHKERRQ(ierr);
55147c6ae99SBarry Smith   PetscFunctionReturn(0);
55247c6ae99SBarry Smith }
55347c6ae99SBarry Smith 
5547087cfbeSBarry Smith PetscErrorCode  MatLoad_MPI_DA(Mat A,PetscViewer viewer)
55547c6ae99SBarry Smith {
5569a42bb27SBarry Smith   DM             da;
55747c6ae99SBarry Smith   PetscErrorCode ierr;
55847c6ae99SBarry Smith   Mat            Anatural,Aapp;
55947c6ae99SBarry Smith   AO             ao;
560539c167fSBarry Smith   PetscInt       rstart,rend,*app,i,m,n,M,N;
56147c6ae99SBarry Smith   IS             is;
56247c6ae99SBarry Smith   MPI_Comm       comm;
56347c6ae99SBarry Smith 
56447c6ae99SBarry Smith   PetscFunctionBegin;
56547c6ae99SBarry Smith   ierr = PetscObjectGetComm((PetscObject)A,&comm);CHKERRQ(ierr);
566c688c046SMatthew G Knepley   ierr = MatGetDM(A, &da);CHKERRQ(ierr);
567ce94432eSBarry Smith   if (!da) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"Matrix not generated from a DMDA");
56847c6ae99SBarry Smith 
56947c6ae99SBarry Smith   /* Load the matrix in natural ordering */
570ce94432eSBarry Smith   ierr = MatCreate(PetscObjectComm((PetscObject)A),&Anatural);CHKERRQ(ierr);
57147c6ae99SBarry Smith   ierr = MatSetType(Anatural,((PetscObject)A)->type_name);CHKERRQ(ierr);
572539c167fSBarry Smith   ierr = MatGetSize(A,&M,&N);CHKERRQ(ierr);
573539c167fSBarry Smith   ierr = MatGetLocalSize(A,&m,&n);CHKERRQ(ierr);
574539c167fSBarry Smith   ierr = MatSetSizes(Anatural,m,n,M,N);CHKERRQ(ierr);
57547c6ae99SBarry Smith   ierr = MatLoad(Anatural,viewer);CHKERRQ(ierr);
57647c6ae99SBarry Smith 
57747c6ae99SBarry Smith   /* Map natural ordering to application ordering and create IS */
578aa219208SBarry Smith   ierr = DMDAGetAO(da,&ao);CHKERRQ(ierr);
57947c6ae99SBarry Smith   ierr = MatGetOwnershipRange(Anatural,&rstart,&rend);CHKERRQ(ierr);
580854ce69bSBarry Smith   ierr = PetscMalloc1(rend-rstart,&app);CHKERRQ(ierr);
58147c6ae99SBarry Smith   for (i=rstart; i<rend; i++) app[i-rstart] = i;
58247c6ae99SBarry Smith   ierr = AOPetscToApplication(ao,rend-rstart,app);CHKERRQ(ierr);
58347c6ae99SBarry Smith   ierr = ISCreateGeneral(comm,rend-rstart,app,PETSC_OWN_POINTER,&is);CHKERRQ(ierr);
58447c6ae99SBarry Smith 
58547c6ae99SBarry Smith   /* Do permutation and replace header */
5867dae84e0SHong Zhang   ierr = MatCreateSubMatrix(Anatural,is,is,MAT_INITIAL_MATRIX,&Aapp);CHKERRQ(ierr);
58728be2f97SBarry Smith   ierr = MatHeaderReplace(A,&Aapp);CHKERRQ(ierr);
588fcfd50ebSBarry Smith   ierr = ISDestroy(&is);CHKERRQ(ierr);
589fcfd50ebSBarry Smith   ierr = MatDestroy(&Anatural);CHKERRQ(ierr);
59047c6ae99SBarry Smith   PetscFunctionReturn(0);
59147c6ae99SBarry Smith }
59247c6ae99SBarry Smith 
593b412c318SBarry Smith PetscErrorCode DMCreateMatrix_DA(DM da, Mat *J)
59447c6ae99SBarry Smith {
59547c6ae99SBarry Smith   PetscErrorCode ierr;
59647c6ae99SBarry Smith   PetscInt       dim,dof,nx,ny,nz,dims[3],starts[3],M,N,P;
59747c6ae99SBarry Smith   Mat            A;
59847c6ae99SBarry Smith   MPI_Comm       comm;
59919fd82e9SBarry Smith   MatType        Atype;
60037d0c07bSMatthew G Knepley   PetscSection   section, sectionGlobal;
6015e26d47bSHong Zhang   void           (*aij)(void)=NULL,(*baij)(void)=NULL,(*sbaij)(void)=NULL,(*ell)(void)=NULL;
602b412c318SBarry Smith   MatType        mtype;
60347c6ae99SBarry Smith   PetscMPIInt    size;
60447c6ae99SBarry Smith   DM_DA          *dd = (DM_DA*)da->data;
60547c6ae99SBarry Smith 
60647c6ae99SBarry Smith   PetscFunctionBegin;
607607a6623SBarry Smith   ierr = MatInitializePackage();CHKERRQ(ierr);
608b412c318SBarry Smith   mtype = da->mattype;
60947c6ae99SBarry Smith 
61037d0c07bSMatthew G Knepley   ierr = DMGetDefaultSection(da, &section);CHKERRQ(ierr);
61137d0c07bSMatthew G Knepley   if (section) {
61237d0c07bSMatthew G Knepley     PetscInt  bs = -1;
61337d0c07bSMatthew G Knepley     PetscInt  localSize;
61437d0c07bSMatthew G Knepley     PetscBool isShell, isBlock, isSeqBlock, isMPIBlock, isSymBlock, isSymSeqBlock, isSymMPIBlock, isSymmetric;
61537d0c07bSMatthew G Knepley 
61637d0c07bSMatthew G Knepley     ierr = DMGetDefaultGlobalSection(da, &sectionGlobal);CHKERRQ(ierr);
61737d0c07bSMatthew G Knepley     ierr = PetscSectionGetConstrainedStorageSize(sectionGlobal, &localSize);CHKERRQ(ierr);
618b5579763SJed Brown     ierr = MatCreate(PetscObjectComm((PetscObject)da),&A);CHKERRQ(ierr);
619b5579763SJed Brown     ierr = MatSetSizes(A,localSize,localSize,PETSC_DETERMINE,PETSC_DETERMINE);CHKERRQ(ierr);
620b5579763SJed Brown     ierr = MatSetType(A,mtype);CHKERRQ(ierr);
62137d0c07bSMatthew G Knepley     ierr = PetscStrcmp(mtype,MATSHELL,&isShell);CHKERRQ(ierr);
62237d0c07bSMatthew G Knepley     ierr = PetscStrcmp(mtype,MATBAIJ,&isBlock);CHKERRQ(ierr);
62337d0c07bSMatthew G Knepley     ierr = PetscStrcmp(mtype,MATSEQBAIJ,&isSeqBlock);CHKERRQ(ierr);
62437d0c07bSMatthew G Knepley     ierr = PetscStrcmp(mtype,MATMPIBAIJ,&isMPIBlock);CHKERRQ(ierr);
62537d0c07bSMatthew G Knepley     ierr = PetscStrcmp(mtype,MATSBAIJ,&isSymBlock);CHKERRQ(ierr);
62637d0c07bSMatthew G Knepley     ierr = PetscStrcmp(mtype,MATSEQSBAIJ,&isSymSeqBlock);CHKERRQ(ierr);
62737d0c07bSMatthew G Knepley     ierr = PetscStrcmp(mtype,MATMPISBAIJ,&isSymMPIBlock);CHKERRQ(ierr);
62837d0c07bSMatthew G Knepley     /* Check for symmetric storage */
62937d0c07bSMatthew G Knepley     isSymmetric = (PetscBool) (isSymBlock || isSymSeqBlock || isSymMPIBlock);
63037d0c07bSMatthew G Knepley     if (isSymmetric) {
63137d0c07bSMatthew G Knepley       ierr = MatSetOption(*J, MAT_IGNORE_LOWER_TRIANGULAR, PETSC_TRUE);CHKERRQ(ierr);
63237d0c07bSMatthew G Knepley     }
63337d0c07bSMatthew G Knepley     if (!isShell) {
63437d0c07bSMatthew G Knepley       PetscInt *dnz, *onz, *dnzu, *onzu, bsLocal;
63537d0c07bSMatthew G Knepley 
63637d0c07bSMatthew G Knepley       if (bs < 0) {
63737d0c07bSMatthew G Knepley         if (isBlock || isSeqBlock || isMPIBlock || isSymBlock || isSymSeqBlock || isSymMPIBlock) {
63837d0c07bSMatthew G Knepley           PetscInt pStart, pEnd, p, dof;
63937d0c07bSMatthew G Knepley 
64037d0c07bSMatthew G Knepley           ierr = PetscSectionGetChart(sectionGlobal, &pStart, &pEnd);CHKERRQ(ierr);
64137d0c07bSMatthew G Knepley           for (p = pStart; p < pEnd; ++p) {
64237d0c07bSMatthew G Knepley             ierr = PetscSectionGetDof(sectionGlobal, p, &dof);CHKERRQ(ierr);
64337d0c07bSMatthew G Knepley             if (dof) {
64437d0c07bSMatthew G Knepley               bs = dof;
64537d0c07bSMatthew G Knepley               break;
64637d0c07bSMatthew G Knepley             }
64737d0c07bSMatthew G Knepley           }
64837d0c07bSMatthew G Knepley         } else {
64937d0c07bSMatthew G Knepley           bs = 1;
65037d0c07bSMatthew G Knepley         }
65137d0c07bSMatthew G Knepley         /* Must have same blocksize on all procs (some might have no points) */
65237d0c07bSMatthew G Knepley         bsLocal = bs;
653b2566f29SBarry Smith         ierr    = MPIU_Allreduce(&bsLocal, &bs, 1, MPIU_INT, MPI_MAX, PetscObjectComm((PetscObject)da));CHKERRQ(ierr);
65437d0c07bSMatthew G Knepley       }
6551795a4d1SJed Brown       ierr = PetscCalloc4(localSize/bs, &dnz, localSize/bs, &onz, localSize/bs, &dnzu, localSize/bs, &onzu);CHKERRQ(ierr);
656552f7358SJed Brown       /* ierr = DMPlexPreallocateOperator(dm, bs, section, sectionGlobal, dnz, onz, dnzu, onzu, *J, fillMatrix);CHKERRQ(ierr); */
65737d0c07bSMatthew G Knepley       ierr = PetscFree4(dnz, onz, dnzu, onzu);CHKERRQ(ierr);
65837d0c07bSMatthew G Knepley     }
65937d0c07bSMatthew G Knepley   }
66047c6ae99SBarry Smith   /*
66147c6ae99SBarry Smith                                   m
66247c6ae99SBarry Smith           ------------------------------------------------------
66347c6ae99SBarry Smith          |                                                     |
66447c6ae99SBarry Smith          |                                                     |
66547c6ae99SBarry Smith          |               ----------------------                |
66647c6ae99SBarry Smith          |               |                    |                |
66747c6ae99SBarry Smith       n  |           ny  |                    |                |
66847c6ae99SBarry Smith          |               |                    |                |
66947c6ae99SBarry Smith          |               .---------------------                |
67047c6ae99SBarry Smith          |             (xs,ys)     nx                          |
67147c6ae99SBarry Smith          |            .                                        |
67247c6ae99SBarry Smith          |         (gxs,gys)                                   |
67347c6ae99SBarry Smith          |                                                     |
67447c6ae99SBarry Smith           -----------------------------------------------------
67547c6ae99SBarry Smith   */
67647c6ae99SBarry Smith 
67747c6ae99SBarry Smith   /*
67847c6ae99SBarry Smith          nc - number of components per grid point
67947c6ae99SBarry Smith          col - number of colors needed in one direction for single component problem
68047c6ae99SBarry Smith 
68147c6ae99SBarry Smith   */
682e30e807fSPeter Brune   M   = dd->M;
683e30e807fSPeter Brune   N   = dd->N;
684e30e807fSPeter Brune   P   = dd->P;
685c73cfb54SMatthew G. Knepley   dim = da->dim;
686e30e807fSPeter Brune   dof = dd->w;
687e30e807fSPeter Brune   /* ierr = DMDAGetInfo(da,&dim,&M,&N,&P,0,0,0,&dof,0,0,0,0,0);CHKERRQ(ierr); */
688aa219208SBarry Smith   ierr = DMDAGetCorners(da,0,0,0,&nx,&ny,&nz);CHKERRQ(ierr);
68947c6ae99SBarry Smith   ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr);
69047c6ae99SBarry Smith   ierr = MatCreate(comm,&A);CHKERRQ(ierr);
69147c6ae99SBarry Smith   ierr = MatSetSizes(A,dof*nx*ny*nz,dof*nx*ny*nz,dof*M*N*P,dof*M*N*P);CHKERRQ(ierr);
692b412c318SBarry Smith   ierr = MatSetType(A,mtype);CHKERRQ(ierr);
69395ee5b0eSBarry Smith   ierr = MatSetDM(A,da);CHKERRQ(ierr);
694b06ff27eSHong Zhang   if (da->structure_only) {
695b06ff27eSHong Zhang     ierr = MatSetOption(A,MAT_STRUCTURE_ONLY,PETSC_TRUE);CHKERRQ(ierr);
696b06ff27eSHong Zhang   }
69747c6ae99SBarry Smith   ierr = MatGetType(A,&Atype);CHKERRQ(ierr);
69847c6ae99SBarry Smith   /*
699aa219208SBarry Smith      We do not provide a getmatrix function in the DMDA operations because
700aa219208SBarry Smith    the basic DMDA does not know about matrices. We think of DMDA as being more
70147c6ae99SBarry Smith    more low-level than matrices. This is kind of cheating but, cause sometimes
702aa219208SBarry Smith    we think of DMDA has higher level than matrices.
70347c6ae99SBarry Smith 
70447c6ae99SBarry Smith      We could switch based on Atype (or mtype), but we do not since the
70547c6ae99SBarry Smith    specialized setting routines depend only the particular preallocation
70647c6ae99SBarry Smith    details of the matrix, not the type itself.
70747c6ae99SBarry Smith   */
70847c6ae99SBarry Smith   ierr = PetscObjectQueryFunction((PetscObject)A,"MatMPIAIJSetPreallocation_C",&aij);CHKERRQ(ierr);
70947c6ae99SBarry Smith   if (!aij) {
71047c6ae99SBarry Smith     ierr = PetscObjectQueryFunction((PetscObject)A,"MatSeqAIJSetPreallocation_C",&aij);CHKERRQ(ierr);
71147c6ae99SBarry Smith   }
71247c6ae99SBarry Smith   if (!aij) {
71347c6ae99SBarry Smith     ierr = PetscObjectQueryFunction((PetscObject)A,"MatMPIBAIJSetPreallocation_C",&baij);CHKERRQ(ierr);
71447c6ae99SBarry Smith     if (!baij) {
71547c6ae99SBarry Smith       ierr = PetscObjectQueryFunction((PetscObject)A,"MatSeqBAIJSetPreallocation_C",&baij);CHKERRQ(ierr);
71647c6ae99SBarry Smith     }
71747c6ae99SBarry Smith     if (!baij) {
71847c6ae99SBarry Smith       ierr = PetscObjectQueryFunction((PetscObject)A,"MatMPISBAIJSetPreallocation_C",&sbaij);CHKERRQ(ierr);
71947c6ae99SBarry Smith       if (!sbaij) {
72047c6ae99SBarry Smith         ierr = PetscObjectQueryFunction((PetscObject)A,"MatSeqSBAIJSetPreallocation_C",&sbaij);CHKERRQ(ierr);
72147c6ae99SBarry Smith       }
7225e26d47bSHong Zhang       if (!sbaij) {
7235e26d47bSHong Zhang         ierr = PetscObjectQueryFunction((PetscObject)A,"MatMPIELLSetPreallocation_C",&ell);CHKERRQ(ierr);
7245e26d47bSHong Zhang         if (!ell) {
7255e26d47bSHong Zhang           ierr = PetscObjectQueryFunction((PetscObject)A,"MatSeqELLSetPreallocation_C",&ell);CHKERRQ(ierr);
7265e26d47bSHong Zhang         }
7275e26d47bSHong Zhang       }
72847c6ae99SBarry Smith     }
72947c6ae99SBarry Smith   }
73047c6ae99SBarry Smith   if (aij) {
73147c6ae99SBarry Smith     if (dim == 1) {
732ce308e1dSBarry Smith       if (dd->ofill) {
733ce308e1dSBarry Smith         ierr = DMCreateMatrix_DA_1d_MPIAIJ_Fill(da,A);CHKERRQ(ierr);
734ce308e1dSBarry Smith       } else {
735950540a4SJed Brown         ierr = DMCreateMatrix_DA_1d_MPIAIJ(da,A);CHKERRQ(ierr);
736ce308e1dSBarry Smith       }
73747c6ae99SBarry Smith     } else if (dim == 2) {
73847c6ae99SBarry Smith       if (dd->ofill) {
739950540a4SJed Brown         ierr = DMCreateMatrix_DA_2d_MPIAIJ_Fill(da,A);CHKERRQ(ierr);
74047c6ae99SBarry Smith       } else {
741950540a4SJed Brown         ierr = DMCreateMatrix_DA_2d_MPIAIJ(da,A);CHKERRQ(ierr);
74247c6ae99SBarry Smith       }
74347c6ae99SBarry Smith     } else if (dim == 3) {
74447c6ae99SBarry Smith       if (dd->ofill) {
745950540a4SJed Brown         ierr = DMCreateMatrix_DA_3d_MPIAIJ_Fill(da,A);CHKERRQ(ierr);
74647c6ae99SBarry Smith       } else {
747950540a4SJed Brown         ierr = DMCreateMatrix_DA_3d_MPIAIJ(da,A);CHKERRQ(ierr);
74847c6ae99SBarry Smith       }
74947c6ae99SBarry Smith     }
75047c6ae99SBarry Smith   } else if (baij) {
75147c6ae99SBarry Smith     if (dim == 2) {
752950540a4SJed Brown       ierr = DMCreateMatrix_DA_2d_MPIBAIJ(da,A);CHKERRQ(ierr);
75347c6ae99SBarry Smith     } else if (dim == 3) {
754950540a4SJed Brown       ierr = DMCreateMatrix_DA_3d_MPIBAIJ(da,A);CHKERRQ(ierr);
755ce94432eSBarry Smith     } else SETERRQ3(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"Not implemented for %D dimension and Matrix Type: %s in %D dimension! Send mail to petsc-maint@mcs.anl.gov for code",dim,Atype,dim);
75647c6ae99SBarry Smith   } else if (sbaij) {
75747c6ae99SBarry Smith     if (dim == 2) {
758950540a4SJed Brown       ierr = DMCreateMatrix_DA_2d_MPISBAIJ(da,A);CHKERRQ(ierr);
75947c6ae99SBarry Smith     } else if (dim == 3) {
760950540a4SJed Brown       ierr = DMCreateMatrix_DA_3d_MPISBAIJ(da,A);CHKERRQ(ierr);
761ce94432eSBarry Smith     } else SETERRQ3(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"Not implemented for %D dimension and Matrix Type: %s in %D dimension! Send mail to petsc-maint@mcs.anl.gov for code",dim,Atype,dim);
7625e26d47bSHong Zhang   } else if (ell) {
7635e26d47bSHong Zhang      if (dim == 2) {
7645e26d47bSHong Zhang        ierr = DMCreateMatrix_DA_2d_MPIELL(da,A);CHKERRQ(ierr);
765*711261dbSHong Zhang      } else if (dim == 3) {
766*711261dbSHong Zhang        ierr = DMCreateMatrix_DA_3d_MPIELL(da,A);CHKERRQ(ierr);
7675e26d47bSHong Zhang      } else SETERRQ3(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"Not implemented for %D dimension and Matrix Type: %s in %D dimension! Send mail to petsc-maint@mcs.anl.gov for code",dim,Atype,dim);
768869776cdSLisandro Dalcin   }else {
76945b6f7e9SBarry Smith     ISLocalToGlobalMapping ltog;
770b026d285SBarry Smith     ierr = MatSetBlockSize(A,dof);CHKERRQ(ierr);
7712949035bSJed Brown     ierr = MatSetUp(A);CHKERRQ(ierr);
772b026d285SBarry Smith     ierr = DMGetLocalToGlobalMapping(da,&ltog);CHKERRQ(ierr);
773869776cdSLisandro Dalcin     ierr = MatSetLocalToGlobalMapping(A,ltog,ltog);CHKERRQ(ierr);
77447c6ae99SBarry Smith   }
775aa219208SBarry Smith   ierr = DMDAGetGhostCorners(da,&starts[0],&starts[1],&starts[2],&dims[0],&dims[1],&dims[2]);CHKERRQ(ierr);
77647c6ae99SBarry Smith   ierr = MatSetStencil(A,dim,dims,starts,dof);CHKERRQ(ierr);
777c688c046SMatthew G Knepley   ierr = MatSetDM(A,da);CHKERRQ(ierr);
77847c6ae99SBarry Smith   ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr);
77947c6ae99SBarry Smith   if (size > 1) {
78047c6ae99SBarry Smith     /* change viewer to display matrix in natural ordering */
78147c6ae99SBarry Smith     ierr = MatShellSetOperation(A, MATOP_VIEW, (void (*)(void))MatView_MPI_DA);CHKERRQ(ierr);
78247c6ae99SBarry Smith     ierr = MatShellSetOperation(A, MATOP_LOAD, (void (*)(void))MatLoad_MPI_DA);CHKERRQ(ierr);
78347c6ae99SBarry Smith   }
784b5579763SJed Brown   ierr = MatSetFromOptions(A);CHKERRQ(ierr);
78547c6ae99SBarry Smith   *J = A;
78647c6ae99SBarry Smith   PetscFunctionReturn(0);
78747c6ae99SBarry Smith }
78847c6ae99SBarry Smith 
78947c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/
7905e26d47bSHong Zhang PetscErrorCode DMCreateMatrix_DA_2d_MPIELL(DM da,Mat J)
7915e26d47bSHong Zhang {
7925e26d47bSHong Zhang   PetscErrorCode         ierr;
7935e26d47bSHong Zhang   PetscInt               xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny,m,n,dim,s,*cols = NULL,k,nc,*rows = NULL,col,cnt,l,p;
7945e26d47bSHong Zhang   PetscInt               lstart,lend,pstart,pend,*dnz,*onz;
7955e26d47bSHong Zhang   MPI_Comm               comm;
7965e26d47bSHong Zhang   PetscScalar            *values;
7975e26d47bSHong Zhang   DMBoundaryType         bx,by;
7985e26d47bSHong Zhang   ISLocalToGlobalMapping ltog;
7995e26d47bSHong Zhang   DMDAStencilType        st;
8005e26d47bSHong Zhang 
8015e26d47bSHong Zhang   PetscFunctionBegin;
8025e26d47bSHong Zhang   /*
8035e26d47bSHong Zhang          nc - number of components per grid point
8045e26d47bSHong Zhang          col - number of colors needed in one direction for single component problem
8055e26d47bSHong Zhang 
8065e26d47bSHong Zhang   */
8075e26d47bSHong Zhang   ierr = DMDAGetInfo(da,&dim,&m,&n,0,0,0,0,&nc,&s,&bx,&by,0,&st);CHKERRQ(ierr);
8085e26d47bSHong Zhang   col  = 2*s + 1;
8095e26d47bSHong Zhang   ierr = DMDAGetCorners(da,&xs,&ys,0,&nx,&ny,0);CHKERRQ(ierr);
8105e26d47bSHong Zhang   ierr = DMDAGetGhostCorners(da,&gxs,&gys,0,&gnx,&gny,0);CHKERRQ(ierr);
8115e26d47bSHong Zhang   ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr);
8125e26d47bSHong Zhang 
8135e26d47bSHong Zhang   ierr = PetscMalloc2(nc,&rows,col*col*nc*nc,&cols);CHKERRQ(ierr);
8145e26d47bSHong Zhang   ierr = DMGetLocalToGlobalMapping(da,&ltog);CHKERRQ(ierr);
8155e26d47bSHong Zhang 
8165e26d47bSHong Zhang   ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr);
8175e26d47bSHong Zhang   /* determine the matrix preallocation information */
8185e26d47bSHong Zhang   ierr = MatPreallocateInitialize(comm,nc*nx*ny,nc*nx*ny,dnz,onz);CHKERRQ(ierr);
8195e26d47bSHong Zhang   for (i=xs; i<xs+nx; i++) {
8205e26d47bSHong Zhang 
8215e26d47bSHong Zhang     pstart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i));
8225e26d47bSHong Zhang     pend   = (bx == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,m-i-1));
8235e26d47bSHong Zhang 
8245e26d47bSHong Zhang     for (j=ys; j<ys+ny; j++) {
8255e26d47bSHong Zhang       slot = i - gxs + gnx*(j - gys);
8265e26d47bSHong Zhang 
8275e26d47bSHong Zhang       lstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j));
8285e26d47bSHong Zhang       lend   = (by == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,n-j-1));
8295e26d47bSHong Zhang 
8305e26d47bSHong Zhang       cnt = 0;
8315e26d47bSHong Zhang       for (k=0; k<nc; k++) {
8325e26d47bSHong Zhang         for (l=lstart; l<lend+1; l++) {
8335e26d47bSHong Zhang           for (p=pstart; p<pend+1; p++) {
8345e26d47bSHong Zhang             if ((st == DMDA_STENCIL_BOX) || (!l || !p)) {  /* entries on star have either l = 0 or p = 0 */
8355e26d47bSHong Zhang               cols[cnt++] = k + nc*(slot + gnx*l + p);
8365e26d47bSHong Zhang             }
8375e26d47bSHong Zhang           }
8385e26d47bSHong Zhang         }
8395e26d47bSHong Zhang         rows[k] = k + nc*(slot);
8405e26d47bSHong Zhang       }
8415e26d47bSHong Zhang       ierr = MatPreallocateSetLocal(ltog,nc,rows,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr);
8425e26d47bSHong Zhang     }
8435e26d47bSHong Zhang   }
8445e26d47bSHong Zhang   ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr);
8455e26d47bSHong Zhang   ierr = MatSeqELLSetPreallocation(J,0,dnz);CHKERRQ(ierr);
846c1aae768SHong Zhang   ierr = MatMPIELLSetPreallocation(J,0,dnz,0,onz);CHKERRQ(ierr);
8475e26d47bSHong Zhang   ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr);
8485e26d47bSHong Zhang 
8495e26d47bSHong Zhang   ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr);
8505e26d47bSHong Zhang 
8515e26d47bSHong Zhang   /*
8525e26d47bSHong Zhang     For each node in the grid: we get the neighbors in the local (on processor ordering
8535e26d47bSHong Zhang     that includes the ghost points) then MatSetValuesLocal() maps those indices to the global
8545e26d47bSHong Zhang     PETSc ordering.
8555e26d47bSHong Zhang   */
8565e26d47bSHong Zhang   if (!da->prealloc_only) {
8575e26d47bSHong Zhang     ierr = PetscCalloc1(col*col*nc*nc,&values);CHKERRQ(ierr);
8585e26d47bSHong Zhang     for (i=xs; i<xs+nx; i++) {
8595e26d47bSHong Zhang 
8605e26d47bSHong Zhang       pstart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i));
8615e26d47bSHong Zhang       pend   = (bx == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,m-i-1));
8625e26d47bSHong Zhang 
8635e26d47bSHong Zhang       for (j=ys; j<ys+ny; j++) {
8645e26d47bSHong Zhang         slot = i - gxs + gnx*(j - gys);
8655e26d47bSHong Zhang 
8665e26d47bSHong Zhang         lstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j));
8675e26d47bSHong Zhang         lend   = (by == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,n-j-1));
8685e26d47bSHong Zhang 
8695e26d47bSHong Zhang         cnt = 0;
8705e26d47bSHong Zhang         for (k=0; k<nc; k++) {
8715e26d47bSHong Zhang           for (l=lstart; l<lend+1; l++) {
8725e26d47bSHong Zhang             for (p=pstart; p<pend+1; p++) {
8735e26d47bSHong Zhang               if ((st == DMDA_STENCIL_BOX) || (!l || !p)) {  /* entries on star have either l = 0 or p = 0 */
8745e26d47bSHong Zhang                 cols[cnt++] = k + nc*(slot + gnx*l + p);
8755e26d47bSHong Zhang               }
8765e26d47bSHong Zhang             }
8775e26d47bSHong Zhang           }
8785e26d47bSHong Zhang           rows[k] = k + nc*(slot);
8795e26d47bSHong Zhang         }
8805e26d47bSHong Zhang         ierr = MatSetValuesLocal(J,nc,rows,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr);
8815e26d47bSHong Zhang       }
8825e26d47bSHong Zhang     }
8835e26d47bSHong Zhang     ierr = PetscFree(values);CHKERRQ(ierr);
8845e26d47bSHong Zhang     ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
8855e26d47bSHong Zhang     ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
8865e26d47bSHong Zhang     ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr);
8875e26d47bSHong Zhang   }
8885e26d47bSHong Zhang   ierr = PetscFree2(rows,cols);CHKERRQ(ierr);
8895e26d47bSHong Zhang   PetscFunctionReturn(0);
8905e26d47bSHong Zhang }
8915e26d47bSHong Zhang 
892*711261dbSHong Zhang PetscErrorCode DMCreateMatrix_DA_3d_MPIELL(DM da,Mat J)
893*711261dbSHong Zhang {
894*711261dbSHong Zhang   PetscErrorCode         ierr;
895*711261dbSHong Zhang   PetscInt               xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny;
896*711261dbSHong Zhang   PetscInt               m,n,dim,s,*cols = NULL,k,nc,*rows = NULL,col,cnt,l,p,*dnz = NULL,*onz = NULL;
897*711261dbSHong Zhang   PetscInt               istart,iend,jstart,jend,kstart,kend,zs,nz,gzs,gnz,ii,jj,kk,M,N,P;
898*711261dbSHong Zhang   MPI_Comm               comm;
899*711261dbSHong Zhang   PetscScalar            *values;
900*711261dbSHong Zhang   DMBoundaryType         bx,by,bz;
901*711261dbSHong Zhang   ISLocalToGlobalMapping ltog;
902*711261dbSHong Zhang   DMDAStencilType        st;
903*711261dbSHong Zhang 
904*711261dbSHong Zhang   PetscFunctionBegin;
905*711261dbSHong Zhang   /*
906*711261dbSHong Zhang          nc - number of components per grid point
907*711261dbSHong Zhang          col - number of colors needed in one direction for single component problem
908*711261dbSHong Zhang 
909*711261dbSHong Zhang   */
910*711261dbSHong Zhang   ierr = DMDAGetInfo(da,&dim,&m,&n,&p,&M,&N,&P,&nc,&s,&bx,&by,&bz,&st);CHKERRQ(ierr);
911*711261dbSHong Zhang   col  = 2*s + 1;
912*711261dbSHong Zhang   ierr = DMDAGetCorners(da,&xs,&ys,&zs,&nx,&ny,&nz);CHKERRQ(ierr);
913*711261dbSHong Zhang   ierr = DMDAGetGhostCorners(da,&gxs,&gys,&gzs,&gnx,&gny,&gnz);CHKERRQ(ierr);
914*711261dbSHong Zhang   ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr);
915*711261dbSHong Zhang 
916*711261dbSHong Zhang   ierr = PetscMalloc2(nc,&rows,col*col*col*nc*nc,&cols);CHKERRQ(ierr);
917*711261dbSHong Zhang   ierr = DMGetLocalToGlobalMapping(da,&ltog);CHKERRQ(ierr);
918*711261dbSHong Zhang 
919*711261dbSHong Zhang   ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr);
920*711261dbSHong Zhang   /* determine the matrix preallocation information */
921*711261dbSHong Zhang   ierr = MatPreallocateInitialize(comm,nc*nx*ny*nz,nc*nx*ny*nz,dnz,onz);CHKERRQ(ierr);
922*711261dbSHong Zhang   for (i=xs; i<xs+nx; i++) {
923*711261dbSHong Zhang     istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i));
924*711261dbSHong Zhang     iend   = (bx == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,m-i-1));
925*711261dbSHong Zhang     for (j=ys; j<ys+ny; j++) {
926*711261dbSHong Zhang       jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j));
927*711261dbSHong Zhang       jend   = (by == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,n-j-1));
928*711261dbSHong Zhang       for (k=zs; k<zs+nz; k++) {
929*711261dbSHong Zhang         kstart = (bz == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k));
930*711261dbSHong Zhang         kend   = (bz == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,p-k-1));
931*711261dbSHong Zhang 
932*711261dbSHong Zhang         slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs);
933*711261dbSHong Zhang 
934*711261dbSHong Zhang         cnt = 0;
935*711261dbSHong Zhang         for (l=0; l<nc; l++) {
936*711261dbSHong Zhang           for (ii=istart; ii<iend+1; ii++) {
937*711261dbSHong Zhang             for (jj=jstart; jj<jend+1; jj++) {
938*711261dbSHong Zhang               for (kk=kstart; kk<kend+1; kk++) {
939*711261dbSHong Zhang                 if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/
940*711261dbSHong Zhang                   cols[cnt++] = l + nc*(slot + ii + gnx*jj + gnx*gny*kk);
941*711261dbSHong Zhang                 }
942*711261dbSHong Zhang               }
943*711261dbSHong Zhang             }
944*711261dbSHong Zhang           }
945*711261dbSHong Zhang           rows[l] = l + nc*(slot);
946*711261dbSHong Zhang         }
947*711261dbSHong Zhang         ierr = MatPreallocateSetLocal(ltog,nc,rows,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr);
948*711261dbSHong Zhang       }
949*711261dbSHong Zhang     }
950*711261dbSHong Zhang   }
951*711261dbSHong Zhang   ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr);
952*711261dbSHong Zhang   ierr = MatSeqELLSetPreallocation(J,0,dnz);CHKERRQ(ierr);
953*711261dbSHong Zhang   ierr = MatMPIELLSetPreallocation(J,0,dnz,0,onz);CHKERRQ(ierr);
954*711261dbSHong Zhang   ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr);
955*711261dbSHong Zhang   ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr);
956*711261dbSHong Zhang 
957*711261dbSHong Zhang   /*
958*711261dbSHong Zhang     For each node in the grid: we get the neighbors in the local (on processor ordering
959*711261dbSHong Zhang     that includes the ghost points) then MatSetValuesLocal() maps those indices to the global
960*711261dbSHong Zhang     PETSc ordering.
961*711261dbSHong Zhang   */
962*711261dbSHong Zhang   if (!da->prealloc_only) {
963*711261dbSHong Zhang     ierr = PetscCalloc1(col*col*col*nc*nc*nc,&values);CHKERRQ(ierr);
964*711261dbSHong Zhang     for (i=xs; i<xs+nx; i++) {
965*711261dbSHong Zhang       istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i));
966*711261dbSHong Zhang       iend   = (bx == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,m-i-1));
967*711261dbSHong Zhang       for (j=ys; j<ys+ny; j++) {
968*711261dbSHong Zhang         jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j));
969*711261dbSHong Zhang         jend   = (by == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,n-j-1));
970*711261dbSHong Zhang         for (k=zs; k<zs+nz; k++) {
971*711261dbSHong Zhang           kstart = (bz == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k));
972*711261dbSHong Zhang           kend   = (bz == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,p-k-1));
973*711261dbSHong Zhang 
974*711261dbSHong Zhang           slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs);
975*711261dbSHong Zhang 
976*711261dbSHong Zhang           cnt = 0;
977*711261dbSHong Zhang           for (l=0; l<nc; l++) {
978*711261dbSHong Zhang             for (ii=istart; ii<iend+1; ii++) {
979*711261dbSHong Zhang               for (jj=jstart; jj<jend+1; jj++) {
980*711261dbSHong Zhang                 for (kk=kstart; kk<kend+1; kk++) {
981*711261dbSHong Zhang                   if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/
982*711261dbSHong Zhang                     cols[cnt++] = l + nc*(slot + ii + gnx*jj + gnx*gny*kk);
983*711261dbSHong Zhang                   }
984*711261dbSHong Zhang                 }
985*711261dbSHong Zhang               }
986*711261dbSHong Zhang             }
987*711261dbSHong Zhang             rows[l] = l + nc*(slot);
988*711261dbSHong Zhang           }
989*711261dbSHong Zhang           ierr = MatSetValuesLocal(J,nc,rows,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr);
990*711261dbSHong Zhang         }
991*711261dbSHong Zhang       }
992*711261dbSHong Zhang     }
993*711261dbSHong Zhang     ierr = PetscFree(values);CHKERRQ(ierr);
994*711261dbSHong Zhang     ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
995*711261dbSHong Zhang     ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
996*711261dbSHong Zhang     ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr);
997*711261dbSHong Zhang   }
998*711261dbSHong Zhang   ierr = PetscFree2(rows,cols);CHKERRQ(ierr);
999*711261dbSHong Zhang   PetscFunctionReturn(0);
1000*711261dbSHong Zhang }
1001*711261dbSHong Zhang 
1002950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_2d_MPIAIJ(DM da,Mat J)
100347c6ae99SBarry Smith {
100447c6ae99SBarry Smith   PetscErrorCode         ierr;
1005c1154cd5SBarry Smith   PetscInt               xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny,m,n,dim,s,*cols = NULL,k,nc,*rows = NULL,col,cnt,l,p,M,N;
100647c6ae99SBarry Smith   PetscInt               lstart,lend,pstart,pend,*dnz,*onz;
100747c6ae99SBarry Smith   MPI_Comm               comm;
100847c6ae99SBarry Smith   PetscScalar            *values;
1009bff4a2f0SMatthew G. Knepley   DMBoundaryType         bx,by;
101045b6f7e9SBarry Smith   ISLocalToGlobalMapping ltog;
1011aa219208SBarry Smith   DMDAStencilType        st;
1012c1154cd5SBarry Smith   PetscBool              removedups = PETSC_FALSE;
101347c6ae99SBarry Smith 
101447c6ae99SBarry Smith   PetscFunctionBegin;
101547c6ae99SBarry Smith   /*
101647c6ae99SBarry Smith          nc - number of components per grid point
101747c6ae99SBarry Smith          col - number of colors needed in one direction for single component problem
101847c6ae99SBarry Smith 
101947c6ae99SBarry Smith   */
1020c1154cd5SBarry Smith   ierr = DMDAGetInfo(da,&dim,&m,&n,&M,&N,0,0,&nc,&s,&bx,&by,0,&st);CHKERRQ(ierr);
102147c6ae99SBarry Smith   col  = 2*s + 1;
1022c1154cd5SBarry Smith   /*
1023c1154cd5SBarry Smith        With one processor in periodic domains in a skinny dimension the code will label nonzero columns multiple times
1024c1154cd5SBarry Smith        because of "wrapping" around the end of the domain hitting an entry already counted in the other direction.
1025c1154cd5SBarry Smith   */
1026c1154cd5SBarry Smith   if (M == 1 && 2*s >= m) removedups = PETSC_TRUE;
1027c1154cd5SBarry Smith   if (N == 1 && 2*s >= n) removedups = PETSC_TRUE;
1028aa219208SBarry Smith   ierr = DMDAGetCorners(da,&xs,&ys,0,&nx,&ny,0);CHKERRQ(ierr);
1029aa219208SBarry Smith   ierr = DMDAGetGhostCorners(da,&gxs,&gys,0,&gnx,&gny,0);CHKERRQ(ierr);
103047c6ae99SBarry Smith   ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr);
103147c6ae99SBarry Smith 
1032dcca6d9dSJed Brown   ierr = PetscMalloc2(nc,&rows,col*col*nc*nc,&cols);CHKERRQ(ierr);
10331411c6eeSJed Brown   ierr = DMGetLocalToGlobalMapping(da,&ltog);CHKERRQ(ierr);
103447c6ae99SBarry Smith 
103506ca8cadSBarry Smith   ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr);
103647c6ae99SBarry Smith   /* determine the matrix preallocation information */
103747c6ae99SBarry Smith   ierr = MatPreallocateInitialize(comm,nc*nx*ny,nc*nx*ny,dnz,onz);CHKERRQ(ierr);
103847c6ae99SBarry Smith   for (i=xs; i<xs+nx; i++) {
103947c6ae99SBarry Smith 
1040bff4a2f0SMatthew G. Knepley     pstart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i));
1041bff4a2f0SMatthew G. Knepley     pend   = (bx == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,m-i-1));
104247c6ae99SBarry Smith 
104347c6ae99SBarry Smith     for (j=ys; j<ys+ny; j++) {
104447c6ae99SBarry Smith       slot = i - gxs + gnx*(j - gys);
104547c6ae99SBarry Smith 
1046bff4a2f0SMatthew G. Knepley       lstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j));
1047bff4a2f0SMatthew G. Knepley       lend   = (by == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,n-j-1));
104847c6ae99SBarry Smith 
104947c6ae99SBarry Smith       cnt = 0;
105047c6ae99SBarry Smith       for (k=0; k<nc; k++) {
105147c6ae99SBarry Smith         for (l=lstart; l<lend+1; l++) {
105247c6ae99SBarry Smith           for (p=pstart; p<pend+1; p++) {
1053aa219208SBarry Smith             if ((st == DMDA_STENCIL_BOX) || (!l || !p)) {  /* entries on star have either l = 0 or p = 0 */
105447c6ae99SBarry Smith               cols[cnt++] = k + nc*(slot + gnx*l + p);
105547c6ae99SBarry Smith             }
105647c6ae99SBarry Smith           }
105747c6ae99SBarry Smith         }
105847c6ae99SBarry Smith         rows[k] = k + nc*(slot);
105947c6ae99SBarry Smith       }
1060c1154cd5SBarry Smith       if (removedups) {
1061c1154cd5SBarry Smith         ierr = MatPreallocateSetLocalRemoveDups(ltog,nc,rows,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr);
1062c1154cd5SBarry Smith       } else {
1063784ac674SJed Brown         ierr = MatPreallocateSetLocal(ltog,nc,rows,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr);
106447c6ae99SBarry Smith       }
106547c6ae99SBarry Smith     }
1066c1154cd5SBarry Smith   }
1067f73d5cc4SBarry Smith   ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr);
106847c6ae99SBarry Smith   ierr = MatSeqAIJSetPreallocation(J,0,dnz);CHKERRQ(ierr);
106947c6ae99SBarry Smith   ierr = MatMPIAIJSetPreallocation(J,0,dnz,0,onz);CHKERRQ(ierr);
107047c6ae99SBarry Smith   ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr);
107147c6ae99SBarry Smith 
1072784ac674SJed Brown   ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr);
107347c6ae99SBarry Smith 
107447c6ae99SBarry Smith   /*
107547c6ae99SBarry Smith     For each node in the grid: we get the neighbors in the local (on processor ordering
107647c6ae99SBarry Smith     that includes the ghost points) then MatSetValuesLocal() maps those indices to the global
107747c6ae99SBarry Smith     PETSc ordering.
107847c6ae99SBarry Smith   */
1079fcfd50ebSBarry Smith   if (!da->prealloc_only) {
10801795a4d1SJed Brown     ierr = PetscCalloc1(col*col*nc*nc,&values);CHKERRQ(ierr);
108147c6ae99SBarry Smith     for (i=xs; i<xs+nx; i++) {
108247c6ae99SBarry Smith 
1083bff4a2f0SMatthew G. Knepley       pstart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i));
1084bff4a2f0SMatthew G. Knepley       pend   = (bx == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,m-i-1));
108547c6ae99SBarry Smith 
108647c6ae99SBarry Smith       for (j=ys; j<ys+ny; j++) {
108747c6ae99SBarry Smith         slot = i - gxs + gnx*(j - gys);
108847c6ae99SBarry Smith 
1089bff4a2f0SMatthew G. Knepley         lstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j));
1090bff4a2f0SMatthew G. Knepley         lend   = (by == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,n-j-1));
109147c6ae99SBarry Smith 
109247c6ae99SBarry Smith         cnt = 0;
109347c6ae99SBarry Smith         for (k=0; k<nc; k++) {
109447c6ae99SBarry Smith           for (l=lstart; l<lend+1; l++) {
109547c6ae99SBarry Smith             for (p=pstart; p<pend+1; p++) {
1096aa219208SBarry Smith               if ((st == DMDA_STENCIL_BOX) || (!l || !p)) {  /* entries on star have either l = 0 or p = 0 */
109747c6ae99SBarry Smith                 cols[cnt++] = k + nc*(slot + gnx*l + p);
109847c6ae99SBarry Smith               }
109947c6ae99SBarry Smith             }
110047c6ae99SBarry Smith           }
110147c6ae99SBarry Smith           rows[k] = k + nc*(slot);
110247c6ae99SBarry Smith         }
110347c6ae99SBarry Smith         ierr = MatSetValuesLocal(J,nc,rows,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr);
110447c6ae99SBarry Smith       }
110547c6ae99SBarry Smith     }
110647c6ae99SBarry Smith     ierr = PetscFree(values);CHKERRQ(ierr);
110747c6ae99SBarry Smith     ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
110847c6ae99SBarry Smith     ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1109189e4007SBarry Smith     ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr);
111047c6ae99SBarry Smith   }
111147c6ae99SBarry Smith   ierr = PetscFree2(rows,cols);CHKERRQ(ierr);
111247c6ae99SBarry Smith   PetscFunctionReturn(0);
111347c6ae99SBarry Smith }
111447c6ae99SBarry Smith 
1115950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_2d_MPIAIJ_Fill(DM da,Mat J)
111647c6ae99SBarry Smith {
111747c6ae99SBarry Smith   PetscErrorCode         ierr;
111847c6ae99SBarry Smith   PetscInt               xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny;
1119c1154cd5SBarry Smith   PetscInt               m,n,dim,s,*cols,k,nc,row,col,cnt,maxcnt = 0,l,p,M,N;
112047c6ae99SBarry Smith   PetscInt               lstart,lend,pstart,pend,*dnz,*onz;
112147c6ae99SBarry Smith   DM_DA                  *dd = (DM_DA*)da->data;
112247c6ae99SBarry Smith   PetscInt               ifill_col,*ofill = dd->ofill, *dfill = dd->dfill;
112347c6ae99SBarry Smith   MPI_Comm               comm;
112447c6ae99SBarry Smith   PetscScalar            *values;
1125bff4a2f0SMatthew G. Knepley   DMBoundaryType         bx,by;
112645b6f7e9SBarry Smith   ISLocalToGlobalMapping ltog;
1127aa219208SBarry Smith   DMDAStencilType        st;
1128c1154cd5SBarry Smith   PetscBool              removedups = PETSC_FALSE;
112947c6ae99SBarry Smith 
113047c6ae99SBarry Smith   PetscFunctionBegin;
113147c6ae99SBarry Smith   /*
113247c6ae99SBarry Smith          nc - number of components per grid point
113347c6ae99SBarry Smith          col - number of colors needed in one direction for single component problem
113447c6ae99SBarry Smith 
113547c6ae99SBarry Smith   */
1136c1154cd5SBarry Smith   ierr = DMDAGetInfo(da,&dim,&m,&n,&M,&N,0,0,&nc,&s,&bx,&by,0,&st);CHKERRQ(ierr);
113747c6ae99SBarry Smith   col  = 2*s + 1;
1138c1154cd5SBarry Smith   /*
1139c1154cd5SBarry Smith        With one processor in periodic domains in a skinny dimension the code will label nonzero columns multiple times
1140c1154cd5SBarry Smith        because of "wrapping" around the end of the domain hitting an entry already counted in the other direction.
1141c1154cd5SBarry Smith   */
1142c1154cd5SBarry Smith   if (M == 1 && 2*s >= m) removedups = PETSC_TRUE;
1143c1154cd5SBarry Smith   if (N == 1 && 2*s >= n) removedups = PETSC_TRUE;
1144aa219208SBarry Smith   ierr = DMDAGetCorners(da,&xs,&ys,0,&nx,&ny,0);CHKERRQ(ierr);
1145aa219208SBarry Smith   ierr = DMDAGetGhostCorners(da,&gxs,&gys,0,&gnx,&gny,0);CHKERRQ(ierr);
114647c6ae99SBarry Smith   ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr);
114747c6ae99SBarry Smith 
11484b26d1cfSBarry Smith   ierr = PetscMalloc1(col*col*nc,&cols);CHKERRQ(ierr);
11491411c6eeSJed Brown   ierr = DMGetLocalToGlobalMapping(da,&ltog);CHKERRQ(ierr);
115047c6ae99SBarry Smith 
115106ca8cadSBarry Smith   ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr);
115247c6ae99SBarry Smith   /* determine the matrix preallocation information */
115347c6ae99SBarry Smith   ierr = MatPreallocateInitialize(comm,nc*nx*ny,nc*nx*ny,dnz,onz);CHKERRQ(ierr);
115447c6ae99SBarry Smith   for (i=xs; i<xs+nx; i++) {
115547c6ae99SBarry Smith 
1156bff4a2f0SMatthew G. Knepley     pstart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i));
1157bff4a2f0SMatthew G. Knepley     pend   = (bx == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,m-i-1));
115847c6ae99SBarry Smith 
115947c6ae99SBarry Smith     for (j=ys; j<ys+ny; j++) {
116047c6ae99SBarry Smith       slot = i - gxs + gnx*(j - gys);
116147c6ae99SBarry Smith 
1162bff4a2f0SMatthew G. Knepley       lstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j));
1163bff4a2f0SMatthew G. Knepley       lend   = (by == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,n-j-1));
116447c6ae99SBarry Smith 
116547c6ae99SBarry Smith       for (k=0; k<nc; k++) {
116647c6ae99SBarry Smith         cnt = 0;
116747c6ae99SBarry Smith         for (l=lstart; l<lend+1; l++) {
116847c6ae99SBarry Smith           for (p=pstart; p<pend+1; p++) {
116947c6ae99SBarry Smith             if (l || p) {
1170aa219208SBarry Smith               if ((st == DMDA_STENCIL_BOX) || (!l || !p)) {  /* entries on star */
11718865f1eaSKarl Rupp                 for (ifill_col=ofill[k]; ifill_col<ofill[k+1]; ifill_col++) cols[cnt++] = ofill[ifill_col] + nc*(slot + gnx*l + p);
117247c6ae99SBarry Smith               }
117347c6ae99SBarry Smith             } else {
117447c6ae99SBarry Smith               if (dfill) {
11758865f1eaSKarl Rupp                 for (ifill_col=dfill[k]; ifill_col<dfill[k+1]; ifill_col++) cols[cnt++] = dfill[ifill_col] + nc*(slot + gnx*l + p);
117647c6ae99SBarry Smith               } else {
11778865f1eaSKarl Rupp                 for (ifill_col=0; ifill_col<nc; ifill_col++) cols[cnt++] = ifill_col + nc*(slot + gnx*l + p);
117847c6ae99SBarry Smith               }
117947c6ae99SBarry Smith             }
118047c6ae99SBarry Smith           }
118147c6ae99SBarry Smith         }
118247c6ae99SBarry Smith         row    = k + nc*(slot);
1183c0ab637bSBarry Smith         maxcnt = PetscMax(maxcnt,cnt);
1184c1154cd5SBarry Smith         if (removedups) {
1185c1154cd5SBarry Smith           ierr   = MatPreallocateSetLocalRemoveDups(ltog,1,&row,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr);
1186c1154cd5SBarry Smith         } else {
1187784ac674SJed Brown           ierr   = MatPreallocateSetLocal(ltog,1,&row,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr);
118847c6ae99SBarry Smith         }
118947c6ae99SBarry Smith       }
119047c6ae99SBarry Smith     }
1191c1154cd5SBarry Smith   }
119247c6ae99SBarry Smith   ierr = MatSeqAIJSetPreallocation(J,0,dnz);CHKERRQ(ierr);
119347c6ae99SBarry Smith   ierr = MatMPIAIJSetPreallocation(J,0,dnz,0,onz);CHKERRQ(ierr);
119447c6ae99SBarry Smith   ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr);
1195784ac674SJed Brown   ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr);
119647c6ae99SBarry Smith 
119747c6ae99SBarry Smith   /*
119847c6ae99SBarry Smith     For each node in the grid: we get the neighbors in the local (on processor ordering
119947c6ae99SBarry Smith     that includes the ghost points) then MatSetValuesLocal() maps those indices to the global
120047c6ae99SBarry Smith     PETSc ordering.
120147c6ae99SBarry Smith   */
1202fcfd50ebSBarry Smith   if (!da->prealloc_only) {
1203c0ab637bSBarry Smith     ierr = PetscCalloc1(maxcnt,&values);CHKERRQ(ierr);
120447c6ae99SBarry Smith     for (i=xs; i<xs+nx; i++) {
120547c6ae99SBarry Smith 
1206bff4a2f0SMatthew G. Knepley       pstart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i));
1207bff4a2f0SMatthew G. Knepley       pend   = (bx == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,m-i-1));
120847c6ae99SBarry Smith 
120947c6ae99SBarry Smith       for (j=ys; j<ys+ny; j++) {
121047c6ae99SBarry Smith         slot = i - gxs + gnx*(j - gys);
121147c6ae99SBarry Smith 
1212bff4a2f0SMatthew G. Knepley         lstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j));
1213bff4a2f0SMatthew G. Knepley         lend   = (by == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,n-j-1));
121447c6ae99SBarry Smith 
121547c6ae99SBarry Smith         for (k=0; k<nc; k++) {
121647c6ae99SBarry Smith           cnt = 0;
121747c6ae99SBarry Smith           for (l=lstart; l<lend+1; l++) {
121847c6ae99SBarry Smith             for (p=pstart; p<pend+1; p++) {
121947c6ae99SBarry Smith               if (l || p) {
1220aa219208SBarry Smith                 if ((st == DMDA_STENCIL_BOX) || (!l || !p)) {  /* entries on star */
12218865f1eaSKarl Rupp                   for (ifill_col=ofill[k]; ifill_col<ofill[k+1]; ifill_col++) cols[cnt++] = ofill[ifill_col] + nc*(slot + gnx*l + p);
122247c6ae99SBarry Smith                 }
122347c6ae99SBarry Smith               } else {
122447c6ae99SBarry Smith                 if (dfill) {
12258865f1eaSKarl Rupp                   for (ifill_col=dfill[k]; ifill_col<dfill[k+1]; ifill_col++) cols[cnt++] = dfill[ifill_col] + nc*(slot + gnx*l + p);
122647c6ae99SBarry Smith                 } else {
12278865f1eaSKarl Rupp                   for (ifill_col=0; ifill_col<nc; ifill_col++) cols[cnt++] = ifill_col + nc*(slot + gnx*l + p);
122847c6ae99SBarry Smith                 }
122947c6ae99SBarry Smith               }
123047c6ae99SBarry Smith             }
123147c6ae99SBarry Smith           }
123247c6ae99SBarry Smith           row  = k + nc*(slot);
123347c6ae99SBarry Smith           ierr = MatSetValuesLocal(J,1,&row,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr);
123447c6ae99SBarry Smith         }
123547c6ae99SBarry Smith       }
123647c6ae99SBarry Smith     }
123747c6ae99SBarry Smith     ierr = PetscFree(values);CHKERRQ(ierr);
123847c6ae99SBarry Smith     ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
123947c6ae99SBarry Smith     ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1240189e4007SBarry Smith     ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr);
124147c6ae99SBarry Smith   }
124247c6ae99SBarry Smith   ierr = PetscFree(cols);CHKERRQ(ierr);
124347c6ae99SBarry Smith   PetscFunctionReturn(0);
124447c6ae99SBarry Smith }
124547c6ae99SBarry Smith 
124647c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/
124747c6ae99SBarry Smith 
1248950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_3d_MPIAIJ(DM da,Mat J)
124947c6ae99SBarry Smith {
125047c6ae99SBarry Smith   PetscErrorCode         ierr;
125147c6ae99SBarry Smith   PetscInt               xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny;
12520298fd71SBarry Smith   PetscInt               m,n,dim,s,*cols = NULL,k,nc,*rows = NULL,col,cnt,l,p,*dnz = NULL,*onz = NULL;
1253c1154cd5SBarry Smith   PetscInt               istart,iend,jstart,jend,kstart,kend,zs,nz,gzs,gnz,ii,jj,kk,M,N,P;
125447c6ae99SBarry Smith   MPI_Comm               comm;
125547c6ae99SBarry Smith   PetscScalar            *values;
1256bff4a2f0SMatthew G. Knepley   DMBoundaryType         bx,by,bz;
125745b6f7e9SBarry Smith   ISLocalToGlobalMapping ltog;
1258aa219208SBarry Smith   DMDAStencilType        st;
1259c1154cd5SBarry Smith   PetscBool              removedups = PETSC_FALSE;
126047c6ae99SBarry Smith 
126147c6ae99SBarry Smith   PetscFunctionBegin;
126247c6ae99SBarry Smith   /*
126347c6ae99SBarry Smith          nc - number of components per grid point
126447c6ae99SBarry Smith          col - number of colors needed in one direction for single component problem
126547c6ae99SBarry Smith 
126647c6ae99SBarry Smith   */
1267c1154cd5SBarry Smith   ierr = DMDAGetInfo(da,&dim,&m,&n,&p,&M,&N,&P,&nc,&s,&bx,&by,&bz,&st);CHKERRQ(ierr);
126847c6ae99SBarry Smith   col  = 2*s + 1;
126947c6ae99SBarry Smith 
1270c1154cd5SBarry Smith   /*
1271c1154cd5SBarry Smith        With one processor in periodic domains in a skinny dimension the code will label nonzero columns multiple times
1272c1154cd5SBarry Smith        because of "wrapping" around the end of the domain hitting an entry already counted in the other direction.
1273c1154cd5SBarry Smith   */
1274c1154cd5SBarry Smith   if (M == 1 && 2*s >= m) removedups = PETSC_TRUE;
1275c1154cd5SBarry Smith   if (N == 1 && 2*s >= n) removedups = PETSC_TRUE;
1276c1154cd5SBarry Smith   if (P == 1 && 2*s >= p) removedups = PETSC_TRUE;
1277c1154cd5SBarry Smith 
1278aa219208SBarry Smith   ierr = DMDAGetCorners(da,&xs,&ys,&zs,&nx,&ny,&nz);CHKERRQ(ierr);
1279aa219208SBarry Smith   ierr = DMDAGetGhostCorners(da,&gxs,&gys,&gzs,&gnx,&gny,&gnz);CHKERRQ(ierr);
128047c6ae99SBarry Smith   ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr);
128147c6ae99SBarry Smith 
1282dcca6d9dSJed Brown   ierr = PetscMalloc2(nc,&rows,col*col*col*nc*nc,&cols);CHKERRQ(ierr);
12831411c6eeSJed Brown   ierr = DMGetLocalToGlobalMapping(da,&ltog);CHKERRQ(ierr);
128447c6ae99SBarry Smith 
128506ca8cadSBarry Smith   ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr);
128647c6ae99SBarry Smith   /* determine the matrix preallocation information */
128747c6ae99SBarry Smith   ierr = MatPreallocateInitialize(comm,nc*nx*ny*nz,nc*nx*ny*nz,dnz,onz);CHKERRQ(ierr);
128847c6ae99SBarry Smith   for (i=xs; i<xs+nx; i++) {
1289bff4a2f0SMatthew G. Knepley     istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i));
1290bff4a2f0SMatthew G. Knepley     iend   = (bx == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,m-i-1));
129147c6ae99SBarry Smith     for (j=ys; j<ys+ny; j++) {
1292bff4a2f0SMatthew G. Knepley       jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j));
1293bff4a2f0SMatthew G. Knepley       jend   = (by == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,n-j-1));
129447c6ae99SBarry Smith       for (k=zs; k<zs+nz; k++) {
1295bff4a2f0SMatthew G. Knepley         kstart = (bz == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k));
1296bff4a2f0SMatthew G. Knepley         kend   = (bz == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,p-k-1));
129747c6ae99SBarry Smith 
129847c6ae99SBarry Smith         slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs);
129947c6ae99SBarry Smith 
130047c6ae99SBarry Smith         cnt = 0;
130147c6ae99SBarry Smith         for (l=0; l<nc; l++) {
130247c6ae99SBarry Smith           for (ii=istart; ii<iend+1; ii++) {
130347c6ae99SBarry Smith             for (jj=jstart; jj<jend+1; jj++) {
130447c6ae99SBarry Smith               for (kk=kstart; kk<kend+1; kk++) {
1305aa219208SBarry Smith                 if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/
130647c6ae99SBarry Smith                   cols[cnt++] = l + nc*(slot + ii + gnx*jj + gnx*gny*kk);
130747c6ae99SBarry Smith                 }
130847c6ae99SBarry Smith               }
130947c6ae99SBarry Smith             }
131047c6ae99SBarry Smith           }
131147c6ae99SBarry Smith           rows[l] = l + nc*(slot);
131247c6ae99SBarry Smith         }
1313c1154cd5SBarry Smith         if (removedups) {
1314c1154cd5SBarry Smith           ierr = MatPreallocateSetLocalRemoveDups(ltog,nc,rows,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr);
1315c1154cd5SBarry Smith         } else {
1316784ac674SJed Brown           ierr = MatPreallocateSetLocal(ltog,nc,rows,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr);
131747c6ae99SBarry Smith         }
131847c6ae99SBarry Smith       }
131947c6ae99SBarry Smith     }
1320c1154cd5SBarry Smith   }
1321f73d5cc4SBarry Smith   ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr);
132247c6ae99SBarry Smith   ierr = MatSeqAIJSetPreallocation(J,0,dnz);CHKERRQ(ierr);
132347c6ae99SBarry Smith   ierr = MatMPIAIJSetPreallocation(J,0,dnz,0,onz);CHKERRQ(ierr);
132447c6ae99SBarry Smith   ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr);
1325784ac674SJed Brown   ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr);
132647c6ae99SBarry Smith 
132747c6ae99SBarry Smith   /*
132847c6ae99SBarry Smith     For each node in the grid: we get the neighbors in the local (on processor ordering
132947c6ae99SBarry Smith     that includes the ghost points) then MatSetValuesLocal() maps those indices to the global
133047c6ae99SBarry Smith     PETSc ordering.
133147c6ae99SBarry Smith   */
1332fcfd50ebSBarry Smith   if (!da->prealloc_only) {
13331795a4d1SJed Brown     ierr = PetscCalloc1(col*col*col*nc*nc*nc,&values);CHKERRQ(ierr);
133447c6ae99SBarry Smith     for (i=xs; i<xs+nx; i++) {
1335bff4a2f0SMatthew G. Knepley       istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i));
1336bff4a2f0SMatthew G. Knepley       iend   = (bx == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,m-i-1));
133747c6ae99SBarry Smith       for (j=ys; j<ys+ny; j++) {
1338bff4a2f0SMatthew G. Knepley         jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j));
1339bff4a2f0SMatthew G. Knepley         jend   = (by == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,n-j-1));
134047c6ae99SBarry Smith         for (k=zs; k<zs+nz; k++) {
1341bff4a2f0SMatthew G. Knepley           kstart = (bz == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k));
1342bff4a2f0SMatthew G. Knepley           kend   = (bz == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,p-k-1));
134347c6ae99SBarry Smith 
134447c6ae99SBarry Smith           slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs);
134547c6ae99SBarry Smith 
134647c6ae99SBarry Smith           cnt = 0;
134747c6ae99SBarry Smith           for (l=0; l<nc; l++) {
134847c6ae99SBarry Smith             for (ii=istart; ii<iend+1; ii++) {
134947c6ae99SBarry Smith               for (jj=jstart; jj<jend+1; jj++) {
135047c6ae99SBarry Smith                 for (kk=kstart; kk<kend+1; kk++) {
1351aa219208SBarry Smith                   if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/
135247c6ae99SBarry Smith                     cols[cnt++] = l + nc*(slot + ii + gnx*jj + gnx*gny*kk);
135347c6ae99SBarry Smith                   }
135447c6ae99SBarry Smith                 }
135547c6ae99SBarry Smith               }
135647c6ae99SBarry Smith             }
135747c6ae99SBarry Smith             rows[l] = l + nc*(slot);
135847c6ae99SBarry Smith           }
135947c6ae99SBarry Smith           ierr = MatSetValuesLocal(J,nc,rows,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr);
136047c6ae99SBarry Smith         }
136147c6ae99SBarry Smith       }
136247c6ae99SBarry Smith     }
136347c6ae99SBarry Smith     ierr = PetscFree(values);CHKERRQ(ierr);
136447c6ae99SBarry Smith     ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
136547c6ae99SBarry Smith     ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1366189e4007SBarry Smith     ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr);
136747c6ae99SBarry Smith   }
136847c6ae99SBarry Smith   ierr = PetscFree2(rows,cols);CHKERRQ(ierr);
136947c6ae99SBarry Smith   PetscFunctionReturn(0);
137047c6ae99SBarry Smith }
137147c6ae99SBarry Smith 
137247c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/
137347c6ae99SBarry Smith 
1374ce308e1dSBarry Smith PetscErrorCode DMCreateMatrix_DA_1d_MPIAIJ_Fill(DM da,Mat J)
1375ce308e1dSBarry Smith {
1376ce308e1dSBarry Smith   PetscErrorCode         ierr;
1377ce308e1dSBarry Smith   DM_DA                  *dd = (DM_DA*)da->data;
1378ce308e1dSBarry Smith   PetscInt               xs,nx,i,j,gxs,gnx,row,k,l;
13798d4c968fSBarry Smith   PetscInt               m,dim,s,*cols = NULL,nc,cnt,maxcnt = 0,*ocols;
13800acb5bebSBarry Smith   PetscInt               *ofill = dd->ofill,*dfill = dd->dfill;
1381ce308e1dSBarry Smith   PetscScalar            *values;
1382bff4a2f0SMatthew G. Knepley   DMBoundaryType         bx;
138345b6f7e9SBarry Smith   ISLocalToGlobalMapping ltog;
1384ce308e1dSBarry Smith   PetscMPIInt            rank,size;
1385ce308e1dSBarry Smith 
1386ce308e1dSBarry Smith   PetscFunctionBegin;
1387bff4a2f0SMatthew G. Knepley   if (dd->bx == DM_BOUNDARY_PERIODIC) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"With fill provided not implemented with periodic boundary conditions");
1388ce94432eSBarry Smith   ierr = MPI_Comm_rank(PetscObjectComm((PetscObject)da),&rank);CHKERRQ(ierr);
1389ce94432eSBarry Smith   ierr = MPI_Comm_size(PetscObjectComm((PetscObject)da),&size);CHKERRQ(ierr);
1390ce308e1dSBarry Smith 
1391ce308e1dSBarry Smith   /*
1392ce308e1dSBarry Smith          nc - number of components per grid point
1393ce308e1dSBarry Smith 
1394ce308e1dSBarry Smith   */
1395ce308e1dSBarry Smith   ierr = DMDAGetInfo(da,&dim,&m,0,0,0,0,0,&nc,&s,&bx,0,0,0);CHKERRQ(ierr);
1396ce308e1dSBarry Smith   ierr = DMDAGetCorners(da,&xs,0,0,&nx,0,0);CHKERRQ(ierr);
1397ce308e1dSBarry Smith   ierr = DMDAGetGhostCorners(da,&gxs,0,0,&gnx,0,0);CHKERRQ(ierr);
1398ce308e1dSBarry Smith 
1399ce308e1dSBarry Smith   ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr);
14001795a4d1SJed Brown   ierr = PetscCalloc2(nx*nc,&cols,nx*nc,&ocols);CHKERRQ(ierr);
1401ce308e1dSBarry Smith 
1402ce308e1dSBarry Smith   /*
1403ce308e1dSBarry Smith         note should be smaller for first and last process with no periodic
1404ce308e1dSBarry Smith         does not handle dfill
1405ce308e1dSBarry Smith   */
1406ce308e1dSBarry Smith   cnt = 0;
1407ce308e1dSBarry Smith   /* coupling with process to the left */
1408ce308e1dSBarry Smith   for (i=0; i<s; i++) {
1409ce308e1dSBarry Smith     for (j=0; j<nc; j++) {
1410ce308e1dSBarry Smith       ocols[cnt] = ((!rank) ? 0 : (s - i)*(ofill[j+1] - ofill[j]));
14110acb5bebSBarry Smith       cols[cnt]  = dfill[j+1] - dfill[j] + (s + i)*(ofill[j+1] - ofill[j]);
1412c0ab637bSBarry Smith       maxcnt = PetscMax(maxcnt,ocols[cnt]+cols[cnt]);
1413ce308e1dSBarry Smith       cnt++;
1414ce308e1dSBarry Smith     }
1415ce308e1dSBarry Smith   }
1416ce308e1dSBarry Smith   for (i=s; i<nx-s; i++) {
1417ce308e1dSBarry Smith     for (j=0; j<nc; j++) {
14180acb5bebSBarry Smith       cols[cnt] = dfill[j+1] - dfill[j] + 2*s*(ofill[j+1] - ofill[j]);
1419c0ab637bSBarry Smith       maxcnt = PetscMax(maxcnt,ocols[cnt]+cols[cnt]);
1420ce308e1dSBarry Smith       cnt++;
1421ce308e1dSBarry Smith     }
1422ce308e1dSBarry Smith   }
1423ce308e1dSBarry Smith   /* coupling with process to the right */
1424ce308e1dSBarry Smith   for (i=nx-s; i<nx; i++) {
1425ce308e1dSBarry Smith     for (j=0; j<nc; j++) {
1426ce308e1dSBarry Smith       ocols[cnt] = ((rank == (size-1)) ? 0 : (i - nx + s + 1)*(ofill[j+1] - ofill[j]));
14270acb5bebSBarry Smith       cols[cnt]  = dfill[j+1] - dfill[j] + (s + nx - i - 1)*(ofill[j+1] - ofill[j]);
1428c0ab637bSBarry Smith       maxcnt = PetscMax(maxcnt,ocols[cnt]+cols[cnt]);
1429ce308e1dSBarry Smith       cnt++;
1430ce308e1dSBarry Smith     }
1431ce308e1dSBarry Smith   }
1432ce308e1dSBarry Smith 
1433ce308e1dSBarry Smith   ierr = MatSeqAIJSetPreallocation(J,0,cols);CHKERRQ(ierr);
1434ce308e1dSBarry Smith   ierr = MatMPIAIJSetPreallocation(J,0,cols,0,ocols);CHKERRQ(ierr);
1435ce308e1dSBarry Smith   ierr = PetscFree2(cols,ocols);CHKERRQ(ierr);
1436ce308e1dSBarry Smith 
1437ce308e1dSBarry Smith   ierr = DMGetLocalToGlobalMapping(da,&ltog);CHKERRQ(ierr);
1438ce308e1dSBarry Smith   ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr);
1439ce308e1dSBarry Smith 
1440ce308e1dSBarry Smith   /*
1441ce308e1dSBarry Smith     For each node in the grid: we get the neighbors in the local (on processor ordering
1442ce308e1dSBarry Smith     that includes the ghost points) then MatSetValuesLocal() maps those indices to the global
1443ce308e1dSBarry Smith     PETSc ordering.
1444ce308e1dSBarry Smith   */
1445ce308e1dSBarry Smith   if (!da->prealloc_only) {
1446c0ab637bSBarry Smith     ierr = PetscCalloc2(maxcnt,&values,maxcnt,&cols);CHKERRQ(ierr);
1447ce308e1dSBarry Smith 
1448ce308e1dSBarry Smith     row = xs*nc;
1449ce308e1dSBarry Smith     /* coupling with process to the left */
1450ce308e1dSBarry Smith     for (i=xs; i<xs+s; i++) {
1451ce308e1dSBarry Smith       for (j=0; j<nc; j++) {
1452ce308e1dSBarry Smith         cnt = 0;
1453ce308e1dSBarry Smith         if (rank) {
1454ce308e1dSBarry Smith           for (l=0; l<s; l++) {
1455ce308e1dSBarry Smith             for (k=ofill[j]; k<ofill[j+1]; k++) cols[cnt++] = (i - s + l)*nc + ofill[k];
1456ce308e1dSBarry Smith           }
1457ce308e1dSBarry Smith         }
14580acb5bebSBarry Smith         if (dfill) {
14590acb5bebSBarry Smith           for (k=dfill[j]; k<dfill[j+1]; k++) {
14600acb5bebSBarry Smith             cols[cnt++] = i*nc + dfill[k];
14610acb5bebSBarry Smith           }
14620acb5bebSBarry Smith         } else {
1463ce308e1dSBarry Smith           for (k=0; k<nc; k++) {
1464ce308e1dSBarry Smith             cols[cnt++] = i*nc + k;
1465ce308e1dSBarry Smith           }
14660acb5bebSBarry Smith         }
1467ce308e1dSBarry Smith         for (l=0; l<s; l++) {
1468ce308e1dSBarry Smith           for (k=ofill[j]; k<ofill[j+1]; k++) cols[cnt++] = (i + s - l)*nc + ofill[k];
1469ce308e1dSBarry Smith         }
1470ce308e1dSBarry Smith         ierr = MatSetValues(J,1,&row,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr);
1471ce308e1dSBarry Smith         row++;
1472ce308e1dSBarry Smith       }
1473ce308e1dSBarry Smith     }
1474ce308e1dSBarry Smith     for (i=xs+s; i<xs+nx-s; i++) {
1475ce308e1dSBarry Smith       for (j=0; j<nc; j++) {
1476ce308e1dSBarry Smith         cnt = 0;
1477ce308e1dSBarry Smith         for (l=0; l<s; l++) {
1478ce308e1dSBarry Smith           for (k=ofill[j]; k<ofill[j+1]; k++) cols[cnt++] = (i - s + l)*nc + ofill[k];
1479ce308e1dSBarry Smith         }
14800acb5bebSBarry Smith         if (dfill) {
14810acb5bebSBarry Smith           for (k=dfill[j]; k<dfill[j+1]; k++) {
14820acb5bebSBarry Smith             cols[cnt++] = i*nc + dfill[k];
14830acb5bebSBarry Smith           }
14840acb5bebSBarry Smith         } else {
1485ce308e1dSBarry Smith           for (k=0; k<nc; k++) {
1486ce308e1dSBarry Smith             cols[cnt++] = i*nc + k;
1487ce308e1dSBarry Smith           }
14880acb5bebSBarry Smith         }
1489ce308e1dSBarry Smith         for (l=0; l<s; l++) {
1490ce308e1dSBarry Smith           for (k=ofill[j]; k<ofill[j+1]; k++) cols[cnt++] = (i + s - l)*nc + ofill[k];
1491ce308e1dSBarry Smith         }
1492ce308e1dSBarry Smith         ierr = MatSetValues(J,1,&row,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr);
1493ce308e1dSBarry Smith         row++;
1494ce308e1dSBarry Smith       }
1495ce308e1dSBarry Smith     }
1496ce308e1dSBarry Smith     /* coupling with process to the right */
1497ce308e1dSBarry Smith     for (i=xs+nx-s; i<xs+nx; i++) {
1498ce308e1dSBarry Smith       for (j=0; j<nc; j++) {
1499ce308e1dSBarry Smith         cnt = 0;
1500ce308e1dSBarry Smith         for (l=0; l<s; l++) {
1501ce308e1dSBarry Smith           for (k=ofill[j]; k<ofill[j+1]; k++) cols[cnt++] = (i - s + l)*nc + ofill[k];
1502ce308e1dSBarry Smith         }
15030acb5bebSBarry Smith         if (dfill) {
15040acb5bebSBarry Smith           for (k=dfill[j]; k<dfill[j+1]; k++) {
15050acb5bebSBarry Smith             cols[cnt++] = i*nc + dfill[k];
15060acb5bebSBarry Smith           }
15070acb5bebSBarry Smith         } else {
1508ce308e1dSBarry Smith           for (k=0; k<nc; k++) {
1509ce308e1dSBarry Smith             cols[cnt++] = i*nc + k;
1510ce308e1dSBarry Smith           }
15110acb5bebSBarry Smith         }
1512ce308e1dSBarry Smith         if (rank < size-1) {
1513ce308e1dSBarry Smith           for (l=0; l<s; l++) {
1514ce308e1dSBarry Smith             for (k=ofill[j]; k<ofill[j+1]; k++) cols[cnt++] = (i + s - l)*nc + ofill[k];
1515ce308e1dSBarry Smith           }
1516ce308e1dSBarry Smith         }
1517ce308e1dSBarry Smith         ierr = MatSetValues(J,1,&row,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr);
1518ce308e1dSBarry Smith         row++;
1519ce308e1dSBarry Smith       }
1520ce308e1dSBarry Smith     }
1521c0ab637bSBarry Smith     ierr = PetscFree2(values,cols);CHKERRQ(ierr);
1522ce308e1dSBarry Smith     ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1523ce308e1dSBarry Smith     ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1524189e4007SBarry Smith     ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr);
1525ce308e1dSBarry Smith   }
1526ce308e1dSBarry Smith   PetscFunctionReturn(0);
1527ce308e1dSBarry Smith }
1528ce308e1dSBarry Smith 
1529ce308e1dSBarry Smith /* ---------------------------------------------------------------------------------*/
1530ce308e1dSBarry Smith 
1531950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_1d_MPIAIJ(DM da,Mat J)
153247c6ae99SBarry Smith {
153347c6ae99SBarry Smith   PetscErrorCode         ierr;
153447c6ae99SBarry Smith   PetscInt               xs,nx,i,i1,slot,gxs,gnx;
15350298fd71SBarry Smith   PetscInt               m,dim,s,*cols = NULL,nc,*rows = NULL,col,cnt,l;
153647c6ae99SBarry Smith   PetscInt               istart,iend;
153747c6ae99SBarry Smith   PetscScalar            *values;
1538bff4a2f0SMatthew G. Knepley   DMBoundaryType         bx;
153945b6f7e9SBarry Smith   ISLocalToGlobalMapping ltog;
154047c6ae99SBarry Smith 
154147c6ae99SBarry Smith   PetscFunctionBegin;
154247c6ae99SBarry Smith   /*
154347c6ae99SBarry Smith          nc - number of components per grid point
154447c6ae99SBarry Smith          col - number of colors needed in one direction for single component problem
154547c6ae99SBarry Smith 
154647c6ae99SBarry Smith   */
15471321219cSEthan Coon   ierr = DMDAGetInfo(da,&dim,&m,0,0,0,0,0,&nc,&s,&bx,0,0,0);CHKERRQ(ierr);
154847c6ae99SBarry Smith   col  = 2*s + 1;
154947c6ae99SBarry Smith 
1550aa219208SBarry Smith   ierr = DMDAGetCorners(da,&xs,0,0,&nx,0,0);CHKERRQ(ierr);
1551aa219208SBarry Smith   ierr = DMDAGetGhostCorners(da,&gxs,0,0,&gnx,0,0);CHKERRQ(ierr);
155247c6ae99SBarry Smith 
1553f73d5cc4SBarry Smith   ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr);
155447c6ae99SBarry Smith   ierr = MatSeqAIJSetPreallocation(J,col*nc,0);CHKERRQ(ierr);
155547c6ae99SBarry Smith   ierr = MatMPIAIJSetPreallocation(J,col*nc,0,col*nc,0);CHKERRQ(ierr);
155647c6ae99SBarry Smith 
15571411c6eeSJed Brown   ierr = DMGetLocalToGlobalMapping(da,&ltog);CHKERRQ(ierr);
1558784ac674SJed Brown   ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr);
155947c6ae99SBarry Smith 
156047c6ae99SBarry Smith   /*
156147c6ae99SBarry Smith     For each node in the grid: we get the neighbors in the local (on processor ordering
156247c6ae99SBarry Smith     that includes the ghost points) then MatSetValuesLocal() maps those indices to the global
156347c6ae99SBarry Smith     PETSc ordering.
156447c6ae99SBarry Smith   */
1565fcfd50ebSBarry Smith   if (!da->prealloc_only) {
1566dcca6d9dSJed Brown     ierr = PetscMalloc2(nc,&rows,col*nc*nc,&cols);CHKERRQ(ierr);
15671795a4d1SJed Brown     ierr = PetscCalloc1(col*nc*nc,&values);CHKERRQ(ierr);
156847c6ae99SBarry Smith     for (i=xs; i<xs+nx; i++) {
156947c6ae99SBarry Smith       istart = PetscMax(-s,gxs - i);
157047c6ae99SBarry Smith       iend   = PetscMin(s,gxs + gnx - i - 1);
157147c6ae99SBarry Smith       slot   = i - gxs;
157247c6ae99SBarry Smith 
157347c6ae99SBarry Smith       cnt = 0;
157447c6ae99SBarry Smith       for (l=0; l<nc; l++) {
157547c6ae99SBarry Smith         for (i1=istart; i1<iend+1; i1++) {
157647c6ae99SBarry Smith           cols[cnt++] = l + nc*(slot + i1);
157747c6ae99SBarry Smith         }
157847c6ae99SBarry Smith         rows[l] = l + nc*(slot);
157947c6ae99SBarry Smith       }
158047c6ae99SBarry Smith       ierr = MatSetValuesLocal(J,nc,rows,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr);
158147c6ae99SBarry Smith     }
158247c6ae99SBarry Smith     ierr = PetscFree(values);CHKERRQ(ierr);
158347c6ae99SBarry Smith     ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
158447c6ae99SBarry Smith     ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1585189e4007SBarry Smith     ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr);
158647c6ae99SBarry Smith     ierr = PetscFree2(rows,cols);CHKERRQ(ierr);
1587ce308e1dSBarry Smith   }
158847c6ae99SBarry Smith   PetscFunctionReturn(0);
158947c6ae99SBarry Smith }
159047c6ae99SBarry Smith 
1591950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_2d_MPIBAIJ(DM da,Mat J)
159247c6ae99SBarry Smith {
159347c6ae99SBarry Smith   PetscErrorCode         ierr;
159447c6ae99SBarry Smith   PetscInt               xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny;
159547c6ae99SBarry Smith   PetscInt               m,n,dim,s,*cols,nc,col,cnt,*dnz,*onz;
159647c6ae99SBarry Smith   PetscInt               istart,iend,jstart,jend,ii,jj;
159747c6ae99SBarry Smith   MPI_Comm               comm;
159847c6ae99SBarry Smith   PetscScalar            *values;
1599bff4a2f0SMatthew G. Knepley   DMBoundaryType         bx,by;
1600aa219208SBarry Smith   DMDAStencilType        st;
160145b6f7e9SBarry Smith   ISLocalToGlobalMapping ltog;
160247c6ae99SBarry Smith 
160347c6ae99SBarry Smith   PetscFunctionBegin;
160447c6ae99SBarry Smith   /*
160547c6ae99SBarry Smith      nc - number of components per grid point
160647c6ae99SBarry Smith      col - number of colors needed in one direction for single component problem
160747c6ae99SBarry Smith   */
16081321219cSEthan Coon   ierr = DMDAGetInfo(da,&dim,&m,&n,0,0,0,0,&nc,&s,&bx,&by,0,&st);CHKERRQ(ierr);
160947c6ae99SBarry Smith   col  = 2*s + 1;
161047c6ae99SBarry Smith 
1611aa219208SBarry Smith   ierr = DMDAGetCorners(da,&xs,&ys,0,&nx,&ny,0);CHKERRQ(ierr);
1612aa219208SBarry Smith   ierr = DMDAGetGhostCorners(da,&gxs,&gys,0,&gnx,&gny,0);CHKERRQ(ierr);
161347c6ae99SBarry Smith   ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr);
161447c6ae99SBarry Smith 
1615785e854fSJed Brown   ierr = PetscMalloc1(col*col*nc*nc,&cols);CHKERRQ(ierr);
161647c6ae99SBarry Smith 
16171411c6eeSJed Brown   ierr = DMGetLocalToGlobalMapping(da,&ltog);CHKERRQ(ierr);
161847c6ae99SBarry Smith 
161947c6ae99SBarry Smith   /* determine the matrix preallocation information */
162047c6ae99SBarry Smith   ierr = MatPreallocateInitialize(comm,nx*ny,nx*ny,dnz,onz);CHKERRQ(ierr);
162147c6ae99SBarry Smith   for (i=xs; i<xs+nx; i++) {
1622bff4a2f0SMatthew G. Knepley     istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i));
1623bff4a2f0SMatthew G. Knepley     iend   = (bx == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,m-i-1));
162447c6ae99SBarry Smith     for (j=ys; j<ys+ny; j++) {
1625bff4a2f0SMatthew G. Knepley       jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j));
1626bff4a2f0SMatthew G. Knepley       jend   = (by == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,n-j-1));
162747c6ae99SBarry Smith       slot   = i - gxs + gnx*(j - gys);
162847c6ae99SBarry Smith 
162947c6ae99SBarry Smith       /* Find block columns in block row */
163047c6ae99SBarry Smith       cnt = 0;
163147c6ae99SBarry Smith       for (ii=istart; ii<iend+1; ii++) {
163247c6ae99SBarry Smith         for (jj=jstart; jj<jend+1; jj++) {
1633aa219208SBarry Smith           if (st == DMDA_STENCIL_BOX || !ii || !jj) { /* BOX or on the STAR */
163447c6ae99SBarry Smith             cols[cnt++] = slot + ii + gnx*jj;
163547c6ae99SBarry Smith           }
163647c6ae99SBarry Smith         }
163747c6ae99SBarry Smith       }
1638d6e23781SBarry Smith       ierr = MatPreallocateSetLocalBlock(ltog,1,&slot,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr);
163947c6ae99SBarry Smith     }
164047c6ae99SBarry Smith   }
164147c6ae99SBarry Smith   ierr = MatSeqBAIJSetPreallocation(J,nc,0,dnz);CHKERRQ(ierr);
164247c6ae99SBarry Smith   ierr = MatMPIBAIJSetPreallocation(J,nc,0,dnz,0,onz);CHKERRQ(ierr);
164347c6ae99SBarry Smith   ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr);
164447c6ae99SBarry Smith 
1645784ac674SJed Brown   ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr);
164647c6ae99SBarry Smith 
164747c6ae99SBarry Smith   /*
164847c6ae99SBarry Smith     For each node in the grid: we get the neighbors in the local (on processor ordering
164947c6ae99SBarry Smith     that includes the ghost points) then MatSetValuesLocal() maps those indices to the global
165047c6ae99SBarry Smith     PETSc ordering.
165147c6ae99SBarry Smith   */
1652fcfd50ebSBarry Smith   if (!da->prealloc_only) {
16531795a4d1SJed Brown     ierr = PetscCalloc1(col*col*nc*nc,&values);CHKERRQ(ierr);
165447c6ae99SBarry Smith     for (i=xs; i<xs+nx; i++) {
1655bff4a2f0SMatthew G. Knepley       istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i));
1656bff4a2f0SMatthew G. Knepley       iend   = (bx == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,m-i-1));
165747c6ae99SBarry Smith       for (j=ys; j<ys+ny; j++) {
1658bff4a2f0SMatthew G. Knepley         jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j));
1659bff4a2f0SMatthew G. Knepley         jend   = (by == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,n-j-1));
166047c6ae99SBarry Smith         slot = i - gxs + gnx*(j - gys);
166147c6ae99SBarry Smith         cnt  = 0;
166247c6ae99SBarry Smith         for (ii=istart; ii<iend+1; ii++) {
166347c6ae99SBarry Smith           for (jj=jstart; jj<jend+1; jj++) {
1664aa219208SBarry Smith             if (st == DMDA_STENCIL_BOX || !ii || !jj) { /* BOX or on the STAR */
166547c6ae99SBarry Smith               cols[cnt++] = slot + ii + gnx*jj;
166647c6ae99SBarry Smith             }
166747c6ae99SBarry Smith           }
166847c6ae99SBarry Smith         }
166947c6ae99SBarry Smith         ierr = MatSetValuesBlockedLocal(J,1,&slot,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr);
167047c6ae99SBarry Smith       }
167147c6ae99SBarry Smith     }
167247c6ae99SBarry Smith     ierr = PetscFree(values);CHKERRQ(ierr);
167347c6ae99SBarry Smith     ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
167447c6ae99SBarry Smith     ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1675189e4007SBarry Smith     ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr);
167647c6ae99SBarry Smith   }
167747c6ae99SBarry Smith   ierr = PetscFree(cols);CHKERRQ(ierr);
167847c6ae99SBarry Smith   PetscFunctionReturn(0);
167947c6ae99SBarry Smith }
168047c6ae99SBarry Smith 
1681950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_3d_MPIBAIJ(DM da,Mat J)
168247c6ae99SBarry Smith {
168347c6ae99SBarry Smith   PetscErrorCode         ierr;
168447c6ae99SBarry Smith   PetscInt               xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny;
168547c6ae99SBarry Smith   PetscInt               m,n,dim,s,*cols,k,nc,col,cnt,p,*dnz,*onz;
168647c6ae99SBarry Smith   PetscInt               istart,iend,jstart,jend,kstart,kend,zs,nz,gzs,gnz,ii,jj,kk;
168747c6ae99SBarry Smith   MPI_Comm               comm;
168847c6ae99SBarry Smith   PetscScalar            *values;
1689bff4a2f0SMatthew G. Knepley   DMBoundaryType         bx,by,bz;
1690aa219208SBarry Smith   DMDAStencilType        st;
169145b6f7e9SBarry Smith   ISLocalToGlobalMapping ltog;
169247c6ae99SBarry Smith 
169347c6ae99SBarry Smith   PetscFunctionBegin;
169447c6ae99SBarry Smith   /*
169547c6ae99SBarry Smith          nc - number of components per grid point
169647c6ae99SBarry Smith          col - number of colors needed in one direction for single component problem
169747c6ae99SBarry Smith 
169847c6ae99SBarry Smith   */
16991321219cSEthan Coon   ierr = DMDAGetInfo(da,&dim,&m,&n,&p,0,0,0,&nc,&s,&bx,&by,&bz,&st);CHKERRQ(ierr);
170047c6ae99SBarry Smith   col  = 2*s + 1;
170147c6ae99SBarry Smith 
1702aa219208SBarry Smith   ierr = DMDAGetCorners(da,&xs,&ys,&zs,&nx,&ny,&nz);CHKERRQ(ierr);
1703aa219208SBarry Smith   ierr = DMDAGetGhostCorners(da,&gxs,&gys,&gzs,&gnx,&gny,&gnz);CHKERRQ(ierr);
170447c6ae99SBarry Smith   ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr);
170547c6ae99SBarry Smith 
1706785e854fSJed Brown   ierr = PetscMalloc1(col*col*col,&cols);CHKERRQ(ierr);
170747c6ae99SBarry Smith 
17081411c6eeSJed Brown   ierr = DMGetLocalToGlobalMapping(da,&ltog);CHKERRQ(ierr);
170947c6ae99SBarry Smith 
171047c6ae99SBarry Smith   /* determine the matrix preallocation information */
171147c6ae99SBarry Smith   ierr = MatPreallocateInitialize(comm,nx*ny*nz,nx*ny*nz,dnz,onz);CHKERRQ(ierr);
171247c6ae99SBarry Smith   for (i=xs; i<xs+nx; i++) {
1713bff4a2f0SMatthew G. Knepley     istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i));
1714bff4a2f0SMatthew G. Knepley     iend   = (bx == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,m-i-1));
171547c6ae99SBarry Smith     for (j=ys; j<ys+ny; j++) {
1716bff4a2f0SMatthew G. Knepley       jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j));
1717bff4a2f0SMatthew G. Knepley       jend   = (by == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,n-j-1));
171847c6ae99SBarry Smith       for (k=zs; k<zs+nz; k++) {
1719bff4a2f0SMatthew G. Knepley         kstart = (bz == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k));
1720bff4a2f0SMatthew G. Knepley         kend   = (bz == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,p-k-1));
172147c6ae99SBarry Smith 
172247c6ae99SBarry Smith         slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs);
172347c6ae99SBarry Smith 
172447c6ae99SBarry Smith         /* Find block columns in block row */
172547c6ae99SBarry Smith         cnt = 0;
172647c6ae99SBarry Smith         for (ii=istart; ii<iend+1; ii++) {
172747c6ae99SBarry Smith           for (jj=jstart; jj<jend+1; jj++) {
172847c6ae99SBarry Smith             for (kk=kstart; kk<kend+1; kk++) {
1729aa219208SBarry Smith               if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/
173047c6ae99SBarry Smith                 cols[cnt++] = slot + ii + gnx*jj + gnx*gny*kk;
173147c6ae99SBarry Smith               }
173247c6ae99SBarry Smith             }
173347c6ae99SBarry Smith           }
173447c6ae99SBarry Smith         }
1735d6e23781SBarry Smith         ierr = MatPreallocateSetLocalBlock(ltog,1,&slot,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr);
173647c6ae99SBarry Smith       }
173747c6ae99SBarry Smith     }
173847c6ae99SBarry Smith   }
173947c6ae99SBarry Smith   ierr = MatSeqBAIJSetPreallocation(J,nc,0,dnz);CHKERRQ(ierr);
174047c6ae99SBarry Smith   ierr = MatMPIBAIJSetPreallocation(J,nc,0,dnz,0,onz);CHKERRQ(ierr);
174147c6ae99SBarry Smith   ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr);
174247c6ae99SBarry Smith 
1743784ac674SJed Brown   ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr);
174447c6ae99SBarry Smith 
174547c6ae99SBarry Smith   /*
174647c6ae99SBarry Smith     For each node in the grid: we get the neighbors in the local (on processor ordering
174747c6ae99SBarry Smith     that includes the ghost points) then MatSetValuesLocal() maps those indices to the global
174847c6ae99SBarry Smith     PETSc ordering.
174947c6ae99SBarry Smith   */
1750fcfd50ebSBarry Smith   if (!da->prealloc_only) {
17511795a4d1SJed Brown     ierr = PetscCalloc1(col*col*col*nc*nc,&values);CHKERRQ(ierr);
175247c6ae99SBarry Smith     for (i=xs; i<xs+nx; i++) {
1753bff4a2f0SMatthew G. Knepley       istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i));
1754bff4a2f0SMatthew G. Knepley       iend   = (bx == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,m-i-1));
175547c6ae99SBarry Smith       for (j=ys; j<ys+ny; j++) {
1756bff4a2f0SMatthew G. Knepley         jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j));
1757bff4a2f0SMatthew G. Knepley         jend   = (by == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,n-j-1));
175847c6ae99SBarry Smith         for (k=zs; k<zs+nz; k++) {
1759bff4a2f0SMatthew G. Knepley           kstart = (bz == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k));
1760bff4a2f0SMatthew G. Knepley           kend   = (bz == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,p-k-1));
176147c6ae99SBarry Smith 
176247c6ae99SBarry Smith           slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs);
176347c6ae99SBarry Smith 
176447c6ae99SBarry Smith           cnt = 0;
176547c6ae99SBarry Smith           for (ii=istart; ii<iend+1; ii++) {
176647c6ae99SBarry Smith             for (jj=jstart; jj<jend+1; jj++) {
176747c6ae99SBarry Smith               for (kk=kstart; kk<kend+1; kk++) {
1768aa219208SBarry Smith                 if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/
176947c6ae99SBarry Smith                   cols[cnt++] = slot + ii + gnx*jj + gnx*gny*kk;
177047c6ae99SBarry Smith                 }
177147c6ae99SBarry Smith               }
177247c6ae99SBarry Smith             }
177347c6ae99SBarry Smith           }
177447c6ae99SBarry Smith           ierr = MatSetValuesBlockedLocal(J,1,&slot,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr);
177547c6ae99SBarry Smith         }
177647c6ae99SBarry Smith       }
177747c6ae99SBarry Smith     }
177847c6ae99SBarry Smith     ierr = PetscFree(values);CHKERRQ(ierr);
177947c6ae99SBarry Smith     ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
178047c6ae99SBarry Smith     ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1781189e4007SBarry Smith     ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr);
178247c6ae99SBarry Smith   }
178347c6ae99SBarry Smith   ierr = PetscFree(cols);CHKERRQ(ierr);
178447c6ae99SBarry Smith   PetscFunctionReturn(0);
178547c6ae99SBarry Smith }
178647c6ae99SBarry Smith 
178747c6ae99SBarry Smith /*
178847c6ae99SBarry Smith   This helper is for of SBAIJ preallocation, to discard the lower-triangular values which are difficult to
178947c6ae99SBarry Smith   identify in the local ordering with periodic domain.
179047c6ae99SBarry Smith */
179147c6ae99SBarry Smith static PetscErrorCode L2GFilterUpperTriangular(ISLocalToGlobalMapping ltog,PetscInt *row,PetscInt *cnt,PetscInt col[])
179247c6ae99SBarry Smith {
179347c6ae99SBarry Smith   PetscErrorCode ierr;
179447c6ae99SBarry Smith   PetscInt       i,n;
179547c6ae99SBarry Smith 
179647c6ae99SBarry Smith   PetscFunctionBegin;
1797d6e23781SBarry Smith   ierr = ISLocalToGlobalMappingApplyBlock(ltog,1,row,row);CHKERRQ(ierr);
1798d6e23781SBarry Smith   ierr = ISLocalToGlobalMappingApplyBlock(ltog,*cnt,col,col);CHKERRQ(ierr);
179947c6ae99SBarry Smith   for (i=0,n=0; i<*cnt; i++) {
180047c6ae99SBarry Smith     if (col[i] >= *row) col[n++] = col[i];
180147c6ae99SBarry Smith   }
180247c6ae99SBarry Smith   *cnt = n;
180347c6ae99SBarry Smith   PetscFunctionReturn(0);
180447c6ae99SBarry Smith }
180547c6ae99SBarry Smith 
1806950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_2d_MPISBAIJ(DM da,Mat J)
180747c6ae99SBarry Smith {
180847c6ae99SBarry Smith   PetscErrorCode         ierr;
180947c6ae99SBarry Smith   PetscInt               xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny;
181047c6ae99SBarry Smith   PetscInt               m,n,dim,s,*cols,nc,col,cnt,*dnz,*onz;
181147c6ae99SBarry Smith   PetscInt               istart,iend,jstart,jend,ii,jj;
181247c6ae99SBarry Smith   MPI_Comm               comm;
181347c6ae99SBarry Smith   PetscScalar            *values;
1814bff4a2f0SMatthew G. Knepley   DMBoundaryType         bx,by;
1815aa219208SBarry Smith   DMDAStencilType        st;
181645b6f7e9SBarry Smith   ISLocalToGlobalMapping ltog;
181747c6ae99SBarry Smith 
181847c6ae99SBarry Smith   PetscFunctionBegin;
181947c6ae99SBarry Smith   /*
182047c6ae99SBarry Smith      nc - number of components per grid point
182147c6ae99SBarry Smith      col - number of colors needed in one direction for single component problem
182247c6ae99SBarry Smith   */
18231321219cSEthan Coon   ierr = DMDAGetInfo(da,&dim,&m,&n,0,0,0,0,&nc,&s,&bx,&by,0,&st);CHKERRQ(ierr);
182447c6ae99SBarry Smith   col  = 2*s + 1;
182547c6ae99SBarry Smith 
1826aa219208SBarry Smith   ierr = DMDAGetCorners(da,&xs,&ys,0,&nx,&ny,0);CHKERRQ(ierr);
1827aa219208SBarry Smith   ierr = DMDAGetGhostCorners(da,&gxs,&gys,0,&gnx,&gny,0);CHKERRQ(ierr);
182847c6ae99SBarry Smith   ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr);
182947c6ae99SBarry Smith 
1830785e854fSJed Brown   ierr = PetscMalloc1(col*col*nc*nc,&cols);CHKERRQ(ierr);
183147c6ae99SBarry Smith 
18321411c6eeSJed Brown   ierr = DMGetLocalToGlobalMapping(da,&ltog);CHKERRQ(ierr);
183347c6ae99SBarry Smith 
183447c6ae99SBarry Smith   /* determine the matrix preallocation information */
1835eabe889fSLisandro Dalcin   ierr = MatPreallocateInitialize(comm,nx*ny,nx*ny,dnz,onz);CHKERRQ(ierr);
183647c6ae99SBarry Smith   for (i=xs; i<xs+nx; i++) {
1837bff4a2f0SMatthew G. Knepley     istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i));
1838bff4a2f0SMatthew G. Knepley     iend   = (bx == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,m-i-1));
183947c6ae99SBarry Smith     for (j=ys; j<ys+ny; j++) {
1840bff4a2f0SMatthew G. Knepley       jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j));
1841bff4a2f0SMatthew G. Knepley       jend   = (by == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,n-j-1));
184247c6ae99SBarry Smith       slot   = i - gxs + gnx*(j - gys);
184347c6ae99SBarry Smith 
184447c6ae99SBarry Smith       /* Find block columns in block row */
184547c6ae99SBarry Smith       cnt = 0;
184647c6ae99SBarry Smith       for (ii=istart; ii<iend+1; ii++) {
184747c6ae99SBarry Smith         for (jj=jstart; jj<jend+1; jj++) {
1848aa219208SBarry Smith           if (st == DMDA_STENCIL_BOX || !ii || !jj) {
184947c6ae99SBarry Smith             cols[cnt++] = slot + ii + gnx*jj;
185047c6ae99SBarry Smith           }
185147c6ae99SBarry Smith         }
185247c6ae99SBarry Smith       }
185345b6f7e9SBarry Smith       ierr = L2GFilterUpperTriangular(ltog,&slot,&cnt,cols);CHKERRQ(ierr);
1854d6e23781SBarry Smith       ierr = MatPreallocateSymmetricSetBlock(slot,cnt,cols,dnz,onz);CHKERRQ(ierr);
185547c6ae99SBarry Smith     }
185647c6ae99SBarry Smith   }
185747c6ae99SBarry Smith   ierr = MatSeqSBAIJSetPreallocation(J,nc,0,dnz);CHKERRQ(ierr);
185847c6ae99SBarry Smith   ierr = MatMPISBAIJSetPreallocation(J,nc,0,dnz,0,onz);CHKERRQ(ierr);
185947c6ae99SBarry Smith   ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr);
186047c6ae99SBarry Smith 
1861784ac674SJed Brown   ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr);
186247c6ae99SBarry Smith 
186347c6ae99SBarry Smith   /*
186447c6ae99SBarry Smith     For each node in the grid: we get the neighbors in the local (on processor ordering
186547c6ae99SBarry Smith     that includes the ghost points) then MatSetValuesLocal() maps those indices to the global
186647c6ae99SBarry Smith     PETSc ordering.
186747c6ae99SBarry Smith   */
1868fcfd50ebSBarry Smith   if (!da->prealloc_only) {
18691795a4d1SJed Brown     ierr = PetscCalloc1(col*col*nc*nc,&values);CHKERRQ(ierr);
187047c6ae99SBarry Smith     for (i=xs; i<xs+nx; i++) {
1871bff4a2f0SMatthew G. Knepley       istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i));
1872bff4a2f0SMatthew G. Knepley       iend   = (bx == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,m-i-1));
187347c6ae99SBarry Smith       for (j=ys; j<ys+ny; j++) {
1874bff4a2f0SMatthew G. Knepley         jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j));
1875bff4a2f0SMatthew G. Knepley         jend   = (by == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,n-j-1));
187647c6ae99SBarry Smith         slot   = i - gxs + gnx*(j - gys);
187747c6ae99SBarry Smith 
187847c6ae99SBarry Smith         /* Find block columns in block row */
187947c6ae99SBarry Smith         cnt = 0;
188047c6ae99SBarry Smith         for (ii=istart; ii<iend+1; ii++) {
188147c6ae99SBarry Smith           for (jj=jstart; jj<jend+1; jj++) {
1882aa219208SBarry Smith             if (st == DMDA_STENCIL_BOX || !ii || !jj) {
188347c6ae99SBarry Smith               cols[cnt++] = slot + ii + gnx*jj;
188447c6ae99SBarry Smith             }
188547c6ae99SBarry Smith           }
188647c6ae99SBarry Smith         }
188745b6f7e9SBarry Smith         ierr = L2GFilterUpperTriangular(ltog,&slot,&cnt,cols);CHKERRQ(ierr);
188847c6ae99SBarry Smith         ierr = MatSetValuesBlocked(J,1,&slot,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr);
188947c6ae99SBarry Smith       }
189047c6ae99SBarry Smith     }
189147c6ae99SBarry Smith     ierr = PetscFree(values);CHKERRQ(ierr);
189247c6ae99SBarry Smith     ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
189347c6ae99SBarry Smith     ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1894189e4007SBarry Smith     ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr);
189547c6ae99SBarry Smith   }
189647c6ae99SBarry Smith   ierr = PetscFree(cols);CHKERRQ(ierr);
189747c6ae99SBarry Smith   PetscFunctionReturn(0);
189847c6ae99SBarry Smith }
189947c6ae99SBarry Smith 
1900950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_3d_MPISBAIJ(DM da,Mat J)
190147c6ae99SBarry Smith {
190247c6ae99SBarry Smith   PetscErrorCode         ierr;
190347c6ae99SBarry Smith   PetscInt               xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny;
190447c6ae99SBarry Smith   PetscInt               m,n,dim,s,*cols,k,nc,col,cnt,p,*dnz,*onz;
190547c6ae99SBarry Smith   PetscInt               istart,iend,jstart,jend,kstart,kend,zs,nz,gzs,gnz,ii,jj,kk;
190647c6ae99SBarry Smith   MPI_Comm               comm;
190747c6ae99SBarry Smith   PetscScalar            *values;
1908bff4a2f0SMatthew G. Knepley   DMBoundaryType         bx,by,bz;
1909aa219208SBarry Smith   DMDAStencilType        st;
191045b6f7e9SBarry Smith   ISLocalToGlobalMapping ltog;
191147c6ae99SBarry Smith 
191247c6ae99SBarry Smith   PetscFunctionBegin;
191347c6ae99SBarry Smith   /*
191447c6ae99SBarry Smith      nc - number of components per grid point
191547c6ae99SBarry Smith      col - number of colors needed in one direction for single component problem
191647c6ae99SBarry Smith   */
19171321219cSEthan Coon   ierr = DMDAGetInfo(da,&dim,&m,&n,&p,0,0,0,&nc,&s,&bx,&by,&bz,&st);CHKERRQ(ierr);
191847c6ae99SBarry Smith   col  = 2*s + 1;
191947c6ae99SBarry Smith 
1920aa219208SBarry Smith   ierr = DMDAGetCorners(da,&xs,&ys,&zs,&nx,&ny,&nz);CHKERRQ(ierr);
1921aa219208SBarry Smith   ierr = DMDAGetGhostCorners(da,&gxs,&gys,&gzs,&gnx,&gny,&gnz);CHKERRQ(ierr);
192247c6ae99SBarry Smith   ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr);
192347c6ae99SBarry Smith 
192447c6ae99SBarry Smith   /* create the matrix */
1925785e854fSJed Brown   ierr = PetscMalloc1(col*col*col,&cols);CHKERRQ(ierr);
192647c6ae99SBarry Smith 
19271411c6eeSJed Brown   ierr = DMGetLocalToGlobalMapping(da,&ltog);CHKERRQ(ierr);
192847c6ae99SBarry Smith 
192947c6ae99SBarry Smith   /* determine the matrix preallocation information */
1930eabe889fSLisandro Dalcin   ierr = MatPreallocateInitialize(comm,nx*ny*nz,nx*ny*nz,dnz,onz);CHKERRQ(ierr);
193147c6ae99SBarry Smith   for (i=xs; i<xs+nx; i++) {
1932bff4a2f0SMatthew G. Knepley     istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i));
1933bff4a2f0SMatthew G. Knepley     iend   = (bx == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,m-i-1));
193447c6ae99SBarry Smith     for (j=ys; j<ys+ny; j++) {
1935bff4a2f0SMatthew G. Knepley       jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j));
1936bff4a2f0SMatthew G. Knepley       jend   = (by == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,n-j-1));
193747c6ae99SBarry Smith       for (k=zs; k<zs+nz; k++) {
1938bff4a2f0SMatthew G. Knepley         kstart = (bz == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k));
1939bff4a2f0SMatthew G. Knepley         kend   = (bz == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,p-k-1));
194047c6ae99SBarry Smith 
194147c6ae99SBarry Smith         slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs);
194247c6ae99SBarry Smith 
194347c6ae99SBarry Smith         /* Find block columns in block row */
194447c6ae99SBarry Smith         cnt = 0;
194547c6ae99SBarry Smith         for (ii=istart; ii<iend+1; ii++) {
194647c6ae99SBarry Smith           for (jj=jstart; jj<jend+1; jj++) {
194747c6ae99SBarry Smith             for (kk=kstart; kk<kend+1; kk++) {
1948aa219208SBarry Smith               if ((st == DMDA_STENCIL_BOX) || (!ii && !jj) || (!jj && !kk) || (!ii && !kk)) {
194947c6ae99SBarry Smith                 cols[cnt++] = slot + ii + gnx*jj + gnx*gny*kk;
195047c6ae99SBarry Smith               }
195147c6ae99SBarry Smith             }
195247c6ae99SBarry Smith           }
195347c6ae99SBarry Smith         }
195445b6f7e9SBarry Smith         ierr = L2GFilterUpperTriangular(ltog,&slot,&cnt,cols);CHKERRQ(ierr);
1955d6e23781SBarry Smith         ierr = MatPreallocateSymmetricSetBlock(slot,cnt,cols,dnz,onz);CHKERRQ(ierr);
195647c6ae99SBarry Smith       }
195747c6ae99SBarry Smith     }
195847c6ae99SBarry Smith   }
195947c6ae99SBarry Smith   ierr = MatSeqSBAIJSetPreallocation(J,nc,0,dnz);CHKERRQ(ierr);
196047c6ae99SBarry Smith   ierr = MatMPISBAIJSetPreallocation(J,nc,0,dnz,0,onz);CHKERRQ(ierr);
196147c6ae99SBarry Smith   ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr);
196247c6ae99SBarry Smith 
1963784ac674SJed Brown   ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr);
196447c6ae99SBarry Smith 
196547c6ae99SBarry Smith   /*
196647c6ae99SBarry Smith     For each node in the grid: we get the neighbors in the local (on processor ordering
196747c6ae99SBarry Smith     that includes the ghost points) then MatSetValuesLocal() maps those indices to the global
196847c6ae99SBarry Smith     PETSc ordering.
196947c6ae99SBarry Smith   */
1970fcfd50ebSBarry Smith   if (!da->prealloc_only) {
19711795a4d1SJed Brown     ierr = PetscCalloc1(col*col*col*nc*nc,&values);CHKERRQ(ierr);
197247c6ae99SBarry Smith     for (i=xs; i<xs+nx; i++) {
1973bff4a2f0SMatthew G. Knepley       istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i));
1974bff4a2f0SMatthew G. Knepley       iend   = (bx == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,m-i-1));
197547c6ae99SBarry Smith       for (j=ys; j<ys+ny; j++) {
1976bff4a2f0SMatthew G. Knepley         jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j));
1977bff4a2f0SMatthew G. Knepley         jend   = (by == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,n-j-1));
197847c6ae99SBarry Smith         for (k=zs; k<zs+nz; k++) {
1979bff4a2f0SMatthew G. Knepley           kstart = (bz == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k));
1980bff4a2f0SMatthew G. Knepley           kend   = (bz == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,p-k-1));
198147c6ae99SBarry Smith 
198247c6ae99SBarry Smith           slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs);
198347c6ae99SBarry Smith 
198447c6ae99SBarry Smith           cnt = 0;
198547c6ae99SBarry Smith           for (ii=istart; ii<iend+1; ii++) {
198647c6ae99SBarry Smith             for (jj=jstart; jj<jend+1; jj++) {
198747c6ae99SBarry Smith               for (kk=kstart; kk<kend+1; kk++) {
1988aa219208SBarry Smith                 if ((st == DMDA_STENCIL_BOX) || (!ii && !jj) || (!jj && !kk) || (!ii && !kk)) {
198947c6ae99SBarry Smith                   cols[cnt++] = slot + ii + gnx*jj + gnx*gny*kk;
199047c6ae99SBarry Smith                 }
199147c6ae99SBarry Smith               }
199247c6ae99SBarry Smith             }
199347c6ae99SBarry Smith           }
199445b6f7e9SBarry Smith           ierr = L2GFilterUpperTriangular(ltog,&slot,&cnt,cols);CHKERRQ(ierr);
199547c6ae99SBarry Smith           ierr = MatSetValuesBlocked(J,1,&slot,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr);
199647c6ae99SBarry Smith         }
199747c6ae99SBarry Smith       }
199847c6ae99SBarry Smith     }
199947c6ae99SBarry Smith     ierr = PetscFree(values);CHKERRQ(ierr);
200047c6ae99SBarry Smith     ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
200147c6ae99SBarry Smith     ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2002189e4007SBarry Smith     ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr);
200347c6ae99SBarry Smith   }
200447c6ae99SBarry Smith   ierr = PetscFree(cols);CHKERRQ(ierr);
200547c6ae99SBarry Smith   PetscFunctionReturn(0);
200647c6ae99SBarry Smith }
200747c6ae99SBarry Smith 
200847c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/
200947c6ae99SBarry Smith 
2010950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_3d_MPIAIJ_Fill(DM da,Mat J)
201147c6ae99SBarry Smith {
201247c6ae99SBarry Smith   PetscErrorCode         ierr;
201347c6ae99SBarry Smith   PetscInt               xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny;
2014c0ab637bSBarry Smith   PetscInt               m,n,dim,s,*cols,k,nc,row,col,cnt, maxcnt = 0,l,p,*dnz,*onz;
2015c1154cd5SBarry Smith   PetscInt               istart,iend,jstart,jend,kstart,kend,zs,nz,gzs,gnz,ii,jj,kk,M,N,P;
201647c6ae99SBarry Smith   DM_DA                  *dd = (DM_DA*)da->data;
201747c6ae99SBarry Smith   PetscInt               ifill_col,*dfill = dd->dfill,*ofill = dd->ofill;
201847c6ae99SBarry Smith   MPI_Comm               comm;
201947c6ae99SBarry Smith   PetscScalar            *values;
2020bff4a2f0SMatthew G. Knepley   DMBoundaryType         bx,by,bz;
202145b6f7e9SBarry Smith   ISLocalToGlobalMapping ltog;
2022aa219208SBarry Smith   DMDAStencilType        st;
2023c1154cd5SBarry Smith   PetscBool              removedups = PETSC_FALSE;
202447c6ae99SBarry Smith 
202547c6ae99SBarry Smith   PetscFunctionBegin;
202647c6ae99SBarry Smith   /*
202747c6ae99SBarry Smith          nc - number of components per grid point
202847c6ae99SBarry Smith          col - number of colors needed in one direction for single component problem
202947c6ae99SBarry Smith 
203047c6ae99SBarry Smith   */
2031c1154cd5SBarry Smith   ierr = DMDAGetInfo(da,&dim,&m,&n,&p,&M,&N,&P,&nc,&s,&bx,&by,&bz,&st);CHKERRQ(ierr);
203247c6ae99SBarry Smith   col  = 2*s + 1;
2033bff4a2f0SMatthew G. Knepley   if (bx == DM_BOUNDARY_PERIODIC && (m % col)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in X is divisible\n\
203447c6ae99SBarry Smith                  by 2*stencil_width + 1\n");
2035bff4a2f0SMatthew G. Knepley   if (by == DM_BOUNDARY_PERIODIC && (n % col)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in Y is divisible\n\
203647c6ae99SBarry Smith                  by 2*stencil_width + 1\n");
2037bff4a2f0SMatthew G. Knepley   if (bz == DM_BOUNDARY_PERIODIC && (p % col)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in Z is divisible\n\
203847c6ae99SBarry Smith                  by 2*stencil_width + 1\n");
203947c6ae99SBarry Smith 
2040c1154cd5SBarry Smith   /*
2041c1154cd5SBarry Smith        With one processor in periodic domains in a skinny dimension the code will label nonzero columns multiple times
2042c1154cd5SBarry Smith        because of "wrapping" around the end of the domain hitting an entry already counted in the other direction.
2043c1154cd5SBarry Smith   */
2044c1154cd5SBarry Smith   if (M == 1 && 2*s >= m) removedups = PETSC_TRUE;
2045c1154cd5SBarry Smith   if (N == 1 && 2*s >= n) removedups = PETSC_TRUE;
2046c1154cd5SBarry Smith   if (P == 1 && 2*s >= p) removedups = PETSC_TRUE;
2047c1154cd5SBarry Smith 
2048aa219208SBarry Smith   ierr = DMDAGetCorners(da,&xs,&ys,&zs,&nx,&ny,&nz);CHKERRQ(ierr);
2049aa219208SBarry Smith   ierr = DMDAGetGhostCorners(da,&gxs,&gys,&gzs,&gnx,&gny,&gnz);CHKERRQ(ierr);
205047c6ae99SBarry Smith   ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr);
205147c6ae99SBarry Smith 
2052785e854fSJed Brown   ierr = PetscMalloc1(col*col*col*nc,&cols);CHKERRQ(ierr);
20531411c6eeSJed Brown   ierr = DMGetLocalToGlobalMapping(da,&ltog);CHKERRQ(ierr);
205447c6ae99SBarry Smith 
205547c6ae99SBarry Smith   /* determine the matrix preallocation information */
205647c6ae99SBarry Smith   ierr = MatPreallocateInitialize(comm,nc*nx*ny*nz,nc*nx*ny*nz,dnz,onz);CHKERRQ(ierr);
205747c6ae99SBarry Smith 
205806ca8cadSBarry Smith   ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr);
205947c6ae99SBarry Smith   for (i=xs; i<xs+nx; i++) {
2060bff4a2f0SMatthew G. Knepley     istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i));
2061bff4a2f0SMatthew G. Knepley     iend   = (bx == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,m-i-1));
206247c6ae99SBarry Smith     for (j=ys; j<ys+ny; j++) {
2063bff4a2f0SMatthew G. Knepley       jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j));
2064bff4a2f0SMatthew G. Knepley       jend   = (by == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,n-j-1));
206547c6ae99SBarry Smith       for (k=zs; k<zs+nz; k++) {
2066bff4a2f0SMatthew G. Knepley         kstart = (bz == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k));
2067bff4a2f0SMatthew G. Knepley         kend   = (bz == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,p-k-1));
206847c6ae99SBarry Smith 
206947c6ae99SBarry Smith         slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs);
207047c6ae99SBarry Smith 
207147c6ae99SBarry Smith         for (l=0; l<nc; l++) {
207247c6ae99SBarry Smith           cnt = 0;
207347c6ae99SBarry Smith           for (ii=istart; ii<iend+1; ii++) {
207447c6ae99SBarry Smith             for (jj=jstart; jj<jend+1; jj++) {
207547c6ae99SBarry Smith               for (kk=kstart; kk<kend+1; kk++) {
207647c6ae99SBarry Smith                 if (ii || jj || kk) {
2077aa219208SBarry Smith                   if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/
20788865f1eaSKarl Rupp                     for (ifill_col=ofill[l]; ifill_col<ofill[l+1]; ifill_col++) cols[cnt++] = ofill[ifill_col] + nc*(slot + ii + gnx*jj + gnx*gny*kk);
207947c6ae99SBarry Smith                   }
208047c6ae99SBarry Smith                 } else {
208147c6ae99SBarry Smith                   if (dfill) {
20828865f1eaSKarl Rupp                     for (ifill_col=dfill[l]; ifill_col<dfill[l+1]; ifill_col++) cols[cnt++] = dfill[ifill_col] + nc*(slot + ii + gnx*jj + gnx*gny*kk);
208347c6ae99SBarry Smith                   } else {
20848865f1eaSKarl Rupp                     for (ifill_col=0; ifill_col<nc; ifill_col++) cols[cnt++] = ifill_col + nc*(slot + ii + gnx*jj + gnx*gny*kk);
208547c6ae99SBarry Smith                   }
208647c6ae99SBarry Smith                 }
208747c6ae99SBarry Smith               }
208847c6ae99SBarry Smith             }
208947c6ae99SBarry Smith           }
209047c6ae99SBarry Smith           row  = l + nc*(slot);
2091c0ab637bSBarry Smith           maxcnt = PetscMax(maxcnt,cnt);
2092c1154cd5SBarry Smith           if (removedups) {
2093c1154cd5SBarry Smith             ierr = MatPreallocateSetLocalRemoveDups(ltog,1,&row,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr);
2094c1154cd5SBarry Smith           } else {
2095784ac674SJed Brown             ierr = MatPreallocateSetLocal(ltog,1,&row,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr);
209647c6ae99SBarry Smith           }
209747c6ae99SBarry Smith         }
209847c6ae99SBarry Smith       }
209947c6ae99SBarry Smith     }
2100c1154cd5SBarry Smith   }
210147c6ae99SBarry Smith   ierr = MatSeqAIJSetPreallocation(J,0,dnz);CHKERRQ(ierr);
210247c6ae99SBarry Smith   ierr = MatMPIAIJSetPreallocation(J,0,dnz,0,onz);CHKERRQ(ierr);
210347c6ae99SBarry Smith   ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr);
2104784ac674SJed Brown   ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr);
210547c6ae99SBarry Smith 
210647c6ae99SBarry Smith   /*
210747c6ae99SBarry Smith     For each node in the grid: we get the neighbors in the local (on processor ordering
210847c6ae99SBarry Smith     that includes the ghost points) then MatSetValuesLocal() maps those indices to the global
210947c6ae99SBarry Smith     PETSc ordering.
211047c6ae99SBarry Smith   */
2111fcfd50ebSBarry Smith   if (!da->prealloc_only) {
2112c0ab637bSBarry Smith     ierr = PetscCalloc1(maxcnt,&values);CHKERRQ(ierr);
211347c6ae99SBarry Smith     for (i=xs; i<xs+nx; i++) {
2114bff4a2f0SMatthew G. Knepley       istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i));
2115bff4a2f0SMatthew G. Knepley       iend   = (bx == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,m-i-1));
211647c6ae99SBarry Smith       for (j=ys; j<ys+ny; j++) {
2117bff4a2f0SMatthew G. Knepley         jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j));
2118bff4a2f0SMatthew G. Knepley         jend   = (by == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,n-j-1));
211947c6ae99SBarry Smith         for (k=zs; k<zs+nz; k++) {
2120bff4a2f0SMatthew G. Knepley           kstart = (bz == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k));
2121bff4a2f0SMatthew G. Knepley           kend   = (bz == DM_BOUNDARY_PERIODIC) ?  s : (PetscMin(s,p-k-1));
212247c6ae99SBarry Smith 
212347c6ae99SBarry Smith           slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs);
212447c6ae99SBarry Smith 
212547c6ae99SBarry Smith           for (l=0; l<nc; l++) {
212647c6ae99SBarry Smith             cnt = 0;
212747c6ae99SBarry Smith             for (ii=istart; ii<iend+1; ii++) {
212847c6ae99SBarry Smith               for (jj=jstart; jj<jend+1; jj++) {
212947c6ae99SBarry Smith                 for (kk=kstart; kk<kend+1; kk++) {
213047c6ae99SBarry Smith                   if (ii || jj || kk) {
2131aa219208SBarry Smith                     if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/
21328865f1eaSKarl Rupp                       for (ifill_col=ofill[l]; ifill_col<ofill[l+1]; ifill_col++) cols[cnt++] = ofill[ifill_col] + nc*(slot + ii + gnx*jj + gnx*gny*kk);
213347c6ae99SBarry Smith                     }
213447c6ae99SBarry Smith                   } else {
213547c6ae99SBarry Smith                     if (dfill) {
21368865f1eaSKarl Rupp                       for (ifill_col=dfill[l]; ifill_col<dfill[l+1]; ifill_col++) cols[cnt++] = dfill[ifill_col] + nc*(slot + ii + gnx*jj + gnx*gny*kk);
213747c6ae99SBarry Smith                     } else {
21388865f1eaSKarl Rupp                       for (ifill_col=0; ifill_col<nc; ifill_col++) cols[cnt++] = ifill_col + nc*(slot + ii + gnx*jj + gnx*gny*kk);
213947c6ae99SBarry Smith                     }
214047c6ae99SBarry Smith                   }
214147c6ae99SBarry Smith                 }
214247c6ae99SBarry Smith               }
214347c6ae99SBarry Smith             }
214447c6ae99SBarry Smith             row  = l + nc*(slot);
214547c6ae99SBarry Smith             ierr = MatSetValuesLocal(J,1,&row,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr);
214647c6ae99SBarry Smith           }
214747c6ae99SBarry Smith         }
214847c6ae99SBarry Smith       }
214947c6ae99SBarry Smith     }
215047c6ae99SBarry Smith     ierr = PetscFree(values);CHKERRQ(ierr);
215147c6ae99SBarry Smith     ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
215247c6ae99SBarry Smith     ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2153189e4007SBarry Smith     ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr);
215447c6ae99SBarry Smith   }
215547c6ae99SBarry Smith   ierr = PetscFree(cols);CHKERRQ(ierr);
215647c6ae99SBarry Smith   PetscFunctionReturn(0);
215747c6ae99SBarry Smith }
2158