147c6ae99SBarry Smith 2af0996ceSBarry Smith #include <petsc/private/dmdaimpl.h> /*I "petscdmda.h" I*/ 307475bc1SBarry Smith #include <petscmat.h> 447c6ae99SBarry Smith 5e727c939SJed Brown extern PetscErrorCode DMCreateColoring_DA_1d_MPIAIJ(DM,ISColoringType,ISColoring*); 6e727c939SJed Brown extern PetscErrorCode DMCreateColoring_DA_2d_MPIAIJ(DM,ISColoringType,ISColoring*); 7e727c939SJed Brown extern PetscErrorCode DMCreateColoring_DA_2d_5pt_MPIAIJ(DM,ISColoringType,ISColoring*); 8e727c939SJed Brown extern PetscErrorCode DMCreateColoring_DA_3d_MPIAIJ(DM,ISColoringType,ISColoring*); 947c6ae99SBarry Smith 1047c6ae99SBarry Smith /* 1147c6ae99SBarry Smith For ghost i that may be negative or greater than the upper bound this 1247c6ae99SBarry Smith maps it into the 0:m-1 range using periodicity 1347c6ae99SBarry Smith */ 1447c6ae99SBarry Smith #define SetInRange(i,m) ((i < 0) ? m+i : ((i >= m) ? i-m : i)) 1547c6ae99SBarry Smith 16ce308e1dSBarry Smith static PetscErrorCode DMDASetBlockFills_Private(const PetscInt *dfill,PetscInt w,PetscInt **rfill) 1747c6ae99SBarry Smith { 1847c6ae99SBarry Smith PetscErrorCode ierr; 1947c6ae99SBarry Smith PetscInt i,j,nz,*fill; 2047c6ae99SBarry Smith 2147c6ae99SBarry Smith PetscFunctionBegin; 2247c6ae99SBarry Smith if (!dfill) PetscFunctionReturn(0); 2347c6ae99SBarry Smith 2447c6ae99SBarry Smith /* count number nonzeros */ 2547c6ae99SBarry Smith nz = 0; 2647c6ae99SBarry Smith for (i=0; i<w; i++) { 2747c6ae99SBarry Smith for (j=0; j<w; j++) { 2847c6ae99SBarry Smith if (dfill[w*i+j]) nz++; 2947c6ae99SBarry Smith } 3047c6ae99SBarry Smith } 31854ce69bSBarry Smith ierr = PetscMalloc1(nz + w + 1,&fill);CHKERRQ(ierr); 3247c6ae99SBarry Smith /* construct modified CSR storage of nonzero structure */ 33ce308e1dSBarry Smith /* fill[0 -- w] marks starts of each row of column indices (and end of last row) 34ce308e1dSBarry Smith so fill[1] - fill[0] gives number of nonzeros in first row etc */ 3547c6ae99SBarry Smith nz = w + 1; 3647c6ae99SBarry Smith for (i=0; i<w; i++) { 3747c6ae99SBarry Smith fill[i] = nz; 3847c6ae99SBarry Smith for (j=0; j<w; j++) { 3947c6ae99SBarry Smith if (dfill[w*i+j]) { 4047c6ae99SBarry Smith fill[nz] = j; 4147c6ae99SBarry Smith nz++; 4247c6ae99SBarry Smith } 4347c6ae99SBarry Smith } 4447c6ae99SBarry Smith } 4547c6ae99SBarry Smith fill[w] = nz; 4647c6ae99SBarry Smith 4747c6ae99SBarry Smith *rfill = fill; 4847c6ae99SBarry Smith PetscFunctionReturn(0); 4947c6ae99SBarry Smith } 5047c6ae99SBarry Smith 5147c6ae99SBarry Smith /*@ 52aa219208SBarry Smith DMDASetBlockFills - Sets the fill pattern in each block for a multi-component problem 53950540a4SJed Brown of the matrix returned by DMCreateMatrix(). 5447c6ae99SBarry Smith 55aa219208SBarry Smith Logically Collective on DMDA 5647c6ae99SBarry Smith 5747c6ae99SBarry Smith Input Parameter: 5847c6ae99SBarry Smith + da - the distributed array 590298fd71SBarry Smith . dfill - the fill pattern in the diagonal block (may be NULL, means use dense block) 6047c6ae99SBarry Smith - ofill - the fill pattern in the off-diagonal blocks 6147c6ae99SBarry Smith 6247c6ae99SBarry Smith 6347c6ae99SBarry Smith Level: developer 6447c6ae99SBarry Smith 6547c6ae99SBarry Smith Notes: This only makes sense when you are doing multicomponent problems but using the 6647c6ae99SBarry Smith MPIAIJ matrix format 6747c6ae99SBarry Smith 6847c6ae99SBarry Smith The format for dfill and ofill is a 2 dimensional dof by dof matrix with 1 entries 6947c6ae99SBarry Smith representing coupling and 0 entries for missing coupling. For example 7047c6ae99SBarry Smith $ dfill[9] = {1, 0, 0, 7147c6ae99SBarry Smith $ 1, 1, 0, 7247c6ae99SBarry Smith $ 0, 1, 1} 7347c6ae99SBarry Smith means that row 0 is coupled with only itself in the diagonal block, row 1 is coupled with 7447c6ae99SBarry Smith itself and row 0 (in the diagonal block) and row 2 is coupled with itself and row 1 (in the 7547c6ae99SBarry Smith diagonal block). 7647c6ae99SBarry Smith 77aa219208SBarry Smith DMDASetGetMatrix() allows you to provide general code for those more complicated nonzero patterns then 7847c6ae99SBarry Smith can be represented in the dfill, ofill format 7947c6ae99SBarry Smith 8047c6ae99SBarry Smith Contributed by Glenn Hammond 8147c6ae99SBarry Smith 828ddb5d8bSBarry Smith .seealso DMCreateMatrix(), DMDASetGetMatrix(), DMSetMatrixPreallocateOnly() 8347c6ae99SBarry Smith 8447c6ae99SBarry Smith @*/ 85ce308e1dSBarry Smith PetscErrorCode DMDASetBlockFills(DM da,const PetscInt *dfill,const PetscInt *ofill) 8647c6ae99SBarry Smith { 8747c6ae99SBarry Smith DM_DA *dd = (DM_DA*)da->data; 8847c6ae99SBarry Smith PetscErrorCode ierr; 89ae4f298aSBarry Smith PetscInt i,k,cnt = 1; 9047c6ae99SBarry Smith 9147c6ae99SBarry Smith PetscFunctionBegin; 92aa219208SBarry Smith ierr = DMDASetBlockFills_Private(dfill,dd->w,&dd->dfill);CHKERRQ(ierr); 93aa219208SBarry Smith ierr = DMDASetBlockFills_Private(ofill,dd->w,&dd->ofill);CHKERRQ(ierr); 94ae4f298aSBarry Smith 95ae4f298aSBarry Smith /* ofillcount tracks the columns of ofill that have any nonzero in thems; the value in each location is the number of 96ae4f298aSBarry Smith columns to the left with any nonzeros in them plus 1 */ 971795a4d1SJed Brown ierr = PetscCalloc1(dd->w,&dd->ofillcols);CHKERRQ(ierr); 98ae4f298aSBarry Smith for (i=0; i<dd->w; i++) { 99ae4f298aSBarry Smith for (k=dd->ofill[i]; k<dd->ofill[i+1]; k++) dd->ofillcols[dd->ofill[k]] = 1; 100ae4f298aSBarry Smith } 101ae4f298aSBarry Smith for (i=0; i<dd->w; i++) { 102ae4f298aSBarry Smith if (dd->ofillcols[i]) { 103ae4f298aSBarry Smith dd->ofillcols[i] = cnt++; 104ae4f298aSBarry Smith } 105ae4f298aSBarry Smith } 10647c6ae99SBarry Smith PetscFunctionReturn(0); 10747c6ae99SBarry Smith } 10847c6ae99SBarry Smith 10947c6ae99SBarry Smith 110b412c318SBarry Smith PetscErrorCode DMCreateColoring_DA(DM da,ISColoringType ctype,ISColoring *coloring) 11147c6ae99SBarry Smith { 11247c6ae99SBarry Smith PetscErrorCode ierr; 11347c6ae99SBarry Smith PetscInt dim,m,n,p,nc; 114bff4a2f0SMatthew G. Knepley DMBoundaryType bx,by,bz; 11547c6ae99SBarry Smith MPI_Comm comm; 11647c6ae99SBarry Smith PetscMPIInt size; 11747c6ae99SBarry Smith PetscBool isBAIJ; 11847c6ae99SBarry Smith DM_DA *dd = (DM_DA*)da->data; 11947c6ae99SBarry Smith 12047c6ae99SBarry Smith PetscFunctionBegin; 12147c6ae99SBarry Smith /* 12247c6ae99SBarry Smith m 12347c6ae99SBarry Smith ------------------------------------------------------ 12447c6ae99SBarry Smith | | 12547c6ae99SBarry Smith | | 12647c6ae99SBarry Smith | ---------------------- | 12747c6ae99SBarry Smith | | | | 12847c6ae99SBarry Smith n | yn | | | 12947c6ae99SBarry Smith | | | | 13047c6ae99SBarry Smith | .--------------------- | 13147c6ae99SBarry Smith | (xs,ys) xn | 13247c6ae99SBarry Smith | . | 13347c6ae99SBarry Smith | (gxs,gys) | 13447c6ae99SBarry Smith | | 13547c6ae99SBarry Smith ----------------------------------------------------- 13647c6ae99SBarry Smith */ 13747c6ae99SBarry Smith 13847c6ae99SBarry Smith /* 13947c6ae99SBarry Smith nc - number of components per grid point 14047c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 14147c6ae99SBarry Smith 14247c6ae99SBarry Smith */ 1431321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,0,0,0,&m,&n,&p,&nc,0,&bx,&by,&bz,0);CHKERRQ(ierr); 14447c6ae99SBarry Smith 14547c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 14647c6ae99SBarry Smith ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr); 1475bdb020cSBarry Smith if (ctype == IS_COLORING_LOCAL) { 14847c6ae99SBarry Smith if (size == 1) { 14947c6ae99SBarry Smith ctype = IS_COLORING_GLOBAL; 15047c6ae99SBarry Smith } else if (dim > 1) { 151bff4a2f0SMatthew G. Knepley if ((m==1 && bx == DM_BOUNDARY_PERIODIC) || (n==1 && by == DM_BOUNDARY_PERIODIC) || (p==1 && bz == DM_BOUNDARY_PERIODIC)) { 1525bdb020cSBarry Smith SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"IS_COLORING_LOCAL cannot be used for periodic boundary condition having both ends of the domain on the same process"); 15347c6ae99SBarry Smith } 15447c6ae99SBarry Smith } 15547c6ae99SBarry Smith } 15647c6ae99SBarry Smith 157aa219208SBarry Smith /* Tell the DMDA it has 1 degree of freedom per grid point so that the coloring for BAIJ 15847c6ae99SBarry Smith matrices is for the blocks, not the individual matrix elements */ 159b412c318SBarry Smith ierr = PetscStrcmp(da->mattype,MATBAIJ,&isBAIJ);CHKERRQ(ierr); 160b412c318SBarry Smith if (!isBAIJ) {ierr = PetscStrcmp(da->mattype,MATMPIBAIJ,&isBAIJ);CHKERRQ(ierr);} 161b412c318SBarry Smith if (!isBAIJ) {ierr = PetscStrcmp(da->mattype,MATSEQBAIJ,&isBAIJ);CHKERRQ(ierr);} 16247c6ae99SBarry Smith if (isBAIJ) { 16347c6ae99SBarry Smith dd->w = 1; 16447c6ae99SBarry Smith dd->xs = dd->xs/nc; 16547c6ae99SBarry Smith dd->xe = dd->xe/nc; 16647c6ae99SBarry Smith dd->Xs = dd->Xs/nc; 16747c6ae99SBarry Smith dd->Xe = dd->Xe/nc; 16847c6ae99SBarry Smith } 16947c6ae99SBarry Smith 17047c6ae99SBarry Smith /* 171aa219208SBarry Smith We do not provide a getcoloring function in the DMDA operations because 172aa219208SBarry Smith the basic DMDA does not know about matrices. We think of DMDA as being more 17347c6ae99SBarry Smith more low-level then matrices. 17447c6ae99SBarry Smith */ 17547c6ae99SBarry Smith if (dim == 1) { 176e727c939SJed Brown ierr = DMCreateColoring_DA_1d_MPIAIJ(da,ctype,coloring);CHKERRQ(ierr); 17747c6ae99SBarry Smith } else if (dim == 2) { 178e727c939SJed Brown ierr = DMCreateColoring_DA_2d_MPIAIJ(da,ctype,coloring);CHKERRQ(ierr); 17947c6ae99SBarry Smith } else if (dim == 3) { 180e727c939SJed Brown ierr = DMCreateColoring_DA_3d_MPIAIJ(da,ctype,coloring);CHKERRQ(ierr); 181ce94432eSBarry Smith } else SETERRQ1(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"Not done for %D dimension, send us mail petsc-maint@mcs.anl.gov for code",dim); 18247c6ae99SBarry Smith if (isBAIJ) { 18347c6ae99SBarry Smith dd->w = nc; 18447c6ae99SBarry Smith dd->xs = dd->xs*nc; 18547c6ae99SBarry Smith dd->xe = dd->xe*nc; 18647c6ae99SBarry Smith dd->Xs = dd->Xs*nc; 18747c6ae99SBarry Smith dd->Xe = dd->Xe*nc; 18847c6ae99SBarry Smith } 18947c6ae99SBarry Smith PetscFunctionReturn(0); 19047c6ae99SBarry Smith } 19147c6ae99SBarry Smith 19247c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/ 19347c6ae99SBarry Smith 194e727c939SJed Brown PetscErrorCode DMCreateColoring_DA_2d_MPIAIJ(DM da,ISColoringType ctype,ISColoring *coloring) 19547c6ae99SBarry Smith { 19647c6ae99SBarry Smith PetscErrorCode ierr; 19747c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,ii,gxs,gys,gnx,gny,m,n,M,N,dim,s,k,nc,col; 19847c6ae99SBarry Smith PetscInt ncolors; 19947c6ae99SBarry Smith MPI_Comm comm; 200bff4a2f0SMatthew G. Knepley DMBoundaryType bx,by; 201aa219208SBarry Smith DMDAStencilType st; 20247c6ae99SBarry Smith ISColoringValue *colors; 20347c6ae99SBarry Smith DM_DA *dd = (DM_DA*)da->data; 20447c6ae99SBarry Smith 20547c6ae99SBarry Smith PetscFunctionBegin; 20647c6ae99SBarry Smith /* 20747c6ae99SBarry Smith nc - number of components per grid point 20847c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 20947c6ae99SBarry Smith 21047c6ae99SBarry Smith */ 2111321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,&n,0,&M,&N,0,&nc,&s,&bx,&by,0,&st);CHKERRQ(ierr); 21247c6ae99SBarry Smith col = 2*s + 1; 213aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,0,&nx,&ny,0);CHKERRQ(ierr); 214aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,0,&gnx,&gny,0);CHKERRQ(ierr); 21547c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 21647c6ae99SBarry Smith 21747c6ae99SBarry Smith /* special case as taught to us by Paul Hovland */ 218aa219208SBarry Smith if (st == DMDA_STENCIL_STAR && s == 1) { 219e727c939SJed Brown ierr = DMCreateColoring_DA_2d_5pt_MPIAIJ(da,ctype,coloring);CHKERRQ(ierr); 22047c6ae99SBarry Smith } else { 22147c6ae99SBarry Smith 222bff4a2f0SMatthew G. Knepley if (bx == DM_BOUNDARY_PERIODIC && (m % col)) SETERRQ2(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in X (%d) is divisible\n\ 22347c6ae99SBarry Smith by 2*stencil_width + 1 (%d)\n", m, col); 224bff4a2f0SMatthew G. Knepley if (by == DM_BOUNDARY_PERIODIC && (n % col)) SETERRQ2(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in Y (%d) is divisible\n\ 22547c6ae99SBarry Smith by 2*stencil_width + 1 (%d)\n", n, col); 22647c6ae99SBarry Smith if (ctype == IS_COLORING_GLOBAL) { 22747c6ae99SBarry Smith if (!dd->localcoloring) { 228785e854fSJed Brown ierr = PetscMalloc1(nc*nx*ny,&colors);CHKERRQ(ierr); 22947c6ae99SBarry Smith ii = 0; 23047c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 23147c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 23247c6ae99SBarry Smith for (k=0; k<nc; k++) { 23347c6ae99SBarry Smith colors[ii++] = k + nc*((i % col) + col*(j % col)); 23447c6ae99SBarry Smith } 23547c6ae99SBarry Smith } 23647c6ae99SBarry Smith } 23747c6ae99SBarry Smith ncolors = nc + nc*(col-1 + col*(col-1)); 238aaf3ff59SMatthew G. Knepley ierr = ISColoringCreate(comm,ncolors,nc*nx*ny,colors,PETSC_OWN_POINTER,&dd->localcoloring);CHKERRQ(ierr); 23947c6ae99SBarry Smith } 24047c6ae99SBarry Smith *coloring = dd->localcoloring; 2415bdb020cSBarry Smith } else if (ctype == IS_COLORING_LOCAL) { 24247c6ae99SBarry Smith if (!dd->ghostedcoloring) { 243785e854fSJed Brown ierr = PetscMalloc1(nc*gnx*gny,&colors);CHKERRQ(ierr); 24447c6ae99SBarry Smith ii = 0; 24547c6ae99SBarry Smith for (j=gys; j<gys+gny; j++) { 24647c6ae99SBarry Smith for (i=gxs; i<gxs+gnx; i++) { 24747c6ae99SBarry Smith for (k=0; k<nc; k++) { 24847c6ae99SBarry Smith /* the complicated stuff is to handle periodic boundaries */ 24947c6ae99SBarry Smith colors[ii++] = k + nc*((SetInRange(i,m) % col) + col*(SetInRange(j,n) % col)); 25047c6ae99SBarry Smith } 25147c6ae99SBarry Smith } 25247c6ae99SBarry Smith } 25347c6ae99SBarry Smith ncolors = nc + nc*(col - 1 + col*(col-1)); 254aaf3ff59SMatthew G. Knepley ierr = ISColoringCreate(comm,ncolors,nc*gnx*gny,colors,PETSC_OWN_POINTER,&dd->ghostedcoloring);CHKERRQ(ierr); 25547c6ae99SBarry Smith /* PetscIntView(ncolors,(PetscInt*)colors,0); */ 25647c6ae99SBarry Smith 2575bdb020cSBarry Smith ierr = ISColoringSetType(dd->ghostedcoloring,IS_COLORING_LOCAL);CHKERRQ(ierr); 25847c6ae99SBarry Smith } 25947c6ae99SBarry Smith *coloring = dd->ghostedcoloring; 260ce94432eSBarry Smith } else SETERRQ1(PetscObjectComm((PetscObject)da),PETSC_ERR_ARG_WRONG,"Unknown ISColoringType %d",(int)ctype); 26147c6ae99SBarry Smith } 26247c6ae99SBarry Smith ierr = ISColoringReference(*coloring);CHKERRQ(ierr); 26347c6ae99SBarry Smith PetscFunctionReturn(0); 26447c6ae99SBarry Smith } 26547c6ae99SBarry Smith 26647c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/ 26747c6ae99SBarry Smith 268e727c939SJed Brown PetscErrorCode DMCreateColoring_DA_3d_MPIAIJ(DM da,ISColoringType ctype,ISColoring *coloring) 26947c6ae99SBarry Smith { 27047c6ae99SBarry Smith PetscErrorCode ierr; 27147c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,gxs,gys,gnx,gny,m,n,p,dim,s,k,nc,col,zs,gzs,ii,l,nz,gnz,M,N,P; 27247c6ae99SBarry Smith PetscInt ncolors; 27347c6ae99SBarry Smith MPI_Comm comm; 274bff4a2f0SMatthew G. Knepley DMBoundaryType bx,by,bz; 275aa219208SBarry Smith DMDAStencilType st; 27647c6ae99SBarry Smith ISColoringValue *colors; 27747c6ae99SBarry Smith DM_DA *dd = (DM_DA*)da->data; 27847c6ae99SBarry Smith 27947c6ae99SBarry Smith PetscFunctionBegin; 28047c6ae99SBarry Smith /* 28147c6ae99SBarry Smith nc - number of components per grid point 28247c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 28347c6ae99SBarry Smith 28447c6ae99SBarry Smith */ 2851321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,&n,&p,&M,&N,&P,&nc,&s,&bx,&by,&bz,&st);CHKERRQ(ierr); 28647c6ae99SBarry Smith col = 2*s + 1; 287bff4a2f0SMatthew G. Knepley if (bx == DM_BOUNDARY_PERIODIC && (m % col)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in X is divisible\n\ 28847c6ae99SBarry Smith by 2*stencil_width + 1\n"); 289bff4a2f0SMatthew G. Knepley if (by == DM_BOUNDARY_PERIODIC && (n % col)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in Y is divisible\n\ 29047c6ae99SBarry Smith by 2*stencil_width + 1\n"); 291bff4a2f0SMatthew G. Knepley if (bz == DM_BOUNDARY_PERIODIC && (p % col)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in Z is divisible\n\ 29247c6ae99SBarry Smith by 2*stencil_width + 1\n"); 29347c6ae99SBarry Smith 294aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,&zs,&nx,&ny,&nz);CHKERRQ(ierr); 295aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,&gzs,&gnx,&gny,&gnz);CHKERRQ(ierr); 29647c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 29747c6ae99SBarry Smith 29847c6ae99SBarry Smith /* create the coloring */ 29947c6ae99SBarry Smith if (ctype == IS_COLORING_GLOBAL) { 30047c6ae99SBarry Smith if (!dd->localcoloring) { 301785e854fSJed Brown ierr = PetscMalloc1(nc*nx*ny*nz,&colors);CHKERRQ(ierr); 30247c6ae99SBarry Smith ii = 0; 30347c6ae99SBarry Smith for (k=zs; k<zs+nz; k++) { 30447c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 30547c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 30647c6ae99SBarry Smith for (l=0; l<nc; l++) { 30747c6ae99SBarry Smith colors[ii++] = l + nc*((i % col) + col*(j % col) + col*col*(k % col)); 30847c6ae99SBarry Smith } 30947c6ae99SBarry Smith } 31047c6ae99SBarry Smith } 31147c6ae99SBarry Smith } 31247c6ae99SBarry Smith ncolors = nc + nc*(col-1 + col*(col-1)+ col*col*(col-1)); 313aaf3ff59SMatthew G. Knepley ierr = ISColoringCreate(comm,ncolors,nc*nx*ny*nz,colors,PETSC_OWN_POINTER,&dd->localcoloring);CHKERRQ(ierr); 31447c6ae99SBarry Smith } 31547c6ae99SBarry Smith *coloring = dd->localcoloring; 3165bdb020cSBarry Smith } else if (ctype == IS_COLORING_LOCAL) { 31747c6ae99SBarry Smith if (!dd->ghostedcoloring) { 318785e854fSJed Brown ierr = PetscMalloc1(nc*gnx*gny*gnz,&colors);CHKERRQ(ierr); 31947c6ae99SBarry Smith ii = 0; 32047c6ae99SBarry Smith for (k=gzs; k<gzs+gnz; k++) { 32147c6ae99SBarry Smith for (j=gys; j<gys+gny; j++) { 32247c6ae99SBarry Smith for (i=gxs; i<gxs+gnx; i++) { 32347c6ae99SBarry Smith for (l=0; l<nc; l++) { 32447c6ae99SBarry Smith /* the complicated stuff is to handle periodic boundaries */ 32547c6ae99SBarry Smith colors[ii++] = l + nc*((SetInRange(i,m) % col) + col*(SetInRange(j,n) % col) + col*col*(SetInRange(k,p) % col)); 32647c6ae99SBarry Smith } 32747c6ae99SBarry Smith } 32847c6ae99SBarry Smith } 32947c6ae99SBarry Smith } 33047c6ae99SBarry Smith ncolors = nc + nc*(col-1 + col*(col-1)+ col*col*(col-1)); 331aaf3ff59SMatthew G. Knepley ierr = ISColoringCreate(comm,ncolors,nc*gnx*gny*gnz,colors,PETSC_OWN_POINTER,&dd->ghostedcoloring);CHKERRQ(ierr); 3325bdb020cSBarry Smith ierr = ISColoringSetType(dd->ghostedcoloring,IS_COLORING_LOCAL);CHKERRQ(ierr); 33347c6ae99SBarry Smith } 33447c6ae99SBarry Smith *coloring = dd->ghostedcoloring; 335ce94432eSBarry Smith } else SETERRQ1(PetscObjectComm((PetscObject)da),PETSC_ERR_ARG_WRONG,"Unknown ISColoringType %d",(int)ctype); 33647c6ae99SBarry Smith ierr = ISColoringReference(*coloring);CHKERRQ(ierr); 33747c6ae99SBarry Smith PetscFunctionReturn(0); 33847c6ae99SBarry Smith } 33947c6ae99SBarry Smith 34047c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/ 34147c6ae99SBarry Smith 342e727c939SJed Brown PetscErrorCode DMCreateColoring_DA_1d_MPIAIJ(DM da,ISColoringType ctype,ISColoring *coloring) 34347c6ae99SBarry Smith { 34447c6ae99SBarry Smith PetscErrorCode ierr; 34547c6ae99SBarry Smith PetscInt xs,nx,i,i1,gxs,gnx,l,m,M,dim,s,nc,col; 34647c6ae99SBarry Smith PetscInt ncolors; 34747c6ae99SBarry Smith MPI_Comm comm; 348bff4a2f0SMatthew G. Knepley DMBoundaryType bx; 34947c6ae99SBarry Smith ISColoringValue *colors; 35047c6ae99SBarry Smith DM_DA *dd = (DM_DA*)da->data; 35147c6ae99SBarry Smith 35247c6ae99SBarry Smith PetscFunctionBegin; 35347c6ae99SBarry Smith /* 35447c6ae99SBarry Smith nc - number of components per grid point 35547c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 35647c6ae99SBarry Smith 35747c6ae99SBarry Smith */ 3581321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,0,0,&M,0,0,&nc,&s,&bx,0,0,0);CHKERRQ(ierr); 35947c6ae99SBarry Smith col = 2*s + 1; 36047c6ae99SBarry Smith 361bff4a2f0SMatthew G. Knepley if (bx == DM_BOUNDARY_PERIODIC && (m % col)) SETERRQ2(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points %d is divisible\n\ 36231e6f798SBarry Smith by 2*stencil_width + 1 %d\n",(int)m,(int)col); 36347c6ae99SBarry Smith 364aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,0,0,&nx,0,0);CHKERRQ(ierr); 365aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,0,0,&gnx,0,0);CHKERRQ(ierr); 36647c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 36747c6ae99SBarry Smith 36847c6ae99SBarry Smith /* create the coloring */ 36947c6ae99SBarry Smith if (ctype == IS_COLORING_GLOBAL) { 37047c6ae99SBarry Smith if (!dd->localcoloring) { 371785e854fSJed Brown ierr = PetscMalloc1(nc*nx,&colors);CHKERRQ(ierr); 372ae4f298aSBarry Smith if (dd->ofillcols) { 373ae4f298aSBarry Smith PetscInt tc = 0; 374ae4f298aSBarry Smith for (i=0; i<nc; i++) tc += (PetscInt) (dd->ofillcols[i] > 0); 375ae4f298aSBarry Smith i1 = 0; 376ae4f298aSBarry Smith for (i=xs; i<xs+nx; i++) { 377ae4f298aSBarry Smith for (l=0; l<nc; l++) { 378ae4f298aSBarry Smith if (dd->ofillcols[l] && (i % col)) { 379ae4f298aSBarry Smith colors[i1++] = nc - 1 + tc*((i % col) - 1) + dd->ofillcols[l]; 380ae4f298aSBarry Smith } else { 381ae4f298aSBarry Smith colors[i1++] = l; 382ae4f298aSBarry Smith } 383ae4f298aSBarry Smith } 384ae4f298aSBarry Smith } 385ae4f298aSBarry Smith ncolors = nc + 2*s*tc; 386ae4f298aSBarry Smith } else { 38747c6ae99SBarry Smith i1 = 0; 38847c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 38947c6ae99SBarry Smith for (l=0; l<nc; l++) { 39047c6ae99SBarry Smith colors[i1++] = l + nc*(i % col); 39147c6ae99SBarry Smith } 39247c6ae99SBarry Smith } 39347c6ae99SBarry Smith ncolors = nc + nc*(col-1); 394ae4f298aSBarry Smith } 395aaf3ff59SMatthew G. Knepley ierr = ISColoringCreate(comm,ncolors,nc*nx,colors,PETSC_OWN_POINTER,&dd->localcoloring);CHKERRQ(ierr); 39647c6ae99SBarry Smith } 39747c6ae99SBarry Smith *coloring = dd->localcoloring; 3985bdb020cSBarry Smith } else if (ctype == IS_COLORING_LOCAL) { 39947c6ae99SBarry Smith if (!dd->ghostedcoloring) { 400785e854fSJed Brown ierr = PetscMalloc1(nc*gnx,&colors);CHKERRQ(ierr); 40147c6ae99SBarry Smith i1 = 0; 40247c6ae99SBarry Smith for (i=gxs; i<gxs+gnx; i++) { 40347c6ae99SBarry Smith for (l=0; l<nc; l++) { 40447c6ae99SBarry Smith /* the complicated stuff is to handle periodic boundaries */ 40547c6ae99SBarry Smith colors[i1++] = l + nc*(SetInRange(i,m) % col); 40647c6ae99SBarry Smith } 40747c6ae99SBarry Smith } 40847c6ae99SBarry Smith ncolors = nc + nc*(col-1); 409aaf3ff59SMatthew G. Knepley ierr = ISColoringCreate(comm,ncolors,nc*gnx,colors,PETSC_OWN_POINTER,&dd->ghostedcoloring);CHKERRQ(ierr); 4105bdb020cSBarry Smith ierr = ISColoringSetType(dd->ghostedcoloring,IS_COLORING_LOCAL);CHKERRQ(ierr); 41147c6ae99SBarry Smith } 41247c6ae99SBarry Smith *coloring = dd->ghostedcoloring; 413ce94432eSBarry Smith } else SETERRQ1(PetscObjectComm((PetscObject)da),PETSC_ERR_ARG_WRONG,"Unknown ISColoringType %d",(int)ctype); 41447c6ae99SBarry Smith ierr = ISColoringReference(*coloring);CHKERRQ(ierr); 41547c6ae99SBarry Smith PetscFunctionReturn(0); 41647c6ae99SBarry Smith } 41747c6ae99SBarry Smith 418e727c939SJed Brown PetscErrorCode DMCreateColoring_DA_2d_5pt_MPIAIJ(DM da,ISColoringType ctype,ISColoring *coloring) 41947c6ae99SBarry Smith { 42047c6ae99SBarry Smith PetscErrorCode ierr; 42147c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,ii,gxs,gys,gnx,gny,m,n,dim,s,k,nc; 42247c6ae99SBarry Smith PetscInt ncolors; 42347c6ae99SBarry Smith MPI_Comm comm; 424bff4a2f0SMatthew G. Knepley DMBoundaryType bx,by; 42547c6ae99SBarry Smith ISColoringValue *colors; 42647c6ae99SBarry Smith DM_DA *dd = (DM_DA*)da->data; 42747c6ae99SBarry Smith 42847c6ae99SBarry Smith PetscFunctionBegin; 42947c6ae99SBarry Smith /* 43047c6ae99SBarry Smith nc - number of components per grid point 43147c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 43247c6ae99SBarry Smith 43347c6ae99SBarry Smith */ 4341321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,&n,0,0,0,0,&nc,&s,&bx,&by,0,0);CHKERRQ(ierr); 435aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,0,&nx,&ny,0);CHKERRQ(ierr); 436aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,0,&gnx,&gny,0);CHKERRQ(ierr); 43747c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 43847c6ae99SBarry Smith 439bff4a2f0SMatthew G. Knepley if (bx == DM_BOUNDARY_PERIODIC && (m % 5)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in X is divisible by 5\n"); 440bff4a2f0SMatthew G. Knepley if (by == DM_BOUNDARY_PERIODIC && (n % 5)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in Y is divisible by 5\n"); 44147c6ae99SBarry Smith 44247c6ae99SBarry Smith /* create the coloring */ 44347c6ae99SBarry Smith if (ctype == IS_COLORING_GLOBAL) { 44447c6ae99SBarry Smith if (!dd->localcoloring) { 445785e854fSJed Brown ierr = PetscMalloc1(nc*nx*ny,&colors);CHKERRQ(ierr); 44647c6ae99SBarry Smith ii = 0; 44747c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 44847c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 44947c6ae99SBarry Smith for (k=0; k<nc; k++) { 45047c6ae99SBarry Smith colors[ii++] = k + nc*((3*j+i) % 5); 45147c6ae99SBarry Smith } 45247c6ae99SBarry Smith } 45347c6ae99SBarry Smith } 45447c6ae99SBarry Smith ncolors = 5*nc; 455aaf3ff59SMatthew G. Knepley ierr = ISColoringCreate(comm,ncolors,nc*nx*ny,colors,PETSC_OWN_POINTER,&dd->localcoloring);CHKERRQ(ierr); 45647c6ae99SBarry Smith } 45747c6ae99SBarry Smith *coloring = dd->localcoloring; 4585bdb020cSBarry Smith } else if (ctype == IS_COLORING_LOCAL) { 45947c6ae99SBarry Smith if (!dd->ghostedcoloring) { 460785e854fSJed Brown ierr = PetscMalloc1(nc*gnx*gny,&colors);CHKERRQ(ierr); 46147c6ae99SBarry Smith ii = 0; 46247c6ae99SBarry Smith for (j=gys; j<gys+gny; j++) { 46347c6ae99SBarry Smith for (i=gxs; i<gxs+gnx; i++) { 46447c6ae99SBarry Smith for (k=0; k<nc; k++) { 46547c6ae99SBarry Smith colors[ii++] = k + nc*((3*SetInRange(j,n) + SetInRange(i,m)) % 5); 46647c6ae99SBarry Smith } 46747c6ae99SBarry Smith } 46847c6ae99SBarry Smith } 46947c6ae99SBarry Smith ncolors = 5*nc; 470aaf3ff59SMatthew G. Knepley ierr = ISColoringCreate(comm,ncolors,nc*gnx*gny,colors,PETSC_OWN_POINTER,&dd->ghostedcoloring);CHKERRQ(ierr); 4715bdb020cSBarry Smith ierr = ISColoringSetType(dd->ghostedcoloring,IS_COLORING_LOCAL);CHKERRQ(ierr); 47247c6ae99SBarry Smith } 47347c6ae99SBarry Smith *coloring = dd->ghostedcoloring; 474ce94432eSBarry Smith } else SETERRQ1(PetscObjectComm((PetscObject)da),PETSC_ERR_ARG_WRONG,"Unknown ISColoringType %d",(int)ctype); 47547c6ae99SBarry Smith PetscFunctionReturn(0); 47647c6ae99SBarry Smith } 47747c6ae99SBarry Smith 47847c6ae99SBarry Smith /* =========================================================================== */ 479950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_1d_MPIAIJ(DM,Mat); 480ce308e1dSBarry Smith extern PetscErrorCode DMCreateMatrix_DA_1d_MPIAIJ_Fill(DM,Mat); 481950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_2d_MPIAIJ(DM,Mat); 482950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_2d_MPIAIJ_Fill(DM,Mat); 483950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_3d_MPIAIJ(DM,Mat); 484950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_3d_MPIAIJ_Fill(DM,Mat); 485950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_2d_MPIBAIJ(DM,Mat); 486950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_3d_MPIBAIJ(DM,Mat); 487950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_2d_MPISBAIJ(DM,Mat); 488950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_3d_MPISBAIJ(DM,Mat); 489d4002b98SHong Zhang extern PetscErrorCode DMCreateMatrix_DA_2d_MPISELL(DM,Mat); 490d4002b98SHong Zhang extern PetscErrorCode DMCreateMatrix_DA_3d_MPISELL(DM,Mat); 491e584696dSStefano Zampini extern PetscErrorCode DMCreateMatrix_DA_IS(DM,Mat); 49247c6ae99SBarry Smith 4938bbdbebaSMatthew G Knepley /*@C 494c688c046SMatthew G Knepley MatSetupDM - Sets the DMDA that is to be used by the HYPRE_StructMatrix PETSc matrix 49547c6ae99SBarry Smith 49647c6ae99SBarry Smith Logically Collective on Mat 49747c6ae99SBarry Smith 49847c6ae99SBarry Smith Input Parameters: 49947c6ae99SBarry Smith + mat - the matrix 50047c6ae99SBarry Smith - da - the da 50147c6ae99SBarry Smith 50247c6ae99SBarry Smith Level: intermediate 50347c6ae99SBarry Smith 50447c6ae99SBarry Smith @*/ 505c688c046SMatthew G Knepley PetscErrorCode MatSetupDM(Mat mat,DM da) 50647c6ae99SBarry Smith { 50747c6ae99SBarry Smith PetscErrorCode ierr; 50847c6ae99SBarry Smith 50947c6ae99SBarry Smith PetscFunctionBegin; 51047c6ae99SBarry Smith PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 51147c6ae99SBarry Smith PetscValidHeaderSpecific(da,DM_CLASSID,1); 512c688c046SMatthew G Knepley ierr = PetscTryMethod(mat,"MatSetupDM_C",(Mat,DM),(mat,da));CHKERRQ(ierr); 51347c6ae99SBarry Smith PetscFunctionReturn(0); 51447c6ae99SBarry Smith } 51547c6ae99SBarry Smith 5167087cfbeSBarry Smith PetscErrorCode MatView_MPI_DA(Mat A,PetscViewer viewer) 51747c6ae99SBarry Smith { 5189a42bb27SBarry Smith DM da; 51947c6ae99SBarry Smith PetscErrorCode ierr; 52047c6ae99SBarry Smith const char *prefix; 52147c6ae99SBarry Smith Mat Anatural; 52247c6ae99SBarry Smith AO ao; 52347c6ae99SBarry Smith PetscInt rstart,rend,*petsc,i; 52447c6ae99SBarry Smith IS is; 52547c6ae99SBarry Smith MPI_Comm comm; 52674388724SJed Brown PetscViewerFormat format; 52747c6ae99SBarry Smith 52847c6ae99SBarry Smith PetscFunctionBegin; 52974388724SJed Brown /* Check whether we are just printing info, in which case MatView() already viewed everything we wanted to view */ 53074388724SJed Brown ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 53174388724SJed Brown if (format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(0); 53274388724SJed Brown 53347c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)A,&comm);CHKERRQ(ierr); 534c688c046SMatthew G Knepley ierr = MatGetDM(A, &da);CHKERRQ(ierr); 535ce94432eSBarry Smith if (!da) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"Matrix not generated from a DMDA"); 53647c6ae99SBarry Smith 537aa219208SBarry Smith ierr = DMDAGetAO(da,&ao);CHKERRQ(ierr); 53847c6ae99SBarry Smith ierr = MatGetOwnershipRange(A,&rstart,&rend);CHKERRQ(ierr); 539854ce69bSBarry Smith ierr = PetscMalloc1(rend-rstart,&petsc);CHKERRQ(ierr); 54047c6ae99SBarry Smith for (i=rstart; i<rend; i++) petsc[i-rstart] = i; 54147c6ae99SBarry Smith ierr = AOApplicationToPetsc(ao,rend-rstart,petsc);CHKERRQ(ierr); 54247c6ae99SBarry Smith ierr = ISCreateGeneral(comm,rend-rstart,petsc,PETSC_OWN_POINTER,&is);CHKERRQ(ierr); 54347c6ae99SBarry Smith 54447c6ae99SBarry Smith /* call viewer on natural ordering */ 5457dae84e0SHong Zhang ierr = MatCreateSubMatrix(A,is,is,MAT_INITIAL_MATRIX,&Anatural);CHKERRQ(ierr); 546fcfd50ebSBarry Smith ierr = ISDestroy(&is);CHKERRQ(ierr); 54747c6ae99SBarry Smith ierr = PetscObjectGetOptionsPrefix((PetscObject)A,&prefix);CHKERRQ(ierr); 54847c6ae99SBarry Smith ierr = PetscObjectSetOptionsPrefix((PetscObject)Anatural,prefix);CHKERRQ(ierr); 54947c6ae99SBarry Smith ierr = PetscObjectSetName((PetscObject)Anatural,((PetscObject)A)->name);CHKERRQ(ierr); 550*f0ed2f47SStefano Zampini ((PetscObject)Anatural)->donotPetscObjectPrintClassNamePrefixType = PETSC_TRUE; 551539c167fSBarry Smith ierr = MatView(Anatural,viewer);CHKERRQ(ierr); 552*f0ed2f47SStefano Zampini ((PetscObject)Anatural)->donotPetscObjectPrintClassNamePrefixType = PETSC_FALSE; 553fcfd50ebSBarry Smith ierr = MatDestroy(&Anatural);CHKERRQ(ierr); 55447c6ae99SBarry Smith PetscFunctionReturn(0); 55547c6ae99SBarry Smith } 55647c6ae99SBarry Smith 5577087cfbeSBarry Smith PetscErrorCode MatLoad_MPI_DA(Mat A,PetscViewer viewer) 55847c6ae99SBarry Smith { 5599a42bb27SBarry Smith DM da; 56047c6ae99SBarry Smith PetscErrorCode ierr; 56147c6ae99SBarry Smith Mat Anatural,Aapp; 56247c6ae99SBarry Smith AO ao; 563539c167fSBarry Smith PetscInt rstart,rend,*app,i,m,n,M,N; 56447c6ae99SBarry Smith IS is; 56547c6ae99SBarry Smith MPI_Comm comm; 56647c6ae99SBarry Smith 56747c6ae99SBarry Smith PetscFunctionBegin; 56847c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)A,&comm);CHKERRQ(ierr); 569c688c046SMatthew G Knepley ierr = MatGetDM(A, &da);CHKERRQ(ierr); 570ce94432eSBarry Smith if (!da) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"Matrix not generated from a DMDA"); 57147c6ae99SBarry Smith 57247c6ae99SBarry Smith /* Load the matrix in natural ordering */ 573ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&Anatural);CHKERRQ(ierr); 57447c6ae99SBarry Smith ierr = MatSetType(Anatural,((PetscObject)A)->type_name);CHKERRQ(ierr); 575539c167fSBarry Smith ierr = MatGetSize(A,&M,&N);CHKERRQ(ierr); 576539c167fSBarry Smith ierr = MatGetLocalSize(A,&m,&n);CHKERRQ(ierr); 577539c167fSBarry Smith ierr = MatSetSizes(Anatural,m,n,M,N);CHKERRQ(ierr); 57847c6ae99SBarry Smith ierr = MatLoad(Anatural,viewer);CHKERRQ(ierr); 57947c6ae99SBarry Smith 58047c6ae99SBarry Smith /* Map natural ordering to application ordering and create IS */ 581aa219208SBarry Smith ierr = DMDAGetAO(da,&ao);CHKERRQ(ierr); 58247c6ae99SBarry Smith ierr = MatGetOwnershipRange(Anatural,&rstart,&rend);CHKERRQ(ierr); 583854ce69bSBarry Smith ierr = PetscMalloc1(rend-rstart,&app);CHKERRQ(ierr); 58447c6ae99SBarry Smith for (i=rstart; i<rend; i++) app[i-rstart] = i; 58547c6ae99SBarry Smith ierr = AOPetscToApplication(ao,rend-rstart,app);CHKERRQ(ierr); 58647c6ae99SBarry Smith ierr = ISCreateGeneral(comm,rend-rstart,app,PETSC_OWN_POINTER,&is);CHKERRQ(ierr); 58747c6ae99SBarry Smith 58847c6ae99SBarry Smith /* Do permutation and replace header */ 5897dae84e0SHong Zhang ierr = MatCreateSubMatrix(Anatural,is,is,MAT_INITIAL_MATRIX,&Aapp);CHKERRQ(ierr); 59028be2f97SBarry Smith ierr = MatHeaderReplace(A,&Aapp);CHKERRQ(ierr); 591fcfd50ebSBarry Smith ierr = ISDestroy(&is);CHKERRQ(ierr); 592fcfd50ebSBarry Smith ierr = MatDestroy(&Anatural);CHKERRQ(ierr); 59347c6ae99SBarry Smith PetscFunctionReturn(0); 59447c6ae99SBarry Smith } 59547c6ae99SBarry Smith 596b412c318SBarry Smith PetscErrorCode DMCreateMatrix_DA(DM da, Mat *J) 59747c6ae99SBarry Smith { 59847c6ae99SBarry Smith PetscErrorCode ierr; 59947c6ae99SBarry Smith PetscInt dim,dof,nx,ny,nz,dims[3],starts[3],M,N,P; 60047c6ae99SBarry Smith Mat A; 60147c6ae99SBarry Smith MPI_Comm comm; 60219fd82e9SBarry Smith MatType Atype; 60337d0c07bSMatthew G Knepley PetscSection section, sectionGlobal; 604e584696dSStefano Zampini void (*aij)(void)=NULL,(*baij)(void)=NULL,(*sbaij)(void)=NULL,(*sell)(void)=NULL,(*is)(void)=NULL; 605b412c318SBarry Smith MatType mtype; 60647c6ae99SBarry Smith PetscMPIInt size; 60747c6ae99SBarry Smith DM_DA *dd = (DM_DA*)da->data; 60847c6ae99SBarry Smith 60947c6ae99SBarry Smith PetscFunctionBegin; 610607a6623SBarry Smith ierr = MatInitializePackage();CHKERRQ(ierr); 611b412c318SBarry Smith mtype = da->mattype; 61247c6ae99SBarry Smith 61337d0c07bSMatthew G Knepley ierr = DMGetDefaultSection(da, §ion);CHKERRQ(ierr); 61437d0c07bSMatthew G Knepley if (section) { 61537d0c07bSMatthew G Knepley PetscInt bs = -1; 61637d0c07bSMatthew G Knepley PetscInt localSize; 61737d0c07bSMatthew G Knepley PetscBool isShell, isBlock, isSeqBlock, isMPIBlock, isSymBlock, isSymSeqBlock, isSymMPIBlock, isSymmetric; 61837d0c07bSMatthew G Knepley 61937d0c07bSMatthew G Knepley ierr = DMGetDefaultGlobalSection(da, §ionGlobal);CHKERRQ(ierr); 62037d0c07bSMatthew G Knepley ierr = PetscSectionGetConstrainedStorageSize(sectionGlobal, &localSize);CHKERRQ(ierr); 621b5579763SJed Brown ierr = MatCreate(PetscObjectComm((PetscObject)da),&A);CHKERRQ(ierr); 622b5579763SJed Brown ierr = MatSetSizes(A,localSize,localSize,PETSC_DETERMINE,PETSC_DETERMINE);CHKERRQ(ierr); 623b5579763SJed Brown ierr = MatSetType(A,mtype);CHKERRQ(ierr); 62437d0c07bSMatthew G Knepley ierr = PetscStrcmp(mtype,MATSHELL,&isShell);CHKERRQ(ierr); 62537d0c07bSMatthew G Knepley ierr = PetscStrcmp(mtype,MATBAIJ,&isBlock);CHKERRQ(ierr); 62637d0c07bSMatthew G Knepley ierr = PetscStrcmp(mtype,MATSEQBAIJ,&isSeqBlock);CHKERRQ(ierr); 62737d0c07bSMatthew G Knepley ierr = PetscStrcmp(mtype,MATMPIBAIJ,&isMPIBlock);CHKERRQ(ierr); 62837d0c07bSMatthew G Knepley ierr = PetscStrcmp(mtype,MATSBAIJ,&isSymBlock);CHKERRQ(ierr); 62937d0c07bSMatthew G Knepley ierr = PetscStrcmp(mtype,MATSEQSBAIJ,&isSymSeqBlock);CHKERRQ(ierr); 63037d0c07bSMatthew G Knepley ierr = PetscStrcmp(mtype,MATMPISBAIJ,&isSymMPIBlock);CHKERRQ(ierr); 63137d0c07bSMatthew G Knepley /* Check for symmetric storage */ 63237d0c07bSMatthew G Knepley isSymmetric = (PetscBool) (isSymBlock || isSymSeqBlock || isSymMPIBlock); 63337d0c07bSMatthew G Knepley if (isSymmetric) { 63437d0c07bSMatthew G Knepley ierr = MatSetOption(*J, MAT_IGNORE_LOWER_TRIANGULAR, PETSC_TRUE);CHKERRQ(ierr); 63537d0c07bSMatthew G Knepley } 63637d0c07bSMatthew G Knepley if (!isShell) { 63737d0c07bSMatthew G Knepley PetscInt *dnz, *onz, *dnzu, *onzu, bsLocal; 63837d0c07bSMatthew G Knepley 63937d0c07bSMatthew G Knepley if (bs < 0) { 64037d0c07bSMatthew G Knepley if (isBlock || isSeqBlock || isMPIBlock || isSymBlock || isSymSeqBlock || isSymMPIBlock) { 64137d0c07bSMatthew G Knepley PetscInt pStart, pEnd, p, dof; 64237d0c07bSMatthew G Knepley 64337d0c07bSMatthew G Knepley ierr = PetscSectionGetChart(sectionGlobal, &pStart, &pEnd);CHKERRQ(ierr); 64437d0c07bSMatthew G Knepley for (p = pStart; p < pEnd; ++p) { 64537d0c07bSMatthew G Knepley ierr = PetscSectionGetDof(sectionGlobal, p, &dof);CHKERRQ(ierr); 64637d0c07bSMatthew G Knepley if (dof) { 64737d0c07bSMatthew G Knepley bs = dof; 64837d0c07bSMatthew G Knepley break; 64937d0c07bSMatthew G Knepley } 65037d0c07bSMatthew G Knepley } 65137d0c07bSMatthew G Knepley } else { 65237d0c07bSMatthew G Knepley bs = 1; 65337d0c07bSMatthew G Knepley } 65437d0c07bSMatthew G Knepley /* Must have same blocksize on all procs (some might have no points) */ 65537d0c07bSMatthew G Knepley bsLocal = bs; 656b2566f29SBarry Smith ierr = MPIU_Allreduce(&bsLocal, &bs, 1, MPIU_INT, MPI_MAX, PetscObjectComm((PetscObject)da));CHKERRQ(ierr); 65737d0c07bSMatthew G Knepley } 6581795a4d1SJed Brown ierr = PetscCalloc4(localSize/bs, &dnz, localSize/bs, &onz, localSize/bs, &dnzu, localSize/bs, &onzu);CHKERRQ(ierr); 659552f7358SJed Brown /* ierr = DMPlexPreallocateOperator(dm, bs, section, sectionGlobal, dnz, onz, dnzu, onzu, *J, fillMatrix);CHKERRQ(ierr); */ 66037d0c07bSMatthew G Knepley ierr = PetscFree4(dnz, onz, dnzu, onzu);CHKERRQ(ierr); 66137d0c07bSMatthew G Knepley } 66237d0c07bSMatthew G Knepley } 66347c6ae99SBarry Smith /* 66447c6ae99SBarry Smith m 66547c6ae99SBarry Smith ------------------------------------------------------ 66647c6ae99SBarry Smith | | 66747c6ae99SBarry Smith | | 66847c6ae99SBarry Smith | ---------------------- | 66947c6ae99SBarry Smith | | | | 67047c6ae99SBarry Smith n | ny | | | 67147c6ae99SBarry Smith | | | | 67247c6ae99SBarry Smith | .--------------------- | 67347c6ae99SBarry Smith | (xs,ys) nx | 67447c6ae99SBarry Smith | . | 67547c6ae99SBarry Smith | (gxs,gys) | 67647c6ae99SBarry Smith | | 67747c6ae99SBarry Smith ----------------------------------------------------- 67847c6ae99SBarry Smith */ 67947c6ae99SBarry Smith 68047c6ae99SBarry Smith /* 68147c6ae99SBarry Smith nc - number of components per grid point 68247c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 68347c6ae99SBarry Smith 68447c6ae99SBarry Smith */ 685e30e807fSPeter Brune M = dd->M; 686e30e807fSPeter Brune N = dd->N; 687e30e807fSPeter Brune P = dd->P; 688c73cfb54SMatthew G. Knepley dim = da->dim; 689e30e807fSPeter Brune dof = dd->w; 690e30e807fSPeter Brune /* ierr = DMDAGetInfo(da,&dim,&M,&N,&P,0,0,0,&dof,0,0,0,0,0);CHKERRQ(ierr); */ 691aa219208SBarry Smith ierr = DMDAGetCorners(da,0,0,0,&nx,&ny,&nz);CHKERRQ(ierr); 69247c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 69347c6ae99SBarry Smith ierr = MatCreate(comm,&A);CHKERRQ(ierr); 69447c6ae99SBarry Smith ierr = MatSetSizes(A,dof*nx*ny*nz,dof*nx*ny*nz,dof*M*N*P,dof*M*N*P);CHKERRQ(ierr); 695b412c318SBarry Smith ierr = MatSetType(A,mtype);CHKERRQ(ierr); 69695ee5b0eSBarry Smith ierr = MatSetDM(A,da);CHKERRQ(ierr); 697b06ff27eSHong Zhang if (da->structure_only) { 698b06ff27eSHong Zhang ierr = MatSetOption(A,MAT_STRUCTURE_ONLY,PETSC_TRUE);CHKERRQ(ierr); 699b06ff27eSHong Zhang } 70047c6ae99SBarry Smith ierr = MatGetType(A,&Atype);CHKERRQ(ierr); 70147c6ae99SBarry Smith /* 702aa219208SBarry Smith We do not provide a getmatrix function in the DMDA operations because 703aa219208SBarry Smith the basic DMDA does not know about matrices. We think of DMDA as being more 70447c6ae99SBarry Smith more low-level than matrices. This is kind of cheating but, cause sometimes 705aa219208SBarry Smith we think of DMDA has higher level than matrices. 70647c6ae99SBarry Smith 70747c6ae99SBarry Smith We could switch based on Atype (or mtype), but we do not since the 70847c6ae99SBarry Smith specialized setting routines depend only the particular preallocation 70947c6ae99SBarry Smith details of the matrix, not the type itself. 71047c6ae99SBarry Smith */ 71147c6ae99SBarry Smith ierr = PetscObjectQueryFunction((PetscObject)A,"MatMPIAIJSetPreallocation_C",&aij);CHKERRQ(ierr); 71247c6ae99SBarry Smith if (!aij) { 71347c6ae99SBarry Smith ierr = PetscObjectQueryFunction((PetscObject)A,"MatSeqAIJSetPreallocation_C",&aij);CHKERRQ(ierr); 71447c6ae99SBarry Smith } 71547c6ae99SBarry Smith if (!aij) { 71647c6ae99SBarry Smith ierr = PetscObjectQueryFunction((PetscObject)A,"MatMPIBAIJSetPreallocation_C",&baij);CHKERRQ(ierr); 71747c6ae99SBarry Smith if (!baij) { 71847c6ae99SBarry Smith ierr = PetscObjectQueryFunction((PetscObject)A,"MatSeqBAIJSetPreallocation_C",&baij);CHKERRQ(ierr); 71947c6ae99SBarry Smith } 72047c6ae99SBarry Smith if (!baij) { 72147c6ae99SBarry Smith ierr = PetscObjectQueryFunction((PetscObject)A,"MatMPISBAIJSetPreallocation_C",&sbaij);CHKERRQ(ierr); 72247c6ae99SBarry Smith if (!sbaij) { 72347c6ae99SBarry Smith ierr = PetscObjectQueryFunction((PetscObject)A,"MatSeqSBAIJSetPreallocation_C",&sbaij);CHKERRQ(ierr); 72447c6ae99SBarry Smith } 7255e26d47bSHong Zhang if (!sbaij) { 726d4002b98SHong Zhang ierr = PetscObjectQueryFunction((PetscObject)A,"MatMPISELLSetPreallocation_C",&sell);CHKERRQ(ierr); 727d4002b98SHong Zhang if (!sell) { 728d4002b98SHong Zhang ierr = PetscObjectQueryFunction((PetscObject)A,"MatSeqSELLSetPreallocation_C",&sell);CHKERRQ(ierr); 7295e26d47bSHong Zhang } 7305e26d47bSHong Zhang } 731e584696dSStefano Zampini if (!sell) { 732e584696dSStefano Zampini ierr = PetscObjectQueryFunction((PetscObject)A,"MatISSetPreallocation_C",&is);CHKERRQ(ierr); 733e584696dSStefano Zampini } 73447c6ae99SBarry Smith } 73547c6ae99SBarry Smith } 73647c6ae99SBarry Smith if (aij) { 73747c6ae99SBarry Smith if (dim == 1) { 738ce308e1dSBarry Smith if (dd->ofill) { 739ce308e1dSBarry Smith ierr = DMCreateMatrix_DA_1d_MPIAIJ_Fill(da,A);CHKERRQ(ierr); 740ce308e1dSBarry Smith } else { 741950540a4SJed Brown ierr = DMCreateMatrix_DA_1d_MPIAIJ(da,A);CHKERRQ(ierr); 742ce308e1dSBarry Smith } 74347c6ae99SBarry Smith } else if (dim == 2) { 74447c6ae99SBarry Smith if (dd->ofill) { 745950540a4SJed Brown ierr = DMCreateMatrix_DA_2d_MPIAIJ_Fill(da,A);CHKERRQ(ierr); 74647c6ae99SBarry Smith } else { 747950540a4SJed Brown ierr = DMCreateMatrix_DA_2d_MPIAIJ(da,A);CHKERRQ(ierr); 74847c6ae99SBarry Smith } 74947c6ae99SBarry Smith } else if (dim == 3) { 75047c6ae99SBarry Smith if (dd->ofill) { 751950540a4SJed Brown ierr = DMCreateMatrix_DA_3d_MPIAIJ_Fill(da,A);CHKERRQ(ierr); 75247c6ae99SBarry Smith } else { 753950540a4SJed Brown ierr = DMCreateMatrix_DA_3d_MPIAIJ(da,A);CHKERRQ(ierr); 75447c6ae99SBarry Smith } 75547c6ae99SBarry Smith } 75647c6ae99SBarry Smith } else if (baij) { 75747c6ae99SBarry Smith if (dim == 2) { 758950540a4SJed Brown ierr = DMCreateMatrix_DA_2d_MPIBAIJ(da,A);CHKERRQ(ierr); 75947c6ae99SBarry Smith } else if (dim == 3) { 760950540a4SJed Brown ierr = DMCreateMatrix_DA_3d_MPIBAIJ(da,A);CHKERRQ(ierr); 761ce94432eSBarry Smith } else SETERRQ3(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"Not implemented for %D dimension and Matrix Type: %s in %D dimension! Send mail to petsc-maint@mcs.anl.gov for code",dim,Atype,dim); 76247c6ae99SBarry Smith } else if (sbaij) { 76347c6ae99SBarry Smith if (dim == 2) { 764950540a4SJed Brown ierr = DMCreateMatrix_DA_2d_MPISBAIJ(da,A);CHKERRQ(ierr); 76547c6ae99SBarry Smith } else if (dim == 3) { 766950540a4SJed Brown ierr = DMCreateMatrix_DA_3d_MPISBAIJ(da,A);CHKERRQ(ierr); 767ce94432eSBarry Smith } else SETERRQ3(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"Not implemented for %D dimension and Matrix Type: %s in %D dimension! Send mail to petsc-maint@mcs.anl.gov for code",dim,Atype,dim); 768d4002b98SHong Zhang } else if (sell) { 7695e26d47bSHong Zhang if (dim == 2) { 770d4002b98SHong Zhang ierr = DMCreateMatrix_DA_2d_MPISELL(da,A);CHKERRQ(ierr); 771711261dbSHong Zhang } else if (dim == 3) { 772d4002b98SHong Zhang ierr = DMCreateMatrix_DA_3d_MPISELL(da,A);CHKERRQ(ierr); 7735e26d47bSHong Zhang } else SETERRQ3(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"Not implemented for %D dimension and Matrix Type: %s in %D dimension! Send mail to petsc-maint@mcs.anl.gov for code",dim,Atype,dim); 774e584696dSStefano Zampini } else if (is) { 775e584696dSStefano Zampini ierr = DMCreateMatrix_DA_IS(da,A);CHKERRQ(ierr); 776869776cdSLisandro Dalcin } else { 77745b6f7e9SBarry Smith ISLocalToGlobalMapping ltog; 778e584696dSStefano Zampini 779b026d285SBarry Smith ierr = MatSetBlockSize(A,dof);CHKERRQ(ierr); 7802949035bSJed Brown ierr = MatSetUp(A);CHKERRQ(ierr); 781b026d285SBarry Smith ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 782869776cdSLisandro Dalcin ierr = MatSetLocalToGlobalMapping(A,ltog,ltog);CHKERRQ(ierr); 78347c6ae99SBarry Smith } 784aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&starts[0],&starts[1],&starts[2],&dims[0],&dims[1],&dims[2]);CHKERRQ(ierr); 78547c6ae99SBarry Smith ierr = MatSetStencil(A,dim,dims,starts,dof);CHKERRQ(ierr); 786c688c046SMatthew G Knepley ierr = MatSetDM(A,da);CHKERRQ(ierr); 78747c6ae99SBarry Smith ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr); 78847c6ae99SBarry Smith if (size > 1) { 78947c6ae99SBarry Smith /* change viewer to display matrix in natural ordering */ 7900c0fd78eSBarry Smith ierr = MatSetOperation(A, MATOP_VIEW, (void (*)(void))MatView_MPI_DA);CHKERRQ(ierr); 7910c0fd78eSBarry Smith ierr = MatSetOperation(A, MATOP_LOAD, (void (*)(void))MatLoad_MPI_DA);CHKERRQ(ierr); 79247c6ae99SBarry Smith } 793b5579763SJed Brown ierr = MatSetFromOptions(A);CHKERRQ(ierr); 79447c6ae99SBarry Smith *J = A; 79547c6ae99SBarry Smith PetscFunctionReturn(0); 79647c6ae99SBarry Smith } 79747c6ae99SBarry Smith 79847c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/ 799e584696dSStefano Zampini PetscErrorCode DMCreateMatrix_DA_IS(DM dm,Mat J) 800e584696dSStefano Zampini { 801e584696dSStefano Zampini DM_DA *da = (DM_DA*)dm->data; 802e584696dSStefano Zampini Mat lJ; 803e584696dSStefano Zampini ISLocalToGlobalMapping ltog; 804e584696dSStefano Zampini IS is_loc_filt, is_glob; 80505339c03SStefano Zampini const PetscInt *e_loc,*idx; 80605339c03SStefano Zampini PetscInt i,nel,nen,dnz,nv,dof,dim,*gidx,nb; 807e584696dSStefano Zampini PetscErrorCode ierr; 808e584696dSStefano Zampini 809e584696dSStefano Zampini /* The l2g map of DMDA has all ghosted nodes, and e_loc is a subset of all the local nodes (including the ghosted) 810e584696dSStefano Zampini We need to filter the local indices that are represented through the DMDAGetElements decomposition 811e584696dSStefano Zampini This is because the size of the local matrices in MATIS is the local size of the l2g map */ 812e584696dSStefano Zampini PetscFunctionBegin; 813e584696dSStefano Zampini dof = da->w; 814e584696dSStefano Zampini dim = dm->dim; 81505339c03SStefano Zampini 81605339c03SStefano Zampini ierr = MatSetBlockSize(J,dof);CHKERRQ(ierr); 81705339c03SStefano Zampini 81805339c03SStefano Zampini /* get local elements indices in local DMDA numbering */ 819e584696dSStefano Zampini ierr = DMDAGetElements(dm,&nel,&nen,&e_loc);CHKERRQ(ierr); /* this will throw an error if the stencil type is not DMDA_STENCIL_BOX */ 820e584696dSStefano Zampini ierr = ISCreateBlock(PetscObjectComm((PetscObject)dm),dof,nel*nen,e_loc,PETSC_COPY_VALUES,&is_loc_filt);CHKERRQ(ierr); 821e584696dSStefano Zampini ierr = DMDARestoreElements(dm,&nel,&nen,&e_loc);CHKERRQ(ierr); 82205339c03SStefano Zampini 82305339c03SStefano Zampini /* obtain a consistent local ordering for MATIS */ 824e584696dSStefano Zampini ierr = ISSortRemoveDups(is_loc_filt);CHKERRQ(ierr); 82505339c03SStefano Zampini ierr = ISBlockGetLocalSize(is_loc_filt,&nb);CHKERRQ(ierr); 82605339c03SStefano Zampini ierr = DMGetLocalToGlobalMapping(dm,<og);CHKERRQ(ierr); 82705339c03SStefano Zampini ierr = ISLocalToGlobalMappingGetSize(ltog,&nv);CHKERRQ(ierr); 82805339c03SStefano Zampini ierr = PetscMalloc1(PetscMax(nb,nv/dof),&gidx);CHKERRQ(ierr); 82905339c03SStefano Zampini ierr = ISBlockGetIndices(is_loc_filt,&idx);CHKERRQ(ierr); 83005339c03SStefano Zampini ierr = ISLocalToGlobalMappingApplyBlock(ltog,nb,idx,gidx);CHKERRQ(ierr); 83105339c03SStefano Zampini ierr = ISBlockRestoreIndices(is_loc_filt,&idx);CHKERRQ(ierr); 83205339c03SStefano Zampini ierr = ISCreateBlock(PetscObjectComm((PetscObject)dm),dof,nb,gidx,PETSC_USE_POINTER,&is_glob);CHKERRQ(ierr); 833e584696dSStefano Zampini ierr = ISLocalToGlobalMappingCreateIS(is_glob,<og);CHKERRQ(ierr); 834e584696dSStefano Zampini ierr = ISDestroy(&is_glob);CHKERRQ(ierr); 835e584696dSStefano Zampini ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 836e584696dSStefano Zampini ierr = ISLocalToGlobalMappingDestroy(<og);CHKERRQ(ierr); 83705339c03SStefano Zampini 838e584696dSStefano Zampini /* We also attach a l2g map to the local matrices to have MatSetValueLocal to work */ 839e584696dSStefano Zampini ierr = MatISGetLocalMat(J,&lJ);CHKERRQ(ierr); 840e584696dSStefano Zampini ierr = ISLocalToGlobalMappingCreateIS(is_loc_filt,<og);CHKERRQ(ierr); 841e584696dSStefano Zampini ierr = ISDestroy(&is_loc_filt);CHKERRQ(ierr); 84205339c03SStefano Zampini ierr = ISCreateStride(PetscObjectComm((PetscObject)lJ),nv/dof,0,1,&is_glob);CHKERRQ(ierr); 84305339c03SStefano Zampini ierr = ISGetIndices(is_glob,&idx);CHKERRQ(ierr); 84405339c03SStefano Zampini ierr = ISGlobalToLocalMappingApplyBlock(ltog,IS_GTOLM_MASK,nv/dof,idx,&nb,gidx);CHKERRQ(ierr); 84505339c03SStefano Zampini ierr = ISRestoreIndices(is_glob,&idx);CHKERRQ(ierr); 846e584696dSStefano Zampini ierr = ISDestroy(&is_glob);CHKERRQ(ierr); 847e584696dSStefano Zampini ierr = ISLocalToGlobalMappingDestroy(<og);CHKERRQ(ierr); 848722d6fa8SStefano Zampini ierr = ISCreateBlock(PETSC_COMM_SELF,dof,nb,gidx,PETSC_USE_POINTER,&is_loc_filt);CHKERRQ(ierr); 849e584696dSStefano Zampini ierr = ISLocalToGlobalMappingCreateIS(is_loc_filt,<og);CHKERRQ(ierr); 850e584696dSStefano Zampini ierr = ISDestroy(&is_loc_filt);CHKERRQ(ierr); 851e584696dSStefano Zampini ierr = MatSetLocalToGlobalMapping(lJ,ltog,ltog);CHKERRQ(ierr); 852e584696dSStefano Zampini ierr = ISLocalToGlobalMappingDestroy(<og);CHKERRQ(ierr); 85305339c03SStefano Zampini ierr = PetscFree(gidx);CHKERRQ(ierr); 85405339c03SStefano Zampini 855e584696dSStefano Zampini /* Preallocation (not exact) */ 856e584696dSStefano Zampini switch (da->elementtype) { 857e584696dSStefano Zampini case DMDA_ELEMENT_P1: 858e584696dSStefano Zampini case DMDA_ELEMENT_Q1: 859e584696dSStefano Zampini dnz = 1; 860e584696dSStefano Zampini for (i=0; i<dim; i++) dnz *= 3; 861e584696dSStefano Zampini dnz *= dof; 862e584696dSStefano Zampini break; 863e584696dSStefano Zampini default: 864e584696dSStefano Zampini SETERRQ1(PetscObjectComm((PetscObject)dm),PETSC_ERR_SUP,"Unhandled element type %d",da->elementtype); 865e584696dSStefano Zampini break; 866e584696dSStefano Zampini } 867e584696dSStefano Zampini ierr = MatSeqAIJSetPreallocation(lJ,dnz,NULL);CHKERRQ(ierr); 868e584696dSStefano Zampini ierr = MatSeqBAIJSetPreallocation(lJ,dof,dnz/dof,NULL);CHKERRQ(ierr); 869e584696dSStefano Zampini ierr = MatSeqSBAIJSetPreallocation(lJ,dof,dnz/dof,NULL);CHKERRQ(ierr); 870e584696dSStefano Zampini ierr = MatISRestoreLocalMat(J,&lJ);CHKERRQ(ierr); 871e584696dSStefano Zampini PetscFunctionReturn(0); 872e584696dSStefano Zampini } 873e584696dSStefano Zampini 874d4002b98SHong Zhang PetscErrorCode DMCreateMatrix_DA_2d_MPISELL(DM da,Mat J) 8755e26d47bSHong Zhang { 8765e26d47bSHong Zhang PetscErrorCode ierr; 8775e26d47bSHong Zhang PetscInt xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny,m,n,dim,s,*cols = NULL,k,nc,*rows = NULL,col,cnt,l,p; 8785e26d47bSHong Zhang PetscInt lstart,lend,pstart,pend,*dnz,*onz; 8795e26d47bSHong Zhang MPI_Comm comm; 8805e26d47bSHong Zhang PetscScalar *values; 8815e26d47bSHong Zhang DMBoundaryType bx,by; 8825e26d47bSHong Zhang ISLocalToGlobalMapping ltog; 8835e26d47bSHong Zhang DMDAStencilType st; 8845e26d47bSHong Zhang 8855e26d47bSHong Zhang PetscFunctionBegin; 8865e26d47bSHong Zhang /* 8875e26d47bSHong Zhang nc - number of components per grid point 8885e26d47bSHong Zhang col - number of colors needed in one direction for single component problem 8895e26d47bSHong Zhang 8905e26d47bSHong Zhang */ 8915e26d47bSHong Zhang ierr = DMDAGetInfo(da,&dim,&m,&n,0,0,0,0,&nc,&s,&bx,&by,0,&st);CHKERRQ(ierr); 8925e26d47bSHong Zhang col = 2*s + 1; 8935e26d47bSHong Zhang ierr = DMDAGetCorners(da,&xs,&ys,0,&nx,&ny,0);CHKERRQ(ierr); 8945e26d47bSHong Zhang ierr = DMDAGetGhostCorners(da,&gxs,&gys,0,&gnx,&gny,0);CHKERRQ(ierr); 8955e26d47bSHong Zhang ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 8965e26d47bSHong Zhang 8975e26d47bSHong Zhang ierr = PetscMalloc2(nc,&rows,col*col*nc*nc,&cols);CHKERRQ(ierr); 8985e26d47bSHong Zhang ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 8995e26d47bSHong Zhang 9005e26d47bSHong Zhang ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr); 9015e26d47bSHong Zhang /* determine the matrix preallocation information */ 9025e26d47bSHong Zhang ierr = MatPreallocateInitialize(comm,nc*nx*ny,nc*nx*ny,dnz,onz);CHKERRQ(ierr); 9035e26d47bSHong Zhang for (i=xs; i<xs+nx; i++) { 9045e26d47bSHong Zhang 9055e26d47bSHong Zhang pstart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 9065e26d47bSHong Zhang pend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 9075e26d47bSHong Zhang 9085e26d47bSHong Zhang for (j=ys; j<ys+ny; j++) { 9095e26d47bSHong Zhang slot = i - gxs + gnx*(j - gys); 9105e26d47bSHong Zhang 9115e26d47bSHong Zhang lstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 9125e26d47bSHong Zhang lend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 9135e26d47bSHong Zhang 9145e26d47bSHong Zhang cnt = 0; 9155e26d47bSHong Zhang for (k=0; k<nc; k++) { 9165e26d47bSHong Zhang for (l=lstart; l<lend+1; l++) { 9175e26d47bSHong Zhang for (p=pstart; p<pend+1; p++) { 9185e26d47bSHong Zhang if ((st == DMDA_STENCIL_BOX) || (!l || !p)) { /* entries on star have either l = 0 or p = 0 */ 9195e26d47bSHong Zhang cols[cnt++] = k + nc*(slot + gnx*l + p); 9205e26d47bSHong Zhang } 9215e26d47bSHong Zhang } 9225e26d47bSHong Zhang } 9235e26d47bSHong Zhang rows[k] = k + nc*(slot); 9245e26d47bSHong Zhang } 9255e26d47bSHong Zhang ierr = MatPreallocateSetLocal(ltog,nc,rows,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr); 9265e26d47bSHong Zhang } 9275e26d47bSHong Zhang } 9285e26d47bSHong Zhang ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr); 929d4002b98SHong Zhang ierr = MatSeqSELLSetPreallocation(J,0,dnz);CHKERRQ(ierr); 930d4002b98SHong Zhang ierr = MatMPISELLSetPreallocation(J,0,dnz,0,onz);CHKERRQ(ierr); 9315e26d47bSHong Zhang ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr); 9325e26d47bSHong Zhang 9335e26d47bSHong Zhang ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 9345e26d47bSHong Zhang 9355e26d47bSHong Zhang /* 9365e26d47bSHong Zhang For each node in the grid: we get the neighbors in the local (on processor ordering 9375e26d47bSHong Zhang that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 9385e26d47bSHong Zhang PETSc ordering. 9395e26d47bSHong Zhang */ 9405e26d47bSHong Zhang if (!da->prealloc_only) { 9415e26d47bSHong Zhang ierr = PetscCalloc1(col*col*nc*nc,&values);CHKERRQ(ierr); 9425e26d47bSHong Zhang for (i=xs; i<xs+nx; i++) { 9435e26d47bSHong Zhang 9445e26d47bSHong Zhang pstart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 9455e26d47bSHong Zhang pend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 9465e26d47bSHong Zhang 9475e26d47bSHong Zhang for (j=ys; j<ys+ny; j++) { 9485e26d47bSHong Zhang slot = i - gxs + gnx*(j - gys); 9495e26d47bSHong Zhang 9505e26d47bSHong Zhang lstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 9515e26d47bSHong Zhang lend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 9525e26d47bSHong Zhang 9535e26d47bSHong Zhang cnt = 0; 9545e26d47bSHong Zhang for (k=0; k<nc; k++) { 9555e26d47bSHong Zhang for (l=lstart; l<lend+1; l++) { 9565e26d47bSHong Zhang for (p=pstart; p<pend+1; p++) { 9575e26d47bSHong Zhang if ((st == DMDA_STENCIL_BOX) || (!l || !p)) { /* entries on star have either l = 0 or p = 0 */ 9585e26d47bSHong Zhang cols[cnt++] = k + nc*(slot + gnx*l + p); 9595e26d47bSHong Zhang } 9605e26d47bSHong Zhang } 9615e26d47bSHong Zhang } 9625e26d47bSHong Zhang rows[k] = k + nc*(slot); 9635e26d47bSHong Zhang } 9645e26d47bSHong Zhang ierr = MatSetValuesLocal(J,nc,rows,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 9655e26d47bSHong Zhang } 9665e26d47bSHong Zhang } 9675e26d47bSHong Zhang ierr = PetscFree(values);CHKERRQ(ierr); 9685e26d47bSHong Zhang ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 9695e26d47bSHong Zhang ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 9705e26d47bSHong Zhang ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr); 9715e26d47bSHong Zhang } 9725e26d47bSHong Zhang ierr = PetscFree2(rows,cols);CHKERRQ(ierr); 9735e26d47bSHong Zhang PetscFunctionReturn(0); 9745e26d47bSHong Zhang } 9755e26d47bSHong Zhang 976d4002b98SHong Zhang PetscErrorCode DMCreateMatrix_DA_3d_MPISELL(DM da,Mat J) 977711261dbSHong Zhang { 978711261dbSHong Zhang PetscErrorCode ierr; 979711261dbSHong Zhang PetscInt xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny; 980711261dbSHong Zhang PetscInt m,n,dim,s,*cols = NULL,k,nc,*rows = NULL,col,cnt,l,p,*dnz = NULL,*onz = NULL; 981711261dbSHong Zhang PetscInt istart,iend,jstart,jend,kstart,kend,zs,nz,gzs,gnz,ii,jj,kk,M,N,P; 982711261dbSHong Zhang MPI_Comm comm; 983711261dbSHong Zhang PetscScalar *values; 984711261dbSHong Zhang DMBoundaryType bx,by,bz; 985711261dbSHong Zhang ISLocalToGlobalMapping ltog; 986711261dbSHong Zhang DMDAStencilType st; 987711261dbSHong Zhang 988711261dbSHong Zhang PetscFunctionBegin; 989711261dbSHong Zhang /* 990711261dbSHong Zhang nc - number of components per grid point 991711261dbSHong Zhang col - number of colors needed in one direction for single component problem 992711261dbSHong Zhang 993711261dbSHong Zhang */ 994711261dbSHong Zhang ierr = DMDAGetInfo(da,&dim,&m,&n,&p,&M,&N,&P,&nc,&s,&bx,&by,&bz,&st);CHKERRQ(ierr); 995711261dbSHong Zhang col = 2*s + 1; 996711261dbSHong Zhang ierr = DMDAGetCorners(da,&xs,&ys,&zs,&nx,&ny,&nz);CHKERRQ(ierr); 997711261dbSHong Zhang ierr = DMDAGetGhostCorners(da,&gxs,&gys,&gzs,&gnx,&gny,&gnz);CHKERRQ(ierr); 998711261dbSHong Zhang ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 999711261dbSHong Zhang 1000711261dbSHong Zhang ierr = PetscMalloc2(nc,&rows,col*col*col*nc*nc,&cols);CHKERRQ(ierr); 1001711261dbSHong Zhang ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 1002711261dbSHong Zhang 1003711261dbSHong Zhang ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr); 1004711261dbSHong Zhang /* determine the matrix preallocation information */ 1005711261dbSHong Zhang ierr = MatPreallocateInitialize(comm,nc*nx*ny*nz,nc*nx*ny*nz,dnz,onz);CHKERRQ(ierr); 1006711261dbSHong Zhang for (i=xs; i<xs+nx; i++) { 1007711261dbSHong Zhang istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 1008711261dbSHong Zhang iend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 1009711261dbSHong Zhang for (j=ys; j<ys+ny; j++) { 1010711261dbSHong Zhang jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 1011711261dbSHong Zhang jend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 1012711261dbSHong Zhang for (k=zs; k<zs+nz; k++) { 1013711261dbSHong Zhang kstart = (bz == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k)); 1014711261dbSHong Zhang kend = (bz == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,p-k-1)); 1015711261dbSHong Zhang 1016711261dbSHong Zhang slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs); 1017711261dbSHong Zhang 1018711261dbSHong Zhang cnt = 0; 1019711261dbSHong Zhang for (l=0; l<nc; l++) { 1020711261dbSHong Zhang for (ii=istart; ii<iend+1; ii++) { 1021711261dbSHong Zhang for (jj=jstart; jj<jend+1; jj++) { 1022711261dbSHong Zhang for (kk=kstart; kk<kend+1; kk++) { 1023711261dbSHong Zhang if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/ 1024711261dbSHong Zhang cols[cnt++] = l + nc*(slot + ii + gnx*jj + gnx*gny*kk); 1025711261dbSHong Zhang } 1026711261dbSHong Zhang } 1027711261dbSHong Zhang } 1028711261dbSHong Zhang } 1029711261dbSHong Zhang rows[l] = l + nc*(slot); 1030711261dbSHong Zhang } 1031711261dbSHong Zhang ierr = MatPreallocateSetLocal(ltog,nc,rows,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr); 1032711261dbSHong Zhang } 1033711261dbSHong Zhang } 1034711261dbSHong Zhang } 1035711261dbSHong Zhang ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr); 1036d4002b98SHong Zhang ierr = MatSeqSELLSetPreallocation(J,0,dnz);CHKERRQ(ierr); 1037d4002b98SHong Zhang ierr = MatMPISELLSetPreallocation(J,0,dnz,0,onz);CHKERRQ(ierr); 1038711261dbSHong Zhang ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr); 1039711261dbSHong Zhang ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 1040711261dbSHong Zhang 1041711261dbSHong Zhang /* 1042711261dbSHong Zhang For each node in the grid: we get the neighbors in the local (on processor ordering 1043711261dbSHong Zhang that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 1044711261dbSHong Zhang PETSc ordering. 1045711261dbSHong Zhang */ 1046711261dbSHong Zhang if (!da->prealloc_only) { 1047711261dbSHong Zhang ierr = PetscCalloc1(col*col*col*nc*nc*nc,&values);CHKERRQ(ierr); 1048711261dbSHong Zhang for (i=xs; i<xs+nx; i++) { 1049711261dbSHong Zhang istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 1050711261dbSHong Zhang iend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 1051711261dbSHong Zhang for (j=ys; j<ys+ny; j++) { 1052711261dbSHong Zhang jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 1053711261dbSHong Zhang jend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 1054711261dbSHong Zhang for (k=zs; k<zs+nz; k++) { 1055711261dbSHong Zhang kstart = (bz == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k)); 1056711261dbSHong Zhang kend = (bz == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,p-k-1)); 1057711261dbSHong Zhang 1058711261dbSHong Zhang slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs); 1059711261dbSHong Zhang 1060711261dbSHong Zhang cnt = 0; 1061711261dbSHong Zhang for (l=0; l<nc; l++) { 1062711261dbSHong Zhang for (ii=istart; ii<iend+1; ii++) { 1063711261dbSHong Zhang for (jj=jstart; jj<jend+1; jj++) { 1064711261dbSHong Zhang for (kk=kstart; kk<kend+1; kk++) { 1065711261dbSHong Zhang if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/ 1066711261dbSHong Zhang cols[cnt++] = l + nc*(slot + ii + gnx*jj + gnx*gny*kk); 1067711261dbSHong Zhang } 1068711261dbSHong Zhang } 1069711261dbSHong Zhang } 1070711261dbSHong Zhang } 1071711261dbSHong Zhang rows[l] = l + nc*(slot); 1072711261dbSHong Zhang } 1073711261dbSHong Zhang ierr = MatSetValuesLocal(J,nc,rows,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 1074711261dbSHong Zhang } 1075711261dbSHong Zhang } 1076711261dbSHong Zhang } 1077711261dbSHong Zhang ierr = PetscFree(values);CHKERRQ(ierr); 1078711261dbSHong Zhang ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1079711261dbSHong Zhang ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1080711261dbSHong Zhang ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr); 1081711261dbSHong Zhang } 1082711261dbSHong Zhang ierr = PetscFree2(rows,cols);CHKERRQ(ierr); 1083711261dbSHong Zhang PetscFunctionReturn(0); 1084711261dbSHong Zhang } 1085711261dbSHong Zhang 1086950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_2d_MPIAIJ(DM da,Mat J) 108747c6ae99SBarry Smith { 108847c6ae99SBarry Smith PetscErrorCode ierr; 1089c1154cd5SBarry Smith PetscInt xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny,m,n,dim,s,*cols = NULL,k,nc,*rows = NULL,col,cnt,l,p,M,N; 109047c6ae99SBarry Smith PetscInt lstart,lend,pstart,pend,*dnz,*onz; 109147c6ae99SBarry Smith MPI_Comm comm; 109247c6ae99SBarry Smith PetscScalar *values; 1093bff4a2f0SMatthew G. Knepley DMBoundaryType bx,by; 109445b6f7e9SBarry Smith ISLocalToGlobalMapping ltog; 1095aa219208SBarry Smith DMDAStencilType st; 1096c1154cd5SBarry Smith PetscBool removedups = PETSC_FALSE; 109747c6ae99SBarry Smith 109847c6ae99SBarry Smith PetscFunctionBegin; 109947c6ae99SBarry Smith /* 110047c6ae99SBarry Smith nc - number of components per grid point 110147c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 110247c6ae99SBarry Smith 110347c6ae99SBarry Smith */ 1104c1154cd5SBarry Smith ierr = DMDAGetInfo(da,&dim,&m,&n,&M,&N,0,0,&nc,&s,&bx,&by,0,&st);CHKERRQ(ierr); 110547c6ae99SBarry Smith col = 2*s + 1; 1106c1154cd5SBarry Smith /* 1107c1154cd5SBarry Smith With one processor in periodic domains in a skinny dimension the code will label nonzero columns multiple times 1108c1154cd5SBarry Smith because of "wrapping" around the end of the domain hitting an entry already counted in the other direction. 1109c1154cd5SBarry Smith */ 1110c1154cd5SBarry Smith if (M == 1 && 2*s >= m) removedups = PETSC_TRUE; 1111c1154cd5SBarry Smith if (N == 1 && 2*s >= n) removedups = PETSC_TRUE; 1112aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,0,&nx,&ny,0);CHKERRQ(ierr); 1113aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,0,&gnx,&gny,0);CHKERRQ(ierr); 111447c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 111547c6ae99SBarry Smith 1116dcca6d9dSJed Brown ierr = PetscMalloc2(nc,&rows,col*col*nc*nc,&cols);CHKERRQ(ierr); 11171411c6eeSJed Brown ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 111847c6ae99SBarry Smith 111906ca8cadSBarry Smith ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr); 112047c6ae99SBarry Smith /* determine the matrix preallocation information */ 112147c6ae99SBarry Smith ierr = MatPreallocateInitialize(comm,nc*nx*ny,nc*nx*ny,dnz,onz);CHKERRQ(ierr); 112247c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 112347c6ae99SBarry Smith 1124bff4a2f0SMatthew G. Knepley pstart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 1125bff4a2f0SMatthew G. Knepley pend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 112647c6ae99SBarry Smith 112747c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 112847c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys); 112947c6ae99SBarry Smith 1130bff4a2f0SMatthew G. Knepley lstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 1131bff4a2f0SMatthew G. Knepley lend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 113247c6ae99SBarry Smith 113347c6ae99SBarry Smith cnt = 0; 113447c6ae99SBarry Smith for (k=0; k<nc; k++) { 113547c6ae99SBarry Smith for (l=lstart; l<lend+1; l++) { 113647c6ae99SBarry Smith for (p=pstart; p<pend+1; p++) { 1137aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || (!l || !p)) { /* entries on star have either l = 0 or p = 0 */ 113847c6ae99SBarry Smith cols[cnt++] = k + nc*(slot + gnx*l + p); 113947c6ae99SBarry Smith } 114047c6ae99SBarry Smith } 114147c6ae99SBarry Smith } 114247c6ae99SBarry Smith rows[k] = k + nc*(slot); 114347c6ae99SBarry Smith } 1144c1154cd5SBarry Smith if (removedups) { 1145c1154cd5SBarry Smith ierr = MatPreallocateSetLocalRemoveDups(ltog,nc,rows,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr); 1146c1154cd5SBarry Smith } else { 1147784ac674SJed Brown ierr = MatPreallocateSetLocal(ltog,nc,rows,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr); 114847c6ae99SBarry Smith } 114947c6ae99SBarry Smith } 1150c1154cd5SBarry Smith } 1151f73d5cc4SBarry Smith ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr); 115247c6ae99SBarry Smith ierr = MatSeqAIJSetPreallocation(J,0,dnz);CHKERRQ(ierr); 115347c6ae99SBarry Smith ierr = MatMPIAIJSetPreallocation(J,0,dnz,0,onz);CHKERRQ(ierr); 115447c6ae99SBarry Smith ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr); 115547c6ae99SBarry Smith 1156784ac674SJed Brown ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 115747c6ae99SBarry Smith 115847c6ae99SBarry Smith /* 115947c6ae99SBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 116047c6ae99SBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 116147c6ae99SBarry Smith PETSc ordering. 116247c6ae99SBarry Smith */ 1163fcfd50ebSBarry Smith if (!da->prealloc_only) { 11641795a4d1SJed Brown ierr = PetscCalloc1(col*col*nc*nc,&values);CHKERRQ(ierr); 116547c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 116647c6ae99SBarry Smith 1167bff4a2f0SMatthew G. Knepley pstart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 1168bff4a2f0SMatthew G. Knepley pend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 116947c6ae99SBarry Smith 117047c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 117147c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys); 117247c6ae99SBarry Smith 1173bff4a2f0SMatthew G. Knepley lstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 1174bff4a2f0SMatthew G. Knepley lend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 117547c6ae99SBarry Smith 117647c6ae99SBarry Smith cnt = 0; 117747c6ae99SBarry Smith for (k=0; k<nc; k++) { 117847c6ae99SBarry Smith for (l=lstart; l<lend+1; l++) { 117947c6ae99SBarry Smith for (p=pstart; p<pend+1; p++) { 1180aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || (!l || !p)) { /* entries on star have either l = 0 or p = 0 */ 118147c6ae99SBarry Smith cols[cnt++] = k + nc*(slot + gnx*l + p); 118247c6ae99SBarry Smith } 118347c6ae99SBarry Smith } 118447c6ae99SBarry Smith } 118547c6ae99SBarry Smith rows[k] = k + nc*(slot); 118647c6ae99SBarry Smith } 118747c6ae99SBarry Smith ierr = MatSetValuesLocal(J,nc,rows,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 118847c6ae99SBarry Smith } 118947c6ae99SBarry Smith } 119047c6ae99SBarry Smith ierr = PetscFree(values);CHKERRQ(ierr); 119147c6ae99SBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 119247c6ae99SBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1193189e4007SBarry Smith ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr); 119447c6ae99SBarry Smith } 119547c6ae99SBarry Smith ierr = PetscFree2(rows,cols);CHKERRQ(ierr); 119647c6ae99SBarry Smith PetscFunctionReturn(0); 119747c6ae99SBarry Smith } 119847c6ae99SBarry Smith 1199950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_2d_MPIAIJ_Fill(DM da,Mat J) 120047c6ae99SBarry Smith { 120147c6ae99SBarry Smith PetscErrorCode ierr; 120247c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny; 1203c1154cd5SBarry Smith PetscInt m,n,dim,s,*cols,k,nc,row,col,cnt,maxcnt = 0,l,p,M,N; 120447c6ae99SBarry Smith PetscInt lstart,lend,pstart,pend,*dnz,*onz; 120547c6ae99SBarry Smith DM_DA *dd = (DM_DA*)da->data; 120647c6ae99SBarry Smith PetscInt ifill_col,*ofill = dd->ofill, *dfill = dd->dfill; 120747c6ae99SBarry Smith MPI_Comm comm; 120847c6ae99SBarry Smith PetscScalar *values; 1209bff4a2f0SMatthew G. Knepley DMBoundaryType bx,by; 121045b6f7e9SBarry Smith ISLocalToGlobalMapping ltog; 1211aa219208SBarry Smith DMDAStencilType st; 1212c1154cd5SBarry Smith PetscBool removedups = PETSC_FALSE; 121347c6ae99SBarry Smith 121447c6ae99SBarry Smith PetscFunctionBegin; 121547c6ae99SBarry Smith /* 121647c6ae99SBarry Smith nc - number of components per grid point 121747c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 121847c6ae99SBarry Smith 121947c6ae99SBarry Smith */ 1220c1154cd5SBarry Smith ierr = DMDAGetInfo(da,&dim,&m,&n,&M,&N,0,0,&nc,&s,&bx,&by,0,&st);CHKERRQ(ierr); 122147c6ae99SBarry Smith col = 2*s + 1; 1222c1154cd5SBarry Smith /* 1223c1154cd5SBarry Smith With one processor in periodic domains in a skinny dimension the code will label nonzero columns multiple times 1224c1154cd5SBarry Smith because of "wrapping" around the end of the domain hitting an entry already counted in the other direction. 1225c1154cd5SBarry Smith */ 1226c1154cd5SBarry Smith if (M == 1 && 2*s >= m) removedups = PETSC_TRUE; 1227c1154cd5SBarry Smith if (N == 1 && 2*s >= n) removedups = PETSC_TRUE; 1228aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,0,&nx,&ny,0);CHKERRQ(ierr); 1229aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,0,&gnx,&gny,0);CHKERRQ(ierr); 123047c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 123147c6ae99SBarry Smith 12324b26d1cfSBarry Smith ierr = PetscMalloc1(col*col*nc,&cols);CHKERRQ(ierr); 12331411c6eeSJed Brown ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 123447c6ae99SBarry Smith 123506ca8cadSBarry Smith ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr); 123647c6ae99SBarry Smith /* determine the matrix preallocation information */ 123747c6ae99SBarry Smith ierr = MatPreallocateInitialize(comm,nc*nx*ny,nc*nx*ny,dnz,onz);CHKERRQ(ierr); 123847c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 123947c6ae99SBarry Smith 1240bff4a2f0SMatthew G. Knepley pstart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 1241bff4a2f0SMatthew G. Knepley pend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 124247c6ae99SBarry Smith 124347c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 124447c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys); 124547c6ae99SBarry Smith 1246bff4a2f0SMatthew G. Knepley lstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 1247bff4a2f0SMatthew G. Knepley lend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 124847c6ae99SBarry Smith 124947c6ae99SBarry Smith for (k=0; k<nc; k++) { 125047c6ae99SBarry Smith cnt = 0; 125147c6ae99SBarry Smith for (l=lstart; l<lend+1; l++) { 125247c6ae99SBarry Smith for (p=pstart; p<pend+1; p++) { 125347c6ae99SBarry Smith if (l || p) { 1254aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || (!l || !p)) { /* entries on star */ 12558865f1eaSKarl Rupp for (ifill_col=ofill[k]; ifill_col<ofill[k+1]; ifill_col++) cols[cnt++] = ofill[ifill_col] + nc*(slot + gnx*l + p); 125647c6ae99SBarry Smith } 125747c6ae99SBarry Smith } else { 125847c6ae99SBarry Smith if (dfill) { 12598865f1eaSKarl Rupp for (ifill_col=dfill[k]; ifill_col<dfill[k+1]; ifill_col++) cols[cnt++] = dfill[ifill_col] + nc*(slot + gnx*l + p); 126047c6ae99SBarry Smith } else { 12618865f1eaSKarl Rupp for (ifill_col=0; ifill_col<nc; ifill_col++) cols[cnt++] = ifill_col + nc*(slot + gnx*l + p); 126247c6ae99SBarry Smith } 126347c6ae99SBarry Smith } 126447c6ae99SBarry Smith } 126547c6ae99SBarry Smith } 126647c6ae99SBarry Smith row = k + nc*(slot); 1267c0ab637bSBarry Smith maxcnt = PetscMax(maxcnt,cnt); 1268c1154cd5SBarry Smith if (removedups) { 1269c1154cd5SBarry Smith ierr = MatPreallocateSetLocalRemoveDups(ltog,1,&row,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr); 1270c1154cd5SBarry Smith } else { 1271784ac674SJed Brown ierr = MatPreallocateSetLocal(ltog,1,&row,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr); 127247c6ae99SBarry Smith } 127347c6ae99SBarry Smith } 127447c6ae99SBarry Smith } 1275c1154cd5SBarry Smith } 127647c6ae99SBarry Smith ierr = MatSeqAIJSetPreallocation(J,0,dnz);CHKERRQ(ierr); 127747c6ae99SBarry Smith ierr = MatMPIAIJSetPreallocation(J,0,dnz,0,onz);CHKERRQ(ierr); 127847c6ae99SBarry Smith ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr); 1279784ac674SJed Brown ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 128047c6ae99SBarry Smith 128147c6ae99SBarry Smith /* 128247c6ae99SBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 128347c6ae99SBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 128447c6ae99SBarry Smith PETSc ordering. 128547c6ae99SBarry Smith */ 1286fcfd50ebSBarry Smith if (!da->prealloc_only) { 1287c0ab637bSBarry Smith ierr = PetscCalloc1(maxcnt,&values);CHKERRQ(ierr); 128847c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 128947c6ae99SBarry Smith 1290bff4a2f0SMatthew G. Knepley pstart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 1291bff4a2f0SMatthew G. Knepley pend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 129247c6ae99SBarry Smith 129347c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 129447c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys); 129547c6ae99SBarry Smith 1296bff4a2f0SMatthew G. Knepley lstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 1297bff4a2f0SMatthew G. Knepley lend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 129847c6ae99SBarry Smith 129947c6ae99SBarry Smith for (k=0; k<nc; k++) { 130047c6ae99SBarry Smith cnt = 0; 130147c6ae99SBarry Smith for (l=lstart; l<lend+1; l++) { 130247c6ae99SBarry Smith for (p=pstart; p<pend+1; p++) { 130347c6ae99SBarry Smith if (l || p) { 1304aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || (!l || !p)) { /* entries on star */ 13058865f1eaSKarl Rupp for (ifill_col=ofill[k]; ifill_col<ofill[k+1]; ifill_col++) cols[cnt++] = ofill[ifill_col] + nc*(slot + gnx*l + p); 130647c6ae99SBarry Smith } 130747c6ae99SBarry Smith } else { 130847c6ae99SBarry Smith if (dfill) { 13098865f1eaSKarl Rupp for (ifill_col=dfill[k]; ifill_col<dfill[k+1]; ifill_col++) cols[cnt++] = dfill[ifill_col] + nc*(slot + gnx*l + p); 131047c6ae99SBarry Smith } else { 13118865f1eaSKarl Rupp for (ifill_col=0; ifill_col<nc; ifill_col++) cols[cnt++] = ifill_col + nc*(slot + gnx*l + p); 131247c6ae99SBarry Smith } 131347c6ae99SBarry Smith } 131447c6ae99SBarry Smith } 131547c6ae99SBarry Smith } 131647c6ae99SBarry Smith row = k + nc*(slot); 131747c6ae99SBarry Smith ierr = MatSetValuesLocal(J,1,&row,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 131847c6ae99SBarry Smith } 131947c6ae99SBarry Smith } 132047c6ae99SBarry Smith } 132147c6ae99SBarry Smith ierr = PetscFree(values);CHKERRQ(ierr); 132247c6ae99SBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 132347c6ae99SBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1324189e4007SBarry Smith ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr); 132547c6ae99SBarry Smith } 132647c6ae99SBarry Smith ierr = PetscFree(cols);CHKERRQ(ierr); 132747c6ae99SBarry Smith PetscFunctionReturn(0); 132847c6ae99SBarry Smith } 132947c6ae99SBarry Smith 133047c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/ 133147c6ae99SBarry Smith 1332950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_3d_MPIAIJ(DM da,Mat J) 133347c6ae99SBarry Smith { 133447c6ae99SBarry Smith PetscErrorCode ierr; 133547c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny; 13360298fd71SBarry Smith PetscInt m,n,dim,s,*cols = NULL,k,nc,*rows = NULL,col,cnt,l,p,*dnz = NULL,*onz = NULL; 1337c1154cd5SBarry Smith PetscInt istart,iend,jstart,jend,kstart,kend,zs,nz,gzs,gnz,ii,jj,kk,M,N,P; 133847c6ae99SBarry Smith MPI_Comm comm; 133947c6ae99SBarry Smith PetscScalar *values; 1340bff4a2f0SMatthew G. Knepley DMBoundaryType bx,by,bz; 134145b6f7e9SBarry Smith ISLocalToGlobalMapping ltog; 1342aa219208SBarry Smith DMDAStencilType st; 1343c1154cd5SBarry Smith PetscBool removedups = PETSC_FALSE; 134447c6ae99SBarry Smith 134547c6ae99SBarry Smith PetscFunctionBegin; 134647c6ae99SBarry Smith /* 134747c6ae99SBarry Smith nc - number of components per grid point 134847c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 134947c6ae99SBarry Smith 135047c6ae99SBarry Smith */ 1351c1154cd5SBarry Smith ierr = DMDAGetInfo(da,&dim,&m,&n,&p,&M,&N,&P,&nc,&s,&bx,&by,&bz,&st);CHKERRQ(ierr); 135247c6ae99SBarry Smith col = 2*s + 1; 135347c6ae99SBarry Smith 1354c1154cd5SBarry Smith /* 1355c1154cd5SBarry Smith With one processor in periodic domains in a skinny dimension the code will label nonzero columns multiple times 1356c1154cd5SBarry Smith because of "wrapping" around the end of the domain hitting an entry already counted in the other direction. 1357c1154cd5SBarry Smith */ 1358c1154cd5SBarry Smith if (M == 1 && 2*s >= m) removedups = PETSC_TRUE; 1359c1154cd5SBarry Smith if (N == 1 && 2*s >= n) removedups = PETSC_TRUE; 1360c1154cd5SBarry Smith if (P == 1 && 2*s >= p) removedups = PETSC_TRUE; 1361c1154cd5SBarry Smith 1362aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,&zs,&nx,&ny,&nz);CHKERRQ(ierr); 1363aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,&gzs,&gnx,&gny,&gnz);CHKERRQ(ierr); 136447c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 136547c6ae99SBarry Smith 1366dcca6d9dSJed Brown ierr = PetscMalloc2(nc,&rows,col*col*col*nc*nc,&cols);CHKERRQ(ierr); 13671411c6eeSJed Brown ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 136847c6ae99SBarry Smith 136906ca8cadSBarry Smith ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr); 137047c6ae99SBarry Smith /* determine the matrix preallocation information */ 137147c6ae99SBarry Smith ierr = MatPreallocateInitialize(comm,nc*nx*ny*nz,nc*nx*ny*nz,dnz,onz);CHKERRQ(ierr); 137247c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 1373bff4a2f0SMatthew G. Knepley istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 1374bff4a2f0SMatthew G. Knepley iend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 137547c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 1376bff4a2f0SMatthew G. Knepley jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 1377bff4a2f0SMatthew G. Knepley jend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 137847c6ae99SBarry Smith for (k=zs; k<zs+nz; k++) { 1379bff4a2f0SMatthew G. Knepley kstart = (bz == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k)); 1380bff4a2f0SMatthew G. Knepley kend = (bz == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,p-k-1)); 138147c6ae99SBarry Smith 138247c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs); 138347c6ae99SBarry Smith 138447c6ae99SBarry Smith cnt = 0; 138547c6ae99SBarry Smith for (l=0; l<nc; l++) { 138647c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 138747c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 138847c6ae99SBarry Smith for (kk=kstart; kk<kend+1; kk++) { 1389aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/ 139047c6ae99SBarry Smith cols[cnt++] = l + nc*(slot + ii + gnx*jj + gnx*gny*kk); 139147c6ae99SBarry Smith } 139247c6ae99SBarry Smith } 139347c6ae99SBarry Smith } 139447c6ae99SBarry Smith } 139547c6ae99SBarry Smith rows[l] = l + nc*(slot); 139647c6ae99SBarry Smith } 1397c1154cd5SBarry Smith if (removedups) { 1398c1154cd5SBarry Smith ierr = MatPreallocateSetLocalRemoveDups(ltog,nc,rows,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr); 1399c1154cd5SBarry Smith } else { 1400784ac674SJed Brown ierr = MatPreallocateSetLocal(ltog,nc,rows,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr); 140147c6ae99SBarry Smith } 140247c6ae99SBarry Smith } 140347c6ae99SBarry Smith } 1404c1154cd5SBarry Smith } 1405f73d5cc4SBarry Smith ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr); 140647c6ae99SBarry Smith ierr = MatSeqAIJSetPreallocation(J,0,dnz);CHKERRQ(ierr); 140747c6ae99SBarry Smith ierr = MatMPIAIJSetPreallocation(J,0,dnz,0,onz);CHKERRQ(ierr); 140847c6ae99SBarry Smith ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr); 1409784ac674SJed Brown ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 141047c6ae99SBarry Smith 141147c6ae99SBarry Smith /* 141247c6ae99SBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 141347c6ae99SBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 141447c6ae99SBarry Smith PETSc ordering. 141547c6ae99SBarry Smith */ 1416fcfd50ebSBarry Smith if (!da->prealloc_only) { 14171795a4d1SJed Brown ierr = PetscCalloc1(col*col*col*nc*nc*nc,&values);CHKERRQ(ierr); 141847c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 1419bff4a2f0SMatthew G. Knepley istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 1420bff4a2f0SMatthew G. Knepley iend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 142147c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 1422bff4a2f0SMatthew G. Knepley jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 1423bff4a2f0SMatthew G. Knepley jend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 142447c6ae99SBarry Smith for (k=zs; k<zs+nz; k++) { 1425bff4a2f0SMatthew G. Knepley kstart = (bz == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k)); 1426bff4a2f0SMatthew G. Knepley kend = (bz == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,p-k-1)); 142747c6ae99SBarry Smith 142847c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs); 142947c6ae99SBarry Smith 143047c6ae99SBarry Smith cnt = 0; 143147c6ae99SBarry Smith for (l=0; l<nc; l++) { 143247c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 143347c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 143447c6ae99SBarry Smith for (kk=kstart; kk<kend+1; kk++) { 1435aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/ 143647c6ae99SBarry Smith cols[cnt++] = l + nc*(slot + ii + gnx*jj + gnx*gny*kk); 143747c6ae99SBarry Smith } 143847c6ae99SBarry Smith } 143947c6ae99SBarry Smith } 144047c6ae99SBarry Smith } 144147c6ae99SBarry Smith rows[l] = l + nc*(slot); 144247c6ae99SBarry Smith } 144347c6ae99SBarry Smith ierr = MatSetValuesLocal(J,nc,rows,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 144447c6ae99SBarry Smith } 144547c6ae99SBarry Smith } 144647c6ae99SBarry Smith } 144747c6ae99SBarry Smith ierr = PetscFree(values);CHKERRQ(ierr); 144847c6ae99SBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 144947c6ae99SBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1450189e4007SBarry Smith ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr); 145147c6ae99SBarry Smith } 145247c6ae99SBarry Smith ierr = PetscFree2(rows,cols);CHKERRQ(ierr); 145347c6ae99SBarry Smith PetscFunctionReturn(0); 145447c6ae99SBarry Smith } 145547c6ae99SBarry Smith 145647c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/ 145747c6ae99SBarry Smith 1458ce308e1dSBarry Smith PetscErrorCode DMCreateMatrix_DA_1d_MPIAIJ_Fill(DM da,Mat J) 1459ce308e1dSBarry Smith { 1460ce308e1dSBarry Smith PetscErrorCode ierr; 1461ce308e1dSBarry Smith DM_DA *dd = (DM_DA*)da->data; 1462ce308e1dSBarry Smith PetscInt xs,nx,i,j,gxs,gnx,row,k,l; 14638d4c968fSBarry Smith PetscInt m,dim,s,*cols = NULL,nc,cnt,maxcnt = 0,*ocols; 14640acb5bebSBarry Smith PetscInt *ofill = dd->ofill,*dfill = dd->dfill; 1465ce308e1dSBarry Smith PetscScalar *values; 1466bff4a2f0SMatthew G. Knepley DMBoundaryType bx; 146745b6f7e9SBarry Smith ISLocalToGlobalMapping ltog; 1468ce308e1dSBarry Smith PetscMPIInt rank,size; 1469ce308e1dSBarry Smith 1470ce308e1dSBarry Smith PetscFunctionBegin; 1471bff4a2f0SMatthew G. Knepley if (dd->bx == DM_BOUNDARY_PERIODIC) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"With fill provided not implemented with periodic boundary conditions"); 1472ce94432eSBarry Smith ierr = MPI_Comm_rank(PetscObjectComm((PetscObject)da),&rank);CHKERRQ(ierr); 1473ce94432eSBarry Smith ierr = MPI_Comm_size(PetscObjectComm((PetscObject)da),&size);CHKERRQ(ierr); 1474ce308e1dSBarry Smith 1475ce308e1dSBarry Smith /* 1476ce308e1dSBarry Smith nc - number of components per grid point 1477ce308e1dSBarry Smith 1478ce308e1dSBarry Smith */ 1479ce308e1dSBarry Smith ierr = DMDAGetInfo(da,&dim,&m,0,0,0,0,0,&nc,&s,&bx,0,0,0);CHKERRQ(ierr); 1480ce308e1dSBarry Smith ierr = DMDAGetCorners(da,&xs,0,0,&nx,0,0);CHKERRQ(ierr); 1481ce308e1dSBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,0,0,&gnx,0,0);CHKERRQ(ierr); 1482ce308e1dSBarry Smith 1483ce308e1dSBarry Smith ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr); 14841795a4d1SJed Brown ierr = PetscCalloc2(nx*nc,&cols,nx*nc,&ocols);CHKERRQ(ierr); 1485ce308e1dSBarry Smith 1486ce308e1dSBarry Smith /* 1487ce308e1dSBarry Smith note should be smaller for first and last process with no periodic 1488ce308e1dSBarry Smith does not handle dfill 1489ce308e1dSBarry Smith */ 1490ce308e1dSBarry Smith cnt = 0; 1491ce308e1dSBarry Smith /* coupling with process to the left */ 1492ce308e1dSBarry Smith for (i=0; i<s; i++) { 1493ce308e1dSBarry Smith for (j=0; j<nc; j++) { 1494ce308e1dSBarry Smith ocols[cnt] = ((!rank) ? 0 : (s - i)*(ofill[j+1] - ofill[j])); 14950acb5bebSBarry Smith cols[cnt] = dfill[j+1] - dfill[j] + (s + i)*(ofill[j+1] - ofill[j]); 1496c0ab637bSBarry Smith maxcnt = PetscMax(maxcnt,ocols[cnt]+cols[cnt]); 1497ce308e1dSBarry Smith cnt++; 1498ce308e1dSBarry Smith } 1499ce308e1dSBarry Smith } 1500ce308e1dSBarry Smith for (i=s; i<nx-s; i++) { 1501ce308e1dSBarry Smith for (j=0; j<nc; j++) { 15020acb5bebSBarry Smith cols[cnt] = dfill[j+1] - dfill[j] + 2*s*(ofill[j+1] - ofill[j]); 1503c0ab637bSBarry Smith maxcnt = PetscMax(maxcnt,ocols[cnt]+cols[cnt]); 1504ce308e1dSBarry Smith cnt++; 1505ce308e1dSBarry Smith } 1506ce308e1dSBarry Smith } 1507ce308e1dSBarry Smith /* coupling with process to the right */ 1508ce308e1dSBarry Smith for (i=nx-s; i<nx; i++) { 1509ce308e1dSBarry Smith for (j=0; j<nc; j++) { 1510ce308e1dSBarry Smith ocols[cnt] = ((rank == (size-1)) ? 0 : (i - nx + s + 1)*(ofill[j+1] - ofill[j])); 15110acb5bebSBarry Smith cols[cnt] = dfill[j+1] - dfill[j] + (s + nx - i - 1)*(ofill[j+1] - ofill[j]); 1512c0ab637bSBarry Smith maxcnt = PetscMax(maxcnt,ocols[cnt]+cols[cnt]); 1513ce308e1dSBarry Smith cnt++; 1514ce308e1dSBarry Smith } 1515ce308e1dSBarry Smith } 1516ce308e1dSBarry Smith 1517ce308e1dSBarry Smith ierr = MatSeqAIJSetPreallocation(J,0,cols);CHKERRQ(ierr); 1518ce308e1dSBarry Smith ierr = MatMPIAIJSetPreallocation(J,0,cols,0,ocols);CHKERRQ(ierr); 1519ce308e1dSBarry Smith ierr = PetscFree2(cols,ocols);CHKERRQ(ierr); 1520ce308e1dSBarry Smith 1521ce308e1dSBarry Smith ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 1522ce308e1dSBarry Smith ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 1523ce308e1dSBarry Smith 1524ce308e1dSBarry Smith /* 1525ce308e1dSBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 1526ce308e1dSBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 1527ce308e1dSBarry Smith PETSc ordering. 1528ce308e1dSBarry Smith */ 1529ce308e1dSBarry Smith if (!da->prealloc_only) { 1530c0ab637bSBarry Smith ierr = PetscCalloc2(maxcnt,&values,maxcnt,&cols);CHKERRQ(ierr); 1531ce308e1dSBarry Smith 1532ce308e1dSBarry Smith row = xs*nc; 1533ce308e1dSBarry Smith /* coupling with process to the left */ 1534ce308e1dSBarry Smith for (i=xs; i<xs+s; i++) { 1535ce308e1dSBarry Smith for (j=0; j<nc; j++) { 1536ce308e1dSBarry Smith cnt = 0; 1537ce308e1dSBarry Smith if (rank) { 1538ce308e1dSBarry Smith for (l=0; l<s; l++) { 1539ce308e1dSBarry Smith for (k=ofill[j]; k<ofill[j+1]; k++) cols[cnt++] = (i - s + l)*nc + ofill[k]; 1540ce308e1dSBarry Smith } 1541ce308e1dSBarry Smith } 15420acb5bebSBarry Smith if (dfill) { 15430acb5bebSBarry Smith for (k=dfill[j]; k<dfill[j+1]; k++) { 15440acb5bebSBarry Smith cols[cnt++] = i*nc + dfill[k]; 15450acb5bebSBarry Smith } 15460acb5bebSBarry Smith } else { 1547ce308e1dSBarry Smith for (k=0; k<nc; k++) { 1548ce308e1dSBarry Smith cols[cnt++] = i*nc + k; 1549ce308e1dSBarry Smith } 15500acb5bebSBarry Smith } 1551ce308e1dSBarry Smith for (l=0; l<s; l++) { 1552ce308e1dSBarry Smith for (k=ofill[j]; k<ofill[j+1]; k++) cols[cnt++] = (i + s - l)*nc + ofill[k]; 1553ce308e1dSBarry Smith } 1554ce308e1dSBarry Smith ierr = MatSetValues(J,1,&row,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 1555ce308e1dSBarry Smith row++; 1556ce308e1dSBarry Smith } 1557ce308e1dSBarry Smith } 1558ce308e1dSBarry Smith for (i=xs+s; i<xs+nx-s; i++) { 1559ce308e1dSBarry Smith for (j=0; j<nc; j++) { 1560ce308e1dSBarry Smith cnt = 0; 1561ce308e1dSBarry Smith for (l=0; l<s; l++) { 1562ce308e1dSBarry Smith for (k=ofill[j]; k<ofill[j+1]; k++) cols[cnt++] = (i - s + l)*nc + ofill[k]; 1563ce308e1dSBarry Smith } 15640acb5bebSBarry Smith if (dfill) { 15650acb5bebSBarry Smith for (k=dfill[j]; k<dfill[j+1]; k++) { 15660acb5bebSBarry Smith cols[cnt++] = i*nc + dfill[k]; 15670acb5bebSBarry Smith } 15680acb5bebSBarry Smith } else { 1569ce308e1dSBarry Smith for (k=0; k<nc; k++) { 1570ce308e1dSBarry Smith cols[cnt++] = i*nc + k; 1571ce308e1dSBarry Smith } 15720acb5bebSBarry Smith } 1573ce308e1dSBarry Smith for (l=0; l<s; l++) { 1574ce308e1dSBarry Smith for (k=ofill[j]; k<ofill[j+1]; k++) cols[cnt++] = (i + s - l)*nc + ofill[k]; 1575ce308e1dSBarry Smith } 1576ce308e1dSBarry Smith ierr = MatSetValues(J,1,&row,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 1577ce308e1dSBarry Smith row++; 1578ce308e1dSBarry Smith } 1579ce308e1dSBarry Smith } 1580ce308e1dSBarry Smith /* coupling with process to the right */ 1581ce308e1dSBarry Smith for (i=xs+nx-s; i<xs+nx; i++) { 1582ce308e1dSBarry Smith for (j=0; j<nc; j++) { 1583ce308e1dSBarry Smith cnt = 0; 1584ce308e1dSBarry Smith for (l=0; l<s; l++) { 1585ce308e1dSBarry Smith for (k=ofill[j]; k<ofill[j+1]; k++) cols[cnt++] = (i - s + l)*nc + ofill[k]; 1586ce308e1dSBarry Smith } 15870acb5bebSBarry Smith if (dfill) { 15880acb5bebSBarry Smith for (k=dfill[j]; k<dfill[j+1]; k++) { 15890acb5bebSBarry Smith cols[cnt++] = i*nc + dfill[k]; 15900acb5bebSBarry Smith } 15910acb5bebSBarry Smith } else { 1592ce308e1dSBarry Smith for (k=0; k<nc; k++) { 1593ce308e1dSBarry Smith cols[cnt++] = i*nc + k; 1594ce308e1dSBarry Smith } 15950acb5bebSBarry Smith } 1596ce308e1dSBarry Smith if (rank < size-1) { 1597ce308e1dSBarry Smith for (l=0; l<s; l++) { 1598ce308e1dSBarry Smith for (k=ofill[j]; k<ofill[j+1]; k++) cols[cnt++] = (i + s - l)*nc + ofill[k]; 1599ce308e1dSBarry Smith } 1600ce308e1dSBarry Smith } 1601ce308e1dSBarry Smith ierr = MatSetValues(J,1,&row,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 1602ce308e1dSBarry Smith row++; 1603ce308e1dSBarry Smith } 1604ce308e1dSBarry Smith } 1605c0ab637bSBarry Smith ierr = PetscFree2(values,cols);CHKERRQ(ierr); 1606ce308e1dSBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1607ce308e1dSBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1608189e4007SBarry Smith ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr); 1609ce308e1dSBarry Smith } 1610ce308e1dSBarry Smith PetscFunctionReturn(0); 1611ce308e1dSBarry Smith } 1612ce308e1dSBarry Smith 1613ce308e1dSBarry Smith /* ---------------------------------------------------------------------------------*/ 1614ce308e1dSBarry Smith 1615950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_1d_MPIAIJ(DM da,Mat J) 161647c6ae99SBarry Smith { 161747c6ae99SBarry Smith PetscErrorCode ierr; 161847c6ae99SBarry Smith PetscInt xs,nx,i,i1,slot,gxs,gnx; 16190298fd71SBarry Smith PetscInt m,dim,s,*cols = NULL,nc,*rows = NULL,col,cnt,l; 162047c6ae99SBarry Smith PetscInt istart,iend; 162147c6ae99SBarry Smith PetscScalar *values; 1622bff4a2f0SMatthew G. Knepley DMBoundaryType bx; 162345b6f7e9SBarry Smith ISLocalToGlobalMapping ltog; 162447c6ae99SBarry Smith 162547c6ae99SBarry Smith PetscFunctionBegin; 162647c6ae99SBarry Smith /* 162747c6ae99SBarry Smith nc - number of components per grid point 162847c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 162947c6ae99SBarry Smith 163047c6ae99SBarry Smith */ 16311321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,0,0,0,0,0,&nc,&s,&bx,0,0,0);CHKERRQ(ierr); 163247c6ae99SBarry Smith col = 2*s + 1; 163347c6ae99SBarry Smith 1634aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,0,0,&nx,0,0);CHKERRQ(ierr); 1635aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,0,0,&gnx,0,0);CHKERRQ(ierr); 163647c6ae99SBarry Smith 1637f73d5cc4SBarry Smith ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr); 163847c6ae99SBarry Smith ierr = MatSeqAIJSetPreallocation(J,col*nc,0);CHKERRQ(ierr); 163947c6ae99SBarry Smith ierr = MatMPIAIJSetPreallocation(J,col*nc,0,col*nc,0);CHKERRQ(ierr); 164047c6ae99SBarry Smith 16411411c6eeSJed Brown ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 1642784ac674SJed Brown ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 164347c6ae99SBarry Smith 164447c6ae99SBarry Smith /* 164547c6ae99SBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 164647c6ae99SBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 164747c6ae99SBarry Smith PETSc ordering. 164847c6ae99SBarry Smith */ 1649fcfd50ebSBarry Smith if (!da->prealloc_only) { 1650dcca6d9dSJed Brown ierr = PetscMalloc2(nc,&rows,col*nc*nc,&cols);CHKERRQ(ierr); 16511795a4d1SJed Brown ierr = PetscCalloc1(col*nc*nc,&values);CHKERRQ(ierr); 165247c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 165347c6ae99SBarry Smith istart = PetscMax(-s,gxs - i); 165447c6ae99SBarry Smith iend = PetscMin(s,gxs + gnx - i - 1); 165547c6ae99SBarry Smith slot = i - gxs; 165647c6ae99SBarry Smith 165747c6ae99SBarry Smith cnt = 0; 165847c6ae99SBarry Smith for (l=0; l<nc; l++) { 165947c6ae99SBarry Smith for (i1=istart; i1<iend+1; i1++) { 166047c6ae99SBarry Smith cols[cnt++] = l + nc*(slot + i1); 166147c6ae99SBarry Smith } 166247c6ae99SBarry Smith rows[l] = l + nc*(slot); 166347c6ae99SBarry Smith } 166447c6ae99SBarry Smith ierr = MatSetValuesLocal(J,nc,rows,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 166547c6ae99SBarry Smith } 166647c6ae99SBarry Smith ierr = PetscFree(values);CHKERRQ(ierr); 166747c6ae99SBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 166847c6ae99SBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1669189e4007SBarry Smith ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr); 167047c6ae99SBarry Smith ierr = PetscFree2(rows,cols);CHKERRQ(ierr); 1671ce308e1dSBarry Smith } 167247c6ae99SBarry Smith PetscFunctionReturn(0); 167347c6ae99SBarry Smith } 167447c6ae99SBarry Smith 1675950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_2d_MPIBAIJ(DM da,Mat J) 167647c6ae99SBarry Smith { 167747c6ae99SBarry Smith PetscErrorCode ierr; 167847c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny; 167947c6ae99SBarry Smith PetscInt m,n,dim,s,*cols,nc,col,cnt,*dnz,*onz; 168047c6ae99SBarry Smith PetscInt istart,iend,jstart,jend,ii,jj; 168147c6ae99SBarry Smith MPI_Comm comm; 168247c6ae99SBarry Smith PetscScalar *values; 1683bff4a2f0SMatthew G. Knepley DMBoundaryType bx,by; 1684aa219208SBarry Smith DMDAStencilType st; 168545b6f7e9SBarry Smith ISLocalToGlobalMapping ltog; 168647c6ae99SBarry Smith 168747c6ae99SBarry Smith PetscFunctionBegin; 168847c6ae99SBarry Smith /* 168947c6ae99SBarry Smith nc - number of components per grid point 169047c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 169147c6ae99SBarry Smith */ 16921321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,&n,0,0,0,0,&nc,&s,&bx,&by,0,&st);CHKERRQ(ierr); 169347c6ae99SBarry Smith col = 2*s + 1; 169447c6ae99SBarry Smith 1695aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,0,&nx,&ny,0);CHKERRQ(ierr); 1696aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,0,&gnx,&gny,0);CHKERRQ(ierr); 169747c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 169847c6ae99SBarry Smith 1699785e854fSJed Brown ierr = PetscMalloc1(col*col*nc*nc,&cols);CHKERRQ(ierr); 170047c6ae99SBarry Smith 17011411c6eeSJed Brown ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 170247c6ae99SBarry Smith 170347c6ae99SBarry Smith /* determine the matrix preallocation information */ 170447c6ae99SBarry Smith ierr = MatPreallocateInitialize(comm,nx*ny,nx*ny,dnz,onz);CHKERRQ(ierr); 170547c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 1706bff4a2f0SMatthew G. Knepley istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 1707bff4a2f0SMatthew G. Knepley iend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 170847c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 1709bff4a2f0SMatthew G. Knepley jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 1710bff4a2f0SMatthew G. Knepley jend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 171147c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys); 171247c6ae99SBarry Smith 171347c6ae99SBarry Smith /* Find block columns in block row */ 171447c6ae99SBarry Smith cnt = 0; 171547c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 171647c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 1717aa219208SBarry Smith if (st == DMDA_STENCIL_BOX || !ii || !jj) { /* BOX or on the STAR */ 171847c6ae99SBarry Smith cols[cnt++] = slot + ii + gnx*jj; 171947c6ae99SBarry Smith } 172047c6ae99SBarry Smith } 172147c6ae99SBarry Smith } 1722d6e23781SBarry Smith ierr = MatPreallocateSetLocalBlock(ltog,1,&slot,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr); 172347c6ae99SBarry Smith } 172447c6ae99SBarry Smith } 172547c6ae99SBarry Smith ierr = MatSeqBAIJSetPreallocation(J,nc,0,dnz);CHKERRQ(ierr); 172647c6ae99SBarry Smith ierr = MatMPIBAIJSetPreallocation(J,nc,0,dnz,0,onz);CHKERRQ(ierr); 172747c6ae99SBarry Smith ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr); 172847c6ae99SBarry Smith 1729784ac674SJed Brown ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 173047c6ae99SBarry Smith 173147c6ae99SBarry Smith /* 173247c6ae99SBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 173347c6ae99SBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 173447c6ae99SBarry Smith PETSc ordering. 173547c6ae99SBarry Smith */ 1736fcfd50ebSBarry Smith if (!da->prealloc_only) { 17371795a4d1SJed Brown ierr = PetscCalloc1(col*col*nc*nc,&values);CHKERRQ(ierr); 173847c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 1739bff4a2f0SMatthew G. Knepley istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 1740bff4a2f0SMatthew G. Knepley iend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 174147c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 1742bff4a2f0SMatthew G. Knepley jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 1743bff4a2f0SMatthew G. Knepley jend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 174447c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys); 174547c6ae99SBarry Smith cnt = 0; 174647c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 174747c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 1748aa219208SBarry Smith if (st == DMDA_STENCIL_BOX || !ii || !jj) { /* BOX or on the STAR */ 174947c6ae99SBarry Smith cols[cnt++] = slot + ii + gnx*jj; 175047c6ae99SBarry Smith } 175147c6ae99SBarry Smith } 175247c6ae99SBarry Smith } 175347c6ae99SBarry Smith ierr = MatSetValuesBlockedLocal(J,1,&slot,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 175447c6ae99SBarry Smith } 175547c6ae99SBarry Smith } 175647c6ae99SBarry Smith ierr = PetscFree(values);CHKERRQ(ierr); 175747c6ae99SBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 175847c6ae99SBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1759189e4007SBarry Smith ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr); 176047c6ae99SBarry Smith } 176147c6ae99SBarry Smith ierr = PetscFree(cols);CHKERRQ(ierr); 176247c6ae99SBarry Smith PetscFunctionReturn(0); 176347c6ae99SBarry Smith } 176447c6ae99SBarry Smith 1765950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_3d_MPIBAIJ(DM da,Mat J) 176647c6ae99SBarry Smith { 176747c6ae99SBarry Smith PetscErrorCode ierr; 176847c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny; 176947c6ae99SBarry Smith PetscInt m,n,dim,s,*cols,k,nc,col,cnt,p,*dnz,*onz; 177047c6ae99SBarry Smith PetscInt istart,iend,jstart,jend,kstart,kend,zs,nz,gzs,gnz,ii,jj,kk; 177147c6ae99SBarry Smith MPI_Comm comm; 177247c6ae99SBarry Smith PetscScalar *values; 1773bff4a2f0SMatthew G. Knepley DMBoundaryType bx,by,bz; 1774aa219208SBarry Smith DMDAStencilType st; 177545b6f7e9SBarry Smith ISLocalToGlobalMapping ltog; 177647c6ae99SBarry Smith 177747c6ae99SBarry Smith PetscFunctionBegin; 177847c6ae99SBarry Smith /* 177947c6ae99SBarry Smith nc - number of components per grid point 178047c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 178147c6ae99SBarry Smith 178247c6ae99SBarry Smith */ 17831321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,&n,&p,0,0,0,&nc,&s,&bx,&by,&bz,&st);CHKERRQ(ierr); 178447c6ae99SBarry Smith col = 2*s + 1; 178547c6ae99SBarry Smith 1786aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,&zs,&nx,&ny,&nz);CHKERRQ(ierr); 1787aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,&gzs,&gnx,&gny,&gnz);CHKERRQ(ierr); 178847c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 178947c6ae99SBarry Smith 1790785e854fSJed Brown ierr = PetscMalloc1(col*col*col,&cols);CHKERRQ(ierr); 179147c6ae99SBarry Smith 17921411c6eeSJed Brown ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 179347c6ae99SBarry Smith 179447c6ae99SBarry Smith /* determine the matrix preallocation information */ 179547c6ae99SBarry Smith ierr = MatPreallocateInitialize(comm,nx*ny*nz,nx*ny*nz,dnz,onz);CHKERRQ(ierr); 179647c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 1797bff4a2f0SMatthew G. Knepley istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 1798bff4a2f0SMatthew G. Knepley iend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 179947c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 1800bff4a2f0SMatthew G. Knepley jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 1801bff4a2f0SMatthew G. Knepley jend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 180247c6ae99SBarry Smith for (k=zs; k<zs+nz; k++) { 1803bff4a2f0SMatthew G. Knepley kstart = (bz == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k)); 1804bff4a2f0SMatthew G. Knepley kend = (bz == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,p-k-1)); 180547c6ae99SBarry Smith 180647c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs); 180747c6ae99SBarry Smith 180847c6ae99SBarry Smith /* Find block columns in block row */ 180947c6ae99SBarry Smith cnt = 0; 181047c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 181147c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 181247c6ae99SBarry Smith for (kk=kstart; kk<kend+1; kk++) { 1813aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/ 181447c6ae99SBarry Smith cols[cnt++] = slot + ii + gnx*jj + gnx*gny*kk; 181547c6ae99SBarry Smith } 181647c6ae99SBarry Smith } 181747c6ae99SBarry Smith } 181847c6ae99SBarry Smith } 1819d6e23781SBarry Smith ierr = MatPreallocateSetLocalBlock(ltog,1,&slot,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr); 182047c6ae99SBarry Smith } 182147c6ae99SBarry Smith } 182247c6ae99SBarry Smith } 182347c6ae99SBarry Smith ierr = MatSeqBAIJSetPreallocation(J,nc,0,dnz);CHKERRQ(ierr); 182447c6ae99SBarry Smith ierr = MatMPIBAIJSetPreallocation(J,nc,0,dnz,0,onz);CHKERRQ(ierr); 182547c6ae99SBarry Smith ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr); 182647c6ae99SBarry Smith 1827784ac674SJed Brown ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 182847c6ae99SBarry Smith 182947c6ae99SBarry Smith /* 183047c6ae99SBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 183147c6ae99SBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 183247c6ae99SBarry Smith PETSc ordering. 183347c6ae99SBarry Smith */ 1834fcfd50ebSBarry Smith if (!da->prealloc_only) { 18351795a4d1SJed Brown ierr = PetscCalloc1(col*col*col*nc*nc,&values);CHKERRQ(ierr); 183647c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 1837bff4a2f0SMatthew G. Knepley istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 1838bff4a2f0SMatthew G. Knepley iend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 183947c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 1840bff4a2f0SMatthew G. Knepley jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 1841bff4a2f0SMatthew G. Knepley jend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 184247c6ae99SBarry Smith for (k=zs; k<zs+nz; k++) { 1843bff4a2f0SMatthew G. Knepley kstart = (bz == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k)); 1844bff4a2f0SMatthew G. Knepley kend = (bz == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,p-k-1)); 184547c6ae99SBarry Smith 184647c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs); 184747c6ae99SBarry Smith 184847c6ae99SBarry Smith cnt = 0; 184947c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 185047c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 185147c6ae99SBarry Smith for (kk=kstart; kk<kend+1; kk++) { 1852aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/ 185347c6ae99SBarry Smith cols[cnt++] = slot + ii + gnx*jj + gnx*gny*kk; 185447c6ae99SBarry Smith } 185547c6ae99SBarry Smith } 185647c6ae99SBarry Smith } 185747c6ae99SBarry Smith } 185847c6ae99SBarry Smith ierr = MatSetValuesBlockedLocal(J,1,&slot,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 185947c6ae99SBarry Smith } 186047c6ae99SBarry Smith } 186147c6ae99SBarry Smith } 186247c6ae99SBarry Smith ierr = PetscFree(values);CHKERRQ(ierr); 186347c6ae99SBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 186447c6ae99SBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1865189e4007SBarry Smith ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr); 186647c6ae99SBarry Smith } 186747c6ae99SBarry Smith ierr = PetscFree(cols);CHKERRQ(ierr); 186847c6ae99SBarry Smith PetscFunctionReturn(0); 186947c6ae99SBarry Smith } 187047c6ae99SBarry Smith 187147c6ae99SBarry Smith /* 187247c6ae99SBarry Smith This helper is for of SBAIJ preallocation, to discard the lower-triangular values which are difficult to 187347c6ae99SBarry Smith identify in the local ordering with periodic domain. 187447c6ae99SBarry Smith */ 187547c6ae99SBarry Smith static PetscErrorCode L2GFilterUpperTriangular(ISLocalToGlobalMapping ltog,PetscInt *row,PetscInt *cnt,PetscInt col[]) 187647c6ae99SBarry Smith { 187747c6ae99SBarry Smith PetscErrorCode ierr; 187847c6ae99SBarry Smith PetscInt i,n; 187947c6ae99SBarry Smith 188047c6ae99SBarry Smith PetscFunctionBegin; 1881d6e23781SBarry Smith ierr = ISLocalToGlobalMappingApplyBlock(ltog,1,row,row);CHKERRQ(ierr); 1882d6e23781SBarry Smith ierr = ISLocalToGlobalMappingApplyBlock(ltog,*cnt,col,col);CHKERRQ(ierr); 188347c6ae99SBarry Smith for (i=0,n=0; i<*cnt; i++) { 188447c6ae99SBarry Smith if (col[i] >= *row) col[n++] = col[i]; 188547c6ae99SBarry Smith } 188647c6ae99SBarry Smith *cnt = n; 188747c6ae99SBarry Smith PetscFunctionReturn(0); 188847c6ae99SBarry Smith } 188947c6ae99SBarry Smith 1890950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_2d_MPISBAIJ(DM da,Mat J) 189147c6ae99SBarry Smith { 189247c6ae99SBarry Smith PetscErrorCode ierr; 189347c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny; 189447c6ae99SBarry Smith PetscInt m,n,dim,s,*cols,nc,col,cnt,*dnz,*onz; 189547c6ae99SBarry Smith PetscInt istart,iend,jstart,jend,ii,jj; 189647c6ae99SBarry Smith MPI_Comm comm; 189747c6ae99SBarry Smith PetscScalar *values; 1898bff4a2f0SMatthew G. Knepley DMBoundaryType bx,by; 1899aa219208SBarry Smith DMDAStencilType st; 190045b6f7e9SBarry Smith ISLocalToGlobalMapping ltog; 190147c6ae99SBarry Smith 190247c6ae99SBarry Smith PetscFunctionBegin; 190347c6ae99SBarry Smith /* 190447c6ae99SBarry Smith nc - number of components per grid point 190547c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 190647c6ae99SBarry Smith */ 19071321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,&n,0,0,0,0,&nc,&s,&bx,&by,0,&st);CHKERRQ(ierr); 190847c6ae99SBarry Smith col = 2*s + 1; 190947c6ae99SBarry Smith 1910aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,0,&nx,&ny,0);CHKERRQ(ierr); 1911aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,0,&gnx,&gny,0);CHKERRQ(ierr); 191247c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 191347c6ae99SBarry Smith 1914785e854fSJed Brown ierr = PetscMalloc1(col*col*nc*nc,&cols);CHKERRQ(ierr); 191547c6ae99SBarry Smith 19161411c6eeSJed Brown ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 191747c6ae99SBarry Smith 191847c6ae99SBarry Smith /* determine the matrix preallocation information */ 1919eabe889fSLisandro Dalcin ierr = MatPreallocateInitialize(comm,nx*ny,nx*ny,dnz,onz);CHKERRQ(ierr); 192047c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 1921bff4a2f0SMatthew G. Knepley istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 1922bff4a2f0SMatthew G. Knepley iend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 192347c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 1924bff4a2f0SMatthew G. Knepley jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 1925bff4a2f0SMatthew G. Knepley jend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 192647c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys); 192747c6ae99SBarry Smith 192847c6ae99SBarry Smith /* Find block columns in block row */ 192947c6ae99SBarry Smith cnt = 0; 193047c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 193147c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 1932aa219208SBarry Smith if (st == DMDA_STENCIL_BOX || !ii || !jj) { 193347c6ae99SBarry Smith cols[cnt++] = slot + ii + gnx*jj; 193447c6ae99SBarry Smith } 193547c6ae99SBarry Smith } 193647c6ae99SBarry Smith } 193745b6f7e9SBarry Smith ierr = L2GFilterUpperTriangular(ltog,&slot,&cnt,cols);CHKERRQ(ierr); 1938d6e23781SBarry Smith ierr = MatPreallocateSymmetricSetBlock(slot,cnt,cols,dnz,onz);CHKERRQ(ierr); 193947c6ae99SBarry Smith } 194047c6ae99SBarry Smith } 194147c6ae99SBarry Smith ierr = MatSeqSBAIJSetPreallocation(J,nc,0,dnz);CHKERRQ(ierr); 194247c6ae99SBarry Smith ierr = MatMPISBAIJSetPreallocation(J,nc,0,dnz,0,onz);CHKERRQ(ierr); 194347c6ae99SBarry Smith ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr); 194447c6ae99SBarry Smith 1945784ac674SJed Brown ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 194647c6ae99SBarry Smith 194747c6ae99SBarry Smith /* 194847c6ae99SBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 194947c6ae99SBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 195047c6ae99SBarry Smith PETSc ordering. 195147c6ae99SBarry Smith */ 1952fcfd50ebSBarry Smith if (!da->prealloc_only) { 19531795a4d1SJed Brown ierr = PetscCalloc1(col*col*nc*nc,&values);CHKERRQ(ierr); 195447c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 1955bff4a2f0SMatthew G. Knepley istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 1956bff4a2f0SMatthew G. Knepley iend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 195747c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 1958bff4a2f0SMatthew G. Knepley jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 1959bff4a2f0SMatthew G. Knepley jend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 196047c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys); 196147c6ae99SBarry Smith 196247c6ae99SBarry Smith /* Find block columns in block row */ 196347c6ae99SBarry Smith cnt = 0; 196447c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 196547c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 1966aa219208SBarry Smith if (st == DMDA_STENCIL_BOX || !ii || !jj) { 196747c6ae99SBarry Smith cols[cnt++] = slot + ii + gnx*jj; 196847c6ae99SBarry Smith } 196947c6ae99SBarry Smith } 197047c6ae99SBarry Smith } 197145b6f7e9SBarry Smith ierr = L2GFilterUpperTriangular(ltog,&slot,&cnt,cols);CHKERRQ(ierr); 197247c6ae99SBarry Smith ierr = MatSetValuesBlocked(J,1,&slot,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 197347c6ae99SBarry Smith } 197447c6ae99SBarry Smith } 197547c6ae99SBarry Smith ierr = PetscFree(values);CHKERRQ(ierr); 197647c6ae99SBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 197747c6ae99SBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1978189e4007SBarry Smith ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr); 197947c6ae99SBarry Smith } 198047c6ae99SBarry Smith ierr = PetscFree(cols);CHKERRQ(ierr); 198147c6ae99SBarry Smith PetscFunctionReturn(0); 198247c6ae99SBarry Smith } 198347c6ae99SBarry Smith 1984950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_3d_MPISBAIJ(DM da,Mat J) 198547c6ae99SBarry Smith { 198647c6ae99SBarry Smith PetscErrorCode ierr; 198747c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny; 198847c6ae99SBarry Smith PetscInt m,n,dim,s,*cols,k,nc,col,cnt,p,*dnz,*onz; 198947c6ae99SBarry Smith PetscInt istart,iend,jstart,jend,kstart,kend,zs,nz,gzs,gnz,ii,jj,kk; 199047c6ae99SBarry Smith MPI_Comm comm; 199147c6ae99SBarry Smith PetscScalar *values; 1992bff4a2f0SMatthew G. Knepley DMBoundaryType bx,by,bz; 1993aa219208SBarry Smith DMDAStencilType st; 199445b6f7e9SBarry Smith ISLocalToGlobalMapping ltog; 199547c6ae99SBarry Smith 199647c6ae99SBarry Smith PetscFunctionBegin; 199747c6ae99SBarry Smith /* 199847c6ae99SBarry Smith nc - number of components per grid point 199947c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 200047c6ae99SBarry Smith */ 20011321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,&n,&p,0,0,0,&nc,&s,&bx,&by,&bz,&st);CHKERRQ(ierr); 200247c6ae99SBarry Smith col = 2*s + 1; 200347c6ae99SBarry Smith 2004aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,&zs,&nx,&ny,&nz);CHKERRQ(ierr); 2005aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,&gzs,&gnx,&gny,&gnz);CHKERRQ(ierr); 200647c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 200747c6ae99SBarry Smith 200847c6ae99SBarry Smith /* create the matrix */ 2009785e854fSJed Brown ierr = PetscMalloc1(col*col*col,&cols);CHKERRQ(ierr); 201047c6ae99SBarry Smith 20111411c6eeSJed Brown ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 201247c6ae99SBarry Smith 201347c6ae99SBarry Smith /* determine the matrix preallocation information */ 2014eabe889fSLisandro Dalcin ierr = MatPreallocateInitialize(comm,nx*ny*nz,nx*ny*nz,dnz,onz);CHKERRQ(ierr); 201547c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 2016bff4a2f0SMatthew G. Knepley istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 2017bff4a2f0SMatthew G. Knepley iend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 201847c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 2019bff4a2f0SMatthew G. Knepley jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 2020bff4a2f0SMatthew G. Knepley jend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 202147c6ae99SBarry Smith for (k=zs; k<zs+nz; k++) { 2022bff4a2f0SMatthew G. Knepley kstart = (bz == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k)); 2023bff4a2f0SMatthew G. Knepley kend = (bz == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,p-k-1)); 202447c6ae99SBarry Smith 202547c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs); 202647c6ae99SBarry Smith 202747c6ae99SBarry Smith /* Find block columns in block row */ 202847c6ae99SBarry Smith cnt = 0; 202947c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 203047c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 203147c6ae99SBarry Smith for (kk=kstart; kk<kend+1; kk++) { 2032aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || (!ii && !jj) || (!jj && !kk) || (!ii && !kk)) { 203347c6ae99SBarry Smith cols[cnt++] = slot + ii + gnx*jj + gnx*gny*kk; 203447c6ae99SBarry Smith } 203547c6ae99SBarry Smith } 203647c6ae99SBarry Smith } 203747c6ae99SBarry Smith } 203845b6f7e9SBarry Smith ierr = L2GFilterUpperTriangular(ltog,&slot,&cnt,cols);CHKERRQ(ierr); 2039d6e23781SBarry Smith ierr = MatPreallocateSymmetricSetBlock(slot,cnt,cols,dnz,onz);CHKERRQ(ierr); 204047c6ae99SBarry Smith } 204147c6ae99SBarry Smith } 204247c6ae99SBarry Smith } 204347c6ae99SBarry Smith ierr = MatSeqSBAIJSetPreallocation(J,nc,0,dnz);CHKERRQ(ierr); 204447c6ae99SBarry Smith ierr = MatMPISBAIJSetPreallocation(J,nc,0,dnz,0,onz);CHKERRQ(ierr); 204547c6ae99SBarry Smith ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr); 204647c6ae99SBarry Smith 2047784ac674SJed Brown ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 204847c6ae99SBarry Smith 204947c6ae99SBarry Smith /* 205047c6ae99SBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 205147c6ae99SBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 205247c6ae99SBarry Smith PETSc ordering. 205347c6ae99SBarry Smith */ 2054fcfd50ebSBarry Smith if (!da->prealloc_only) { 20551795a4d1SJed Brown ierr = PetscCalloc1(col*col*col*nc*nc,&values);CHKERRQ(ierr); 205647c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 2057bff4a2f0SMatthew G. Knepley istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 2058bff4a2f0SMatthew G. Knepley iend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 205947c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 2060bff4a2f0SMatthew G. Knepley jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 2061bff4a2f0SMatthew G. Knepley jend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 206247c6ae99SBarry Smith for (k=zs; k<zs+nz; k++) { 2063bff4a2f0SMatthew G. Knepley kstart = (bz == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k)); 2064bff4a2f0SMatthew G. Knepley kend = (bz == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,p-k-1)); 206547c6ae99SBarry Smith 206647c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs); 206747c6ae99SBarry Smith 206847c6ae99SBarry Smith cnt = 0; 206947c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 207047c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 207147c6ae99SBarry Smith for (kk=kstart; kk<kend+1; kk++) { 2072aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || (!ii && !jj) || (!jj && !kk) || (!ii && !kk)) { 207347c6ae99SBarry Smith cols[cnt++] = slot + ii + gnx*jj + gnx*gny*kk; 207447c6ae99SBarry Smith } 207547c6ae99SBarry Smith } 207647c6ae99SBarry Smith } 207747c6ae99SBarry Smith } 207845b6f7e9SBarry Smith ierr = L2GFilterUpperTriangular(ltog,&slot,&cnt,cols);CHKERRQ(ierr); 207947c6ae99SBarry Smith ierr = MatSetValuesBlocked(J,1,&slot,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 208047c6ae99SBarry Smith } 208147c6ae99SBarry Smith } 208247c6ae99SBarry Smith } 208347c6ae99SBarry Smith ierr = PetscFree(values);CHKERRQ(ierr); 208447c6ae99SBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 208547c6ae99SBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2086189e4007SBarry Smith ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr); 208747c6ae99SBarry Smith } 208847c6ae99SBarry Smith ierr = PetscFree(cols);CHKERRQ(ierr); 208947c6ae99SBarry Smith PetscFunctionReturn(0); 209047c6ae99SBarry Smith } 209147c6ae99SBarry Smith 209247c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/ 209347c6ae99SBarry Smith 2094950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_3d_MPIAIJ_Fill(DM da,Mat J) 209547c6ae99SBarry Smith { 209647c6ae99SBarry Smith PetscErrorCode ierr; 209747c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny; 2098c0ab637bSBarry Smith PetscInt m,n,dim,s,*cols,k,nc,row,col,cnt, maxcnt = 0,l,p,*dnz,*onz; 2099c1154cd5SBarry Smith PetscInt istart,iend,jstart,jend,kstart,kend,zs,nz,gzs,gnz,ii,jj,kk,M,N,P; 210047c6ae99SBarry Smith DM_DA *dd = (DM_DA*)da->data; 210147c6ae99SBarry Smith PetscInt ifill_col,*dfill = dd->dfill,*ofill = dd->ofill; 210247c6ae99SBarry Smith MPI_Comm comm; 210347c6ae99SBarry Smith PetscScalar *values; 2104bff4a2f0SMatthew G. Knepley DMBoundaryType bx,by,bz; 210545b6f7e9SBarry Smith ISLocalToGlobalMapping ltog; 2106aa219208SBarry Smith DMDAStencilType st; 2107c1154cd5SBarry Smith PetscBool removedups = PETSC_FALSE; 210847c6ae99SBarry Smith 210947c6ae99SBarry Smith PetscFunctionBegin; 211047c6ae99SBarry Smith /* 211147c6ae99SBarry Smith nc - number of components per grid point 211247c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 211347c6ae99SBarry Smith 211447c6ae99SBarry Smith */ 2115c1154cd5SBarry Smith ierr = DMDAGetInfo(da,&dim,&m,&n,&p,&M,&N,&P,&nc,&s,&bx,&by,&bz,&st);CHKERRQ(ierr); 211647c6ae99SBarry Smith col = 2*s + 1; 2117bff4a2f0SMatthew G. Knepley if (bx == DM_BOUNDARY_PERIODIC && (m % col)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in X is divisible\n\ 211847c6ae99SBarry Smith by 2*stencil_width + 1\n"); 2119bff4a2f0SMatthew G. Knepley if (by == DM_BOUNDARY_PERIODIC && (n % col)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in Y is divisible\n\ 212047c6ae99SBarry Smith by 2*stencil_width + 1\n"); 2121bff4a2f0SMatthew G. Knepley if (bz == DM_BOUNDARY_PERIODIC && (p % col)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in Z is divisible\n\ 212247c6ae99SBarry Smith by 2*stencil_width + 1\n"); 212347c6ae99SBarry Smith 2124c1154cd5SBarry Smith /* 2125c1154cd5SBarry Smith With one processor in periodic domains in a skinny dimension the code will label nonzero columns multiple times 2126c1154cd5SBarry Smith because of "wrapping" around the end of the domain hitting an entry already counted in the other direction. 2127c1154cd5SBarry Smith */ 2128c1154cd5SBarry Smith if (M == 1 && 2*s >= m) removedups = PETSC_TRUE; 2129c1154cd5SBarry Smith if (N == 1 && 2*s >= n) removedups = PETSC_TRUE; 2130c1154cd5SBarry Smith if (P == 1 && 2*s >= p) removedups = PETSC_TRUE; 2131c1154cd5SBarry Smith 2132aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,&zs,&nx,&ny,&nz);CHKERRQ(ierr); 2133aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,&gzs,&gnx,&gny,&gnz);CHKERRQ(ierr); 213447c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 213547c6ae99SBarry Smith 2136785e854fSJed Brown ierr = PetscMalloc1(col*col*col*nc,&cols);CHKERRQ(ierr); 21371411c6eeSJed Brown ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 213847c6ae99SBarry Smith 213947c6ae99SBarry Smith /* determine the matrix preallocation information */ 214047c6ae99SBarry Smith ierr = MatPreallocateInitialize(comm,nc*nx*ny*nz,nc*nx*ny*nz,dnz,onz);CHKERRQ(ierr); 214147c6ae99SBarry Smith 214206ca8cadSBarry Smith ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr); 214347c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 2144bff4a2f0SMatthew G. Knepley istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 2145bff4a2f0SMatthew G. Knepley iend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 214647c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 2147bff4a2f0SMatthew G. Knepley jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 2148bff4a2f0SMatthew G. Knepley jend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 214947c6ae99SBarry Smith for (k=zs; k<zs+nz; k++) { 2150bff4a2f0SMatthew G. Knepley kstart = (bz == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k)); 2151bff4a2f0SMatthew G. Knepley kend = (bz == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,p-k-1)); 215247c6ae99SBarry Smith 215347c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs); 215447c6ae99SBarry Smith 215547c6ae99SBarry Smith for (l=0; l<nc; l++) { 215647c6ae99SBarry Smith cnt = 0; 215747c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 215847c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 215947c6ae99SBarry Smith for (kk=kstart; kk<kend+1; kk++) { 216047c6ae99SBarry Smith if (ii || jj || kk) { 2161aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/ 21628865f1eaSKarl Rupp for (ifill_col=ofill[l]; ifill_col<ofill[l+1]; ifill_col++) cols[cnt++] = ofill[ifill_col] + nc*(slot + ii + gnx*jj + gnx*gny*kk); 216347c6ae99SBarry Smith } 216447c6ae99SBarry Smith } else { 216547c6ae99SBarry Smith if (dfill) { 21668865f1eaSKarl Rupp for (ifill_col=dfill[l]; ifill_col<dfill[l+1]; ifill_col++) cols[cnt++] = dfill[ifill_col] + nc*(slot + ii + gnx*jj + gnx*gny*kk); 216747c6ae99SBarry Smith } else { 21688865f1eaSKarl Rupp for (ifill_col=0; ifill_col<nc; ifill_col++) cols[cnt++] = ifill_col + nc*(slot + ii + gnx*jj + gnx*gny*kk); 216947c6ae99SBarry Smith } 217047c6ae99SBarry Smith } 217147c6ae99SBarry Smith } 217247c6ae99SBarry Smith } 217347c6ae99SBarry Smith } 217447c6ae99SBarry Smith row = l + nc*(slot); 2175c0ab637bSBarry Smith maxcnt = PetscMax(maxcnt,cnt); 2176c1154cd5SBarry Smith if (removedups) { 2177c1154cd5SBarry Smith ierr = MatPreallocateSetLocalRemoveDups(ltog,1,&row,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr); 2178c1154cd5SBarry Smith } else { 2179784ac674SJed Brown ierr = MatPreallocateSetLocal(ltog,1,&row,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr); 218047c6ae99SBarry Smith } 218147c6ae99SBarry Smith } 218247c6ae99SBarry Smith } 218347c6ae99SBarry Smith } 2184c1154cd5SBarry Smith } 218547c6ae99SBarry Smith ierr = MatSeqAIJSetPreallocation(J,0,dnz);CHKERRQ(ierr); 218647c6ae99SBarry Smith ierr = MatMPIAIJSetPreallocation(J,0,dnz,0,onz);CHKERRQ(ierr); 218747c6ae99SBarry Smith ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr); 2188784ac674SJed Brown ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 218947c6ae99SBarry Smith 219047c6ae99SBarry Smith /* 219147c6ae99SBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 219247c6ae99SBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 219347c6ae99SBarry Smith PETSc ordering. 219447c6ae99SBarry Smith */ 2195fcfd50ebSBarry Smith if (!da->prealloc_only) { 2196c0ab637bSBarry Smith ierr = PetscCalloc1(maxcnt,&values);CHKERRQ(ierr); 219747c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 2198bff4a2f0SMatthew G. Knepley istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 2199bff4a2f0SMatthew G. Knepley iend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 220047c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 2201bff4a2f0SMatthew G. Knepley jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 2202bff4a2f0SMatthew G. Knepley jend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 220347c6ae99SBarry Smith for (k=zs; k<zs+nz; k++) { 2204bff4a2f0SMatthew G. Knepley kstart = (bz == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k)); 2205bff4a2f0SMatthew G. Knepley kend = (bz == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,p-k-1)); 220647c6ae99SBarry Smith 220747c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs); 220847c6ae99SBarry Smith 220947c6ae99SBarry Smith for (l=0; l<nc; l++) { 221047c6ae99SBarry Smith cnt = 0; 221147c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 221247c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 221347c6ae99SBarry Smith for (kk=kstart; kk<kend+1; kk++) { 221447c6ae99SBarry Smith if (ii || jj || kk) { 2215aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/ 22168865f1eaSKarl Rupp for (ifill_col=ofill[l]; ifill_col<ofill[l+1]; ifill_col++) cols[cnt++] = ofill[ifill_col] + nc*(slot + ii + gnx*jj + gnx*gny*kk); 221747c6ae99SBarry Smith } 221847c6ae99SBarry Smith } else { 221947c6ae99SBarry Smith if (dfill) { 22208865f1eaSKarl Rupp for (ifill_col=dfill[l]; ifill_col<dfill[l+1]; ifill_col++) cols[cnt++] = dfill[ifill_col] + nc*(slot + ii + gnx*jj + gnx*gny*kk); 222147c6ae99SBarry Smith } else { 22228865f1eaSKarl Rupp for (ifill_col=0; ifill_col<nc; ifill_col++) cols[cnt++] = ifill_col + nc*(slot + ii + gnx*jj + gnx*gny*kk); 222347c6ae99SBarry Smith } 222447c6ae99SBarry Smith } 222547c6ae99SBarry Smith } 222647c6ae99SBarry Smith } 222747c6ae99SBarry Smith } 222847c6ae99SBarry Smith row = l + nc*(slot); 222947c6ae99SBarry Smith ierr = MatSetValuesLocal(J,1,&row,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 223047c6ae99SBarry Smith } 223147c6ae99SBarry Smith } 223247c6ae99SBarry Smith } 223347c6ae99SBarry Smith } 223447c6ae99SBarry Smith ierr = PetscFree(values);CHKERRQ(ierr); 223547c6ae99SBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 223647c6ae99SBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2237189e4007SBarry Smith ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr); 223847c6ae99SBarry Smith } 223947c6ae99SBarry Smith ierr = PetscFree(cols);CHKERRQ(ierr); 224047c6ae99SBarry Smith PetscFunctionReturn(0); 224147c6ae99SBarry Smith } 2242