147c6ae99SBarry Smith 24035e84dSBarry Smith #include <petsc-private/dmdaimpl.h> /*I "petscdmda.h" I*/ 307475bc1SBarry Smith #include <petscmat.h> 4b45d2f2cSJed Brown #include <petsc-private/matimpl.h> 547c6ae99SBarry Smith 6e727c939SJed Brown extern PetscErrorCode DMCreateColoring_DA_1d_MPIAIJ(DM,ISColoringType,ISColoring*); 7e727c939SJed Brown extern PetscErrorCode DMCreateColoring_DA_2d_MPIAIJ(DM,ISColoringType,ISColoring*); 8e727c939SJed Brown extern PetscErrorCode DMCreateColoring_DA_2d_5pt_MPIAIJ(DM,ISColoringType,ISColoring*); 9e727c939SJed Brown extern PetscErrorCode DMCreateColoring_DA_3d_MPIAIJ(DM,ISColoringType,ISColoring*); 1047c6ae99SBarry Smith 1147c6ae99SBarry Smith /* 1247c6ae99SBarry Smith For ghost i that may be negative or greater than the upper bound this 1347c6ae99SBarry Smith maps it into the 0:m-1 range using periodicity 1447c6ae99SBarry Smith */ 1547c6ae99SBarry Smith #define SetInRange(i,m) ((i < 0) ? m+i : ((i >= m) ? i-m : i)) 1647c6ae99SBarry Smith 1747c6ae99SBarry Smith #undef __FUNCT__ 18aa219208SBarry Smith #define __FUNCT__ "DMDASetBlockFills_Private" 19ce308e1dSBarry Smith static PetscErrorCode DMDASetBlockFills_Private(const PetscInt *dfill,PetscInt w,PetscInt **rfill) 2047c6ae99SBarry Smith { 2147c6ae99SBarry Smith PetscErrorCode ierr; 2247c6ae99SBarry Smith PetscInt i,j,nz,*fill; 2347c6ae99SBarry Smith 2447c6ae99SBarry Smith PetscFunctionBegin; 2547c6ae99SBarry Smith if (!dfill) PetscFunctionReturn(0); 2647c6ae99SBarry Smith 2747c6ae99SBarry Smith /* count number nonzeros */ 2847c6ae99SBarry Smith nz = 0; 2947c6ae99SBarry Smith for (i=0; i<w; i++) { 3047c6ae99SBarry Smith for (j=0; j<w; j++) { 3147c6ae99SBarry Smith if (dfill[w*i+j]) nz++; 3247c6ae99SBarry Smith } 3347c6ae99SBarry Smith } 3447c6ae99SBarry Smith ierr = PetscMalloc((nz + w + 1)*sizeof(PetscInt),&fill);CHKERRQ(ierr); 3547c6ae99SBarry Smith /* construct modified CSR storage of nonzero structure */ 36ce308e1dSBarry Smith /* fill[0 -- w] marks starts of each row of column indices (and end of last row) 37ce308e1dSBarry Smith so fill[1] - fill[0] gives number of nonzeros in first row etc */ 3847c6ae99SBarry Smith nz = w + 1; 3947c6ae99SBarry Smith for (i=0; i<w; i++) { 4047c6ae99SBarry Smith fill[i] = nz; 4147c6ae99SBarry Smith for (j=0; j<w; j++) { 4247c6ae99SBarry Smith if (dfill[w*i+j]) { 4347c6ae99SBarry Smith fill[nz] = j; 4447c6ae99SBarry Smith nz++; 4547c6ae99SBarry Smith } 4647c6ae99SBarry Smith } 4747c6ae99SBarry Smith } 4847c6ae99SBarry Smith fill[w] = nz; 4947c6ae99SBarry Smith 5047c6ae99SBarry Smith *rfill = fill; 5147c6ae99SBarry Smith PetscFunctionReturn(0); 5247c6ae99SBarry Smith } 5347c6ae99SBarry Smith 5447c6ae99SBarry Smith #undef __FUNCT__ 55aa219208SBarry Smith #define __FUNCT__ "DMDASetBlockFills" 5647c6ae99SBarry Smith /*@ 57aa219208SBarry Smith DMDASetBlockFills - Sets the fill pattern in each block for a multi-component problem 58950540a4SJed Brown of the matrix returned by DMCreateMatrix(). 5947c6ae99SBarry Smith 60aa219208SBarry Smith Logically Collective on DMDA 6147c6ae99SBarry Smith 6247c6ae99SBarry Smith Input Parameter: 6347c6ae99SBarry Smith + da - the distributed array 640298fd71SBarry Smith . dfill - the fill pattern in the diagonal block (may be NULL, means use dense block) 6547c6ae99SBarry Smith - ofill - the fill pattern in the off-diagonal blocks 6647c6ae99SBarry Smith 6747c6ae99SBarry Smith 6847c6ae99SBarry Smith Level: developer 6947c6ae99SBarry Smith 7047c6ae99SBarry Smith Notes: This only makes sense when you are doing multicomponent problems but using the 7147c6ae99SBarry Smith MPIAIJ matrix format 7247c6ae99SBarry Smith 7347c6ae99SBarry Smith The format for dfill and ofill is a 2 dimensional dof by dof matrix with 1 entries 7447c6ae99SBarry Smith representing coupling and 0 entries for missing coupling. For example 7547c6ae99SBarry Smith $ dfill[9] = {1, 0, 0, 7647c6ae99SBarry Smith $ 1, 1, 0, 7747c6ae99SBarry Smith $ 0, 1, 1} 7847c6ae99SBarry Smith means that row 0 is coupled with only itself in the diagonal block, row 1 is coupled with 7947c6ae99SBarry Smith itself and row 0 (in the diagonal block) and row 2 is coupled with itself and row 1 (in the 8047c6ae99SBarry Smith diagonal block). 8147c6ae99SBarry Smith 82aa219208SBarry Smith DMDASetGetMatrix() allows you to provide general code for those more complicated nonzero patterns then 8347c6ae99SBarry Smith can be represented in the dfill, ofill format 8447c6ae99SBarry Smith 8547c6ae99SBarry Smith Contributed by Glenn Hammond 8647c6ae99SBarry Smith 878ddb5d8bSBarry Smith .seealso DMCreateMatrix(), DMDASetGetMatrix(), DMSetMatrixPreallocateOnly() 8847c6ae99SBarry Smith 8947c6ae99SBarry Smith @*/ 90ce308e1dSBarry Smith PetscErrorCode DMDASetBlockFills(DM da,const PetscInt *dfill,const PetscInt *ofill) 9147c6ae99SBarry Smith { 9247c6ae99SBarry Smith DM_DA *dd = (DM_DA*)da->data; 9347c6ae99SBarry Smith PetscErrorCode ierr; 94ae4f298aSBarry Smith PetscInt i,k,cnt = 1; 9547c6ae99SBarry Smith 9647c6ae99SBarry Smith PetscFunctionBegin; 97aa219208SBarry Smith ierr = DMDASetBlockFills_Private(dfill,dd->w,&dd->dfill);CHKERRQ(ierr); 98aa219208SBarry Smith ierr = DMDASetBlockFills_Private(ofill,dd->w,&dd->ofill);CHKERRQ(ierr); 99ae4f298aSBarry Smith 100ae4f298aSBarry Smith /* ofillcount tracks the columns of ofill that have any nonzero in thems; the value in each location is the number of 101ae4f298aSBarry Smith columns to the left with any nonzeros in them plus 1 */ 102ae4f298aSBarry Smith ierr = PetscMalloc(dd->w*sizeof(PetscBool),&dd->ofillcols);CHKERRQ(ierr); 103ae4f298aSBarry Smith ierr = PetscMemzero(dd->ofillcols,dd->w*sizeof(PetscBool));CHKERRQ(ierr); 104ae4f298aSBarry Smith for (i=0; i<dd->w; i++) { 105ae4f298aSBarry Smith for (k=dd->ofill[i]; k<dd->ofill[i+1]; k++) dd->ofillcols[dd->ofill[k]] = 1; 106ae4f298aSBarry Smith } 107ae4f298aSBarry Smith for (i=0; i<dd->w; i++) { 108ae4f298aSBarry Smith if (dd->ofillcols[i]) { 109ae4f298aSBarry Smith dd->ofillcols[i] = cnt++; 110ae4f298aSBarry Smith } 111ae4f298aSBarry Smith } 11247c6ae99SBarry Smith PetscFunctionReturn(0); 11347c6ae99SBarry Smith } 11447c6ae99SBarry Smith 11547c6ae99SBarry Smith 11647c6ae99SBarry Smith #undef __FUNCT__ 117e727c939SJed Brown #define __FUNCT__ "DMCreateColoring_DA" 11819fd82e9SBarry Smith PetscErrorCode DMCreateColoring_DA(DM da,ISColoringType ctype,MatType mtype,ISColoring *coloring) 11947c6ae99SBarry Smith { 12047c6ae99SBarry Smith PetscErrorCode ierr; 12147c6ae99SBarry Smith PetscInt dim,m,n,p,nc; 1221321219cSEthan Coon DMDABoundaryType bx,by,bz; 12347c6ae99SBarry Smith MPI_Comm comm; 12447c6ae99SBarry Smith PetscMPIInt size; 12547c6ae99SBarry Smith PetscBool isBAIJ; 12647c6ae99SBarry Smith DM_DA *dd = (DM_DA*)da->data; 12747c6ae99SBarry Smith 12847c6ae99SBarry Smith PetscFunctionBegin; 12947c6ae99SBarry Smith /* 13047c6ae99SBarry Smith m 13147c6ae99SBarry Smith ------------------------------------------------------ 13247c6ae99SBarry Smith | | 13347c6ae99SBarry Smith | | 13447c6ae99SBarry Smith | ---------------------- | 13547c6ae99SBarry Smith | | | | 13647c6ae99SBarry Smith n | yn | | | 13747c6ae99SBarry Smith | | | | 13847c6ae99SBarry Smith | .--------------------- | 13947c6ae99SBarry Smith | (xs,ys) xn | 14047c6ae99SBarry Smith | . | 14147c6ae99SBarry Smith | (gxs,gys) | 14247c6ae99SBarry Smith | | 14347c6ae99SBarry Smith ----------------------------------------------------- 14447c6ae99SBarry Smith */ 14547c6ae99SBarry Smith 14647c6ae99SBarry Smith /* 14747c6ae99SBarry Smith nc - number of components per grid point 14847c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 14947c6ae99SBarry Smith 15047c6ae99SBarry Smith */ 1511321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,0,0,0,&m,&n,&p,&nc,0,&bx,&by,&bz,0);CHKERRQ(ierr); 15247c6ae99SBarry Smith 15347c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 15447c6ae99SBarry Smith ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr); 15547c6ae99SBarry Smith if (ctype == IS_COLORING_GHOSTED) { 15647c6ae99SBarry Smith if (size == 1) { 15747c6ae99SBarry Smith ctype = IS_COLORING_GLOBAL; 15847c6ae99SBarry Smith } else if (dim > 1) { 1591321219cSEthan Coon if ((m==1 && bx == DMDA_BOUNDARY_PERIODIC) || (n==1 && by == DMDA_BOUNDARY_PERIODIC) || (p==1 && bz == DMDA_BOUNDARY_PERIODIC)) { 160ce94432eSBarry Smith SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"IS_COLORING_GHOSTED cannot be used for periodic boundary condition having both ends of the domain on the same process"); 16147c6ae99SBarry Smith } 16247c6ae99SBarry Smith } 16347c6ae99SBarry Smith } 16447c6ae99SBarry Smith 165aa219208SBarry Smith /* Tell the DMDA it has 1 degree of freedom per grid point so that the coloring for BAIJ 16647c6ae99SBarry Smith matrices is for the blocks, not the individual matrix elements */ 1674833614aSSatish Balay ierr = PetscStrcmp(mtype,MATBAIJ,&isBAIJ);CHKERRQ(ierr); 1684833614aSSatish Balay if (!isBAIJ) {ierr = PetscStrcmp(mtype,MATMPIBAIJ,&isBAIJ);CHKERRQ(ierr);} 16947c6ae99SBarry Smith if (!isBAIJ) {ierr = PetscStrcmp(mtype,MATSEQBAIJ,&isBAIJ);CHKERRQ(ierr);} 17047c6ae99SBarry Smith if (isBAIJ) { 17147c6ae99SBarry Smith dd->w = 1; 17247c6ae99SBarry Smith dd->xs = dd->xs/nc; 17347c6ae99SBarry Smith dd->xe = dd->xe/nc; 17447c6ae99SBarry Smith dd->Xs = dd->Xs/nc; 17547c6ae99SBarry Smith dd->Xe = dd->Xe/nc; 17647c6ae99SBarry Smith } 17747c6ae99SBarry Smith 17847c6ae99SBarry Smith /* 179aa219208SBarry Smith We do not provide a getcoloring function in the DMDA operations because 180aa219208SBarry Smith the basic DMDA does not know about matrices. We think of DMDA as being more 18147c6ae99SBarry Smith more low-level then matrices. 18247c6ae99SBarry Smith */ 18347c6ae99SBarry Smith if (dim == 1) { 184e727c939SJed Brown ierr = DMCreateColoring_DA_1d_MPIAIJ(da,ctype,coloring);CHKERRQ(ierr); 18547c6ae99SBarry Smith } else if (dim == 2) { 186e727c939SJed Brown ierr = DMCreateColoring_DA_2d_MPIAIJ(da,ctype,coloring);CHKERRQ(ierr); 18747c6ae99SBarry Smith } else if (dim == 3) { 188e727c939SJed Brown ierr = DMCreateColoring_DA_3d_MPIAIJ(da,ctype,coloring);CHKERRQ(ierr); 189ce94432eSBarry Smith } else SETERRQ1(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"Not done for %D dimension, send us mail petsc-maint@mcs.anl.gov for code",dim); 19047c6ae99SBarry Smith if (isBAIJ) { 19147c6ae99SBarry Smith dd->w = nc; 19247c6ae99SBarry Smith dd->xs = dd->xs*nc; 19347c6ae99SBarry Smith dd->xe = dd->xe*nc; 19447c6ae99SBarry Smith dd->Xs = dd->Xs*nc; 19547c6ae99SBarry Smith dd->Xe = dd->Xe*nc; 19647c6ae99SBarry Smith } 19747c6ae99SBarry Smith PetscFunctionReturn(0); 19847c6ae99SBarry Smith } 19947c6ae99SBarry Smith 20047c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/ 20147c6ae99SBarry Smith 20247c6ae99SBarry Smith #undef __FUNCT__ 203e727c939SJed Brown #define __FUNCT__ "DMCreateColoring_DA_2d_MPIAIJ" 204e727c939SJed Brown PetscErrorCode DMCreateColoring_DA_2d_MPIAIJ(DM da,ISColoringType ctype,ISColoring *coloring) 20547c6ae99SBarry Smith { 20647c6ae99SBarry Smith PetscErrorCode ierr; 20747c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,ii,gxs,gys,gnx,gny,m,n,M,N,dim,s,k,nc,col; 20847c6ae99SBarry Smith PetscInt ncolors; 20947c6ae99SBarry Smith MPI_Comm comm; 2101321219cSEthan Coon DMDABoundaryType bx,by; 211aa219208SBarry Smith DMDAStencilType st; 21247c6ae99SBarry Smith ISColoringValue *colors; 21347c6ae99SBarry Smith DM_DA *dd = (DM_DA*)da->data; 21447c6ae99SBarry Smith 21547c6ae99SBarry Smith PetscFunctionBegin; 21647c6ae99SBarry Smith /* 21747c6ae99SBarry Smith nc - number of components per grid point 21847c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 21947c6ae99SBarry Smith 22047c6ae99SBarry Smith */ 2211321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,&n,0,&M,&N,0,&nc,&s,&bx,&by,0,&st);CHKERRQ(ierr); 22247c6ae99SBarry Smith col = 2*s + 1; 223aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,0,&nx,&ny,0);CHKERRQ(ierr); 224aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,0,&gnx,&gny,0);CHKERRQ(ierr); 22547c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 22647c6ae99SBarry Smith 22747c6ae99SBarry Smith /* special case as taught to us by Paul Hovland */ 228aa219208SBarry Smith if (st == DMDA_STENCIL_STAR && s == 1) { 229e727c939SJed Brown ierr = DMCreateColoring_DA_2d_5pt_MPIAIJ(da,ctype,coloring);CHKERRQ(ierr); 23047c6ae99SBarry Smith } else { 23147c6ae99SBarry Smith 232ce94432eSBarry Smith if (bx == DMDA_BOUNDARY_PERIODIC && (m % col)) SETERRQ2(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in X (%d) is divisible\n\ 23347c6ae99SBarry Smith by 2*stencil_width + 1 (%d)\n", m, col); 234ce94432eSBarry Smith if (by == DMDA_BOUNDARY_PERIODIC && (n % col)) SETERRQ2(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in Y (%d) is divisible\n\ 23547c6ae99SBarry Smith by 2*stencil_width + 1 (%d)\n", n, col); 23647c6ae99SBarry Smith if (ctype == IS_COLORING_GLOBAL) { 23747c6ae99SBarry Smith if (!dd->localcoloring) { 23847c6ae99SBarry Smith ierr = PetscMalloc(nc*nx*ny*sizeof(ISColoringValue),&colors);CHKERRQ(ierr); 23947c6ae99SBarry Smith ii = 0; 24047c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 24147c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 24247c6ae99SBarry Smith for (k=0; k<nc; k++) { 24347c6ae99SBarry Smith colors[ii++] = k + nc*((i % col) + col*(j % col)); 24447c6ae99SBarry Smith } 24547c6ae99SBarry Smith } 24647c6ae99SBarry Smith } 24747c6ae99SBarry Smith ncolors = nc + nc*(col-1 + col*(col-1)); 24847c6ae99SBarry Smith ierr = ISColoringCreate(comm,ncolors,nc*nx*ny,colors,&dd->localcoloring);CHKERRQ(ierr); 24947c6ae99SBarry Smith } 25047c6ae99SBarry Smith *coloring = dd->localcoloring; 25147c6ae99SBarry Smith } else if (ctype == IS_COLORING_GHOSTED) { 25247c6ae99SBarry Smith if (!dd->ghostedcoloring) { 25347c6ae99SBarry Smith ierr = PetscMalloc(nc*gnx*gny*sizeof(ISColoringValue),&colors);CHKERRQ(ierr); 25447c6ae99SBarry Smith ii = 0; 25547c6ae99SBarry Smith for (j=gys; j<gys+gny; j++) { 25647c6ae99SBarry Smith for (i=gxs; i<gxs+gnx; i++) { 25747c6ae99SBarry Smith for (k=0; k<nc; k++) { 25847c6ae99SBarry Smith /* the complicated stuff is to handle periodic boundaries */ 25947c6ae99SBarry Smith colors[ii++] = k + nc*((SetInRange(i,m) % col) + col*(SetInRange(j,n) % col)); 26047c6ae99SBarry Smith } 26147c6ae99SBarry Smith } 26247c6ae99SBarry Smith } 26347c6ae99SBarry Smith ncolors = nc + nc*(col - 1 + col*(col-1)); 26447c6ae99SBarry Smith ierr = ISColoringCreate(comm,ncolors,nc*gnx*gny,colors,&dd->ghostedcoloring);CHKERRQ(ierr); 26547c6ae99SBarry Smith /* PetscIntView(ncolors,(PetscInt*)colors,0); */ 26647c6ae99SBarry Smith 26747c6ae99SBarry Smith ierr = ISColoringSetType(dd->ghostedcoloring,IS_COLORING_GHOSTED);CHKERRQ(ierr); 26847c6ae99SBarry Smith } 26947c6ae99SBarry Smith *coloring = dd->ghostedcoloring; 270ce94432eSBarry Smith } else SETERRQ1(PetscObjectComm((PetscObject)da),PETSC_ERR_ARG_WRONG,"Unknown ISColoringType %d",(int)ctype); 27147c6ae99SBarry Smith } 27247c6ae99SBarry Smith ierr = ISColoringReference(*coloring);CHKERRQ(ierr); 27347c6ae99SBarry Smith PetscFunctionReturn(0); 27447c6ae99SBarry Smith } 27547c6ae99SBarry Smith 27647c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/ 27747c6ae99SBarry Smith 27847c6ae99SBarry Smith #undef __FUNCT__ 279e727c939SJed Brown #define __FUNCT__ "DMCreateColoring_DA_3d_MPIAIJ" 280e727c939SJed Brown PetscErrorCode DMCreateColoring_DA_3d_MPIAIJ(DM da,ISColoringType ctype,ISColoring *coloring) 28147c6ae99SBarry Smith { 28247c6ae99SBarry Smith PetscErrorCode ierr; 28347c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,gxs,gys,gnx,gny,m,n,p,dim,s,k,nc,col,zs,gzs,ii,l,nz,gnz,M,N,P; 28447c6ae99SBarry Smith PetscInt ncolors; 28547c6ae99SBarry Smith MPI_Comm comm; 2861321219cSEthan Coon DMDABoundaryType bx,by,bz; 287aa219208SBarry Smith DMDAStencilType st; 28847c6ae99SBarry Smith ISColoringValue *colors; 28947c6ae99SBarry Smith DM_DA *dd = (DM_DA*)da->data; 29047c6ae99SBarry Smith 29147c6ae99SBarry Smith PetscFunctionBegin; 29247c6ae99SBarry Smith /* 29347c6ae99SBarry Smith nc - number of components per grid point 29447c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 29547c6ae99SBarry Smith 29647c6ae99SBarry Smith */ 2971321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,&n,&p,&M,&N,&P,&nc,&s,&bx,&by,&bz,&st);CHKERRQ(ierr); 29847c6ae99SBarry Smith col = 2*s + 1; 299ce94432eSBarry Smith if (bx == DMDA_BOUNDARY_PERIODIC && (m % col)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in X is divisible\n\ 30047c6ae99SBarry Smith by 2*stencil_width + 1\n"); 301ce94432eSBarry Smith if (by == DMDA_BOUNDARY_PERIODIC && (n % col)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in Y is divisible\n\ 30247c6ae99SBarry Smith by 2*stencil_width + 1\n"); 303ce94432eSBarry Smith if (bz == DMDA_BOUNDARY_PERIODIC && (p % col)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in Z is divisible\n\ 30447c6ae99SBarry Smith by 2*stencil_width + 1\n"); 30547c6ae99SBarry Smith 306aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,&zs,&nx,&ny,&nz);CHKERRQ(ierr); 307aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,&gzs,&gnx,&gny,&gnz);CHKERRQ(ierr); 30847c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 30947c6ae99SBarry Smith 31047c6ae99SBarry Smith /* create the coloring */ 31147c6ae99SBarry Smith if (ctype == IS_COLORING_GLOBAL) { 31247c6ae99SBarry Smith if (!dd->localcoloring) { 31347c6ae99SBarry Smith ierr = PetscMalloc(nc*nx*ny*nz*sizeof(ISColoringValue),&colors);CHKERRQ(ierr); 31447c6ae99SBarry Smith ii = 0; 31547c6ae99SBarry Smith for (k=zs; k<zs+nz; k++) { 31647c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 31747c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 31847c6ae99SBarry Smith for (l=0; l<nc; l++) { 31947c6ae99SBarry Smith colors[ii++] = l + nc*((i % col) + col*(j % col) + col*col*(k % col)); 32047c6ae99SBarry Smith } 32147c6ae99SBarry Smith } 32247c6ae99SBarry Smith } 32347c6ae99SBarry Smith } 32447c6ae99SBarry Smith ncolors = nc + nc*(col-1 + col*(col-1)+ col*col*(col-1)); 32547c6ae99SBarry Smith ierr = ISColoringCreate(comm,ncolors,nc*nx*ny*nz,colors,&dd->localcoloring);CHKERRQ(ierr); 32647c6ae99SBarry Smith } 32747c6ae99SBarry Smith *coloring = dd->localcoloring; 32847c6ae99SBarry Smith } else if (ctype == IS_COLORING_GHOSTED) { 32947c6ae99SBarry Smith if (!dd->ghostedcoloring) { 33047c6ae99SBarry Smith ierr = PetscMalloc(nc*gnx*gny*gnz*sizeof(ISColoringValue),&colors);CHKERRQ(ierr); 33147c6ae99SBarry Smith ii = 0; 33247c6ae99SBarry Smith for (k=gzs; k<gzs+gnz; k++) { 33347c6ae99SBarry Smith for (j=gys; j<gys+gny; j++) { 33447c6ae99SBarry Smith for (i=gxs; i<gxs+gnx; i++) { 33547c6ae99SBarry Smith for (l=0; l<nc; l++) { 33647c6ae99SBarry Smith /* the complicated stuff is to handle periodic boundaries */ 33747c6ae99SBarry Smith colors[ii++] = l + nc*((SetInRange(i,m) % col) + col*(SetInRange(j,n) % col) + col*col*(SetInRange(k,p) % col)); 33847c6ae99SBarry Smith } 33947c6ae99SBarry Smith } 34047c6ae99SBarry Smith } 34147c6ae99SBarry Smith } 34247c6ae99SBarry Smith ncolors = nc + nc*(col-1 + col*(col-1)+ col*col*(col-1)); 34347c6ae99SBarry Smith ierr = ISColoringCreate(comm,ncolors,nc*gnx*gny*gnz,colors,&dd->ghostedcoloring);CHKERRQ(ierr); 34447c6ae99SBarry Smith ierr = ISColoringSetType(dd->ghostedcoloring,IS_COLORING_GHOSTED);CHKERRQ(ierr); 34547c6ae99SBarry Smith } 34647c6ae99SBarry Smith *coloring = dd->ghostedcoloring; 347ce94432eSBarry Smith } else SETERRQ1(PetscObjectComm((PetscObject)da),PETSC_ERR_ARG_WRONG,"Unknown ISColoringType %d",(int)ctype); 34847c6ae99SBarry Smith ierr = ISColoringReference(*coloring);CHKERRQ(ierr); 34947c6ae99SBarry Smith PetscFunctionReturn(0); 35047c6ae99SBarry Smith } 35147c6ae99SBarry Smith 35247c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/ 35347c6ae99SBarry Smith 35447c6ae99SBarry Smith #undef __FUNCT__ 355e727c939SJed Brown #define __FUNCT__ "DMCreateColoring_DA_1d_MPIAIJ" 356e727c939SJed Brown PetscErrorCode DMCreateColoring_DA_1d_MPIAIJ(DM da,ISColoringType ctype,ISColoring *coloring) 35747c6ae99SBarry Smith { 35847c6ae99SBarry Smith PetscErrorCode ierr; 35947c6ae99SBarry Smith PetscInt xs,nx,i,i1,gxs,gnx,l,m,M,dim,s,nc,col; 36047c6ae99SBarry Smith PetscInt ncolors; 36147c6ae99SBarry Smith MPI_Comm comm; 3621321219cSEthan Coon DMDABoundaryType bx; 36347c6ae99SBarry Smith ISColoringValue *colors; 36447c6ae99SBarry Smith DM_DA *dd = (DM_DA*)da->data; 36547c6ae99SBarry Smith 36647c6ae99SBarry Smith PetscFunctionBegin; 36747c6ae99SBarry Smith /* 36847c6ae99SBarry Smith nc - number of components per grid point 36947c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 37047c6ae99SBarry Smith 37147c6ae99SBarry Smith */ 3721321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,0,0,&M,0,0,&nc,&s,&bx,0,0,0);CHKERRQ(ierr); 37347c6ae99SBarry Smith col = 2*s + 1; 37447c6ae99SBarry Smith 375ce94432eSBarry Smith if (bx == DMDA_BOUNDARY_PERIODIC && (m % col)) SETERRQ2(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points %d is divisible\n\ 37631e6f798SBarry Smith by 2*stencil_width + 1 %d\n",(int)m,(int)col); 37747c6ae99SBarry Smith 378aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,0,0,&nx,0,0);CHKERRQ(ierr); 379aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,0,0,&gnx,0,0);CHKERRQ(ierr); 38047c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 38147c6ae99SBarry Smith 38247c6ae99SBarry Smith /* create the coloring */ 38347c6ae99SBarry Smith if (ctype == IS_COLORING_GLOBAL) { 38447c6ae99SBarry Smith if (!dd->localcoloring) { 38547c6ae99SBarry Smith ierr = PetscMalloc(nc*nx*sizeof(ISColoringValue),&colors);CHKERRQ(ierr); 386ae4f298aSBarry Smith if (dd->ofillcols) { 387ae4f298aSBarry Smith PetscInt tc = 0; 388ae4f298aSBarry Smith for (i=0; i<nc; i++) tc += (PetscInt) (dd->ofillcols[i] > 0); 389ae4f298aSBarry Smith i1 = 0; 390ae4f298aSBarry Smith for (i=xs; i<xs+nx; i++) { 391ae4f298aSBarry Smith for (l=0; l<nc; l++) { 392ae4f298aSBarry Smith if (dd->ofillcols[l] && (i % col)) { 393ae4f298aSBarry Smith colors[i1++] = nc - 1 + tc*((i % col) - 1) + dd->ofillcols[l]; 394ae4f298aSBarry Smith } else { 395ae4f298aSBarry Smith colors[i1++] = l; 396ae4f298aSBarry Smith } 397ae4f298aSBarry Smith } 398ae4f298aSBarry Smith } 399ae4f298aSBarry Smith ncolors = nc + 2*s*tc; 400ae4f298aSBarry Smith } else { 40147c6ae99SBarry Smith i1 = 0; 40247c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 40347c6ae99SBarry Smith for (l=0; l<nc; l++) { 40447c6ae99SBarry Smith colors[i1++] = l + nc*(i % col); 40547c6ae99SBarry Smith } 40647c6ae99SBarry Smith } 40747c6ae99SBarry Smith ncolors = nc + nc*(col-1); 408ae4f298aSBarry Smith } 40947c6ae99SBarry Smith ierr = ISColoringCreate(comm,ncolors,nc*nx,colors,&dd->localcoloring);CHKERRQ(ierr); 41047c6ae99SBarry Smith } 41147c6ae99SBarry Smith *coloring = dd->localcoloring; 41247c6ae99SBarry Smith } else if (ctype == IS_COLORING_GHOSTED) { 41347c6ae99SBarry Smith if (!dd->ghostedcoloring) { 41447c6ae99SBarry Smith ierr = PetscMalloc(nc*gnx*sizeof(ISColoringValue),&colors);CHKERRQ(ierr); 41547c6ae99SBarry Smith i1 = 0; 41647c6ae99SBarry Smith for (i=gxs; i<gxs+gnx; i++) { 41747c6ae99SBarry Smith for (l=0; l<nc; l++) { 41847c6ae99SBarry Smith /* the complicated stuff is to handle periodic boundaries */ 41947c6ae99SBarry Smith colors[i1++] = l + nc*(SetInRange(i,m) % col); 42047c6ae99SBarry Smith } 42147c6ae99SBarry Smith } 42247c6ae99SBarry Smith ncolors = nc + nc*(col-1); 42347c6ae99SBarry Smith ierr = ISColoringCreate(comm,ncolors,nc*gnx,colors,&dd->ghostedcoloring);CHKERRQ(ierr); 42447c6ae99SBarry Smith ierr = ISColoringSetType(dd->ghostedcoloring,IS_COLORING_GHOSTED);CHKERRQ(ierr); 42547c6ae99SBarry Smith } 42647c6ae99SBarry Smith *coloring = dd->ghostedcoloring; 427ce94432eSBarry Smith } else SETERRQ1(PetscObjectComm((PetscObject)da),PETSC_ERR_ARG_WRONG,"Unknown ISColoringType %d",(int)ctype); 42847c6ae99SBarry Smith ierr = ISColoringReference(*coloring);CHKERRQ(ierr); 42947c6ae99SBarry Smith PetscFunctionReturn(0); 43047c6ae99SBarry Smith } 43147c6ae99SBarry Smith 43247c6ae99SBarry Smith #undef __FUNCT__ 433e727c939SJed Brown #define __FUNCT__ "DMCreateColoring_DA_2d_5pt_MPIAIJ" 434e727c939SJed Brown PetscErrorCode DMCreateColoring_DA_2d_5pt_MPIAIJ(DM da,ISColoringType ctype,ISColoring *coloring) 43547c6ae99SBarry Smith { 43647c6ae99SBarry Smith PetscErrorCode ierr; 43747c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,ii,gxs,gys,gnx,gny,m,n,dim,s,k,nc; 43847c6ae99SBarry Smith PetscInt ncolors; 43947c6ae99SBarry Smith MPI_Comm comm; 4401321219cSEthan Coon DMDABoundaryType bx,by; 44147c6ae99SBarry Smith ISColoringValue *colors; 44247c6ae99SBarry Smith DM_DA *dd = (DM_DA*)da->data; 44347c6ae99SBarry Smith 44447c6ae99SBarry Smith PetscFunctionBegin; 44547c6ae99SBarry Smith /* 44647c6ae99SBarry Smith nc - number of components per grid point 44747c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 44847c6ae99SBarry Smith 44947c6ae99SBarry Smith */ 4501321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,&n,0,0,0,0,&nc,&s,&bx,&by,0,0);CHKERRQ(ierr); 451aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,0,&nx,&ny,0);CHKERRQ(ierr); 452aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,0,&gnx,&gny,0);CHKERRQ(ierr); 45347c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 45447c6ae99SBarry Smith 455ce94432eSBarry Smith if (bx == DMDA_BOUNDARY_PERIODIC && (m % 5)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in X is divisible by 5\n"); 456ce94432eSBarry Smith if (by == DMDA_BOUNDARY_PERIODIC && (n % 5)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in Y is divisible by 5\n"); 45747c6ae99SBarry Smith 45847c6ae99SBarry Smith /* create the coloring */ 45947c6ae99SBarry Smith if (ctype == IS_COLORING_GLOBAL) { 46047c6ae99SBarry Smith if (!dd->localcoloring) { 46147c6ae99SBarry Smith ierr = PetscMalloc(nc*nx*ny*sizeof(ISColoringValue),&colors);CHKERRQ(ierr); 46247c6ae99SBarry Smith ii = 0; 46347c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 46447c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 46547c6ae99SBarry Smith for (k=0; k<nc; k++) { 46647c6ae99SBarry Smith colors[ii++] = k + nc*((3*j+i) % 5); 46747c6ae99SBarry Smith } 46847c6ae99SBarry Smith } 46947c6ae99SBarry Smith } 47047c6ae99SBarry Smith ncolors = 5*nc; 47147c6ae99SBarry Smith ierr = ISColoringCreate(comm,ncolors,nc*nx*ny,colors,&dd->localcoloring);CHKERRQ(ierr); 47247c6ae99SBarry Smith } 47347c6ae99SBarry Smith *coloring = dd->localcoloring; 47447c6ae99SBarry Smith } else if (ctype == IS_COLORING_GHOSTED) { 47547c6ae99SBarry Smith if (!dd->ghostedcoloring) { 47647c6ae99SBarry Smith ierr = PetscMalloc(nc*gnx*gny*sizeof(ISColoringValue),&colors);CHKERRQ(ierr); 47747c6ae99SBarry Smith ii = 0; 47847c6ae99SBarry Smith for (j=gys; j<gys+gny; j++) { 47947c6ae99SBarry Smith for (i=gxs; i<gxs+gnx; i++) { 48047c6ae99SBarry Smith for (k=0; k<nc; k++) { 48147c6ae99SBarry Smith colors[ii++] = k + nc*((3*SetInRange(j,n) + SetInRange(i,m)) % 5); 48247c6ae99SBarry Smith } 48347c6ae99SBarry Smith } 48447c6ae99SBarry Smith } 48547c6ae99SBarry Smith ncolors = 5*nc; 48647c6ae99SBarry Smith ierr = ISColoringCreate(comm,ncolors,nc*gnx*gny,colors,&dd->ghostedcoloring);CHKERRQ(ierr); 48747c6ae99SBarry Smith ierr = ISColoringSetType(dd->ghostedcoloring,IS_COLORING_GHOSTED);CHKERRQ(ierr); 48847c6ae99SBarry Smith } 48947c6ae99SBarry Smith *coloring = dd->ghostedcoloring; 490ce94432eSBarry Smith } else SETERRQ1(PetscObjectComm((PetscObject)da),PETSC_ERR_ARG_WRONG,"Unknown ISColoringType %d",(int)ctype); 49147c6ae99SBarry Smith PetscFunctionReturn(0); 49247c6ae99SBarry Smith } 49347c6ae99SBarry Smith 49447c6ae99SBarry Smith /* =========================================================================== */ 495950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_1d_MPIAIJ(DM,Mat); 496ce308e1dSBarry Smith extern PetscErrorCode DMCreateMatrix_DA_1d_MPIAIJ_Fill(DM,Mat); 497950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_2d_MPIAIJ(DM,Mat); 498950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_2d_MPIAIJ_Fill(DM,Mat); 499950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_3d_MPIAIJ(DM,Mat); 500950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_3d_MPIAIJ_Fill(DM,Mat); 501950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_2d_MPIBAIJ(DM,Mat); 502950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_3d_MPIBAIJ(DM,Mat); 503950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_2d_MPISBAIJ(DM,Mat); 504950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_3d_MPISBAIJ(DM,Mat); 50547c6ae99SBarry Smith 50647c6ae99SBarry Smith #undef __FUNCT__ 507c688c046SMatthew G Knepley #define __FUNCT__ "MatSetupDM" 5088bbdbebaSMatthew G Knepley /*@C 509c688c046SMatthew G Knepley MatSetupDM - Sets the DMDA that is to be used by the HYPRE_StructMatrix PETSc matrix 51047c6ae99SBarry Smith 51147c6ae99SBarry Smith Logically Collective on Mat 51247c6ae99SBarry Smith 51347c6ae99SBarry Smith Input Parameters: 51447c6ae99SBarry Smith + mat - the matrix 51547c6ae99SBarry Smith - da - the da 51647c6ae99SBarry Smith 51747c6ae99SBarry Smith Level: intermediate 51847c6ae99SBarry Smith 51947c6ae99SBarry Smith @*/ 520c688c046SMatthew G Knepley PetscErrorCode MatSetupDM(Mat mat,DM da) 52147c6ae99SBarry Smith { 52247c6ae99SBarry Smith PetscErrorCode ierr; 52347c6ae99SBarry Smith 52447c6ae99SBarry Smith PetscFunctionBegin; 52547c6ae99SBarry Smith PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 52647c6ae99SBarry Smith PetscValidHeaderSpecific(da,DM_CLASSID,1); 527c688c046SMatthew G Knepley ierr = PetscTryMethod(mat,"MatSetupDM_C",(Mat,DM),(mat,da));CHKERRQ(ierr); 52847c6ae99SBarry Smith PetscFunctionReturn(0); 52947c6ae99SBarry Smith } 53047c6ae99SBarry Smith 53147c6ae99SBarry Smith #undef __FUNCT__ 53247c6ae99SBarry Smith #define __FUNCT__ "MatView_MPI_DA" 5337087cfbeSBarry Smith PetscErrorCode MatView_MPI_DA(Mat A,PetscViewer viewer) 53447c6ae99SBarry Smith { 5359a42bb27SBarry Smith DM da; 53647c6ae99SBarry Smith PetscErrorCode ierr; 53747c6ae99SBarry Smith const char *prefix; 53847c6ae99SBarry Smith Mat Anatural; 53947c6ae99SBarry Smith AO ao; 54047c6ae99SBarry Smith PetscInt rstart,rend,*petsc,i; 54147c6ae99SBarry Smith IS is; 54247c6ae99SBarry Smith MPI_Comm comm; 54374388724SJed Brown PetscViewerFormat format; 54447c6ae99SBarry Smith 54547c6ae99SBarry Smith PetscFunctionBegin; 54674388724SJed Brown /* Check whether we are just printing info, in which case MatView() already viewed everything we wanted to view */ 54774388724SJed Brown ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 54874388724SJed Brown if (format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(0); 54974388724SJed Brown 55047c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)A,&comm);CHKERRQ(ierr); 551c688c046SMatthew G Knepley ierr = MatGetDM(A, &da);CHKERRQ(ierr); 552ce94432eSBarry Smith if (!da) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"Matrix not generated from a DMDA"); 55347c6ae99SBarry Smith 554aa219208SBarry Smith ierr = DMDAGetAO(da,&ao);CHKERRQ(ierr); 55547c6ae99SBarry Smith ierr = MatGetOwnershipRange(A,&rstart,&rend);CHKERRQ(ierr); 55647c6ae99SBarry Smith ierr = PetscMalloc((rend-rstart)*sizeof(PetscInt),&petsc);CHKERRQ(ierr); 55747c6ae99SBarry Smith for (i=rstart; i<rend; i++) petsc[i-rstart] = i; 55847c6ae99SBarry Smith ierr = AOApplicationToPetsc(ao,rend-rstart,petsc);CHKERRQ(ierr); 55947c6ae99SBarry Smith ierr = ISCreateGeneral(comm,rend-rstart,petsc,PETSC_OWN_POINTER,&is);CHKERRQ(ierr); 56047c6ae99SBarry Smith 56147c6ae99SBarry Smith /* call viewer on natural ordering */ 56247c6ae99SBarry Smith ierr = MatGetSubMatrix(A,is,is,MAT_INITIAL_MATRIX,&Anatural);CHKERRQ(ierr); 563fcfd50ebSBarry Smith ierr = ISDestroy(&is);CHKERRQ(ierr); 56447c6ae99SBarry Smith ierr = PetscObjectGetOptionsPrefix((PetscObject)A,&prefix);CHKERRQ(ierr); 56547c6ae99SBarry Smith ierr = PetscObjectSetOptionsPrefix((PetscObject)Anatural,prefix);CHKERRQ(ierr); 56647c6ae99SBarry Smith ierr = PetscObjectSetName((PetscObject)Anatural,((PetscObject)A)->name);CHKERRQ(ierr); 56747c6ae99SBarry Smith ierr = MatView(Anatural,viewer);CHKERRQ(ierr); 568fcfd50ebSBarry Smith ierr = MatDestroy(&Anatural);CHKERRQ(ierr); 56947c6ae99SBarry Smith PetscFunctionReturn(0); 57047c6ae99SBarry Smith } 57147c6ae99SBarry Smith 57247c6ae99SBarry Smith #undef __FUNCT__ 57347c6ae99SBarry Smith #define __FUNCT__ "MatLoad_MPI_DA" 5747087cfbeSBarry Smith PetscErrorCode MatLoad_MPI_DA(Mat A,PetscViewer viewer) 57547c6ae99SBarry Smith { 5769a42bb27SBarry Smith DM da; 57747c6ae99SBarry Smith PetscErrorCode ierr; 57847c6ae99SBarry Smith Mat Anatural,Aapp; 57947c6ae99SBarry Smith AO ao; 58047c6ae99SBarry Smith PetscInt rstart,rend,*app,i; 58147c6ae99SBarry Smith IS is; 58247c6ae99SBarry Smith MPI_Comm comm; 58347c6ae99SBarry Smith 58447c6ae99SBarry Smith PetscFunctionBegin; 58547c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)A,&comm);CHKERRQ(ierr); 586c688c046SMatthew G Knepley ierr = MatGetDM(A, &da);CHKERRQ(ierr); 587ce94432eSBarry Smith if (!da) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"Matrix not generated from a DMDA"); 58847c6ae99SBarry Smith 58947c6ae99SBarry Smith /* Load the matrix in natural ordering */ 590ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&Anatural);CHKERRQ(ierr); 59147c6ae99SBarry Smith ierr = MatSetType(Anatural,((PetscObject)A)->type_name);CHKERRQ(ierr); 59247c6ae99SBarry Smith ierr = MatSetSizes(Anatural,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr); 59347c6ae99SBarry Smith ierr = MatLoad(Anatural,viewer);CHKERRQ(ierr); 59447c6ae99SBarry Smith 59547c6ae99SBarry Smith /* Map natural ordering to application ordering and create IS */ 596aa219208SBarry Smith ierr = DMDAGetAO(da,&ao);CHKERRQ(ierr); 59747c6ae99SBarry Smith ierr = MatGetOwnershipRange(Anatural,&rstart,&rend);CHKERRQ(ierr); 59847c6ae99SBarry Smith ierr = PetscMalloc((rend-rstart)*sizeof(PetscInt),&app);CHKERRQ(ierr); 59947c6ae99SBarry Smith for (i=rstart; i<rend; i++) app[i-rstart] = i; 60047c6ae99SBarry Smith ierr = AOPetscToApplication(ao,rend-rstart,app);CHKERRQ(ierr); 60147c6ae99SBarry Smith ierr = ISCreateGeneral(comm,rend-rstart,app,PETSC_OWN_POINTER,&is);CHKERRQ(ierr); 60247c6ae99SBarry Smith 60347c6ae99SBarry Smith /* Do permutation and replace header */ 60447c6ae99SBarry Smith ierr = MatGetSubMatrix(Anatural,is,is,MAT_INITIAL_MATRIX,&Aapp);CHKERRQ(ierr); 60547c6ae99SBarry Smith ierr = MatHeaderReplace(A,Aapp);CHKERRQ(ierr); 606fcfd50ebSBarry Smith ierr = ISDestroy(&is);CHKERRQ(ierr); 607fcfd50ebSBarry Smith ierr = MatDestroy(&Anatural);CHKERRQ(ierr); 60847c6ae99SBarry Smith PetscFunctionReturn(0); 60947c6ae99SBarry Smith } 61047c6ae99SBarry Smith 61147c6ae99SBarry Smith #undef __FUNCT__ 612950540a4SJed Brown #define __FUNCT__ "DMCreateMatrix_DA" 61319fd82e9SBarry Smith PetscErrorCode DMCreateMatrix_DA(DM da, MatType mtype,Mat *J) 61447c6ae99SBarry Smith { 61547c6ae99SBarry Smith PetscErrorCode ierr; 61647c6ae99SBarry Smith PetscInt dim,dof,nx,ny,nz,dims[3],starts[3],M,N,P; 61747c6ae99SBarry Smith Mat A; 61847c6ae99SBarry Smith MPI_Comm comm; 61919fd82e9SBarry Smith MatType Atype; 62037d0c07bSMatthew G Knepley PetscSection section, sectionGlobal; 6210298fd71SBarry Smith void (*aij)(void)=NULL,(*baij)(void)=NULL,(*sbaij)(void)=NULL; 62247c6ae99SBarry Smith MatType ttype[256]; 62347c6ae99SBarry Smith PetscBool flg; 62447c6ae99SBarry Smith PetscMPIInt size; 62547c6ae99SBarry Smith DM_DA *dd = (DM_DA*)da->data; 62647c6ae99SBarry Smith 62747c6ae99SBarry Smith PetscFunctionBegin; 628519f805aSKarl Rupp #if !defined(PETSC_USE_DYNAMIC_LIBRARIES) 629607a6623SBarry Smith ierr = MatInitializePackage();CHKERRQ(ierr); 63047c6ae99SBarry Smith #endif 6315da5aae0SJed Brown if (!mtype) mtype = MATAIJ; 63247c6ae99SBarry Smith ierr = PetscStrcpy((char*)ttype,mtype);CHKERRQ(ierr); 633ce94432eSBarry Smith ierr = PetscOptionsBegin(PetscObjectComm((PetscObject)da),((PetscObject)da)->prefix,"DMDA options","Mat");CHKERRQ(ierr); 634dd85299cSBarry Smith ierr = PetscOptionsList("-dm_mat_type","Matrix type","MatSetType",MatList,mtype,(char*)ttype,256,&flg);CHKERRQ(ierr); 63547c6ae99SBarry Smith ierr = PetscOptionsEnd(); 63647c6ae99SBarry Smith 63737d0c07bSMatthew G Knepley ierr = DMGetDefaultSection(da, §ion);CHKERRQ(ierr); 63837d0c07bSMatthew G Knepley if (section) { 63937d0c07bSMatthew G Knepley PetscInt bs = -1; 64037d0c07bSMatthew G Knepley PetscInt localSize; 64137d0c07bSMatthew G Knepley PetscBool isShell, isBlock, isSeqBlock, isMPIBlock, isSymBlock, isSymSeqBlock, isSymMPIBlock, isSymmetric; 64237d0c07bSMatthew G Knepley 64337d0c07bSMatthew G Knepley ierr = DMGetDefaultGlobalSection(da, §ionGlobal);CHKERRQ(ierr); 64437d0c07bSMatthew G Knepley ierr = PetscSectionGetConstrainedStorageSize(sectionGlobal, &localSize);CHKERRQ(ierr); 64582f516ccSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)da), J);CHKERRQ(ierr); 64637d0c07bSMatthew G Knepley ierr = MatSetSizes(*J, localSize, localSize, PETSC_DETERMINE, PETSC_DETERMINE);CHKERRQ(ierr); 64737d0c07bSMatthew G Knepley ierr = MatSetType(*J, mtype);CHKERRQ(ierr); 64837d0c07bSMatthew G Knepley ierr = MatSetFromOptions(*J);CHKERRQ(ierr); 64937d0c07bSMatthew G Knepley ierr = PetscStrcmp(mtype, MATSHELL, &isShell);CHKERRQ(ierr); 65037d0c07bSMatthew G Knepley ierr = PetscStrcmp(mtype, MATBAIJ, &isBlock);CHKERRQ(ierr); 65137d0c07bSMatthew G Knepley ierr = PetscStrcmp(mtype, MATSEQBAIJ, &isSeqBlock);CHKERRQ(ierr); 65237d0c07bSMatthew G Knepley ierr = PetscStrcmp(mtype, MATMPIBAIJ, &isMPIBlock);CHKERRQ(ierr); 65337d0c07bSMatthew G Knepley ierr = PetscStrcmp(mtype, MATSBAIJ, &isSymBlock);CHKERRQ(ierr); 65437d0c07bSMatthew G Knepley ierr = PetscStrcmp(mtype, MATSEQSBAIJ, &isSymSeqBlock);CHKERRQ(ierr); 65537d0c07bSMatthew G Knepley ierr = PetscStrcmp(mtype, MATMPISBAIJ, &isSymMPIBlock);CHKERRQ(ierr); 65637d0c07bSMatthew G Knepley /* Check for symmetric storage */ 65737d0c07bSMatthew G Knepley isSymmetric = (PetscBool) (isSymBlock || isSymSeqBlock || isSymMPIBlock); 65837d0c07bSMatthew G Knepley if (isSymmetric) { 65937d0c07bSMatthew G Knepley ierr = MatSetOption(*J, MAT_IGNORE_LOWER_TRIANGULAR, PETSC_TRUE);CHKERRQ(ierr); 66037d0c07bSMatthew G Knepley } 66137d0c07bSMatthew G Knepley if (!isShell) { 66237d0c07bSMatthew G Knepley PetscInt *dnz, *onz, *dnzu, *onzu, bsLocal; 66337d0c07bSMatthew G Knepley 66437d0c07bSMatthew G Knepley if (bs < 0) { 66537d0c07bSMatthew G Knepley if (isBlock || isSeqBlock || isMPIBlock || isSymBlock || isSymSeqBlock || isSymMPIBlock) { 66637d0c07bSMatthew G Knepley PetscInt pStart, pEnd, p, dof; 66737d0c07bSMatthew G Knepley 66837d0c07bSMatthew G Knepley ierr = PetscSectionGetChart(sectionGlobal, &pStart, &pEnd);CHKERRQ(ierr); 66937d0c07bSMatthew G Knepley for (p = pStart; p < pEnd; ++p) { 67037d0c07bSMatthew G Knepley ierr = PetscSectionGetDof(sectionGlobal, p, &dof);CHKERRQ(ierr); 67137d0c07bSMatthew G Knepley if (dof) { 67237d0c07bSMatthew G Knepley bs = dof; 67337d0c07bSMatthew G Knepley break; 67437d0c07bSMatthew G Knepley } 67537d0c07bSMatthew G Knepley } 67637d0c07bSMatthew G Knepley } else { 67737d0c07bSMatthew G Knepley bs = 1; 67837d0c07bSMatthew G Knepley } 67937d0c07bSMatthew G Knepley /* Must have same blocksize on all procs (some might have no points) */ 68037d0c07bSMatthew G Knepley bsLocal = bs; 68182f516ccSBarry Smith ierr = MPI_Allreduce(&bsLocal, &bs, 1, MPIU_INT, MPI_MAX, PetscObjectComm((PetscObject)da));CHKERRQ(ierr); 68237d0c07bSMatthew G Knepley } 68337d0c07bSMatthew G Knepley ierr = PetscMalloc4(localSize/bs, PetscInt, &dnz, localSize/bs, PetscInt, &onz, localSize/bs, PetscInt, &dnzu, localSize/bs, PetscInt, &onzu);CHKERRQ(ierr); 68437d0c07bSMatthew G Knepley ierr = PetscMemzero(dnz, localSize/bs * sizeof(PetscInt));CHKERRQ(ierr); 68537d0c07bSMatthew G Knepley ierr = PetscMemzero(onz, localSize/bs * sizeof(PetscInt));CHKERRQ(ierr); 68637d0c07bSMatthew G Knepley ierr = PetscMemzero(dnzu, localSize/bs * sizeof(PetscInt));CHKERRQ(ierr); 68737d0c07bSMatthew G Knepley ierr = PetscMemzero(onzu, localSize/bs * sizeof(PetscInt));CHKERRQ(ierr); 688552f7358SJed Brown /* ierr = DMPlexPreallocateOperator(dm, bs, section, sectionGlobal, dnz, onz, dnzu, onzu, *J, fillMatrix);CHKERRQ(ierr); */ 68937d0c07bSMatthew G Knepley ierr = PetscFree4(dnz, onz, dnzu, onzu);CHKERRQ(ierr); 69037d0c07bSMatthew G Knepley } 69137d0c07bSMatthew G Knepley } 69247c6ae99SBarry Smith /* 69347c6ae99SBarry Smith m 69447c6ae99SBarry Smith ------------------------------------------------------ 69547c6ae99SBarry Smith | | 69647c6ae99SBarry Smith | | 69747c6ae99SBarry Smith | ---------------------- | 69847c6ae99SBarry Smith | | | | 69947c6ae99SBarry Smith n | ny | | | 70047c6ae99SBarry Smith | | | | 70147c6ae99SBarry Smith | .--------------------- | 70247c6ae99SBarry Smith | (xs,ys) nx | 70347c6ae99SBarry Smith | . | 70447c6ae99SBarry Smith | (gxs,gys) | 70547c6ae99SBarry Smith | | 70647c6ae99SBarry Smith ----------------------------------------------------- 70747c6ae99SBarry Smith */ 70847c6ae99SBarry Smith 70947c6ae99SBarry Smith /* 71047c6ae99SBarry Smith nc - number of components per grid point 71147c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 71247c6ae99SBarry Smith 71347c6ae99SBarry Smith */ 714e30e807fSPeter Brune M = dd->M; 715e30e807fSPeter Brune N = dd->N; 716e30e807fSPeter Brune P = dd->P; 717e30e807fSPeter Brune dim = dd->dim; 718e30e807fSPeter Brune dof = dd->w; 719e30e807fSPeter Brune /* ierr = DMDAGetInfo(da,&dim,&M,&N,&P,0,0,0,&dof,0,0,0,0,0);CHKERRQ(ierr); */ 720aa219208SBarry Smith ierr = DMDAGetCorners(da,0,0,0,&nx,&ny,&nz);CHKERRQ(ierr); 72147c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 72247c6ae99SBarry Smith ierr = MatCreate(comm,&A);CHKERRQ(ierr); 72347c6ae99SBarry Smith ierr = MatSetSizes(A,dof*nx*ny*nz,dof*nx*ny*nz,dof*M*N*P,dof*M*N*P);CHKERRQ(ierr); 72419fd82e9SBarry Smith ierr = MatSetType(A,(MatType)ttype);CHKERRQ(ierr); 72595ee5b0eSBarry Smith ierr = MatSetDM(A,da);CHKERRQ(ierr); 72647c6ae99SBarry Smith ierr = MatSetFromOptions(A);CHKERRQ(ierr); 72747c6ae99SBarry Smith ierr = MatGetType(A,&Atype);CHKERRQ(ierr); 72847c6ae99SBarry Smith /* 729aa219208SBarry Smith We do not provide a getmatrix function in the DMDA operations because 730aa219208SBarry Smith the basic DMDA does not know about matrices. We think of DMDA as being more 73147c6ae99SBarry Smith more low-level than matrices. This is kind of cheating but, cause sometimes 732aa219208SBarry Smith we think of DMDA has higher level than matrices. 73347c6ae99SBarry Smith 73447c6ae99SBarry Smith We could switch based on Atype (or mtype), but we do not since the 73547c6ae99SBarry Smith specialized setting routines depend only the particular preallocation 73647c6ae99SBarry Smith details of the matrix, not the type itself. 73747c6ae99SBarry Smith */ 73847c6ae99SBarry Smith ierr = PetscObjectQueryFunction((PetscObject)A,"MatMPIAIJSetPreallocation_C",&aij);CHKERRQ(ierr); 73947c6ae99SBarry Smith if (!aij) { 74047c6ae99SBarry Smith ierr = PetscObjectQueryFunction((PetscObject)A,"MatSeqAIJSetPreallocation_C",&aij);CHKERRQ(ierr); 74147c6ae99SBarry Smith } 74247c6ae99SBarry Smith if (!aij) { 74347c6ae99SBarry Smith ierr = PetscObjectQueryFunction((PetscObject)A,"MatMPIBAIJSetPreallocation_C",&baij);CHKERRQ(ierr); 74447c6ae99SBarry Smith if (!baij) { 74547c6ae99SBarry Smith ierr = PetscObjectQueryFunction((PetscObject)A,"MatSeqBAIJSetPreallocation_C",&baij);CHKERRQ(ierr); 74647c6ae99SBarry Smith } 74747c6ae99SBarry Smith if (!baij) { 74847c6ae99SBarry Smith ierr = PetscObjectQueryFunction((PetscObject)A,"MatMPISBAIJSetPreallocation_C",&sbaij);CHKERRQ(ierr); 74947c6ae99SBarry Smith if (!sbaij) { 75047c6ae99SBarry Smith ierr = PetscObjectQueryFunction((PetscObject)A,"MatSeqSBAIJSetPreallocation_C",&sbaij);CHKERRQ(ierr); 75147c6ae99SBarry Smith } 75247c6ae99SBarry Smith } 75347c6ae99SBarry Smith } 75447c6ae99SBarry Smith if (aij) { 75547c6ae99SBarry Smith if (dim == 1) { 756ce308e1dSBarry Smith if (dd->ofill) { 757ce308e1dSBarry Smith ierr = DMCreateMatrix_DA_1d_MPIAIJ_Fill(da,A);CHKERRQ(ierr); 758ce308e1dSBarry Smith } else { 759950540a4SJed Brown ierr = DMCreateMatrix_DA_1d_MPIAIJ(da,A);CHKERRQ(ierr); 760ce308e1dSBarry Smith } 76147c6ae99SBarry Smith } else if (dim == 2) { 76247c6ae99SBarry Smith if (dd->ofill) { 763950540a4SJed Brown ierr = DMCreateMatrix_DA_2d_MPIAIJ_Fill(da,A);CHKERRQ(ierr); 76447c6ae99SBarry Smith } else { 765950540a4SJed Brown ierr = DMCreateMatrix_DA_2d_MPIAIJ(da,A);CHKERRQ(ierr); 76647c6ae99SBarry Smith } 76747c6ae99SBarry Smith } else if (dim == 3) { 76847c6ae99SBarry Smith if (dd->ofill) { 769950540a4SJed Brown ierr = DMCreateMatrix_DA_3d_MPIAIJ_Fill(da,A);CHKERRQ(ierr); 77047c6ae99SBarry Smith } else { 771950540a4SJed Brown ierr = DMCreateMatrix_DA_3d_MPIAIJ(da,A);CHKERRQ(ierr); 77247c6ae99SBarry Smith } 77347c6ae99SBarry Smith } 77447c6ae99SBarry Smith } else if (baij) { 77547c6ae99SBarry Smith if (dim == 2) { 776950540a4SJed Brown ierr = DMCreateMatrix_DA_2d_MPIBAIJ(da,A);CHKERRQ(ierr); 77747c6ae99SBarry Smith } else if (dim == 3) { 778950540a4SJed Brown ierr = DMCreateMatrix_DA_3d_MPIBAIJ(da,A);CHKERRQ(ierr); 779ce94432eSBarry Smith } else SETERRQ3(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"Not implemented for %D dimension and Matrix Type: %s in %D dimension! Send mail to petsc-maint@mcs.anl.gov for code",dim,Atype,dim); 78047c6ae99SBarry Smith } else if (sbaij) { 78147c6ae99SBarry Smith if (dim == 2) { 782950540a4SJed Brown ierr = DMCreateMatrix_DA_2d_MPISBAIJ(da,A);CHKERRQ(ierr); 78347c6ae99SBarry Smith } else if (dim == 3) { 784950540a4SJed Brown ierr = DMCreateMatrix_DA_3d_MPISBAIJ(da,A);CHKERRQ(ierr); 785ce94432eSBarry Smith } else SETERRQ3(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"Not implemented for %D dimension and Matrix Type: %s in %D dimension! Send mail to petsc-maint@mcs.anl.gov for code",dim,Atype,dim); 786869776cdSLisandro Dalcin } else { 787869776cdSLisandro Dalcin ISLocalToGlobalMapping ltog,ltogb; 788869776cdSLisandro Dalcin ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 789869776cdSLisandro Dalcin ierr = DMGetLocalToGlobalMappingBlock(da,<ogb);CHKERRQ(ierr); 7902949035bSJed Brown ierr = MatSetUp(A);CHKERRQ(ierr); 791869776cdSLisandro Dalcin ierr = MatSetLocalToGlobalMapping(A,ltog,ltog);CHKERRQ(ierr); 792869776cdSLisandro Dalcin ierr = MatSetLocalToGlobalMappingBlock(A,ltogb,ltogb);CHKERRQ(ierr); 79347c6ae99SBarry Smith } 794aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&starts[0],&starts[1],&starts[2],&dims[0],&dims[1],&dims[2]);CHKERRQ(ierr); 79547c6ae99SBarry Smith ierr = MatSetStencil(A,dim,dims,starts,dof);CHKERRQ(ierr); 796c688c046SMatthew G Knepley ierr = MatSetDM(A,da);CHKERRQ(ierr); 79747c6ae99SBarry Smith ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr); 79847c6ae99SBarry Smith if (size > 1) { 79947c6ae99SBarry Smith /* change viewer to display matrix in natural ordering */ 80047c6ae99SBarry Smith ierr = MatShellSetOperation(A, MATOP_VIEW, (void (*)(void))MatView_MPI_DA);CHKERRQ(ierr); 80147c6ae99SBarry Smith ierr = MatShellSetOperation(A, MATOP_LOAD, (void (*)(void))MatLoad_MPI_DA);CHKERRQ(ierr); 80247c6ae99SBarry Smith } 80347c6ae99SBarry Smith *J = A; 80447c6ae99SBarry Smith PetscFunctionReturn(0); 80547c6ae99SBarry Smith } 80647c6ae99SBarry Smith 80747c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/ 80847c6ae99SBarry Smith #undef __FUNCT__ 809950540a4SJed Brown #define __FUNCT__ "DMCreateMatrix_DA_2d_MPIAIJ" 810950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_2d_MPIAIJ(DM da,Mat J) 81147c6ae99SBarry Smith { 81247c6ae99SBarry Smith PetscErrorCode ierr; 8130298fd71SBarry Smith PetscInt xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny,m,n,dim,s,*cols = NULL,k,nc,*rows = NULL,col,cnt,l,p; 81447c6ae99SBarry Smith PetscInt lstart,lend,pstart,pend,*dnz,*onz; 81547c6ae99SBarry Smith MPI_Comm comm; 81647c6ae99SBarry Smith PetscScalar *values; 8171321219cSEthan Coon DMDABoundaryType bx,by; 81847c6ae99SBarry Smith ISLocalToGlobalMapping ltog,ltogb; 819aa219208SBarry Smith DMDAStencilType st; 82047c6ae99SBarry Smith 82147c6ae99SBarry Smith PetscFunctionBegin; 82247c6ae99SBarry Smith /* 82347c6ae99SBarry Smith nc - number of components per grid point 82447c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 82547c6ae99SBarry Smith 82647c6ae99SBarry Smith */ 8271321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,&n,0,0,0,0,&nc,&s,&bx,&by,0,&st);CHKERRQ(ierr); 82847c6ae99SBarry Smith col = 2*s + 1; 829aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,0,&nx,&ny,0);CHKERRQ(ierr); 830aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,0,&gnx,&gny,0);CHKERRQ(ierr); 83147c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 83247c6ae99SBarry Smith 83347c6ae99SBarry Smith ierr = PetscMalloc2(nc,PetscInt,&rows,col*col*nc*nc,PetscInt,&cols);CHKERRQ(ierr); 8341411c6eeSJed Brown ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 8351411c6eeSJed Brown ierr = DMGetLocalToGlobalMappingBlock(da,<ogb);CHKERRQ(ierr); 83647c6ae99SBarry Smith 83747c6ae99SBarry Smith /* determine the matrix preallocation information */ 83847c6ae99SBarry Smith ierr = MatPreallocateInitialize(comm,nc*nx*ny,nc*nx*ny,dnz,onz);CHKERRQ(ierr); 83947c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 84047c6ae99SBarry Smith 8411321219cSEthan Coon pstart = (bx == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 8421321219cSEthan Coon pend = (bx == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 84347c6ae99SBarry Smith 84447c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 84547c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys); 84647c6ae99SBarry Smith 8471321219cSEthan Coon lstart = (by == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 8481321219cSEthan Coon lend = (by == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 84947c6ae99SBarry Smith 85047c6ae99SBarry Smith cnt = 0; 85147c6ae99SBarry Smith for (k=0; k<nc; k++) { 85247c6ae99SBarry Smith for (l=lstart; l<lend+1; l++) { 85347c6ae99SBarry Smith for (p=pstart; p<pend+1; p++) { 854aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || (!l || !p)) { /* entries on star have either l = 0 or p = 0 */ 85547c6ae99SBarry Smith cols[cnt++] = k + nc*(slot + gnx*l + p); 85647c6ae99SBarry Smith } 85747c6ae99SBarry Smith } 85847c6ae99SBarry Smith } 85947c6ae99SBarry Smith rows[k] = k + nc*(slot); 86047c6ae99SBarry Smith } 861784ac674SJed Brown ierr = MatPreallocateSetLocal(ltog,nc,rows,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr); 86247c6ae99SBarry Smith } 86347c6ae99SBarry Smith } 864f73d5cc4SBarry Smith ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr); 86547c6ae99SBarry Smith ierr = MatSeqAIJSetPreallocation(J,0,dnz);CHKERRQ(ierr); 86647c6ae99SBarry Smith ierr = MatMPIAIJSetPreallocation(J,0,dnz,0,onz);CHKERRQ(ierr); 86747c6ae99SBarry Smith ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr); 86847c6ae99SBarry Smith 869784ac674SJed Brown ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 870784ac674SJed Brown ierr = MatSetLocalToGlobalMappingBlock(J,ltogb,ltogb);CHKERRQ(ierr); 87147c6ae99SBarry Smith 87247c6ae99SBarry Smith /* 87347c6ae99SBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 87447c6ae99SBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 87547c6ae99SBarry Smith PETSc ordering. 87647c6ae99SBarry Smith */ 877fcfd50ebSBarry Smith if (!da->prealloc_only) { 87847c6ae99SBarry Smith ierr = PetscMalloc(col*col*nc*nc*sizeof(PetscScalar),&values);CHKERRQ(ierr); 87947c6ae99SBarry Smith ierr = PetscMemzero(values,col*col*nc*nc*sizeof(PetscScalar));CHKERRQ(ierr); 88047c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 88147c6ae99SBarry Smith 8821321219cSEthan Coon pstart = (bx == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 8831321219cSEthan Coon pend = (bx == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 88447c6ae99SBarry Smith 88547c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 88647c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys); 88747c6ae99SBarry Smith 8881321219cSEthan Coon lstart = (by == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 8891321219cSEthan Coon lend = (by == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 89047c6ae99SBarry Smith 89147c6ae99SBarry Smith cnt = 0; 89247c6ae99SBarry Smith for (k=0; k<nc; k++) { 89347c6ae99SBarry Smith for (l=lstart; l<lend+1; l++) { 89447c6ae99SBarry Smith for (p=pstart; p<pend+1; p++) { 895aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || (!l || !p)) { /* entries on star have either l = 0 or p = 0 */ 89647c6ae99SBarry Smith cols[cnt++] = k + nc*(slot + gnx*l + p); 89747c6ae99SBarry Smith } 89847c6ae99SBarry Smith } 89947c6ae99SBarry Smith } 90047c6ae99SBarry Smith rows[k] = k + nc*(slot); 90147c6ae99SBarry Smith } 90247c6ae99SBarry Smith ierr = MatSetValuesLocal(J,nc,rows,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 90347c6ae99SBarry Smith } 90447c6ae99SBarry Smith } 90547c6ae99SBarry Smith ierr = PetscFree(values);CHKERRQ(ierr); 90647c6ae99SBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 90747c6ae99SBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 90847c6ae99SBarry Smith } 90947c6ae99SBarry Smith ierr = PetscFree2(rows,cols);CHKERRQ(ierr); 91047c6ae99SBarry Smith PetscFunctionReturn(0); 91147c6ae99SBarry Smith } 91247c6ae99SBarry Smith 91347c6ae99SBarry Smith #undef __FUNCT__ 914950540a4SJed Brown #define __FUNCT__ "DMCreateMatrix_DA_2d_MPIAIJ_Fill" 915950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_2d_MPIAIJ_Fill(DM da,Mat J) 91647c6ae99SBarry Smith { 91747c6ae99SBarry Smith PetscErrorCode ierr; 91847c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny; 91947c6ae99SBarry Smith PetscInt m,n,dim,s,*cols,k,nc,row,col,cnt,l,p; 92047c6ae99SBarry Smith PetscInt lstart,lend,pstart,pend,*dnz,*onz; 92147c6ae99SBarry Smith DM_DA *dd = (DM_DA*)da->data; 92247c6ae99SBarry Smith PetscInt ifill_col,*ofill = dd->ofill, *dfill = dd->dfill; 92347c6ae99SBarry Smith MPI_Comm comm; 92447c6ae99SBarry Smith PetscScalar *values; 9251321219cSEthan Coon DMDABoundaryType bx,by; 92647c6ae99SBarry Smith ISLocalToGlobalMapping ltog,ltogb; 927aa219208SBarry Smith DMDAStencilType st; 92847c6ae99SBarry Smith 92947c6ae99SBarry Smith PetscFunctionBegin; 93047c6ae99SBarry Smith /* 93147c6ae99SBarry Smith nc - number of components per grid point 93247c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 93347c6ae99SBarry Smith 93447c6ae99SBarry Smith */ 9351321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,&n,0,0,0,0,&nc,&s,&bx,&by,0,&st);CHKERRQ(ierr); 93647c6ae99SBarry Smith col = 2*s + 1; 937aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,0,&nx,&ny,0);CHKERRQ(ierr); 938aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,0,&gnx,&gny,0);CHKERRQ(ierr); 93947c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 94047c6ae99SBarry Smith 94147c6ae99SBarry Smith ierr = PetscMalloc(col*col*nc*nc*sizeof(PetscInt),&cols);CHKERRQ(ierr); 9421411c6eeSJed Brown ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 9431411c6eeSJed Brown ierr = DMGetLocalToGlobalMappingBlock(da,<ogb);CHKERRQ(ierr); 94447c6ae99SBarry Smith 94547c6ae99SBarry Smith /* determine the matrix preallocation information */ 94647c6ae99SBarry Smith ierr = MatPreallocateInitialize(comm,nc*nx*ny,nc*nx*ny,dnz,onz);CHKERRQ(ierr); 94747c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 94847c6ae99SBarry Smith 9491321219cSEthan Coon pstart = (bx == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 9501321219cSEthan Coon pend = (bx == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 95147c6ae99SBarry Smith 95247c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 95347c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys); 95447c6ae99SBarry Smith 9551321219cSEthan Coon lstart = (by == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 9561321219cSEthan Coon lend = (by == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 95747c6ae99SBarry Smith 95847c6ae99SBarry Smith for (k=0; k<nc; k++) { 95947c6ae99SBarry Smith cnt = 0; 96047c6ae99SBarry Smith for (l=lstart; l<lend+1; l++) { 96147c6ae99SBarry Smith for (p=pstart; p<pend+1; p++) { 96247c6ae99SBarry Smith if (l || p) { 963aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || (!l || !p)) { /* entries on star */ 9648865f1eaSKarl Rupp for (ifill_col=ofill[k]; ifill_col<ofill[k+1]; ifill_col++) cols[cnt++] = ofill[ifill_col] + nc*(slot + gnx*l + p); 96547c6ae99SBarry Smith } 96647c6ae99SBarry Smith } else { 96747c6ae99SBarry Smith if (dfill) { 9688865f1eaSKarl Rupp for (ifill_col=dfill[k]; ifill_col<dfill[k+1]; ifill_col++) cols[cnt++] = dfill[ifill_col] + nc*(slot + gnx*l + p); 96947c6ae99SBarry Smith } else { 9708865f1eaSKarl Rupp for (ifill_col=0; ifill_col<nc; ifill_col++) cols[cnt++] = ifill_col + nc*(slot + gnx*l + p); 97147c6ae99SBarry Smith } 97247c6ae99SBarry Smith } 97347c6ae99SBarry Smith } 97447c6ae99SBarry Smith } 97547c6ae99SBarry Smith row = k + nc*(slot); 976784ac674SJed Brown ierr = MatPreallocateSetLocal(ltog,1,&row,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr); 97747c6ae99SBarry Smith } 97847c6ae99SBarry Smith } 97947c6ae99SBarry Smith } 98047c6ae99SBarry Smith ierr = MatSeqAIJSetPreallocation(J,0,dnz);CHKERRQ(ierr); 98147c6ae99SBarry Smith ierr = MatMPIAIJSetPreallocation(J,0,dnz,0,onz);CHKERRQ(ierr); 98247c6ae99SBarry Smith ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr); 983784ac674SJed Brown ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 984784ac674SJed Brown ierr = MatSetLocalToGlobalMappingBlock(J,ltogb,ltogb);CHKERRQ(ierr); 98547c6ae99SBarry Smith 98647c6ae99SBarry Smith /* 98747c6ae99SBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 98847c6ae99SBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 98947c6ae99SBarry Smith PETSc ordering. 99047c6ae99SBarry Smith */ 991fcfd50ebSBarry Smith if (!da->prealloc_only) { 99247c6ae99SBarry Smith ierr = PetscMalloc(col*col*nc*nc*sizeof(PetscScalar),&values);CHKERRQ(ierr); 99347c6ae99SBarry Smith ierr = PetscMemzero(values,col*col*nc*nc*sizeof(PetscScalar));CHKERRQ(ierr); 99447c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 99547c6ae99SBarry Smith 9961321219cSEthan Coon pstart = (bx == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 9971321219cSEthan Coon pend = (bx == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 99847c6ae99SBarry Smith 99947c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 100047c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys); 100147c6ae99SBarry Smith 10021321219cSEthan Coon lstart = (by == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 10031321219cSEthan Coon lend = (by == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 100447c6ae99SBarry Smith 100547c6ae99SBarry Smith for (k=0; k<nc; k++) { 100647c6ae99SBarry Smith cnt = 0; 100747c6ae99SBarry Smith for (l=lstart; l<lend+1; l++) { 100847c6ae99SBarry Smith for (p=pstart; p<pend+1; p++) { 100947c6ae99SBarry Smith if (l || p) { 1010aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || (!l || !p)) { /* entries on star */ 10118865f1eaSKarl Rupp for (ifill_col=ofill[k]; ifill_col<ofill[k+1]; ifill_col++) cols[cnt++] = ofill[ifill_col] + nc*(slot + gnx*l + p); 101247c6ae99SBarry Smith } 101347c6ae99SBarry Smith } else { 101447c6ae99SBarry Smith if (dfill) { 10158865f1eaSKarl Rupp for (ifill_col=dfill[k]; ifill_col<dfill[k+1]; ifill_col++) cols[cnt++] = dfill[ifill_col] + nc*(slot + gnx*l + p); 101647c6ae99SBarry Smith } else { 10178865f1eaSKarl Rupp for (ifill_col=0; ifill_col<nc; ifill_col++) cols[cnt++] = ifill_col + nc*(slot + gnx*l + p); 101847c6ae99SBarry Smith } 101947c6ae99SBarry Smith } 102047c6ae99SBarry Smith } 102147c6ae99SBarry Smith } 102247c6ae99SBarry Smith row = k + nc*(slot); 102347c6ae99SBarry Smith ierr = MatSetValuesLocal(J,1,&row,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 102447c6ae99SBarry Smith } 102547c6ae99SBarry Smith } 102647c6ae99SBarry Smith } 102747c6ae99SBarry Smith ierr = PetscFree(values);CHKERRQ(ierr); 102847c6ae99SBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 102947c6ae99SBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 103047c6ae99SBarry Smith } 103147c6ae99SBarry Smith ierr = PetscFree(cols);CHKERRQ(ierr); 103247c6ae99SBarry Smith PetscFunctionReturn(0); 103347c6ae99SBarry Smith } 103447c6ae99SBarry Smith 103547c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/ 103647c6ae99SBarry Smith 103747c6ae99SBarry Smith #undef __FUNCT__ 1038950540a4SJed Brown #define __FUNCT__ "DMCreateMatrix_DA_3d_MPIAIJ" 1039950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_3d_MPIAIJ(DM da,Mat J) 104047c6ae99SBarry Smith { 104147c6ae99SBarry Smith PetscErrorCode ierr; 104247c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny; 10430298fd71SBarry Smith PetscInt m,n,dim,s,*cols = NULL,k,nc,*rows = NULL,col,cnt,l,p,*dnz = NULL,*onz = NULL; 104447c6ae99SBarry Smith PetscInt istart,iend,jstart,jend,kstart,kend,zs,nz,gzs,gnz,ii,jj,kk; 104547c6ae99SBarry Smith MPI_Comm comm; 104647c6ae99SBarry Smith PetscScalar *values; 10471321219cSEthan Coon DMDABoundaryType bx,by,bz; 104847c6ae99SBarry Smith ISLocalToGlobalMapping ltog,ltogb; 1049aa219208SBarry Smith DMDAStencilType st; 105047c6ae99SBarry Smith 105147c6ae99SBarry Smith PetscFunctionBegin; 105247c6ae99SBarry Smith /* 105347c6ae99SBarry Smith nc - number of components per grid point 105447c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 105547c6ae99SBarry Smith 105647c6ae99SBarry Smith */ 10571321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,&n,&p,0,0,0,&nc,&s,&bx,&by,&bz,&st);CHKERRQ(ierr); 105847c6ae99SBarry Smith col = 2*s + 1; 105947c6ae99SBarry Smith 1060aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,&zs,&nx,&ny,&nz);CHKERRQ(ierr); 1061aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,&gzs,&gnx,&gny,&gnz);CHKERRQ(ierr); 106247c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 106347c6ae99SBarry Smith 106447c6ae99SBarry Smith ierr = PetscMalloc2(nc,PetscInt,&rows,col*col*col*nc*nc,PetscInt,&cols);CHKERRQ(ierr); 10651411c6eeSJed Brown ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 10661411c6eeSJed Brown ierr = DMGetLocalToGlobalMappingBlock(da,<ogb);CHKERRQ(ierr); 106747c6ae99SBarry Smith 106847c6ae99SBarry Smith /* determine the matrix preallocation information */ 106947c6ae99SBarry Smith ierr = MatPreallocateInitialize(comm,nc*nx*ny*nz,nc*nx*ny*nz,dnz,onz);CHKERRQ(ierr); 107047c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 10711321219cSEthan Coon istart = (bx == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 10721321219cSEthan Coon iend = (bx == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 107347c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 10741321219cSEthan Coon jstart = (by == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 10751321219cSEthan Coon jend = (by == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 107647c6ae99SBarry Smith for (k=zs; k<zs+nz; k++) { 10771321219cSEthan Coon kstart = (bz == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k)); 10781321219cSEthan Coon kend = (bz == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,p-k-1)); 107947c6ae99SBarry Smith 108047c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs); 108147c6ae99SBarry Smith 108247c6ae99SBarry Smith cnt = 0; 108347c6ae99SBarry Smith for (l=0; l<nc; l++) { 108447c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 108547c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 108647c6ae99SBarry Smith for (kk=kstart; kk<kend+1; kk++) { 1087aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/ 108847c6ae99SBarry Smith cols[cnt++] = l + nc*(slot + ii + gnx*jj + gnx*gny*kk); 108947c6ae99SBarry Smith } 109047c6ae99SBarry Smith } 109147c6ae99SBarry Smith } 109247c6ae99SBarry Smith } 109347c6ae99SBarry Smith rows[l] = l + nc*(slot); 109447c6ae99SBarry Smith } 1095784ac674SJed Brown ierr = MatPreallocateSetLocal(ltog,nc,rows,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr); 109647c6ae99SBarry Smith } 109747c6ae99SBarry Smith } 109847c6ae99SBarry Smith } 1099f73d5cc4SBarry Smith ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr); 110047c6ae99SBarry Smith ierr = MatSeqAIJSetPreallocation(J,0,dnz);CHKERRQ(ierr); 110147c6ae99SBarry Smith ierr = MatMPIAIJSetPreallocation(J,0,dnz,0,onz);CHKERRQ(ierr); 110247c6ae99SBarry Smith ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr); 1103784ac674SJed Brown ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 1104784ac674SJed Brown ierr = MatSetLocalToGlobalMappingBlock(J,ltogb,ltogb);CHKERRQ(ierr); 110547c6ae99SBarry Smith 110647c6ae99SBarry Smith /* 110747c6ae99SBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 110847c6ae99SBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 110947c6ae99SBarry Smith PETSc ordering. 111047c6ae99SBarry Smith */ 1111fcfd50ebSBarry Smith if (!da->prealloc_only) { 111247c6ae99SBarry Smith ierr = PetscMalloc(col*col*col*nc*nc*nc*sizeof(PetscScalar),&values);CHKERRQ(ierr); 111347c6ae99SBarry Smith ierr = PetscMemzero(values,col*col*col*nc*nc*nc*sizeof(PetscScalar));CHKERRQ(ierr); 111447c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 11151321219cSEthan Coon istart = (bx == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 11161321219cSEthan Coon iend = (bx == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 111747c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 11181321219cSEthan Coon jstart = (by == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 11191321219cSEthan Coon jend = (by == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 112047c6ae99SBarry Smith for (k=zs; k<zs+nz; k++) { 11211321219cSEthan Coon kstart = (bz == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k)); 11221321219cSEthan Coon kend = (bz == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,p-k-1)); 112347c6ae99SBarry Smith 112447c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs); 112547c6ae99SBarry Smith 112647c6ae99SBarry Smith cnt = 0; 112747c6ae99SBarry Smith for (l=0; l<nc; l++) { 112847c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 112947c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 113047c6ae99SBarry Smith for (kk=kstart; kk<kend+1; kk++) { 1131aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/ 113247c6ae99SBarry Smith cols[cnt++] = l + nc*(slot + ii + gnx*jj + gnx*gny*kk); 113347c6ae99SBarry Smith } 113447c6ae99SBarry Smith } 113547c6ae99SBarry Smith } 113647c6ae99SBarry Smith } 113747c6ae99SBarry Smith rows[l] = l + nc*(slot); 113847c6ae99SBarry Smith } 113947c6ae99SBarry Smith ierr = MatSetValuesLocal(J,nc,rows,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 114047c6ae99SBarry Smith } 114147c6ae99SBarry Smith } 114247c6ae99SBarry Smith } 114347c6ae99SBarry Smith ierr = PetscFree(values);CHKERRQ(ierr); 114447c6ae99SBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 114547c6ae99SBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 114647c6ae99SBarry Smith } 114747c6ae99SBarry Smith ierr = PetscFree2(rows,cols);CHKERRQ(ierr); 114847c6ae99SBarry Smith PetscFunctionReturn(0); 114947c6ae99SBarry Smith } 115047c6ae99SBarry Smith 115147c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/ 115247c6ae99SBarry Smith 115347c6ae99SBarry Smith #undef __FUNCT__ 1154ce308e1dSBarry Smith #define __FUNCT__ "DMCreateMatrix_DA_1d_MPIAIJ_Fill" 1155ce308e1dSBarry Smith PetscErrorCode DMCreateMatrix_DA_1d_MPIAIJ_Fill(DM da,Mat J) 1156ce308e1dSBarry Smith { 1157ce308e1dSBarry Smith PetscErrorCode ierr; 1158ce308e1dSBarry Smith DM_DA *dd = (DM_DA*)da->data; 1159ce308e1dSBarry Smith PetscInt xs,nx,i,j,gxs,gnx,row,k,l; 11600298fd71SBarry Smith PetscInt m,dim,s,*cols = NULL,nc,col,cnt,*ocols; 1161*0acb5bebSBarry Smith PetscInt *ofill = dd->ofill,*dfill = dd->dfill; 1162ce308e1dSBarry Smith PetscScalar *values; 1163ce308e1dSBarry Smith DMDABoundaryType bx; 1164ce308e1dSBarry Smith ISLocalToGlobalMapping ltog,ltogb; 1165ce308e1dSBarry Smith PetscMPIInt rank,size; 1166ce308e1dSBarry Smith 1167ce308e1dSBarry Smith PetscFunctionBegin; 1168ce94432eSBarry Smith if (dd->bx == DMDA_BOUNDARY_PERIODIC) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"With fill provided not implemented with periodic boundary conditions"); 1169ce94432eSBarry Smith ierr = MPI_Comm_rank(PetscObjectComm((PetscObject)da),&rank);CHKERRQ(ierr); 1170ce94432eSBarry Smith ierr = MPI_Comm_size(PetscObjectComm((PetscObject)da),&size);CHKERRQ(ierr); 1171ce308e1dSBarry Smith 1172ce308e1dSBarry Smith /* 1173ce308e1dSBarry Smith nc - number of components per grid point 1174ce308e1dSBarry Smith col - number of colors needed in one direction for single component problem 1175ce308e1dSBarry Smith 1176ce308e1dSBarry Smith */ 1177ce308e1dSBarry Smith ierr = DMDAGetInfo(da,&dim,&m,0,0,0,0,0,&nc,&s,&bx,0,0,0);CHKERRQ(ierr); 1178ce308e1dSBarry Smith col = 2*s + 1; 1179ce308e1dSBarry Smith 1180ce308e1dSBarry Smith ierr = DMDAGetCorners(da,&xs,0,0,&nx,0,0);CHKERRQ(ierr); 1181ce308e1dSBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,0,0,&gnx,0,0);CHKERRQ(ierr); 1182ce308e1dSBarry Smith 1183ce308e1dSBarry Smith ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr); 1184ce308e1dSBarry Smith ierr = PetscMalloc2(nx*nc,PetscInt,&cols,nx*nc,PetscInt,&ocols);CHKERRQ(ierr); 1185ce308e1dSBarry Smith ierr = PetscMemzero(cols,nx*nc*sizeof(PetscInt));CHKERRQ(ierr); 1186ce308e1dSBarry Smith ierr = PetscMemzero(ocols,nx*nc*sizeof(PetscInt));CHKERRQ(ierr); 1187ce308e1dSBarry Smith 1188ce308e1dSBarry Smith /* 1189ce308e1dSBarry Smith note should be smaller for first and last process with no periodic 1190ce308e1dSBarry Smith does not handle dfill 1191ce308e1dSBarry Smith */ 1192ce308e1dSBarry Smith cnt = 0; 1193ce308e1dSBarry Smith /* coupling with process to the left */ 1194ce308e1dSBarry Smith for (i=0; i<s; i++) { 1195ce308e1dSBarry Smith for (j=0; j<nc; j++) { 1196ce308e1dSBarry Smith ocols[cnt] = ((!rank) ? 0 : (s - i)*(ofill[j+1] - ofill[j])); 1197*0acb5bebSBarry Smith cols[cnt] = dfill[j+1] - dfill[j] + (s + i)*(ofill[j+1] - ofill[j]); 1198ce308e1dSBarry Smith cnt++; 1199ce308e1dSBarry Smith } 1200ce308e1dSBarry Smith } 1201ce308e1dSBarry Smith for (i=s; i<nx-s; i++) { 1202ce308e1dSBarry Smith for (j=0; j<nc; j++) { 1203*0acb5bebSBarry Smith cols[cnt] = dfill[j+1] - dfill[j] + 2*s*(ofill[j+1] - ofill[j]); 1204ce308e1dSBarry Smith cnt++; 1205ce308e1dSBarry Smith } 1206ce308e1dSBarry Smith } 1207ce308e1dSBarry Smith /* coupling with process to the right */ 1208ce308e1dSBarry Smith for (i=nx-s; i<nx; i++) { 1209ce308e1dSBarry Smith for (j=0; j<nc; j++) { 1210ce308e1dSBarry Smith ocols[cnt] = ((rank == (size-1)) ? 0 : (i - nx + s + 1)*(ofill[j+1] - ofill[j])); 1211*0acb5bebSBarry Smith cols[cnt] = dfill[j+1] - dfill[j] + (s + nx - i - 1)*(ofill[j+1] - ofill[j]); 1212ce308e1dSBarry Smith cnt++; 1213ce308e1dSBarry Smith } 1214ce308e1dSBarry Smith } 1215ce308e1dSBarry Smith 1216ce308e1dSBarry Smith ierr = MatSeqAIJSetPreallocation(J,0,cols);CHKERRQ(ierr); 1217ce308e1dSBarry Smith ierr = MatMPIAIJSetPreallocation(J,0,cols,0,ocols);CHKERRQ(ierr); 1218ce308e1dSBarry Smith ierr = PetscFree2(cols,ocols);CHKERRQ(ierr); 1219ce308e1dSBarry Smith 1220ce308e1dSBarry Smith ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 1221ce308e1dSBarry Smith ierr = DMGetLocalToGlobalMappingBlock(da,<ogb);CHKERRQ(ierr); 1222ce308e1dSBarry Smith ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 1223ce308e1dSBarry Smith ierr = MatSetLocalToGlobalMappingBlock(J,ltogb,ltogb);CHKERRQ(ierr); 1224ce308e1dSBarry Smith 1225ce308e1dSBarry Smith /* 1226ce308e1dSBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 1227ce308e1dSBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 1228ce308e1dSBarry Smith PETSc ordering. 1229ce308e1dSBarry Smith */ 1230ce308e1dSBarry Smith if (!da->prealloc_only) { 1231ce308e1dSBarry Smith ierr = PetscMalloc(col*nc*nc*sizeof(PetscInt),&cols);CHKERRQ(ierr); 1232ce308e1dSBarry Smith ierr = PetscMalloc(col*nc*nc*sizeof(PetscScalar),&values);CHKERRQ(ierr); 1233ce308e1dSBarry Smith ierr = PetscMemzero(values,col*nc*nc*sizeof(PetscScalar));CHKERRQ(ierr); 1234ce308e1dSBarry Smith 1235ce308e1dSBarry Smith row = xs*nc; 1236ce308e1dSBarry Smith /* coupling with process to the left */ 1237ce308e1dSBarry Smith for (i=xs; i<xs+s; i++) { 1238ce308e1dSBarry Smith for (j=0; j<nc; j++) { 1239ce308e1dSBarry Smith cnt = 0; 1240ce308e1dSBarry Smith if (rank) { 1241ce308e1dSBarry Smith for (l=0; l<s; l++) { 1242ce308e1dSBarry Smith for (k=ofill[j]; k<ofill[j+1]; k++) cols[cnt++] = (i - s + l)*nc + ofill[k]; 1243ce308e1dSBarry Smith } 1244ce308e1dSBarry Smith } 1245*0acb5bebSBarry Smith if (dfill) { 1246*0acb5bebSBarry Smith for (k=dfill[j]; k<dfill[j+1]; k++) { 1247*0acb5bebSBarry Smith cols[cnt++] = i*nc + dfill[k]; 1248*0acb5bebSBarry Smith } 1249*0acb5bebSBarry Smith } else { 1250ce308e1dSBarry Smith for (k=0; k<nc; k++) { 1251ce308e1dSBarry Smith cols[cnt++] = i*nc + k; 1252ce308e1dSBarry Smith } 1253*0acb5bebSBarry Smith } 1254ce308e1dSBarry Smith for (l=0; l<s; l++) { 1255ce308e1dSBarry Smith for (k=ofill[j]; k<ofill[j+1]; k++) cols[cnt++] = (i + s - l)*nc + ofill[k]; 1256ce308e1dSBarry Smith } 1257ce308e1dSBarry Smith ierr = MatSetValues(J,1,&row,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 1258ce308e1dSBarry Smith row++; 1259ce308e1dSBarry Smith } 1260ce308e1dSBarry Smith } 1261ce308e1dSBarry Smith for (i=xs+s; i<xs+nx-s; i++) { 1262ce308e1dSBarry Smith for (j=0; j<nc; j++) { 1263ce308e1dSBarry Smith cnt = 0; 1264ce308e1dSBarry Smith for (l=0; l<s; l++) { 1265ce308e1dSBarry Smith for (k=ofill[j]; k<ofill[j+1]; k++) cols[cnt++] = (i - s + l)*nc + ofill[k]; 1266ce308e1dSBarry Smith } 1267*0acb5bebSBarry Smith if (dfill) { 1268*0acb5bebSBarry Smith for (k=dfill[j]; k<dfill[j+1]; k++) { 1269*0acb5bebSBarry Smith cols[cnt++] = i*nc + dfill[k]; 1270*0acb5bebSBarry Smith } 1271*0acb5bebSBarry Smith } else { 1272ce308e1dSBarry Smith for (k=0; k<nc; k++) { 1273ce308e1dSBarry Smith cols[cnt++] = i*nc + k; 1274ce308e1dSBarry Smith } 1275*0acb5bebSBarry Smith } 1276ce308e1dSBarry Smith for (l=0; l<s; l++) { 1277ce308e1dSBarry Smith for (k=ofill[j]; k<ofill[j+1]; k++) cols[cnt++] = (i + s - l)*nc + ofill[k]; 1278ce308e1dSBarry Smith } 1279ce308e1dSBarry Smith ierr = MatSetValues(J,1,&row,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 1280ce308e1dSBarry Smith row++; 1281ce308e1dSBarry Smith } 1282ce308e1dSBarry Smith } 1283ce308e1dSBarry Smith /* coupling with process to the right */ 1284ce308e1dSBarry Smith for (i=xs+nx-s; i<xs+nx; i++) { 1285ce308e1dSBarry Smith for (j=0; j<nc; j++) { 1286ce308e1dSBarry Smith cnt = 0; 1287ce308e1dSBarry Smith for (l=0; l<s; l++) { 1288ce308e1dSBarry Smith for (k=ofill[j]; k<ofill[j+1]; k++) cols[cnt++] = (i - s + l)*nc + ofill[k]; 1289ce308e1dSBarry Smith } 1290*0acb5bebSBarry Smith if (dfill) { 1291*0acb5bebSBarry Smith for (k=dfill[j]; k<dfill[j+1]; k++) { 1292*0acb5bebSBarry Smith cols[cnt++] = i*nc + dfill[k]; 1293*0acb5bebSBarry Smith } 1294*0acb5bebSBarry Smith } else { 1295ce308e1dSBarry Smith for (k=0; k<nc; k++) { 1296ce308e1dSBarry Smith cols[cnt++] = i*nc + k; 1297ce308e1dSBarry Smith } 1298*0acb5bebSBarry Smith } 1299ce308e1dSBarry Smith if (rank < size-1) { 1300ce308e1dSBarry Smith for (l=0; l<s; l++) { 1301ce308e1dSBarry Smith for (k=ofill[j]; k<ofill[j+1]; k++) cols[cnt++] = (i + s - l)*nc + ofill[k]; 1302ce308e1dSBarry Smith } 1303ce308e1dSBarry Smith } 1304ce308e1dSBarry Smith ierr = MatSetValues(J,1,&row,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 1305ce308e1dSBarry Smith row++; 1306ce308e1dSBarry Smith } 1307ce308e1dSBarry Smith } 1308ce308e1dSBarry Smith ierr = PetscFree(values);CHKERRQ(ierr); 1309ce308e1dSBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1310ce308e1dSBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1311ce308e1dSBarry Smith ierr = PetscFree(cols);CHKERRQ(ierr); 1312ce308e1dSBarry Smith } 1313ce308e1dSBarry Smith PetscFunctionReturn(0); 1314ce308e1dSBarry Smith } 1315ce308e1dSBarry Smith 1316ce308e1dSBarry Smith /* ---------------------------------------------------------------------------------*/ 1317ce308e1dSBarry Smith 1318ce308e1dSBarry Smith #undef __FUNCT__ 1319950540a4SJed Brown #define __FUNCT__ "DMCreateMatrix_DA_1d_MPIAIJ" 1320950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_1d_MPIAIJ(DM da,Mat J) 132147c6ae99SBarry Smith { 132247c6ae99SBarry Smith PetscErrorCode ierr; 132347c6ae99SBarry Smith PetscInt xs,nx,i,i1,slot,gxs,gnx; 13240298fd71SBarry Smith PetscInt m,dim,s,*cols = NULL,nc,*rows = NULL,col,cnt,l; 132547c6ae99SBarry Smith PetscInt istart,iend; 132647c6ae99SBarry Smith PetscScalar *values; 13271321219cSEthan Coon DMDABoundaryType bx; 132847c6ae99SBarry Smith ISLocalToGlobalMapping ltog,ltogb; 132947c6ae99SBarry Smith 133047c6ae99SBarry Smith PetscFunctionBegin; 133147c6ae99SBarry Smith /* 133247c6ae99SBarry Smith nc - number of components per grid point 133347c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 133447c6ae99SBarry Smith 133547c6ae99SBarry Smith */ 13361321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,0,0,0,0,0,&nc,&s,&bx,0,0,0);CHKERRQ(ierr); 133747c6ae99SBarry Smith col = 2*s + 1; 133847c6ae99SBarry Smith 1339aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,0,0,&nx,0,0);CHKERRQ(ierr); 1340aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,0,0,&gnx,0,0);CHKERRQ(ierr); 134147c6ae99SBarry Smith 1342f73d5cc4SBarry Smith ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr); 134347c6ae99SBarry Smith ierr = MatSeqAIJSetPreallocation(J,col*nc,0);CHKERRQ(ierr); 134447c6ae99SBarry Smith ierr = MatMPIAIJSetPreallocation(J,col*nc,0,col*nc,0);CHKERRQ(ierr); 134547c6ae99SBarry Smith 13461411c6eeSJed Brown ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 13471411c6eeSJed Brown ierr = DMGetLocalToGlobalMappingBlock(da,<ogb);CHKERRQ(ierr); 1348784ac674SJed Brown ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 1349784ac674SJed Brown ierr = MatSetLocalToGlobalMappingBlock(J,ltogb,ltogb);CHKERRQ(ierr); 135047c6ae99SBarry Smith 135147c6ae99SBarry Smith /* 135247c6ae99SBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 135347c6ae99SBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 135447c6ae99SBarry Smith PETSc ordering. 135547c6ae99SBarry Smith */ 1356fcfd50ebSBarry Smith if (!da->prealloc_only) { 1357ce308e1dSBarry Smith ierr = PetscMalloc2(nc,PetscInt,&rows,col*nc*nc,PetscInt,&cols);CHKERRQ(ierr); 135847c6ae99SBarry Smith ierr = PetscMalloc(col*nc*nc*sizeof(PetscScalar),&values);CHKERRQ(ierr); 135947c6ae99SBarry Smith ierr = PetscMemzero(values,col*nc*nc*sizeof(PetscScalar));CHKERRQ(ierr); 136047c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 136147c6ae99SBarry Smith istart = PetscMax(-s,gxs - i); 136247c6ae99SBarry Smith iend = PetscMin(s,gxs + gnx - i - 1); 136347c6ae99SBarry Smith slot = i - gxs; 136447c6ae99SBarry Smith 136547c6ae99SBarry Smith cnt = 0; 136647c6ae99SBarry Smith for (l=0; l<nc; l++) { 136747c6ae99SBarry Smith for (i1=istart; i1<iend+1; i1++) { 136847c6ae99SBarry Smith cols[cnt++] = l + nc*(slot + i1); 136947c6ae99SBarry Smith } 137047c6ae99SBarry Smith rows[l] = l + nc*(slot); 137147c6ae99SBarry Smith } 137247c6ae99SBarry Smith ierr = MatSetValuesLocal(J,nc,rows,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 137347c6ae99SBarry Smith } 137447c6ae99SBarry Smith ierr = PetscFree(values);CHKERRQ(ierr); 137547c6ae99SBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 137647c6ae99SBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 137747c6ae99SBarry Smith ierr = PetscFree2(rows,cols);CHKERRQ(ierr); 1378ce308e1dSBarry Smith } 137947c6ae99SBarry Smith PetscFunctionReturn(0); 138047c6ae99SBarry Smith } 138147c6ae99SBarry Smith 138247c6ae99SBarry Smith #undef __FUNCT__ 1383950540a4SJed Brown #define __FUNCT__ "DMCreateMatrix_DA_2d_MPIBAIJ" 1384950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_2d_MPIBAIJ(DM da,Mat J) 138547c6ae99SBarry Smith { 138647c6ae99SBarry Smith PetscErrorCode ierr; 138747c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny; 138847c6ae99SBarry Smith PetscInt m,n,dim,s,*cols,nc,col,cnt,*dnz,*onz; 138947c6ae99SBarry Smith PetscInt istart,iend,jstart,jend,ii,jj; 139047c6ae99SBarry Smith MPI_Comm comm; 139147c6ae99SBarry Smith PetscScalar *values; 13921321219cSEthan Coon DMDABoundaryType bx,by; 1393aa219208SBarry Smith DMDAStencilType st; 139447c6ae99SBarry Smith ISLocalToGlobalMapping ltog,ltogb; 139547c6ae99SBarry Smith 139647c6ae99SBarry Smith PetscFunctionBegin; 139747c6ae99SBarry Smith /* 139847c6ae99SBarry Smith nc - number of components per grid point 139947c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 140047c6ae99SBarry Smith */ 14011321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,&n,0,0,0,0,&nc,&s,&bx,&by,0,&st);CHKERRQ(ierr); 140247c6ae99SBarry Smith col = 2*s + 1; 140347c6ae99SBarry Smith 1404aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,0,&nx,&ny,0);CHKERRQ(ierr); 1405aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,0,&gnx,&gny,0);CHKERRQ(ierr); 140647c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 140747c6ae99SBarry Smith 140847c6ae99SBarry Smith ierr = PetscMalloc(col*col*nc*nc*sizeof(PetscInt),&cols);CHKERRQ(ierr); 140947c6ae99SBarry Smith 14101411c6eeSJed Brown ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 14111411c6eeSJed Brown ierr = DMGetLocalToGlobalMappingBlock(da,<ogb);CHKERRQ(ierr); 141247c6ae99SBarry Smith 141347c6ae99SBarry Smith /* determine the matrix preallocation information */ 141447c6ae99SBarry Smith ierr = MatPreallocateInitialize(comm,nx*ny,nx*ny,dnz,onz);CHKERRQ(ierr); 141547c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 14161321219cSEthan Coon istart = (bx == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 14171321219cSEthan Coon iend = (bx == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 141847c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 14191321219cSEthan Coon jstart = (by == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 14201321219cSEthan Coon jend = (by == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 142147c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys); 142247c6ae99SBarry Smith 142347c6ae99SBarry Smith /* Find block columns in block row */ 142447c6ae99SBarry Smith cnt = 0; 142547c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 142647c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 1427aa219208SBarry Smith if (st == DMDA_STENCIL_BOX || !ii || !jj) { /* BOX or on the STAR */ 142847c6ae99SBarry Smith cols[cnt++] = slot + ii + gnx*jj; 142947c6ae99SBarry Smith } 143047c6ae99SBarry Smith } 143147c6ae99SBarry Smith } 1432784ac674SJed Brown ierr = MatPreallocateSetLocal(ltogb,1,&slot,ltogb,cnt,cols,dnz,onz);CHKERRQ(ierr); 143347c6ae99SBarry Smith } 143447c6ae99SBarry Smith } 143547c6ae99SBarry Smith ierr = MatSeqBAIJSetPreallocation(J,nc,0,dnz);CHKERRQ(ierr); 143647c6ae99SBarry Smith ierr = MatMPIBAIJSetPreallocation(J,nc,0,dnz,0,onz);CHKERRQ(ierr); 143747c6ae99SBarry Smith ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr); 143847c6ae99SBarry Smith 1439784ac674SJed Brown ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 1440784ac674SJed Brown ierr = MatSetLocalToGlobalMappingBlock(J,ltogb,ltogb);CHKERRQ(ierr); 144147c6ae99SBarry Smith 144247c6ae99SBarry Smith /* 144347c6ae99SBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 144447c6ae99SBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 144547c6ae99SBarry Smith PETSc ordering. 144647c6ae99SBarry Smith */ 1447fcfd50ebSBarry Smith if (!da->prealloc_only) { 144847c6ae99SBarry Smith ierr = PetscMalloc(col*col*nc*nc*sizeof(PetscScalar),&values);CHKERRQ(ierr); 144947c6ae99SBarry Smith ierr = PetscMemzero(values,col*col*nc*nc*sizeof(PetscScalar));CHKERRQ(ierr); 145047c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 14511321219cSEthan Coon istart = (bx == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 14521321219cSEthan Coon iend = (bx == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 145347c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 14541321219cSEthan Coon jstart = (by == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 14551321219cSEthan Coon jend = (by == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 145647c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys); 145747c6ae99SBarry Smith cnt = 0; 145847c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 145947c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 1460aa219208SBarry Smith if (st == DMDA_STENCIL_BOX || !ii || !jj) { /* BOX or on the STAR */ 146147c6ae99SBarry Smith cols[cnt++] = slot + ii + gnx*jj; 146247c6ae99SBarry Smith } 146347c6ae99SBarry Smith } 146447c6ae99SBarry Smith } 146547c6ae99SBarry Smith ierr = MatSetValuesBlockedLocal(J,1,&slot,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 146647c6ae99SBarry Smith } 146747c6ae99SBarry Smith } 146847c6ae99SBarry Smith ierr = PetscFree(values);CHKERRQ(ierr); 146947c6ae99SBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 147047c6ae99SBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 147147c6ae99SBarry Smith } 147247c6ae99SBarry Smith ierr = PetscFree(cols);CHKERRQ(ierr); 147347c6ae99SBarry Smith PetscFunctionReturn(0); 147447c6ae99SBarry Smith } 147547c6ae99SBarry Smith 147647c6ae99SBarry Smith #undef __FUNCT__ 1477950540a4SJed Brown #define __FUNCT__ "DMCreateMatrix_DA_3d_MPIBAIJ" 1478950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_3d_MPIBAIJ(DM da,Mat J) 147947c6ae99SBarry Smith { 148047c6ae99SBarry Smith PetscErrorCode ierr; 148147c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny; 148247c6ae99SBarry Smith PetscInt m,n,dim,s,*cols,k,nc,col,cnt,p,*dnz,*onz; 148347c6ae99SBarry Smith PetscInt istart,iend,jstart,jend,kstart,kend,zs,nz,gzs,gnz,ii,jj,kk; 148447c6ae99SBarry Smith MPI_Comm comm; 148547c6ae99SBarry Smith PetscScalar *values; 14861321219cSEthan Coon DMDABoundaryType bx,by,bz; 1487aa219208SBarry Smith DMDAStencilType st; 148847c6ae99SBarry Smith ISLocalToGlobalMapping ltog,ltogb; 148947c6ae99SBarry Smith 149047c6ae99SBarry Smith PetscFunctionBegin; 149147c6ae99SBarry Smith /* 149247c6ae99SBarry Smith nc - number of components per grid point 149347c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 149447c6ae99SBarry Smith 149547c6ae99SBarry Smith */ 14961321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,&n,&p,0,0,0,&nc,&s,&bx,&by,&bz,&st);CHKERRQ(ierr); 149747c6ae99SBarry Smith col = 2*s + 1; 149847c6ae99SBarry Smith 1499aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,&zs,&nx,&ny,&nz);CHKERRQ(ierr); 1500aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,&gzs,&gnx,&gny,&gnz);CHKERRQ(ierr); 150147c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 150247c6ae99SBarry Smith 150347c6ae99SBarry Smith ierr = PetscMalloc(col*col*col*sizeof(PetscInt),&cols);CHKERRQ(ierr); 150447c6ae99SBarry Smith 15051411c6eeSJed Brown ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 15061411c6eeSJed Brown ierr = DMGetLocalToGlobalMappingBlock(da,<ogb);CHKERRQ(ierr); 150747c6ae99SBarry Smith 150847c6ae99SBarry Smith /* determine the matrix preallocation information */ 150947c6ae99SBarry Smith ierr = MatPreallocateInitialize(comm,nx*ny*nz,nx*ny*nz,dnz,onz);CHKERRQ(ierr); 151047c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 15111321219cSEthan Coon istart = (bx == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 15121321219cSEthan Coon iend = (bx == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 151347c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 15141321219cSEthan Coon jstart = (by == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 15151321219cSEthan Coon jend = (by == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 151647c6ae99SBarry Smith for (k=zs; k<zs+nz; k++) { 15171321219cSEthan Coon kstart = (bz == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k)); 15181321219cSEthan Coon kend = (bz == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,p-k-1)); 151947c6ae99SBarry Smith 152047c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs); 152147c6ae99SBarry Smith 152247c6ae99SBarry Smith /* Find block columns in block row */ 152347c6ae99SBarry Smith cnt = 0; 152447c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 152547c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 152647c6ae99SBarry Smith for (kk=kstart; kk<kend+1; kk++) { 1527aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/ 152847c6ae99SBarry Smith cols[cnt++] = slot + ii + gnx*jj + gnx*gny*kk; 152947c6ae99SBarry Smith } 153047c6ae99SBarry Smith } 153147c6ae99SBarry Smith } 153247c6ae99SBarry Smith } 1533784ac674SJed Brown ierr = MatPreallocateSetLocal(ltogb,1,&slot,ltogb,cnt,cols,dnz,onz);CHKERRQ(ierr); 153447c6ae99SBarry Smith } 153547c6ae99SBarry Smith } 153647c6ae99SBarry Smith } 153747c6ae99SBarry Smith ierr = MatSeqBAIJSetPreallocation(J,nc,0,dnz);CHKERRQ(ierr); 153847c6ae99SBarry Smith ierr = MatMPIBAIJSetPreallocation(J,nc,0,dnz,0,onz);CHKERRQ(ierr); 153947c6ae99SBarry Smith ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr); 154047c6ae99SBarry Smith 1541784ac674SJed Brown ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 1542784ac674SJed Brown ierr = MatSetLocalToGlobalMappingBlock(J,ltogb,ltogb);CHKERRQ(ierr); 154347c6ae99SBarry Smith 154447c6ae99SBarry Smith /* 154547c6ae99SBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 154647c6ae99SBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 154747c6ae99SBarry Smith PETSc ordering. 154847c6ae99SBarry Smith */ 1549fcfd50ebSBarry Smith if (!da->prealloc_only) { 155047c6ae99SBarry Smith ierr = PetscMalloc(col*col*col*nc*nc*sizeof(PetscScalar),&values);CHKERRQ(ierr); 155147c6ae99SBarry Smith ierr = PetscMemzero(values,col*col*col*nc*nc*sizeof(PetscScalar));CHKERRQ(ierr); 155247c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 15531321219cSEthan Coon istart = (bx == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 15541321219cSEthan Coon iend = (bx == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 155547c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 15561321219cSEthan Coon jstart = (by == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 15571321219cSEthan Coon jend = (by == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 155847c6ae99SBarry Smith for (k=zs; k<zs+nz; k++) { 15591321219cSEthan Coon kstart = (bz == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k)); 15601321219cSEthan Coon kend = (bz == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,p-k-1)); 156147c6ae99SBarry Smith 156247c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs); 156347c6ae99SBarry Smith 156447c6ae99SBarry Smith cnt = 0; 156547c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 156647c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 156747c6ae99SBarry Smith for (kk=kstart; kk<kend+1; kk++) { 1568aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/ 156947c6ae99SBarry Smith cols[cnt++] = slot + ii + gnx*jj + gnx*gny*kk; 157047c6ae99SBarry Smith } 157147c6ae99SBarry Smith } 157247c6ae99SBarry Smith } 157347c6ae99SBarry Smith } 157447c6ae99SBarry Smith ierr = MatSetValuesBlockedLocal(J,1,&slot,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 157547c6ae99SBarry Smith } 157647c6ae99SBarry Smith } 157747c6ae99SBarry Smith } 157847c6ae99SBarry Smith ierr = PetscFree(values);CHKERRQ(ierr); 157947c6ae99SBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 158047c6ae99SBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 158147c6ae99SBarry Smith } 158247c6ae99SBarry Smith ierr = PetscFree(cols);CHKERRQ(ierr); 158347c6ae99SBarry Smith PetscFunctionReturn(0); 158447c6ae99SBarry Smith } 158547c6ae99SBarry Smith 158647c6ae99SBarry Smith #undef __FUNCT__ 158747c6ae99SBarry Smith #define __FUNCT__ "L2GFilterUpperTriangular" 158847c6ae99SBarry Smith /* 158947c6ae99SBarry Smith This helper is for of SBAIJ preallocation, to discard the lower-triangular values which are difficult to 159047c6ae99SBarry Smith identify in the local ordering with periodic domain. 159147c6ae99SBarry Smith */ 159247c6ae99SBarry Smith static PetscErrorCode L2GFilterUpperTriangular(ISLocalToGlobalMapping ltog,PetscInt *row,PetscInt *cnt,PetscInt col[]) 159347c6ae99SBarry Smith { 159447c6ae99SBarry Smith PetscErrorCode ierr; 159547c6ae99SBarry Smith PetscInt i,n; 159647c6ae99SBarry Smith 159747c6ae99SBarry Smith PetscFunctionBegin; 159847c6ae99SBarry Smith ierr = ISLocalToGlobalMappingApply(ltog,1,row,row);CHKERRQ(ierr); 159947c6ae99SBarry Smith ierr = ISLocalToGlobalMappingApply(ltog,*cnt,col,col);CHKERRQ(ierr); 160047c6ae99SBarry Smith for (i=0,n=0; i<*cnt; i++) { 160147c6ae99SBarry Smith if (col[i] >= *row) col[n++] = col[i]; 160247c6ae99SBarry Smith } 160347c6ae99SBarry Smith *cnt = n; 160447c6ae99SBarry Smith PetscFunctionReturn(0); 160547c6ae99SBarry Smith } 160647c6ae99SBarry Smith 160747c6ae99SBarry Smith #undef __FUNCT__ 1608950540a4SJed Brown #define __FUNCT__ "DMCreateMatrix_DA_2d_MPISBAIJ" 1609950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_2d_MPISBAIJ(DM da,Mat J) 161047c6ae99SBarry Smith { 161147c6ae99SBarry Smith PetscErrorCode ierr; 161247c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny; 161347c6ae99SBarry Smith PetscInt m,n,dim,s,*cols,nc,col,cnt,*dnz,*onz; 161447c6ae99SBarry Smith PetscInt istart,iend,jstart,jend,ii,jj; 161547c6ae99SBarry Smith MPI_Comm comm; 161647c6ae99SBarry Smith PetscScalar *values; 16171321219cSEthan Coon DMDABoundaryType bx,by; 1618aa219208SBarry Smith DMDAStencilType st; 161947c6ae99SBarry Smith ISLocalToGlobalMapping ltog,ltogb; 162047c6ae99SBarry Smith 162147c6ae99SBarry Smith PetscFunctionBegin; 162247c6ae99SBarry Smith /* 162347c6ae99SBarry Smith nc - number of components per grid point 162447c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 162547c6ae99SBarry Smith */ 16261321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,&n,0,0,0,0,&nc,&s,&bx,&by,0,&st);CHKERRQ(ierr); 162747c6ae99SBarry Smith col = 2*s + 1; 162847c6ae99SBarry Smith 1629aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,0,&nx,&ny,0);CHKERRQ(ierr); 1630aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,0,&gnx,&gny,0);CHKERRQ(ierr); 163147c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 163247c6ae99SBarry Smith 163347c6ae99SBarry Smith ierr = PetscMalloc(col*col*nc*nc*sizeof(PetscInt),&cols);CHKERRQ(ierr); 163447c6ae99SBarry Smith 16351411c6eeSJed Brown ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 16361411c6eeSJed Brown ierr = DMGetLocalToGlobalMappingBlock(da,<ogb);CHKERRQ(ierr); 163747c6ae99SBarry Smith 163847c6ae99SBarry Smith /* determine the matrix preallocation information */ 1639eabe889fSLisandro Dalcin ierr = MatPreallocateInitialize(comm,nx*ny,nx*ny,dnz,onz);CHKERRQ(ierr); 164047c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 16411321219cSEthan Coon istart = (bx == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 16421321219cSEthan Coon iend = (bx == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 164347c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 16441321219cSEthan Coon jstart = (by == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 16451321219cSEthan Coon jend = (by == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 164647c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys); 164747c6ae99SBarry Smith 164847c6ae99SBarry Smith /* Find block columns in block row */ 164947c6ae99SBarry Smith cnt = 0; 165047c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 165147c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 1652aa219208SBarry Smith if (st == DMDA_STENCIL_BOX || !ii || !jj) { 165347c6ae99SBarry Smith cols[cnt++] = slot + ii + gnx*jj; 165447c6ae99SBarry Smith } 165547c6ae99SBarry Smith } 165647c6ae99SBarry Smith } 165747c6ae99SBarry Smith ierr = L2GFilterUpperTriangular(ltogb,&slot,&cnt,cols);CHKERRQ(ierr); 165847c6ae99SBarry Smith ierr = MatPreallocateSymmetricSet(slot,cnt,cols,dnz,onz);CHKERRQ(ierr); 165947c6ae99SBarry Smith } 166047c6ae99SBarry Smith } 166147c6ae99SBarry Smith ierr = MatSeqSBAIJSetPreallocation(J,nc,0,dnz);CHKERRQ(ierr); 166247c6ae99SBarry Smith ierr = MatMPISBAIJSetPreallocation(J,nc,0,dnz,0,onz);CHKERRQ(ierr); 166347c6ae99SBarry Smith ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr); 166447c6ae99SBarry Smith 1665784ac674SJed Brown ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 1666784ac674SJed Brown ierr = MatSetLocalToGlobalMappingBlock(J,ltogb,ltogb);CHKERRQ(ierr); 166747c6ae99SBarry Smith 166847c6ae99SBarry Smith /* 166947c6ae99SBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 167047c6ae99SBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 167147c6ae99SBarry Smith PETSc ordering. 167247c6ae99SBarry Smith */ 1673fcfd50ebSBarry Smith if (!da->prealloc_only) { 167447c6ae99SBarry Smith ierr = PetscMalloc(col*col*nc*nc*sizeof(PetscScalar),&values);CHKERRQ(ierr); 167547c6ae99SBarry Smith ierr = PetscMemzero(values,col*col*nc*nc*sizeof(PetscScalar));CHKERRQ(ierr); 167647c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 16771321219cSEthan Coon istart = (bx == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 16781321219cSEthan Coon iend = (bx == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 167947c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 16801321219cSEthan Coon jstart = (by == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 16811321219cSEthan Coon jend = (by == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 168247c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys); 168347c6ae99SBarry Smith 168447c6ae99SBarry Smith /* Find block columns in block row */ 168547c6ae99SBarry Smith cnt = 0; 168647c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 168747c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 1688aa219208SBarry Smith if (st == DMDA_STENCIL_BOX || !ii || !jj) { 168947c6ae99SBarry Smith cols[cnt++] = slot + ii + gnx*jj; 169047c6ae99SBarry Smith } 169147c6ae99SBarry Smith } 169247c6ae99SBarry Smith } 169347c6ae99SBarry Smith ierr = L2GFilterUpperTriangular(ltogb,&slot,&cnt,cols);CHKERRQ(ierr); 169447c6ae99SBarry Smith ierr = MatSetValuesBlocked(J,1,&slot,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 169547c6ae99SBarry Smith } 169647c6ae99SBarry Smith } 169747c6ae99SBarry Smith ierr = PetscFree(values);CHKERRQ(ierr); 169847c6ae99SBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 169947c6ae99SBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 170047c6ae99SBarry Smith } 170147c6ae99SBarry Smith ierr = PetscFree(cols);CHKERRQ(ierr); 170247c6ae99SBarry Smith PetscFunctionReturn(0); 170347c6ae99SBarry Smith } 170447c6ae99SBarry Smith 170547c6ae99SBarry Smith #undef __FUNCT__ 1706950540a4SJed Brown #define __FUNCT__ "DMCreateMatrix_DA_3d_MPISBAIJ" 1707950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_3d_MPISBAIJ(DM da,Mat J) 170847c6ae99SBarry Smith { 170947c6ae99SBarry Smith PetscErrorCode ierr; 171047c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny; 171147c6ae99SBarry Smith PetscInt m,n,dim,s,*cols,k,nc,col,cnt,p,*dnz,*onz; 171247c6ae99SBarry Smith PetscInt istart,iend,jstart,jend,kstart,kend,zs,nz,gzs,gnz,ii,jj,kk; 171347c6ae99SBarry Smith MPI_Comm comm; 171447c6ae99SBarry Smith PetscScalar *values; 17151321219cSEthan Coon DMDABoundaryType bx,by,bz; 1716aa219208SBarry Smith DMDAStencilType st; 171747c6ae99SBarry Smith ISLocalToGlobalMapping ltog,ltogb; 171847c6ae99SBarry Smith 171947c6ae99SBarry Smith PetscFunctionBegin; 172047c6ae99SBarry Smith /* 172147c6ae99SBarry Smith nc - number of components per grid point 172247c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 172347c6ae99SBarry Smith */ 17241321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,&n,&p,0,0,0,&nc,&s,&bx,&by,&bz,&st);CHKERRQ(ierr); 172547c6ae99SBarry Smith col = 2*s + 1; 172647c6ae99SBarry Smith 1727aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,&zs,&nx,&ny,&nz);CHKERRQ(ierr); 1728aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,&gzs,&gnx,&gny,&gnz);CHKERRQ(ierr); 172947c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 173047c6ae99SBarry Smith 173147c6ae99SBarry Smith /* create the matrix */ 173247c6ae99SBarry Smith ierr = PetscMalloc(col*col*col*sizeof(PetscInt),&cols);CHKERRQ(ierr); 173347c6ae99SBarry Smith 17341411c6eeSJed Brown ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 17351411c6eeSJed Brown ierr = DMGetLocalToGlobalMappingBlock(da,<ogb);CHKERRQ(ierr); 173647c6ae99SBarry Smith 173747c6ae99SBarry Smith /* determine the matrix preallocation information */ 1738eabe889fSLisandro Dalcin ierr = MatPreallocateInitialize(comm,nx*ny*nz,nx*ny*nz,dnz,onz);CHKERRQ(ierr); 173947c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 17401321219cSEthan Coon istart = (bx == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 17411321219cSEthan Coon iend = (bx == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 174247c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 17431321219cSEthan Coon jstart = (by == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 17441321219cSEthan Coon jend = (by == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 174547c6ae99SBarry Smith for (k=zs; k<zs+nz; k++) { 17461321219cSEthan Coon kstart = (bz == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k)); 17471321219cSEthan Coon kend = (bz == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,p-k-1)); 174847c6ae99SBarry Smith 174947c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs); 175047c6ae99SBarry Smith 175147c6ae99SBarry Smith /* Find block columns in block row */ 175247c6ae99SBarry Smith cnt = 0; 175347c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 175447c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 175547c6ae99SBarry Smith for (kk=kstart; kk<kend+1; kk++) { 1756aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || (!ii && !jj) || (!jj && !kk) || (!ii && !kk)) { 175747c6ae99SBarry Smith cols[cnt++] = slot + ii + gnx*jj + gnx*gny*kk; 175847c6ae99SBarry Smith } 175947c6ae99SBarry Smith } 176047c6ae99SBarry Smith } 176147c6ae99SBarry Smith } 176247c6ae99SBarry Smith ierr = L2GFilterUpperTriangular(ltogb,&slot,&cnt,cols);CHKERRQ(ierr); 176347c6ae99SBarry Smith ierr = MatPreallocateSymmetricSet(slot,cnt,cols,dnz,onz);CHKERRQ(ierr); 176447c6ae99SBarry Smith } 176547c6ae99SBarry Smith } 176647c6ae99SBarry Smith } 176747c6ae99SBarry Smith ierr = MatSeqSBAIJSetPreallocation(J,nc,0,dnz);CHKERRQ(ierr); 176847c6ae99SBarry Smith ierr = MatMPISBAIJSetPreallocation(J,nc,0,dnz,0,onz);CHKERRQ(ierr); 176947c6ae99SBarry Smith ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr); 177047c6ae99SBarry Smith 1771784ac674SJed Brown ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 1772784ac674SJed Brown ierr = MatSetLocalToGlobalMappingBlock(J,ltogb,ltogb);CHKERRQ(ierr); 177347c6ae99SBarry Smith 177447c6ae99SBarry Smith /* 177547c6ae99SBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 177647c6ae99SBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 177747c6ae99SBarry Smith PETSc ordering. 177847c6ae99SBarry Smith */ 1779fcfd50ebSBarry Smith if (!da->prealloc_only) { 178047c6ae99SBarry Smith ierr = PetscMalloc(col*col*col*nc*nc*sizeof(PetscScalar),&values);CHKERRQ(ierr); 178147c6ae99SBarry Smith ierr = PetscMemzero(values,col*col*col*nc*nc*sizeof(PetscScalar));CHKERRQ(ierr); 178247c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 17831321219cSEthan Coon istart = (bx == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 17841321219cSEthan Coon iend = (bx == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 178547c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 17861321219cSEthan Coon jstart = (by == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 17871321219cSEthan Coon jend = (by == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 178847c6ae99SBarry Smith for (k=zs; k<zs+nz; k++) { 17891321219cSEthan Coon kstart = (bz == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k)); 17901321219cSEthan Coon kend = (bz == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,p-k-1)); 179147c6ae99SBarry Smith 179247c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs); 179347c6ae99SBarry Smith 179447c6ae99SBarry Smith cnt = 0; 179547c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 179647c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 179747c6ae99SBarry Smith for (kk=kstart; kk<kend+1; kk++) { 1798aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || (!ii && !jj) || (!jj && !kk) || (!ii && !kk)) { 179947c6ae99SBarry Smith cols[cnt++] = slot + ii + gnx*jj + gnx*gny*kk; 180047c6ae99SBarry Smith } 180147c6ae99SBarry Smith } 180247c6ae99SBarry Smith } 180347c6ae99SBarry Smith } 180447c6ae99SBarry Smith ierr = L2GFilterUpperTriangular(ltogb,&slot,&cnt,cols);CHKERRQ(ierr); 180547c6ae99SBarry Smith ierr = MatSetValuesBlocked(J,1,&slot,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 180647c6ae99SBarry Smith } 180747c6ae99SBarry Smith } 180847c6ae99SBarry Smith } 180947c6ae99SBarry Smith ierr = PetscFree(values);CHKERRQ(ierr); 181047c6ae99SBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 181147c6ae99SBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 181247c6ae99SBarry Smith } 181347c6ae99SBarry Smith ierr = PetscFree(cols);CHKERRQ(ierr); 181447c6ae99SBarry Smith PetscFunctionReturn(0); 181547c6ae99SBarry Smith } 181647c6ae99SBarry Smith 181747c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/ 181847c6ae99SBarry Smith 181947c6ae99SBarry Smith #undef __FUNCT__ 1820950540a4SJed Brown #define __FUNCT__ "DMCreateMatrix_DA_3d_MPIAIJ_Fill" 1821950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_3d_MPIAIJ_Fill(DM da,Mat J) 182247c6ae99SBarry Smith { 182347c6ae99SBarry Smith PetscErrorCode ierr; 182447c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny; 182547c6ae99SBarry Smith PetscInt m,n,dim,s,*cols,k,nc,row,col,cnt,l,p,*dnz,*onz; 182647c6ae99SBarry Smith PetscInt istart,iend,jstart,jend,kstart,kend,zs,nz,gzs,gnz,ii,jj,kk; 182747c6ae99SBarry Smith DM_DA *dd = (DM_DA*)da->data; 182847c6ae99SBarry Smith PetscInt ifill_col,*dfill = dd->dfill,*ofill = dd->ofill; 182947c6ae99SBarry Smith MPI_Comm comm; 183047c6ae99SBarry Smith PetscScalar *values; 18311321219cSEthan Coon DMDABoundaryType bx,by,bz; 183247c6ae99SBarry Smith ISLocalToGlobalMapping ltog,ltogb; 1833aa219208SBarry Smith DMDAStencilType st; 183447c6ae99SBarry Smith 183547c6ae99SBarry Smith PetscFunctionBegin; 183647c6ae99SBarry Smith /* 183747c6ae99SBarry Smith nc - number of components per grid point 183847c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 183947c6ae99SBarry Smith 184047c6ae99SBarry Smith */ 18411321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,&n,&p,0,0,0,&nc,&s,&bx,&by,&bz,&st);CHKERRQ(ierr); 184247c6ae99SBarry Smith col = 2*s + 1; 1843ce94432eSBarry Smith if (bx == DMDA_BOUNDARY_PERIODIC && (m % col)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in X is divisible\n\ 184447c6ae99SBarry Smith by 2*stencil_width + 1\n"); 1845ce94432eSBarry Smith if (by == DMDA_BOUNDARY_PERIODIC && (n % col)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in Y is divisible\n\ 184647c6ae99SBarry Smith by 2*stencil_width + 1\n"); 1847ce94432eSBarry Smith if (bz == DMDA_BOUNDARY_PERIODIC && (p % col)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in Z is divisible\n\ 184847c6ae99SBarry Smith by 2*stencil_width + 1\n"); 184947c6ae99SBarry Smith 1850aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,&zs,&nx,&ny,&nz);CHKERRQ(ierr); 1851aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,&gzs,&gnx,&gny,&gnz);CHKERRQ(ierr); 185247c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 185347c6ae99SBarry Smith 185447c6ae99SBarry Smith ierr = PetscMalloc(col*col*col*nc*sizeof(PetscInt),&cols);CHKERRQ(ierr); 18551411c6eeSJed Brown ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 18561411c6eeSJed Brown ierr = DMGetLocalToGlobalMappingBlock(da,<ogb);CHKERRQ(ierr); 185747c6ae99SBarry Smith 185847c6ae99SBarry Smith /* determine the matrix preallocation information */ 185947c6ae99SBarry Smith ierr = MatPreallocateInitialize(comm,nc*nx*ny*nz,nc*nx*ny*nz,dnz,onz);CHKERRQ(ierr); 186047c6ae99SBarry Smith 186147c6ae99SBarry Smith 186247c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 18631321219cSEthan Coon istart = (bx == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 18641321219cSEthan Coon iend = (bx == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 186547c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 18661321219cSEthan Coon jstart = (by == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 18671321219cSEthan Coon jend = (by == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 186847c6ae99SBarry Smith for (k=zs; k<zs+nz; k++) { 18691321219cSEthan Coon kstart = (bz == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k)); 18701321219cSEthan Coon kend = (bz == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,p-k-1)); 187147c6ae99SBarry Smith 187247c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs); 187347c6ae99SBarry Smith 187447c6ae99SBarry Smith for (l=0; l<nc; l++) { 187547c6ae99SBarry Smith cnt = 0; 187647c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 187747c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 187847c6ae99SBarry Smith for (kk=kstart; kk<kend+1; kk++) { 187947c6ae99SBarry Smith if (ii || jj || kk) { 1880aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/ 18818865f1eaSKarl Rupp for (ifill_col=ofill[l]; ifill_col<ofill[l+1]; ifill_col++) cols[cnt++] = ofill[ifill_col] + nc*(slot + ii + gnx*jj + gnx*gny*kk); 188247c6ae99SBarry Smith } 188347c6ae99SBarry Smith } else { 188447c6ae99SBarry Smith if (dfill) { 18858865f1eaSKarl Rupp for (ifill_col=dfill[l]; ifill_col<dfill[l+1]; ifill_col++) cols[cnt++] = dfill[ifill_col] + nc*(slot + ii + gnx*jj + gnx*gny*kk); 188647c6ae99SBarry Smith } else { 18878865f1eaSKarl Rupp for (ifill_col=0; ifill_col<nc; ifill_col++) cols[cnt++] = ifill_col + nc*(slot + ii + gnx*jj + gnx*gny*kk); 188847c6ae99SBarry Smith } 188947c6ae99SBarry Smith } 189047c6ae99SBarry Smith } 189147c6ae99SBarry Smith } 189247c6ae99SBarry Smith } 189347c6ae99SBarry Smith row = l + nc*(slot); 1894784ac674SJed Brown ierr = MatPreallocateSetLocal(ltog,1,&row,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr); 189547c6ae99SBarry Smith } 189647c6ae99SBarry Smith } 189747c6ae99SBarry Smith } 189847c6ae99SBarry Smith } 189947c6ae99SBarry Smith ierr = MatSeqAIJSetPreallocation(J,0,dnz);CHKERRQ(ierr); 190047c6ae99SBarry Smith ierr = MatMPIAIJSetPreallocation(J,0,dnz,0,onz);CHKERRQ(ierr); 190147c6ae99SBarry Smith ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr); 1902784ac674SJed Brown ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 1903784ac674SJed Brown ierr = MatSetLocalToGlobalMappingBlock(J,ltogb,ltogb);CHKERRQ(ierr); 190447c6ae99SBarry Smith 190547c6ae99SBarry Smith /* 190647c6ae99SBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 190747c6ae99SBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 190847c6ae99SBarry Smith PETSc ordering. 190947c6ae99SBarry Smith */ 1910fcfd50ebSBarry Smith if (!da->prealloc_only) { 191147c6ae99SBarry Smith ierr = PetscMalloc(col*col*col*nc*nc*nc*sizeof(PetscScalar),&values);CHKERRQ(ierr); 191247c6ae99SBarry Smith ierr = PetscMemzero(values,col*col*col*nc*nc*nc*sizeof(PetscScalar));CHKERRQ(ierr); 191347c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 19141321219cSEthan Coon istart = (bx == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 19151321219cSEthan Coon iend = (bx == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 191647c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 19171321219cSEthan Coon jstart = (by == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 19181321219cSEthan Coon jend = (by == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 191947c6ae99SBarry Smith for (k=zs; k<zs+nz; k++) { 19201321219cSEthan Coon kstart = (bz == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k)); 19211321219cSEthan Coon kend = (bz == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,p-k-1)); 192247c6ae99SBarry Smith 192347c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs); 192447c6ae99SBarry Smith 192547c6ae99SBarry Smith for (l=0; l<nc; l++) { 192647c6ae99SBarry Smith cnt = 0; 192747c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 192847c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 192947c6ae99SBarry Smith for (kk=kstart; kk<kend+1; kk++) { 193047c6ae99SBarry Smith if (ii || jj || kk) { 1931aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/ 19328865f1eaSKarl Rupp for (ifill_col=ofill[l]; ifill_col<ofill[l+1]; ifill_col++) cols[cnt++] = ofill[ifill_col] + nc*(slot + ii + gnx*jj + gnx*gny*kk); 193347c6ae99SBarry Smith } 193447c6ae99SBarry Smith } else { 193547c6ae99SBarry Smith if (dfill) { 19368865f1eaSKarl Rupp for (ifill_col=dfill[l]; ifill_col<dfill[l+1]; ifill_col++) cols[cnt++] = dfill[ifill_col] + nc*(slot + ii + gnx*jj + gnx*gny*kk); 193747c6ae99SBarry Smith } else { 19388865f1eaSKarl Rupp for (ifill_col=0; ifill_col<nc; ifill_col++) cols[cnt++] = ifill_col + nc*(slot + ii + gnx*jj + gnx*gny*kk); 193947c6ae99SBarry Smith } 194047c6ae99SBarry Smith } 194147c6ae99SBarry Smith } 194247c6ae99SBarry Smith } 194347c6ae99SBarry Smith } 194447c6ae99SBarry Smith row = l + nc*(slot); 194547c6ae99SBarry Smith ierr = MatSetValuesLocal(J,1,&row,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 194647c6ae99SBarry Smith } 194747c6ae99SBarry Smith } 194847c6ae99SBarry Smith } 194947c6ae99SBarry Smith } 195047c6ae99SBarry Smith ierr = PetscFree(values);CHKERRQ(ierr); 195147c6ae99SBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 195247c6ae99SBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 195347c6ae99SBarry Smith } 195447c6ae99SBarry Smith ierr = PetscFree(cols);CHKERRQ(ierr); 195547c6ae99SBarry Smith PetscFunctionReturn(0); 195647c6ae99SBarry Smith } 1957