147c6ae99SBarry Smith 2af0996ceSBarry Smith #include <petsc/private/dmdaimpl.h> /*I "petscdmda.h" I*/ 307475bc1SBarry Smith #include <petscmat.h> 447c6ae99SBarry Smith 5e727c939SJed Brown extern PetscErrorCode DMCreateColoring_DA_1d_MPIAIJ(DM,ISColoringType,ISColoring*); 6e727c939SJed Brown extern PetscErrorCode DMCreateColoring_DA_2d_MPIAIJ(DM,ISColoringType,ISColoring*); 7e727c939SJed Brown extern PetscErrorCode DMCreateColoring_DA_2d_5pt_MPIAIJ(DM,ISColoringType,ISColoring*); 8e727c939SJed Brown extern PetscErrorCode DMCreateColoring_DA_3d_MPIAIJ(DM,ISColoringType,ISColoring*); 947c6ae99SBarry Smith 1047c6ae99SBarry Smith /* 1147c6ae99SBarry Smith For ghost i that may be negative or greater than the upper bound this 1247c6ae99SBarry Smith maps it into the 0:m-1 range using periodicity 1347c6ae99SBarry Smith */ 1447c6ae99SBarry Smith #define SetInRange(i,m) ((i < 0) ? m+i : ((i >= m) ? i-m : i)) 1547c6ae99SBarry Smith 16ce308e1dSBarry Smith static PetscErrorCode DMDASetBlockFills_Private(const PetscInt *dfill,PetscInt w,PetscInt **rfill) 1747c6ae99SBarry Smith { 1847c6ae99SBarry Smith PetscErrorCode ierr; 1947c6ae99SBarry Smith PetscInt i,j,nz,*fill; 2047c6ae99SBarry Smith 2147c6ae99SBarry Smith PetscFunctionBegin; 2247c6ae99SBarry Smith if (!dfill) PetscFunctionReturn(0); 2347c6ae99SBarry Smith 2447c6ae99SBarry Smith /* count number nonzeros */ 2547c6ae99SBarry Smith nz = 0; 2647c6ae99SBarry Smith for (i=0; i<w; i++) { 2747c6ae99SBarry Smith for (j=0; j<w; j++) { 2847c6ae99SBarry Smith if (dfill[w*i+j]) nz++; 2947c6ae99SBarry Smith } 3047c6ae99SBarry Smith } 31854ce69bSBarry Smith ierr = PetscMalloc1(nz + w + 1,&fill);CHKERRQ(ierr); 3247c6ae99SBarry Smith /* construct modified CSR storage of nonzero structure */ 33ce308e1dSBarry Smith /* fill[0 -- w] marks starts of each row of column indices (and end of last row) 34ce308e1dSBarry Smith so fill[1] - fill[0] gives number of nonzeros in first row etc */ 3547c6ae99SBarry Smith nz = w + 1; 3647c6ae99SBarry Smith for (i=0; i<w; i++) { 3747c6ae99SBarry Smith fill[i] = nz; 3847c6ae99SBarry Smith for (j=0; j<w; j++) { 3947c6ae99SBarry Smith if (dfill[w*i+j]) { 4047c6ae99SBarry Smith fill[nz] = j; 4147c6ae99SBarry Smith nz++; 4247c6ae99SBarry Smith } 4347c6ae99SBarry Smith } 4447c6ae99SBarry Smith } 4547c6ae99SBarry Smith fill[w] = nz; 4647c6ae99SBarry Smith 4747c6ae99SBarry Smith *rfill = fill; 4847c6ae99SBarry Smith PetscFunctionReturn(0); 4947c6ae99SBarry Smith } 5047c6ae99SBarry Smith 5147c6ae99SBarry Smith /*@ 52aa219208SBarry Smith DMDASetBlockFills - Sets the fill pattern in each block for a multi-component problem 53950540a4SJed Brown of the matrix returned by DMCreateMatrix(). 5447c6ae99SBarry Smith 55aa219208SBarry Smith Logically Collective on DMDA 5647c6ae99SBarry Smith 5747c6ae99SBarry Smith Input Parameter: 5847c6ae99SBarry Smith + da - the distributed array 590298fd71SBarry Smith . dfill - the fill pattern in the diagonal block (may be NULL, means use dense block) 6047c6ae99SBarry Smith - ofill - the fill pattern in the off-diagonal blocks 6147c6ae99SBarry Smith 6247c6ae99SBarry Smith 6347c6ae99SBarry Smith Level: developer 6447c6ae99SBarry Smith 65*95452b02SPatrick Sanan Notes: 66*95452b02SPatrick Sanan This only makes sense when you are doing multicomponent problems but using the 6747c6ae99SBarry Smith MPIAIJ matrix format 6847c6ae99SBarry Smith 6947c6ae99SBarry Smith The format for dfill and ofill is a 2 dimensional dof by dof matrix with 1 entries 7047c6ae99SBarry Smith representing coupling and 0 entries for missing coupling. For example 7147c6ae99SBarry Smith $ dfill[9] = {1, 0, 0, 7247c6ae99SBarry Smith $ 1, 1, 0, 7347c6ae99SBarry Smith $ 0, 1, 1} 7447c6ae99SBarry Smith means that row 0 is coupled with only itself in the diagonal block, row 1 is coupled with 7547c6ae99SBarry Smith itself and row 0 (in the diagonal block) and row 2 is coupled with itself and row 1 (in the 7647c6ae99SBarry Smith diagonal block). 7747c6ae99SBarry Smith 78aa219208SBarry Smith DMDASetGetMatrix() allows you to provide general code for those more complicated nonzero patterns then 7947c6ae99SBarry Smith can be represented in the dfill, ofill format 8047c6ae99SBarry Smith 8147c6ae99SBarry Smith Contributed by Glenn Hammond 8247c6ae99SBarry Smith 838ddb5d8bSBarry Smith .seealso DMCreateMatrix(), DMDASetGetMatrix(), DMSetMatrixPreallocateOnly() 8447c6ae99SBarry Smith 8547c6ae99SBarry Smith @*/ 86ce308e1dSBarry Smith PetscErrorCode DMDASetBlockFills(DM da,const PetscInt *dfill,const PetscInt *ofill) 8747c6ae99SBarry Smith { 8847c6ae99SBarry Smith DM_DA *dd = (DM_DA*)da->data; 8947c6ae99SBarry Smith PetscErrorCode ierr; 90ae4f298aSBarry Smith PetscInt i,k,cnt = 1; 9147c6ae99SBarry Smith 9247c6ae99SBarry Smith PetscFunctionBegin; 93aa219208SBarry Smith ierr = DMDASetBlockFills_Private(dfill,dd->w,&dd->dfill);CHKERRQ(ierr); 94aa219208SBarry Smith ierr = DMDASetBlockFills_Private(ofill,dd->w,&dd->ofill);CHKERRQ(ierr); 95ae4f298aSBarry Smith 96ae4f298aSBarry Smith /* ofillcount tracks the columns of ofill that have any nonzero in thems; the value in each location is the number of 97ae4f298aSBarry Smith columns to the left with any nonzeros in them plus 1 */ 981795a4d1SJed Brown ierr = PetscCalloc1(dd->w,&dd->ofillcols);CHKERRQ(ierr); 99ae4f298aSBarry Smith for (i=0; i<dd->w; i++) { 100ae4f298aSBarry Smith for (k=dd->ofill[i]; k<dd->ofill[i+1]; k++) dd->ofillcols[dd->ofill[k]] = 1; 101ae4f298aSBarry Smith } 102ae4f298aSBarry Smith for (i=0; i<dd->w; i++) { 103ae4f298aSBarry Smith if (dd->ofillcols[i]) { 104ae4f298aSBarry Smith dd->ofillcols[i] = cnt++; 105ae4f298aSBarry Smith } 106ae4f298aSBarry Smith } 10747c6ae99SBarry Smith PetscFunctionReturn(0); 10847c6ae99SBarry Smith } 10947c6ae99SBarry Smith 11047c6ae99SBarry Smith 111b412c318SBarry Smith PetscErrorCode DMCreateColoring_DA(DM da,ISColoringType ctype,ISColoring *coloring) 11247c6ae99SBarry Smith { 11347c6ae99SBarry Smith PetscErrorCode ierr; 11447c6ae99SBarry Smith PetscInt dim,m,n,p,nc; 115bff4a2f0SMatthew G. Knepley DMBoundaryType bx,by,bz; 11647c6ae99SBarry Smith MPI_Comm comm; 11747c6ae99SBarry Smith PetscMPIInt size; 11847c6ae99SBarry Smith PetscBool isBAIJ; 11947c6ae99SBarry Smith DM_DA *dd = (DM_DA*)da->data; 12047c6ae99SBarry Smith 12147c6ae99SBarry Smith PetscFunctionBegin; 12247c6ae99SBarry Smith /* 12347c6ae99SBarry Smith m 12447c6ae99SBarry Smith ------------------------------------------------------ 12547c6ae99SBarry Smith | | 12647c6ae99SBarry Smith | | 12747c6ae99SBarry Smith | ---------------------- | 12847c6ae99SBarry Smith | | | | 12947c6ae99SBarry Smith n | yn | | | 13047c6ae99SBarry Smith | | | | 13147c6ae99SBarry Smith | .--------------------- | 13247c6ae99SBarry Smith | (xs,ys) xn | 13347c6ae99SBarry Smith | . | 13447c6ae99SBarry Smith | (gxs,gys) | 13547c6ae99SBarry Smith | | 13647c6ae99SBarry Smith ----------------------------------------------------- 13747c6ae99SBarry Smith */ 13847c6ae99SBarry Smith 13947c6ae99SBarry Smith /* 14047c6ae99SBarry Smith nc - number of components per grid point 14147c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 14247c6ae99SBarry Smith 14347c6ae99SBarry Smith */ 1441321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,0,0,0,&m,&n,&p,&nc,0,&bx,&by,&bz,0);CHKERRQ(ierr); 14547c6ae99SBarry Smith 14647c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 14747c6ae99SBarry Smith ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr); 1485bdb020cSBarry Smith if (ctype == IS_COLORING_LOCAL) { 14947c6ae99SBarry Smith if (size == 1) { 15047c6ae99SBarry Smith ctype = IS_COLORING_GLOBAL; 15147c6ae99SBarry Smith } else if (dim > 1) { 152bff4a2f0SMatthew G. Knepley if ((m==1 && bx == DM_BOUNDARY_PERIODIC) || (n==1 && by == DM_BOUNDARY_PERIODIC) || (p==1 && bz == DM_BOUNDARY_PERIODIC)) { 1535bdb020cSBarry Smith SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"IS_COLORING_LOCAL cannot be used for periodic boundary condition having both ends of the domain on the same process"); 15447c6ae99SBarry Smith } 15547c6ae99SBarry Smith } 15647c6ae99SBarry Smith } 15747c6ae99SBarry Smith 158aa219208SBarry Smith /* Tell the DMDA it has 1 degree of freedom per grid point so that the coloring for BAIJ 15947c6ae99SBarry Smith matrices is for the blocks, not the individual matrix elements */ 160b412c318SBarry Smith ierr = PetscStrcmp(da->mattype,MATBAIJ,&isBAIJ);CHKERRQ(ierr); 161b412c318SBarry Smith if (!isBAIJ) {ierr = PetscStrcmp(da->mattype,MATMPIBAIJ,&isBAIJ);CHKERRQ(ierr);} 162b412c318SBarry Smith if (!isBAIJ) {ierr = PetscStrcmp(da->mattype,MATSEQBAIJ,&isBAIJ);CHKERRQ(ierr);} 16347c6ae99SBarry Smith if (isBAIJ) { 16447c6ae99SBarry Smith dd->w = 1; 16547c6ae99SBarry Smith dd->xs = dd->xs/nc; 16647c6ae99SBarry Smith dd->xe = dd->xe/nc; 16747c6ae99SBarry Smith dd->Xs = dd->Xs/nc; 16847c6ae99SBarry Smith dd->Xe = dd->Xe/nc; 16947c6ae99SBarry Smith } 17047c6ae99SBarry Smith 17147c6ae99SBarry Smith /* 172aa219208SBarry Smith We do not provide a getcoloring function in the DMDA operations because 173aa219208SBarry Smith the basic DMDA does not know about matrices. We think of DMDA as being more 17447c6ae99SBarry Smith more low-level then matrices. 17547c6ae99SBarry Smith */ 17647c6ae99SBarry Smith if (dim == 1) { 177e727c939SJed Brown ierr = DMCreateColoring_DA_1d_MPIAIJ(da,ctype,coloring);CHKERRQ(ierr); 17847c6ae99SBarry Smith } else if (dim == 2) { 179e727c939SJed Brown ierr = DMCreateColoring_DA_2d_MPIAIJ(da,ctype,coloring);CHKERRQ(ierr); 18047c6ae99SBarry Smith } else if (dim == 3) { 181e727c939SJed Brown ierr = DMCreateColoring_DA_3d_MPIAIJ(da,ctype,coloring);CHKERRQ(ierr); 182ce94432eSBarry Smith } else SETERRQ1(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"Not done for %D dimension, send us mail petsc-maint@mcs.anl.gov for code",dim); 18347c6ae99SBarry Smith if (isBAIJ) { 18447c6ae99SBarry Smith dd->w = nc; 18547c6ae99SBarry Smith dd->xs = dd->xs*nc; 18647c6ae99SBarry Smith dd->xe = dd->xe*nc; 18747c6ae99SBarry Smith dd->Xs = dd->Xs*nc; 18847c6ae99SBarry Smith dd->Xe = dd->Xe*nc; 18947c6ae99SBarry Smith } 19047c6ae99SBarry Smith PetscFunctionReturn(0); 19147c6ae99SBarry Smith } 19247c6ae99SBarry Smith 19347c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/ 19447c6ae99SBarry Smith 195e727c939SJed Brown PetscErrorCode DMCreateColoring_DA_2d_MPIAIJ(DM da,ISColoringType ctype,ISColoring *coloring) 19647c6ae99SBarry Smith { 19747c6ae99SBarry Smith PetscErrorCode ierr; 19847c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,ii,gxs,gys,gnx,gny,m,n,M,N,dim,s,k,nc,col; 19947c6ae99SBarry Smith PetscInt ncolors; 20047c6ae99SBarry Smith MPI_Comm comm; 201bff4a2f0SMatthew G. Knepley DMBoundaryType bx,by; 202aa219208SBarry Smith DMDAStencilType st; 20347c6ae99SBarry Smith ISColoringValue *colors; 20447c6ae99SBarry Smith DM_DA *dd = (DM_DA*)da->data; 20547c6ae99SBarry Smith 20647c6ae99SBarry Smith PetscFunctionBegin; 20747c6ae99SBarry Smith /* 20847c6ae99SBarry Smith nc - number of components per grid point 20947c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 21047c6ae99SBarry Smith 21147c6ae99SBarry Smith */ 2121321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,&n,0,&M,&N,0,&nc,&s,&bx,&by,0,&st);CHKERRQ(ierr); 21347c6ae99SBarry Smith col = 2*s + 1; 214aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,0,&nx,&ny,0);CHKERRQ(ierr); 215aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,0,&gnx,&gny,0);CHKERRQ(ierr); 21647c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 21747c6ae99SBarry Smith 21847c6ae99SBarry Smith /* special case as taught to us by Paul Hovland */ 219aa219208SBarry Smith if (st == DMDA_STENCIL_STAR && s == 1) { 220e727c939SJed Brown ierr = DMCreateColoring_DA_2d_5pt_MPIAIJ(da,ctype,coloring);CHKERRQ(ierr); 22147c6ae99SBarry Smith } else { 22247c6ae99SBarry Smith 223bff4a2f0SMatthew G. Knepley if (bx == DM_BOUNDARY_PERIODIC && (m % col)) SETERRQ2(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in X (%d) is divisible\n\ 22447c6ae99SBarry Smith by 2*stencil_width + 1 (%d)\n", m, col); 225bff4a2f0SMatthew G. Knepley if (by == DM_BOUNDARY_PERIODIC && (n % col)) SETERRQ2(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in Y (%d) is divisible\n\ 22647c6ae99SBarry Smith by 2*stencil_width + 1 (%d)\n", n, col); 22747c6ae99SBarry Smith if (ctype == IS_COLORING_GLOBAL) { 22847c6ae99SBarry Smith if (!dd->localcoloring) { 229785e854fSJed Brown ierr = PetscMalloc1(nc*nx*ny,&colors);CHKERRQ(ierr); 23047c6ae99SBarry Smith ii = 0; 23147c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 23247c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 23347c6ae99SBarry Smith for (k=0; k<nc; k++) { 23447c6ae99SBarry Smith colors[ii++] = k + nc*((i % col) + col*(j % col)); 23547c6ae99SBarry Smith } 23647c6ae99SBarry Smith } 23747c6ae99SBarry Smith } 23847c6ae99SBarry Smith ncolors = nc + nc*(col-1 + col*(col-1)); 239aaf3ff59SMatthew G. Knepley ierr = ISColoringCreate(comm,ncolors,nc*nx*ny,colors,PETSC_OWN_POINTER,&dd->localcoloring);CHKERRQ(ierr); 24047c6ae99SBarry Smith } 24147c6ae99SBarry Smith *coloring = dd->localcoloring; 2425bdb020cSBarry Smith } else if (ctype == IS_COLORING_LOCAL) { 24347c6ae99SBarry Smith if (!dd->ghostedcoloring) { 244785e854fSJed Brown ierr = PetscMalloc1(nc*gnx*gny,&colors);CHKERRQ(ierr); 24547c6ae99SBarry Smith ii = 0; 24647c6ae99SBarry Smith for (j=gys; j<gys+gny; j++) { 24747c6ae99SBarry Smith for (i=gxs; i<gxs+gnx; i++) { 24847c6ae99SBarry Smith for (k=0; k<nc; k++) { 24947c6ae99SBarry Smith /* the complicated stuff is to handle periodic boundaries */ 25047c6ae99SBarry Smith colors[ii++] = k + nc*((SetInRange(i,m) % col) + col*(SetInRange(j,n) % col)); 25147c6ae99SBarry Smith } 25247c6ae99SBarry Smith } 25347c6ae99SBarry Smith } 25447c6ae99SBarry Smith ncolors = nc + nc*(col - 1 + col*(col-1)); 255aaf3ff59SMatthew G. Knepley ierr = ISColoringCreate(comm,ncolors,nc*gnx*gny,colors,PETSC_OWN_POINTER,&dd->ghostedcoloring);CHKERRQ(ierr); 25647c6ae99SBarry Smith /* PetscIntView(ncolors,(PetscInt*)colors,0); */ 25747c6ae99SBarry Smith 2585bdb020cSBarry Smith ierr = ISColoringSetType(dd->ghostedcoloring,IS_COLORING_LOCAL);CHKERRQ(ierr); 25947c6ae99SBarry Smith } 26047c6ae99SBarry Smith *coloring = dd->ghostedcoloring; 261ce94432eSBarry Smith } else SETERRQ1(PetscObjectComm((PetscObject)da),PETSC_ERR_ARG_WRONG,"Unknown ISColoringType %d",(int)ctype); 26247c6ae99SBarry Smith } 26347c6ae99SBarry Smith ierr = ISColoringReference(*coloring);CHKERRQ(ierr); 26447c6ae99SBarry Smith PetscFunctionReturn(0); 26547c6ae99SBarry Smith } 26647c6ae99SBarry Smith 26747c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/ 26847c6ae99SBarry Smith 269e727c939SJed Brown PetscErrorCode DMCreateColoring_DA_3d_MPIAIJ(DM da,ISColoringType ctype,ISColoring *coloring) 27047c6ae99SBarry Smith { 27147c6ae99SBarry Smith PetscErrorCode ierr; 27247c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,gxs,gys,gnx,gny,m,n,p,dim,s,k,nc,col,zs,gzs,ii,l,nz,gnz,M,N,P; 27347c6ae99SBarry Smith PetscInt ncolors; 27447c6ae99SBarry Smith MPI_Comm comm; 275bff4a2f0SMatthew G. Knepley DMBoundaryType bx,by,bz; 276aa219208SBarry Smith DMDAStencilType st; 27747c6ae99SBarry Smith ISColoringValue *colors; 27847c6ae99SBarry Smith DM_DA *dd = (DM_DA*)da->data; 27947c6ae99SBarry Smith 28047c6ae99SBarry Smith PetscFunctionBegin; 28147c6ae99SBarry Smith /* 28247c6ae99SBarry Smith nc - number of components per grid point 28347c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 28447c6ae99SBarry Smith 28547c6ae99SBarry Smith */ 2861321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,&n,&p,&M,&N,&P,&nc,&s,&bx,&by,&bz,&st);CHKERRQ(ierr); 28747c6ae99SBarry Smith col = 2*s + 1; 288bff4a2f0SMatthew G. Knepley if (bx == DM_BOUNDARY_PERIODIC && (m % col)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in X is divisible\n\ 28947c6ae99SBarry Smith by 2*stencil_width + 1\n"); 290bff4a2f0SMatthew G. Knepley if (by == DM_BOUNDARY_PERIODIC && (n % col)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in Y is divisible\n\ 29147c6ae99SBarry Smith by 2*stencil_width + 1\n"); 292bff4a2f0SMatthew G. Knepley if (bz == DM_BOUNDARY_PERIODIC && (p % col)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in Z is divisible\n\ 29347c6ae99SBarry Smith by 2*stencil_width + 1\n"); 29447c6ae99SBarry Smith 295aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,&zs,&nx,&ny,&nz);CHKERRQ(ierr); 296aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,&gzs,&gnx,&gny,&gnz);CHKERRQ(ierr); 29747c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 29847c6ae99SBarry Smith 29947c6ae99SBarry Smith /* create the coloring */ 30047c6ae99SBarry Smith if (ctype == IS_COLORING_GLOBAL) { 30147c6ae99SBarry Smith if (!dd->localcoloring) { 302785e854fSJed Brown ierr = PetscMalloc1(nc*nx*ny*nz,&colors);CHKERRQ(ierr); 30347c6ae99SBarry Smith ii = 0; 30447c6ae99SBarry Smith for (k=zs; k<zs+nz; k++) { 30547c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 30647c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 30747c6ae99SBarry Smith for (l=0; l<nc; l++) { 30847c6ae99SBarry Smith colors[ii++] = l + nc*((i % col) + col*(j % col) + col*col*(k % col)); 30947c6ae99SBarry Smith } 31047c6ae99SBarry Smith } 31147c6ae99SBarry Smith } 31247c6ae99SBarry Smith } 31347c6ae99SBarry Smith ncolors = nc + nc*(col-1 + col*(col-1)+ col*col*(col-1)); 314aaf3ff59SMatthew G. Knepley ierr = ISColoringCreate(comm,ncolors,nc*nx*ny*nz,colors,PETSC_OWN_POINTER,&dd->localcoloring);CHKERRQ(ierr); 31547c6ae99SBarry Smith } 31647c6ae99SBarry Smith *coloring = dd->localcoloring; 3175bdb020cSBarry Smith } else if (ctype == IS_COLORING_LOCAL) { 31847c6ae99SBarry Smith if (!dd->ghostedcoloring) { 319785e854fSJed Brown ierr = PetscMalloc1(nc*gnx*gny*gnz,&colors);CHKERRQ(ierr); 32047c6ae99SBarry Smith ii = 0; 32147c6ae99SBarry Smith for (k=gzs; k<gzs+gnz; k++) { 32247c6ae99SBarry Smith for (j=gys; j<gys+gny; j++) { 32347c6ae99SBarry Smith for (i=gxs; i<gxs+gnx; i++) { 32447c6ae99SBarry Smith for (l=0; l<nc; l++) { 32547c6ae99SBarry Smith /* the complicated stuff is to handle periodic boundaries */ 32647c6ae99SBarry Smith colors[ii++] = l + nc*((SetInRange(i,m) % col) + col*(SetInRange(j,n) % col) + col*col*(SetInRange(k,p) % col)); 32747c6ae99SBarry Smith } 32847c6ae99SBarry Smith } 32947c6ae99SBarry Smith } 33047c6ae99SBarry Smith } 33147c6ae99SBarry Smith ncolors = nc + nc*(col-1 + col*(col-1)+ col*col*(col-1)); 332aaf3ff59SMatthew G. Knepley ierr = ISColoringCreate(comm,ncolors,nc*gnx*gny*gnz,colors,PETSC_OWN_POINTER,&dd->ghostedcoloring);CHKERRQ(ierr); 3335bdb020cSBarry Smith ierr = ISColoringSetType(dd->ghostedcoloring,IS_COLORING_LOCAL);CHKERRQ(ierr); 33447c6ae99SBarry Smith } 33547c6ae99SBarry Smith *coloring = dd->ghostedcoloring; 336ce94432eSBarry Smith } else SETERRQ1(PetscObjectComm((PetscObject)da),PETSC_ERR_ARG_WRONG,"Unknown ISColoringType %d",(int)ctype); 33747c6ae99SBarry Smith ierr = ISColoringReference(*coloring);CHKERRQ(ierr); 33847c6ae99SBarry Smith PetscFunctionReturn(0); 33947c6ae99SBarry Smith } 34047c6ae99SBarry Smith 34147c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/ 34247c6ae99SBarry Smith 343e727c939SJed Brown PetscErrorCode DMCreateColoring_DA_1d_MPIAIJ(DM da,ISColoringType ctype,ISColoring *coloring) 34447c6ae99SBarry Smith { 34547c6ae99SBarry Smith PetscErrorCode ierr; 34647c6ae99SBarry Smith PetscInt xs,nx,i,i1,gxs,gnx,l,m,M,dim,s,nc,col; 34747c6ae99SBarry Smith PetscInt ncolors; 34847c6ae99SBarry Smith MPI_Comm comm; 349bff4a2f0SMatthew G. Knepley DMBoundaryType bx; 35047c6ae99SBarry Smith ISColoringValue *colors; 35147c6ae99SBarry Smith DM_DA *dd = (DM_DA*)da->data; 35247c6ae99SBarry Smith 35347c6ae99SBarry Smith PetscFunctionBegin; 35447c6ae99SBarry Smith /* 35547c6ae99SBarry Smith nc - number of components per grid point 35647c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 35747c6ae99SBarry Smith 35847c6ae99SBarry Smith */ 3591321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,0,0,&M,0,0,&nc,&s,&bx,0,0,0);CHKERRQ(ierr); 36047c6ae99SBarry Smith col = 2*s + 1; 36147c6ae99SBarry Smith 362bff4a2f0SMatthew G. Knepley if (bx == DM_BOUNDARY_PERIODIC && (m % col)) SETERRQ2(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points %d is divisible\n\ 36331e6f798SBarry Smith by 2*stencil_width + 1 %d\n",(int)m,(int)col); 36447c6ae99SBarry Smith 365aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,0,0,&nx,0,0);CHKERRQ(ierr); 366aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,0,0,&gnx,0,0);CHKERRQ(ierr); 36747c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 36847c6ae99SBarry Smith 36947c6ae99SBarry Smith /* create the coloring */ 37047c6ae99SBarry Smith if (ctype == IS_COLORING_GLOBAL) { 37147c6ae99SBarry Smith if (!dd->localcoloring) { 372785e854fSJed Brown ierr = PetscMalloc1(nc*nx,&colors);CHKERRQ(ierr); 373ae4f298aSBarry Smith if (dd->ofillcols) { 374ae4f298aSBarry Smith PetscInt tc = 0; 375ae4f298aSBarry Smith for (i=0; i<nc; i++) tc += (PetscInt) (dd->ofillcols[i] > 0); 376ae4f298aSBarry Smith i1 = 0; 377ae4f298aSBarry Smith for (i=xs; i<xs+nx; i++) { 378ae4f298aSBarry Smith for (l=0; l<nc; l++) { 379ae4f298aSBarry Smith if (dd->ofillcols[l] && (i % col)) { 380ae4f298aSBarry Smith colors[i1++] = nc - 1 + tc*((i % col) - 1) + dd->ofillcols[l]; 381ae4f298aSBarry Smith } else { 382ae4f298aSBarry Smith colors[i1++] = l; 383ae4f298aSBarry Smith } 384ae4f298aSBarry Smith } 385ae4f298aSBarry Smith } 386ae4f298aSBarry Smith ncolors = nc + 2*s*tc; 387ae4f298aSBarry Smith } else { 38847c6ae99SBarry Smith i1 = 0; 38947c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 39047c6ae99SBarry Smith for (l=0; l<nc; l++) { 39147c6ae99SBarry Smith colors[i1++] = l + nc*(i % col); 39247c6ae99SBarry Smith } 39347c6ae99SBarry Smith } 39447c6ae99SBarry Smith ncolors = nc + nc*(col-1); 395ae4f298aSBarry Smith } 396aaf3ff59SMatthew G. Knepley ierr = ISColoringCreate(comm,ncolors,nc*nx,colors,PETSC_OWN_POINTER,&dd->localcoloring);CHKERRQ(ierr); 39747c6ae99SBarry Smith } 39847c6ae99SBarry Smith *coloring = dd->localcoloring; 3995bdb020cSBarry Smith } else if (ctype == IS_COLORING_LOCAL) { 40047c6ae99SBarry Smith if (!dd->ghostedcoloring) { 401785e854fSJed Brown ierr = PetscMalloc1(nc*gnx,&colors);CHKERRQ(ierr); 40247c6ae99SBarry Smith i1 = 0; 40347c6ae99SBarry Smith for (i=gxs; i<gxs+gnx; i++) { 40447c6ae99SBarry Smith for (l=0; l<nc; l++) { 40547c6ae99SBarry Smith /* the complicated stuff is to handle periodic boundaries */ 40647c6ae99SBarry Smith colors[i1++] = l + nc*(SetInRange(i,m) % col); 40747c6ae99SBarry Smith } 40847c6ae99SBarry Smith } 40947c6ae99SBarry Smith ncolors = nc + nc*(col-1); 410aaf3ff59SMatthew G. Knepley ierr = ISColoringCreate(comm,ncolors,nc*gnx,colors,PETSC_OWN_POINTER,&dd->ghostedcoloring);CHKERRQ(ierr); 4115bdb020cSBarry Smith ierr = ISColoringSetType(dd->ghostedcoloring,IS_COLORING_LOCAL);CHKERRQ(ierr); 41247c6ae99SBarry Smith } 41347c6ae99SBarry Smith *coloring = dd->ghostedcoloring; 414ce94432eSBarry Smith } else SETERRQ1(PetscObjectComm((PetscObject)da),PETSC_ERR_ARG_WRONG,"Unknown ISColoringType %d",(int)ctype); 41547c6ae99SBarry Smith ierr = ISColoringReference(*coloring);CHKERRQ(ierr); 41647c6ae99SBarry Smith PetscFunctionReturn(0); 41747c6ae99SBarry Smith } 41847c6ae99SBarry Smith 419e727c939SJed Brown PetscErrorCode DMCreateColoring_DA_2d_5pt_MPIAIJ(DM da,ISColoringType ctype,ISColoring *coloring) 42047c6ae99SBarry Smith { 42147c6ae99SBarry Smith PetscErrorCode ierr; 42247c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,ii,gxs,gys,gnx,gny,m,n,dim,s,k,nc; 42347c6ae99SBarry Smith PetscInt ncolors; 42447c6ae99SBarry Smith MPI_Comm comm; 425bff4a2f0SMatthew G. Knepley DMBoundaryType bx,by; 42647c6ae99SBarry Smith ISColoringValue *colors; 42747c6ae99SBarry Smith DM_DA *dd = (DM_DA*)da->data; 42847c6ae99SBarry Smith 42947c6ae99SBarry Smith PetscFunctionBegin; 43047c6ae99SBarry Smith /* 43147c6ae99SBarry Smith nc - number of components per grid point 43247c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 43347c6ae99SBarry Smith 43447c6ae99SBarry Smith */ 4351321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,&n,0,0,0,0,&nc,&s,&bx,&by,0,0);CHKERRQ(ierr); 436aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,0,&nx,&ny,0);CHKERRQ(ierr); 437aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,0,&gnx,&gny,0);CHKERRQ(ierr); 43847c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 43947c6ae99SBarry Smith 440bff4a2f0SMatthew G. Knepley if (bx == DM_BOUNDARY_PERIODIC && (m % 5)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in X is divisible by 5\n"); 441bff4a2f0SMatthew G. Knepley if (by == DM_BOUNDARY_PERIODIC && (n % 5)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in Y is divisible by 5\n"); 44247c6ae99SBarry Smith 44347c6ae99SBarry Smith /* create the coloring */ 44447c6ae99SBarry Smith if (ctype == IS_COLORING_GLOBAL) { 44547c6ae99SBarry Smith if (!dd->localcoloring) { 446785e854fSJed Brown ierr = PetscMalloc1(nc*nx*ny,&colors);CHKERRQ(ierr); 44747c6ae99SBarry Smith ii = 0; 44847c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 44947c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 45047c6ae99SBarry Smith for (k=0; k<nc; k++) { 45147c6ae99SBarry Smith colors[ii++] = k + nc*((3*j+i) % 5); 45247c6ae99SBarry Smith } 45347c6ae99SBarry Smith } 45447c6ae99SBarry Smith } 45547c6ae99SBarry Smith ncolors = 5*nc; 456aaf3ff59SMatthew G. Knepley ierr = ISColoringCreate(comm,ncolors,nc*nx*ny,colors,PETSC_OWN_POINTER,&dd->localcoloring);CHKERRQ(ierr); 45747c6ae99SBarry Smith } 45847c6ae99SBarry Smith *coloring = dd->localcoloring; 4595bdb020cSBarry Smith } else if (ctype == IS_COLORING_LOCAL) { 46047c6ae99SBarry Smith if (!dd->ghostedcoloring) { 461785e854fSJed Brown ierr = PetscMalloc1(nc*gnx*gny,&colors);CHKERRQ(ierr); 46247c6ae99SBarry Smith ii = 0; 46347c6ae99SBarry Smith for (j=gys; j<gys+gny; j++) { 46447c6ae99SBarry Smith for (i=gxs; i<gxs+gnx; i++) { 46547c6ae99SBarry Smith for (k=0; k<nc; k++) { 46647c6ae99SBarry Smith colors[ii++] = k + nc*((3*SetInRange(j,n) + SetInRange(i,m)) % 5); 46747c6ae99SBarry Smith } 46847c6ae99SBarry Smith } 46947c6ae99SBarry Smith } 47047c6ae99SBarry Smith ncolors = 5*nc; 471aaf3ff59SMatthew G. Knepley ierr = ISColoringCreate(comm,ncolors,nc*gnx*gny,colors,PETSC_OWN_POINTER,&dd->ghostedcoloring);CHKERRQ(ierr); 4725bdb020cSBarry Smith ierr = ISColoringSetType(dd->ghostedcoloring,IS_COLORING_LOCAL);CHKERRQ(ierr); 47347c6ae99SBarry Smith } 47447c6ae99SBarry Smith *coloring = dd->ghostedcoloring; 475ce94432eSBarry Smith } else SETERRQ1(PetscObjectComm((PetscObject)da),PETSC_ERR_ARG_WRONG,"Unknown ISColoringType %d",(int)ctype); 47647c6ae99SBarry Smith PetscFunctionReturn(0); 47747c6ae99SBarry Smith } 47847c6ae99SBarry Smith 47947c6ae99SBarry Smith /* =========================================================================== */ 480950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_1d_MPIAIJ(DM,Mat); 481ce308e1dSBarry Smith extern PetscErrorCode DMCreateMatrix_DA_1d_MPIAIJ_Fill(DM,Mat); 482950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_2d_MPIAIJ(DM,Mat); 483950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_2d_MPIAIJ_Fill(DM,Mat); 484950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_3d_MPIAIJ(DM,Mat); 485950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_3d_MPIAIJ_Fill(DM,Mat); 486950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_2d_MPIBAIJ(DM,Mat); 487950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_3d_MPIBAIJ(DM,Mat); 488950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_2d_MPISBAIJ(DM,Mat); 489950540a4SJed Brown extern PetscErrorCode DMCreateMatrix_DA_3d_MPISBAIJ(DM,Mat); 490d4002b98SHong Zhang extern PetscErrorCode DMCreateMatrix_DA_2d_MPISELL(DM,Mat); 491d4002b98SHong Zhang extern PetscErrorCode DMCreateMatrix_DA_3d_MPISELL(DM,Mat); 492e584696dSStefano Zampini extern PetscErrorCode DMCreateMatrix_DA_IS(DM,Mat); 49347c6ae99SBarry Smith 4948bbdbebaSMatthew G Knepley /*@C 495c688c046SMatthew G Knepley MatSetupDM - Sets the DMDA that is to be used by the HYPRE_StructMatrix PETSc matrix 49647c6ae99SBarry Smith 49747c6ae99SBarry Smith Logically Collective on Mat 49847c6ae99SBarry Smith 49947c6ae99SBarry Smith Input Parameters: 50047c6ae99SBarry Smith + mat - the matrix 50147c6ae99SBarry Smith - da - the da 50247c6ae99SBarry Smith 50347c6ae99SBarry Smith Level: intermediate 50447c6ae99SBarry Smith 50547c6ae99SBarry Smith @*/ 506c688c046SMatthew G Knepley PetscErrorCode MatSetupDM(Mat mat,DM da) 50747c6ae99SBarry Smith { 50847c6ae99SBarry Smith PetscErrorCode ierr; 50947c6ae99SBarry Smith 51047c6ae99SBarry Smith PetscFunctionBegin; 51147c6ae99SBarry Smith PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 51247c6ae99SBarry Smith PetscValidHeaderSpecific(da,DM_CLASSID,1); 513c688c046SMatthew G Knepley ierr = PetscTryMethod(mat,"MatSetupDM_C",(Mat,DM),(mat,da));CHKERRQ(ierr); 51447c6ae99SBarry Smith PetscFunctionReturn(0); 51547c6ae99SBarry Smith } 51647c6ae99SBarry Smith 5177087cfbeSBarry Smith PetscErrorCode MatView_MPI_DA(Mat A,PetscViewer viewer) 51847c6ae99SBarry Smith { 5199a42bb27SBarry Smith DM da; 52047c6ae99SBarry Smith PetscErrorCode ierr; 52147c6ae99SBarry Smith const char *prefix; 52247c6ae99SBarry Smith Mat Anatural; 52347c6ae99SBarry Smith AO ao; 52447c6ae99SBarry Smith PetscInt rstart,rend,*petsc,i; 52547c6ae99SBarry Smith IS is; 52647c6ae99SBarry Smith MPI_Comm comm; 52774388724SJed Brown PetscViewerFormat format; 52847c6ae99SBarry Smith 52947c6ae99SBarry Smith PetscFunctionBegin; 53074388724SJed Brown /* Check whether we are just printing info, in which case MatView() already viewed everything we wanted to view */ 53174388724SJed Brown ierr = PetscViewerGetFormat(viewer,&format);CHKERRQ(ierr); 53274388724SJed Brown if (format == PETSC_VIEWER_ASCII_INFO || format == PETSC_VIEWER_ASCII_INFO_DETAIL) PetscFunctionReturn(0); 53374388724SJed Brown 53447c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)A,&comm);CHKERRQ(ierr); 535c688c046SMatthew G Knepley ierr = MatGetDM(A, &da);CHKERRQ(ierr); 536ce94432eSBarry Smith if (!da) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"Matrix not generated from a DMDA"); 53747c6ae99SBarry Smith 538aa219208SBarry Smith ierr = DMDAGetAO(da,&ao);CHKERRQ(ierr); 53947c6ae99SBarry Smith ierr = MatGetOwnershipRange(A,&rstart,&rend);CHKERRQ(ierr); 540854ce69bSBarry Smith ierr = PetscMalloc1(rend-rstart,&petsc);CHKERRQ(ierr); 54147c6ae99SBarry Smith for (i=rstart; i<rend; i++) petsc[i-rstart] = i; 54247c6ae99SBarry Smith ierr = AOApplicationToPetsc(ao,rend-rstart,petsc);CHKERRQ(ierr); 54347c6ae99SBarry Smith ierr = ISCreateGeneral(comm,rend-rstart,petsc,PETSC_OWN_POINTER,&is);CHKERRQ(ierr); 54447c6ae99SBarry Smith 54547c6ae99SBarry Smith /* call viewer on natural ordering */ 5467dae84e0SHong Zhang ierr = MatCreateSubMatrix(A,is,is,MAT_INITIAL_MATRIX,&Anatural);CHKERRQ(ierr); 547fcfd50ebSBarry Smith ierr = ISDestroy(&is);CHKERRQ(ierr); 54847c6ae99SBarry Smith ierr = PetscObjectGetOptionsPrefix((PetscObject)A,&prefix);CHKERRQ(ierr); 54947c6ae99SBarry Smith ierr = PetscObjectSetOptionsPrefix((PetscObject)Anatural,prefix);CHKERRQ(ierr); 55047c6ae99SBarry Smith ierr = PetscObjectSetName((PetscObject)Anatural,((PetscObject)A)->name);CHKERRQ(ierr); 551539c167fSBarry Smith ierr = MatView(Anatural,viewer);CHKERRQ(ierr); 552fcfd50ebSBarry Smith ierr = MatDestroy(&Anatural);CHKERRQ(ierr); 55347c6ae99SBarry Smith PetscFunctionReturn(0); 55447c6ae99SBarry Smith } 55547c6ae99SBarry Smith 5567087cfbeSBarry Smith PetscErrorCode MatLoad_MPI_DA(Mat A,PetscViewer viewer) 55747c6ae99SBarry Smith { 5589a42bb27SBarry Smith DM da; 55947c6ae99SBarry Smith PetscErrorCode ierr; 56047c6ae99SBarry Smith Mat Anatural,Aapp; 56147c6ae99SBarry Smith AO ao; 562539c167fSBarry Smith PetscInt rstart,rend,*app,i,m,n,M,N; 56347c6ae99SBarry Smith IS is; 56447c6ae99SBarry Smith MPI_Comm comm; 56547c6ae99SBarry Smith 56647c6ae99SBarry Smith PetscFunctionBegin; 56747c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)A,&comm);CHKERRQ(ierr); 568c688c046SMatthew G Knepley ierr = MatGetDM(A, &da);CHKERRQ(ierr); 569ce94432eSBarry Smith if (!da) SETERRQ(PetscObjectComm((PetscObject)A),PETSC_ERR_ARG_WRONG,"Matrix not generated from a DMDA"); 57047c6ae99SBarry Smith 57147c6ae99SBarry Smith /* Load the matrix in natural ordering */ 572ce94432eSBarry Smith ierr = MatCreate(PetscObjectComm((PetscObject)A),&Anatural);CHKERRQ(ierr); 57347c6ae99SBarry Smith ierr = MatSetType(Anatural,((PetscObject)A)->type_name);CHKERRQ(ierr); 574539c167fSBarry Smith ierr = MatGetSize(A,&M,&N);CHKERRQ(ierr); 575539c167fSBarry Smith ierr = MatGetLocalSize(A,&m,&n);CHKERRQ(ierr); 576539c167fSBarry Smith ierr = MatSetSizes(Anatural,m,n,M,N);CHKERRQ(ierr); 57747c6ae99SBarry Smith ierr = MatLoad(Anatural,viewer);CHKERRQ(ierr); 57847c6ae99SBarry Smith 57947c6ae99SBarry Smith /* Map natural ordering to application ordering and create IS */ 580aa219208SBarry Smith ierr = DMDAGetAO(da,&ao);CHKERRQ(ierr); 58147c6ae99SBarry Smith ierr = MatGetOwnershipRange(Anatural,&rstart,&rend);CHKERRQ(ierr); 582854ce69bSBarry Smith ierr = PetscMalloc1(rend-rstart,&app);CHKERRQ(ierr); 58347c6ae99SBarry Smith for (i=rstart; i<rend; i++) app[i-rstart] = i; 58447c6ae99SBarry Smith ierr = AOPetscToApplication(ao,rend-rstart,app);CHKERRQ(ierr); 58547c6ae99SBarry Smith ierr = ISCreateGeneral(comm,rend-rstart,app,PETSC_OWN_POINTER,&is);CHKERRQ(ierr); 58647c6ae99SBarry Smith 58747c6ae99SBarry Smith /* Do permutation and replace header */ 5887dae84e0SHong Zhang ierr = MatCreateSubMatrix(Anatural,is,is,MAT_INITIAL_MATRIX,&Aapp);CHKERRQ(ierr); 58928be2f97SBarry Smith ierr = MatHeaderReplace(A,&Aapp);CHKERRQ(ierr); 590fcfd50ebSBarry Smith ierr = ISDestroy(&is);CHKERRQ(ierr); 591fcfd50ebSBarry Smith ierr = MatDestroy(&Anatural);CHKERRQ(ierr); 59247c6ae99SBarry Smith PetscFunctionReturn(0); 59347c6ae99SBarry Smith } 59447c6ae99SBarry Smith 595b412c318SBarry Smith PetscErrorCode DMCreateMatrix_DA(DM da, Mat *J) 59647c6ae99SBarry Smith { 59747c6ae99SBarry Smith PetscErrorCode ierr; 59847c6ae99SBarry Smith PetscInt dim,dof,nx,ny,nz,dims[3],starts[3],M,N,P; 59947c6ae99SBarry Smith Mat A; 60047c6ae99SBarry Smith MPI_Comm comm; 60119fd82e9SBarry Smith MatType Atype; 60237d0c07bSMatthew G Knepley PetscSection section, sectionGlobal; 603e584696dSStefano Zampini void (*aij)(void)=NULL,(*baij)(void)=NULL,(*sbaij)(void)=NULL,(*sell)(void)=NULL,(*is)(void)=NULL; 604b412c318SBarry Smith MatType mtype; 60547c6ae99SBarry Smith PetscMPIInt size; 60647c6ae99SBarry Smith DM_DA *dd = (DM_DA*)da->data; 60747c6ae99SBarry Smith 60847c6ae99SBarry Smith PetscFunctionBegin; 609607a6623SBarry Smith ierr = MatInitializePackage();CHKERRQ(ierr); 610b412c318SBarry Smith mtype = da->mattype; 61147c6ae99SBarry Smith 61237d0c07bSMatthew G Knepley ierr = DMGetDefaultSection(da, §ion);CHKERRQ(ierr); 61337d0c07bSMatthew G Knepley if (section) { 61437d0c07bSMatthew G Knepley PetscInt bs = -1; 61537d0c07bSMatthew G Knepley PetscInt localSize; 61637d0c07bSMatthew G Knepley PetscBool isShell, isBlock, isSeqBlock, isMPIBlock, isSymBlock, isSymSeqBlock, isSymMPIBlock, isSymmetric; 61737d0c07bSMatthew G Knepley 61837d0c07bSMatthew G Knepley ierr = DMGetDefaultGlobalSection(da, §ionGlobal);CHKERRQ(ierr); 61937d0c07bSMatthew G Knepley ierr = PetscSectionGetConstrainedStorageSize(sectionGlobal, &localSize);CHKERRQ(ierr); 620b5579763SJed Brown ierr = MatCreate(PetscObjectComm((PetscObject)da),&A);CHKERRQ(ierr); 621b5579763SJed Brown ierr = MatSetSizes(A,localSize,localSize,PETSC_DETERMINE,PETSC_DETERMINE);CHKERRQ(ierr); 622b5579763SJed Brown ierr = MatSetType(A,mtype);CHKERRQ(ierr); 62337d0c07bSMatthew G Knepley ierr = PetscStrcmp(mtype,MATSHELL,&isShell);CHKERRQ(ierr); 62437d0c07bSMatthew G Knepley ierr = PetscStrcmp(mtype,MATBAIJ,&isBlock);CHKERRQ(ierr); 62537d0c07bSMatthew G Knepley ierr = PetscStrcmp(mtype,MATSEQBAIJ,&isSeqBlock);CHKERRQ(ierr); 62637d0c07bSMatthew G Knepley ierr = PetscStrcmp(mtype,MATMPIBAIJ,&isMPIBlock);CHKERRQ(ierr); 62737d0c07bSMatthew G Knepley ierr = PetscStrcmp(mtype,MATSBAIJ,&isSymBlock);CHKERRQ(ierr); 62837d0c07bSMatthew G Knepley ierr = PetscStrcmp(mtype,MATSEQSBAIJ,&isSymSeqBlock);CHKERRQ(ierr); 62937d0c07bSMatthew G Knepley ierr = PetscStrcmp(mtype,MATMPISBAIJ,&isSymMPIBlock);CHKERRQ(ierr); 63037d0c07bSMatthew G Knepley /* Check for symmetric storage */ 63137d0c07bSMatthew G Knepley isSymmetric = (PetscBool) (isSymBlock || isSymSeqBlock || isSymMPIBlock); 63237d0c07bSMatthew G Knepley if (isSymmetric) { 63337d0c07bSMatthew G Knepley ierr = MatSetOption(*J, MAT_IGNORE_LOWER_TRIANGULAR, PETSC_TRUE);CHKERRQ(ierr); 63437d0c07bSMatthew G Knepley } 63537d0c07bSMatthew G Knepley if (!isShell) { 63637d0c07bSMatthew G Knepley PetscInt *dnz, *onz, *dnzu, *onzu, bsLocal; 63737d0c07bSMatthew G Knepley 63837d0c07bSMatthew G Knepley if (bs < 0) { 63937d0c07bSMatthew G Knepley if (isBlock || isSeqBlock || isMPIBlock || isSymBlock || isSymSeqBlock || isSymMPIBlock) { 64037d0c07bSMatthew G Knepley PetscInt pStart, pEnd, p, dof; 64137d0c07bSMatthew G Knepley 64237d0c07bSMatthew G Knepley ierr = PetscSectionGetChart(sectionGlobal, &pStart, &pEnd);CHKERRQ(ierr); 64337d0c07bSMatthew G Knepley for (p = pStart; p < pEnd; ++p) { 64437d0c07bSMatthew G Knepley ierr = PetscSectionGetDof(sectionGlobal, p, &dof);CHKERRQ(ierr); 64537d0c07bSMatthew G Knepley if (dof) { 64637d0c07bSMatthew G Knepley bs = dof; 64737d0c07bSMatthew G Knepley break; 64837d0c07bSMatthew G Knepley } 64937d0c07bSMatthew G Knepley } 65037d0c07bSMatthew G Knepley } else { 65137d0c07bSMatthew G Knepley bs = 1; 65237d0c07bSMatthew G Knepley } 65337d0c07bSMatthew G Knepley /* Must have same blocksize on all procs (some might have no points) */ 65437d0c07bSMatthew G Knepley bsLocal = bs; 655b2566f29SBarry Smith ierr = MPIU_Allreduce(&bsLocal, &bs, 1, MPIU_INT, MPI_MAX, PetscObjectComm((PetscObject)da));CHKERRQ(ierr); 65637d0c07bSMatthew G Knepley } 6571795a4d1SJed Brown ierr = PetscCalloc4(localSize/bs, &dnz, localSize/bs, &onz, localSize/bs, &dnzu, localSize/bs, &onzu);CHKERRQ(ierr); 658552f7358SJed Brown /* ierr = DMPlexPreallocateOperator(dm, bs, section, sectionGlobal, dnz, onz, dnzu, onzu, *J, fillMatrix);CHKERRQ(ierr); */ 65937d0c07bSMatthew G Knepley ierr = PetscFree4(dnz, onz, dnzu, onzu);CHKERRQ(ierr); 66037d0c07bSMatthew G Knepley } 66137d0c07bSMatthew G Knepley } 66247c6ae99SBarry Smith /* 66347c6ae99SBarry Smith m 66447c6ae99SBarry Smith ------------------------------------------------------ 66547c6ae99SBarry Smith | | 66647c6ae99SBarry Smith | | 66747c6ae99SBarry Smith | ---------------------- | 66847c6ae99SBarry Smith | | | | 66947c6ae99SBarry Smith n | ny | | | 67047c6ae99SBarry Smith | | | | 67147c6ae99SBarry Smith | .--------------------- | 67247c6ae99SBarry Smith | (xs,ys) nx | 67347c6ae99SBarry Smith | . | 67447c6ae99SBarry Smith | (gxs,gys) | 67547c6ae99SBarry Smith | | 67647c6ae99SBarry Smith ----------------------------------------------------- 67747c6ae99SBarry Smith */ 67847c6ae99SBarry Smith 67947c6ae99SBarry Smith /* 68047c6ae99SBarry Smith nc - number of components per grid point 68147c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 68247c6ae99SBarry Smith 68347c6ae99SBarry Smith */ 684e30e807fSPeter Brune M = dd->M; 685e30e807fSPeter Brune N = dd->N; 686e30e807fSPeter Brune P = dd->P; 687c73cfb54SMatthew G. Knepley dim = da->dim; 688e30e807fSPeter Brune dof = dd->w; 689e30e807fSPeter Brune /* ierr = DMDAGetInfo(da,&dim,&M,&N,&P,0,0,0,&dof,0,0,0,0,0);CHKERRQ(ierr); */ 690aa219208SBarry Smith ierr = DMDAGetCorners(da,0,0,0,&nx,&ny,&nz);CHKERRQ(ierr); 69147c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 69247c6ae99SBarry Smith ierr = MatCreate(comm,&A);CHKERRQ(ierr); 69347c6ae99SBarry Smith ierr = MatSetSizes(A,dof*nx*ny*nz,dof*nx*ny*nz,dof*M*N*P,dof*M*N*P);CHKERRQ(ierr); 694b412c318SBarry Smith ierr = MatSetType(A,mtype);CHKERRQ(ierr); 69595ee5b0eSBarry Smith ierr = MatSetDM(A,da);CHKERRQ(ierr); 696b06ff27eSHong Zhang if (da->structure_only) { 697b06ff27eSHong Zhang ierr = MatSetOption(A,MAT_STRUCTURE_ONLY,PETSC_TRUE);CHKERRQ(ierr); 698b06ff27eSHong Zhang } 69947c6ae99SBarry Smith ierr = MatGetType(A,&Atype);CHKERRQ(ierr); 70047c6ae99SBarry Smith /* 701aa219208SBarry Smith We do not provide a getmatrix function in the DMDA operations because 702aa219208SBarry Smith the basic DMDA does not know about matrices. We think of DMDA as being more 70347c6ae99SBarry Smith more low-level than matrices. This is kind of cheating but, cause sometimes 704aa219208SBarry Smith we think of DMDA has higher level than matrices. 70547c6ae99SBarry Smith 70647c6ae99SBarry Smith We could switch based on Atype (or mtype), but we do not since the 70747c6ae99SBarry Smith specialized setting routines depend only the particular preallocation 70847c6ae99SBarry Smith details of the matrix, not the type itself. 70947c6ae99SBarry Smith */ 71047c6ae99SBarry Smith ierr = PetscObjectQueryFunction((PetscObject)A,"MatMPIAIJSetPreallocation_C",&aij);CHKERRQ(ierr); 71147c6ae99SBarry Smith if (!aij) { 71247c6ae99SBarry Smith ierr = PetscObjectQueryFunction((PetscObject)A,"MatSeqAIJSetPreallocation_C",&aij);CHKERRQ(ierr); 71347c6ae99SBarry Smith } 71447c6ae99SBarry Smith if (!aij) { 71547c6ae99SBarry Smith ierr = PetscObjectQueryFunction((PetscObject)A,"MatMPIBAIJSetPreallocation_C",&baij);CHKERRQ(ierr); 71647c6ae99SBarry Smith if (!baij) { 71747c6ae99SBarry Smith ierr = PetscObjectQueryFunction((PetscObject)A,"MatSeqBAIJSetPreallocation_C",&baij);CHKERRQ(ierr); 71847c6ae99SBarry Smith } 71947c6ae99SBarry Smith if (!baij) { 72047c6ae99SBarry Smith ierr = PetscObjectQueryFunction((PetscObject)A,"MatMPISBAIJSetPreallocation_C",&sbaij);CHKERRQ(ierr); 72147c6ae99SBarry Smith if (!sbaij) { 72247c6ae99SBarry Smith ierr = PetscObjectQueryFunction((PetscObject)A,"MatSeqSBAIJSetPreallocation_C",&sbaij);CHKERRQ(ierr); 72347c6ae99SBarry Smith } 7245e26d47bSHong Zhang if (!sbaij) { 725d4002b98SHong Zhang ierr = PetscObjectQueryFunction((PetscObject)A,"MatMPISELLSetPreallocation_C",&sell);CHKERRQ(ierr); 726d4002b98SHong Zhang if (!sell) { 727d4002b98SHong Zhang ierr = PetscObjectQueryFunction((PetscObject)A,"MatSeqSELLSetPreallocation_C",&sell);CHKERRQ(ierr); 7285e26d47bSHong Zhang } 7295e26d47bSHong Zhang } 730e584696dSStefano Zampini if (!sell) { 731e584696dSStefano Zampini ierr = PetscObjectQueryFunction((PetscObject)A,"MatISSetPreallocation_C",&is);CHKERRQ(ierr); 732e584696dSStefano Zampini } 73347c6ae99SBarry Smith } 73447c6ae99SBarry Smith } 73547c6ae99SBarry Smith if (aij) { 73647c6ae99SBarry Smith if (dim == 1) { 737ce308e1dSBarry Smith if (dd->ofill) { 738ce308e1dSBarry Smith ierr = DMCreateMatrix_DA_1d_MPIAIJ_Fill(da,A);CHKERRQ(ierr); 739ce308e1dSBarry Smith } else { 740950540a4SJed Brown ierr = DMCreateMatrix_DA_1d_MPIAIJ(da,A);CHKERRQ(ierr); 741ce308e1dSBarry Smith } 74247c6ae99SBarry Smith } else if (dim == 2) { 74347c6ae99SBarry Smith if (dd->ofill) { 744950540a4SJed Brown ierr = DMCreateMatrix_DA_2d_MPIAIJ_Fill(da,A);CHKERRQ(ierr); 74547c6ae99SBarry Smith } else { 746950540a4SJed Brown ierr = DMCreateMatrix_DA_2d_MPIAIJ(da,A);CHKERRQ(ierr); 74747c6ae99SBarry Smith } 74847c6ae99SBarry Smith } else if (dim == 3) { 74947c6ae99SBarry Smith if (dd->ofill) { 750950540a4SJed Brown ierr = DMCreateMatrix_DA_3d_MPIAIJ_Fill(da,A);CHKERRQ(ierr); 75147c6ae99SBarry Smith } else { 752950540a4SJed Brown ierr = DMCreateMatrix_DA_3d_MPIAIJ(da,A);CHKERRQ(ierr); 75347c6ae99SBarry Smith } 75447c6ae99SBarry Smith } 75547c6ae99SBarry Smith } else if (baij) { 75647c6ae99SBarry Smith if (dim == 2) { 757950540a4SJed Brown ierr = DMCreateMatrix_DA_2d_MPIBAIJ(da,A);CHKERRQ(ierr); 75847c6ae99SBarry Smith } else if (dim == 3) { 759950540a4SJed Brown ierr = DMCreateMatrix_DA_3d_MPIBAIJ(da,A);CHKERRQ(ierr); 760ce94432eSBarry Smith } else SETERRQ3(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"Not implemented for %D dimension and Matrix Type: %s in %D dimension! Send mail to petsc-maint@mcs.anl.gov for code",dim,Atype,dim); 76147c6ae99SBarry Smith } else if (sbaij) { 76247c6ae99SBarry Smith if (dim == 2) { 763950540a4SJed Brown ierr = DMCreateMatrix_DA_2d_MPISBAIJ(da,A);CHKERRQ(ierr); 76447c6ae99SBarry Smith } else if (dim == 3) { 765950540a4SJed Brown ierr = DMCreateMatrix_DA_3d_MPISBAIJ(da,A);CHKERRQ(ierr); 766ce94432eSBarry Smith } else SETERRQ3(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"Not implemented for %D dimension and Matrix Type: %s in %D dimension! Send mail to petsc-maint@mcs.anl.gov for code",dim,Atype,dim); 767d4002b98SHong Zhang } else if (sell) { 7685e26d47bSHong Zhang if (dim == 2) { 769d4002b98SHong Zhang ierr = DMCreateMatrix_DA_2d_MPISELL(da,A);CHKERRQ(ierr); 770711261dbSHong Zhang } else if (dim == 3) { 771d4002b98SHong Zhang ierr = DMCreateMatrix_DA_3d_MPISELL(da,A);CHKERRQ(ierr); 7725e26d47bSHong Zhang } else SETERRQ3(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"Not implemented for %D dimension and Matrix Type: %s in %D dimension! Send mail to petsc-maint@mcs.anl.gov for code",dim,Atype,dim); 773e584696dSStefano Zampini } else if (is) { 774e584696dSStefano Zampini ierr = DMCreateMatrix_DA_IS(da,A);CHKERRQ(ierr); 775869776cdSLisandro Dalcin } else { 77645b6f7e9SBarry Smith ISLocalToGlobalMapping ltog; 777e584696dSStefano Zampini 778b026d285SBarry Smith ierr = MatSetBlockSize(A,dof);CHKERRQ(ierr); 7792949035bSJed Brown ierr = MatSetUp(A);CHKERRQ(ierr); 780b026d285SBarry Smith ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 781869776cdSLisandro Dalcin ierr = MatSetLocalToGlobalMapping(A,ltog,ltog);CHKERRQ(ierr); 78247c6ae99SBarry Smith } 783aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&starts[0],&starts[1],&starts[2],&dims[0],&dims[1],&dims[2]);CHKERRQ(ierr); 78447c6ae99SBarry Smith ierr = MatSetStencil(A,dim,dims,starts,dof);CHKERRQ(ierr); 785c688c046SMatthew G Knepley ierr = MatSetDM(A,da);CHKERRQ(ierr); 78647c6ae99SBarry Smith ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr); 78747c6ae99SBarry Smith if (size > 1) { 78847c6ae99SBarry Smith /* change viewer to display matrix in natural ordering */ 7890c0fd78eSBarry Smith ierr = MatSetOperation(A, MATOP_VIEW, (void (*)(void))MatView_MPI_DA);CHKERRQ(ierr); 7900c0fd78eSBarry Smith ierr = MatSetOperation(A, MATOP_LOAD, (void (*)(void))MatLoad_MPI_DA);CHKERRQ(ierr); 79147c6ae99SBarry Smith } 792b5579763SJed Brown ierr = MatSetFromOptions(A);CHKERRQ(ierr); 79347c6ae99SBarry Smith *J = A; 79447c6ae99SBarry Smith PetscFunctionReturn(0); 79547c6ae99SBarry Smith } 79647c6ae99SBarry Smith 79747c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/ 798e584696dSStefano Zampini PetscErrorCode DMCreateMatrix_DA_IS(DM dm,Mat J) 799e584696dSStefano Zampini { 800e584696dSStefano Zampini DM_DA *da = (DM_DA*)dm->data; 801e584696dSStefano Zampini Mat lJ; 802e584696dSStefano Zampini ISLocalToGlobalMapping ltog; 803e584696dSStefano Zampini IS is_loc_filt, is_glob; 80405339c03SStefano Zampini const PetscInt *e_loc,*idx; 80505339c03SStefano Zampini PetscInt i,nel,nen,dnz,nv,dof,dim,*gidx,nb; 806e584696dSStefano Zampini PetscErrorCode ierr; 807e584696dSStefano Zampini 808e584696dSStefano Zampini /* The l2g map of DMDA has all ghosted nodes, and e_loc is a subset of all the local nodes (including the ghosted) 809e584696dSStefano Zampini We need to filter the local indices that are represented through the DMDAGetElements decomposition 810e584696dSStefano Zampini This is because the size of the local matrices in MATIS is the local size of the l2g map */ 811e584696dSStefano Zampini PetscFunctionBegin; 812e584696dSStefano Zampini dof = da->w; 813e584696dSStefano Zampini dim = dm->dim; 81405339c03SStefano Zampini 81505339c03SStefano Zampini ierr = MatSetBlockSize(J,dof);CHKERRQ(ierr); 81605339c03SStefano Zampini 81705339c03SStefano Zampini /* get local elements indices in local DMDA numbering */ 818e584696dSStefano Zampini ierr = DMDAGetElements(dm,&nel,&nen,&e_loc);CHKERRQ(ierr); /* this will throw an error if the stencil type is not DMDA_STENCIL_BOX */ 819e584696dSStefano Zampini ierr = ISCreateBlock(PetscObjectComm((PetscObject)dm),dof,nel*nen,e_loc,PETSC_COPY_VALUES,&is_loc_filt);CHKERRQ(ierr); 820e584696dSStefano Zampini ierr = DMDARestoreElements(dm,&nel,&nen,&e_loc);CHKERRQ(ierr); 82105339c03SStefano Zampini 82205339c03SStefano Zampini /* obtain a consistent local ordering for MATIS */ 823e584696dSStefano Zampini ierr = ISSortRemoveDups(is_loc_filt);CHKERRQ(ierr); 82405339c03SStefano Zampini ierr = ISBlockGetLocalSize(is_loc_filt,&nb);CHKERRQ(ierr); 82505339c03SStefano Zampini ierr = DMGetLocalToGlobalMapping(dm,<og);CHKERRQ(ierr); 82605339c03SStefano Zampini ierr = ISLocalToGlobalMappingGetSize(ltog,&nv);CHKERRQ(ierr); 82705339c03SStefano Zampini ierr = PetscMalloc1(PetscMax(nb,nv/dof),&gidx);CHKERRQ(ierr); 82805339c03SStefano Zampini ierr = ISBlockGetIndices(is_loc_filt,&idx);CHKERRQ(ierr); 82905339c03SStefano Zampini ierr = ISLocalToGlobalMappingApplyBlock(ltog,nb,idx,gidx);CHKERRQ(ierr); 83005339c03SStefano Zampini ierr = ISBlockRestoreIndices(is_loc_filt,&idx);CHKERRQ(ierr); 83105339c03SStefano Zampini ierr = ISCreateBlock(PetscObjectComm((PetscObject)dm),dof,nb,gidx,PETSC_USE_POINTER,&is_glob);CHKERRQ(ierr); 832e584696dSStefano Zampini ierr = ISLocalToGlobalMappingCreateIS(is_glob,<og);CHKERRQ(ierr); 833e584696dSStefano Zampini ierr = ISDestroy(&is_glob);CHKERRQ(ierr); 834e584696dSStefano Zampini ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 835e584696dSStefano Zampini ierr = ISLocalToGlobalMappingDestroy(<og);CHKERRQ(ierr); 83605339c03SStefano Zampini 837e584696dSStefano Zampini /* We also attach a l2g map to the local matrices to have MatSetValueLocal to work */ 838e584696dSStefano Zampini ierr = MatISGetLocalMat(J,&lJ);CHKERRQ(ierr); 839e584696dSStefano Zampini ierr = ISLocalToGlobalMappingCreateIS(is_loc_filt,<og);CHKERRQ(ierr); 840e584696dSStefano Zampini ierr = ISDestroy(&is_loc_filt);CHKERRQ(ierr); 84105339c03SStefano Zampini ierr = ISCreateStride(PetscObjectComm((PetscObject)lJ),nv/dof,0,1,&is_glob);CHKERRQ(ierr); 84205339c03SStefano Zampini ierr = ISGetIndices(is_glob,&idx);CHKERRQ(ierr); 84305339c03SStefano Zampini ierr = ISGlobalToLocalMappingApplyBlock(ltog,IS_GTOLM_MASK,nv/dof,idx,&nb,gidx);CHKERRQ(ierr); 84405339c03SStefano Zampini ierr = ISRestoreIndices(is_glob,&idx);CHKERRQ(ierr); 845e584696dSStefano Zampini ierr = ISDestroy(&is_glob);CHKERRQ(ierr); 846e584696dSStefano Zampini ierr = ISLocalToGlobalMappingDestroy(<og);CHKERRQ(ierr); 847722d6fa8SStefano Zampini ierr = ISCreateBlock(PETSC_COMM_SELF,dof,nb,gidx,PETSC_USE_POINTER,&is_loc_filt);CHKERRQ(ierr); 848e584696dSStefano Zampini ierr = ISLocalToGlobalMappingCreateIS(is_loc_filt,<og);CHKERRQ(ierr); 849e584696dSStefano Zampini ierr = ISDestroy(&is_loc_filt);CHKERRQ(ierr); 850e584696dSStefano Zampini ierr = MatSetLocalToGlobalMapping(lJ,ltog,ltog);CHKERRQ(ierr); 851e584696dSStefano Zampini ierr = ISLocalToGlobalMappingDestroy(<og);CHKERRQ(ierr); 85205339c03SStefano Zampini ierr = PetscFree(gidx);CHKERRQ(ierr); 85305339c03SStefano Zampini 854e584696dSStefano Zampini /* Preallocation (not exact) */ 855e584696dSStefano Zampini switch (da->elementtype) { 856e584696dSStefano Zampini case DMDA_ELEMENT_P1: 857e584696dSStefano Zampini case DMDA_ELEMENT_Q1: 858e584696dSStefano Zampini dnz = 1; 859e584696dSStefano Zampini for (i=0; i<dim; i++) dnz *= 3; 860e584696dSStefano Zampini dnz *= dof; 861e584696dSStefano Zampini break; 862e584696dSStefano Zampini default: 863e584696dSStefano Zampini SETERRQ1(PetscObjectComm((PetscObject)dm),PETSC_ERR_SUP,"Unhandled element type %d",da->elementtype); 864e584696dSStefano Zampini break; 865e584696dSStefano Zampini } 866e584696dSStefano Zampini ierr = MatSeqAIJSetPreallocation(lJ,dnz,NULL);CHKERRQ(ierr); 867e584696dSStefano Zampini ierr = MatSeqBAIJSetPreallocation(lJ,dof,dnz/dof,NULL);CHKERRQ(ierr); 868e584696dSStefano Zampini ierr = MatSeqSBAIJSetPreallocation(lJ,dof,dnz/dof,NULL);CHKERRQ(ierr); 869e584696dSStefano Zampini ierr = MatISRestoreLocalMat(J,&lJ);CHKERRQ(ierr); 870e584696dSStefano Zampini PetscFunctionReturn(0); 871e584696dSStefano Zampini } 872e584696dSStefano Zampini 873d4002b98SHong Zhang PetscErrorCode DMCreateMatrix_DA_2d_MPISELL(DM da,Mat J) 8745e26d47bSHong Zhang { 8755e26d47bSHong Zhang PetscErrorCode ierr; 8765e26d47bSHong Zhang PetscInt xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny,m,n,dim,s,*cols = NULL,k,nc,*rows = NULL,col,cnt,l,p; 8775e26d47bSHong Zhang PetscInt lstart,lend,pstart,pend,*dnz,*onz; 8785e26d47bSHong Zhang MPI_Comm comm; 8795e26d47bSHong Zhang PetscScalar *values; 8805e26d47bSHong Zhang DMBoundaryType bx,by; 8815e26d47bSHong Zhang ISLocalToGlobalMapping ltog; 8825e26d47bSHong Zhang DMDAStencilType st; 8835e26d47bSHong Zhang 8845e26d47bSHong Zhang PetscFunctionBegin; 8855e26d47bSHong Zhang /* 8865e26d47bSHong Zhang nc - number of components per grid point 8875e26d47bSHong Zhang col - number of colors needed in one direction for single component problem 8885e26d47bSHong Zhang 8895e26d47bSHong Zhang */ 8905e26d47bSHong Zhang ierr = DMDAGetInfo(da,&dim,&m,&n,0,0,0,0,&nc,&s,&bx,&by,0,&st);CHKERRQ(ierr); 8915e26d47bSHong Zhang col = 2*s + 1; 8925e26d47bSHong Zhang ierr = DMDAGetCorners(da,&xs,&ys,0,&nx,&ny,0);CHKERRQ(ierr); 8935e26d47bSHong Zhang ierr = DMDAGetGhostCorners(da,&gxs,&gys,0,&gnx,&gny,0);CHKERRQ(ierr); 8945e26d47bSHong Zhang ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 8955e26d47bSHong Zhang 8965e26d47bSHong Zhang ierr = PetscMalloc2(nc,&rows,col*col*nc*nc,&cols);CHKERRQ(ierr); 8975e26d47bSHong Zhang ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 8985e26d47bSHong Zhang 8995e26d47bSHong Zhang ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr); 9005e26d47bSHong Zhang /* determine the matrix preallocation information */ 9015e26d47bSHong Zhang ierr = MatPreallocateInitialize(comm,nc*nx*ny,nc*nx*ny,dnz,onz);CHKERRQ(ierr); 9025e26d47bSHong Zhang for (i=xs; i<xs+nx; i++) { 9035e26d47bSHong Zhang 9045e26d47bSHong Zhang pstart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 9055e26d47bSHong Zhang pend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 9065e26d47bSHong Zhang 9075e26d47bSHong Zhang for (j=ys; j<ys+ny; j++) { 9085e26d47bSHong Zhang slot = i - gxs + gnx*(j - gys); 9095e26d47bSHong Zhang 9105e26d47bSHong Zhang lstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 9115e26d47bSHong Zhang lend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 9125e26d47bSHong Zhang 9135e26d47bSHong Zhang cnt = 0; 9145e26d47bSHong Zhang for (k=0; k<nc; k++) { 9155e26d47bSHong Zhang for (l=lstart; l<lend+1; l++) { 9165e26d47bSHong Zhang for (p=pstart; p<pend+1; p++) { 9175e26d47bSHong Zhang if ((st == DMDA_STENCIL_BOX) || (!l || !p)) { /* entries on star have either l = 0 or p = 0 */ 9185e26d47bSHong Zhang cols[cnt++] = k + nc*(slot + gnx*l + p); 9195e26d47bSHong Zhang } 9205e26d47bSHong Zhang } 9215e26d47bSHong Zhang } 9225e26d47bSHong Zhang rows[k] = k + nc*(slot); 9235e26d47bSHong Zhang } 9245e26d47bSHong Zhang ierr = MatPreallocateSetLocal(ltog,nc,rows,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr); 9255e26d47bSHong Zhang } 9265e26d47bSHong Zhang } 9275e26d47bSHong Zhang ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr); 928d4002b98SHong Zhang ierr = MatSeqSELLSetPreallocation(J,0,dnz);CHKERRQ(ierr); 929d4002b98SHong Zhang ierr = MatMPISELLSetPreallocation(J,0,dnz,0,onz);CHKERRQ(ierr); 9305e26d47bSHong Zhang ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr); 9315e26d47bSHong Zhang 9325e26d47bSHong Zhang ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 9335e26d47bSHong Zhang 9345e26d47bSHong Zhang /* 9355e26d47bSHong Zhang For each node in the grid: we get the neighbors in the local (on processor ordering 9365e26d47bSHong Zhang that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 9375e26d47bSHong Zhang PETSc ordering. 9385e26d47bSHong Zhang */ 9395e26d47bSHong Zhang if (!da->prealloc_only) { 9405e26d47bSHong Zhang ierr = PetscCalloc1(col*col*nc*nc,&values);CHKERRQ(ierr); 9415e26d47bSHong Zhang for (i=xs; i<xs+nx; i++) { 9425e26d47bSHong Zhang 9435e26d47bSHong Zhang pstart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 9445e26d47bSHong Zhang pend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 9455e26d47bSHong Zhang 9465e26d47bSHong Zhang for (j=ys; j<ys+ny; j++) { 9475e26d47bSHong Zhang slot = i - gxs + gnx*(j - gys); 9485e26d47bSHong Zhang 9495e26d47bSHong Zhang lstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 9505e26d47bSHong Zhang lend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 9515e26d47bSHong Zhang 9525e26d47bSHong Zhang cnt = 0; 9535e26d47bSHong Zhang for (k=0; k<nc; k++) { 9545e26d47bSHong Zhang for (l=lstart; l<lend+1; l++) { 9555e26d47bSHong Zhang for (p=pstart; p<pend+1; p++) { 9565e26d47bSHong Zhang if ((st == DMDA_STENCIL_BOX) || (!l || !p)) { /* entries on star have either l = 0 or p = 0 */ 9575e26d47bSHong Zhang cols[cnt++] = k + nc*(slot + gnx*l + p); 9585e26d47bSHong Zhang } 9595e26d47bSHong Zhang } 9605e26d47bSHong Zhang } 9615e26d47bSHong Zhang rows[k] = k + nc*(slot); 9625e26d47bSHong Zhang } 9635e26d47bSHong Zhang ierr = MatSetValuesLocal(J,nc,rows,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 9645e26d47bSHong Zhang } 9655e26d47bSHong Zhang } 9665e26d47bSHong Zhang ierr = PetscFree(values);CHKERRQ(ierr); 9675e26d47bSHong Zhang ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 9685e26d47bSHong Zhang ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 9695e26d47bSHong Zhang ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr); 9705e26d47bSHong Zhang } 9715e26d47bSHong Zhang ierr = PetscFree2(rows,cols);CHKERRQ(ierr); 9725e26d47bSHong Zhang PetscFunctionReturn(0); 9735e26d47bSHong Zhang } 9745e26d47bSHong Zhang 975d4002b98SHong Zhang PetscErrorCode DMCreateMatrix_DA_3d_MPISELL(DM da,Mat J) 976711261dbSHong Zhang { 977711261dbSHong Zhang PetscErrorCode ierr; 978711261dbSHong Zhang PetscInt xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny; 979711261dbSHong Zhang PetscInt m,n,dim,s,*cols = NULL,k,nc,*rows = NULL,col,cnt,l,p,*dnz = NULL,*onz = NULL; 980711261dbSHong Zhang PetscInt istart,iend,jstart,jend,kstart,kend,zs,nz,gzs,gnz,ii,jj,kk,M,N,P; 981711261dbSHong Zhang MPI_Comm comm; 982711261dbSHong Zhang PetscScalar *values; 983711261dbSHong Zhang DMBoundaryType bx,by,bz; 984711261dbSHong Zhang ISLocalToGlobalMapping ltog; 985711261dbSHong Zhang DMDAStencilType st; 986711261dbSHong Zhang 987711261dbSHong Zhang PetscFunctionBegin; 988711261dbSHong Zhang /* 989711261dbSHong Zhang nc - number of components per grid point 990711261dbSHong Zhang col - number of colors needed in one direction for single component problem 991711261dbSHong Zhang 992711261dbSHong Zhang */ 993711261dbSHong Zhang ierr = DMDAGetInfo(da,&dim,&m,&n,&p,&M,&N,&P,&nc,&s,&bx,&by,&bz,&st);CHKERRQ(ierr); 994711261dbSHong Zhang col = 2*s + 1; 995711261dbSHong Zhang ierr = DMDAGetCorners(da,&xs,&ys,&zs,&nx,&ny,&nz);CHKERRQ(ierr); 996711261dbSHong Zhang ierr = DMDAGetGhostCorners(da,&gxs,&gys,&gzs,&gnx,&gny,&gnz);CHKERRQ(ierr); 997711261dbSHong Zhang ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 998711261dbSHong Zhang 999711261dbSHong Zhang ierr = PetscMalloc2(nc,&rows,col*col*col*nc*nc,&cols);CHKERRQ(ierr); 1000711261dbSHong Zhang ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 1001711261dbSHong Zhang 1002711261dbSHong Zhang ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr); 1003711261dbSHong Zhang /* determine the matrix preallocation information */ 1004711261dbSHong Zhang ierr = MatPreallocateInitialize(comm,nc*nx*ny*nz,nc*nx*ny*nz,dnz,onz);CHKERRQ(ierr); 1005711261dbSHong Zhang for (i=xs; i<xs+nx; i++) { 1006711261dbSHong Zhang istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 1007711261dbSHong Zhang iend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 1008711261dbSHong Zhang for (j=ys; j<ys+ny; j++) { 1009711261dbSHong Zhang jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 1010711261dbSHong Zhang jend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 1011711261dbSHong Zhang for (k=zs; k<zs+nz; k++) { 1012711261dbSHong Zhang kstart = (bz == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k)); 1013711261dbSHong Zhang kend = (bz == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,p-k-1)); 1014711261dbSHong Zhang 1015711261dbSHong Zhang slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs); 1016711261dbSHong Zhang 1017711261dbSHong Zhang cnt = 0; 1018711261dbSHong Zhang for (l=0; l<nc; l++) { 1019711261dbSHong Zhang for (ii=istart; ii<iend+1; ii++) { 1020711261dbSHong Zhang for (jj=jstart; jj<jend+1; jj++) { 1021711261dbSHong Zhang for (kk=kstart; kk<kend+1; kk++) { 1022711261dbSHong Zhang if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/ 1023711261dbSHong Zhang cols[cnt++] = l + nc*(slot + ii + gnx*jj + gnx*gny*kk); 1024711261dbSHong Zhang } 1025711261dbSHong Zhang } 1026711261dbSHong Zhang } 1027711261dbSHong Zhang } 1028711261dbSHong Zhang rows[l] = l + nc*(slot); 1029711261dbSHong Zhang } 1030711261dbSHong Zhang ierr = MatPreallocateSetLocal(ltog,nc,rows,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr); 1031711261dbSHong Zhang } 1032711261dbSHong Zhang } 1033711261dbSHong Zhang } 1034711261dbSHong Zhang ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr); 1035d4002b98SHong Zhang ierr = MatSeqSELLSetPreallocation(J,0,dnz);CHKERRQ(ierr); 1036d4002b98SHong Zhang ierr = MatMPISELLSetPreallocation(J,0,dnz,0,onz);CHKERRQ(ierr); 1037711261dbSHong Zhang ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr); 1038711261dbSHong Zhang ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 1039711261dbSHong Zhang 1040711261dbSHong Zhang /* 1041711261dbSHong Zhang For each node in the grid: we get the neighbors in the local (on processor ordering 1042711261dbSHong Zhang that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 1043711261dbSHong Zhang PETSc ordering. 1044711261dbSHong Zhang */ 1045711261dbSHong Zhang if (!da->prealloc_only) { 1046711261dbSHong Zhang ierr = PetscCalloc1(col*col*col*nc*nc*nc,&values);CHKERRQ(ierr); 1047711261dbSHong Zhang for (i=xs; i<xs+nx; i++) { 1048711261dbSHong Zhang istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 1049711261dbSHong Zhang iend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 1050711261dbSHong Zhang for (j=ys; j<ys+ny; j++) { 1051711261dbSHong Zhang jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 1052711261dbSHong Zhang jend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 1053711261dbSHong Zhang for (k=zs; k<zs+nz; k++) { 1054711261dbSHong Zhang kstart = (bz == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k)); 1055711261dbSHong Zhang kend = (bz == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,p-k-1)); 1056711261dbSHong Zhang 1057711261dbSHong Zhang slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs); 1058711261dbSHong Zhang 1059711261dbSHong Zhang cnt = 0; 1060711261dbSHong Zhang for (l=0; l<nc; l++) { 1061711261dbSHong Zhang for (ii=istart; ii<iend+1; ii++) { 1062711261dbSHong Zhang for (jj=jstart; jj<jend+1; jj++) { 1063711261dbSHong Zhang for (kk=kstart; kk<kend+1; kk++) { 1064711261dbSHong Zhang if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/ 1065711261dbSHong Zhang cols[cnt++] = l + nc*(slot + ii + gnx*jj + gnx*gny*kk); 1066711261dbSHong Zhang } 1067711261dbSHong Zhang } 1068711261dbSHong Zhang } 1069711261dbSHong Zhang } 1070711261dbSHong Zhang rows[l] = l + nc*(slot); 1071711261dbSHong Zhang } 1072711261dbSHong Zhang ierr = MatSetValuesLocal(J,nc,rows,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 1073711261dbSHong Zhang } 1074711261dbSHong Zhang } 1075711261dbSHong Zhang } 1076711261dbSHong Zhang ierr = PetscFree(values);CHKERRQ(ierr); 1077711261dbSHong Zhang ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1078711261dbSHong Zhang ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1079711261dbSHong Zhang ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr); 1080711261dbSHong Zhang } 1081711261dbSHong Zhang ierr = PetscFree2(rows,cols);CHKERRQ(ierr); 1082711261dbSHong Zhang PetscFunctionReturn(0); 1083711261dbSHong Zhang } 1084711261dbSHong Zhang 1085950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_2d_MPIAIJ(DM da,Mat J) 108647c6ae99SBarry Smith { 108747c6ae99SBarry Smith PetscErrorCode ierr; 1088c1154cd5SBarry Smith PetscInt xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny,m,n,dim,s,*cols = NULL,k,nc,*rows = NULL,col,cnt,l,p,M,N; 108947c6ae99SBarry Smith PetscInt lstart,lend,pstart,pend,*dnz,*onz; 109047c6ae99SBarry Smith MPI_Comm comm; 109147c6ae99SBarry Smith PetscScalar *values; 1092bff4a2f0SMatthew G. Knepley DMBoundaryType bx,by; 109345b6f7e9SBarry Smith ISLocalToGlobalMapping ltog; 1094aa219208SBarry Smith DMDAStencilType st; 1095c1154cd5SBarry Smith PetscBool removedups = PETSC_FALSE; 109647c6ae99SBarry Smith 109747c6ae99SBarry Smith PetscFunctionBegin; 109847c6ae99SBarry Smith /* 109947c6ae99SBarry Smith nc - number of components per grid point 110047c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 110147c6ae99SBarry Smith 110247c6ae99SBarry Smith */ 1103c1154cd5SBarry Smith ierr = DMDAGetInfo(da,&dim,&m,&n,&M,&N,0,0,&nc,&s,&bx,&by,0,&st);CHKERRQ(ierr); 110447c6ae99SBarry Smith col = 2*s + 1; 1105c1154cd5SBarry Smith /* 1106c1154cd5SBarry Smith With one processor in periodic domains in a skinny dimension the code will label nonzero columns multiple times 1107c1154cd5SBarry Smith because of "wrapping" around the end of the domain hitting an entry already counted in the other direction. 1108c1154cd5SBarry Smith */ 1109c1154cd5SBarry Smith if (M == 1 && 2*s >= m) removedups = PETSC_TRUE; 1110c1154cd5SBarry Smith if (N == 1 && 2*s >= n) removedups = PETSC_TRUE; 1111aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,0,&nx,&ny,0);CHKERRQ(ierr); 1112aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,0,&gnx,&gny,0);CHKERRQ(ierr); 111347c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 111447c6ae99SBarry Smith 1115dcca6d9dSJed Brown ierr = PetscMalloc2(nc,&rows,col*col*nc*nc,&cols);CHKERRQ(ierr); 11161411c6eeSJed Brown ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 111747c6ae99SBarry Smith 111806ca8cadSBarry Smith ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr); 111947c6ae99SBarry Smith /* determine the matrix preallocation information */ 112047c6ae99SBarry Smith ierr = MatPreallocateInitialize(comm,nc*nx*ny,nc*nx*ny,dnz,onz);CHKERRQ(ierr); 112147c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 112247c6ae99SBarry Smith 1123bff4a2f0SMatthew G. Knepley pstart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 1124bff4a2f0SMatthew G. Knepley pend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 112547c6ae99SBarry Smith 112647c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 112747c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys); 112847c6ae99SBarry Smith 1129bff4a2f0SMatthew G. Knepley lstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 1130bff4a2f0SMatthew G. Knepley lend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 113147c6ae99SBarry Smith 113247c6ae99SBarry Smith cnt = 0; 113347c6ae99SBarry Smith for (k=0; k<nc; k++) { 113447c6ae99SBarry Smith for (l=lstart; l<lend+1; l++) { 113547c6ae99SBarry Smith for (p=pstart; p<pend+1; p++) { 1136aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || (!l || !p)) { /* entries on star have either l = 0 or p = 0 */ 113747c6ae99SBarry Smith cols[cnt++] = k + nc*(slot + gnx*l + p); 113847c6ae99SBarry Smith } 113947c6ae99SBarry Smith } 114047c6ae99SBarry Smith } 114147c6ae99SBarry Smith rows[k] = k + nc*(slot); 114247c6ae99SBarry Smith } 1143c1154cd5SBarry Smith if (removedups) { 1144c1154cd5SBarry Smith ierr = MatPreallocateSetLocalRemoveDups(ltog,nc,rows,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr); 1145c1154cd5SBarry Smith } else { 1146784ac674SJed Brown ierr = MatPreallocateSetLocal(ltog,nc,rows,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr); 114747c6ae99SBarry Smith } 114847c6ae99SBarry Smith } 1149c1154cd5SBarry Smith } 1150f73d5cc4SBarry Smith ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr); 115147c6ae99SBarry Smith ierr = MatSeqAIJSetPreallocation(J,0,dnz);CHKERRQ(ierr); 115247c6ae99SBarry Smith ierr = MatMPIAIJSetPreallocation(J,0,dnz,0,onz);CHKERRQ(ierr); 115347c6ae99SBarry Smith ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr); 115447c6ae99SBarry Smith 1155784ac674SJed Brown ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 115647c6ae99SBarry Smith 115747c6ae99SBarry Smith /* 115847c6ae99SBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 115947c6ae99SBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 116047c6ae99SBarry Smith PETSc ordering. 116147c6ae99SBarry Smith */ 1162fcfd50ebSBarry Smith if (!da->prealloc_only) { 11631795a4d1SJed Brown ierr = PetscCalloc1(col*col*nc*nc,&values);CHKERRQ(ierr); 116447c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 116547c6ae99SBarry Smith 1166bff4a2f0SMatthew G. Knepley pstart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 1167bff4a2f0SMatthew G. Knepley pend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 116847c6ae99SBarry Smith 116947c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 117047c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys); 117147c6ae99SBarry Smith 1172bff4a2f0SMatthew G. Knepley lstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 1173bff4a2f0SMatthew G. Knepley lend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 117447c6ae99SBarry Smith 117547c6ae99SBarry Smith cnt = 0; 117647c6ae99SBarry Smith for (k=0; k<nc; k++) { 117747c6ae99SBarry Smith for (l=lstart; l<lend+1; l++) { 117847c6ae99SBarry Smith for (p=pstart; p<pend+1; p++) { 1179aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || (!l || !p)) { /* entries on star have either l = 0 or p = 0 */ 118047c6ae99SBarry Smith cols[cnt++] = k + nc*(slot + gnx*l + p); 118147c6ae99SBarry Smith } 118247c6ae99SBarry Smith } 118347c6ae99SBarry Smith } 118447c6ae99SBarry Smith rows[k] = k + nc*(slot); 118547c6ae99SBarry Smith } 118647c6ae99SBarry Smith ierr = MatSetValuesLocal(J,nc,rows,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 118747c6ae99SBarry Smith } 118847c6ae99SBarry Smith } 118947c6ae99SBarry Smith ierr = PetscFree(values);CHKERRQ(ierr); 119047c6ae99SBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 119147c6ae99SBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1192189e4007SBarry Smith ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr); 119347c6ae99SBarry Smith } 119447c6ae99SBarry Smith ierr = PetscFree2(rows,cols);CHKERRQ(ierr); 119547c6ae99SBarry Smith PetscFunctionReturn(0); 119647c6ae99SBarry Smith } 119747c6ae99SBarry Smith 1198950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_2d_MPIAIJ_Fill(DM da,Mat J) 119947c6ae99SBarry Smith { 120047c6ae99SBarry Smith PetscErrorCode ierr; 120147c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny; 1202c1154cd5SBarry Smith PetscInt m,n,dim,s,*cols,k,nc,row,col,cnt,maxcnt = 0,l,p,M,N; 120347c6ae99SBarry Smith PetscInt lstart,lend,pstart,pend,*dnz,*onz; 120447c6ae99SBarry Smith DM_DA *dd = (DM_DA*)da->data; 120547c6ae99SBarry Smith PetscInt ifill_col,*ofill = dd->ofill, *dfill = dd->dfill; 120647c6ae99SBarry Smith MPI_Comm comm; 120747c6ae99SBarry Smith PetscScalar *values; 1208bff4a2f0SMatthew G. Knepley DMBoundaryType bx,by; 120945b6f7e9SBarry Smith ISLocalToGlobalMapping ltog; 1210aa219208SBarry Smith DMDAStencilType st; 1211c1154cd5SBarry Smith PetscBool removedups = PETSC_FALSE; 121247c6ae99SBarry Smith 121347c6ae99SBarry Smith PetscFunctionBegin; 121447c6ae99SBarry Smith /* 121547c6ae99SBarry Smith nc - number of components per grid point 121647c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 121747c6ae99SBarry Smith 121847c6ae99SBarry Smith */ 1219c1154cd5SBarry Smith ierr = DMDAGetInfo(da,&dim,&m,&n,&M,&N,0,0,&nc,&s,&bx,&by,0,&st);CHKERRQ(ierr); 122047c6ae99SBarry Smith col = 2*s + 1; 1221c1154cd5SBarry Smith /* 1222c1154cd5SBarry Smith With one processor in periodic domains in a skinny dimension the code will label nonzero columns multiple times 1223c1154cd5SBarry Smith because of "wrapping" around the end of the domain hitting an entry already counted in the other direction. 1224c1154cd5SBarry Smith */ 1225c1154cd5SBarry Smith if (M == 1 && 2*s >= m) removedups = PETSC_TRUE; 1226c1154cd5SBarry Smith if (N == 1 && 2*s >= n) removedups = PETSC_TRUE; 1227aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,0,&nx,&ny,0);CHKERRQ(ierr); 1228aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,0,&gnx,&gny,0);CHKERRQ(ierr); 122947c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 123047c6ae99SBarry Smith 12314b26d1cfSBarry Smith ierr = PetscMalloc1(col*col*nc,&cols);CHKERRQ(ierr); 12321411c6eeSJed Brown ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 123347c6ae99SBarry Smith 123406ca8cadSBarry Smith ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr); 123547c6ae99SBarry Smith /* determine the matrix preallocation information */ 123647c6ae99SBarry Smith ierr = MatPreallocateInitialize(comm,nc*nx*ny,nc*nx*ny,dnz,onz);CHKERRQ(ierr); 123747c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 123847c6ae99SBarry Smith 1239bff4a2f0SMatthew G. Knepley pstart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 1240bff4a2f0SMatthew G. Knepley pend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 124147c6ae99SBarry Smith 124247c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 124347c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys); 124447c6ae99SBarry Smith 1245bff4a2f0SMatthew G. Knepley lstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 1246bff4a2f0SMatthew G. Knepley lend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 124747c6ae99SBarry Smith 124847c6ae99SBarry Smith for (k=0; k<nc; k++) { 124947c6ae99SBarry Smith cnt = 0; 125047c6ae99SBarry Smith for (l=lstart; l<lend+1; l++) { 125147c6ae99SBarry Smith for (p=pstart; p<pend+1; p++) { 125247c6ae99SBarry Smith if (l || p) { 1253aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || (!l || !p)) { /* entries on star */ 12548865f1eaSKarl Rupp for (ifill_col=ofill[k]; ifill_col<ofill[k+1]; ifill_col++) cols[cnt++] = ofill[ifill_col] + nc*(slot + gnx*l + p); 125547c6ae99SBarry Smith } 125647c6ae99SBarry Smith } else { 125747c6ae99SBarry Smith if (dfill) { 12588865f1eaSKarl Rupp for (ifill_col=dfill[k]; ifill_col<dfill[k+1]; ifill_col++) cols[cnt++] = dfill[ifill_col] + nc*(slot + gnx*l + p); 125947c6ae99SBarry Smith } else { 12608865f1eaSKarl Rupp for (ifill_col=0; ifill_col<nc; ifill_col++) cols[cnt++] = ifill_col + nc*(slot + gnx*l + p); 126147c6ae99SBarry Smith } 126247c6ae99SBarry Smith } 126347c6ae99SBarry Smith } 126447c6ae99SBarry Smith } 126547c6ae99SBarry Smith row = k + nc*(slot); 1266c0ab637bSBarry Smith maxcnt = PetscMax(maxcnt,cnt); 1267c1154cd5SBarry Smith if (removedups) { 1268c1154cd5SBarry Smith ierr = MatPreallocateSetLocalRemoveDups(ltog,1,&row,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr); 1269c1154cd5SBarry Smith } else { 1270784ac674SJed Brown ierr = MatPreallocateSetLocal(ltog,1,&row,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr); 127147c6ae99SBarry Smith } 127247c6ae99SBarry Smith } 127347c6ae99SBarry Smith } 1274c1154cd5SBarry Smith } 127547c6ae99SBarry Smith ierr = MatSeqAIJSetPreallocation(J,0,dnz);CHKERRQ(ierr); 127647c6ae99SBarry Smith ierr = MatMPIAIJSetPreallocation(J,0,dnz,0,onz);CHKERRQ(ierr); 127747c6ae99SBarry Smith ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr); 1278784ac674SJed Brown ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 127947c6ae99SBarry Smith 128047c6ae99SBarry Smith /* 128147c6ae99SBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 128247c6ae99SBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 128347c6ae99SBarry Smith PETSc ordering. 128447c6ae99SBarry Smith */ 1285fcfd50ebSBarry Smith if (!da->prealloc_only) { 1286c0ab637bSBarry Smith ierr = PetscCalloc1(maxcnt,&values);CHKERRQ(ierr); 128747c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 128847c6ae99SBarry Smith 1289bff4a2f0SMatthew G. Knepley pstart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 1290bff4a2f0SMatthew G. Knepley pend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 129147c6ae99SBarry Smith 129247c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 129347c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys); 129447c6ae99SBarry Smith 1295bff4a2f0SMatthew G. Knepley lstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 1296bff4a2f0SMatthew G. Knepley lend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 129747c6ae99SBarry Smith 129847c6ae99SBarry Smith for (k=0; k<nc; k++) { 129947c6ae99SBarry Smith cnt = 0; 130047c6ae99SBarry Smith for (l=lstart; l<lend+1; l++) { 130147c6ae99SBarry Smith for (p=pstart; p<pend+1; p++) { 130247c6ae99SBarry Smith if (l || p) { 1303aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || (!l || !p)) { /* entries on star */ 13048865f1eaSKarl Rupp for (ifill_col=ofill[k]; ifill_col<ofill[k+1]; ifill_col++) cols[cnt++] = ofill[ifill_col] + nc*(slot + gnx*l + p); 130547c6ae99SBarry Smith } 130647c6ae99SBarry Smith } else { 130747c6ae99SBarry Smith if (dfill) { 13088865f1eaSKarl Rupp for (ifill_col=dfill[k]; ifill_col<dfill[k+1]; ifill_col++) cols[cnt++] = dfill[ifill_col] + nc*(slot + gnx*l + p); 130947c6ae99SBarry Smith } else { 13108865f1eaSKarl Rupp for (ifill_col=0; ifill_col<nc; ifill_col++) cols[cnt++] = ifill_col + nc*(slot + gnx*l + p); 131147c6ae99SBarry Smith } 131247c6ae99SBarry Smith } 131347c6ae99SBarry Smith } 131447c6ae99SBarry Smith } 131547c6ae99SBarry Smith row = k + nc*(slot); 131647c6ae99SBarry Smith ierr = MatSetValuesLocal(J,1,&row,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 131747c6ae99SBarry Smith } 131847c6ae99SBarry Smith } 131947c6ae99SBarry Smith } 132047c6ae99SBarry Smith ierr = PetscFree(values);CHKERRQ(ierr); 132147c6ae99SBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 132247c6ae99SBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1323189e4007SBarry Smith ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr); 132447c6ae99SBarry Smith } 132547c6ae99SBarry Smith ierr = PetscFree(cols);CHKERRQ(ierr); 132647c6ae99SBarry Smith PetscFunctionReturn(0); 132747c6ae99SBarry Smith } 132847c6ae99SBarry Smith 132947c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/ 133047c6ae99SBarry Smith 1331950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_3d_MPIAIJ(DM da,Mat J) 133247c6ae99SBarry Smith { 133347c6ae99SBarry Smith PetscErrorCode ierr; 133447c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny; 13350298fd71SBarry Smith PetscInt m,n,dim,s,*cols = NULL,k,nc,*rows = NULL,col,cnt,l,p,*dnz = NULL,*onz = NULL; 1336c1154cd5SBarry Smith PetscInt istart,iend,jstart,jend,kstart,kend,zs,nz,gzs,gnz,ii,jj,kk,M,N,P; 133747c6ae99SBarry Smith MPI_Comm comm; 133847c6ae99SBarry Smith PetscScalar *values; 1339bff4a2f0SMatthew G. Knepley DMBoundaryType bx,by,bz; 134045b6f7e9SBarry Smith ISLocalToGlobalMapping ltog; 1341aa219208SBarry Smith DMDAStencilType st; 1342c1154cd5SBarry Smith PetscBool removedups = PETSC_FALSE; 134347c6ae99SBarry Smith 134447c6ae99SBarry Smith PetscFunctionBegin; 134547c6ae99SBarry Smith /* 134647c6ae99SBarry Smith nc - number of components per grid point 134747c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 134847c6ae99SBarry Smith 134947c6ae99SBarry Smith */ 1350c1154cd5SBarry Smith ierr = DMDAGetInfo(da,&dim,&m,&n,&p,&M,&N,&P,&nc,&s,&bx,&by,&bz,&st);CHKERRQ(ierr); 135147c6ae99SBarry Smith col = 2*s + 1; 135247c6ae99SBarry Smith 1353c1154cd5SBarry Smith /* 1354c1154cd5SBarry Smith With one processor in periodic domains in a skinny dimension the code will label nonzero columns multiple times 1355c1154cd5SBarry Smith because of "wrapping" around the end of the domain hitting an entry already counted in the other direction. 1356c1154cd5SBarry Smith */ 1357c1154cd5SBarry Smith if (M == 1 && 2*s >= m) removedups = PETSC_TRUE; 1358c1154cd5SBarry Smith if (N == 1 && 2*s >= n) removedups = PETSC_TRUE; 1359c1154cd5SBarry Smith if (P == 1 && 2*s >= p) removedups = PETSC_TRUE; 1360c1154cd5SBarry Smith 1361aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,&zs,&nx,&ny,&nz);CHKERRQ(ierr); 1362aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,&gzs,&gnx,&gny,&gnz);CHKERRQ(ierr); 136347c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 136447c6ae99SBarry Smith 1365dcca6d9dSJed Brown ierr = PetscMalloc2(nc,&rows,col*col*col*nc*nc,&cols);CHKERRQ(ierr); 13661411c6eeSJed Brown ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 136747c6ae99SBarry Smith 136806ca8cadSBarry Smith ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr); 136947c6ae99SBarry Smith /* determine the matrix preallocation information */ 137047c6ae99SBarry Smith ierr = MatPreallocateInitialize(comm,nc*nx*ny*nz,nc*nx*ny*nz,dnz,onz);CHKERRQ(ierr); 137147c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 1372bff4a2f0SMatthew G. Knepley istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 1373bff4a2f0SMatthew G. Knepley iend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 137447c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 1375bff4a2f0SMatthew G. Knepley jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 1376bff4a2f0SMatthew G. Knepley jend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 137747c6ae99SBarry Smith for (k=zs; k<zs+nz; k++) { 1378bff4a2f0SMatthew G. Knepley kstart = (bz == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k)); 1379bff4a2f0SMatthew G. Knepley kend = (bz == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,p-k-1)); 138047c6ae99SBarry Smith 138147c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs); 138247c6ae99SBarry Smith 138347c6ae99SBarry Smith cnt = 0; 138447c6ae99SBarry Smith for (l=0; l<nc; l++) { 138547c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 138647c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 138747c6ae99SBarry Smith for (kk=kstart; kk<kend+1; kk++) { 1388aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/ 138947c6ae99SBarry Smith cols[cnt++] = l + nc*(slot + ii + gnx*jj + gnx*gny*kk); 139047c6ae99SBarry Smith } 139147c6ae99SBarry Smith } 139247c6ae99SBarry Smith } 139347c6ae99SBarry Smith } 139447c6ae99SBarry Smith rows[l] = l + nc*(slot); 139547c6ae99SBarry Smith } 1396c1154cd5SBarry Smith if (removedups) { 1397c1154cd5SBarry Smith ierr = MatPreallocateSetLocalRemoveDups(ltog,nc,rows,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr); 1398c1154cd5SBarry Smith } else { 1399784ac674SJed Brown ierr = MatPreallocateSetLocal(ltog,nc,rows,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr); 140047c6ae99SBarry Smith } 140147c6ae99SBarry Smith } 140247c6ae99SBarry Smith } 1403c1154cd5SBarry Smith } 1404f73d5cc4SBarry Smith ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr); 140547c6ae99SBarry Smith ierr = MatSeqAIJSetPreallocation(J,0,dnz);CHKERRQ(ierr); 140647c6ae99SBarry Smith ierr = MatMPIAIJSetPreallocation(J,0,dnz,0,onz);CHKERRQ(ierr); 140747c6ae99SBarry Smith ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr); 1408784ac674SJed Brown ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 140947c6ae99SBarry Smith 141047c6ae99SBarry Smith /* 141147c6ae99SBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 141247c6ae99SBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 141347c6ae99SBarry Smith PETSc ordering. 141447c6ae99SBarry Smith */ 1415fcfd50ebSBarry Smith if (!da->prealloc_only) { 14161795a4d1SJed Brown ierr = PetscCalloc1(col*col*col*nc*nc*nc,&values);CHKERRQ(ierr); 141747c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 1418bff4a2f0SMatthew G. Knepley istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 1419bff4a2f0SMatthew G. Knepley iend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 142047c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 1421bff4a2f0SMatthew G. Knepley jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 1422bff4a2f0SMatthew G. Knepley jend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 142347c6ae99SBarry Smith for (k=zs; k<zs+nz; k++) { 1424bff4a2f0SMatthew G. Knepley kstart = (bz == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k)); 1425bff4a2f0SMatthew G. Knepley kend = (bz == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,p-k-1)); 142647c6ae99SBarry Smith 142747c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs); 142847c6ae99SBarry Smith 142947c6ae99SBarry Smith cnt = 0; 143047c6ae99SBarry Smith for (l=0; l<nc; l++) { 143147c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 143247c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 143347c6ae99SBarry Smith for (kk=kstart; kk<kend+1; kk++) { 1434aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/ 143547c6ae99SBarry Smith cols[cnt++] = l + nc*(slot + ii + gnx*jj + gnx*gny*kk); 143647c6ae99SBarry Smith } 143747c6ae99SBarry Smith } 143847c6ae99SBarry Smith } 143947c6ae99SBarry Smith } 144047c6ae99SBarry Smith rows[l] = l + nc*(slot); 144147c6ae99SBarry Smith } 144247c6ae99SBarry Smith ierr = MatSetValuesLocal(J,nc,rows,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 144347c6ae99SBarry Smith } 144447c6ae99SBarry Smith } 144547c6ae99SBarry Smith } 144647c6ae99SBarry Smith ierr = PetscFree(values);CHKERRQ(ierr); 144747c6ae99SBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 144847c6ae99SBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1449189e4007SBarry Smith ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr); 145047c6ae99SBarry Smith } 145147c6ae99SBarry Smith ierr = PetscFree2(rows,cols);CHKERRQ(ierr); 145247c6ae99SBarry Smith PetscFunctionReturn(0); 145347c6ae99SBarry Smith } 145447c6ae99SBarry Smith 145547c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/ 145647c6ae99SBarry Smith 1457ce308e1dSBarry Smith PetscErrorCode DMCreateMatrix_DA_1d_MPIAIJ_Fill(DM da,Mat J) 1458ce308e1dSBarry Smith { 1459ce308e1dSBarry Smith PetscErrorCode ierr; 1460ce308e1dSBarry Smith DM_DA *dd = (DM_DA*)da->data; 1461ce308e1dSBarry Smith PetscInt xs,nx,i,j,gxs,gnx,row,k,l; 14628d4c968fSBarry Smith PetscInt m,dim,s,*cols = NULL,nc,cnt,maxcnt = 0,*ocols; 14630acb5bebSBarry Smith PetscInt *ofill = dd->ofill,*dfill = dd->dfill; 1464ce308e1dSBarry Smith PetscScalar *values; 1465bff4a2f0SMatthew G. Knepley DMBoundaryType bx; 146645b6f7e9SBarry Smith ISLocalToGlobalMapping ltog; 1467ce308e1dSBarry Smith PetscMPIInt rank,size; 1468ce308e1dSBarry Smith 1469ce308e1dSBarry Smith PetscFunctionBegin; 1470bff4a2f0SMatthew G. Knepley if (dd->bx == DM_BOUNDARY_PERIODIC) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"With fill provided not implemented with periodic boundary conditions"); 1471ce94432eSBarry Smith ierr = MPI_Comm_rank(PetscObjectComm((PetscObject)da),&rank);CHKERRQ(ierr); 1472ce94432eSBarry Smith ierr = MPI_Comm_size(PetscObjectComm((PetscObject)da),&size);CHKERRQ(ierr); 1473ce308e1dSBarry Smith 1474ce308e1dSBarry Smith /* 1475ce308e1dSBarry Smith nc - number of components per grid point 1476ce308e1dSBarry Smith 1477ce308e1dSBarry Smith */ 1478ce308e1dSBarry Smith ierr = DMDAGetInfo(da,&dim,&m,0,0,0,0,0,&nc,&s,&bx,0,0,0);CHKERRQ(ierr); 1479ce308e1dSBarry Smith ierr = DMDAGetCorners(da,&xs,0,0,&nx,0,0);CHKERRQ(ierr); 1480ce308e1dSBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,0,0,&gnx,0,0);CHKERRQ(ierr); 1481ce308e1dSBarry Smith 1482ce308e1dSBarry Smith ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr); 14831795a4d1SJed Brown ierr = PetscCalloc2(nx*nc,&cols,nx*nc,&ocols);CHKERRQ(ierr); 1484ce308e1dSBarry Smith 1485ce308e1dSBarry Smith /* 1486ce308e1dSBarry Smith note should be smaller for first and last process with no periodic 1487ce308e1dSBarry Smith does not handle dfill 1488ce308e1dSBarry Smith */ 1489ce308e1dSBarry Smith cnt = 0; 1490ce308e1dSBarry Smith /* coupling with process to the left */ 1491ce308e1dSBarry Smith for (i=0; i<s; i++) { 1492ce308e1dSBarry Smith for (j=0; j<nc; j++) { 1493ce308e1dSBarry Smith ocols[cnt] = ((!rank) ? 0 : (s - i)*(ofill[j+1] - ofill[j])); 14940acb5bebSBarry Smith cols[cnt] = dfill[j+1] - dfill[j] + (s + i)*(ofill[j+1] - ofill[j]); 1495c0ab637bSBarry Smith maxcnt = PetscMax(maxcnt,ocols[cnt]+cols[cnt]); 1496ce308e1dSBarry Smith cnt++; 1497ce308e1dSBarry Smith } 1498ce308e1dSBarry Smith } 1499ce308e1dSBarry Smith for (i=s; i<nx-s; i++) { 1500ce308e1dSBarry Smith for (j=0; j<nc; j++) { 15010acb5bebSBarry Smith cols[cnt] = dfill[j+1] - dfill[j] + 2*s*(ofill[j+1] - ofill[j]); 1502c0ab637bSBarry Smith maxcnt = PetscMax(maxcnt,ocols[cnt]+cols[cnt]); 1503ce308e1dSBarry Smith cnt++; 1504ce308e1dSBarry Smith } 1505ce308e1dSBarry Smith } 1506ce308e1dSBarry Smith /* coupling with process to the right */ 1507ce308e1dSBarry Smith for (i=nx-s; i<nx; i++) { 1508ce308e1dSBarry Smith for (j=0; j<nc; j++) { 1509ce308e1dSBarry Smith ocols[cnt] = ((rank == (size-1)) ? 0 : (i - nx + s + 1)*(ofill[j+1] - ofill[j])); 15100acb5bebSBarry Smith cols[cnt] = dfill[j+1] - dfill[j] + (s + nx - i - 1)*(ofill[j+1] - ofill[j]); 1511c0ab637bSBarry Smith maxcnt = PetscMax(maxcnt,ocols[cnt]+cols[cnt]); 1512ce308e1dSBarry Smith cnt++; 1513ce308e1dSBarry Smith } 1514ce308e1dSBarry Smith } 1515ce308e1dSBarry Smith 1516ce308e1dSBarry Smith ierr = MatSeqAIJSetPreallocation(J,0,cols);CHKERRQ(ierr); 1517ce308e1dSBarry Smith ierr = MatMPIAIJSetPreallocation(J,0,cols,0,ocols);CHKERRQ(ierr); 1518ce308e1dSBarry Smith ierr = PetscFree2(cols,ocols);CHKERRQ(ierr); 1519ce308e1dSBarry Smith 1520ce308e1dSBarry Smith ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 1521ce308e1dSBarry Smith ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 1522ce308e1dSBarry Smith 1523ce308e1dSBarry Smith /* 1524ce308e1dSBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 1525ce308e1dSBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 1526ce308e1dSBarry Smith PETSc ordering. 1527ce308e1dSBarry Smith */ 1528ce308e1dSBarry Smith if (!da->prealloc_only) { 1529c0ab637bSBarry Smith ierr = PetscCalloc2(maxcnt,&values,maxcnt,&cols);CHKERRQ(ierr); 1530ce308e1dSBarry Smith 1531ce308e1dSBarry Smith row = xs*nc; 1532ce308e1dSBarry Smith /* coupling with process to the left */ 1533ce308e1dSBarry Smith for (i=xs; i<xs+s; i++) { 1534ce308e1dSBarry Smith for (j=0; j<nc; j++) { 1535ce308e1dSBarry Smith cnt = 0; 1536ce308e1dSBarry Smith if (rank) { 1537ce308e1dSBarry Smith for (l=0; l<s; l++) { 1538ce308e1dSBarry Smith for (k=ofill[j]; k<ofill[j+1]; k++) cols[cnt++] = (i - s + l)*nc + ofill[k]; 1539ce308e1dSBarry Smith } 1540ce308e1dSBarry Smith } 15410acb5bebSBarry Smith if (dfill) { 15420acb5bebSBarry Smith for (k=dfill[j]; k<dfill[j+1]; k++) { 15430acb5bebSBarry Smith cols[cnt++] = i*nc + dfill[k]; 15440acb5bebSBarry Smith } 15450acb5bebSBarry Smith } else { 1546ce308e1dSBarry Smith for (k=0; k<nc; k++) { 1547ce308e1dSBarry Smith cols[cnt++] = i*nc + k; 1548ce308e1dSBarry Smith } 15490acb5bebSBarry Smith } 1550ce308e1dSBarry Smith for (l=0; l<s; l++) { 1551ce308e1dSBarry Smith for (k=ofill[j]; k<ofill[j+1]; k++) cols[cnt++] = (i + s - l)*nc + ofill[k]; 1552ce308e1dSBarry Smith } 1553ce308e1dSBarry Smith ierr = MatSetValues(J,1,&row,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 1554ce308e1dSBarry Smith row++; 1555ce308e1dSBarry Smith } 1556ce308e1dSBarry Smith } 1557ce308e1dSBarry Smith for (i=xs+s; i<xs+nx-s; i++) { 1558ce308e1dSBarry Smith for (j=0; j<nc; j++) { 1559ce308e1dSBarry Smith cnt = 0; 1560ce308e1dSBarry Smith for (l=0; l<s; l++) { 1561ce308e1dSBarry Smith for (k=ofill[j]; k<ofill[j+1]; k++) cols[cnt++] = (i - s + l)*nc + ofill[k]; 1562ce308e1dSBarry Smith } 15630acb5bebSBarry Smith if (dfill) { 15640acb5bebSBarry Smith for (k=dfill[j]; k<dfill[j+1]; k++) { 15650acb5bebSBarry Smith cols[cnt++] = i*nc + dfill[k]; 15660acb5bebSBarry Smith } 15670acb5bebSBarry Smith } else { 1568ce308e1dSBarry Smith for (k=0; k<nc; k++) { 1569ce308e1dSBarry Smith cols[cnt++] = i*nc + k; 1570ce308e1dSBarry Smith } 15710acb5bebSBarry Smith } 1572ce308e1dSBarry Smith for (l=0; l<s; l++) { 1573ce308e1dSBarry Smith for (k=ofill[j]; k<ofill[j+1]; k++) cols[cnt++] = (i + s - l)*nc + ofill[k]; 1574ce308e1dSBarry Smith } 1575ce308e1dSBarry Smith ierr = MatSetValues(J,1,&row,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 1576ce308e1dSBarry Smith row++; 1577ce308e1dSBarry Smith } 1578ce308e1dSBarry Smith } 1579ce308e1dSBarry Smith /* coupling with process to the right */ 1580ce308e1dSBarry Smith for (i=xs+nx-s; i<xs+nx; i++) { 1581ce308e1dSBarry Smith for (j=0; j<nc; j++) { 1582ce308e1dSBarry Smith cnt = 0; 1583ce308e1dSBarry Smith for (l=0; l<s; l++) { 1584ce308e1dSBarry Smith for (k=ofill[j]; k<ofill[j+1]; k++) cols[cnt++] = (i - s + l)*nc + ofill[k]; 1585ce308e1dSBarry Smith } 15860acb5bebSBarry Smith if (dfill) { 15870acb5bebSBarry Smith for (k=dfill[j]; k<dfill[j+1]; k++) { 15880acb5bebSBarry Smith cols[cnt++] = i*nc + dfill[k]; 15890acb5bebSBarry Smith } 15900acb5bebSBarry Smith } else { 1591ce308e1dSBarry Smith for (k=0; k<nc; k++) { 1592ce308e1dSBarry Smith cols[cnt++] = i*nc + k; 1593ce308e1dSBarry Smith } 15940acb5bebSBarry Smith } 1595ce308e1dSBarry Smith if (rank < size-1) { 1596ce308e1dSBarry Smith for (l=0; l<s; l++) { 1597ce308e1dSBarry Smith for (k=ofill[j]; k<ofill[j+1]; k++) cols[cnt++] = (i + s - l)*nc + ofill[k]; 1598ce308e1dSBarry Smith } 1599ce308e1dSBarry Smith } 1600ce308e1dSBarry Smith ierr = MatSetValues(J,1,&row,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 1601ce308e1dSBarry Smith row++; 1602ce308e1dSBarry Smith } 1603ce308e1dSBarry Smith } 1604c0ab637bSBarry Smith ierr = PetscFree2(values,cols);CHKERRQ(ierr); 1605ce308e1dSBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1606ce308e1dSBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1607189e4007SBarry Smith ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr); 1608ce308e1dSBarry Smith } 1609ce308e1dSBarry Smith PetscFunctionReturn(0); 1610ce308e1dSBarry Smith } 1611ce308e1dSBarry Smith 1612ce308e1dSBarry Smith /* ---------------------------------------------------------------------------------*/ 1613ce308e1dSBarry Smith 1614950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_1d_MPIAIJ(DM da,Mat J) 161547c6ae99SBarry Smith { 161647c6ae99SBarry Smith PetscErrorCode ierr; 161747c6ae99SBarry Smith PetscInt xs,nx,i,i1,slot,gxs,gnx; 16180298fd71SBarry Smith PetscInt m,dim,s,*cols = NULL,nc,*rows = NULL,col,cnt,l; 161947c6ae99SBarry Smith PetscInt istart,iend; 162047c6ae99SBarry Smith PetscScalar *values; 1621bff4a2f0SMatthew G. Knepley DMBoundaryType bx; 162245b6f7e9SBarry Smith ISLocalToGlobalMapping ltog; 162347c6ae99SBarry Smith 162447c6ae99SBarry Smith PetscFunctionBegin; 162547c6ae99SBarry Smith /* 162647c6ae99SBarry Smith nc - number of components per grid point 162747c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 162847c6ae99SBarry Smith 162947c6ae99SBarry Smith */ 16301321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,0,0,0,0,0,&nc,&s,&bx,0,0,0);CHKERRQ(ierr); 163147c6ae99SBarry Smith col = 2*s + 1; 163247c6ae99SBarry Smith 1633aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,0,0,&nx,0,0);CHKERRQ(ierr); 1634aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,0,0,&gnx,0,0);CHKERRQ(ierr); 163547c6ae99SBarry Smith 1636f73d5cc4SBarry Smith ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr); 163747c6ae99SBarry Smith ierr = MatSeqAIJSetPreallocation(J,col*nc,0);CHKERRQ(ierr); 163847c6ae99SBarry Smith ierr = MatMPIAIJSetPreallocation(J,col*nc,0,col*nc,0);CHKERRQ(ierr); 163947c6ae99SBarry Smith 16401411c6eeSJed Brown ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 1641784ac674SJed Brown ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 164247c6ae99SBarry Smith 164347c6ae99SBarry Smith /* 164447c6ae99SBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 164547c6ae99SBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 164647c6ae99SBarry Smith PETSc ordering. 164747c6ae99SBarry Smith */ 1648fcfd50ebSBarry Smith if (!da->prealloc_only) { 1649dcca6d9dSJed Brown ierr = PetscMalloc2(nc,&rows,col*nc*nc,&cols);CHKERRQ(ierr); 16501795a4d1SJed Brown ierr = PetscCalloc1(col*nc*nc,&values);CHKERRQ(ierr); 165147c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 165247c6ae99SBarry Smith istart = PetscMax(-s,gxs - i); 165347c6ae99SBarry Smith iend = PetscMin(s,gxs + gnx - i - 1); 165447c6ae99SBarry Smith slot = i - gxs; 165547c6ae99SBarry Smith 165647c6ae99SBarry Smith cnt = 0; 165747c6ae99SBarry Smith for (l=0; l<nc; l++) { 165847c6ae99SBarry Smith for (i1=istart; i1<iend+1; i1++) { 165947c6ae99SBarry Smith cols[cnt++] = l + nc*(slot + i1); 166047c6ae99SBarry Smith } 166147c6ae99SBarry Smith rows[l] = l + nc*(slot); 166247c6ae99SBarry Smith } 166347c6ae99SBarry Smith ierr = MatSetValuesLocal(J,nc,rows,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 166447c6ae99SBarry Smith } 166547c6ae99SBarry Smith ierr = PetscFree(values);CHKERRQ(ierr); 166647c6ae99SBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 166747c6ae99SBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1668189e4007SBarry Smith ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr); 166947c6ae99SBarry Smith ierr = PetscFree2(rows,cols);CHKERRQ(ierr); 1670ce308e1dSBarry Smith } 167147c6ae99SBarry Smith PetscFunctionReturn(0); 167247c6ae99SBarry Smith } 167347c6ae99SBarry Smith 1674950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_2d_MPIBAIJ(DM da,Mat J) 167547c6ae99SBarry Smith { 167647c6ae99SBarry Smith PetscErrorCode ierr; 167747c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny; 167847c6ae99SBarry Smith PetscInt m,n,dim,s,*cols,nc,col,cnt,*dnz,*onz; 167947c6ae99SBarry Smith PetscInt istart,iend,jstart,jend,ii,jj; 168047c6ae99SBarry Smith MPI_Comm comm; 168147c6ae99SBarry Smith PetscScalar *values; 1682bff4a2f0SMatthew G. Knepley DMBoundaryType bx,by; 1683aa219208SBarry Smith DMDAStencilType st; 168445b6f7e9SBarry Smith ISLocalToGlobalMapping ltog; 168547c6ae99SBarry Smith 168647c6ae99SBarry Smith PetscFunctionBegin; 168747c6ae99SBarry Smith /* 168847c6ae99SBarry Smith nc - number of components per grid point 168947c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 169047c6ae99SBarry Smith */ 16911321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,&n,0,0,0,0,&nc,&s,&bx,&by,0,&st);CHKERRQ(ierr); 169247c6ae99SBarry Smith col = 2*s + 1; 169347c6ae99SBarry Smith 1694aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,0,&nx,&ny,0);CHKERRQ(ierr); 1695aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,0,&gnx,&gny,0);CHKERRQ(ierr); 169647c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 169747c6ae99SBarry Smith 1698785e854fSJed Brown ierr = PetscMalloc1(col*col*nc*nc,&cols);CHKERRQ(ierr); 169947c6ae99SBarry Smith 17001411c6eeSJed Brown ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 170147c6ae99SBarry Smith 170247c6ae99SBarry Smith /* determine the matrix preallocation information */ 170347c6ae99SBarry Smith ierr = MatPreallocateInitialize(comm,nx*ny,nx*ny,dnz,onz);CHKERRQ(ierr); 170447c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 1705bff4a2f0SMatthew G. Knepley istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 1706bff4a2f0SMatthew G. Knepley iend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 170747c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 1708bff4a2f0SMatthew G. Knepley jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 1709bff4a2f0SMatthew G. Knepley jend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 171047c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys); 171147c6ae99SBarry Smith 171247c6ae99SBarry Smith /* Find block columns in block row */ 171347c6ae99SBarry Smith cnt = 0; 171447c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 171547c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 1716aa219208SBarry Smith if (st == DMDA_STENCIL_BOX || !ii || !jj) { /* BOX or on the STAR */ 171747c6ae99SBarry Smith cols[cnt++] = slot + ii + gnx*jj; 171847c6ae99SBarry Smith } 171947c6ae99SBarry Smith } 172047c6ae99SBarry Smith } 1721d6e23781SBarry Smith ierr = MatPreallocateSetLocalBlock(ltog,1,&slot,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr); 172247c6ae99SBarry Smith } 172347c6ae99SBarry Smith } 172447c6ae99SBarry Smith ierr = MatSeqBAIJSetPreallocation(J,nc,0,dnz);CHKERRQ(ierr); 172547c6ae99SBarry Smith ierr = MatMPIBAIJSetPreallocation(J,nc,0,dnz,0,onz);CHKERRQ(ierr); 172647c6ae99SBarry Smith ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr); 172747c6ae99SBarry Smith 1728784ac674SJed Brown ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 172947c6ae99SBarry Smith 173047c6ae99SBarry Smith /* 173147c6ae99SBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 173247c6ae99SBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 173347c6ae99SBarry Smith PETSc ordering. 173447c6ae99SBarry Smith */ 1735fcfd50ebSBarry Smith if (!da->prealloc_only) { 17361795a4d1SJed Brown ierr = PetscCalloc1(col*col*nc*nc,&values);CHKERRQ(ierr); 173747c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 1738bff4a2f0SMatthew G. Knepley istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 1739bff4a2f0SMatthew G. Knepley iend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 174047c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 1741bff4a2f0SMatthew G. Knepley jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 1742bff4a2f0SMatthew G. Knepley jend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 174347c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys); 174447c6ae99SBarry Smith cnt = 0; 174547c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 174647c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 1747aa219208SBarry Smith if (st == DMDA_STENCIL_BOX || !ii || !jj) { /* BOX or on the STAR */ 174847c6ae99SBarry Smith cols[cnt++] = slot + ii + gnx*jj; 174947c6ae99SBarry Smith } 175047c6ae99SBarry Smith } 175147c6ae99SBarry Smith } 175247c6ae99SBarry Smith ierr = MatSetValuesBlockedLocal(J,1,&slot,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 175347c6ae99SBarry Smith } 175447c6ae99SBarry Smith } 175547c6ae99SBarry Smith ierr = PetscFree(values);CHKERRQ(ierr); 175647c6ae99SBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 175747c6ae99SBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1758189e4007SBarry Smith ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr); 175947c6ae99SBarry Smith } 176047c6ae99SBarry Smith ierr = PetscFree(cols);CHKERRQ(ierr); 176147c6ae99SBarry Smith PetscFunctionReturn(0); 176247c6ae99SBarry Smith } 176347c6ae99SBarry Smith 1764950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_3d_MPIBAIJ(DM da,Mat J) 176547c6ae99SBarry Smith { 176647c6ae99SBarry Smith PetscErrorCode ierr; 176747c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny; 176847c6ae99SBarry Smith PetscInt m,n,dim,s,*cols,k,nc,col,cnt,p,*dnz,*onz; 176947c6ae99SBarry Smith PetscInt istart,iend,jstart,jend,kstart,kend,zs,nz,gzs,gnz,ii,jj,kk; 177047c6ae99SBarry Smith MPI_Comm comm; 177147c6ae99SBarry Smith PetscScalar *values; 1772bff4a2f0SMatthew G. Knepley DMBoundaryType bx,by,bz; 1773aa219208SBarry Smith DMDAStencilType st; 177445b6f7e9SBarry Smith ISLocalToGlobalMapping ltog; 177547c6ae99SBarry Smith 177647c6ae99SBarry Smith PetscFunctionBegin; 177747c6ae99SBarry Smith /* 177847c6ae99SBarry Smith nc - number of components per grid point 177947c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 178047c6ae99SBarry Smith 178147c6ae99SBarry Smith */ 17821321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,&n,&p,0,0,0,&nc,&s,&bx,&by,&bz,&st);CHKERRQ(ierr); 178347c6ae99SBarry Smith col = 2*s + 1; 178447c6ae99SBarry Smith 1785aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,&zs,&nx,&ny,&nz);CHKERRQ(ierr); 1786aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,&gzs,&gnx,&gny,&gnz);CHKERRQ(ierr); 178747c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 178847c6ae99SBarry Smith 1789785e854fSJed Brown ierr = PetscMalloc1(col*col*col,&cols);CHKERRQ(ierr); 179047c6ae99SBarry Smith 17911411c6eeSJed Brown ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 179247c6ae99SBarry Smith 179347c6ae99SBarry Smith /* determine the matrix preallocation information */ 179447c6ae99SBarry Smith ierr = MatPreallocateInitialize(comm,nx*ny*nz,nx*ny*nz,dnz,onz);CHKERRQ(ierr); 179547c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 1796bff4a2f0SMatthew G. Knepley istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 1797bff4a2f0SMatthew G. Knepley iend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 179847c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 1799bff4a2f0SMatthew G. Knepley jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 1800bff4a2f0SMatthew G. Knepley jend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 180147c6ae99SBarry Smith for (k=zs; k<zs+nz; k++) { 1802bff4a2f0SMatthew G. Knepley kstart = (bz == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k)); 1803bff4a2f0SMatthew G. Knepley kend = (bz == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,p-k-1)); 180447c6ae99SBarry Smith 180547c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs); 180647c6ae99SBarry Smith 180747c6ae99SBarry Smith /* Find block columns in block row */ 180847c6ae99SBarry Smith cnt = 0; 180947c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 181047c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 181147c6ae99SBarry Smith for (kk=kstart; kk<kend+1; kk++) { 1812aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/ 181347c6ae99SBarry Smith cols[cnt++] = slot + ii + gnx*jj + gnx*gny*kk; 181447c6ae99SBarry Smith } 181547c6ae99SBarry Smith } 181647c6ae99SBarry Smith } 181747c6ae99SBarry Smith } 1818d6e23781SBarry Smith ierr = MatPreallocateSetLocalBlock(ltog,1,&slot,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr); 181947c6ae99SBarry Smith } 182047c6ae99SBarry Smith } 182147c6ae99SBarry Smith } 182247c6ae99SBarry Smith ierr = MatSeqBAIJSetPreallocation(J,nc,0,dnz);CHKERRQ(ierr); 182347c6ae99SBarry Smith ierr = MatMPIBAIJSetPreallocation(J,nc,0,dnz,0,onz);CHKERRQ(ierr); 182447c6ae99SBarry Smith ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr); 182547c6ae99SBarry Smith 1826784ac674SJed Brown ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 182747c6ae99SBarry Smith 182847c6ae99SBarry Smith /* 182947c6ae99SBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 183047c6ae99SBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 183147c6ae99SBarry Smith PETSc ordering. 183247c6ae99SBarry Smith */ 1833fcfd50ebSBarry Smith if (!da->prealloc_only) { 18341795a4d1SJed Brown ierr = PetscCalloc1(col*col*col*nc*nc,&values);CHKERRQ(ierr); 183547c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 1836bff4a2f0SMatthew G. Knepley istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 1837bff4a2f0SMatthew G. Knepley iend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 183847c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 1839bff4a2f0SMatthew G. Knepley jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 1840bff4a2f0SMatthew G. Knepley jend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 184147c6ae99SBarry Smith for (k=zs; k<zs+nz; k++) { 1842bff4a2f0SMatthew G. Knepley kstart = (bz == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k)); 1843bff4a2f0SMatthew G. Knepley kend = (bz == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,p-k-1)); 184447c6ae99SBarry Smith 184547c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs); 184647c6ae99SBarry Smith 184747c6ae99SBarry Smith cnt = 0; 184847c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 184947c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 185047c6ae99SBarry Smith for (kk=kstart; kk<kend+1; kk++) { 1851aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/ 185247c6ae99SBarry Smith cols[cnt++] = slot + ii + gnx*jj + gnx*gny*kk; 185347c6ae99SBarry Smith } 185447c6ae99SBarry Smith } 185547c6ae99SBarry Smith } 185647c6ae99SBarry Smith } 185747c6ae99SBarry Smith ierr = MatSetValuesBlockedLocal(J,1,&slot,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 185847c6ae99SBarry Smith } 185947c6ae99SBarry Smith } 186047c6ae99SBarry Smith } 186147c6ae99SBarry Smith ierr = PetscFree(values);CHKERRQ(ierr); 186247c6ae99SBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 186347c6ae99SBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1864189e4007SBarry Smith ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr); 186547c6ae99SBarry Smith } 186647c6ae99SBarry Smith ierr = PetscFree(cols);CHKERRQ(ierr); 186747c6ae99SBarry Smith PetscFunctionReturn(0); 186847c6ae99SBarry Smith } 186947c6ae99SBarry Smith 187047c6ae99SBarry Smith /* 187147c6ae99SBarry Smith This helper is for of SBAIJ preallocation, to discard the lower-triangular values which are difficult to 187247c6ae99SBarry Smith identify in the local ordering with periodic domain. 187347c6ae99SBarry Smith */ 187447c6ae99SBarry Smith static PetscErrorCode L2GFilterUpperTriangular(ISLocalToGlobalMapping ltog,PetscInt *row,PetscInt *cnt,PetscInt col[]) 187547c6ae99SBarry Smith { 187647c6ae99SBarry Smith PetscErrorCode ierr; 187747c6ae99SBarry Smith PetscInt i,n; 187847c6ae99SBarry Smith 187947c6ae99SBarry Smith PetscFunctionBegin; 1880d6e23781SBarry Smith ierr = ISLocalToGlobalMappingApplyBlock(ltog,1,row,row);CHKERRQ(ierr); 1881d6e23781SBarry Smith ierr = ISLocalToGlobalMappingApplyBlock(ltog,*cnt,col,col);CHKERRQ(ierr); 188247c6ae99SBarry Smith for (i=0,n=0; i<*cnt; i++) { 188347c6ae99SBarry Smith if (col[i] >= *row) col[n++] = col[i]; 188447c6ae99SBarry Smith } 188547c6ae99SBarry Smith *cnt = n; 188647c6ae99SBarry Smith PetscFunctionReturn(0); 188747c6ae99SBarry Smith } 188847c6ae99SBarry Smith 1889950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_2d_MPISBAIJ(DM da,Mat J) 189047c6ae99SBarry Smith { 189147c6ae99SBarry Smith PetscErrorCode ierr; 189247c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny; 189347c6ae99SBarry Smith PetscInt m,n,dim,s,*cols,nc,col,cnt,*dnz,*onz; 189447c6ae99SBarry Smith PetscInt istart,iend,jstart,jend,ii,jj; 189547c6ae99SBarry Smith MPI_Comm comm; 189647c6ae99SBarry Smith PetscScalar *values; 1897bff4a2f0SMatthew G. Knepley DMBoundaryType bx,by; 1898aa219208SBarry Smith DMDAStencilType st; 189945b6f7e9SBarry Smith ISLocalToGlobalMapping ltog; 190047c6ae99SBarry Smith 190147c6ae99SBarry Smith PetscFunctionBegin; 190247c6ae99SBarry Smith /* 190347c6ae99SBarry Smith nc - number of components per grid point 190447c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 190547c6ae99SBarry Smith */ 19061321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,&n,0,0,0,0,&nc,&s,&bx,&by,0,&st);CHKERRQ(ierr); 190747c6ae99SBarry Smith col = 2*s + 1; 190847c6ae99SBarry Smith 1909aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,0,&nx,&ny,0);CHKERRQ(ierr); 1910aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,0,&gnx,&gny,0);CHKERRQ(ierr); 191147c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 191247c6ae99SBarry Smith 1913785e854fSJed Brown ierr = PetscMalloc1(col*col*nc*nc,&cols);CHKERRQ(ierr); 191447c6ae99SBarry Smith 19151411c6eeSJed Brown ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 191647c6ae99SBarry Smith 191747c6ae99SBarry Smith /* determine the matrix preallocation information */ 1918eabe889fSLisandro Dalcin ierr = MatPreallocateInitialize(comm,nx*ny,nx*ny,dnz,onz);CHKERRQ(ierr); 191947c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 1920bff4a2f0SMatthew G. Knepley istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 1921bff4a2f0SMatthew G. Knepley iend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 192247c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 1923bff4a2f0SMatthew G. Knepley jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 1924bff4a2f0SMatthew G. Knepley jend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 192547c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys); 192647c6ae99SBarry Smith 192747c6ae99SBarry Smith /* Find block columns in block row */ 192847c6ae99SBarry Smith cnt = 0; 192947c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 193047c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 1931aa219208SBarry Smith if (st == DMDA_STENCIL_BOX || !ii || !jj) { 193247c6ae99SBarry Smith cols[cnt++] = slot + ii + gnx*jj; 193347c6ae99SBarry Smith } 193447c6ae99SBarry Smith } 193547c6ae99SBarry Smith } 193645b6f7e9SBarry Smith ierr = L2GFilterUpperTriangular(ltog,&slot,&cnt,cols);CHKERRQ(ierr); 1937d6e23781SBarry Smith ierr = MatPreallocateSymmetricSetBlock(slot,cnt,cols,dnz,onz);CHKERRQ(ierr); 193847c6ae99SBarry Smith } 193947c6ae99SBarry Smith } 194047c6ae99SBarry Smith ierr = MatSeqSBAIJSetPreallocation(J,nc,0,dnz);CHKERRQ(ierr); 194147c6ae99SBarry Smith ierr = MatMPISBAIJSetPreallocation(J,nc,0,dnz,0,onz);CHKERRQ(ierr); 194247c6ae99SBarry Smith ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr); 194347c6ae99SBarry Smith 1944784ac674SJed Brown ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 194547c6ae99SBarry Smith 194647c6ae99SBarry Smith /* 194747c6ae99SBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 194847c6ae99SBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 194947c6ae99SBarry Smith PETSc ordering. 195047c6ae99SBarry Smith */ 1951fcfd50ebSBarry Smith if (!da->prealloc_only) { 19521795a4d1SJed Brown ierr = PetscCalloc1(col*col*nc*nc,&values);CHKERRQ(ierr); 195347c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 1954bff4a2f0SMatthew G. Knepley istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 1955bff4a2f0SMatthew G. Knepley iend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 195647c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 1957bff4a2f0SMatthew G. Knepley jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 1958bff4a2f0SMatthew G. Knepley jend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 195947c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys); 196047c6ae99SBarry Smith 196147c6ae99SBarry Smith /* Find block columns in block row */ 196247c6ae99SBarry Smith cnt = 0; 196347c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 196447c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 1965aa219208SBarry Smith if (st == DMDA_STENCIL_BOX || !ii || !jj) { 196647c6ae99SBarry Smith cols[cnt++] = slot + ii + gnx*jj; 196747c6ae99SBarry Smith } 196847c6ae99SBarry Smith } 196947c6ae99SBarry Smith } 197045b6f7e9SBarry Smith ierr = L2GFilterUpperTriangular(ltog,&slot,&cnt,cols);CHKERRQ(ierr); 197147c6ae99SBarry Smith ierr = MatSetValuesBlocked(J,1,&slot,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 197247c6ae99SBarry Smith } 197347c6ae99SBarry Smith } 197447c6ae99SBarry Smith ierr = PetscFree(values);CHKERRQ(ierr); 197547c6ae99SBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 197647c6ae99SBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1977189e4007SBarry Smith ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr); 197847c6ae99SBarry Smith } 197947c6ae99SBarry Smith ierr = PetscFree(cols);CHKERRQ(ierr); 198047c6ae99SBarry Smith PetscFunctionReturn(0); 198147c6ae99SBarry Smith } 198247c6ae99SBarry Smith 1983950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_3d_MPISBAIJ(DM da,Mat J) 198447c6ae99SBarry Smith { 198547c6ae99SBarry Smith PetscErrorCode ierr; 198647c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny; 198747c6ae99SBarry Smith PetscInt m,n,dim,s,*cols,k,nc,col,cnt,p,*dnz,*onz; 198847c6ae99SBarry Smith PetscInt istart,iend,jstart,jend,kstart,kend,zs,nz,gzs,gnz,ii,jj,kk; 198947c6ae99SBarry Smith MPI_Comm comm; 199047c6ae99SBarry Smith PetscScalar *values; 1991bff4a2f0SMatthew G. Knepley DMBoundaryType bx,by,bz; 1992aa219208SBarry Smith DMDAStencilType st; 199345b6f7e9SBarry Smith ISLocalToGlobalMapping ltog; 199447c6ae99SBarry Smith 199547c6ae99SBarry Smith PetscFunctionBegin; 199647c6ae99SBarry Smith /* 199747c6ae99SBarry Smith nc - number of components per grid point 199847c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 199947c6ae99SBarry Smith */ 20001321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,&n,&p,0,0,0,&nc,&s,&bx,&by,&bz,&st);CHKERRQ(ierr); 200147c6ae99SBarry Smith col = 2*s + 1; 200247c6ae99SBarry Smith 2003aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,&zs,&nx,&ny,&nz);CHKERRQ(ierr); 2004aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,&gzs,&gnx,&gny,&gnz);CHKERRQ(ierr); 200547c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 200647c6ae99SBarry Smith 200747c6ae99SBarry Smith /* create the matrix */ 2008785e854fSJed Brown ierr = PetscMalloc1(col*col*col,&cols);CHKERRQ(ierr); 200947c6ae99SBarry Smith 20101411c6eeSJed Brown ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 201147c6ae99SBarry Smith 201247c6ae99SBarry Smith /* determine the matrix preallocation information */ 2013eabe889fSLisandro Dalcin ierr = MatPreallocateInitialize(comm,nx*ny*nz,nx*ny*nz,dnz,onz);CHKERRQ(ierr); 201447c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 2015bff4a2f0SMatthew G. Knepley istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 2016bff4a2f0SMatthew G. Knepley iend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 201747c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 2018bff4a2f0SMatthew G. Knepley jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 2019bff4a2f0SMatthew G. Knepley jend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 202047c6ae99SBarry Smith for (k=zs; k<zs+nz; k++) { 2021bff4a2f0SMatthew G. Knepley kstart = (bz == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k)); 2022bff4a2f0SMatthew G. Knepley kend = (bz == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,p-k-1)); 202347c6ae99SBarry Smith 202447c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs); 202547c6ae99SBarry Smith 202647c6ae99SBarry Smith /* Find block columns in block row */ 202747c6ae99SBarry Smith cnt = 0; 202847c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 202947c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 203047c6ae99SBarry Smith for (kk=kstart; kk<kend+1; kk++) { 2031aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || (!ii && !jj) || (!jj && !kk) || (!ii && !kk)) { 203247c6ae99SBarry Smith cols[cnt++] = slot + ii + gnx*jj + gnx*gny*kk; 203347c6ae99SBarry Smith } 203447c6ae99SBarry Smith } 203547c6ae99SBarry Smith } 203647c6ae99SBarry Smith } 203745b6f7e9SBarry Smith ierr = L2GFilterUpperTriangular(ltog,&slot,&cnt,cols);CHKERRQ(ierr); 2038d6e23781SBarry Smith ierr = MatPreallocateSymmetricSetBlock(slot,cnt,cols,dnz,onz);CHKERRQ(ierr); 203947c6ae99SBarry Smith } 204047c6ae99SBarry Smith } 204147c6ae99SBarry Smith } 204247c6ae99SBarry Smith ierr = MatSeqSBAIJSetPreallocation(J,nc,0,dnz);CHKERRQ(ierr); 204347c6ae99SBarry Smith ierr = MatMPISBAIJSetPreallocation(J,nc,0,dnz,0,onz);CHKERRQ(ierr); 204447c6ae99SBarry Smith ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr); 204547c6ae99SBarry Smith 2046784ac674SJed Brown ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 204747c6ae99SBarry Smith 204847c6ae99SBarry Smith /* 204947c6ae99SBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 205047c6ae99SBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 205147c6ae99SBarry Smith PETSc ordering. 205247c6ae99SBarry Smith */ 2053fcfd50ebSBarry Smith if (!da->prealloc_only) { 20541795a4d1SJed Brown ierr = PetscCalloc1(col*col*col*nc*nc,&values);CHKERRQ(ierr); 205547c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 2056bff4a2f0SMatthew G. Knepley istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 2057bff4a2f0SMatthew G. Knepley iend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 205847c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 2059bff4a2f0SMatthew G. Knepley jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 2060bff4a2f0SMatthew G. Knepley jend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 206147c6ae99SBarry Smith for (k=zs; k<zs+nz; k++) { 2062bff4a2f0SMatthew G. Knepley kstart = (bz == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k)); 2063bff4a2f0SMatthew G. Knepley kend = (bz == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,p-k-1)); 206447c6ae99SBarry Smith 206547c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs); 206647c6ae99SBarry Smith 206747c6ae99SBarry Smith cnt = 0; 206847c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 206947c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 207047c6ae99SBarry Smith for (kk=kstart; kk<kend+1; kk++) { 2071aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || (!ii && !jj) || (!jj && !kk) || (!ii && !kk)) { 207247c6ae99SBarry Smith cols[cnt++] = slot + ii + gnx*jj + gnx*gny*kk; 207347c6ae99SBarry Smith } 207447c6ae99SBarry Smith } 207547c6ae99SBarry Smith } 207647c6ae99SBarry Smith } 207745b6f7e9SBarry Smith ierr = L2GFilterUpperTriangular(ltog,&slot,&cnt,cols);CHKERRQ(ierr); 207847c6ae99SBarry Smith ierr = MatSetValuesBlocked(J,1,&slot,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 207947c6ae99SBarry Smith } 208047c6ae99SBarry Smith } 208147c6ae99SBarry Smith } 208247c6ae99SBarry Smith ierr = PetscFree(values);CHKERRQ(ierr); 208347c6ae99SBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 208447c6ae99SBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2085189e4007SBarry Smith ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr); 208647c6ae99SBarry Smith } 208747c6ae99SBarry Smith ierr = PetscFree(cols);CHKERRQ(ierr); 208847c6ae99SBarry Smith PetscFunctionReturn(0); 208947c6ae99SBarry Smith } 209047c6ae99SBarry Smith 209147c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/ 209247c6ae99SBarry Smith 2093950540a4SJed Brown PetscErrorCode DMCreateMatrix_DA_3d_MPIAIJ_Fill(DM da,Mat J) 209447c6ae99SBarry Smith { 209547c6ae99SBarry Smith PetscErrorCode ierr; 209647c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny; 2097c0ab637bSBarry Smith PetscInt m,n,dim,s,*cols,k,nc,row,col,cnt, maxcnt = 0,l,p,*dnz,*onz; 2098c1154cd5SBarry Smith PetscInt istart,iend,jstart,jend,kstart,kend,zs,nz,gzs,gnz,ii,jj,kk,M,N,P; 209947c6ae99SBarry Smith DM_DA *dd = (DM_DA*)da->data; 210047c6ae99SBarry Smith PetscInt ifill_col,*dfill = dd->dfill,*ofill = dd->ofill; 210147c6ae99SBarry Smith MPI_Comm comm; 210247c6ae99SBarry Smith PetscScalar *values; 2103bff4a2f0SMatthew G. Knepley DMBoundaryType bx,by,bz; 210445b6f7e9SBarry Smith ISLocalToGlobalMapping ltog; 2105aa219208SBarry Smith DMDAStencilType st; 2106c1154cd5SBarry Smith PetscBool removedups = PETSC_FALSE; 210747c6ae99SBarry Smith 210847c6ae99SBarry Smith PetscFunctionBegin; 210947c6ae99SBarry Smith /* 211047c6ae99SBarry Smith nc - number of components per grid point 211147c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 211247c6ae99SBarry Smith 211347c6ae99SBarry Smith */ 2114c1154cd5SBarry Smith ierr = DMDAGetInfo(da,&dim,&m,&n,&p,&M,&N,&P,&nc,&s,&bx,&by,&bz,&st);CHKERRQ(ierr); 211547c6ae99SBarry Smith col = 2*s + 1; 2116bff4a2f0SMatthew G. Knepley if (bx == DM_BOUNDARY_PERIODIC && (m % col)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in X is divisible\n\ 211747c6ae99SBarry Smith by 2*stencil_width + 1\n"); 2118bff4a2f0SMatthew G. Knepley if (by == DM_BOUNDARY_PERIODIC && (n % col)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in Y is divisible\n\ 211947c6ae99SBarry Smith by 2*stencil_width + 1\n"); 2120bff4a2f0SMatthew G. Knepley if (bz == DM_BOUNDARY_PERIODIC && (p % col)) SETERRQ(PetscObjectComm((PetscObject)da),PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in Z is divisible\n\ 212147c6ae99SBarry Smith by 2*stencil_width + 1\n"); 212247c6ae99SBarry Smith 2123c1154cd5SBarry Smith /* 2124c1154cd5SBarry Smith With one processor in periodic domains in a skinny dimension the code will label nonzero columns multiple times 2125c1154cd5SBarry Smith because of "wrapping" around the end of the domain hitting an entry already counted in the other direction. 2126c1154cd5SBarry Smith */ 2127c1154cd5SBarry Smith if (M == 1 && 2*s >= m) removedups = PETSC_TRUE; 2128c1154cd5SBarry Smith if (N == 1 && 2*s >= n) removedups = PETSC_TRUE; 2129c1154cd5SBarry Smith if (P == 1 && 2*s >= p) removedups = PETSC_TRUE; 2130c1154cd5SBarry Smith 2131aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,&zs,&nx,&ny,&nz);CHKERRQ(ierr); 2132aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,&gzs,&gnx,&gny,&gnz);CHKERRQ(ierr); 213347c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 213447c6ae99SBarry Smith 2135785e854fSJed Brown ierr = PetscMalloc1(col*col*col*nc,&cols);CHKERRQ(ierr); 21361411c6eeSJed Brown ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 213747c6ae99SBarry Smith 213847c6ae99SBarry Smith /* determine the matrix preallocation information */ 213947c6ae99SBarry Smith ierr = MatPreallocateInitialize(comm,nc*nx*ny*nz,nc*nx*ny*nz,dnz,onz);CHKERRQ(ierr); 214047c6ae99SBarry Smith 214106ca8cadSBarry Smith ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr); 214247c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 2143bff4a2f0SMatthew G. Knepley istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 2144bff4a2f0SMatthew G. Knepley iend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 214547c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 2146bff4a2f0SMatthew G. Knepley jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 2147bff4a2f0SMatthew G. Knepley jend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 214847c6ae99SBarry Smith for (k=zs; k<zs+nz; k++) { 2149bff4a2f0SMatthew G. Knepley kstart = (bz == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k)); 2150bff4a2f0SMatthew G. Knepley kend = (bz == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,p-k-1)); 215147c6ae99SBarry Smith 215247c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs); 215347c6ae99SBarry Smith 215447c6ae99SBarry Smith for (l=0; l<nc; l++) { 215547c6ae99SBarry Smith cnt = 0; 215647c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 215747c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 215847c6ae99SBarry Smith for (kk=kstart; kk<kend+1; kk++) { 215947c6ae99SBarry Smith if (ii || jj || kk) { 2160aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/ 21618865f1eaSKarl Rupp for (ifill_col=ofill[l]; ifill_col<ofill[l+1]; ifill_col++) cols[cnt++] = ofill[ifill_col] + nc*(slot + ii + gnx*jj + gnx*gny*kk); 216247c6ae99SBarry Smith } 216347c6ae99SBarry Smith } else { 216447c6ae99SBarry Smith if (dfill) { 21658865f1eaSKarl Rupp for (ifill_col=dfill[l]; ifill_col<dfill[l+1]; ifill_col++) cols[cnt++] = dfill[ifill_col] + nc*(slot + ii + gnx*jj + gnx*gny*kk); 216647c6ae99SBarry Smith } else { 21678865f1eaSKarl Rupp for (ifill_col=0; ifill_col<nc; ifill_col++) cols[cnt++] = ifill_col + nc*(slot + ii + gnx*jj + gnx*gny*kk); 216847c6ae99SBarry Smith } 216947c6ae99SBarry Smith } 217047c6ae99SBarry Smith } 217147c6ae99SBarry Smith } 217247c6ae99SBarry Smith } 217347c6ae99SBarry Smith row = l + nc*(slot); 2174c0ab637bSBarry Smith maxcnt = PetscMax(maxcnt,cnt); 2175c1154cd5SBarry Smith if (removedups) { 2176c1154cd5SBarry Smith ierr = MatPreallocateSetLocalRemoveDups(ltog,1,&row,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr); 2177c1154cd5SBarry Smith } else { 2178784ac674SJed Brown ierr = MatPreallocateSetLocal(ltog,1,&row,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr); 217947c6ae99SBarry Smith } 218047c6ae99SBarry Smith } 218147c6ae99SBarry Smith } 218247c6ae99SBarry Smith } 2183c1154cd5SBarry Smith } 218447c6ae99SBarry Smith ierr = MatSeqAIJSetPreallocation(J,0,dnz);CHKERRQ(ierr); 218547c6ae99SBarry Smith ierr = MatMPIAIJSetPreallocation(J,0,dnz,0,onz);CHKERRQ(ierr); 218647c6ae99SBarry Smith ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr); 2187784ac674SJed Brown ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 218847c6ae99SBarry Smith 218947c6ae99SBarry Smith /* 219047c6ae99SBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 219147c6ae99SBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 219247c6ae99SBarry Smith PETSc ordering. 219347c6ae99SBarry Smith */ 2194fcfd50ebSBarry Smith if (!da->prealloc_only) { 2195c0ab637bSBarry Smith ierr = PetscCalloc1(maxcnt,&values);CHKERRQ(ierr); 219647c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 2197bff4a2f0SMatthew G. Knepley istart = (bx == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 2198bff4a2f0SMatthew G. Knepley iend = (bx == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 219947c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 2200bff4a2f0SMatthew G. Knepley jstart = (by == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 2201bff4a2f0SMatthew G. Knepley jend = (by == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 220247c6ae99SBarry Smith for (k=zs; k<zs+nz; k++) { 2203bff4a2f0SMatthew G. Knepley kstart = (bz == DM_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k)); 2204bff4a2f0SMatthew G. Knepley kend = (bz == DM_BOUNDARY_PERIODIC) ? s : (PetscMin(s,p-k-1)); 220547c6ae99SBarry Smith 220647c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs); 220747c6ae99SBarry Smith 220847c6ae99SBarry Smith for (l=0; l<nc; l++) { 220947c6ae99SBarry Smith cnt = 0; 221047c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 221147c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 221247c6ae99SBarry Smith for (kk=kstart; kk<kend+1; kk++) { 221347c6ae99SBarry Smith if (ii || jj || kk) { 2214aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/ 22158865f1eaSKarl Rupp for (ifill_col=ofill[l]; ifill_col<ofill[l+1]; ifill_col++) cols[cnt++] = ofill[ifill_col] + nc*(slot + ii + gnx*jj + gnx*gny*kk); 221647c6ae99SBarry Smith } 221747c6ae99SBarry Smith } else { 221847c6ae99SBarry Smith if (dfill) { 22198865f1eaSKarl Rupp for (ifill_col=dfill[l]; ifill_col<dfill[l+1]; ifill_col++) cols[cnt++] = dfill[ifill_col] + nc*(slot + ii + gnx*jj + gnx*gny*kk); 222047c6ae99SBarry Smith } else { 22218865f1eaSKarl Rupp for (ifill_col=0; ifill_col<nc; ifill_col++) cols[cnt++] = ifill_col + nc*(slot + ii + gnx*jj + gnx*gny*kk); 222247c6ae99SBarry Smith } 222347c6ae99SBarry Smith } 222447c6ae99SBarry Smith } 222547c6ae99SBarry Smith } 222647c6ae99SBarry Smith } 222747c6ae99SBarry Smith row = l + nc*(slot); 222847c6ae99SBarry Smith ierr = MatSetValuesLocal(J,1,&row,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 222947c6ae99SBarry Smith } 223047c6ae99SBarry Smith } 223147c6ae99SBarry Smith } 223247c6ae99SBarry Smith } 223347c6ae99SBarry Smith ierr = PetscFree(values);CHKERRQ(ierr); 223447c6ae99SBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 223547c6ae99SBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2236189e4007SBarry Smith ierr = MatSetOption(J,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_TRUE);CHKERRQ(ierr); 223747c6ae99SBarry Smith } 223847c6ae99SBarry Smith ierr = PetscFree(cols);CHKERRQ(ierr); 223947c6ae99SBarry Smith PetscFunctionReturn(0); 224047c6ae99SBarry Smith } 2241