147c6ae99SBarry Smith 2c6db04a5SJed Brown #include <private/daimpl.h> /*I "petscdmda.h" I*/ 3c6db04a5SJed Brown #include <petscmat.h> /*I "petscmat.h" I*/ 4c6db04a5SJed Brown #include <private/matimpl.h> 547c6ae99SBarry Smith 609573ac7SBarry Smith extern PetscErrorCode DMGetColoring_DA_1d_MPIAIJ(DM,ISColoringType,ISColoring *); 709573ac7SBarry Smith extern PetscErrorCode DMGetColoring_DA_2d_MPIAIJ(DM,ISColoringType,ISColoring *); 809573ac7SBarry Smith extern PetscErrorCode DMGetColoring_DA_2d_5pt_MPIAIJ(DM,ISColoringType,ISColoring *); 909573ac7SBarry Smith extern PetscErrorCode DMGetColoring_DA_3d_MPIAIJ(DM,ISColoringType,ISColoring *); 1047c6ae99SBarry Smith 1147c6ae99SBarry Smith /* 1247c6ae99SBarry Smith For ghost i that may be negative or greater than the upper bound this 1347c6ae99SBarry Smith maps it into the 0:m-1 range using periodicity 1447c6ae99SBarry Smith */ 1547c6ae99SBarry Smith #define SetInRange(i,m) ((i < 0) ? m+i:((i >= m) ? i-m:i)) 1647c6ae99SBarry Smith 1747c6ae99SBarry Smith #undef __FUNCT__ 18aa219208SBarry Smith #define __FUNCT__ "DMDASetBlockFills_Private" 19aa219208SBarry Smith static PetscErrorCode DMDASetBlockFills_Private(PetscInt *dfill,PetscInt w,PetscInt **rfill) 2047c6ae99SBarry Smith { 2147c6ae99SBarry Smith PetscErrorCode ierr; 2247c6ae99SBarry Smith PetscInt i,j,nz,*fill; 2347c6ae99SBarry Smith 2447c6ae99SBarry Smith PetscFunctionBegin; 2547c6ae99SBarry Smith if (!dfill) PetscFunctionReturn(0); 2647c6ae99SBarry Smith 2747c6ae99SBarry Smith /* count number nonzeros */ 2847c6ae99SBarry Smith nz = 0; 2947c6ae99SBarry Smith for (i=0; i<w; i++) { 3047c6ae99SBarry Smith for (j=0; j<w; j++) { 3147c6ae99SBarry Smith if (dfill[w*i+j]) nz++; 3247c6ae99SBarry Smith } 3347c6ae99SBarry Smith } 3447c6ae99SBarry Smith ierr = PetscMalloc((nz + w + 1)*sizeof(PetscInt),&fill);CHKERRQ(ierr); 3547c6ae99SBarry Smith /* construct modified CSR storage of nonzero structure */ 3647c6ae99SBarry Smith nz = w + 1; 3747c6ae99SBarry Smith for (i=0; i<w; i++) { 3847c6ae99SBarry Smith fill[i] = nz; 3947c6ae99SBarry Smith for (j=0; j<w; j++) { 4047c6ae99SBarry Smith if (dfill[w*i+j]) { 4147c6ae99SBarry Smith fill[nz] = j; 4247c6ae99SBarry Smith nz++; 4347c6ae99SBarry Smith } 4447c6ae99SBarry Smith } 4547c6ae99SBarry Smith } 4647c6ae99SBarry Smith fill[w] = nz; 4747c6ae99SBarry Smith 4847c6ae99SBarry Smith *rfill = fill; 4947c6ae99SBarry Smith PetscFunctionReturn(0); 5047c6ae99SBarry Smith } 5147c6ae99SBarry Smith 5247c6ae99SBarry Smith #undef __FUNCT__ 53aa219208SBarry Smith #define __FUNCT__ "DMDASetBlockFills" 5447c6ae99SBarry Smith /*@ 55aa219208SBarry Smith DMDASetBlockFills - Sets the fill pattern in each block for a multi-component problem 5694013140SBarry Smith of the matrix returned by DMGetMatrix(). 5747c6ae99SBarry Smith 58aa219208SBarry Smith Logically Collective on DMDA 5947c6ae99SBarry Smith 6047c6ae99SBarry Smith Input Parameter: 6147c6ae99SBarry Smith + da - the distributed array 6247c6ae99SBarry Smith . dfill - the fill pattern in the diagonal block (may be PETSC_NULL, means use dense block) 6347c6ae99SBarry Smith - ofill - the fill pattern in the off-diagonal blocks 6447c6ae99SBarry Smith 6547c6ae99SBarry Smith 6647c6ae99SBarry Smith Level: developer 6747c6ae99SBarry Smith 6847c6ae99SBarry Smith Notes: This only makes sense when you are doing multicomponent problems but using the 6947c6ae99SBarry Smith MPIAIJ matrix format 7047c6ae99SBarry Smith 7147c6ae99SBarry Smith The format for dfill and ofill is a 2 dimensional dof by dof matrix with 1 entries 7247c6ae99SBarry Smith representing coupling and 0 entries for missing coupling. For example 7347c6ae99SBarry Smith $ dfill[9] = {1, 0, 0, 7447c6ae99SBarry Smith $ 1, 1, 0, 7547c6ae99SBarry Smith $ 0, 1, 1} 7647c6ae99SBarry Smith means that row 0 is coupled with only itself in the diagonal block, row 1 is coupled with 7747c6ae99SBarry Smith itself and row 0 (in the diagonal block) and row 2 is coupled with itself and row 1 (in the 7847c6ae99SBarry Smith diagonal block). 7947c6ae99SBarry Smith 80aa219208SBarry Smith DMDASetGetMatrix() allows you to provide general code for those more complicated nonzero patterns then 8147c6ae99SBarry Smith can be represented in the dfill, ofill format 8247c6ae99SBarry Smith 8347c6ae99SBarry Smith Contributed by Glenn Hammond 8447c6ae99SBarry Smith 85aa219208SBarry Smith .seealso DMGetMatrix(), DMDASetGetMatrix(), DMDASetMatPreallocateOnly() 8647c6ae99SBarry Smith 8747c6ae99SBarry Smith @*/ 887087cfbeSBarry Smith PetscErrorCode DMDASetBlockFills(DM da,PetscInt *dfill,PetscInt *ofill) 8947c6ae99SBarry Smith { 9047c6ae99SBarry Smith DM_DA *dd = (DM_DA*)da->data; 9147c6ae99SBarry Smith PetscErrorCode ierr; 9247c6ae99SBarry Smith 9347c6ae99SBarry Smith PetscFunctionBegin; 94aa219208SBarry Smith ierr = DMDASetBlockFills_Private(dfill,dd->w,&dd->dfill);CHKERRQ(ierr); 95aa219208SBarry Smith ierr = DMDASetBlockFills_Private(ofill,dd->w,&dd->ofill);CHKERRQ(ierr); 9647c6ae99SBarry Smith PetscFunctionReturn(0); 9747c6ae99SBarry Smith } 9847c6ae99SBarry Smith 9947c6ae99SBarry Smith 10047c6ae99SBarry Smith #undef __FUNCT__ 10194013140SBarry Smith #define __FUNCT__ "DMGetColoring_DA" 1027087cfbeSBarry Smith PetscErrorCode DMGetColoring_DA(DM da,ISColoringType ctype,const MatType mtype,ISColoring *coloring) 10347c6ae99SBarry Smith { 10447c6ae99SBarry Smith PetscErrorCode ierr; 10547c6ae99SBarry Smith PetscInt dim,m,n,p,nc; 1061321219cSEthan Coon DMDABoundaryType bx,by,bz; 10747c6ae99SBarry Smith MPI_Comm comm; 10847c6ae99SBarry Smith PetscMPIInt size; 10947c6ae99SBarry Smith PetscBool isBAIJ; 11047c6ae99SBarry Smith DM_DA *dd = (DM_DA*)da->data; 11147c6ae99SBarry Smith 11247c6ae99SBarry Smith PetscFunctionBegin; 11347c6ae99SBarry Smith /* 11447c6ae99SBarry Smith m 11547c6ae99SBarry Smith ------------------------------------------------------ 11647c6ae99SBarry Smith | | 11747c6ae99SBarry Smith | | 11847c6ae99SBarry Smith | ---------------------- | 11947c6ae99SBarry Smith | | | | 12047c6ae99SBarry Smith n | yn | | | 12147c6ae99SBarry Smith | | | | 12247c6ae99SBarry Smith | .--------------------- | 12347c6ae99SBarry Smith | (xs,ys) xn | 12447c6ae99SBarry Smith | . | 12547c6ae99SBarry Smith | (gxs,gys) | 12647c6ae99SBarry Smith | | 12747c6ae99SBarry Smith ----------------------------------------------------- 12847c6ae99SBarry Smith */ 12947c6ae99SBarry Smith 13047c6ae99SBarry Smith /* 13147c6ae99SBarry Smith nc - number of components per grid point 13247c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 13347c6ae99SBarry Smith 13447c6ae99SBarry Smith */ 1351321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,0,0,0,&m,&n,&p,&nc,0,&bx,&by,&bz,0);CHKERRQ(ierr); 13647c6ae99SBarry Smith 13747c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 13847c6ae99SBarry Smith ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr); 13947c6ae99SBarry Smith if (ctype == IS_COLORING_GHOSTED){ 14047c6ae99SBarry Smith if (size == 1) { 14147c6ae99SBarry Smith ctype = IS_COLORING_GLOBAL; 14247c6ae99SBarry Smith } else if (dim > 1){ 1431321219cSEthan Coon if ((m==1 && bx == DMDA_BOUNDARY_PERIODIC) || (n==1 && by == DMDA_BOUNDARY_PERIODIC) || (p==1 && bz == DMDA_BOUNDARY_PERIODIC)){ 14447c6ae99SBarry Smith SETERRQ(((PetscObject)da)->comm,PETSC_ERR_SUP,"IS_COLORING_GHOSTED cannot be used for periodic boundary condition having both ends of the domain on the same process"); 14547c6ae99SBarry Smith } 14647c6ae99SBarry Smith } 14747c6ae99SBarry Smith } 14847c6ae99SBarry Smith 149aa219208SBarry Smith /* Tell the DMDA it has 1 degree of freedom per grid point so that the coloring for BAIJ 15047c6ae99SBarry Smith matrices is for the blocks, not the individual matrix elements */ 151*4833614aSSatish Balay ierr = PetscStrcmp(mtype,MATBAIJ,&isBAIJ);CHKERRQ(ierr); 152*4833614aSSatish Balay if (!isBAIJ) {ierr = PetscStrcmp(mtype,MATMPIBAIJ,&isBAIJ);CHKERRQ(ierr);} 15347c6ae99SBarry Smith if (!isBAIJ) {ierr = PetscStrcmp(mtype,MATSEQBAIJ,&isBAIJ);CHKERRQ(ierr);} 15447c6ae99SBarry Smith if (isBAIJ) { 15547c6ae99SBarry Smith dd->w = 1; 15647c6ae99SBarry Smith dd->xs = dd->xs/nc; 15747c6ae99SBarry Smith dd->xe = dd->xe/nc; 15847c6ae99SBarry Smith dd->Xs = dd->Xs/nc; 15947c6ae99SBarry Smith dd->Xe = dd->Xe/nc; 16047c6ae99SBarry Smith } 16147c6ae99SBarry Smith 16247c6ae99SBarry Smith /* 163aa219208SBarry Smith We do not provide a getcoloring function in the DMDA operations because 164aa219208SBarry Smith the basic DMDA does not know about matrices. We think of DMDA as being more 16547c6ae99SBarry Smith more low-level then matrices. 16647c6ae99SBarry Smith */ 16747c6ae99SBarry Smith if (dim == 1) { 16894013140SBarry Smith ierr = DMGetColoring_DA_1d_MPIAIJ(da,ctype,coloring);CHKERRQ(ierr); 16947c6ae99SBarry Smith } else if (dim == 2) { 17094013140SBarry Smith ierr = DMGetColoring_DA_2d_MPIAIJ(da,ctype,coloring);CHKERRQ(ierr); 17147c6ae99SBarry Smith } else if (dim == 3) { 17294013140SBarry Smith ierr = DMGetColoring_DA_3d_MPIAIJ(da,ctype,coloring);CHKERRQ(ierr); 17371cd77b2SBarry Smith } else SETERRQ1(((PetscObject)da)->comm,PETSC_ERR_SUP,"Not done for %D dimension, send us mail petsc-maint@mcs.anl.gov for code",dim); 17447c6ae99SBarry Smith if (isBAIJ) { 17547c6ae99SBarry Smith dd->w = nc; 17647c6ae99SBarry Smith dd->xs = dd->xs*nc; 17747c6ae99SBarry Smith dd->xe = dd->xe*nc; 17847c6ae99SBarry Smith dd->Xs = dd->Xs*nc; 17947c6ae99SBarry Smith dd->Xe = dd->Xe*nc; 18047c6ae99SBarry Smith } 18147c6ae99SBarry Smith PetscFunctionReturn(0); 18247c6ae99SBarry Smith } 18347c6ae99SBarry Smith 18447c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/ 18547c6ae99SBarry Smith 18647c6ae99SBarry Smith #undef __FUNCT__ 18794013140SBarry Smith #define __FUNCT__ "DMGetColoring_DA_2d_MPIAIJ" 18894013140SBarry Smith PetscErrorCode DMGetColoring_DA_2d_MPIAIJ(DM da,ISColoringType ctype,ISColoring *coloring) 18947c6ae99SBarry Smith { 19047c6ae99SBarry Smith PetscErrorCode ierr; 19147c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,ii,gxs,gys,gnx,gny,m,n,M,N,dim,s,k,nc,col; 19247c6ae99SBarry Smith PetscInt ncolors; 19347c6ae99SBarry Smith MPI_Comm comm; 1941321219cSEthan Coon DMDABoundaryType bx,by; 195aa219208SBarry Smith DMDAStencilType st; 19647c6ae99SBarry Smith ISColoringValue *colors; 19747c6ae99SBarry Smith DM_DA *dd = (DM_DA*)da->data; 19847c6ae99SBarry Smith 19947c6ae99SBarry Smith PetscFunctionBegin; 20047c6ae99SBarry Smith /* 20147c6ae99SBarry Smith nc - number of components per grid point 20247c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 20347c6ae99SBarry Smith 20447c6ae99SBarry Smith */ 2051321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,&n,0,&M,&N,0,&nc,&s,&bx,&by,0,&st);CHKERRQ(ierr); 20647c6ae99SBarry Smith col = 2*s + 1; 207aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,0,&nx,&ny,0);CHKERRQ(ierr); 208aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,0,&gnx,&gny,0);CHKERRQ(ierr); 20947c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 21047c6ae99SBarry Smith 21147c6ae99SBarry Smith /* special case as taught to us by Paul Hovland */ 212aa219208SBarry Smith if (st == DMDA_STENCIL_STAR && s == 1) { 21394013140SBarry Smith ierr = DMGetColoring_DA_2d_5pt_MPIAIJ(da,ctype,coloring);CHKERRQ(ierr); 21447c6ae99SBarry Smith } else { 21547c6ae99SBarry Smith 2161321219cSEthan Coon if (bx == DMDA_BOUNDARY_PERIODIC && (m % col)){ 21747c6ae99SBarry Smith SETERRQ2(((PetscObject)da)->comm,PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in X (%d) is divisible\n\ 21847c6ae99SBarry Smith by 2*stencil_width + 1 (%d)\n", m, col); 21947c6ae99SBarry Smith } 2201321219cSEthan Coon if (by == DMDA_BOUNDARY_PERIODIC && (n % col)){ 22147c6ae99SBarry Smith SETERRQ2(((PetscObject)da)->comm,PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in Y (%d) is divisible\n\ 22247c6ae99SBarry Smith by 2*stencil_width + 1 (%d)\n", n, col); 22347c6ae99SBarry Smith } 22447c6ae99SBarry Smith if (ctype == IS_COLORING_GLOBAL) { 22547c6ae99SBarry Smith if (!dd->localcoloring) { 22647c6ae99SBarry Smith ierr = PetscMalloc(nc*nx*ny*sizeof(ISColoringValue),&colors);CHKERRQ(ierr); 22747c6ae99SBarry Smith ii = 0; 22847c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 22947c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 23047c6ae99SBarry Smith for (k=0; k<nc; k++) { 23147c6ae99SBarry Smith colors[ii++] = k + nc*((i % col) + col*(j % col)); 23247c6ae99SBarry Smith } 23347c6ae99SBarry Smith } 23447c6ae99SBarry Smith } 23547c6ae99SBarry Smith ncolors = nc + nc*(col-1 + col*(col-1)); 23647c6ae99SBarry Smith ierr = ISColoringCreate(comm,ncolors,nc*nx*ny,colors,&dd->localcoloring);CHKERRQ(ierr); 23747c6ae99SBarry Smith } 23847c6ae99SBarry Smith *coloring = dd->localcoloring; 23947c6ae99SBarry Smith } else if (ctype == IS_COLORING_GHOSTED) { 24047c6ae99SBarry Smith if (!dd->ghostedcoloring) { 24147c6ae99SBarry Smith ierr = PetscMalloc(nc*gnx*gny*sizeof(ISColoringValue),&colors);CHKERRQ(ierr); 24247c6ae99SBarry Smith ii = 0; 24347c6ae99SBarry Smith for (j=gys; j<gys+gny; j++) { 24447c6ae99SBarry Smith for (i=gxs; i<gxs+gnx; i++) { 24547c6ae99SBarry Smith for (k=0; k<nc; k++) { 24647c6ae99SBarry Smith /* the complicated stuff is to handle periodic boundaries */ 24747c6ae99SBarry Smith colors[ii++] = k + nc*((SetInRange(i,m) % col) + col*(SetInRange(j,n) % col)); 24847c6ae99SBarry Smith } 24947c6ae99SBarry Smith } 25047c6ae99SBarry Smith } 25147c6ae99SBarry Smith ncolors = nc + nc*(col - 1 + col*(col-1)); 25247c6ae99SBarry Smith ierr = ISColoringCreate(comm,ncolors,nc*gnx*gny,colors,&dd->ghostedcoloring);CHKERRQ(ierr); 25347c6ae99SBarry Smith /* PetscIntView(ncolors,(PetscInt *)colors,0); */ 25447c6ae99SBarry Smith 25547c6ae99SBarry Smith ierr = ISColoringSetType(dd->ghostedcoloring,IS_COLORING_GHOSTED);CHKERRQ(ierr); 25647c6ae99SBarry Smith } 25747c6ae99SBarry Smith *coloring = dd->ghostedcoloring; 25847c6ae99SBarry Smith } else SETERRQ1(((PetscObject)da)->comm,PETSC_ERR_ARG_WRONG,"Unknown ISColoringType %d",(int)ctype); 25947c6ae99SBarry Smith } 26047c6ae99SBarry Smith ierr = ISColoringReference(*coloring);CHKERRQ(ierr); 26147c6ae99SBarry Smith PetscFunctionReturn(0); 26247c6ae99SBarry Smith } 26347c6ae99SBarry Smith 26447c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/ 26547c6ae99SBarry Smith 26647c6ae99SBarry Smith #undef __FUNCT__ 26794013140SBarry Smith #define __FUNCT__ "DMGetColoring_DA_3d_MPIAIJ" 26894013140SBarry Smith PetscErrorCode DMGetColoring_DA_3d_MPIAIJ(DM da,ISColoringType ctype,ISColoring *coloring) 26947c6ae99SBarry Smith { 27047c6ae99SBarry Smith PetscErrorCode ierr; 27147c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,gxs,gys,gnx,gny,m,n,p,dim,s,k,nc,col,zs,gzs,ii,l,nz,gnz,M,N,P; 27247c6ae99SBarry Smith PetscInt ncolors; 27347c6ae99SBarry Smith MPI_Comm comm; 2741321219cSEthan Coon DMDABoundaryType bx,by,bz; 275aa219208SBarry Smith DMDAStencilType st; 27647c6ae99SBarry Smith ISColoringValue *colors; 27747c6ae99SBarry Smith DM_DA *dd = (DM_DA*)da->data; 27847c6ae99SBarry Smith 27947c6ae99SBarry Smith PetscFunctionBegin; 28047c6ae99SBarry Smith /* 28147c6ae99SBarry Smith nc - number of components per grid point 28247c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 28347c6ae99SBarry Smith 28447c6ae99SBarry Smith */ 2851321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,&n,&p,&M,&N,&P,&nc,&s,&bx,&by,&bz,&st);CHKERRQ(ierr); 28647c6ae99SBarry Smith col = 2*s + 1; 2871321219cSEthan Coon if (bx == DMDA_BOUNDARY_PERIODIC && (m % col)){ 28847c6ae99SBarry Smith SETERRQ(((PetscObject)da)->comm,PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in X is divisible\n\ 28947c6ae99SBarry Smith by 2*stencil_width + 1\n"); 29047c6ae99SBarry Smith } 2911321219cSEthan Coon if (by == DMDA_BOUNDARY_PERIODIC && (n % col)){ 29247c6ae99SBarry Smith SETERRQ(((PetscObject)da)->comm,PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in Y is divisible\n\ 29347c6ae99SBarry Smith by 2*stencil_width + 1\n"); 29447c6ae99SBarry Smith } 2951321219cSEthan Coon if (bz == DMDA_BOUNDARY_PERIODIC && (p % col)){ 29647c6ae99SBarry Smith SETERRQ(((PetscObject)da)->comm,PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in Z is divisible\n\ 29747c6ae99SBarry Smith by 2*stencil_width + 1\n"); 29847c6ae99SBarry Smith } 29947c6ae99SBarry Smith 300aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,&zs,&nx,&ny,&nz);CHKERRQ(ierr); 301aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,&gzs,&gnx,&gny,&gnz);CHKERRQ(ierr); 30247c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 30347c6ae99SBarry Smith 30447c6ae99SBarry Smith /* create the coloring */ 30547c6ae99SBarry Smith if (ctype == IS_COLORING_GLOBAL) { 30647c6ae99SBarry Smith if (!dd->localcoloring) { 30747c6ae99SBarry Smith ierr = PetscMalloc(nc*nx*ny*nz*sizeof(ISColoringValue),&colors);CHKERRQ(ierr); 30847c6ae99SBarry Smith ii = 0; 30947c6ae99SBarry Smith for (k=zs; k<zs+nz; k++) { 31047c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 31147c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 31247c6ae99SBarry Smith for (l=0; l<nc; l++) { 31347c6ae99SBarry Smith colors[ii++] = l + nc*((i % col) + col*(j % col) + col*col*(k % col)); 31447c6ae99SBarry Smith } 31547c6ae99SBarry Smith } 31647c6ae99SBarry Smith } 31747c6ae99SBarry Smith } 31847c6ae99SBarry Smith ncolors = nc + nc*(col-1 + col*(col-1)+ col*col*(col-1)); 31947c6ae99SBarry Smith ierr = ISColoringCreate(comm,ncolors,nc*nx*ny*nz,colors,&dd->localcoloring);CHKERRQ(ierr); 32047c6ae99SBarry Smith } 32147c6ae99SBarry Smith *coloring = dd->localcoloring; 32247c6ae99SBarry Smith } else if (ctype == IS_COLORING_GHOSTED) { 32347c6ae99SBarry Smith if (!dd->ghostedcoloring) { 32447c6ae99SBarry Smith ierr = PetscMalloc(nc*gnx*gny*gnz*sizeof(ISColoringValue),&colors);CHKERRQ(ierr); 32547c6ae99SBarry Smith ii = 0; 32647c6ae99SBarry Smith for (k=gzs; k<gzs+gnz; k++) { 32747c6ae99SBarry Smith for (j=gys; j<gys+gny; j++) { 32847c6ae99SBarry Smith for (i=gxs; i<gxs+gnx; i++) { 32947c6ae99SBarry Smith for (l=0; l<nc; l++) { 33047c6ae99SBarry Smith /* the complicated stuff is to handle periodic boundaries */ 33147c6ae99SBarry Smith colors[ii++] = l + nc*((SetInRange(i,m) % col) + col*(SetInRange(j,n) % col) + col*col*(SetInRange(k,p) % col)); 33247c6ae99SBarry Smith } 33347c6ae99SBarry Smith } 33447c6ae99SBarry Smith } 33547c6ae99SBarry Smith } 33647c6ae99SBarry Smith ncolors = nc + nc*(col-1 + col*(col-1)+ col*col*(col-1)); 33747c6ae99SBarry Smith ierr = ISColoringCreate(comm,ncolors,nc*gnx*gny*gnz,colors,&dd->ghostedcoloring);CHKERRQ(ierr); 33847c6ae99SBarry Smith ierr = ISColoringSetType(dd->ghostedcoloring,IS_COLORING_GHOSTED);CHKERRQ(ierr); 33947c6ae99SBarry Smith } 34047c6ae99SBarry Smith *coloring = dd->ghostedcoloring; 34147c6ae99SBarry Smith } else SETERRQ1(((PetscObject)da)->comm,PETSC_ERR_ARG_WRONG,"Unknown ISColoringType %d",(int)ctype); 34247c6ae99SBarry Smith ierr = ISColoringReference(*coloring);CHKERRQ(ierr); 34347c6ae99SBarry Smith PetscFunctionReturn(0); 34447c6ae99SBarry Smith } 34547c6ae99SBarry Smith 34647c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/ 34747c6ae99SBarry Smith 34847c6ae99SBarry Smith #undef __FUNCT__ 34994013140SBarry Smith #define __FUNCT__ "DMGetColoring_DA_1d_MPIAIJ" 35094013140SBarry Smith PetscErrorCode DMGetColoring_DA_1d_MPIAIJ(DM da,ISColoringType ctype,ISColoring *coloring) 35147c6ae99SBarry Smith { 35247c6ae99SBarry Smith PetscErrorCode ierr; 35347c6ae99SBarry Smith PetscInt xs,nx,i,i1,gxs,gnx,l,m,M,dim,s,nc,col; 35447c6ae99SBarry Smith PetscInt ncolors; 35547c6ae99SBarry Smith MPI_Comm comm; 3561321219cSEthan Coon DMDABoundaryType bx; 35747c6ae99SBarry Smith ISColoringValue *colors; 35847c6ae99SBarry Smith DM_DA *dd = (DM_DA*)da->data; 35947c6ae99SBarry Smith 36047c6ae99SBarry Smith PetscFunctionBegin; 36147c6ae99SBarry Smith /* 36247c6ae99SBarry Smith nc - number of components per grid point 36347c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 36447c6ae99SBarry Smith 36547c6ae99SBarry Smith */ 3661321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,0,0,&M,0,0,&nc,&s,&bx,0,0,0);CHKERRQ(ierr); 36747c6ae99SBarry Smith col = 2*s + 1; 36847c6ae99SBarry Smith 3691321219cSEthan Coon if (bx == DMDA_BOUNDARY_PERIODIC && (m % col)) { 37031e6f798SBarry Smith SETERRQ2(((PetscObject)da)->comm,PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points %d is divisible\n\ 37131e6f798SBarry Smith by 2*stencil_width + 1 %d\n",(int)m,(int)col); 37247c6ae99SBarry Smith } 37347c6ae99SBarry Smith 374aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,0,0,&nx,0,0);CHKERRQ(ierr); 375aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,0,0,&gnx,0,0);CHKERRQ(ierr); 37647c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 37747c6ae99SBarry Smith 37847c6ae99SBarry Smith /* create the coloring */ 37947c6ae99SBarry Smith if (ctype == IS_COLORING_GLOBAL) { 38047c6ae99SBarry Smith if (!dd->localcoloring) { 38147c6ae99SBarry Smith ierr = PetscMalloc(nc*nx*sizeof(ISColoringValue),&colors);CHKERRQ(ierr); 38247c6ae99SBarry Smith i1 = 0; 38347c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 38447c6ae99SBarry Smith for (l=0; l<nc; l++) { 38547c6ae99SBarry Smith colors[i1++] = l + nc*(i % col); 38647c6ae99SBarry Smith } 38747c6ae99SBarry Smith } 38847c6ae99SBarry Smith ncolors = nc + nc*(col-1); 38947c6ae99SBarry Smith ierr = ISColoringCreate(comm,ncolors,nc*nx,colors,&dd->localcoloring);CHKERRQ(ierr); 39047c6ae99SBarry Smith } 39147c6ae99SBarry Smith *coloring = dd->localcoloring; 39247c6ae99SBarry Smith } else if (ctype == IS_COLORING_GHOSTED) { 39347c6ae99SBarry Smith if (!dd->ghostedcoloring) { 39447c6ae99SBarry Smith ierr = PetscMalloc(nc*gnx*sizeof(ISColoringValue),&colors);CHKERRQ(ierr); 39547c6ae99SBarry Smith i1 = 0; 39647c6ae99SBarry Smith for (i=gxs; i<gxs+gnx; i++) { 39747c6ae99SBarry Smith for (l=0; l<nc; l++) { 39847c6ae99SBarry Smith /* the complicated stuff is to handle periodic boundaries */ 39947c6ae99SBarry Smith colors[i1++] = l + nc*(SetInRange(i,m) % col); 40047c6ae99SBarry Smith } 40147c6ae99SBarry Smith } 40247c6ae99SBarry Smith ncolors = nc + nc*(col-1); 40347c6ae99SBarry Smith ierr = ISColoringCreate(comm,ncolors,nc*gnx,colors,&dd->ghostedcoloring);CHKERRQ(ierr); 40447c6ae99SBarry Smith ierr = ISColoringSetType(dd->ghostedcoloring,IS_COLORING_GHOSTED);CHKERRQ(ierr); 40547c6ae99SBarry Smith } 40647c6ae99SBarry Smith *coloring = dd->ghostedcoloring; 40747c6ae99SBarry Smith } else SETERRQ1(((PetscObject)da)->comm,PETSC_ERR_ARG_WRONG,"Unknown ISColoringType %d",(int)ctype); 40847c6ae99SBarry Smith ierr = ISColoringReference(*coloring);CHKERRQ(ierr); 40947c6ae99SBarry Smith PetscFunctionReturn(0); 41047c6ae99SBarry Smith } 41147c6ae99SBarry Smith 41247c6ae99SBarry Smith #undef __FUNCT__ 41394013140SBarry Smith #define __FUNCT__ "DMGetColoring_DA_2d_5pt_MPIAIJ" 41494013140SBarry Smith PetscErrorCode DMGetColoring_DA_2d_5pt_MPIAIJ(DM da,ISColoringType ctype,ISColoring *coloring) 41547c6ae99SBarry Smith { 41647c6ae99SBarry Smith PetscErrorCode ierr; 41747c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,ii,gxs,gys,gnx,gny,m,n,dim,s,k,nc; 41847c6ae99SBarry Smith PetscInt ncolors; 41947c6ae99SBarry Smith MPI_Comm comm; 4201321219cSEthan Coon DMDABoundaryType bx,by; 42147c6ae99SBarry Smith ISColoringValue *colors; 42247c6ae99SBarry Smith DM_DA *dd = (DM_DA*)da->data; 42347c6ae99SBarry Smith 42447c6ae99SBarry Smith PetscFunctionBegin; 42547c6ae99SBarry Smith /* 42647c6ae99SBarry Smith nc - number of components per grid point 42747c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 42847c6ae99SBarry Smith 42947c6ae99SBarry Smith */ 4301321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,&n,0,0,0,0,&nc,&s,&bx,&by,0,0);CHKERRQ(ierr); 431aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,0,&nx,&ny,0);CHKERRQ(ierr); 432aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,0,&gnx,&gny,0);CHKERRQ(ierr); 43347c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 43447c6ae99SBarry Smith 4351321219cSEthan Coon if (bx == DMDA_BOUNDARY_PERIODIC && (m % 5)){ 43647c6ae99SBarry Smith SETERRQ(((PetscObject)da)->comm,PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in X is divisible\n\ 43747c6ae99SBarry Smith by 5\n"); 43847c6ae99SBarry Smith } 4391321219cSEthan Coon if (by == DMDA_BOUNDARY_PERIODIC && (n % 5)){ 44047c6ae99SBarry Smith SETERRQ(((PetscObject)da)->comm,PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in Y is divisible\n\ 44147c6ae99SBarry Smith by 5\n"); 44247c6ae99SBarry Smith } 44347c6ae99SBarry Smith 44447c6ae99SBarry Smith /* create the coloring */ 44547c6ae99SBarry Smith if (ctype == IS_COLORING_GLOBAL) { 44647c6ae99SBarry Smith if (!dd->localcoloring) { 44747c6ae99SBarry Smith ierr = PetscMalloc(nc*nx*ny*sizeof(ISColoringValue),&colors);CHKERRQ(ierr); 44847c6ae99SBarry Smith ii = 0; 44947c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 45047c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 45147c6ae99SBarry Smith for (k=0; k<nc; k++) { 45247c6ae99SBarry Smith colors[ii++] = k + nc*((3*j+i) % 5); 45347c6ae99SBarry Smith } 45447c6ae99SBarry Smith } 45547c6ae99SBarry Smith } 45647c6ae99SBarry Smith ncolors = 5*nc; 45747c6ae99SBarry Smith ierr = ISColoringCreate(comm,ncolors,nc*nx*ny,colors,&dd->localcoloring);CHKERRQ(ierr); 45847c6ae99SBarry Smith } 45947c6ae99SBarry Smith *coloring = dd->localcoloring; 46047c6ae99SBarry Smith } else if (ctype == IS_COLORING_GHOSTED) { 46147c6ae99SBarry Smith if (!dd->ghostedcoloring) { 46247c6ae99SBarry Smith ierr = PetscMalloc(nc*gnx*gny*sizeof(ISColoringValue),&colors);CHKERRQ(ierr); 46347c6ae99SBarry Smith ii = 0; 46447c6ae99SBarry Smith for (j=gys; j<gys+gny; j++) { 46547c6ae99SBarry Smith for (i=gxs; i<gxs+gnx; i++) { 46647c6ae99SBarry Smith for (k=0; k<nc; k++) { 46747c6ae99SBarry Smith colors[ii++] = k + nc*((3*SetInRange(j,n) + SetInRange(i,m)) % 5); 46847c6ae99SBarry Smith } 46947c6ae99SBarry Smith } 47047c6ae99SBarry Smith } 47147c6ae99SBarry Smith ncolors = 5*nc; 47247c6ae99SBarry Smith ierr = ISColoringCreate(comm,ncolors,nc*gnx*gny,colors,&dd->ghostedcoloring);CHKERRQ(ierr); 47347c6ae99SBarry Smith ierr = ISColoringSetType(dd->ghostedcoloring,IS_COLORING_GHOSTED);CHKERRQ(ierr); 47447c6ae99SBarry Smith } 47547c6ae99SBarry Smith *coloring = dd->ghostedcoloring; 47647c6ae99SBarry Smith } else SETERRQ1(((PetscObject)da)->comm,PETSC_ERR_ARG_WRONG,"Unknown ISColoringType %d",(int)ctype); 47747c6ae99SBarry Smith PetscFunctionReturn(0); 47847c6ae99SBarry Smith } 47947c6ae99SBarry Smith 48047c6ae99SBarry Smith /* =========================================================================== */ 48109573ac7SBarry Smith extern PetscErrorCode DMGetMatrix_DA_1d_MPIAIJ(DM,Mat); 48209573ac7SBarry Smith extern PetscErrorCode DMGetMatrix_DA_2d_MPIAIJ(DM,Mat); 48309573ac7SBarry Smith extern PetscErrorCode DMGetMatrix_DA_2d_MPIAIJ_Fill(DM,Mat); 48409573ac7SBarry Smith extern PetscErrorCode DMGetMatrix_DA_3d_MPIAIJ(DM,Mat); 48509573ac7SBarry Smith extern PetscErrorCode DMGetMatrix_DA_3d_MPIAIJ_Fill(DM,Mat); 48609573ac7SBarry Smith extern PetscErrorCode DMGetMatrix_DA_2d_MPIBAIJ(DM,Mat); 48709573ac7SBarry Smith extern PetscErrorCode DMGetMatrix_DA_3d_MPIBAIJ(DM,Mat); 48809573ac7SBarry Smith extern PetscErrorCode DMGetMatrix_DA_2d_MPISBAIJ(DM,Mat); 48909573ac7SBarry Smith extern PetscErrorCode DMGetMatrix_DA_3d_MPISBAIJ(DM,Mat); 49047c6ae99SBarry Smith 49147c6ae99SBarry Smith #undef __FUNCT__ 49295ee5b0eSBarry Smith #define __FUNCT__ "MatSetDM" 49347c6ae99SBarry Smith /*@ 49495ee5b0eSBarry Smith MatSetDM - Sets the DMDA that is to be used by the HYPRE_StructMatrix PETSc matrix 49547c6ae99SBarry Smith 49647c6ae99SBarry Smith Logically Collective on Mat 49747c6ae99SBarry Smith 49847c6ae99SBarry Smith Input Parameters: 49947c6ae99SBarry Smith + mat - the matrix 50047c6ae99SBarry Smith - da - the da 50147c6ae99SBarry Smith 50247c6ae99SBarry Smith Level: intermediate 50347c6ae99SBarry Smith 50447c6ae99SBarry Smith @*/ 50595ee5b0eSBarry Smith PetscErrorCode MatSetDM(Mat mat,DM da) 50647c6ae99SBarry Smith { 50747c6ae99SBarry Smith PetscErrorCode ierr; 50847c6ae99SBarry Smith 50947c6ae99SBarry Smith PetscFunctionBegin; 51047c6ae99SBarry Smith PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 51147c6ae99SBarry Smith PetscValidHeaderSpecific(da,DM_CLASSID,1); 51295ee5b0eSBarry Smith ierr = PetscTryMethod(mat,"MatSetDM_C",(Mat,DM),(mat,da));CHKERRQ(ierr); 51347c6ae99SBarry Smith PetscFunctionReturn(0); 51447c6ae99SBarry Smith } 51547c6ae99SBarry Smith 51647c6ae99SBarry Smith EXTERN_C_BEGIN 51747c6ae99SBarry Smith #undef __FUNCT__ 51847c6ae99SBarry Smith #define __FUNCT__ "MatView_MPI_DA" 5197087cfbeSBarry Smith PetscErrorCode MatView_MPI_DA(Mat A,PetscViewer viewer) 52047c6ae99SBarry Smith { 5219a42bb27SBarry Smith DM da; 52247c6ae99SBarry Smith PetscErrorCode ierr; 52347c6ae99SBarry Smith const char *prefix; 52447c6ae99SBarry Smith Mat Anatural; 52547c6ae99SBarry Smith AO ao; 52647c6ae99SBarry Smith PetscInt rstart,rend,*petsc,i; 52747c6ae99SBarry Smith IS is; 52847c6ae99SBarry Smith MPI_Comm comm; 52947c6ae99SBarry Smith 53047c6ae99SBarry Smith PetscFunctionBegin; 53147c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)A,&comm);CHKERRQ(ierr); 5323c0c59f3SBarry Smith ierr = PetscObjectQuery((PetscObject)A,"DM",(PetscObject*)&da);CHKERRQ(ierr); 533aa219208SBarry Smith if (!da) SETERRQ(((PetscObject)A)->comm,PETSC_ERR_ARG_WRONG,"Matrix not generated from a DMDA"); 53447c6ae99SBarry Smith 535aa219208SBarry Smith ierr = DMDAGetAO(da,&ao);CHKERRQ(ierr); 53647c6ae99SBarry Smith ierr = MatGetOwnershipRange(A,&rstart,&rend);CHKERRQ(ierr); 53747c6ae99SBarry Smith ierr = PetscMalloc((rend-rstart)*sizeof(PetscInt),&petsc);CHKERRQ(ierr); 53847c6ae99SBarry Smith for (i=rstart; i<rend; i++) petsc[i-rstart] = i; 53947c6ae99SBarry Smith ierr = AOApplicationToPetsc(ao,rend-rstart,petsc);CHKERRQ(ierr); 54047c6ae99SBarry Smith ierr = ISCreateGeneral(comm,rend-rstart,petsc,PETSC_OWN_POINTER,&is);CHKERRQ(ierr); 54147c6ae99SBarry Smith 54247c6ae99SBarry Smith /* call viewer on natural ordering */ 54347c6ae99SBarry Smith ierr = MatGetSubMatrix(A,is,is,MAT_INITIAL_MATRIX,&Anatural);CHKERRQ(ierr); 544fcfd50ebSBarry Smith ierr = ISDestroy(&is);CHKERRQ(ierr); 54547c6ae99SBarry Smith ierr = PetscObjectGetOptionsPrefix((PetscObject)A,&prefix);CHKERRQ(ierr); 54647c6ae99SBarry Smith ierr = PetscObjectSetOptionsPrefix((PetscObject)Anatural,prefix);CHKERRQ(ierr); 54747c6ae99SBarry Smith ierr = PetscObjectSetName((PetscObject)Anatural,((PetscObject)A)->name);CHKERRQ(ierr); 54847c6ae99SBarry Smith ierr = MatView(Anatural,viewer);CHKERRQ(ierr); 549fcfd50ebSBarry Smith ierr = MatDestroy(&Anatural);CHKERRQ(ierr); 55047c6ae99SBarry Smith PetscFunctionReturn(0); 55147c6ae99SBarry Smith } 55247c6ae99SBarry Smith EXTERN_C_END 55347c6ae99SBarry Smith 55447c6ae99SBarry Smith EXTERN_C_BEGIN 55547c6ae99SBarry Smith #undef __FUNCT__ 55647c6ae99SBarry Smith #define __FUNCT__ "MatLoad_MPI_DA" 5577087cfbeSBarry Smith PetscErrorCode MatLoad_MPI_DA(Mat A,PetscViewer viewer) 55847c6ae99SBarry Smith { 5599a42bb27SBarry Smith DM da; 56047c6ae99SBarry Smith PetscErrorCode ierr; 56147c6ae99SBarry Smith Mat Anatural,Aapp; 56247c6ae99SBarry Smith AO ao; 56347c6ae99SBarry Smith PetscInt rstart,rend,*app,i; 56447c6ae99SBarry Smith IS is; 56547c6ae99SBarry Smith MPI_Comm comm; 56647c6ae99SBarry Smith 56747c6ae99SBarry Smith PetscFunctionBegin; 56847c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)A,&comm);CHKERRQ(ierr); 5693c0c59f3SBarry Smith ierr = PetscObjectQuery((PetscObject)A,"DM",(PetscObject*)&da);CHKERRQ(ierr); 570aa219208SBarry Smith if (!da) SETERRQ(((PetscObject)A)->comm,PETSC_ERR_ARG_WRONG,"Matrix not generated from a DMDA"); 57147c6ae99SBarry Smith 57247c6ae99SBarry Smith /* Load the matrix in natural ordering */ 57347c6ae99SBarry Smith ierr = MatCreate(((PetscObject)A)->comm,&Anatural);CHKERRQ(ierr); 57447c6ae99SBarry Smith ierr = MatSetType(Anatural,((PetscObject)A)->type_name);CHKERRQ(ierr); 57547c6ae99SBarry Smith ierr = MatSetSizes(Anatural,A->rmap->n,A->cmap->n,A->rmap->N,A->cmap->N);CHKERRQ(ierr); 57647c6ae99SBarry Smith ierr = MatLoad(Anatural,viewer);CHKERRQ(ierr); 57747c6ae99SBarry Smith 57847c6ae99SBarry Smith /* Map natural ordering to application ordering and create IS */ 579aa219208SBarry Smith ierr = DMDAGetAO(da,&ao);CHKERRQ(ierr); 58047c6ae99SBarry Smith ierr = MatGetOwnershipRange(Anatural,&rstart,&rend);CHKERRQ(ierr); 58147c6ae99SBarry Smith ierr = PetscMalloc((rend-rstart)*sizeof(PetscInt),&app);CHKERRQ(ierr); 58247c6ae99SBarry Smith for (i=rstart; i<rend; i++) app[i-rstart] = i; 58347c6ae99SBarry Smith ierr = AOPetscToApplication(ao,rend-rstart,app);CHKERRQ(ierr); 58447c6ae99SBarry Smith ierr = ISCreateGeneral(comm,rend-rstart,app,PETSC_OWN_POINTER,&is);CHKERRQ(ierr); 58547c6ae99SBarry Smith 58647c6ae99SBarry Smith /* Do permutation and replace header */ 58747c6ae99SBarry Smith ierr = MatGetSubMatrix(Anatural,is,is,MAT_INITIAL_MATRIX,&Aapp);CHKERRQ(ierr); 58847c6ae99SBarry Smith ierr = MatHeaderReplace(A,Aapp);CHKERRQ(ierr); 589fcfd50ebSBarry Smith ierr = ISDestroy(&is);CHKERRQ(ierr); 590fcfd50ebSBarry Smith ierr = MatDestroy(&Anatural);CHKERRQ(ierr); 59147c6ae99SBarry Smith PetscFunctionReturn(0); 59247c6ae99SBarry Smith } 59347c6ae99SBarry Smith EXTERN_C_END 59447c6ae99SBarry Smith 59547c6ae99SBarry Smith #undef __FUNCT__ 59694013140SBarry Smith #define __FUNCT__ "DMGetMatrix_DA" 5977087cfbeSBarry Smith PetscErrorCode DMGetMatrix_DA(DM da, const MatType mtype,Mat *J) 59847c6ae99SBarry Smith { 59947c6ae99SBarry Smith PetscErrorCode ierr; 60047c6ae99SBarry Smith PetscInt dim,dof,nx,ny,nz,dims[3],starts[3],M,N,P; 60147c6ae99SBarry Smith Mat A; 60247c6ae99SBarry Smith MPI_Comm comm; 60347c6ae99SBarry Smith const MatType Atype; 60447c6ae99SBarry Smith void (*aij)(void)=PETSC_NULL,(*baij)(void)=PETSC_NULL,(*sbaij)(void)=PETSC_NULL; 60547c6ae99SBarry Smith MatType ttype[256]; 60647c6ae99SBarry Smith PetscBool flg; 60747c6ae99SBarry Smith PetscMPIInt size; 60847c6ae99SBarry Smith DM_DA *dd = (DM_DA*)da->data; 60947c6ae99SBarry Smith 61047c6ae99SBarry Smith PetscFunctionBegin; 61147c6ae99SBarry Smith #ifndef PETSC_USE_DYNAMIC_LIBRARIES 61247c6ae99SBarry Smith ierr = MatInitializePackage(PETSC_NULL);CHKERRQ(ierr); 61347c6ae99SBarry Smith #endif 6145da5aae0SJed Brown if (!mtype) mtype = MATAIJ; 61547c6ae99SBarry Smith ierr = PetscStrcpy((char*)ttype,mtype);CHKERRQ(ierr); 616aa219208SBarry Smith ierr = PetscOptionsBegin(((PetscObject)da)->comm,((PetscObject)da)->prefix,"DMDA options","Mat");CHKERRQ(ierr); 61747c6ae99SBarry Smith ierr = PetscOptionsList("-da_mat_type","Matrix type","MatSetType",MatList,mtype,(char*)ttype,256,&flg);CHKERRQ(ierr); 61847c6ae99SBarry Smith ierr = PetscOptionsEnd(); 61947c6ae99SBarry Smith 62047c6ae99SBarry Smith /* 62147c6ae99SBarry Smith m 62247c6ae99SBarry Smith ------------------------------------------------------ 62347c6ae99SBarry Smith | | 62447c6ae99SBarry Smith | | 62547c6ae99SBarry Smith | ---------------------- | 62647c6ae99SBarry Smith | | | | 62747c6ae99SBarry Smith n | ny | | | 62847c6ae99SBarry Smith | | | | 62947c6ae99SBarry Smith | .--------------------- | 63047c6ae99SBarry Smith | (xs,ys) nx | 63147c6ae99SBarry Smith | . | 63247c6ae99SBarry Smith | (gxs,gys) | 63347c6ae99SBarry Smith | | 63447c6ae99SBarry Smith ----------------------------------------------------- 63547c6ae99SBarry Smith */ 63647c6ae99SBarry Smith 63747c6ae99SBarry Smith /* 63847c6ae99SBarry Smith nc - number of components per grid point 63947c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 64047c6ae99SBarry Smith 64147c6ae99SBarry Smith */ 6421321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&M,&N,&P,0,0,0,&dof,0,0,0,0,0);CHKERRQ(ierr); 643aa219208SBarry Smith ierr = DMDAGetCorners(da,0,0,0,&nx,&ny,&nz);CHKERRQ(ierr); 64447c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 64547c6ae99SBarry Smith ierr = MatCreate(comm,&A);CHKERRQ(ierr); 64647c6ae99SBarry Smith ierr = MatSetSizes(A,dof*nx*ny*nz,dof*nx*ny*nz,dof*M*N*P,dof*M*N*P);CHKERRQ(ierr); 64747c6ae99SBarry Smith ierr = MatSetType(A,(const MatType)ttype);CHKERRQ(ierr); 64895ee5b0eSBarry Smith ierr = MatSetDM(A,da);CHKERRQ(ierr); 64947c6ae99SBarry Smith ierr = MatSetFromOptions(A);CHKERRQ(ierr); 65047c6ae99SBarry Smith ierr = MatGetType(A,&Atype);CHKERRQ(ierr); 65147c6ae99SBarry Smith /* 652aa219208SBarry Smith We do not provide a getmatrix function in the DMDA operations because 653aa219208SBarry Smith the basic DMDA does not know about matrices. We think of DMDA as being more 65447c6ae99SBarry Smith more low-level than matrices. This is kind of cheating but, cause sometimes 655aa219208SBarry Smith we think of DMDA has higher level than matrices. 65647c6ae99SBarry Smith 65747c6ae99SBarry Smith We could switch based on Atype (or mtype), but we do not since the 65847c6ae99SBarry Smith specialized setting routines depend only the particular preallocation 65947c6ae99SBarry Smith details of the matrix, not the type itself. 66047c6ae99SBarry Smith */ 66147c6ae99SBarry Smith ierr = PetscObjectQueryFunction((PetscObject)A,"MatMPIAIJSetPreallocation_C",&aij);CHKERRQ(ierr); 66247c6ae99SBarry Smith if (!aij) { 66347c6ae99SBarry Smith ierr = PetscObjectQueryFunction((PetscObject)A,"MatSeqAIJSetPreallocation_C",&aij);CHKERRQ(ierr); 66447c6ae99SBarry Smith } 66547c6ae99SBarry Smith if (!aij) { 66647c6ae99SBarry Smith ierr = PetscObjectQueryFunction((PetscObject)A,"MatMPIBAIJSetPreallocation_C",&baij);CHKERRQ(ierr); 66747c6ae99SBarry Smith if (!baij) { 66847c6ae99SBarry Smith ierr = PetscObjectQueryFunction((PetscObject)A,"MatSeqBAIJSetPreallocation_C",&baij);CHKERRQ(ierr); 66947c6ae99SBarry Smith } 67047c6ae99SBarry Smith if (!baij){ 67147c6ae99SBarry Smith ierr = PetscObjectQueryFunction((PetscObject)A,"MatMPISBAIJSetPreallocation_C",&sbaij);CHKERRQ(ierr); 67247c6ae99SBarry Smith if (!sbaij) { 67347c6ae99SBarry Smith ierr = PetscObjectQueryFunction((PetscObject)A,"MatSeqSBAIJSetPreallocation_C",&sbaij);CHKERRQ(ierr); 67447c6ae99SBarry Smith } 67547c6ae99SBarry Smith } 67647c6ae99SBarry Smith } 67747c6ae99SBarry Smith if (aij) { 67847c6ae99SBarry Smith if (dim == 1) { 67994013140SBarry Smith ierr = DMGetMatrix_DA_1d_MPIAIJ(da,A);CHKERRQ(ierr); 68047c6ae99SBarry Smith } else if (dim == 2) { 68147c6ae99SBarry Smith if (dd->ofill) { 68294013140SBarry Smith ierr = DMGetMatrix_DA_2d_MPIAIJ_Fill(da,A);CHKERRQ(ierr); 68347c6ae99SBarry Smith } else { 68494013140SBarry Smith ierr = DMGetMatrix_DA_2d_MPIAIJ(da,A);CHKERRQ(ierr); 68547c6ae99SBarry Smith } 68647c6ae99SBarry Smith } else if (dim == 3) { 68747c6ae99SBarry Smith if (dd->ofill) { 68894013140SBarry Smith ierr = DMGetMatrix_DA_3d_MPIAIJ_Fill(da,A);CHKERRQ(ierr); 68947c6ae99SBarry Smith } else { 69094013140SBarry Smith ierr = DMGetMatrix_DA_3d_MPIAIJ(da,A);CHKERRQ(ierr); 69147c6ae99SBarry Smith } 69247c6ae99SBarry Smith } 69347c6ae99SBarry Smith } else if (baij) { 69447c6ae99SBarry Smith if (dim == 2) { 69594013140SBarry Smith ierr = DMGetMatrix_DA_2d_MPIBAIJ(da,A);CHKERRQ(ierr); 69647c6ae99SBarry Smith } else if (dim == 3) { 69794013140SBarry Smith ierr = DMGetMatrix_DA_3d_MPIBAIJ(da,A);CHKERRQ(ierr); 69847c6ae99SBarry Smith } else { 699b17742caSSean Farley SETERRQ3(((PetscObject)da)->comm,PETSC_ERR_SUP,"Not implemented for %D dimension and Matrix Type: %s in %D dimension!\n" \ 700b17742caSSean Farley "Send mail to petsc-maint@mcs.anl.gov for code",dim,Atype,dim); 70147c6ae99SBarry Smith } 70247c6ae99SBarry Smith } else if (sbaij) { 70347c6ae99SBarry Smith if (dim == 2) { 70494013140SBarry Smith ierr = DMGetMatrix_DA_2d_MPISBAIJ(da,A);CHKERRQ(ierr); 70547c6ae99SBarry Smith } else if (dim == 3) { 70694013140SBarry Smith ierr = DMGetMatrix_DA_3d_MPISBAIJ(da,A);CHKERRQ(ierr); 70747c6ae99SBarry Smith } else { 708b17742caSSean Farley SETERRQ3(((PetscObject)da)->comm,PETSC_ERR_SUP,"Not implemented for %D dimension and Matrix Type: %s in %D dimension!\n" \ 709b17742caSSean Farley "Send mail to petsc-maint@mcs.anl.gov for code",dim,Atype,dim); 71047c6ae99SBarry Smith } 71147c6ae99SBarry Smith } 712aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&starts[0],&starts[1],&starts[2],&dims[0],&dims[1],&dims[2]);CHKERRQ(ierr); 71347c6ae99SBarry Smith ierr = MatSetStencil(A,dim,dims,starts,dof);CHKERRQ(ierr); 7143c0c59f3SBarry Smith ierr = PetscObjectCompose((PetscObject)A,"DM",(PetscObject)da);CHKERRQ(ierr); 71547c6ae99SBarry Smith ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr); 71647c6ae99SBarry Smith if (size > 1) { 71747c6ae99SBarry Smith /* change viewer to display matrix in natural ordering */ 71847c6ae99SBarry Smith ierr = MatShellSetOperation(A, MATOP_VIEW, (void (*)(void)) MatView_MPI_DA);CHKERRQ(ierr); 71947c6ae99SBarry Smith ierr = MatShellSetOperation(A, MATOP_LOAD, (void (*)(void)) MatLoad_MPI_DA);CHKERRQ(ierr); 72047c6ae99SBarry Smith } 72147c6ae99SBarry Smith *J = A; 72247c6ae99SBarry Smith PetscFunctionReturn(0); 72347c6ae99SBarry Smith } 72447c6ae99SBarry Smith 72547c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/ 72647c6ae99SBarry Smith #undef __FUNCT__ 72794013140SBarry Smith #define __FUNCT__ "DMGetMatrix_DA_2d_MPIAIJ" 72894013140SBarry Smith PetscErrorCode DMGetMatrix_DA_2d_MPIAIJ(DM da,Mat J) 72947c6ae99SBarry Smith { 73047c6ae99SBarry Smith PetscErrorCode ierr; 73147c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny,m,n,dim,s,*cols = PETSC_NULL,k,nc,*rows = PETSC_NULL,col,cnt,l,p; 73247c6ae99SBarry Smith PetscInt lstart,lend,pstart,pend,*dnz,*onz; 73347c6ae99SBarry Smith MPI_Comm comm; 73447c6ae99SBarry Smith PetscScalar *values; 7351321219cSEthan Coon DMDABoundaryType bx,by; 73647c6ae99SBarry Smith ISLocalToGlobalMapping ltog,ltogb; 737aa219208SBarry Smith DMDAStencilType st; 73847c6ae99SBarry Smith 73947c6ae99SBarry Smith PetscFunctionBegin; 74047c6ae99SBarry Smith /* 74147c6ae99SBarry Smith nc - number of components per grid point 74247c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 74347c6ae99SBarry Smith 74447c6ae99SBarry Smith */ 7451321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,&n,0,0,0,0,&nc,&s,&bx,&by,0,&st);CHKERRQ(ierr); 74647c6ae99SBarry Smith col = 2*s + 1; 747aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,0,&nx,&ny,0);CHKERRQ(ierr); 748aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,0,&gnx,&gny,0);CHKERRQ(ierr); 74947c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 75047c6ae99SBarry Smith 75147c6ae99SBarry Smith ierr = PetscMalloc2(nc,PetscInt,&rows,col*col*nc*nc,PetscInt,&cols);CHKERRQ(ierr); 7521411c6eeSJed Brown ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 7531411c6eeSJed Brown ierr = DMGetLocalToGlobalMappingBlock(da,<ogb);CHKERRQ(ierr); 75447c6ae99SBarry Smith 75547c6ae99SBarry Smith /* determine the matrix preallocation information */ 75647c6ae99SBarry Smith ierr = MatPreallocateInitialize(comm,nc*nx*ny,nc*nx*ny,dnz,onz);CHKERRQ(ierr); 75747c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 75847c6ae99SBarry Smith 7591321219cSEthan Coon pstart = (bx == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 7601321219cSEthan Coon pend = (bx == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 76147c6ae99SBarry Smith 76247c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 76347c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys); 76447c6ae99SBarry Smith 7651321219cSEthan Coon lstart = (by == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 7661321219cSEthan Coon lend = (by == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 76747c6ae99SBarry Smith 76847c6ae99SBarry Smith cnt = 0; 76947c6ae99SBarry Smith for (k=0; k<nc; k++) { 77047c6ae99SBarry Smith for (l=lstart; l<lend+1; l++) { 77147c6ae99SBarry Smith for (p=pstart; p<pend+1; p++) { 772aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || (!l || !p)) { /* entries on star have either l = 0 or p = 0 */ 77347c6ae99SBarry Smith cols[cnt++] = k + nc*(slot + gnx*l + p); 77447c6ae99SBarry Smith } 77547c6ae99SBarry Smith } 77647c6ae99SBarry Smith } 77747c6ae99SBarry Smith rows[k] = k + nc*(slot); 77847c6ae99SBarry Smith } 779784ac674SJed Brown ierr = MatPreallocateSetLocal(ltog,nc,rows,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr); 78047c6ae99SBarry Smith } 78147c6ae99SBarry Smith } 78247c6ae99SBarry Smith ierr = MatSeqAIJSetPreallocation(J,0,dnz);CHKERRQ(ierr); 78347c6ae99SBarry Smith ierr = MatMPIAIJSetPreallocation(J,0,dnz,0,onz);CHKERRQ(ierr); 78447c6ae99SBarry Smith ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr); 78547c6ae99SBarry Smith ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr); 78647c6ae99SBarry Smith 787784ac674SJed Brown ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 788784ac674SJed Brown ierr = MatSetLocalToGlobalMappingBlock(J,ltogb,ltogb);CHKERRQ(ierr); 78947c6ae99SBarry Smith 79047c6ae99SBarry Smith /* 79147c6ae99SBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 79247c6ae99SBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 79347c6ae99SBarry Smith PETSc ordering. 79447c6ae99SBarry Smith */ 795fcfd50ebSBarry Smith if (!da->prealloc_only) { 79647c6ae99SBarry Smith ierr = PetscMalloc(col*col*nc*nc*sizeof(PetscScalar),&values);CHKERRQ(ierr); 79747c6ae99SBarry Smith ierr = PetscMemzero(values,col*col*nc*nc*sizeof(PetscScalar));CHKERRQ(ierr); 79847c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 79947c6ae99SBarry Smith 8001321219cSEthan Coon pstart = (bx == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 8011321219cSEthan Coon pend = (bx == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 80247c6ae99SBarry Smith 80347c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 80447c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys); 80547c6ae99SBarry Smith 8061321219cSEthan Coon lstart = (by == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 8071321219cSEthan Coon lend = (by == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 80847c6ae99SBarry Smith 80947c6ae99SBarry Smith cnt = 0; 81047c6ae99SBarry Smith for (k=0; k<nc; k++) { 81147c6ae99SBarry Smith for (l=lstart; l<lend+1; l++) { 81247c6ae99SBarry Smith for (p=pstart; p<pend+1; p++) { 813aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || (!l || !p)) { /* entries on star have either l = 0 or p = 0 */ 81447c6ae99SBarry Smith cols[cnt++] = k + nc*(slot + gnx*l + p); 81547c6ae99SBarry Smith } 81647c6ae99SBarry Smith } 81747c6ae99SBarry Smith } 81847c6ae99SBarry Smith rows[k] = k + nc*(slot); 81947c6ae99SBarry Smith } 82047c6ae99SBarry Smith ierr = MatSetValuesLocal(J,nc,rows,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 82147c6ae99SBarry Smith } 82247c6ae99SBarry Smith } 82347c6ae99SBarry Smith ierr = PetscFree(values);CHKERRQ(ierr); 82447c6ae99SBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 82547c6ae99SBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 82647c6ae99SBarry Smith } 82747c6ae99SBarry Smith ierr = PetscFree2(rows,cols);CHKERRQ(ierr); 82847c6ae99SBarry Smith PetscFunctionReturn(0); 82947c6ae99SBarry Smith } 83047c6ae99SBarry Smith 83147c6ae99SBarry Smith #undef __FUNCT__ 83294013140SBarry Smith #define __FUNCT__ "DMGetMatrix_DA_2d_MPIAIJ_Fill" 83394013140SBarry Smith PetscErrorCode DMGetMatrix_DA_2d_MPIAIJ_Fill(DM da,Mat J) 83447c6ae99SBarry Smith { 83547c6ae99SBarry Smith PetscErrorCode ierr; 83647c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny; 83747c6ae99SBarry Smith PetscInt m,n,dim,s,*cols,k,nc,row,col,cnt,l,p; 83847c6ae99SBarry Smith PetscInt lstart,lend,pstart,pend,*dnz,*onz; 83947c6ae99SBarry Smith DM_DA *dd = (DM_DA*)da->data; 84047c6ae99SBarry Smith PetscInt ifill_col,*ofill = dd->ofill, *dfill = dd->dfill; 84147c6ae99SBarry Smith MPI_Comm comm; 84247c6ae99SBarry Smith PetscScalar *values; 8431321219cSEthan Coon DMDABoundaryType bx,by; 84447c6ae99SBarry Smith ISLocalToGlobalMapping ltog,ltogb; 845aa219208SBarry Smith DMDAStencilType st; 84647c6ae99SBarry Smith 84747c6ae99SBarry Smith PetscFunctionBegin; 84847c6ae99SBarry Smith /* 84947c6ae99SBarry Smith nc - number of components per grid point 85047c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 85147c6ae99SBarry Smith 85247c6ae99SBarry Smith */ 8531321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,&n,0,0,0,0,&nc,&s,&bx,&by,0,&st);CHKERRQ(ierr); 85447c6ae99SBarry Smith col = 2*s + 1; 855aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,0,&nx,&ny,0);CHKERRQ(ierr); 856aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,0,&gnx,&gny,0);CHKERRQ(ierr); 85747c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 85847c6ae99SBarry Smith 85947c6ae99SBarry Smith ierr = PetscMalloc(col*col*nc*nc*sizeof(PetscInt),&cols);CHKERRQ(ierr); 8601411c6eeSJed Brown ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 8611411c6eeSJed Brown ierr = DMGetLocalToGlobalMappingBlock(da,<ogb);CHKERRQ(ierr); 86247c6ae99SBarry Smith 86347c6ae99SBarry Smith /* determine the matrix preallocation information */ 86447c6ae99SBarry Smith ierr = MatPreallocateInitialize(comm,nc*nx*ny,nc*nx*ny,dnz,onz);CHKERRQ(ierr); 86547c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 86647c6ae99SBarry Smith 8671321219cSEthan Coon pstart = (bx == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 8681321219cSEthan Coon pend = (bx == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 86947c6ae99SBarry Smith 87047c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 87147c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys); 87247c6ae99SBarry Smith 8731321219cSEthan Coon lstart = (by == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 8741321219cSEthan Coon lend = (by == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 87547c6ae99SBarry Smith 87647c6ae99SBarry Smith for (k=0; k<nc; k++) { 87747c6ae99SBarry Smith cnt = 0; 87847c6ae99SBarry Smith for (l=lstart; l<lend+1; l++) { 87947c6ae99SBarry Smith for (p=pstart; p<pend+1; p++) { 88047c6ae99SBarry Smith if (l || p) { 881aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || (!l || !p)) { /* entries on star */ 88247c6ae99SBarry Smith for (ifill_col=ofill[k]; ifill_col<ofill[k+1]; ifill_col++) 88347c6ae99SBarry Smith cols[cnt++] = ofill[ifill_col] + nc*(slot + gnx*l + p); 88447c6ae99SBarry Smith } 88547c6ae99SBarry Smith } else { 88647c6ae99SBarry Smith if (dfill) { 88747c6ae99SBarry Smith for (ifill_col=dfill[k]; ifill_col<dfill[k+1]; ifill_col++) 88847c6ae99SBarry Smith cols[cnt++] = dfill[ifill_col] + nc*(slot + gnx*l + p); 88947c6ae99SBarry Smith } else { 89047c6ae99SBarry Smith for (ifill_col=0; ifill_col<nc; ifill_col++) 89147c6ae99SBarry Smith cols[cnt++] = ifill_col + nc*(slot + gnx*l + p); 89247c6ae99SBarry Smith } 89347c6ae99SBarry Smith } 89447c6ae99SBarry Smith } 89547c6ae99SBarry Smith } 89647c6ae99SBarry Smith row = k + nc*(slot); 897784ac674SJed Brown ierr = MatPreallocateSetLocal(ltog,1,&row,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr); 89847c6ae99SBarry Smith } 89947c6ae99SBarry Smith } 90047c6ae99SBarry Smith } 90147c6ae99SBarry Smith ierr = MatSeqAIJSetPreallocation(J,0,dnz);CHKERRQ(ierr); 90247c6ae99SBarry Smith ierr = MatMPIAIJSetPreallocation(J,0,dnz,0,onz);CHKERRQ(ierr); 90347c6ae99SBarry Smith ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr); 904784ac674SJed Brown ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 905784ac674SJed Brown ierr = MatSetLocalToGlobalMappingBlock(J,ltogb,ltogb);CHKERRQ(ierr); 90647c6ae99SBarry Smith 90747c6ae99SBarry Smith /* 90847c6ae99SBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 90947c6ae99SBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 91047c6ae99SBarry Smith PETSc ordering. 91147c6ae99SBarry Smith */ 912fcfd50ebSBarry Smith if (!da->prealloc_only) { 91347c6ae99SBarry Smith ierr = PetscMalloc(col*col*nc*nc*sizeof(PetscScalar),&values);CHKERRQ(ierr); 91447c6ae99SBarry Smith ierr = PetscMemzero(values,col*col*nc*nc*sizeof(PetscScalar));CHKERRQ(ierr); 91547c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 91647c6ae99SBarry Smith 9171321219cSEthan Coon pstart = (bx == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 9181321219cSEthan Coon pend = (bx == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 91947c6ae99SBarry Smith 92047c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 92147c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys); 92247c6ae99SBarry Smith 9231321219cSEthan Coon lstart = (by == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 9241321219cSEthan Coon lend = (by == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 92547c6ae99SBarry Smith 92647c6ae99SBarry Smith for (k=0; k<nc; k++) { 92747c6ae99SBarry Smith cnt = 0; 92847c6ae99SBarry Smith for (l=lstart; l<lend+1; l++) { 92947c6ae99SBarry Smith for (p=pstart; p<pend+1; p++) { 93047c6ae99SBarry Smith if (l || p) { 931aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || (!l || !p)) { /* entries on star */ 93247c6ae99SBarry Smith for (ifill_col=ofill[k]; ifill_col<ofill[k+1]; ifill_col++) 93347c6ae99SBarry Smith cols[cnt++] = ofill[ifill_col] + nc*(slot + gnx*l + p); 93447c6ae99SBarry Smith } 93547c6ae99SBarry Smith } else { 93647c6ae99SBarry Smith if (dfill) { 93747c6ae99SBarry Smith for (ifill_col=dfill[k]; ifill_col<dfill[k+1]; ifill_col++) 93847c6ae99SBarry Smith cols[cnt++] = dfill[ifill_col] + nc*(slot + gnx*l + p); 93947c6ae99SBarry Smith } else { 94047c6ae99SBarry Smith for (ifill_col=0; ifill_col<nc; ifill_col++) 94147c6ae99SBarry Smith cols[cnt++] = ifill_col + nc*(slot + gnx*l + p); 94247c6ae99SBarry Smith } 94347c6ae99SBarry Smith } 94447c6ae99SBarry Smith } 94547c6ae99SBarry Smith } 94647c6ae99SBarry Smith row = k + nc*(slot); 94747c6ae99SBarry Smith ierr = MatSetValuesLocal(J,1,&row,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 94847c6ae99SBarry Smith } 94947c6ae99SBarry Smith } 95047c6ae99SBarry Smith } 95147c6ae99SBarry Smith ierr = PetscFree(values);CHKERRQ(ierr); 95247c6ae99SBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 95347c6ae99SBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 95447c6ae99SBarry Smith } 95547c6ae99SBarry Smith ierr = PetscFree(cols);CHKERRQ(ierr); 95647c6ae99SBarry Smith PetscFunctionReturn(0); 95747c6ae99SBarry Smith } 95847c6ae99SBarry Smith 95947c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/ 96047c6ae99SBarry Smith 96147c6ae99SBarry Smith #undef __FUNCT__ 96294013140SBarry Smith #define __FUNCT__ "DMGetMatrix_DA_3d_MPIAIJ" 96394013140SBarry Smith PetscErrorCode DMGetMatrix_DA_3d_MPIAIJ(DM da,Mat J) 96447c6ae99SBarry Smith { 96547c6ae99SBarry Smith PetscErrorCode ierr; 96647c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny; 96747c6ae99SBarry Smith PetscInt m,n,dim,s,*cols = PETSC_NULL,k,nc,*rows = PETSC_NULL,col,cnt,l,p,*dnz = PETSC_NULL,*onz = PETSC_NULL; 96847c6ae99SBarry Smith PetscInt istart,iend,jstart,jend,kstart,kend,zs,nz,gzs,gnz,ii,jj,kk; 96947c6ae99SBarry Smith MPI_Comm comm; 97047c6ae99SBarry Smith PetscScalar *values; 9711321219cSEthan Coon DMDABoundaryType bx,by,bz; 97247c6ae99SBarry Smith ISLocalToGlobalMapping ltog,ltogb; 973aa219208SBarry Smith DMDAStencilType st; 97447c6ae99SBarry Smith 97547c6ae99SBarry Smith PetscFunctionBegin; 97647c6ae99SBarry Smith /* 97747c6ae99SBarry Smith nc - number of components per grid point 97847c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 97947c6ae99SBarry Smith 98047c6ae99SBarry Smith */ 9811321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,&n,&p,0,0,0,&nc,&s,&bx,&by,&bz,&st);CHKERRQ(ierr); 98247c6ae99SBarry Smith col = 2*s + 1; 98347c6ae99SBarry Smith 984aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,&zs,&nx,&ny,&nz);CHKERRQ(ierr); 985aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,&gzs,&gnx,&gny,&gnz);CHKERRQ(ierr); 98647c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 98747c6ae99SBarry Smith 98847c6ae99SBarry Smith ierr = PetscMalloc2(nc,PetscInt,&rows,col*col*col*nc*nc,PetscInt,&cols);CHKERRQ(ierr); 9891411c6eeSJed Brown ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 9901411c6eeSJed Brown ierr = DMGetLocalToGlobalMappingBlock(da,<ogb);CHKERRQ(ierr); 99147c6ae99SBarry Smith 99247c6ae99SBarry Smith /* determine the matrix preallocation information */ 99347c6ae99SBarry Smith ierr = MatPreallocateInitialize(comm,nc*nx*ny*nz,nc*nx*ny*nz,dnz,onz);CHKERRQ(ierr); 99447c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 9951321219cSEthan Coon istart = (bx == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 9961321219cSEthan Coon iend = (bx == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 99747c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 9981321219cSEthan Coon jstart = (by == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 9991321219cSEthan Coon jend = (by == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 100047c6ae99SBarry Smith for (k=zs; k<zs+nz; k++) { 10011321219cSEthan Coon kstart = (bz == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k)); 10021321219cSEthan Coon kend = (bz == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,p-k-1)); 100347c6ae99SBarry Smith 100447c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs); 100547c6ae99SBarry Smith 100647c6ae99SBarry Smith cnt = 0; 100747c6ae99SBarry Smith for (l=0; l<nc; l++) { 100847c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 100947c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 101047c6ae99SBarry Smith for (kk=kstart; kk<kend+1; kk++) { 1011aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/ 101247c6ae99SBarry Smith cols[cnt++] = l + nc*(slot + ii + gnx*jj + gnx*gny*kk); 101347c6ae99SBarry Smith } 101447c6ae99SBarry Smith } 101547c6ae99SBarry Smith } 101647c6ae99SBarry Smith } 101747c6ae99SBarry Smith rows[l] = l + nc*(slot); 101847c6ae99SBarry Smith } 1019784ac674SJed Brown ierr = MatPreallocateSetLocal(ltog,nc,rows,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr); 102047c6ae99SBarry Smith } 102147c6ae99SBarry Smith } 102247c6ae99SBarry Smith } 102347c6ae99SBarry Smith ierr = MatSeqAIJSetPreallocation(J,0,dnz);CHKERRQ(ierr); 102447c6ae99SBarry Smith ierr = MatMPIAIJSetPreallocation(J,0,dnz,0,onz);CHKERRQ(ierr); 102547c6ae99SBarry Smith ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr); 102647c6ae99SBarry Smith ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr); 1027784ac674SJed Brown ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 1028784ac674SJed Brown ierr = MatSetLocalToGlobalMappingBlock(J,ltogb,ltogb);CHKERRQ(ierr); 102947c6ae99SBarry Smith 103047c6ae99SBarry Smith /* 103147c6ae99SBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 103247c6ae99SBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 103347c6ae99SBarry Smith PETSc ordering. 103447c6ae99SBarry Smith */ 1035fcfd50ebSBarry Smith if (!da->prealloc_only) { 103647c6ae99SBarry Smith ierr = PetscMalloc(col*col*col*nc*nc*nc*sizeof(PetscScalar),&values);CHKERRQ(ierr); 103747c6ae99SBarry Smith ierr = PetscMemzero(values,col*col*col*nc*nc*nc*sizeof(PetscScalar));CHKERRQ(ierr); 103847c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 10391321219cSEthan Coon istart = (bx == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 10401321219cSEthan Coon iend = (bx == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 104147c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 10421321219cSEthan Coon jstart = (by == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 10431321219cSEthan Coon jend = (by == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 104447c6ae99SBarry Smith for (k=zs; k<zs+nz; k++) { 10451321219cSEthan Coon kstart = (bz == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k)); 10461321219cSEthan Coon kend = (bz == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,p-k-1)); 104747c6ae99SBarry Smith 104847c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs); 104947c6ae99SBarry Smith 105047c6ae99SBarry Smith cnt = 0; 105147c6ae99SBarry Smith for (l=0; l<nc; l++) { 105247c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 105347c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 105447c6ae99SBarry Smith for (kk=kstart; kk<kend+1; kk++) { 1055aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/ 105647c6ae99SBarry Smith cols[cnt++] = l + nc*(slot + ii + gnx*jj + gnx*gny*kk); 105747c6ae99SBarry Smith } 105847c6ae99SBarry Smith } 105947c6ae99SBarry Smith } 106047c6ae99SBarry Smith } 106147c6ae99SBarry Smith rows[l] = l + nc*(slot); 106247c6ae99SBarry Smith } 106347c6ae99SBarry Smith ierr = MatSetValuesLocal(J,nc,rows,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 106447c6ae99SBarry Smith } 106547c6ae99SBarry Smith } 106647c6ae99SBarry Smith } 106747c6ae99SBarry Smith ierr = PetscFree(values);CHKERRQ(ierr); 106847c6ae99SBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 106947c6ae99SBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 107047c6ae99SBarry Smith } 107147c6ae99SBarry Smith ierr = PetscFree2(rows,cols);CHKERRQ(ierr); 107247c6ae99SBarry Smith PetscFunctionReturn(0); 107347c6ae99SBarry Smith } 107447c6ae99SBarry Smith 107547c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/ 107647c6ae99SBarry Smith 107747c6ae99SBarry Smith #undef __FUNCT__ 107894013140SBarry Smith #define __FUNCT__ "DMGetMatrix_DA_1d_MPIAIJ" 107994013140SBarry Smith PetscErrorCode DMGetMatrix_DA_1d_MPIAIJ(DM da,Mat J) 108047c6ae99SBarry Smith { 108147c6ae99SBarry Smith PetscErrorCode ierr; 108247c6ae99SBarry Smith PetscInt xs,nx,i,i1,slot,gxs,gnx; 108347c6ae99SBarry Smith PetscInt m,dim,s,*cols = PETSC_NULL,nc,*rows = PETSC_NULL,col,cnt,l; 108447c6ae99SBarry Smith PetscInt istart,iend; 108547c6ae99SBarry Smith PetscScalar *values; 10861321219cSEthan Coon DMDABoundaryType bx; 108747c6ae99SBarry Smith ISLocalToGlobalMapping ltog,ltogb; 108847c6ae99SBarry Smith 108947c6ae99SBarry Smith PetscFunctionBegin; 109047c6ae99SBarry Smith /* 109147c6ae99SBarry Smith nc - number of components per grid point 109247c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 109347c6ae99SBarry Smith 109447c6ae99SBarry Smith */ 10951321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,0,0,0,0,0,&nc,&s,&bx,0,0,0);CHKERRQ(ierr); 109647c6ae99SBarry Smith col = 2*s + 1; 109747c6ae99SBarry Smith 1098aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,0,0,&nx,0,0);CHKERRQ(ierr); 1099aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,0,0,&gnx,0,0);CHKERRQ(ierr); 110047c6ae99SBarry Smith 110147c6ae99SBarry Smith ierr = MatSeqAIJSetPreallocation(J,col*nc,0);CHKERRQ(ierr); 110247c6ae99SBarry Smith ierr = MatMPIAIJSetPreallocation(J,col*nc,0,col*nc,0);CHKERRQ(ierr); 110347c6ae99SBarry Smith ierr = MatSetBlockSize(J,nc);CHKERRQ(ierr); 110447c6ae99SBarry Smith ierr = PetscMalloc2(nc,PetscInt,&rows,col*nc*nc,PetscInt,&cols);CHKERRQ(ierr); 110547c6ae99SBarry Smith 11061411c6eeSJed Brown ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 11071411c6eeSJed Brown ierr = DMGetLocalToGlobalMappingBlock(da,<ogb);CHKERRQ(ierr); 1108784ac674SJed Brown ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 1109784ac674SJed Brown ierr = MatSetLocalToGlobalMappingBlock(J,ltogb,ltogb);CHKERRQ(ierr); 111047c6ae99SBarry Smith 111147c6ae99SBarry Smith /* 111247c6ae99SBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 111347c6ae99SBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 111447c6ae99SBarry Smith PETSc ordering. 111547c6ae99SBarry Smith */ 1116fcfd50ebSBarry Smith if (!da->prealloc_only) { 111747c6ae99SBarry Smith ierr = PetscMalloc(col*nc*nc*sizeof(PetscScalar),&values);CHKERRQ(ierr); 111847c6ae99SBarry Smith ierr = PetscMemzero(values,col*nc*nc*sizeof(PetscScalar));CHKERRQ(ierr); 111947c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 112047c6ae99SBarry Smith istart = PetscMax(-s,gxs - i); 112147c6ae99SBarry Smith iend = PetscMin(s,gxs + gnx - i - 1); 112247c6ae99SBarry Smith slot = i - gxs; 112347c6ae99SBarry Smith 112447c6ae99SBarry Smith cnt = 0; 112547c6ae99SBarry Smith for (l=0; l<nc; l++) { 112647c6ae99SBarry Smith for (i1=istart; i1<iend+1; i1++) { 112747c6ae99SBarry Smith cols[cnt++] = l + nc*(slot + i1); 112847c6ae99SBarry Smith } 112947c6ae99SBarry Smith rows[l] = l + nc*(slot); 113047c6ae99SBarry Smith } 113147c6ae99SBarry Smith ierr = MatSetValuesLocal(J,nc,rows,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 113247c6ae99SBarry Smith } 113347c6ae99SBarry Smith ierr = PetscFree(values);CHKERRQ(ierr); 113447c6ae99SBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 113547c6ae99SBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 113647c6ae99SBarry Smith } 113747c6ae99SBarry Smith ierr = PetscFree2(rows,cols);CHKERRQ(ierr); 113847c6ae99SBarry Smith PetscFunctionReturn(0); 113947c6ae99SBarry Smith } 114047c6ae99SBarry Smith 114147c6ae99SBarry Smith #undef __FUNCT__ 114294013140SBarry Smith #define __FUNCT__ "DMGetMatrix_DA_2d_MPIBAIJ" 114394013140SBarry Smith PetscErrorCode DMGetMatrix_DA_2d_MPIBAIJ(DM da,Mat J) 114447c6ae99SBarry Smith { 114547c6ae99SBarry Smith PetscErrorCode ierr; 114647c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny; 114747c6ae99SBarry Smith PetscInt m,n,dim,s,*cols,nc,col,cnt,*dnz,*onz; 114847c6ae99SBarry Smith PetscInt istart,iend,jstart,jend,ii,jj; 114947c6ae99SBarry Smith MPI_Comm comm; 115047c6ae99SBarry Smith PetscScalar *values; 11511321219cSEthan Coon DMDABoundaryType bx,by; 1152aa219208SBarry Smith DMDAStencilType st; 115347c6ae99SBarry Smith ISLocalToGlobalMapping ltog,ltogb; 115447c6ae99SBarry Smith 115547c6ae99SBarry Smith PetscFunctionBegin; 115647c6ae99SBarry Smith /* 115747c6ae99SBarry Smith nc - number of components per grid point 115847c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 115947c6ae99SBarry Smith */ 11601321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,&n,0,0,0,0,&nc,&s,&bx,&by,0,&st);CHKERRQ(ierr); 116147c6ae99SBarry Smith col = 2*s + 1; 116247c6ae99SBarry Smith 1163aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,0,&nx,&ny,0);CHKERRQ(ierr); 1164aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,0,&gnx,&gny,0);CHKERRQ(ierr); 116547c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 116647c6ae99SBarry Smith 116747c6ae99SBarry Smith ierr = PetscMalloc(col*col*nc*nc*sizeof(PetscInt),&cols);CHKERRQ(ierr); 116847c6ae99SBarry Smith 11691411c6eeSJed Brown ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 11701411c6eeSJed Brown ierr = DMGetLocalToGlobalMappingBlock(da,<ogb);CHKERRQ(ierr); 117147c6ae99SBarry Smith 117247c6ae99SBarry Smith /* determine the matrix preallocation information */ 117347c6ae99SBarry Smith ierr = MatPreallocateInitialize(comm,nx*ny,nx*ny,dnz,onz);CHKERRQ(ierr); 117447c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 11751321219cSEthan Coon istart = (bx == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 11761321219cSEthan Coon iend = (bx == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 117747c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 11781321219cSEthan Coon jstart = (by == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 11791321219cSEthan Coon jend = (by == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 118047c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys); 118147c6ae99SBarry Smith 118247c6ae99SBarry Smith /* Find block columns in block row */ 118347c6ae99SBarry Smith cnt = 0; 118447c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 118547c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 1186aa219208SBarry Smith if (st == DMDA_STENCIL_BOX || !ii || !jj) { /* BOX or on the STAR */ 118747c6ae99SBarry Smith cols[cnt++] = slot + ii + gnx*jj; 118847c6ae99SBarry Smith } 118947c6ae99SBarry Smith } 119047c6ae99SBarry Smith } 1191784ac674SJed Brown ierr = MatPreallocateSetLocal(ltogb,1,&slot,ltogb,cnt,cols,dnz,onz);CHKERRQ(ierr); 119247c6ae99SBarry Smith } 119347c6ae99SBarry Smith } 119447c6ae99SBarry Smith ierr = MatSeqBAIJSetPreallocation(J,nc,0,dnz);CHKERRQ(ierr); 119547c6ae99SBarry Smith ierr = MatMPIBAIJSetPreallocation(J,nc,0,dnz,0,onz);CHKERRQ(ierr); 119647c6ae99SBarry Smith ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr); 119747c6ae99SBarry Smith 1198784ac674SJed Brown ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 1199784ac674SJed Brown ierr = MatSetLocalToGlobalMappingBlock(J,ltogb,ltogb);CHKERRQ(ierr); 120047c6ae99SBarry Smith 120147c6ae99SBarry Smith /* 120247c6ae99SBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 120347c6ae99SBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 120447c6ae99SBarry Smith PETSc ordering. 120547c6ae99SBarry Smith */ 1206fcfd50ebSBarry Smith if (!da->prealloc_only) { 120747c6ae99SBarry Smith ierr = PetscMalloc(col*col*nc*nc*sizeof(PetscScalar),&values);CHKERRQ(ierr); 120847c6ae99SBarry Smith ierr = PetscMemzero(values,col*col*nc*nc*sizeof(PetscScalar));CHKERRQ(ierr); 120947c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 12101321219cSEthan Coon istart = (bx == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 12111321219cSEthan Coon iend = (bx == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 121247c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 12131321219cSEthan Coon jstart = (by == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 12141321219cSEthan Coon jend = (by == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 121547c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys); 121647c6ae99SBarry Smith cnt = 0; 121747c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 121847c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 1219aa219208SBarry Smith if (st == DMDA_STENCIL_BOX || !ii || !jj) { /* BOX or on the STAR */ 122047c6ae99SBarry Smith cols[cnt++] = slot + ii + gnx*jj; 122147c6ae99SBarry Smith } 122247c6ae99SBarry Smith } 122347c6ae99SBarry Smith } 122447c6ae99SBarry Smith ierr = MatSetValuesBlockedLocal(J,1,&slot,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 122547c6ae99SBarry Smith } 122647c6ae99SBarry Smith } 122747c6ae99SBarry Smith ierr = PetscFree(values);CHKERRQ(ierr); 122847c6ae99SBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 122947c6ae99SBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 123047c6ae99SBarry Smith } 123147c6ae99SBarry Smith ierr = PetscFree(cols);CHKERRQ(ierr); 123247c6ae99SBarry Smith PetscFunctionReturn(0); 123347c6ae99SBarry Smith } 123447c6ae99SBarry Smith 123547c6ae99SBarry Smith #undef __FUNCT__ 123694013140SBarry Smith #define __FUNCT__ "DMGetMatrix_DA_3d_MPIBAIJ" 123794013140SBarry Smith PetscErrorCode DMGetMatrix_DA_3d_MPIBAIJ(DM da,Mat J) 123847c6ae99SBarry Smith { 123947c6ae99SBarry Smith PetscErrorCode ierr; 124047c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny; 124147c6ae99SBarry Smith PetscInt m,n,dim,s,*cols,k,nc,col,cnt,p,*dnz,*onz; 124247c6ae99SBarry Smith PetscInt istart,iend,jstart,jend,kstart,kend,zs,nz,gzs,gnz,ii,jj,kk; 124347c6ae99SBarry Smith MPI_Comm comm; 124447c6ae99SBarry Smith PetscScalar *values; 12451321219cSEthan Coon DMDABoundaryType bx,by,bz; 1246aa219208SBarry Smith DMDAStencilType st; 124747c6ae99SBarry Smith ISLocalToGlobalMapping ltog,ltogb; 124847c6ae99SBarry Smith 124947c6ae99SBarry Smith PetscFunctionBegin; 125047c6ae99SBarry Smith /* 125147c6ae99SBarry Smith nc - number of components per grid point 125247c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 125347c6ae99SBarry Smith 125447c6ae99SBarry Smith */ 12551321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,&n,&p,0,0,0,&nc,&s,&bx,&by,&bz,&st);CHKERRQ(ierr); 125647c6ae99SBarry Smith col = 2*s + 1; 125747c6ae99SBarry Smith 1258aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,&zs,&nx,&ny,&nz);CHKERRQ(ierr); 1259aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,&gzs,&gnx,&gny,&gnz);CHKERRQ(ierr); 126047c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 126147c6ae99SBarry Smith 126247c6ae99SBarry Smith ierr = PetscMalloc(col*col*col*sizeof(PetscInt),&cols);CHKERRQ(ierr); 126347c6ae99SBarry Smith 12641411c6eeSJed Brown ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 12651411c6eeSJed Brown ierr = DMGetLocalToGlobalMappingBlock(da,<ogb);CHKERRQ(ierr); 126647c6ae99SBarry Smith 126747c6ae99SBarry Smith /* determine the matrix preallocation information */ 126847c6ae99SBarry Smith ierr = MatPreallocateInitialize(comm,nx*ny*nz,nx*ny*nz,dnz,onz);CHKERRQ(ierr); 126947c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 12701321219cSEthan Coon istart = (bx == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 12711321219cSEthan Coon iend = (bx == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 127247c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 12731321219cSEthan Coon jstart = (by == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 12741321219cSEthan Coon jend = (by == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 127547c6ae99SBarry Smith for (k=zs; k<zs+nz; k++) { 12761321219cSEthan Coon kstart = (bz == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k)); 12771321219cSEthan Coon kend = (bz == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,p-k-1)); 127847c6ae99SBarry Smith 127947c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs); 128047c6ae99SBarry Smith 128147c6ae99SBarry Smith /* Find block columns in block row */ 128247c6ae99SBarry Smith cnt = 0; 128347c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 128447c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 128547c6ae99SBarry Smith for (kk=kstart; kk<kend+1; kk++) { 1286aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/ 128747c6ae99SBarry Smith cols[cnt++] = slot + ii + gnx*jj + gnx*gny*kk; 128847c6ae99SBarry Smith } 128947c6ae99SBarry Smith } 129047c6ae99SBarry Smith } 129147c6ae99SBarry Smith } 1292784ac674SJed Brown ierr = MatPreallocateSetLocal(ltogb,1,&slot,ltogb,cnt,cols,dnz,onz);CHKERRQ(ierr); 129347c6ae99SBarry Smith } 129447c6ae99SBarry Smith } 129547c6ae99SBarry Smith } 129647c6ae99SBarry Smith ierr = MatSeqBAIJSetPreallocation(J,nc,0,dnz);CHKERRQ(ierr); 129747c6ae99SBarry Smith ierr = MatMPIBAIJSetPreallocation(J,nc,0,dnz,0,onz);CHKERRQ(ierr); 129847c6ae99SBarry Smith ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr); 129947c6ae99SBarry Smith 1300784ac674SJed Brown ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 1301784ac674SJed Brown ierr = MatSetLocalToGlobalMappingBlock(J,ltogb,ltogb);CHKERRQ(ierr); 130247c6ae99SBarry Smith 130347c6ae99SBarry Smith /* 130447c6ae99SBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 130547c6ae99SBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 130647c6ae99SBarry Smith PETSc ordering. 130747c6ae99SBarry Smith */ 1308fcfd50ebSBarry Smith if (!da->prealloc_only) { 130947c6ae99SBarry Smith ierr = PetscMalloc(col*col*col*nc*nc*sizeof(PetscScalar),&values);CHKERRQ(ierr); 131047c6ae99SBarry Smith ierr = PetscMemzero(values,col*col*col*nc*nc*sizeof(PetscScalar));CHKERRQ(ierr); 131147c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 13121321219cSEthan Coon istart = (bx == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 13131321219cSEthan Coon iend = (bx == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 131447c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 13151321219cSEthan Coon jstart = (by == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 13161321219cSEthan Coon jend = (by == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 131747c6ae99SBarry Smith for (k=zs; k<zs+nz; k++) { 13181321219cSEthan Coon kstart = (bz == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k)); 13191321219cSEthan Coon kend = (bz == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,p-k-1)); 132047c6ae99SBarry Smith 132147c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs); 132247c6ae99SBarry Smith 132347c6ae99SBarry Smith cnt = 0; 132447c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 132547c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 132647c6ae99SBarry Smith for (kk=kstart; kk<kend+1; kk++) { 1327aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/ 132847c6ae99SBarry Smith cols[cnt++] = slot + ii + gnx*jj + gnx*gny*kk; 132947c6ae99SBarry Smith } 133047c6ae99SBarry Smith } 133147c6ae99SBarry Smith } 133247c6ae99SBarry Smith } 133347c6ae99SBarry Smith ierr = MatSetValuesBlockedLocal(J,1,&slot,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 133447c6ae99SBarry Smith } 133547c6ae99SBarry Smith } 133647c6ae99SBarry Smith } 133747c6ae99SBarry Smith ierr = PetscFree(values);CHKERRQ(ierr); 133847c6ae99SBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 133947c6ae99SBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 134047c6ae99SBarry Smith } 134147c6ae99SBarry Smith ierr = PetscFree(cols);CHKERRQ(ierr); 134247c6ae99SBarry Smith PetscFunctionReturn(0); 134347c6ae99SBarry Smith } 134447c6ae99SBarry Smith 134547c6ae99SBarry Smith #undef __FUNCT__ 134647c6ae99SBarry Smith #define __FUNCT__ "L2GFilterUpperTriangular" 134747c6ae99SBarry Smith /* 134847c6ae99SBarry Smith This helper is for of SBAIJ preallocation, to discard the lower-triangular values which are difficult to 134947c6ae99SBarry Smith identify in the local ordering with periodic domain. 135047c6ae99SBarry Smith */ 135147c6ae99SBarry Smith static PetscErrorCode L2GFilterUpperTriangular(ISLocalToGlobalMapping ltog,PetscInt *row,PetscInt *cnt,PetscInt col[]) 135247c6ae99SBarry Smith { 135347c6ae99SBarry Smith PetscErrorCode ierr; 135447c6ae99SBarry Smith PetscInt i,n; 135547c6ae99SBarry Smith 135647c6ae99SBarry Smith PetscFunctionBegin; 135747c6ae99SBarry Smith ierr = ISLocalToGlobalMappingApply(ltog,1,row,row);CHKERRQ(ierr); 135847c6ae99SBarry Smith ierr = ISLocalToGlobalMappingApply(ltog,*cnt,col,col);CHKERRQ(ierr); 135947c6ae99SBarry Smith for (i=0,n=0; i<*cnt; i++) { 136047c6ae99SBarry Smith if (col[i] >= *row) col[n++] = col[i]; 136147c6ae99SBarry Smith } 136247c6ae99SBarry Smith *cnt = n; 136347c6ae99SBarry Smith PetscFunctionReturn(0); 136447c6ae99SBarry Smith } 136547c6ae99SBarry Smith 136647c6ae99SBarry Smith #undef __FUNCT__ 136794013140SBarry Smith #define __FUNCT__ "DMGetMatrix_DA_2d_MPISBAIJ" 136894013140SBarry Smith PetscErrorCode DMGetMatrix_DA_2d_MPISBAIJ(DM da,Mat J) 136947c6ae99SBarry Smith { 137047c6ae99SBarry Smith PetscErrorCode ierr; 137147c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny; 137247c6ae99SBarry Smith PetscInt m,n,dim,s,*cols,nc,col,cnt,*dnz,*onz; 137347c6ae99SBarry Smith PetscInt istart,iend,jstart,jend,ii,jj; 137447c6ae99SBarry Smith MPI_Comm comm; 137547c6ae99SBarry Smith PetscScalar *values; 13761321219cSEthan Coon DMDABoundaryType bx,by; 1377aa219208SBarry Smith DMDAStencilType st; 137847c6ae99SBarry Smith ISLocalToGlobalMapping ltog,ltogb; 137947c6ae99SBarry Smith 138047c6ae99SBarry Smith PetscFunctionBegin; 138147c6ae99SBarry Smith /* 138247c6ae99SBarry Smith nc - number of components per grid point 138347c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 138447c6ae99SBarry Smith */ 13851321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,&n,0,0,0,0,&nc,&s,&bx,&by,0,&st);CHKERRQ(ierr); 138647c6ae99SBarry Smith col = 2*s + 1; 138747c6ae99SBarry Smith 1388aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,0,&nx,&ny,0);CHKERRQ(ierr); 1389aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,0,&gnx,&gny,0);CHKERRQ(ierr); 139047c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 139147c6ae99SBarry Smith 139247c6ae99SBarry Smith ierr = PetscMalloc(col*col*nc*nc*sizeof(PetscInt),&cols);CHKERRQ(ierr); 139347c6ae99SBarry Smith 13941411c6eeSJed Brown ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 13951411c6eeSJed Brown ierr = DMGetLocalToGlobalMappingBlock(da,<ogb);CHKERRQ(ierr); 139647c6ae99SBarry Smith 139747c6ae99SBarry Smith /* determine the matrix preallocation information */ 139847c6ae99SBarry Smith ierr = MatPreallocateSymmetricInitialize(comm,nx*ny,nx*ny,dnz,onz);CHKERRQ(ierr); 139947c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 14001321219cSEthan Coon istart = (bx == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 14011321219cSEthan Coon iend = (bx == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 140247c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 14031321219cSEthan Coon jstart = (by == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 14041321219cSEthan Coon jend = (by == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 140547c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys); 140647c6ae99SBarry Smith 140747c6ae99SBarry Smith /* Find block columns in block row */ 140847c6ae99SBarry Smith cnt = 0; 140947c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 141047c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 1411aa219208SBarry Smith if (st == DMDA_STENCIL_BOX || !ii || !jj) { 141247c6ae99SBarry Smith cols[cnt++] = slot + ii + gnx*jj; 141347c6ae99SBarry Smith } 141447c6ae99SBarry Smith } 141547c6ae99SBarry Smith } 141647c6ae99SBarry Smith ierr = L2GFilterUpperTriangular(ltogb,&slot,&cnt,cols);CHKERRQ(ierr); 141747c6ae99SBarry Smith ierr = MatPreallocateSymmetricSet(slot,cnt,cols,dnz,onz);CHKERRQ(ierr); 141847c6ae99SBarry Smith } 141947c6ae99SBarry Smith } 142047c6ae99SBarry Smith ierr = MatSeqSBAIJSetPreallocation(J,nc,0,dnz);CHKERRQ(ierr); 142147c6ae99SBarry Smith ierr = MatMPISBAIJSetPreallocation(J,nc,0,dnz,0,onz);CHKERRQ(ierr); 142247c6ae99SBarry Smith ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr); 142347c6ae99SBarry Smith 1424784ac674SJed Brown ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 1425784ac674SJed Brown ierr = MatSetLocalToGlobalMappingBlock(J,ltogb,ltogb);CHKERRQ(ierr); 142647c6ae99SBarry Smith 142747c6ae99SBarry Smith /* 142847c6ae99SBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 142947c6ae99SBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 143047c6ae99SBarry Smith PETSc ordering. 143147c6ae99SBarry Smith */ 1432fcfd50ebSBarry Smith if (!da->prealloc_only) { 143347c6ae99SBarry Smith ierr = PetscMalloc(col*col*nc*nc*sizeof(PetscScalar),&values);CHKERRQ(ierr); 143447c6ae99SBarry Smith ierr = PetscMemzero(values,col*col*nc*nc*sizeof(PetscScalar));CHKERRQ(ierr); 143547c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 14361321219cSEthan Coon istart = (bx == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 14371321219cSEthan Coon iend = (bx == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 143847c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 14391321219cSEthan Coon jstart = (by == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 14401321219cSEthan Coon jend = (by == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 144147c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys); 144247c6ae99SBarry Smith 144347c6ae99SBarry Smith /* Find block columns in block row */ 144447c6ae99SBarry Smith cnt = 0; 144547c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 144647c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 1447aa219208SBarry Smith if (st == DMDA_STENCIL_BOX || !ii || !jj) { 144847c6ae99SBarry Smith cols[cnt++] = slot + ii + gnx*jj; 144947c6ae99SBarry Smith } 145047c6ae99SBarry Smith } 145147c6ae99SBarry Smith } 145247c6ae99SBarry Smith ierr = L2GFilterUpperTriangular(ltogb,&slot,&cnt,cols);CHKERRQ(ierr); 145347c6ae99SBarry Smith ierr = MatSetValuesBlocked(J,1,&slot,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 145447c6ae99SBarry Smith } 145547c6ae99SBarry Smith } 145647c6ae99SBarry Smith ierr = PetscFree(values);CHKERRQ(ierr); 145747c6ae99SBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 145847c6ae99SBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 145947c6ae99SBarry Smith } 146047c6ae99SBarry Smith ierr = PetscFree(cols);CHKERRQ(ierr); 146147c6ae99SBarry Smith PetscFunctionReturn(0); 146247c6ae99SBarry Smith } 146347c6ae99SBarry Smith 146447c6ae99SBarry Smith #undef __FUNCT__ 146594013140SBarry Smith #define __FUNCT__ "DMGetMatrix_DA_3d_MPISBAIJ" 146694013140SBarry Smith PetscErrorCode DMGetMatrix_DA_3d_MPISBAIJ(DM da,Mat J) 146747c6ae99SBarry Smith { 146847c6ae99SBarry Smith PetscErrorCode ierr; 146947c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny; 147047c6ae99SBarry Smith PetscInt m,n,dim,s,*cols,k,nc,col,cnt,p,*dnz,*onz; 147147c6ae99SBarry Smith PetscInt istart,iend,jstart,jend,kstart,kend,zs,nz,gzs,gnz,ii,jj,kk; 147247c6ae99SBarry Smith MPI_Comm comm; 147347c6ae99SBarry Smith PetscScalar *values; 14741321219cSEthan Coon DMDABoundaryType bx,by,bz; 1475aa219208SBarry Smith DMDAStencilType st; 147647c6ae99SBarry Smith ISLocalToGlobalMapping ltog,ltogb; 147747c6ae99SBarry Smith 147847c6ae99SBarry Smith PetscFunctionBegin; 147947c6ae99SBarry Smith /* 148047c6ae99SBarry Smith nc - number of components per grid point 148147c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 148247c6ae99SBarry Smith */ 14831321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,&n,&p,0,0,0,&nc,&s,&bx,&by,&bz,&st);CHKERRQ(ierr); 148447c6ae99SBarry Smith col = 2*s + 1; 148547c6ae99SBarry Smith 1486aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,&zs,&nx,&ny,&nz);CHKERRQ(ierr); 1487aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,&gzs,&gnx,&gny,&gnz);CHKERRQ(ierr); 148847c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 148947c6ae99SBarry Smith 149047c6ae99SBarry Smith /* create the matrix */ 149147c6ae99SBarry Smith ierr = PetscMalloc(col*col*col*sizeof(PetscInt),&cols);CHKERRQ(ierr); 149247c6ae99SBarry Smith 14931411c6eeSJed Brown ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 14941411c6eeSJed Brown ierr = DMGetLocalToGlobalMappingBlock(da,<ogb);CHKERRQ(ierr); 149547c6ae99SBarry Smith 149647c6ae99SBarry Smith /* determine the matrix preallocation information */ 149747c6ae99SBarry Smith ierr = MatPreallocateSymmetricInitialize(comm,nx*ny*nz,nx*ny*nz,dnz,onz);CHKERRQ(ierr); 149847c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 14991321219cSEthan Coon istart = (bx == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 15001321219cSEthan Coon iend = (bx == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 150147c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 15021321219cSEthan Coon jstart = (by == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 15031321219cSEthan Coon jend = (by == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 150447c6ae99SBarry Smith for (k=zs; k<zs+nz; k++) { 15051321219cSEthan Coon kstart = (bz == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k)); 15061321219cSEthan Coon kend = (bz == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,p-k-1)); 150747c6ae99SBarry Smith 150847c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs); 150947c6ae99SBarry Smith 151047c6ae99SBarry Smith /* Find block columns in block row */ 151147c6ae99SBarry Smith cnt = 0; 151247c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 151347c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 151447c6ae99SBarry Smith for (kk=kstart; kk<kend+1; kk++) { 1515aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || (!ii && !jj) || (!jj && !kk) || (!ii && !kk)) { 151647c6ae99SBarry Smith cols[cnt++] = slot + ii + gnx*jj + gnx*gny*kk; 151747c6ae99SBarry Smith } 151847c6ae99SBarry Smith } 151947c6ae99SBarry Smith } 152047c6ae99SBarry Smith } 152147c6ae99SBarry Smith ierr = L2GFilterUpperTriangular(ltogb,&slot,&cnt,cols);CHKERRQ(ierr); 152247c6ae99SBarry Smith ierr = MatPreallocateSymmetricSet(slot,cnt,cols,dnz,onz);CHKERRQ(ierr); 152347c6ae99SBarry Smith } 152447c6ae99SBarry Smith } 152547c6ae99SBarry Smith } 152647c6ae99SBarry Smith ierr = MatSeqSBAIJSetPreallocation(J,nc,0,dnz);CHKERRQ(ierr); 152747c6ae99SBarry Smith ierr = MatMPISBAIJSetPreallocation(J,nc,0,dnz,0,onz);CHKERRQ(ierr); 152847c6ae99SBarry Smith ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr); 152947c6ae99SBarry Smith 1530784ac674SJed Brown ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 1531784ac674SJed Brown ierr = MatSetLocalToGlobalMappingBlock(J,ltogb,ltogb);CHKERRQ(ierr); 153247c6ae99SBarry Smith 153347c6ae99SBarry Smith /* 153447c6ae99SBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 153547c6ae99SBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 153647c6ae99SBarry Smith PETSc ordering. 153747c6ae99SBarry Smith */ 1538fcfd50ebSBarry Smith if (!da->prealloc_only) { 153947c6ae99SBarry Smith ierr = PetscMalloc(col*col*col*nc*nc*sizeof(PetscScalar),&values);CHKERRQ(ierr); 154047c6ae99SBarry Smith ierr = PetscMemzero(values,col*col*col*nc*nc*sizeof(PetscScalar));CHKERRQ(ierr); 154147c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 15421321219cSEthan Coon istart = (bx == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 15431321219cSEthan Coon iend = (bx == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 154447c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 15451321219cSEthan Coon jstart = (by == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 15461321219cSEthan Coon jend = (by == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 154747c6ae99SBarry Smith for (k=zs; k<zs+nz; k++) { 15481321219cSEthan Coon kstart = (bz == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k)); 15491321219cSEthan Coon kend = (bz == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,p-k-1)); 155047c6ae99SBarry Smith 155147c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs); 155247c6ae99SBarry Smith 155347c6ae99SBarry Smith cnt = 0; 155447c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 155547c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 155647c6ae99SBarry Smith for (kk=kstart; kk<kend+1; kk++) { 1557aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || (!ii && !jj) || (!jj && !kk) || (!ii && !kk)) { 155847c6ae99SBarry Smith cols[cnt++] = slot + ii + gnx*jj + gnx*gny*kk; 155947c6ae99SBarry Smith } 156047c6ae99SBarry Smith } 156147c6ae99SBarry Smith } 156247c6ae99SBarry Smith } 156347c6ae99SBarry Smith ierr = L2GFilterUpperTriangular(ltogb,&slot,&cnt,cols);CHKERRQ(ierr); 156447c6ae99SBarry Smith ierr = MatSetValuesBlocked(J,1,&slot,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 156547c6ae99SBarry Smith } 156647c6ae99SBarry Smith } 156747c6ae99SBarry Smith } 156847c6ae99SBarry Smith ierr = PetscFree(values);CHKERRQ(ierr); 156947c6ae99SBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 157047c6ae99SBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 157147c6ae99SBarry Smith } 157247c6ae99SBarry Smith ierr = PetscFree(cols);CHKERRQ(ierr); 157347c6ae99SBarry Smith PetscFunctionReturn(0); 157447c6ae99SBarry Smith } 157547c6ae99SBarry Smith 157647c6ae99SBarry Smith /* ---------------------------------------------------------------------------------*/ 157747c6ae99SBarry Smith 157847c6ae99SBarry Smith #undef __FUNCT__ 157994013140SBarry Smith #define __FUNCT__ "DMGetMatrix_DA_3d_MPIAIJ_Fill" 158094013140SBarry Smith PetscErrorCode DMGetMatrix_DA_3d_MPIAIJ_Fill(DM da,Mat J) 158147c6ae99SBarry Smith { 158247c6ae99SBarry Smith PetscErrorCode ierr; 158347c6ae99SBarry Smith PetscInt xs,ys,nx,ny,i,j,slot,gxs,gys,gnx,gny; 158447c6ae99SBarry Smith PetscInt m,n,dim,s,*cols,k,nc,row,col,cnt,l,p,*dnz,*onz; 158547c6ae99SBarry Smith PetscInt istart,iend,jstart,jend,kstart,kend,zs,nz,gzs,gnz,ii,jj,kk; 158647c6ae99SBarry Smith DM_DA *dd = (DM_DA*)da->data; 158747c6ae99SBarry Smith PetscInt ifill_col,*dfill = dd->dfill,*ofill = dd->ofill; 158847c6ae99SBarry Smith MPI_Comm comm; 158947c6ae99SBarry Smith PetscScalar *values; 15901321219cSEthan Coon DMDABoundaryType bx,by,bz; 159147c6ae99SBarry Smith ISLocalToGlobalMapping ltog,ltogb; 1592aa219208SBarry Smith DMDAStencilType st; 159347c6ae99SBarry Smith 159447c6ae99SBarry Smith PetscFunctionBegin; 159547c6ae99SBarry Smith /* 159647c6ae99SBarry Smith nc - number of components per grid point 159747c6ae99SBarry Smith col - number of colors needed in one direction for single component problem 159847c6ae99SBarry Smith 159947c6ae99SBarry Smith */ 16001321219cSEthan Coon ierr = DMDAGetInfo(da,&dim,&m,&n,&p,0,0,0,&nc,&s,&bx,&by,&bz,&st);CHKERRQ(ierr); 160147c6ae99SBarry Smith col = 2*s + 1; 16021321219cSEthan Coon if (bx == DMDA_BOUNDARY_PERIODIC && (m % col)){ 160347c6ae99SBarry Smith SETERRQ(((PetscObject)da)->comm,PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in X is divisible\n\ 160447c6ae99SBarry Smith by 2*stencil_width + 1\n"); 160547c6ae99SBarry Smith } 16061321219cSEthan Coon if (by == DMDA_BOUNDARY_PERIODIC && (n % col)){ 160747c6ae99SBarry Smith SETERRQ(((PetscObject)da)->comm,PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in Y is divisible\n\ 160847c6ae99SBarry Smith by 2*stencil_width + 1\n"); 160947c6ae99SBarry Smith } 16101321219cSEthan Coon if (bz == DMDA_BOUNDARY_PERIODIC && (p % col)){ 161147c6ae99SBarry Smith SETERRQ(((PetscObject)da)->comm,PETSC_ERR_SUP,"For coloring efficiency ensure number of grid points in Z is divisible\n\ 161247c6ae99SBarry Smith by 2*stencil_width + 1\n"); 161347c6ae99SBarry Smith } 161447c6ae99SBarry Smith 1615aa219208SBarry Smith ierr = DMDAGetCorners(da,&xs,&ys,&zs,&nx,&ny,&nz);CHKERRQ(ierr); 1616aa219208SBarry Smith ierr = DMDAGetGhostCorners(da,&gxs,&gys,&gzs,&gnx,&gny,&gnz);CHKERRQ(ierr); 161747c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject)da,&comm);CHKERRQ(ierr); 161847c6ae99SBarry Smith 161947c6ae99SBarry Smith ierr = PetscMalloc(col*col*col*nc*sizeof(PetscInt),&cols);CHKERRQ(ierr); 16201411c6eeSJed Brown ierr = DMGetLocalToGlobalMapping(da,<og);CHKERRQ(ierr); 16211411c6eeSJed Brown ierr = DMGetLocalToGlobalMappingBlock(da,<ogb);CHKERRQ(ierr); 162247c6ae99SBarry Smith 162347c6ae99SBarry Smith /* determine the matrix preallocation information */ 162447c6ae99SBarry Smith ierr = MatPreallocateInitialize(comm,nc*nx*ny*nz,nc*nx*ny*nz,dnz,onz);CHKERRQ(ierr); 162547c6ae99SBarry Smith 162647c6ae99SBarry Smith 162747c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 16281321219cSEthan Coon istart = (bx == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 16291321219cSEthan Coon iend = (bx == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 163047c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 16311321219cSEthan Coon jstart = (by == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 16321321219cSEthan Coon jend = (by == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 163347c6ae99SBarry Smith for (k=zs; k<zs+nz; k++) { 16341321219cSEthan Coon kstart = (bz == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k)); 16351321219cSEthan Coon kend = (bz == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,p-k-1)); 163647c6ae99SBarry Smith 163747c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs); 163847c6ae99SBarry Smith 163947c6ae99SBarry Smith for (l=0; l<nc; l++) { 164047c6ae99SBarry Smith cnt = 0; 164147c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 164247c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 164347c6ae99SBarry Smith for (kk=kstart; kk<kend+1; kk++) { 164447c6ae99SBarry Smith if (ii || jj || kk) { 1645aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/ 164647c6ae99SBarry Smith for (ifill_col=ofill[l]; ifill_col<ofill[l+1]; ifill_col++) 164747c6ae99SBarry Smith cols[cnt++] = ofill[ifill_col] + nc*(slot + ii + gnx*jj + gnx*gny*kk); 164847c6ae99SBarry Smith } 164947c6ae99SBarry Smith } else { 165047c6ae99SBarry Smith if (dfill) { 165147c6ae99SBarry Smith for (ifill_col=dfill[l]; ifill_col<dfill[l+1]; ifill_col++) 165247c6ae99SBarry Smith cols[cnt++] = dfill[ifill_col] + nc*(slot + ii + gnx*jj + gnx*gny*kk); 165347c6ae99SBarry Smith } else { 165447c6ae99SBarry Smith for (ifill_col=0; ifill_col<nc; ifill_col++) 165547c6ae99SBarry Smith cols[cnt++] = ifill_col + nc*(slot + ii + gnx*jj + gnx*gny*kk); 165647c6ae99SBarry Smith } 165747c6ae99SBarry Smith } 165847c6ae99SBarry Smith } 165947c6ae99SBarry Smith } 166047c6ae99SBarry Smith } 166147c6ae99SBarry Smith row = l + nc*(slot); 1662784ac674SJed Brown ierr = MatPreallocateSetLocal(ltog,1,&row,ltog,cnt,cols,dnz,onz);CHKERRQ(ierr); 166347c6ae99SBarry Smith } 166447c6ae99SBarry Smith } 166547c6ae99SBarry Smith } 166647c6ae99SBarry Smith } 166747c6ae99SBarry Smith ierr = MatSeqAIJSetPreallocation(J,0,dnz);CHKERRQ(ierr); 166847c6ae99SBarry Smith ierr = MatMPIAIJSetPreallocation(J,0,dnz,0,onz);CHKERRQ(ierr); 166947c6ae99SBarry Smith ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr); 1670784ac674SJed Brown ierr = MatSetLocalToGlobalMapping(J,ltog,ltog);CHKERRQ(ierr); 1671784ac674SJed Brown ierr = MatSetLocalToGlobalMappingBlock(J,ltogb,ltogb);CHKERRQ(ierr); 167247c6ae99SBarry Smith 167347c6ae99SBarry Smith /* 167447c6ae99SBarry Smith For each node in the grid: we get the neighbors in the local (on processor ordering 167547c6ae99SBarry Smith that includes the ghost points) then MatSetValuesLocal() maps those indices to the global 167647c6ae99SBarry Smith PETSc ordering. 167747c6ae99SBarry Smith */ 1678fcfd50ebSBarry Smith if (!da->prealloc_only) { 167947c6ae99SBarry Smith ierr = PetscMalloc(col*col*col*nc*nc*nc*sizeof(PetscScalar),&values);CHKERRQ(ierr); 168047c6ae99SBarry Smith ierr = PetscMemzero(values,col*col*col*nc*nc*nc*sizeof(PetscScalar));CHKERRQ(ierr); 168147c6ae99SBarry Smith for (i=xs; i<xs+nx; i++) { 16821321219cSEthan Coon istart = (bx == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-i)); 16831321219cSEthan Coon iend = (bx == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,m-i-1)); 168447c6ae99SBarry Smith for (j=ys; j<ys+ny; j++) { 16851321219cSEthan Coon jstart = (by == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-j)); 16861321219cSEthan Coon jend = (by == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,n-j-1)); 168747c6ae99SBarry Smith for (k=zs; k<zs+nz; k++) { 16881321219cSEthan Coon kstart = (bz == DMDA_BOUNDARY_PERIODIC) ? -s : (PetscMax(-s,-k)); 16891321219cSEthan Coon kend = (bz == DMDA_BOUNDARY_PERIODIC) ? s : (PetscMin(s,p-k-1)); 169047c6ae99SBarry Smith 169147c6ae99SBarry Smith slot = i - gxs + gnx*(j - gys) + gnx*gny*(k - gzs); 169247c6ae99SBarry Smith 169347c6ae99SBarry Smith for (l=0; l<nc; l++) { 169447c6ae99SBarry Smith cnt = 0; 169547c6ae99SBarry Smith for (ii=istart; ii<iend+1; ii++) { 169647c6ae99SBarry Smith for (jj=jstart; jj<jend+1; jj++) { 169747c6ae99SBarry Smith for (kk=kstart; kk<kend+1; kk++) { 169847c6ae99SBarry Smith if (ii || jj || kk) { 1699aa219208SBarry Smith if ((st == DMDA_STENCIL_BOX) || ((!ii && !jj) || (!jj && !kk) || (!ii && !kk))) {/* entries on star*/ 170047c6ae99SBarry Smith for (ifill_col=ofill[l]; ifill_col<ofill[l+1]; ifill_col++) 170147c6ae99SBarry Smith cols[cnt++] = ofill[ifill_col] + nc*(slot + ii + gnx*jj + gnx*gny*kk); 170247c6ae99SBarry Smith } 170347c6ae99SBarry Smith } else { 170447c6ae99SBarry Smith if (dfill) { 170547c6ae99SBarry Smith for (ifill_col=dfill[l]; ifill_col<dfill[l+1]; ifill_col++) 170647c6ae99SBarry Smith cols[cnt++] = dfill[ifill_col] + nc*(slot + ii + gnx*jj + gnx*gny*kk); 170747c6ae99SBarry Smith } else { 170847c6ae99SBarry Smith for (ifill_col=0; ifill_col<nc; ifill_col++) 170947c6ae99SBarry Smith cols[cnt++] = ifill_col + nc*(slot + ii + gnx*jj + gnx*gny*kk); 171047c6ae99SBarry Smith } 171147c6ae99SBarry Smith } 171247c6ae99SBarry Smith } 171347c6ae99SBarry Smith } 171447c6ae99SBarry Smith } 171547c6ae99SBarry Smith row = l + nc*(slot); 171647c6ae99SBarry Smith ierr = MatSetValuesLocal(J,1,&row,cnt,cols,values,INSERT_VALUES);CHKERRQ(ierr); 171747c6ae99SBarry Smith } 171847c6ae99SBarry Smith } 171947c6ae99SBarry Smith } 172047c6ae99SBarry Smith } 172147c6ae99SBarry Smith ierr = PetscFree(values);CHKERRQ(ierr); 172247c6ae99SBarry Smith ierr = MatAssemblyBegin(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 172347c6ae99SBarry Smith ierr = MatAssemblyEnd(J,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 172447c6ae99SBarry Smith } 172547c6ae99SBarry Smith ierr = PetscFree(cols);CHKERRQ(ierr); 172647c6ae99SBarry Smith PetscFunctionReturn(0); 172747c6ae99SBarry Smith } 1728