17d0a6c19SBarry Smith 247c6ae99SBarry Smith /* 347c6ae99SBarry Smith Code for manipulating distributed regular 3d arrays in parallel. 447c6ae99SBarry Smith File created by Peter Mell 7/14/95 547c6ae99SBarry Smith */ 647c6ae99SBarry Smith 7b45d2f2cSJed Brown #include <petsc-private/daimpl.h> /*I "petscdmda.h" I*/ 847c6ae99SBarry Smith 947c6ae99SBarry Smith #undef __FUNCT__ 109a42bb27SBarry Smith #define __FUNCT__ "DMView_DA_3d" 119a42bb27SBarry Smith PetscErrorCode DMView_DA_3d(DM da,PetscViewer viewer) 1247c6ae99SBarry Smith { 1347c6ae99SBarry Smith PetscErrorCode ierr; 1447c6ae99SBarry Smith PetscMPIInt rank; 159a42bb27SBarry Smith PetscBool iascii,isdraw,isbinary; 1647c6ae99SBarry Smith DM_DA *dd = (DM_DA*)da->data; 179a42bb27SBarry Smith #if defined(PETSC_HAVE_MATLAB_ENGINE) 189a42bb27SBarry Smith PetscBool ismatlab; 199a42bb27SBarry Smith #endif 2047c6ae99SBarry Smith 2147c6ae99SBarry Smith PetscFunctionBegin; 2247c6ae99SBarry Smith ierr = MPI_Comm_rank(((PetscObject)da)->comm,&rank);CHKERRQ(ierr); 2347c6ae99SBarry Smith 24*251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERASCII,&iascii);CHKERRQ(ierr); 25*251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERDRAW,&isdraw);CHKERRQ(ierr); 26*251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERBINARY,&isbinary);CHKERRQ(ierr); 279a42bb27SBarry Smith #if defined(PETSC_HAVE_MATLAB_ENGINE) 28*251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare((PetscObject)viewer,PETSCVIEWERMATLAB,&ismatlab);CHKERRQ(ierr); 299a42bb27SBarry Smith #endif 3047c6ae99SBarry Smith if (iascii) { 3147c6ae99SBarry Smith PetscViewerFormat format; 3247c6ae99SBarry Smith 337b23a99aSBarry Smith ierr = PetscViewerASCIISynchronizedAllow(viewer,PETSC_TRUE);CHKERRQ(ierr); 3447c6ae99SBarry Smith ierr = PetscViewerGetFormat(viewer, &format);CHKERRQ(ierr); 3547c6ae99SBarry Smith if (format != PETSC_VIEWER_ASCII_VTK && format != PETSC_VIEWER_ASCII_VTK_CELL) { 36aa219208SBarry Smith DMDALocalInfo info; 37aa219208SBarry Smith ierr = DMDAGetLocalInfo(da,&info);CHKERRQ(ierr); 3847c6ae99SBarry Smith ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Processor [%d] M %D N %D P %D m %D n %D p %D w %D s %D\n",rank,dd->M,dd->N,dd->P,dd->m,dd->n,dd->p,dd->w,dd->s);CHKERRQ(ierr); 3947c6ae99SBarry Smith ierr = PetscViewerASCIISynchronizedPrintf(viewer,"X range of indices: %D %D, Y range of indices: %D %D, Z range of indices: %D %D\n", 4047c6ae99SBarry Smith info.xs,info.xs+info.xm,info.ys,info.ys+info.ym,info.zs,info.zs+info.zm);CHKERRQ(ierr); 4147c6ae99SBarry Smith #if !defined(PETSC_USE_COMPLEX) 4247c6ae99SBarry Smith if (dd->coordinates) { 4347c6ae99SBarry Smith PetscInt last; 4447c6ae99SBarry Smith const PetscReal *coors; 4547c6ae99SBarry Smith ierr = VecGetArrayRead(dd->coordinates,&coors);CHKERRQ(ierr); 4647c6ae99SBarry Smith ierr = VecGetLocalSize(dd->coordinates,&last);CHKERRQ(ierr); 4747c6ae99SBarry Smith last = last - 3; 4847c6ae99SBarry Smith ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Lower left corner %G %G %G : Upper right %G %G %G\n",coors[0],coors[1],coors[2],coors[last],coors[last+1],coors[last+2]);CHKERRQ(ierr); 4947c6ae99SBarry Smith ierr = VecRestoreArrayRead(dd->coordinates,&coors);CHKERRQ(ierr); 5047c6ae99SBarry Smith } 5147c6ae99SBarry Smith #endif 5247c6ae99SBarry Smith ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 537b23a99aSBarry Smith ierr = PetscViewerASCIISynchronizedAllow(viewer,PETSC_FALSE);CHKERRQ(ierr); 54616157d6SJed Brown } else { 55616157d6SJed Brown ierr = DMView_DA_VTK(da,viewer);CHKERRQ(ierr); 5647c6ae99SBarry Smith } 5747c6ae99SBarry Smith } else if (isdraw) { 5847c6ae99SBarry Smith PetscDraw draw; 5947c6ae99SBarry Smith PetscReal ymin = -1.0,ymax = (PetscReal)dd->N; 6047c6ae99SBarry Smith PetscReal xmin = -1.0,xmax = (PetscReal)((dd->M+2)*dd->P),x,y,ycoord,xcoord; 6147c6ae99SBarry Smith PetscInt k,plane,base,*idx; 6247c6ae99SBarry Smith char node[10]; 6347c6ae99SBarry Smith PetscBool isnull; 6447c6ae99SBarry Smith 6547c6ae99SBarry Smith ierr = PetscViewerDrawGetDraw(viewer,0,&draw);CHKERRQ(ierr); 6647c6ae99SBarry Smith ierr = PetscDrawIsNull(draw,&isnull);CHKERRQ(ierr); if (isnull) PetscFunctionReturn(0); 6747c6ae99SBarry Smith ierr = PetscDrawSetCoordinates(draw,xmin,ymin,xmax,ymax);CHKERRQ(ierr); 6847c6ae99SBarry Smith ierr = PetscDrawSynchronizedClear(draw);CHKERRQ(ierr); 6947c6ae99SBarry Smith 7047c6ae99SBarry Smith /* first processor draw all node lines */ 7147c6ae99SBarry Smith if (!rank) { 7247c6ae99SBarry Smith for (k=0; k<dd->P; k++) { 7347c6ae99SBarry Smith ymin = 0.0; ymax = (PetscReal)(dd->N - 1); 7447c6ae99SBarry Smith for (xmin=(PetscReal)(k*(dd->M+1)); xmin<(PetscReal)(dd->M+(k*(dd->M+1))); xmin++) { 7547c6ae99SBarry Smith ierr = PetscDrawLine(draw,xmin,ymin,xmin,ymax,PETSC_DRAW_BLACK);CHKERRQ(ierr); 7647c6ae99SBarry Smith } 7747c6ae99SBarry Smith 7847c6ae99SBarry Smith xmin = (PetscReal)(k*(dd->M+1)); xmax = xmin + (PetscReal)(dd->M - 1); 7947c6ae99SBarry Smith for (ymin=0; ymin<(PetscReal)dd->N; ymin++) { 8047c6ae99SBarry Smith ierr = PetscDrawLine(draw,xmin,ymin,xmax,ymin,PETSC_DRAW_BLACK);CHKERRQ(ierr); 8147c6ae99SBarry Smith } 8247c6ae99SBarry Smith } 8347c6ae99SBarry Smith } 8447c6ae99SBarry Smith ierr = PetscDrawSynchronizedFlush(draw);CHKERRQ(ierr); 8547c6ae99SBarry Smith ierr = PetscDrawPause(draw);CHKERRQ(ierr); 8647c6ae99SBarry Smith 8747c6ae99SBarry Smith for (k=0; k<dd->P; k++) { /*Go through and draw for each plane*/ 8847c6ae99SBarry Smith if ((k >= dd->zs) && (k < dd->ze)) { 8947c6ae99SBarry Smith /* draw my box */ 9047c6ae99SBarry Smith ymin = dd->ys; 9147c6ae99SBarry Smith ymax = dd->ye - 1; 9247c6ae99SBarry Smith xmin = dd->xs/dd->w + (dd->M+1)*k; 9347c6ae99SBarry Smith xmax =(dd->xe-1)/dd->w + (dd->M+1)*k; 9447c6ae99SBarry Smith 9547c6ae99SBarry Smith ierr = PetscDrawLine(draw,xmin,ymin,xmax,ymin,PETSC_DRAW_RED);CHKERRQ(ierr); 9647c6ae99SBarry Smith ierr = PetscDrawLine(draw,xmin,ymin,xmin,ymax,PETSC_DRAW_RED);CHKERRQ(ierr); 9747c6ae99SBarry Smith ierr = PetscDrawLine(draw,xmin,ymax,xmax,ymax,PETSC_DRAW_RED);CHKERRQ(ierr); 9847c6ae99SBarry Smith ierr = PetscDrawLine(draw,xmax,ymin,xmax,ymax,PETSC_DRAW_RED);CHKERRQ(ierr); 9947c6ae99SBarry Smith 10047c6ae99SBarry Smith xmin = dd->xs/dd->w; 10147c6ae99SBarry Smith xmax =(dd->xe-1)/dd->w; 10247c6ae99SBarry Smith 10347c6ae99SBarry Smith /* put in numbers*/ 10447c6ae99SBarry Smith base = (dd->base+(dd->xe-dd->xs)*(dd->ye-dd->ys)*(k-dd->zs))/dd->w; 10547c6ae99SBarry Smith 10647c6ae99SBarry Smith /* Identify which processor owns the box */ 10747c6ae99SBarry Smith sprintf(node,"%d",rank); 10847c6ae99SBarry Smith ierr = PetscDrawString(draw,xmin+(dd->M+1)*k+.2,ymin+.3,PETSC_DRAW_RED,node);CHKERRQ(ierr); 10947c6ae99SBarry Smith 11047c6ae99SBarry Smith for (y=ymin; y<=ymax; y++) { 11147c6ae99SBarry Smith for (x=xmin+(dd->M+1)*k; x<=xmax+(dd->M+1)*k; x++) { 11247c6ae99SBarry Smith sprintf(node,"%d",(int)base++); 11347c6ae99SBarry Smith ierr = PetscDrawString(draw,x,y,PETSC_DRAW_BLACK,node);CHKERRQ(ierr); 11447c6ae99SBarry Smith } 11547c6ae99SBarry Smith } 11647c6ae99SBarry Smith 11747c6ae99SBarry Smith } 11847c6ae99SBarry Smith } 11947c6ae99SBarry Smith ierr = PetscDrawSynchronizedFlush(draw);CHKERRQ(ierr); 12047c6ae99SBarry Smith ierr = PetscDrawPause(draw);CHKERRQ(ierr); 12147c6ae99SBarry Smith 12247c6ae99SBarry Smith for (k=0-dd->s; k<dd->P+dd->s; k++) { 12347c6ae99SBarry Smith /* Go through and draw for each plane */ 12447c6ae99SBarry Smith if ((k >= dd->Zs) && (k < dd->Ze)) { 12547c6ae99SBarry Smith 12647c6ae99SBarry Smith /* overlay ghost numbers, useful for error checking */ 12747c6ae99SBarry Smith base = (dd->Xe-dd->Xs)*(dd->Ye-dd->Ys)*(k-dd->Zs); idx = dd->idx; 12847c6ae99SBarry Smith plane=k; 12947c6ae99SBarry Smith /* Keep z wrap around points on the dradrawg */ 13047c6ae99SBarry Smith if (k<0) { plane=dd->P+k; } 13147c6ae99SBarry Smith if (k>=dd->P) { plane=k-dd->P; } 13247c6ae99SBarry Smith ymin = dd->Ys; ymax = dd->Ye; 13347c6ae99SBarry Smith xmin = (dd->M+1)*plane*dd->w; 13447c6ae99SBarry Smith xmax = (dd->M+1)*plane*dd->w+dd->M*dd->w; 13547c6ae99SBarry Smith for (y=ymin; y<ymax; y++) { 13647c6ae99SBarry Smith for (x=xmin+dd->Xs; x<xmin+dd->Xe; x+=dd->w) { 13747c6ae99SBarry Smith sprintf(node,"%d",(int)(idx[base]/dd->w)); 13847c6ae99SBarry Smith ycoord = y; 13947c6ae99SBarry Smith /*Keep y wrap around points on drawing */ 14047c6ae99SBarry Smith if (y<0) { ycoord = dd->N+y; } 14147c6ae99SBarry Smith 14247c6ae99SBarry Smith if (y>=dd->N) { ycoord = y-dd->N; } 14347c6ae99SBarry Smith xcoord = x; /* Keep x wrap points on drawing */ 14447c6ae99SBarry Smith 14547c6ae99SBarry Smith if (x<xmin) { xcoord = xmax - (xmin-x); } 14647c6ae99SBarry Smith if (x>=xmax) { xcoord = xmin + (x-xmax); } 14747c6ae99SBarry Smith ierr = PetscDrawString(draw,xcoord/dd->w,ycoord,PETSC_DRAW_BLUE,node);CHKERRQ(ierr); 14847c6ae99SBarry Smith base+=dd->w; 14947c6ae99SBarry Smith } 15047c6ae99SBarry Smith } 15147c6ae99SBarry Smith } 15247c6ae99SBarry Smith } 15347c6ae99SBarry Smith ierr = PetscDrawSynchronizedFlush(draw);CHKERRQ(ierr); 15447c6ae99SBarry Smith ierr = PetscDrawPause(draw);CHKERRQ(ierr); 1559a42bb27SBarry Smith } else if (isbinary){ 1569a42bb27SBarry Smith ierr = DMView_DA_Binary(da,viewer);CHKERRQ(ierr); 1579a42bb27SBarry Smith #if defined(PETSC_HAVE_MATLAB_ENGINE) 1589a42bb27SBarry Smith } else if (ismatlab) { 1599a42bb27SBarry Smith ierr = DMView_DA_Matlab(da,viewer);CHKERRQ(ierr); 1609a42bb27SBarry Smith #endif 161aa219208SBarry Smith } else SETERRQ1(((PetscObject)da)->comm,PETSC_ERR_SUP,"Viewer type %s not supported for DMDA 1d",((PetscObject)viewer)->type_name); 16247c6ae99SBarry Smith PetscFunctionReturn(0); 16347c6ae99SBarry Smith } 16447c6ae99SBarry Smith 16547c6ae99SBarry Smith #undef __FUNCT__ 1669a42bb27SBarry Smith #define __FUNCT__ "DMSetUp_DA_3D" 1677087cfbeSBarry Smith PetscErrorCode DMSetUp_DA_3D(DM da) 16847c6ae99SBarry Smith { 16947c6ae99SBarry Smith DM_DA *dd = (DM_DA*)da->data; 17047c6ae99SBarry Smith const PetscInt M = dd->M; 17147c6ae99SBarry Smith const PetscInt N = dd->N; 17247c6ae99SBarry Smith const PetscInt P = dd->P; 17347c6ae99SBarry Smith PetscInt m = dd->m; 17447c6ae99SBarry Smith PetscInt n = dd->n; 17547c6ae99SBarry Smith PetscInt p = dd->p; 17647c6ae99SBarry Smith const PetscInt dof = dd->w; 17747c6ae99SBarry Smith const PetscInt s = dd->s; 1781321219cSEthan Coon const DMDABoundaryType bx = dd->bx; 1791321219cSEthan Coon const DMDABoundaryType by = dd->by; 1801321219cSEthan Coon const DMDABoundaryType bz = dd->bz; 181aa219208SBarry Smith const DMDAStencilType stencil_type = dd->stencil_type; 18247c6ae99SBarry Smith PetscInt *lx = dd->lx; 18347c6ae99SBarry Smith PetscInt *ly = dd->ly; 18447c6ae99SBarry Smith PetscInt *lz = dd->lz; 18547c6ae99SBarry Smith MPI_Comm comm; 18647c6ae99SBarry Smith PetscMPIInt rank,size; 187ce00eea3SSatish Balay PetscInt xs = 0,xe,ys = 0,ye,zs = 0,ze,x = 0,y = 0,z = 0; 188ce00eea3SSatish Balay PetscInt Xs,Xe,Ys,Ye,Zs,Ze,IXs,IXe,IYs,IYe,IZs,IZe,start,end,pm; 189ce00eea3SSatish Balay PetscInt left,right,up,down,bottom,top,i,j,k,*idx,*idx_cpy,nn; 190ce00eea3SSatish Balay const PetscInt *idx_full; 19147c6ae99SBarry Smith PetscInt n0,n1,n2,n3,n4,n5,n6,n7,n8,n9,n10,n11,n12,n14; 19247c6ae99SBarry Smith PetscInt n15,n16,n17,n18,n19,n20,n21,n22,n23,n24,n25,n26; 193db87c5ecSEthan Coon PetscInt *bases,*ldims,base,x_t,y_t,z_t,s_t,count,s_x,s_y,s_z; 19447c6ae99SBarry Smith PetscInt sn0 = 0,sn1 = 0,sn2 = 0,sn3 = 0,sn5 = 0,sn6 = 0,sn7 = 0; 19547c6ae99SBarry Smith PetscInt sn8 = 0,sn9 = 0,sn11 = 0,sn15 = 0,sn24 = 0,sn25 = 0,sn26 = 0; 19647c6ae99SBarry Smith PetscInt sn17 = 0,sn18 = 0,sn19 = 0,sn20 = 0,sn21 = 0,sn23 = 0; 19747c6ae99SBarry Smith Vec local,global; 19847c6ae99SBarry Smith VecScatter ltog,gtol; 199ce00eea3SSatish Balay IS to,from,ltogis; 2006f951b95Secoon PetscBool twod; 20147c6ae99SBarry Smith PetscErrorCode ierr; 20247c6ae99SBarry Smith 2036f951b95Secoon 20447c6ae99SBarry Smith PetscFunctionBegin; 20547c6ae99SBarry Smith if (dof < 1) SETERRQ1(((PetscObject)da)->comm,PETSC_ERR_ARG_OUTOFRANGE,"Must have 1 or more degrees of freedom per node: %D",dof); 20647c6ae99SBarry Smith if (s < 0) SETERRQ1(((PetscObject)da)->comm,PETSC_ERR_ARG_OUTOFRANGE,"Stencil width cannot be negative: %D",s); 20747c6ae99SBarry Smith ierr = PetscObjectGetComm((PetscObject) da, &comm);CHKERRQ(ierr); 2083855c12bSBarry Smith #if !defined(PETSC_USE_64BIT_INDICES) 2093855c12bSBarry Smith if (((Petsc64bitInt) M)*((Petsc64bitInt) N)*((Petsc64bitInt) P)*((Petsc64bitInt) dof) > (Petsc64bitInt) PETSC_MPI_INT_MAX) SETERRQ3(comm,PETSC_ERR_INT_OVERFLOW,"Mesh of %D by %D by %D (dof) is too large for 32 bit indices",M,N,dof); 2103855c12bSBarry Smith #endif 2113855c12bSBarry Smith 21247c6ae99SBarry Smith ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr); 21347c6ae99SBarry Smith ierr = MPI_Comm_rank(comm,&rank);CHKERRQ(ierr); 21447c6ae99SBarry Smith 21547c6ae99SBarry Smith dd->dim = 3; 21647c6ae99SBarry Smith ierr = PetscMalloc(dof*sizeof(char*),&dd->fieldname);CHKERRQ(ierr); 21747c6ae99SBarry Smith ierr = PetscMemzero(dd->fieldname,dof*sizeof(char*));CHKERRQ(ierr); 21847c6ae99SBarry Smith 21947c6ae99SBarry Smith if (m != PETSC_DECIDE) { 22047c6ae99SBarry Smith if (m < 1) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Non-positive number of processors in X direction: %D",m); 22147c6ae99SBarry Smith else if (m > size) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Too many processors in X direction: %D %d",m,size); 22247c6ae99SBarry Smith } 22347c6ae99SBarry Smith if (n != PETSC_DECIDE) { 22447c6ae99SBarry Smith if (n < 1) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Non-positive number of processors in Y direction: %D",n); 22547c6ae99SBarry Smith else if (n > size) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Too many processors in Y direction: %D %d",n,size); 22647c6ae99SBarry Smith } 22747c6ae99SBarry Smith if (p != PETSC_DECIDE) { 22847c6ae99SBarry Smith if (p < 1) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Non-positive number of processors in Z direction: %D",p); 22947c6ae99SBarry Smith else if (p > size) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Too many processors in Z direction: %D %d",p,size); 23047c6ae99SBarry Smith } 2310716a85fSBarry Smith if ((m > 0) && (n > 0) && (p > 0) && (m*n*p != size)) SETERRQ4(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"m %D * n %D * p %D != size %d",m,n,p,size); 23247c6ae99SBarry Smith 23347c6ae99SBarry Smith /* Partition the array among the processors */ 23447c6ae99SBarry Smith if (m == PETSC_DECIDE && n != PETSC_DECIDE && p != PETSC_DECIDE) { 23547c6ae99SBarry Smith m = size/(n*p); 23647c6ae99SBarry Smith } else if (m != PETSC_DECIDE && n == PETSC_DECIDE && p != PETSC_DECIDE) { 23747c6ae99SBarry Smith n = size/(m*p); 23847c6ae99SBarry Smith } else if (m != PETSC_DECIDE && n != PETSC_DECIDE && p == PETSC_DECIDE) { 23947c6ae99SBarry Smith p = size/(m*n); 24047c6ae99SBarry Smith } else if (m == PETSC_DECIDE && n == PETSC_DECIDE && p != PETSC_DECIDE) { 24147c6ae99SBarry Smith /* try for squarish distribution */ 2428f1a2a5eSBarry Smith m = (int)(0.5 + sqrt(((double)M)*((double)size)/((double)N*p))); 24347c6ae99SBarry Smith if (!m) m = 1; 24447c6ae99SBarry Smith while (m > 0) { 24547c6ae99SBarry Smith n = size/(m*p); 24647c6ae99SBarry Smith if (m*n*p == size) break; 24747c6ae99SBarry Smith m--; 24847c6ae99SBarry Smith } 24947c6ae99SBarry Smith if (!m) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"bad p value: p = %D",p); 25047c6ae99SBarry Smith if (M > N && m < n) {PetscInt _m = m; m = n; n = _m;} 25147c6ae99SBarry Smith } else if (m == PETSC_DECIDE && n != PETSC_DECIDE && p == PETSC_DECIDE) { 25247c6ae99SBarry Smith /* try for squarish distribution */ 2538f1a2a5eSBarry Smith m = (int)(0.5 + sqrt(((double)M)*((double)size)/((double)P*n))); 25447c6ae99SBarry Smith if (!m) m = 1; 25547c6ae99SBarry Smith while (m > 0) { 25647c6ae99SBarry Smith p = size/(m*n); 25747c6ae99SBarry Smith if (m*n*p == size) break; 25847c6ae99SBarry Smith m--; 25947c6ae99SBarry Smith } 26047c6ae99SBarry Smith if (!m) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"bad n value: n = %D",n); 26147c6ae99SBarry Smith if (M > P && m < p) {PetscInt _m = m; m = p; p = _m;} 26247c6ae99SBarry Smith } else if (m != PETSC_DECIDE && n == PETSC_DECIDE && p == PETSC_DECIDE) { 26347c6ae99SBarry Smith /* try for squarish distribution */ 2648f1a2a5eSBarry Smith n = (int)(0.5 + sqrt(((double)N)*((double)size)/((double)P*m))); 26547c6ae99SBarry Smith if (!n) n = 1; 26647c6ae99SBarry Smith while (n > 0) { 26747c6ae99SBarry Smith p = size/(m*n); 26847c6ae99SBarry Smith if (m*n*p == size) break; 26947c6ae99SBarry Smith n--; 27047c6ae99SBarry Smith } 27147c6ae99SBarry Smith if (!n) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"bad m value: m = %D",n); 27247c6ae99SBarry Smith if (N > P && n < p) {PetscInt _n = n; n = p; p = _n;} 27347c6ae99SBarry Smith } else if (m == PETSC_DECIDE && n == PETSC_DECIDE && p == PETSC_DECIDE) { 27447c6ae99SBarry Smith /* try for squarish distribution */ 2758f1a2a5eSBarry Smith n = (PetscInt)(0.5 + pow(((double)N*N)*((double)size)/((double)P*M),(double)(1./3.))); 27647c6ae99SBarry Smith if (!n) n = 1; 27747c6ae99SBarry Smith while (n > 0) { 27847c6ae99SBarry Smith pm = size/n; 27947c6ae99SBarry Smith if (n*pm == size) break; 28047c6ae99SBarry Smith n--; 28147c6ae99SBarry Smith } 28247c6ae99SBarry Smith if (!n) n = 1; 2838f1a2a5eSBarry Smith m = (PetscInt)(0.5 + sqrt(((double)M)*((double)size)/((double)P*n))); 28447c6ae99SBarry Smith if (!m) m = 1; 28547c6ae99SBarry Smith while (m > 0) { 28647c6ae99SBarry Smith p = size/(m*n); 28747c6ae99SBarry Smith if (m*n*p == size) break; 28847c6ae99SBarry Smith m--; 28947c6ae99SBarry Smith } 29047c6ae99SBarry Smith if (M > P && m < p) {PetscInt _m = m; m = p; p = _m;} 29147c6ae99SBarry Smith } else if (m*n*p != size) SETERRQ(((PetscObject)da)->comm,PETSC_ERR_ARG_OUTOFRANGE,"Given Bad partition"); 29247c6ae99SBarry Smith 29347c6ae99SBarry Smith if (m*n*p != size) SETERRQ(((PetscObject)da)->comm,PETSC_ERR_PLIB,"Could not find good partition"); 29447c6ae99SBarry Smith if (M < m) SETERRQ2(((PetscObject)da)->comm,PETSC_ERR_ARG_OUTOFRANGE,"Partition in x direction is too fine! %D %D",M,m); 29547c6ae99SBarry Smith if (N < n) SETERRQ2(((PetscObject)da)->comm,PETSC_ERR_ARG_OUTOFRANGE,"Partition in y direction is too fine! %D %D",N,n); 29647c6ae99SBarry Smith if (P < p) SETERRQ2(((PetscObject)da)->comm,PETSC_ERR_ARG_OUTOFRANGE,"Partition in z direction is too fine! %D %D",P,p); 29747c6ae99SBarry Smith 29847c6ae99SBarry Smith /* 29947c6ae99SBarry Smith Determine locally owned region 30047c6ae99SBarry Smith [x, y, or z]s is the first local node number, [x, y, z] is the number of local nodes 30147c6ae99SBarry Smith */ 30247c6ae99SBarry Smith 30347c6ae99SBarry Smith if (!lx) { 30447c6ae99SBarry Smith ierr = PetscMalloc(m*sizeof(PetscInt), &dd->lx);CHKERRQ(ierr); 30547c6ae99SBarry Smith lx = dd->lx; 30647c6ae99SBarry Smith for (i=0; i<m; i++) { 30747c6ae99SBarry Smith lx[i] = M/m + ((M % m) > (i % m)); 30847c6ae99SBarry Smith } 30947c6ae99SBarry Smith } 31047c6ae99SBarry Smith x = lx[rank % m]; 31147c6ae99SBarry Smith xs = 0; 31247c6ae99SBarry Smith for (i=0; i<(rank%m); i++) { xs += lx[i];} 31330729d88SBarry Smith if ((x < s) && ((m > 1) || (bx == DMDA_BOUNDARY_PERIODIC))) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Local x-width of domain x %D is smaller than stencil width s %D",x,s); 31447c6ae99SBarry Smith 31547c6ae99SBarry Smith if (!ly) { 31647c6ae99SBarry Smith ierr = PetscMalloc(n*sizeof(PetscInt), &dd->ly);CHKERRQ(ierr); 31747c6ae99SBarry Smith ly = dd->ly; 31847c6ae99SBarry Smith for (i=0; i<n; i++) { 31947c6ae99SBarry Smith ly[i] = N/n + ((N % n) > (i % n)); 32047c6ae99SBarry Smith } 32147c6ae99SBarry Smith } 32247c6ae99SBarry Smith y = ly[(rank % (m*n))/m]; 32330729d88SBarry Smith if ((y < s) && ((n > 1) || (by == DMDA_BOUNDARY_PERIODIC))) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Local y-width of domain y %D is smaller than stencil width s %D",y,s); 32430729d88SBarry Smith 32547c6ae99SBarry Smith ys = 0; 32647c6ae99SBarry Smith for (i=0; i<(rank % (m*n))/m; i++) { ys += ly[i];} 32747c6ae99SBarry Smith 32847c6ae99SBarry Smith if (!lz) { 32947c6ae99SBarry Smith ierr = PetscMalloc(p*sizeof(PetscInt), &dd->lz);CHKERRQ(ierr); 33047c6ae99SBarry Smith lz = dd->lz; 33147c6ae99SBarry Smith for (i=0; i<p; i++) { 33247c6ae99SBarry Smith lz[i] = P/p + ((P % p) > (i % p)); 33347c6ae99SBarry Smith } 33447c6ae99SBarry Smith } 33547c6ae99SBarry Smith z = lz[rank/(m*n)]; 336bcea557cSEthan Coon 337fdc81ce8SEthan Coon /* note this is different than x- and y-, as we will handle as an important special 338fdc81ce8SEthan Coon case when p=P=1 and DMDA_BOUNDARY_PERIODIC and s > z. This is to deal with 2D problems 339fdc81ce8SEthan Coon in a 3D code. Additional code for this case is noted with "2d case" comments */ 3406f951b95Secoon twod = PETSC_FALSE; 3416f951b95Secoon if (P == 1) { 3426f951b95Secoon twod = PETSC_TRUE; 34330729d88SBarry Smith } else if ((z < s) && ((p > 1) || (bz == DMDA_BOUNDARY_PERIODIC))) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_OUTOFRANGE,"Local z-width of domain z %D is smaller than stencil width s %D",z,s); 34447c6ae99SBarry Smith zs = 0; 34547c6ae99SBarry Smith for (i=0; i<(rank/(m*n)); i++) { zs += lz[i];} 34647c6ae99SBarry Smith ye = ys + y; 34747c6ae99SBarry Smith xe = xs + x; 34847c6ae99SBarry Smith ze = zs + z; 34947c6ae99SBarry Smith 35047c6ae99SBarry Smith /* determine ghost region */ 35147c6ae99SBarry Smith /* Assume No Periodicity */ 352ce00eea3SSatish Balay if (xs-s > 0) { Xs = xs - s; IXs = xs - s; } else { Xs = 0; IXs = 0; } 353ce00eea3SSatish Balay if (xe+s <= M) { Xe = xe + s; IXe = xe + s; } else { Xe = M; IXe = M; } 354ce00eea3SSatish Balay if (ys-s > 0) { Ys = ys - s; IYs = ys - s; } else { Ys = 0; IYs = 0; } 355ce00eea3SSatish Balay if (ye+s <= N) { Ye = ye + s; IYe = ye + s; } else { Ye = N; IYe = N; } 356ce00eea3SSatish Balay if (zs-s > 0) { Zs = zs - s; IZs = zs - s; } else { Zs = 0; IZs = 0; } 357ce00eea3SSatish Balay if (ze+s <= P) { Ze = ze + s; IZe = ze + s; } else { Ze = P; IZe = P; } 35847c6ae99SBarry Smith 359ce00eea3SSatish Balay /* fix for periodicity/ghosted */ 3601321219cSEthan Coon if (bx) { Xs = xs - s; Xe = xe + s; } 3611321219cSEthan Coon if (bx == DMDA_BOUNDARY_PERIODIC) { IXs = xs - s; IXe = xe + s; } 3621321219cSEthan Coon if (by) { Ys = ys - s; Ye = ye + s; } 3631321219cSEthan Coon if (by == DMDA_BOUNDARY_PERIODIC) { IYs = ys - s; IYe = ye + s; } 3641321219cSEthan Coon if (bz) { Zs = zs - s; Ze = ze + s; } 3651321219cSEthan Coon if (bz == DMDA_BOUNDARY_PERIODIC) { IZs = zs - s; IZe = ze + s; } 36647c6ae99SBarry Smith 36747c6ae99SBarry Smith /* Resize all X parameters to reflect w */ 368ce00eea3SSatish Balay s_x = s; 36947c6ae99SBarry Smith s_y = s; 37047c6ae99SBarry Smith s_z = s; 37147c6ae99SBarry Smith 37247c6ae99SBarry Smith /* determine starting point of each processor */ 37347c6ae99SBarry Smith nn = x*y*z; 37447c6ae99SBarry Smith ierr = PetscMalloc2(size+1,PetscInt,&bases,size,PetscInt,&ldims);CHKERRQ(ierr); 37547c6ae99SBarry Smith ierr = MPI_Allgather(&nn,1,MPIU_INT,ldims,1,MPIU_INT,comm);CHKERRQ(ierr); 37647c6ae99SBarry Smith bases[0] = 0; 37747c6ae99SBarry Smith for (i=1; i<=size; i++) { 37847c6ae99SBarry Smith bases[i] = ldims[i-1]; 37947c6ae99SBarry Smith } 38047c6ae99SBarry Smith for (i=1; i<=size; i++) { 38147c6ae99SBarry Smith bases[i] += bases[i-1]; 38247c6ae99SBarry Smith } 383ce00eea3SSatish Balay base = bases[rank]*dof; 38447c6ae99SBarry Smith 38547c6ae99SBarry Smith /* allocate the base parallel and sequential vectors */ 386ce00eea3SSatish Balay dd->Nlocal = x*y*z*dof; 387778a2246SBarry Smith ierr = VecCreateMPIWithArray(comm,dof,dd->Nlocal,PETSC_DECIDE,0,&global);CHKERRQ(ierr); 388ce00eea3SSatish Balay dd->nlocal = (Xe-Xs)*(Ye-Ys)*(Ze-Zs)*dof; 389778a2246SBarry Smith ierr = VecCreateSeqWithArray(PETSC_COMM_SELF,dof,dd->nlocal,0,&local);CHKERRQ(ierr); 39047c6ae99SBarry Smith 39147c6ae99SBarry Smith /* generate appropriate vector scatters */ 39247c6ae99SBarry Smith /* local to global inserts non-ghost point region into global */ 39347c6ae99SBarry Smith ierr = VecGetOwnershipRange(global,&start,&end);CHKERRQ(ierr); 394ce00eea3SSatish Balay ierr = ISCreateStride(comm,x*y*z*dof,start,1,&to);CHKERRQ(ierr); 39547c6ae99SBarry Smith 396db87c5ecSEthan Coon count = x*y*z; 397ce00eea3SSatish Balay ierr = PetscMalloc(x*y*z*sizeof(PetscInt),&idx);CHKERRQ(ierr); 398ce00eea3SSatish Balay left = xs - Xs; right = left + x; 39947c6ae99SBarry Smith bottom = ys - Ys; top = bottom + y; 40047c6ae99SBarry Smith down = zs - Zs; up = down + z; 40147c6ae99SBarry Smith count = 0; 40247c6ae99SBarry Smith for (i=down; i<up; i++) { 40347c6ae99SBarry Smith for (j=bottom; j<top; j++) { 404ce00eea3SSatish Balay for (k=left; k<right; k++) { 405ce00eea3SSatish Balay idx[count++] = (i*(Ye-Ys) + j)*(Xe-Xs) + k; 40647c6ae99SBarry Smith } 40747c6ae99SBarry Smith } 40847c6ae99SBarry Smith } 40947c6ae99SBarry Smith 41047c6ae99SBarry Smith ierr = ISCreateBlock(comm,dof,count,idx,PETSC_OWN_POINTER,&from);CHKERRQ(ierr); 41147c6ae99SBarry Smith ierr = VecScatterCreate(local,from,global,to,<og);CHKERRQ(ierr); 41247c6ae99SBarry Smith ierr = PetscLogObjectParent(da,ltog);CHKERRQ(ierr); 413fcfd50ebSBarry Smith ierr = ISDestroy(&from);CHKERRQ(ierr); 414fcfd50ebSBarry Smith ierr = ISDestroy(&to);CHKERRQ(ierr); 41547c6ae99SBarry Smith 416ce00eea3SSatish Balay /* global to local must include ghost points within the domain, 417ce00eea3SSatish Balay but not ghost points outside the domain that aren't periodic */ 418aa219208SBarry Smith if (stencil_type == DMDA_STENCIL_BOX) { 419db87c5ecSEthan Coon count = (IXe-IXs)*(IYe-IYs)*(IZe-IZs); 420db87c5ecSEthan Coon ierr = PetscMalloc(count*sizeof(PetscInt),&idx);CHKERRQ(ierr); 421ce00eea3SSatish Balay 422ce00eea3SSatish Balay left = IXs - Xs; right = left + (IXe-IXs); 423ce00eea3SSatish Balay bottom = IYs - Ys; top = bottom + (IYe-IYs); 424ce00eea3SSatish Balay down = IZs - Zs; up = down + (IZe-IZs); 425ce00eea3SSatish Balay count = 0; 426ce00eea3SSatish Balay for (i=down; i<up; i++) { 427ce00eea3SSatish Balay for (j=bottom; j<top; j++) { 428ce00eea3SSatish Balay for (k=left; k<right; k++) { 429ce00eea3SSatish Balay idx[count++] = (i*(Ye-Ys) + j)*(Xe-Xs) + k; 430ce00eea3SSatish Balay } 431ce00eea3SSatish Balay } 432ce00eea3SSatish Balay } 433ce00eea3SSatish Balay ierr = ISCreateBlock(comm,dof,count,idx,PETSC_OWN_POINTER,&to);CHKERRQ(ierr); 434ce00eea3SSatish Balay 43547c6ae99SBarry Smith } else { 43647c6ae99SBarry Smith /* This is way ugly! We need to list the funny cross type region */ 437db87c5ecSEthan Coon count = ((ys-IYs) + (IYe-ye))*x*z + ((xs-IXs) + (IXe-xe))*y*z + ((zs-IZs) + (IZe-ze))*x*y + x*y*z; 438db87c5ecSEthan Coon ierr = PetscMalloc(count*sizeof(PetscInt),&idx);CHKERRQ(ierr); 439ce00eea3SSatish Balay 440ce00eea3SSatish Balay left = xs - Xs; right = left + x; 44147c6ae99SBarry Smith bottom = ys - Ys; top = bottom + y; 44247c6ae99SBarry Smith down = zs - Zs; up = down + z; 44347c6ae99SBarry Smith count = 0; 444ce00eea3SSatish Balay /* the bottom chunck */ 445ce00eea3SSatish Balay for (i=(IZs-Zs); i<down; i++) { 44647c6ae99SBarry Smith for (j=bottom; j<top; j++) { 447ce00eea3SSatish Balay for (k=left; k<right; k++) idx[count++] = (i*(Ye-Ys) + j)*(Xe-Xs) + k; 44847c6ae99SBarry Smith } 44947c6ae99SBarry Smith } 45047c6ae99SBarry Smith /* the middle piece */ 45147c6ae99SBarry Smith for (i=down; i<up; i++) { 45247c6ae99SBarry Smith /* front */ 453ce00eea3SSatish Balay for (j=(IYs-Ys); j<bottom; j++) { 454ce00eea3SSatish Balay for (k=left; k<right; k++) idx[count++] = (i*(Ye-Ys) + j)*(Xe-Xs) + k; 45547c6ae99SBarry Smith } 45647c6ae99SBarry Smith /* middle */ 45747c6ae99SBarry Smith for (j=bottom; j<top; j++) { 458ce00eea3SSatish Balay for (k=IXs-Xs; k<IXe-Xs; k++) idx[count++] = (i*(Ye-Ys) + j)*(Xe-Xs) + k; 45947c6ae99SBarry Smith } 46047c6ae99SBarry Smith /* back */ 461ce00eea3SSatish Balay for (j=top; j<top+IYe-ye; j++) { 462ce00eea3SSatish Balay for (k=left; k<right; k++) idx[count++] = (i*(Ye-Ys) + j)*(Xe-Xs) + k; 46347c6ae99SBarry Smith } 46447c6ae99SBarry Smith } 46547c6ae99SBarry Smith /* the top piece */ 466ce00eea3SSatish Balay for (i=up; i<up+IZe-ze; i++) { 46747c6ae99SBarry Smith for (j=bottom; j<top; j++) { 468ce00eea3SSatish Balay for (k=left; k<right; k++) idx[count++] = (i*(Ye-Ys) + j)*(Xe-Xs) + k; 46947c6ae99SBarry Smith } 47047c6ae99SBarry Smith } 47147c6ae99SBarry Smith ierr = ISCreateBlock(comm,dof,count,idx,PETSC_OWN_POINTER,&to);CHKERRQ(ierr); 47247c6ae99SBarry Smith } 47347c6ae99SBarry Smith 47447c6ae99SBarry Smith /* determine who lies on each side of use stored in n24 n25 n26 47547c6ae99SBarry Smith n21 n22 n23 47647c6ae99SBarry Smith n18 n19 n20 47747c6ae99SBarry Smith 47847c6ae99SBarry Smith n15 n16 n17 47947c6ae99SBarry Smith n12 n14 48047c6ae99SBarry Smith n9 n10 n11 48147c6ae99SBarry Smith 48247c6ae99SBarry Smith n6 n7 n8 48347c6ae99SBarry Smith n3 n4 n5 48447c6ae99SBarry Smith n0 n1 n2 48547c6ae99SBarry Smith */ 48647c6ae99SBarry Smith 48747c6ae99SBarry Smith /* Solve for X,Y, and Z Periodic Case First, Then Modify Solution */ 48847c6ae99SBarry Smith /* Assume Nodes are Internal to the Cube */ 48947c6ae99SBarry Smith n0 = rank - m*n - m - 1; 49047c6ae99SBarry Smith n1 = rank - m*n - m; 49147c6ae99SBarry Smith n2 = rank - m*n - m + 1; 49247c6ae99SBarry Smith n3 = rank - m*n -1; 49347c6ae99SBarry Smith n4 = rank - m*n; 49447c6ae99SBarry Smith n5 = rank - m*n + 1; 49547c6ae99SBarry Smith n6 = rank - m*n + m - 1; 49647c6ae99SBarry Smith n7 = rank - m*n + m; 49747c6ae99SBarry Smith n8 = rank - m*n + m + 1; 49847c6ae99SBarry Smith 49947c6ae99SBarry Smith n9 = rank - m - 1; 50047c6ae99SBarry Smith n10 = rank - m; 50147c6ae99SBarry Smith n11 = rank - m + 1; 50247c6ae99SBarry Smith n12 = rank - 1; 50347c6ae99SBarry Smith n14 = rank + 1; 50447c6ae99SBarry Smith n15 = rank + m - 1; 50547c6ae99SBarry Smith n16 = rank + m; 50647c6ae99SBarry Smith n17 = rank + m + 1; 50747c6ae99SBarry Smith 50847c6ae99SBarry Smith n18 = rank + m*n - m - 1; 50947c6ae99SBarry Smith n19 = rank + m*n - m; 51047c6ae99SBarry Smith n20 = rank + m*n - m + 1; 51147c6ae99SBarry Smith n21 = rank + m*n - 1; 51247c6ae99SBarry Smith n22 = rank + m*n; 51347c6ae99SBarry Smith n23 = rank + m*n + 1; 51447c6ae99SBarry Smith n24 = rank + m*n + m - 1; 51547c6ae99SBarry Smith n25 = rank + m*n + m; 51647c6ae99SBarry Smith n26 = rank + m*n + m + 1; 51747c6ae99SBarry Smith 51847c6ae99SBarry Smith /* Assume Pieces are on Faces of Cube */ 51947c6ae99SBarry Smith 52047c6ae99SBarry Smith if (xs == 0) { /* First assume not corner or edge */ 52147c6ae99SBarry Smith n0 = rank -1 - (m*n); 52247c6ae99SBarry Smith n3 = rank + m -1 - (m*n); 52347c6ae99SBarry Smith n6 = rank + 2*m -1 - (m*n); 52447c6ae99SBarry Smith n9 = rank -1; 52547c6ae99SBarry Smith n12 = rank + m -1; 52647c6ae99SBarry Smith n15 = rank + 2*m -1; 52747c6ae99SBarry Smith n18 = rank -1 + (m*n); 52847c6ae99SBarry Smith n21 = rank + m -1 + (m*n); 52947c6ae99SBarry Smith n24 = rank + 2*m -1 + (m*n); 53047c6ae99SBarry Smith } 53147c6ae99SBarry Smith 532ce00eea3SSatish Balay if (xe == M) { /* First assume not corner or edge */ 53347c6ae99SBarry Smith n2 = rank -2*m +1 - (m*n); 53447c6ae99SBarry Smith n5 = rank - m +1 - (m*n); 53547c6ae99SBarry Smith n8 = rank +1 - (m*n); 53647c6ae99SBarry Smith n11 = rank -2*m +1; 53747c6ae99SBarry Smith n14 = rank - m +1; 53847c6ae99SBarry Smith n17 = rank +1; 53947c6ae99SBarry Smith n20 = rank -2*m +1 + (m*n); 54047c6ae99SBarry Smith n23 = rank - m +1 + (m*n); 54147c6ae99SBarry Smith n26 = rank +1 + (m*n); 54247c6ae99SBarry Smith } 54347c6ae99SBarry Smith 54447c6ae99SBarry Smith if (ys==0) { /* First assume not corner or edge */ 54547c6ae99SBarry Smith n0 = rank + m * (n-1) -1 - (m*n); 54647c6ae99SBarry Smith n1 = rank + m * (n-1) - (m*n); 54747c6ae99SBarry Smith n2 = rank + m * (n-1) +1 - (m*n); 54847c6ae99SBarry Smith n9 = rank + m * (n-1) -1; 54947c6ae99SBarry Smith n10 = rank + m * (n-1); 55047c6ae99SBarry Smith n11 = rank + m * (n-1) +1; 55147c6ae99SBarry Smith n18 = rank + m * (n-1) -1 + (m*n); 55247c6ae99SBarry Smith n19 = rank + m * (n-1) + (m*n); 55347c6ae99SBarry Smith n20 = rank + m * (n-1) +1 + (m*n); 55447c6ae99SBarry Smith } 55547c6ae99SBarry Smith 55647c6ae99SBarry Smith if (ye == N) { /* First assume not corner or edge */ 55747c6ae99SBarry Smith n6 = rank - m * (n-1) -1 - (m*n); 55847c6ae99SBarry Smith n7 = rank - m * (n-1) - (m*n); 55947c6ae99SBarry Smith n8 = rank - m * (n-1) +1 - (m*n); 56047c6ae99SBarry Smith n15 = rank - m * (n-1) -1; 56147c6ae99SBarry Smith n16 = rank - m * (n-1); 56247c6ae99SBarry Smith n17 = rank - m * (n-1) +1; 56347c6ae99SBarry Smith n24 = rank - m * (n-1) -1 + (m*n); 56447c6ae99SBarry Smith n25 = rank - m * (n-1) + (m*n); 56547c6ae99SBarry Smith n26 = rank - m * (n-1) +1 + (m*n); 56647c6ae99SBarry Smith } 56747c6ae99SBarry Smith 56847c6ae99SBarry Smith if (zs == 0) { /* First assume not corner or edge */ 56947c6ae99SBarry Smith n0 = size - (m*n) + rank - m - 1; 57047c6ae99SBarry Smith n1 = size - (m*n) + rank - m; 57147c6ae99SBarry Smith n2 = size - (m*n) + rank - m + 1; 57247c6ae99SBarry Smith n3 = size - (m*n) + rank - 1; 57347c6ae99SBarry Smith n4 = size - (m*n) + rank; 57447c6ae99SBarry Smith n5 = size - (m*n) + rank + 1; 57547c6ae99SBarry Smith n6 = size - (m*n) + rank + m - 1; 57647c6ae99SBarry Smith n7 = size - (m*n) + rank + m ; 57747c6ae99SBarry Smith n8 = size - (m*n) + rank + m + 1; 57847c6ae99SBarry Smith } 57947c6ae99SBarry Smith 58047c6ae99SBarry Smith if (ze == P) { /* First assume not corner or edge */ 58147c6ae99SBarry Smith n18 = (m*n) - (size-rank) - m - 1; 58247c6ae99SBarry Smith n19 = (m*n) - (size-rank) - m; 58347c6ae99SBarry Smith n20 = (m*n) - (size-rank) - m + 1; 58447c6ae99SBarry Smith n21 = (m*n) - (size-rank) - 1; 58547c6ae99SBarry Smith n22 = (m*n) - (size-rank); 58647c6ae99SBarry Smith n23 = (m*n) - (size-rank) + 1; 58747c6ae99SBarry Smith n24 = (m*n) - (size-rank) + m - 1; 58847c6ae99SBarry Smith n25 = (m*n) - (size-rank) + m; 58947c6ae99SBarry Smith n26 = (m*n) - (size-rank) + m + 1; 59047c6ae99SBarry Smith } 59147c6ae99SBarry Smith 59247c6ae99SBarry Smith if ((xs==0) && (zs==0)) { /* Assume an edge, not corner */ 59347c6ae99SBarry Smith n0 = size - m*n + rank + m-1 - m; 59447c6ae99SBarry Smith n3 = size - m*n + rank + m-1; 59547c6ae99SBarry Smith n6 = size - m*n + rank + m-1 + m; 59647c6ae99SBarry Smith } 59747c6ae99SBarry Smith 59847c6ae99SBarry Smith if ((xs==0) && (ze==P)) { /* Assume an edge, not corner */ 59947c6ae99SBarry Smith n18 = m*n - (size - rank) + m-1 - m; 60047c6ae99SBarry Smith n21 = m*n - (size - rank) + m-1; 60147c6ae99SBarry Smith n24 = m*n - (size - rank) + m-1 + m; 60247c6ae99SBarry Smith } 60347c6ae99SBarry Smith 60447c6ae99SBarry Smith if ((xs==0) && (ys==0)) { /* Assume an edge, not corner */ 60547c6ae99SBarry Smith n0 = rank + m*n -1 - m*n; 60647c6ae99SBarry Smith n9 = rank + m*n -1; 60747c6ae99SBarry Smith n18 = rank + m*n -1 + m*n; 60847c6ae99SBarry Smith } 60947c6ae99SBarry Smith 61047c6ae99SBarry Smith if ((xs==0) && (ye==N)) { /* Assume an edge, not corner */ 61147c6ae99SBarry Smith n6 = rank - m*(n-1) + m-1 - m*n; 61247c6ae99SBarry Smith n15 = rank - m*(n-1) + m-1; 61347c6ae99SBarry Smith n24 = rank - m*(n-1) + m-1 + m*n; 61447c6ae99SBarry Smith } 61547c6ae99SBarry Smith 616ce00eea3SSatish Balay if ((xe==M) && (zs==0)) { /* Assume an edge, not corner */ 61747c6ae99SBarry Smith n2 = size - (m*n-rank) - (m-1) - m; 61847c6ae99SBarry Smith n5 = size - (m*n-rank) - (m-1); 61947c6ae99SBarry Smith n8 = size - (m*n-rank) - (m-1) + m; 62047c6ae99SBarry Smith } 62147c6ae99SBarry Smith 622ce00eea3SSatish Balay if ((xe==M) && (ze==P)) { /* Assume an edge, not corner */ 62347c6ae99SBarry Smith n20 = m*n - (size - rank) - (m-1) - m; 62447c6ae99SBarry Smith n23 = m*n - (size - rank) - (m-1); 62547c6ae99SBarry Smith n26 = m*n - (size - rank) - (m-1) + m; 62647c6ae99SBarry Smith } 62747c6ae99SBarry Smith 628ce00eea3SSatish Balay if ((xe==M) && (ys==0)) { /* Assume an edge, not corner */ 62947c6ae99SBarry Smith n2 = rank + m*(n-1) - (m-1) - m*n; 63047c6ae99SBarry Smith n11 = rank + m*(n-1) - (m-1); 63147c6ae99SBarry Smith n20 = rank + m*(n-1) - (m-1) + m*n; 63247c6ae99SBarry Smith } 63347c6ae99SBarry Smith 634ce00eea3SSatish Balay if ((xe==M) && (ye==N)) { /* Assume an edge, not corner */ 63547c6ae99SBarry Smith n8 = rank - m*n +1 - m*n; 63647c6ae99SBarry Smith n17 = rank - m*n +1; 63747c6ae99SBarry Smith n26 = rank - m*n +1 + m*n; 63847c6ae99SBarry Smith } 63947c6ae99SBarry Smith 64047c6ae99SBarry Smith if ((ys==0) && (zs==0)) { /* Assume an edge, not corner */ 64147c6ae99SBarry Smith n0 = size - m + rank -1; 64247c6ae99SBarry Smith n1 = size - m + rank; 64347c6ae99SBarry Smith n2 = size - m + rank +1; 64447c6ae99SBarry Smith } 64547c6ae99SBarry Smith 64647c6ae99SBarry Smith if ((ys==0) && (ze==P)) { /* Assume an edge, not corner */ 64747c6ae99SBarry Smith n18 = m*n - (size - rank) + m*(n-1) -1; 64847c6ae99SBarry Smith n19 = m*n - (size - rank) + m*(n-1); 64947c6ae99SBarry Smith n20 = m*n - (size - rank) + m*(n-1) +1; 65047c6ae99SBarry Smith } 65147c6ae99SBarry Smith 65247c6ae99SBarry Smith if ((ye==N) && (zs==0)) { /* Assume an edge, not corner */ 65347c6ae99SBarry Smith n6 = size - (m*n-rank) - m * (n-1) -1; 65447c6ae99SBarry Smith n7 = size - (m*n-rank) - m * (n-1); 65547c6ae99SBarry Smith n8 = size - (m*n-rank) - m * (n-1) +1; 65647c6ae99SBarry Smith } 65747c6ae99SBarry Smith 65847c6ae99SBarry Smith if ((ye==N) && (ze==P)) { /* Assume an edge, not corner */ 65947c6ae99SBarry Smith n24 = rank - (size-m) -1; 66047c6ae99SBarry Smith n25 = rank - (size-m); 66147c6ae99SBarry Smith n26 = rank - (size-m) +1; 66247c6ae99SBarry Smith } 66347c6ae99SBarry Smith 66447c6ae99SBarry Smith /* Check for Corners */ 66547c6ae99SBarry Smith if ((xs==0) && (ys==0) && (zs==0)) { n0 = size -1;} 66647c6ae99SBarry Smith if ((xs==0) && (ys==0) && (ze==P)) { n18 = m*n-1;} 66747c6ae99SBarry Smith if ((xs==0) && (ye==N) && (zs==0)) { n6 = (size-1)-m*(n-1);} 66847c6ae99SBarry Smith if ((xs==0) && (ye==N) && (ze==P)) { n24 = m-1;} 669ce00eea3SSatish Balay if ((xe==M) && (ys==0) && (zs==0)) { n2 = size-m;} 670ce00eea3SSatish Balay if ((xe==M) && (ys==0) && (ze==P)) { n20 = m*n-m;} 671ce00eea3SSatish Balay if ((xe==M) && (ye==N) && (zs==0)) { n8 = size-m*n;} 672ce00eea3SSatish Balay if ((xe==M) && (ye==N) && (ze==P)) { n26 = 0;} 67347c6ae99SBarry Smith 67447c6ae99SBarry Smith /* Check for when not X,Y, and Z Periodic */ 67547c6ae99SBarry Smith 67647c6ae99SBarry Smith /* If not X periodic */ 6771321219cSEthan Coon if (bx != DMDA_BOUNDARY_PERIODIC) { 67847c6ae99SBarry Smith if (xs==0) {n0 = n3 = n6 = n9 = n12 = n15 = n18 = n21 = n24 = -2;} 679ce00eea3SSatish Balay if (xe==M) {n2 = n5 = n8 = n11 = n14 = n17 = n20 = n23 = n26 = -2;} 68047c6ae99SBarry Smith } 68147c6ae99SBarry Smith 68247c6ae99SBarry Smith /* If not Y periodic */ 6831321219cSEthan Coon if (by != DMDA_BOUNDARY_PERIODIC) { 68447c6ae99SBarry Smith if (ys==0) {n0 = n1 = n2 = n9 = n10 = n11 = n18 = n19 = n20 = -2;} 68547c6ae99SBarry Smith if (ye==N) {n6 = n7 = n8 = n15 = n16 = n17 = n24 = n25 = n26 = -2;} 68647c6ae99SBarry Smith } 68747c6ae99SBarry Smith 68847c6ae99SBarry Smith /* If not Z periodic */ 6891321219cSEthan Coon if (bz != DMDA_BOUNDARY_PERIODIC) { 69047c6ae99SBarry Smith if (zs==0) {n0 = n1 = n2 = n3 = n4 = n5 = n6 = n7 = n8 = -2;} 69147c6ae99SBarry Smith if (ze==P) {n18 = n19 = n20 = n21 = n22 = n23 = n24 = n25 = n26 = -2;} 69247c6ae99SBarry Smith } 69347c6ae99SBarry Smith 69447c6ae99SBarry Smith ierr = PetscMalloc(27*sizeof(PetscInt),&dd->neighbors);CHKERRQ(ierr); 69547c6ae99SBarry Smith dd->neighbors[0] = n0; 69647c6ae99SBarry Smith dd->neighbors[1] = n1; 69747c6ae99SBarry Smith dd->neighbors[2] = n2; 69847c6ae99SBarry Smith dd->neighbors[3] = n3; 69947c6ae99SBarry Smith dd->neighbors[4] = n4; 70047c6ae99SBarry Smith dd->neighbors[5] = n5; 70147c6ae99SBarry Smith dd->neighbors[6] = n6; 70247c6ae99SBarry Smith dd->neighbors[7] = n7; 70347c6ae99SBarry Smith dd->neighbors[8] = n8; 70447c6ae99SBarry Smith dd->neighbors[9] = n9; 70547c6ae99SBarry Smith dd->neighbors[10] = n10; 70647c6ae99SBarry Smith dd->neighbors[11] = n11; 70747c6ae99SBarry Smith dd->neighbors[12] = n12; 70847c6ae99SBarry Smith dd->neighbors[13] = rank; 70947c6ae99SBarry Smith dd->neighbors[14] = n14; 71047c6ae99SBarry Smith dd->neighbors[15] = n15; 71147c6ae99SBarry Smith dd->neighbors[16] = n16; 71247c6ae99SBarry Smith dd->neighbors[17] = n17; 71347c6ae99SBarry Smith dd->neighbors[18] = n18; 71447c6ae99SBarry Smith dd->neighbors[19] = n19; 71547c6ae99SBarry Smith dd->neighbors[20] = n20; 71647c6ae99SBarry Smith dd->neighbors[21] = n21; 71747c6ae99SBarry Smith dd->neighbors[22] = n22; 71847c6ae99SBarry Smith dd->neighbors[23] = n23; 71947c6ae99SBarry Smith dd->neighbors[24] = n24; 72047c6ae99SBarry Smith dd->neighbors[25] = n25; 72147c6ae99SBarry Smith dd->neighbors[26] = n26; 72247c6ae99SBarry Smith 72347c6ae99SBarry Smith /* If star stencil then delete the corner neighbors */ 724aa219208SBarry Smith if (stencil_type == DMDA_STENCIL_STAR) { 72547c6ae99SBarry Smith /* save information about corner neighbors */ 72647c6ae99SBarry Smith sn0 = n0; sn1 = n1; sn2 = n2; sn3 = n3; sn5 = n5; sn6 = n6; sn7 = n7; 72747c6ae99SBarry Smith sn8 = n8; sn9 = n9; sn11 = n11; sn15 = n15; sn17 = n17; sn18 = n18; 72847c6ae99SBarry Smith sn19 = n19; sn20 = n20; sn21 = n21; sn23 = n23; sn24 = n24; sn25 = n25; 72947c6ae99SBarry Smith sn26 = n26; 73047c6ae99SBarry Smith n0 = n1 = n2 = n3 = n5 = n6 = n7 = n8 = n9 = n11 = 73147c6ae99SBarry Smith n15 = n17 = n18 = n19 = n20 = n21 = n23 = n24 = n25 = n26 = -1; 73247c6ae99SBarry Smith } 73347c6ae99SBarry Smith 73447c6ae99SBarry Smith 73547c6ae99SBarry Smith ierr = PetscMalloc((Xe-Xs)*(Ye-Ys)*(Ze-Zs)*sizeof(PetscInt),&idx);CHKERRQ(ierr); 73647c6ae99SBarry Smith ierr = PetscLogObjectMemory(da,(Xe-Xs)*(Ye-Ys)*(Ze-Zs)*sizeof(PetscInt));CHKERRQ(ierr); 73747c6ae99SBarry Smith 73847c6ae99SBarry Smith nn = 0; 73947c6ae99SBarry Smith /* Bottom Level */ 74047c6ae99SBarry Smith for (k=0; k<s_z; k++) { 74147c6ae99SBarry Smith for (i=1; i<=s_y; i++) { 74247c6ae99SBarry Smith if (n0 >= 0) { /* left below */ 743ce00eea3SSatish Balay x_t = lx[n0 % m]; 74447c6ae99SBarry Smith y_t = ly[(n0 % (m*n))/m]; 74547c6ae99SBarry Smith z_t = lz[n0 / (m*n)]; 74647c6ae99SBarry Smith s_t = bases[n0] + x_t*y_t*z_t - (s_y-i)*x_t - s_x - (s_z-k-1)*x_t*y_t; 7476f951b95Secoon if (twod && (s_t < 0)) {s_t = bases[n0] + x_t*y_t*z_t - (s_y-i)*x_t - s_x;} /* 2D case */ 74847c6ae99SBarry Smith for (j=0; j<s_x; j++) { idx[nn++] = s_t++;} 74947c6ae99SBarry Smith } 75047c6ae99SBarry Smith if (n1 >= 0) { /* directly below */ 75147c6ae99SBarry Smith x_t = x; 75247c6ae99SBarry Smith y_t = ly[(n1 % (m*n))/m]; 75347c6ae99SBarry Smith z_t = lz[n1 / (m*n)]; 75447c6ae99SBarry Smith s_t = bases[n1] + x_t*y_t*z_t - (s_y+1-i)*x_t - (s_z-k-1)*x_t*y_t; 7556f951b95Secoon if (twod && (s_t < 0)) {s_t = bases[n1] + x_t*y_t*z_t - (s_y+1-i)*x_t;} /* 2D case */ 75647c6ae99SBarry Smith for (j=0; j<x_t; j++) { idx[nn++] = s_t++;} 75747c6ae99SBarry Smith } 75847c6ae99SBarry Smith if (n2 >= 0) { /* right below */ 759ce00eea3SSatish Balay x_t = lx[n2 % m]; 76047c6ae99SBarry Smith y_t = ly[(n2 % (m*n))/m]; 76147c6ae99SBarry Smith z_t = lz[n2 / (m*n)]; 76247c6ae99SBarry Smith s_t = bases[n2] + x_t*y_t*z_t - (s_y+1-i)*x_t - (s_z-k-1)*x_t*y_t; 7636f951b95Secoon if (twod && (s_t < 0)) {s_t = bases[n2] + x_t*y_t*z_t - (s_y+1-i)*x_t;} /* 2D case */ 76447c6ae99SBarry Smith for (j=0; j<s_x; j++) { idx[nn++] = s_t++;} 76547c6ae99SBarry Smith } 76647c6ae99SBarry Smith } 76747c6ae99SBarry Smith 76847c6ae99SBarry Smith for (i=0; i<y; i++) { 76947c6ae99SBarry Smith if (n3 >= 0) { /* directly left */ 770ce00eea3SSatish Balay x_t = lx[n3 % m]; 77147c6ae99SBarry Smith y_t = y; 77247c6ae99SBarry Smith z_t = lz[n3 / (m*n)]; 77347c6ae99SBarry Smith s_t = bases[n3] + (i+1)*x_t - s_x + x_t*y_t*z_t - (s_z-k)*x_t*y_t; 7746f951b95Secoon if (twod && (s_t < 0)) {s_t = bases[n3] + (i+1)*x_t - s_x + x_t*y_t*z_t - x_t*y_t;} /* 2D case */ 77547c6ae99SBarry Smith for (j=0; j<s_x; j++) { idx[nn++] = s_t++;} 77647c6ae99SBarry Smith } 77747c6ae99SBarry Smith 77847c6ae99SBarry Smith if (n4 >= 0) { /* middle */ 77947c6ae99SBarry Smith x_t = x; 78047c6ae99SBarry Smith y_t = y; 78147c6ae99SBarry Smith z_t = lz[n4 / (m*n)]; 78247c6ae99SBarry Smith s_t = bases[n4] + i*x_t + x_t*y_t*z_t - (s_z-k)*x_t*y_t; 7836f951b95Secoon if (twod && (s_t < 0)) {s_t = bases[n4] + i*x_t + x_t*y_t*z_t - x_t*y_t;} /* 2D case */ 78447c6ae99SBarry Smith for (j=0; j<x_t; j++) { idx[nn++] = s_t++;} 78547c6ae99SBarry Smith } 78647c6ae99SBarry Smith 78747c6ae99SBarry Smith if (n5 >= 0) { /* directly right */ 788ce00eea3SSatish Balay x_t = lx[n5 % m]; 78947c6ae99SBarry Smith y_t = y; 79047c6ae99SBarry Smith z_t = lz[n5 / (m*n)]; 79147c6ae99SBarry Smith s_t = bases[n5] + i*x_t + x_t*y_t*z_t - (s_z-k)*x_t*y_t; 7926f951b95Secoon if (twod && (s_t < 0)) {s_t = bases[n5] + i*x_t + x_t*y_t*z_t - x_t*y_t;} /* 2D case */ 79347c6ae99SBarry Smith for (j=0; j<s_x; j++) { idx[nn++] = s_t++;} 79447c6ae99SBarry Smith } 79547c6ae99SBarry Smith } 79647c6ae99SBarry Smith 79747c6ae99SBarry Smith for (i=1; i<=s_y; i++) { 79847c6ae99SBarry Smith if (n6 >= 0) { /* left above */ 799ce00eea3SSatish Balay x_t = lx[n6 % m]; 80047c6ae99SBarry Smith y_t = ly[(n6 % (m*n))/m]; 80147c6ae99SBarry Smith z_t = lz[n6 / (m*n)]; 80247c6ae99SBarry Smith s_t = bases[n6] + i*x_t - s_x + x_t*y_t*z_t - (s_z-k)*x_t*y_t; 8036f951b95Secoon if (twod && (s_t < 0)) {s_t = bases[n6] + i*x_t - s_x + x_t*y_t*z_t - x_t*y_t;} /* 2D case */ 80447c6ae99SBarry Smith for (j=0; j<s_x; j++) { idx[nn++] = s_t++;} 80547c6ae99SBarry Smith } 80647c6ae99SBarry Smith if (n7 >= 0) { /* directly above */ 80747c6ae99SBarry Smith x_t = x; 80847c6ae99SBarry Smith y_t = ly[(n7 % (m*n))/m]; 80947c6ae99SBarry Smith z_t = lz[n7 / (m*n)]; 81047c6ae99SBarry Smith s_t = bases[n7] + (i-1)*x_t + x_t*y_t*z_t - (s_z-k)*x_t*y_t; 8116f951b95Secoon if (twod && (s_t < 0)) {s_t = bases[n7] + (i-1)*x_t + x_t*y_t*z_t - x_t*y_t;} /* 2D case */ 81247c6ae99SBarry Smith for (j=0; j<x_t; j++) { idx[nn++] = s_t++;} 81347c6ae99SBarry Smith } 81447c6ae99SBarry Smith if (n8 >= 0) { /* right above */ 815ce00eea3SSatish Balay x_t = lx[n8 % m]; 81647c6ae99SBarry Smith y_t = ly[(n8 % (m*n))/m]; 81747c6ae99SBarry Smith z_t = lz[n8 / (m*n)]; 81847c6ae99SBarry Smith s_t = bases[n8] + (i-1)*x_t + x_t*y_t*z_t - (s_z-k)*x_t*y_t; 8196f951b95Secoon if (twod && (s_t < 0)) {s_t = bases[n8] + (i-1)*x_t + x_t*y_t*z_t - x_t*y_t;} /* 2D case */ 82047c6ae99SBarry Smith for (j=0; j<s_x; j++) { idx[nn++] = s_t++;} 82147c6ae99SBarry Smith } 82247c6ae99SBarry Smith } 82347c6ae99SBarry Smith } 82447c6ae99SBarry Smith 82547c6ae99SBarry Smith /* Middle Level */ 82647c6ae99SBarry Smith for (k=0; k<z; k++) { 82747c6ae99SBarry Smith for (i=1; i<=s_y; i++) { 82847c6ae99SBarry Smith if (n9 >= 0) { /* left below */ 829ce00eea3SSatish Balay x_t = lx[n9 % m]; 83047c6ae99SBarry Smith y_t = ly[(n9 % (m*n))/m]; 83147c6ae99SBarry Smith /* z_t = z; */ 83247c6ae99SBarry Smith s_t = bases[n9] - (s_y-i)*x_t -s_x + (k+1)*x_t*y_t; 83347c6ae99SBarry Smith for (j=0; j<s_x; j++) { idx[nn++] = s_t++;} 83447c6ae99SBarry Smith } 83547c6ae99SBarry Smith if (n10 >= 0) { /* directly below */ 83647c6ae99SBarry Smith x_t = x; 83747c6ae99SBarry Smith y_t = ly[(n10 % (m*n))/m]; 83847c6ae99SBarry Smith /* z_t = z; */ 83947c6ae99SBarry Smith s_t = bases[n10] - (s_y+1-i)*x_t + (k+1)*x_t*y_t; 84047c6ae99SBarry Smith for (j=0; j<x_t; j++) { idx[nn++] = s_t++;} 84147c6ae99SBarry Smith } 84247c6ae99SBarry Smith if (n11 >= 0) { /* right below */ 843ce00eea3SSatish Balay x_t = lx[n11 % m]; 84447c6ae99SBarry Smith y_t = ly[(n11 % (m*n))/m]; 84547c6ae99SBarry Smith /* z_t = z; */ 84647c6ae99SBarry Smith s_t = bases[n11] - (s_y+1-i)*x_t + (k+1)*x_t*y_t; 84747c6ae99SBarry Smith for (j=0; j<s_x; j++) { idx[nn++] = s_t++;} 84847c6ae99SBarry Smith } 84947c6ae99SBarry Smith } 85047c6ae99SBarry Smith 85147c6ae99SBarry Smith for (i=0; i<y; i++) { 85247c6ae99SBarry Smith if (n12 >= 0) { /* directly left */ 853ce00eea3SSatish Balay x_t = lx[n12 % m]; 85447c6ae99SBarry Smith y_t = y; 85547c6ae99SBarry Smith /* z_t = z; */ 85647c6ae99SBarry Smith s_t = bases[n12] + (i+1)*x_t - s_x + k*x_t*y_t; 85747c6ae99SBarry Smith for (j=0; j<s_x; j++) { idx[nn++] = s_t++;} 85847c6ae99SBarry Smith } 85947c6ae99SBarry Smith 86047c6ae99SBarry Smith /* Interior */ 86147c6ae99SBarry Smith s_t = bases[rank] + i*x + k*x*y; 86247c6ae99SBarry Smith for (j=0; j<x; j++) { idx[nn++] = s_t++;} 86347c6ae99SBarry Smith 86447c6ae99SBarry Smith if (n14 >= 0) { /* directly right */ 865ce00eea3SSatish Balay x_t = lx[n14 % m]; 86647c6ae99SBarry Smith y_t = y; 86747c6ae99SBarry Smith /* z_t = z; */ 86847c6ae99SBarry Smith s_t = bases[n14] + i*x_t + k*x_t*y_t; 86947c6ae99SBarry Smith for (j=0; j<s_x; j++) { idx[nn++] = s_t++;} 87047c6ae99SBarry Smith } 87147c6ae99SBarry Smith } 87247c6ae99SBarry Smith 87347c6ae99SBarry Smith for (i=1; i<=s_y; i++) { 87447c6ae99SBarry Smith if (n15 >= 0) { /* left above */ 875ce00eea3SSatish Balay x_t = lx[n15 % m]; 87647c6ae99SBarry Smith y_t = ly[(n15 % (m*n))/m]; 87747c6ae99SBarry Smith /* z_t = z; */ 87847c6ae99SBarry Smith s_t = bases[n15] + i*x_t - s_x + k*x_t*y_t; 87947c6ae99SBarry Smith for (j=0; j<s_x; j++) { idx[nn++] = s_t++;} 88047c6ae99SBarry Smith } 88147c6ae99SBarry Smith if (n16 >= 0) { /* directly above */ 88247c6ae99SBarry Smith x_t = x; 88347c6ae99SBarry Smith y_t = ly[(n16 % (m*n))/m]; 88447c6ae99SBarry Smith /* z_t = z; */ 88547c6ae99SBarry Smith s_t = bases[n16] + (i-1)*x_t + k*x_t*y_t; 88647c6ae99SBarry Smith for (j=0; j<x_t; j++) { idx[nn++] = s_t++;} 88747c6ae99SBarry Smith } 88847c6ae99SBarry Smith if (n17 >= 0) { /* right above */ 889ce00eea3SSatish Balay x_t = lx[n17 % m]; 89047c6ae99SBarry Smith y_t = ly[(n17 % (m*n))/m]; 89147c6ae99SBarry Smith /* z_t = z; */ 89247c6ae99SBarry Smith s_t = bases[n17] + (i-1)*x_t + k*x_t*y_t; 89347c6ae99SBarry Smith for (j=0; j<s_x; j++) { idx[nn++] = s_t++;} 89447c6ae99SBarry Smith } 89547c6ae99SBarry Smith } 89647c6ae99SBarry Smith } 89747c6ae99SBarry Smith 89847c6ae99SBarry Smith /* Upper Level */ 89947c6ae99SBarry Smith for (k=0; k<s_z; k++) { 90047c6ae99SBarry Smith for (i=1; i<=s_y; i++) { 90147c6ae99SBarry Smith if (n18 >= 0) { /* left below */ 902ce00eea3SSatish Balay x_t = lx[n18 % m]; 90347c6ae99SBarry Smith y_t = ly[(n18 % (m*n))/m]; 90447c6ae99SBarry Smith /* z_t = lz[n18 / (m*n)]; */ 90547c6ae99SBarry Smith s_t = bases[n18] - (s_y-i)*x_t -s_x + (k+1)*x_t*y_t; 9066f951b95Secoon if (twod && (s_t >= M*N*P)) {s_t = bases[n18] - (s_y-i)*x_t -s_x + x_t*y_t;} /* 2d case */ 90747c6ae99SBarry Smith for (j=0; j<s_x; j++) { idx[nn++] = s_t++;} 90847c6ae99SBarry Smith } 90947c6ae99SBarry Smith if (n19 >= 0) { /* directly below */ 91047c6ae99SBarry Smith x_t = x; 91147c6ae99SBarry Smith y_t = ly[(n19 % (m*n))/m]; 91247c6ae99SBarry Smith /* z_t = lz[n19 / (m*n)]; */ 91347c6ae99SBarry Smith s_t = bases[n19] - (s_y+1-i)*x_t + (k+1)*x_t*y_t; 9146f951b95Secoon if (twod && (s_t >= M*N*P)) {s_t = bases[n19] - (s_y+1-i)*x_t + x_t*y_t;} /* 2d case */ 91547c6ae99SBarry Smith for (j=0; j<x_t; j++) { idx[nn++] = s_t++;} 91647c6ae99SBarry Smith } 91747c6ae99SBarry Smith if (n20 >= 0) { /* right below */ 918ce00eea3SSatish Balay x_t = lx[n20 % m]; 91947c6ae99SBarry Smith y_t = ly[(n20 % (m*n))/m]; 92047c6ae99SBarry Smith /* z_t = lz[n20 / (m*n)]; */ 92147c6ae99SBarry Smith s_t = bases[n20] - (s_y+1-i)*x_t + (k+1)*x_t*y_t; 9226f951b95Secoon if (twod && (s_t >= M*N*P)) {s_t = bases[n20] - (s_y+1-i)*x_t + x_t*y_t;} /* 2d case */ 92347c6ae99SBarry Smith for (j=0; j<s_x; j++) { idx[nn++] = s_t++;} 92447c6ae99SBarry Smith } 92547c6ae99SBarry Smith } 92647c6ae99SBarry Smith 92747c6ae99SBarry Smith for (i=0; i<y; i++) { 92847c6ae99SBarry Smith if (n21 >= 0) { /* directly left */ 929ce00eea3SSatish Balay x_t = lx[n21 % m]; 93047c6ae99SBarry Smith y_t = y; 93147c6ae99SBarry Smith /* z_t = lz[n21 / (m*n)]; */ 93247c6ae99SBarry Smith s_t = bases[n21] + (i+1)*x_t - s_x + k*x_t*y_t; 9336f951b95Secoon if (twod && (s_t >= M*N*P)) {s_t = bases[n21] + (i+1)*x_t - s_x;} /* 2d case */ 93447c6ae99SBarry Smith for (j=0; j<s_x; j++) { idx[nn++] = s_t++;} 93547c6ae99SBarry Smith } 93647c6ae99SBarry Smith 93747c6ae99SBarry Smith if (n22 >= 0) { /* middle */ 93847c6ae99SBarry Smith x_t = x; 93947c6ae99SBarry Smith y_t = y; 94047c6ae99SBarry Smith /* z_t = lz[n22 / (m*n)]; */ 94147c6ae99SBarry Smith s_t = bases[n22] + i*x_t + k*x_t*y_t; 9426f951b95Secoon if (twod && (s_t >= M*N*P)) {s_t = bases[n22] + i*x_t;} /* 2d case */ 94347c6ae99SBarry Smith for (j=0; j<x_t; j++) { idx[nn++] = s_t++;} 94447c6ae99SBarry Smith } 94547c6ae99SBarry Smith 94647c6ae99SBarry Smith if (n23 >= 0) { /* directly right */ 947ce00eea3SSatish Balay x_t = lx[n23 % m]; 94847c6ae99SBarry Smith y_t = y; 94947c6ae99SBarry Smith /* z_t = lz[n23 / (m*n)]; */ 95047c6ae99SBarry Smith s_t = bases[n23] + i*x_t + k*x_t*y_t; 9516f951b95Secoon if (twod && (s_t >= M*N*P)) {s_t = bases[n23] + i*x_t;} /* 2d case */ 95247c6ae99SBarry Smith for (j=0; j<s_x; j++) { idx[nn++] = s_t++;} 95347c6ae99SBarry Smith } 95447c6ae99SBarry Smith } 95547c6ae99SBarry Smith 95647c6ae99SBarry Smith for (i=1; i<=s_y; i++) { 95747c6ae99SBarry Smith if (n24 >= 0) { /* left above */ 958ce00eea3SSatish Balay x_t = lx[n24 % m]; 95947c6ae99SBarry Smith y_t = ly[(n24 % (m*n))/m]; 96047c6ae99SBarry Smith /* z_t = lz[n24 / (m*n)]; */ 96147c6ae99SBarry Smith s_t = bases[n24] + i*x_t - s_x + k*x_t*y_t; 9626f951b95Secoon if (twod && (s_t >= M*N*P)) {s_t = bases[n24] + i*x_t - s_x;} /* 2d case */ 96347c6ae99SBarry Smith for (j=0; j<s_x; j++) { idx[nn++] = s_t++;} 96447c6ae99SBarry Smith } 96547c6ae99SBarry Smith if (n25 >= 0) { /* directly above */ 96647c6ae99SBarry Smith x_t = x; 96747c6ae99SBarry Smith y_t = ly[(n25 % (m*n))/m]; 96847c6ae99SBarry Smith /* z_t = lz[n25 / (m*n)]; */ 96947c6ae99SBarry Smith s_t = bases[n25] + (i-1)*x_t + k*x_t*y_t; 9706f951b95Secoon if (twod && (s_t >= M*N*P)) {s_t = bases[n25] + (i-1)*x_t;} /* 2d case */ 97147c6ae99SBarry Smith for (j=0; j<x_t; j++) { idx[nn++] = s_t++;} 97247c6ae99SBarry Smith } 97347c6ae99SBarry Smith if (n26 >= 0) { /* right above */ 974ce00eea3SSatish Balay x_t = lx[n26 % m]; 97547c6ae99SBarry Smith y_t = ly[(n26 % (m*n))/m]; 97647c6ae99SBarry Smith /* z_t = lz[n26 / (m*n)]; */ 97747c6ae99SBarry Smith s_t = bases[n26] + (i-1)*x_t + k*x_t*y_t; 9786f951b95Secoon if (twod && (s_t >= M*N*P)) {s_t = bases[n26] + (i-1)*x_t;} /* 2d case */ 97947c6ae99SBarry Smith for (j=0; j<s_x; j++) { idx[nn++] = s_t++;} 98047c6ae99SBarry Smith } 98147c6ae99SBarry Smith } 98247c6ae99SBarry Smith } 983ce00eea3SSatish Balay 984ce00eea3SSatish Balay ierr = ISCreateBlock(comm,dof,nn,idx,PETSC_COPY_VALUES,&from);CHKERRQ(ierr); 98547c6ae99SBarry Smith ierr = VecScatterCreate(global,from,local,to,>ol);CHKERRQ(ierr); 98647c6ae99SBarry Smith ierr = PetscLogObjectParent(da,gtol);CHKERRQ(ierr); 987fcfd50ebSBarry Smith ierr = ISDestroy(&to);CHKERRQ(ierr); 988fcfd50ebSBarry Smith ierr = ISDestroy(&from);CHKERRQ(ierr); 98947c6ae99SBarry Smith 990aa219208SBarry Smith if (stencil_type == DMDA_STENCIL_STAR) { 99147c6ae99SBarry Smith n0 = sn0; n1 = sn1; n2 = sn2; n3 = sn3; n5 = sn5; n6 = sn6; n7 = sn7; 99247c6ae99SBarry Smith n8 = sn8; n9 = sn9; n11 = sn11; n15 = sn15; n17 = sn17; n18 = sn18; 99347c6ae99SBarry Smith n19 = sn19; n20 = sn20; n21 = sn21; n23 = sn23; n24 = sn24; n25 = sn25; 99447c6ae99SBarry Smith n26 = sn26; 995ce00eea3SSatish Balay } 99647c6ae99SBarry Smith 997ce00eea3SSatish Balay if ((stencil_type == DMDA_STENCIL_STAR) || 9981321219cSEthan Coon (bx != DMDA_BOUNDARY_PERIODIC && bx) || 9991321219cSEthan Coon (by != DMDA_BOUNDARY_PERIODIC && by) || 10001321219cSEthan Coon (bz != DMDA_BOUNDARY_PERIODIC && bz)) { 1001ce00eea3SSatish Balay /* 1002ce00eea3SSatish Balay Recompute the local to global mappings, this time keeping the 1003ce00eea3SSatish Balay information about the cross corner processor numbers. 1004ce00eea3SSatish Balay */ 100547c6ae99SBarry Smith nn = 0; 100647c6ae99SBarry Smith /* Bottom Level */ 100747c6ae99SBarry Smith for (k=0; k<s_z; k++) { 100847c6ae99SBarry Smith for (i=1; i<=s_y; i++) { 100947c6ae99SBarry Smith if (n0 >= 0) { /* left below */ 1010ce00eea3SSatish Balay x_t = lx[n0 % m]; 101147c6ae99SBarry Smith y_t = ly[(n0 % (m*n))/m]; 101247c6ae99SBarry Smith z_t = lz[n0 / (m*n)]; 101347c6ae99SBarry Smith s_t = bases[n0] + x_t*y_t*z_t - (s_y-i)*x_t - s_x - (s_z-k-1)*x_t*y_t; 101447c6ae99SBarry Smith for (j=0; j<s_x; j++) { idx[nn++] = s_t++;} 1015ce00eea3SSatish Balay } else if (Xs-xs < 0 && Ys-ys < 0 && Zs-zs < 0) { 1016ce00eea3SSatish Balay for (j=0; j<s_x; j++) { idx[nn++] = -1;} 101747c6ae99SBarry Smith } 101847c6ae99SBarry Smith if (n1 >= 0) { /* directly below */ 101947c6ae99SBarry Smith x_t = x; 102047c6ae99SBarry Smith y_t = ly[(n1 % (m*n))/m]; 102147c6ae99SBarry Smith z_t = lz[n1 / (m*n)]; 102247c6ae99SBarry Smith s_t = bases[n1] + x_t*y_t*z_t - (s_y+1-i)*x_t - (s_z-k-1)*x_t*y_t; 102347c6ae99SBarry Smith for (j=0; j<x_t; j++) { idx[nn++] = s_t++;} 1024ce00eea3SSatish Balay } else if (Ys-ys < 0 && Zs-zs < 0) { 1025ce00eea3SSatish Balay for (j=0; j<x; j++) { idx[nn++] = -1;} 102647c6ae99SBarry Smith } 102747c6ae99SBarry Smith if (n2 >= 0) { /* right below */ 1028ce00eea3SSatish Balay x_t = lx[n2 % m]; 102947c6ae99SBarry Smith y_t = ly[(n2 % (m*n))/m]; 103047c6ae99SBarry Smith z_t = lz[n2 / (m*n)]; 103147c6ae99SBarry Smith s_t = bases[n2] + x_t*y_t*z_t - (s_y+1-i)*x_t - (s_z-k-1)*x_t*y_t; 103247c6ae99SBarry Smith for (j=0; j<s_x; j++) { idx[nn++] = s_t++;} 1033ce00eea3SSatish Balay } else if (xe-Xe < 0 && Ys-ys < 0 && Zs-zs < 0) { 1034ce00eea3SSatish Balay for (j=0; j<s_x; j++) { idx[nn++] = -1;} 103547c6ae99SBarry Smith } 103647c6ae99SBarry Smith } 103747c6ae99SBarry Smith 103847c6ae99SBarry Smith for (i=0; i<y; i++) { 103947c6ae99SBarry Smith if (n3 >= 0) { /* directly left */ 1040ce00eea3SSatish Balay x_t = lx[n3 % m]; 104147c6ae99SBarry Smith y_t = y; 104247c6ae99SBarry Smith z_t = lz[n3 / (m*n)]; 104347c6ae99SBarry Smith s_t = bases[n3] + (i+1)*x_t - s_x + x_t*y_t*z_t - (s_z-k)*x_t*y_t; 104447c6ae99SBarry Smith for (j=0; j<s_x; j++) { idx[nn++] = s_t++;} 1045ce00eea3SSatish Balay } else if (Xs-xs < 0 && Zs-zs < 0) { 1046ce00eea3SSatish Balay for (j=0; j<s_x; j++) { idx[nn++] = -1;} 104747c6ae99SBarry Smith } 104847c6ae99SBarry Smith 104947c6ae99SBarry Smith if (n4 >= 0) { /* middle */ 105047c6ae99SBarry Smith x_t = x; 105147c6ae99SBarry Smith y_t = y; 105247c6ae99SBarry Smith z_t = lz[n4 / (m*n)]; 105347c6ae99SBarry Smith s_t = bases[n4] + i*x_t + x_t*y_t*z_t - (s_z-k)*x_t*y_t; 105447c6ae99SBarry Smith for (j=0; j<x_t; j++) { idx[nn++] = s_t++;} 1055ce00eea3SSatish Balay } else if (Zs-zs < 0) { 1056ce00eea3SSatish Balay for (j=0; j<x; j++) { idx[nn++] = -1;} 105747c6ae99SBarry Smith } 105847c6ae99SBarry Smith 105947c6ae99SBarry Smith if (n5 >= 0) { /* directly right */ 1060ce00eea3SSatish Balay x_t = lx[n5 % m]; 106147c6ae99SBarry Smith y_t = y; 106247c6ae99SBarry Smith z_t = lz[n5 / (m*n)]; 106347c6ae99SBarry Smith s_t = bases[n5] + i*x_t + x_t*y_t*z_t - (s_z-k)*x_t*y_t; 106447c6ae99SBarry Smith for (j=0; j<s_x; j++) { idx[nn++] = s_t++;} 1065ce00eea3SSatish Balay } else if (xe-Xe < 0 && Zs-zs < 0) { 1066ce00eea3SSatish Balay for (j=0; j<s_x; j++) { idx[nn++] = -1;} 106747c6ae99SBarry Smith } 106847c6ae99SBarry Smith } 106947c6ae99SBarry Smith 107047c6ae99SBarry Smith for (i=1; i<=s_y; i++) { 107147c6ae99SBarry Smith if (n6 >= 0) { /* left above */ 1072ce00eea3SSatish Balay x_t = lx[n6 % m]; 107347c6ae99SBarry Smith y_t = ly[(n6 % (m*n))/m]; 107447c6ae99SBarry Smith z_t = lz[n6 / (m*n)]; 107547c6ae99SBarry Smith s_t = bases[n6] + i*x_t - s_x + x_t*y_t*z_t - (s_z-k)*x_t*y_t; 107647c6ae99SBarry Smith for (j=0; j<s_x; j++) { idx[nn++] = s_t++;} 1077ce00eea3SSatish Balay } else if (Xs-xs < 0 && ye-Ye < 0 && Zs-zs < 0) { 1078ce00eea3SSatish Balay for (j=0; j<s_x; j++) { idx[nn++] = -1;} 107947c6ae99SBarry Smith } 108047c6ae99SBarry Smith if (n7 >= 0) { /* directly above */ 108147c6ae99SBarry Smith x_t = x; 108247c6ae99SBarry Smith y_t = ly[(n7 % (m*n))/m]; 108347c6ae99SBarry Smith z_t = lz[n7 / (m*n)]; 108447c6ae99SBarry Smith s_t = bases[n7] + (i-1)*x_t + x_t*y_t*z_t - (s_z-k)*x_t*y_t; 108547c6ae99SBarry Smith for (j=0; j<x_t; j++) { idx[nn++] = s_t++;} 1086ce00eea3SSatish Balay } else if (ye-Ye < 0 && Zs-zs < 0) { 1087ce00eea3SSatish Balay for (j=0; j<x; j++) { idx[nn++] = -1;} 108847c6ae99SBarry Smith } 108947c6ae99SBarry Smith if (n8 >= 0) { /* right above */ 1090ce00eea3SSatish Balay x_t = lx[n8 % m]; 109147c6ae99SBarry Smith y_t = ly[(n8 % (m*n))/m]; 109247c6ae99SBarry Smith z_t = lz[n8 / (m*n)]; 109347c6ae99SBarry Smith s_t = bases[n8] + (i-1)*x_t + x_t*y_t*z_t - (s_z-k)*x_t*y_t; 109447c6ae99SBarry Smith for (j=0; j<s_x; j++) { idx[nn++] = s_t++;} 1095ce00eea3SSatish Balay } else if (xe-Xe < 0 && ye-Ye < 0 && Zs-zs < 0) { 1096ce00eea3SSatish Balay for (j=0; j<s_x; j++) { idx[nn++] = -1;} 109747c6ae99SBarry Smith } 109847c6ae99SBarry Smith } 109947c6ae99SBarry Smith } 110047c6ae99SBarry Smith 110147c6ae99SBarry Smith /* Middle Level */ 110247c6ae99SBarry Smith for (k=0; k<z; k++) { 110347c6ae99SBarry Smith for (i=1; i<=s_y; i++) { 110447c6ae99SBarry Smith if (n9 >= 0) { /* left below */ 1105ce00eea3SSatish Balay x_t = lx[n9 % m]; 110647c6ae99SBarry Smith y_t = ly[(n9 % (m*n))/m]; 110747c6ae99SBarry Smith /* z_t = z; */ 110847c6ae99SBarry Smith s_t = bases[n9] - (s_y-i)*x_t -s_x + (k+1)*x_t*y_t; 110947c6ae99SBarry Smith for (j=0; j<s_x; j++) { idx[nn++] = s_t++;} 1110ce00eea3SSatish Balay } else if (Xs-xs < 0 && Ys-ys < 0) { 1111ce00eea3SSatish Balay for (j=0; j<s_x; j++) { idx[nn++] = -1;} 111247c6ae99SBarry Smith } 111347c6ae99SBarry Smith if (n10 >= 0) { /* directly below */ 111447c6ae99SBarry Smith x_t = x; 111547c6ae99SBarry Smith y_t = ly[(n10 % (m*n))/m]; 111647c6ae99SBarry Smith /* z_t = z; */ 111747c6ae99SBarry Smith s_t = bases[n10] - (s_y+1-i)*x_t + (k+1)*x_t*y_t; 111847c6ae99SBarry Smith for (j=0; j<x_t; j++) { idx[nn++] = s_t++;} 1119ce00eea3SSatish Balay } else if (Ys-ys < 0) { 1120ce00eea3SSatish Balay for (j=0; j<x; j++) { idx[nn++] = -1;} 112147c6ae99SBarry Smith } 112247c6ae99SBarry Smith if (n11 >= 0) { /* right below */ 1123ce00eea3SSatish Balay x_t = lx[n11 % m]; 112447c6ae99SBarry Smith y_t = ly[(n11 % (m*n))/m]; 112547c6ae99SBarry Smith /* z_t = z; */ 112647c6ae99SBarry Smith s_t = bases[n11] - (s_y+1-i)*x_t + (k+1)*x_t*y_t; 112747c6ae99SBarry Smith for (j=0; j<s_x; j++) { idx[nn++] = s_t++;} 1128ce00eea3SSatish Balay } else if (xe-Xe < 0 && Ys-ys < 0) { 1129ce00eea3SSatish Balay for (j=0; j<s_x; j++) { idx[nn++] = -1;} 113047c6ae99SBarry Smith } 113147c6ae99SBarry Smith } 113247c6ae99SBarry Smith 113347c6ae99SBarry Smith for (i=0; i<y; i++) { 113447c6ae99SBarry Smith if (n12 >= 0) { /* directly left */ 1135ce00eea3SSatish Balay x_t = lx[n12 % m]; 113647c6ae99SBarry Smith y_t = y; 113747c6ae99SBarry Smith /* z_t = z; */ 113847c6ae99SBarry Smith s_t = bases[n12] + (i+1)*x_t - s_x + k*x_t*y_t; 113947c6ae99SBarry Smith for (j=0; j<s_x; j++) { idx[nn++] = s_t++;} 1140ce00eea3SSatish Balay } else if (Xs-xs < 0) { 1141ce00eea3SSatish Balay for (j=0; j<s_x; j++) { idx[nn++] = -1;} 114247c6ae99SBarry Smith } 114347c6ae99SBarry Smith 114447c6ae99SBarry Smith /* Interior */ 114547c6ae99SBarry Smith s_t = bases[rank] + i*x + k*x*y; 114647c6ae99SBarry Smith for (j=0; j<x; j++) { idx[nn++] = s_t++;} 114747c6ae99SBarry Smith 114847c6ae99SBarry Smith if (n14 >= 0) { /* directly right */ 1149ce00eea3SSatish Balay x_t = lx[n14 % m]; 115047c6ae99SBarry Smith y_t = y; 115147c6ae99SBarry Smith /* z_t = z; */ 115247c6ae99SBarry Smith s_t = bases[n14] + i*x_t + k*x_t*y_t; 115347c6ae99SBarry Smith for (j=0; j<s_x; j++) { idx[nn++] = s_t++;} 1154ce00eea3SSatish Balay } else if (xe-Xe < 0) { 1155ce00eea3SSatish Balay for (j=0; j<s_x; j++) { idx[nn++] = -1;} 115647c6ae99SBarry Smith } 115747c6ae99SBarry Smith } 115847c6ae99SBarry Smith 115947c6ae99SBarry Smith for (i=1; i<=s_y; i++) { 116047c6ae99SBarry Smith if (n15 >= 0) { /* left above */ 1161ce00eea3SSatish Balay x_t = lx[n15 % m]; 116247c6ae99SBarry Smith y_t = ly[(n15 % (m*n))/m]; 116347c6ae99SBarry Smith /* z_t = z; */ 116447c6ae99SBarry Smith s_t = bases[n15] + i*x_t - s_x + k*x_t*y_t; 116547c6ae99SBarry Smith for (j=0; j<s_x; j++) { idx[nn++] = s_t++;} 1166ce00eea3SSatish Balay } else if (Xs-xs < 0 && ye-Ye < 0) { 1167ce00eea3SSatish Balay for (j=0; j<s_x; j++) { idx[nn++] = -1;} 116847c6ae99SBarry Smith } 116947c6ae99SBarry Smith if (n16 >= 0) { /* directly above */ 117047c6ae99SBarry Smith x_t = x; 117147c6ae99SBarry Smith y_t = ly[(n16 % (m*n))/m]; 117247c6ae99SBarry Smith /* z_t = z; */ 117347c6ae99SBarry Smith s_t = bases[n16] + (i-1)*x_t + k*x_t*y_t; 117447c6ae99SBarry Smith for (j=0; j<x_t; j++) { idx[nn++] = s_t++;} 1175ce00eea3SSatish Balay } else if (ye-Ye < 0) { 1176ce00eea3SSatish Balay for (j=0; j<x; j++) { idx[nn++] = -1;} 117747c6ae99SBarry Smith } 117847c6ae99SBarry Smith if (n17 >= 0) { /* right above */ 1179ce00eea3SSatish Balay x_t = lx[n17 % m]; 118047c6ae99SBarry Smith y_t = ly[(n17 % (m*n))/m]; 118147c6ae99SBarry Smith /* z_t = z; */ 118247c6ae99SBarry Smith s_t = bases[n17] + (i-1)*x_t + k*x_t*y_t; 118347c6ae99SBarry Smith for (j=0; j<s_x; j++) { idx[nn++] = s_t++;} 1184ce00eea3SSatish Balay } else if (xe-Xe < 0 && ye-Ye < 0) { 1185ce00eea3SSatish Balay for (j=0; j<s_x; j++) { idx[nn++] = -1;} 118647c6ae99SBarry Smith } 118747c6ae99SBarry Smith } 118847c6ae99SBarry Smith } 118947c6ae99SBarry Smith 119047c6ae99SBarry Smith /* Upper Level */ 119147c6ae99SBarry Smith for (k=0; k<s_z; k++) { 119247c6ae99SBarry Smith for (i=1; i<=s_y; i++) { 119347c6ae99SBarry Smith if (n18 >= 0) { /* left below */ 1194ce00eea3SSatish Balay x_t = lx[n18 % m]; 119547c6ae99SBarry Smith y_t = ly[(n18 % (m*n))/m]; 119647c6ae99SBarry Smith /* z_t = lz[n18 / (m*n)]; */ 119747c6ae99SBarry Smith s_t = bases[n18] - (s_y-i)*x_t -s_x + (k+1)*x_t*y_t; 119847c6ae99SBarry Smith for (j=0; j<s_x; j++) { idx[nn++] = s_t++;} 1199ce00eea3SSatish Balay } else if (Xs-xs < 0 && Ys-ys < 0 && ze-Ze < 0) { 1200ce00eea3SSatish Balay for (j=0; j<s_x; j++) { idx[nn++] = -1;} 120147c6ae99SBarry Smith } 120247c6ae99SBarry Smith if (n19 >= 0) { /* directly below */ 120347c6ae99SBarry Smith x_t = x; 120447c6ae99SBarry Smith y_t = ly[(n19 % (m*n))/m]; 120547c6ae99SBarry Smith /* z_t = lz[n19 / (m*n)]; */ 120647c6ae99SBarry Smith s_t = bases[n19] - (s_y+1-i)*x_t + (k+1)*x_t*y_t; 120747c6ae99SBarry Smith for (j=0; j<x_t; j++) { idx[nn++] = s_t++;} 1208ce00eea3SSatish Balay } else if (Ys-ys < 0 && ze-Ze < 0) { 1209ce00eea3SSatish Balay for (j=0; j<x; j++) { idx[nn++] = -1;} 121047c6ae99SBarry Smith } 121147c6ae99SBarry Smith if (n20 >= 0) { /* right below */ 1212ce00eea3SSatish Balay x_t = lx[n20 % m]; 121347c6ae99SBarry Smith y_t = ly[(n20 % (m*n))/m]; 121447c6ae99SBarry Smith /* z_t = lz[n20 / (m*n)]; */ 121547c6ae99SBarry Smith s_t = bases[n20] - (s_y+1-i)*x_t + (k+1)*x_t*y_t; 121647c6ae99SBarry Smith for (j=0; j<s_x; j++) { idx[nn++] = s_t++;} 1217ce00eea3SSatish Balay } else if (xe-Xe < 0 && Ys-ys < 0 && ze-Ze < 0) { 1218ce00eea3SSatish Balay for (j=0; j<s_x; j++) { idx[nn++] = -1;} 121947c6ae99SBarry Smith } 122047c6ae99SBarry Smith } 122147c6ae99SBarry Smith 122247c6ae99SBarry Smith for (i=0; i<y; i++) { 122347c6ae99SBarry Smith if (n21 >= 0) { /* directly left */ 1224ce00eea3SSatish Balay x_t = lx[n21 % m]; 122547c6ae99SBarry Smith y_t = y; 122647c6ae99SBarry Smith /* z_t = lz[n21 / (m*n)]; */ 122747c6ae99SBarry Smith s_t = bases[n21] + (i+1)*x_t - s_x + k*x_t*y_t; 122847c6ae99SBarry Smith for (j=0; j<s_x; j++) { idx[nn++] = s_t++;} 1229ce00eea3SSatish Balay } else if (Xs-xs < 0 && ze-Ze < 0) { 1230ce00eea3SSatish Balay for (j=0; j<s_x; j++) { idx[nn++] = -1;} 123147c6ae99SBarry Smith } 123247c6ae99SBarry Smith 123347c6ae99SBarry Smith if (n22 >= 0) { /* middle */ 123447c6ae99SBarry Smith x_t = x; 123547c6ae99SBarry Smith y_t = y; 123647c6ae99SBarry Smith /* z_t = lz[n22 / (m*n)]; */ 123747c6ae99SBarry Smith s_t = bases[n22] + i*x_t + k*x_t*y_t; 123847c6ae99SBarry Smith for (j=0; j<x_t; j++) { idx[nn++] = s_t++;} 1239ce00eea3SSatish Balay } else if (ze-Ze < 0) { 1240ce00eea3SSatish Balay for (j=0; j<x; j++) { idx[nn++] = -1;} 124147c6ae99SBarry Smith } 124247c6ae99SBarry Smith 124347c6ae99SBarry Smith if (n23 >= 0) { /* directly right */ 1244ce00eea3SSatish Balay x_t = lx[n23 % m]; 124547c6ae99SBarry Smith y_t = y; 124647c6ae99SBarry Smith /* z_t = lz[n23 / (m*n)]; */ 124747c6ae99SBarry Smith s_t = bases[n23] + i*x_t + k*x_t*y_t; 124847c6ae99SBarry Smith for (j=0; j<s_x; j++) { idx[nn++] = s_t++;} 1249ce00eea3SSatish Balay } else if (xe-Xe < 0 && ze-Ze < 0) { 1250ce00eea3SSatish Balay for (j=0; j<s_x; j++) { idx[nn++] = -1;} 125147c6ae99SBarry Smith } 125247c6ae99SBarry Smith } 125347c6ae99SBarry Smith 125447c6ae99SBarry Smith for (i=1; i<=s_y; i++) { 125547c6ae99SBarry Smith if (n24 >= 0) { /* left above */ 1256ce00eea3SSatish Balay x_t = lx[n24 % m]; 125747c6ae99SBarry Smith y_t = ly[(n24 % (m*n))/m]; 125847c6ae99SBarry Smith /* z_t = lz[n24 / (m*n)]; */ 125947c6ae99SBarry Smith s_t = bases[n24] + i*x_t - s_x + k*x_t*y_t; 126047c6ae99SBarry Smith for (j=0; j<s_x; j++) { idx[nn++] = s_t++;} 1261ce00eea3SSatish Balay } else if (Xs-xs < 0 && ye-Ye < 0 && ze-Ze < 0) { 1262ce00eea3SSatish Balay for (j=0; j<s_x; j++) { idx[nn++] = -1;} 126347c6ae99SBarry Smith } 126447c6ae99SBarry Smith if (n25 >= 0) { /* directly above */ 126547c6ae99SBarry Smith x_t = x; 126647c6ae99SBarry Smith y_t = ly[(n25 % (m*n))/m]; 126747c6ae99SBarry Smith /* z_t = lz[n25 / (m*n)]; */ 126847c6ae99SBarry Smith s_t = bases[n25] + (i-1)*x_t + k*x_t*y_t; 126947c6ae99SBarry Smith for (j=0; j<x_t; j++) { idx[nn++] = s_t++;} 1270ce00eea3SSatish Balay } else if (ye-Ye < 0 && ze-Ze < 0) { 1271ce00eea3SSatish Balay for (j=0; j<x; j++) { idx[nn++] = -1;} 127247c6ae99SBarry Smith } 127347c6ae99SBarry Smith if (n26 >= 0) { /* right above */ 1274ce00eea3SSatish Balay x_t = lx[n26 % m]; 127547c6ae99SBarry Smith y_t = ly[(n26 % (m*n))/m]; 127647c6ae99SBarry Smith /* z_t = lz[n26 / (m*n)]; */ 127747c6ae99SBarry Smith s_t = bases[n26] + (i-1)*x_t + k*x_t*y_t; 127847c6ae99SBarry Smith for (j=0; j<s_x; j++) { idx[nn++] = s_t++;} 1279ce00eea3SSatish Balay } else if (xe-Xe < 0 && ye-Ye < 0 && ze-Ze < 0) { 1280ce00eea3SSatish Balay for (j=0; j<s_x; j++) { idx[nn++] = -1;} 128147c6ae99SBarry Smith } 128247c6ae99SBarry Smith } 128347c6ae99SBarry Smith } 128447c6ae99SBarry Smith } 128547c6ae99SBarry Smith /* 128647c6ae99SBarry Smith Set the local to global ordering in the global vector, this allows use 128747c6ae99SBarry Smith of VecSetValuesLocal(). 128847c6ae99SBarry Smith */ 1289ce00eea3SSatish Balay ierr = ISCreateBlock(comm,dof,nn,idx,PETSC_OWN_POINTER,<ogis);CHKERRQ(ierr); 1290ce00eea3SSatish Balay ierr = PetscMalloc(nn*dof*sizeof(PetscInt),&idx_cpy);CHKERRQ(ierr); 1291db87c5ecSEthan Coon ierr = PetscLogObjectMemory(da,nn*dof*sizeof(PetscInt));CHKERRQ(ierr); 1292ce00eea3SSatish Balay ierr = ISGetIndices(ltogis, &idx_full); 1293ce00eea3SSatish Balay ierr = PetscMemcpy(idx_cpy,idx_full,nn*dof*sizeof(PetscInt));CHKERRQ(ierr); 1294ce00eea3SSatish Balay ierr = ISRestoreIndices(ltogis, &idx_full); 1295ce00eea3SSatish Balay ierr = ISLocalToGlobalMappingCreateIS(ltogis,&da->ltogmap);CHKERRQ(ierr); 1296ce00eea3SSatish Balay ierr = PetscLogObjectParent(da,da->ltogmap);CHKERRQ(ierr); 1297fcfd50ebSBarry Smith ierr = ISDestroy(<ogis);CHKERRQ(ierr); 12981411c6eeSJed Brown ierr = ISLocalToGlobalMappingBlock(da->ltogmap,dd->w,&da->ltogmapb);CHKERRQ(ierr); 12991411c6eeSJed Brown ierr = PetscLogObjectParent(da,da->ltogmap);CHKERRQ(ierr); 130047c6ae99SBarry Smith 1301ce00eea3SSatish Balay ierr = PetscFree2(bases,ldims);CHKERRQ(ierr); 1302ce00eea3SSatish Balay dd->m = m; dd->n = n; dd->p = p; 1303ce00eea3SSatish Balay /* note petsc expects xs/xe/Xs/Xe to be multiplied by #dofs in many places */ 1304ce00eea3SSatish Balay dd->xs = xs*dof; dd->xe = xe*dof; dd->ys = ys; dd->ye = ye; dd->zs = zs; dd->ze = ze; 1305ce00eea3SSatish Balay dd->Xs = Xs*dof; dd->Xe = Xe*dof; dd->Ys = Ys; dd->Ye = Ye; dd->Zs = Zs; dd->Ze = Ze; 1306ce00eea3SSatish Balay 1307fcfd50ebSBarry Smith ierr = VecDestroy(&local);CHKERRQ(ierr); 1308fcfd50ebSBarry Smith ierr = VecDestroy(&global);CHKERRQ(ierr); 1309ce00eea3SSatish Balay 1310ce00eea3SSatish Balay dd->gtol = gtol; 1311ce00eea3SSatish Balay dd->ltog = ltog; 1312ce00eea3SSatish Balay dd->idx = idx_cpy; 1313ce00eea3SSatish Balay dd->Nl = nn*dof; 1314ce00eea3SSatish Balay dd->base = base; 1315ce00eea3SSatish Balay da->ops->view = DMView_DA_3d; 131647c6ae99SBarry Smith dd->ltol = PETSC_NULL; 131747c6ae99SBarry Smith dd->ao = PETSC_NULL; 1318ce00eea3SSatish Balay 131947c6ae99SBarry Smith PetscFunctionReturn(0); 132047c6ae99SBarry Smith } 1321564755cdSBarry Smith 132247c6ae99SBarry Smith 132347c6ae99SBarry Smith #undef __FUNCT__ 1324aa219208SBarry Smith #define __FUNCT__ "DMDACreate3d" 132547c6ae99SBarry Smith /*@C 1326aa219208SBarry Smith DMDACreate3d - Creates an object that will manage the communication of three-dimensional 132747c6ae99SBarry Smith regular array data that is distributed across some processors. 132847c6ae99SBarry Smith 132947c6ae99SBarry Smith Collective on MPI_Comm 133047c6ae99SBarry Smith 133147c6ae99SBarry Smith Input Parameters: 133247c6ae99SBarry Smith + comm - MPI communicator 13331321219cSEthan Coon . bx,by,bz - type of ghost nodes the array have. 13341321219cSEthan Coon Use one of DMDA_BOUNDARY_NONE, DMDA_BOUNDARY_GHOSTED, DMDA_BOUNDARY_PERIODIC. 1335aa219208SBarry Smith . stencil_type - Type of stencil (DMDA_STENCIL_STAR or DMDA_STENCIL_BOX) 133647c6ae99SBarry Smith . M,N,P - global dimension in each direction of the array (use -M, -N, and or -P to indicate that it may be set to a different value 133747c6ae99SBarry Smith from the command line with -da_grid_x <M> -da_grid_y <N> -da_grid_z <P>) 133847c6ae99SBarry Smith . m,n,p - corresponding number of processors in each dimension 133947c6ae99SBarry Smith (or PETSC_DECIDE to have calculated) 134047c6ae99SBarry Smith . dof - number of degrees of freedom per node 134110d7c030SMatthew G Knepley . s - stencil width 134210d7c030SMatthew G Knepley - lx, ly, lz - arrays containing the number of nodes in each cell along 134347c6ae99SBarry Smith the x, y, and z coordinates, or PETSC_NULL. If non-null, these 134447c6ae99SBarry Smith must be of length as m,n,p and the corresponding 134547c6ae99SBarry Smith m,n, or p cannot be PETSC_DECIDE. Sum of the lx[] entries must be M, sum of 134647c6ae99SBarry Smith the ly[] must N, sum of the lz[] must be P 134747c6ae99SBarry Smith 134847c6ae99SBarry Smith Output Parameter: 134947c6ae99SBarry Smith . da - the resulting distributed array object 135047c6ae99SBarry Smith 135147c6ae99SBarry Smith Options Database Key: 1352aa219208SBarry Smith + -da_view - Calls DMView() at the conclusion of DMDACreate3d() 135347c6ae99SBarry Smith . -da_grid_x <nx> - number of grid points in x direction, if M < 0 135447c6ae99SBarry Smith . -da_grid_y <ny> - number of grid points in y direction, if N < 0 135547c6ae99SBarry Smith . -da_grid_z <nz> - number of grid points in z direction, if P < 0 135647c6ae99SBarry Smith . -da_processors_x <MX> - number of processors in x direction 135747c6ae99SBarry Smith . -da_processors_y <MY> - number of processors in y direction 135847c6ae99SBarry Smith . -da_processors_z <MZ> - number of processors in z direction 1359e0f5d30fSBarry Smith . -da_refine_x <rx> - refinement ratio in x direction 1360e0f5d30fSBarry Smith . -da_refine_y <ry> - refinement ratio in y direction 1361e0f5d30fSBarry Smith . -da_refine_z <rz>- refinement ratio in z directio 1362e0f5d30fSBarry Smith - -da_refine <n> - refine the DMDA n times before creating it, , if M, N, or P < 0 136347c6ae99SBarry Smith 136447c6ae99SBarry Smith Level: beginner 136547c6ae99SBarry Smith 136647c6ae99SBarry Smith Notes: 1367aa219208SBarry Smith The stencil type DMDA_STENCIL_STAR with width 1 corresponds to the 1368aa219208SBarry Smith standard 7-pt stencil, while DMDA_STENCIL_BOX with width 1 denotes 136947c6ae99SBarry Smith the standard 27-pt stencil. 137047c6ae99SBarry Smith 1371aa219208SBarry Smith The array data itself is NOT stored in the DMDA, it is stored in Vec objects; 1372564755cdSBarry Smith The appropriate vector objects can be obtained with calls to DMCreateGlobalVector() 1373564755cdSBarry Smith and DMCreateLocalVector() and calls to VecDuplicate() if more are needed. 137447c6ae99SBarry Smith 137547c6ae99SBarry Smith .keywords: distributed array, create, three-dimensional 137647c6ae99SBarry Smith 1377aa219208SBarry Smith .seealso: DMDestroy(), DMView(), DMDACreate1d(), DMDACreate2d(), DMGlobalToLocalBegin(), DMDAGetRefinementFactor(), 1378aa219208SBarry Smith DMGlobalToLocalEnd(), DMLocalToGlobalBegin(), DMDALocalToLocalBegin(), DMDALocalToLocalEnd(), DMDASetRefinementFactor(), 1379d461ba97SBarry Smith DMDAGetInfo(), DMCreateGlobalVector(), DMCreateLocalVector(), DMDACreateNaturalVector(), DMLoad(), DMDAGetOwnershipRanges() 138047c6ae99SBarry Smith 138147c6ae99SBarry Smith @*/ 13821321219cSEthan Coon PetscErrorCode DMDACreate3d(MPI_Comm comm,DMDABoundaryType bx,DMDABoundaryType by,DMDABoundaryType bz,DMDAStencilType stencil_type,PetscInt M, 13839a42bb27SBarry Smith PetscInt N,PetscInt P,PetscInt m,PetscInt n,PetscInt p,PetscInt dof,PetscInt s,const PetscInt lx[],const PetscInt ly[],const PetscInt lz[],DM *da) 138447c6ae99SBarry Smith { 138547c6ae99SBarry Smith PetscErrorCode ierr; 138647c6ae99SBarry Smith 138747c6ae99SBarry Smith PetscFunctionBegin; 1388aa219208SBarry Smith ierr = DMDACreate(comm, da);CHKERRQ(ierr); 1389aa219208SBarry Smith ierr = DMDASetDim(*da, 3);CHKERRQ(ierr); 1390aa219208SBarry Smith ierr = DMDASetSizes(*da, M, N, P);CHKERRQ(ierr); 1391aa219208SBarry Smith ierr = DMDASetNumProcs(*da, m, n, p);CHKERRQ(ierr); 13921321219cSEthan Coon ierr = DMDASetBoundaryType(*da, bx, by, bz);CHKERRQ(ierr); 1393aa219208SBarry Smith ierr = DMDASetDof(*da, dof);CHKERRQ(ierr); 1394aa219208SBarry Smith ierr = DMDASetStencilType(*da, stencil_type);CHKERRQ(ierr); 1395aa219208SBarry Smith ierr = DMDASetStencilWidth(*da, s);CHKERRQ(ierr); 1396aa219208SBarry Smith ierr = DMDASetOwnershipRanges(*da, lx, ly, lz);CHKERRQ(ierr); 139747c6ae99SBarry Smith /* This violates the behavior for other classes, but right now users expect negative dimensions to be handled this way */ 13989a42bb27SBarry Smith ierr = DMSetFromOptions(*da);CHKERRQ(ierr); 13999a42bb27SBarry Smith ierr = DMSetUp(*da);CHKERRQ(ierr); 14007242296bSJed Brown ierr = DMView_DA_Private(*da);CHKERRQ(ierr); 140147c6ae99SBarry Smith PetscFunctionReturn(0); 140247c6ae99SBarry Smith } 1403