1c4762a1bSJed Brown 2c4762a1bSJed Brown static char help[] = "Tests MatCreateSubmatrix() in parallel."; 3c4762a1bSJed Brown 4c4762a1bSJed Brown #include <petscmat.h> 5c4762a1bSJed Brown #include <../src/mat/impls/aij/mpi/mpiaij.h> 6c4762a1bSJed Brown 7c4762a1bSJed Brown PetscErrorCode ISGetSeqIS_SameColDist_Private(Mat mat,IS isrow,IS iscol,IS *isrow_d,IS *iscol_d,IS *iscol_o,const PetscInt *garray[]) 8c4762a1bSJed Brown { 9c4762a1bSJed Brown PetscErrorCode ierr; 10c4762a1bSJed Brown Vec x,cmap; 11c4762a1bSJed Brown const PetscInt *is_idx; 12c4762a1bSJed Brown PetscScalar *xarray,*cmaparray; 13c4762a1bSJed Brown PetscInt ncols,isstart,*idx,m,rstart,count; 14c4762a1bSJed Brown Mat_MPIAIJ *a=(Mat_MPIAIJ*)mat->data; 15c4762a1bSJed Brown Mat B=a->B; 16c4762a1bSJed Brown Vec lvec=a->lvec,lcmap; 17c4762a1bSJed Brown PetscInt i,cstart,cend,Bn=B->cmap->N; 18c4762a1bSJed Brown MPI_Comm comm; 19c4762a1bSJed Brown PetscMPIInt rank; 20c4762a1bSJed Brown VecScatter Mvctx; 21c4762a1bSJed Brown 22c4762a1bSJed Brown PetscFunctionBegin; 23c4762a1bSJed Brown ierr = PetscObjectGetComm((PetscObject)mat,&comm);CHKERRQ(ierr); 24ffc4695bSBarry Smith ierr = MPI_Comm_rank(comm,&rank);CHKERRMPI(ierr); 25c4762a1bSJed Brown ierr = ISGetLocalSize(iscol,&ncols);CHKERRQ(ierr); 26c4762a1bSJed Brown 27c4762a1bSJed Brown /* (1) iscol is a sub-column vector of mat, pad it with '-1.' to form a full vector x */ 28c4762a1bSJed Brown ierr = MatCreateVecs(mat,&x,NULL);CHKERRQ(ierr); 29c4762a1bSJed Brown ierr = VecDuplicate(x,&cmap);CHKERRQ(ierr); 30c4762a1bSJed Brown ierr = VecSet(x,-1.0);CHKERRQ(ierr); 31c4762a1bSJed Brown ierr = VecSet(cmap,-1.0);CHKERRQ(ierr); 32c4762a1bSJed Brown 33c4762a1bSJed Brown ierr = VecDuplicate(lvec,&lcmap);CHKERRQ(ierr); 34c4762a1bSJed Brown 35c4762a1bSJed Brown /* Get start indices */ 36ffc4695bSBarry Smith ierr = MPI_Scan(&ncols,&isstart,1,MPIU_INT,MPI_SUM,comm);CHKERRMPI(ierr); 37c4762a1bSJed Brown isstart -= ncols; 38c4762a1bSJed Brown ierr = MatGetOwnershipRangeColumn(mat,&cstart,&cend);CHKERRQ(ierr); 39c4762a1bSJed Brown 40c4762a1bSJed Brown ierr = ISGetIndices(iscol,&is_idx);CHKERRQ(ierr); 41c4762a1bSJed Brown ierr = VecGetArray(x,&xarray);CHKERRQ(ierr); 42c4762a1bSJed Brown ierr = VecGetArray(cmap,&cmaparray);CHKERRQ(ierr); 43c4762a1bSJed Brown ierr = PetscMalloc1(ncols,&idx);CHKERRQ(ierr); 44c4762a1bSJed Brown for (i=0; i<ncols; i++) { 45c4762a1bSJed Brown xarray[is_idx[i]-cstart] = (PetscScalar)is_idx[i]; 46c4762a1bSJed Brown cmaparray[is_idx[i]-cstart] = (PetscScalar)(i + isstart); /* global index of iscol[i] */ 47c4762a1bSJed Brown idx[i] = is_idx[i]-cstart; /* local index of iscol[i] */ 48c4762a1bSJed Brown } 49c4762a1bSJed Brown ierr = VecRestoreArray(x,&xarray);CHKERRQ(ierr); 50c4762a1bSJed Brown ierr = VecRestoreArray(cmap,&cmaparray);CHKERRQ(ierr); 51c4762a1bSJed Brown ierr = ISRestoreIndices(iscol,&is_idx);CHKERRQ(ierr); 52c4762a1bSJed Brown 53c4762a1bSJed Brown /* Get iscol_d */ 54c4762a1bSJed Brown ierr = ISCreateGeneral(PETSC_COMM_SELF,ncols,idx,PETSC_OWN_POINTER,iscol_d);CHKERRQ(ierr); 55c4762a1bSJed Brown ierr = ISGetBlockSize(iscol,&i);CHKERRQ(ierr); 56c4762a1bSJed Brown ierr = ISSetBlockSize(*iscol_d,i);CHKERRQ(ierr); 57c4762a1bSJed Brown 58c4762a1bSJed Brown /* Get isrow_d */ 59c4762a1bSJed Brown ierr = ISGetLocalSize(isrow,&m);CHKERRQ(ierr); 60c4762a1bSJed Brown rstart = mat->rmap->rstart; 61c4762a1bSJed Brown ierr = PetscMalloc1(m,&idx);CHKERRQ(ierr); 62c4762a1bSJed Brown ierr = ISGetIndices(isrow,&is_idx);CHKERRQ(ierr); 63c4762a1bSJed Brown for (i=0; i<m; i++) idx[i] = is_idx[i]-rstart; 64c4762a1bSJed Brown ierr = ISRestoreIndices(isrow,&is_idx);CHKERRQ(ierr); 65c4762a1bSJed Brown 66c4762a1bSJed Brown ierr = ISCreateGeneral(PETSC_COMM_SELF,m,idx,PETSC_OWN_POINTER,isrow_d);CHKERRQ(ierr); 67c4762a1bSJed Brown ierr = ISGetBlockSize(isrow,&i);CHKERRQ(ierr); 68c4762a1bSJed Brown ierr = ISSetBlockSize(*isrow_d,i);CHKERRQ(ierr); 69c4762a1bSJed Brown 70c4762a1bSJed Brown /* (2) Scatter x and cmap using aij->Mvctx to get their off-process portions (see MatMult_MPIAIJ) */ 71c4762a1bSJed Brown #if 0 72c4762a1bSJed Brown if (!a->Mvctx_mpi1) { 73c4762a1bSJed Brown /* a->Mvctx causes random 'count' in o-build? See src/mat/tests/runex59_2 */ 74c4762a1bSJed Brown a->Mvctx_mpi1_flg = PETSC_TRUE; 75c4762a1bSJed Brown ierr = MatSetUpMultiply_MPIAIJ(mat);CHKERRQ(ierr); 76c4762a1bSJed Brown } 77c4762a1bSJed Brown Mvctx = a->Mvctx_mpi1; 78c4762a1bSJed Brown #endif 79c4762a1bSJed Brown Mvctx = a->Mvctx; 80c4762a1bSJed Brown ierr = VecScatterBegin(Mvctx,x,lvec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 81c4762a1bSJed Brown ierr = VecScatterEnd(Mvctx,x,lvec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 82c4762a1bSJed Brown 83c4762a1bSJed Brown ierr = VecScatterBegin(Mvctx,cmap,lcmap,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 84c4762a1bSJed Brown ierr = VecScatterEnd(Mvctx,cmap,lcmap,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 85c4762a1bSJed Brown 86c4762a1bSJed Brown /* (3) create sequential iscol_o (a subset of iscol) and isgarray */ 87c4762a1bSJed Brown /* off-process column indices */ 88c4762a1bSJed Brown count = 0; 89c4762a1bSJed Brown PetscInt *cmap1; 90c4762a1bSJed Brown ierr = PetscMalloc1(Bn,&idx);CHKERRQ(ierr); 91c4762a1bSJed Brown ierr = PetscMalloc1(Bn,&cmap1);CHKERRQ(ierr); 92c4762a1bSJed Brown 93c4762a1bSJed Brown ierr = VecGetArray(lvec,&xarray);CHKERRQ(ierr); 94c4762a1bSJed Brown ierr = VecGetArray(lcmap,&cmaparray);CHKERRQ(ierr); 95c4762a1bSJed Brown for (i=0; i<Bn; i++) { 96c4762a1bSJed Brown if (PetscRealPart(xarray[i]) > -1.0) { 97c4762a1bSJed Brown idx[count] = i; /* local column index in off-diagonal part B */ 98c4762a1bSJed Brown cmap1[count] = (PetscInt)(PetscRealPart(cmaparray[i])); /* column index in submat */ 99c4762a1bSJed Brown count++; 100c4762a1bSJed Brown } 101c4762a1bSJed Brown } 102c4762a1bSJed Brown printf("[%d] Bn %d, count %d\n",rank,Bn,count); 103c4762a1bSJed Brown ierr = VecRestoreArray(lvec,&xarray);CHKERRQ(ierr); 104c4762a1bSJed Brown ierr = VecRestoreArray(lcmap,&cmaparray);CHKERRQ(ierr); 105c4762a1bSJed Brown if (count != 6) { 106c4762a1bSJed Brown printf("[%d] count %d != 6 lvec:\n",rank,count); 107c4762a1bSJed Brown ierr = VecView(lvec,0);CHKERRQ(ierr); 108c4762a1bSJed Brown 109c4762a1bSJed Brown printf("[%d] count %d != 6 lcmap:\n",rank,count); 110c4762a1bSJed Brown ierr = VecView(lcmap,0);CHKERRQ(ierr); 111*98921bdaSJacob Faibussowitsch SETERRQ(PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"count %d != 6",count); 112c4762a1bSJed Brown } 113c4762a1bSJed Brown 114c4762a1bSJed Brown ierr = ISCreateGeneral(PETSC_COMM_SELF,count,idx,PETSC_COPY_VALUES,iscol_o);CHKERRQ(ierr); 115c4762a1bSJed Brown /* cannot ensure iscol_o has same blocksize as iscol! */ 116c4762a1bSJed Brown 117c4762a1bSJed Brown ierr = PetscFree(idx);CHKERRQ(ierr); 118c4762a1bSJed Brown 119c4762a1bSJed Brown *garray = cmap1; 120c4762a1bSJed Brown 121c4762a1bSJed Brown ierr = VecDestroy(&x);CHKERRQ(ierr); 122c4762a1bSJed Brown ierr = VecDestroy(&cmap);CHKERRQ(ierr); 123c4762a1bSJed Brown ierr = VecDestroy(&lcmap);CHKERRQ(ierr); 124c4762a1bSJed Brown PetscFunctionReturn(0); 125c4762a1bSJed Brown } 126c4762a1bSJed Brown 127c4762a1bSJed Brown int main(int argc,char **args) 128c4762a1bSJed Brown { 129c4762a1bSJed Brown Mat C,A; 130c4762a1bSJed Brown PetscInt i,j,m = 3,n = 2,rstart,rend; 131c4762a1bSJed Brown PetscMPIInt size,rank; 132c4762a1bSJed Brown PetscErrorCode ierr; 133c4762a1bSJed Brown PetscScalar v; 134c4762a1bSJed Brown IS isrow,iscol; 135c4762a1bSJed Brown 136c4762a1bSJed Brown ierr = PetscInitialize(&argc,&args,(char*)0,help);if (ierr) return ierr; 137ffc4695bSBarry Smith ierr = MPI_Comm_rank(PETSC_COMM_WORLD,&rank);CHKERRMPI(ierr); 138ffc4695bSBarry Smith ierr = MPI_Comm_size(PETSC_COMM_WORLD,&size);CHKERRMPI(ierr); 139c4762a1bSJed Brown n = 2*size; 140c4762a1bSJed Brown 141c4762a1bSJed Brown ierr = MatCreate(PETSC_COMM_WORLD,&C);CHKERRQ(ierr); 142c4762a1bSJed Brown ierr = MatSetSizes(C,PETSC_DECIDE,PETSC_DECIDE,m*n,m*n);CHKERRQ(ierr); 143c4762a1bSJed Brown ierr = MatSetFromOptions(C);CHKERRQ(ierr); 144c4762a1bSJed Brown ierr = MatSetUp(C);CHKERRQ(ierr); 145c4762a1bSJed Brown 146c4762a1bSJed Brown /* 147c4762a1bSJed Brown This is JUST to generate a nice test matrix, all processors fill up 148c4762a1bSJed Brown the entire matrix. This is not something one would ever do in practice. 149c4762a1bSJed Brown */ 150c4762a1bSJed Brown ierr = MatGetOwnershipRange(C,&rstart,&rend);CHKERRQ(ierr); 151c4762a1bSJed Brown for (i=rstart; i<rend; i++) { 152c4762a1bSJed Brown for (j=0; j<m*n; j++) { 153c4762a1bSJed Brown v = i + j + 1; 154c4762a1bSJed Brown ierr = MatSetValues(C,1,&i,1,&j,&v,INSERT_VALUES);CHKERRQ(ierr); 155c4762a1bSJed Brown } 156c4762a1bSJed Brown } 157c4762a1bSJed Brown 158c4762a1bSJed Brown ierr = MatAssemblyBegin(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 159c4762a1bSJed Brown ierr = MatAssemblyEnd(C,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 160c4762a1bSJed Brown 161c4762a1bSJed Brown /* 162c4762a1bSJed Brown Generate a new matrix consisting of every second row and column of 163c4762a1bSJed Brown the original matrix 164c4762a1bSJed Brown */ 165c4762a1bSJed Brown ierr = MatGetOwnershipRange(C,&rstart,&rend);CHKERRQ(ierr); 166c4762a1bSJed Brown /* Create parallel IS with the rows we want on THIS processor */ 167c4762a1bSJed Brown ierr = ISCreateStride(PETSC_COMM_WORLD,(rend-rstart)/2,rstart,2,&isrow);CHKERRQ(ierr); 168c4762a1bSJed Brown /* Create parallel IS with the rows we want on THIS processor (same as rows for now) */ 169c4762a1bSJed Brown ierr = ISCreateStride(PETSC_COMM_WORLD,(rend-rstart)/2,rstart,2,&iscol);CHKERRQ(ierr); 170c4762a1bSJed Brown 171c4762a1bSJed Brown IS iscol_d,isrow_d,iscol_o; 172c4762a1bSJed Brown const PetscInt *garray; 173c4762a1bSJed Brown ierr = ISGetSeqIS_SameColDist_Private(C,isrow,iscol,&isrow_d,&iscol_d,&iscol_o,&garray);CHKERRQ(ierr); 174c4762a1bSJed Brown 175c4762a1bSJed Brown ierr = ISDestroy(&isrow_d);CHKERRQ(ierr); 176c4762a1bSJed Brown ierr = ISDestroy(&iscol_d);CHKERRQ(ierr); 177c4762a1bSJed Brown ierr = ISDestroy(&iscol_o);CHKERRQ(ierr); 178c4762a1bSJed Brown ierr = PetscFree(garray);CHKERRQ(ierr); 179c4762a1bSJed Brown 180c4762a1bSJed Brown ierr = MatCreateSubMatrix(C,isrow,iscol,MAT_INITIAL_MATRIX,&A);CHKERRQ(ierr); 181c4762a1bSJed Brown ierr = MatCreateSubMatrix(C,isrow,iscol,MAT_REUSE_MATRIX,&A);CHKERRQ(ierr); 182c4762a1bSJed Brown 183c4762a1bSJed Brown ierr = ISDestroy(&isrow);CHKERRQ(ierr); 184c4762a1bSJed Brown ierr = ISDestroy(&iscol);CHKERRQ(ierr); 185c4762a1bSJed Brown ierr = MatDestroy(&A);CHKERRQ(ierr); 186c4762a1bSJed Brown ierr = MatDestroy(&C);CHKERRQ(ierr); 187c4762a1bSJed Brown ierr = PetscFinalize(); 188c4762a1bSJed Brown return ierr; 189c4762a1bSJed Brown } 190