1c4762a1bSJed Brown 2c4762a1bSJed Brown static char help[] = "Tests MatIncreaseOverlap(), MatCreateSubMatrices() for parallel MatSBAIJ format.\n"; 3c4762a1bSJed Brown /* Example of usage: 4c4762a1bSJed Brown mpiexec -n 2 ./ex92 -nd 2 -ov 3 -mat_block_size 2 -view_id 0 -test_overlap -test_submat 5c4762a1bSJed Brown */ 6c4762a1bSJed Brown #include <petscmat.h> 7c4762a1bSJed Brown 8c4762a1bSJed Brown int main(int argc,char **args) 9c4762a1bSJed Brown { 10c4762a1bSJed Brown Mat A,Atrans,sA,*submatA,*submatsA; 11c4762a1bSJed Brown PetscErrorCode ierr; 12c4762a1bSJed Brown PetscMPIInt size,rank; 13c4762a1bSJed Brown PetscInt bs=1,mbs=10,ov=1,i,j,k,*rows,*cols,nd=2,*idx,rstart,rend,sz,M,N,Mbs; 14c4762a1bSJed Brown PetscScalar *vals,rval,one=1.0; 15c4762a1bSJed Brown IS *is1,*is2; 16c4762a1bSJed Brown PetscRandom rand; 17c4762a1bSJed Brown PetscBool flg,TestOverlap,TestSubMat,TestAllcols,test_sorted=PETSC_FALSE; 18c4762a1bSJed Brown PetscInt vid = -1; 19c4762a1bSJed Brown #if defined(PETSC_USE_LOG) 20c4762a1bSJed Brown PetscLogStage stages[2]; 21c4762a1bSJed Brown #endif 22c4762a1bSJed Brown 23c4762a1bSJed Brown ierr = PetscInitialize(&argc,&args,(char*)0,help);if (ierr) return ierr; 245f80ce2aSJacob Faibussowitsch CHKERRMPI(MPI_Comm_size(PETSC_COMM_WORLD,&size)); 255f80ce2aSJacob Faibussowitsch CHKERRMPI(MPI_Comm_rank(PETSC_COMM_WORLD,&rank)); 26c4762a1bSJed Brown 275f80ce2aSJacob Faibussowitsch CHKERRQ(PetscOptionsGetInt(NULL,NULL,"-mat_block_size",&bs,NULL)); 285f80ce2aSJacob Faibussowitsch CHKERRQ(PetscOptionsGetInt(NULL,NULL,"-mat_mbs",&mbs,NULL)); 295f80ce2aSJacob Faibussowitsch CHKERRQ(PetscOptionsGetInt(NULL,NULL,"-ov",&ov,NULL)); 305f80ce2aSJacob Faibussowitsch CHKERRQ(PetscOptionsGetInt(NULL,NULL,"-nd",&nd,NULL)); 315f80ce2aSJacob Faibussowitsch CHKERRQ(PetscOptionsGetInt(NULL,NULL,"-view_id",&vid,NULL)); 325f80ce2aSJacob Faibussowitsch CHKERRQ(PetscOptionsHasName(NULL,NULL, "-test_overlap", &TestOverlap)); 335f80ce2aSJacob Faibussowitsch CHKERRQ(PetscOptionsHasName(NULL,NULL, "-test_submat", &TestSubMat)); 345f80ce2aSJacob Faibussowitsch CHKERRQ(PetscOptionsHasName(NULL,NULL, "-test_allcols", &TestAllcols)); 355f80ce2aSJacob Faibussowitsch CHKERRQ(PetscOptionsGetBool(NULL,NULL,"-test_sorted",&test_sorted,NULL)); 36c4762a1bSJed Brown 375f80ce2aSJacob Faibussowitsch CHKERRQ(MatCreate(PETSC_COMM_WORLD,&A)); 385f80ce2aSJacob Faibussowitsch CHKERRQ(MatSetSizes(A,mbs*bs,mbs*bs,PETSC_DECIDE,PETSC_DECIDE)); 395f80ce2aSJacob Faibussowitsch CHKERRQ(MatSetType(A,MATBAIJ)); 405f80ce2aSJacob Faibussowitsch CHKERRQ(MatSeqBAIJSetPreallocation(A,bs,PETSC_DEFAULT,NULL)); 415f80ce2aSJacob Faibussowitsch CHKERRQ(MatMPIBAIJSetPreallocation(A,bs,PETSC_DEFAULT,NULL,PETSC_DEFAULT,NULL)); 42c4762a1bSJed Brown 435f80ce2aSJacob Faibussowitsch CHKERRQ(PetscRandomCreate(PETSC_COMM_WORLD,&rand)); 445f80ce2aSJacob Faibussowitsch CHKERRQ(PetscRandomSetFromOptions(rand)); 45c4762a1bSJed Brown 465f80ce2aSJacob Faibussowitsch CHKERRQ(MatGetOwnershipRange(A,&rstart,&rend)); 475f80ce2aSJacob Faibussowitsch CHKERRQ(MatGetSize(A,&M,&N)); 48c4762a1bSJed Brown Mbs = M/bs; 49c4762a1bSJed Brown 505f80ce2aSJacob Faibussowitsch CHKERRQ(PetscMalloc1(bs,&rows)); 515f80ce2aSJacob Faibussowitsch CHKERRQ(PetscMalloc1(bs,&cols)); 525f80ce2aSJacob Faibussowitsch CHKERRQ(PetscMalloc1(bs*bs,&vals)); 535f80ce2aSJacob Faibussowitsch CHKERRQ(PetscMalloc1(M,&idx)); 54c4762a1bSJed Brown 55c4762a1bSJed Brown /* Now set blocks of values */ 56c4762a1bSJed Brown for (j=0; j<bs*bs; j++) vals[j] = 0.0; 57c4762a1bSJed Brown for (i=0; i<Mbs; i++) { 58c4762a1bSJed Brown cols[0] = i*bs; rows[0] = i*bs; 59c4762a1bSJed Brown for (j=1; j<bs; j++) { 60c4762a1bSJed Brown rows[j] = rows[j-1]+1; 61c4762a1bSJed Brown cols[j] = cols[j-1]+1; 62c4762a1bSJed Brown } 635f80ce2aSJacob Faibussowitsch CHKERRQ(MatSetValues(A,bs,rows,bs,cols,vals,ADD_VALUES)); 64c4762a1bSJed Brown } 65c4762a1bSJed Brown /* second, add random blocks */ 66c4762a1bSJed Brown for (i=0; i<20*bs; i++) { 675f80ce2aSJacob Faibussowitsch CHKERRQ(PetscRandomGetValue(rand,&rval)); 68c4762a1bSJed Brown cols[0] = bs*(PetscInt)(PetscRealPart(rval)*Mbs); 695f80ce2aSJacob Faibussowitsch CHKERRQ(PetscRandomGetValue(rand,&rval)); 70c4762a1bSJed Brown rows[0] = rstart + bs*(PetscInt)(PetscRealPart(rval)*mbs); 71c4762a1bSJed Brown for (j=1; j<bs; j++) { 72c4762a1bSJed Brown rows[j] = rows[j-1]+1; 73c4762a1bSJed Brown cols[j] = cols[j-1]+1; 74c4762a1bSJed Brown } 75c4762a1bSJed Brown 76c4762a1bSJed Brown for (j=0; j<bs*bs; j++) { 775f80ce2aSJacob Faibussowitsch CHKERRQ(PetscRandomGetValue(rand,&rval)); 78c4762a1bSJed Brown vals[j] = rval; 79c4762a1bSJed Brown } 805f80ce2aSJacob Faibussowitsch CHKERRQ(MatSetValues(A,bs,rows,bs,cols,vals,ADD_VALUES)); 81c4762a1bSJed Brown } 82c4762a1bSJed Brown 835f80ce2aSJacob Faibussowitsch CHKERRQ(MatAssemblyBegin(A,MAT_FINAL_ASSEMBLY)); 845f80ce2aSJacob Faibussowitsch CHKERRQ(MatAssemblyEnd(A,MAT_FINAL_ASSEMBLY)); 85c4762a1bSJed Brown 86c4762a1bSJed Brown /* make A a symmetric matrix: A <- A^T + A */ 875f80ce2aSJacob Faibussowitsch CHKERRQ(MatTranspose(A,MAT_INITIAL_MATRIX, &Atrans)); 885f80ce2aSJacob Faibussowitsch CHKERRQ(MatAXPY(A,one,Atrans,DIFFERENT_NONZERO_PATTERN)); 895f80ce2aSJacob Faibussowitsch CHKERRQ(MatDestroy(&Atrans)); 905f80ce2aSJacob Faibussowitsch CHKERRQ(MatTranspose(A,MAT_INITIAL_MATRIX, &Atrans)); 915f80ce2aSJacob Faibussowitsch CHKERRQ(MatEqual(A, Atrans, &flg)); 92c4762a1bSJed Brown if (flg) { 935f80ce2aSJacob Faibussowitsch CHKERRQ(MatSetOption(A,MAT_SYMMETRIC,PETSC_TRUE)); 94c4762a1bSJed Brown } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"A+A^T is non-symmetric"); 955f80ce2aSJacob Faibussowitsch CHKERRQ(MatDestroy(&Atrans)); 96c4762a1bSJed Brown 97c4762a1bSJed Brown /* create a SeqSBAIJ matrix sA (= A) */ 985f80ce2aSJacob Faibussowitsch CHKERRQ(MatConvert(A,MATSBAIJ,MAT_INITIAL_MATRIX,&sA)); 99c4762a1bSJed Brown if (vid >= 0 && vid < size) { 1005f80ce2aSJacob Faibussowitsch CHKERRQ(PetscViewerASCIIPrintf(PETSC_VIEWER_STDOUT_WORLD,"A:\n")); 1015f80ce2aSJacob Faibussowitsch CHKERRQ(MatView(A,PETSC_VIEWER_STDOUT_WORLD)); 1025f80ce2aSJacob Faibussowitsch CHKERRQ(PetscViewerASCIIPrintf(PETSC_VIEWER_STDOUT_WORLD,"sA:\n")); 1035f80ce2aSJacob Faibussowitsch CHKERRQ(MatView(sA,PETSC_VIEWER_STDOUT_WORLD)); 104c4762a1bSJed Brown } 105c4762a1bSJed Brown 106c4762a1bSJed Brown /* Test sA==A through MatMult() */ 1075f80ce2aSJacob Faibussowitsch CHKERRQ(MatMultEqual(A,sA,10,&flg)); 108*28b400f6SJacob Faibussowitsch PetscCheck(flg,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONG,"Error in MatConvert(): A != sA"); 109c4762a1bSJed Brown 110c4762a1bSJed Brown /* Test MatIncreaseOverlap() */ 1115f80ce2aSJacob Faibussowitsch CHKERRQ(PetscMalloc1(nd,&is1)); 1125f80ce2aSJacob Faibussowitsch CHKERRQ(PetscMalloc1(nd,&is2)); 113c4762a1bSJed Brown 114c4762a1bSJed Brown for (i=0; i<nd; i++) { 115c4762a1bSJed Brown if (!TestAllcols) { 1165f80ce2aSJacob Faibussowitsch CHKERRQ(PetscRandomGetValue(rand,&rval)); 117c4762a1bSJed Brown sz = (PetscInt)((0.5+0.2*PetscRealPart(rval))*mbs); /* 0.5*mbs < sz < 0.7*mbs */ 118c4762a1bSJed Brown 119c4762a1bSJed Brown for (j=0; j<sz; j++) { 1205f80ce2aSJacob Faibussowitsch CHKERRQ(PetscRandomGetValue(rand,&rval)); 121c4762a1bSJed Brown idx[j*bs] = bs*(PetscInt)(PetscRealPart(rval)*Mbs); 122c4762a1bSJed Brown for (k=1; k<bs; k++) idx[j*bs+k] = idx[j*bs]+k; 123c4762a1bSJed Brown } 1245f80ce2aSJacob Faibussowitsch CHKERRQ(ISCreateGeneral(PETSC_COMM_SELF,sz*bs,idx,PETSC_COPY_VALUES,is1+i)); 1255f80ce2aSJacob Faibussowitsch CHKERRQ(ISCreateGeneral(PETSC_COMM_SELF,sz*bs,idx,PETSC_COPY_VALUES,is2+i)); 126c4762a1bSJed Brown if (rank == vid) { 1275f80ce2aSJacob Faibussowitsch CHKERRQ(PetscPrintf(PETSC_COMM_SELF," [%d] IS sz[%" PetscInt_FMT "]: %" PetscInt_FMT "\n",rank,i,sz)); 1285f80ce2aSJacob Faibussowitsch CHKERRQ(ISView(is2[i],PETSC_VIEWER_STDOUT_SELF)); 129c4762a1bSJed Brown } 130a5b23f4aSJose E. Roman } else { /* Test all rows and columns */ 131c4762a1bSJed Brown sz = M; 1325f80ce2aSJacob Faibussowitsch CHKERRQ(ISCreateStride(PETSC_COMM_SELF,sz,0,1,is1+i)); 1335f80ce2aSJacob Faibussowitsch CHKERRQ(ISCreateStride(PETSC_COMM_SELF,sz,0,1,is2+i)); 134c4762a1bSJed Brown 135c4762a1bSJed Brown if (rank == vid) { 136c4762a1bSJed Brown PetscBool colflag; 1375f80ce2aSJacob Faibussowitsch CHKERRQ(ISIdentity(is2[i],&colflag)); 1385f80ce2aSJacob Faibussowitsch CHKERRQ(PetscPrintf(PETSC_COMM_SELF,"[%d] is2[%" PetscInt_FMT "], colflag %d\n",rank,i,colflag)); 1395f80ce2aSJacob Faibussowitsch CHKERRQ(ISView(is2[i],PETSC_VIEWER_STDOUT_SELF)); 140c4762a1bSJed Brown } 141c4762a1bSJed Brown } 142c4762a1bSJed Brown } 143c4762a1bSJed Brown 1445f80ce2aSJacob Faibussowitsch CHKERRQ(PetscLogStageRegister("MatOv_SBAIJ",&stages[0])); 1455f80ce2aSJacob Faibussowitsch CHKERRQ(PetscLogStageRegister("MatOv_BAIJ",&stages[1])); 146c4762a1bSJed Brown 147c4762a1bSJed Brown /* Test MatIncreaseOverlap */ 148c4762a1bSJed Brown if (TestOverlap) { 1495f80ce2aSJacob Faibussowitsch CHKERRQ(PetscLogStagePush(stages[0])); 1505f80ce2aSJacob Faibussowitsch CHKERRQ(MatIncreaseOverlap(sA,nd,is2,ov)); 1515f80ce2aSJacob Faibussowitsch CHKERRQ(PetscLogStagePop()); 152c4762a1bSJed Brown 1535f80ce2aSJacob Faibussowitsch CHKERRQ(PetscLogStagePush(stages[1])); 1545f80ce2aSJacob Faibussowitsch CHKERRQ(MatIncreaseOverlap(A,nd,is1,ov)); 1555f80ce2aSJacob Faibussowitsch CHKERRQ(PetscLogStagePop()); 156c4762a1bSJed Brown 157c4762a1bSJed Brown if (rank == vid) { 1585f80ce2aSJacob Faibussowitsch CHKERRQ(PetscPrintf(PETSC_COMM_SELF,"\n[%d] IS from BAIJ:\n",rank)); 1595f80ce2aSJacob Faibussowitsch CHKERRQ(ISView(is1[0],PETSC_VIEWER_STDOUT_SELF)); 1605f80ce2aSJacob Faibussowitsch CHKERRQ(PetscPrintf(PETSC_COMM_SELF,"\n[%d] IS from SBAIJ:\n",rank)); 1615f80ce2aSJacob Faibussowitsch CHKERRQ(ISView(is2[0],PETSC_VIEWER_STDOUT_SELF)); 162c4762a1bSJed Brown } 163c4762a1bSJed Brown 164c4762a1bSJed Brown for (i=0; i<nd; ++i) { 1655f80ce2aSJacob Faibussowitsch CHKERRQ(ISEqual(is1[i],is2[i],&flg)); 166c4762a1bSJed Brown if (!flg) { 167dd400576SPatrick Sanan if (rank == 0) { 1685f80ce2aSJacob Faibussowitsch CHKERRQ(ISSort(is1[i])); 1695f80ce2aSJacob Faibussowitsch CHKERRQ(ISSort(is2[i])); 170c4762a1bSJed Brown } 17198921bdaSJacob Faibussowitsch SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"i=%" PetscInt_FMT ", is1 != is2",i); 172c4762a1bSJed Brown } 173c4762a1bSJed Brown } 174c4762a1bSJed Brown } 175c4762a1bSJed Brown 176c4762a1bSJed Brown /* Test MatCreateSubmatrices */ 177c4762a1bSJed Brown if (TestSubMat) { 178c4762a1bSJed Brown if (test_sorted) { 179c4762a1bSJed Brown for (i = 0; i < nd; ++i) { 1805f80ce2aSJacob Faibussowitsch CHKERRQ(ISSort(is1[i])); 181c4762a1bSJed Brown } 182c4762a1bSJed Brown } 1835f80ce2aSJacob Faibussowitsch CHKERRQ(MatCreateSubMatrices(A,nd,is1,is1,MAT_INITIAL_MATRIX,&submatA)); 1845f80ce2aSJacob Faibussowitsch CHKERRQ(MatCreateSubMatrices(sA,nd,is1,is1,MAT_INITIAL_MATRIX,&submatsA)); 185c4762a1bSJed Brown 1865f80ce2aSJacob Faibussowitsch CHKERRQ(MatMultEqual(A,sA,10,&flg)); 187*28b400f6SJacob Faibussowitsch PetscCheck(flg,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"A != sA"); 188c4762a1bSJed Brown 189c4762a1bSJed Brown /* Now test MatCreateSubmatrices with MAT_REUSE_MATRIX option */ 1905f80ce2aSJacob Faibussowitsch CHKERRQ(MatCreateSubMatrices(A,nd,is1,is1,MAT_REUSE_MATRIX,&submatA)); 1915f80ce2aSJacob Faibussowitsch CHKERRQ(MatCreateSubMatrices(sA,nd,is1,is1,MAT_REUSE_MATRIX,&submatsA)); 1925f80ce2aSJacob Faibussowitsch CHKERRQ(MatMultEqual(A,sA,10,&flg)); 193*28b400f6SJacob Faibussowitsch PetscCheck(flg,PETSC_COMM_SELF,PETSC_ERR_ARG_WRONGSTATE,"MatCreateSubmatrices(): A != sA"); 194c4762a1bSJed Brown 1955f80ce2aSJacob Faibussowitsch CHKERRQ(MatDestroySubMatrices(nd,&submatA)); 1965f80ce2aSJacob Faibussowitsch CHKERRQ(MatDestroySubMatrices(nd,&submatsA)); 197c4762a1bSJed Brown } 198c4762a1bSJed Brown 199c4762a1bSJed Brown /* Free allocated memory */ 200c4762a1bSJed Brown for (i=0; i<nd; ++i) { 2015f80ce2aSJacob Faibussowitsch CHKERRQ(ISDestroy(&is1[i])); 2025f80ce2aSJacob Faibussowitsch CHKERRQ(ISDestroy(&is2[i])); 203c4762a1bSJed Brown } 2045f80ce2aSJacob Faibussowitsch CHKERRQ(PetscFree(is1)); 2055f80ce2aSJacob Faibussowitsch CHKERRQ(PetscFree(is2)); 2065f80ce2aSJacob Faibussowitsch CHKERRQ(PetscFree(idx)); 2075f80ce2aSJacob Faibussowitsch CHKERRQ(PetscFree(rows)); 2085f80ce2aSJacob Faibussowitsch CHKERRQ(PetscFree(cols)); 2095f80ce2aSJacob Faibussowitsch CHKERRQ(PetscFree(vals)); 2105f80ce2aSJacob Faibussowitsch CHKERRQ(MatDestroy(&A)); 2115f80ce2aSJacob Faibussowitsch CHKERRQ(MatDestroy(&sA)); 2125f80ce2aSJacob Faibussowitsch CHKERRQ(PetscRandomDestroy(&rand)); 213c4762a1bSJed Brown ierr = PetscFinalize(); 214c4762a1bSJed Brown return ierr; 215c4762a1bSJed Brown } 216c4762a1bSJed Brown 217c4762a1bSJed Brown /*TEST 218c4762a1bSJed Brown 219c4762a1bSJed Brown test: 220c4762a1bSJed Brown args: -ov {{1 3}} -mat_block_size {{2 8}} -test_overlap -test_submat 221c4762a1bSJed Brown output_file: output/ex92_1.out 222c4762a1bSJed Brown 223c4762a1bSJed Brown test: 224c4762a1bSJed Brown suffix: 2 225c4762a1bSJed Brown nsize: {{3 4}} 226c4762a1bSJed Brown args: -ov {{1 3}} -mat_block_size {{2 8}} -test_overlap -test_submat 227c4762a1bSJed Brown output_file: output/ex92_1.out 228c4762a1bSJed Brown 229c4762a1bSJed Brown test: 230c4762a1bSJed Brown suffix: 3 231c4762a1bSJed Brown nsize: {{3 4}} 232c4762a1bSJed Brown args: -ov {{1 3}} -mat_block_size {{2 8}} -test_overlap -test_allcols 233c4762a1bSJed Brown output_file: output/ex92_1.out 234c4762a1bSJed Brown 235c4762a1bSJed Brown test: 236c4762a1bSJed Brown suffix: 3_sorted 237c4762a1bSJed Brown nsize: {{3 4}} 238c4762a1bSJed Brown args: -ov {{1 3}} -mat_block_size {{2 8}} -test_overlap -test_allcols -test_sorted 239c4762a1bSJed Brown output_file: output/ex92_1.out 240c4762a1bSJed Brown 241c4762a1bSJed Brown test: 242c4762a1bSJed Brown suffix: 4 243c4762a1bSJed Brown nsize: {{3 4}} 244c4762a1bSJed Brown args: -ov {{1 3}} -mat_block_size {{2 8}} -test_submat -test_allcols 245c4762a1bSJed Brown output_file: output/ex92_1.out 246c4762a1bSJed Brown 247c4762a1bSJed Brown TEST*/ 248