1c4762a1bSJed Brown static char help[]= "Test PetscSFFCompose when the ilocal arrays are not identity nor dense\n\n"; 2c4762a1bSJed Brown 3c4762a1bSJed Brown #include <petsc.h> 4c4762a1bSJed Brown #include <petscsf.h> 5c4762a1bSJed Brown 6c4762a1bSJed Brown int main(int argc, char **argv) 7c4762a1bSJed Brown { 8c4762a1bSJed Brown PetscSF sfA, sfB, sfBA, sfAAm, sfBBm, sfAm, sfBm; 9c4762a1bSJed Brown PetscInt nrootsA, nleavesA, nrootsB, nleavesB; 10c4762a1bSJed Brown PetscInt *ilocalA, *ilocalB; 11c4762a1bSJed Brown PetscSFNode *iremoteA, *iremoteB; 12c4762a1bSJed Brown PetscMPIInt rank,size; 13c4762a1bSJed Brown PetscInt i,m,n,k,nl = 2,mA,mB,nldataA,nldataB; 14c4762a1bSJed Brown PetscInt *rdA,*rdB,*ldA,*ldB; 15c4762a1bSJed Brown PetscBool inverse = PETSC_FALSE; 16c4762a1bSJed Brown 17*b122ec5aSJacob Faibussowitsch CHKERRQ(PetscInitialize(&argc,&argv,NULL,help)); 185f80ce2aSJacob Faibussowitsch CHKERRQ(PetscOptionsGetInt(NULL,NULL,"-nl",&nl,NULL)); 195f80ce2aSJacob Faibussowitsch CHKERRQ(PetscOptionsGetBool(NULL,NULL,"-explicit_inverse",&inverse,NULL)); 205f80ce2aSJacob Faibussowitsch CHKERRMPI(MPI_Comm_size(PETSC_COMM_WORLD,&size)); 215f80ce2aSJacob Faibussowitsch CHKERRMPI(MPI_Comm_rank(PETSC_COMM_WORLD,&rank)); 22c4762a1bSJed Brown 235f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFCreate(PETSC_COMM_WORLD, &sfA)); 245f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFCreate(PETSC_COMM_WORLD, &sfB)); 255f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFSetFromOptions(sfA)); 265f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFSetFromOptions(sfB)); 27c4762a1bSJed Brown 28c4762a1bSJed Brown n = 4*nl*size; 29c4762a1bSJed Brown m = 2*nl; 30c4762a1bSJed Brown k = nl; 31c4762a1bSJed Brown 32dd400576SPatrick Sanan nldataA = rank == 0 ? n : 0; 33c4762a1bSJed Brown nldataB = 3*nl; 34c4762a1bSJed Brown 35c4762a1bSJed Brown nrootsA = m; 36dd400576SPatrick Sanan nleavesA = rank == 0 ? size*m : 0; 37dd400576SPatrick Sanan nrootsB = rank == 0 ? n : 0; 38c4762a1bSJed Brown nleavesB = k; 39c4762a1bSJed Brown 405f80ce2aSJacob Faibussowitsch CHKERRQ(PetscMalloc1(nleavesA, &ilocalA)); 415f80ce2aSJacob Faibussowitsch CHKERRQ(PetscMalloc1(nleavesA, &iremoteA)); 425f80ce2aSJacob Faibussowitsch CHKERRQ(PetscMalloc1(nleavesB, &ilocalB)); 435f80ce2aSJacob Faibussowitsch CHKERRQ(PetscMalloc1(nleavesB, &iremoteB)); 44c4762a1bSJed Brown 45c4762a1bSJed Brown /* sf A bcast is equivalent to a sparse gather on process 0 46c4762a1bSJed Brown process 0 receives data in the middle [nl,3*nl] of the leaf data array for A */ 47c4762a1bSJed Brown for (i = 0; i < nleavesA; i++) { 48c4762a1bSJed Brown iremoteA[i].rank = i/m; 49c4762a1bSJed Brown iremoteA[i].index = i%m; 50c4762a1bSJed Brown ilocalA[i] = nl + i/m * 4*nl + i%m; 51c4762a1bSJed Brown } 52c4762a1bSJed Brown 53c4762a1bSJed Brown /* sf B bcast is equivalent to a sparse scatter from process 0 54c4762a1bSJed Brown process 0 sends data from [nl,2*nl] of the leaf data array for A 55c4762a1bSJed Brown each process receives, in reverse order, in the middle [nl,2*nl] of the leaf data array for B */ 56c4762a1bSJed Brown for (i = 0; i < nleavesB; i++) { 57c4762a1bSJed Brown iremoteB[i].rank = 0; 58c4762a1bSJed Brown iremoteB[i].index = rank * 4*nl + nl + i%m; 59c4762a1bSJed Brown ilocalB[i] = 2*nl - i - 1; 60c4762a1bSJed Brown } 615f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFSetGraph(sfA, nrootsA, nleavesA, ilocalA, PETSC_OWN_POINTER, iremoteA, PETSC_OWN_POINTER)); 625f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFSetGraph(sfB, nrootsB, nleavesB, ilocalB, PETSC_OWN_POINTER, iremoteB, PETSC_OWN_POINTER)); 635f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFSetUp(sfA)); 645f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFSetUp(sfB)); 655f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectSetName((PetscObject)sfA, "sfA")); 665f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectSetName((PetscObject)sfB, "sfB")); 675f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFViewFromOptions(sfA, NULL, "-view")); 685f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFViewFromOptions(sfB, NULL, "-view")); 69c4762a1bSJed Brown 705f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFGetLeafRange(sfA, NULL, &mA)); 715f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFGetLeafRange(sfB, NULL, &mB)); 725f80ce2aSJacob Faibussowitsch CHKERRQ(PetscMalloc2(nrootsA, &rdA, nldataA, &ldA)); 735f80ce2aSJacob Faibussowitsch CHKERRQ(PetscMalloc2(nrootsB, &rdB, nldataB, &ldB)); 74c4762a1bSJed Brown for (i = 0; i < nrootsA; i++) rdA[i] = m*rank + i; 75c4762a1bSJed Brown for (i = 0; i < nldataA; i++) ldA[i] = -1; 76c4762a1bSJed Brown for (i = 0; i < nldataB; i++) ldB[i] = -1; 77c4762a1bSJed Brown 785f80ce2aSJacob Faibussowitsch CHKERRQ(PetscViewerASCIIPrintf(PETSC_VIEWER_STDOUT_WORLD, "BcastB(BcastA)\n")); 795f80ce2aSJacob Faibussowitsch CHKERRQ(PetscViewerASCIIPrintf(PETSC_VIEWER_STDOUT_WORLD, "A: root data\n")); 805f80ce2aSJacob Faibussowitsch CHKERRQ(PetscIntView(nrootsA, rdA, PETSC_VIEWER_STDOUT_WORLD)); 815f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFBcastBegin(sfA, MPIU_INT, rdA, ldA,MPI_REPLACE)); 825f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFBcastEnd(sfA, MPIU_INT, rdA, ldA,MPI_REPLACE)); 835f80ce2aSJacob Faibussowitsch CHKERRQ(PetscViewerASCIIPrintf(PETSC_VIEWER_STDOUT_WORLD, "A: leaf data (all)\n")); 845f80ce2aSJacob Faibussowitsch CHKERRQ(PetscIntView(nldataA, ldA, PETSC_VIEWER_STDOUT_WORLD)); 855f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFBcastBegin(sfB, MPIU_INT, ldA, ldB,MPI_REPLACE)); 865f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFBcastEnd(sfB, MPIU_INT, ldA, ldB,MPI_REPLACE)); 875f80ce2aSJacob Faibussowitsch CHKERRQ(PetscViewerASCIIPrintf(PETSC_VIEWER_STDOUT_WORLD, "B: leaf data (all)\n")); 885f80ce2aSJacob Faibussowitsch CHKERRQ(PetscIntView(nldataB, ldB, PETSC_VIEWER_STDOUT_WORLD)); 89c4762a1bSJed Brown 905f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFCompose(sfA, sfB, &sfBA)); 915f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFSetFromOptions(sfBA)); 925f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFSetUp(sfBA)); 935f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectSetName((PetscObject)sfBA, "sfBA")); 945f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFViewFromOptions(sfBA, NULL, "-view")); 95c4762a1bSJed Brown 96c4762a1bSJed Brown for (i = 0; i < nldataB; i++) ldB[i] = -1; 975f80ce2aSJacob Faibussowitsch CHKERRQ(PetscViewerASCIIPrintf(PETSC_VIEWER_STDOUT_WORLD, "BcastBA\n")); 985f80ce2aSJacob Faibussowitsch CHKERRQ(PetscViewerASCIIPrintf(PETSC_VIEWER_STDOUT_WORLD, "BA: root data\n")); 995f80ce2aSJacob Faibussowitsch CHKERRQ(PetscIntView(nrootsA, rdA, PETSC_VIEWER_STDOUT_WORLD)); 1005f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFBcastBegin(sfBA, MPIU_INT, rdA, ldB,MPI_REPLACE)); 1015f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFBcastEnd(sfBA, MPIU_INT, rdA, ldB,MPI_REPLACE)); 1025f80ce2aSJacob Faibussowitsch CHKERRQ(PetscViewerASCIIPrintf(PETSC_VIEWER_STDOUT_WORLD, "BA: leaf data (all)\n")); 1035f80ce2aSJacob Faibussowitsch CHKERRQ(PetscIntView(nldataB, ldB, PETSC_VIEWER_STDOUT_WORLD)); 104c4762a1bSJed Brown 1055f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFCreateInverseSF(sfA, &sfAm)); 1065f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFSetFromOptions(sfAm)); 1075f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectSetName((PetscObject)sfAm, "sfAm")); 1085f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFViewFromOptions(sfAm, NULL, "-view")); 109c4762a1bSJed Brown 110c4762a1bSJed Brown if (!inverse) { 1115f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFComposeInverse(sfA, sfA, &sfAAm)); 112c4762a1bSJed Brown } else { 1135f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFCompose(sfA, sfAm, &sfAAm)); 114c4762a1bSJed Brown } 1155f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFSetFromOptions(sfAAm)); 1165f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFSetUp(sfAAm)); 1175f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectSetName((PetscObject)sfAAm, "sfAAm")); 1185f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFViewFromOptions(sfAAm, NULL, "-view")); 119c4762a1bSJed Brown 1205f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFCreateInverseSF(sfB, &sfBm)); 1215f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFSetFromOptions(sfBm)); 1225f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectSetName((PetscObject)sfBm, "sfBm")); 1235f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFViewFromOptions(sfBm, NULL, "-view")); 124c4762a1bSJed Brown 125c4762a1bSJed Brown if (!inverse) { 1265f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFComposeInverse(sfB, sfB, &sfBBm)); 127c4762a1bSJed Brown } else { 1285f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFCompose(sfB, sfBm, &sfBBm)); 129c4762a1bSJed Brown } 1305f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFSetFromOptions(sfBBm)); 1315f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFSetUp(sfBBm)); 1325f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectSetName((PetscObject)sfBBm, "sfBBm")); 1335f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFViewFromOptions(sfBBm, NULL, "-view")); 134c4762a1bSJed Brown 1355f80ce2aSJacob Faibussowitsch CHKERRQ(PetscFree2(rdA, ldA)); 1365f80ce2aSJacob Faibussowitsch CHKERRQ(PetscFree2(rdB, ldB)); 137c4762a1bSJed Brown 1385f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFDestroy(&sfA)); 1395f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFDestroy(&sfB)); 1405f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFDestroy(&sfBA)); 1415f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFDestroy(&sfAm)); 1425f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFDestroy(&sfBm)); 1435f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFDestroy(&sfAAm)); 1445f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFDestroy(&sfBBm)); 145c4762a1bSJed Brown 146*b122ec5aSJacob Faibussowitsch CHKERRQ(PetscFinalize()); 147*b122ec5aSJacob Faibussowitsch return 0; 148c4762a1bSJed Brown } 149c4762a1bSJed Brown 150c4762a1bSJed Brown /*TEST 151c4762a1bSJed Brown 152c4762a1bSJed Brown test: 153c4762a1bSJed Brown suffix: 1 154c4762a1bSJed Brown args: -view -explicit_inverse {{0 1}} 155c4762a1bSJed Brown 156c4762a1bSJed Brown test: 157c4762a1bSJed Brown nsize: 7 158c4762a1bSJed Brown filter: grep -v "type" | grep -v "sort" 159c4762a1bSJed Brown suffix: 2 160c4762a1bSJed Brown args: -view -nl 5 -explicit_inverse {{0 1}} 161c4762a1bSJed Brown 162c4762a1bSJed Brown # we cannot test for -sf_window_flavor dynamic because SFCompose with sparse leaves may change the root data pointer only locally, and this is not supported by the dynamic case 163c4762a1bSJed Brown test: 164c4762a1bSJed Brown nsize: 7 165c4762a1bSJed Brown suffix: 2_window 166c4762a1bSJed Brown filter: grep -v "type" | grep -v "sort" 167c4762a1bSJed Brown output_file: output/ex5_2.out 168c4762a1bSJed Brown args: -view -nl 5 -explicit_inverse {{0 1}} -sf_type window -sf_window_sync {{fence lock active}} -sf_window_flavor {{create allocate}} 169dfd57a17SPierre Jolivet requires: defined(PETSC_HAVE_MPI_ONE_SIDED) defined(PETSC_HAVE_MPI_FEATURE_DYNAMIC_WINDOW) 170c4762a1bSJed Brown 171c4762a1bSJed Brown # The nightly test suite with MPICH uses ch3:sock, which is broken when winsize == 0 in some of the processes 172c4762a1bSJed Brown test: 173c4762a1bSJed Brown nsize: 7 174c4762a1bSJed Brown suffix: 2_window_shared 175c4762a1bSJed Brown filter: grep -v "type" | grep -v "sort" 176c4762a1bSJed Brown output_file: output/ex5_2.out 177c4762a1bSJed Brown args: -view -nl 5 -explicit_inverse {{0 1}} -sf_type window -sf_window_sync {{fence lock active}} -sf_window_flavor shared 178dfd57a17SPierre Jolivet requires: defined(PETSC_HAVE_MPI_PROCESS_SHARED_MEMORY) !defined(PETSC_HAVE_MPICH_NUMVERSION) defined(PETSC_HAVE_MPI_ONE_SIDED) 179c4762a1bSJed Brown 180c4762a1bSJed Brown TEST*/ 181