1c4762a1bSJed Brown static char help[] = "Test PetscSFFCompose when the ilocal array is not the identity\n\n"; 2c4762a1bSJed Brown 3c4762a1bSJed Brown #include <petscsf.h> 4c4762a1bSJed Brown 59371c9d4SSatish Balay int main(int argc, char **argv) { 6c4762a1bSJed Brown PetscSF sfA, sfB, sfBA; 7c4762a1bSJed Brown PetscInt nrootsA, nleavesA, nrootsB, nleavesB; 8c4762a1bSJed Brown PetscInt *ilocalA, *ilocalB; 9c4762a1bSJed Brown PetscSFNode *iremoteA, *iremoteB; 10c4762a1bSJed Brown Vec a, b, ba; 11c4762a1bSJed Brown const PetscScalar *arrayR; 12c4762a1bSJed Brown PetscScalar *arrayW; 13c4762a1bSJed Brown PetscMPIInt size; 14c4762a1bSJed Brown PetscInt i; 15c4762a1bSJed Brown PetscInt maxleafB; 16c4762a1bSJed Brown PetscBool flag = PETSC_FALSE; 17c4762a1bSJed Brown 18327415f7SBarry Smith PetscFunctionBeginUser; 199566063dSJacob Faibussowitsch PetscCall(PetscInitialize(&argc, &argv, NULL, help)); 209566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(PETSC_COMM_WORLD, &size)); 214643bc0bSVaclav Hapla PetscCheck(size == 1, PETSC_COMM_WORLD, PETSC_ERR_USER, "Only coded for one MPI process"); 22c4762a1bSJed Brown 239566063dSJacob Faibussowitsch PetscCall(PetscSFCreate(PETSC_COMM_WORLD, &sfA)); 249566063dSJacob Faibussowitsch PetscCall(PetscSFCreate(PETSC_COMM_WORLD, &sfB)); 259566063dSJacob Faibussowitsch PetscCall(PetscSFSetFromOptions(sfA)); 269566063dSJacob Faibussowitsch PetscCall(PetscSFSetFromOptions(sfB)); 27c4762a1bSJed Brown 289566063dSJacob Faibussowitsch PetscCall(PetscOptionsGetBool(NULL, NULL, "-sparse_sfB", &flag, NULL)); 29c4762a1bSJed Brown 30c4762a1bSJed Brown if (flag) { 31c4762a1bSJed Brown /* sfA permutes indices, sfB has sparse leaf space. */ 32c4762a1bSJed Brown nrootsA = 3; 33c4762a1bSJed Brown nleavesA = 3; 34c4762a1bSJed Brown nrootsB = 3; 35c4762a1bSJed Brown nleavesB = 2; 36c4762a1bSJed Brown } else { 37c4762a1bSJed Brown /* sfA reverses indices, sfB is identity */ 38c4762a1bSJed Brown nrootsA = nrootsB = nleavesA = nleavesB = 4; 39c4762a1bSJed Brown } 409566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nleavesA, &ilocalA)); 419566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nleavesA, &iremoteA)); 429566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nleavesB, &ilocalB)); 439566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nleavesB, &iremoteB)); 44c4762a1bSJed Brown 45c4762a1bSJed Brown for (i = 0; i < nleavesA; i++) { 46c4762a1bSJed Brown iremoteA[i].rank = 0; 47c4762a1bSJed Brown iremoteA[i].index = i; 48c4762a1bSJed Brown if (flag) { 49c4762a1bSJed Brown ilocalA[i] = (i + 1) % nleavesA; 50c4762a1bSJed Brown } else { 51c4762a1bSJed Brown ilocalA[i] = nleavesA - i - 1; 52c4762a1bSJed Brown } 53c4762a1bSJed Brown } 54c4762a1bSJed Brown 55c4762a1bSJed Brown for (i = 0; i < nleavesB; i++) { 56c4762a1bSJed Brown iremoteB[i].rank = 0; 57c4762a1bSJed Brown if (flag) { 58c4762a1bSJed Brown ilocalB[i] = nleavesB - i; 59c4762a1bSJed Brown iremoteB[i].index = nleavesB - i - 1; 60c4762a1bSJed Brown } else { 61c4762a1bSJed Brown ilocalB[i] = i; 62c4762a1bSJed Brown iremoteB[i].index = i; 63c4762a1bSJed Brown } 64c4762a1bSJed Brown } 65c4762a1bSJed Brown 669566063dSJacob Faibussowitsch PetscCall(PetscSFSetGraph(sfA, nrootsA, nleavesA, ilocalA, PETSC_OWN_POINTER, iremoteA, PETSC_OWN_POINTER)); 679566063dSJacob Faibussowitsch PetscCall(PetscSFSetGraph(sfB, nrootsB, nleavesB, ilocalB, PETSC_OWN_POINTER, iremoteB, PETSC_OWN_POINTER)); 689566063dSJacob Faibussowitsch PetscCall(PetscSFSetUp(sfA)); 699566063dSJacob Faibussowitsch PetscCall(PetscSFSetUp(sfB)); 709566063dSJacob Faibussowitsch PetscCall(PetscObjectSetName((PetscObject)sfA, "sfA")); 719566063dSJacob Faibussowitsch PetscCall(PetscObjectSetName((PetscObject)sfB, "sfB")); 72c4762a1bSJed Brown 739566063dSJacob Faibussowitsch PetscCall(VecCreateSeq(PETSC_COMM_WORLD, nrootsA, &a)); 749566063dSJacob Faibussowitsch PetscCall(VecCreateSeq(PETSC_COMM_WORLD, nleavesA, &b)); 759566063dSJacob Faibussowitsch PetscCall(PetscSFGetLeafRange(sfB, NULL, &maxleafB)); 769566063dSJacob Faibussowitsch PetscCall(VecCreateSeq(PETSC_COMM_WORLD, maxleafB + 1, &ba)); 779566063dSJacob Faibussowitsch PetscCall(VecGetArray(a, &arrayW)); 78*ad540459SPierre Jolivet for (i = 0; i < nrootsA; i++) arrayW[i] = (PetscScalar)i; 799566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(a, &arrayW)); 80c4762a1bSJed Brown 819566063dSJacob Faibussowitsch PetscCall(PetscPrintf(PETSC_COMM_WORLD, "Initial Vec A\n")); 829566063dSJacob Faibussowitsch PetscCall(VecView(a, NULL)); 839566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(a, &arrayR)); 849566063dSJacob Faibussowitsch PetscCall(VecGetArray(b, &arrayW)); 85c4762a1bSJed Brown 869566063dSJacob Faibussowitsch PetscCall(PetscSFBcastBegin(sfA, MPIU_SCALAR, arrayR, arrayW, MPI_REPLACE)); 879566063dSJacob Faibussowitsch PetscCall(PetscSFBcastEnd(sfA, MPIU_SCALAR, arrayR, arrayW, MPI_REPLACE)); 889566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(b, &arrayW)); 899566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(a, &arrayR)); 909566063dSJacob Faibussowitsch PetscCall(PetscPrintf(PETSC_COMM_WORLD, "\nBroadcast A->B over sfA\n")); 919566063dSJacob Faibussowitsch PetscCall(VecView(b, NULL)); 92c4762a1bSJed Brown 939566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(b, &arrayR)); 949566063dSJacob Faibussowitsch PetscCall(VecGetArray(ba, &arrayW)); 95c4762a1bSJed Brown arrayW[0] = 10.0; /* Not touched by bcast */ 969566063dSJacob Faibussowitsch PetscCall(PetscSFBcastBegin(sfB, MPIU_SCALAR, arrayR, arrayW, MPI_REPLACE)); 979566063dSJacob Faibussowitsch PetscCall(PetscSFBcastEnd(sfB, MPIU_SCALAR, arrayR, arrayW, MPI_REPLACE)); 989566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(b, &arrayR)); 999566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(ba, &arrayW)); 100c4762a1bSJed Brown 1019566063dSJacob Faibussowitsch PetscCall(PetscPrintf(PETSC_COMM_WORLD, "\nBroadcast B->BA over sfB\n")); 1029566063dSJacob Faibussowitsch PetscCall(VecView(ba, NULL)); 103c4762a1bSJed Brown 1049566063dSJacob Faibussowitsch PetscCall(PetscSFCompose(sfA, sfB, &sfBA)); 1059566063dSJacob Faibussowitsch PetscCall(PetscSFSetFromOptions(sfBA)); 1069566063dSJacob Faibussowitsch PetscCall(PetscObjectSetName((PetscObject)sfBA, "(sfB o sfA)")); 1079566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(a, &arrayR)); 1089566063dSJacob Faibussowitsch PetscCall(VecGetArray(ba, &arrayW)); 109c4762a1bSJed Brown arrayW[0] = 11.0; /* Not touched by bcast */ 1109566063dSJacob Faibussowitsch PetscCall(PetscSFBcastBegin(sfBA, MPIU_SCALAR, arrayR, arrayW, MPI_REPLACE)); 1119566063dSJacob Faibussowitsch PetscCall(PetscSFBcastEnd(sfBA, MPIU_SCALAR, arrayR, arrayW, MPI_REPLACE)); 1129566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(ba, &arrayW)); 1139566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(a, &arrayR)); 1149566063dSJacob Faibussowitsch PetscCall(PetscPrintf(PETSC_COMM_WORLD, "\nBroadcast A->BA over sfBA (sfB o sfA)\n")); 1159566063dSJacob Faibussowitsch PetscCall(VecView(ba, NULL)); 116c4762a1bSJed Brown 1179566063dSJacob Faibussowitsch PetscCall(VecDestroy(&ba)); 1189566063dSJacob Faibussowitsch PetscCall(VecDestroy(&b)); 1199566063dSJacob Faibussowitsch PetscCall(VecDestroy(&a)); 120c4762a1bSJed Brown 1219566063dSJacob Faibussowitsch PetscCall(PetscSFView(sfA, NULL)); 1229566063dSJacob Faibussowitsch PetscCall(PetscSFView(sfB, NULL)); 1239566063dSJacob Faibussowitsch PetscCall(PetscSFView(sfBA, NULL)); 1249566063dSJacob Faibussowitsch PetscCall(PetscSFDestroy(&sfA)); 1259566063dSJacob Faibussowitsch PetscCall(PetscSFDestroy(&sfB)); 1269566063dSJacob Faibussowitsch PetscCall(PetscSFDestroy(&sfBA)); 127c4762a1bSJed Brown 1289566063dSJacob Faibussowitsch PetscCall(PetscFinalize()); 129b122ec5aSJacob Faibussowitsch return 0; 130c4762a1bSJed Brown } 131c4762a1bSJed Brown 132c4762a1bSJed Brown /*TEST 133c4762a1bSJed Brown 134c4762a1bSJed Brown test: 135c4762a1bSJed Brown suffix: 1 136c4762a1bSJed Brown 137c4762a1bSJed Brown test: 138c4762a1bSJed Brown suffix: 2 139c4762a1bSJed Brown filter: grep -v "type" | grep -v "sort" 140c4762a1bSJed Brown args: -sparse_sfB 141c4762a1bSJed Brown 142c4762a1bSJed Brown test: 143c4762a1bSJed Brown suffix: 2_window 144c4762a1bSJed Brown filter: grep -v "type" | grep -v "sort" 145c4762a1bSJed Brown output_file: output/ex4_2.out 146c4762a1bSJed Brown args: -sparse_sfB -sf_type window -sf_window_sync {{fence active lock}} -sf_window_flavor {{create dynamic allocate}} 147dfd57a17SPierre Jolivet requires: defined(PETSC_HAVE_MPI_ONE_SIDED) defined(PETSC_HAVE_MPI_FEATURE_DYNAMIC_WINDOW) 148c4762a1bSJed Brown 149c4762a1bSJed Brown # The nightly test suite with MPICH uses ch3:sock, which is broken when winsize == 0 in some of the processes 150c4762a1bSJed Brown test: 151c4762a1bSJed Brown suffix: 2_window_shared 152c4762a1bSJed Brown filter: grep -v "type" | grep -v "sort" 153c4762a1bSJed Brown output_file: output/ex4_2.out 154c4762a1bSJed Brown args: -sparse_sfB -sf_type window -sf_window_sync {{fence active lock}} -sf_window_flavor shared 155dfd57a17SPierre Jolivet requires: defined(PETSC_HAVE_MPI_PROCESS_SHARED_MEMORY) !defined(PETSC_HAVE_MPICH_NUMVERSION) defined(PETSC_HAVE_MPI_ONE_SIDED) 156c4762a1bSJed Brown 157c4762a1bSJed Brown TEST*/ 158