1c4762a1bSJed Brown static const char help[] = "Test overlapped communication on a single star forest (PetscSF)\n\n"; 2c4762a1bSJed Brown 3c4762a1bSJed Brown #include <petscvec.h> 4c4762a1bSJed Brown #include <petscsf.h> 5c4762a1bSJed Brown #include <petscviewer.h> 6c4762a1bSJed Brown 7*9371c9d4SSatish Balay int main(int argc, char **argv) { 8c4762a1bSJed Brown PetscSF sf; 9c4762a1bSJed Brown Vec A, Aout; 10c4762a1bSJed Brown Vec B, Bout; 11c4762a1bSJed Brown PetscScalar *bufA; 12c4762a1bSJed Brown PetscScalar *bufAout; 13c4762a1bSJed Brown PetscScalar *bufB; 14c4762a1bSJed Brown PetscScalar *bufBout; 15c4762a1bSJed Brown PetscMPIInt rank, size; 16c4762a1bSJed Brown PetscInt nroots, nleaves; 17c4762a1bSJed Brown PetscInt i; 18c4762a1bSJed Brown PetscInt *ilocal; 19c4762a1bSJed Brown PetscSFNode *iremote; 20c4762a1bSJed Brown 21327415f7SBarry Smith PetscFunctionBeginUser; 229566063dSJacob Faibussowitsch PetscCall(PetscInitialize(&argc, &argv, NULL, help)); 239566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_rank(PETSC_COMM_WORLD, &rank)); 249566063dSJacob Faibussowitsch PetscCallMPI(MPI_Comm_size(PETSC_COMM_WORLD, &size)); 25c4762a1bSJed Brown 2608401ef6SPierre Jolivet PetscCheck(size == 2, PETSC_COMM_WORLD, PETSC_ERR_USER, "Only coded for two MPI processes"); 27c4762a1bSJed Brown 289566063dSJacob Faibussowitsch PetscCall(PetscSFCreate(PETSC_COMM_WORLD, &sf)); 299566063dSJacob Faibussowitsch PetscCall(PetscSFSetFromOptions(sf)); 30c4762a1bSJed Brown 31c4762a1bSJed Brown nleaves = 2; 32c4762a1bSJed Brown nroots = 1; 339566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nleaves, &ilocal)); 34c4762a1bSJed Brown 35*9371c9d4SSatish Balay for (i = 0; i < nleaves; i++) { ilocal[i] = i; } 36c4762a1bSJed Brown 379566063dSJacob Faibussowitsch PetscCall(PetscMalloc1(nleaves, &iremote)); 38c4762a1bSJed Brown if (rank == 0) { 39c4762a1bSJed Brown iremote[0].rank = 0; 40c4762a1bSJed Brown iremote[0].index = 0; 41c4762a1bSJed Brown iremote[1].rank = 1; 42c4762a1bSJed Brown iremote[1].index = 0; 43c4762a1bSJed Brown } else { 44c4762a1bSJed Brown iremote[0].rank = 1; 45c4762a1bSJed Brown iremote[0].index = 0; 46c4762a1bSJed Brown iremote[1].rank = 0; 47c4762a1bSJed Brown iremote[1].index = 0; 48c4762a1bSJed Brown } 499566063dSJacob Faibussowitsch PetscCall(PetscSFSetGraph(sf, nroots, nleaves, ilocal, PETSC_OWN_POINTER, iremote, PETSC_OWN_POINTER)); 509566063dSJacob Faibussowitsch PetscCall(PetscSFSetUp(sf)); 519566063dSJacob Faibussowitsch PetscCall(PetscSFView(sf, PETSC_VIEWER_STDOUT_WORLD)); 529566063dSJacob Faibussowitsch PetscCall(VecCreate(PETSC_COMM_WORLD, &A)); 539566063dSJacob Faibussowitsch PetscCall(VecSetSizes(A, 2, PETSC_DETERMINE)); 549566063dSJacob Faibussowitsch PetscCall(VecSetFromOptions(A)); 559566063dSJacob Faibussowitsch PetscCall(VecSetUp(A)); 56c4762a1bSJed Brown 579566063dSJacob Faibussowitsch PetscCall(VecDuplicate(A, &B)); 589566063dSJacob Faibussowitsch PetscCall(VecDuplicate(A, &Aout)); 599566063dSJacob Faibussowitsch PetscCall(VecDuplicate(A, &Bout)); 609566063dSJacob Faibussowitsch PetscCall(VecGetArray(A, &bufA)); 619566063dSJacob Faibussowitsch PetscCall(VecGetArray(B, &bufB)); 62c4762a1bSJed Brown for (i = 0; i < 2; i++) { 63c4762a1bSJed Brown bufA[i] = (PetscScalar)rank; 64c4762a1bSJed Brown bufB[i] = (PetscScalar)(rank) + 10.0; 65c4762a1bSJed Brown } 669566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(A, &bufA)); 679566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(B, &bufB)); 68c4762a1bSJed Brown 699566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(A, (const PetscScalar **)&bufA)); 709566063dSJacob Faibussowitsch PetscCall(VecGetArrayRead(B, (const PetscScalar **)&bufB)); 719566063dSJacob Faibussowitsch PetscCall(VecGetArray(Aout, &bufAout)); 729566063dSJacob Faibussowitsch PetscCall(VecGetArray(Bout, &bufBout)); 739566063dSJacob Faibussowitsch PetscCall(PetscSFBcastBegin(sf, MPIU_SCALAR, (const void *)bufA, (void *)bufAout, MPI_REPLACE)); 749566063dSJacob Faibussowitsch PetscCall(PetscSFBcastBegin(sf, MPIU_SCALAR, (const void *)bufB, (void *)bufBout, MPI_REPLACE)); 759566063dSJacob Faibussowitsch PetscCall(PetscSFBcastEnd(sf, MPIU_SCALAR, (const void *)bufA, (void *)bufAout, MPI_REPLACE)); 769566063dSJacob Faibussowitsch PetscCall(PetscSFBcastEnd(sf, MPIU_SCALAR, (const void *)bufB, (void *)bufBout, MPI_REPLACE)); 779566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(A, (const PetscScalar **)&bufA)); 789566063dSJacob Faibussowitsch PetscCall(VecRestoreArrayRead(B, (const PetscScalar **)&bufB)); 799566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(Aout, &bufAout)); 809566063dSJacob Faibussowitsch PetscCall(VecRestoreArray(Bout, &bufBout)); 81c4762a1bSJed Brown 829566063dSJacob Faibussowitsch PetscCall(VecView(Aout, PETSC_VIEWER_STDOUT_WORLD)); 839566063dSJacob Faibussowitsch PetscCall(VecView(Bout, PETSC_VIEWER_STDOUT_WORLD)); 849566063dSJacob Faibussowitsch PetscCall(VecDestroy(&A)); 859566063dSJacob Faibussowitsch PetscCall(VecDestroy(&B)); 869566063dSJacob Faibussowitsch PetscCall(VecDestroy(&Aout)); 879566063dSJacob Faibussowitsch PetscCall(VecDestroy(&Bout)); 889566063dSJacob Faibussowitsch PetscCall(PetscSFDestroy(&sf)); 89c4762a1bSJed Brown 909566063dSJacob Faibussowitsch PetscCall(PetscFinalize()); 91b122ec5aSJacob Faibussowitsch return 0; 92c4762a1bSJed Brown } 93c4762a1bSJed Brown 94c4762a1bSJed Brown /*TEST 95c4762a1bSJed Brown 96c4762a1bSJed Brown test: 97c4762a1bSJed Brown suffix: basic 98c4762a1bSJed Brown nsize: 2 99c4762a1bSJed Brown filter: grep -v "type" | grep -v "sort" 100c4762a1bSJed Brown args: -sf_type basic 101c4762a1bSJed Brown 102c4762a1bSJed Brown test: 103c4762a1bSJed Brown suffix: window 104c4762a1bSJed Brown nsize: 2 105c4762a1bSJed Brown filter: grep -v "type" | grep -v "sort" 106c4762a1bSJed Brown output_file: output/ex2_basic.out 107c4762a1bSJed Brown args: -sf_type window -sf_window_sync {{fence active lock}} -sf_window_flavor {{create dynamic allocate}} 108dfd57a17SPierre Jolivet requires: defined(PETSC_HAVE_MPI_ONE_SIDED) defined(PETSC_HAVE_MPI_FEATURE_DYNAMIC_WINDOW) 109c4762a1bSJed Brown 110c4762a1bSJed Brown # The nightly test suite with MPICH uses ch3:sock, which is broken when winsize == 0 in some of the processes 111c4762a1bSJed Brown test: 112c4762a1bSJed Brown suffix: window_shared 113c4762a1bSJed Brown nsize: 2 114c4762a1bSJed Brown filter: grep -v "type" | grep -v "sort" 115c4762a1bSJed Brown output_file: output/ex2_basic.out 116c4762a1bSJed Brown args: -sf_type window -sf_window_sync {{fence active lock}} -sf_window_flavor shared 117dfd57a17SPierre Jolivet requires: defined(PETSC_HAVE_MPI_PROCESS_SHARED_MEMORY) !defined(PETSC_HAVE_MPICH_NUMVERSION) defined(PETSC_HAVE_MPI_ONE_SIDED) 118c4762a1bSJed Brown 119c4762a1bSJed Brown TEST*/ 120