xref: /petsc/src/vec/is/sf/tutorials/ex2.c (revision 9566063d113dddea24716c546802770db7481bc0)
1c4762a1bSJed Brown static const char help[] = "Test overlapped communication on a single star forest (PetscSF)\n\n";
2c4762a1bSJed Brown 
3c4762a1bSJed Brown #include <petscvec.h>
4c4762a1bSJed Brown #include <petscsf.h>
5c4762a1bSJed Brown #include <petscviewer.h>
6c4762a1bSJed Brown 
7c4762a1bSJed Brown int main(int argc, char **argv)
8c4762a1bSJed Brown {
9c4762a1bSJed Brown   PetscSF     sf;
10c4762a1bSJed Brown   Vec         A,Aout;
11c4762a1bSJed Brown   Vec         B,Bout;
12c4762a1bSJed Brown   PetscScalar *bufA;
13c4762a1bSJed Brown   PetscScalar *bufAout;
14c4762a1bSJed Brown   PetscScalar *bufB;
15c4762a1bSJed Brown   PetscScalar *bufBout;
16c4762a1bSJed Brown   PetscMPIInt rank, size;
17c4762a1bSJed Brown   PetscInt    nroots, nleaves;
18c4762a1bSJed Brown   PetscInt    i;
19c4762a1bSJed Brown   PetscInt    *ilocal;
20c4762a1bSJed Brown   PetscSFNode *iremote;
21c4762a1bSJed Brown 
22*9566063dSJacob Faibussowitsch   PetscCall(PetscInitialize(&argc,&argv,NULL,help));
23*9566063dSJacob Faibussowitsch   PetscCallMPI(MPI_Comm_rank(PETSC_COMM_WORLD,&rank));
24*9566063dSJacob Faibussowitsch   PetscCallMPI(MPI_Comm_size(PETSC_COMM_WORLD,&size));
25c4762a1bSJed Brown 
262c71b3e2SJacob Faibussowitsch   PetscCheckFalse(size != 2,PETSC_COMM_WORLD, PETSC_ERR_USER, "Only coded for two MPI processes");
27c4762a1bSJed Brown 
28*9566063dSJacob Faibussowitsch   PetscCall(PetscSFCreate(PETSC_COMM_WORLD,&sf));
29*9566063dSJacob Faibussowitsch   PetscCall(PetscSFSetFromOptions(sf));
30c4762a1bSJed Brown 
31c4762a1bSJed Brown   nleaves = 2;
32c4762a1bSJed Brown   nroots = 1;
33*9566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(nleaves,&ilocal));
34c4762a1bSJed Brown 
35c4762a1bSJed Brown   for (i = 0; i<nleaves; i++) {
36c4762a1bSJed Brown     ilocal[i] = i;
37c4762a1bSJed Brown   }
38c4762a1bSJed Brown 
39*9566063dSJacob Faibussowitsch   PetscCall(PetscMalloc1(nleaves,&iremote));
40c4762a1bSJed Brown   if (rank == 0) {
41c4762a1bSJed Brown     iremote[0].rank = 0;
42c4762a1bSJed Brown     iremote[0].index = 0;
43c4762a1bSJed Brown     iremote[1].rank = 1;
44c4762a1bSJed Brown     iremote[1].index = 0;
45c4762a1bSJed Brown   } else {
46c4762a1bSJed Brown     iremote[0].rank = 1;
47c4762a1bSJed Brown     iremote[0].index = 0;
48c4762a1bSJed Brown     iremote[1].rank = 0;
49c4762a1bSJed Brown     iremote[1].index = 0;
50c4762a1bSJed Brown   }
51*9566063dSJacob Faibussowitsch   PetscCall(PetscSFSetGraph(sf,nroots,nleaves,ilocal,PETSC_OWN_POINTER,iremote,PETSC_OWN_POINTER));
52*9566063dSJacob Faibussowitsch   PetscCall(PetscSFSetUp(sf));
53*9566063dSJacob Faibussowitsch   PetscCall(PetscSFView(sf,PETSC_VIEWER_STDOUT_WORLD));
54*9566063dSJacob Faibussowitsch   PetscCall(VecCreate(PETSC_COMM_WORLD,&A));
55*9566063dSJacob Faibussowitsch   PetscCall(VecSetSizes(A,2,PETSC_DETERMINE));
56*9566063dSJacob Faibussowitsch   PetscCall(VecSetFromOptions(A));
57*9566063dSJacob Faibussowitsch   PetscCall(VecSetUp(A));
58c4762a1bSJed Brown 
59*9566063dSJacob Faibussowitsch   PetscCall(VecDuplicate(A,&B));
60*9566063dSJacob Faibussowitsch   PetscCall(VecDuplicate(A,&Aout));
61*9566063dSJacob Faibussowitsch   PetscCall(VecDuplicate(A,&Bout));
62*9566063dSJacob Faibussowitsch   PetscCall(VecGetArray(A,&bufA));
63*9566063dSJacob Faibussowitsch   PetscCall(VecGetArray(B,&bufB));
64c4762a1bSJed Brown   for (i=0; i<2; i++) {
65c4762a1bSJed Brown     bufA[i] = (PetscScalar)rank;
66c4762a1bSJed Brown     bufB[i] = (PetscScalar)(rank) + 10.0;
67c4762a1bSJed Brown   }
68*9566063dSJacob Faibussowitsch   PetscCall(VecRestoreArray(A,&bufA));
69*9566063dSJacob Faibussowitsch   PetscCall(VecRestoreArray(B,&bufB));
70c4762a1bSJed Brown 
71*9566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(A,(const PetscScalar**)&bufA));
72*9566063dSJacob Faibussowitsch   PetscCall(VecGetArrayRead(B,(const PetscScalar**)&bufB));
73*9566063dSJacob Faibussowitsch   PetscCall(VecGetArray(Aout,&bufAout));
74*9566063dSJacob Faibussowitsch   PetscCall(VecGetArray(Bout,&bufBout));
75*9566063dSJacob Faibussowitsch   PetscCall(PetscSFBcastBegin(sf,MPIU_SCALAR,(const void*)bufA,(void *)bufAout,MPI_REPLACE));
76*9566063dSJacob Faibussowitsch   PetscCall(PetscSFBcastBegin(sf,MPIU_SCALAR,(const void*)bufB,(void *)bufBout,MPI_REPLACE));
77*9566063dSJacob Faibussowitsch   PetscCall(PetscSFBcastEnd(sf,MPIU_SCALAR,(const void*)bufA,(void *)bufAout,MPI_REPLACE));
78*9566063dSJacob Faibussowitsch   PetscCall(PetscSFBcastEnd(sf,MPIU_SCALAR,(const void*)bufB,(void *)bufBout,MPI_REPLACE));
79*9566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(A,(const PetscScalar**)&bufA));
80*9566063dSJacob Faibussowitsch   PetscCall(VecRestoreArrayRead(B,(const PetscScalar**)&bufB));
81*9566063dSJacob Faibussowitsch   PetscCall(VecRestoreArray(Aout,&bufAout));
82*9566063dSJacob Faibussowitsch   PetscCall(VecRestoreArray(Bout,&bufBout));
83c4762a1bSJed Brown 
84*9566063dSJacob Faibussowitsch   PetscCall(VecView(Aout,PETSC_VIEWER_STDOUT_WORLD));
85*9566063dSJacob Faibussowitsch   PetscCall(VecView(Bout,PETSC_VIEWER_STDOUT_WORLD));
86*9566063dSJacob Faibussowitsch   PetscCall(VecDestroy(&A));
87*9566063dSJacob Faibussowitsch   PetscCall(VecDestroy(&B));
88*9566063dSJacob Faibussowitsch   PetscCall(VecDestroy(&Aout));
89*9566063dSJacob Faibussowitsch   PetscCall(VecDestroy(&Bout));
90*9566063dSJacob Faibussowitsch   PetscCall(PetscSFDestroy(&sf));
91c4762a1bSJed Brown 
92*9566063dSJacob Faibussowitsch   PetscCall(PetscFinalize());
93b122ec5aSJacob Faibussowitsch   return 0;
94c4762a1bSJed Brown }
95c4762a1bSJed Brown 
96c4762a1bSJed Brown /*TEST
97c4762a1bSJed Brown 
98c4762a1bSJed Brown    test:
99c4762a1bSJed Brown       suffix: basic
100c4762a1bSJed Brown       nsize: 2
101c4762a1bSJed Brown       filter: grep -v "type" | grep -v "sort"
102c4762a1bSJed Brown       args: -sf_type basic
103c4762a1bSJed Brown 
104c4762a1bSJed Brown    test:
105c4762a1bSJed Brown       suffix: window
106c4762a1bSJed Brown       nsize: 2
107c4762a1bSJed Brown       filter: grep -v "type" | grep -v "sort"
108c4762a1bSJed Brown       output_file: output/ex2_basic.out
109c4762a1bSJed Brown       args: -sf_type window -sf_window_sync {{fence active lock}} -sf_window_flavor {{create dynamic allocate}}
110dfd57a17SPierre Jolivet       requires: defined(PETSC_HAVE_MPI_ONE_SIDED) defined(PETSC_HAVE_MPI_FEATURE_DYNAMIC_WINDOW)
111c4762a1bSJed Brown 
112c4762a1bSJed Brown    # The nightly test suite with MPICH uses ch3:sock, which is broken when winsize == 0 in some of the processes
113c4762a1bSJed Brown    test:
114c4762a1bSJed Brown       suffix: window_shared
115c4762a1bSJed Brown       nsize: 2
116c4762a1bSJed Brown       filter: grep -v "type" | grep -v "sort"
117c4762a1bSJed Brown       output_file: output/ex2_basic.out
118c4762a1bSJed Brown       args: -sf_type window -sf_window_sync {{fence active lock}} -sf_window_flavor shared
119dfd57a17SPierre Jolivet       requires: defined(PETSC_HAVE_MPI_PROCESS_SHARED_MEMORY) !defined(PETSC_HAVE_MPICH_NUMVERSION) defined(PETSC_HAVE_MPI_ONE_SIDED)
120c4762a1bSJed Brown 
121c4762a1bSJed Brown TEST*/
122