1936c5a86SJed Brown /* 2936c5a86SJed Brown A star forest (SF) describes a communication pattern 3936c5a86SJed Brown */ 426bd1501SBarry Smith #if !defined(PETSCSF_H) 526bd1501SBarry Smith #define PETSCSF_H 62c8e378dSBarry Smith #include <petscsys.h> 7dd5b3ca6SJunchao Zhang #include <petscis.h> 80c312b8eSJed Brown #include <petscsftypes.h> 9936c5a86SJed Brown 10014dd563SJed Brown PETSC_EXTERN PetscClassId PETSCSF_CLASSID; 11936c5a86SJed Brown 125af141bcSJed Brown /*J 13dd5b3ca6SJunchao Zhang PetscSFType - String with the name of a PetscSF type 145af141bcSJed Brown 155af141bcSJed Brown Level: beginner 165af141bcSJed Brown 175af141bcSJed Brown .seealso: PetscSFSetType(), PetscSF 185af141bcSJed Brown J*/ 195af141bcSJed Brown typedef const char *PetscSFType; 20ac762476SJed Brown #define PETSCSFBASIC "basic" 21027eff8aSJunchao Zhang #define PETSCSFNEIGHBOR "neighbor" 22dd5b3ca6SJunchao Zhang #define PETSCSFALLGATHERV "allgatherv" 23dd5b3ca6SJunchao Zhang #define PETSCSFALLGATHER "allgather" 24dd5b3ca6SJunchao Zhang #define PETSCSFGATHERV "gatherv" 25dd5b3ca6SJunchao Zhang #define PETSCSFGATHER "gather" 26dd5b3ca6SJunchao Zhang #define PETSCSFALLTOALL "alltoall" 27ed658588SBarry Smith #define PETSCSFWINDOW "window" 285af141bcSJed Brown 29936c5a86SJed Brown /*E 30dd5b3ca6SJunchao Zhang PetscSFPattern - Pattern of the PetscSF graph 31dd5b3ca6SJunchao Zhang 32dd5b3ca6SJunchao Zhang $ PETSCSF_PATTERN_GENERAL - A general graph. One sets the graph with PetscSFSetGraph() and usually does not use this enum directly. 33dd5b3ca6SJunchao Zhang $ PETSCSF_PATTERN_ALLGATHER - A graph that every rank gathers all roots from all ranks (like MPI_Allgather/v). One sets the graph with PetscSFSetGraphWithPattern(). 34dd5b3ca6SJunchao Zhang $ PETSCSF_PATTERN_GATHER - A graph that rank 0 gathers all roots from all ranks (like MPI_Gather/v with root=0). One sets the graph with PetscSFSetGraphWithPattern(). 35dd5b3ca6SJunchao Zhang $ PETSCSF_PATTERN_ALLTOALL - A graph that every rank gathers different roots from all ranks (like MPI_Alltoall). One sets the graph with PetscSFSetGraphWithPattern(). 36dd5b3ca6SJunchao Zhang In an ALLTOALL graph, we assume each process has <size> leaves and <size> roots, with each leaf connecting to a remote root. Here <size> is 37dd5b3ca6SJunchao Zhang the size of the communicator. This does not mean one can not communicate multiple data items between a pair of processes. One just needs to 38dd5b3ca6SJunchao Zhang create a new MPI datatype for the multiple data items, e.g., by MPI_Type_contiguous. 39dd5b3ca6SJunchao Zhang Level: beginner 40dd5b3ca6SJunchao Zhang 41dd5b3ca6SJunchao Zhang .seealso: PetscSFSetGraph(), PetscSFSetGraphWithPattern() 42dd5b3ca6SJunchao Zhang E*/ 43dd5b3ca6SJunchao Zhang typedef enum {PETSCSF_PATTERN_GENERAL=0,PETSCSF_PATTERN_ALLGATHER,PETSCSF_PATTERN_GATHER,PETSCSF_PATTERN_ALLTOALL} PetscSFPattern; 44dd5b3ca6SJunchao Zhang 45dd5b3ca6SJunchao Zhang /*E 465af141bcSJed Brown PetscSFWindowSyncType - Type of synchronization for PETSCSFWINDOW 47936c5a86SJed Brown 485af141bcSJed Brown $ PETSCSF_WINDOW_SYNC_FENCE - simplest model, synchronizing across communicator 495af141bcSJed Brown $ PETSCSF_WINDOW_SYNC_LOCK - passive model, less synchronous, requires less setup than PETSCSF_WINDOW_SYNC_ACTIVE, but may require more handshakes 505af141bcSJed Brown $ PETSCSF_WINDOW_SYNC_ACTIVE - active model, provides most information to MPI implementation, needs to construct 2-way process groups (more setup than PETSCSF_WINDOW_SYNC_LOCK) 51936c5a86SJed Brown 52e84a5f06SJed Brown Level: advanced 53936c5a86SJed Brown 54e84a5f06SJed Brown .seealso: PetscSFWindowSetSyncType(), PetscSFWindowGetSyncType() 55936c5a86SJed Brown E*/ 565af141bcSJed Brown typedef enum {PETSCSF_WINDOW_SYNC_FENCE,PETSCSF_WINDOW_SYNC_LOCK,PETSCSF_WINDOW_SYNC_ACTIVE} PetscSFWindowSyncType; 575af141bcSJed Brown PETSC_EXTERN const char *const PetscSFWindowSyncTypes[]; 58936c5a86SJed Brown 59e84a5f06SJed Brown /*E 605b0d146aSStefano Zampini PetscSFWindowFlavorType - Flavor for the creation of MPI windows for PETSCSFWINDOW 615b0d146aSStefano Zampini 625b0d146aSStefano Zampini $ PETSCSF_WINDOW_FLAVOR_CREATE - Use MPI_Win_create, no reusage 635b0d146aSStefano Zampini $ PETSCSF_WINDOW_FLAVOR_DYNAMIC - Use MPI_Win_create_dynamic and dynamically attach pointers 645b0d146aSStefano Zampini $ PETSCSF_WINDOW_FLAVOR_ALLOCATE - Use MPI_Win_allocate 655b0d146aSStefano Zampini $ PETSCSF_WINDOW_FLAVOR_SHARED - Use MPI_Win_allocate_shared 665b0d146aSStefano Zampini 675b0d146aSStefano Zampini Level: advanced 685b0d146aSStefano Zampini 695b0d146aSStefano Zampini .seealso: PetscSFWindowSetFlavorType(), PetscSFWindowGetFlavorType() 705b0d146aSStefano Zampini E*/ 715b0d146aSStefano Zampini typedef enum {PETSCSF_WINDOW_FLAVOR_CREATE,PETSCSF_WINDOW_FLAVOR_DYNAMIC,PETSCSF_WINDOW_FLAVOR_ALLOCATE,PETSCSF_WINDOW_FLAVOR_SHARED} PetscSFWindowFlavorType; 725b0d146aSStefano Zampini PETSC_EXTERN const char *const PetscSFWindowFlavorTypes[]; 735b0d146aSStefano Zampini 745b0d146aSStefano Zampini /*E 75e84a5f06SJed Brown PetscSFDuplicateOption - Aspects to preserve when duplicating a PetscSF 76e84a5f06SJed Brown 77e84a5f06SJed Brown $ PETSCSF_DUPLICATE_CONFONLY - configuration only, user must call PetscSFSetGraph() 78e84a5f06SJed Brown $ PETSCSF_DUPLICATE_RANKS - communication ranks preserved, but different graph (allows simpler setup after calling PetscSFSetGraph()) 79e84a5f06SJed Brown $ PETSCSF_DUPLICATE_GRAPH - entire graph duplicated 80e84a5f06SJed Brown 81e84a5f06SJed Brown Level: beginner 82e84a5f06SJed Brown 83e84a5f06SJed Brown .seealso: PetscSFDuplicate() 84e84a5f06SJed Brown E*/ 85e84a5f06SJed Brown typedef enum {PETSCSF_DUPLICATE_CONFONLY,PETSCSF_DUPLICATE_RANKS,PETSCSF_DUPLICATE_GRAPH} PetscSFDuplicateOption; 86e84a5f06SJed Brown PETSC_EXTERN const char *const PetscSFDuplicateOptions[]; 87090c6444SJed Brown 88adc40e5bSBarry Smith PETSC_EXTERN PetscFunctionList PetscSFList; 89bdf89e91SBarry Smith PETSC_EXTERN PetscErrorCode PetscSFRegister(const char[],PetscErrorCode (*)(PetscSF)); 905af141bcSJed Brown 91607a6623SBarry Smith PETSC_EXTERN PetscErrorCode PetscSFInitializePackage(void); 92014dd563SJed Brown PETSC_EXTERN PetscErrorCode PetscSFFinalizePackage(void); 9379c40355SBarry Smith PETSC_EXTERN PetscErrorCode PetscSFCreate(MPI_Comm,PetscSF*); 94014dd563SJed Brown PETSC_EXTERN PetscErrorCode PetscSFDestroy(PetscSF*); 955af141bcSJed Brown PETSC_EXTERN PetscErrorCode PetscSFSetType(PetscSF,PetscSFType); 9629046d53SLisandro Dalcin PETSC_EXTERN PetscErrorCode PetscSFGetType(PetscSF,PetscSFType*); 97014dd563SJed Brown PETSC_EXTERN PetscErrorCode PetscSFView(PetscSF,PetscViewer); 98fe2efc57SMark PETSC_EXTERN PetscErrorCode PetscSFViewFromOptions(PetscSF,PetscObject,const char[]); 995af141bcSJed Brown PETSC_EXTERN PetscErrorCode PetscSFSetUp(PetscSF); 100014dd563SJed Brown PETSC_EXTERN PetscErrorCode PetscSFSetFromOptions(PetscSF); 101e84a5f06SJed Brown PETSC_EXTERN PetscErrorCode PetscSFDuplicate(PetscSF,PetscSFDuplicateOption,PetscSF*); 1025af141bcSJed Brown PETSC_EXTERN PetscErrorCode PetscSFWindowSetSyncType(PetscSF,PetscSFWindowSyncType); 1035af141bcSJed Brown PETSC_EXTERN PetscErrorCode PetscSFWindowGetSyncType(PetscSF,PetscSFWindowSyncType*); 1045b0d146aSStefano Zampini PETSC_EXTERN PetscErrorCode PetscSFWindowSetFlavorType(PetscSF,PetscSFWindowFlavorType); 1055b0d146aSStefano Zampini PETSC_EXTERN PetscErrorCode PetscSFWindowGetFlavorType(PetscSF,PetscSFWindowFlavorType*); 106*2eb0eadbSSatish Balay PETSC_EXTERN PetscErrorCode PetscSFWindowSetInfo(PetscSF,MPI_Info); 107*2eb0eadbSSatish Balay PETSC_EXTERN PetscErrorCode PetscSFWindowGetInfo(PetscSF,MPI_Info*); 108014dd563SJed Brown PETSC_EXTERN PetscErrorCode PetscSFSetRankOrder(PetscSF,PetscBool); 10963f4a732SJed Brown PETSC_EXTERN PetscErrorCode PetscSFSetGraph(PetscSF,PetscInt,PetscInt,const PetscInt*,PetscCopyMode,const PetscSFNode*,PetscCopyMode); 110dd5b3ca6SJunchao Zhang PETSC_EXTERN PetscErrorCode PetscSFSetGraphWithPattern(PetscSF,PetscLayout,PetscSFPattern); 11179c40355SBarry Smith PETSC_EXTERN PetscErrorCode PetscSFGetGraph(PetscSF,PetscInt*,PetscInt*,const PetscInt**,const PetscSFNode**); 112f723732fSJed Brown PETSC_EXTERN PetscErrorCode PetscSFGetLeafRange(PetscSF,PetscInt*,PetscInt*); 11379c40355SBarry Smith PETSC_EXTERN PetscErrorCode PetscSFCreateEmbeddedSF(PetscSF,PetscInt,const PetscInt*,PetscSF*); 1142f5fb4c2SMatthew G. Knepley PETSC_EXTERN PetscErrorCode PetscSFCreateEmbeddedLeafSF(PetscSF,PetscInt,const PetscInt *, PetscSF *); 115014dd563SJed Brown PETSC_EXTERN PetscErrorCode PetscSFReset(PetscSF); 116b5a8e515SJed Brown PETSC_EXTERN PetscErrorCode PetscSFSetUpRanks(PetscSF,MPI_Group); 117dec1416fSJunchao Zhang PETSC_EXTERN PetscErrorCode PetscSFGetRootRanks(PetscSF,PetscInt*,const PetscMPIInt**,const PetscInt**,const PetscInt**,const PetscInt**); 1188750ddebSJunchao Zhang PETSC_EXTERN PetscErrorCode PetscSFGetLeafRanks(PetscSF,PetscInt*,const PetscMPIInt**,const PetscInt**,const PetscInt**); 119014dd563SJed Brown PETSC_EXTERN PetscErrorCode PetscSFGetGroups(PetscSF,MPI_Group*,MPI_Group*); 120014dd563SJed Brown PETSC_EXTERN PetscErrorCode PetscSFGetMultiSF(PetscSF,PetscSF*); 121014dd563SJed Brown PETSC_EXTERN PetscErrorCode PetscSFCreateInverseSF(PetscSF,PetscSF*); 122936c5a86SJed Brown 1233482bfa8SJunchao Zhang /* Reduce rootdata to leafdata using provided operation */ 1243482bfa8SJunchao Zhang PETSC_EXTERN PetscErrorCode PetscSFBcastAndOpBegin(PetscSF,MPI_Datatype,const void*,void*,MPI_Op) 1253482bfa8SJunchao Zhang PetscAttrMPIPointerWithType(3,2) PetscAttrMPIPointerWithType(4,2); 1263482bfa8SJunchao Zhang PETSC_EXTERN PetscErrorCode PetscSFBcastAndOpEnd(PetscSF,MPI_Datatype,const void*,void*,MPI_Op) 1273482bfa8SJunchao Zhang PetscAttrMPIPointerWithType(3,2) PetscAttrMPIPointerWithType(4,2); 128936c5a86SJed Brown /* Reduce leafdata into rootdata using provided operation */ 12979c40355SBarry Smith PETSC_EXTERN PetscErrorCode PetscSFReduceBegin(PetscSF,MPI_Datatype,const void*,void *,MPI_Op) 13019436ca2SJed Brown PetscAttrMPIPointerWithType(3,2) PetscAttrMPIPointerWithType(4,2); 13179c40355SBarry Smith PETSC_EXTERN PetscErrorCode PetscSFReduceEnd(PetscSF,MPI_Datatype,const void*,void*,MPI_Op) 13219436ca2SJed Brown PetscAttrMPIPointerWithType(3,2) PetscAttrMPIPointerWithType(4,2); 133936c5a86SJed Brown /* Atomically modifies (using provided operation) rootdata using leafdata from each leaf, value at root at time of modification is returned in leafupdate. */ 13479c40355SBarry Smith PETSC_EXTERN PetscErrorCode PetscSFFetchAndOpBegin(PetscSF,MPI_Datatype,void*,const void*,void*,MPI_Op) 135894dd566SJed Brown PetscAttrMPIPointerWithType(3,2) PetscAttrMPIPointerWithType(4,2) PetscAttrMPIPointerWithType(5,2); 13679c40355SBarry Smith PETSC_EXTERN PetscErrorCode PetscSFFetchAndOpEnd(PetscSF,MPI_Datatype,void*,const void*,void*,MPI_Op) 137894dd566SJed Brown PetscAttrMPIPointerWithType(3,2) PetscAttrMPIPointerWithType(4,2) PetscAttrMPIPointerWithType(5,2); 138936c5a86SJed Brown /* Compute the degree of every root vertex (number of leaves in its star) */ 13979c40355SBarry Smith PETSC_EXTERN PetscErrorCode PetscSFComputeDegreeBegin(PetscSF,const PetscInt**); 14079c40355SBarry Smith PETSC_EXTERN PetscErrorCode PetscSFComputeDegreeEnd(PetscSF,const PetscInt**); 14166dfcd1aSVaclav Hapla PETSC_EXTERN PetscErrorCode PetscSFComputeMultiRootOriginalNumbering(PetscSF,const PetscInt[],PetscInt*,PetscInt*[]); 142936c5a86SJed Brown /* Concatenate data from all leaves into roots */ 14379c40355SBarry Smith PETSC_EXTERN PetscErrorCode PetscSFGatherBegin(PetscSF,MPI_Datatype,const void*,void*) 144894dd566SJed Brown PetscAttrMPIPointerWithType(3,2) PetscAttrMPIPointerWithType(4,2); 14579c40355SBarry Smith PETSC_EXTERN PetscErrorCode PetscSFGatherEnd(PetscSF,MPI_Datatype,const void*,void*) 146894dd566SJed Brown PetscAttrMPIPointerWithType(3,2) PetscAttrMPIPointerWithType(4,2); 147936c5a86SJed Brown /* Distribute distinct values to each leaf from roots */ 14879c40355SBarry Smith PETSC_EXTERN PetscErrorCode PetscSFScatterBegin(PetscSF,MPI_Datatype,const void*,void*) 149894dd566SJed Brown PetscAttrMPIPointerWithType(3,2) PetscAttrMPIPointerWithType(4,2); 15079c40355SBarry Smith PETSC_EXTERN PetscErrorCode PetscSFScatterEnd(PetscSF,MPI_Datatype,const void*,void*) 151894dd566SJed Brown PetscAttrMPIPointerWithType(3,2) PetscAttrMPIPointerWithType(4,2); 152936c5a86SJed Brown 153a7b3aa13SAta Mesgarnejad PETSC_EXTERN PetscErrorCode PetscSFCompose(PetscSF,PetscSF,PetscSF*); 15404c0ada0SJunchao Zhang PETSC_EXTERN PetscErrorCode PetscSFComposeInverse(PetscSF,PetscSF,PetscSF*); 155a7b3aa13SAta Mesgarnejad 1568bfbc91cSJed Brown #if defined(MPI_REPLACE) 1578bfbc91cSJed Brown # define MPIU_REPLACE MPI_REPLACE 1588bfbc91cSJed Brown #else 1598bfbc91cSJed Brown /* When using an old MPI such that MPI_REPLACE is not defined, we do not pass MPI_REPLACE to MPI at all. Instead, we 1608bfbc91cSJed Brown * use it as a flag for our own reducer in the PETSCSFBASIC implementation. This could be any unique value unlikely to 1618bfbc91cSJed Brown * collide with another MPI_Op so we'll just use the value that has been used by every version of MPICH since 1628bfbc91cSJed Brown * MPICH2-1.0.6. */ 1638bfbc91cSJed Brown # define MPIU_REPLACE (MPI_Op)(0x5800000d) 1648bfbc91cSJed Brown #endif 1658bfbc91cSJed Brown 166dec1416fSJunchao Zhang PETSC_DEPRECATED_FUNCTION("Use PetscSFGetRootRanks (since v3.12)") 167dec1416fSJunchao Zhang PETSC_STATIC_INLINE PetscErrorCode PetscSFGetRanks(PetscSF sf,PetscInt *nranks,const PetscMPIInt **ranks,const PetscInt **roffset,const PetscInt **rmine,const PetscInt **rremote) { 168dec1416fSJunchao Zhang return PetscSFGetRootRanks(sf,nranks,ranks,roffset,rmine,rremote); 169dec1416fSJunchao Zhang } 170e2652d4cSJunchao Zhang 171c73c85a0SVaclav Hapla /*@C 172c73c85a0SVaclav Hapla PetscSFBcastBegin - begin pointwise broadcast to be concluded with call to PetscSFBcastEnd() 173c73c85a0SVaclav Hapla 174c73c85a0SVaclav Hapla Collective on PetscSF 175c73c85a0SVaclav Hapla 176c73c85a0SVaclav Hapla Input Arguments: 177c73c85a0SVaclav Hapla + sf - star forest on which to communicate 178c73c85a0SVaclav Hapla . unit - data type associated with each node 179c73c85a0SVaclav Hapla - rootdata - buffer to broadcast 180c73c85a0SVaclav Hapla 181c73c85a0SVaclav Hapla Output Arguments: 182c73c85a0SVaclav Hapla . leafdata - buffer to update with values from each leaf's respective root 183c73c85a0SVaclav Hapla 184c73c85a0SVaclav Hapla Level: intermediate 185c73c85a0SVaclav Hapla 1868eeec653SVaclav Hapla .seealso: PetscSFCreate(), PetscSFSetGraph(), PetscSFView(), PetscSFBcastEnd(), PetscSFReduceBegin(), PetscSFBcastAndOpBegin() 187c73c85a0SVaclav Hapla @*/ 188e2652d4cSJunchao Zhang PETSC_STATIC_INLINE PetscErrorCode PetscSFBcastBegin(PetscSF sf,MPI_Datatype unit,const void* rootdata,void* leafdata) { 189e2652d4cSJunchao Zhang return PetscSFBcastAndOpBegin(sf,unit,rootdata,leafdata,MPIU_REPLACE); 190e2652d4cSJunchao Zhang } 191c73c85a0SVaclav Hapla 192c73c85a0SVaclav Hapla /*@C 193c73c85a0SVaclav Hapla PetscSFBcastEnd - end a broadcast operation started with PetscSFBcastBegin() 194c73c85a0SVaclav Hapla 195c73c85a0SVaclav Hapla Collective 196c73c85a0SVaclav Hapla 197c73c85a0SVaclav Hapla Input Arguments: 198c73c85a0SVaclav Hapla + sf - star forest 199c73c85a0SVaclav Hapla . unit - data type 200c73c85a0SVaclav Hapla - rootdata - buffer to broadcast 201c73c85a0SVaclav Hapla 202c73c85a0SVaclav Hapla Output Arguments: 203c73c85a0SVaclav Hapla . leafdata - buffer to update with values from each leaf's respective root 204c73c85a0SVaclav Hapla 205c73c85a0SVaclav Hapla Level: intermediate 206c73c85a0SVaclav Hapla 207c73c85a0SVaclav Hapla .seealso: PetscSFSetGraph(), PetscSFReduceEnd() 208c73c85a0SVaclav Hapla @*/ 209e2652d4cSJunchao Zhang PETSC_STATIC_INLINE PetscErrorCode PetscSFBcastEnd(PetscSF sf,MPI_Datatype unit,const void* rootdata,void* leafdata) { 210e2652d4cSJunchao Zhang return PetscSFBcastAndOpEnd(sf,unit,rootdata,leafdata,MPIU_REPLACE); 211e2652d4cSJunchao Zhang } 212e2652d4cSJunchao Zhang 213936c5a86SJed Brown #endif 214