xref: /petsc/src/vec/is/sf/impls/basic/gather/sfgather.c (revision 3ba1676111f5c958fe6c2729b46ca4d523958bb3)
1dd5b3ca6SJunchao Zhang #include <../src/vec/is/sf/impls/basic/gatherv/sfgatherv.h>
2cd620004SJunchao Zhang #include <../src/vec/is/sf/impls/basic/allgather/sfallgather.h>
3dd5b3ca6SJunchao Zhang 
4dd5b3ca6SJunchao Zhang /* Reuse the type. The difference is some fields (i.e., displs, recvcounts) are not used in Gather, which is not a big deal */
5dd5b3ca6SJunchao Zhang typedef PetscSF_Allgatherv PetscSF_Gather;
6dd5b3ca6SJunchao Zhang 
7d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode PetscSFBcastBegin_Gather(PetscSF sf, MPI_Datatype unit, PetscMemType rootmtype, const void *rootdata, PetscMemType leafmtype, void *leafdata, MPI_Op op)
8d71ae5a4SJacob Faibussowitsch {
9cd620004SJunchao Zhang   PetscSFLink  link;
10855db38dSJunchao Zhang   PetscMPIInt  sendcount;
11dd5b3ca6SJunchao Zhang   MPI_Comm     comm;
12cd620004SJunchao Zhang   void        *rootbuf = NULL, *leafbuf = NULL;
13cd620004SJunchao Zhang   MPI_Request *req;
14dd5b3ca6SJunchao Zhang 
15dd5b3ca6SJunchao Zhang   PetscFunctionBegin;
169566063dSJacob Faibussowitsch   PetscCall(PetscSFLinkCreate(sf, unit, rootmtype, rootdata, leafmtype, leafdata, op, PETSCSF_BCAST, &link));
179566063dSJacob Faibussowitsch   PetscCall(PetscSFLinkPackRootData(sf, link, PETSCSF_REMOTE, rootdata));
189566063dSJacob Faibussowitsch   PetscCall(PetscSFLinkCopyRootBufferInCaseNotUseGpuAwareMPI(sf, link, PETSC_TRUE /* device2host before sending */));
199566063dSJacob Faibussowitsch   PetscCall(PetscObjectGetComm((PetscObject)sf, &comm));
209566063dSJacob Faibussowitsch   PetscCall(PetscMPIIntCast(sf->nroots, &sendcount));
219566063dSJacob Faibussowitsch   PetscCall(PetscSFLinkGetMPIBuffersAndRequests(sf, link, PETSCSF_ROOT2LEAF, &rootbuf, &leafbuf, &req, NULL));
229566063dSJacob Faibussowitsch   PetscCall(PetscSFLinkSyncStreamBeforeCallMPI(sf, link, PETSCSF_ROOT2LEAF));
239566063dSJacob Faibussowitsch   PetscCallMPI(MPIU_Igather(rootbuf == leafbuf ? MPI_IN_PLACE : rootbuf, sendcount, unit, leafbuf, sendcount, unit, 0 /*rank 0*/, comm, req));
24*3ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
25dd5b3ca6SJunchao Zhang }
26dd5b3ca6SJunchao Zhang 
27d71ae5a4SJacob Faibussowitsch static PetscErrorCode PetscSFReduceBegin_Gather(PetscSF sf, MPI_Datatype unit, PetscMemType leafmtype, const void *leafdata, PetscMemType rootmtype, void *rootdata, MPI_Op op)
28d71ae5a4SJacob Faibussowitsch {
29cd620004SJunchao Zhang   PetscSFLink  link;
30dd5b3ca6SJunchao Zhang   PetscMPIInt  recvcount;
31dd5b3ca6SJunchao Zhang   MPI_Comm     comm;
32cd620004SJunchao Zhang   void        *rootbuf = NULL, *leafbuf = NULL;
33cd620004SJunchao Zhang   MPI_Request *req;
34dd5b3ca6SJunchao Zhang 
35dd5b3ca6SJunchao Zhang   PetscFunctionBegin;
369566063dSJacob Faibussowitsch   PetscCall(PetscSFLinkCreate(sf, unit, rootmtype, rootdata, leafmtype, leafdata, op, PETSCSF_REDUCE, &link));
379566063dSJacob Faibussowitsch   PetscCall(PetscSFLinkPackLeafData(sf, link, PETSCSF_REMOTE, leafdata));
389566063dSJacob Faibussowitsch   PetscCall(PetscSFLinkCopyLeafBufferInCaseNotUseGpuAwareMPI(sf, link, PETSC_TRUE /* device2host before sending */));
399566063dSJacob Faibussowitsch   PetscCall(PetscObjectGetComm((PetscObject)sf, &comm));
409566063dSJacob Faibussowitsch   PetscCall(PetscMPIIntCast(sf->nroots, &recvcount));
419566063dSJacob Faibussowitsch   PetscCall(PetscSFLinkGetMPIBuffersAndRequests(sf, link, PETSCSF_LEAF2ROOT, &rootbuf, &leafbuf, &req, NULL));
429566063dSJacob Faibussowitsch   PetscCall(PetscSFLinkSyncStreamBeforeCallMPI(sf, link, PETSCSF_LEAF2ROOT));
439566063dSJacob Faibussowitsch   PetscCallMPI(MPIU_Iscatter(leafbuf, recvcount, unit, rootbuf == leafbuf ? MPI_IN_PLACE : rootbuf, recvcount, unit, 0 /*rank 0*/, comm, req));
44*3ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
45dd5b3ca6SJunchao Zhang }
46dd5b3ca6SJunchao Zhang 
47d71ae5a4SJacob Faibussowitsch PETSC_INTERN PetscErrorCode PetscSFCreate_Gather(PetscSF sf)
48d71ae5a4SJacob Faibussowitsch {
49dd5b3ca6SJunchao Zhang   PetscSF_Gather *dat = (PetscSF_Gather *)sf->data;
50dd5b3ca6SJunchao Zhang 
51dd5b3ca6SJunchao Zhang   PetscFunctionBegin;
52ad227feaSJunchao Zhang   sf->ops->BcastEnd  = PetscSFBcastEnd_Basic;
53cd620004SJunchao Zhang   sf->ops->ReduceEnd = PetscSFReduceEnd_Basic;
54cd620004SJunchao Zhang 
55dd5b3ca6SJunchao Zhang   /* Inherit from Allgatherv */
56dd5b3ca6SJunchao Zhang   sf->ops->Reset         = PetscSFReset_Allgatherv;
57dd5b3ca6SJunchao Zhang   sf->ops->Destroy       = PetscSFDestroy_Allgatherv;
58dd5b3ca6SJunchao Zhang   sf->ops->GetGraph      = PetscSFGetGraph_Allgatherv;
59dd5b3ca6SJunchao Zhang   sf->ops->GetRootRanks  = PetscSFGetRootRanks_Allgatherv;
60dd5b3ca6SJunchao Zhang   sf->ops->GetLeafRanks  = PetscSFGetLeafRanks_Allgatherv;
61dd5b3ca6SJunchao Zhang   sf->ops->FetchAndOpEnd = PetscSFFetchAndOpEnd_Allgatherv;
62dd5b3ca6SJunchao Zhang   sf->ops->CreateLocalSF = PetscSFCreateLocalSF_Allgatherv;
63dd5b3ca6SJunchao Zhang 
64cd620004SJunchao Zhang   /* Inherit from Allgather */
65cd620004SJunchao Zhang   sf->ops->SetUp = PetscSFSetUp_Allgather;
66cd620004SJunchao Zhang 
67dd5b3ca6SJunchao Zhang   /* Inherit from Gatherv */
68dd5b3ca6SJunchao Zhang   sf->ops->FetchAndOpBegin = PetscSFFetchAndOpBegin_Gatherv;
69dd5b3ca6SJunchao Zhang 
70dd5b3ca6SJunchao Zhang   /* Gather stuff */
71ad227feaSJunchao Zhang   sf->ops->BcastBegin  = PetscSFBcastBegin_Gather;
72dd5b3ca6SJunchao Zhang   sf->ops->ReduceBegin = PetscSFReduceBegin_Gather;
73dd5b3ca6SJunchao Zhang 
744dfa11a4SJacob Faibussowitsch   PetscCall(PetscNew(&dat));
75dd5b3ca6SJunchao Zhang   sf->data = (void *)dat;
76*3ba16761SJacob Faibussowitsch   PetscFunctionReturn(PETSC_SUCCESS);
77dd5b3ca6SJunchao Zhang }
78