1dd5b3ca6SJunchao Zhang 2dd5b3ca6SJunchao Zhang #include <../src/vec/is/sf/impls/basic/gatherv/sfgatherv.h> 3dd5b3ca6SJunchao Zhang 4eb02082bSJunchao Zhang /* Reuse the type. The difference is some fields (displs, recvcounts) are only significant 5eb02082bSJunchao Zhang on rank 0 in Gatherv. On other ranks they are harmless NULL. 6eb02082bSJunchao Zhang */ 7eb02082bSJunchao Zhang typedef PetscSF_Allgatherv PetscSF_Gatherv; 8eb02082bSJunchao Zhang 9ad227feaSJunchao Zhang PETSC_INTERN PetscErrorCode PetscSFBcastBegin_Gatherv(PetscSF sf,MPI_Datatype unit,PetscMemType rootmtype,const void *rootdata,PetscMemType leafmtype,void *leafdata,MPI_Op op) 10dd5b3ca6SJunchao Zhang { 11cd620004SJunchao Zhang PetscSFLink link; 12855db38dSJunchao Zhang PetscMPIInt sendcount; 13dd5b3ca6SJunchao Zhang MPI_Comm comm; 14dd5b3ca6SJunchao Zhang PetscSF_Gatherv *dat = (PetscSF_Gatherv*)sf->data; 15cd620004SJunchao Zhang void *rootbuf = NULL,*leafbuf = NULL; /* buffer seen by MPI */ 16cd620004SJunchao Zhang MPI_Request *req; 17dd5b3ca6SJunchao Zhang 18dd5b3ca6SJunchao Zhang PetscFunctionBegin; 19*9566063dSJacob Faibussowitsch PetscCall(PetscSFLinkCreate(sf,unit,rootmtype,rootdata,leafmtype,leafdata,op,PETSCSF_BCAST,&link)); 20*9566063dSJacob Faibussowitsch PetscCall(PetscSFLinkPackRootData(sf,link,PETSCSF_REMOTE,rootdata)); 21*9566063dSJacob Faibussowitsch PetscCall(PetscSFLinkCopyRootBufferInCaseNotUseGpuAwareMPI(sf,link,PETSC_TRUE/* device2host before sending */)); 22*9566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)sf,&comm)); 23*9566063dSJacob Faibussowitsch PetscCall(PetscMPIIntCast(sf->nroots,&sendcount)); 24*9566063dSJacob Faibussowitsch PetscCall(PetscSFLinkGetMPIBuffersAndRequests(sf,link,PETSCSF_ROOT2LEAF,&rootbuf,&leafbuf,&req,NULL)); 25*9566063dSJacob Faibussowitsch PetscCall(PetscSFLinkSyncStreamBeforeCallMPI(sf,link,PETSCSF_ROOT2LEAF)); 26*9566063dSJacob Faibussowitsch PetscCallMPI(MPIU_Igatherv(rootbuf,sendcount,unit,leafbuf,dat->recvcounts,dat->displs,unit,0/*rank 0*/,comm,req)); 27dd5b3ca6SJunchao Zhang PetscFunctionReturn(0); 28dd5b3ca6SJunchao Zhang } 29dd5b3ca6SJunchao Zhang 30eb02082bSJunchao Zhang static PetscErrorCode PetscSFReduceBegin_Gatherv(PetscSF sf,MPI_Datatype unit,PetscMemType leafmtype,const void *leafdata,PetscMemType rootmtype,void *rootdata,MPI_Op op) 31dd5b3ca6SJunchao Zhang { 32cd620004SJunchao Zhang PetscSFLink link; 33dd5b3ca6SJunchao Zhang PetscMPIInt recvcount; 34dd5b3ca6SJunchao Zhang MPI_Comm comm; 35dd5b3ca6SJunchao Zhang PetscSF_Gatherv *dat = (PetscSF_Gatherv*)sf->data; 36cd620004SJunchao Zhang void *rootbuf = NULL,*leafbuf = NULL; /* buffer seen by MPI */ 37cd620004SJunchao Zhang MPI_Request *req; 38dd5b3ca6SJunchao Zhang 39dd5b3ca6SJunchao Zhang PetscFunctionBegin; 40*9566063dSJacob Faibussowitsch PetscCall(PetscSFLinkCreate(sf,unit,rootmtype,rootdata,leafmtype,leafdata,op,PETSCSF_REDUCE,&link)); 41*9566063dSJacob Faibussowitsch PetscCall(PetscSFLinkPackLeafData(sf,link,PETSCSF_REMOTE,leafdata)); 42*9566063dSJacob Faibussowitsch PetscCall(PetscSFLinkCopyLeafBufferInCaseNotUseGpuAwareMPI(sf,link,PETSC_TRUE/* device2host before sending */)); 43*9566063dSJacob Faibussowitsch PetscCall(PetscObjectGetComm((PetscObject)sf,&comm)); 44*9566063dSJacob Faibussowitsch PetscCall(PetscMPIIntCast(sf->nroots,&recvcount)); 45*9566063dSJacob Faibussowitsch PetscCall(PetscSFLinkGetMPIBuffersAndRequests(sf,link,PETSCSF_LEAF2ROOT,&rootbuf,&leafbuf,&req,NULL)); 46*9566063dSJacob Faibussowitsch PetscCall(PetscSFLinkSyncStreamBeforeCallMPI(sf,link,PETSCSF_LEAF2ROOT)); 47*9566063dSJacob Faibussowitsch PetscCallMPI(MPIU_Iscatterv(leafbuf,dat->recvcounts,dat->displs,unit,rootbuf,recvcount,unit,0,comm,req)); 48dd5b3ca6SJunchao Zhang PetscFunctionReturn(0); 49dd5b3ca6SJunchao Zhang } 50dd5b3ca6SJunchao Zhang 51eb02082bSJunchao Zhang PETSC_INTERN PetscErrorCode PetscSFFetchAndOpBegin_Gatherv(PetscSF sf,MPI_Datatype unit,PetscMemType rootmtype,void *rootdata,PetscMemType leafmtype,const void *leafdata,void *leafupdate,MPI_Op op) 52dd5b3ca6SJunchao Zhang { 53dd5b3ca6SJunchao Zhang PetscFunctionBegin; 54dd5b3ca6SJunchao Zhang /* In Gatherv, each root only has one leaf. So we just need to bcast rootdata to leafupdate and then reduce leafdata to rootdata */ 55*9566063dSJacob Faibussowitsch PetscCall(PetscSFBcastBegin(sf,unit,rootdata,leafupdate,MPI_REPLACE)); 56*9566063dSJacob Faibussowitsch PetscCall(PetscSFBcastEnd(sf,unit,rootdata,leafupdate,MPI_REPLACE)); 57*9566063dSJacob Faibussowitsch PetscCall(PetscSFReduceBegin(sf,unit,leafdata,rootdata,op)); 58dd5b3ca6SJunchao Zhang PetscFunctionReturn(0); 59dd5b3ca6SJunchao Zhang } 60dd5b3ca6SJunchao Zhang 61dd5b3ca6SJunchao Zhang PETSC_INTERN PetscErrorCode PetscSFCreate_Gatherv(PetscSF sf) 62dd5b3ca6SJunchao Zhang { 63dd5b3ca6SJunchao Zhang PetscSF_Gatherv *dat = (PetscSF_Gatherv*)sf->data; 64dd5b3ca6SJunchao Zhang 65dd5b3ca6SJunchao Zhang PetscFunctionBegin; 66ad227feaSJunchao Zhang sf->ops->BcastEnd = PetscSFBcastEnd_Basic; 67cd620004SJunchao Zhang sf->ops->ReduceEnd = PetscSFReduceEnd_Basic; 68cd620004SJunchao Zhang 69dd5b3ca6SJunchao Zhang /* Inherit from Allgatherv */ 70dd5b3ca6SJunchao Zhang sf->ops->SetUp = PetscSFSetUp_Allgatherv; 71dd5b3ca6SJunchao Zhang sf->ops->Reset = PetscSFReset_Allgatherv; 72dd5b3ca6SJunchao Zhang sf->ops->Destroy = PetscSFDestroy_Allgatherv; 73dd5b3ca6SJunchao Zhang sf->ops->GetGraph = PetscSFGetGraph_Allgatherv; 74dd5b3ca6SJunchao Zhang sf->ops->GetLeafRanks = PetscSFGetLeafRanks_Allgatherv; 75dd5b3ca6SJunchao Zhang sf->ops->GetRootRanks = PetscSFGetRootRanks_Allgatherv; 76dd5b3ca6SJunchao Zhang sf->ops->FetchAndOpEnd = PetscSFFetchAndOpEnd_Allgatherv; 77dd5b3ca6SJunchao Zhang sf->ops->CreateLocalSF = PetscSFCreateLocalSF_Allgatherv; 78dd5b3ca6SJunchao Zhang 79dd5b3ca6SJunchao Zhang /* Gatherv stuff */ 80ad227feaSJunchao Zhang sf->ops->BcastBegin = PetscSFBcastBegin_Gatherv; 81dd5b3ca6SJunchao Zhang sf->ops->ReduceBegin = PetscSFReduceBegin_Gatherv; 82dd5b3ca6SJunchao Zhang sf->ops->FetchAndOpBegin = PetscSFFetchAndOpBegin_Gatherv; 83dd5b3ca6SJunchao Zhang 84*9566063dSJacob Faibussowitsch PetscCall(PetscNewLog(sf,&dat)); 85dd5b3ca6SJunchao Zhang sf->data = (void*)dat; 86dd5b3ca6SJunchao Zhang PetscFunctionReturn(0); 87dd5b3ca6SJunchao Zhang } 88