1*dd5b3ca6SJunchao Zhang 2*dd5b3ca6SJunchao Zhang #include <../src/vec/is/sf/impls/basic/gatherv/sfgatherv.h> 3*dd5b3ca6SJunchao Zhang 4*dd5b3ca6SJunchao Zhang PETSC_INTERN PetscErrorCode PetscSFBcastAndOpBegin_Gatherv(PetscSF sf,MPI_Datatype unit,const void *rootdata,void *leafdata,MPI_Op op) 5*dd5b3ca6SJunchao Zhang { 6*dd5b3ca6SJunchao Zhang PetscErrorCode ierr; 7*dd5b3ca6SJunchao Zhang PetscSFPack_Gatherv link; 8*dd5b3ca6SJunchao Zhang PetscMPIInt rank,sendcount; 9*dd5b3ca6SJunchao Zhang MPI_Comm comm; 10*dd5b3ca6SJunchao Zhang void *recvbuf; 11*dd5b3ca6SJunchao Zhang PetscSF_Gatherv *dat = (PetscSF_Gatherv*)sf->data; 12*dd5b3ca6SJunchao Zhang 13*dd5b3ca6SJunchao Zhang PetscFunctionBegin; 14*dd5b3ca6SJunchao Zhang ierr = PetscSFPackGet_Gatherv(sf,unit,rootdata,&link);CHKERRQ(ierr); 15*dd5b3ca6SJunchao Zhang ierr = PetscObjectGetComm((PetscObject)sf,&comm);CHKERRQ(ierr); 16*dd5b3ca6SJunchao Zhang ierr = PetscMPIIntCast(sf->nroots,&sendcount);CHKERRQ(ierr); 17*dd5b3ca6SJunchao Zhang ierr = MPI_Comm_rank(comm,&rank);CHKERRQ(ierr); 18*dd5b3ca6SJunchao Zhang 19*dd5b3ca6SJunchao Zhang if (op == MPIU_REPLACE) { 20*dd5b3ca6SJunchao Zhang recvbuf = leafdata; 21*dd5b3ca6SJunchao Zhang } else { 22*dd5b3ca6SJunchao Zhang if (!link->leaf && !rank) {ierr = PetscMalloc(sf->nleaves*link->unitbytes,&link->leaf);CHKERRQ(ierr);} /* Alloate leafbuf on rank 0 */ 23*dd5b3ca6SJunchao Zhang recvbuf = link->leaf; 24*dd5b3ca6SJunchao Zhang } 25*dd5b3ca6SJunchao Zhang 26*dd5b3ca6SJunchao Zhang ierr = MPIU_Igatherv(rootdata,sendcount,unit,recvbuf,dat->recvcounts,dat->displs,unit,0/*rank 0*/,comm,&link->request);CHKERRQ(ierr); 27*dd5b3ca6SJunchao Zhang PetscFunctionReturn(0); 28*dd5b3ca6SJunchao Zhang } 29*dd5b3ca6SJunchao Zhang 30*dd5b3ca6SJunchao Zhang static PetscErrorCode PetscSFReduceBegin_Gatherv(PetscSF sf,MPI_Datatype unit,const void *leafdata,void *rootdata,MPI_Op op) 31*dd5b3ca6SJunchao Zhang { 32*dd5b3ca6SJunchao Zhang PetscErrorCode ierr; 33*dd5b3ca6SJunchao Zhang PetscSFPack_Gatherv link; 34*dd5b3ca6SJunchao Zhang PetscMPIInt recvcount; 35*dd5b3ca6SJunchao Zhang MPI_Comm comm; 36*dd5b3ca6SJunchao Zhang void *recvbuf; 37*dd5b3ca6SJunchao Zhang PetscSF_Gatherv *dat = (PetscSF_Gatherv*)sf->data; 38*dd5b3ca6SJunchao Zhang 39*dd5b3ca6SJunchao Zhang PetscFunctionBegin; 40*dd5b3ca6SJunchao Zhang ierr = PetscSFPackGet_Gatherv(sf,unit,leafdata,&link);CHKERRQ(ierr); 41*dd5b3ca6SJunchao Zhang ierr = PetscObjectGetComm((PetscObject)sf,&comm);CHKERRQ(ierr); 42*dd5b3ca6SJunchao Zhang 43*dd5b3ca6SJunchao Zhang if (op == MPIU_REPLACE) { 44*dd5b3ca6SJunchao Zhang recvbuf = rootdata; 45*dd5b3ca6SJunchao Zhang } else { 46*dd5b3ca6SJunchao Zhang if (!link->root) {ierr = PetscMalloc(sf->nroots*link->unitbytes,&link->root);CHKERRQ(ierr);} 47*dd5b3ca6SJunchao Zhang recvbuf = link->root; 48*dd5b3ca6SJunchao Zhang } 49*dd5b3ca6SJunchao Zhang 50*dd5b3ca6SJunchao Zhang ierr = PetscMPIIntCast(sf->nroots,&recvcount);CHKERRQ(ierr); 51*dd5b3ca6SJunchao Zhang ierr = MPIU_Iscatterv(leafdata,dat->recvcounts,dat->displs,unit,recvbuf,recvcount,unit,0,comm,&link->request);CHKERRQ(ierr); 52*dd5b3ca6SJunchao Zhang PetscFunctionReturn(0); 53*dd5b3ca6SJunchao Zhang } 54*dd5b3ca6SJunchao Zhang 55*dd5b3ca6SJunchao Zhang PETSC_INTERN PetscErrorCode PetscSFFetchAndOpBegin_Gatherv(PetscSF sf,MPI_Datatype unit,void *rootdata,const void *leafdata,void *leafupdate,MPI_Op op) 56*dd5b3ca6SJunchao Zhang { 57*dd5b3ca6SJunchao Zhang PetscErrorCode ierr; 58*dd5b3ca6SJunchao Zhang 59*dd5b3ca6SJunchao Zhang PetscFunctionBegin; 60*dd5b3ca6SJunchao Zhang /* In Gatherv, each root only has one leaf. So we just need to bcast rootdata to leafupdate and then reduce leafdata to rootdata */ 61*dd5b3ca6SJunchao Zhang ierr = PetscSFBcastAndOpBegin(sf,unit,rootdata,leafupdate,MPIU_REPLACE);CHKERRQ(ierr); 62*dd5b3ca6SJunchao Zhang ierr = PetscSFBcastAndOpEnd(sf,unit,rootdata,leafupdate,MPIU_REPLACE);CHKERRQ(ierr); 63*dd5b3ca6SJunchao Zhang ierr = PetscSFReduceBegin(sf,unit,leafdata,rootdata,op);CHKERRQ(ierr); 64*dd5b3ca6SJunchao Zhang PetscFunctionReturn(0); 65*dd5b3ca6SJunchao Zhang } 66*dd5b3ca6SJunchao Zhang 67*dd5b3ca6SJunchao Zhang PETSC_INTERN PetscErrorCode PetscSFCreate_Gatherv(PetscSF sf) 68*dd5b3ca6SJunchao Zhang { 69*dd5b3ca6SJunchao Zhang PetscErrorCode ierr; 70*dd5b3ca6SJunchao Zhang PetscSF_Gatherv *dat = (PetscSF_Gatherv*)sf->data; 71*dd5b3ca6SJunchao Zhang 72*dd5b3ca6SJunchao Zhang PetscFunctionBegin; 73*dd5b3ca6SJunchao Zhang /* Inherit from Allgatherv */ 74*dd5b3ca6SJunchao Zhang sf->ops->SetUp = PetscSFSetUp_Allgatherv; 75*dd5b3ca6SJunchao Zhang sf->ops->Reset = PetscSFReset_Allgatherv; 76*dd5b3ca6SJunchao Zhang sf->ops->Destroy = PetscSFDestroy_Allgatherv; 77*dd5b3ca6SJunchao Zhang sf->ops->GetGraph = PetscSFGetGraph_Allgatherv; 78*dd5b3ca6SJunchao Zhang sf->ops->GetLeafRanks = PetscSFGetLeafRanks_Allgatherv; 79*dd5b3ca6SJunchao Zhang sf->ops->GetRootRanks = PetscSFGetRootRanks_Allgatherv; 80*dd5b3ca6SJunchao Zhang sf->ops->BcastAndOpEnd = PetscSFBcastAndOpEnd_Allgatherv; 81*dd5b3ca6SJunchao Zhang sf->ops->ReduceEnd = PetscSFReduceEnd_Allgatherv; 82*dd5b3ca6SJunchao Zhang sf->ops->FetchAndOpEnd = PetscSFFetchAndOpEnd_Allgatherv; 83*dd5b3ca6SJunchao Zhang sf->ops->CreateLocalSF = PetscSFCreateLocalSF_Allgatherv; 84*dd5b3ca6SJunchao Zhang 85*dd5b3ca6SJunchao Zhang /* Gatherv stuff */ 86*dd5b3ca6SJunchao Zhang sf->ops->BcastAndOpBegin = PetscSFBcastAndOpBegin_Gatherv; 87*dd5b3ca6SJunchao Zhang sf->ops->ReduceBegin = PetscSFReduceBegin_Gatherv; 88*dd5b3ca6SJunchao Zhang sf->ops->FetchAndOpBegin = PetscSFFetchAndOpBegin_Gatherv; 89*dd5b3ca6SJunchao Zhang 90*dd5b3ca6SJunchao Zhang ierr = PetscNewLog(sf,&dat);CHKERRQ(ierr); 91*dd5b3ca6SJunchao Zhang sf->data = (void*)dat; 92*dd5b3ca6SJunchao Zhang PetscFunctionReturn(0); 93*dd5b3ca6SJunchao Zhang } 94