1c4762a1bSJed Brown static char help[]= "Test PetscSFFetchAndOp on patterned SF graphs. PetscSFFetchAndOp internally uses PetscSFBcastAndOp \n\ 2c4762a1bSJed Brown and PetscSFReduce. So it is a good test to see if they all work for patterned graphs.\n\ 3c4762a1bSJed Brown Run with ./prog -op [replace | sum]\n\n"; 4c4762a1bSJed Brown 5c4762a1bSJed Brown #include <petscvec.h> 6c4762a1bSJed Brown #include <petscsf.h> 7c4762a1bSJed Brown int main(int argc,char **argv) 8c4762a1bSJed Brown { 9c4762a1bSJed Brown PetscErrorCode ierr; 10c4762a1bSJed Brown PetscInt i,N=10,low,high,nleaves; 11c4762a1bSJed Brown PetscMPIInt size,rank; 12c4762a1bSJed Brown Vec x,y,y2,gy2; 13c4762a1bSJed Brown PetscScalar *rootdata,*leafdata,*leafupdate; 14c4762a1bSJed Brown PetscLayout layout; 15c4762a1bSJed Brown PetscSF gathersf,allgathersf,alltoallsf; 16c4762a1bSJed Brown MPI_Op op=MPI_SUM; 17c4762a1bSJed Brown char opname[64]; 18c4762a1bSJed Brown const char *mpiopname; 19c4762a1bSJed Brown PetscBool flag,isreplace,issum; 20c4762a1bSJed Brown 21c4762a1bSJed Brown ierr = PetscInitialize(&argc,&argv,(char*)0,help);if (ierr) return ierr; 22*5f80ce2aSJacob Faibussowitsch CHKERRMPI(MPI_Comm_size(PETSC_COMM_WORLD,&size)); 23*5f80ce2aSJacob Faibussowitsch CHKERRMPI(MPI_Comm_rank(PETSC_COMM_WORLD,&rank)); 24c4762a1bSJed Brown 25*5f80ce2aSJacob Faibussowitsch CHKERRQ(PetscOptionsGetString(NULL,NULL,"-op",opname,sizeof(opname),&flag)); 26*5f80ce2aSJacob Faibussowitsch CHKERRQ(PetscStrcmp(opname,"replace",&isreplace)); 27*5f80ce2aSJacob Faibussowitsch CHKERRQ(PetscStrcmp(opname,"sum",&issum)); 28c4762a1bSJed Brown 2983df288dSJunchao Zhang if (isreplace) {op = MPI_REPLACE; mpiopname = "MPI_REPLACE";} 30c4762a1bSJed Brown else if (issum) {op = MPIU_SUM; mpiopname = "MPI_SUM";} 3198921bdaSJacob Faibussowitsch else SETERRQ(PETSC_COMM_WORLD,PETSC_ERR_ARG_WRONG,"Unsupported argument (%s) to -op, which must be 'replace' or 'sum'",opname); 32c4762a1bSJed Brown 33*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecCreate(PETSC_COMM_WORLD,&x)); 34*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecSetFromOptions(x)); 35*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecSetSizes(x,PETSC_DECIDE,N)); 36c4762a1bSJed Brown 37c4762a1bSJed Brown /*-------------------------------------*/ 38c4762a1bSJed Brown /* PETSCSF_PATTERN_GATHER */ 39c4762a1bSJed Brown /*-------------------------------------*/ 40c4762a1bSJed Brown 41c4762a1bSJed Brown /* set MPI vec x to [1, 2, .., N] */ 42*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecGetOwnershipRange(x,&low,&high)); 43*5f80ce2aSJacob Faibussowitsch for (i=low; i<high; i++) CHKERRQ(VecSetValue(x,i,(PetscScalar)i+1.0,INSERT_VALUES)); 44*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecAssemblyBegin(x)); 45*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecAssemblyEnd(x)); 46c4762a1bSJed Brown 47c4762a1bSJed Brown /* Create the gather SF */ 48*5f80ce2aSJacob Faibussowitsch CHKERRQ(PetscPrintf(PETSC_COMM_WORLD,"\nTesting PetscSFFetchAndOp on a PETSCSF_PATTERN_GATHER graph with op = %s\n",mpiopname)); 49*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecGetLayout(x,&layout)); 50*5f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFCreate(PETSC_COMM_WORLD,&gathersf)); 51*5f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFSetGraphWithPattern(gathersf,layout,PETSCSF_PATTERN_GATHER)); 52c4762a1bSJed Brown 53c4762a1bSJed Brown /* Create the leaf vector y (seq vector) and its duplicate y2 working as leafupdate */ 54*5f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFGetGraph(gathersf,NULL,&nleaves,NULL,NULL)); 55*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecCreateSeq(PETSC_COMM_SELF,nleaves,&y)); 56*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecDuplicate(y,&y2)); 57c4762a1bSJed Brown 58*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecGetArray(x,&rootdata)); 59*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecGetArray(y,&leafdata)); 60*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecGetArray(y2,&leafupdate)); 61c4762a1bSJed Brown 62c4762a1bSJed Brown /* Bcast x to y,to initialize y = [1,N], then scale y to make leafupdate = y = [2,2*N] */ 63*5f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFBcastBegin(gathersf,MPIU_SCALAR,rootdata,leafdata,MPI_REPLACE)); 64*5f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFBcastEnd(gathersf,MPIU_SCALAR,rootdata,leafdata,MPI_REPLACE)); 65*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecRestoreArray(y,&leafdata)); 66*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecScale(y,2)); 67*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecGetArray(y,&leafdata)); 68c4762a1bSJed Brown 69c4762a1bSJed Brown /* FetchAndOp x to y */ 70*5f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFFetchAndOpBegin(gathersf,MPIU_SCALAR,rootdata,leafdata,leafupdate,op)); 71*5f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFFetchAndOpEnd(gathersf,MPIU_SCALAR,rootdata,leafdata,leafupdate,op)); 72c4762a1bSJed Brown 73c4762a1bSJed Brown /* View roots (x) and leafupdate (y2). Since this is a gather graph, leafudpate = rootdata = [1,N], then rootdata += leafdata, i.e., [3,3*N] */ 74*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecCreateMPIWithArray(PETSC_COMM_WORLD,1,nleaves,PETSC_DECIDE,leafupdate,&gy2)); 75*5f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectSetName((PetscObject)x,"rootdata")); 76*5f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectSetName((PetscObject)gy2,"leafupdate")); 77c4762a1bSJed Brown 78*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecView(x,PETSC_VIEWER_STDOUT_WORLD)); 79*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecView(gy2,PETSC_VIEWER_STDOUT_WORLD)); 80*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecDestroy(&gy2)); 81c4762a1bSJed Brown 82*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecRestoreArray(y2,&leafupdate)); 83*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecDestroy(&y2)); 84c4762a1bSJed Brown 85*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecRestoreArray(y,&leafdata)); 86*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecDestroy(&y)); 87c4762a1bSJed Brown 88*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecRestoreArray(x,&rootdata)); 89*5f80ce2aSJacob Faibussowitsch /* CHKERRQ(VecDestroy(&x)); */ /* We will reuse x in ALLGATHER, so do not destroy it */ 90c4762a1bSJed Brown 91*5f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFDestroy(&gathersf)); 92c4762a1bSJed Brown 93c4762a1bSJed Brown /*-------------------------------------*/ 94c4762a1bSJed Brown /* PETSCSF_PATTERN_ALLGATHER */ 95c4762a1bSJed Brown /*-------------------------------------*/ 96c4762a1bSJed Brown 97c4762a1bSJed Brown /* set MPI vec x to [1, 2, .., N] */ 98*5f80ce2aSJacob Faibussowitsch for (i=low; i<high; i++) CHKERRQ(VecSetValue(x,i,(PetscScalar)i+1.0,INSERT_VALUES)); 99*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecAssemblyBegin(x)); 100*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecAssemblyEnd(x)); 101c4762a1bSJed Brown 102c4762a1bSJed Brown /* Create the allgather SF */ 103*5f80ce2aSJacob Faibussowitsch CHKERRQ(PetscPrintf(PETSC_COMM_WORLD,"\nTesting PetscSFFetchAndOp on a PETSCSF_PATTERN_ALLGATHER graph with op = %s\n",mpiopname)); 104*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecGetLayout(x,&layout)); 105*5f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFCreate(PETSC_COMM_WORLD,&allgathersf)); 106*5f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFSetGraphWithPattern(allgathersf,layout,PETSCSF_PATTERN_ALLGATHER)); 107c4762a1bSJed Brown 108c4762a1bSJed Brown /* Create the leaf vector y (seq vector) and its duplicate y2 working as leafupdate */ 109*5f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFGetGraph(allgathersf,NULL,&nleaves,NULL,NULL)); 110*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecCreateSeq(PETSC_COMM_SELF,nleaves,&y)); 111*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecDuplicate(y,&y2)); 112c4762a1bSJed Brown 113*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecGetArray(x,&rootdata)); 114*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecGetArray(y,&leafdata)); 115*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecGetArray(y2,&leafupdate)); 116c4762a1bSJed Brown 117c4762a1bSJed Brown /* Bcast x to y, to initialize y = [1,N], then scale y to make leafupdate = y = [2,2*N] */ 118*5f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFBcastBegin(allgathersf,MPIU_SCALAR,rootdata,leafdata,MPI_REPLACE)); 119*5f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFBcastEnd(allgathersf,MPIU_SCALAR,rootdata,leafdata,MPI_REPLACE)); 120*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecRestoreArray(y,&leafdata)); 121*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecScale(y,2)); 122*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecGetArray(y,&leafdata)); 123c4762a1bSJed Brown 124c4762a1bSJed Brown /* FetchAndOp x to y */ 125*5f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFFetchAndOpBegin(allgathersf,MPIU_SCALAR,rootdata,leafdata,leafupdate,op)); 126*5f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFFetchAndOpEnd(allgathersf,MPIU_SCALAR,rootdata,leafdata,leafupdate,op)); 127c4762a1bSJed Brown 128c4762a1bSJed Brown /* View roots (x) and leafupdate (y2). Since this is an allgather graph, we have (suppose ranks get updates in ascending order) 129c4762a1bSJed Brown rank 0: leafupdate = rootdata = [1,N], rootdata += leafdata = [3,3*N] 130c4762a1bSJed Brown rank 1: leafupdate = rootdata = [3,3*N], rootdata += leafdata = [5,5*N] 131c4762a1bSJed Brown rank 2: leafupdate = rootdata = [5,5*N], rootdata += leafdata = [7,7*N] 132c4762a1bSJed Brown ... 133c4762a1bSJed Brown */ 134*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecCreateMPIWithArray(PETSC_COMM_WORLD,1,nleaves,PETSC_DECIDE,leafupdate,&gy2)); 135*5f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectSetName((PetscObject)x,"rootdata")); 136*5f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectSetName((PetscObject)gy2,"leafupdate")); 137c4762a1bSJed Brown 138*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecView(x,PETSC_VIEWER_STDOUT_WORLD)); 139*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecView(gy2,PETSC_VIEWER_STDOUT_WORLD)); 140*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecDestroy(&gy2)); 141c4762a1bSJed Brown 142*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecRestoreArray(y2,&leafupdate)); 143*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecDestroy(&y2)); 144c4762a1bSJed Brown 145*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecRestoreArray(y,&leafdata)); 146*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecDestroy(&y)); 147c4762a1bSJed Brown 148*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecRestoreArray(x,&rootdata)); 149*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecDestroy(&x)); /* We won't reuse x in ALLGATHER, so destroy it */ 150c4762a1bSJed Brown 151*5f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFDestroy(&allgathersf)); 152c4762a1bSJed Brown 153c4762a1bSJed Brown /*-------------------------------------*/ 154c4762a1bSJed Brown /* PETSCSF_PATTERN_ALLTOALL */ 155c4762a1bSJed Brown /*-------------------------------------*/ 156c4762a1bSJed Brown 157*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecCreate(PETSC_COMM_WORLD,&x)); 158*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecSetFromOptions(x)); 159*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecSetSizes(x,size,PETSC_DECIDE)); 160c4762a1bSJed Brown 161c4762a1bSJed Brown /* set MPI vec x to [1, 2, .., size^2] */ 162*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecGetOwnershipRange(x,&low,&high)); 163*5f80ce2aSJacob Faibussowitsch for (i=low; i<high; i++) CHKERRQ(VecSetValue(x,i,(PetscScalar)i+1.0,INSERT_VALUES)); 164*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecAssemblyBegin(x)); 165*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecAssemblyEnd(x)); 166c4762a1bSJed Brown 167c4762a1bSJed Brown /* Create the alltoall SF */ 168*5f80ce2aSJacob Faibussowitsch CHKERRQ(PetscPrintf(PETSC_COMM_WORLD,"\nTesting PetscSFFetchAndOp on a PETSCSF_PATTERN_ALLTOALL graph with op = %s\n",mpiopname)); 169*5f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFCreate(PETSC_COMM_WORLD,&alltoallsf)); 170*5f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFSetGraphWithPattern(alltoallsf,NULL/*insignificant*/,PETSCSF_PATTERN_ALLTOALL)); 171c4762a1bSJed Brown 172c4762a1bSJed Brown /* Create the leaf vector y (seq vector) and its duplicate y2 working as leafupdate */ 173*5f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFGetGraph(alltoallsf,NULL,&nleaves,NULL,NULL)); 174*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecCreateSeq(PETSC_COMM_SELF,nleaves,&y)); 175*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecDuplicate(y,&y2)); 176c4762a1bSJed Brown 177*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecGetArray(x,&rootdata)); 178*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecGetArray(y,&leafdata)); 179*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecGetArray(y2,&leafupdate)); 180c4762a1bSJed Brown 181c4762a1bSJed Brown /* Bcast x to y, to initialize y = 1+rank+size*i, with i=0..size-1 */ 182*5f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFBcastBegin(alltoallsf,MPIU_SCALAR,rootdata,leafdata,MPI_REPLACE)); 183*5f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFBcastEnd(alltoallsf,MPIU_SCALAR,rootdata,leafdata,MPI_REPLACE)); 184c4762a1bSJed Brown 185c4762a1bSJed Brown /* FetchAndOp x to y */ 186*5f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFFetchAndOpBegin(alltoallsf,MPIU_SCALAR,rootdata,leafdata,leafupdate,op)); 187*5f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFFetchAndOpEnd(alltoallsf,MPIU_SCALAR,rootdata,leafdata,leafupdate,op)); 188c4762a1bSJed Brown 189c4762a1bSJed Brown /* View roots (x) and leafupdate (y2). Since this is an alltoall graph, each root has only one leaf. 190c4762a1bSJed Brown So, leafupdate = rootdata = 1+rank+size*i, i=0..size-1; and rootdata += leafdata, i.e., rootdata = [2,2*N] 191c4762a1bSJed Brown */ 192*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecCreateMPIWithArray(PETSC_COMM_WORLD,1,nleaves,PETSC_DECIDE,leafupdate,&gy2)); 193*5f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectSetName((PetscObject)x,"rootdata")); 194*5f80ce2aSJacob Faibussowitsch CHKERRQ(PetscObjectSetName((PetscObject)gy2,"leafupdate")); 195c4762a1bSJed Brown 196*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecView(x,PETSC_VIEWER_STDOUT_WORLD)); 197*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecView(gy2,PETSC_VIEWER_STDOUT_WORLD)); 198*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecDestroy(&gy2)); 199c4762a1bSJed Brown 200*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecRestoreArray(y2,&leafupdate)); 201*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecDestroy(&y2)); 202c4762a1bSJed Brown 203*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecRestoreArray(y,&leafdata)); 204*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecDestroy(&y)); 205c4762a1bSJed Brown 206*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecRestoreArray(x,&rootdata)); 207*5f80ce2aSJacob Faibussowitsch CHKERRQ(VecDestroy(&x)); 208c4762a1bSJed Brown 209*5f80ce2aSJacob Faibussowitsch CHKERRQ(PetscSFDestroy(&alltoallsf)); 210c4762a1bSJed Brown 211c4762a1bSJed Brown ierr = PetscFinalize(); 212c4762a1bSJed Brown return ierr; 213c4762a1bSJed Brown } 214c4762a1bSJed Brown 215c4762a1bSJed Brown /*TEST 216c4762a1bSJed Brown 217c4762a1bSJed Brown test: 218c4762a1bSJed Brown # N=10 is divisible by nsize, to trigger Allgather/Gather in SF 219f424265bSStefano Zampini #MPI_Sendrecv_replace is broken with 20210400300 220f424265bSStefano Zampini requires: !defined(PETSC_HAVE_I_MPI_NUMVERSION) 221c4762a1bSJed Brown nsize: 2 222c4762a1bSJed Brown args: -op replace 223c4762a1bSJed Brown 224c4762a1bSJed Brown test: 225c4762a1bSJed Brown suffix: 2 226c4762a1bSJed Brown nsize: 2 227c4762a1bSJed Brown args: -op sum 228c4762a1bSJed Brown 229c4762a1bSJed Brown # N=10 is not divisible by nsize, to trigger Allgatherv/Gatherv in SF 230c4762a1bSJed Brown test: 231f424265bSStefano Zampini #MPI_Sendrecv_replace is broken with 20210400300 232f424265bSStefano Zampini requires: !defined(PETSC_HAVE_I_MPI_NUMVERSION) 233c4762a1bSJed Brown suffix: 3 234c4762a1bSJed Brown nsize: 3 235c4762a1bSJed Brown args: -op replace 236c4762a1bSJed Brown 237c4762a1bSJed Brown test: 238c4762a1bSJed Brown suffix: 4 239c4762a1bSJed Brown nsize: 3 240c4762a1bSJed Brown args: -op sum 241c4762a1bSJed Brown 242c4762a1bSJed Brown TEST*/ 243