12e68589bSMark F. Adams /* 22e68589bSMark F. Adams GAMG geometric-algebric multiogrid PC - Mark Adams 2011 32e68589bSMark F. Adams */ 42e68589bSMark F. Adams 52e68589bSMark F. Adams #include <../src/ksp/pc/impls/gamg/gamg.h> /*I "petscpc.h" I*/ 6b45d2f2cSJed Brown #include <petsc-private/kspimpl.h> 72e68589bSMark F. Adams 82e68589bSMark F. Adams #if defined(PETSC_HAVE_TRIANGLE) 92e68589bSMark F. Adams #define REAL PetscReal 102e68589bSMark F. Adams #include <triangle.h> 112e68589bSMark F. Adams #endif 122e68589bSMark F. Adams 132e68589bSMark F. Adams #include <petscblaslapack.h> 142e68589bSMark F. Adams 15c8b0795cSMark F. Adams /* Private context for the GAMG preconditioner */ 16c8b0795cSMark F. Adams typedef struct { 17c8b0795cSMark F. Adams PetscInt lid; /* local vertex index */ 18c8b0795cSMark F. Adams PetscInt degree; /* vertex degree */ 19c8b0795cSMark F. Adams } GAMGNode; 202fa5cd67SKarl Rupp 210cbbd2e1SMark F. Adams int petsc_geo_mg_compare(const void *a, const void *b) 22c8b0795cSMark F. Adams { 23c8b0795cSMark F. Adams return (((GAMGNode*)a)->degree - ((GAMGNode*)b)->degree); 24c8b0795cSMark F. Adams } 25c8b0795cSMark F. Adams 262e68589bSMark F. Adams /* -------------------------------------------------------------------------- */ 272e68589bSMark F. Adams /* 282e68589bSMark F. Adams PCSetCoordinates_GEO 292e68589bSMark F. Adams 302e68589bSMark F. Adams Input Parameter: 312e68589bSMark F. Adams . pc - the preconditioner context 322e68589bSMark F. Adams */ 332e68589bSMark F. Adams #undef __FUNCT__ 342e68589bSMark F. Adams #define __FUNCT__ "PCSetCoordinates_GEO" 35302f38e8SMark F. Adams PetscErrorCode PCSetCoordinates_GEO(PC pc, PetscInt ndm, PetscInt a_nloc, PetscReal *coords) 362e68589bSMark F. Adams { 372e68589bSMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 382e68589bSMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 392e68589bSMark F. Adams PetscErrorCode ierr; 402e68589bSMark F. Adams PetscInt arrsz,bs,my0,kk,ii,nloc,Iend; 412e68589bSMark F. Adams Mat Amat = pc->pmat; 422e68589bSMark F. Adams 432e68589bSMark F. Adams PetscFunctionBegin; 442e68589bSMark F. Adams PetscValidHeaderSpecific(Amat, MAT_CLASSID, 1); 452e68589bSMark F. Adams ierr = MatGetBlockSize(Amat, &bs);CHKERRQ(ierr); 46a2f3521dSMark F. Adams 472e68589bSMark F. Adams ierr = MatGetOwnershipRange(Amat, &my0, &Iend);CHKERRQ(ierr); 482e68589bSMark F. Adams nloc = (Iend-my0)/bs; 49a2f3521dSMark F. Adams 50ce94432eSBarry Smith if (nloc!=a_nloc) SETERRQ2(PetscObjectComm((PetscObject)Amat),PETSC_ERR_ARG_WRONG, "Stokes not supported nloc = %d %d.",a_nloc,nloc); 51ce94432eSBarry Smith if ((Iend-my0)%bs!=0) SETERRQ1(PetscObjectComm((PetscObject)Amat),PETSC_ERR_ARG_WRONG, "Bad local size %d.",nloc); 522e68589bSMark F. Adams 53c8b0795cSMark F. Adams pc_gamg->data_cell_rows = 1; 54ce94432eSBarry Smith if (coords==0 && nloc > 0) SETERRQ(PetscObjectComm((PetscObject)Amat),PETSC_ERR_ARG_WRONG, "Need coordinates for pc_gamg_type 'geo'."); 55c8b0795cSMark F. Adams pc_gamg->data_cell_cols = ndm; /* coordinates */ 562e68589bSMark F. Adams 57c8b0795cSMark F. Adams arrsz = nloc*pc_gamg->data_cell_rows*pc_gamg->data_cell_cols; 582e68589bSMark F. Adams 592e68589bSMark F. Adams /* create data - syntactic sugar that should be refactored at some point */ 602e68589bSMark F. Adams if (pc_gamg->data==0 || (pc_gamg->data_sz != arrsz)) { 612e68589bSMark F. Adams ierr = PetscFree(pc_gamg->data);CHKERRQ(ierr); 62854ce69bSBarry Smith ierr = PetscMalloc1(arrsz+1, &pc_gamg->data);CHKERRQ(ierr); 632e68589bSMark F. Adams } 642e68589bSMark F. Adams for (kk=0; kk<arrsz; kk++) pc_gamg->data[kk] = -999.; 652e68589bSMark F. Adams pc_gamg->data[arrsz] = -99.; 662e68589bSMark F. Adams /* copy data in - column oriented */ 672e68589bSMark F. Adams for (kk = 0; kk < nloc; kk++) { 682e68589bSMark F. Adams for (ii = 0; ii < ndm; ii++) { 692e68589bSMark F. Adams pc_gamg->data[ii*nloc + kk] = coords[kk*ndm + ii]; 702e68589bSMark F. Adams } 712e68589bSMark F. Adams } 7271959b99SBarry Smith if (pc_gamg->data[arrsz] != -99.) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"pc_gamg->data[arrsz %D] %g != -99.",arrsz,pc_gamg->data[arrsz]); 732e68589bSMark F. Adams pc_gamg->data_sz = arrsz; 742e68589bSMark F. Adams PetscFunctionReturn(0); 752e68589bSMark F. Adams } 762e68589bSMark F. Adams 772e68589bSMark F. Adams /* -------------------------------------------------------------------------- */ 782e68589bSMark F. Adams /* 792e68589bSMark F. Adams PCSetData_GEO 802e68589bSMark F. Adams 812e68589bSMark F. Adams Input Parameter: 822e68589bSMark F. Adams . pc - 832e68589bSMark F. Adams */ 842e68589bSMark F. Adams #undef __FUNCT__ 852e68589bSMark F. Adams #define __FUNCT__ "PCSetData_GEO" 86b8cd405aSMark F. Adams PetscErrorCode PCSetData_GEO(PC pc, Mat m) 872e68589bSMark F. Adams { 882e68589bSMark F. Adams PetscFunctionBegin; 89ce94432eSBarry Smith SETERRQ(PetscObjectComm((PetscObject)pc),PETSC_ERR_PLIB,"GEO MG needs coordinates"); 902e68589bSMark F. Adams } 912e68589bSMark F. Adams 922e68589bSMark F. Adams /* -------------------------------------------------------------------------- */ 932e68589bSMark F. Adams /* 942e68589bSMark F. Adams PCSetFromOptions_GEO 952e68589bSMark F. Adams 962e68589bSMark F. Adams Input Parameter: 972e68589bSMark F. Adams . pc - 982e68589bSMark F. Adams */ 992e68589bSMark F. Adams #undef __FUNCT__ 1002e68589bSMark F. Adams #define __FUNCT__ "PCSetFromOptions_GEO" 1018c34d3f5SBarry Smith PetscErrorCode PCSetFromOptions_GEO(PetscOptions *PetscOptionsObject,PC pc) 1022e68589bSMark F. Adams { 1032e68589bSMark F. Adams PetscErrorCode ierr; 1042e68589bSMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 1052e68589bSMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 1062e68589bSMark F. Adams 1072e68589bSMark F. Adams PetscFunctionBegin; 108e55864a3SBarry Smith ierr = PetscOptionsHead(PetscOptionsObject,"GAMG-GEO options");CHKERRQ(ierr); 1092e68589bSMark F. Adams { 1102e68589bSMark F. Adams /* -pc_gamg_sa_nsmooths */ 1112e68589bSMark F. Adams /* pc_gamg_sa->smooths = 0; */ 1122e68589bSMark F. Adams /* ierr = PetscOptionsInt("-pc_gamg_agg_nsmooths", */ 1132e68589bSMark F. Adams /* "smoothing steps for smoothed aggregation, usually 1 (0)", */ 1142e68589bSMark F. Adams /* "PCGAMGSetNSmooths_AGG", */ 1152e68589bSMark F. Adams /* pc_gamg_sa->smooths, */ 1162e68589bSMark F. Adams /* &pc_gamg_sa->smooths, */ 1172e68589bSMark F. Adams /* &flag); */ 1182e68589bSMark F. Adams /* CHKERRQ(ierr); */ 1192e68589bSMark F. Adams } 1202e68589bSMark F. Adams ierr = PetscOptionsTail();CHKERRQ(ierr); 1212e68589bSMark F. Adams 1222e68589bSMark F. Adams if (pc_gamg->verbose) { 123ce94432eSBarry Smith PetscPrintf(PetscObjectComm((PetscObject)pc),"[%d]%s done\n",0,__FUNCT__); 1242e68589bSMark F. Adams } 1252e68589bSMark F. Adams PetscFunctionReturn(0); 1262e68589bSMark F. Adams } 1272e68589bSMark F. Adams 1282e68589bSMark F. Adams /* -------------------------------------------------------------------------- */ 1292e68589bSMark F. Adams /* 1302e68589bSMark F. Adams triangulateAndFormProl 1312e68589bSMark F. Adams 1322e68589bSMark F. Adams Input Parameter: 1332e68589bSMark F. Adams . selected_2 - list of selected local ID, includes selected ghosts 134a2f3521dSMark F. Adams . data_stride - 135a2f3521dSMark F. Adams . coords[2*data_stride] - column vector of local coordinates w/ ghosts 136b43b03e9SMark F. Adams . nselected_1 - selected IDs that go with base (1) graph 1370cbbd2e1SMark F. Adams . clid_lid_1[nselected_1] - lids of selected (c) nodes ??????????? 1380cbbd2e1SMark F. Adams . agg_lists_1 - list of aggregates 1392e68589bSMark F. Adams . crsGID[selected.size()] - global index for prolongation operator 1402e68589bSMark F. Adams . bs - block size 1412e68589bSMark F. Adams Output Parameter: 1422e68589bSMark F. Adams . a_Prol - prolongation operator 1432e68589bSMark F. Adams . a_worst_best - measure of worst missed fine vertex, 0 is no misses 1442e68589bSMark F. Adams */ 1452e68589bSMark F. Adams #undef __FUNCT__ 1462e68589bSMark F. Adams #define __FUNCT__ "triangulateAndFormProl" 1470cbbd2e1SMark F. Adams static PetscErrorCode triangulateAndFormProl(IS selected_2, /* list of selected local ID, includes selected ghosts */ 148a2f3521dSMark F. Adams const PetscInt data_stride, 1492e68589bSMark F. Adams const PetscReal coords[], /* column vector of local coordinates w/ ghosts */ 150b43b03e9SMark F. Adams const PetscInt nselected_1, /* list of selected local ID, includes selected ghosts */ 151b43b03e9SMark F. Adams const PetscInt clid_lid_1[], 1520cbbd2e1SMark F. Adams const PetscCoarsenData *agg_lists_1, /* selected_1 vertices of aggregate unselected vertices */ 1532e68589bSMark F. Adams const PetscInt crsGID[], 1542e68589bSMark F. Adams const PetscInt bs, 1552e68589bSMark F. Adams Mat a_Prol, /* prolongation operator (output) */ 1561147fc2aSKarl Rupp PetscReal *a_worst_best) /* measure of worst missed fine vertex, 0 is no misses */ 1572e68589bSMark F. Adams { 1582e68589bSMark F. Adams #if defined(PETSC_HAVE_TRIANGLE) 1592e68589bSMark F. Adams PetscErrorCode ierr; 160b43b03e9SMark F. Adams PetscInt jj,tid,tt,idx,nselected_2; 1612e68589bSMark F. Adams struct triangulateio in,mid; 1620cbbd2e1SMark F. Adams const PetscInt *selected_idx_2; 163*73911c69SBarry Smith PetscMPIInt rank; 1642e68589bSMark F. Adams PetscInt Istart,Iend,nFineLoc,myFine0; 1652e68589bSMark F. Adams int kk,nPlotPts,sid; 1663b4367a7SBarry Smith MPI_Comm comm; 167c8b0795cSMark F. Adams PetscReal tm; 168c8b0795cSMark F. Adams 1696e111a19SKarl Rupp PetscFunctionBegin; 1703b4367a7SBarry Smith ierr = PetscObjectGetComm((PetscObject)a_Prol,&comm);CHKERRQ(ierr); 1713b4367a7SBarry Smith ierr = MPI_Comm_rank(comm,&rank);CHKERRQ(ierr); 172c8b0795cSMark F. Adams ierr = ISGetSize(selected_2, &nselected_2);CHKERRQ(ierr); 1732e68589bSMark F. Adams if (nselected_2 == 1 || nselected_2 == 2) { /* 0 happens on idle processors */ 1742e68589bSMark F. Adams *a_worst_best = 100.0; /* this will cause a stop, but not globalized (should not happen) */ 175806fa848SBarry Smith } else *a_worst_best = 0.0; 1763b4367a7SBarry Smith ierr = MPI_Allreduce(a_worst_best, &tm, 1, MPIU_REAL, MPIU_MAX, comm);CHKERRQ(ierr); 177c8b0795cSMark F. Adams if (tm > 0.0) { 178c8b0795cSMark F. Adams *a_worst_best = 100.0; 1792e68589bSMark F. Adams PetscFunctionReturn(0); 1802e68589bSMark F. Adams } 1812e68589bSMark F. Adams ierr = MatGetOwnershipRange(a_Prol, &Istart, &Iend);CHKERRQ(ierr); 1822e68589bSMark F. Adams nFineLoc = (Iend-Istart)/bs; myFine0 = Istart/bs; 1832e68589bSMark F. Adams nPlotPts = nFineLoc; /* locals */ 1842e68589bSMark F. Adams /* traingle */ 1852e68589bSMark F. Adams /* Define input points - in*/ 1862e68589bSMark F. Adams in.numberofpoints = nselected_2; 1872e68589bSMark F. Adams in.numberofpointattributes = 0; 1882e68589bSMark F. Adams /* get nselected points */ 189785e854fSJed Brown ierr = PetscMalloc1(2*(nselected_2), &in.pointlist);CHKERRQ(ierr); 1902e68589bSMark F. Adams ierr = ISGetIndices(selected_2, &selected_idx_2);CHKERRQ(ierr); 1912e68589bSMark F. Adams 1922e68589bSMark F. Adams for (kk=0,sid=0; kk<nselected_2; kk++,sid += 2) { 1932e68589bSMark F. Adams PetscInt lid = selected_idx_2[kk]; 1942e68589bSMark F. Adams in.pointlist[sid] = coords[lid]; 195a2f3521dSMark F. Adams in.pointlist[sid+1] = coords[data_stride + lid]; 1962e68589bSMark F. Adams if (lid>=nFineLoc) nPlotPts++; 1972e68589bSMark F. Adams } 19871959b99SBarry Smith if (sid != 2*nselected_2) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"sid %D != 2*nselected_2 %D",sid,nselected_2); 1992e68589bSMark F. Adams 2002e68589bSMark F. Adams in.numberofsegments = 0; 2012e68589bSMark F. Adams in.numberofedges = 0; 2022e68589bSMark F. Adams in.numberofholes = 0; 2032e68589bSMark F. Adams in.numberofregions = 0; 2042e68589bSMark F. Adams in.trianglelist = 0; 2052e68589bSMark F. Adams in.segmentmarkerlist = 0; 2062e68589bSMark F. Adams in.pointattributelist = 0; 2072e68589bSMark F. Adams in.pointmarkerlist = 0; 2082e68589bSMark F. Adams in.triangleattributelist = 0; 2092e68589bSMark F. Adams in.trianglearealist = 0; 2102e68589bSMark F. Adams in.segmentlist = 0; 2112e68589bSMark F. Adams in.holelist = 0; 2122e68589bSMark F. Adams in.regionlist = 0; 2132e68589bSMark F. Adams in.edgelist = 0; 2142e68589bSMark F. Adams in.edgemarkerlist = 0; 2152e68589bSMark F. Adams in.normlist = 0; 2162fa5cd67SKarl Rupp 2172e68589bSMark F. Adams /* triangulate */ 2182e68589bSMark F. Adams mid.pointlist = 0; /* Not needed if -N switch used. */ 2192e68589bSMark F. Adams /* Not needed if -N switch used or number of point attributes is zero: */ 2202e68589bSMark F. Adams mid.pointattributelist = 0; 2212e68589bSMark F. Adams mid.pointmarkerlist = 0; /* Not needed if -N or -B switch used. */ 2222e68589bSMark F. Adams mid.trianglelist = 0; /* Not needed if -E switch used. */ 2232e68589bSMark F. Adams /* Not needed if -E switch used or number of triangle attributes is zero: */ 2242e68589bSMark F. Adams mid.triangleattributelist = 0; 2252e68589bSMark F. Adams mid.neighborlist = 0; /* Needed only if -n switch used. */ 2262e68589bSMark F. Adams /* Needed only if segments are output (-p or -c) and -P not used: */ 2272e68589bSMark F. Adams mid.segmentlist = 0; 2282e68589bSMark F. Adams /* Needed only if segments are output (-p or -c) and -P and -B not used: */ 2292e68589bSMark F. Adams mid.segmentmarkerlist = 0; 2302e68589bSMark F. Adams mid.edgelist = 0; /* Needed only if -e switch used. */ 2312e68589bSMark F. Adams mid.edgemarkerlist = 0; /* Needed if -e used and -B not used. */ 2322e68589bSMark F. Adams mid.numberoftriangles = 0; 2332e68589bSMark F. Adams 2342e68589bSMark F. Adams /* Triangulate the points. Switches are chosen to read and write a */ 2352e68589bSMark F. Adams /* PSLG (p), preserve the convex hull (c), number everything from */ 2362e68589bSMark F. Adams /* zero (z), assign a regional attribute to each element (A), and */ 2372e68589bSMark F. Adams /* produce an edge list (e), a Voronoi diagram (v), and a triangle */ 2382e68589bSMark F. Adams /* neighbor list (n). */ 2392e68589bSMark F. Adams if (nselected_2 != 0) { /* inactive processor */ 2402e68589bSMark F. Adams char args[] = "npczQ"; /* c is needed ? */ 2412e68589bSMark F. Adams triangulate(args, &in, &mid, (struct triangulateio*) NULL); 2422e68589bSMark F. Adams /* output .poly files for 'showme' */ 2432e68589bSMark F. Adams if (!PETSC_TRUE) { 2442e68589bSMark F. Adams static int level = 1; 2452e68589bSMark F. Adams FILE *file; char fname[32]; 2462e68589bSMark F. Adams 247c5df96a5SBarry Smith sprintf(fname,"C%d_%d.poly",level,rank); file = fopen(fname, "w"); 2482e68589bSMark F. Adams /*First line: <# of vertices> <dimension (must be 2)> <# of attributes> <# of boundary markers (0 or 1)>*/ 2492e68589bSMark F. Adams fprintf(file, "%d %d %d %d\n",in.numberofpoints,2,0,0); 2502e68589bSMark F. Adams /*Following lines: <vertex #> <x> <y> */ 2512e68589bSMark F. Adams for (kk=0,sid=0; kk<in.numberofpoints; kk++,sid += 2) { 2522e68589bSMark F. Adams fprintf(file, "%d %e %e\n",kk,in.pointlist[sid],in.pointlist[sid+1]); 2532e68589bSMark F. Adams } 2542e68589bSMark F. Adams /*One line: <# of segments> <# of boundary markers (0 or 1)> */ 2552e68589bSMark F. Adams fprintf(file, "%d %d\n",0,0); 2562e68589bSMark F. Adams /*Following lines: <segment #> <endpoint> <endpoint> [boundary marker] */ 2572e68589bSMark F. Adams /* One line: <# of holes> */ 2582e68589bSMark F. Adams fprintf(file, "%d\n",0); 2592e68589bSMark F. Adams /* Following lines: <hole #> <x> <y> */ 2602e68589bSMark F. Adams /* Optional line: <# of regional attributes and/or area constraints> */ 2612e68589bSMark F. Adams /* Optional following lines: <region #> <x> <y> <attribute> <maximum area> */ 2622e68589bSMark F. Adams fclose(file); 2632e68589bSMark F. Adams 2642e68589bSMark F. Adams /* elems */ 265c5df96a5SBarry Smith sprintf(fname,"C%d_%d.ele",level,rank); file = fopen(fname, "w"); 2662e68589bSMark F. Adams /* First line: <# of triangles> <nodes per triangle> <# of attributes> */ 2672e68589bSMark F. Adams fprintf(file, "%d %d %d\n",mid.numberoftriangles,3,0); 2682e68589bSMark F. Adams /* Remaining lines: <triangle #> <node> <node> <node> ... [attributes] */ 2692e68589bSMark F. Adams for (kk=0,sid=0; kk<mid.numberoftriangles; kk++,sid += 3) { 2702e68589bSMark F. Adams fprintf(file, "%d %d %d %d\n",kk,mid.trianglelist[sid],mid.trianglelist[sid+1],mid.trianglelist[sid+2]); 2712e68589bSMark F. Adams } 2722e68589bSMark F. Adams fclose(file); 2732e68589bSMark F. Adams 274c5df96a5SBarry Smith sprintf(fname,"C%d_%d.node",level,rank); file = fopen(fname, "w"); 2752e68589bSMark F. Adams /* First line: <# of vertices> <dimension (must be 2)> <# of attributes> <# of boundary markers (0 or 1)> */ 2762e68589bSMark F. Adams /* fprintf(file, "%d %d %d %d\n",in.numberofpoints,2,0,0); */ 2772e68589bSMark F. Adams fprintf(file, "%d %d %d %d\n",nPlotPts,2,0,0); 2782e68589bSMark F. Adams /*Following lines: <vertex #> <x> <y> */ 2792e68589bSMark F. Adams for (kk=0,sid=0; kk<in.numberofpoints; kk++,sid+=2) { 2802e68589bSMark F. Adams fprintf(file, "%d %e %e\n",kk,in.pointlist[sid],in.pointlist[sid+1]); 2812e68589bSMark F. Adams } 2822e68589bSMark F. Adams 2832e68589bSMark F. Adams sid /= 2; 2842e68589bSMark F. Adams for (jj=0; jj<nFineLoc; jj++) { 2852e68589bSMark F. Adams PetscBool sel = PETSC_TRUE; 2862e68589bSMark F. Adams for (kk=0; kk<nselected_2 && sel; kk++) { 2872e68589bSMark F. Adams PetscInt lid = selected_idx_2[kk]; 2882e68589bSMark F. Adams if (lid == jj) sel = PETSC_FALSE; 2892e68589bSMark F. Adams } 2902fa5cd67SKarl Rupp if (sel) fprintf(file, "%d %e %e\n",sid++,coords[jj],coords[data_stride + jj]); 2912e68589bSMark F. Adams } 2922e68589bSMark F. Adams fclose(file); 29371959b99SBarry Smith if (sid != nPlotPts) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"sid %D != nPlotPts %D",sid,nPlotPts); 2942e68589bSMark F. Adams level++; 2952e68589bSMark F. Adams } 2962e68589bSMark F. Adams } 2970cbbd2e1SMark F. Adams #if defined PETSC_GAMG_USE_LOG 2980cbbd2e1SMark F. Adams ierr = PetscLogEventBegin(petsc_gamg_setup_events[FIND_V],0,0,0,0);CHKERRQ(ierr); 2992e68589bSMark F. Adams #endif 3002e68589bSMark F. Adams { /* form P - setup some maps */ 3010cbbd2e1SMark F. Adams PetscInt clid,mm,*nTri,*node_tri; 3022e68589bSMark F. Adams 303785e854fSJed Brown ierr = PetscMalloc1(nselected_2, &node_tri);CHKERRQ(ierr); 304785e854fSJed Brown ierr = PetscMalloc1(nselected_2, &nTri);CHKERRQ(ierr); 3052e68589bSMark F. Adams 3062e68589bSMark F. Adams /* need list of triangles on node */ 3072e68589bSMark F. Adams for (kk=0; kk<nselected_2; kk++) nTri[kk] = 0; 3082e68589bSMark F. Adams for (tid=0,kk=0; tid<mid.numberoftriangles; tid++) { 3092e68589bSMark F. Adams for (jj=0; jj<3; jj++) { 3102e68589bSMark F. Adams PetscInt cid = mid.trianglelist[kk++]; 3112e68589bSMark F. Adams if (nTri[cid] == 0) node_tri[cid] = tid; 3122e68589bSMark F. Adams nTri[cid]++; 3132e68589bSMark F. Adams } 3142e68589bSMark F. Adams } 3152e68589bSMark F. Adams #define EPS 1.e-12 3162e68589bSMark F. Adams /* find points and set prolongation */ 3170cbbd2e1SMark F. Adams for (mm = clid = 0; mm < nFineLoc; mm++) { 318e78576d6SMark F. Adams PetscBool ise; 319e78576d6SMark F. Adams ierr = PetscCDEmptyAt(agg_lists_1,mm,&ise);CHKERRQ(ierr); 320e78576d6SMark F. Adams if (!ise) { 3210cbbd2e1SMark F. Adams const PetscInt lid = mm; 322c41eeb4cSKarl Rupp /* for (clid_iterator=0;clid_iterator<nselected_1;clid_iterator++) { */ 3232e68589bSMark F. Adams PetscScalar AA[3][3]; 3242e68589bSMark F. Adams PetscBLASInt N=3,NRHS=1,LDA=3,IPIV[3],LDB=3,INFO; 32541b27cdeSMark F. Adams PetscCDPos pos; 326e78576d6SMark F. Adams ierr = PetscCDGetHeadPos(agg_lists_1,lid,&pos);CHKERRQ(ierr); 327e78576d6SMark F. Adams while (pos) { 328e78576d6SMark F. Adams PetscInt flid; 329ffc955d6SMark F. Adams ierr = PetscLLNGetID(pos, &flid);CHKERRQ(ierr); 330e78576d6SMark F. Adams ierr = PetscCDGetNextPos(agg_lists_1,lid,&pos);CHKERRQ(ierr); 3310cbbd2e1SMark F. Adams 3322e68589bSMark F. Adams if (flid < nFineLoc) { /* could be a ghost */ 3332e68589bSMark F. Adams PetscInt bestTID = -1; PetscReal best_alpha = 1.e10; 3342e68589bSMark F. Adams const PetscInt fgid = flid + myFine0; 3352e68589bSMark F. Adams /* compute shape function for gid */ 336a2f3521dSMark F. Adams const PetscReal fcoord[3] = {coords[flid],coords[data_stride+flid],1.0}; 3372e68589bSMark F. Adams PetscBool haveit =PETSC_FALSE; PetscScalar alpha[3]; PetscInt clids[3]; 3382fa5cd67SKarl Rupp 3392e68589bSMark F. Adams /* look for it */ 3400cbbd2e1SMark F. Adams for (tid = node_tri[clid], jj=0; 3412e68589bSMark F. Adams jj < 5 && !haveit && tid != -1; 3422e68589bSMark F. Adams jj++) { 3432e68589bSMark F. Adams for (tt=0; tt<3; tt++) { 3442e68589bSMark F. Adams PetscInt cid2 = mid.trianglelist[3*tid + tt]; 3452e68589bSMark F. Adams PetscInt lid2 = selected_idx_2[cid2]; 346a2f3521dSMark F. Adams AA[tt][0] = coords[lid2]; AA[tt][1] = coords[data_stride + lid2]; AA[tt][2] = 1.0; 3472e68589bSMark F. Adams clids[tt] = cid2; /* store for interp */ 3482e68589bSMark F. Adams } 3492e68589bSMark F. Adams 3502e68589bSMark F. Adams for (tt=0; tt<3; tt++) alpha[tt] = (PetscScalar)fcoord[tt]; 3512e68589bSMark F. Adams 3522e68589bSMark F. Adams /* SUBROUTINE DGESV(N, NRHS, A, LDA, IPIV, B, LDB, INFO) */ 3538b83055fSJed Brown PetscStackCallBLAS("LAPACKgesv",LAPACKgesv_(&N, &NRHS, (PetscScalar*)AA, &LDA, IPIV, alpha, &LDB, &INFO)); 3542e68589bSMark F. Adams { 3552e68589bSMark F. Adams PetscBool have=PETSC_TRUE; PetscReal lowest=1.e10; 3562e68589bSMark F. Adams for (tt = 0, idx = 0; tt < 3; tt++) { 3572e68589bSMark F. Adams if (PetscRealPart(alpha[tt]) > (1.0+EPS) || PetscRealPart(alpha[tt]) < -EPS) have = PETSC_FALSE; 3582e68589bSMark F. Adams if (PetscRealPart(alpha[tt]) < lowest) { 3592e68589bSMark F. Adams lowest = PetscRealPart(alpha[tt]); 3602e68589bSMark F. Adams idx = tt; 3612e68589bSMark F. Adams } 3622e68589bSMark F. Adams } 3632e68589bSMark F. Adams haveit = have; 3642e68589bSMark F. Adams } 3652e68589bSMark F. Adams tid = mid.neighborlist[3*tid + idx]; 3662e68589bSMark F. Adams } 3672e68589bSMark F. Adams 3682e68589bSMark F. Adams if (!haveit) { 3692e68589bSMark F. Adams /* brute force */ 3702e68589bSMark F. Adams for (tid=0; tid<mid.numberoftriangles && !haveit; tid++) { 3712e68589bSMark F. Adams for (tt=0; tt<3; tt++) { 3722e68589bSMark F. Adams PetscInt cid2 = mid.trianglelist[3*tid + tt]; 3732e68589bSMark F. Adams PetscInt lid2 = selected_idx_2[cid2]; 374a2f3521dSMark F. Adams AA[tt][0] = coords[lid2]; AA[tt][1] = coords[data_stride + lid2]; AA[tt][2] = 1.0; 3752e68589bSMark F. Adams clids[tt] = cid2; /* store for interp */ 3762e68589bSMark F. Adams } 3772e68589bSMark F. Adams for (tt=0; tt<3; tt++) alpha[tt] = fcoord[tt]; 3782e68589bSMark F. Adams /* SUBROUTINE DGESV(N, NRHS, A, LDA, IPIV, B, LDB, INFO) */ 3798b83055fSJed Brown PetscStackCallBLAS("LAPACKgesv",LAPACKgesv_(&N, &NRHS, (PetscScalar*)AA, &LDA, IPIV, alpha, &LDB, &INFO)); 3802e68589bSMark F. Adams { 3812e68589bSMark F. Adams PetscBool have=PETSC_TRUE; PetscReal worst=0.0, v; 3822e68589bSMark F. Adams for (tt=0; tt<3 && have; tt++) { 3832e68589bSMark F. Adams if (PetscRealPart(alpha[tt]) > 1.0+EPS || PetscRealPart(alpha[tt]) < -EPS) have=PETSC_FALSE; 3842e68589bSMark F. Adams if ((v=PetscAbs(PetscRealPart(alpha[tt])-0.5)) > worst) worst = v; 3852e68589bSMark F. Adams } 3862e68589bSMark F. Adams if (worst < best_alpha) { 3872e68589bSMark F. Adams best_alpha = worst; bestTID = tid; 3882e68589bSMark F. Adams } 3892e68589bSMark F. Adams haveit = have; 3902e68589bSMark F. Adams } 3912e68589bSMark F. Adams } 3922e68589bSMark F. Adams } 3932e68589bSMark F. Adams if (!haveit) { 3942e68589bSMark F. Adams if (best_alpha > *a_worst_best) *a_worst_best = best_alpha; 3952e68589bSMark F. Adams /* use best one */ 3962e68589bSMark F. Adams for (tt=0; tt<3; tt++) { 3972e68589bSMark F. Adams PetscInt cid2 = mid.trianglelist[3*bestTID + tt]; 3982e68589bSMark F. Adams PetscInt lid2 = selected_idx_2[cid2]; 399a2f3521dSMark F. Adams AA[tt][0] = coords[lid2]; AA[tt][1] = coords[data_stride + lid2]; AA[tt][2] = 1.0; 4002e68589bSMark F. Adams clids[tt] = cid2; /* store for interp */ 4012e68589bSMark F. Adams } 4022e68589bSMark F. Adams for (tt=0; tt<3; tt++) alpha[tt] = fcoord[tt]; 4032e68589bSMark F. Adams /* SUBROUTINE DGESV(N, NRHS, A, LDA, IPIV, B, LDB, INFO) */ 4048b83055fSJed Brown PetscStackCallBLAS("LAPACKgesv",LAPACKgesv_(&N, &NRHS, (PetscScalar*)AA, &LDA, IPIV, alpha, &LDB, &INFO)); 4052e68589bSMark F. Adams } 4062e68589bSMark F. Adams 4072e68589bSMark F. Adams /* put in row of P */ 4082e68589bSMark F. Adams for (idx=0; idx<3; idx++) { 4092e68589bSMark F. Adams PetscScalar shp = alpha[idx]; 4102e68589bSMark F. Adams if (PetscAbs(PetscRealPart(shp)) > 1.e-6) { 4112e68589bSMark F. Adams PetscInt cgid = crsGID[clids[idx]]; 4122e68589bSMark F. Adams PetscInt jj = cgid*bs, ii = fgid*bs; /* need to gloalize */ 4132e68589bSMark F. Adams for (tt=0; tt < bs; tt++, ii++, jj++) { 4142e68589bSMark F. Adams ierr = MatSetValues(a_Prol,1,&ii,1,&jj,&shp,INSERT_VALUES);CHKERRQ(ierr); 4152e68589bSMark F. Adams } 4162e68589bSMark F. Adams } 4172e68589bSMark F. Adams } 4182e68589bSMark F. Adams } 4190cbbd2e1SMark F. Adams } /* aggregates iterations */ 4200cbbd2e1SMark F. Adams clid++; 4210cbbd2e1SMark F. Adams } /* a coarse agg */ 4220cbbd2e1SMark F. Adams } /* for all fine nodes */ 4230cbbd2e1SMark F. Adams 4242e68589bSMark F. Adams ierr = ISRestoreIndices(selected_2, &selected_idx_2);CHKERRQ(ierr); 4252e68589bSMark F. Adams ierr = MatAssemblyBegin(a_Prol,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 4262e68589bSMark F. Adams ierr = MatAssemblyEnd(a_Prol,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 4272e68589bSMark F. Adams 4282e68589bSMark F. Adams ierr = PetscFree(node_tri);CHKERRQ(ierr); 4292e68589bSMark F. Adams ierr = PetscFree(nTri);CHKERRQ(ierr); 4302e68589bSMark F. Adams } 4310cbbd2e1SMark F. Adams #if defined PETSC_GAMG_USE_LOG 4320cbbd2e1SMark F. Adams ierr = PetscLogEventEnd(petsc_gamg_setup_events[FIND_V],0,0,0,0);CHKERRQ(ierr); 4332e68589bSMark F. Adams #endif 4342e68589bSMark F. Adams free(mid.trianglelist); 4352e68589bSMark F. Adams free(mid.neighborlist); 4362e68589bSMark F. Adams ierr = PetscFree(in.pointlist);CHKERRQ(ierr); 4372e68589bSMark F. Adams PetscFunctionReturn(0); 4382e68589bSMark F. Adams #else 4393b4367a7SBarry Smith SETERRQ(PetscObjectComm((PetscObject)a_Prol),PETSC_ERR_PLIB,"configure with TRIANGLE to use geometric MG"); 4402e68589bSMark F. Adams #endif 4412e68589bSMark F. Adams } 4422e68589bSMark F. Adams /* -------------------------------------------------------------------------- */ 4432e68589bSMark F. Adams /* 4442e68589bSMark F. Adams getGIDsOnSquareGraph - square graph, get 4452e68589bSMark F. Adams 4462e68589bSMark F. Adams Input Parameter: 4470cbbd2e1SMark F. Adams . nselected_1 - selected local indices (includes ghosts in input Gmat1) 448b43b03e9SMark F. Adams . clid_lid_1 - [nselected_1] lids of selected nodes 4492e68589bSMark F. Adams . Gmat1 - graph that goes with 'selected_1' 4502e68589bSMark F. Adams Output Parameter: 4512e68589bSMark F. Adams . a_selected_2 - selected local indices (includes ghosts in output a_Gmat_2) 4522e68589bSMark F. Adams . a_Gmat_2 - graph that is squared of 'Gmat_1' 4532e68589bSMark F. Adams . a_crsGID[a_selected_2.size()] - map of global IDs of coarse grid nodes 4542e68589bSMark F. Adams */ 4552e68589bSMark F. Adams #undef __FUNCT__ 4562e68589bSMark F. Adams #define __FUNCT__ "getGIDsOnSquareGraph" 4572fa5cd67SKarl Rupp static PetscErrorCode getGIDsOnSquareGraph(const PetscInt nselected_1,const PetscInt clid_lid_1[],const Mat Gmat1,IS *a_selected_2,Mat *a_Gmat_2,PetscInt **a_crsGID) 4582e68589bSMark F. Adams { 4592e68589bSMark F. Adams PetscErrorCode ierr; 460*73911c69SBarry Smith PetscMPIInt size; 461b43b03e9SMark F. Adams PetscInt *crsGID, kk,my0,Iend,nloc; 4623b4367a7SBarry Smith MPI_Comm comm; 4632e68589bSMark F. Adams 4642e68589bSMark F. Adams PetscFunctionBegin; 4653b4367a7SBarry Smith ierr = PetscObjectGetComm((PetscObject)Gmat1,&comm);CHKERRQ(ierr); 4663b4367a7SBarry Smith ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr); 4672e68589bSMark F. Adams ierr = MatGetOwnershipRange(Gmat1,&my0,&Iend);CHKERRQ(ierr); /* AIJ */ 4682e68589bSMark F. Adams nloc = Iend - my0; /* this does not change */ 4692e68589bSMark F. Adams 470c5df96a5SBarry Smith if (size == 1) { /* not much to do in serial */ 471785e854fSJed Brown ierr = PetscMalloc1(nselected_1, &crsGID);CHKERRQ(ierr); 472b43b03e9SMark F. Adams for (kk=0; kk<nselected_1; kk++) crsGID[kk] = kk; 4732e68589bSMark F. Adams *a_Gmat_2 = 0; 474806fa848SBarry Smith ierr = ISCreateGeneral(PETSC_COMM_SELF,nselected_1,clid_lid_1,PETSC_COPY_VALUES,a_selected_2);CHKERRQ(ierr); 475806fa848SBarry Smith } else { 476b43b03e9SMark F. Adams PetscInt idx,num_fine_ghosts,num_crs_ghost,myCrs0; 4772e68589bSMark F. Adams Mat_MPIAIJ *mpimat2; 4782e68589bSMark F. Adams Mat Gmat2; 4792e68589bSMark F. Adams Vec locState; 4802e68589bSMark F. Adams PetscScalar *cpcol_state; 4812e68589bSMark F. Adams 4822e68589bSMark F. Adams /* scan my coarse zero gid, set 'lid_state' with coarse GID */ 483b43b03e9SMark F. Adams kk = nselected_1; 4843b4367a7SBarry Smith MPI_Scan(&kk, &myCrs0, 1, MPIU_INT, MPIU_SUM, comm); 485b43b03e9SMark F. Adams myCrs0 -= nselected_1; 4862e68589bSMark F. Adams 487b43b03e9SMark F. Adams if (a_Gmat_2) { /* output */ 4882e68589bSMark F. Adams /* grow graph to get wider set of selected vertices to cover fine grid, invalidates 'llist' */ 4892e68589bSMark F. Adams ierr = MatTransposeMatMult(Gmat1, Gmat1, MAT_INITIAL_MATRIX, PETSC_DEFAULT, &Gmat2);CHKERRQ(ierr); 4902e68589bSMark F. Adams *a_Gmat_2 = Gmat2; /* output */ 491806fa848SBarry Smith } else Gmat2 = Gmat1; /* use local to get crsGIDs at least */ 4922e68589bSMark F. Adams /* get coarse grid GIDS for selected (locals and ghosts) */ 4932e68589bSMark F. Adams mpimat2 = (Mat_MPIAIJ*)Gmat2->data; 4942a7a6963SBarry Smith ierr = MatCreateVecs(Gmat2, &locState, 0);CHKERRQ(ierr); 4952e68589bSMark F. Adams ierr = VecSet(locState, (PetscScalar)(PetscReal)(-1));CHKERRQ(ierr); /* set with UNKNOWN state */ 496b43b03e9SMark F. Adams for (kk=0; kk<nselected_1; kk++) { 497b43b03e9SMark F. Adams PetscInt fgid = clid_lid_1[kk] + my0; 4982e68589bSMark F. Adams PetscScalar v = (PetscScalar)(kk+myCrs0); 4992e68589bSMark F. Adams ierr = VecSetValues(locState, 1, &fgid, &v, INSERT_VALUES);CHKERRQ(ierr); /* set with PID */ 5002e68589bSMark F. Adams } 5012e68589bSMark F. Adams ierr = VecAssemblyBegin(locState);CHKERRQ(ierr); 5022e68589bSMark F. Adams ierr = VecAssemblyEnd(locState);CHKERRQ(ierr); 5032e68589bSMark F. Adams ierr = VecScatterBegin(mpimat2->Mvctx,locState,mpimat2->lvec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 5042e68589bSMark F. Adams ierr = VecScatterEnd(mpimat2->Mvctx,locState,mpimat2->lvec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 5052e68589bSMark F. Adams ierr = VecGetLocalSize(mpimat2->lvec, &num_fine_ghosts);CHKERRQ(ierr); 5062e68589bSMark F. Adams ierr = VecGetArray(mpimat2->lvec, &cpcol_state);CHKERRQ(ierr); 5072e68589bSMark F. Adams for (kk=0,num_crs_ghost=0; kk<num_fine_ghosts; kk++) { 5082e68589bSMark F. Adams if ((PetscInt)PetscRealPart(cpcol_state[kk]) != -1) num_crs_ghost++; 5092e68589bSMark F. Adams } 510854ce69bSBarry Smith ierr = PetscMalloc1(nselected_1+num_crs_ghost, &crsGID);CHKERRQ(ierr); /* output */ 5112e68589bSMark F. Adams { 5122e68589bSMark F. Adams PetscInt *selected_set; 513854ce69bSBarry Smith ierr = PetscMalloc1(nselected_1+num_crs_ghost, &selected_set);CHKERRQ(ierr); 5142e68589bSMark F. Adams /* do ghost of 'crsGID' */ 515b43b03e9SMark F. Adams for (kk=0,idx=nselected_1; kk<num_fine_ghosts; kk++) { 5162e68589bSMark F. Adams if ((PetscInt)PetscRealPart(cpcol_state[kk]) != -1) { 5172e68589bSMark F. Adams PetscInt cgid = (PetscInt)PetscRealPart(cpcol_state[kk]); 5182e68589bSMark F. Adams selected_set[idx] = nloc + kk; 5192e68589bSMark F. Adams crsGID[idx++] = cgid; 5202e68589bSMark F. Adams } 5212e68589bSMark F. Adams } 52271959b99SBarry Smith if (idx != (nselected_1+num_crs_ghost)) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_PLIB,"idx %D != (nselected_1 %D + num_crs_ghost %D)",idx,nselected_1,num_crs_ghost); 5232e68589bSMark F. Adams ierr = VecRestoreArray(mpimat2->lvec, &cpcol_state);CHKERRQ(ierr); 5242e68589bSMark F. Adams /* do locals in 'crsGID' */ 5252e68589bSMark F. Adams ierr = VecGetArray(locState, &cpcol_state);CHKERRQ(ierr); 5262e68589bSMark F. Adams for (kk=0,idx=0; kk<nloc; kk++) { 5272e68589bSMark F. Adams if ((PetscInt)PetscRealPart(cpcol_state[kk]) != -1) { 5282e68589bSMark F. Adams PetscInt cgid = (PetscInt)PetscRealPart(cpcol_state[kk]); 5292e68589bSMark F. Adams selected_set[idx] = kk; 5302e68589bSMark F. Adams crsGID[idx++] = cgid; 5312e68589bSMark F. Adams } 5322e68589bSMark F. Adams } 53371959b99SBarry Smith if (idx != nselected_1) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"idx %D != nselected_1 %D",idx,nselected_1); 5342e68589bSMark F. Adams ierr = VecRestoreArray(locState, &cpcol_state);CHKERRQ(ierr); 5352e68589bSMark F. Adams 5362e68589bSMark F. Adams if (a_selected_2 != 0) { /* output */ 537806fa848SBarry Smith ierr = ISCreateGeneral(PETSC_COMM_SELF,(nselected_1+num_crs_ghost),selected_set,PETSC_OWN_POINTER,a_selected_2);CHKERRQ(ierr); 538806fa848SBarry Smith } else { 5392e68589bSMark F. Adams ierr = PetscFree(selected_set);CHKERRQ(ierr); 5402e68589bSMark F. Adams } 5410cbbd2e1SMark F. Adams } 5422e68589bSMark F. Adams ierr = VecDestroy(&locState);CHKERRQ(ierr); 5432e68589bSMark F. Adams } 5442e68589bSMark F. Adams *a_crsGID = crsGID; /* output */ 5452e68589bSMark F. Adams PetscFunctionReturn(0); 5462e68589bSMark F. Adams } 5472e68589bSMark F. Adams 5482e68589bSMark F. Adams /* -------------------------------------------------------------------------- */ 5492e68589bSMark F. Adams /* 550fd1112cbSBarry Smith PCGAMGGraph_GEO 5512e68589bSMark F. Adams 5522e68589bSMark F. Adams Input Parameter: 5532e68589bSMark F. Adams . pc - this 5542e68589bSMark F. Adams . Amat - matrix on this fine level 5552e68589bSMark F. Adams Output Parameter: 556c8b0795cSMark F. Adams . a_Gmat 5572e68589bSMark F. Adams */ 5582e68589bSMark F. Adams #undef __FUNCT__ 559fd1112cbSBarry Smith #define __FUNCT__ "PCGAMGGraph_GEO" 560fd1112cbSBarry Smith PetscErrorCode PCGAMGGraph_GEO(PC pc,const Mat Amat,Mat *a_Gmat) 561c8b0795cSMark F. Adams { 562c8b0795cSMark F. Adams PetscErrorCode ierr; 563c8b0795cSMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 564c8b0795cSMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 565c8b0795cSMark F. Adams const PetscInt verbose = pc_gamg->verbose; 566c8b0795cSMark F. Adams const PetscReal vfilter = pc_gamg->threshold; 5673b4367a7SBarry Smith MPI_Comm comm; 568c8b0795cSMark F. Adams Mat Gmat; 5690cbbd2e1SMark F. Adams PetscBool set,flg,symm; 5706e111a19SKarl Rupp 571c8b0795cSMark F. Adams PetscFunctionBegin; 5723b4367a7SBarry Smith ierr = PetscObjectGetComm((PetscObject)Amat,&comm);CHKERRQ(ierr); 573fd1112cbSBarry Smith ierr = PetscLogEventBegin(PC_GAMGGraph_GEO,0,0,0,0);CHKERRQ(ierr); 574c8b0795cSMark F. Adams 5750cbbd2e1SMark F. Adams ierr = MatIsSymmetricKnown(Amat, &set, &flg);CHKERRQ(ierr); 576263489e9SJed Brown symm = (PetscBool)!(set && flg); 5770cbbd2e1SMark F. Adams 5782d7fac45SMark F. Adams ierr = PCGAMGCreateGraph(Amat, &Gmat);CHKERRQ(ierr); 5792d7fac45SMark F. Adams ierr = PCGAMGFilterGraph(&Gmat, vfilter, symm, verbose);CHKERRQ(ierr); 580c8b0795cSMark F. Adams 581c8b0795cSMark F. Adams *a_Gmat = Gmat; 582fd1112cbSBarry Smith ierr = PetscLogEventEnd(PC_GAMGGraph_GEO,0,0,0,0);CHKERRQ(ierr); 583c8b0795cSMark F. Adams PetscFunctionReturn(0); 584c8b0795cSMark F. Adams } 585c8b0795cSMark F. Adams 586c8b0795cSMark F. Adams /* -------------------------------------------------------------------------- */ 587c8b0795cSMark F. Adams /* 588fd1112cbSBarry Smith PCGAMGCoarsen_GEO 589c8b0795cSMark F. Adams 590c8b0795cSMark F. Adams Input Parameter: 591e0940f08SMark F. Adams . a_pc - this 592e0940f08SMark F. Adams . a_Gmat - graph 593c8b0795cSMark F. Adams Output Parameter: 594c8b0795cSMark F. Adams . a_llist_parent - linked list from selected indices for data locality only 595c8b0795cSMark F. Adams */ 596c8b0795cSMark F. Adams #undef __FUNCT__ 597fd1112cbSBarry Smith #define __FUNCT__ "PCGAMGCoarsen_GEO" 598fd1112cbSBarry Smith PetscErrorCode PCGAMGCoarsen_GEO(PC a_pc,Mat *a_Gmat,PetscCoarsenData **a_llist_parent) 599c8b0795cSMark F. Adams { 600c8b0795cSMark F. Adams PetscErrorCode ierr; 601e0940f08SMark F. Adams PC_MG *mg = (PC_MG*)a_pc->data; 602c8b0795cSMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 603c8b0795cSMark F. Adams PetscInt Istart,Iend,nloc,kk,Ii,ncols; 6040cbbd2e1SMark F. Adams IS perm; 605c8b0795cSMark F. Adams GAMGNode *gnodes; 606c8b0795cSMark F. Adams PetscInt *permute; 607e0940f08SMark F. Adams Mat Gmat = *a_Gmat; 6083b4367a7SBarry Smith MPI_Comm comm; 609b43b03e9SMark F. Adams MatCoarsen crs; 610c8b0795cSMark F. Adams 611c8b0795cSMark F. Adams PetscFunctionBegin; 6123b4367a7SBarry Smith ierr = PetscObjectGetComm((PetscObject)a_pc,&comm);CHKERRQ(ierr); 6130cbbd2e1SMark F. Adams ierr = PetscLogEventBegin(PC_GAMGCoarsen_GEO,0,0,0,0);CHKERRQ(ierr); 614c8b0795cSMark F. Adams ierr = MatGetOwnershipRange(Gmat, &Istart, &Iend);CHKERRQ(ierr); 615c8b0795cSMark F. Adams nloc = (Iend-Istart); 616c8b0795cSMark F. Adams 617c8b0795cSMark F. Adams /* create random permutation with sort for geo-mg */ 618785e854fSJed Brown ierr = PetscMalloc1(nloc, &gnodes);CHKERRQ(ierr); 619785e854fSJed Brown ierr = PetscMalloc1(nloc, &permute);CHKERRQ(ierr); 620c8b0795cSMark F. Adams 621c8b0795cSMark F. Adams for (Ii=Istart; Ii<Iend; Ii++) { /* locals only? */ 622c8b0795cSMark F. Adams ierr = MatGetRow(Gmat,Ii,&ncols,0,0);CHKERRQ(ierr); 623c8b0795cSMark F. Adams { 624c8b0795cSMark F. Adams PetscInt lid = Ii - Istart; 625c8b0795cSMark F. Adams gnodes[lid].lid = lid; 626c8b0795cSMark F. Adams gnodes[lid].degree = ncols; 627c8b0795cSMark F. Adams } 628c8b0795cSMark F. Adams ierr = MatRestoreRow(Gmat,Ii,&ncols,0,0);CHKERRQ(ierr); 629c8b0795cSMark F. Adams } 630c8b0795cSMark F. Adams /* randomize */ 631c8b0795cSMark F. Adams srand(1); /* make deterministic */ 632c8b0795cSMark F. Adams if (PETSC_TRUE) { 633c8b0795cSMark F. Adams PetscBool *bIndexSet; 634785e854fSJed Brown ierr = PetscMalloc1(nloc, &bIndexSet);CHKERRQ(ierr); 635c8b0795cSMark F. Adams for (Ii = 0; Ii < nloc; Ii++) bIndexSet[Ii] = PETSC_FALSE; 6362fa5cd67SKarl Rupp for (Ii = 0; Ii < nloc; Ii++) { 637c8b0795cSMark F. Adams PetscInt iSwapIndex = rand()%nloc; 6382fa5cd67SKarl Rupp if (!bIndexSet[iSwapIndex] && iSwapIndex != Ii) { 639c8b0795cSMark F. Adams GAMGNode iTemp = gnodes[iSwapIndex]; 640c8b0795cSMark F. Adams gnodes[iSwapIndex] = gnodes[Ii]; 641c8b0795cSMark F. Adams gnodes[Ii] = iTemp; 642c8b0795cSMark F. Adams bIndexSet[Ii] = PETSC_TRUE; 643c8b0795cSMark F. Adams bIndexSet[iSwapIndex] = PETSC_TRUE; 644c8b0795cSMark F. Adams } 645c8b0795cSMark F. Adams } 646c8b0795cSMark F. Adams ierr = PetscFree(bIndexSet);CHKERRQ(ierr); 647c8b0795cSMark F. Adams } 648c8b0795cSMark F. Adams /* only sort locals */ 6490cbbd2e1SMark F. Adams qsort(gnodes, nloc, sizeof(GAMGNode), petsc_geo_mg_compare); 650c8b0795cSMark F. Adams /* create IS of permutation */ 6512fa5cd67SKarl Rupp for (kk=0; kk<nloc; kk++) permute[kk] = gnodes[kk].lid; /* locals only */ 652806fa848SBarry Smith ierr = ISCreateGeneral(PETSC_COMM_SELF, nloc, permute, PETSC_OWN_POINTER, &perm);CHKERRQ(ierr); 653c8b0795cSMark F. Adams 654c8b0795cSMark F. Adams ierr = PetscFree(gnodes);CHKERRQ(ierr); 655c8b0795cSMark F. Adams 656c8b0795cSMark F. Adams /* get MIS aggs */ 657b43b03e9SMark F. Adams 6583b4367a7SBarry Smith ierr = MatCoarsenCreate(comm, &crs);CHKERRQ(ierr); 659b43b03e9SMark F. Adams ierr = MatCoarsenSetType(crs, MATCOARSENMIS);CHKERRQ(ierr); 660b43b03e9SMark F. Adams ierr = MatCoarsenSetGreedyOrdering(crs, perm);CHKERRQ(ierr); 661b43b03e9SMark F. Adams ierr = MatCoarsenSetAdjacency(crs, Gmat);CHKERRQ(ierr); 662b43b03e9SMark F. Adams ierr = MatCoarsenSetVerbose(crs, pc_gamg->verbose);CHKERRQ(ierr); 663b43b03e9SMark F. Adams ierr = MatCoarsenSetStrictAggs(crs, PETSC_FALSE);CHKERRQ(ierr); 664b43b03e9SMark F. Adams ierr = MatCoarsenApply(crs);CHKERRQ(ierr); 6650cbbd2e1SMark F. Adams ierr = MatCoarsenGetData(crs, a_llist_parent);CHKERRQ(ierr); 666b43b03e9SMark F. Adams ierr = MatCoarsenDestroy(&crs);CHKERRQ(ierr); 667c8b0795cSMark F. Adams 668c8b0795cSMark F. Adams ierr = ISDestroy(&perm);CHKERRQ(ierr); 6690cbbd2e1SMark F. Adams ierr = PetscLogEventEnd(PC_GAMGCoarsen_GEO,0,0,0,0);CHKERRQ(ierr); 670c8b0795cSMark F. Adams PetscFunctionReturn(0); 671c8b0795cSMark F. Adams } 672c8b0795cSMark F. Adams 673c8b0795cSMark F. Adams /* -------------------------------------------------------------------------- */ 674c8b0795cSMark F. Adams /* 6750cbbd2e1SMark F. Adams PCGAMGProlongator_GEO 676c8b0795cSMark F. Adams 677c8b0795cSMark F. Adams Input Parameter: 678c8b0795cSMark F. Adams . pc - this 679c8b0795cSMark F. Adams . Amat - matrix on this fine level 680c8b0795cSMark F. Adams . Graph - used to get ghost data for nodes in 6810cbbd2e1SMark F. Adams . selected_1 - [nselected] 6820cbbd2e1SMark F. Adams . agg_lists - [nselected] 683c8b0795cSMark F. Adams Output Parameter: 684c8b0795cSMark F. Adams . a_P_out - prolongation operator to the next level 685c8b0795cSMark F. Adams */ 686c8b0795cSMark F. Adams #undef __FUNCT__ 6870cbbd2e1SMark F. Adams #define __FUNCT__ "PCGAMGProlongator_GEO" 6882fa5cd67SKarl Rupp PetscErrorCode PCGAMGProlongator_GEO(PC pc,const Mat Amat,const Mat Gmat,PetscCoarsenData *agg_lists,Mat *a_P_out) 6892e68589bSMark F. Adams { 6902e68589bSMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 6912e68589bSMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 6922e68589bSMark F. Adams const PetscInt verbose = pc_gamg->verbose; 693c8b0795cSMark F. Adams const PetscInt dim = pc_gamg->data_cell_cols, data_cols = pc_gamg->data_cell_cols; 6942e68589bSMark F. Adams PetscErrorCode ierr; 695b43b03e9SMark F. Adams PetscInt Istart,Iend,nloc,my0,jj,kk,ncols,nLocalSelected,bs,*clid_flid; 696c8b0795cSMark F. Adams Mat Prol; 697c5df96a5SBarry Smith PetscMPIInt rank, size; 6983b4367a7SBarry Smith MPI_Comm comm; 6990cbbd2e1SMark F. Adams IS selected_2,selected_1; 7002e68589bSMark F. Adams const PetscInt *selected_idx; 7012e68589bSMark F. Adams 7022e68589bSMark F. Adams PetscFunctionBegin; 7033b4367a7SBarry Smith ierr = PetscObjectGetComm((PetscObject)Amat,&comm);CHKERRQ(ierr); 7040cbbd2e1SMark F. Adams ierr = PetscLogEventBegin(PC_GAMGProlongator_GEO,0,0,0,0);CHKERRQ(ierr); 7053b4367a7SBarry Smith ierr = MPI_Comm_rank(comm,&rank);CHKERRQ(ierr); 7063b4367a7SBarry Smith ierr = MPI_Comm_size(comm,&size);CHKERRQ(ierr); 7072e68589bSMark F. Adams ierr = MatGetOwnershipRange(Amat, &Istart, &Iend);CHKERRQ(ierr); 7082e68589bSMark F. Adams ierr = MatGetBlockSize(Amat, &bs);CHKERRQ(ierr); 70971959b99SBarry Smith nloc = (Iend-Istart)/bs; my0 = Istart/bs; 71071959b99SBarry Smith if ((Iend-Istart) % bs) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_PLIB,"(Iend %D - Istart %D) % bs %D",Iend,Istart,bs); 7112e68589bSMark F. Adams 7122e68589bSMark F. Adams /* get 'nLocalSelected' */ 71341b27cdeSMark F. Adams ierr = PetscCDGetMIS(agg_lists, &selected_1);CHKERRQ(ierr); 714b43b03e9SMark F. Adams ierr = ISGetSize(selected_1, &jj);CHKERRQ(ierr); 715785e854fSJed Brown ierr = PetscMalloc1(jj, &clid_flid);CHKERRQ(ierr); 7162e68589bSMark F. Adams ierr = ISGetIndices(selected_1, &selected_idx);CHKERRQ(ierr); 717c8b0795cSMark F. Adams for (kk=0,nLocalSelected=0; kk<jj; kk++) { 7182e68589bSMark F. Adams PetscInt lid = selected_idx[kk]; 719b43b03e9SMark F. Adams if (lid<nloc) { 7200cbbd2e1SMark F. Adams ierr = MatGetRow(Gmat,lid+my0,&ncols,0,0);CHKERRQ(ierr); 7212fa5cd67SKarl Rupp if (ncols>1) clid_flid[nLocalSelected++] = lid; /* fiter out singletons */ 7220cbbd2e1SMark F. Adams ierr = MatRestoreRow(Gmat,lid+my0,&ncols,0,0);CHKERRQ(ierr); 723b43b03e9SMark F. Adams } 7242e68589bSMark F. Adams } 7252e68589bSMark F. Adams ierr = ISRestoreIndices(selected_1, &selected_idx);CHKERRQ(ierr); 726a2f3521dSMark F. Adams ierr = ISDestroy(&selected_1);CHKERRQ(ierr); /* this is selected_1 in serial */ 7272e68589bSMark F. Adams 7282e68589bSMark F. Adams /* create prolongator, create P matrix */ 7293b4367a7SBarry Smith ierr = MatCreate(comm, &Prol);CHKERRQ(ierr); 730806fa848SBarry Smith ierr = MatSetSizes(Prol,nloc*bs,nLocalSelected*bs,PETSC_DETERMINE,PETSC_DETERMINE);CHKERRQ(ierr); 731a2f3521dSMark F. Adams ierr = MatSetBlockSizes(Prol, bs, bs);CHKERRQ(ierr); 732a2f3521dSMark F. Adams ierr = MatSetType(Prol, MATAIJ);CHKERRQ(ierr); 7330298fd71SBarry Smith ierr = MatSeqAIJSetPreallocation(Prol,3*data_cols,NULL);CHKERRQ(ierr); 7340298fd71SBarry Smith ierr = MatMPIAIJSetPreallocation(Prol,3*data_cols,NULL,3*data_cols,NULL);CHKERRQ(ierr); 7353b4367a7SBarry Smith /* ierr = MatCreateAIJ(comm, */ 736a2f3521dSMark F. Adams /* nloc*bs, nLocalSelected*bs, */ 737a2f3521dSMark F. Adams /* PETSC_DETERMINE, PETSC_DETERMINE, */ 7380298fd71SBarry Smith /* 3*data_cols, NULL, */ 7390298fd71SBarry Smith /* 3*data_cols, NULL, */ 740a2f3521dSMark F. Adams /* &Prol); */ 741a2f3521dSMark F. Adams /* CHKERRQ(ierr); */ 7422e68589bSMark F. Adams 743c8b0795cSMark F. Adams /* can get all points "removed" - but not on geomg */ 7442e68589bSMark F. Adams ierr = MatGetSize(Prol, &kk, &jj);CHKERRQ(ierr); 7452e68589bSMark F. Adams if (jj==0) { 7463b4367a7SBarry Smith if (verbose) PetscPrintf(comm,"[%d]%s ERROE: no selected points on coarse grid\n",rank,__FUNCT__); 747b43b03e9SMark F. Adams ierr = PetscFree(clid_flid);CHKERRQ(ierr); 7482e68589bSMark F. Adams ierr = MatDestroy(&Prol);CHKERRQ(ierr); 7490298fd71SBarry Smith *a_P_out = NULL; /* out */ 7502e68589bSMark F. Adams PetscFunctionReturn(0); 7512e68589bSMark F. Adams } 7522e68589bSMark F. Adams 7532e68589bSMark F. Adams { 7542e68589bSMark F. Adams PetscReal *coords; 755a2f3521dSMark F. Adams PetscInt data_stride; 7560298fd71SBarry Smith PetscInt *crsGID = NULL; 7572e68589bSMark F. Adams Mat Gmat2; 7582e68589bSMark F. Adams 75971959b99SBarry Smith if (dim != data_cols) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_PLIB,"dim %D != data_cols %D",dim,data_cols); 7602e68589bSMark F. Adams /* grow ghost data for better coarse grid cover of fine grid */ 7610cbbd2e1SMark F. Adams #if defined PETSC_GAMG_USE_LOG 7620cbbd2e1SMark F. Adams ierr = PetscLogEventBegin(petsc_gamg_setup_events[SET5],0,0,0,0);CHKERRQ(ierr); 7632e68589bSMark F. Adams #endif 764a2f3521dSMark F. Adams /* messy method, squares graph and gets some data */ 765806fa848SBarry Smith ierr = getGIDsOnSquareGraph(nLocalSelected, clid_flid, Gmat, &selected_2, &Gmat2, &crsGID);CHKERRQ(ierr); 7662e68589bSMark F. Adams /* llist is now not valid wrt squared graph, but will work as iterator in 'triangulateAndFormProl' */ 7670cbbd2e1SMark F. Adams #if defined PETSC_GAMG_USE_LOG 7680cbbd2e1SMark F. Adams ierr = PetscLogEventEnd(petsc_gamg_setup_events[SET5],0,0,0,0);CHKERRQ(ierr); 7692e68589bSMark F. Adams #endif 7702e68589bSMark F. Adams /* create global vector of coorindates in 'coords' */ 771c5df96a5SBarry Smith if (size > 1) { 772806fa848SBarry Smith ierr = PCGAMGGetDataWithGhosts(Gmat2, dim, pc_gamg->data, &data_stride, &coords);CHKERRQ(ierr); 773806fa848SBarry Smith } else { 774c8b0795cSMark F. Adams coords = (PetscReal*)pc_gamg->data; 775a2f3521dSMark F. Adams data_stride = pc_gamg->data_sz/pc_gamg->data_cell_cols; 7762e68589bSMark F. Adams } 7772e68589bSMark F. Adams ierr = MatDestroy(&Gmat2);CHKERRQ(ierr); 7782e68589bSMark F. Adams 7792e68589bSMark F. Adams /* triangulate */ 7802e68589bSMark F. Adams if (dim == 2) { 781c8b0795cSMark F. Adams PetscReal metric,tm; 7820cbbd2e1SMark F. Adams #if defined PETSC_GAMG_USE_LOG 7830cbbd2e1SMark F. Adams ierr = PetscLogEventBegin(petsc_gamg_setup_events[SET6],0,0,0,0);CHKERRQ(ierr); 7842e68589bSMark F. Adams #endif 785806fa848SBarry Smith ierr = triangulateAndFormProl(selected_2, data_stride, coords,nLocalSelected, clid_flid, agg_lists, crsGID, bs, Prol, &metric);CHKERRQ(ierr); 7860cbbd2e1SMark F. Adams #if defined PETSC_GAMG_USE_LOG 7870cbbd2e1SMark F. Adams ierr = PetscLogEventEnd(petsc_gamg_setup_events[SET6],0,0,0,0);CHKERRQ(ierr); 7882e68589bSMark F. Adams #endif 7892e68589bSMark F. Adams ierr = PetscFree(crsGID);CHKERRQ(ierr); 7902e68589bSMark F. Adams 7912e68589bSMark F. Adams /* clean up and create coordinates for coarse grid (output) */ 792c5df96a5SBarry Smith if (size > 1) ierr = PetscFree(coords);CHKERRQ(ierr); 7932e68589bSMark F. Adams 7943b4367a7SBarry Smith ierr = MPI_Allreduce(&metric, &tm, 1, MPIU_REAL, MPIU_MAX, comm);CHKERRQ(ierr); 795c8b0795cSMark F. Adams if (tm > 1.) { /* needs to be globalized - should not happen */ 7963b4367a7SBarry Smith if (verbose) PetscPrintf(comm,"[%d]%s failed metric for coarse grid %e\n",rank,__FUNCT__,tm); 7972e68589bSMark F. Adams ierr = MatDestroy(&Prol);CHKERRQ(ierr); 7980298fd71SBarry Smith Prol = NULL; 799806fa848SBarry Smith } else if (metric > .0) { 8003b4367a7SBarry Smith if (verbose) PetscPrintf(comm,"[%d]%s worst metric for coarse grid = %e\n",rank,__FUNCT__,metric); 8012e68589bSMark F. Adams } 8023b4367a7SBarry Smith } else SETERRQ(comm,PETSC_ERR_PLIB,"3D not implemented for 'geo' AMG"); 8032e68589bSMark F. Adams { /* create next coords - output */ 8042e68589bSMark F. Adams PetscReal *crs_crds; 805785e854fSJed Brown ierr = PetscMalloc1(dim*nLocalSelected, &crs_crds);CHKERRQ(ierr); 8062e68589bSMark F. Adams for (kk=0; kk<nLocalSelected; kk++) { /* grab local select nodes to promote - output */ 807b43b03e9SMark F. Adams PetscInt lid = clid_flid[kk]; 808c8b0795cSMark F. Adams for (jj=0; jj<dim; jj++) crs_crds[jj*nLocalSelected + kk] = pc_gamg->data[jj*nloc + lid]; 8092e68589bSMark F. Adams } 810c8b0795cSMark F. Adams 811c8b0795cSMark F. Adams ierr = PetscFree(pc_gamg->data);CHKERRQ(ierr); 812c8b0795cSMark F. Adams pc_gamg->data = crs_crds; /* out */ 813c8b0795cSMark F. Adams pc_gamg->data_sz = dim*nLocalSelected; 8142e68589bSMark F. Adams } 815a2f3521dSMark F. Adams ierr = ISDestroy(&selected_2);CHKERRQ(ierr); 8162e68589bSMark F. Adams } 817a2f3521dSMark F. Adams 8182e68589bSMark F. Adams *a_P_out = Prol; /* out */ 819b43b03e9SMark F. Adams ierr = PetscFree(clid_flid);CHKERRQ(ierr); 8200cbbd2e1SMark F. Adams ierr = PetscLogEventEnd(PC_GAMGProlongator_GEO,0,0,0,0);CHKERRQ(ierr); 821c8b0795cSMark F. Adams PetscFunctionReturn(0); 822c8b0795cSMark F. Adams } 823c8b0795cSMark F. Adams 8249b8ffb57SJed Brown #undef __FUNCT__ 8259b8ffb57SJed Brown #define __FUNCT__ "PCDestroy_GAMG_GEO" 8269b8ffb57SJed Brown static PetscErrorCode PCDestroy_GAMG_GEO(PC pc) 8279b8ffb57SJed Brown { 8289b8ffb57SJed Brown PetscErrorCode ierr; 8299b8ffb57SJed Brown 8309b8ffb57SJed Brown PetscFunctionBegin; 8319b8ffb57SJed Brown ierr = PetscObjectComposeFunction((PetscObject)pc,"PCSetCoordinates_C",NULL);CHKERRQ(ierr); 8329b8ffb57SJed Brown PetscFunctionReturn(0); 8339b8ffb57SJed Brown } 8349b8ffb57SJed Brown 835c8b0795cSMark F. Adams /* -------------------------------------------------------------------------- */ 836c8b0795cSMark F. Adams /* 837c8b0795cSMark F. Adams PCCreateGAMG_GEO 838c8b0795cSMark F. Adams 839c8b0795cSMark F. Adams Input Parameter: 840c8b0795cSMark F. Adams . pc - 841c8b0795cSMark F. Adams */ 842c8b0795cSMark F. Adams #undef __FUNCT__ 843c8b0795cSMark F. Adams #define __FUNCT__ "PCCreateGAMG_GEO" 844c8b0795cSMark F. Adams PetscErrorCode PCCreateGAMG_GEO(PC pc) 845c8b0795cSMark F. Adams { 846c8b0795cSMark F. Adams PetscErrorCode ierr; 847c8b0795cSMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 848c8b0795cSMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 849c8b0795cSMark F. Adams 850c8b0795cSMark F. Adams PetscFunctionBegin; 8511ab5ffc9SJed Brown pc_gamg->ops->setfromoptions = PCSetFromOptions_GEO; 8529b8ffb57SJed Brown pc_gamg->ops->destroy = PCDestroy_GAMG_GEO; 853c8b0795cSMark F. Adams /* reset does not do anything; setup not virtual */ 854c8b0795cSMark F. Adams 855c8b0795cSMark F. Adams /* set internal function pointers */ 856fd1112cbSBarry Smith pc_gamg->ops->graph = PCGAMGGraph_GEO; 857fd1112cbSBarry Smith pc_gamg->ops->coarsen = PCGAMGCoarsen_GEO; 8581ab5ffc9SJed Brown pc_gamg->ops->prolongator = PCGAMGProlongator_GEO; 859fd1112cbSBarry Smith pc_gamg->ops->optprolongator = NULL; 8601ab5ffc9SJed Brown pc_gamg->ops->createdefaultdata = PCSetData_GEO; 861c8b0795cSMark F. Adams 862bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)pc,"PCSetCoordinates_C",PCSetCoordinates_GEO);CHKERRQ(ierr); 8632e68589bSMark F. Adams PetscFunctionReturn(0); 8642e68589bSMark F. Adams } 865