12e68589bSMark F. Adams /* 22e68589bSMark F. Adams GAMG geometric-algebric multiogrid PC - Mark Adams 2011 32e68589bSMark F. Adams */ 42e68589bSMark F. Adams 52e68589bSMark F. Adams #include <../src/ksp/pc/impls/gamg/gamg.h> /*I "petscpc.h" I*/ 6b45d2f2cSJed Brown #include <petsc-private/kspimpl.h> 72e68589bSMark F. Adams 82e68589bSMark F. Adams #include <assert.h> 92e68589bSMark F. Adams #include <petscblaslapack.h> 102e68589bSMark F. Adams 112e68589bSMark F. Adams typedef struct { 12c8b0795cSMark F. Adams PetscInt nsmooths; 13c8b0795cSMark F. Adams PetscBool sym_graph; 14ef4ad70eSMark F. Adams PetscBool square_graph; 152e68589bSMark F. Adams }PC_GAMG_AGG; 162e68589bSMark F. Adams 172e68589bSMark F. Adams #undef __FUNCT__ 182e68589bSMark F. Adams #define __FUNCT__ "PCGAMGSetNSmooths" 192e68589bSMark F. Adams /*@ 202e68589bSMark F. Adams PCGAMGSetNSmooths - Set number of smoothing steps (1 is typical) 212e68589bSMark F. Adams 222e68589bSMark F. Adams Not Collective on PC 232e68589bSMark F. Adams 242e68589bSMark F. Adams Input Parameters: 252e68589bSMark F. Adams . pc - the preconditioner context 262e68589bSMark F. Adams 272e68589bSMark F. Adams Options Database Key: 282e68589bSMark F. Adams . -pc_gamg_agg_nsmooths 292e68589bSMark F. Adams 302e68589bSMark F. Adams Level: intermediate 312e68589bSMark F. Adams 322e68589bSMark F. Adams Concepts: Aggregation AMG preconditioner 332e68589bSMark F. Adams 342e68589bSMark F. Adams .seealso: () 352e68589bSMark F. Adams @*/ 362e68589bSMark F. Adams PetscErrorCode PCGAMGSetNSmooths(PC pc, PetscInt n) 372e68589bSMark F. Adams { 382e68589bSMark F. Adams PetscErrorCode ierr; 392e68589bSMark F. Adams 402e68589bSMark F. Adams PetscFunctionBegin; 412e68589bSMark F. Adams PetscValidHeaderSpecific(pc,PC_CLASSID,1); 422e68589bSMark F. Adams ierr = PetscTryMethod(pc,"PCGAMGSetNSmooths_C",(PC,PetscInt),(pc,n));CHKERRQ(ierr); 432e68589bSMark F. Adams PetscFunctionReturn(0); 442e68589bSMark F. Adams } 452e68589bSMark F. Adams 462e68589bSMark F. Adams EXTERN_C_BEGIN 472e68589bSMark F. Adams #undef __FUNCT__ 482e68589bSMark F. Adams #define __FUNCT__ "PCGAMGSetNSmooths_GAMG" 492e68589bSMark F. Adams PetscErrorCode PCGAMGSetNSmooths_GAMG(PC pc, PetscInt n) 502e68589bSMark F. Adams { 512e68589bSMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 522e68589bSMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 53c8b0795cSMark F. Adams PC_GAMG_AGG *pc_gamg_agg = (PC_GAMG_AGG*)pc_gamg->subctx; 542e68589bSMark F. Adams 552e68589bSMark F. Adams PetscFunctionBegin; 56c8b0795cSMark F. Adams pc_gamg_agg->nsmooths = n; 57c8b0795cSMark F. Adams PetscFunctionReturn(0); 58c8b0795cSMark F. Adams } 59c8b0795cSMark F. Adams EXTERN_C_END 60c8b0795cSMark F. Adams 61c8b0795cSMark F. Adams #undef __FUNCT__ 62c8b0795cSMark F. Adams #define __FUNCT__ "PCGAMGSetSymGraph" 63c8b0795cSMark F. Adams /*@ 64c8b0795cSMark F. Adams PCGAMGSetSymGraph - 65c8b0795cSMark F. Adams 66c8b0795cSMark F. Adams Not Collective on PC 67c8b0795cSMark F. Adams 68c8b0795cSMark F. Adams Input Parameters: 69c8b0795cSMark F. Adams . pc - the preconditioner context 70c8b0795cSMark F. Adams 71c8b0795cSMark F. Adams Options Database Key: 72c8b0795cSMark F. Adams . -pc_gamg_sym_graph 73c8b0795cSMark F. Adams 74c8b0795cSMark F. Adams Level: intermediate 75c8b0795cSMark F. Adams 76c8b0795cSMark F. Adams Concepts: Aggregation AMG preconditioner 77c8b0795cSMark F. Adams 78c8b0795cSMark F. Adams .seealso: () 79c8b0795cSMark F. Adams @*/ 80c8b0795cSMark F. Adams PetscErrorCode PCGAMGSetSymGraph(PC pc, PetscBool n) 81c8b0795cSMark F. Adams { 82c8b0795cSMark F. Adams PetscErrorCode ierr; 83c8b0795cSMark F. Adams 84c8b0795cSMark F. Adams PetscFunctionBegin; 85c8b0795cSMark F. Adams PetscValidHeaderSpecific(pc,PC_CLASSID,1); 86c8b0795cSMark F. Adams ierr = PetscTryMethod(pc,"PCGAMGSetSymGraph_C",(PC,PetscBool),(pc,n));CHKERRQ(ierr); 87c8b0795cSMark F. Adams PetscFunctionReturn(0); 88c8b0795cSMark F. Adams } 89c8b0795cSMark F. Adams 90c8b0795cSMark F. Adams EXTERN_C_BEGIN 91c8b0795cSMark F. Adams #undef __FUNCT__ 92c8b0795cSMark F. Adams #define __FUNCT__ "PCGAMGSetSymGraph_GAMG" 93c8b0795cSMark F. Adams PetscErrorCode PCGAMGSetSymGraph_GAMG(PC pc, PetscBool n) 94c8b0795cSMark F. Adams { 95c8b0795cSMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 96c8b0795cSMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 97c8b0795cSMark F. Adams PC_GAMG_AGG *pc_gamg_agg = (PC_GAMG_AGG*)pc_gamg->subctx; 98c8b0795cSMark F. Adams 99c8b0795cSMark F. Adams PetscFunctionBegin; 100c8b0795cSMark F. Adams pc_gamg_agg->sym_graph = n; 1012e68589bSMark F. Adams PetscFunctionReturn(0); 1022e68589bSMark F. Adams } 1032e68589bSMark F. Adams EXTERN_C_END 1042e68589bSMark F. Adams 105ef4ad70eSMark F. Adams #undef __FUNCT__ 106ef4ad70eSMark F. Adams #define __FUNCT__ "PCGAMGSetSquareGraph" 107ef4ad70eSMark F. Adams /*@ 108ef4ad70eSMark F. Adams PCGAMGSetSquareGraph - 109ef4ad70eSMark F. Adams 110ef4ad70eSMark F. Adams Not Collective on PC 111ef4ad70eSMark F. Adams 112ef4ad70eSMark F. Adams Input Parameters: 113ef4ad70eSMark F. Adams . pc - the preconditioner context 114ef4ad70eSMark F. Adams 115ef4ad70eSMark F. Adams Options Database Key: 116ef4ad70eSMark F. Adams . -pc_gamg_square_graph 117ef4ad70eSMark F. Adams 118ef4ad70eSMark F. Adams Level: intermediate 119ef4ad70eSMark F. Adams 120ef4ad70eSMark F. Adams Concepts: Aggregation AMG preconditioner 121ef4ad70eSMark F. Adams 122ef4ad70eSMark F. Adams .seealso: () 123ef4ad70eSMark F. Adams @*/ 124ef4ad70eSMark F. Adams PetscErrorCode PCGAMGSetSquareGraph(PC pc, PetscBool n) 125ef4ad70eSMark F. Adams { 126ef4ad70eSMark F. Adams PetscErrorCode ierr; 127ef4ad70eSMark F. Adams 128ef4ad70eSMark F. Adams PetscFunctionBegin; 129ef4ad70eSMark F. Adams PetscValidHeaderSpecific(pc,PC_CLASSID,1); 130ef4ad70eSMark F. Adams ierr = PetscTryMethod(pc,"PCGAMGSetSquareGraph_C",(PC,PetscBool),(pc,n));CHKERRQ(ierr); 131ef4ad70eSMark F. Adams PetscFunctionReturn(0); 132ef4ad70eSMark F. Adams } 133ef4ad70eSMark F. Adams 134ef4ad70eSMark F. Adams EXTERN_C_BEGIN 135ef4ad70eSMark F. Adams #undef __FUNCT__ 136ef4ad70eSMark F. Adams #define __FUNCT__ "PCGAMGSetSquareGraph_GAMG" 137ef4ad70eSMark F. Adams PetscErrorCode PCGAMGSetSquareGraph_GAMG(PC pc, PetscBool n) 138ef4ad70eSMark F. Adams { 139ef4ad70eSMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 140ef4ad70eSMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 141ef4ad70eSMark F. Adams PC_GAMG_AGG *pc_gamg_agg = (PC_GAMG_AGG*)pc_gamg->subctx; 142ef4ad70eSMark F. Adams 143ef4ad70eSMark F. Adams PetscFunctionBegin; 144ef4ad70eSMark F. Adams pc_gamg_agg->square_graph = n; 145ef4ad70eSMark F. Adams PetscFunctionReturn(0); 146ef4ad70eSMark F. Adams } 147ef4ad70eSMark F. Adams EXTERN_C_END 148ef4ad70eSMark F. Adams 1492e68589bSMark F. Adams /* -------------------------------------------------------------------------- */ 1502e68589bSMark F. Adams /* 1512e68589bSMark F. Adams PCSetFromOptions_GAMG_AGG 1522e68589bSMark F. Adams 1532e68589bSMark F. Adams Input Parameter: 1542e68589bSMark F. Adams . pc - 1552e68589bSMark F. Adams */ 1562e68589bSMark F. Adams #undef __FUNCT__ 1572e68589bSMark F. Adams #define __FUNCT__ "PCSetFromOptions_GAMG_AGG" 1582e68589bSMark F. Adams PetscErrorCode PCSetFromOptions_GAMG_AGG( PC pc ) 1592e68589bSMark F. Adams { 1602e68589bSMark F. Adams PetscErrorCode ierr; 1612e68589bSMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 1622e68589bSMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 163c8b0795cSMark F. Adams PC_GAMG_AGG *pc_gamg_agg = (PC_GAMG_AGG*)pc_gamg->subctx; 1642e68589bSMark F. Adams PetscBool flag; 1652e68589bSMark F. Adams 1662e68589bSMark F. Adams PetscFunctionBegin; 1672e68589bSMark F. Adams /* call base class */ 1682e68589bSMark F. Adams ierr = PCSetFromOptions_GAMG( pc ); CHKERRQ(ierr); 1692e68589bSMark F. Adams 1702e68589bSMark F. Adams ierr = PetscOptionsHead("GAMG-AGG options"); CHKERRQ(ierr); 1712e68589bSMark F. Adams { 1722e68589bSMark F. Adams /* -pc_gamg_agg_nsmooths */ 173c8b0795cSMark F. Adams pc_gamg_agg->nsmooths = 0; 1742e68589bSMark F. Adams ierr = PetscOptionsInt("-pc_gamg_agg_nsmooths", 1752e68589bSMark F. Adams "smoothing steps for smoothed aggregation, usually 1 (0)", 1762e68589bSMark F. Adams "PCGAMGSetNSmooths", 177c8b0795cSMark F. Adams pc_gamg_agg->nsmooths, 178c8b0795cSMark F. Adams &pc_gamg_agg->nsmooths, 179c8b0795cSMark F. Adams &flag); 180c8b0795cSMark F. Adams CHKERRQ(ierr); 181c8b0795cSMark F. Adams 182c8b0795cSMark F. Adams /* -pc_gamg_sym_graph */ 183c8b0795cSMark F. Adams pc_gamg_agg->sym_graph = PETSC_FALSE; 184c8b0795cSMark F. Adams ierr = PetscOptionsBool("-pc_gamg_sym_graph", 185581a99e3SJed Brown "Set for asymmetric matrices", 186c8b0795cSMark F. Adams "PCGAMGSetSymGraph", 187c8b0795cSMark F. Adams pc_gamg_agg->sym_graph, 188c8b0795cSMark F. Adams &pc_gamg_agg->sym_graph, 1892e68589bSMark F. Adams &flag); 1902e68589bSMark F. Adams CHKERRQ(ierr); 191ef4ad70eSMark F. Adams 192ef4ad70eSMark F. Adams /* -pc_gamg_square_graph */ 193ef4ad70eSMark F. Adams pc_gamg_agg->square_graph = PETSC_TRUE; 194ef4ad70eSMark F. Adams ierr = PetscOptionsBool("-pc_gamg_square_graph", 1950cbbd2e1SMark F. Adams "For faster coarsening and lower coarse grid complexity", 196ef4ad70eSMark F. Adams "PCGAMGSetSquareGraph", 197ef4ad70eSMark F. Adams pc_gamg_agg->square_graph, 198ef4ad70eSMark F. Adams &pc_gamg_agg->square_graph, 199ef4ad70eSMark F. Adams &flag); 200ef4ad70eSMark F. Adams CHKERRQ(ierr); 2012e68589bSMark F. Adams } 2022e68589bSMark F. Adams ierr = PetscOptionsTail();CHKERRQ(ierr); 2032e68589bSMark F. Adams 2042e68589bSMark F. Adams PetscFunctionReturn(0); 2052e68589bSMark F. Adams } 2062e68589bSMark F. Adams 2072e68589bSMark F. Adams /* -------------------------------------------------------------------------- */ 2082e68589bSMark F. Adams /* 2092e68589bSMark F. Adams PCDestroy_AGG 2102e68589bSMark F. Adams 2112e68589bSMark F. Adams Input Parameter: 2122e68589bSMark F. Adams . pc - 2132e68589bSMark F. Adams */ 2142e68589bSMark F. Adams #undef __FUNCT__ 2152e68589bSMark F. Adams #define __FUNCT__ "PCDestroy_AGG" 2162e68589bSMark F. Adams PetscErrorCode PCDestroy_AGG( PC pc ) 2172e68589bSMark F. Adams { 2182e68589bSMark F. Adams PetscErrorCode ierr; 2192e68589bSMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 2202e68589bSMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 221c8b0795cSMark F. Adams PC_GAMG_AGG *pc_gamg_agg = (PC_GAMG_AGG*)pc_gamg->subctx; 2222e68589bSMark F. Adams 2232e68589bSMark F. Adams PetscFunctionBegin; 224c8b0795cSMark F. Adams if( pc_gamg_agg ) { 225c8b0795cSMark F. Adams ierr = PetscFree(pc_gamg_agg);CHKERRQ(ierr); 226c8b0795cSMark F. Adams pc_gamg_agg = 0; 2272e68589bSMark F. Adams } 2282e68589bSMark F. Adams 2292e68589bSMark F. Adams /* call base class */ 2302e68589bSMark F. Adams ierr = PCDestroy_GAMG( pc );CHKERRQ(ierr); 2312e68589bSMark F. Adams 2322e68589bSMark F. Adams PetscFunctionReturn(0); 2332e68589bSMark F. Adams } 2342e68589bSMark F. Adams 2352e68589bSMark F. Adams /* -------------------------------------------------------------------------- */ 2362e68589bSMark F. Adams /* 2372e68589bSMark F. Adams PCSetCoordinates_AGG 238302f38e8SMark F. Adams - collective 2392e68589bSMark F. Adams 2402e68589bSMark F. Adams Input Parameter: 2412e68589bSMark F. Adams . pc - the preconditioner context 242*a2f3521dSMark F. Adams . ndm - dimesion of data (used for dof/vertex for Stokes) 243302f38e8SMark F. Adams . a_nloc - number of vertices local 244302f38e8SMark F. Adams . coords - [a_nloc][ndm] - interleaved coordinate data: {x_0, y_0, z_0, x_1, y_1, ...} 2452e68589bSMark F. Adams */ 2462e68589bSMark F. Adams EXTERN_C_BEGIN 2472e68589bSMark F. Adams #undef __FUNCT__ 2482e68589bSMark F. Adams #define __FUNCT__ "PCSetCoordinates_AGG" 249302f38e8SMark F. Adams PetscErrorCode PCSetCoordinates_AGG( PC pc, PetscInt ndm, PetscInt a_nloc, PetscReal *coords ) 2502e68589bSMark F. Adams { 2512e68589bSMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 2522e68589bSMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 2532e68589bSMark F. Adams PetscErrorCode ierr; 254*a2f3521dSMark F. Adams PetscInt arrsz,kk,ii,jj,nloc,ndatarows,bs; 255*a2f3521dSMark F. Adams Mat mat = pc->pmat; 256*a2f3521dSMark F. Adams /* MPI_Comm wcomm = ((PetscObject)pc)->comm; */ 2572e68589bSMark F. Adams 2582e68589bSMark F. Adams PetscFunctionBegin; 259*a2f3521dSMark F. Adams PetscValidHeaderSpecific(pc,PC_CLASSID,1); 260*a2f3521dSMark F. Adams PetscValidHeaderSpecific(mat,MAT_CLASSID,1); 261302f38e8SMark F. Adams nloc = a_nloc; 2622e68589bSMark F. Adams 2632e68589bSMark F. Adams /* SA: null space vectors */ 264*a2f3521dSMark F. Adams ierr = MatGetBlockSize( mat, &bs ); CHKERRQ( ierr ); /* this does not work for Stokes */ 265c8b0795cSMark F. Adams if( coords && bs==1 ) pc_gamg->data_cell_cols = 1; /* scalar w/ coords and SA (not needed) */ 266*a2f3521dSMark F. Adams else if( coords ) { 267*a2f3521dSMark F. Adams if(ndm > bs) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_LIB,"degrees of motion %d > block size %d",ndm,bs); 268*a2f3521dSMark F. Adams pc_gamg->data_cell_cols = (ndm==2 ? (bs+1) : (bs+3)); /* elasticity */ 269*a2f3521dSMark F. Adams } 270c8b0795cSMark F. Adams else pc_gamg->data_cell_cols = bs; /* no data, force SA with constant null space vectors */ 271*a2f3521dSMark F. Adams pc_gamg->data_cell_rows = ndatarows = bs; 272*a2f3521dSMark F. Adams assert(pc_gamg->data_cell_cols>0); 273c8b0795cSMark F. Adams arrsz = nloc*pc_gamg->data_cell_rows*pc_gamg->data_cell_cols; 2742e68589bSMark F. Adams 2752e68589bSMark F. Adams /* create data - syntactic sugar that should be refactored at some point */ 2762e68589bSMark F. Adams if (pc_gamg->data==0 || (pc_gamg->data_sz != arrsz)) { 2772e68589bSMark F. Adams ierr = PetscFree( pc_gamg->data ); CHKERRQ(ierr); 278302f38e8SMark F. Adams ierr = PetscMalloc((arrsz+1)*sizeof(PetscReal), &pc_gamg->data ); CHKERRQ(ierr); 279*a2f3521dSMark F. Adams /* pc_gamg->data != null if nloc==0: flag for called */ 2802e68589bSMark F. Adams } 2812e68589bSMark F. Adams /* copy data in - column oriented */ 2822e68589bSMark F. Adams for(kk=0;kk<nloc;kk++){ 283302f38e8SMark F. Adams const PetscInt M = nloc*pc_gamg->data_cell_rows; 284*a2f3521dSMark F. Adams PetscReal *data = &pc_gamg->data[kk*ndatarows]; 285c8b0795cSMark F. Adams if( pc_gamg->data_cell_cols==1 ) *data = 1.0; 2862e68589bSMark F. Adams else { 287*a2f3521dSMark F. Adams for(ii=0;ii<ndatarows;ii++) 288*a2f3521dSMark F. Adams for(jj=0;jj<ndatarows;jj++) 2892e68589bSMark F. Adams if(ii==jj)data[ii*M + jj] = 1.0; /* translational modes */ 2902e68589bSMark F. Adams else data[ii*M + jj] = 0.0; 2912e68589bSMark F. Adams if( coords ) { 2922e68589bSMark F. Adams if( ndm == 2 ){ /* rotational modes */ 2932e68589bSMark F. Adams data += 2*M; 2942e68589bSMark F. Adams data[0] = -coords[2*kk+1]; 2952e68589bSMark F. Adams data[1] = coords[2*kk]; 2962e68589bSMark F. Adams } 2972e68589bSMark F. Adams else { 2982e68589bSMark F. Adams data += 3*M; 2992e68589bSMark F. Adams data[0] = 0.0; data[M+0] = coords[3*kk+2]; data[2*M+0] = -coords[3*kk+1]; 3002e68589bSMark F. Adams data[1] = -coords[3*kk+2]; data[M+1] = 0.0; data[2*M+1] = coords[3*kk]; 3012e68589bSMark F. Adams data[2] = coords[3*kk+1]; data[M+2] = -coords[3*kk]; data[2*M+2] = 0.0; 3022e68589bSMark F. Adams } 3032e68589bSMark F. Adams } 3042e68589bSMark F. Adams } 3052e68589bSMark F. Adams } 3062e68589bSMark F. Adams 3072e68589bSMark F. Adams pc_gamg->data_sz = arrsz; 3082e68589bSMark F. Adams 3092e68589bSMark F. Adams PetscFunctionReturn(0); 3102e68589bSMark F. Adams } 3112e68589bSMark F. Adams EXTERN_C_END 3122e68589bSMark F. Adams 313b43b03e9SMark F. Adams typedef PetscInt NState; 314b43b03e9SMark F. Adams static const NState NOT_DONE=-2; 315b43b03e9SMark F. Adams static const NState DELETED=-1; 316b43b03e9SMark F. Adams static const NState REMOVED=-3; 317b43b03e9SMark F. Adams #define IS_SELECTED(s) (s!=DELETED && s!=NOT_DONE && s!=REMOVED) 318b43b03e9SMark F. Adams 319c8b0795cSMark F. Adams /* -------------------------------------------------------------------------- */ 320c8b0795cSMark F. Adams /* 321b43b03e9SMark F. Adams smoothAggs - greedy grab of with G1 (unsquared graph) -- AIJ specific 322b43b03e9SMark F. Adams - AGG-MG specific: clears singletons out of 'selected_2' 323c8b0795cSMark F. Adams 324c8b0795cSMark F. Adams Input Parameter: 325c8b0795cSMark F. Adams . Gmat_2 - glabal matrix of graph (data not defined) 326c8b0795cSMark F. Adams . Gmat_1 - base graph to grab with 327c8b0795cSMark F. Adams Input/Output Parameter: 3280cbbd2e1SMark F. Adams . aggs_2 - linked list of aggs with gids ) 329c8b0795cSMark F. Adams */ 330c8b0795cSMark F. Adams #undef __FUNCT__ 331c8b0795cSMark F. Adams #define __FUNCT__ "smoothAggs" 3320cbbd2e1SMark F. Adams static PetscErrorCode smoothAggs( const Mat Gmat_2, /* base (squared) graph */ 3330cbbd2e1SMark F. Adams const Mat Gmat_1, /* base graph */ 3340cbbd2e1SMark F. Adams /* const IS selected_2, [nselected local] selected vertices */ 3350cbbd2e1SMark F. Adams PetscCoarsenData *aggs_2 /* [nselected local] global ID of aggregate */ 336c8b0795cSMark F. Adams ) 337c8b0795cSMark F. Adams { 338c8b0795cSMark F. Adams PetscErrorCode ierr; 339c8b0795cSMark F. Adams PetscBool isMPI; 340c8b0795cSMark F. Adams Mat_SeqAIJ *matA_1, *matB_1=0, *matA_2, *matB_2=0; 341c8b0795cSMark F. Adams MPI_Comm wcomm = ((PetscObject)Gmat_2)->comm; 3420cbbd2e1SMark F. Adams PetscMPIInt mype,npe; 3430cbbd2e1SMark F. Adams PetscInt lid,*ii,*idx,ix,Iend,my0,kk,n,j; 344c8b0795cSMark F. Adams Mat_MPIAIJ *mpimat_2 = 0, *mpimat_1=0; 345c8b0795cSMark F. Adams const PetscInt nloc = Gmat_2->rmap->n; 3460cbbd2e1SMark F. Adams PetscScalar *cpcol_1_state,*cpcol_2_state,*cpcol_2_par_orig,*lid_parent_gid; 3470cbbd2e1SMark F. Adams PetscInt *lid_cprowID_1; 348c8b0795cSMark F. Adams NState *lid_state; 3490cbbd2e1SMark F. Adams Vec ghost_par_orig2; 350c8b0795cSMark F. Adams 351c8b0795cSMark F. Adams PetscFunctionBegin; 352c8b0795cSMark F. Adams ierr = MPI_Comm_rank( wcomm, &mype ); CHKERRQ(ierr); 3530cbbd2e1SMark F. Adams ierr = MPI_Comm_size( wcomm, &npe ); CHKERRQ(ierr); 354c8b0795cSMark F. Adams ierr = MatGetOwnershipRange(Gmat_1,&my0,&Iend); CHKERRQ(ierr); 355c8b0795cSMark F. Adams 3560cbbd2e1SMark F. Adams if( PETSC_FALSE ) { 357c8b0795cSMark F. Adams PetscViewer viewer; char fname[32]; static int llev=0; 358c8b0795cSMark F. Adams sprintf(fname,"Gmat2_%d.m",llev++); 359c8b0795cSMark F. Adams PetscViewerASCIIOpen(wcomm,fname,&viewer); 360c8b0795cSMark F. Adams ierr = PetscViewerSetFormat( viewer, PETSC_VIEWER_ASCII_MATLAB); CHKERRQ(ierr); 361c8b0795cSMark F. Adams ierr = MatView(Gmat_2, viewer ); CHKERRQ(ierr); 362c8b0795cSMark F. Adams ierr = PetscViewerDestroy( &viewer ); 363c8b0795cSMark F. Adams } 364c8b0795cSMark F. Adams 365c8b0795cSMark F. Adams /* get submatrices */ 366251f4c67SDmitry Karpeev ierr = PetscObjectTypeCompare( (PetscObject)Gmat_1, MATMPIAIJ, &isMPI ); CHKERRQ(ierr); 367c8b0795cSMark F. Adams if(isMPI) { 368c8b0795cSMark F. Adams /* grab matrix objects */ 369c8b0795cSMark F. Adams mpimat_2 = (Mat_MPIAIJ*)Gmat_2->data; 370c8b0795cSMark F. Adams mpimat_1 = (Mat_MPIAIJ*)Gmat_1->data; 371c8b0795cSMark F. Adams matA_1 = (Mat_SeqAIJ*)mpimat_1->A->data; 372c8b0795cSMark F. Adams matB_1 = (Mat_SeqAIJ*)mpimat_1->B->data; 373c8b0795cSMark F. Adams matA_2 = (Mat_SeqAIJ*)mpimat_2->A->data; 374c8b0795cSMark F. Adams matB_2 = (Mat_SeqAIJ*)mpimat_2->B->data; 375c8b0795cSMark F. Adams 376c8b0795cSMark F. Adams /* force compressed row storage for B matrix in AuxMat */ 377c8b0795cSMark F. Adams matB_1->compressedrow.check = PETSC_TRUE; 378c8b0795cSMark F. Adams ierr = MatCheckCompressedRow(mpimat_1->B,&matB_1->compressedrow,matB_1->i,Gmat_1->rmap->n,-1.0); 379c8b0795cSMark F. Adams CHKERRQ(ierr); 380c8b0795cSMark F. Adams 381c8b0795cSMark F. Adams ierr = PetscMalloc( nloc*sizeof(PetscInt), &lid_cprowID_1 ); CHKERRQ(ierr); 3820cbbd2e1SMark F. Adams for( lid = 0 ; lid < nloc ; lid++ ) lid_cprowID_1[lid] = -1; 383c8b0795cSMark F. Adams for (ix=0; ix<matB_1->compressedrow.nrows; ix++) { 384c8b0795cSMark F. Adams PetscInt lid = matB_1->compressedrow.rindex[ix]; 385c8b0795cSMark F. Adams lid_cprowID_1[lid] = ix; 386c8b0795cSMark F. Adams } 387c8b0795cSMark F. Adams } 388c8b0795cSMark F. Adams else { 389c8b0795cSMark F. Adams matA_1 = (Mat_SeqAIJ*)Gmat_1->data; 390c8b0795cSMark F. Adams matA_2 = (Mat_SeqAIJ*)Gmat_2->data; 3910cbbd2e1SMark F. Adams lid_cprowID_1 = PETSC_NULL; 392c8b0795cSMark F. Adams } 393c8b0795cSMark F. Adams assert( matA_1 && !matA_1->compressedrow.use ); 394c8b0795cSMark F. Adams assert( matB_1==0 || matB_1->compressedrow.use ); 395c8b0795cSMark F. Adams assert( matA_2 && !matA_2->compressedrow.use ); 396c8b0795cSMark F. Adams assert( matB_2==0 || matB_2->compressedrow.use ); 397c8b0795cSMark F. Adams 398c8b0795cSMark F. Adams /* get state of locals and selected gid for deleted */ 399c8b0795cSMark F. Adams ierr = PetscMalloc( nloc*sizeof(NState), &lid_state ); CHKERRQ(ierr); 4000cbbd2e1SMark F. Adams ierr = PetscMalloc( nloc*sizeof(PetscScalar), &lid_parent_gid ); CHKERRQ(ierr); 401c8b0795cSMark F. Adams for( lid = 0 ; lid < nloc ; lid++ ) { 4020cbbd2e1SMark F. Adams lid_parent_gid[lid] = -1.0; 403c8b0795cSMark F. Adams lid_state[lid] = DELETED; 404c8b0795cSMark F. Adams } 4050cbbd2e1SMark F. Adams 4060cbbd2e1SMark F. Adams /* set lid_state */ 4070cbbd2e1SMark F. Adams for( lid = 0 ; lid < nloc ; lid++ ) { 40841b27cdeSMark F. Adams PetscCDPos pos; 409e78576d6SMark F. Adams ierr = PetscCDGetHeadPos(aggs_2,lid,&pos); CHKERRQ(ierr); 410e78576d6SMark F. Adams if( pos ) { 411e78576d6SMark F. Adams PetscInt gid1; 412ffc955d6SMark F. Adams ierr = PetscLLNGetID( pos, &gid1 ); CHKERRQ(ierr); assert(gid1==lid+my0); 4130cbbd2e1SMark F. Adams lid_state[lid] = gid1; 414b43b03e9SMark F. Adams } 415b43b03e9SMark F. Adams } 4160cbbd2e1SMark F. Adams 4170cbbd2e1SMark F. Adams /* map local to selected local, DELETED means a ghost owns it */ 418c8b0795cSMark F. Adams for(lid=kk=0;lid<nloc;lid++){ 419c8b0795cSMark F. Adams NState state = lid_state[lid]; 420c8b0795cSMark F. Adams if( IS_SELECTED(state) ){ 42141b27cdeSMark F. Adams PetscCDPos pos; 422e78576d6SMark F. Adams ierr = PetscCDGetHeadPos(aggs_2,lid,&pos); CHKERRQ(ierr); 423e78576d6SMark F. Adams while(pos){ 424e78576d6SMark F. Adams PetscInt gid1; 425ffc955d6SMark F. Adams ierr = PetscLLNGetID( pos, &gid1 ); CHKERRQ(ierr); 426e78576d6SMark F. Adams ierr = PetscCDGetNextPos(aggs_2,lid,&pos); CHKERRQ(ierr); 427e78576d6SMark F. Adams 4280cbbd2e1SMark F. Adams if( gid1 >= my0 && gid1 < Iend ){ 4290cbbd2e1SMark F. Adams lid_parent_gid[gid1-my0] = (PetscScalar)(lid + my0); 430c8b0795cSMark F. Adams } 431c8b0795cSMark F. Adams } 4320cbbd2e1SMark F. Adams } 4330cbbd2e1SMark F. Adams } 4340cbbd2e1SMark F. Adams /* get 'cpcol_1/2_state' & cpcol_2_par_orig - uses mpimat_1/2->lvec for temp space */ 435c8b0795cSMark F. Adams if (isMPI) { 436c8b0795cSMark F. Adams Vec tempVec; 437c8b0795cSMark F. Adams /* get 'cpcol_1_state' */ 438c8b0795cSMark F. Adams ierr = MatGetVecs( Gmat_1, &tempVec, 0 ); CHKERRQ(ierr); 439c8b0795cSMark F. Adams for(kk=0,j=my0;kk<nloc;kk++,j++){ 440c8b0795cSMark F. Adams PetscScalar v = (PetscScalar)lid_state[kk]; 441c8b0795cSMark F. Adams ierr = VecSetValues( tempVec, 1, &j, &v, INSERT_VALUES ); CHKERRQ(ierr); 442c8b0795cSMark F. Adams } 443c8b0795cSMark F. Adams ierr = VecAssemblyBegin( tempVec ); CHKERRQ(ierr); 444c8b0795cSMark F. Adams ierr = VecAssemblyEnd( tempVec ); CHKERRQ(ierr); 445c8b0795cSMark F. Adams ierr = VecScatterBegin(mpimat_1->Mvctx,tempVec, mpimat_1->lvec,INSERT_VALUES,SCATTER_FORWARD); 446c8b0795cSMark F. Adams CHKERRQ(ierr); 447c8b0795cSMark F. Adams ierr = VecScatterEnd(mpimat_1->Mvctx,tempVec, mpimat_1->lvec,INSERT_VALUES,SCATTER_FORWARD); 448c8b0795cSMark F. Adams CHKERRQ(ierr); 449c8b0795cSMark F. Adams ierr = VecGetArray( mpimat_1->lvec, &cpcol_1_state ); CHKERRQ(ierr); 450c8b0795cSMark F. Adams /* get 'cpcol_2_state' */ 451c8b0795cSMark F. Adams ierr = VecScatterBegin(mpimat_2->Mvctx,tempVec, mpimat_2->lvec,INSERT_VALUES,SCATTER_FORWARD); 452c8b0795cSMark F. Adams CHKERRQ(ierr); 453c8b0795cSMark F. Adams ierr = VecScatterEnd(mpimat_2->Mvctx,tempVec, mpimat_2->lvec,INSERT_VALUES,SCATTER_FORWARD); 454c8b0795cSMark F. Adams CHKERRQ(ierr); 455c8b0795cSMark F. Adams ierr = VecGetArray( mpimat_2->lvec, &cpcol_2_state ); CHKERRQ(ierr); 4560cbbd2e1SMark F. Adams /* get 'cpcol_2_par_orig' */ 4570cbbd2e1SMark F. Adams for(kk=0,j=my0;kk<nloc;kk++,j++){ 4580cbbd2e1SMark F. Adams PetscScalar v = (PetscScalar)lid_parent_gid[kk]; 4590cbbd2e1SMark F. Adams ierr = VecSetValues( tempVec, 1, &j, &v, INSERT_VALUES ); CHKERRQ(ierr); 4600cbbd2e1SMark F. Adams } 4610cbbd2e1SMark F. Adams ierr = VecAssemblyBegin( tempVec ); CHKERRQ(ierr); 4620cbbd2e1SMark F. Adams ierr = VecAssemblyEnd( tempVec ); CHKERRQ(ierr); 4630cbbd2e1SMark F. Adams ierr = VecDuplicate( mpimat_2->lvec, &ghost_par_orig2 ); CHKERRQ(ierr); 4640cbbd2e1SMark F. Adams ierr = VecScatterBegin(mpimat_2->Mvctx,tempVec, ghost_par_orig2,INSERT_VALUES,SCATTER_FORWARD); 4650cbbd2e1SMark F. Adams CHKERRQ(ierr); 4660cbbd2e1SMark F. Adams ierr = VecScatterEnd(mpimat_2->Mvctx,tempVec, ghost_par_orig2,INSERT_VALUES,SCATTER_FORWARD); 4670cbbd2e1SMark F. Adams CHKERRQ(ierr); 4680cbbd2e1SMark F. Adams ierr = VecGetArray( ghost_par_orig2, &cpcol_2_par_orig ); CHKERRQ(ierr); 4690cbbd2e1SMark F. Adams 470c8b0795cSMark F. Adams ierr = VecDestroy( &tempVec ); CHKERRQ(ierr); 471c8b0795cSMark F. Adams } /* ismpi */ 472c8b0795cSMark F. Adams 473c8b0795cSMark F. Adams /* doit */ 474c8b0795cSMark F. Adams for(lid=0;lid<nloc;lid++){ 475c8b0795cSMark F. Adams NState state = lid_state[lid]; 4760cbbd2e1SMark F. Adams if( IS_SELECTED(state) ) { 4770cbbd2e1SMark F. Adams /* steal locals */ 478c8b0795cSMark F. Adams ii = matA_1->i; n = ii[lid+1] - ii[lid]; 479c8b0795cSMark F. Adams idx = matA_1->j + ii[lid]; 480c8b0795cSMark F. Adams for (j=0; j<n; j++) { 4810cbbd2e1SMark F. Adams PetscInt lidj = idx[j], sgid; 482c8b0795cSMark F. Adams NState statej = lid_state[lidj]; 4830cbbd2e1SMark F. Adams if (statej==DELETED && (sgid=(PetscInt)PetscRealPart(lid_parent_gid[lidj])) != lid+my0) { /* steal local */ 4840cbbd2e1SMark F. Adams lid_parent_gid[lidj] = (PetscScalar)(lid+my0); /* send this if sgid is not local */ 4850cbbd2e1SMark F. Adams if( sgid >= my0 && sgid < Iend ){ /* I'm stealing this local from a local sgid */ 4860cbbd2e1SMark F. Adams PetscInt hav=0,slid=sgid-my0,gidj=lidj+my0; 48741b27cdeSMark F. Adams PetscCDPos pos,last=PETSC_NULL; 488c8b0795cSMark F. Adams /* looking for local from local so id_llist_2 works */ 489e78576d6SMark F. Adams ierr = PetscCDGetHeadPos(aggs_2,slid,&pos); CHKERRQ(ierr); 490e78576d6SMark F. Adams while(pos){ 491e78576d6SMark F. Adams PetscInt gid; 492ffc955d6SMark F. Adams ierr = PetscLLNGetID( pos, &gid ); CHKERRQ(ierr); 4930cbbd2e1SMark F. Adams if( gid == gidj ) { 4940cbbd2e1SMark F. Adams assert(last); 49541b27cdeSMark F. Adams ierr = PetscCDRemoveNextNode( aggs_2, slid, last ); CHKERRQ(ierr); 49641b27cdeSMark F. Adams ierr = PetscCDAppendNode( aggs_2, lid, pos ); CHKERRQ(ierr); 4970cbbd2e1SMark F. Adams hav = 1; 498c8b0795cSMark F. Adams break; 499c8b0795cSMark F. Adams } 5000cbbd2e1SMark F. Adams else last = pos; 501e78576d6SMark F. Adams 502e78576d6SMark F. Adams ierr = PetscCDGetNextPos(aggs_2,slid,&pos); CHKERRQ(ierr); 503c8b0795cSMark F. Adams } 504c8b0795cSMark F. Adams if(hav!=1){ 505c8b0795cSMark F. Adams if(hav==0)SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"failed to find adj in 'selected' lists - structurally unsymmetric matrix"); 506c8b0795cSMark F. Adams SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"found node %d times???",hav); 507c8b0795cSMark F. Adams } 508c8b0795cSMark F. Adams } 5090cbbd2e1SMark F. Adams else{ /* I'm stealing this local, owned by a ghost */ 510c8b0795cSMark F. Adams assert(sgid==-1); 51141b27cdeSMark F. Adams ierr = PetscCDAppendID( aggs_2, lid, lidj+my0 ); CHKERRQ(ierr); 512c8b0795cSMark F. Adams } 513c8b0795cSMark F. Adams } 5140cbbd2e1SMark F. Adams } /* local neighbors */ 515c8b0795cSMark F. Adams } 516c8b0795cSMark F. Adams else if( state == DELETED && lid_cprowID_1 ) { 5170cbbd2e1SMark F. Adams PetscInt sgidold = (PetscInt)PetscRealPart(lid_parent_gid[lid]); 518c8b0795cSMark F. Adams /* see if I have a selected ghost neighbor that will steal me */ 519c8b0795cSMark F. Adams if( (ix=lid_cprowID_1[lid]) != -1 ){ 520c8b0795cSMark F. Adams ii = matB_1->compressedrow.i; n = ii[ix+1] - ii[ix]; 521c8b0795cSMark F. Adams idx = matB_1->j + ii[ix]; 522c8b0795cSMark F. Adams for( j=0 ; j<n ; j++ ) { 523c8b0795cSMark F. Adams PetscInt cpid = idx[j]; 524c8b0795cSMark F. Adams NState statej = (NState)PetscRealPart(cpcol_1_state[cpid]); 525c8b0795cSMark F. Adams if( IS_SELECTED(statej) && sgidold != (PetscInt)statej ) { /* ghost will steal this, remove from my list */ 5260cbbd2e1SMark F. Adams lid_parent_gid[lid] = (PetscScalar)statej; /* send who selected */ 5270cbbd2e1SMark F. Adams if( sgidold>=my0 && sgidold<Iend ) { /* this was mine */ 5280cbbd2e1SMark F. Adams PetscInt hav=0,oldslidj=sgidold-my0; 52941b27cdeSMark F. Adams PetscCDPos pos,last=PETSC_NULL; 5300cbbd2e1SMark F. Adams /* remove from 'oldslidj' list */ 531e78576d6SMark F. Adams ierr = PetscCDGetHeadPos(aggs_2,oldslidj,&pos); CHKERRQ(ierr); 532e78576d6SMark F. Adams while( pos ) { 533e78576d6SMark F. Adams PetscInt gid; 534ffc955d6SMark F. Adams ierr = PetscLLNGetID( pos, &gid ); CHKERRQ(ierr); 5350cbbd2e1SMark F. Adams if( lid+my0 == gid ) { 5360cbbd2e1SMark F. Adams /* id_llist_2[lastid] = id_llist_2[flid]; /\* remove lid from oldslidj list *\/ */ 5370cbbd2e1SMark F. Adams assert(last); 53841b27cdeSMark F. Adams ierr = PetscCDRemoveNextNode( aggs_2, oldslidj, last ); CHKERRQ(ierr); 5390cbbd2e1SMark F. Adams /* ghost (PetscScalar)statej will add this later */ 5400cbbd2e1SMark F. Adams hav = 1; 541c8b0795cSMark F. Adams break; 542c8b0795cSMark F. Adams } 5430cbbd2e1SMark F. Adams else last = pos; 544e78576d6SMark F. Adams 545e78576d6SMark F. Adams ierr = PetscCDGetNextPos(aggs_2,oldslidj,&pos); CHKERRQ(ierr); 546c8b0795cSMark F. Adams } 547c8b0795cSMark F. Adams if(hav!=1){ 548c8b0795cSMark F. Adams if(hav==0)SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"failed to find adj in 'selected' lists - structurally unsymmetric matrix"); 549c8b0795cSMark F. Adams SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"found node %d times???",hav); 550c8b0795cSMark F. Adams } 551c8b0795cSMark F. Adams } 5520cbbd2e1SMark F. Adams else { 5530cbbd2e1SMark F. Adams /* ghosts remove this later */ 5540cbbd2e1SMark F. Adams } 555c8b0795cSMark F. Adams } 556c8b0795cSMark F. Adams } 557c8b0795cSMark F. Adams } 558c8b0795cSMark F. Adams } /* selected/deleted */ 559c8b0795cSMark F. Adams } /* node loop */ 560c8b0795cSMark F. Adams 561c8b0795cSMark F. Adams if( isMPI ) { 5620cbbd2e1SMark F. Adams PetscScalar *cpcol_2_parent,*cpcol_2_gid; 5630cbbd2e1SMark F. Adams Vec tempVec,ghostgids2,ghostparents2; 5640cbbd2e1SMark F. Adams PetscInt cpid,nghost_2; 5650cbbd2e1SMark F. Adams GAMGHashTable gid_cpid; 566c8b0795cSMark F. Adams 5670cbbd2e1SMark F. Adams ierr = VecGetSize( mpimat_2->lvec, &nghost_2 ); CHKERRQ(ierr); 568c8b0795cSMark F. Adams ierr = MatGetVecs( Gmat_2, &tempVec, 0 ); CHKERRQ(ierr); 5690cbbd2e1SMark F. Adams 5700cbbd2e1SMark F. Adams /* get 'cpcol_2_parent' */ 571c8b0795cSMark F. Adams for(kk=0,j=my0;kk<nloc;kk++,j++){ 5720cbbd2e1SMark F. Adams ierr = VecSetValues( tempVec, 1, &j, &lid_parent_gid[kk], INSERT_VALUES ); CHKERRQ(ierr); 573c8b0795cSMark F. Adams } 574c8b0795cSMark F. Adams ierr = VecAssemblyBegin( tempVec ); CHKERRQ(ierr); 575c8b0795cSMark F. Adams ierr = VecAssemblyEnd( tempVec ); CHKERRQ(ierr); 5760cbbd2e1SMark F. Adams ierr = VecDuplicate( mpimat_2->lvec, &ghostparents2 ); CHKERRQ(ierr); 5770cbbd2e1SMark F. Adams ierr = VecScatterBegin(mpimat_2->Mvctx,tempVec, ghostparents2,INSERT_VALUES,SCATTER_FORWARD); 578c8b0795cSMark F. Adams CHKERRQ(ierr); 5790cbbd2e1SMark F. Adams ierr = VecScatterEnd(mpimat_2->Mvctx,tempVec, ghostparents2,INSERT_VALUES,SCATTER_FORWARD); 580c8b0795cSMark F. Adams CHKERRQ(ierr); 5810cbbd2e1SMark F. Adams ierr = VecGetArray( ghostparents2, &cpcol_2_parent ); CHKERRQ(ierr); 5820cbbd2e1SMark F. Adams 5830cbbd2e1SMark F. Adams /* get 'cpcol_2_gid' */ 5840cbbd2e1SMark F. Adams for(kk=0,j=my0;kk<nloc;kk++,j++){ 5850cbbd2e1SMark F. Adams PetscScalar v = (PetscScalar)j; 5860cbbd2e1SMark F. Adams ierr = VecSetValues( tempVec, 1, &j, &v, INSERT_VALUES ); CHKERRQ(ierr); 5870cbbd2e1SMark F. Adams } 5880cbbd2e1SMark F. Adams ierr = VecAssemblyBegin( tempVec ); CHKERRQ(ierr); 5890cbbd2e1SMark F. Adams ierr = VecAssemblyEnd( tempVec ); CHKERRQ(ierr); 5900cbbd2e1SMark F. Adams ierr = VecDuplicate( mpimat_2->lvec, &ghostgids2 ); CHKERRQ(ierr); 5910cbbd2e1SMark F. Adams ierr = VecScatterBegin(mpimat_2->Mvctx,tempVec, ghostgids2,INSERT_VALUES,SCATTER_FORWARD); 5920cbbd2e1SMark F. Adams CHKERRQ(ierr); 5930cbbd2e1SMark F. Adams ierr = VecScatterEnd(mpimat_2->Mvctx,tempVec, ghostgids2,INSERT_VALUES,SCATTER_FORWARD); 5940cbbd2e1SMark F. Adams CHKERRQ(ierr); 5950cbbd2e1SMark F. Adams ierr = VecGetArray( ghostgids2, &cpcol_2_gid ); CHKERRQ(ierr); 5960cbbd2e1SMark F. Adams 597c8b0795cSMark F. Adams ierr = VecDestroy( &tempVec ); CHKERRQ(ierr); 598c8b0795cSMark F. Adams 5990cbbd2e1SMark F. Adams /* look for deleted ghosts and add to table */ 6000cbbd2e1SMark F. Adams ierr = GAMGTableCreate( 2*nghost_2, &gid_cpid ); CHKERRQ(ierr); 6010cbbd2e1SMark F. Adams for( cpid = 0 ; cpid < nghost_2 ; cpid++ ) { 6020cbbd2e1SMark F. Adams NState state = (NState)PetscRealPart(cpcol_2_state[cpid]); 6030cbbd2e1SMark F. Adams if( state==DELETED ) { 6040cbbd2e1SMark F. Adams PetscInt sgid_new = (PetscInt)PetscRealPart(cpcol_2_parent[cpid]); 6050cbbd2e1SMark F. Adams PetscInt sgid_old = (PetscInt)PetscRealPart(cpcol_2_par_orig[cpid]); 6060cbbd2e1SMark F. Adams if( sgid_old == -1 && sgid_new != -1 ) { 6070cbbd2e1SMark F. Adams PetscInt gid = (PetscInt)PetscRealPart(cpcol_2_gid[cpid]); 6080cbbd2e1SMark F. Adams ierr = GAMGTableAdd( &gid_cpid, gid, cpid ); CHKERRQ(ierr); 6090cbbd2e1SMark F. Adams } 6100cbbd2e1SMark F. Adams } 6110cbbd2e1SMark F. Adams } 612c8b0795cSMark F. Adams 6130cbbd2e1SMark F. Adams /* look for deleted ghosts and see if they moved - remove it */ 614c8b0795cSMark F. Adams for(lid=0;lid<nloc;lid++){ 615c8b0795cSMark F. Adams NState state = lid_state[lid]; 616c8b0795cSMark F. Adams if( IS_SELECTED(state) ){ 61741b27cdeSMark F. Adams PetscCDPos pos,last=PETSC_NULL; 618c8b0795cSMark F. Adams /* look for deleted ghosts and see if they moved */ 619e78576d6SMark F. Adams ierr = PetscCDGetHeadPos(aggs_2,lid,&pos); CHKERRQ(ierr); 620e78576d6SMark F. Adams while(pos){ 621e78576d6SMark F. Adams PetscInt gid; 622ffc955d6SMark F. Adams ierr = PetscLLNGetID( pos, &gid ); CHKERRQ(ierr); 623e78576d6SMark F. Adams 6240cbbd2e1SMark F. Adams if( gid < my0 || gid >= Iend ) { 6250cbbd2e1SMark F. Adams ierr = GAMGTableFind( &gid_cpid, gid, &cpid ); CHKERRQ(ierr); 6260cbbd2e1SMark F. Adams if( cpid != -1 ) { 6270cbbd2e1SMark F. Adams /* a moved ghost - */ 6280cbbd2e1SMark F. Adams /* id_llist_2[lastid] = id_llist_2[flid]; /\* remove 'flid' from list *\/ */ 62941b27cdeSMark F. Adams ierr = PetscCDRemoveNextNode( aggs_2, lid, last ); CHKERRQ(ierr); 6300cbbd2e1SMark F. Adams } 6310cbbd2e1SMark F. Adams else last = pos; 6320cbbd2e1SMark F. Adams } 6330cbbd2e1SMark F. Adams else last = pos; 634e78576d6SMark F. Adams 635e78576d6SMark F. Adams ierr = PetscCDGetNextPos(aggs_2,lid,&pos); CHKERRQ(ierr); 636c8b0795cSMark F. Adams } /* loop over list of deleted */ 637c8b0795cSMark F. Adams } /* selected */ 638c8b0795cSMark F. Adams } 6390cbbd2e1SMark F. Adams ierr = GAMGTableDestroy( &gid_cpid ); CHKERRQ(ierr); 640c8b0795cSMark F. Adams 6410cbbd2e1SMark F. Adams /* look at ghosts, see if they changed - and it */ 6420cbbd2e1SMark F. Adams for( cpid = 0 ; cpid < nghost_2 ; cpid++ ){ 6430cbbd2e1SMark F. Adams PetscInt sgid_new = (PetscInt)PetscRealPart(cpcol_2_parent[cpid]); 6440cbbd2e1SMark F. Adams if( sgid_new >= my0 && sgid_new < Iend ) { /* this is mine */ 6450cbbd2e1SMark F. Adams PetscInt gid = (PetscInt)PetscRealPart(cpcol_2_gid[cpid]); 6460cbbd2e1SMark F. Adams PetscInt slid_new=sgid_new-my0,hav=0; 64741b27cdeSMark F. Adams PetscCDPos pos; 6480cbbd2e1SMark F. Adams /* search for this gid to see if I have it */ 649e78576d6SMark F. Adams ierr = PetscCDGetHeadPos(aggs_2,slid_new,&pos); CHKERRQ(ierr); 650e78576d6SMark F. Adams while(pos){ 651e78576d6SMark F. Adams PetscInt gidj; 652ffc955d6SMark F. Adams ierr = PetscLLNGetID( pos, &gidj ); CHKERRQ(ierr); 653e78576d6SMark F. Adams ierr = PetscCDGetNextPos(aggs_2,slid_new,&pos); CHKERRQ(ierr); 654e78576d6SMark F. Adams 6550cbbd2e1SMark F. Adams if( gidj == gid ) { hav = 1; break; } 656c8b0795cSMark F. Adams } 657c8b0795cSMark F. Adams if( hav != 1 ){ 658ffc955d6SMark F. Adams /* insert 'flidj' into head of llist */ 65941b27cdeSMark F. Adams ierr = PetscCDAppendID( aggs_2, slid_new, gid ); CHKERRQ(ierr); 660c8b0795cSMark F. Adams } 661c8b0795cSMark F. Adams } 662c8b0795cSMark F. Adams } 663c8b0795cSMark F. Adams 6640cbbd2e1SMark F. Adams ierr = VecRestoreArray( mpimat_1->lvec, &cpcol_1_state ); CHKERRQ(ierr); 6650cbbd2e1SMark F. Adams ierr = VecRestoreArray( mpimat_2->lvec, &cpcol_2_state ); CHKERRQ(ierr); 6660cbbd2e1SMark F. Adams ierr = VecRestoreArray( ghostparents2, &cpcol_2_parent ); CHKERRQ(ierr); 6670cbbd2e1SMark F. Adams ierr = VecRestoreArray( ghostgids2, &cpcol_2_gid ); CHKERRQ(ierr); 668c8b0795cSMark F. Adams ierr = PetscFree( lid_cprowID_1 ); CHKERRQ(ierr); 6690cbbd2e1SMark F. Adams ierr = VecDestroy( &ghostgids2 ); CHKERRQ(ierr); 6700cbbd2e1SMark F. Adams ierr = VecDestroy( &ghostparents2 ); CHKERRQ(ierr); 6710cbbd2e1SMark F. Adams ierr = VecDestroy( &ghost_par_orig2 ); CHKERRQ(ierr); 672c8b0795cSMark F. Adams } 673c8b0795cSMark F. Adams 6740cbbd2e1SMark F. Adams ierr = PetscFree( lid_parent_gid ); CHKERRQ(ierr); 675c8b0795cSMark F. Adams ierr = PetscFree( lid_state ); CHKERRQ(ierr); 676c8b0795cSMark F. Adams 677c8b0795cSMark F. Adams PetscFunctionReturn(0); 678c8b0795cSMark F. Adams } 6792e68589bSMark F. Adams 6802e68589bSMark F. Adams /* -------------------------------------------------------------------------- */ 6812e68589bSMark F. Adams /* 682*a2f3521dSMark F. Adams PCSetData_AGG - called if data is not set with PCSetCoordinates. 683*a2f3521dSMark F. Adams Looks in Mat for near null space. 684*a2f3521dSMark F. Adams Does not work for Stokes 6852e68589bSMark F. Adams 6862e68589bSMark F. Adams Input Parameter: 6872e68589bSMark F. Adams . pc - 688*a2f3521dSMark F. Adams . a_A - matrix to get (near) null space out of. 6892e68589bSMark F. Adams */ 6902e68589bSMark F. Adams #undef __FUNCT__ 6912e68589bSMark F. Adams #define __FUNCT__ "PCSetData_AGG" 692b8cd405aSMark F. Adams PetscErrorCode PCSetData_AGG( PC pc, Mat a_A ) 6932e68589bSMark F. Adams { 6942e68589bSMark F. Adams PetscErrorCode ierr; 695b8cd405aSMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 696b8cd405aSMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 697b8cd405aSMark F. Adams MatNullSpace mnull; 698b8cd405aSMark F. Adams 6992e68589bSMark F. Adams PetscFunctionBegin; 700b8cd405aSMark F. Adams ierr = MatGetNearNullSpace( a_A, &mnull ); CHKERRQ(ierr); 701b8cd405aSMark F. Adams if( !mnull ) { 702*a2f3521dSMark F. Adams PetscInt bs,NN,MM; 703*a2f3521dSMark F. Adams ierr = MatGetBlockSize( a_A, &bs ); CHKERRQ( ierr ); /* this does not work for Stokes */ 704*a2f3521dSMark F. Adams ierr = MatGetLocalSize( a_A, &MM, &NN ); CHKERRQ( ierr ); 705*a2f3521dSMark F. Adams /* this does not work for Stokes */ 706*a2f3521dSMark F. Adams ierr = PCSetCoordinates_AGG( pc, bs, MM/bs, PETSC_NULL ); CHKERRQ(ierr); 707b8cd405aSMark F. Adams } 708b8cd405aSMark F. Adams else { 709b8cd405aSMark F. Adams PetscReal *nullvec; 710b8cd405aSMark F. Adams PetscBool has_const; 711b8cd405aSMark F. Adams PetscInt i,j,mlocal,nvec,bs; 712b8cd405aSMark F. Adams const Vec *vecs; const PetscScalar *v; 713b8cd405aSMark F. Adams ierr = MatGetLocalSize(a_A,&mlocal,PETSC_NULL);CHKERRQ(ierr); 714b8cd405aSMark F. Adams ierr = MatNullSpaceGetVecs( mnull, &has_const, &nvec, &vecs ); CHKERRQ(ierr); 715b8cd405aSMark F. Adams ierr = PetscMalloc((nvec+!!has_const)*mlocal*sizeof *nullvec,&nullvec);CHKERRQ(ierr); 716b8cd405aSMark F. Adams if (has_const) for (i=0; i<mlocal; i++) nullvec[i] = 1.0; 717b8cd405aSMark F. Adams for (i=0; i<nvec; i++) { 718b8cd405aSMark F. Adams ierr = VecGetArrayRead(vecs[i],&v);CHKERRQ(ierr); 719b8cd405aSMark F. Adams for (j=0; j<mlocal; j++) nullvec[(i+!!has_const)*mlocal + j] = PetscRealPart(v[j]); 720b8cd405aSMark F. Adams ierr = VecRestoreArrayRead(vecs[i],&v);CHKERRQ(ierr); 721b8cd405aSMark F. Adams } 722b8cd405aSMark F. Adams pc_gamg->data = nullvec; 723b8cd405aSMark F. Adams pc_gamg->data_cell_cols = (nvec+!!has_const); 724*a2f3521dSMark F. Adams ierr = MatGetBlockSize( a_A, &bs ); CHKERRQ( ierr ); /* this does not work for Stokes */ 725b8cd405aSMark F. Adams pc_gamg->data_cell_rows = bs; 726b8cd405aSMark F. Adams } 7272e68589bSMark F. Adams PetscFunctionReturn(0); 7282e68589bSMark F. Adams } 7292e68589bSMark F. Adams 7302e68589bSMark F. Adams /* -------------------------------------------------------------------------- */ 7312e68589bSMark F. Adams /* 7322e68589bSMark F. Adams formProl0 7332e68589bSMark F. Adams 7342e68589bSMark F. Adams Input Parameter: 7350cbbd2e1SMark F. Adams . agg_llists - list of arrays with aggregates 7362e68589bSMark F. Adams . bs - block size 7370cbbd2e1SMark F. Adams . nSAvec - column bs of new P 7380cbbd2e1SMark F. Adams . my0crs - global index of start of locals 7392e68589bSMark F. Adams . data_stride - bs*(nloc nodes + ghost nodes) 7402e68589bSMark F. Adams . data_in[data_stride*nSAvec] - local data on fine grid 7412e68589bSMark F. Adams . flid_fgid[data_stride/bs] - make local to global IDs, includes ghosts in 'locals_llist' 7422e68589bSMark F. Adams Output Parameter: 7432e68589bSMark F. Adams . a_data_out - in with fine grid data (w/ghosts), out with coarse grid data 7442e68589bSMark F. Adams . a_Prol - prolongation operator 7452e68589bSMark F. Adams */ 7462e68589bSMark F. Adams #undef __FUNCT__ 7472e68589bSMark F. Adams #define __FUNCT__ "formProl0" 7480cbbd2e1SMark F. Adams static PetscErrorCode formProl0(const PetscCoarsenData *agg_llists,/* list from selected vertices of aggregate unselected vertices */ 7490cbbd2e1SMark F. Adams const PetscInt bs, /* (row) block size */ 7500cbbd2e1SMark F. Adams const PetscInt nSAvec, /* column bs */ 7510cbbd2e1SMark F. Adams const PetscInt my0crs, /* global index of start of locals */ 7520cbbd2e1SMark F. Adams const PetscInt data_stride, /* (nloc+nghost)*bs */ 7530cbbd2e1SMark F. Adams PetscReal data_in[], /* [data_stride][nSAvec] */ 7540cbbd2e1SMark F. Adams const PetscInt flid_fgid[], /* [data_stride/bs] */ 7552e68589bSMark F. Adams PetscReal **a_data_out, 7562e68589bSMark F. Adams Mat a_Prol /* prolongation operator (output)*/ 7572e68589bSMark F. Adams ) 7582e68589bSMark F. Adams { 7592e68589bSMark F. Adams PetscErrorCode ierr; 7600cbbd2e1SMark F. Adams PetscInt Istart,my0,Iend,nloc,clid,flid,aggID,kk,jj,ii,mm,ndone,nSelected,minsz,nghosts,out_data_stride; 7612e68589bSMark F. Adams MPI_Comm wcomm = ((PetscObject)a_Prol)->comm; 7622e68589bSMark F. Adams PetscMPIInt mype, npe; 7632e68589bSMark F. Adams PetscReal *out_data; 76441b27cdeSMark F. Adams PetscCDPos pos; 7650cbbd2e1SMark F. Adams GAMGHashTable fgid_flid; 7660cbbd2e1SMark F. Adams 767797e13b7SMark F. Adams /* #define OUT_AGGS */ 7689057884aSMark F. Adams #ifdef OUT_AGGS 769f7620de1SMatthew G Knepley static PetscInt llev = 0; char fname[32]; FILE *file = PETSC_NULL; PetscInt pM; 7709057884aSMark F. Adams #endif 7712e68589bSMark F. Adams 7722e68589bSMark F. Adams PetscFunctionBegin; 7732e68589bSMark F. Adams ierr = MPI_Comm_rank(wcomm,&mype);CHKERRQ(ierr); 7742e68589bSMark F. Adams ierr = MPI_Comm_size(wcomm,&npe);CHKERRQ(ierr); 7752e68589bSMark F. Adams ierr = MatGetOwnershipRange( a_Prol, &Istart, &Iend ); CHKERRQ(ierr); 7760cbbd2e1SMark F. Adams nloc = (Iend-Istart)/bs; my0 = Istart/bs; assert((Iend-Istart)%bs==0); 7770cbbd2e1SMark F. Adams Iend /= bs; 7780cbbd2e1SMark F. Adams nghosts = data_stride/bs - nloc; 7792e68589bSMark F. Adams 7800cbbd2e1SMark F. Adams ierr = GAMGTableCreate( 2*nghosts, &fgid_flid ); CHKERRQ(ierr); 7810cbbd2e1SMark F. Adams for(kk=0;kk<nghosts;kk++) { 7820cbbd2e1SMark F. Adams ierr = GAMGTableAdd( &fgid_flid, flid_fgid[nloc+kk], nloc+kk ); CHKERRQ(ierr); 7832e68589bSMark F. Adams } 7842e68589bSMark F. Adams 7850cbbd2e1SMark F. Adams #ifdef OUT_AGGS 7860cbbd2e1SMark F. Adams sprintf(fname,"aggs_%d_%d.m",llev++,mype); 7870cbbd2e1SMark F. Adams if(llev==1) { 7880cbbd2e1SMark F. Adams file = fopen(fname,"w"); 7890cbbd2e1SMark F. Adams } 7900cbbd2e1SMark F. Adams MatGetSize( a_Prol, &pM, &jj ); 7910cbbd2e1SMark F. Adams #endif 7920cbbd2e1SMark F. Adams 7930cbbd2e1SMark F. Adams /* count selected -- same as number of cols of P */ 7940cbbd2e1SMark F. Adams for(nSelected=mm=0;mm<nloc;mm++) { 795e78576d6SMark F. Adams PetscBool ise; 796e78576d6SMark F. Adams ierr = PetscCDEmptyAt( agg_llists, mm, &ise ); CHKERRQ(ierr); 797e78576d6SMark F. Adams if( !ise ) nSelected++; 7980cbbd2e1SMark F. Adams } 7990cbbd2e1SMark F. Adams ierr = MatGetOwnershipRangeColumn( a_Prol, &ii, &jj ); CHKERRQ(ierr); 8000cbbd2e1SMark F. Adams assert((ii/nSAvec)==my0crs); assert(nSelected==(jj-ii)/nSAvec); 8010cbbd2e1SMark F. Adams 8022e68589bSMark F. Adams /* aloc space for coarse point data (output) */ 8030cbbd2e1SMark F. Adams out_data_stride = nSelected*nSAvec; 8040cbbd2e1SMark F. Adams ierr = PetscMalloc( out_data_stride*nSAvec*sizeof(PetscReal), &out_data ); CHKERRQ(ierr); 8050cbbd2e1SMark F. Adams for(ii=0;ii<out_data_stride*nSAvec;ii++) { 8060cbbd2e1SMark F. Adams out_data[ii]=1.e300; 8070cbbd2e1SMark F. Adams } 8080cbbd2e1SMark F. Adams *a_data_out = out_data; /* output - stride nSelected*nSAvec */ 8092e68589bSMark F. Adams 8102e68589bSMark F. Adams /* find points and set prolongation */ 811c8b0795cSMark F. Adams minsz = 100; 8122e68589bSMark F. Adams ndone = 0; 8130cbbd2e1SMark F. Adams for( mm = clid = 0 ; mm < nloc ; mm++ ){ 814e78576d6SMark F. Adams ierr = PetscCDSizeAt( agg_llists, mm, &jj ); CHKERRQ(ierr); 815e78576d6SMark F. Adams if( jj > 0 ) { 8160cbbd2e1SMark F. Adams const PetscInt lid = mm, cgid = my0crs + clid; 8170cbbd2e1SMark F. Adams PetscInt cids[100]; /* max bs */ 8180cbbd2e1SMark F. Adams PetscBLASInt asz=jj,M=asz*bs,N=nSAvec,INFO; 8192e68589bSMark F. Adams PetscBLASInt Mdata=M+((N-M>0)?N-M:0),LDA=Mdata,LWORK=N*bs; 8202e68589bSMark F. Adams PetscScalar *qqc,*qqr,*TAU,*WORK; 8212e68589bSMark F. Adams PetscInt *fids; 82265d7b583SSatish Balay PetscReal *data; 8230cbbd2e1SMark F. Adams /* count agg */ 8240cbbd2e1SMark F. Adams if( asz<minsz ) minsz = asz; 8250cbbd2e1SMark F. Adams 8260cbbd2e1SMark F. Adams /* get block */ 8272e68589bSMark F. Adams ierr = PetscMalloc( (Mdata*N)*sizeof(PetscScalar), &qqc ); CHKERRQ(ierr); 8282e68589bSMark F. Adams ierr = PetscMalloc( (M*N)*sizeof(PetscScalar), &qqr ); CHKERRQ(ierr); 8292e68589bSMark F. Adams ierr = PetscMalloc( N*sizeof(PetscScalar), &TAU ); CHKERRQ(ierr); 8302e68589bSMark F. Adams ierr = PetscMalloc( LWORK*sizeof(PetscScalar), &WORK ); CHKERRQ(ierr); 8312e68589bSMark F. Adams ierr = PetscMalloc( M*sizeof(PetscInt), &fids ); CHKERRQ(ierr); 8322e68589bSMark F. Adams 8332e68589bSMark F. Adams aggID = 0; 834e78576d6SMark F. Adams ierr = PetscCDGetHeadPos(agg_llists,lid,&pos); CHKERRQ(ierr); 835e78576d6SMark F. Adams while(pos){ 836e78576d6SMark F. Adams PetscInt gid1; 837ffc955d6SMark F. Adams ierr = PetscLLNGetID( pos, &gid1 ); CHKERRQ(ierr); 838e78576d6SMark F. Adams ierr = PetscCDGetNextPos(agg_llists,lid,&pos); CHKERRQ(ierr); 839e78576d6SMark F. Adams 8400cbbd2e1SMark F. Adams if( gid1 >= my0 && gid1 < Iend ) flid = gid1 - my0; 8410cbbd2e1SMark F. Adams else { 8420cbbd2e1SMark F. Adams ierr = GAMGTableFind( &fgid_flid, gid1, &flid ); CHKERRQ(ierr); 8430cbbd2e1SMark F. Adams assert(flid>=0); 8440cbbd2e1SMark F. Adams } 8452e68589bSMark F. Adams /* copy in B_i matrix - column oriented */ 84665d7b583SSatish Balay data = &data_in[flid*bs]; 8472e68589bSMark F. Adams for( kk = ii = 0; ii < bs ; ii++ ) { 8482e68589bSMark F. Adams for( jj = 0; jj < N ; jj++ ) { 8490cbbd2e1SMark F. Adams PetscReal d = data[jj*data_stride + ii]; 8500cbbd2e1SMark F. Adams qqc[jj*Mdata + aggID*bs + ii] = d; 8512e68589bSMark F. Adams } 8522e68589bSMark F. Adams } 8539057884aSMark F. Adams #ifdef OUT_AGGS 854b2a4f308SMark F. Adams if(llev==1) { 8559057884aSMark F. Adams char str[] = "plot(%e,%e,'r*'), hold on,\n", col[] = "rgbkmc", sim[] = "*os+h>d<vx^"; 8560cbbd2e1SMark F. Adams PetscInt MM,pi,pj; 8570cbbd2e1SMark F. Adams str[12] = col[(clid+17*mype)%6]; str[13] = sim[(clid+17*mype)%11]; 858f7620de1SMatthew G Knepley MM = (PetscInt)(PetscSqrtReal((PetscReal)pM)); 8590cbbd2e1SMark F. Adams pj = gid1/MM; pi = gid1%MM; 860b2a4f308SMark F. Adams fprintf(file,str,(double)pi,(double)pj); 861b2a4f308SMark F. Adams /* fprintf(file,str,data[2*data_stride+1],-data[2*data_stride]); */ 8629057884aSMark F. Adams } 8639057884aSMark F. Adams #endif 8642e68589bSMark F. Adams /* set fine IDs */ 8652e68589bSMark F. Adams for(kk=0;kk<bs;kk++) fids[aggID*bs + kk] = flid_fgid[flid]*bs + kk; 8662e68589bSMark F. Adams 8672e68589bSMark F. Adams aggID++; 8680cbbd2e1SMark F. Adams } 8692e68589bSMark F. Adams 8702e68589bSMark F. Adams /* pad with zeros */ 8712e68589bSMark F. Adams for( ii = asz*bs; ii < Mdata ; ii++ ) { 8722e68589bSMark F. Adams for( jj = 0; jj < N ; jj++, kk++ ) { 8732e68589bSMark F. Adams qqc[jj*Mdata + ii] = .0; 8742e68589bSMark F. Adams } 8752e68589bSMark F. Adams } 8762e68589bSMark F. Adams 8772e68589bSMark F. Adams ndone += aggID; 8782e68589bSMark F. Adams /* QR */ 8792e68589bSMark F. Adams LAPACKgeqrf_( &Mdata, &N, qqc, &LDA, TAU, WORK, &LWORK, &INFO ); 8802e68589bSMark F. Adams if( INFO != 0 ) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"xGEQRS error"); 8812e68589bSMark F. Adams /* get R - column oriented - output B_{i+1} */ 8822e68589bSMark F. Adams { 8832e68589bSMark F. Adams PetscReal *data = &out_data[clid*nSAvec]; 8842e68589bSMark F. Adams for( jj = 0; jj < nSAvec ; jj++ ) { 8852e68589bSMark F. Adams for( ii = 0; ii < nSAvec ; ii++ ) { 8860cbbd2e1SMark F. Adams assert(data[jj*out_data_stride + ii] == 1.e300); 8870cbbd2e1SMark F. Adams if( ii <= jj ) data[jj*out_data_stride + ii] = PetscRealPart(qqc[jj*Mdata + ii]); 8880cbbd2e1SMark F. Adams else data[jj*out_data_stride + ii] = 0.; 8892e68589bSMark F. Adams } 8902e68589bSMark F. Adams } 8912e68589bSMark F. Adams } 8922e68589bSMark F. Adams 8932e68589bSMark F. Adams /* get Q - row oriented */ 8942e68589bSMark F. Adams LAPACKungqr_( &Mdata, &N, &N, qqc, &LDA, TAU, WORK, &LWORK, &INFO ); 8952e68589bSMark F. Adams if( INFO != 0 ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"xORGQR error arg %d",-INFO); 8962e68589bSMark F. Adams 8972e68589bSMark F. Adams for( ii = 0 ; ii < M ; ii++ ){ 8982e68589bSMark F. Adams for( jj = 0 ; jj < N ; jj++ ) { 8992e68589bSMark F. Adams qqr[N*ii + jj] = qqc[jj*Mdata + ii]; 9002e68589bSMark F. Adams } 9012e68589bSMark F. Adams } 9022e68589bSMark F. Adams 9032e68589bSMark F. Adams /* add diagonal block of P0 */ 904c8b0795cSMark F. Adams for(kk=0;kk<N;kk++) { 905c8b0795cSMark F. Adams cids[kk] = N*cgid + kk; /* global col IDs in P0 */ 906c8b0795cSMark F. Adams } 9072e68589bSMark F. Adams ierr = MatSetValues(a_Prol,M,fids,N,cids,qqr,INSERT_VALUES); CHKERRQ(ierr); 9082e68589bSMark F. Adams 9092e68589bSMark F. Adams ierr = PetscFree( qqc ); CHKERRQ(ierr); 9102e68589bSMark F. Adams ierr = PetscFree( qqr ); CHKERRQ(ierr); 9112e68589bSMark F. Adams ierr = PetscFree( TAU ); CHKERRQ(ierr); 9122e68589bSMark F. Adams ierr = PetscFree( WORK ); CHKERRQ(ierr); 9132e68589bSMark F. Adams ierr = PetscFree( fids ); CHKERRQ(ierr); 914b43b03e9SMark F. Adams clid++; 9150cbbd2e1SMark F. Adams } /* coarse agg */ 9160cbbd2e1SMark F. Adams } /* for all fine nodes */ 9170cbbd2e1SMark F. Adams ierr = MatAssemblyBegin(a_Prol,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 9180cbbd2e1SMark F. Adams ierr = MatAssemblyEnd(a_Prol,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 9192e68589bSMark F. Adams 920c8b0795cSMark F. Adams /* ierr = MPI_Allreduce( &ndone, &ii, 1, MPIU_INT, MPIU_SUM, wcomm ); */ 9212e68589bSMark F. Adams /* MatGetSize( a_Prol, &kk, &jj ); */ 922c8b0795cSMark F. Adams /* ierr = MPI_Allreduce( &minsz, &jj, 1, MPIU_INT, MPIU_MIN, wcomm ); */ 923e78576d6SMark F. Adams /* PetscPrintf(wcomm," **** [%d]%s %d total done, %d nodes (%d local done), min agg. size = %d\n",mype,__FUNCT__,ii,kk/bs,ndone,jj); */ 9242e68589bSMark F. Adams 9259057884aSMark F. Adams #ifdef OUT_AGGS 926b2a4f308SMark F. Adams if(llev==1) fclose(file); 9279057884aSMark F. Adams #endif 9280cbbd2e1SMark F. Adams ierr = GAMGTableDestroy( &fgid_flid ); CHKERRQ(ierr); 9292e68589bSMark F. Adams 9302e68589bSMark F. Adams PetscFunctionReturn(0); 9312e68589bSMark F. Adams } 9322e68589bSMark F. Adams 9332e68589bSMark F. Adams /* -------------------------------------------------------------------------- */ 9342e68589bSMark F. Adams /* 935c8b0795cSMark F. Adams PCGAMGgraph_AGG 9362e68589bSMark F. Adams 9372e68589bSMark F. Adams Input Parameter: 9382e68589bSMark F. Adams . pc - this 9392e68589bSMark F. Adams . Amat - matrix on this fine level 9402e68589bSMark F. Adams Output Parameter: 941c8b0795cSMark F. Adams . a_Gmat - 9422e68589bSMark F. Adams */ 9432e68589bSMark F. Adams #undef __FUNCT__ 944c8b0795cSMark F. Adams #define __FUNCT__ "PCGAMGgraph_AGG" 945c8b0795cSMark F. Adams PetscErrorCode PCGAMGgraph_AGG( PC pc, 9462e68589bSMark F. Adams const Mat Amat, 947c8b0795cSMark F. Adams Mat *a_Gmat 948c8b0795cSMark F. Adams ) 949c8b0795cSMark F. Adams { 950c8b0795cSMark F. Adams PetscErrorCode ierr; 951c8b0795cSMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 952c8b0795cSMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 953c8b0795cSMark F. Adams const PetscInt verbose = pc_gamg->verbose; 954c8b0795cSMark F. Adams const PetscReal vfilter = pc_gamg->threshold; 955c8b0795cSMark F. Adams PC_GAMG_AGG *pc_gamg_agg = (PC_GAMG_AGG*)pc_gamg->subctx; 956c8b0795cSMark F. Adams PetscMPIInt mype,npe; 957e0940f08SMark F. Adams Mat Gmat; 958c8b0795cSMark F. Adams MPI_Comm wcomm = ((PetscObject)Amat)->comm; 9590cbbd2e1SMark F. Adams PetscBool set,flg,symm; 960c8b0795cSMark F. Adams 961c8b0795cSMark F. Adams PetscFunctionBegin; 9620cbbd2e1SMark F. Adams #if defined PETSC_USE_LOG 9630cbbd2e1SMark F. Adams ierr = PetscLogEventBegin(PC_GAMGGgraph_AGG,0,0,0,0);CHKERRQ(ierr); 9640cbbd2e1SMark F. Adams #endif 965c8b0795cSMark F. Adams ierr = MPI_Comm_rank( wcomm, &mype); CHKERRQ(ierr); 966c8b0795cSMark F. Adams ierr = MPI_Comm_size( wcomm, &npe); CHKERRQ(ierr); 967c8b0795cSMark F. Adams 9680cbbd2e1SMark F. Adams ierr = MatIsSymmetricKnown(Amat, &set, &flg); CHKERRQ(ierr); 969263489e9SJed Brown symm = (PetscBool)(pc_gamg_agg->sym_graph || !(set && flg)); 9700cbbd2e1SMark F. Adams 9712d7fac45SMark F. Adams ierr = PCGAMGCreateGraph( Amat, &Gmat ); CHKERRQ( ierr ); 9722d7fac45SMark F. Adams ierr = PCGAMGFilterGraph( &Gmat, vfilter, symm, verbose ); CHKERRQ( ierr ); 973c8b0795cSMark F. Adams 974e0940f08SMark F. Adams *a_Gmat = Gmat; 975c8b0795cSMark F. Adams 9760cbbd2e1SMark F. Adams #if defined PETSC_USE_LOG 9770cbbd2e1SMark F. Adams ierr = PetscLogEventEnd(PC_GAMGGgraph_AGG,0,0,0,0);CHKERRQ(ierr); 9780cbbd2e1SMark F. Adams #endif 979c8b0795cSMark F. Adams PetscFunctionReturn(0); 980c8b0795cSMark F. Adams } 981c8b0795cSMark F. Adams 982c8b0795cSMark F. Adams /* -------------------------------------------------------------------------- */ 983c8b0795cSMark F. Adams /* 984b43b03e9SMark F. Adams PCGAMGCoarsen_AGG 985c8b0795cSMark F. Adams 986c8b0795cSMark F. Adams Input Parameter: 987e0940f08SMark F. Adams . a_pc - this 988e0940f08SMark F. Adams Input/Output Parameter: 9890cbbd2e1SMark F. Adams . a_Gmat1 - graph on this fine level - coarsening can change this (squares it) 990c8b0795cSMark F. Adams Output Parameter: 9910cbbd2e1SMark F. Adams . agg_lists - list of aggregates 992c8b0795cSMark F. Adams */ 993c8b0795cSMark F. Adams #undef __FUNCT__ 994b43b03e9SMark F. Adams #define __FUNCT__ "PCGAMGCoarsen_AGG" 995e0940f08SMark F. Adams PetscErrorCode PCGAMGCoarsen_AGG( PC a_pc, 996e0940f08SMark F. Adams Mat *a_Gmat1, 9970cbbd2e1SMark F. Adams PetscCoarsenData **agg_lists 998c8b0795cSMark F. Adams ) 999c8b0795cSMark F. Adams { 1000c8b0795cSMark F. Adams PetscErrorCode ierr; 1001e0940f08SMark F. Adams PC_MG *mg = (PC_MG*)a_pc->data; 1002c8b0795cSMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 1003c8b0795cSMark F. Adams PC_GAMG_AGG *pc_gamg_agg = (PC_GAMG_AGG*)pc_gamg->subctx; 10040cbbd2e1SMark F. Adams Mat mat,Gmat2, Gmat1 = *a_Gmat1; /* squared graph */ 10050cbbd2e1SMark F. Adams IS perm; 1006c8b0795cSMark F. Adams PetscInt Ii,nloc,bs,n,m; 1007c8b0795cSMark F. Adams PetscInt *permute; 1008c8b0795cSMark F. Adams PetscBool *bIndexSet; 1009b43b03e9SMark F. Adams MatCoarsen crs; 1010e0940f08SMark F. Adams MPI_Comm wcomm = ((PetscObject)Gmat1)->comm; 10110cbbd2e1SMark F. Adams PetscMPIInt mype,npe; 1012c8b0795cSMark F. Adams 1013c8b0795cSMark F. Adams PetscFunctionBegin; 10140cbbd2e1SMark F. Adams #if defined PETSC_USE_LOG 10150cbbd2e1SMark F. Adams ierr = PetscLogEventBegin(PC_GAMGCoarsen_AGG,0,0,0,0);CHKERRQ(ierr); 10160cbbd2e1SMark F. Adams #endif 10170cbbd2e1SMark F. Adams ierr = MPI_Comm_rank( wcomm, &mype); CHKERRQ(ierr); 10180cbbd2e1SMark F. Adams ierr = MPI_Comm_size( wcomm, &npe); CHKERRQ(ierr); 1019e0940f08SMark F. Adams ierr = MatGetLocalSize( Gmat1, &n, &m ); CHKERRQ(ierr); 1020e0940f08SMark F. Adams ierr = MatGetBlockSize( Gmat1, &bs ); CHKERRQ(ierr); assert(bs==1); 1021c8b0795cSMark F. Adams nloc = n/bs; 1022c8b0795cSMark F. Adams 1023e0940f08SMark F. Adams if( pc_gamg_agg->square_graph ) { 1024e0940f08SMark F. Adams ierr = MatTransposeMatMult( Gmat1, Gmat1, MAT_INITIAL_MATRIX, PETSC_DEFAULT, &Gmat2 ); 1025e0940f08SMark F. Adams CHKERRQ(ierr); 1026e0940f08SMark F. Adams } 1027e0940f08SMark F. Adams else Gmat2 = Gmat1; 1028c8b0795cSMark F. Adams 1029c8b0795cSMark F. Adams /* get MIS aggs */ 1030c8b0795cSMark F. Adams /* randomize */ 1031c8b0795cSMark F. Adams ierr = PetscMalloc( nloc*sizeof(PetscInt), &permute ); CHKERRQ(ierr); 1032c8b0795cSMark F. Adams ierr = PetscMalloc( nloc*sizeof(PetscBool), &bIndexSet ); CHKERRQ(ierr); 1033c8b0795cSMark F. Adams for ( Ii = 0; Ii < nloc ; Ii++ ){ 1034c8b0795cSMark F. Adams bIndexSet[Ii] = PETSC_FALSE; 1035c8b0795cSMark F. Adams permute[Ii] = Ii; 1036c8b0795cSMark F. Adams } 1037c8b0795cSMark F. Adams srand(1); /* make deterministic */ 1038c8b0795cSMark F. Adams for ( Ii = 0; Ii < nloc ; Ii++ ) { 1039c8b0795cSMark F. Adams PetscInt iSwapIndex = rand()%nloc; 1040c8b0795cSMark F. Adams if (!bIndexSet[iSwapIndex] && iSwapIndex != Ii) { 1041c8b0795cSMark F. Adams PetscInt iTemp = permute[iSwapIndex]; 1042c8b0795cSMark F. Adams permute[iSwapIndex] = permute[Ii]; 1043c8b0795cSMark F. Adams permute[Ii] = iTemp; 1044c8b0795cSMark F. Adams bIndexSet[iSwapIndex] = PETSC_TRUE; 1045c8b0795cSMark F. Adams } 1046c8b0795cSMark F. Adams } 1047c8b0795cSMark F. Adams ierr = PetscFree( bIndexSet ); CHKERRQ(ierr); 1048c8b0795cSMark F. Adams 1049c8b0795cSMark F. Adams ierr = ISCreateGeneral(PETSC_COMM_SELF, nloc, permute, PETSC_USE_POINTER, &perm); 1050c8b0795cSMark F. Adams CHKERRQ(ierr); 10510cbbd2e1SMark F. Adams #if defined PETSC_GAMG_USE_LOG 10520cbbd2e1SMark F. Adams ierr = PetscLogEventBegin(petsc_gamg_setup_events[SET4],0,0,0,0);CHKERRQ(ierr); 1053b43b03e9SMark F. Adams #endif 1054b43b03e9SMark F. Adams ierr = MatCoarsenCreate( wcomm, &crs ); CHKERRQ(ierr); 10559057884aSMark F. Adams /* ierr = MatCoarsenSetType( crs, MATCOARSENMIS ); CHKERRQ(ierr); */ 10569057884aSMark F. Adams ierr = MatCoarsenSetFromOptions( crs ); CHKERRQ(ierr); 1057b43b03e9SMark F. Adams ierr = MatCoarsenSetGreedyOrdering( crs, perm ); CHKERRQ(ierr); 1058b43b03e9SMark F. Adams ierr = MatCoarsenSetAdjacency( crs, Gmat2 ); CHKERRQ(ierr); 1059b43b03e9SMark F. Adams ierr = MatCoarsenSetVerbose( crs, pc_gamg->verbose ); CHKERRQ(ierr); 1060b43b03e9SMark F. Adams ierr = MatCoarsenSetStrictAggs( crs, PETSC_TRUE ); CHKERRQ(ierr); 1061b43b03e9SMark F. Adams ierr = MatCoarsenApply( crs ); CHKERRQ(ierr); 10620cbbd2e1SMark F. Adams ierr = MatCoarsenGetData( crs, agg_lists ); CHKERRQ(ierr); /* output */ 1063b43b03e9SMark F. Adams ierr = MatCoarsenDestroy( &crs ); CHKERRQ(ierr); 1064b43b03e9SMark F. Adams 1065c8b0795cSMark F. Adams ierr = ISDestroy( &perm ); CHKERRQ(ierr); 1066c8b0795cSMark F. Adams ierr = PetscFree( permute ); CHKERRQ(ierr); 10670cbbd2e1SMark F. Adams #if defined PETSC_GAMG_USE_LOG 10680cbbd2e1SMark F. Adams ierr = PetscLogEventEnd(petsc_gamg_setup_events[SET4],0,0,0,0);CHKERRQ(ierr); 1069b43b03e9SMark F. Adams #endif 1070c8b0795cSMark F. Adams /* smooth aggs */ 1071e0940f08SMark F. Adams if( Gmat2 != Gmat1 ) { 10720cbbd2e1SMark F. Adams const PetscCoarsenData *llist = *agg_lists; 10730cbbd2e1SMark F. Adams ierr = smoothAggs( Gmat2, Gmat1, *agg_lists ); CHKERRQ(ierr); 1074c8b0795cSMark F. Adams ierr = MatDestroy( &Gmat1 ); CHKERRQ(ierr); 1075e0940f08SMark F. Adams *a_Gmat1 = Gmat2; /* output */ 107641b27cdeSMark F. Adams ierr = PetscCDGetMat( llist, &mat ); CHKERRQ(ierr); 10770cbbd2e1SMark F. Adams if(mat) SETERRQ(wcomm,PETSC_ERR_ARG_WRONG, "Auxilary matrix with squared graph????"); 1078ef4ad70eSMark F. Adams } 10790cbbd2e1SMark F. Adams else { 10800cbbd2e1SMark F. Adams const PetscCoarsenData *llist = *agg_lists; 10810cbbd2e1SMark F. Adams /* see if we have a matrix that takes pecedence (returned from MatCoarsenAppply) */ 108241b27cdeSMark F. Adams ierr = PetscCDGetMat( llist, &mat ); CHKERRQ(ierr); 10830cbbd2e1SMark F. Adams if( mat ) { 10840cbbd2e1SMark F. Adams ierr = MatDestroy( &Gmat1 ); CHKERRQ(ierr); 10850cbbd2e1SMark F. Adams *a_Gmat1 = mat; /* output */ 10860cbbd2e1SMark F. Adams } 10870cbbd2e1SMark F. Adams } 10880cbbd2e1SMark F. Adams #if defined PETSC_USE_LOG 10890cbbd2e1SMark F. Adams ierr = PetscLogEventEnd(PC_GAMGCoarsen_AGG,0,0,0,0);CHKERRQ(ierr); 10900cbbd2e1SMark F. Adams #endif 1091c8b0795cSMark F. Adams PetscFunctionReturn(0); 1092c8b0795cSMark F. Adams } 1093c8b0795cSMark F. Adams 1094c8b0795cSMark F. Adams /* -------------------------------------------------------------------------- */ 1095c8b0795cSMark F. Adams /* 10960cbbd2e1SMark F. Adams PCGAMGProlongator_AGG 1097c8b0795cSMark F. Adams 1098c8b0795cSMark F. Adams Input Parameter: 1099c8b0795cSMark F. Adams . pc - this 1100c8b0795cSMark F. Adams . Amat - matrix on this fine level 1101c8b0795cSMark F. Adams . Graph - used to get ghost data for nodes in 11020cbbd2e1SMark F. Adams . agg_lists - list of aggregates 1103c8b0795cSMark F. Adams Output Parameter: 1104c8b0795cSMark F. Adams . a_P_out - prolongation operator to the next level 1105c8b0795cSMark F. Adams */ 1106c8b0795cSMark F. Adams #undef __FUNCT__ 11070cbbd2e1SMark F. Adams #define __FUNCT__ "PCGAMGProlongator_AGG" 11080cbbd2e1SMark F. Adams PetscErrorCode PCGAMGProlongator_AGG( PC pc, 1109c8b0795cSMark F. Adams const Mat Amat, 1110c8b0795cSMark F. Adams const Mat Gmat, 11110cbbd2e1SMark F. Adams PetscCoarsenData *agg_lists, 1112c8b0795cSMark F. Adams Mat *a_P_out 11132e68589bSMark F. Adams ) 11142e68589bSMark F. Adams { 11152e68589bSMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 11162e68589bSMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 11172e68589bSMark F. Adams const PetscInt verbose = pc_gamg->verbose; 1118c8b0795cSMark F. Adams const PetscInt data_cols = pc_gamg->data_cell_cols; 11192e68589bSMark F. Adams PetscErrorCode ierr; 1120c8b0795cSMark F. Adams PetscInt Istart,Iend,nloc,ii,jj,kk,my0,nLocalSelected,bs; 1121c8b0795cSMark F. Adams Mat Prol; 11222e68589bSMark F. Adams PetscMPIInt mype, npe; 11232e68589bSMark F. Adams MPI_Comm wcomm = ((PetscObject)Amat)->comm; 11240cbbd2e1SMark F. Adams const PetscInt col_bs = data_cols; 1125c8b0795cSMark F. Adams PetscReal *data_w_ghost; 1126c8b0795cSMark F. Adams PetscInt myCrs0, nbnodes=0, *flid_fgid; 11272e68589bSMark F. Adams 11282e68589bSMark F. Adams PetscFunctionBegin; 11290cbbd2e1SMark F. Adams #if defined PETSC_USE_LOG 11300cbbd2e1SMark F. Adams ierr = PetscLogEventBegin(PC_GAMGProlongator_AGG,0,0,0,0);CHKERRQ(ierr); 11310cbbd2e1SMark F. Adams #endif 11322e68589bSMark F. Adams ierr = MPI_Comm_rank( wcomm, &mype); CHKERRQ(ierr); 11332e68589bSMark F. Adams ierr = MPI_Comm_size( wcomm, &npe); CHKERRQ(ierr); 11342e68589bSMark F. Adams ierr = MatGetOwnershipRange( Amat, &Istart, &Iend ); CHKERRQ(ierr); 1135c8b0795cSMark F. Adams ierr = MatGetBlockSize( Amat, &bs ); CHKERRQ( ierr ); 1136c8b0795cSMark F. Adams nloc = (Iend-Istart)/bs; my0 = Istart/bs; assert((Iend-Istart)%bs==0); 11372e68589bSMark F. Adams 11382e68589bSMark F. Adams /* get 'nLocalSelected' */ 11390cbbd2e1SMark F. Adams for( ii=0, nLocalSelected = 0 ; ii < nloc ; ii++ ){ 1140e78576d6SMark F. Adams PetscBool ise; 11410cbbd2e1SMark F. Adams /* filter out singletons 0 or 1? */ 1142e78576d6SMark F. Adams ierr = PetscCDEmptyAt( agg_lists, ii, &ise ); CHKERRQ(ierr); 1143e78576d6SMark F. Adams if( !ise ) nLocalSelected++; 11442e68589bSMark F. Adams } 11452e68589bSMark F. Adams 11462e68589bSMark F. Adams /* create prolongator, create P matrix */ 1147*a2f3521dSMark F. Adams ierr = MatCreate( wcomm, &Prol ); CHKERRQ(ierr); 1148*a2f3521dSMark F. Adams ierr = MatSetSizes(Prol,nloc*bs,nLocalSelected*col_bs,PETSC_DETERMINE,PETSC_DETERMINE); 11492e68589bSMark F. Adams CHKERRQ(ierr); 1150*a2f3521dSMark F. Adams ierr = MatSetBlockSizes( Prol, bs, col_bs ); CHKERRQ(ierr); 1151*a2f3521dSMark F. Adams ierr = MatSetType( Prol, MATAIJ ); CHKERRQ(ierr); 1152*a2f3521dSMark F. Adams ierr = MatSeqAIJSetPreallocation( Prol, data_cols, PETSC_NULL); CHKERRQ(ierr); 1153*a2f3521dSMark F. Adams ierr = MatMPIAIJSetPreallocation(Prol,data_cols, PETSC_NULL,data_cols, PETSC_NULL);CHKERRQ(ierr); 1154*a2f3521dSMark F. Adams /* nloc*bs, nLocalSelected*col_bs, */ 1155*a2f3521dSMark F. Adams /* PETSC_DETERMINE, PETSC_DETERMINE, */ 1156*a2f3521dSMark F. Adams /* data_cols, PETSC_NULL, data_cols, PETSC_NULL, */ 1157*a2f3521dSMark F. Adams /* &Prol ); */ 11582e68589bSMark F. Adams 11592e68589bSMark F. Adams /* can get all points "removed" */ 1160c8b0795cSMark F. Adams ierr = MatGetSize( Prol, &kk, &ii ); CHKERRQ(ierr); 1161c8b0795cSMark F. Adams if( ii==0 ) { 11622e68589bSMark F. Adams if( verbose ) { 1163c8b0795cSMark F. Adams PetscPrintf(wcomm,"[%d]%s no selected points on coarse grid\n",mype,__FUNCT__); 11642e68589bSMark F. Adams } 11652e68589bSMark F. Adams ierr = MatDestroy( &Prol ); CHKERRQ(ierr); 11662e68589bSMark F. Adams *a_P_out = PETSC_NULL; /* out */ 11672e68589bSMark F. Adams PetscFunctionReturn(0); 11682e68589bSMark F. Adams } 1169c8b0795cSMark F. Adams if( verbose ) { 1170e78576d6SMark F. Adams PetscPrintf(wcomm,"\t\t[%d]%s New grid %d nodes\n",mype,__FUNCT__,ii/col_bs); 1171c8b0795cSMark F. Adams } 1172c8b0795cSMark F. Adams ierr = MatGetOwnershipRangeColumn( Prol, &myCrs0, &kk ); CHKERRQ(ierr); 11730cbbd2e1SMark F. Adams 11740cbbd2e1SMark F. Adams assert((kk-myCrs0)%col_bs==0); 1175c8b0795cSMark F. Adams myCrs0 = myCrs0/col_bs; 11760cbbd2e1SMark F. Adams assert((kk/col_bs-myCrs0)==nLocalSelected); 11772e68589bSMark F. Adams 11782e68589bSMark F. Adams /* create global vector of data in 'data_w_ghost' */ 11790cbbd2e1SMark F. Adams #if defined PETSC_GAMG_USE_LOG 11800cbbd2e1SMark F. Adams ierr = PetscLogEventBegin(petsc_gamg_setup_events[SET7],0,0,0,0);CHKERRQ(ierr); 11812e68589bSMark F. Adams #endif 1182c8b0795cSMark F. Adams if (npe > 1) { /* */ 11832e68589bSMark F. Adams PetscReal *tmp_gdata,*tmp_ldata,*tp2; 11842e68589bSMark F. Adams ierr = PetscMalloc( nloc*sizeof(PetscReal), &tmp_ldata ); CHKERRQ(ierr); 11852e68589bSMark F. Adams for( jj = 0 ; jj < data_cols ; jj++ ){ 1186c8b0795cSMark F. Adams for( kk = 0 ; kk < bs ; kk++) { 1187*a2f3521dSMark F. Adams PetscInt ii,stride; 1188c8b0795cSMark F. Adams const PetscReal *tp = pc_gamg->data + jj*bs*nloc + kk; 1189c8b0795cSMark F. Adams for( ii = 0 ; ii < nloc ; ii++, tp += bs ){ 11902e68589bSMark F. Adams tmp_ldata[ii] = *tp; 11912e68589bSMark F. Adams } 1192*a2f3521dSMark F. Adams ierr = PCGAMGGetDataWithGhosts( Gmat, 1, tmp_ldata, &stride, &tmp_gdata ); 11932e68589bSMark F. Adams CHKERRQ(ierr); 1194*a2f3521dSMark F. Adams 11952e68589bSMark F. Adams if(jj==0 && kk==0) { /* now I know how many todal nodes - allocate */ 1196*a2f3521dSMark F. Adams ierr = PetscMalloc( stride*bs*data_cols*sizeof(PetscReal), &data_w_ghost ); CHKERRQ(ierr); 1197*a2f3521dSMark F. Adams nbnodes = bs*stride; 11982e68589bSMark F. Adams } 1199*a2f3521dSMark F. Adams tp2 = data_w_ghost + jj*bs*stride + kk; 1200*a2f3521dSMark F. Adams for( ii = 0 ; ii < stride ; ii++, tp2 += bs ){ 12012e68589bSMark F. Adams *tp2 = tmp_gdata[ii]; 12022e68589bSMark F. Adams } 12032e68589bSMark F. Adams ierr = PetscFree( tmp_gdata ); CHKERRQ(ierr); 12042e68589bSMark F. Adams } 12052e68589bSMark F. Adams } 12062e68589bSMark F. Adams ierr = PetscFree( tmp_ldata ); CHKERRQ(ierr); 12072e68589bSMark F. Adams } 12082e68589bSMark F. Adams else { 1209c8b0795cSMark F. Adams nbnodes = bs*nloc; 1210c8b0795cSMark F. Adams data_w_ghost = (PetscReal*)pc_gamg->data; 12112e68589bSMark F. Adams } 12122e68589bSMark F. Adams 12132e68589bSMark F. Adams /* get P0 */ 12142e68589bSMark F. Adams if( npe > 1 ){ 12152e68589bSMark F. Adams PetscReal *fid_glid_loc,*fiddata; 1216*a2f3521dSMark F. Adams PetscInt stride; 12172e68589bSMark F. Adams 12182e68589bSMark F. Adams ierr = PetscMalloc( nloc*sizeof(PetscReal), &fid_glid_loc ); CHKERRQ(ierr); 12192e68589bSMark F. Adams for(kk=0;kk<nloc;kk++) fid_glid_loc[kk] = (PetscReal)(my0+kk); 1220*a2f3521dSMark F. Adams ierr = PCGAMGGetDataWithGhosts( Gmat, 1, fid_glid_loc, &stride, &fiddata ); 12212e68589bSMark F. Adams CHKERRQ(ierr); 1222*a2f3521dSMark F. Adams ierr = PetscMalloc( stride*sizeof(PetscInt), &flid_fgid ); CHKERRQ(ierr); 1223*a2f3521dSMark F. Adams for(kk=0;kk<stride;kk++) flid_fgid[kk] = (PetscInt)fiddata[kk]; 12242e68589bSMark F. Adams ierr = PetscFree( fiddata ); CHKERRQ(ierr); 1225*a2f3521dSMark F. Adams 1226*a2f3521dSMark F. Adams assert(stride==nbnodes/bs); 12272e68589bSMark F. Adams ierr = PetscFree( fid_glid_loc ); CHKERRQ(ierr); 12282e68589bSMark F. Adams } 12292e68589bSMark F. Adams else { 12302e68589bSMark F. Adams ierr = PetscMalloc( nloc*sizeof(PetscInt), &flid_fgid ); CHKERRQ(ierr); 12312e68589bSMark F. Adams for(kk=0;kk<nloc;kk++) flid_fgid[kk] = my0 + kk; 12322e68589bSMark F. Adams } 12330cbbd2e1SMark F. Adams #if defined PETSC_GAMG_USE_LOG 12340cbbd2e1SMark F. Adams ierr = PetscLogEventEnd(petsc_gamg_setup_events[SET7],0,0,0,0);CHKERRQ(ierr); 12350cbbd2e1SMark F. Adams ierr = PetscLogEventBegin(petsc_gamg_setup_events[SET8],0,0,0,0);CHKERRQ(ierr); 12362e68589bSMark F. Adams #endif 1237c8b0795cSMark F. Adams { 1238ffc955d6SMark F. Adams PetscReal *data_out = PETSC_NULL; 12390cbbd2e1SMark F. Adams ierr = formProl0( agg_lists, bs, data_cols, myCrs0, nbnodes, 1240c8b0795cSMark F. Adams data_w_ghost, flid_fgid, &data_out, Prol ); 12412e68589bSMark F. Adams CHKERRQ(ierr); 1242c8b0795cSMark F. Adams ierr = PetscFree( pc_gamg->data ); CHKERRQ( ierr ); 1243c8b0795cSMark F. Adams pc_gamg->data = data_out; 1244c8b0795cSMark F. Adams pc_gamg->data_cell_rows = data_cols; 1245c8b0795cSMark F. Adams pc_gamg->data_sz = data_cols*data_cols*nLocalSelected; 1246c8b0795cSMark F. Adams } 12470cbbd2e1SMark F. Adams #if defined PETSC_GAMG_USE_LOG 12480cbbd2e1SMark F. Adams ierr = PetscLogEventEnd(petsc_gamg_setup_events[SET8],0,0,0,0);CHKERRQ(ierr); 1249c8b0795cSMark F. Adams #endif 12502e68589bSMark F. Adams if (npe > 1) ierr = PetscFree( data_w_ghost ); CHKERRQ(ierr); 12512e68589bSMark F. Adams ierr = PetscFree( flid_fgid ); CHKERRQ(ierr); 12522e68589bSMark F. Adams 1253c8b0795cSMark F. Adams /* attach block size of columns */ 1254c8b0795cSMark F. Adams if( pc_gamg->col_bs_id == -1 ) { 1255c8b0795cSMark F. Adams ierr = PetscObjectComposedDataRegister( &pc_gamg->col_bs_id ); assert(pc_gamg->col_bs_id != -1 ); 1256c8b0795cSMark F. Adams } 1257c8b0795cSMark F. Adams ierr = PetscObjectComposedDataSetInt( (PetscObject)Prol, pc_gamg->col_bs_id, data_cols ); CHKERRQ(ierr); 1258c8b0795cSMark F. Adams 1259c8b0795cSMark F. Adams *a_P_out = Prol; /* out */ 12600cbbd2e1SMark F. Adams #if defined PETSC_USE_LOG 12610cbbd2e1SMark F. Adams ierr = PetscLogEventEnd(PC_GAMGProlongator_AGG,0,0,0,0);CHKERRQ(ierr); 12620cbbd2e1SMark F. Adams #endif 1263c8b0795cSMark F. Adams PetscFunctionReturn(0); 1264c8b0795cSMark F. Adams } 1265c8b0795cSMark F. Adams 1266c8b0795cSMark F. Adams /* -------------------------------------------------------------------------- */ 1267c8b0795cSMark F. Adams /* 12680cbbd2e1SMark F. Adams PCGAMGOptprol_AGG 1269c8b0795cSMark F. Adams 1270c8b0795cSMark F. Adams Input Parameter: 1271c8b0795cSMark F. Adams . pc - this 1272c8b0795cSMark F. Adams . Amat - matrix on this fine level 1273c8b0795cSMark F. Adams In/Output Parameter: 1274c8b0795cSMark F. Adams . a_P_out - prolongation operator to the next level 1275c8b0795cSMark F. Adams */ 1276c8b0795cSMark F. Adams #undef __FUNCT__ 12770cbbd2e1SMark F. Adams #define __FUNCT__ "PCGAMGOptprol_AGG" 12780cbbd2e1SMark F. Adams PetscErrorCode PCGAMGOptprol_AGG( PC pc, 1279c8b0795cSMark F. Adams const Mat Amat, 1280c8b0795cSMark F. Adams Mat *a_P 1281c8b0795cSMark F. Adams ) 1282c8b0795cSMark F. Adams { 1283c8b0795cSMark F. Adams PetscErrorCode ierr; 1284c8b0795cSMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 1285c8b0795cSMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 1286c8b0795cSMark F. Adams const PetscInt verbose = pc_gamg->verbose; 1287c8b0795cSMark F. Adams PC_GAMG_AGG *pc_gamg_agg = (PC_GAMG_AGG*)pc_gamg->subctx; 1288c8b0795cSMark F. Adams PetscInt jj; 1289c8b0795cSMark F. Adams PetscMPIInt mype,npe; 1290c8b0795cSMark F. Adams Mat Prol = *a_P; 1291c8b0795cSMark F. Adams MPI_Comm wcomm = ((PetscObject)Amat)->comm; 1292c8b0795cSMark F. Adams 1293c8b0795cSMark F. Adams PetscFunctionBegin; 12940cbbd2e1SMark F. Adams #if defined PETSC_USE_LOG 12950cbbd2e1SMark F. Adams ierr = PetscLogEventBegin(PC_GAMGOptprol_AGG,0,0,0,0);CHKERRQ(ierr); 12960cbbd2e1SMark F. Adams #endif 1297c8b0795cSMark F. Adams ierr = MPI_Comm_rank( wcomm, &mype); CHKERRQ(ierr); 1298c8b0795cSMark F. Adams ierr = MPI_Comm_size( wcomm, &npe); CHKERRQ(ierr); 1299c8b0795cSMark F. Adams 13002e68589bSMark F. Adams /* smooth P0 */ 1301c8b0795cSMark F. Adams for( jj = 0 ; jj < pc_gamg_agg->nsmooths ; jj++ ){ 13022e68589bSMark F. Adams Mat tMat; 13032e68589bSMark F. Adams Vec diag; 13042e68589bSMark F. Adams PetscReal alpha, emax, emin; 13050cbbd2e1SMark F. Adams #if defined PETSC_GAMG_USE_LOG 13060cbbd2e1SMark F. Adams ierr = PetscLogEventBegin(petsc_gamg_setup_events[SET9],0,0,0,0);CHKERRQ(ierr); 13072e68589bSMark F. Adams #endif 13082e68589bSMark F. Adams if( jj == 0 ) { 13092e68589bSMark F. Adams KSP eksp; 13102e68589bSMark F. Adams Vec bb, xx; 13112e68589bSMark F. Adams PC pc; 13122e68589bSMark F. Adams ierr = MatGetVecs( Amat, &bb, 0 ); CHKERRQ(ierr); 13132e68589bSMark F. Adams ierr = MatGetVecs( Amat, &xx, 0 ); CHKERRQ(ierr); 13142e68589bSMark F. Adams { 13152e68589bSMark F. Adams PetscRandom rctx; 13162e68589bSMark F. Adams ierr = PetscRandomCreate(wcomm,&rctx);CHKERRQ(ierr); 13172e68589bSMark F. Adams ierr = PetscRandomSetFromOptions(rctx);CHKERRQ(ierr); 13182e68589bSMark F. Adams ierr = VecSetRandom(bb,rctx);CHKERRQ(ierr); 13192e68589bSMark F. Adams ierr = PetscRandomDestroy( &rctx ); CHKERRQ(ierr); 13202e68589bSMark F. Adams } 13212e68589bSMark F. Adams ierr = KSPCreate(wcomm,&eksp); CHKERRQ(ierr); 1322db36e5aeSMark F. Adams ierr = KSPAppendOptionsPrefix( eksp, "gamg_est_"); CHKERRQ(ierr); 13232e68589bSMark F. Adams ierr = KSPSetFromOptions( eksp ); CHKERRQ(ierr); 13242e68589bSMark F. Adams ierr = KSPSetInitialGuessNonzero( eksp, PETSC_FALSE ); CHKERRQ(ierr); 13252e68589bSMark F. Adams ierr = KSPSetOperators( eksp, Amat, Amat, SAME_NONZERO_PATTERN ); 13262e68589bSMark F. Adams CHKERRQ( ierr ); 13272e68589bSMark F. Adams ierr = KSPGetPC( eksp, &pc ); CHKERRQ( ierr ); 13282e68589bSMark F. Adams ierr = PCSetType( pc, PCJACOBI ); CHKERRQ(ierr); /* smoother */ 13292e68589bSMark F. Adams ierr = KSPSetTolerances(eksp,PETSC_DEFAULT,PETSC_DEFAULT,PETSC_DEFAULT,10); 13302e68589bSMark F. Adams CHKERRQ(ierr); 13312e68589bSMark F. Adams ierr = KSPSetNormType( eksp, KSP_NORM_NONE ); CHKERRQ(ierr); 13322e68589bSMark F. Adams ierr = KSPSetComputeSingularValues( eksp,PETSC_TRUE ); CHKERRQ(ierr); 13332e68589bSMark F. Adams 13342e68589bSMark F. Adams /* solve - keep stuff out of logging */ 13352e68589bSMark F. Adams ierr = PetscLogEventDeactivate(KSP_Solve);CHKERRQ(ierr); 13362e68589bSMark F. Adams ierr = PetscLogEventDeactivate(PC_Apply);CHKERRQ(ierr); 13372e68589bSMark F. Adams ierr = KSPSolve( eksp, bb, xx ); CHKERRQ(ierr); 13382e68589bSMark F. Adams ierr = PetscLogEventActivate(KSP_Solve);CHKERRQ(ierr); 13392e68589bSMark F. Adams ierr = PetscLogEventActivate(PC_Apply);CHKERRQ(ierr); 13402e68589bSMark F. Adams 13412e68589bSMark F. Adams ierr = KSPComputeExtremeSingularValues( eksp, &emax, &emin ); CHKERRQ(ierr); 13422e68589bSMark F. Adams if( verbose ) { 1343c8b0795cSMark F. Adams PetscPrintf(wcomm,"\t\t\t%s smooth P0: max eigen=%e min=%e PC=%s\n", 13442e68589bSMark F. Adams __FUNCT__,emax,emin,PCJACOBI); 13452e68589bSMark F. Adams } 13462e68589bSMark F. Adams ierr = VecDestroy( &xx ); CHKERRQ(ierr); 13472e68589bSMark F. Adams ierr = VecDestroy( &bb ); CHKERRQ(ierr); 13482e68589bSMark F. Adams ierr = KSPDestroy( &eksp ); CHKERRQ(ierr); 13492e68589bSMark F. Adams 13502e68589bSMark F. Adams if( pc_gamg->emax_id == -1 ) { 13512e68589bSMark F. Adams ierr = PetscObjectComposedDataRegister( &pc_gamg->emax_id ); 13522e68589bSMark F. Adams assert(pc_gamg->emax_id != -1 ); 13532e68589bSMark F. Adams } 13542e68589bSMark F. Adams ierr = PetscObjectComposedDataSetScalar( (PetscObject)Amat, pc_gamg->emax_id, emax ); CHKERRQ(ierr); 13552e68589bSMark F. Adams } 13562e68589bSMark F. Adams 13572e68589bSMark F. Adams /* smooth P1 := (I - omega/lam D^{-1}A)P0 */ 13582e68589bSMark F. Adams ierr = MatMatMult( Amat, Prol, MAT_INITIAL_MATRIX, PETSC_DEFAULT, &tMat ); CHKERRQ(ierr); 13592e68589bSMark F. Adams ierr = MatGetVecs( Amat, &diag, 0 ); CHKERRQ(ierr); 13602e68589bSMark F. Adams ierr = MatGetDiagonal( Amat, diag ); CHKERRQ(ierr); /* effectively PCJACOBI */ 13612e68589bSMark F. Adams ierr = VecReciprocal( diag ); CHKERRQ(ierr); 13622e68589bSMark F. Adams ierr = MatDiagonalScale( tMat, diag, 0 ); CHKERRQ(ierr); 13632e68589bSMark F. Adams ierr = VecDestroy( &diag ); CHKERRQ(ierr); 13642e68589bSMark F. Adams alpha = -1.5/emax; 13652e68589bSMark F. Adams ierr = MatAYPX( tMat, alpha, Prol, SUBSET_NONZERO_PATTERN ); CHKERRQ(ierr); 13662e68589bSMark F. Adams ierr = MatDestroy( &Prol ); CHKERRQ(ierr); 13672e68589bSMark F. Adams Prol = tMat; 13680cbbd2e1SMark F. Adams #if defined PETSC_GAMG_USE_LOG 13690cbbd2e1SMark F. Adams ierr = PetscLogEventEnd(petsc_gamg_setup_events[SET9],0,0,0,0);CHKERRQ(ierr); 13702e68589bSMark F. Adams #endif 13712e68589bSMark F. Adams } 13720cbbd2e1SMark F. Adams #if defined PETSC_USE_LOG 13730cbbd2e1SMark F. Adams ierr = PetscLogEventEnd(PC_GAMGOptprol_AGG,0,0,0,0);CHKERRQ(ierr); 13740cbbd2e1SMark F. Adams #endif 1375c8b0795cSMark F. Adams *a_P = Prol; 1376c8b0795cSMark F. Adams 1377c8b0795cSMark F. Adams PetscFunctionReturn(0); 13782e68589bSMark F. Adams } 13792e68589bSMark F. Adams 1380c8b0795cSMark F. Adams /* -------------------------------------------------------------------------- */ 1381c8b0795cSMark F. Adams /* 1382*a2f3521dSMark F. Adams PCGAMGKKTProl_AGG 1383*a2f3521dSMark F. Adams 1384*a2f3521dSMark F. Adams Input Parameter: 1385*a2f3521dSMark F. Adams . pc - this 1386*a2f3521dSMark F. Adams . Prol11 - matrix on this fine level 1387*a2f3521dSMark F. Adams . A21 - matrix on this fine level 1388*a2f3521dSMark F. Adams In/Output Parameter: 1389*a2f3521dSMark F. Adams . a_P22 - prolongation operator to the next level 1390*a2f3521dSMark F. Adams */ 1391*a2f3521dSMark F. Adams #undef __FUNCT__ 1392*a2f3521dSMark F. Adams #define __FUNCT__ "PCGAMGKKTProl_AGG" 1393*a2f3521dSMark F. Adams PetscErrorCode PCGAMGKKTProl_AGG( PC pc, 1394*a2f3521dSMark F. Adams const Mat Prol11, 1395*a2f3521dSMark F. Adams const Mat A21, 1396*a2f3521dSMark F. Adams Mat *a_P22 1397*a2f3521dSMark F. Adams ) 1398*a2f3521dSMark F. Adams { 1399*a2f3521dSMark F. Adams PetscErrorCode ierr; 1400*a2f3521dSMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 1401*a2f3521dSMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 1402*a2f3521dSMark F. Adams const PetscInt verbose = pc_gamg->verbose; 1403*a2f3521dSMark F. Adams /* PC_GAMG_AGG *pc_gamg_agg = (PC_GAMG_AGG*)pc_gamg->subctx; */ 1404*a2f3521dSMark F. Adams PetscMPIInt mype,npe; 1405*a2f3521dSMark F. Adams Mat Prol22,Tmat,Gmat; 1406*a2f3521dSMark F. Adams MPI_Comm wcomm = ((PetscObject)pc)->comm; 1407*a2f3521dSMark F. Adams PetscCoarsenData *agg_lists; 1408*a2f3521dSMark F. Adams 1409*a2f3521dSMark F. Adams PetscFunctionBegin; 1410*a2f3521dSMark F. Adams #if defined PETSC_USE_LOG 1411*a2f3521dSMark F. Adams ierr = PetscLogEventBegin(PC_GAMGKKTProl_AGG,0,0,0,0); CHKERRQ(ierr); 1412*a2f3521dSMark F. Adams #endif 1413*a2f3521dSMark F. Adams ierr = MPI_Comm_rank( wcomm, &mype); CHKERRQ(ierr); 1414*a2f3521dSMark F. Adams ierr = MPI_Comm_size( wcomm, &npe); CHKERRQ(ierr); 1415*a2f3521dSMark F. Adams 1416*a2f3521dSMark F. Adams /* form C graph */ 1417*a2f3521dSMark F. Adams ierr = MatMatMult( A21, Prol11, MAT_INITIAL_MATRIX, PETSC_DEFAULT, &Tmat); CHKERRQ(ierr); 1418*a2f3521dSMark F. Adams ierr = MatMatTransposeMult(Tmat, Tmat, MAT_INITIAL_MATRIX, PETSC_DEFAULT, &Gmat ); CHKERRQ(ierr); 1419*a2f3521dSMark F. Adams ierr = MatDestroy(&Tmat); CHKERRQ(ierr); 1420*a2f3521dSMark F. Adams ierr = PCGAMGFilterGraph(&Gmat, 0.0, PETSC_FALSE, verbose); CHKERRQ(ierr); 1421*a2f3521dSMark F. Adams 1422*a2f3521dSMark F. Adams /* coarsen constraints */ 1423*a2f3521dSMark F. Adams { 1424*a2f3521dSMark F. Adams MatCoarsen crs; 1425*a2f3521dSMark F. Adams ierr = MatCoarsenCreate( wcomm, &crs ); CHKERRQ(ierr); 1426*a2f3521dSMark F. Adams ierr = MatCoarsenSetType( crs, MATCOARSENMIS ); CHKERRQ(ierr); 1427*a2f3521dSMark F. Adams ierr = MatCoarsenSetAdjacency( crs, Gmat ); CHKERRQ(ierr); 1428*a2f3521dSMark F. Adams ierr = MatCoarsenSetVerbose( crs, verbose ); CHKERRQ(ierr); 1429*a2f3521dSMark F. Adams ierr = MatCoarsenSetStrictAggs( crs, PETSC_TRUE ); CHKERRQ(ierr); 1430*a2f3521dSMark F. Adams ierr = MatCoarsenApply( crs ); CHKERRQ(ierr); 1431*a2f3521dSMark F. Adams ierr = MatCoarsenGetData( crs, &agg_lists ); CHKERRQ(ierr); 1432*a2f3521dSMark F. Adams ierr = MatCoarsenDestroy( &crs ); CHKERRQ(ierr); 1433*a2f3521dSMark F. Adams } 1434*a2f3521dSMark F. Adams 1435*a2f3521dSMark F. Adams /* form simple prolongation 'Prol22' */ 1436*a2f3521dSMark F. Adams { 1437*a2f3521dSMark F. Adams PetscInt ii,mm,clid,my0,nloc,nLocalSelected; 1438*a2f3521dSMark F. Adams PetscScalar val = 1.0; 1439*a2f3521dSMark F. Adams /* get 'nLocalSelected' */ 1440*a2f3521dSMark F. Adams ierr = MatGetLocalSize( Gmat, &nloc, &ii ); CHKERRQ(ierr); 1441*a2f3521dSMark F. Adams for( ii=0, nLocalSelected = 0 ; ii < nloc ; ii++ ){ 1442*a2f3521dSMark F. Adams PetscBool ise; 1443*a2f3521dSMark F. Adams /* filter out singletons 0 or 1? */ 1444*a2f3521dSMark F. Adams ierr = PetscCDEmptyAt( agg_lists, ii, &ise ); CHKERRQ(ierr); 1445*a2f3521dSMark F. Adams if( !ise ) nLocalSelected++; 1446*a2f3521dSMark F. Adams } 1447*a2f3521dSMark F. Adams 1448*a2f3521dSMark F. Adams ierr = MatCreate(wcomm,&Prol22);CHKERRQ(ierr); 1449*a2f3521dSMark F. Adams ierr = MatSetSizes( Prol22,nloc, nLocalSelected, 1450*a2f3521dSMark F. Adams PETSC_DETERMINE, PETSC_DETERMINE); 1451*a2f3521dSMark F. Adams CHKERRQ(ierr); 1452*a2f3521dSMark F. Adams ierr = MatSetType( Prol22, MATAIJ ); CHKERRQ(ierr); 1453*a2f3521dSMark F. Adams ierr = MatSeqAIJSetPreallocation(Prol22,1,PETSC_NULL); CHKERRQ(ierr); 1454*a2f3521dSMark F. Adams ierr = MatMPIAIJSetPreallocation(Prol22,1,PETSC_NULL,1,PETSC_NULL); 1455*a2f3521dSMark F. Adams CHKERRQ(ierr); 1456*a2f3521dSMark F. Adams /* ierr = MatCreateAIJ( wcomm, */ 1457*a2f3521dSMark F. Adams /* nloc, nLocalSelected, */ 1458*a2f3521dSMark F. Adams /* PETSC_DETERMINE, PETSC_DETERMINE, */ 1459*a2f3521dSMark F. Adams /* 1, PETSC_NULL, 1, PETSC_NULL, */ 1460*a2f3521dSMark F. Adams /* &Prol22 ); */ 1461*a2f3521dSMark F. Adams 1462*a2f3521dSMark F. Adams ierr = MatGetOwnershipRange( Prol22, &my0, &ii ); CHKERRQ(ierr); 1463*a2f3521dSMark F. Adams nloc = ii - my0; 1464*a2f3521dSMark F. Adams 1465*a2f3521dSMark F. Adams /* make aggregates */ 1466*a2f3521dSMark F. Adams for( mm = clid = 0 ; mm < nloc ; mm++ ){ 1467*a2f3521dSMark F. Adams ierr = PetscCDSizeAt( agg_lists, mm, &ii ); CHKERRQ(ierr); 1468*a2f3521dSMark F. Adams if( ii > 0 ) { 1469*a2f3521dSMark F. Adams PetscInt asz=ii,cgid=my0+clid,rids[1000]; 1470*a2f3521dSMark F. Adams PetscCDPos pos; 1471*a2f3521dSMark F. Adams if(asz>1000)SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Very large aggregate: %d",asz); 1472*a2f3521dSMark F. Adams ii = 0; 1473*a2f3521dSMark F. Adams ierr = PetscCDGetHeadPos(agg_lists,mm,&pos); CHKERRQ(ierr); 1474*a2f3521dSMark F. Adams while(pos){ 1475*a2f3521dSMark F. Adams PetscInt gid1; 1476*a2f3521dSMark F. Adams ierr = PetscLLNGetID( pos, &gid1 ); CHKERRQ(ierr); 1477*a2f3521dSMark F. Adams ierr = PetscCDGetNextPos(agg_lists,mm,&pos); CHKERRQ(ierr); 1478*a2f3521dSMark F. Adams 1479*a2f3521dSMark F. Adams rids[ii++] = gid1; 1480*a2f3521dSMark F. Adams } 1481*a2f3521dSMark F. Adams assert(ii==asz); 1482*a2f3521dSMark F. Adams /* add diagonal block of P0 */ 1483*a2f3521dSMark F. Adams ierr = MatSetValues(Prol22,asz,rids,1,&cgid,&val,INSERT_VALUES); CHKERRQ(ierr); 1484*a2f3521dSMark F. Adams 1485*a2f3521dSMark F. Adams clid++; 1486*a2f3521dSMark F. Adams } /* coarse agg */ 1487*a2f3521dSMark F. Adams } /* for all fine nodes */ 1488*a2f3521dSMark F. Adams ierr = MatAssemblyBegin(Prol22,MAT_FINAL_ASSEMBLY); CHKERRQ(ierr); 1489*a2f3521dSMark F. Adams ierr = MatAssemblyEnd(Prol22,MAT_FINAL_ASSEMBLY); CHKERRQ(ierr); 1490*a2f3521dSMark F. Adams } 1491*a2f3521dSMark F. Adams 1492*a2f3521dSMark F. Adams /* clean up */ 1493*a2f3521dSMark F. Adams ierr = MatDestroy( &Gmat ); CHKERRQ(ierr); 1494*a2f3521dSMark F. Adams ierr = PetscCDDestroy( agg_lists ); CHKERRQ(ierr); 1495*a2f3521dSMark F. Adams #if defined PETSC_USE_LOG 1496*a2f3521dSMark F. Adams ierr = PetscLogEventEnd(PC_GAMGKKTProl_AGG,0,0,0,0);CHKERRQ(ierr); 1497*a2f3521dSMark F. Adams #endif 1498*a2f3521dSMark F. Adams *a_P22 = Prol22; 1499*a2f3521dSMark F. Adams 1500*a2f3521dSMark F. Adams PetscFunctionReturn(0); 1501*a2f3521dSMark F. Adams } 1502*a2f3521dSMark F. Adams 1503*a2f3521dSMark F. Adams /* -------------------------------------------------------------------------- */ 1504*a2f3521dSMark F. Adams /* 1505c8b0795cSMark F. Adams PCCreateGAMG_AGG 15062e68589bSMark F. Adams 1507c8b0795cSMark F. Adams Input Parameter: 1508c8b0795cSMark F. Adams . pc - 1509c8b0795cSMark F. Adams */ 1510c8b0795cSMark F. Adams #undef __FUNCT__ 1511c8b0795cSMark F. Adams #define __FUNCT__ "PCCreateGAMG_AGG" 1512c8b0795cSMark F. Adams PetscErrorCode PCCreateGAMG_AGG( PC pc ) 1513c8b0795cSMark F. Adams { 1514c8b0795cSMark F. Adams PetscErrorCode ierr; 1515c8b0795cSMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 1516c8b0795cSMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 1517c8b0795cSMark F. Adams PC_GAMG_AGG *pc_gamg_agg; 15182e68589bSMark F. Adams 1519c8b0795cSMark F. Adams PetscFunctionBegin; 1520c8b0795cSMark F. Adams /* create sub context for SA */ 1521c8b0795cSMark F. Adams ierr = PetscNewLog( pc, PC_GAMG_AGG, &pc_gamg_agg ); CHKERRQ(ierr); 1522c8b0795cSMark F. Adams assert(!pc_gamg->subctx); 1523c8b0795cSMark F. Adams pc_gamg->subctx = pc_gamg_agg; 1524c8b0795cSMark F. Adams 1525c8b0795cSMark F. Adams pc->ops->setfromoptions = PCSetFromOptions_GAMG_AGG; 1526c8b0795cSMark F. Adams pc->ops->destroy = PCDestroy_AGG; 1527c8b0795cSMark F. Adams /* reset does not do anything; setup not virtual */ 1528c8b0795cSMark F. Adams 1529c8b0795cSMark F. Adams /* set internal function pointers */ 1530c8b0795cSMark F. Adams pc_gamg->graph = PCGAMGgraph_AGG; 1531b43b03e9SMark F. Adams pc_gamg->coarsen = PCGAMGCoarsen_AGG; 15320cbbd2e1SMark F. Adams pc_gamg->prolongator = PCGAMGProlongator_AGG; 15330cbbd2e1SMark F. Adams pc_gamg->optprol = PCGAMGOptprol_AGG; 1534*a2f3521dSMark F. Adams pc_gamg->formkktprol = PCGAMGKKTProl_AGG; 1535c8b0795cSMark F. Adams 1536c8b0795cSMark F. Adams pc_gamg->createdefaultdata = PCSetData_AGG; 1537c8b0795cSMark F. Adams 1538c8b0795cSMark F. Adams ierr = PetscObjectComposeFunctionDynamic( (PetscObject)pc, 1539c8b0795cSMark F. Adams "PCSetCoordinates_C", 1540c8b0795cSMark F. Adams "PCSetCoordinates_AGG", 1541c8b0795cSMark F. Adams PCSetCoordinates_AGG); 15422e68589bSMark F. Adams PetscFunctionReturn(0); 15432e68589bSMark F. Adams } 1544