12e68589bSMark F. Adams /* 22e68589bSMark F. Adams GAMG geometric-algebric multiogrid PC - Mark Adams 2011 32e68589bSMark F. Adams */ 42e68589bSMark F. Adams 52e68589bSMark F. Adams #include <../src/ksp/pc/impls/gamg/gamg.h> /*I "petscpc.h" I*/ 62e68589bSMark F. Adams #include <private/kspimpl.h> 72e68589bSMark F. Adams 82e68589bSMark F. Adams #include <assert.h> 92e68589bSMark F. Adams #include <petscblaslapack.h> 102e68589bSMark F. Adams 112e68589bSMark F. Adams typedef struct { 12c8b0795cSMark F. Adams PetscInt nsmooths; 13c8b0795cSMark F. Adams Mat aux_mat; 14c8b0795cSMark F. Adams PetscBool sym_graph; 15ef4ad70eSMark F. Adams PetscBool square_graph; 162e68589bSMark F. Adams }PC_GAMG_AGG; 172e68589bSMark F. Adams 182e68589bSMark F. Adams #undef __FUNCT__ 192e68589bSMark F. Adams #define __FUNCT__ "PCGAMGSetNSmooths" 202e68589bSMark F. Adams /*@ 212e68589bSMark F. Adams PCGAMGSetNSmooths - Set number of smoothing steps (1 is typical) 222e68589bSMark F. Adams 232e68589bSMark F. Adams Not Collective on PC 242e68589bSMark F. Adams 252e68589bSMark F. Adams Input Parameters: 262e68589bSMark F. Adams . pc - the preconditioner context 272e68589bSMark F. Adams 282e68589bSMark F. Adams Options Database Key: 292e68589bSMark F. Adams . -pc_gamg_agg_nsmooths 302e68589bSMark F. Adams 312e68589bSMark F. Adams Level: intermediate 322e68589bSMark F. Adams 332e68589bSMark F. Adams Concepts: Aggregation AMG preconditioner 342e68589bSMark F. Adams 352e68589bSMark F. Adams .seealso: () 362e68589bSMark F. Adams @*/ 372e68589bSMark F. Adams PetscErrorCode PCGAMGSetNSmooths(PC pc, PetscInt n) 382e68589bSMark F. Adams { 392e68589bSMark F. Adams PetscErrorCode ierr; 402e68589bSMark F. Adams 412e68589bSMark F. Adams PetscFunctionBegin; 422e68589bSMark F. Adams PetscValidHeaderSpecific(pc,PC_CLASSID,1); 432e68589bSMark F. Adams ierr = PetscTryMethod(pc,"PCGAMGSetNSmooths_C",(PC,PetscInt),(pc,n));CHKERRQ(ierr); 442e68589bSMark F. Adams PetscFunctionReturn(0); 452e68589bSMark F. Adams } 462e68589bSMark F. Adams 472e68589bSMark F. Adams EXTERN_C_BEGIN 482e68589bSMark F. Adams #undef __FUNCT__ 492e68589bSMark F. Adams #define __FUNCT__ "PCGAMGSetNSmooths_GAMG" 502e68589bSMark F. Adams PetscErrorCode PCGAMGSetNSmooths_GAMG(PC pc, PetscInt n) 512e68589bSMark F. Adams { 522e68589bSMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 532e68589bSMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 54c8b0795cSMark F. Adams PC_GAMG_AGG *pc_gamg_agg = (PC_GAMG_AGG*)pc_gamg->subctx; 552e68589bSMark F. Adams 562e68589bSMark F. Adams PetscFunctionBegin; 57c8b0795cSMark F. Adams pc_gamg_agg->nsmooths = n; 58c8b0795cSMark F. Adams PetscFunctionReturn(0); 59c8b0795cSMark F. Adams } 60c8b0795cSMark F. Adams EXTERN_C_END 61c8b0795cSMark F. Adams 62c8b0795cSMark F. Adams #undef __FUNCT__ 63c8b0795cSMark F. Adams #define __FUNCT__ "PCGAMGSetSymGraph" 64c8b0795cSMark F. Adams /*@ 65c8b0795cSMark F. Adams PCGAMGSetSymGraph - 66c8b0795cSMark F. Adams 67c8b0795cSMark F. Adams Not Collective on PC 68c8b0795cSMark F. Adams 69c8b0795cSMark F. Adams Input Parameters: 70c8b0795cSMark F. Adams . pc - the preconditioner context 71c8b0795cSMark F. Adams 72c8b0795cSMark F. Adams Options Database Key: 73c8b0795cSMark F. Adams . -pc_gamg_sym_graph 74c8b0795cSMark F. Adams 75c8b0795cSMark F. Adams Level: intermediate 76c8b0795cSMark F. Adams 77c8b0795cSMark F. Adams Concepts: Aggregation AMG preconditioner 78c8b0795cSMark F. Adams 79c8b0795cSMark F. Adams .seealso: () 80c8b0795cSMark F. Adams @*/ 81c8b0795cSMark F. Adams PetscErrorCode PCGAMGSetSymGraph(PC pc, PetscBool n) 82c8b0795cSMark F. Adams { 83c8b0795cSMark F. Adams PetscErrorCode ierr; 84c8b0795cSMark F. Adams 85c8b0795cSMark F. Adams PetscFunctionBegin; 86c8b0795cSMark F. Adams PetscValidHeaderSpecific(pc,PC_CLASSID,1); 87c8b0795cSMark F. Adams ierr = PetscTryMethod(pc,"PCGAMGSetSymGraph_C",(PC,PetscBool),(pc,n));CHKERRQ(ierr); 88c8b0795cSMark F. Adams PetscFunctionReturn(0); 89c8b0795cSMark F. Adams } 90c8b0795cSMark F. Adams 91c8b0795cSMark F. Adams EXTERN_C_BEGIN 92c8b0795cSMark F. Adams #undef __FUNCT__ 93c8b0795cSMark F. Adams #define __FUNCT__ "PCGAMGSetSymGraph_GAMG" 94c8b0795cSMark F. Adams PetscErrorCode PCGAMGSetSymGraph_GAMG(PC pc, PetscBool n) 95c8b0795cSMark F. Adams { 96c8b0795cSMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 97c8b0795cSMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 98c8b0795cSMark F. Adams PC_GAMG_AGG *pc_gamg_agg = (PC_GAMG_AGG*)pc_gamg->subctx; 99c8b0795cSMark F. Adams 100c8b0795cSMark F. Adams PetscFunctionBegin; 101c8b0795cSMark F. Adams pc_gamg_agg->sym_graph = n; 1022e68589bSMark F. Adams PetscFunctionReturn(0); 1032e68589bSMark F. Adams } 1042e68589bSMark F. Adams EXTERN_C_END 1052e68589bSMark F. Adams 106ef4ad70eSMark F. Adams #undef __FUNCT__ 107ef4ad70eSMark F. Adams #define __FUNCT__ "PCGAMGSetSquareGraph" 108ef4ad70eSMark F. Adams /*@ 109ef4ad70eSMark F. Adams PCGAMGSetSquareGraph - 110ef4ad70eSMark F. Adams 111ef4ad70eSMark F. Adams Not Collective on PC 112ef4ad70eSMark F. Adams 113ef4ad70eSMark F. Adams Input Parameters: 114ef4ad70eSMark F. Adams . pc - the preconditioner context 115ef4ad70eSMark F. Adams 116ef4ad70eSMark F. Adams Options Database Key: 117ef4ad70eSMark F. Adams . -pc_gamg_square_graph 118ef4ad70eSMark F. Adams 119ef4ad70eSMark F. Adams Level: intermediate 120ef4ad70eSMark F. Adams 121ef4ad70eSMark F. Adams Concepts: Aggregation AMG preconditioner 122ef4ad70eSMark F. Adams 123ef4ad70eSMark F. Adams .seealso: () 124ef4ad70eSMark F. Adams @*/ 125ef4ad70eSMark F. Adams PetscErrorCode PCGAMGSetSquareGraph(PC pc, PetscBool n) 126ef4ad70eSMark F. Adams { 127ef4ad70eSMark F. Adams PetscErrorCode ierr; 128ef4ad70eSMark F. Adams 129ef4ad70eSMark F. Adams PetscFunctionBegin; 130ef4ad70eSMark F. Adams PetscValidHeaderSpecific(pc,PC_CLASSID,1); 131ef4ad70eSMark F. Adams ierr = PetscTryMethod(pc,"PCGAMGSetSquareGraph_C",(PC,PetscBool),(pc,n));CHKERRQ(ierr); 132ef4ad70eSMark F. Adams PetscFunctionReturn(0); 133ef4ad70eSMark F. Adams } 134ef4ad70eSMark F. Adams 135ef4ad70eSMark F. Adams EXTERN_C_BEGIN 136ef4ad70eSMark F. Adams #undef __FUNCT__ 137ef4ad70eSMark F. Adams #define __FUNCT__ "PCGAMGSetSquareGraph_GAMG" 138ef4ad70eSMark F. Adams PetscErrorCode PCGAMGSetSquareGraph_GAMG(PC pc, PetscBool n) 139ef4ad70eSMark F. Adams { 140ef4ad70eSMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 141ef4ad70eSMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 142ef4ad70eSMark F. Adams PC_GAMG_AGG *pc_gamg_agg = (PC_GAMG_AGG*)pc_gamg->subctx; 143ef4ad70eSMark F. Adams 144ef4ad70eSMark F. Adams PetscFunctionBegin; 145ef4ad70eSMark F. Adams pc_gamg_agg->square_graph = n; 146ef4ad70eSMark F. Adams PetscFunctionReturn(0); 147ef4ad70eSMark F. Adams } 148ef4ad70eSMark F. Adams EXTERN_C_END 149ef4ad70eSMark F. Adams 1502e68589bSMark F. Adams /* -------------------------------------------------------------------------- */ 1512e68589bSMark F. Adams /* 1522e68589bSMark F. Adams PCSetFromOptions_GAMG_AGG 1532e68589bSMark F. Adams 1542e68589bSMark F. Adams Input Parameter: 1552e68589bSMark F. Adams . pc - 1562e68589bSMark F. Adams */ 1572e68589bSMark F. Adams #undef __FUNCT__ 1582e68589bSMark F. Adams #define __FUNCT__ "PCSetFromOptions_GAMG_AGG" 1592e68589bSMark F. Adams PetscErrorCode PCSetFromOptions_GAMG_AGG( PC pc ) 1602e68589bSMark F. Adams { 1612e68589bSMark F. Adams PetscErrorCode ierr; 1622e68589bSMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 1632e68589bSMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 164c8b0795cSMark F. Adams PC_GAMG_AGG *pc_gamg_agg = (PC_GAMG_AGG*)pc_gamg->subctx; 1652e68589bSMark F. Adams PetscBool flag; 1662e68589bSMark F. Adams 1672e68589bSMark F. Adams PetscFunctionBegin; 1682e68589bSMark F. Adams /* call base class */ 1692e68589bSMark F. Adams ierr = PCSetFromOptions_GAMG( pc ); CHKERRQ(ierr); 1702e68589bSMark F. Adams 1712e68589bSMark F. Adams ierr = PetscOptionsHead("GAMG-AGG options"); CHKERRQ(ierr); 1722e68589bSMark F. Adams { 1732e68589bSMark F. Adams /* -pc_gamg_agg_nsmooths */ 174c8b0795cSMark F. Adams pc_gamg_agg->nsmooths = 0; 1752e68589bSMark F. Adams ierr = PetscOptionsInt("-pc_gamg_agg_nsmooths", 1762e68589bSMark F. Adams "smoothing steps for smoothed aggregation, usually 1 (0)", 1772e68589bSMark F. Adams "PCGAMGSetNSmooths", 178c8b0795cSMark F. Adams pc_gamg_agg->nsmooths, 179c8b0795cSMark F. Adams &pc_gamg_agg->nsmooths, 180c8b0795cSMark F. Adams &flag); 181c8b0795cSMark F. Adams CHKERRQ(ierr); 182c8b0795cSMark F. Adams 183c8b0795cSMark F. Adams /* -pc_gamg_sym_graph */ 184c8b0795cSMark F. Adams pc_gamg_agg->sym_graph = PETSC_FALSE; 185c8b0795cSMark F. Adams ierr = PetscOptionsBool("-pc_gamg_sym_graph", 186*581a99e3SJed Brown "Set for asymmetric matrices", 187c8b0795cSMark F. Adams "PCGAMGSetSymGraph", 188c8b0795cSMark F. Adams pc_gamg_agg->sym_graph, 189c8b0795cSMark F. Adams &pc_gamg_agg->sym_graph, 1902e68589bSMark F. Adams &flag); 1912e68589bSMark F. Adams CHKERRQ(ierr); 192ef4ad70eSMark F. Adams 193ef4ad70eSMark F. Adams /* -pc_gamg_square_graph */ 194ef4ad70eSMark F. Adams pc_gamg_agg->square_graph = PETSC_TRUE; 195ef4ad70eSMark F. Adams ierr = PetscOptionsBool("-pc_gamg_square_graph", 196*581a99e3SJed Brown "Set for asymmetric matrices", 197ef4ad70eSMark F. Adams "PCGAMGSetSquareGraph", 198ef4ad70eSMark F. Adams pc_gamg_agg->square_graph, 199ef4ad70eSMark F. Adams &pc_gamg_agg->square_graph, 200ef4ad70eSMark F. Adams &flag); 201ef4ad70eSMark F. Adams CHKERRQ(ierr); 2022e68589bSMark F. Adams } 2032e68589bSMark F. Adams ierr = PetscOptionsTail();CHKERRQ(ierr); 2042e68589bSMark F. Adams 2052e68589bSMark F. Adams PetscFunctionReturn(0); 2062e68589bSMark F. Adams } 2072e68589bSMark F. Adams 2082e68589bSMark F. Adams /* -------------------------------------------------------------------------- */ 2092e68589bSMark F. Adams /* 2102e68589bSMark F. Adams PCDestroy_AGG 2112e68589bSMark F. Adams 2122e68589bSMark F. Adams Input Parameter: 2132e68589bSMark F. Adams . pc - 2142e68589bSMark F. Adams */ 2152e68589bSMark F. Adams #undef __FUNCT__ 2162e68589bSMark F. Adams #define __FUNCT__ "PCDestroy_AGG" 2172e68589bSMark F. Adams PetscErrorCode PCDestroy_AGG( PC pc ) 2182e68589bSMark F. Adams { 2192e68589bSMark F. Adams PetscErrorCode ierr; 2202e68589bSMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 2212e68589bSMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 222c8b0795cSMark F. Adams PC_GAMG_AGG *pc_gamg_agg = (PC_GAMG_AGG*)pc_gamg->subctx; 2232e68589bSMark F. Adams 2242e68589bSMark F. Adams PetscFunctionBegin; 225c8b0795cSMark F. Adams if( pc_gamg_agg ) { 226c8b0795cSMark F. Adams ierr = PetscFree(pc_gamg_agg);CHKERRQ(ierr); 227c8b0795cSMark F. Adams pc_gamg_agg = 0; 2282e68589bSMark F. Adams } 2292e68589bSMark F. Adams 2302e68589bSMark F. Adams /* call base class */ 2312e68589bSMark F. Adams ierr = PCDestroy_GAMG( pc );CHKERRQ(ierr); 2322e68589bSMark F. Adams 2332e68589bSMark F. Adams PetscFunctionReturn(0); 2342e68589bSMark F. Adams } 2352e68589bSMark F. Adams 2362e68589bSMark F. Adams /* -------------------------------------------------------------------------- */ 2372e68589bSMark F. Adams /* 2382e68589bSMark F. Adams PCSetCoordinates_AGG 2392e68589bSMark F. Adams 2402e68589bSMark F. Adams Input Parameter: 2412e68589bSMark F. Adams . pc - the preconditioner context 2422e68589bSMark F. Adams */ 2432e68589bSMark F. Adams EXTERN_C_BEGIN 2442e68589bSMark F. Adams #undef __FUNCT__ 2452e68589bSMark F. Adams #define __FUNCT__ "PCSetCoordinates_AGG" 2462e68589bSMark F. Adams PetscErrorCode PCSetCoordinates_AGG( PC pc, PetscInt ndm, PetscReal *coords ) 2472e68589bSMark F. Adams { 2482e68589bSMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 2492e68589bSMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 2502e68589bSMark F. Adams PetscErrorCode ierr; 2512e68589bSMark F. Adams PetscInt arrsz,bs,my0,kk,ii,jj,nloc,Iend; 2522e68589bSMark F. Adams Mat Amat = pc->pmat; 2532e68589bSMark F. Adams 2542e68589bSMark F. Adams PetscFunctionBegin; 2552e68589bSMark F. Adams PetscValidHeaderSpecific( Amat, MAT_CLASSID, 1 ); 2562e68589bSMark F. Adams ierr = MatGetBlockSize( Amat, &bs ); CHKERRQ( ierr ); 2572e68589bSMark F. Adams ierr = MatGetOwnershipRange( Amat, &my0, &Iend ); CHKERRQ(ierr); 2582e68589bSMark F. Adams nloc = (Iend-my0)/bs; 2592e68589bSMark F. Adams if((Iend-my0)%bs!=0) SETERRQ1(((PetscObject)Amat)->comm,PETSC_ERR_ARG_WRONG, "Bad local size %d.",nloc); 2602e68589bSMark F. Adams 2612e68589bSMark F. Adams /* SA: null space vectors */ 262c8b0795cSMark F. Adams if( coords && bs==1 ) pc_gamg->data_cell_cols = 1; /* scalar w/ coords and SA (not needed) */ 263c8b0795cSMark F. Adams else if( coords ) pc_gamg->data_cell_cols = (ndm==2 ? 3 : 6); /* elasticity */ 264c8b0795cSMark F. Adams else pc_gamg->data_cell_cols = bs; /* no data, force SA with constant null space vectors */ 265c8b0795cSMark F. Adams pc_gamg->data_cell_rows = bs; 2662e68589bSMark F. Adams 267c8b0795cSMark F. Adams arrsz = nloc*pc_gamg->data_cell_rows*pc_gamg->data_cell_cols; 2682e68589bSMark F. Adams 2692e68589bSMark F. Adams /* create data - syntactic sugar that should be refactored at some point */ 2702e68589bSMark F. Adams if (pc_gamg->data==0 || (pc_gamg->data_sz != arrsz)) { 2712e68589bSMark F. Adams ierr = PetscFree( pc_gamg->data ); CHKERRQ(ierr); 272c8b0795cSMark F. Adams ierr = PetscMalloc(arrsz*sizeof(PetscReal), &pc_gamg->data ); CHKERRQ(ierr); 2732e68589bSMark F. Adams } 2742e68589bSMark F. Adams /* copy data in - column oriented */ 2752e68589bSMark F. Adams for(kk=0;kk<nloc;kk++){ 2762e68589bSMark F. Adams const PetscInt M = Iend - my0; 2772e68589bSMark F. Adams PetscReal *data = &pc_gamg->data[kk*bs]; 278c8b0795cSMark F. Adams if( pc_gamg->data_cell_cols==1 ) *data = 1.0; 2792e68589bSMark F. Adams else { 2802e68589bSMark F. Adams for(ii=0;ii<bs;ii++) 2812e68589bSMark F. Adams for(jj=0;jj<bs;jj++) 2822e68589bSMark F. Adams if(ii==jj)data[ii*M + jj] = 1.0; /* translational modes */ 2832e68589bSMark F. Adams else data[ii*M + jj] = 0.0; 2842e68589bSMark F. Adams if( coords ) { 2852e68589bSMark F. Adams if( ndm == 2 ){ /* rotational modes */ 2862e68589bSMark F. Adams data += 2*M; 2872e68589bSMark F. Adams data[0] = -coords[2*kk+1]; 2882e68589bSMark F. Adams data[1] = coords[2*kk]; 2892e68589bSMark F. Adams } 2902e68589bSMark F. Adams else { 2912e68589bSMark F. Adams data += 3*M; 2922e68589bSMark F. Adams data[0] = 0.0; data[M+0] = coords[3*kk+2]; data[2*M+0] = -coords[3*kk+1]; 2932e68589bSMark F. Adams data[1] = -coords[3*kk+2]; data[M+1] = 0.0; data[2*M+1] = coords[3*kk]; 2942e68589bSMark F. Adams data[2] = coords[3*kk+1]; data[M+2] = -coords[3*kk]; data[2*M+2] = 0.0; 2952e68589bSMark F. Adams } 2962e68589bSMark F. Adams } 2972e68589bSMark F. Adams } 2982e68589bSMark F. Adams } 2992e68589bSMark F. Adams 3002e68589bSMark F. Adams pc_gamg->data_sz = arrsz; 3012e68589bSMark F. Adams 3022e68589bSMark F. Adams PetscFunctionReturn(0); 3032e68589bSMark F. Adams } 3042e68589bSMark F. Adams EXTERN_C_END 3052e68589bSMark F. Adams 306b43b03e9SMark F. Adams typedef PetscInt NState; 307b43b03e9SMark F. Adams static const NState NOT_DONE=-2; 308b43b03e9SMark F. Adams static const NState DELETED=-1; 309b43b03e9SMark F. Adams static const NState REMOVED=-3; 310b43b03e9SMark F. Adams #define IS_SELECTED(s) (s!=DELETED && s!=NOT_DONE && s!=REMOVED) 311b43b03e9SMark F. Adams 312c8b0795cSMark F. Adams /* -------------------------------------------------------------------------- */ 313c8b0795cSMark F. Adams /* 314b43b03e9SMark F. Adams smoothAggs - greedy grab of with G1 (unsquared graph) -- AIJ specific 315b43b03e9SMark F. Adams - AGG-MG specific: clears singletons out of 'selected_2' 316c8b0795cSMark F. Adams 317c8b0795cSMark F. Adams Input Parameter: 318c8b0795cSMark F. Adams . Gmat_2 - glabal matrix of graph (data not defined) 319c8b0795cSMark F. Adams . Gmat_1 - base graph to grab with 320c8b0795cSMark F. Adams . selected_2 - 321c8b0795cSMark F. Adams Input/Output Parameter: 322c8b0795cSMark F. Adams . llist_aggs_2 - linked list of aggs, ghost lids are based on Gmat_2 (squared graph) 323c8b0795cSMark F. Adams */ 324c8b0795cSMark F. Adams #undef __FUNCT__ 325c8b0795cSMark F. Adams #define __FUNCT__ "smoothAggs" 326c8b0795cSMark F. Adams PetscErrorCode smoothAggs( const Mat Gmat_2, /* base (squared) graph */ 327c8b0795cSMark F. Adams const Mat Gmat_1, /* base graph, could be unsymmetic */ 328c8b0795cSMark F. Adams const IS selected_2, /* [nselected total] selected vertices */ 329c8b0795cSMark F. Adams IS llist_aggs_2 /* [nloc_nghost] global ID of aggregate */ 330c8b0795cSMark F. Adams ) 331c8b0795cSMark F. Adams { 332c8b0795cSMark F. Adams PetscErrorCode ierr; 333c8b0795cSMark F. Adams PetscBool isMPI; 334c8b0795cSMark F. Adams Mat_SeqAIJ *matA_1, *matB_1=0, *matA_2, *matB_2=0; 335c8b0795cSMark F. Adams MPI_Comm wcomm = ((PetscObject)Gmat_2)->comm; 336c8b0795cSMark F. Adams PetscMPIInt mype; 337b43b03e9SMark F. Adams PetscInt lid,*ii,*idx,ix,Iend,my0,nnodes_2,kk,n,j; 338c8b0795cSMark F. Adams Mat_MPIAIJ *mpimat_2 = 0, *mpimat_1=0; 339c8b0795cSMark F. Adams const PetscInt nloc = Gmat_2->rmap->n; 340c8b0795cSMark F. Adams PetscScalar *cpcol_1_state,*cpcol_2_state,*deleted_parent_gid; 341c8b0795cSMark F. Adams PetscInt *lid_cprowID_1,*id_llist_2,*lid_cprowID_2; 342c8b0795cSMark F. Adams NState *lid_state; 343c8b0795cSMark F. Adams 344c8b0795cSMark F. Adams PetscFunctionBegin; 345c8b0795cSMark F. Adams ierr = MPI_Comm_rank( wcomm, &mype ); CHKERRQ(ierr); 346c8b0795cSMark F. Adams ierr = MatGetOwnershipRange(Gmat_1,&my0,&Iend); CHKERRQ(ierr); 347c8b0795cSMark F. Adams 348c8b0795cSMark F. Adams if( !PETSC_TRUE ) { 349c8b0795cSMark F. Adams PetscViewer viewer; char fname[32]; static int llev=0; 350c8b0795cSMark F. Adams sprintf(fname,"Gmat2_%d.m",llev++); 351c8b0795cSMark F. Adams PetscViewerASCIIOpen(wcomm,fname,&viewer); 352c8b0795cSMark F. Adams ierr = PetscViewerSetFormat( viewer, PETSC_VIEWER_ASCII_MATLAB); CHKERRQ(ierr); 353c8b0795cSMark F. Adams ierr = MatView(Gmat_2, viewer ); CHKERRQ(ierr); 354c8b0795cSMark F. Adams ierr = PetscViewerDestroy( &viewer ); 355c8b0795cSMark F. Adams } 356c8b0795cSMark F. Adams 357c8b0795cSMark F. Adams { /* copy linked list into temp buffer - should not work directly on pointer */ 358c8b0795cSMark F. Adams const PetscInt *llist_idx; 359c8b0795cSMark F. Adams ierr = ISGetSize( llist_aggs_2, &nnodes_2 ); CHKERRQ(ierr); 360c8b0795cSMark F. Adams ierr = PetscMalloc( nnodes_2*sizeof(PetscInt), &id_llist_2 ); CHKERRQ(ierr); 361c8b0795cSMark F. Adams ierr = ISGetIndices( llist_aggs_2, &llist_idx ); CHKERRQ(ierr); 362c8b0795cSMark F. Adams for(lid=0;lid<nnodes_2;lid++) id_llist_2[lid] = llist_idx[lid]; 363c8b0795cSMark F. Adams ierr = ISRestoreIndices( llist_aggs_2, &llist_idx ); CHKERRQ(ierr); 364c8b0795cSMark F. Adams } 365c8b0795cSMark F. Adams 366c8b0795cSMark F. Adams /* get submatrices */ 367c8b0795cSMark F. Adams ierr = PetscTypeCompare( (PetscObject)Gmat_1, MATMPIAIJ, &isMPI ); CHKERRQ(ierr); 368c8b0795cSMark F. Adams if(isMPI) { 369c8b0795cSMark F. Adams /* grab matrix objects */ 370c8b0795cSMark F. Adams mpimat_2 = (Mat_MPIAIJ*)Gmat_2->data; 371c8b0795cSMark F. Adams mpimat_1 = (Mat_MPIAIJ*)Gmat_1->data; 372c8b0795cSMark F. Adams matA_1 = (Mat_SeqAIJ*)mpimat_1->A->data; 373c8b0795cSMark F. Adams matB_1 = (Mat_SeqAIJ*)mpimat_1->B->data; 374c8b0795cSMark F. Adams matA_2 = (Mat_SeqAIJ*)mpimat_2->A->data; 375c8b0795cSMark F. Adams matB_2 = (Mat_SeqAIJ*)mpimat_2->B->data; 376c8b0795cSMark F. Adams 377c8b0795cSMark F. Adams /* force compressed row storage for B matrix in AuxMat */ 378c8b0795cSMark F. Adams matB_1->compressedrow.check = PETSC_TRUE; 379c8b0795cSMark F. Adams ierr = MatCheckCompressedRow(mpimat_1->B,&matB_1->compressedrow,matB_1->i,Gmat_1->rmap->n,-1.0); 380c8b0795cSMark F. Adams CHKERRQ(ierr); 381c8b0795cSMark F. Adams 382c8b0795cSMark F. Adams ierr = PetscMalloc( nloc*sizeof(PetscInt), &lid_cprowID_2 ); CHKERRQ(ierr); 383c8b0795cSMark F. Adams ierr = PetscMalloc( nloc*sizeof(PetscInt), &lid_cprowID_1 ); CHKERRQ(ierr); 384c8b0795cSMark F. Adams for(lid=0;lid<nloc;lid++) lid_cprowID_1[lid] = lid_cprowID_2[lid] = -1; 385c8b0795cSMark F. Adams for (ix=0; ix<matB_1->compressedrow.nrows; ix++) { 386c8b0795cSMark F. Adams PetscInt lid = matB_1->compressedrow.rindex[ix]; 387c8b0795cSMark F. Adams lid_cprowID_1[lid] = ix; 388c8b0795cSMark F. Adams } 389c8b0795cSMark F. Adams for (ix=0; ix<matB_2->compressedrow.nrows; ix++) { 390c8b0795cSMark F. Adams PetscInt lid = matB_2->compressedrow.rindex[ix]; 391c8b0795cSMark F. Adams lid_cprowID_2[lid] = ix; 392c8b0795cSMark F. Adams } 393c8b0795cSMark F. Adams } 394c8b0795cSMark F. Adams else { 395c8b0795cSMark F. Adams matA_1 = (Mat_SeqAIJ*)Gmat_1->data; 396c8b0795cSMark F. Adams matA_2 = (Mat_SeqAIJ*)Gmat_2->data; 397c8b0795cSMark F. Adams lid_cprowID_2 = lid_cprowID_1 = 0; 398c8b0795cSMark F. Adams } 399c8b0795cSMark F. Adams assert( matA_1 && !matA_1->compressedrow.use ); 400c8b0795cSMark F. Adams assert( matB_1==0 || matB_1->compressedrow.use ); 401c8b0795cSMark F. Adams assert( matA_2 && !matA_2->compressedrow.use ); 402c8b0795cSMark F. Adams assert( matB_2==0 || matB_2->compressedrow.use ); 403c8b0795cSMark F. Adams 404c8b0795cSMark F. Adams /* get state of locals and selected gid for deleted */ 405c8b0795cSMark F. Adams ierr = PetscMalloc( nloc*sizeof(NState), &lid_state ); CHKERRQ(ierr); 406c8b0795cSMark F. Adams ierr = PetscMalloc( nloc*sizeof(PetscScalar), &deleted_parent_gid ); CHKERRQ(ierr); 407c8b0795cSMark F. Adams for( lid = 0 ; lid < nloc ; lid++ ) { 408c8b0795cSMark F. Adams deleted_parent_gid[lid] = -1.0; 409c8b0795cSMark F. Adams lid_state[lid] = DELETED; 410c8b0795cSMark F. Adams } 411c8b0795cSMark F. Adams /* set index into compressed row 'lid_cprowID', not -1 means its a boundary node */ 412c8b0795cSMark F. Adams { 413b43b03e9SMark F. Adams PetscInt nSelected; 414c8b0795cSMark F. Adams const PetscInt *selected_idx; 415c8b0795cSMark F. Adams /* set local selected */ 416c8b0795cSMark F. Adams ierr = ISGetSize( selected_2, &nSelected ); CHKERRQ(ierr); 417c8b0795cSMark F. Adams ierr = ISGetIndices( selected_2, &selected_idx ); CHKERRQ(ierr); 418c8b0795cSMark F. Adams for(kk=0;kk<nSelected;kk++){ 419c8b0795cSMark F. Adams PetscInt lid = selected_idx[kk]; 420c8b0795cSMark F. Adams if(lid<nloc) lid_state[lid] = (NState)(lid+my0); /* selected flag */ 421c8b0795cSMark F. Adams else break; 422b43b03e9SMark F. Adams /* remove singletons */ 423b43b03e9SMark F. Adams ii = matA_2->i; n = ii[lid+1] - ii[lid]; 424b43b03e9SMark F. Adams if( n < 2 ) { 425b43b03e9SMark F. Adams if(!lid_cprowID_2 || (ix=lid_cprowID_2[lid])==-1 || (matB_2->compressedrow.i[ix+1]-matB_2->compressedrow.i[ix])==0){ 426b43b03e9SMark F. Adams lid_state[lid] = REMOVED; 427b43b03e9SMark F. Adams } 428b43b03e9SMark F. Adams } 429c8b0795cSMark F. Adams } 430c8b0795cSMark F. Adams ierr = ISRestoreIndices( selected_2, &selected_idx ); CHKERRQ(ierr); 431c8b0795cSMark F. Adams } 432c8b0795cSMark F. Adams /* map local to selected local, -1 means a ghost owns it */ 433c8b0795cSMark F. Adams for(lid=kk=0;lid<nloc;lid++){ 434c8b0795cSMark F. Adams NState state = lid_state[lid]; 435c8b0795cSMark F. Adams if( IS_SELECTED(state) ){ 436c8b0795cSMark F. Adams PetscInt flid = lid; 437c8b0795cSMark F. Adams do{ 438c8b0795cSMark F. Adams if(flid<nloc){ 439c8b0795cSMark F. Adams deleted_parent_gid[flid] = (PetscScalar)(lid + my0); 440c8b0795cSMark F. Adams } 441c8b0795cSMark F. Adams kk++; 442c8b0795cSMark F. Adams } while( (flid=id_llist_2[flid]) != -1 ); 443c8b0795cSMark F. Adams } 444c8b0795cSMark F. Adams } 445c8b0795cSMark F. Adams /* get 'cpcol_1_state', 'cpcol_2_state' - uses mpimat_1->lvec & mpimat_2->lvec for temp space */ 446c8b0795cSMark F. Adams if (isMPI) { 447c8b0795cSMark F. Adams Vec tempVec; 448c8b0795cSMark F. Adams 449c8b0795cSMark F. Adams /* get 'cpcol_1_state' */ 450c8b0795cSMark F. Adams ierr = MatGetVecs( Gmat_1, &tempVec, 0 ); CHKERRQ(ierr); 451c8b0795cSMark F. Adams for(kk=0,j=my0;kk<nloc;kk++,j++){ 452c8b0795cSMark F. Adams PetscScalar v = (PetscScalar)lid_state[kk]; 453c8b0795cSMark F. Adams ierr = VecSetValues( tempVec, 1, &j, &v, INSERT_VALUES ); CHKERRQ(ierr); 454c8b0795cSMark F. Adams } 455c8b0795cSMark F. Adams ierr = VecAssemblyBegin( tempVec ); CHKERRQ(ierr); 456c8b0795cSMark F. Adams ierr = VecAssemblyEnd( tempVec ); CHKERRQ(ierr); 457c8b0795cSMark F. Adams ierr = VecScatterBegin(mpimat_1->Mvctx,tempVec, mpimat_1->lvec,INSERT_VALUES,SCATTER_FORWARD); 458c8b0795cSMark F. Adams CHKERRQ(ierr); 459c8b0795cSMark F. Adams ierr = VecScatterEnd(mpimat_1->Mvctx,tempVec, mpimat_1->lvec,INSERT_VALUES,SCATTER_FORWARD); 460c8b0795cSMark F. Adams CHKERRQ(ierr); 461c8b0795cSMark F. Adams ierr = VecGetArray( mpimat_1->lvec, &cpcol_1_state ); CHKERRQ(ierr); 462c8b0795cSMark F. Adams ierr = VecDestroy( &tempVec ); CHKERRQ(ierr); 463c8b0795cSMark F. Adams 464c8b0795cSMark F. Adams /* get 'cpcol_2_state' */ 465c8b0795cSMark F. Adams ierr = MatGetVecs( Gmat_2, &tempVec, 0 ); CHKERRQ(ierr); 466c8b0795cSMark F. Adams for(kk=0,j=my0;kk<nloc;kk++,j++){ 467c8b0795cSMark F. Adams PetscScalar v = (PetscScalar)lid_state[kk]; 468c8b0795cSMark F. Adams ierr = VecSetValues( tempVec, 1, &j, &v, INSERT_VALUES ); CHKERRQ(ierr); 469c8b0795cSMark F. Adams } 470c8b0795cSMark F. Adams ierr = VecAssemblyBegin( tempVec ); CHKERRQ(ierr); 471c8b0795cSMark F. Adams ierr = VecAssemblyEnd( tempVec ); CHKERRQ(ierr); 472c8b0795cSMark F. Adams ierr = VecScatterBegin(mpimat_2->Mvctx,tempVec, mpimat_2->lvec,INSERT_VALUES,SCATTER_FORWARD); 473c8b0795cSMark F. Adams CHKERRQ(ierr); 474c8b0795cSMark F. Adams ierr = VecScatterEnd(mpimat_2->Mvctx,tempVec, mpimat_2->lvec,INSERT_VALUES,SCATTER_FORWARD); 475c8b0795cSMark F. Adams CHKERRQ(ierr); 476c8b0795cSMark F. Adams ierr = VecGetArray( mpimat_2->lvec, &cpcol_2_state ); CHKERRQ(ierr); 477c8b0795cSMark F. Adams ierr = VecDestroy( &tempVec ); CHKERRQ(ierr); 478c8b0795cSMark F. Adams } /* ismpi */ 479c8b0795cSMark F. Adams 480c8b0795cSMark F. Adams /* doit */ 481c8b0795cSMark F. Adams for(lid=0;lid<nloc;lid++){ 482c8b0795cSMark F. Adams NState state = lid_state[lid]; 483c8b0795cSMark F. Adams if( IS_SELECTED(state) ) { /* steal locals */ 484c8b0795cSMark F. Adams ii = matA_1->i; n = ii[lid+1] - ii[lid]; 485c8b0795cSMark F. Adams idx = matA_1->j + ii[lid]; 486c8b0795cSMark F. Adams for (j=0; j<n; j++) { 487c8b0795cSMark F. Adams PetscInt flid, lidj = idx[j], sgid; 488c8b0795cSMark F. Adams NState statej = lid_state[lidj]; 48974778d6cSJed Brown if (statej==DELETED && (sgid=(PetscInt)PetscRealPart(deleted_parent_gid[lidj])) != lid+my0) { /* steal local */ 490c8b0795cSMark F. Adams deleted_parent_gid[lidj] = (PetscScalar)(lid+my0); /* send this with _2 */ 491c8b0795cSMark F. Adams if( sgid >= my0 && sgid < my0+nloc ){ /* I'm stealing this local from a local */ 492c8b0795cSMark F. Adams PetscInt hav=0, flid2=sgid-my0, lastid; 493c8b0795cSMark F. Adams /* looking for local from local so id_llist_2 works */ 494c8b0795cSMark F. Adams for( lastid=flid2, flid=id_llist_2[flid2] ; flid!=-1 ; flid=id_llist_2[flid] ) { 495c8b0795cSMark F. Adams if( flid == lidj ) { 496c8b0795cSMark F. Adams id_llist_2[lastid] = id_llist_2[flid]; /* remove lidj from list */ 497c8b0795cSMark F. Adams id_llist_2[flid] = id_llist_2[lid]; id_llist_2[lid] = flid; /* insert 'lidj' into head of llist */ 498c8b0795cSMark F. Adams hav++; 499c8b0795cSMark F. Adams break; 500c8b0795cSMark F. Adams } 501c8b0795cSMark F. Adams lastid = flid; 502c8b0795cSMark F. Adams } 503c8b0795cSMark F. Adams if(hav!=1){ 504c8b0795cSMark F. Adams if(hav==0)SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"failed to find adj in 'selected' lists - structurally unsymmetric matrix"); 505c8b0795cSMark F. Adams SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"found node %d times???",hav); 506c8b0795cSMark F. Adams } 507c8b0795cSMark F. Adams } 508c8b0795cSMark F. Adams else{ /* I'm stealing this local, owned by a ghost - ok to use _2, local */ 509c8b0795cSMark F. Adams assert(sgid==-1); 510c8b0795cSMark F. Adams id_llist_2[lidj] = id_llist_2[lid]; id_llist_2[lid] = lidj; /* insert 'lidj' into head of llist */ 511c8b0795cSMark F. Adams /* local remove at end, off add/rm at end */ 512c8b0795cSMark F. Adams } 513c8b0795cSMark F. Adams } 514c8b0795cSMark F. Adams } 515c8b0795cSMark F. Adams } 516c8b0795cSMark F. Adams else if( state == DELETED && lid_cprowID_1 ) { 51774778d6cSJed Brown PetscInt sgidold = (PetscInt)PetscRealPart(deleted_parent_gid[lid]); 518c8b0795cSMark F. Adams /* see if I have a selected ghost neighbor that will steal me */ 519c8b0795cSMark F. Adams if( (ix=lid_cprowID_1[lid]) != -1 ){ 520c8b0795cSMark F. Adams ii = matB_1->compressedrow.i; n = ii[ix+1] - ii[ix]; 521c8b0795cSMark F. Adams idx = matB_1->j + ii[ix]; 522c8b0795cSMark F. Adams for( j=0 ; j<n ; j++ ) { 523c8b0795cSMark F. Adams PetscInt cpid = idx[j]; 524c8b0795cSMark F. Adams NState statej = (NState)PetscRealPart(cpcol_1_state[cpid]); 525c8b0795cSMark F. Adams if( IS_SELECTED(statej) && sgidold != (PetscInt)statej ) { /* ghost will steal this, remove from my list */ 526c8b0795cSMark F. Adams deleted_parent_gid[lid] = (PetscScalar)statej; /* send who selected with _2 */ 527c8b0795cSMark F. Adams if( sgidold>=my0 && sgidold<(my0+nloc) ) { /* this was mine */ 528c8b0795cSMark F. Adams PetscInt lastid,hav=0,flid,oldslidj=sgidold-my0; 529c8b0795cSMark F. Adams /* remove from 'oldslidj' list, local so _2 is OK */ 530c8b0795cSMark F. Adams for( lastid=oldslidj, flid=id_llist_2[oldslidj] ; flid != -1 ; flid=id_llist_2[flid] ) { 531c8b0795cSMark F. Adams if( flid == lid ) { 532c8b0795cSMark F. Adams id_llist_2[lastid] = id_llist_2[flid]; /* remove lid from oldslidj list */ 533c8b0795cSMark F. Adams hav++; 534c8b0795cSMark F. Adams break; 535c8b0795cSMark F. Adams } 536c8b0795cSMark F. Adams lastid = flid; 537c8b0795cSMark F. Adams } 538c8b0795cSMark F. Adams if(hav!=1){ 539c8b0795cSMark F. Adams if(hav==0)SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"failed to find adj in 'selected' lists - structurally unsymmetric matrix"); 540c8b0795cSMark F. Adams SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"found node %d times???",hav); 541c8b0795cSMark F. Adams } 542c8b0795cSMark F. Adams id_llist_2[lid] = -1; /* terminate linked list - needed? */ 543c8b0795cSMark F. Adams } 544c8b0795cSMark F. Adams else assert(id_llist_2[lid] == -1); 545c8b0795cSMark F. Adams } 546c8b0795cSMark F. Adams } 547c8b0795cSMark F. Adams } 548c8b0795cSMark F. Adams } /* selected/deleted */ 549c8b0795cSMark F. Adams else assert(state == REMOVED || !lid_cprowID_1); 550c8b0795cSMark F. Adams } /* node loop */ 551c8b0795cSMark F. Adams 552c8b0795cSMark F. Adams if( isMPI ) { 553c8b0795cSMark F. Adams PetscScalar *cpcol_2_sel_gid; 554c8b0795cSMark F. Adams Vec tempVec; 555c8b0795cSMark F. Adams PetscInt cpid; 556c8b0795cSMark F. Adams 557c8b0795cSMark F. Adams ierr = VecRestoreArray( mpimat_1->lvec, &cpcol_1_state ); CHKERRQ(ierr); 558c8b0795cSMark F. Adams ierr = VecRestoreArray( mpimat_2->lvec, &cpcol_2_state ); CHKERRQ(ierr); 559c8b0795cSMark F. Adams 560c8b0795cSMark F. Adams /* get 'cpcol_2_sel_gid' */ 561c8b0795cSMark F. Adams ierr = MatGetVecs( Gmat_2, &tempVec, 0 ); CHKERRQ(ierr); 562c8b0795cSMark F. Adams for(kk=0,j=my0;kk<nloc;kk++,j++){ 563c8b0795cSMark F. Adams ierr = VecSetValues( tempVec, 1, &j, &deleted_parent_gid[kk], INSERT_VALUES ); CHKERRQ(ierr); 564c8b0795cSMark F. Adams } 565c8b0795cSMark F. Adams ierr = VecAssemblyBegin( tempVec ); CHKERRQ(ierr); 566c8b0795cSMark F. Adams ierr = VecAssemblyEnd( tempVec ); CHKERRQ(ierr); 567c8b0795cSMark F. Adams ierr = VecScatterBegin(mpimat_2->Mvctx,tempVec, mpimat_2->lvec,INSERT_VALUES,SCATTER_FORWARD); 568c8b0795cSMark F. Adams CHKERRQ(ierr); 569c8b0795cSMark F. Adams ierr = VecScatterEnd(mpimat_2->Mvctx,tempVec, mpimat_2->lvec,INSERT_VALUES,SCATTER_FORWARD); 570c8b0795cSMark F. Adams CHKERRQ(ierr); 571c8b0795cSMark F. Adams ierr = VecDestroy( &tempVec ); CHKERRQ(ierr); 572c8b0795cSMark F. Adams 573c8b0795cSMark F. Adams ierr = VecGetArray( mpimat_2->lvec, &cpcol_2_sel_gid ); CHKERRQ(ierr); 574c8b0795cSMark F. Adams 575c8b0795cSMark F. Adams /* look for deleted ghosts and see if they moved */ 576c8b0795cSMark F. Adams for(lid=0;lid<nloc;lid++){ 577c8b0795cSMark F. Adams NState state = lid_state[lid]; 578c8b0795cSMark F. Adams if( IS_SELECTED(state) ){ 579c8b0795cSMark F. Adams PetscInt flid,lastid,old_sgid=lid+my0; 580c8b0795cSMark F. Adams /* look for deleted ghosts and see if they moved */ 581c8b0795cSMark F. Adams for( lastid=lid, flid=id_llist_2[lid] ; flid!=-1 ; flid=id_llist_2[flid] ) { 582c8b0795cSMark F. Adams if( flid>=nloc ) { 58374778d6cSJed Brown PetscInt cpid = flid-nloc, sgid_new = (PetscInt)PetscRealPart(cpcol_2_sel_gid[cpid]); 584c8b0795cSMark F. Adams if( sgid_new != old_sgid && sgid_new != -1 ) { 585c8b0795cSMark F. Adams id_llist_2[lastid] = id_llist_2[flid]; /* remove 'flid' from list */ 586c8b0795cSMark F. Adams id_llist_2[flid] = -1; 587c8b0795cSMark F. Adams flid = lastid; 588c8b0795cSMark F. Adams } /* if it changed parents */ 589c8b0795cSMark F. Adams else lastid = flid; 590c8b0795cSMark F. Adams } /* for ghost nodes */ 591c8b0795cSMark F. Adams else lastid = flid; 592c8b0795cSMark F. Adams } /* loop over list of deleted */ 593c8b0795cSMark F. Adams } /* selected */ 594c8b0795cSMark F. Adams } 595c8b0795cSMark F. Adams 596c8b0795cSMark F. Adams /* look at ghosts, see if they changed, and moved here */ 597c8b0795cSMark F. Adams for(cpid=0;cpid<nnodes_2-nloc;cpid++){ 59874778d6cSJed Brown PetscInt sgid_new = (PetscInt)PetscRealPart(cpcol_2_sel_gid[cpid]); 599c8b0795cSMark F. Adams if( sgid_new>=my0 && sgid_new<(my0+nloc) ) { /* this is mine */ 600c8b0795cSMark F. Adams PetscInt lastid,flid,slid_new=sgid_new-my0,flidj=nloc+cpid,hav=0; 601c8b0795cSMark F. Adams for( lastid=slid_new, flid=id_llist_2[slid_new] ; flid != -1 ; flid=id_llist_2[flid] ) { 602c8b0795cSMark F. Adams if( flid == flidj ) { 603c8b0795cSMark F. Adams hav++; 604c8b0795cSMark F. Adams break; 605c8b0795cSMark F. Adams } 606c8b0795cSMark F. Adams lastid = flid; 607c8b0795cSMark F. Adams } 608c8b0795cSMark F. Adams if( hav != 1 ){ 609c8b0795cSMark F. Adams assert(id_llist_2[flidj] == -1); 610c8b0795cSMark F. Adams id_llist_2[flidj] = id_llist_2[slid_new]; id_llist_2[slid_new] = flidj; /* insert 'flidj' into head of llist */ 611c8b0795cSMark F. Adams } 612c8b0795cSMark F. Adams } 613c8b0795cSMark F. Adams } 614c8b0795cSMark F. Adams 615c8b0795cSMark F. Adams ierr = VecRestoreArray( mpimat_2->lvec, &cpcol_2_sel_gid ); CHKERRQ(ierr); 616c8b0795cSMark F. Adams ierr = PetscFree( lid_cprowID_1 ); CHKERRQ(ierr); 617c8b0795cSMark F. Adams ierr = PetscFree( lid_cprowID_2 ); CHKERRQ(ierr); 618c8b0795cSMark F. Adams } 619c8b0795cSMark F. Adams 620c8b0795cSMark F. Adams /* copy out new aggs */ 621c8b0795cSMark F. Adams ierr = ISGeneralSetIndices(llist_aggs_2, nnodes_2, id_llist_2, PETSC_COPY_VALUES ); CHKERRQ(ierr); 622c8b0795cSMark F. Adams 623c8b0795cSMark F. Adams ierr = PetscFree( id_llist_2 ); CHKERRQ(ierr); 624c8b0795cSMark F. Adams ierr = PetscFree( deleted_parent_gid ); CHKERRQ(ierr); 625c8b0795cSMark F. Adams ierr = PetscFree( lid_state ); CHKERRQ(ierr); 626c8b0795cSMark F. Adams 627c8b0795cSMark F. Adams PetscFunctionReturn(0); 628c8b0795cSMark F. Adams } 6292e68589bSMark F. Adams 6302e68589bSMark F. Adams /* -------------------------------------------------------------------------- */ 6312e68589bSMark F. Adams /* 6322e68589bSMark F. Adams PCSetData_AGG 6332e68589bSMark F. Adams 6342e68589bSMark F. Adams Input Parameter: 6352e68589bSMark F. Adams . pc - 6362e68589bSMark F. Adams */ 6372e68589bSMark F. Adams #undef __FUNCT__ 6382e68589bSMark F. Adams #define __FUNCT__ "PCSetData_AGG" 6392e68589bSMark F. Adams PetscErrorCode PCSetData_AGG( PC pc ) 6402e68589bSMark F. Adams { 6412e68589bSMark F. Adams PetscErrorCode ierr; 6422e68589bSMark F. Adams PetscFunctionBegin; 6432e68589bSMark F. Adams ierr = PCSetCoordinates_AGG( pc, -1, PETSC_NULL ); CHKERRQ(ierr); 6442e68589bSMark F. Adams PetscFunctionReturn(0); 6452e68589bSMark F. Adams } 6462e68589bSMark F. Adams 6472e68589bSMark F. Adams /* -------------------------------------------------------------------------- */ 6482e68589bSMark F. Adams /* 6492e68589bSMark F. Adams formProl0 6502e68589bSMark F. Adams 6512e68589bSMark F. Adams Input Parameter: 6522e68589bSMark F. Adams . selected - list of selected local ID, includes selected ghosts 6532e68589bSMark F. Adams . locals_llist - linked list with aggregates 6542e68589bSMark F. Adams . bs - block size 6552e68589bSMark F. Adams . nSAvec - num columns of new P 6562e68589bSMark F. Adams . my0crs - global index of locals 6572e68589bSMark F. Adams . data_stride - bs*(nloc nodes + ghost nodes) 6582e68589bSMark F. Adams . data_in[data_stride*nSAvec] - local data on fine grid 6592e68589bSMark F. Adams . flid_fgid[data_stride/bs] - make local to global IDs, includes ghosts in 'locals_llist' 6602e68589bSMark F. Adams Output Parameter: 6612e68589bSMark F. Adams . a_data_out - in with fine grid data (w/ghosts), out with coarse grid data 6622e68589bSMark F. Adams . a_Prol - prolongation operator 6632e68589bSMark F. Adams */ 6642e68589bSMark F. Adams #undef __FUNCT__ 6652e68589bSMark F. Adams #define __FUNCT__ "formProl0" 6662e68589bSMark F. Adams PetscErrorCode formProl0( IS selected, /* list of selected local ID, includes selected ghosts */ 6672e68589bSMark F. Adams IS locals_llist, /* linked list from selected vertices of aggregate unselected vertices */ 6682e68589bSMark F. Adams const PetscInt bs, 6692e68589bSMark F. Adams const PetscInt nSAvec, 6702e68589bSMark F. Adams const PetscInt my0crs, 6712e68589bSMark F. Adams const PetscInt data_stride, 6722e68589bSMark F. Adams PetscReal data_in[], 6732e68589bSMark F. Adams const PetscInt flid_fgid[], 6742e68589bSMark F. Adams PetscReal **a_data_out, 6752e68589bSMark F. Adams Mat a_Prol /* prolongation operator (output)*/ 6762e68589bSMark F. Adams ) 6772e68589bSMark F. Adams { 6782e68589bSMark F. Adams PetscErrorCode ierr; 679b43b03e9SMark F. Adams PetscInt Istart,Iend,nFineLoc,clid,flid,aggID,kk,jj,ii,mm,nLocalSelected,ndone,nSelected,minsz; 6802e68589bSMark F. Adams MPI_Comm wcomm = ((PetscObject)a_Prol)->comm; 6812e68589bSMark F. Adams PetscMPIInt mype, npe; 6822e68589bSMark F. Adams const PetscInt *selected_idx,*llist_idx; 6832e68589bSMark F. Adams PetscReal *out_data; 6842adcac29SMark F. Adams /* #define OUT_AGGS */ 6859057884aSMark F. Adams #ifdef OUT_AGGS 6869057884aSMark F. Adams static PetscInt llev = 0; char fname[32]; FILE *file; 6879057884aSMark F. Adams sprintf(fname,"aggs_%d.m",llev++); 688b2a4f308SMark F. Adams if(llev==1) { 6899057884aSMark F. Adams file = fopen(fname,"w"); 6909057884aSMark F. Adams fprintf(file,"figure,\n"); 691b2a4f308SMark F. Adams } 6929057884aSMark F. Adams #endif 6932e68589bSMark F. Adams 6942e68589bSMark F. Adams PetscFunctionBegin; 6952e68589bSMark F. Adams ierr = MPI_Comm_rank(wcomm,&mype);CHKERRQ(ierr); 6962e68589bSMark F. Adams ierr = MPI_Comm_size(wcomm,&npe);CHKERRQ(ierr); 6972e68589bSMark F. Adams ierr = MatGetOwnershipRange( a_Prol, &Istart, &Iend ); CHKERRQ(ierr); 6982e68589bSMark F. Adams nFineLoc = (Iend-Istart)/bs; assert((Iend-Istart)%bs==0); 6992e68589bSMark F. Adams 700c8b0795cSMark F. Adams ierr = ISGetSize( selected, &nSelected ); CHKERRQ(ierr); 7012e68589bSMark F. Adams ierr = ISGetIndices( selected, &selected_idx ); CHKERRQ(ierr); 702b43b03e9SMark F. Adams ierr = ISGetIndices( locals_llist, &llist_idx ); CHKERRQ(ierr); 7032e68589bSMark F. Adams for(kk=0,nLocalSelected=0;kk<nSelected;kk++){ 7042e68589bSMark F. Adams PetscInt lid = selected_idx[kk]; 705b43b03e9SMark F. Adams if( lid<nFineLoc && llist_idx[lid] != -1 ) nLocalSelected++; 7062e68589bSMark F. Adams } 7072e68589bSMark F. Adams 7082e68589bSMark F. Adams /* aloc space for coarse point data (output) */ 7092e68589bSMark F. Adams #define DATA_OUT_STRIDE (nLocalSelected*nSAvec) 710c8b0795cSMark F. Adams ierr = PetscMalloc( DATA_OUT_STRIDE*nSAvec*sizeof(PetscReal), &out_data ); CHKERRQ(ierr); 711c8b0795cSMark F. Adams for(ii=0;ii<DATA_OUT_STRIDE*nSAvec;ii++) out_data[ii]=1.e300; 7122e68589bSMark F. Adams *a_data_out = out_data; /* output - stride nLocalSelected*nSAvec */ 7132e68589bSMark F. Adams 7142e68589bSMark F. Adams /* find points and set prolongation */ 715c8b0795cSMark F. Adams minsz = 100; 7162e68589bSMark F. Adams ndone = 0; 717b43b03e9SMark F. Adams for( mm = clid = 0 ; mm < nSelected ; mm++ ){ 718b43b03e9SMark F. Adams PetscInt lid = selected_idx[mm]; 7192e68589bSMark F. Adams PetscInt cgid = my0crs + clid, cids[100]; 720b43b03e9SMark F. Adams if( lid>=nFineLoc || llist_idx[lid]==-1 ) continue; /* skip ghost or singleton */ 721b43b03e9SMark F. Adams 7222e68589bSMark F. Adams /* count agg */ 7232e68589bSMark F. Adams aggID = 0; 724b43b03e9SMark F. Adams flid = selected_idx[mm]; assert(flid != -1); 7252e68589bSMark F. Adams do{ 7262e68589bSMark F. Adams aggID++; 7272e68589bSMark F. Adams } while( (flid=llist_idx[flid]) != -1 ); 728c8b0795cSMark F. Adams if( aggID<minsz ) minsz = aggID; 7292e68589bSMark F. Adams 7302e68589bSMark F. Adams /* get block */ 7312e68589bSMark F. Adams { 7322e68589bSMark F. Adams PetscBLASInt asz=aggID,M=asz*bs,N=nSAvec,INFO; 7332e68589bSMark F. Adams PetscBLASInt Mdata=M+((N-M>0)?N-M:0),LDA=Mdata,LWORK=N*bs; 7342e68589bSMark F. Adams PetscScalar *qqc,*qqr,*TAU,*WORK; 7352e68589bSMark F. Adams PetscInt *fids; 7362e68589bSMark F. Adams 7372e68589bSMark F. Adams ierr = PetscMalloc( (Mdata*N)*sizeof(PetscScalar), &qqc ); CHKERRQ(ierr); 7382e68589bSMark F. Adams ierr = PetscMalloc( (M*N)*sizeof(PetscScalar), &qqr ); CHKERRQ(ierr); 7392e68589bSMark F. Adams ierr = PetscMalloc( N*sizeof(PetscScalar), &TAU ); CHKERRQ(ierr); 7402e68589bSMark F. Adams ierr = PetscMalloc( LWORK*sizeof(PetscScalar), &WORK ); CHKERRQ(ierr); 7412e68589bSMark F. Adams ierr = PetscMalloc( M*sizeof(PetscInt), &fids ); CHKERRQ(ierr); 7422e68589bSMark F. Adams 743b43b03e9SMark F. Adams flid = selected_idx[mm]; 7442e68589bSMark F. Adams aggID = 0; 7452e68589bSMark F. Adams do{ 7462e68589bSMark F. Adams /* copy in B_i matrix - column oriented */ 7472e68589bSMark F. Adams PetscReal *data = &data_in[flid*bs]; 7482e68589bSMark F. Adams for( kk = ii = 0; ii < bs ; ii++ ) { 7492e68589bSMark F. Adams for( jj = 0; jj < N ; jj++ ) { 7502e68589bSMark F. Adams qqc[jj*Mdata + aggID*bs + ii] = data[jj*data_stride + ii]; 7512e68589bSMark F. Adams } 7522e68589bSMark F. Adams } 7539057884aSMark F. Adams #ifdef OUT_AGGS 754b2a4f308SMark F. Adams if(llev==1) { 7559057884aSMark F. Adams char str[] = "plot(%e,%e,'r*'), hold on,\n", col[] = "rgbkmc", sim[] = "*os+h>d<vx^"; 756b2a4f308SMark F. Adams PetscInt M,pi,pj,gid=Istart+flid; 7579057884aSMark F. Adams str[12] = col[clid%6]; str[13] = sim[(clid/6)%11]; 758b2a4f308SMark F. Adams M = (PetscInt)(PetscSqrtScalar((PetscScalar)nFineLoc*npe)); 759b2a4f308SMark F. Adams pj = gid/M; pi = gid%M; 760b2a4f308SMark F. Adams fprintf(file,str,(double)pi,(double)pj); 761b2a4f308SMark F. Adams /* fprintf(file,str,data[2*data_stride+1],-data[2*data_stride]); */ 7629057884aSMark F. Adams } 7639057884aSMark F. Adams #endif 7642e68589bSMark F. Adams /* set fine IDs */ 7652e68589bSMark F. Adams for(kk=0;kk<bs;kk++) fids[aggID*bs + kk] = flid_fgid[flid]*bs + kk; 7662e68589bSMark F. Adams 7672e68589bSMark F. Adams aggID++; 7682e68589bSMark F. Adams }while( (flid=llist_idx[flid]) != -1 ); 7692e68589bSMark F. Adams 7702e68589bSMark F. Adams /* pad with zeros */ 7712e68589bSMark F. Adams for( ii = asz*bs; ii < Mdata ; ii++ ) { 7722e68589bSMark F. Adams for( jj = 0; jj < N ; jj++, kk++ ) { 7732e68589bSMark F. Adams qqc[jj*Mdata + ii] = .0; 7742e68589bSMark F. Adams } 7752e68589bSMark F. Adams } 7762e68589bSMark F. Adams 7772e68589bSMark F. Adams ndone += aggID; 7782e68589bSMark F. Adams /* QR */ 7792e68589bSMark F. Adams LAPACKgeqrf_( &Mdata, &N, qqc, &LDA, TAU, WORK, &LWORK, &INFO ); 7802e68589bSMark F. Adams if( INFO != 0 ) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"xGEQRS error"); 7812e68589bSMark F. Adams /* get R - column oriented - output B_{i+1} */ 7822e68589bSMark F. Adams { 7832e68589bSMark F. Adams PetscReal *data = &out_data[clid*nSAvec]; 7842e68589bSMark F. Adams for( jj = 0; jj < nSAvec ; jj++ ) { 7852e68589bSMark F. Adams for( ii = 0; ii < nSAvec ; ii++ ) { 7862e68589bSMark F. Adams assert(data[jj*DATA_OUT_STRIDE + ii] == 1.e300); 7872e68589bSMark F. Adams if( ii <= jj ) data[jj*DATA_OUT_STRIDE + ii] = PetscRealPart(qqc[jj*Mdata + ii]); 7882e68589bSMark F. Adams else data[jj*DATA_OUT_STRIDE + ii] = 0.; 7892e68589bSMark F. Adams } 7902e68589bSMark F. Adams } 7912e68589bSMark F. Adams } 7922e68589bSMark F. Adams 7932e68589bSMark F. Adams /* get Q - row oriented */ 7942e68589bSMark F. Adams LAPACKungqr_( &Mdata, &N, &N, qqc, &LDA, TAU, WORK, &LWORK, &INFO ); 7952e68589bSMark F. Adams if( INFO != 0 ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"xORGQR error arg %d",-INFO); 7962e68589bSMark F. Adams 7972e68589bSMark F. Adams for( ii = 0 ; ii < M ; ii++ ){ 7982e68589bSMark F. Adams for( jj = 0 ; jj < N ; jj++ ) { 7992e68589bSMark F. Adams qqr[N*ii + jj] = qqc[jj*Mdata + ii]; 8002e68589bSMark F. Adams } 8012e68589bSMark F. Adams } 8022e68589bSMark F. Adams 8032e68589bSMark F. Adams /* add diagonal block of P0 */ 804c8b0795cSMark F. Adams for(kk=0;kk<N;kk++) { 805c8b0795cSMark F. Adams cids[kk] = N*cgid + kk; /* global col IDs in P0 */ 806c8b0795cSMark F. Adams } 8072e68589bSMark F. Adams ierr = MatSetValues(a_Prol,M,fids,N,cids,qqr,INSERT_VALUES); CHKERRQ(ierr); 8082e68589bSMark F. Adams 8092e68589bSMark F. Adams ierr = PetscFree( qqc ); CHKERRQ(ierr); 8102e68589bSMark F. Adams ierr = PetscFree( qqr ); CHKERRQ(ierr); 8112e68589bSMark F. Adams ierr = PetscFree( TAU ); CHKERRQ(ierr); 8122e68589bSMark F. Adams ierr = PetscFree( WORK ); CHKERRQ(ierr); 8132e68589bSMark F. Adams ierr = PetscFree( fids ); CHKERRQ(ierr); 8142e68589bSMark F. Adams } /* scoping */ 815b43b03e9SMark F. Adams clid++; 8162e68589bSMark F. Adams } /* for all coarse nodes */ 8172e68589bSMark F. Adams 818c8b0795cSMark F. Adams /* ierr = MPI_Allreduce( &ndone, &ii, 1, MPIU_INT, MPIU_SUM, wcomm ); */ 8192e68589bSMark F. Adams /* MatGetSize( a_Prol, &kk, &jj ); */ 820c8b0795cSMark F. Adams /* ierr = MPI_Allreduce( &minsz, &jj, 1, MPIU_INT, MPIU_MIN, wcomm ); */ 821ef4ad70eSMark F. Adams /* PetscPrintf(PETSC_COMM_WORLD," **** [%d]%s %d total done, %d nodes (%d local done), min agg. size = %d\n",mype,__FUNCT__,ii,kk/bs,ndone,jj); */ 8222e68589bSMark F. Adams 8239057884aSMark F. Adams #ifdef OUT_AGGS 824b2a4f308SMark F. Adams if(llev==1) fclose(file); 8259057884aSMark F. Adams #endif 8262e68589bSMark F. Adams ierr = ISRestoreIndices( selected, &selected_idx ); CHKERRQ(ierr); 8272e68589bSMark F. Adams ierr = ISRestoreIndices( locals_llist, &llist_idx ); CHKERRQ(ierr); 8282e68589bSMark F. Adams ierr = MatAssemblyBegin(a_Prol,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 8292e68589bSMark F. Adams ierr = MatAssemblyEnd(a_Prol,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 8302e68589bSMark F. Adams 8312e68589bSMark F. Adams PetscFunctionReturn(0); 8322e68589bSMark F. Adams } 8332e68589bSMark F. Adams 8342e68589bSMark F. Adams /* -------------------------------------------------------------------------- */ 8352e68589bSMark F. Adams /* 836c8b0795cSMark F. Adams PCGAMGgraph_AGG 8372e68589bSMark F. Adams 8382e68589bSMark F. Adams Input Parameter: 8392e68589bSMark F. Adams . pc - this 8402e68589bSMark F. Adams . Amat - matrix on this fine level 8412e68589bSMark F. Adams Output Parameter: 842c8b0795cSMark F. Adams . a_Gmat - 8432e68589bSMark F. Adams */ 8442e68589bSMark F. Adams #undef __FUNCT__ 845c8b0795cSMark F. Adams #define __FUNCT__ "PCGAMGgraph_AGG" 846c8b0795cSMark F. Adams PetscErrorCode PCGAMGgraph_AGG( PC pc, 8472e68589bSMark F. Adams const Mat Amat, 848c8b0795cSMark F. Adams Mat *a_Gmat 849c8b0795cSMark F. Adams ) 850c8b0795cSMark F. Adams { 851c8b0795cSMark F. Adams PetscErrorCode ierr; 852c8b0795cSMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 853c8b0795cSMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 854c8b0795cSMark F. Adams const PetscInt verbose = pc_gamg->verbose; 855c8b0795cSMark F. Adams const PetscReal vfilter = pc_gamg->threshold; 856c8b0795cSMark F. Adams PC_GAMG_AGG *pc_gamg_agg = (PC_GAMG_AGG*)pc_gamg->subctx; 857c8b0795cSMark F. Adams PetscMPIInt mype,npe; 858c8b0795cSMark F. Adams Mat Gmat, Gmat2; 859c8b0795cSMark F. Adams MPI_Comm wcomm = ((PetscObject)Amat)->comm; 860c8b0795cSMark F. Adams 861c8b0795cSMark F. Adams PetscFunctionBegin; 862c8b0795cSMark F. Adams ierr = MPI_Comm_rank( wcomm, &mype); CHKERRQ(ierr); 863c8b0795cSMark F. Adams ierr = MPI_Comm_size( wcomm, &npe); CHKERRQ(ierr); 864c8b0795cSMark F. Adams 865c8b0795cSMark F. Adams ierr = createSimpleGraph( Amat, &Gmat ); CHKERRQ( ierr ); 866c8b0795cSMark F. Adams ierr = scaleFilterGraph( &Gmat, vfilter, pc_gamg_agg->sym_graph, verbose ); CHKERRQ( ierr ); 867c8b0795cSMark F. Adams 868ef4ad70eSMark F. Adams if( pc_gamg_agg->square_graph ) { 869c8b0795cSMark F. Adams ierr = MatTransposeMatMult( Gmat, Gmat, MAT_INITIAL_MATRIX, PETSC_DEFAULT, &Gmat2 ); 870c8b0795cSMark F. Adams CHKERRQ(ierr); 871c8b0795cSMark F. Adams /* attach auxilary matrix */ 872c8b0795cSMark F. Adams pc_gamg_agg->aux_mat = Gmat; 873c8b0795cSMark F. Adams *a_Gmat = Gmat2; 874ef4ad70eSMark F. Adams } 875ef4ad70eSMark F. Adams else { 876ef4ad70eSMark F. Adams *a_Gmat = Gmat; assert(pc_gamg_agg->aux_mat == 0); 877ef4ad70eSMark F. Adams } 878c8b0795cSMark F. Adams 879c8b0795cSMark F. Adams PetscFunctionReturn(0); 880c8b0795cSMark F. Adams } 881c8b0795cSMark F. Adams 882c8b0795cSMark F. Adams /* -------------------------------------------------------------------------- */ 883c8b0795cSMark F. Adams /* 884b43b03e9SMark F. Adams PCGAMGCoarsen_AGG 885c8b0795cSMark F. Adams 886c8b0795cSMark F. Adams Input Parameter: 887c8b0795cSMark F. Adams . pc - this 888c8b0795cSMark F. Adams . Gmat2 - matrix on this fine level 889c8b0795cSMark F. Adams Output Parameter: 890c8b0795cSMark F. Adams . a_selected - prolongation operator to the next level 891c8b0795cSMark F. Adams . a_llist_parent - data of coarse grid points (num local columns in 'a_P_out') 892c8b0795cSMark F. Adams */ 893c8b0795cSMark F. Adams #undef __FUNCT__ 894b43b03e9SMark F. Adams #define __FUNCT__ "PCGAMGCoarsen_AGG" 895b43b03e9SMark F. Adams PetscErrorCode PCGAMGCoarsen_AGG( PC pc, 896c8b0795cSMark F. Adams const Mat Gmat2, 897c8b0795cSMark F. Adams IS *a_selected, 898c8b0795cSMark F. Adams IS *a_llist_parent 899c8b0795cSMark F. Adams ) 900c8b0795cSMark F. Adams { 901c8b0795cSMark F. Adams PetscErrorCode ierr; 902c8b0795cSMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 903c8b0795cSMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 904c8b0795cSMark F. Adams PC_GAMG_AGG *pc_gamg_agg = (PC_GAMG_AGG*)pc_gamg->subctx; 905c8b0795cSMark F. Adams Mat Gmat1; /* unsquared graph (not symetrized!) */ 906c8b0795cSMark F. Adams IS perm, selected, llist_parent; 907c8b0795cSMark F. Adams PetscInt Ii,nloc,bs,n,m; 908c8b0795cSMark F. Adams PetscInt *permute; 909c8b0795cSMark F. Adams PetscBool *bIndexSet; 910b43b03e9SMark F. Adams MatCoarsen crs; 911b43b03e9SMark F. Adams MPI_Comm wcomm = ((PetscObject)Gmat2)->comm; 912c8b0795cSMark F. Adams /* PetscMPIInt mype,npe; */ 913c8b0795cSMark F. Adams 914c8b0795cSMark F. Adams PetscFunctionBegin; 915c8b0795cSMark F. Adams /* ierr = MPI_Comm_rank( wcomm, &mype); CHKERRQ(ierr); */ 916c8b0795cSMark F. Adams /* ierr = MPI_Comm_size( wcomm, &npe); CHKERRQ(ierr); */ 917c8b0795cSMark F. Adams ierr = MatGetLocalSize( Gmat2, &n, &m ); CHKERRQ(ierr); 918c8b0795cSMark F. Adams ierr = MatGetBlockSize( Gmat2, &bs ); CHKERRQ(ierr); assert(bs==1); 919c8b0795cSMark F. Adams nloc = n/bs; 920c8b0795cSMark F. Adams 921c8b0795cSMark F. Adams /* get unsquared graph */ 922c8b0795cSMark F. Adams Gmat1 = pc_gamg_agg->aux_mat; pc_gamg_agg->aux_mat = 0; 923c8b0795cSMark F. Adams 924c8b0795cSMark F. Adams /* get MIS aggs */ 925c8b0795cSMark F. Adams /* randomize */ 926c8b0795cSMark F. Adams ierr = PetscMalloc( nloc*sizeof(PetscInt), &permute ); CHKERRQ(ierr); 927c8b0795cSMark F. Adams ierr = PetscMalloc( nloc*sizeof(PetscBool), &bIndexSet ); CHKERRQ(ierr); 928c8b0795cSMark F. Adams for ( Ii = 0; Ii < nloc ; Ii++ ){ 929c8b0795cSMark F. Adams bIndexSet[Ii] = PETSC_FALSE; 930c8b0795cSMark F. Adams permute[Ii] = Ii; 931c8b0795cSMark F. Adams } 932c8b0795cSMark F. Adams srand(1); /* make deterministic */ 933c8b0795cSMark F. Adams for ( Ii = 0; Ii < nloc ; Ii++ ) { 934c8b0795cSMark F. Adams PetscInt iSwapIndex = rand()%nloc; 935c8b0795cSMark F. Adams if (!bIndexSet[iSwapIndex] && iSwapIndex != Ii) { 936c8b0795cSMark F. Adams PetscInt iTemp = permute[iSwapIndex]; 937c8b0795cSMark F. Adams permute[iSwapIndex] = permute[Ii]; 938c8b0795cSMark F. Adams permute[Ii] = iTemp; 939c8b0795cSMark F. Adams bIndexSet[iSwapIndex] = PETSC_TRUE; 940c8b0795cSMark F. Adams } 941c8b0795cSMark F. Adams } 942c8b0795cSMark F. Adams ierr = PetscFree( bIndexSet ); CHKERRQ(ierr); 943c8b0795cSMark F. Adams 944c8b0795cSMark F. Adams ierr = ISCreateGeneral(PETSC_COMM_SELF, nloc, permute, PETSC_USE_POINTER, &perm); 945c8b0795cSMark F. Adams CHKERRQ(ierr); 946b43b03e9SMark F. Adams #if defined PETSC_USE_LOG 947b43b03e9SMark F. Adams ierr = PetscLogEventBegin(gamg_setup_events[SET4],0,0,0,0);CHKERRQ(ierr); 948b43b03e9SMark F. Adams #endif 949b43b03e9SMark F. Adams ierr = MatCoarsenCreate( wcomm, &crs ); CHKERRQ(ierr); 9509057884aSMark F. Adams /* ierr = MatCoarsenSetType( crs, MATCOARSENMIS ); CHKERRQ(ierr); */ 9519057884aSMark F. Adams ierr = MatCoarsenSetFromOptions( crs ); CHKERRQ(ierr); 952b43b03e9SMark F. Adams ierr = MatCoarsenSetGreedyOrdering( crs, perm ); CHKERRQ(ierr); 953b43b03e9SMark F. Adams ierr = MatCoarsenSetAdjacency( crs, Gmat2 ); CHKERRQ(ierr); 954b43b03e9SMark F. Adams ierr = MatCoarsenSetVerbose( crs, pc_gamg->verbose ); CHKERRQ(ierr); 955b43b03e9SMark F. Adams ierr = MatCoarsenSetStrictAggs( crs, PETSC_TRUE ); CHKERRQ(ierr); 956b43b03e9SMark F. Adams ierr = MatCoarsenApply( crs ); CHKERRQ(ierr); 957b43b03e9SMark F. Adams ierr = MatCoarsenGetMISAggLists( crs, &selected, &llist_parent ); CHKERRQ(ierr); 958b43b03e9SMark F. Adams ierr = MatCoarsenDestroy( &crs ); CHKERRQ(ierr); 959b43b03e9SMark F. Adams 960c8b0795cSMark F. Adams ierr = ISDestroy( &perm ); CHKERRQ(ierr); 961c8b0795cSMark F. Adams ierr = PetscFree( permute ); CHKERRQ(ierr); 962b43b03e9SMark F. Adams #if defined PETSC_USE_LOG 963b43b03e9SMark F. Adams ierr = PetscLogEventEnd(gamg_setup_events[SET4],0,0,0,0);CHKERRQ(ierr); 964b43b03e9SMark F. Adams #endif 965c8b0795cSMark F. Adams /* smooth aggs */ 966ef4ad70eSMark F. Adams if( Gmat1 ) { 967c8b0795cSMark F. Adams ierr = smoothAggs( Gmat2, Gmat1, selected, llist_parent ); CHKERRQ(ierr); 968c8b0795cSMark F. Adams ierr = MatDestroy( &Gmat1 ); CHKERRQ(ierr); 969ef4ad70eSMark F. Adams } 970c8b0795cSMark F. Adams 971c8b0795cSMark F. Adams *a_selected = selected; 972c8b0795cSMark F. Adams *a_llist_parent = llist_parent; 973c8b0795cSMark F. Adams 974c8b0795cSMark F. Adams PetscFunctionReturn(0); 975c8b0795cSMark F. Adams } 976c8b0795cSMark F. Adams 977c8b0795cSMark F. Adams /* -------------------------------------------------------------------------- */ 978c8b0795cSMark F. Adams /* 979c8b0795cSMark F. Adams PCGAMGprolongator_AGG 980c8b0795cSMark F. Adams 981c8b0795cSMark F. Adams Input Parameter: 982c8b0795cSMark F. Adams . pc - this 983c8b0795cSMark F. Adams . Amat - matrix on this fine level 984c8b0795cSMark F. Adams . Graph - used to get ghost data for nodes in 985c8b0795cSMark F. Adams . selected - [nselected inc. chosts] 986c8b0795cSMark F. Adams . llist_parent - [nloc + Gmat.nghost] linked list 987c8b0795cSMark F. Adams Output Parameter: 988c8b0795cSMark F. Adams . a_P_out - prolongation operator to the next level 989c8b0795cSMark F. Adams */ 990c8b0795cSMark F. Adams #undef __FUNCT__ 991c8b0795cSMark F. Adams #define __FUNCT__ "PCGAMGprolongator_AGG" 992c8b0795cSMark F. Adams PetscErrorCode PCGAMGprolongator_AGG( PC pc, 993c8b0795cSMark F. Adams const Mat Amat, 994c8b0795cSMark F. Adams const Mat Gmat, 995c8b0795cSMark F. Adams IS selected, 996c8b0795cSMark F. Adams IS llist_parent, 997c8b0795cSMark F. Adams Mat *a_P_out 9982e68589bSMark F. Adams ) 9992e68589bSMark F. Adams { 10002e68589bSMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 10012e68589bSMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 10022e68589bSMark F. Adams const PetscInt verbose = pc_gamg->verbose; 1003c8b0795cSMark F. Adams const PetscInt data_cols = pc_gamg->data_cell_cols; 10042e68589bSMark F. Adams PetscErrorCode ierr; 1005c8b0795cSMark F. Adams PetscInt Istart,Iend,nloc,ii,jj,kk,my0,nLocalSelected,bs; 1006c8b0795cSMark F. Adams Mat Prol; 10072e68589bSMark F. Adams PetscMPIInt mype, npe; 10082e68589bSMark F. Adams MPI_Comm wcomm = ((PetscObject)Amat)->comm; 1009b43b03e9SMark F. Adams const PetscInt *selected_idx,*llist_idx,col_bs=data_cols; 1010c8b0795cSMark F. Adams PetscReal *data_w_ghost; 1011c8b0795cSMark F. Adams PetscInt myCrs0, nbnodes=0, *flid_fgid; 10122e68589bSMark F. Adams 10132e68589bSMark F. Adams PetscFunctionBegin; 10142e68589bSMark F. Adams ierr = MPI_Comm_rank( wcomm, &mype); CHKERRQ(ierr); 10152e68589bSMark F. Adams ierr = MPI_Comm_size( wcomm, &npe); CHKERRQ(ierr); 10162e68589bSMark F. Adams ierr = MatGetOwnershipRange( Amat, &Istart, &Iend ); CHKERRQ(ierr); 1017c8b0795cSMark F. Adams ierr = MatGetBlockSize( Amat, &bs ); CHKERRQ( ierr ); 1018c8b0795cSMark F. Adams nloc = (Iend-Istart)/bs; my0 = Istart/bs; assert((Iend-Istart)%bs==0); 10192e68589bSMark F. Adams 10202e68589bSMark F. Adams /* get 'nLocalSelected' */ 1021c8b0795cSMark F. Adams ierr = ISGetSize( selected, &kk ); CHKERRQ(ierr); 1022c8b0795cSMark F. Adams ierr = ISGetIndices( selected, &selected_idx ); CHKERRQ(ierr); 1023b43b03e9SMark F. Adams ierr = ISGetIndices( llist_parent, &llist_idx ); CHKERRQ(ierr); 1024c8b0795cSMark F. Adams for(ii=0,nLocalSelected=0;ii<kk;ii++){ 1025c8b0795cSMark F. Adams PetscInt lid = selected_idx[ii]; 1026b43b03e9SMark F. Adams /* filter out singletons */ 1027b43b03e9SMark F. Adams if( lid<nloc && llist_idx[lid] != -1) nLocalSelected++; 10282e68589bSMark F. Adams } 1029c8b0795cSMark F. Adams ierr = ISRestoreIndices( selected, &selected_idx ); CHKERRQ(ierr); 1030b43b03e9SMark F. Adams ierr = ISRestoreIndices( llist_parent, &llist_idx ); CHKERRQ(ierr); 10312e68589bSMark F. Adams 10322e68589bSMark F. Adams /* create prolongator, create P matrix */ 103369b1f4b7SBarry Smith ierr = MatCreateAIJ( wcomm, 1034c8b0795cSMark F. Adams nloc*bs, nLocalSelected*col_bs, 10352e68589bSMark F. Adams PETSC_DETERMINE, PETSC_DETERMINE, 10362e68589bSMark F. Adams data_cols, PETSC_NULL, data_cols, PETSC_NULL, 10372e68589bSMark F. Adams &Prol ); 10382e68589bSMark F. Adams CHKERRQ(ierr); 10392e68589bSMark F. Adams 10402e68589bSMark F. Adams /* can get all points "removed" */ 1041c8b0795cSMark F. Adams ierr = MatGetSize( Prol, &kk, &ii ); CHKERRQ(ierr); 1042c8b0795cSMark F. Adams if( ii==0 ) { 10432e68589bSMark F. Adams if( verbose ) { 1044c8b0795cSMark F. Adams PetscPrintf(wcomm,"[%d]%s no selected points on coarse grid\n",mype,__FUNCT__); 10452e68589bSMark F. Adams } 10462e68589bSMark F. Adams ierr = MatDestroy( &Prol ); CHKERRQ(ierr); 10472e68589bSMark F. Adams *a_P_out = PETSC_NULL; /* out */ 10482e68589bSMark F. Adams PetscFunctionReturn(0); 10492e68589bSMark F. Adams } 1050c8b0795cSMark F. Adams if( verbose ) { 1051ef4ad70eSMark F. Adams PetscPrintf(PETSC_COMM_WORLD,"\t\t[%d]%s New grid %d nodes\n",mype,__FUNCT__,ii/col_bs); 1052c8b0795cSMark F. Adams } 1053c8b0795cSMark F. Adams ierr = MatGetOwnershipRangeColumn( Prol, &myCrs0, &kk ); CHKERRQ(ierr); 1054c8b0795cSMark F. Adams myCrs0 = myCrs0/col_bs; 10552e68589bSMark F. Adams 10562e68589bSMark F. Adams /* create global vector of data in 'data_w_ghost' */ 10572e68589bSMark F. Adams #if defined PETSC_USE_LOG 10582e68589bSMark F. Adams ierr = PetscLogEventBegin(gamg_setup_events[SET7],0,0,0,0);CHKERRQ(ierr); 10592e68589bSMark F. Adams #endif 1060c8b0795cSMark F. Adams if (npe > 1) { /* */ 10612e68589bSMark F. Adams PetscReal *tmp_gdata,*tmp_ldata,*tp2; 10622e68589bSMark F. Adams ierr = PetscMalloc( nloc*sizeof(PetscReal), &tmp_ldata ); CHKERRQ(ierr); 10632e68589bSMark F. Adams for( jj = 0 ; jj < data_cols ; jj++ ){ 1064c8b0795cSMark F. Adams for( kk = 0 ; kk < bs ; kk++) { 10652e68589bSMark F. Adams PetscInt ii,nnodes; 1066c8b0795cSMark F. Adams const PetscReal *tp = pc_gamg->data + jj*bs*nloc + kk; 1067c8b0795cSMark F. Adams for( ii = 0 ; ii < nloc ; ii++, tp += bs ){ 10682e68589bSMark F. Adams tmp_ldata[ii] = *tp; 10692e68589bSMark F. Adams } 10702e68589bSMark F. Adams ierr = getDataWithGhosts( Gmat, 1, tmp_ldata, &nnodes, &tmp_gdata ); 10712e68589bSMark F. Adams CHKERRQ(ierr); 10722e68589bSMark F. Adams if(jj==0 && kk==0) { /* now I know how many todal nodes - allocate */ 1073c8b0795cSMark F. Adams ierr = PetscMalloc( nnodes*bs*data_cols*sizeof(PetscReal), &data_w_ghost ); CHKERRQ(ierr); 1074c8b0795cSMark F. Adams nbnodes = bs*nnodes; 10752e68589bSMark F. Adams } 1076c8b0795cSMark F. Adams tp2 = data_w_ghost + jj*bs*nnodes + kk; 1077c8b0795cSMark F. Adams for( ii = 0 ; ii < nnodes ; ii++, tp2 += bs ){ 10782e68589bSMark F. Adams *tp2 = tmp_gdata[ii]; 10792e68589bSMark F. Adams } 10802e68589bSMark F. Adams ierr = PetscFree( tmp_gdata ); CHKERRQ(ierr); 10812e68589bSMark F. Adams } 10822e68589bSMark F. Adams } 10832e68589bSMark F. Adams ierr = PetscFree( tmp_ldata ); CHKERRQ(ierr); 10842e68589bSMark F. Adams } 10852e68589bSMark F. Adams else { 1086c8b0795cSMark F. Adams nbnodes = bs*nloc; 1087c8b0795cSMark F. Adams data_w_ghost = (PetscReal*)pc_gamg->data; 10882e68589bSMark F. Adams } 10892e68589bSMark F. Adams 10902e68589bSMark F. Adams /* get P0 */ 10912e68589bSMark F. Adams if( npe > 1 ){ 10922e68589bSMark F. Adams PetscReal *fid_glid_loc,*fiddata; 10932e68589bSMark F. Adams PetscInt nnodes; 10942e68589bSMark F. Adams 10952e68589bSMark F. Adams ierr = PetscMalloc( nloc*sizeof(PetscReal), &fid_glid_loc ); CHKERRQ(ierr); 10962e68589bSMark F. Adams for(kk=0;kk<nloc;kk++) fid_glid_loc[kk] = (PetscReal)(my0+kk); 10972e68589bSMark F. Adams ierr = getDataWithGhosts( Gmat, 1, fid_glid_loc, &nnodes, &fiddata ); 10982e68589bSMark F. Adams CHKERRQ(ierr); 10992e68589bSMark F. Adams ierr = PetscMalloc( nnodes*sizeof(PetscInt), &flid_fgid ); CHKERRQ(ierr); 11002e68589bSMark F. Adams for(kk=0;kk<nnodes;kk++) flid_fgid[kk] = (PetscInt)fiddata[kk]; 11012e68589bSMark F. Adams ierr = PetscFree( fiddata ); CHKERRQ(ierr); 1102c8b0795cSMark F. Adams assert(nnodes==nbnodes/bs); 11032e68589bSMark F. Adams ierr = PetscFree( fid_glid_loc ); CHKERRQ(ierr); 11042e68589bSMark F. Adams } 11052e68589bSMark F. Adams else { 11062e68589bSMark F. Adams ierr = PetscMalloc( nloc*sizeof(PetscInt), &flid_fgid ); CHKERRQ(ierr); 11072e68589bSMark F. Adams for(kk=0;kk<nloc;kk++) flid_fgid[kk] = my0 + kk; 11082e68589bSMark F. Adams } 11092e68589bSMark F. Adams #if defined PETSC_USE_LOG 11102e68589bSMark F. Adams ierr = PetscLogEventEnd(gamg_setup_events[SET7],0,0,0,0);CHKERRQ(ierr); 1111c8b0795cSMark F. Adams ierr = PetscLogEventBegin(gamg_setup_events[SET8],0,0,0,0);CHKERRQ(ierr); 11122e68589bSMark F. Adams #endif 1113c8b0795cSMark F. Adams { 1114c8b0795cSMark F. Adams PetscReal *data_out; 1115c8b0795cSMark F. Adams ierr = formProl0( selected, llist_parent, bs, data_cols, myCrs0, nbnodes, 1116c8b0795cSMark F. Adams data_w_ghost, flid_fgid, &data_out, Prol ); 11172e68589bSMark F. Adams CHKERRQ(ierr); 1118c8b0795cSMark F. Adams ierr = PetscFree( pc_gamg->data ); CHKERRQ( ierr ); 1119c8b0795cSMark F. Adams pc_gamg->data = data_out; 1120c8b0795cSMark F. Adams pc_gamg->data_cell_rows = data_cols; 1121c8b0795cSMark F. Adams pc_gamg->data_sz = data_cols*data_cols*nLocalSelected; 1122c8b0795cSMark F. Adams } 1123c8b0795cSMark F. Adams #if defined PETSC_USE_LOG 1124c8b0795cSMark F. Adams ierr = PetscLogEventEnd(gamg_setup_events[SET8],0,0,0,0);CHKERRQ(ierr); 1125c8b0795cSMark F. Adams #endif 11262e68589bSMark F. Adams if (npe > 1) ierr = PetscFree( data_w_ghost ); CHKERRQ(ierr); 11272e68589bSMark F. Adams ierr = PetscFree( flid_fgid ); CHKERRQ(ierr); 11282e68589bSMark F. Adams 1129c8b0795cSMark F. Adams /* attach block size of columns */ 1130c8b0795cSMark F. Adams if( pc_gamg->col_bs_id == -1 ) { 1131c8b0795cSMark F. Adams ierr = PetscObjectComposedDataRegister( &pc_gamg->col_bs_id ); assert(pc_gamg->col_bs_id != -1 ); 1132c8b0795cSMark F. Adams } 1133c8b0795cSMark F. Adams ierr = PetscObjectComposedDataSetInt( (PetscObject)Prol, pc_gamg->col_bs_id, data_cols ); CHKERRQ(ierr); 1134c8b0795cSMark F. Adams 1135c8b0795cSMark F. Adams *a_P_out = Prol; /* out */ 1136c8b0795cSMark F. Adams 1137c8b0795cSMark F. Adams PetscFunctionReturn(0); 1138c8b0795cSMark F. Adams } 1139c8b0795cSMark F. Adams 1140c8b0795cSMark F. Adams /* -------------------------------------------------------------------------- */ 1141c8b0795cSMark F. Adams /* 1142c8b0795cSMark F. Adams PCGAMGoptprol_AGG 1143c8b0795cSMark F. Adams 1144c8b0795cSMark F. Adams Input Parameter: 1145c8b0795cSMark F. Adams . pc - this 1146c8b0795cSMark F. Adams . Amat - matrix on this fine level 1147c8b0795cSMark F. Adams In/Output Parameter: 1148c8b0795cSMark F. Adams . a_P_out - prolongation operator to the next level 1149c8b0795cSMark F. Adams */ 1150c8b0795cSMark F. Adams #undef __FUNCT__ 1151c8b0795cSMark F. Adams #define __FUNCT__ "PCGAMGoptprol_AGG" 1152c8b0795cSMark F. Adams PetscErrorCode PCGAMGoptprol_AGG( PC pc, 1153c8b0795cSMark F. Adams const Mat Amat, 1154c8b0795cSMark F. Adams Mat *a_P 1155c8b0795cSMark F. Adams ) 1156c8b0795cSMark F. Adams { 1157c8b0795cSMark F. Adams PetscErrorCode ierr; 1158c8b0795cSMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 1159c8b0795cSMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 1160c8b0795cSMark F. Adams const PetscInt verbose = pc_gamg->verbose; 1161c8b0795cSMark F. Adams PC_GAMG_AGG *pc_gamg_agg = (PC_GAMG_AGG*)pc_gamg->subctx; 1162c8b0795cSMark F. Adams PetscInt jj; 1163c8b0795cSMark F. Adams PetscMPIInt mype,npe; 1164c8b0795cSMark F. Adams Mat Prol = *a_P; 1165c8b0795cSMark F. Adams MPI_Comm wcomm = ((PetscObject)Amat)->comm; 1166c8b0795cSMark F. Adams 1167c8b0795cSMark F. Adams PetscFunctionBegin; 1168c8b0795cSMark F. Adams ierr = MPI_Comm_rank( wcomm, &mype); CHKERRQ(ierr); 1169c8b0795cSMark F. Adams ierr = MPI_Comm_size( wcomm, &npe); CHKERRQ(ierr); 1170c8b0795cSMark F. Adams 11712e68589bSMark F. Adams /* smooth P0 */ 1172c8b0795cSMark F. Adams for( jj = 0 ; jj < pc_gamg_agg->nsmooths ; jj++ ){ 11732e68589bSMark F. Adams Mat tMat; 11742e68589bSMark F. Adams Vec diag; 11752e68589bSMark F. Adams PetscReal alpha, emax, emin; 11762e68589bSMark F. Adams #if defined PETSC_USE_LOG 11772e68589bSMark F. Adams ierr = PetscLogEventBegin(gamg_setup_events[SET9],0,0,0,0);CHKERRQ(ierr); 11782e68589bSMark F. Adams #endif 11792e68589bSMark F. Adams if( jj == 0 ) { 11802e68589bSMark F. Adams KSP eksp; 11812e68589bSMark F. Adams Vec bb, xx; 11822e68589bSMark F. Adams PC pc; 11832e68589bSMark F. Adams ierr = MatGetVecs( Amat, &bb, 0 ); CHKERRQ(ierr); 11842e68589bSMark F. Adams ierr = MatGetVecs( Amat, &xx, 0 ); CHKERRQ(ierr); 11852e68589bSMark F. Adams { 11862e68589bSMark F. Adams PetscRandom rctx; 11872e68589bSMark F. Adams ierr = PetscRandomCreate(wcomm,&rctx);CHKERRQ(ierr); 11882e68589bSMark F. Adams ierr = PetscRandomSetFromOptions(rctx);CHKERRQ(ierr); 11892e68589bSMark F. Adams ierr = VecSetRandom(bb,rctx);CHKERRQ(ierr); 11902e68589bSMark F. Adams ierr = PetscRandomDestroy( &rctx ); CHKERRQ(ierr); 11912e68589bSMark F. Adams } 11922e68589bSMark F. Adams ierr = KSPCreate(wcomm,&eksp); CHKERRQ(ierr); 11932e68589bSMark F. Adams ierr = KSPAppendOptionsPrefix( eksp, "est_"); CHKERRQ(ierr); 11942e68589bSMark F. Adams ierr = KSPSetFromOptions( eksp ); CHKERRQ(ierr); 11952e68589bSMark F. Adams ierr = KSPSetInitialGuessNonzero( eksp, PETSC_FALSE ); CHKERRQ(ierr); 11962e68589bSMark F. Adams ierr = KSPSetOperators( eksp, Amat, Amat, SAME_NONZERO_PATTERN ); 11972e68589bSMark F. Adams CHKERRQ( ierr ); 11982e68589bSMark F. Adams ierr = KSPGetPC( eksp, &pc ); CHKERRQ( ierr ); 11992e68589bSMark F. Adams ierr = PCSetType( pc, PCJACOBI ); CHKERRQ(ierr); /* smoother */ 12002e68589bSMark F. Adams ierr = KSPSetTolerances(eksp,PETSC_DEFAULT,PETSC_DEFAULT,PETSC_DEFAULT,10); 12012e68589bSMark F. Adams CHKERRQ(ierr); 12022e68589bSMark F. Adams ierr = KSPSetNormType( eksp, KSP_NORM_NONE ); CHKERRQ(ierr); 12032e68589bSMark F. Adams ierr = KSPSetComputeSingularValues( eksp,PETSC_TRUE ); CHKERRQ(ierr); 12042e68589bSMark F. Adams 12052e68589bSMark F. Adams /* solve - keep stuff out of logging */ 12062e68589bSMark F. Adams ierr = PetscLogEventDeactivate(KSP_Solve);CHKERRQ(ierr); 12072e68589bSMark F. Adams ierr = PetscLogEventDeactivate(PC_Apply);CHKERRQ(ierr); 12082e68589bSMark F. Adams ierr = KSPSolve( eksp, bb, xx ); CHKERRQ(ierr); 12092e68589bSMark F. Adams ierr = PetscLogEventActivate(KSP_Solve);CHKERRQ(ierr); 12102e68589bSMark F. Adams ierr = PetscLogEventActivate(PC_Apply);CHKERRQ(ierr); 12112e68589bSMark F. Adams 12122e68589bSMark F. Adams ierr = KSPComputeExtremeSingularValues( eksp, &emax, &emin ); CHKERRQ(ierr); 12132e68589bSMark F. Adams if( verbose ) { 1214c8b0795cSMark F. Adams PetscPrintf(wcomm,"\t\t\t%s smooth P0: max eigen=%e min=%e PC=%s\n", 12152e68589bSMark F. Adams __FUNCT__,emax,emin,PCJACOBI); 12162e68589bSMark F. Adams } 12172e68589bSMark F. Adams ierr = VecDestroy( &xx ); CHKERRQ(ierr); 12182e68589bSMark F. Adams ierr = VecDestroy( &bb ); CHKERRQ(ierr); 12192e68589bSMark F. Adams ierr = KSPDestroy( &eksp ); CHKERRQ(ierr); 12202e68589bSMark F. Adams 12212e68589bSMark F. Adams if( pc_gamg->emax_id == -1 ) { 12222e68589bSMark F. Adams ierr = PetscObjectComposedDataRegister( &pc_gamg->emax_id ); 12232e68589bSMark F. Adams assert(pc_gamg->emax_id != -1 ); 12242e68589bSMark F. Adams } 12252e68589bSMark F. Adams ierr = PetscObjectComposedDataSetScalar( (PetscObject)Amat, pc_gamg->emax_id, emax ); CHKERRQ(ierr); 12262e68589bSMark F. Adams } 12272e68589bSMark F. Adams 12282e68589bSMark F. Adams /* smooth P1 := (I - omega/lam D^{-1}A)P0 */ 12292e68589bSMark F. Adams ierr = MatMatMult( Amat, Prol, MAT_INITIAL_MATRIX, PETSC_DEFAULT, &tMat ); CHKERRQ(ierr); 12302e68589bSMark F. Adams ierr = MatGetVecs( Amat, &diag, 0 ); CHKERRQ(ierr); 12312e68589bSMark F. Adams ierr = MatGetDiagonal( Amat, diag ); CHKERRQ(ierr); /* effectively PCJACOBI */ 12322e68589bSMark F. Adams ierr = VecReciprocal( diag ); CHKERRQ(ierr); 12332e68589bSMark F. Adams ierr = MatDiagonalScale( tMat, diag, 0 ); CHKERRQ(ierr); 12342e68589bSMark F. Adams ierr = VecDestroy( &diag ); CHKERRQ(ierr); 12352e68589bSMark F. Adams alpha = -1.5/emax; 12362e68589bSMark F. Adams ierr = MatAYPX( tMat, alpha, Prol, SUBSET_NONZERO_PATTERN ); CHKERRQ(ierr); 12372e68589bSMark F. Adams ierr = MatDestroy( &Prol ); CHKERRQ(ierr); 12382e68589bSMark F. Adams Prol = tMat; 12392e68589bSMark F. Adams #if defined PETSC_USE_LOG 12402e68589bSMark F. Adams ierr = PetscLogEventEnd(gamg_setup_events[SET9],0,0,0,0);CHKERRQ(ierr); 12412e68589bSMark F. Adams #endif 12422e68589bSMark F. Adams } 12432e68589bSMark F. Adams 1244c8b0795cSMark F. Adams *a_P = Prol; 1245c8b0795cSMark F. Adams 1246c8b0795cSMark F. Adams PetscFunctionReturn(0); 12472e68589bSMark F. Adams } 12482e68589bSMark F. Adams 1249c8b0795cSMark F. Adams /* -------------------------------------------------------------------------- */ 1250c8b0795cSMark F. Adams /* 1251c8b0795cSMark F. Adams PCCreateGAMG_AGG 12522e68589bSMark F. Adams 1253c8b0795cSMark F. Adams Input Parameter: 1254c8b0795cSMark F. Adams . pc - 1255c8b0795cSMark F. Adams */ 1256c8b0795cSMark F. Adams #undef __FUNCT__ 1257c8b0795cSMark F. Adams #define __FUNCT__ "PCCreateGAMG_AGG" 1258c8b0795cSMark F. Adams PetscErrorCode PCCreateGAMG_AGG( PC pc ) 1259c8b0795cSMark F. Adams { 1260c8b0795cSMark F. Adams PetscErrorCode ierr; 1261c8b0795cSMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 1262c8b0795cSMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 1263c8b0795cSMark F. Adams PC_GAMG_AGG *pc_gamg_agg; 12642e68589bSMark F. Adams 1265c8b0795cSMark F. Adams PetscFunctionBegin; 1266c8b0795cSMark F. Adams /* create sub context for SA */ 1267c8b0795cSMark F. Adams ierr = PetscNewLog( pc, PC_GAMG_AGG, &pc_gamg_agg ); CHKERRQ(ierr); 1268c8b0795cSMark F. Adams assert(!pc_gamg->subctx); 1269c8b0795cSMark F. Adams pc_gamg->subctx = pc_gamg_agg; 1270c8b0795cSMark F. Adams 1271c8b0795cSMark F. Adams pc->ops->setfromoptions = PCSetFromOptions_GAMG_AGG; 1272c8b0795cSMark F. Adams pc->ops->destroy = PCDestroy_AGG; 1273c8b0795cSMark F. Adams /* reset does not do anything; setup not virtual */ 1274c8b0795cSMark F. Adams 1275c8b0795cSMark F. Adams /* set internal function pointers */ 1276c8b0795cSMark F. Adams pc_gamg->graph = PCGAMGgraph_AGG; 1277b43b03e9SMark F. Adams pc_gamg->coarsen = PCGAMGCoarsen_AGG; 1278c8b0795cSMark F. Adams pc_gamg->prolongator = PCGAMGprolongator_AGG; 1279c8b0795cSMark F. Adams pc_gamg->optprol = PCGAMGoptprol_AGG; 1280c8b0795cSMark F. Adams 1281c8b0795cSMark F. Adams pc_gamg->createdefaultdata = PCSetData_AGG; 1282c8b0795cSMark F. Adams 1283c8b0795cSMark F. Adams ierr = PetscObjectComposeFunctionDynamic( (PetscObject)pc, 1284c8b0795cSMark F. Adams "PCSetCoordinates_C", 1285c8b0795cSMark F. Adams "PCSetCoordinates_AGG", 1286c8b0795cSMark F. Adams PCSetCoordinates_AGG); 12872e68589bSMark F. Adams PetscFunctionReturn(0); 12882e68589bSMark F. Adams } 1289