12e68589bSMark F. Adams /* 22e68589bSMark F. Adams GAMG geometric-algebric multiogrid PC - Mark Adams 2011 32e68589bSMark F. Adams */ 42e68589bSMark F. Adams 52e68589bSMark F. Adams #include <../src/ksp/pc/impls/gamg/gamg.h> /*I "petscpc.h" I*/ 62e68589bSMark F. Adams #include <private/kspimpl.h> 72e68589bSMark F. Adams 82e68589bSMark F. Adams #include <assert.h> 92e68589bSMark F. Adams #include <petscblaslapack.h> 102e68589bSMark F. Adams 112e68589bSMark F. Adams typedef struct { 12*c8b0795cSMark F. Adams PetscInt nsmooths; 13*c8b0795cSMark F. Adams Mat aux_mat; 14*c8b0795cSMark F. Adams PetscBool sym_graph; 152e68589bSMark F. Adams }PC_GAMG_AGG; 162e68589bSMark F. Adams 172e68589bSMark F. Adams #undef __FUNCT__ 182e68589bSMark F. Adams #define __FUNCT__ "PCGAMGSetNSmooths" 192e68589bSMark F. Adams /*@ 202e68589bSMark F. Adams PCGAMGSetNSmooths - Set number of smoothing steps (1 is typical) 212e68589bSMark F. Adams 222e68589bSMark F. Adams Not Collective on PC 232e68589bSMark F. Adams 242e68589bSMark F. Adams Input Parameters: 252e68589bSMark F. Adams . pc - the preconditioner context 262e68589bSMark F. Adams 272e68589bSMark F. Adams Options Database Key: 282e68589bSMark F. Adams . -pc_gamg_agg_nsmooths 292e68589bSMark F. Adams 302e68589bSMark F. Adams Level: intermediate 312e68589bSMark F. Adams 322e68589bSMark F. Adams Concepts: Aggregation AMG preconditioner 332e68589bSMark F. Adams 342e68589bSMark F. Adams .seealso: () 352e68589bSMark F. Adams @*/ 362e68589bSMark F. Adams PetscErrorCode PCGAMGSetNSmooths(PC pc, PetscInt n) 372e68589bSMark F. Adams { 382e68589bSMark F. Adams PetscErrorCode ierr; 392e68589bSMark F. Adams 402e68589bSMark F. Adams PetscFunctionBegin; 412e68589bSMark F. Adams PetscValidHeaderSpecific(pc,PC_CLASSID,1); 422e68589bSMark F. Adams ierr = PetscTryMethod(pc,"PCGAMGSetNSmooths_C",(PC,PetscInt),(pc,n));CHKERRQ(ierr); 432e68589bSMark F. Adams PetscFunctionReturn(0); 442e68589bSMark F. Adams } 452e68589bSMark F. Adams 462e68589bSMark F. Adams EXTERN_C_BEGIN 472e68589bSMark F. Adams #undef __FUNCT__ 482e68589bSMark F. Adams #define __FUNCT__ "PCGAMGSetNSmooths_GAMG" 492e68589bSMark F. Adams PetscErrorCode PCGAMGSetNSmooths_GAMG(PC pc, PetscInt n) 502e68589bSMark F. Adams { 512e68589bSMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 522e68589bSMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 53*c8b0795cSMark F. Adams PC_GAMG_AGG *pc_gamg_agg = (PC_GAMG_AGG*)pc_gamg->subctx; 542e68589bSMark F. Adams 552e68589bSMark F. Adams PetscFunctionBegin; 56*c8b0795cSMark F. Adams pc_gamg_agg->nsmooths = n; 57*c8b0795cSMark F. Adams PetscFunctionReturn(0); 58*c8b0795cSMark F. Adams } 59*c8b0795cSMark F. Adams EXTERN_C_END 60*c8b0795cSMark F. Adams 61*c8b0795cSMark F. Adams #undef __FUNCT__ 62*c8b0795cSMark F. Adams #define __FUNCT__ "PCGAMGSetSymGraph" 63*c8b0795cSMark F. Adams /*@ 64*c8b0795cSMark F. Adams PCGAMGSetSymGraph - 65*c8b0795cSMark F. Adams 66*c8b0795cSMark F. Adams Not Collective on PC 67*c8b0795cSMark F. Adams 68*c8b0795cSMark F. Adams Input Parameters: 69*c8b0795cSMark F. Adams . pc - the preconditioner context 70*c8b0795cSMark F. Adams 71*c8b0795cSMark F. Adams Options Database Key: 72*c8b0795cSMark F. Adams . -pc_gamg_sym_graph 73*c8b0795cSMark F. Adams 74*c8b0795cSMark F. Adams Level: intermediate 75*c8b0795cSMark F. Adams 76*c8b0795cSMark F. Adams Concepts: Aggregation AMG preconditioner 77*c8b0795cSMark F. Adams 78*c8b0795cSMark F. Adams .seealso: () 79*c8b0795cSMark F. Adams @*/ 80*c8b0795cSMark F. Adams PetscErrorCode PCGAMGSetSymGraph(PC pc, PetscBool n) 81*c8b0795cSMark F. Adams { 82*c8b0795cSMark F. Adams PetscErrorCode ierr; 83*c8b0795cSMark F. Adams 84*c8b0795cSMark F. Adams PetscFunctionBegin; 85*c8b0795cSMark F. Adams PetscValidHeaderSpecific(pc,PC_CLASSID,1); 86*c8b0795cSMark F. Adams ierr = PetscTryMethod(pc,"PCGAMGSetSymGraph_C",(PC,PetscBool),(pc,n));CHKERRQ(ierr); 87*c8b0795cSMark F. Adams PetscFunctionReturn(0); 88*c8b0795cSMark F. Adams } 89*c8b0795cSMark F. Adams 90*c8b0795cSMark F. Adams EXTERN_C_BEGIN 91*c8b0795cSMark F. Adams #undef __FUNCT__ 92*c8b0795cSMark F. Adams #define __FUNCT__ "PCGAMGSetSymGraph_GAMG" 93*c8b0795cSMark F. Adams PetscErrorCode PCGAMGSetSymGraph_GAMG(PC pc, PetscBool n) 94*c8b0795cSMark F. Adams { 95*c8b0795cSMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 96*c8b0795cSMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 97*c8b0795cSMark F. Adams PC_GAMG_AGG *pc_gamg_agg = (PC_GAMG_AGG*)pc_gamg->subctx; 98*c8b0795cSMark F. Adams 99*c8b0795cSMark F. Adams PetscFunctionBegin; 100*c8b0795cSMark F. Adams pc_gamg_agg->sym_graph = n; 1012e68589bSMark F. Adams PetscFunctionReturn(0); 1022e68589bSMark F. Adams } 1032e68589bSMark F. Adams EXTERN_C_END 1042e68589bSMark F. Adams 1052e68589bSMark F. Adams /* -------------------------------------------------------------------------- */ 1062e68589bSMark F. Adams /* 1072e68589bSMark F. Adams PCSetFromOptions_GAMG_AGG 1082e68589bSMark F. Adams 1092e68589bSMark F. Adams Input Parameter: 1102e68589bSMark F. Adams . pc - 1112e68589bSMark F. Adams */ 1122e68589bSMark F. Adams #undef __FUNCT__ 1132e68589bSMark F. Adams #define __FUNCT__ "PCSetFromOptions_GAMG_AGG" 1142e68589bSMark F. Adams PetscErrorCode PCSetFromOptions_GAMG_AGG( PC pc ) 1152e68589bSMark F. Adams { 1162e68589bSMark F. Adams PetscErrorCode ierr; 1172e68589bSMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 1182e68589bSMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 119*c8b0795cSMark F. Adams PC_GAMG_AGG *pc_gamg_agg = (PC_GAMG_AGG*)pc_gamg->subctx; 1202e68589bSMark F. Adams PetscBool flag; 1212e68589bSMark F. Adams 1222e68589bSMark F. Adams PetscFunctionBegin; 1232e68589bSMark F. Adams /* call base class */ 1242e68589bSMark F. Adams ierr = PCSetFromOptions_GAMG( pc ); CHKERRQ(ierr); 1252e68589bSMark F. Adams 1262e68589bSMark F. Adams ierr = PetscOptionsHead("GAMG-AGG options"); CHKERRQ(ierr); 1272e68589bSMark F. Adams { 1282e68589bSMark F. Adams /* -pc_gamg_agg_nsmooths */ 129*c8b0795cSMark F. Adams pc_gamg_agg->nsmooths = 0; 1302e68589bSMark F. Adams ierr = PetscOptionsInt("-pc_gamg_agg_nsmooths", 1312e68589bSMark F. Adams "smoothing steps for smoothed aggregation, usually 1 (0)", 1322e68589bSMark F. Adams "PCGAMGSetNSmooths", 133*c8b0795cSMark F. Adams pc_gamg_agg->nsmooths, 134*c8b0795cSMark F. Adams &pc_gamg_agg->nsmooths, 135*c8b0795cSMark F. Adams &flag); 136*c8b0795cSMark F. Adams CHKERRQ(ierr); 137*c8b0795cSMark F. Adams 138*c8b0795cSMark F. Adams /* -pc_gamg_sym_graph */ 139*c8b0795cSMark F. Adams pc_gamg_agg->sym_graph = PETSC_FALSE; 140*c8b0795cSMark F. Adams ierr = PetscOptionsBool("-pc_gamg_sym_graph", 141*c8b0795cSMark F. Adams "Set for asymetric matrices", 142*c8b0795cSMark F. Adams "PCGAMGSetSymGraph", 143*c8b0795cSMark F. Adams pc_gamg_agg->sym_graph, 144*c8b0795cSMark F. Adams &pc_gamg_agg->sym_graph, 1452e68589bSMark F. Adams &flag); 1462e68589bSMark F. Adams CHKERRQ(ierr); 1472e68589bSMark F. Adams } 1482e68589bSMark F. Adams ierr = PetscOptionsTail();CHKERRQ(ierr); 1492e68589bSMark F. Adams 150*c8b0795cSMark F. Adams if( pc_gamg->verbose > 1 ) { 1512e68589bSMark F. Adams PetscPrintf(PETSC_COMM_WORLD,"[%d]%s done\n",0,__FUNCT__); 1522e68589bSMark F. Adams } 1532e68589bSMark F. Adams 1542e68589bSMark F. Adams PetscFunctionReturn(0); 1552e68589bSMark F. Adams } 1562e68589bSMark F. Adams 1572e68589bSMark F. Adams /* -------------------------------------------------------------------------- */ 1582e68589bSMark F. Adams /* 1592e68589bSMark F. Adams PCDestroy_AGG 1602e68589bSMark F. Adams 1612e68589bSMark F. Adams Input Parameter: 1622e68589bSMark F. Adams . pc - 1632e68589bSMark F. Adams */ 1642e68589bSMark F. Adams #undef __FUNCT__ 1652e68589bSMark F. Adams #define __FUNCT__ "PCDestroy_AGG" 1662e68589bSMark F. Adams PetscErrorCode PCDestroy_AGG( PC pc ) 1672e68589bSMark F. Adams { 1682e68589bSMark F. Adams PetscErrorCode ierr; 1692e68589bSMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 1702e68589bSMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 171*c8b0795cSMark F. Adams PC_GAMG_AGG *pc_gamg_agg = (PC_GAMG_AGG*)pc_gamg->subctx; 1722e68589bSMark F. Adams 1732e68589bSMark F. Adams PetscFunctionBegin; 174*c8b0795cSMark F. Adams if( pc_gamg_agg ) { 175*c8b0795cSMark F. Adams ierr = PetscFree(pc_gamg_agg);CHKERRQ(ierr); 176*c8b0795cSMark F. Adams pc_gamg_agg = 0; 1772e68589bSMark F. Adams } 1782e68589bSMark F. Adams 1792e68589bSMark F. Adams /* call base class */ 1802e68589bSMark F. Adams ierr = PCDestroy_GAMG( pc );CHKERRQ(ierr); 1812e68589bSMark F. Adams 1822e68589bSMark F. Adams PetscFunctionReturn(0); 1832e68589bSMark F. Adams } 1842e68589bSMark F. Adams 1852e68589bSMark F. Adams /* -------------------------------------------------------------------------- */ 1862e68589bSMark F. Adams /* 1872e68589bSMark F. Adams PCSetCoordinates_AGG 1882e68589bSMark F. Adams 1892e68589bSMark F. Adams Input Parameter: 1902e68589bSMark F. Adams . pc - the preconditioner context 1912e68589bSMark F. Adams */ 1922e68589bSMark F. Adams EXTERN_C_BEGIN 1932e68589bSMark F. Adams #undef __FUNCT__ 1942e68589bSMark F. Adams #define __FUNCT__ "PCSetCoordinates_AGG" 1952e68589bSMark F. Adams PetscErrorCode PCSetCoordinates_AGG( PC pc, PetscInt ndm, PetscReal *coords ) 1962e68589bSMark F. Adams { 1972e68589bSMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 1982e68589bSMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 1992e68589bSMark F. Adams PetscErrorCode ierr; 2002e68589bSMark F. Adams PetscInt arrsz,bs,my0,kk,ii,jj,nloc,Iend; 2012e68589bSMark F. Adams Mat Amat = pc->pmat; 2022e68589bSMark F. Adams 2032e68589bSMark F. Adams PetscFunctionBegin; 2042e68589bSMark F. Adams PetscValidHeaderSpecific( Amat, MAT_CLASSID, 1 ); 2052e68589bSMark F. Adams ierr = MatGetBlockSize( Amat, &bs ); CHKERRQ( ierr ); 2062e68589bSMark F. Adams ierr = MatGetOwnershipRange( Amat, &my0, &Iend ); CHKERRQ(ierr); 2072e68589bSMark F. Adams nloc = (Iend-my0)/bs; 2082e68589bSMark F. Adams if((Iend-my0)%bs!=0) SETERRQ1(((PetscObject)Amat)->comm,PETSC_ERR_ARG_WRONG, "Bad local size %d.",nloc); 2092e68589bSMark F. Adams 2102e68589bSMark F. Adams /* SA: null space vectors */ 211*c8b0795cSMark F. Adams if( coords && bs==1 ) pc_gamg->data_cell_cols = 1; /* scalar w/ coords and SA (not needed) */ 212*c8b0795cSMark F. Adams else if( coords ) pc_gamg->data_cell_cols = (ndm==2 ? 3 : 6); /* elasticity */ 213*c8b0795cSMark F. Adams else pc_gamg->data_cell_cols = bs; /* no data, force SA with constant null space vectors */ 214*c8b0795cSMark F. Adams pc_gamg->data_cell_rows = bs; 2152e68589bSMark F. Adams 216*c8b0795cSMark F. Adams arrsz = nloc*pc_gamg->data_cell_rows*pc_gamg->data_cell_cols; 2172e68589bSMark F. Adams 2182e68589bSMark F. Adams /* create data - syntactic sugar that should be refactored at some point */ 2192e68589bSMark F. Adams if (pc_gamg->data==0 || (pc_gamg->data_sz != arrsz)) { 2202e68589bSMark F. Adams ierr = PetscFree( pc_gamg->data ); CHKERRQ(ierr); 221*c8b0795cSMark F. Adams ierr = PetscMalloc(arrsz*sizeof(PetscReal), &pc_gamg->data ); CHKERRQ(ierr); 2222e68589bSMark F. Adams } 2232e68589bSMark F. Adams /* copy data in - column oriented */ 2242e68589bSMark F. Adams for(kk=0;kk<nloc;kk++){ 2252e68589bSMark F. Adams const PetscInt M = Iend - my0; 2262e68589bSMark F. Adams PetscReal *data = &pc_gamg->data[kk*bs]; 227*c8b0795cSMark F. Adams if( pc_gamg->data_cell_cols==1 ) *data = 1.0; 2282e68589bSMark F. Adams else { 2292e68589bSMark F. Adams for(ii=0;ii<bs;ii++) 2302e68589bSMark F. Adams for(jj=0;jj<bs;jj++) 2312e68589bSMark F. Adams if(ii==jj)data[ii*M + jj] = 1.0; /* translational modes */ 2322e68589bSMark F. Adams else data[ii*M + jj] = 0.0; 2332e68589bSMark F. Adams if( coords ) { 2342e68589bSMark F. Adams if( ndm == 2 ){ /* rotational modes */ 2352e68589bSMark F. Adams data += 2*M; 2362e68589bSMark F. Adams data[0] = -coords[2*kk+1]; 2372e68589bSMark F. Adams data[1] = coords[2*kk]; 2382e68589bSMark F. Adams } 2392e68589bSMark F. Adams else { 2402e68589bSMark F. Adams data += 3*M; 2412e68589bSMark F. Adams data[0] = 0.0; data[M+0] = coords[3*kk+2]; data[2*M+0] = -coords[3*kk+1]; 2422e68589bSMark F. Adams data[1] = -coords[3*kk+2]; data[M+1] = 0.0; data[2*M+1] = coords[3*kk]; 2432e68589bSMark F. Adams data[2] = coords[3*kk+1]; data[M+2] = -coords[3*kk]; data[2*M+2] = 0.0; 2442e68589bSMark F. Adams } 2452e68589bSMark F. Adams } 2462e68589bSMark F. Adams } 2472e68589bSMark F. Adams } 2482e68589bSMark F. Adams 2492e68589bSMark F. Adams pc_gamg->data_sz = arrsz; 2502e68589bSMark F. Adams 2512e68589bSMark F. Adams PetscFunctionReturn(0); 2522e68589bSMark F. Adams } 2532e68589bSMark F. Adams EXTERN_C_END 2542e68589bSMark F. Adams 255*c8b0795cSMark F. Adams /* -------------------------------------------------------------------------- */ 256*c8b0795cSMark F. Adams /* 257*c8b0795cSMark F. Adams smoothAggs - greedy grab of with G1 (unsquared graph) -- AIJ specific!!! 258*c8b0795cSMark F. Adams 259*c8b0795cSMark F. Adams Input Parameter: 260*c8b0795cSMark F. Adams . Gmat_2 - glabal matrix of graph (data not defined) 261*c8b0795cSMark F. Adams . Gmat_1 - base graph to grab with 262*c8b0795cSMark F. Adams . selected_2 - 263*c8b0795cSMark F. Adams Input/Output Parameter: 264*c8b0795cSMark F. Adams . llist_aggs_2 - linked list of aggs, ghost lids are based on Gmat_2 (squared graph) 265*c8b0795cSMark F. Adams */ 266*c8b0795cSMark F. Adams #undef __FUNCT__ 267*c8b0795cSMark F. Adams #define __FUNCT__ "smoothAggs" 268*c8b0795cSMark F. Adams PetscErrorCode smoothAggs( const Mat Gmat_2, /* base (squared) graph */ 269*c8b0795cSMark F. Adams const Mat Gmat_1, /* base graph, could be unsymmetic */ 270*c8b0795cSMark F. Adams const IS selected_2, /* [nselected total] selected vertices */ 271*c8b0795cSMark F. Adams IS llist_aggs_2 /* [nloc_nghost] global ID of aggregate */ 272*c8b0795cSMark F. Adams ) 273*c8b0795cSMark F. Adams { 274*c8b0795cSMark F. Adams PetscErrorCode ierr; 275*c8b0795cSMark F. Adams PetscBool isMPI; 276*c8b0795cSMark F. Adams Mat_SeqAIJ *matA_1, *matB_1=0, *matA_2, *matB_2=0; 277*c8b0795cSMark F. Adams MPI_Comm wcomm = ((PetscObject)Gmat_2)->comm; 278*c8b0795cSMark F. Adams PetscMPIInt mype; 279*c8b0795cSMark F. Adams PetscInt lid,*ii,*idx,ix,Iend,my0,nSelected,nnodes_2,kk,n,j; 280*c8b0795cSMark F. Adams Mat_MPIAIJ *mpimat_2 = 0, *mpimat_1=0; 281*c8b0795cSMark F. Adams const PetscInt nloc = Gmat_2->rmap->n; 282*c8b0795cSMark F. Adams PetscScalar *cpcol_1_state,*cpcol_2_state,*deleted_parent_gid; 283*c8b0795cSMark F. Adams PetscInt *lid_cprowID_1,*id_llist_2,*lid_cprowID_2; 284*c8b0795cSMark F. Adams NState *lid_state; 285*c8b0795cSMark F. Adams 286*c8b0795cSMark F. Adams PetscFunctionBegin; 287*c8b0795cSMark F. Adams ierr = MPI_Comm_rank( wcomm, &mype ); CHKERRQ(ierr); 288*c8b0795cSMark F. Adams ierr = MatGetOwnershipRange(Gmat_1,&my0,&Iend); CHKERRQ(ierr); 289*c8b0795cSMark F. Adams 290*c8b0795cSMark F. Adams if( !PETSC_TRUE ) { 291*c8b0795cSMark F. Adams PetscViewer viewer; char fname[32]; static int llev=0; 292*c8b0795cSMark F. Adams sprintf(fname,"Gmat2_%d.m",llev++); 293*c8b0795cSMark F. Adams PetscViewerASCIIOpen(wcomm,fname,&viewer); 294*c8b0795cSMark F. Adams ierr = PetscViewerSetFormat( viewer, PETSC_VIEWER_ASCII_MATLAB); CHKERRQ(ierr); 295*c8b0795cSMark F. Adams ierr = MatView(Gmat_2, viewer ); CHKERRQ(ierr); 296*c8b0795cSMark F. Adams ierr = PetscViewerDestroy( &viewer ); 297*c8b0795cSMark F. Adams } 298*c8b0795cSMark F. Adams 299*c8b0795cSMark F. Adams { /* copy linked list into temp buffer - should not work directly on pointer */ 300*c8b0795cSMark F. Adams const PetscInt *llist_idx; 301*c8b0795cSMark F. Adams ierr = ISGetSize( llist_aggs_2, &nnodes_2 ); CHKERRQ(ierr); 302*c8b0795cSMark F. Adams ierr = PetscMalloc( nnodes_2*sizeof(PetscInt), &id_llist_2 ); CHKERRQ(ierr); 303*c8b0795cSMark F. Adams ierr = ISGetIndices( llist_aggs_2, &llist_idx ); CHKERRQ(ierr); 304*c8b0795cSMark F. Adams for(lid=0;lid<nnodes_2;lid++) id_llist_2[lid] = llist_idx[lid]; 305*c8b0795cSMark F. Adams ierr = ISRestoreIndices( llist_aggs_2, &llist_idx ); CHKERRQ(ierr); 306*c8b0795cSMark F. Adams } 307*c8b0795cSMark F. Adams 308*c8b0795cSMark F. Adams /* get submatrices */ 309*c8b0795cSMark F. Adams ierr = PetscTypeCompare( (PetscObject)Gmat_1, MATMPIAIJ, &isMPI ); CHKERRQ(ierr); 310*c8b0795cSMark F. Adams if(isMPI) { 311*c8b0795cSMark F. Adams /* grab matrix objects */ 312*c8b0795cSMark F. Adams mpimat_2 = (Mat_MPIAIJ*)Gmat_2->data; 313*c8b0795cSMark F. Adams mpimat_1 = (Mat_MPIAIJ*)Gmat_1->data; 314*c8b0795cSMark F. Adams matA_1 = (Mat_SeqAIJ*)mpimat_1->A->data; 315*c8b0795cSMark F. Adams matB_1 = (Mat_SeqAIJ*)mpimat_1->B->data; 316*c8b0795cSMark F. Adams matA_2 = (Mat_SeqAIJ*)mpimat_2->A->data; 317*c8b0795cSMark F. Adams matB_2 = (Mat_SeqAIJ*)mpimat_2->B->data; 318*c8b0795cSMark F. Adams 319*c8b0795cSMark F. Adams /* force compressed row storage for B matrix in AuxMat */ 320*c8b0795cSMark F. Adams matB_1->compressedrow.check = PETSC_TRUE; 321*c8b0795cSMark F. Adams ierr = MatCheckCompressedRow(mpimat_1->B,&matB_1->compressedrow,matB_1->i,Gmat_1->rmap->n,-1.0); 322*c8b0795cSMark F. Adams CHKERRQ(ierr); 323*c8b0795cSMark F. Adams 324*c8b0795cSMark F. Adams ierr = PetscMalloc( nloc*sizeof(PetscInt), &lid_cprowID_2 ); CHKERRQ(ierr); 325*c8b0795cSMark F. Adams ierr = PetscMalloc( nloc*sizeof(PetscInt), &lid_cprowID_1 ); CHKERRQ(ierr); 326*c8b0795cSMark F. Adams for(lid=0;lid<nloc;lid++) lid_cprowID_1[lid] = lid_cprowID_2[lid] = -1; 327*c8b0795cSMark F. Adams for (ix=0; ix<matB_1->compressedrow.nrows; ix++) { 328*c8b0795cSMark F. Adams PetscInt lid = matB_1->compressedrow.rindex[ix]; 329*c8b0795cSMark F. Adams lid_cprowID_1[lid] = ix; 330*c8b0795cSMark F. Adams } 331*c8b0795cSMark F. Adams for (ix=0; ix<matB_2->compressedrow.nrows; ix++) { 332*c8b0795cSMark F. Adams PetscInt lid = matB_2->compressedrow.rindex[ix]; 333*c8b0795cSMark F. Adams lid_cprowID_2[lid] = ix; 334*c8b0795cSMark F. Adams } 335*c8b0795cSMark F. Adams } 336*c8b0795cSMark F. Adams else { 337*c8b0795cSMark F. Adams matA_1 = (Mat_SeqAIJ*)Gmat_1->data; 338*c8b0795cSMark F. Adams matA_2 = (Mat_SeqAIJ*)Gmat_2->data; 339*c8b0795cSMark F. Adams lid_cprowID_2 = lid_cprowID_1 = 0; 340*c8b0795cSMark F. Adams } 341*c8b0795cSMark F. Adams assert( matA_1 && !matA_1->compressedrow.use ); 342*c8b0795cSMark F. Adams assert( matB_1==0 || matB_1->compressedrow.use ); 343*c8b0795cSMark F. Adams assert( matA_2 && !matA_2->compressedrow.use ); 344*c8b0795cSMark F. Adams assert( matB_2==0 || matB_2->compressedrow.use ); 345*c8b0795cSMark F. Adams 346*c8b0795cSMark F. Adams /* get state of locals and selected gid for deleted */ 347*c8b0795cSMark F. Adams ierr = PetscMalloc( nloc*sizeof(NState), &lid_state ); CHKERRQ(ierr); 348*c8b0795cSMark F. Adams ierr = PetscMalloc( nloc*sizeof(PetscScalar), &deleted_parent_gid ); CHKERRQ(ierr); 349*c8b0795cSMark F. Adams for( lid = 0 ; lid < nloc ; lid++ ) { 350*c8b0795cSMark F. Adams deleted_parent_gid[lid] = -1.0; 351*c8b0795cSMark F. Adams lid_state[lid] = DELETED; 352*c8b0795cSMark F. Adams ii = matA_2->i; n = ii[lid+1] - ii[lid]; 353*c8b0795cSMark F. Adams if( n < 2 ) { 354*c8b0795cSMark F. Adams if(!lid_cprowID_2 || (ix=lid_cprowID_2[lid])==-1 || (matB_2->compressedrow.i[ix+1]-matB_2->compressedrow.i[ix])==0){ 355*c8b0795cSMark F. Adams lid_state[lid] = REMOVED; 356*c8b0795cSMark F. Adams } 357*c8b0795cSMark F. Adams } 358*c8b0795cSMark F. Adams } 359*c8b0795cSMark F. Adams /* set index into compressed row 'lid_cprowID', not -1 means its a boundary node */ 360*c8b0795cSMark F. Adams { 361*c8b0795cSMark F. Adams const PetscInt *selected_idx; 362*c8b0795cSMark F. Adams /* set local selected */ 363*c8b0795cSMark F. Adams ierr = ISGetSize( selected_2, &nSelected ); CHKERRQ(ierr); 364*c8b0795cSMark F. Adams ierr = ISGetIndices( selected_2, &selected_idx ); CHKERRQ(ierr); 365*c8b0795cSMark F. Adams for(kk=0;kk<nSelected;kk++){ 366*c8b0795cSMark F. Adams PetscInt lid = selected_idx[kk]; 367*c8b0795cSMark F. Adams if(lid<nloc) lid_state[lid] = (NState)(lid+my0); /* selected flag */ 368*c8b0795cSMark F. Adams else break; 369*c8b0795cSMark F. Adams } 370*c8b0795cSMark F. Adams ierr = ISRestoreIndices( selected_2, &selected_idx ); CHKERRQ(ierr); 371*c8b0795cSMark F. Adams } 372*c8b0795cSMark F. Adams /* map local to selected local, -1 means a ghost owns it */ 373*c8b0795cSMark F. Adams for(lid=kk=0;lid<nloc;lid++){ 374*c8b0795cSMark F. Adams NState state = lid_state[lid]; 375*c8b0795cSMark F. Adams if( IS_SELECTED(state) ){ 376*c8b0795cSMark F. Adams PetscInt flid = lid; 377*c8b0795cSMark F. Adams do{ 378*c8b0795cSMark F. Adams if(flid<nloc){ 379*c8b0795cSMark F. Adams deleted_parent_gid[flid] = (PetscScalar)(lid + my0); 380*c8b0795cSMark F. Adams } 381*c8b0795cSMark F. Adams kk++; 382*c8b0795cSMark F. Adams } while( (flid=id_llist_2[flid]) != -1 ); 383*c8b0795cSMark F. Adams } 384*c8b0795cSMark F. Adams } 385*c8b0795cSMark F. Adams /* get 'cpcol_1_state', 'cpcol_2_state' - uses mpimat_1->lvec & mpimat_2->lvec for temp space */ 386*c8b0795cSMark F. Adams if (isMPI) { 387*c8b0795cSMark F. Adams Vec tempVec; 388*c8b0795cSMark F. Adams 389*c8b0795cSMark F. Adams /* get 'cpcol_1_state' */ 390*c8b0795cSMark F. Adams ierr = MatGetVecs( Gmat_1, &tempVec, 0 ); CHKERRQ(ierr); 391*c8b0795cSMark F. Adams for(kk=0,j=my0;kk<nloc;kk++,j++){ 392*c8b0795cSMark F. Adams PetscScalar v = (PetscScalar)lid_state[kk]; 393*c8b0795cSMark F. Adams ierr = VecSetValues( tempVec, 1, &j, &v, INSERT_VALUES ); CHKERRQ(ierr); 394*c8b0795cSMark F. Adams } 395*c8b0795cSMark F. Adams ierr = VecAssemblyBegin( tempVec ); CHKERRQ(ierr); 396*c8b0795cSMark F. Adams ierr = VecAssemblyEnd( tempVec ); CHKERRQ(ierr); 397*c8b0795cSMark F. Adams ierr = VecScatterBegin(mpimat_1->Mvctx,tempVec, mpimat_1->lvec,INSERT_VALUES,SCATTER_FORWARD); 398*c8b0795cSMark F. Adams CHKERRQ(ierr); 399*c8b0795cSMark F. Adams ierr = VecScatterEnd(mpimat_1->Mvctx,tempVec, mpimat_1->lvec,INSERT_VALUES,SCATTER_FORWARD); 400*c8b0795cSMark F. Adams CHKERRQ(ierr); 401*c8b0795cSMark F. Adams ierr = VecGetArray( mpimat_1->lvec, &cpcol_1_state ); CHKERRQ(ierr); 402*c8b0795cSMark F. Adams ierr = VecDestroy( &tempVec ); CHKERRQ(ierr); 403*c8b0795cSMark F. Adams 404*c8b0795cSMark F. Adams /* get 'cpcol_2_state' */ 405*c8b0795cSMark F. Adams ierr = MatGetVecs( Gmat_2, &tempVec, 0 ); CHKERRQ(ierr); 406*c8b0795cSMark F. Adams for(kk=0,j=my0;kk<nloc;kk++,j++){ 407*c8b0795cSMark F. Adams PetscScalar v = (PetscScalar)lid_state[kk]; 408*c8b0795cSMark F. Adams ierr = VecSetValues( tempVec, 1, &j, &v, INSERT_VALUES ); CHKERRQ(ierr); 409*c8b0795cSMark F. Adams } 410*c8b0795cSMark F. Adams ierr = VecAssemblyBegin( tempVec ); CHKERRQ(ierr); 411*c8b0795cSMark F. Adams ierr = VecAssemblyEnd( tempVec ); CHKERRQ(ierr); 412*c8b0795cSMark F. Adams ierr = VecScatterBegin(mpimat_2->Mvctx,tempVec, mpimat_2->lvec,INSERT_VALUES,SCATTER_FORWARD); 413*c8b0795cSMark F. Adams CHKERRQ(ierr); 414*c8b0795cSMark F. Adams ierr = VecScatterEnd(mpimat_2->Mvctx,tempVec, mpimat_2->lvec,INSERT_VALUES,SCATTER_FORWARD); 415*c8b0795cSMark F. Adams CHKERRQ(ierr); 416*c8b0795cSMark F. Adams ierr = VecGetArray( mpimat_2->lvec, &cpcol_2_state ); CHKERRQ(ierr); 417*c8b0795cSMark F. Adams ierr = VecDestroy( &tempVec ); CHKERRQ(ierr); 418*c8b0795cSMark F. Adams } /* ismpi */ 419*c8b0795cSMark F. Adams 420*c8b0795cSMark F. Adams /* doit */ 421*c8b0795cSMark F. Adams for(lid=0;lid<nloc;lid++){ 422*c8b0795cSMark F. Adams NState state = lid_state[lid]; 423*c8b0795cSMark F. Adams if( IS_SELECTED(state) ) { /* steal locals */ 424*c8b0795cSMark F. Adams ii = matA_1->i; n = ii[lid+1] - ii[lid]; 425*c8b0795cSMark F. Adams idx = matA_1->j + ii[lid]; 426*c8b0795cSMark F. Adams for (j=0; j<n; j++) { 427*c8b0795cSMark F. Adams PetscInt flid, lidj = idx[j], sgid; 428*c8b0795cSMark F. Adams NState statej = lid_state[lidj]; 429*c8b0795cSMark F. Adams if( statej==DELETED && (sgid=deleted_parent_gid[lidj]) != (PetscScalar)(lid+my0) ){ /* steal local */ 430*c8b0795cSMark F. Adams deleted_parent_gid[lidj] = (PetscScalar)(lid+my0); /* send this with _2 */ 431*c8b0795cSMark F. Adams if( sgid >= my0 && sgid < my0+nloc ){ /* I'm stealing this local from a local */ 432*c8b0795cSMark F. Adams PetscInt hav=0, flid2=sgid-my0, lastid; 433*c8b0795cSMark F. Adams /* looking for local from local so id_llist_2 works */ 434*c8b0795cSMark F. Adams for( lastid=flid2, flid=id_llist_2[flid2] ; flid!=-1 ; flid=id_llist_2[flid] ) { 435*c8b0795cSMark F. Adams if( flid == lidj ) { 436*c8b0795cSMark F. Adams id_llist_2[lastid] = id_llist_2[flid]; /* remove lidj from list */ 437*c8b0795cSMark F. Adams id_llist_2[flid] = id_llist_2[lid]; id_llist_2[lid] = flid; /* insert 'lidj' into head of llist */ 438*c8b0795cSMark F. Adams hav++; 439*c8b0795cSMark F. Adams break; 440*c8b0795cSMark F. Adams } 441*c8b0795cSMark F. Adams lastid = flid; 442*c8b0795cSMark F. Adams } 443*c8b0795cSMark F. Adams if(hav!=1){ 444*c8b0795cSMark F. Adams if(hav==0)SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"failed to find adj in 'selected' lists - structurally unsymmetric matrix"); 445*c8b0795cSMark F. Adams SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"found node %d times???",hav); 446*c8b0795cSMark F. Adams } 447*c8b0795cSMark F. Adams } 448*c8b0795cSMark F. Adams else{ /* I'm stealing this local, owned by a ghost - ok to use _2, local */ 449*c8b0795cSMark F. Adams assert(sgid==-1); 450*c8b0795cSMark F. Adams id_llist_2[lidj] = id_llist_2[lid]; id_llist_2[lid] = lidj; /* insert 'lidj' into head of llist */ 451*c8b0795cSMark F. Adams /* local remove at end, off add/rm at end */ 452*c8b0795cSMark F. Adams } 453*c8b0795cSMark F. Adams } 454*c8b0795cSMark F. Adams } 455*c8b0795cSMark F. Adams } 456*c8b0795cSMark F. Adams else if( state == DELETED && lid_cprowID_1 ) { 457*c8b0795cSMark F. Adams PetscInt sgidold = (PetscInt)deleted_parent_gid[lid]; 458*c8b0795cSMark F. Adams /* see if I have a selected ghost neighbor that will steal me */ 459*c8b0795cSMark F. Adams if( (ix=lid_cprowID_1[lid]) != -1 ){ 460*c8b0795cSMark F. Adams ii = matB_1->compressedrow.i; n = ii[ix+1] - ii[ix]; 461*c8b0795cSMark F. Adams idx = matB_1->j + ii[ix]; 462*c8b0795cSMark F. Adams for( j=0 ; j<n ; j++ ) { 463*c8b0795cSMark F. Adams PetscInt cpid = idx[j]; 464*c8b0795cSMark F. Adams NState statej = (NState)PetscRealPart(cpcol_1_state[cpid]); 465*c8b0795cSMark F. Adams if( IS_SELECTED(statej) && sgidold != (PetscInt)statej ) { /* ghost will steal this, remove from my list */ 466*c8b0795cSMark F. Adams deleted_parent_gid[lid] = (PetscScalar)statej; /* send who selected with _2 */ 467*c8b0795cSMark F. Adams if( sgidold>=my0 && sgidold<(my0+nloc) ) { /* this was mine */ 468*c8b0795cSMark F. Adams PetscInt lastid,hav=0,flid,oldslidj=sgidold-my0; 469*c8b0795cSMark F. Adams /* remove from 'oldslidj' list, local so _2 is OK */ 470*c8b0795cSMark F. Adams for( lastid=oldslidj, flid=id_llist_2[oldslidj] ; flid != -1 ; flid=id_llist_2[flid] ) { 471*c8b0795cSMark F. Adams if( flid == lid ) { 472*c8b0795cSMark F. Adams id_llist_2[lastid] = id_llist_2[flid]; /* remove lid from oldslidj list */ 473*c8b0795cSMark F. Adams hav++; 474*c8b0795cSMark F. Adams break; 475*c8b0795cSMark F. Adams } 476*c8b0795cSMark F. Adams lastid = flid; 477*c8b0795cSMark F. Adams } 478*c8b0795cSMark F. Adams if(hav!=1){ 479*c8b0795cSMark F. Adams if(hav==0)SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"failed to find adj in 'selected' lists - structurally unsymmetric matrix"); 480*c8b0795cSMark F. Adams SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"found node %d times???",hav); 481*c8b0795cSMark F. Adams } 482*c8b0795cSMark F. Adams id_llist_2[lid] = -1; /* terminate linked list - needed? */ 483*c8b0795cSMark F. Adams } 484*c8b0795cSMark F. Adams else assert(id_llist_2[lid] == -1); 485*c8b0795cSMark F. Adams } 486*c8b0795cSMark F. Adams } 487*c8b0795cSMark F. Adams } 488*c8b0795cSMark F. Adams } /* selected/deleted */ 489*c8b0795cSMark F. Adams else assert(state == REMOVED || !lid_cprowID_1); 490*c8b0795cSMark F. Adams } /* node loop */ 491*c8b0795cSMark F. Adams 492*c8b0795cSMark F. Adams if( isMPI ) { 493*c8b0795cSMark F. Adams PetscScalar *cpcol_2_sel_gid; 494*c8b0795cSMark F. Adams Vec tempVec; 495*c8b0795cSMark F. Adams PetscInt cpid; 496*c8b0795cSMark F. Adams 497*c8b0795cSMark F. Adams ierr = VecRestoreArray( mpimat_1->lvec, &cpcol_1_state ); CHKERRQ(ierr); 498*c8b0795cSMark F. Adams ierr = VecRestoreArray( mpimat_2->lvec, &cpcol_2_state ); CHKERRQ(ierr); 499*c8b0795cSMark F. Adams 500*c8b0795cSMark F. Adams /* get 'cpcol_2_sel_gid' */ 501*c8b0795cSMark F. Adams ierr = MatGetVecs( Gmat_2, &tempVec, 0 ); CHKERRQ(ierr); 502*c8b0795cSMark F. Adams for(kk=0,j=my0;kk<nloc;kk++,j++){ 503*c8b0795cSMark F. Adams ierr = VecSetValues( tempVec, 1, &j, &deleted_parent_gid[kk], INSERT_VALUES ); CHKERRQ(ierr); 504*c8b0795cSMark F. Adams } 505*c8b0795cSMark F. Adams ierr = VecAssemblyBegin( tempVec ); CHKERRQ(ierr); 506*c8b0795cSMark F. Adams ierr = VecAssemblyEnd( tempVec ); CHKERRQ(ierr); 507*c8b0795cSMark F. Adams ierr = VecScatterBegin(mpimat_2->Mvctx,tempVec, mpimat_2->lvec,INSERT_VALUES,SCATTER_FORWARD); 508*c8b0795cSMark F. Adams CHKERRQ(ierr); 509*c8b0795cSMark F. Adams ierr = VecScatterEnd(mpimat_2->Mvctx,tempVec, mpimat_2->lvec,INSERT_VALUES,SCATTER_FORWARD); 510*c8b0795cSMark F. Adams CHKERRQ(ierr); 511*c8b0795cSMark F. Adams ierr = VecDestroy( &tempVec ); CHKERRQ(ierr); 512*c8b0795cSMark F. Adams 513*c8b0795cSMark F. Adams ierr = VecGetArray( mpimat_2->lvec, &cpcol_2_sel_gid ); CHKERRQ(ierr); 514*c8b0795cSMark F. Adams 515*c8b0795cSMark F. Adams /* look for deleted ghosts and see if they moved */ 516*c8b0795cSMark F. Adams for(lid=0;lid<nloc;lid++){ 517*c8b0795cSMark F. Adams NState state = lid_state[lid]; 518*c8b0795cSMark F. Adams if( IS_SELECTED(state) ){ 519*c8b0795cSMark F. Adams PetscInt flid,lastid,old_sgid=lid+my0; 520*c8b0795cSMark F. Adams /* look for deleted ghosts and see if they moved */ 521*c8b0795cSMark F. Adams for( lastid=lid, flid=id_llist_2[lid] ; flid!=-1 ; flid=id_llist_2[flid] ) { 522*c8b0795cSMark F. Adams if( flid>=nloc ) { 523*c8b0795cSMark F. Adams PetscInt cpid = flid-nloc, sgid_new = cpcol_2_sel_gid[cpid]; 524*c8b0795cSMark F. Adams if( sgid_new != old_sgid && sgid_new != -1 ) { 525*c8b0795cSMark F. Adams id_llist_2[lastid] = id_llist_2[flid]; /* remove 'flid' from list */ 526*c8b0795cSMark F. Adams id_llist_2[flid] = -1; 527*c8b0795cSMark F. Adams flid = lastid; 528*c8b0795cSMark F. Adams } /* if it changed parents */ 529*c8b0795cSMark F. Adams else lastid = flid; 530*c8b0795cSMark F. Adams } /* for ghost nodes */ 531*c8b0795cSMark F. Adams else lastid = flid; 532*c8b0795cSMark F. Adams } /* loop over list of deleted */ 533*c8b0795cSMark F. Adams } /* selected */ 534*c8b0795cSMark F. Adams } 535*c8b0795cSMark F. Adams 536*c8b0795cSMark F. Adams /* look at ghosts, see if they changed, and moved here */ 537*c8b0795cSMark F. Adams for(cpid=0;cpid<nnodes_2-nloc;cpid++){ 538*c8b0795cSMark F. Adams PetscInt sgid_new = cpcol_2_sel_gid[cpid]; 539*c8b0795cSMark F. Adams if( sgid_new>=my0 && sgid_new<(my0+nloc) ) { /* this is mine */ 540*c8b0795cSMark F. Adams PetscInt lastid,flid,slid_new=sgid_new-my0,flidj=nloc+cpid,hav=0; 541*c8b0795cSMark F. Adams for( lastid=slid_new, flid=id_llist_2[slid_new] ; flid != -1 ; flid=id_llist_2[flid] ) { 542*c8b0795cSMark F. Adams if( flid == flidj ) { 543*c8b0795cSMark F. Adams hav++; 544*c8b0795cSMark F. Adams break; 545*c8b0795cSMark F. Adams } 546*c8b0795cSMark F. Adams lastid = flid; 547*c8b0795cSMark F. Adams } 548*c8b0795cSMark F. Adams if( hav != 1 ){ 549*c8b0795cSMark F. Adams assert(id_llist_2[flidj] == -1); 550*c8b0795cSMark F. Adams id_llist_2[flidj] = id_llist_2[slid_new]; id_llist_2[slid_new] = flidj; /* insert 'flidj' into head of llist */ 551*c8b0795cSMark F. Adams } 552*c8b0795cSMark F. Adams } 553*c8b0795cSMark F. Adams } 554*c8b0795cSMark F. Adams 555*c8b0795cSMark F. Adams ierr = VecRestoreArray( mpimat_2->lvec, &cpcol_2_sel_gid ); CHKERRQ(ierr); 556*c8b0795cSMark F. Adams ierr = PetscFree( lid_cprowID_1 ); CHKERRQ(ierr); 557*c8b0795cSMark F. Adams ierr = PetscFree( lid_cprowID_2 ); CHKERRQ(ierr); 558*c8b0795cSMark F. Adams } 559*c8b0795cSMark F. Adams 560*c8b0795cSMark F. Adams /* copy out new aggs */ 561*c8b0795cSMark F. Adams ierr = ISGeneralSetIndices(llist_aggs_2, nnodes_2, id_llist_2, PETSC_COPY_VALUES ); CHKERRQ(ierr); 562*c8b0795cSMark F. Adams 563*c8b0795cSMark F. Adams ierr = PetscFree( id_llist_2 ); CHKERRQ(ierr); 564*c8b0795cSMark F. Adams ierr = PetscFree( deleted_parent_gid ); CHKERRQ(ierr); 565*c8b0795cSMark F. Adams ierr = PetscFree( lid_state ); CHKERRQ(ierr); 566*c8b0795cSMark F. Adams 567*c8b0795cSMark F. Adams PetscFunctionReturn(0); 568*c8b0795cSMark F. Adams } 5692e68589bSMark F. Adams 5702e68589bSMark F. Adams /* -------------------------------------------------------------------------- */ 5712e68589bSMark F. Adams /* 5722e68589bSMark F. Adams PCSetData_AGG 5732e68589bSMark F. Adams 5742e68589bSMark F. Adams Input Parameter: 5752e68589bSMark F. Adams . pc - 5762e68589bSMark F. Adams */ 5772e68589bSMark F. Adams #undef __FUNCT__ 5782e68589bSMark F. Adams #define __FUNCT__ "PCSetData_AGG" 5792e68589bSMark F. Adams PetscErrorCode PCSetData_AGG( PC pc ) 5802e68589bSMark F. Adams { 5812e68589bSMark F. Adams PetscErrorCode ierr; 5822e68589bSMark F. Adams PetscFunctionBegin; 5832e68589bSMark F. Adams ierr = PCSetCoordinates_AGG( pc, -1, PETSC_NULL ); CHKERRQ(ierr); 5842e68589bSMark F. Adams PetscFunctionReturn(0); 5852e68589bSMark F. Adams } 5862e68589bSMark F. Adams 5872e68589bSMark F. Adams /* -------------------------------------------------------------------------- */ 5882e68589bSMark F. Adams /* 5892e68589bSMark F. Adams formProl0 5902e68589bSMark F. Adams 5912e68589bSMark F. Adams Input Parameter: 5922e68589bSMark F. Adams . selected - list of selected local ID, includes selected ghosts 5932e68589bSMark F. Adams . locals_llist - linked list with aggregates 5942e68589bSMark F. Adams . bs - block size 5952e68589bSMark F. Adams . nSAvec - num columns of new P 5962e68589bSMark F. Adams . my0crs - global index of locals 5972e68589bSMark F. Adams . data_stride - bs*(nloc nodes + ghost nodes) 5982e68589bSMark F. Adams . data_in[data_stride*nSAvec] - local data on fine grid 5992e68589bSMark F. Adams . flid_fgid[data_stride/bs] - make local to global IDs, includes ghosts in 'locals_llist' 6002e68589bSMark F. Adams Output Parameter: 6012e68589bSMark F. Adams . a_data_out - in with fine grid data (w/ghosts), out with coarse grid data 6022e68589bSMark F. Adams . a_Prol - prolongation operator 6032e68589bSMark F. Adams */ 6042e68589bSMark F. Adams #undef __FUNCT__ 6052e68589bSMark F. Adams #define __FUNCT__ "formProl0" 6062e68589bSMark F. Adams PetscErrorCode formProl0( IS selected, /* list of selected local ID, includes selected ghosts */ 6072e68589bSMark F. Adams IS locals_llist, /* linked list from selected vertices of aggregate unselected vertices */ 6082e68589bSMark F. Adams const PetscInt bs, 6092e68589bSMark F. Adams const PetscInt nSAvec, 6102e68589bSMark F. Adams const PetscInt my0crs, 6112e68589bSMark F. Adams const PetscInt data_stride, 6122e68589bSMark F. Adams PetscReal data_in[], 6132e68589bSMark F. Adams const PetscInt flid_fgid[], 6142e68589bSMark F. Adams PetscReal **a_data_out, 6152e68589bSMark F. Adams Mat a_Prol /* prolongation operator (output)*/ 6162e68589bSMark F. Adams ) 6172e68589bSMark F. Adams { 6182e68589bSMark F. Adams PetscErrorCode ierr; 619*c8b0795cSMark F. Adams PetscInt Istart,Iend,nFineLoc,clid,flid,aggID,kk,jj,ii,nLocalSelected,ndone,nSelected,minsz; 6202e68589bSMark F. Adams MPI_Comm wcomm = ((PetscObject)a_Prol)->comm; 6212e68589bSMark F. Adams PetscMPIInt mype, npe; 6222e68589bSMark F. Adams const PetscInt *selected_idx,*llist_idx; 6232e68589bSMark F. Adams PetscReal *out_data; 6242e68589bSMark F. Adams 6252e68589bSMark F. Adams PetscFunctionBegin; 6262e68589bSMark F. Adams ierr = MPI_Comm_rank(wcomm,&mype);CHKERRQ(ierr); 6272e68589bSMark F. Adams ierr = MPI_Comm_size(wcomm,&npe);CHKERRQ(ierr); 6282e68589bSMark F. Adams ierr = MatGetOwnershipRange( a_Prol, &Istart, &Iend ); CHKERRQ(ierr); 6292e68589bSMark F. Adams nFineLoc = (Iend-Istart)/bs; assert((Iend-Istart)%bs==0); 6302e68589bSMark F. Adams 631*c8b0795cSMark F. Adams ierr = ISGetSize( selected, &nSelected ); CHKERRQ(ierr); 6322e68589bSMark F. Adams ierr = ISGetIndices( selected, &selected_idx ); CHKERRQ(ierr); 6332e68589bSMark F. Adams for(kk=0,nLocalSelected=0;kk<nSelected;kk++){ 6342e68589bSMark F. Adams PetscInt lid = selected_idx[kk]; 6352e68589bSMark F. Adams if(lid<nFineLoc) nLocalSelected++; 6362e68589bSMark F. Adams } 6372e68589bSMark F. Adams 6382e68589bSMark F. Adams /* aloc space for coarse point data (output) */ 6392e68589bSMark F. Adams #define DATA_OUT_STRIDE (nLocalSelected*nSAvec) 640*c8b0795cSMark F. Adams ierr = PetscMalloc( DATA_OUT_STRIDE*nSAvec*sizeof(PetscReal), &out_data ); CHKERRQ(ierr); 641*c8b0795cSMark F. Adams for(ii=0;ii<DATA_OUT_STRIDE*nSAvec;ii++) out_data[ii]=1.e300; 6422e68589bSMark F. Adams *a_data_out = out_data; /* output - stride nLocalSelected*nSAvec */ 6432e68589bSMark F. Adams 6442e68589bSMark F. Adams /* find points and set prolongation */ 645*c8b0795cSMark F. Adams minsz = 100; 6462e68589bSMark F. Adams ndone = 0; 6472e68589bSMark F. Adams ierr = ISGetIndices( locals_llist, &llist_idx ); CHKERRQ(ierr); 6482e68589bSMark F. Adams for( clid = 0 ; clid < nLocalSelected ; clid++ ){ 6492e68589bSMark F. Adams PetscInt cgid = my0crs + clid, cids[100]; 6502e68589bSMark F. Adams 6512e68589bSMark F. Adams /* count agg */ 6522e68589bSMark F. Adams aggID = 0; 6532e68589bSMark F. Adams flid = selected_idx[clid]; assert(flid != -1); 6542e68589bSMark F. Adams do{ 6552e68589bSMark F. Adams aggID++; 6562e68589bSMark F. Adams } while( (flid=llist_idx[flid]) != -1 ); 657*c8b0795cSMark F. Adams if( aggID<minsz ) minsz = aggID; 6582e68589bSMark F. Adams 6592e68589bSMark F. Adams /* get block */ 6602e68589bSMark F. Adams { 6612e68589bSMark F. Adams PetscBLASInt asz=aggID,M=asz*bs,N=nSAvec,INFO; 6622e68589bSMark F. Adams PetscBLASInt Mdata=M+((N-M>0)?N-M:0),LDA=Mdata,LWORK=N*bs; 6632e68589bSMark F. Adams PetscScalar *qqc,*qqr,*TAU,*WORK; 6642e68589bSMark F. Adams PetscInt *fids; 6652e68589bSMark F. Adams 6662e68589bSMark F. Adams ierr = PetscMalloc( (Mdata*N)*sizeof(PetscScalar), &qqc ); CHKERRQ(ierr); 6672e68589bSMark F. Adams ierr = PetscMalloc( (M*N)*sizeof(PetscScalar), &qqr ); CHKERRQ(ierr); 6682e68589bSMark F. Adams ierr = PetscMalloc( N*sizeof(PetscScalar), &TAU ); CHKERRQ(ierr); 6692e68589bSMark F. Adams ierr = PetscMalloc( LWORK*sizeof(PetscScalar), &WORK ); CHKERRQ(ierr); 6702e68589bSMark F. Adams ierr = PetscMalloc( M*sizeof(PetscInt), &fids ); CHKERRQ(ierr); 6712e68589bSMark F. Adams 6722e68589bSMark F. Adams flid = selected_idx[clid]; 6732e68589bSMark F. Adams aggID = 0; 6742e68589bSMark F. Adams do{ 6752e68589bSMark F. Adams /* copy in B_i matrix - column oriented */ 6762e68589bSMark F. Adams PetscReal *data = &data_in[flid*bs]; 6772e68589bSMark F. Adams for( kk = ii = 0; ii < bs ; ii++ ) { 6782e68589bSMark F. Adams for( jj = 0; jj < N ; jj++ ) { 6792e68589bSMark F. Adams qqc[jj*Mdata + aggID*bs + ii] = data[jj*data_stride + ii]; 6802e68589bSMark F. Adams } 6812e68589bSMark F. Adams } 6822e68589bSMark F. Adams 6832e68589bSMark F. Adams /* set fine IDs */ 6842e68589bSMark F. Adams for(kk=0;kk<bs;kk++) fids[aggID*bs + kk] = flid_fgid[flid]*bs + kk; 6852e68589bSMark F. Adams 6862e68589bSMark F. Adams aggID++; 6872e68589bSMark F. Adams }while( (flid=llist_idx[flid]) != -1 ); 6882e68589bSMark F. Adams 6892e68589bSMark F. Adams /* pad with zeros */ 6902e68589bSMark F. Adams for( ii = asz*bs; ii < Mdata ; ii++ ) { 6912e68589bSMark F. Adams for( jj = 0; jj < N ; jj++, kk++ ) { 6922e68589bSMark F. Adams qqc[jj*Mdata + ii] = .0; 6932e68589bSMark F. Adams } 6942e68589bSMark F. Adams } 6952e68589bSMark F. Adams 6962e68589bSMark F. Adams ndone += aggID; 6972e68589bSMark F. Adams /* QR */ 6982e68589bSMark F. Adams LAPACKgeqrf_( &Mdata, &N, qqc, &LDA, TAU, WORK, &LWORK, &INFO ); 6992e68589bSMark F. Adams if( INFO != 0 ) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"xGEQRS error"); 7002e68589bSMark F. Adams /* get R - column oriented - output B_{i+1} */ 7012e68589bSMark F. Adams { 7022e68589bSMark F. Adams PetscReal *data = &out_data[clid*nSAvec]; 7032e68589bSMark F. Adams for( jj = 0; jj < nSAvec ; jj++ ) { 7042e68589bSMark F. Adams for( ii = 0; ii < nSAvec ; ii++ ) { 7052e68589bSMark F. Adams assert(data[jj*DATA_OUT_STRIDE + ii] == 1.e300); 7062e68589bSMark F. Adams if( ii <= jj ) data[jj*DATA_OUT_STRIDE + ii] = PetscRealPart(qqc[jj*Mdata + ii]); 7072e68589bSMark F. Adams else data[jj*DATA_OUT_STRIDE + ii] = 0.; 7082e68589bSMark F. Adams } 7092e68589bSMark F. Adams } 7102e68589bSMark F. Adams } 7112e68589bSMark F. Adams 7122e68589bSMark F. Adams /* get Q - row oriented */ 7132e68589bSMark F. Adams LAPACKungqr_( &Mdata, &N, &N, qqc, &LDA, TAU, WORK, &LWORK, &INFO ); 7142e68589bSMark F. Adams if( INFO != 0 ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"xORGQR error arg %d",-INFO); 7152e68589bSMark F. Adams 7162e68589bSMark F. Adams for( ii = 0 ; ii < M ; ii++ ){ 7172e68589bSMark F. Adams for( jj = 0 ; jj < N ; jj++ ) { 7182e68589bSMark F. Adams qqr[N*ii + jj] = qqc[jj*Mdata + ii]; 7192e68589bSMark F. Adams } 7202e68589bSMark F. Adams } 7212e68589bSMark F. Adams 7222e68589bSMark F. Adams /* add diagonal block of P0 */ 723*c8b0795cSMark F. Adams for(kk=0;kk<N;kk++) { 724*c8b0795cSMark F. Adams cids[kk] = N*cgid + kk; /* global col IDs in P0 */ 725*c8b0795cSMark F. Adams } 7262e68589bSMark F. Adams ierr = MatSetValues(a_Prol,M,fids,N,cids,qqr,INSERT_VALUES); CHKERRQ(ierr); 7272e68589bSMark F. Adams 7282e68589bSMark F. Adams ierr = PetscFree( qqc ); CHKERRQ(ierr); 7292e68589bSMark F. Adams ierr = PetscFree( qqr ); CHKERRQ(ierr); 7302e68589bSMark F. Adams ierr = PetscFree( TAU ); CHKERRQ(ierr); 7312e68589bSMark F. Adams ierr = PetscFree( WORK ); CHKERRQ(ierr); 7322e68589bSMark F. Adams ierr = PetscFree( fids ); CHKERRQ(ierr); 7332e68589bSMark F. Adams } /* scoping */ 7342e68589bSMark F. Adams } /* for all coarse nodes */ 7352e68589bSMark F. Adams 736*c8b0795cSMark F. Adams /* ierr = MPI_Allreduce( &ndone, &ii, 1, MPIU_INT, MPIU_SUM, wcomm ); */ 7372e68589bSMark F. Adams /* MatGetSize( a_Prol, &kk, &jj ); */ 738*c8b0795cSMark F. Adams /* ierr = MPI_Allreduce( &minsz, &jj, 1, MPIU_INT, MPIU_MIN, wcomm ); */ 739*c8b0795cSMark F. Adams /* PetscPrintf(PETSC_COMM_WORLD," **** [%d]%s %d total done, N=%d (%d local done), min agg. size = %d\n",mype,__FUNCT__,ii,kk/bs,ndone,jj); */ 7402e68589bSMark F. Adams 7412e68589bSMark F. Adams ierr = ISRestoreIndices( selected, &selected_idx ); CHKERRQ(ierr); 7422e68589bSMark F. Adams ierr = ISRestoreIndices( locals_llist, &llist_idx ); CHKERRQ(ierr); 7432e68589bSMark F. Adams ierr = MatAssemblyBegin(a_Prol,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 7442e68589bSMark F. Adams ierr = MatAssemblyEnd(a_Prol,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 7452e68589bSMark F. Adams 7462e68589bSMark F. Adams PetscFunctionReturn(0); 7472e68589bSMark F. Adams } 7482e68589bSMark F. Adams 7492e68589bSMark F. Adams /* -------------------------------------------------------------------------- */ 7502e68589bSMark F. Adams /* 751*c8b0795cSMark F. Adams PCGAMGgraph_AGG 7522e68589bSMark F. Adams 7532e68589bSMark F. Adams Input Parameter: 7542e68589bSMark F. Adams . pc - this 7552e68589bSMark F. Adams . Amat - matrix on this fine level 7562e68589bSMark F. Adams Output Parameter: 757*c8b0795cSMark F. Adams . a_Gmat - 7582e68589bSMark F. Adams */ 7592e68589bSMark F. Adams #undef __FUNCT__ 760*c8b0795cSMark F. Adams #define __FUNCT__ "PCGAMGgraph_AGG" 761*c8b0795cSMark F. Adams PetscErrorCode PCGAMGgraph_AGG( PC pc, 7622e68589bSMark F. Adams const Mat Amat, 763*c8b0795cSMark F. Adams Mat *a_Gmat 764*c8b0795cSMark F. Adams ) 765*c8b0795cSMark F. Adams { 766*c8b0795cSMark F. Adams PetscErrorCode ierr; 767*c8b0795cSMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 768*c8b0795cSMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 769*c8b0795cSMark F. Adams const PetscInt verbose = pc_gamg->verbose; 770*c8b0795cSMark F. Adams const PetscReal vfilter = pc_gamg->threshold; 771*c8b0795cSMark F. Adams PC_GAMG_AGG *pc_gamg_agg = (PC_GAMG_AGG*)pc_gamg->subctx; 772*c8b0795cSMark F. Adams PetscMPIInt mype,npe; 773*c8b0795cSMark F. Adams Mat Gmat, Gmat2; 774*c8b0795cSMark F. Adams MPI_Comm wcomm = ((PetscObject)Amat)->comm; 775*c8b0795cSMark F. Adams 776*c8b0795cSMark F. Adams PetscFunctionBegin; 777*c8b0795cSMark F. Adams ierr = MPI_Comm_rank( wcomm, &mype); CHKERRQ(ierr); 778*c8b0795cSMark F. Adams ierr = MPI_Comm_size( wcomm, &npe); CHKERRQ(ierr); 779*c8b0795cSMark F. Adams 780*c8b0795cSMark F. Adams ierr = createSimpleGraph( Amat, &Gmat ); CHKERRQ( ierr ); 781*c8b0795cSMark F. Adams 782*c8b0795cSMark F. Adams ierr = scaleFilterGraph( &Gmat, vfilter, pc_gamg_agg->sym_graph, verbose ); CHKERRQ( ierr ); 783*c8b0795cSMark F. Adams 784*c8b0795cSMark F. Adams ierr = MatTransposeMatMult( Gmat, Gmat, MAT_INITIAL_MATRIX, PETSC_DEFAULT, &Gmat2 ); 785*c8b0795cSMark F. Adams CHKERRQ(ierr); 786*c8b0795cSMark F. Adams 787*c8b0795cSMark F. Adams /* attach auxilary matrix */ 788*c8b0795cSMark F. Adams pc_gamg_agg->aux_mat = Gmat; 789*c8b0795cSMark F. Adams 790*c8b0795cSMark F. Adams *a_Gmat = Gmat2; 791*c8b0795cSMark F. Adams 792*c8b0795cSMark F. Adams PetscFunctionReturn(0); 793*c8b0795cSMark F. Adams } 794*c8b0795cSMark F. Adams 795*c8b0795cSMark F. Adams /* -------------------------------------------------------------------------- */ 796*c8b0795cSMark F. Adams /* 797*c8b0795cSMark F. Adams PCGAMGcoarsen_AGG 798*c8b0795cSMark F. Adams 799*c8b0795cSMark F. Adams Input Parameter: 800*c8b0795cSMark F. Adams . pc - this 801*c8b0795cSMark F. Adams . Gmat2 - matrix on this fine level 802*c8b0795cSMark F. Adams Output Parameter: 803*c8b0795cSMark F. Adams . a_selected - prolongation operator to the next level 804*c8b0795cSMark F. Adams . a_llist_parent - data of coarse grid points (num local columns in 'a_P_out') 805*c8b0795cSMark F. Adams */ 806*c8b0795cSMark F. Adams #undef __FUNCT__ 807*c8b0795cSMark F. Adams #define __FUNCT__ "PCGAMGcoarsen_AGG" 808*c8b0795cSMark F. Adams PetscErrorCode PCGAMGcoarsen_AGG( PC pc, 809*c8b0795cSMark F. Adams const Mat Gmat2, 810*c8b0795cSMark F. Adams IS *a_selected, 811*c8b0795cSMark F. Adams IS *a_llist_parent 812*c8b0795cSMark F. Adams ) 813*c8b0795cSMark F. Adams { 814*c8b0795cSMark F. Adams PetscErrorCode ierr; 815*c8b0795cSMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 816*c8b0795cSMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 817*c8b0795cSMark F. Adams PC_GAMG_AGG *pc_gamg_agg = (PC_GAMG_AGG*)pc_gamg->subctx; 818*c8b0795cSMark F. Adams Mat Gmat1; /* unsquared graph (not symetrized!) */ 819*c8b0795cSMark F. Adams IS perm, selected, llist_parent; 820*c8b0795cSMark F. Adams PetscInt Ii,nloc,bs,n,m; 821*c8b0795cSMark F. Adams PetscInt *permute; 822*c8b0795cSMark F. Adams PetscBool *bIndexSet; 823*c8b0795cSMark F. Adams /* MPI_Comm wcomm = ((PetscObject)Gmat2)->comm; */ 824*c8b0795cSMark F. Adams /* PetscMPIInt mype,npe; */ 825*c8b0795cSMark F. Adams 826*c8b0795cSMark F. Adams PetscFunctionBegin; 827*c8b0795cSMark F. Adams /* ierr = MPI_Comm_rank( wcomm, &mype); CHKERRQ(ierr); */ 828*c8b0795cSMark F. Adams /* ierr = MPI_Comm_size( wcomm, &npe); CHKERRQ(ierr); */ 829*c8b0795cSMark F. Adams ierr = MatGetLocalSize( Gmat2, &n, &m ); CHKERRQ(ierr); 830*c8b0795cSMark F. Adams ierr = MatGetBlockSize( Gmat2, &bs ); CHKERRQ(ierr); assert(bs==1); 831*c8b0795cSMark F. Adams nloc = n/bs; 832*c8b0795cSMark F. Adams 833*c8b0795cSMark F. Adams /* get unsquared graph */ 834*c8b0795cSMark F. Adams Gmat1 = pc_gamg_agg->aux_mat; pc_gamg_agg->aux_mat = 0; 835*c8b0795cSMark F. Adams 836*c8b0795cSMark F. Adams /* get MIS aggs */ 837*c8b0795cSMark F. Adams /* randomize */ 838*c8b0795cSMark F. Adams ierr = PetscMalloc( nloc*sizeof(PetscInt), &permute ); CHKERRQ(ierr); 839*c8b0795cSMark F. Adams ierr = PetscMalloc( nloc*sizeof(PetscBool), &bIndexSet ); CHKERRQ(ierr); 840*c8b0795cSMark F. Adams for ( Ii = 0; Ii < nloc ; Ii++ ){ 841*c8b0795cSMark F. Adams bIndexSet[Ii] = PETSC_FALSE; 842*c8b0795cSMark F. Adams permute[Ii] = Ii; 843*c8b0795cSMark F. Adams } 844*c8b0795cSMark F. Adams srand(1); /* make deterministic */ 845*c8b0795cSMark F. Adams for ( Ii = 0; Ii < nloc ; Ii++ ) { 846*c8b0795cSMark F. Adams PetscInt iSwapIndex = rand()%nloc; 847*c8b0795cSMark F. Adams if (!bIndexSet[iSwapIndex] && iSwapIndex != Ii) { 848*c8b0795cSMark F. Adams PetscInt iTemp = permute[iSwapIndex]; 849*c8b0795cSMark F. Adams permute[iSwapIndex] = permute[Ii]; 850*c8b0795cSMark F. Adams permute[Ii] = iTemp; 851*c8b0795cSMark F. Adams bIndexSet[iSwapIndex] = PETSC_TRUE; 852*c8b0795cSMark F. Adams } 853*c8b0795cSMark F. Adams } 854*c8b0795cSMark F. Adams ierr = PetscFree( bIndexSet ); CHKERRQ(ierr); 855*c8b0795cSMark F. Adams 856*c8b0795cSMark F. Adams ierr = ISCreateGeneral(PETSC_COMM_SELF, nloc, permute, PETSC_USE_POINTER, &perm); 857*c8b0795cSMark F. Adams CHKERRQ(ierr); 858*c8b0795cSMark F. Adams 859*c8b0795cSMark F. Adams ierr = maxIndSetAgg( perm, Gmat2, PETSC_TRUE, pc_gamg->verbose, &selected, &llist_parent ); CHKERRQ(ierr); 860*c8b0795cSMark F. Adams ierr = ISDestroy( &perm ); CHKERRQ(ierr); 861*c8b0795cSMark F. Adams ierr = PetscFree( permute ); CHKERRQ(ierr); 862*c8b0795cSMark F. Adams 863*c8b0795cSMark F. Adams /* smooth aggs */ 864*c8b0795cSMark F. Adams ierr = smoothAggs( Gmat2, Gmat1, selected, llist_parent ); CHKERRQ(ierr); 865*c8b0795cSMark F. Adams 866*c8b0795cSMark F. Adams ierr = MatDestroy( &Gmat1 ); CHKERRQ(ierr); 867*c8b0795cSMark F. Adams 868*c8b0795cSMark F. Adams *a_selected = selected; 869*c8b0795cSMark F. Adams *a_llist_parent = llist_parent; 870*c8b0795cSMark F. Adams 871*c8b0795cSMark F. Adams PetscFunctionReturn(0); 872*c8b0795cSMark F. Adams } 873*c8b0795cSMark F. Adams 874*c8b0795cSMark F. Adams /* -------------------------------------------------------------------------- */ 875*c8b0795cSMark F. Adams /* 876*c8b0795cSMark F. Adams PCGAMGprolongator_AGG 877*c8b0795cSMark F. Adams 878*c8b0795cSMark F. Adams Input Parameter: 879*c8b0795cSMark F. Adams . pc - this 880*c8b0795cSMark F. Adams . Amat - matrix on this fine level 881*c8b0795cSMark F. Adams . Graph - used to get ghost data for nodes in 882*c8b0795cSMark F. Adams . selected - [nselected inc. chosts] 883*c8b0795cSMark F. Adams . llist_parent - [nloc + Gmat.nghost] linked list 884*c8b0795cSMark F. Adams Output Parameter: 885*c8b0795cSMark F. Adams . a_P_out - prolongation operator to the next level 886*c8b0795cSMark F. Adams */ 887*c8b0795cSMark F. Adams #undef __FUNCT__ 888*c8b0795cSMark F. Adams #define __FUNCT__ "PCGAMGprolongator_AGG" 889*c8b0795cSMark F. Adams PetscErrorCode PCGAMGprolongator_AGG( PC pc, 890*c8b0795cSMark F. Adams const Mat Amat, 891*c8b0795cSMark F. Adams const Mat Gmat, 892*c8b0795cSMark F. Adams IS selected, 893*c8b0795cSMark F. Adams IS llist_parent, 894*c8b0795cSMark F. Adams Mat *a_P_out 8952e68589bSMark F. Adams ) 8962e68589bSMark F. Adams { 8972e68589bSMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 8982e68589bSMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 8992e68589bSMark F. Adams const PetscInt verbose = pc_gamg->verbose; 900*c8b0795cSMark F. Adams const PetscInt data_cols = pc_gamg->data_cell_cols; 9012e68589bSMark F. Adams PetscErrorCode ierr; 902*c8b0795cSMark F. Adams PetscInt Istart,Iend,nloc,ii,jj,kk,my0,nLocalSelected,bs; 903*c8b0795cSMark F. Adams Mat Prol; 9042e68589bSMark F. Adams PetscMPIInt mype, npe; 9052e68589bSMark F. Adams MPI_Comm wcomm = ((PetscObject)Amat)->comm; 9062e68589bSMark F. Adams const PetscInt *selected_idx,col_bs=data_cols; 907*c8b0795cSMark F. Adams PetscReal *data_w_ghost; 908*c8b0795cSMark F. Adams PetscInt myCrs0, nbnodes=0, *flid_fgid; 9092e68589bSMark F. Adams 9102e68589bSMark F. Adams PetscFunctionBegin; 9112e68589bSMark F. Adams ierr = MPI_Comm_rank( wcomm, &mype); CHKERRQ(ierr); 9122e68589bSMark F. Adams ierr = MPI_Comm_size( wcomm, &npe); CHKERRQ(ierr); 9132e68589bSMark F. Adams ierr = MatGetOwnershipRange( Amat, &Istart, &Iend ); CHKERRQ(ierr); 914*c8b0795cSMark F. Adams ierr = MatGetBlockSize( Amat, &bs ); CHKERRQ( ierr ); 915*c8b0795cSMark F. Adams nloc = (Iend-Istart)/bs; my0 = Istart/bs; assert((Iend-Istart)%bs==0); 9162e68589bSMark F. Adams 9172e68589bSMark F. Adams /* get 'nLocalSelected' */ 918*c8b0795cSMark F. Adams ierr = ISGetSize( selected, &kk ); CHKERRQ(ierr); 919*c8b0795cSMark F. Adams ierr = ISGetIndices( selected, &selected_idx ); CHKERRQ(ierr); 920*c8b0795cSMark F. Adams for(ii=0,nLocalSelected=0;ii<kk;ii++){ 921*c8b0795cSMark F. Adams PetscInt lid = selected_idx[ii]; 9222e68589bSMark F. Adams if(lid<nloc) nLocalSelected++; 9232e68589bSMark F. Adams } 924*c8b0795cSMark F. Adams ierr = ISRestoreIndices( selected, &selected_idx ); CHKERRQ(ierr); 9252e68589bSMark F. Adams 9262e68589bSMark F. Adams /* create prolongator, create P matrix */ 9272e68589bSMark F. Adams ierr = MatCreateMPIAIJ(wcomm, 928*c8b0795cSMark F. Adams nloc*bs, nLocalSelected*col_bs, 9292e68589bSMark F. Adams PETSC_DETERMINE, PETSC_DETERMINE, 9302e68589bSMark F. Adams data_cols, PETSC_NULL, data_cols, PETSC_NULL, 9312e68589bSMark F. Adams &Prol ); 9322e68589bSMark F. Adams CHKERRQ(ierr); 9332e68589bSMark F. Adams 9342e68589bSMark F. Adams /* can get all points "removed" */ 935*c8b0795cSMark F. Adams ierr = MatGetSize( Prol, &kk, &ii ); CHKERRQ(ierr); 936*c8b0795cSMark F. Adams if( ii==0 ) { 9372e68589bSMark F. Adams if( verbose ) { 938*c8b0795cSMark F. Adams PetscPrintf(wcomm,"[%d]%s no selected points on coarse grid\n",mype,__FUNCT__); 9392e68589bSMark F. Adams } 9402e68589bSMark F. Adams ierr = MatDestroy( &Prol ); CHKERRQ(ierr); 9412e68589bSMark F. Adams *a_P_out = PETSC_NULL; /* out */ 9422e68589bSMark F. Adams PetscFunctionReturn(0); 9432e68589bSMark F. Adams } 944*c8b0795cSMark F. Adams if( verbose ) { 945*c8b0795cSMark F. Adams PetscPrintf(PETSC_COMM_WORLD,"\t\t[%d]%s New grid %d nodes\n",mype,__FUNCT__,ii/bs); 946*c8b0795cSMark F. Adams } 947*c8b0795cSMark F. Adams ierr = MatGetOwnershipRangeColumn( Prol, &myCrs0, &kk ); CHKERRQ(ierr); 948*c8b0795cSMark F. Adams myCrs0 = myCrs0/col_bs; 9492e68589bSMark F. Adams 9502e68589bSMark F. Adams /* create global vector of data in 'data_w_ghost' */ 9512e68589bSMark F. Adams #if defined PETSC_USE_LOG 9522e68589bSMark F. Adams ierr = PetscLogEventBegin(gamg_setup_events[SET7],0,0,0,0);CHKERRQ(ierr); 9532e68589bSMark F. Adams #endif 954*c8b0795cSMark F. Adams if (npe > 1) { /* */ 9552e68589bSMark F. Adams PetscReal *tmp_gdata,*tmp_ldata,*tp2; 9562e68589bSMark F. Adams ierr = PetscMalloc( nloc*sizeof(PetscReal), &tmp_ldata ); CHKERRQ(ierr); 9572e68589bSMark F. Adams for( jj = 0 ; jj < data_cols ; jj++ ){ 958*c8b0795cSMark F. Adams for( kk = 0 ; kk < bs ; kk++) { 9592e68589bSMark F. Adams PetscInt ii,nnodes; 960*c8b0795cSMark F. Adams const PetscReal *tp = pc_gamg->data + jj*bs*nloc + kk; 961*c8b0795cSMark F. Adams for( ii = 0 ; ii < nloc ; ii++, tp += bs ){ 9622e68589bSMark F. Adams tmp_ldata[ii] = *tp; 9632e68589bSMark F. Adams } 9642e68589bSMark F. Adams ierr = getDataWithGhosts( Gmat, 1, tmp_ldata, &nnodes, &tmp_gdata ); 9652e68589bSMark F. Adams CHKERRQ(ierr); 9662e68589bSMark F. Adams if(jj==0 && kk==0) { /* now I know how many todal nodes - allocate */ 967*c8b0795cSMark F. Adams ierr = PetscMalloc( nnodes*bs*data_cols*sizeof(PetscReal), &data_w_ghost ); CHKERRQ(ierr); 968*c8b0795cSMark F. Adams nbnodes = bs*nnodes; 9692e68589bSMark F. Adams } 970*c8b0795cSMark F. Adams tp2 = data_w_ghost + jj*bs*nnodes + kk; 971*c8b0795cSMark F. Adams for( ii = 0 ; ii < nnodes ; ii++, tp2 += bs ){ 9722e68589bSMark F. Adams *tp2 = tmp_gdata[ii]; 9732e68589bSMark F. Adams } 9742e68589bSMark F. Adams ierr = PetscFree( tmp_gdata ); CHKERRQ(ierr); 9752e68589bSMark F. Adams } 9762e68589bSMark F. Adams } 9772e68589bSMark F. Adams ierr = PetscFree( tmp_ldata ); CHKERRQ(ierr); 9782e68589bSMark F. Adams } 9792e68589bSMark F. Adams else { 980*c8b0795cSMark F. Adams nbnodes = bs*nloc; 981*c8b0795cSMark F. Adams data_w_ghost = (PetscReal*)pc_gamg->data; 9822e68589bSMark F. Adams } 9832e68589bSMark F. Adams 9842e68589bSMark F. Adams /* get P0 */ 9852e68589bSMark F. Adams if( npe > 1 ){ 9862e68589bSMark F. Adams PetscReal *fid_glid_loc,*fiddata; 9872e68589bSMark F. Adams PetscInt nnodes; 9882e68589bSMark F. Adams 9892e68589bSMark F. Adams ierr = PetscMalloc( nloc*sizeof(PetscReal), &fid_glid_loc ); CHKERRQ(ierr); 9902e68589bSMark F. Adams for(kk=0;kk<nloc;kk++) fid_glid_loc[kk] = (PetscReal)(my0+kk); 9912e68589bSMark F. Adams ierr = getDataWithGhosts(Gmat, 1, fid_glid_loc, &nnodes, &fiddata); 9922e68589bSMark F. Adams CHKERRQ(ierr); 9932e68589bSMark F. Adams ierr = PetscMalloc( nnodes*sizeof(PetscInt), &flid_fgid ); CHKERRQ(ierr); 9942e68589bSMark F. Adams for(kk=0;kk<nnodes;kk++) flid_fgid[kk] = (PetscInt)fiddata[kk]; 9952e68589bSMark F. Adams ierr = PetscFree( fiddata ); CHKERRQ(ierr); 996*c8b0795cSMark F. Adams assert(nnodes==nbnodes/bs); 9972e68589bSMark F. Adams ierr = PetscFree( fid_glid_loc ); CHKERRQ(ierr); 9982e68589bSMark F. Adams } 9992e68589bSMark F. Adams else { 10002e68589bSMark F. Adams ierr = PetscMalloc( nloc*sizeof(PetscInt), &flid_fgid ); CHKERRQ(ierr); 10012e68589bSMark F. Adams for(kk=0;kk<nloc;kk++) flid_fgid[kk] = my0 + kk; 10022e68589bSMark F. Adams } 10032e68589bSMark F. Adams #if defined PETSC_USE_LOG 10042e68589bSMark F. Adams ierr = PetscLogEventEnd(gamg_setup_events[SET7],0,0,0,0);CHKERRQ(ierr); 1005*c8b0795cSMark F. Adams ierr = PetscLogEventBegin(gamg_setup_events[SET8],0,0,0,0);CHKERRQ(ierr); 10062e68589bSMark F. Adams #endif 1007*c8b0795cSMark F. Adams { 1008*c8b0795cSMark F. Adams PetscReal *data_out; 1009*c8b0795cSMark F. Adams ierr = formProl0( selected, llist_parent, bs, data_cols, myCrs0, nbnodes, 1010*c8b0795cSMark F. Adams data_w_ghost, flid_fgid, &data_out, Prol ); 10112e68589bSMark F. Adams CHKERRQ(ierr); 1012*c8b0795cSMark F. Adams ierr = PetscFree( pc_gamg->data ); CHKERRQ( ierr ); 1013*c8b0795cSMark F. Adams pc_gamg->data = data_out; 1014*c8b0795cSMark F. Adams pc_gamg->data_cell_rows = data_cols; 1015*c8b0795cSMark F. Adams pc_gamg->data_sz = data_cols*data_cols*nLocalSelected; 1016*c8b0795cSMark F. Adams } 1017*c8b0795cSMark F. Adams #if defined PETSC_USE_LOG 1018*c8b0795cSMark F. Adams ierr = PetscLogEventEnd(gamg_setup_events[SET8],0,0,0,0);CHKERRQ(ierr); 1019*c8b0795cSMark F. Adams #endif 10202e68589bSMark F. Adams if (npe > 1) ierr = PetscFree( data_w_ghost ); CHKERRQ(ierr); 10212e68589bSMark F. Adams ierr = PetscFree( flid_fgid ); CHKERRQ(ierr); 10222e68589bSMark F. Adams 1023*c8b0795cSMark F. Adams /* attach block size of columns */ 1024*c8b0795cSMark F. Adams if( pc_gamg->col_bs_id == -1 ) { 1025*c8b0795cSMark F. Adams ierr = PetscObjectComposedDataRegister( &pc_gamg->col_bs_id ); assert(pc_gamg->col_bs_id != -1 ); 1026*c8b0795cSMark F. Adams } 1027*c8b0795cSMark F. Adams ierr = PetscObjectComposedDataSetInt( (PetscObject)Prol, pc_gamg->col_bs_id, data_cols ); CHKERRQ(ierr); 1028*c8b0795cSMark F. Adams 1029*c8b0795cSMark F. Adams *a_P_out = Prol; /* out */ 1030*c8b0795cSMark F. Adams 1031*c8b0795cSMark F. Adams PetscFunctionReturn(0); 1032*c8b0795cSMark F. Adams } 1033*c8b0795cSMark F. Adams 1034*c8b0795cSMark F. Adams /* -------------------------------------------------------------------------- */ 1035*c8b0795cSMark F. Adams /* 1036*c8b0795cSMark F. Adams PCGAMGoptprol_AGG 1037*c8b0795cSMark F. Adams 1038*c8b0795cSMark F. Adams Input Parameter: 1039*c8b0795cSMark F. Adams . pc - this 1040*c8b0795cSMark F. Adams . Amat - matrix on this fine level 1041*c8b0795cSMark F. Adams In/Output Parameter: 1042*c8b0795cSMark F. Adams . a_P_out - prolongation operator to the next level 1043*c8b0795cSMark F. Adams */ 1044*c8b0795cSMark F. Adams #undef __FUNCT__ 1045*c8b0795cSMark F. Adams #define __FUNCT__ "PCGAMGoptprol_AGG" 1046*c8b0795cSMark F. Adams PetscErrorCode PCGAMGoptprol_AGG( PC pc, 1047*c8b0795cSMark F. Adams const Mat Amat, 1048*c8b0795cSMark F. Adams Mat *a_P 1049*c8b0795cSMark F. Adams ) 1050*c8b0795cSMark F. Adams { 1051*c8b0795cSMark F. Adams PetscErrorCode ierr; 1052*c8b0795cSMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 1053*c8b0795cSMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 1054*c8b0795cSMark F. Adams const PetscInt verbose = pc_gamg->verbose; 1055*c8b0795cSMark F. Adams PC_GAMG_AGG *pc_gamg_agg = (PC_GAMG_AGG*)pc_gamg->subctx; 1056*c8b0795cSMark F. Adams PetscInt jj; 1057*c8b0795cSMark F. Adams PetscMPIInt mype,npe; 1058*c8b0795cSMark F. Adams Mat Prol = *a_P; 1059*c8b0795cSMark F. Adams MPI_Comm wcomm = ((PetscObject)Amat)->comm; 1060*c8b0795cSMark F. Adams 1061*c8b0795cSMark F. Adams PetscFunctionBegin; 1062*c8b0795cSMark F. Adams ierr = MPI_Comm_rank( wcomm, &mype); CHKERRQ(ierr); 1063*c8b0795cSMark F. Adams ierr = MPI_Comm_size( wcomm, &npe); CHKERRQ(ierr); 1064*c8b0795cSMark F. Adams 10652e68589bSMark F. Adams /* smooth P0 */ 1066*c8b0795cSMark F. Adams for( jj = 0 ; jj < pc_gamg_agg->nsmooths ; jj++ ){ 10672e68589bSMark F. Adams Mat tMat; 10682e68589bSMark F. Adams Vec diag; 10692e68589bSMark F. Adams PetscReal alpha, emax, emin; 10702e68589bSMark F. Adams #if defined PETSC_USE_LOG 10712e68589bSMark F. Adams ierr = PetscLogEventBegin(gamg_setup_events[SET9],0,0,0,0);CHKERRQ(ierr); 10722e68589bSMark F. Adams #endif 10732e68589bSMark F. Adams if( jj == 0 ) { 10742e68589bSMark F. Adams KSP eksp; 10752e68589bSMark F. Adams Vec bb, xx; 10762e68589bSMark F. Adams PC pc; 10772e68589bSMark F. Adams ierr = MatGetVecs( Amat, &bb, 0 ); CHKERRQ(ierr); 10782e68589bSMark F. Adams ierr = MatGetVecs( Amat, &xx, 0 ); CHKERRQ(ierr); 10792e68589bSMark F. Adams { 10802e68589bSMark F. Adams PetscRandom rctx; 10812e68589bSMark F. Adams ierr = PetscRandomCreate(wcomm,&rctx);CHKERRQ(ierr); 10822e68589bSMark F. Adams ierr = PetscRandomSetFromOptions(rctx);CHKERRQ(ierr); 10832e68589bSMark F. Adams ierr = VecSetRandom(bb,rctx);CHKERRQ(ierr); 10842e68589bSMark F. Adams ierr = PetscRandomDestroy( &rctx ); CHKERRQ(ierr); 10852e68589bSMark F. Adams } 10862e68589bSMark F. Adams ierr = KSPCreate(wcomm,&eksp); CHKERRQ(ierr); 10872e68589bSMark F. Adams ierr = KSPAppendOptionsPrefix( eksp, "est_"); CHKERRQ(ierr); 10882e68589bSMark F. Adams ierr = KSPSetFromOptions( eksp ); CHKERRQ(ierr); 10892e68589bSMark F. Adams ierr = KSPSetInitialGuessNonzero( eksp, PETSC_FALSE ); CHKERRQ(ierr); 10902e68589bSMark F. Adams ierr = KSPSetOperators( eksp, Amat, Amat, SAME_NONZERO_PATTERN ); 10912e68589bSMark F. Adams CHKERRQ( ierr ); 10922e68589bSMark F. Adams ierr = KSPGetPC( eksp, &pc ); CHKERRQ( ierr ); 10932e68589bSMark F. Adams ierr = PCSetType( pc, PCJACOBI ); CHKERRQ(ierr); /* smoother */ 10942e68589bSMark F. Adams ierr = KSPSetTolerances(eksp,PETSC_DEFAULT,PETSC_DEFAULT,PETSC_DEFAULT,10); 10952e68589bSMark F. Adams CHKERRQ(ierr); 10962e68589bSMark F. Adams ierr = KSPSetNormType( eksp, KSP_NORM_NONE ); CHKERRQ(ierr); 10972e68589bSMark F. Adams ierr = KSPSetComputeSingularValues( eksp,PETSC_TRUE ); CHKERRQ(ierr); 10982e68589bSMark F. Adams 10992e68589bSMark F. Adams /* solve - keep stuff out of logging */ 11002e68589bSMark F. Adams ierr = PetscLogEventDeactivate(KSP_Solve);CHKERRQ(ierr); 11012e68589bSMark F. Adams ierr = PetscLogEventDeactivate(PC_Apply);CHKERRQ(ierr); 11022e68589bSMark F. Adams ierr = KSPSolve( eksp, bb, xx ); CHKERRQ(ierr); 11032e68589bSMark F. Adams ierr = PetscLogEventActivate(KSP_Solve);CHKERRQ(ierr); 11042e68589bSMark F. Adams ierr = PetscLogEventActivate(PC_Apply);CHKERRQ(ierr); 11052e68589bSMark F. Adams 11062e68589bSMark F. Adams ierr = KSPComputeExtremeSingularValues( eksp, &emax, &emin ); CHKERRQ(ierr); 11072e68589bSMark F. Adams if( verbose ) { 1108*c8b0795cSMark F. Adams PetscPrintf(wcomm,"\t\t\t%s smooth P0: max eigen=%e min=%e PC=%s\n", 11092e68589bSMark F. Adams __FUNCT__,emax,emin,PCJACOBI); 11102e68589bSMark F. Adams } 11112e68589bSMark F. Adams ierr = VecDestroy( &xx ); CHKERRQ(ierr); 11122e68589bSMark F. Adams ierr = VecDestroy( &bb ); CHKERRQ(ierr); 11132e68589bSMark F. Adams ierr = KSPDestroy( &eksp ); CHKERRQ(ierr); 11142e68589bSMark F. Adams 11152e68589bSMark F. Adams if( pc_gamg->emax_id == -1 ) { 11162e68589bSMark F. Adams ierr = PetscObjectComposedDataRegister( &pc_gamg->emax_id ); 11172e68589bSMark F. Adams assert(pc_gamg->emax_id != -1 ); 11182e68589bSMark F. Adams } 11192e68589bSMark F. Adams ierr = PetscObjectComposedDataSetScalar( (PetscObject)Amat, pc_gamg->emax_id, emax ); CHKERRQ(ierr); 11202e68589bSMark F. Adams } 11212e68589bSMark F. Adams 11222e68589bSMark F. Adams /* smooth P1 := (I - omega/lam D^{-1}A)P0 */ 11232e68589bSMark F. Adams ierr = MatMatMult( Amat, Prol, MAT_INITIAL_MATRIX, PETSC_DEFAULT, &tMat ); CHKERRQ(ierr); 11242e68589bSMark F. Adams ierr = MatGetVecs( Amat, &diag, 0 ); CHKERRQ(ierr); 11252e68589bSMark F. Adams ierr = MatGetDiagonal( Amat, diag ); CHKERRQ(ierr); /* effectively PCJACOBI */ 11262e68589bSMark F. Adams ierr = VecReciprocal( diag ); CHKERRQ(ierr); 11272e68589bSMark F. Adams ierr = MatDiagonalScale( tMat, diag, 0 ); CHKERRQ(ierr); 11282e68589bSMark F. Adams ierr = VecDestroy( &diag ); CHKERRQ(ierr); 11292e68589bSMark F. Adams alpha = -1.5/emax; 11302e68589bSMark F. Adams ierr = MatAYPX( tMat, alpha, Prol, SUBSET_NONZERO_PATTERN ); CHKERRQ(ierr); 11312e68589bSMark F. Adams ierr = MatDestroy( &Prol ); CHKERRQ(ierr); 11322e68589bSMark F. Adams Prol = tMat; 11332e68589bSMark F. Adams #if defined PETSC_USE_LOG 11342e68589bSMark F. Adams ierr = PetscLogEventEnd(gamg_setup_events[SET9],0,0,0,0);CHKERRQ(ierr); 11352e68589bSMark F. Adams #endif 11362e68589bSMark F. Adams } 11372e68589bSMark F. Adams 1138*c8b0795cSMark F. Adams *a_P = Prol; 1139*c8b0795cSMark F. Adams 1140*c8b0795cSMark F. Adams PetscFunctionReturn(0); 11412e68589bSMark F. Adams } 11422e68589bSMark F. Adams 1143*c8b0795cSMark F. Adams /* -------------------------------------------------------------------------- */ 1144*c8b0795cSMark F. Adams /* 1145*c8b0795cSMark F. Adams PCCreateGAMG_AGG 11462e68589bSMark F. Adams 1147*c8b0795cSMark F. Adams Input Parameter: 1148*c8b0795cSMark F. Adams . pc - 1149*c8b0795cSMark F. Adams */ 1150*c8b0795cSMark F. Adams #undef __FUNCT__ 1151*c8b0795cSMark F. Adams #define __FUNCT__ "PCCreateGAMG_AGG" 1152*c8b0795cSMark F. Adams PetscErrorCode PCCreateGAMG_AGG( PC pc ) 1153*c8b0795cSMark F. Adams { 1154*c8b0795cSMark F. Adams PetscErrorCode ierr; 1155*c8b0795cSMark F. Adams PC_MG *mg = (PC_MG*)pc->data; 1156*c8b0795cSMark F. Adams PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 1157*c8b0795cSMark F. Adams PC_GAMG_AGG *pc_gamg_agg; 11582e68589bSMark F. Adams 1159*c8b0795cSMark F. Adams PetscFunctionBegin; 1160*c8b0795cSMark F. Adams /* create sub context for SA */ 1161*c8b0795cSMark F. Adams ierr = PetscNewLog( pc, PC_GAMG_AGG, &pc_gamg_agg ); CHKERRQ(ierr); 1162*c8b0795cSMark F. Adams assert(!pc_gamg->subctx); 1163*c8b0795cSMark F. Adams pc_gamg->subctx = pc_gamg_agg; 1164*c8b0795cSMark F. Adams 1165*c8b0795cSMark F. Adams pc->ops->setfromoptions = PCSetFromOptions_GAMG_AGG; 1166*c8b0795cSMark F. Adams pc->ops->destroy = PCDestroy_AGG; 1167*c8b0795cSMark F. Adams /* reset does not do anything; setup not virtual */ 1168*c8b0795cSMark F. Adams 1169*c8b0795cSMark F. Adams /* set internal function pointers */ 1170*c8b0795cSMark F. Adams pc_gamg->graph = PCGAMGgraph_AGG; 1171*c8b0795cSMark F. Adams pc_gamg->coarsen = PCGAMGcoarsen_AGG; 1172*c8b0795cSMark F. Adams pc_gamg->prolongator = PCGAMGprolongator_AGG; 1173*c8b0795cSMark F. Adams pc_gamg->optprol = PCGAMGoptprol_AGG; 1174*c8b0795cSMark F. Adams 1175*c8b0795cSMark F. Adams pc_gamg->createdefaultdata = PCSetData_AGG; 1176*c8b0795cSMark F. Adams 1177*c8b0795cSMark F. Adams ierr = PetscObjectComposeFunctionDynamic( (PetscObject)pc, 1178*c8b0795cSMark F. Adams "PCSetCoordinates_C", 1179*c8b0795cSMark F. Adams "PCSetCoordinates_AGG", 1180*c8b0795cSMark F. Adams PCSetCoordinates_AGG); 11812e68589bSMark F. Adams PetscFunctionReturn(0); 11822e68589bSMark F. Adams } 1183