18e6d0c30SPeter Brune #include <../src/ksp/pc/impls/gamg/gamg.h> /*I "petscpc.h" I*/ 28e6d0c30SPeter Brune #include <petsc-private/kspimpl.h> 38e6d0c30SPeter Brune 48e6d0c30SPeter Brune typedef struct { 58e6d0c30SPeter Brune PetscReal dummy; /* empty struct; save for later */ 68e6d0c30SPeter Brune } PC_GAMG_Classical; 78e6d0c30SPeter Brune 88e6d0c30SPeter Brune 98e6d0c30SPeter Brune #undef __FUNCT__ 10bfde193fSPeter Brune #define __FUNCT__ "PCGAMGClassicalCreateGhostVector_Private" 11bfde193fSPeter Brune PetscErrorCode PCGAMGClassicalCreateGhostVector_Private(Mat G,Vec *gvec,PetscInt **global) 128e6d0c30SPeter Brune { 138e6d0c30SPeter Brune Mat_MPIAIJ *aij = (Mat_MPIAIJ*)G->data; 148e6d0c30SPeter Brune PetscErrorCode ierr; 158e6d0c30SPeter Brune PetscBool isMPIAIJ; 168e6d0c30SPeter Brune 178e6d0c30SPeter Brune PetscFunctionBegin; 188e6d0c30SPeter Brune ierr = PetscObjectTypeCompare((PetscObject)G, MATMPIAIJ, &isMPIAIJ); CHKERRQ(ierr); 198e6d0c30SPeter Brune if (isMPIAIJ) { 208e6d0c30SPeter Brune if (gvec)ierr = VecDuplicate(aij->lvec,gvec);CHKERRQ(ierr); 218e6d0c30SPeter Brune if (global)*global = aij->garray; 228e6d0c30SPeter Brune } else { 238e6d0c30SPeter Brune /* no off-processor nodes */ 248e6d0c30SPeter Brune if (gvec)*gvec = NULL; 258e6d0c30SPeter Brune if (global)*global = NULL; 268e6d0c30SPeter Brune } 278e6d0c30SPeter Brune PetscFunctionReturn(0); 288e6d0c30SPeter Brune } 298e6d0c30SPeter Brune 308e6d0c30SPeter Brune #undef __FUNCT__ 31bfde193fSPeter Brune #define __FUNCT__ "PCGAMGClassicalGraphSplitting_Private" 328e6d0c30SPeter Brune /* 338e6d0c30SPeter Brune Split the relevant graph into diagonal and off-diagonal parts in local numbering; for now this 348e6d0c30SPeter Brune a roundabout private interface to the mats' internal diag and offdiag mats. 358e6d0c30SPeter Brune */ 36bfde193fSPeter Brune PetscErrorCode PCGAMGClassicalGraphSplitting_Private(Mat G,Mat *Gd, Mat *Go) 378e6d0c30SPeter Brune { 388e6d0c30SPeter Brune Mat_MPIAIJ *aij = (Mat_MPIAIJ*)G->data; 398e6d0c30SPeter Brune PetscErrorCode ierr; 408e6d0c30SPeter Brune PetscBool isMPIAIJ; 418e6d0c30SPeter Brune PetscFunctionBegin; 428e6d0c30SPeter Brune ierr = PetscObjectTypeCompare((PetscObject)G, MATMPIAIJ, &isMPIAIJ ); CHKERRQ(ierr); 438e6d0c30SPeter Brune if (isMPIAIJ) { 448e6d0c30SPeter Brune *Gd = aij->A; 458e6d0c30SPeter Brune *Go = aij->B; 468e6d0c30SPeter Brune } else { 478e6d0c30SPeter Brune *Gd = G; 488e6d0c30SPeter Brune *Go = NULL; 498e6d0c30SPeter Brune } 508e6d0c30SPeter Brune PetscFunctionReturn(0); 518e6d0c30SPeter Brune } 528e6d0c30SPeter Brune 538e6d0c30SPeter Brune #undef __FUNCT__ 548e6d0c30SPeter Brune #define __FUNCT__ "PCGAMGGraph_Classical" 5565b3d5b6SPeter Brune PetscErrorCode PCGAMGGraph_Classical(PC pc,const Mat A,Mat *G) 568e6d0c30SPeter Brune { 57550383edSPeter Brune PetscInt s,f,n,idx,lidx,gidx; 58e5a0faa4SPeter Brune PetscInt r,c,ncols; 598e6d0c30SPeter Brune const PetscInt *rcol; 608e6d0c30SPeter Brune const PetscScalar *rval; 61e5a0faa4SPeter Brune PetscInt *gcol; 628e6d0c30SPeter Brune PetscScalar *gval; 63e5a0faa4SPeter Brune PetscReal rmax; 64550383edSPeter Brune PetscInt cmax = 0; 658e6d0c30SPeter Brune PC_MG *mg; 668e6d0c30SPeter Brune PC_GAMG *gamg; 678e6d0c30SPeter Brune PetscErrorCode ierr; 688e6d0c30SPeter Brune PetscInt *gsparse,*lsparse; 69e5a0faa4SPeter Brune PetscScalar *Amax; 708e6d0c30SPeter Brune MatType mtype; 718e6d0c30SPeter Brune 728e6d0c30SPeter Brune PetscFunctionBegin; 738e6d0c30SPeter Brune mg = (PC_MG *)pc->data; 748e6d0c30SPeter Brune gamg = (PC_GAMG *)mg->innerctx; 758e6d0c30SPeter Brune 768e6d0c30SPeter Brune ierr = MatGetOwnershipRange(A,&s,&f);CHKERRQ(ierr); 77550383edSPeter Brune n=f-s; 78550383edSPeter Brune ierr = PetscMalloc(sizeof(PetscInt)*n,&lsparse);CHKERRQ(ierr); 79550383edSPeter Brune ierr = PetscMalloc(sizeof(PetscInt)*n,&gsparse);CHKERRQ(ierr); 80550383edSPeter Brune ierr = PetscMalloc(sizeof(PetscScalar)*n,&Amax);CHKERRQ(ierr); 818e6d0c30SPeter Brune 82550383edSPeter Brune for (r = 0;r < n;r++) { 838e6d0c30SPeter Brune lsparse[r] = 0; 84550383edSPeter Brune gsparse[r] = 0; 858e6d0c30SPeter Brune } 868e6d0c30SPeter Brune 87550383edSPeter Brune for (r = s;r < f;r++) { 88e5a0faa4SPeter Brune /* determine the maximum off-diagonal in each row */ 89e5a0faa4SPeter Brune rmax = 0.; 90550383edSPeter Brune ierr = MatGetRow(A,r,&ncols,&rcol,&rval);CHKERRQ(ierr); 91e5a0faa4SPeter Brune for (c = 0; c < ncols; c++) { 921ce39c63SPeter Brune if (PetscRealPart(-rval[c]) > rmax && rcol[c] != r) { 931ce39c63SPeter Brune rmax = PetscRealPart(-rval[c]); 94e5a0faa4SPeter Brune } 95e5a0faa4SPeter Brune } 96550383edSPeter Brune Amax[r-s] = rmax; 97550383edSPeter Brune if (ncols > cmax) cmax = ncols; 98550383edSPeter Brune lidx = 0; 99550383edSPeter Brune gidx = 0; 100e5a0faa4SPeter Brune /* create the local and global sparsity patterns */ 1018e6d0c30SPeter Brune for (c = 0; c < ncols; c++) { 1021ce39c63SPeter Brune if (PetscRealPart(-rval[c]) > gamg->threshold*PetscRealPart(Amax[r-s])) { 103550383edSPeter Brune if (rcol[c] < f && rcol[c] >= s) { 104550383edSPeter Brune lidx++; 105550383edSPeter Brune } else { 106550383edSPeter Brune gidx++; 1078e6d0c30SPeter Brune } 1088e6d0c30SPeter Brune } 1098e6d0c30SPeter Brune } 110550383edSPeter Brune ierr = MatRestoreRow(A,r,&ncols,&rcol,&rval);CHKERRQ(ierr); 111550383edSPeter Brune lsparse[r-s] = lidx; 112550383edSPeter Brune gsparse[r-s] = gidx; 1138e6d0c30SPeter Brune } 114e5a0faa4SPeter Brune ierr = PetscMalloc(sizeof(PetscScalar)*cmax,&gval);CHKERRQ(ierr); 115e5a0faa4SPeter Brune ierr = PetscMalloc(sizeof(PetscInt)*cmax,&gcol);CHKERRQ(ierr); 116e5a0faa4SPeter Brune 1178e6d0c30SPeter Brune ierr = MatCreate(PetscObjectComm((PetscObject)A),G); CHKERRQ(ierr); 1188e6d0c30SPeter Brune ierr = MatGetType(A,&mtype);CHKERRQ(ierr); 1198e6d0c30SPeter Brune ierr = MatSetType(*G,mtype);CHKERRQ(ierr); 120550383edSPeter Brune ierr = MatSetSizes(*G,n,n,PETSC_DETERMINE,PETSC_DETERMINE);CHKERRQ(ierr); 1218e6d0c30SPeter Brune ierr = MatMPIAIJSetPreallocation(*G,0,lsparse,0,gsparse);CHKERRQ(ierr); 1228e6d0c30SPeter Brune ierr = MatSeqAIJSetPreallocation(*G,0,lsparse);CHKERRQ(ierr); 1238e6d0c30SPeter Brune for (r = s;r < f;r++) { 1248e6d0c30SPeter Brune ierr = MatGetRow(A,r,&ncols,&rcol,&rval);CHKERRQ(ierr); 1258e6d0c30SPeter Brune idx = 0; 1268e6d0c30SPeter Brune for (c = 0; c < ncols; c++) { 1278e6d0c30SPeter Brune /* classical strength of connection */ 1281ce39c63SPeter Brune if (PetscRealPart(-rval[c]) > gamg->threshold*PetscRealPart(Amax[r-s])) { 1298e6d0c30SPeter Brune gcol[idx] = rcol[c]; 1308e6d0c30SPeter Brune gval[idx] = rval[c]; 1318e6d0c30SPeter Brune idx++; 1328e6d0c30SPeter Brune } 1338e6d0c30SPeter Brune } 1348e6d0c30SPeter Brune ierr = MatSetValues(*G,1,&r,idx,gcol,gval,INSERT_VALUES);CHKERRQ(ierr); 1358e6d0c30SPeter Brune ierr = MatRestoreRow(A,r,&ncols,&rcol,&rval);CHKERRQ(ierr); 1368e6d0c30SPeter Brune } 1378e6d0c30SPeter Brune ierr = MatAssemblyBegin(*G, MAT_FINAL_ASSEMBLY); CHKERRQ(ierr); 1388e6d0c30SPeter Brune ierr = MatAssemblyEnd(*G, MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1398e6d0c30SPeter Brune 1408e6d0c30SPeter Brune ierr = PetscFree(gval);CHKERRQ(ierr); 1418e6d0c30SPeter Brune ierr = PetscFree(gcol);CHKERRQ(ierr); 1428e6d0c30SPeter Brune ierr = PetscFree(lsparse);CHKERRQ(ierr); 1438e6d0c30SPeter Brune ierr = PetscFree(gsparse);CHKERRQ(ierr); 144e5a0faa4SPeter Brune ierr = PetscFree(Amax);CHKERRQ(ierr); 1458e6d0c30SPeter Brune PetscFunctionReturn(0); 1468e6d0c30SPeter Brune } 1478e6d0c30SPeter Brune 1488e6d0c30SPeter Brune 1498e6d0c30SPeter Brune #undef __FUNCT__ 1508e6d0c30SPeter Brune #define __FUNCT__ "PCGAMGCoarsen_Classical" 1518e6d0c30SPeter Brune PetscErrorCode PCGAMGCoarsen_Classical(PC pc,Mat *G,PetscCoarsenData **agg_lists) 1528e6d0c30SPeter Brune { 1538e6d0c30SPeter Brune PetscErrorCode ierr; 1548e6d0c30SPeter Brune MatCoarsen crs; 1558e6d0c30SPeter Brune MPI_Comm fcomm = ((PetscObject)pc)->comm; 1568e6d0c30SPeter Brune 1578e6d0c30SPeter Brune PetscFunctionBegin; 1588e6d0c30SPeter Brune 1598e6d0c30SPeter Brune 1608e6d0c30SPeter Brune /* construct the graph if necessary */ 1618e6d0c30SPeter Brune if (!G) { 1628e6d0c30SPeter Brune SETERRQ(fcomm,PETSC_ERR_ARG_WRONGSTATE,"Must set Graph in PC in PCGAMG before coarsening"); 1638e6d0c30SPeter Brune } 1648e6d0c30SPeter Brune 1658e6d0c30SPeter Brune ierr = MatCoarsenCreate(fcomm,&crs);CHKERRQ(ierr); 1668e6d0c30SPeter Brune ierr = MatCoarsenSetFromOptions(crs);CHKERRQ(ierr); 1678e6d0c30SPeter Brune ierr = MatCoarsenSetAdjacency(crs,*G);CHKERRQ(ierr); 1688e6d0c30SPeter Brune ierr = MatCoarsenSetStrictAggs(crs,PETSC_TRUE);CHKERRQ(ierr); 1698e6d0c30SPeter Brune ierr = MatCoarsenApply(crs);CHKERRQ(ierr); 1708e6d0c30SPeter Brune ierr = MatCoarsenGetData(crs,agg_lists);CHKERRQ(ierr); 1718e6d0c30SPeter Brune ierr = MatCoarsenDestroy(&crs);CHKERRQ(ierr); 1728e6d0c30SPeter Brune 1738e6d0c30SPeter Brune PetscFunctionReturn(0); 1748e6d0c30SPeter Brune } 1758e6d0c30SPeter Brune 1768e6d0c30SPeter Brune #undef __FUNCT__ 177bfde193fSPeter Brune #define __FUNCT__ "PCGAMGClassicalGhost_Private" 1788e6d0c30SPeter Brune /* 1798e6d0c30SPeter Brune Find all ghost nodes that are coarse and output the fine/coarse splitting for those as well 1808e6d0c30SPeter Brune 1818e6d0c30SPeter Brune Input: 1828e6d0c30SPeter Brune G - graph; 1838e6d0c30SPeter Brune gvec - Global Vector 1848e6d0c30SPeter Brune avec - Local part of the scattered vec 1858e6d0c30SPeter Brune bvec - Global part of the scattered vec 1868e6d0c30SPeter Brune 1878e6d0c30SPeter Brune Output: 1888e6d0c30SPeter Brune findx - indirection t 1898e6d0c30SPeter Brune 1908e6d0c30SPeter Brune */ 191bfde193fSPeter Brune PetscErrorCode PCGAMGClassicalGhost_Private(Mat G,Vec v,Vec gv) 1928e6d0c30SPeter Brune { 1938e6d0c30SPeter Brune PetscErrorCode ierr; 1948e6d0c30SPeter Brune Mat_MPIAIJ *aij = (Mat_MPIAIJ*)G->data; 1958e6d0c30SPeter Brune PetscBool isMPIAIJ; 1968e6d0c30SPeter Brune 1978e6d0c30SPeter Brune PetscFunctionBegin; 1988e6d0c30SPeter Brune ierr = PetscObjectTypeCompare((PetscObject)G, MATMPIAIJ, &isMPIAIJ ); CHKERRQ(ierr); 1998e6d0c30SPeter Brune if (isMPIAIJ) { 2008e6d0c30SPeter Brune ierr = VecScatterBegin(aij->Mvctx,v,gv,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 2018e6d0c30SPeter Brune ierr = VecScatterEnd(aij->Mvctx,v,gv,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 2028e6d0c30SPeter Brune } 2038e6d0c30SPeter Brune PetscFunctionReturn(0); 2048e6d0c30SPeter Brune } 2058e6d0c30SPeter Brune 2068e6d0c30SPeter Brune #undef __FUNCT__ 2078e6d0c30SPeter Brune #define __FUNCT__ "PCGAMGProlongator_Classical" 20865b3d5b6SPeter Brune PetscErrorCode PCGAMGProlongator_Classical(PC pc, const Mat A, const Mat G, PetscCoarsenData *agg_lists,Mat *P) 2098e6d0c30SPeter Brune { 2108e6d0c30SPeter Brune PetscErrorCode ierr; 2118e6d0c30SPeter Brune MPI_Comm comm; 2121ce39c63SPeter Brune PetscReal *Amax_pos,*Amax_neg; 2131ce39c63SPeter Brune Mat lA,gA; /* on and off diagonal matrices */ 2148e6d0c30SPeter Brune PetscInt fn; /* fine local blocked sizes */ 2158e6d0c30SPeter Brune PetscInt cn; /* coarse local blocked sizes */ 2168e6d0c30SPeter Brune PetscInt gn; /* size of the off-diagonal fine vector */ 2178e6d0c30SPeter Brune PetscInt fs,fe; /* fine (row) ownership range*/ 2188e6d0c30SPeter Brune PetscInt cs,ce; /* coarse (column) ownership range */ 2191ce39c63SPeter Brune PetscInt i,j; /* indices! */ 2208e6d0c30SPeter Brune PetscBool iscoarse; /* flag for determining if a node is coarse */ 2218e6d0c30SPeter Brune PetscInt *lcid,*gcid; /* on and off-processor coarse unknown IDs */ 2228e6d0c30SPeter Brune PetscInt *lsparse,*gsparse; /* on and off-processor sparsity patterns for prolongator */ 2238e6d0c30SPeter Brune PetscScalar pij; 2248e6d0c30SPeter Brune const PetscScalar *rval; 2258e6d0c30SPeter Brune const PetscInt *rcol; 2268e6d0c30SPeter Brune PetscScalar g_pos,g_neg,a_pos,a_neg,diag,invdiag,alpha,beta; 2278e6d0c30SPeter Brune Vec F; /* vec of coarse size */ 2288e6d0c30SPeter Brune Vec C; /* vec of fine size */ 2298e6d0c30SPeter Brune Vec gF; /* vec of off-diagonal fine size */ 2308e6d0c30SPeter Brune MatType mtype; 2318e6d0c30SPeter Brune PetscInt c_indx; 2328e6d0c30SPeter Brune PetscScalar c_scalar; 2338e6d0c30SPeter Brune PetscInt ncols,col; 2348e6d0c30SPeter Brune PetscInt row_f,row_c; 2351ce39c63SPeter Brune PetscInt cmax=0,idx; 2368e6d0c30SPeter Brune PetscScalar *pvals; 2378e6d0c30SPeter Brune PetscInt *pcols; 2381ce39c63SPeter Brune PC_MG *mg = (PC_MG*)pc->data; 2391ce39c63SPeter Brune PC_GAMG *gamg = (PC_GAMG*)mg->innerctx; 2408e6d0c30SPeter Brune 2418e6d0c30SPeter Brune PetscFunctionBegin; 2428e6d0c30SPeter Brune comm = ((PetscObject)pc)->comm; 2438e6d0c30SPeter Brune ierr = MatGetOwnershipRange(A,&fs,&fe); CHKERRQ(ierr); 2448e6d0c30SPeter Brune fn = (fe - fs); 2458e6d0c30SPeter Brune 2468e6d0c30SPeter Brune ierr = MatGetVecs(A,&F,NULL);CHKERRQ(ierr); 2478e6d0c30SPeter Brune 2488e6d0c30SPeter Brune /* get the number of local unknowns and the indices of the local unknowns */ 2498e6d0c30SPeter Brune 2508e6d0c30SPeter Brune ierr = PetscMalloc(sizeof(PetscInt)*fn,&lsparse);CHKERRQ(ierr); 2518e6d0c30SPeter Brune ierr = PetscMalloc(sizeof(PetscInt)*fn,&gsparse);CHKERRQ(ierr); 2528e6d0c30SPeter Brune ierr = PetscMalloc(sizeof(PetscInt)*fn,&lcid);CHKERRQ(ierr); 2531ce39c63SPeter Brune ierr = PetscMalloc(sizeof(PetscReal)*fn,&Amax_pos);CHKERRQ(ierr); 2541ce39c63SPeter Brune ierr = PetscMalloc(sizeof(PetscReal)*fn,&Amax_neg);CHKERRQ(ierr); 2558e6d0c30SPeter Brune 2568e6d0c30SPeter Brune /* count the number of coarse unknowns */ 2578e6d0c30SPeter Brune cn = 0; 2588e6d0c30SPeter Brune for (i=0;i<fn;i++) { 2598e6d0c30SPeter Brune /* filter out singletons */ 2608e6d0c30SPeter Brune ierr = PetscCDEmptyAt(agg_lists,i,&iscoarse); CHKERRQ(ierr); 2618e6d0c30SPeter Brune lcid[i] = -1; 2628e6d0c30SPeter Brune if (!iscoarse) { 2638e6d0c30SPeter Brune cn++; 2648e6d0c30SPeter Brune } 2658e6d0c30SPeter Brune } 2668e6d0c30SPeter Brune 2678e6d0c30SPeter Brune /* create the coarse vector */ 2688e6d0c30SPeter Brune ierr = VecCreateMPI(comm,cn,PETSC_DECIDE,&C);CHKERRQ(ierr); 2698e6d0c30SPeter Brune ierr = VecGetOwnershipRange(C,&cs,&ce);CHKERRQ(ierr); 2708e6d0c30SPeter Brune 2718e6d0c30SPeter Brune /* construct a global vector indicating the global indices of the coarse unknowns */ 2728e6d0c30SPeter Brune cn = 0; 2738e6d0c30SPeter Brune for (i=0;i<fn;i++) { 2748e6d0c30SPeter Brune ierr = PetscCDEmptyAt(agg_lists,i,&iscoarse); CHKERRQ(ierr); 2758e6d0c30SPeter Brune if (!iscoarse) { 2768e6d0c30SPeter Brune lcid[i] = cs+cn; 2778e6d0c30SPeter Brune cn++; 2788e6d0c30SPeter Brune } else { 2798e6d0c30SPeter Brune lcid[i] = -1; 2808e6d0c30SPeter Brune } 281167fb786SPeter Brune *((PetscInt *)&c_scalar) = lcid[i]; 2828e6d0c30SPeter Brune c_indx = fs+i; 2838e6d0c30SPeter Brune ierr = VecSetValues(F,1,&c_indx,&c_scalar,INSERT_VALUES);CHKERRQ(ierr); 2848e6d0c30SPeter Brune } 2858e6d0c30SPeter Brune 2868e6d0c30SPeter Brune ierr = VecAssemblyBegin(F);CHKERRQ(ierr); 2878e6d0c30SPeter Brune ierr = VecAssemblyEnd(F);CHKERRQ(ierr); 2888e6d0c30SPeter Brune 2891ce39c63SPeter Brune /* determine the biggest off-diagonal entries in each row */ 2901ce39c63SPeter Brune for (i=fs;i<fe;i++) { 2911ce39c63SPeter Brune Amax_pos[i-fs] = 0.; 2921ce39c63SPeter Brune Amax_neg[i-fs] = 0.; 2931ce39c63SPeter Brune ierr = MatGetRow(A,i,&ncols,&rcol,&rval);CHKERRQ(ierr); 2941ce39c63SPeter Brune for(j=0;j<ncols;j++){ 2951ce39c63SPeter Brune if ((PetscRealPart(-rval[j]) > Amax_neg[i-fs]) && i != rcol[j]) Amax_neg[i-fs] = PetscAbsScalar(rval[j]); 2961ce39c63SPeter Brune if ((PetscRealPart(rval[j]) > Amax_pos[i-fs]) && i != rcol[j]) Amax_pos[i-fs] = PetscAbsScalar(rval[j]); 2971ce39c63SPeter Brune } 2981ce39c63SPeter Brune if (ncols > cmax) cmax = ncols; 2991ce39c63SPeter Brune ierr = MatRestoreRow(A,i,&ncols,&rcol,&rval);CHKERRQ(ierr); 3001ce39c63SPeter Brune } 3011ce39c63SPeter Brune ierr = PetscMalloc(sizeof(PetscInt)*cmax,&pcols);CHKERRQ(ierr); 3021ce39c63SPeter Brune ierr = PetscMalloc(sizeof(PetscScalar)*cmax,&pvals);CHKERRQ(ierr); 3031ce39c63SPeter Brune 304167fb786SPeter Brune /* split the operator into two */ 305bfde193fSPeter Brune ierr = PCGAMGClassicalGraphSplitting_Private(A,&lA,&gA);CHKERRQ(ierr); 3068e6d0c30SPeter Brune 3078e6d0c30SPeter Brune /* scatter to the ghost vector */ 3081ce39c63SPeter Brune ierr = PCGAMGClassicalCreateGhostVector_Private(A,&gF,NULL);CHKERRQ(ierr); 3091ce39c63SPeter Brune ierr = PCGAMGClassicalGhost_Private(A,F,gF);CHKERRQ(ierr); 3108e6d0c30SPeter Brune 3111ce39c63SPeter Brune if (gA) { 3128e6d0c30SPeter Brune ierr = VecGetSize(gF,&gn);CHKERRQ(ierr); 3138e6d0c30SPeter Brune ierr = PetscMalloc(sizeof(PetscInt)*gn,&gcid);CHKERRQ(ierr); 3148e6d0c30SPeter Brune for (i=0;i<gn;i++) { 3158e6d0c30SPeter Brune ierr = VecGetValues(gF,1,&i,&c_scalar);CHKERRQ(ierr); 316167fb786SPeter Brune gcid[i] = *((PetscInt *)&c_scalar); 3178e6d0c30SPeter Brune } 3188e6d0c30SPeter Brune } 3198e6d0c30SPeter Brune 3208e6d0c30SPeter Brune ierr = VecDestroy(&F);CHKERRQ(ierr); 3218e6d0c30SPeter Brune ierr = VecDestroy(&gF);CHKERRQ(ierr); 3228e6d0c30SPeter Brune ierr = VecDestroy(&C);CHKERRQ(ierr); 3238e6d0c30SPeter Brune 3248e6d0c30SPeter Brune /* count the on and off processor sparsity patterns for the prolongator */ 3258e6d0c30SPeter Brune for (i=0;i<fn;i++) { 3268e6d0c30SPeter Brune /* on */ 3278e6d0c30SPeter Brune lsparse[i] = 0; 328e5a0faa4SPeter Brune gsparse[i] = 0; 3298e6d0c30SPeter Brune if (lcid[i] >= 0) { 3308e6d0c30SPeter Brune lsparse[i] = 1; 3318e6d0c30SPeter Brune gsparse[i] = 0; 3328e6d0c30SPeter Brune } else { 3331ce39c63SPeter Brune ierr = MatGetRow(lA,i,&ncols,&rcol,&rval);CHKERRQ(ierr); 3348e6d0c30SPeter Brune for (j = 0;j < ncols;j++) { 3351ce39c63SPeter Brune col = rcol[j]; 3361ce39c63SPeter Brune if (lcid[col] >= 0 && (PetscRealPart(rval[j]) > gamg->threshold*Amax_pos[i] || PetscRealPart(-rval[j]) > gamg->threshold*Amax_neg[i])) { 3378e6d0c30SPeter Brune lsparse[i] += 1; 3388e6d0c30SPeter Brune } 3398e6d0c30SPeter Brune } 3401ce39c63SPeter Brune ierr = MatRestoreRow(lA,i,&ncols,&rcol,&rval);CHKERRQ(ierr); 3418e6d0c30SPeter Brune /* off */ 3421ce39c63SPeter Brune if (gA) { 3431ce39c63SPeter Brune ierr = MatGetRow(gA,i,&ncols,&rcol,&rval);CHKERRQ(ierr); 3448e6d0c30SPeter Brune for (j = 0; j < ncols; j++) { 3451ce39c63SPeter Brune col = rcol[j]; 3461ce39c63SPeter Brune if (gcid[col] >= 0 && (PetscRealPart(rval[j]) > gamg->threshold*Amax_pos[i] || PetscRealPart(-rval[j]) > gamg->threshold*Amax_neg[i])) { 3478e6d0c30SPeter Brune gsparse[i] += 1; 3488e6d0c30SPeter Brune } 3498e6d0c30SPeter Brune } 3501ce39c63SPeter Brune ierr = MatRestoreRow(gA,i,&ncols,&rcol,&rval);CHKERRQ(ierr); 3518e6d0c30SPeter Brune } 3528e6d0c30SPeter Brune } 3531ce39c63SPeter Brune } 3548e6d0c30SPeter Brune 3558e6d0c30SPeter Brune /* preallocate and create the prolongator */ 3568e6d0c30SPeter Brune ierr = MatCreate(comm,P); CHKERRQ(ierr); 3578e6d0c30SPeter Brune ierr = MatGetType(G,&mtype);CHKERRQ(ierr); 3588e6d0c30SPeter Brune ierr = MatSetType(*P,mtype);CHKERRQ(ierr); 3598e6d0c30SPeter Brune 3608e6d0c30SPeter Brune ierr = MatSetSizes(*P,fn,cn,PETSC_DETERMINE,PETSC_DETERMINE);CHKERRQ(ierr); 3618e6d0c30SPeter Brune ierr = MatMPIAIJSetPreallocation(*P,0,lsparse,0,gsparse);CHKERRQ(ierr); 3628e6d0c30SPeter Brune ierr = MatSeqAIJSetPreallocation(*P,0,lsparse);CHKERRQ(ierr); 3638e6d0c30SPeter Brune 3648e6d0c30SPeter Brune /* loop over local fine nodes -- get the diagonal, the sum of positive and negative strong and weak weights, and set up the row */ 3658e6d0c30SPeter Brune for (i = 0;i < fn;i++) { 3668e6d0c30SPeter Brune /* determine on or off */ 3678e6d0c30SPeter Brune row_f = i + fs; 3688e6d0c30SPeter Brune row_c = lcid[i]; 3698e6d0c30SPeter Brune if (row_c >= 0) { 3708e6d0c30SPeter Brune pij = 1.; 3718e6d0c30SPeter Brune ierr = MatSetValues(*P,1,&row_f,1,&row_c,&pij,INSERT_VALUES);CHKERRQ(ierr); 3728e6d0c30SPeter Brune } else { 3738e6d0c30SPeter Brune g_pos = 0.; 3748e6d0c30SPeter Brune g_neg = 0.; 3758e6d0c30SPeter Brune a_pos = 0.; 3768e6d0c30SPeter Brune a_neg = 0.; 3778e6d0c30SPeter Brune diag = 0.; 3788e6d0c30SPeter Brune 3791ce39c63SPeter Brune /* local connections */ 3808e6d0c30SPeter Brune ierr = MatGetRow(lA,i,&ncols,&rcol,&rval);CHKERRQ(ierr); 3811ce39c63SPeter Brune for (j = 0; j < ncols; j++) { 3821ce39c63SPeter Brune col = rcol[j]; 3831ce39c63SPeter Brune if (lcid[col] >= 0 && (PetscRealPart(rval[j]) > gamg->threshold*Amax_pos[i] || PetscRealPart(-rval[j]) > gamg->threshold*Amax_neg[i])) { 3841ce39c63SPeter Brune if (PetscRealPart(rval[j]) > 0.) { 3851ce39c63SPeter Brune g_pos += rval[j]; 3868e6d0c30SPeter Brune } else { 3871ce39c63SPeter Brune g_neg += rval[j]; 3888e6d0c30SPeter Brune } 3891ce39c63SPeter Brune } 3901ce39c63SPeter Brune if (col != i) { 3911ce39c63SPeter Brune if (PetscRealPart(rval[j]) > 0.) { 3921ce39c63SPeter Brune a_pos += rval[j]; 3931ce39c63SPeter Brune } else { 3941ce39c63SPeter Brune a_neg += rval[j]; 3951ce39c63SPeter Brune } 3961ce39c63SPeter Brune } else { 3971ce39c63SPeter Brune diag = rval[j]; 3981ce39c63SPeter Brune } 3998e6d0c30SPeter Brune } 4008e6d0c30SPeter Brune ierr = MatRestoreRow(lA,i,&ncols,&rcol,&rval);CHKERRQ(ierr); 4018e6d0c30SPeter Brune 4021ce39c63SPeter Brune /* ghosted connections */ 4038e6d0c30SPeter Brune if (gA) { 4048e6d0c30SPeter Brune ierr = MatGetRow(gA,i,&ncols,&rcol,&rval);CHKERRQ(ierr); 4051ce39c63SPeter Brune for (j = 0; j < ncols; j++) { 4061ce39c63SPeter Brune col = rcol[j]; 4071ce39c63SPeter Brune if (gcid[col] >= 0 && (PetscRealPart(rval[j]) > gamg->threshold*Amax_pos[i] || PetscRealPart(-rval[j]) > gamg->threshold*Amax_neg[i])) { 4081ce39c63SPeter Brune if (PetscRealPart(rval[j]) > 0.) { 4091ce39c63SPeter Brune g_pos += rval[j]; 4108e6d0c30SPeter Brune } else { 4111ce39c63SPeter Brune g_neg += rval[j]; 4128e6d0c30SPeter Brune } 4131ce39c63SPeter Brune } 4141ce39c63SPeter Brune if (PetscRealPart(rval[j]) > 0.) { 4151ce39c63SPeter Brune a_pos += rval[j]; 4161ce39c63SPeter Brune } else { 4171ce39c63SPeter Brune a_neg += rval[j]; 4181ce39c63SPeter Brune } 4198e6d0c30SPeter Brune } 4208e6d0c30SPeter Brune ierr = MatRestoreRow(gA,i,&ncols,&rcol,&rval);CHKERRQ(ierr); 4218e6d0c30SPeter Brune } 4228e6d0c30SPeter Brune 4238e6d0c30SPeter Brune if (g_neg == 0.) { 4248e6d0c30SPeter Brune alpha = 0.; 4258e6d0c30SPeter Brune } else { 4268e6d0c30SPeter Brune alpha = -a_neg/g_neg; 4278e6d0c30SPeter Brune } 4288e6d0c30SPeter Brune 4298e6d0c30SPeter Brune if (g_pos == 0.) { 4308e6d0c30SPeter Brune diag += a_pos; 4318e6d0c30SPeter Brune beta = 0.; 4328e6d0c30SPeter Brune } else { 4338e6d0c30SPeter Brune beta = -a_pos/g_pos; 4348e6d0c30SPeter Brune } 435e5a0faa4SPeter Brune if (diag == 0.) { 436e5a0faa4SPeter Brune invdiag = 0.; 437e5a0faa4SPeter Brune } else invdiag = 1. / diag; 4388e6d0c30SPeter Brune /* on */ 4391ce39c63SPeter Brune ierr = MatGetRow(lA,i,&ncols,&rcol,&rval);CHKERRQ(ierr); 4408e6d0c30SPeter Brune idx = 0; 4418e6d0c30SPeter Brune for (j = 0;j < ncols;j++) { 4421ce39c63SPeter Brune col = rcol[j]; 4431ce39c63SPeter Brune if (lcid[col] >= 0 && (PetscRealPart(rval[j]) > gamg->threshold*Amax_pos[i] || PetscRealPart(-rval[j]) > gamg->threshold*Amax_neg[i])) { 4448e6d0c30SPeter Brune row_f = i + fs; 4458e6d0c30SPeter Brune row_c = lcid[col]; 4468e6d0c30SPeter Brune /* set the values for on-processor ones */ 4471ce39c63SPeter Brune if (PetscRealPart(rval[j]) < 0.) { 4481ce39c63SPeter Brune pij = rval[j]*alpha*invdiag; 4498e6d0c30SPeter Brune } else { 4501ce39c63SPeter Brune pij = rval[j]*beta*invdiag; 4518e6d0c30SPeter Brune } 4528e6d0c30SPeter Brune if (PetscAbsScalar(pij) != 0.) { 4538e6d0c30SPeter Brune pvals[idx] = pij; 4548e6d0c30SPeter Brune pcols[idx] = row_c; 4558e6d0c30SPeter Brune idx++; 4568e6d0c30SPeter Brune } 4578e6d0c30SPeter Brune } 4588e6d0c30SPeter Brune } 4591ce39c63SPeter Brune ierr = MatRestoreRow(lA,i,&ncols,&rcol,&rval);CHKERRQ(ierr); 4608e6d0c30SPeter Brune /* off */ 4611ce39c63SPeter Brune if (gA) { 4621ce39c63SPeter Brune ierr = MatGetRow(gA,i,&ncols,&rcol,&rval);CHKERRQ(ierr); 4638e6d0c30SPeter Brune for (j = 0; j < ncols; j++) { 4641ce39c63SPeter Brune col = rcol[j]; 4651ce39c63SPeter Brune if (gcid[col] >= 0 && (PetscRealPart(rval[j]) > gamg->threshold*Amax_pos[i] || PetscRealPart(-rval[j]) > gamg->threshold*Amax_neg[i])) { 4668e6d0c30SPeter Brune row_f = i + fs; 4678e6d0c30SPeter Brune row_c = gcid[col]; 4688e6d0c30SPeter Brune /* set the values for on-processor ones */ 4691ce39c63SPeter Brune if (PetscRealPart(rval[j]) < 0.) { 4701ce39c63SPeter Brune pij = rval[j]*alpha*invdiag; 4718e6d0c30SPeter Brune } else { 4721ce39c63SPeter Brune pij = rval[j]*beta*invdiag; 4738e6d0c30SPeter Brune } 4748e6d0c30SPeter Brune if (PetscAbsScalar(pij) != 0.) { 4758e6d0c30SPeter Brune pvals[idx] = pij; 4768e6d0c30SPeter Brune pcols[idx] = row_c; 4778e6d0c30SPeter Brune idx++; 4788e6d0c30SPeter Brune } 4798e6d0c30SPeter Brune } 4808e6d0c30SPeter Brune } 4811ce39c63SPeter Brune ierr = MatRestoreRow(gA,i,&ncols,&rcol,&rval);CHKERRQ(ierr); 4823c9ab2c3SPeter Brune } 4838e6d0c30SPeter Brune ierr = MatSetValues(*P,1,&row_f,idx,pcols,pvals,INSERT_VALUES);CHKERRQ(ierr); 4848e6d0c30SPeter Brune } 4858e6d0c30SPeter Brune } 4863c9ab2c3SPeter Brune 4878e6d0c30SPeter Brune ierr = MatAssemblyBegin(*P, MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 4888e6d0c30SPeter Brune ierr = MatAssemblyEnd(*P, MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 4898e6d0c30SPeter Brune 4908e6d0c30SPeter Brune ierr = PetscFree(lsparse);CHKERRQ(ierr); 4918e6d0c30SPeter Brune ierr = PetscFree(gsparse);CHKERRQ(ierr); 4928e6d0c30SPeter Brune ierr = PetscFree(pcols);CHKERRQ(ierr); 4938e6d0c30SPeter Brune ierr = PetscFree(pvals);CHKERRQ(ierr); 4941ce39c63SPeter Brune ierr = PetscFree(Amax_pos);CHKERRQ(ierr); 4951ce39c63SPeter Brune ierr = PetscFree(Amax_neg);CHKERRQ(ierr); 4968e6d0c30SPeter Brune ierr = PetscFree(lcid);CHKERRQ(ierr); 4971ce39c63SPeter Brune if (gA) {ierr = PetscFree(gcid);CHKERRQ(ierr);} 4988e6d0c30SPeter Brune 4998e6d0c30SPeter Brune PetscFunctionReturn(0); 5008e6d0c30SPeter Brune } 5018e6d0c30SPeter Brune 5028e6d0c30SPeter Brune #undef __FUNCT__ 503*f9a65ec8SPeter Brune #define __FUNCT__ "PCGAMGProlongator_Standard_Classical" 504*f9a65ec8SPeter Brune PetscErrorCode PCGAMGProlongator_Standard_Classical(PC pc, const Mat A, const Mat G, PetscCoarsenData *agg_lists,Mat *P) 505*f9a65ec8SPeter Brune { 506*f9a65ec8SPeter Brune PetscErrorCode ierr; 507*f9a65ec8SPeter Brune Mat *lA; 508*f9a65ec8SPeter Brune Vec lv,v,cv; 509*f9a65ec8SPeter Brune PetscScalar *lcid; 510*f9a65ec8SPeter Brune IS lis; 511*f9a65ec8SPeter Brune PetscInt fs,fe,cs,ce,nl,i,j,k,li,lni,ci; 512*f9a65ec8SPeter Brune VecScatter lscat; 513*f9a65ec8SPeter Brune PetscInt fn,cn,cid,c_indx; 514*f9a65ec8SPeter Brune PetscBool iscoarse; 515*f9a65ec8SPeter Brune PetscScalar c_scalar; 516*f9a65ec8SPeter Brune const PetscScalar *vcol; 517*f9a65ec8SPeter Brune const PetscInt *icol; 518*f9a65ec8SPeter Brune const PetscInt *gidx; 519*f9a65ec8SPeter Brune PetscInt ncols; 520*f9a65ec8SPeter Brune PetscInt *lsparse,*gsparse; 521*f9a65ec8SPeter Brune MatType mtype; 522*f9a65ec8SPeter Brune PetscInt maxcols; 523*f9a65ec8SPeter Brune PetscReal g_pos,g_neg,a_pos,a_neg,diag,invdiag,alpha,beta; 524*f9a65ec8SPeter Brune /* PetscReal jdiag,invjdiag; */ 525*f9a65ec8SPeter Brune PetscReal *amax_pos,*amax_neg; 526*f9a65ec8SPeter Brune PetscScalar *pvcol,vi; 527*f9a65ec8SPeter Brune PetscInt *picol; 528*f9a65ec8SPeter Brune PetscInt pncols; 529*f9a65ec8SPeter Brune PetscScalar *pcontrib,pentry; 530*f9a65ec8SPeter Brune PC_MG *mg = (PC_MG*)pc->data; 531*f9a65ec8SPeter Brune PC_GAMG *gamg = (PC_GAMG*)mg->innerctx; 532*f9a65ec8SPeter Brune 533*f9a65ec8SPeter Brune PetscFunctionBegin; 534*f9a65ec8SPeter Brune 535*f9a65ec8SPeter Brune ierr = MatGetOwnershipRange(A,&fs,&fe);CHKERRQ(ierr); 536*f9a65ec8SPeter Brune fn = fe-fs; 537*f9a65ec8SPeter Brune ierr = MatGetVecs(A,NULL,&v);CHKERRQ(ierr); 538*f9a65ec8SPeter Brune ierr = ISCreateStride(PETSC_COMM_SELF,fe-fs,fs,1,&lis);CHKERRQ(ierr); 539*f9a65ec8SPeter Brune /* increase the overlap by two to get neighbors of neighbors */ 540*f9a65ec8SPeter Brune ierr = MatIncreaseOverlap(A,1,&lis,2);CHKERRQ(ierr); 541*f9a65ec8SPeter Brune ierr = ISSort(lis);CHKERRQ(ierr); 542*f9a65ec8SPeter Brune /* get the local part of A */ 543*f9a65ec8SPeter Brune ierr = MatGetSubMatrices(A,1,&lis,&lis,MAT_INITIAL_MATRIX,&lA);CHKERRQ(ierr); 544*f9a65ec8SPeter Brune /* build the scatter out of it */ 545*f9a65ec8SPeter Brune ierr = ISGetLocalSize(lis,&nl);CHKERRQ(ierr); 546*f9a65ec8SPeter Brune ierr = VecCreateSeq(PETSC_COMM_SELF,nl,&lv);CHKERRQ(ierr); 547*f9a65ec8SPeter Brune ierr = VecScatterCreate(v,lis,lv,NULL,&lscat);CHKERRQ(ierr); 548*f9a65ec8SPeter Brune 549*f9a65ec8SPeter Brune ierr = PetscMalloc(sizeof(PetscInt)*fn,&lsparse);CHKERRQ(ierr); 550*f9a65ec8SPeter Brune ierr = PetscMalloc(sizeof(PetscInt)*fn,&gsparse);CHKERRQ(ierr); 551*f9a65ec8SPeter Brune ierr = PetscMalloc(sizeof(PetscScalar)*nl,&amax_pos);CHKERRQ(ierr); 552*f9a65ec8SPeter Brune ierr = PetscMalloc(sizeof(PetscScalar)*nl,&amax_neg);CHKERRQ(ierr); 553*f9a65ec8SPeter Brune ierr = PetscMalloc(sizeof(PetscScalar)*nl,&pcontrib);CHKERRQ(ierr); 554*f9a65ec8SPeter Brune 555*f9a65ec8SPeter Brune /* create coarse vector */ 556*f9a65ec8SPeter Brune cn = 0; 557*f9a65ec8SPeter Brune for (i=0;i<fn;i++) { 558*f9a65ec8SPeter Brune ierr = PetscCDEmptyAt(agg_lists,i,&iscoarse);CHKERRQ(ierr); 559*f9a65ec8SPeter Brune if (!iscoarse) { 560*f9a65ec8SPeter Brune cn++; 561*f9a65ec8SPeter Brune } 562*f9a65ec8SPeter Brune } 563*f9a65ec8SPeter Brune ierr = VecCreateMPI(PetscObjectComm((PetscObject)A),cn,PETSC_DECIDE,&cv);CHKERRQ(ierr); 564*f9a65ec8SPeter Brune ierr = VecGetOwnershipRange(cv,&cs,&ce);CHKERRQ(ierr); 565*f9a65ec8SPeter Brune cn = 0; 566*f9a65ec8SPeter Brune for (i=0;i<fn;i++) { 567*f9a65ec8SPeter Brune ierr = PetscCDEmptyAt(agg_lists,i,&iscoarse); CHKERRQ(ierr); 568*f9a65ec8SPeter Brune if (!iscoarse) { 569*f9a65ec8SPeter Brune cid = cs+cn; 570*f9a65ec8SPeter Brune cn++; 571*f9a65ec8SPeter Brune } else { 572*f9a65ec8SPeter Brune cid = -1; 573*f9a65ec8SPeter Brune } 574*f9a65ec8SPeter Brune c_scalar = (PetscScalar)cid; 575*f9a65ec8SPeter Brune c_indx = fs+i; 576*f9a65ec8SPeter Brune ierr = VecSetValues(v,1,&c_indx,&c_scalar,INSERT_VALUES);CHKERRQ(ierr); 577*f9a65ec8SPeter Brune } 578*f9a65ec8SPeter Brune ierr = VecScatterBegin(lscat,v,lv,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 579*f9a65ec8SPeter Brune ierr = VecScatterEnd(lscat,v,lv,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 580*f9a65ec8SPeter Brune /* count to preallocate the prolongator */ 581*f9a65ec8SPeter Brune ierr = ISGetIndices(lis,&gidx);CHKERRQ(ierr); 582*f9a65ec8SPeter Brune ierr = VecGetArray(lv,&lcid);CHKERRQ(ierr); 583*f9a65ec8SPeter Brune maxcols = 0; 584*f9a65ec8SPeter Brune for (i=0;i<nl;i++) { 585*f9a65ec8SPeter Brune amax_pos[i] = 0.; 586*f9a65ec8SPeter Brune amax_neg[i] = 0.; 587*f9a65ec8SPeter Brune pcontrib[i] = 0.; 588*f9a65ec8SPeter Brune ierr = MatGetRow(lA[0],i,&ncols,&icol,&vcol);CHKERRQ(ierr); 589*f9a65ec8SPeter Brune for (j=0;j<ncols;j++) { 590*f9a65ec8SPeter Brune if (i != icol[j]) { 591*f9a65ec8SPeter Brune if (PetscRealPart(vcol[j]) > 0.) { 592*f9a65ec8SPeter Brune if (amax_pos[i] < PetscAbsScalar(vcol[j])) amax_pos[i] = PetscAbsScalar(vcol[j]); 593*f9a65ec8SPeter Brune } else { 594*f9a65ec8SPeter Brune if (amax_neg[i] < PetscAbsScalar(vcol[j])) amax_neg[i] = PetscAbsScalar(vcol[j]); 595*f9a65ec8SPeter Brune } 596*f9a65ec8SPeter Brune } 597*f9a65ec8SPeter Brune } 598*f9a65ec8SPeter Brune ierr = MatRestoreRow(lA[0],i,&ncols,&icol,&vcol);CHKERRQ(ierr); 599*f9a65ec8SPeter Brune } 600*f9a65ec8SPeter Brune /* count the number of unique contributing coarse cells for each fine */ 601*f9a65ec8SPeter Brune for (i=0;i<nl;i++) { 602*f9a65ec8SPeter Brune if (gidx[i] >= fs && gidx[i] < fe) { 603*f9a65ec8SPeter Brune li = gidx[i] - fs; 604*f9a65ec8SPeter Brune lsparse[li] = 0; 605*f9a65ec8SPeter Brune gsparse[li] = 0; 606*f9a65ec8SPeter Brune cid = (PetscInt)lcid[i]; 607*f9a65ec8SPeter Brune if (cid >= 0) { 608*f9a65ec8SPeter Brune lsparse[li] = 1; 609*f9a65ec8SPeter Brune } else { 610*f9a65ec8SPeter Brune ierr = MatGetRow(lA[0],i,&ncols,&icol,&vcol);CHKERRQ(ierr); 611*f9a65ec8SPeter Brune for (j=0;j<ncols;j++) { 612*f9a65ec8SPeter Brune } 613*f9a65ec8SPeter Brune for (j=0;j<ncols;j++) { 614*f9a65ec8SPeter Brune if ((PetscInt)lcid[icol[j]] >= 0) { 615*f9a65ec8SPeter Brune pcontrib[icol[j]] = 1.; 616*f9a65ec8SPeter Brune } else { 617*f9a65ec8SPeter Brune ci = icol[j]; 618*f9a65ec8SPeter Brune ierr = MatRestoreRow(lA[0],i,&ncols,&icol,&vcol);CHKERRQ(ierr); 619*f9a65ec8SPeter Brune ierr = MatGetRow(lA[0],ci,&ncols,&icol,&vcol);CHKERRQ(ierr); 620*f9a65ec8SPeter Brune for (k=0;k<ncols;k++) { 621*f9a65ec8SPeter Brune if ((PetscInt)lcid[icol[k]] >= 0) { 622*f9a65ec8SPeter Brune pcontrib[icol[k]] = 1.; 623*f9a65ec8SPeter Brune } 624*f9a65ec8SPeter Brune } 625*f9a65ec8SPeter Brune ierr = MatRestoreRow(lA[0],ci,&ncols,&icol,&vcol);CHKERRQ(ierr); 626*f9a65ec8SPeter Brune ierr = MatGetRow(lA[0],i,&ncols,&icol,&vcol);CHKERRQ(ierr); 627*f9a65ec8SPeter Brune } 628*f9a65ec8SPeter Brune } 629*f9a65ec8SPeter Brune for (j=0;j<ncols;j++) { 630*f9a65ec8SPeter Brune if (lcid[icol[j]] >= 0 && pcontrib[icol[j]] != 0.) { 631*f9a65ec8SPeter Brune /* the neighbor is a coarse node */ 632*f9a65ec8SPeter Brune lni = (PetscInt)lcid[icol[j]]; 633*f9a65ec8SPeter Brune if (lni >= cs && lni < ce) { 634*f9a65ec8SPeter Brune lsparse[li]++; 635*f9a65ec8SPeter Brune } else { 636*f9a65ec8SPeter Brune gsparse[li]++; 637*f9a65ec8SPeter Brune } 638*f9a65ec8SPeter Brune pcontrib[icol[j]] = 0.; 639*f9a65ec8SPeter Brune } else { 640*f9a65ec8SPeter Brune /* the neighbor is a strongly connected fine node */ 641*f9a65ec8SPeter Brune ci = icol[j]; 642*f9a65ec8SPeter Brune ierr = MatRestoreRow(lA[0],i,&ncols,&icol,&vcol);CHKERRQ(ierr); 643*f9a65ec8SPeter Brune ierr = MatGetRow(lA[0],ci,&ncols,&icol,&vcol);CHKERRQ(ierr); 644*f9a65ec8SPeter Brune for (k=0;k<ncols;k++) { 645*f9a65ec8SPeter Brune if (lcid[icol[k]] >= 0 && pcontrib[icol[k]] != 0.) { 646*f9a65ec8SPeter Brune lni = (PetscInt)lcid[icol[k]]; 647*f9a65ec8SPeter Brune if (lni >= cs && lni < ce) { 648*f9a65ec8SPeter Brune lsparse[li]++; 649*f9a65ec8SPeter Brune } else { 650*f9a65ec8SPeter Brune gsparse[li]++; 651*f9a65ec8SPeter Brune } 652*f9a65ec8SPeter Brune pcontrib[icol[k]] = 0.; 653*f9a65ec8SPeter Brune } 654*f9a65ec8SPeter Brune } 655*f9a65ec8SPeter Brune ierr = MatRestoreRow(lA[0],ci,&ncols,&icol,&vcol);CHKERRQ(ierr); 656*f9a65ec8SPeter Brune ierr = MatGetRow(lA[0],i,&ncols,&icol,&vcol);CHKERRQ(ierr); 657*f9a65ec8SPeter Brune } 658*f9a65ec8SPeter Brune } 659*f9a65ec8SPeter Brune if (lsparse[li] + gsparse[li] > maxcols) maxcols = lsparse[li] + gsparse[li]; 660*f9a65ec8SPeter Brune ierr = MatRestoreRow(lA[0],i,&ncols,&icol,&vcol);CHKERRQ(ierr); 661*f9a65ec8SPeter Brune } 662*f9a65ec8SPeter Brune } 663*f9a65ec8SPeter Brune } 664*f9a65ec8SPeter Brune ierr = PetscMalloc(sizeof(PetscInt)*maxcols,&picol);CHKERRQ(ierr); 665*f9a65ec8SPeter Brune ierr = PetscMalloc(sizeof(PetscScalar)*maxcols,&pvcol);CHKERRQ(ierr); 666*f9a65ec8SPeter Brune ierr = MatCreate(PetscObjectComm((PetscObject)A),P);CHKERRQ(ierr); 667*f9a65ec8SPeter Brune ierr = MatGetType(A,&mtype);CHKERRQ(ierr); 668*f9a65ec8SPeter Brune ierr = MatSetType(*P,mtype);CHKERRQ(ierr); 669*f9a65ec8SPeter Brune 670*f9a65ec8SPeter Brune ierr = MatSetSizes(*P,fn,cn,PETSC_DETERMINE,PETSC_DETERMINE);CHKERRQ(ierr); 671*f9a65ec8SPeter Brune ierr = MatMPIAIJSetPreallocation(*P,0,lsparse,0,gsparse);CHKERRQ(ierr); 672*f9a65ec8SPeter Brune ierr = MatSeqAIJSetPreallocation(*P,0,lsparse);CHKERRQ(ierr); 673*f9a65ec8SPeter Brune for (i=0;i<nl;i++) { 674*f9a65ec8SPeter Brune if (gidx[i] >= fs && gidx[i] < fe) { 675*f9a65ec8SPeter Brune a_pos = 0.; 676*f9a65ec8SPeter Brune a_neg = 0.; 677*f9a65ec8SPeter Brune g_pos = 0.; 678*f9a65ec8SPeter Brune g_neg = 0.; 679*f9a65ec8SPeter Brune li = gidx[i] - fs; 680*f9a65ec8SPeter Brune pncols=0; 681*f9a65ec8SPeter Brune cid = (PetscInt)lcid[i]; 682*f9a65ec8SPeter Brune if (cid >= 0) { 683*f9a65ec8SPeter Brune pncols = 1; 684*f9a65ec8SPeter Brune picol[0] = cid; 685*f9a65ec8SPeter Brune pvcol[0] = 1.; 686*f9a65ec8SPeter Brune } else { 687*f9a65ec8SPeter Brune ierr = MatGetRow(lA[0],i,&ncols,&icol,&vcol);CHKERRQ(ierr); 688*f9a65ec8SPeter Brune for (j=0;j<ncols;j++) { 689*f9a65ec8SPeter Brune if (icol[j] == i) { 690*f9a65ec8SPeter Brune diag = vcol[j]; 691*f9a65ec8SPeter Brune } else { 692*f9a65ec8SPeter Brune if ((PetscInt)lcid[icol[j]] >= 0 && (PetscRealPart(vcol[j]) > gamg->threshold*amax_pos[i] || PetscRealPart(-vcol[j]) > gamg->threshold*amax_neg[i])) { 693*f9a65ec8SPeter Brune if (PetscRealPart(vcol[j]) > 0.) { 694*f9a65ec8SPeter Brune g_pos += vcol[j]; 695*f9a65ec8SPeter Brune } else { 696*f9a65ec8SPeter Brune g_neg += vcol[j]; 697*f9a65ec8SPeter Brune } 698*f9a65ec8SPeter Brune } 699*f9a65ec8SPeter Brune if (PetscRealPart(vcol[j]) > 0.) { 700*f9a65ec8SPeter Brune a_pos += vcol[j]; 701*f9a65ec8SPeter Brune } else { 702*f9a65ec8SPeter Brune a_neg += vcol[j]; 703*f9a65ec8SPeter Brune } 704*f9a65ec8SPeter Brune } 705*f9a65ec8SPeter Brune } 706*f9a65ec8SPeter Brune if (g_neg == 0.) { 707*f9a65ec8SPeter Brune alpha = 0.; 708*f9a65ec8SPeter Brune } else { 709*f9a65ec8SPeter Brune alpha = a_neg/g_neg; 710*f9a65ec8SPeter Brune } 711*f9a65ec8SPeter Brune if (g_pos == 0.) { 712*f9a65ec8SPeter Brune diag += a_pos; 713*f9a65ec8SPeter Brune beta = 0.; 714*f9a65ec8SPeter Brune } else { 715*f9a65ec8SPeter Brune beta = a_pos/g_pos; 716*f9a65ec8SPeter Brune } 717*f9a65ec8SPeter Brune invdiag = 0; 718*f9a65ec8SPeter Brune if (diag != 0.) { 719*f9a65ec8SPeter Brune invdiag = 1./diag; 720*f9a65ec8SPeter Brune } 721*f9a65ec8SPeter Brune for (j=0;j<ncols;j++) { 722*f9a65ec8SPeter Brune if (PetscRealPart(vcol[j]) > gamg->threshold*amax_pos[i] || PetscRealPart(-vcol[j]) > gamg->threshold*amax_neg[i]) { 723*f9a65ec8SPeter Brune if (PetscRealPart(vcol[j]) < 0.) { 724*f9a65ec8SPeter Brune pentry = -vcol[j]*invdiag*alpha; 725*f9a65ec8SPeter Brune } else { 726*f9a65ec8SPeter Brune pentry = -vcol[j]*invdiag*beta; 727*f9a65ec8SPeter Brune } 728*f9a65ec8SPeter Brune if ((PetscInt)lcid[icol[j]] >= 0) { 729*f9a65ec8SPeter Brune /* coarse neighbor */ 730*f9a65ec8SPeter Brune pcontrib[icol[j]] = pentry; 731*f9a65ec8SPeter Brune } else { 732*f9a65ec8SPeter Brune /* the neighbor is a strongly connected fine node */ 733*f9a65ec8SPeter Brune ci = icol[j]; 734*f9a65ec8SPeter Brune vi = vcol[j]; 735*f9a65ec8SPeter Brune ierr = MatRestoreRow(lA[0],i,&ncols,&icol,&vcol);CHKERRQ(ierr); 736*f9a65ec8SPeter Brune ierr = MatGetRow(lA[0],ci,&ncols,&icol,&vcol);CHKERRQ(ierr); 737*f9a65ec8SPeter Brune jdiag = 0.; 738*f9a65ec8SPeter Brune invjdiag = 0.; 739*f9a65ec8SPeter Brune for (k=0;k<ncols;k++) { 740*f9a65ec8SPeter Brune if (ci == icol[k]) jdiag = PetscRealPart(vcol[k]); 741*f9a65ec8SPeter Brune } 742*f9a65ec8SPeter Brune if (jdiag != 0) { 743*f9a65ec8SPeter Brune invjdiag = 1. / jdiag; 744*f9a65ec8SPeter Brune } 745*f9a65ec8SPeter Brune for (k=0;k<ncols;k++) { 746*f9a65ec8SPeter Brune if ((PetscInt)lcid[icol[k]] >= 0 && (PetscAbsScalar(vcol[k]) > gamg->threshold*amax_pos[ci] || PetscRealPart(vcol[k]) < gamg->threshold*amax_neg[ci])) { 747*f9a65ec8SPeter Brune /* pcontrib[icol[k]] += -pentry*vcol[k]*invjdiag; */ 748*f9a65ec8SPeter Brune } 749*f9a65ec8SPeter Brune } 750*f9a65ec8SPeter Brune ierr = MatRestoreRow(lA[0],ci,&ncols,&icol,&vcol);CHKERRQ(ierr); 751*f9a65ec8SPeter Brune ierr = MatGetRow(lA[0],i,&ncols,&icol,&vcol);CHKERRQ(ierr); 752*f9a65ec8SPeter Brune } 753*f9a65ec8SPeter Brune } 754*f9a65ec8SPeter Brune } 755*f9a65ec8SPeter Brune for (j=0;j<ncols;j++) { 756*f9a65ec8SPeter Brune if (lcid[icol[j]] >= 0 && pcontrib[icol[j]] != 0.) { 757*f9a65ec8SPeter Brune /* the neighbor is a coarse node */ 758*f9a65ec8SPeter Brune lni = (PetscInt)lcid[icol[j]]; 759*f9a65ec8SPeter Brune pvcol[pncols] = pcontrib[icol[j]]; 760*f9a65ec8SPeter Brune picol[pncols] = lni; 761*f9a65ec8SPeter Brune pcontrib[icol[j]] = 0.; 762*f9a65ec8SPeter Brune pncols++; 763*f9a65ec8SPeter Brune } else { 764*f9a65ec8SPeter Brune /* the neighbor is a strongly connected fine node */ 765*f9a65ec8SPeter Brune ci = icol[j]; 766*f9a65ec8SPeter Brune ierr = MatRestoreRow(lA[0],i,&ncols,&icol,&vcol);CHKERRQ(ierr); 767*f9a65ec8SPeter Brune ierr = MatGetRow(lA[0],ci,&ncols,&icol,&vcol);CHKERRQ(ierr); 768*f9a65ec8SPeter Brune for (k=0;k<ncols;k++) { 769*f9a65ec8SPeter Brune if (lcid[icol[k]] >= 0 && pcontrib[icol[k]] != 0.) { 770*f9a65ec8SPeter Brune lni = (PetscInt)lcid[icol[k]]; 771*f9a65ec8SPeter Brune pvcol[pncols] = pcontrib[icol[k]]; 772*f9a65ec8SPeter Brune picol[pncols] = lni; 773*f9a65ec8SPeter Brune pcontrib[icol[k]] = 0.; 774*f9a65ec8SPeter Brune pncols++; 775*f9a65ec8SPeter Brune } 776*f9a65ec8SPeter Brune } 777*f9a65ec8SPeter Brune ierr = MatRestoreRow(lA[0],ci,&ncols,&icol,&vcol);CHKERRQ(ierr); 778*f9a65ec8SPeter Brune ierr = MatGetRow(lA[0],i,&ncols,&icol,&vcol);CHKERRQ(ierr); 779*f9a65ec8SPeter Brune } 780*f9a65ec8SPeter Brune } 781*f9a65ec8SPeter Brune ierr = MatRestoreRow(lA[0],i,&ncols,&icol,&vcol);CHKERRQ(ierr); 782*f9a65ec8SPeter Brune } 783*f9a65ec8SPeter Brune ci = gidx[i]; 784*f9a65ec8SPeter Brune li = gidx[i] - fs; 785*f9a65ec8SPeter Brune if (pncols > 0) { 786*f9a65ec8SPeter Brune ierr = MatSetValues(*P,1,&ci,pncols,picol,pvcol,INSERT_VALUES);CHKERRQ(ierr); 787*f9a65ec8SPeter Brune } 788*f9a65ec8SPeter Brune } 789*f9a65ec8SPeter Brune } 790*f9a65ec8SPeter Brune 791*f9a65ec8SPeter Brune ierr = ISRestoreIndices(lis,&gidx);CHKERRQ(ierr); 792*f9a65ec8SPeter Brune ierr = VecRestoreArray(lv,&lcid);CHKERRQ(ierr); 793*f9a65ec8SPeter Brune 794*f9a65ec8SPeter Brune ierr = PetscFree(amax_pos);CHKERRQ(ierr); 795*f9a65ec8SPeter Brune ierr = PetscFree(amax_neg);CHKERRQ(ierr); 796*f9a65ec8SPeter Brune ierr = PetscFree(pcontrib);CHKERRQ(ierr); 797*f9a65ec8SPeter Brune ierr = PetscFree(picol);CHKERRQ(ierr); 798*f9a65ec8SPeter Brune ierr = PetscFree(pvcol);CHKERRQ(ierr); 799*f9a65ec8SPeter Brune ierr = PetscFree(lsparse);CHKERRQ(ierr); 800*f9a65ec8SPeter Brune ierr = PetscFree(gsparse);CHKERRQ(ierr); 801*f9a65ec8SPeter Brune ierr = ISDestroy(&lis);CHKERRQ(ierr); 802*f9a65ec8SPeter Brune ierr = MatDestroyMatrices(1,&lA);CHKERRQ(ierr); 803*f9a65ec8SPeter Brune ierr = VecDestroy(&lv);CHKERRQ(ierr); 804*f9a65ec8SPeter Brune ierr = VecDestroy(&cv);CHKERRQ(ierr); 805*f9a65ec8SPeter Brune ierr = VecDestroy(&v);CHKERRQ(ierr); 806*f9a65ec8SPeter Brune ierr = VecScatterDestroy(&lscat);CHKERRQ(ierr); 807*f9a65ec8SPeter Brune 808*f9a65ec8SPeter Brune ierr = MatAssemblyBegin(*P, MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 809*f9a65ec8SPeter Brune ierr = MatAssemblyEnd(*P, MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 810*f9a65ec8SPeter Brune 811*f9a65ec8SPeter Brune /* 812*f9a65ec8SPeter Brune Mat Pold; 813*f9a65ec8SPeter Brune ierr = PCGAMGProlongator_Classical(pc,A,G,agg_lists,&Pold);CHKERRQ(ierr); 814*f9a65ec8SPeter Brune ierr = MatView(Pold,PETSC_VIEWER_STDOUT_WORLD);CHKERRQ(ierr); 815*f9a65ec8SPeter Brune ierr = MatView(*P,PETSC_VIEWER_STDOUT_WORLD);CHKERRQ(ierr); 816*f9a65ec8SPeter Brune ierr = MatDestroy(&Pold);CHKERRQ(ierr); 817*f9a65ec8SPeter Brune */ 818*f9a65ec8SPeter Brune 819*f9a65ec8SPeter Brune PetscFunctionReturn(0); 820*f9a65ec8SPeter Brune } 821*f9a65ec8SPeter Brune 822*f9a65ec8SPeter Brune #undef __FUNCT__ 8238e6d0c30SPeter Brune #define __FUNCT__ "PCGAMGDestroy_Classical" 8248e6d0c30SPeter Brune PetscErrorCode PCGAMGDestroy_Classical(PC pc) 8258e6d0c30SPeter Brune { 8268e6d0c30SPeter Brune PetscErrorCode ierr; 8278e6d0c30SPeter Brune PC_MG *mg = (PC_MG*)pc->data; 8288e6d0c30SPeter Brune PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 8298e6d0c30SPeter Brune 8308e6d0c30SPeter Brune PetscFunctionBegin; 8318e6d0c30SPeter Brune ierr = PetscFree(pc_gamg->subctx);CHKERRQ(ierr); 8328e6d0c30SPeter Brune PetscFunctionReturn(0); 8338e6d0c30SPeter Brune } 8348e6d0c30SPeter Brune 8358e6d0c30SPeter Brune #undef __FUNCT__ 8368e6d0c30SPeter Brune #define __FUNCT__ "PCGAMGSetFromOptions_Classical" 8378e6d0c30SPeter Brune PetscErrorCode PCGAMGSetFromOptions_Classical(PC pc) 8388e6d0c30SPeter Brune { 8398e6d0c30SPeter Brune PetscFunctionBegin; 8408e6d0c30SPeter Brune PetscFunctionReturn(0); 8418e6d0c30SPeter Brune } 8428e6d0c30SPeter Brune 8438e6d0c30SPeter Brune #undef __FUNCT__ 8448e6d0c30SPeter Brune #define __FUNCT__ "PCGAMGSetData_Classical" 8458e6d0c30SPeter Brune PetscErrorCode PCGAMGSetData_Classical(PC pc, Mat A) 8468e6d0c30SPeter Brune { 8478e6d0c30SPeter Brune PC_MG *mg = (PC_MG*)pc->data; 8488e6d0c30SPeter Brune PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 8498e6d0c30SPeter Brune 8508e6d0c30SPeter Brune PetscFunctionBegin; 8518e6d0c30SPeter Brune /* no data for classical AMG */ 8528e6d0c30SPeter Brune pc_gamg->data = NULL; 853d2050638SMark Adams pc_gamg->data_cell_cols = 0; 854d2050638SMark Adams pc_gamg->data_cell_rows = 0; 8558e6d0c30SPeter Brune pc_gamg->data_sz = 0; 8568e6d0c30SPeter Brune PetscFunctionReturn(0); 8578e6d0c30SPeter Brune } 8588e6d0c30SPeter Brune 8598e6d0c30SPeter Brune /* -------------------------------------------------------------------------- */ 8608e6d0c30SPeter Brune /* 8618e6d0c30SPeter Brune PCCreateGAMG_Classical 8628e6d0c30SPeter Brune 8638e6d0c30SPeter Brune */ 8648e6d0c30SPeter Brune #undef __FUNCT__ 8658e6d0c30SPeter Brune #define __FUNCT__ "PCCreateGAMG_Classical" 8668e6d0c30SPeter Brune PetscErrorCode PCCreateGAMG_Classical(PC pc) 8678e6d0c30SPeter Brune { 8688e6d0c30SPeter Brune PetscErrorCode ierr; 8698e6d0c30SPeter Brune PC_MG *mg = (PC_MG*)pc->data; 8708e6d0c30SPeter Brune PC_GAMG *pc_gamg = (PC_GAMG*)mg->innerctx; 8718e6d0c30SPeter Brune PC_GAMG_Classical *pc_gamg_classical; 8728e6d0c30SPeter Brune 8738e6d0c30SPeter Brune PetscFunctionBegin; 8748e6d0c30SPeter Brune if (pc_gamg->subctx) { 8758e6d0c30SPeter Brune /* call base class */ 8768e6d0c30SPeter Brune ierr = PCDestroy_GAMG(pc);CHKERRQ(ierr); 8778e6d0c30SPeter Brune } 8788e6d0c30SPeter Brune 8798e6d0c30SPeter Brune /* create sub context for SA */ 8808e6d0c30SPeter Brune ierr = PetscNewLog(pc, PC_GAMG_Classical, &pc_gamg_classical);CHKERRQ(ierr); 8818e6d0c30SPeter Brune pc_gamg->subctx = pc_gamg_classical; 8828e6d0c30SPeter Brune pc->ops->setfromoptions = PCGAMGSetFromOptions_Classical; 8838e6d0c30SPeter Brune /* reset does not do anything; setup not virtual */ 8848e6d0c30SPeter Brune 8858e6d0c30SPeter Brune /* set internal function pointers */ 8868e6d0c30SPeter Brune pc_gamg->ops->destroy = PCGAMGDestroy_Classical; 8878e6d0c30SPeter Brune pc_gamg->ops->graph = PCGAMGGraph_Classical; 8888e6d0c30SPeter Brune pc_gamg->ops->coarsen = PCGAMGCoarsen_Classical; 889*f9a65ec8SPeter Brune pc_gamg->ops->prolongator = PCGAMGProlongator_Standard_Classical; 8908e6d0c30SPeter Brune pc_gamg->ops->optprol = NULL; 8918e6d0c30SPeter Brune 8928e6d0c30SPeter Brune pc_gamg->ops->createdefaultdata = PCGAMGSetData_Classical; 8938e6d0c30SPeter Brune PetscFunctionReturn(0); 8948e6d0c30SPeter Brune } 895