xref: /petsc/src/ksp/pc/impls/gamg/util.c (revision ffc4695bcb29f4b022f59a5fd6bc99fc280ff6d8)
16618991cSMark Adams /*
26618991cSMark Adams  GAMG geometric-algebric multigrid PC - Mark Adams 2011
36618991cSMark Adams  */
46618991cSMark Adams #include <petsc/private/matimpl.h>
56618991cSMark Adams #include <../src/ksp/pc/impls/gamg/gamg.h>           /*I "petscpc.h" I*/
66618991cSMark Adams 
76618991cSMark Adams /*
86618991cSMark Adams    Produces a set of block column indices of the matrix row, one for each block represented in the original row
96618991cSMark Adams 
106618991cSMark Adams    n - the number of block indices in cc[]
116618991cSMark Adams    cc - the block indices (must be large enough to contain the indices)
126618991cSMark Adams */
136618991cSMark Adams PETSC_STATIC_INLINE PetscErrorCode MatCollapseRow(Mat Amat,PetscInt row,PetscInt bs,PetscInt *n,PetscInt *cc)
146618991cSMark Adams {
156618991cSMark Adams   PetscInt       cnt = -1,nidx,j;
166618991cSMark Adams   const PetscInt *idx;
176618991cSMark Adams   PetscErrorCode ierr;
186618991cSMark Adams 
196618991cSMark Adams   PetscFunctionBegin;
206618991cSMark Adams   ierr = MatGetRow(Amat,row,&nidx,&idx,NULL);CHKERRQ(ierr);
216618991cSMark Adams   if (nidx) {
226618991cSMark Adams     cnt = 0;
236618991cSMark Adams     cc[cnt] = idx[0]/bs;
246618991cSMark Adams     for (j=1; j<nidx; j++) {
256618991cSMark Adams       if (cc[cnt] < idx[j]/bs) cc[++cnt] = idx[j]/bs;
266618991cSMark Adams     }
276618991cSMark Adams   }
286618991cSMark Adams   ierr = MatRestoreRow(Amat,row,&nidx,&idx,NULL);CHKERRQ(ierr);
296618991cSMark Adams   *n = cnt+1;
306618991cSMark Adams   PetscFunctionReturn(0);
316618991cSMark Adams }
326618991cSMark Adams 
336618991cSMark Adams /*
346618991cSMark Adams     Produces a set of block column indices of the matrix block row, one for each block represented in the original set of rows
356618991cSMark Adams 
366618991cSMark Adams     ncollapsed - the number of block indices
376618991cSMark Adams     collapsed - the block indices (must be large enough to contain the indices)
386618991cSMark Adams */
396618991cSMark Adams PETSC_STATIC_INLINE PetscErrorCode MatCollapseRows(Mat Amat,PetscInt start,PetscInt bs,PetscInt *w0,PetscInt *w1,PetscInt *w2,PetscInt *ncollapsed,PetscInt **collapsed)
406618991cSMark Adams {
416618991cSMark Adams   PetscInt       i,nprev,*cprev = w0,ncur = 0,*ccur = w1,*merged = w2,*cprevtmp;
426618991cSMark Adams   PetscErrorCode ierr;
436618991cSMark Adams 
446618991cSMark Adams   PetscFunctionBegin;
456618991cSMark Adams   ierr = MatCollapseRow(Amat,start,bs,&nprev,cprev);CHKERRQ(ierr);
466618991cSMark Adams   for (i=start+1; i<start+bs; i++) {
476618991cSMark Adams     ierr  = MatCollapseRow(Amat,i,bs,&ncur,ccur);CHKERRQ(ierr);
486618991cSMark Adams     ierr  = PetscMergeIntArray(nprev,cprev,ncur,ccur,&nprev,&merged);CHKERRQ(ierr);
496618991cSMark Adams     cprevtmp = cprev; cprev = merged; merged = cprevtmp;
506618991cSMark Adams   }
516618991cSMark Adams   *ncollapsed = nprev;
526618991cSMark Adams   if (collapsed) *collapsed  = cprev;
536618991cSMark Adams   PetscFunctionReturn(0);
546618991cSMark Adams }
556618991cSMark Adams 
566618991cSMark Adams 
576618991cSMark Adams /* -------------------------------------------------------------------------- */
586618991cSMark Adams /*
596618991cSMark Adams    PCGAMGCreateGraph - create simple scaled scalar graph from matrix
606618991cSMark Adams 
616618991cSMark Adams  Input Parameter:
626618991cSMark Adams  . Amat - matrix
636618991cSMark Adams  Output Parameter:
646618991cSMark Adams  . a_Gmaat - eoutput scalar graph (symmetric?)
656618991cSMark Adams  */
666618991cSMark Adams PetscErrorCode PCGAMGCreateGraph(Mat Amat, Mat *a_Gmat)
676618991cSMark Adams {
686618991cSMark Adams   PetscErrorCode ierr;
69f42dcbb3SMark Adams   PetscInt       Istart,Iend,Ii,jj,kk,ncols,nloc,NN,MM,bs;
706618991cSMark Adams   MPI_Comm       comm;
716618991cSMark Adams   Mat            Gmat;
726618991cSMark Adams 
736618991cSMark Adams   PetscFunctionBegin;
746618991cSMark Adams   ierr = PetscObjectGetComm((PetscObject)Amat,&comm);CHKERRQ(ierr);
756618991cSMark Adams   ierr = MatGetOwnershipRange(Amat, &Istart, &Iend);CHKERRQ(ierr);
766618991cSMark Adams   ierr = MatGetSize(Amat, &MM, &NN);CHKERRQ(ierr);
776618991cSMark Adams   ierr = MatGetBlockSize(Amat, &bs);CHKERRQ(ierr);
786618991cSMark Adams   nloc = (Iend-Istart)/bs;
796618991cSMark Adams 
806618991cSMark Adams #if defined PETSC_GAMG_USE_LOG
816618991cSMark Adams   ierr = PetscLogEventBegin(petsc_gamg_setup_events[GRAPH],0,0,0,0);CHKERRQ(ierr);
826618991cSMark Adams #endif
836618991cSMark Adams 
846618991cSMark Adams   if (bs > 1) {
856618991cSMark Adams     const PetscScalar *vals;
866618991cSMark Adams     const PetscInt    *idx;
87f42dcbb3SMark Adams     PetscInt          *d_nnz, *o_nnz,*w0,*w1,*w2;
886618991cSMark Adams     PetscBool         ismpiaij,isseqaij;
896618991cSMark Adams 
906618991cSMark Adams     /*
916618991cSMark Adams        Determine the preallocation needed for the scalar matrix derived from the vector matrix.
926618991cSMark Adams     */
936618991cSMark Adams 
944099cc6bSBarry Smith     ierr = PetscObjectBaseTypeCompare((PetscObject)Amat,MATSEQAIJ,&isseqaij);CHKERRQ(ierr);
954099cc6bSBarry Smith     ierr = PetscObjectBaseTypeCompare((PetscObject)Amat,MATMPIAIJ,&ismpiaij);CHKERRQ(ierr);
966618991cSMark Adams     ierr = PetscMalloc2(nloc, &d_nnz,isseqaij ? 0 : nloc, &o_nnz);CHKERRQ(ierr);
976618991cSMark Adams 
986618991cSMark Adams     if (isseqaij) {
996618991cSMark Adams       PetscInt max_d_nnz;
1006618991cSMark Adams 
1016618991cSMark Adams       /*
1026618991cSMark Adams           Determine exact preallocation count for (sequential) scalar matrix
1036618991cSMark Adams       */
1046618991cSMark Adams       ierr = MatSeqAIJGetMaxRowNonzeros(Amat,&max_d_nnz);CHKERRQ(ierr);
1056618991cSMark Adams       max_d_nnz = PetscMin(nloc,bs*max_d_nnz);CHKERRQ(ierr);
1066618991cSMark Adams       ierr = PetscMalloc3(max_d_nnz, &w0,max_d_nnz, &w1,max_d_nnz, &w2);CHKERRQ(ierr);
1076618991cSMark Adams       for (Ii = 0, jj = 0; Ii < Iend; Ii += bs, jj++) {
1086618991cSMark Adams         ierr = MatCollapseRows(Amat,Ii,bs,w0,w1,w2,&d_nnz[jj],NULL);CHKERRQ(ierr);
1096618991cSMark Adams       }
1106618991cSMark Adams       ierr = PetscFree3(w0,w1,w2);CHKERRQ(ierr);
1116618991cSMark Adams 
1126618991cSMark Adams     } else if (ismpiaij) {
1136618991cSMark Adams       Mat            Daij,Oaij;
1146618991cSMark Adams       const PetscInt *garray;
1156618991cSMark Adams       PetscInt       max_d_nnz;
1166618991cSMark Adams 
1176618991cSMark Adams       ierr = MatMPIAIJGetSeqAIJ(Amat,&Daij,&Oaij,&garray);CHKERRQ(ierr);
1186618991cSMark Adams 
1196618991cSMark Adams       /*
1206618991cSMark Adams           Determine exact preallocation count for diagonal block portion of scalar matrix
1216618991cSMark Adams       */
1226618991cSMark Adams       ierr = MatSeqAIJGetMaxRowNonzeros(Daij,&max_d_nnz);CHKERRQ(ierr);
1236618991cSMark Adams       max_d_nnz = PetscMin(nloc,bs*max_d_nnz);CHKERRQ(ierr);
1246618991cSMark Adams       ierr = PetscMalloc3(max_d_nnz, &w0,max_d_nnz, &w1,max_d_nnz, &w2);CHKERRQ(ierr);
1256618991cSMark Adams       for (Ii = 0, jj = 0; Ii < Iend - Istart; Ii += bs, jj++) {
1266618991cSMark Adams         ierr = MatCollapseRows(Daij,Ii,bs,w0,w1,w2,&d_nnz[jj],NULL);CHKERRQ(ierr);
1276618991cSMark Adams       }
1286618991cSMark Adams       ierr = PetscFree3(w0,w1,w2);CHKERRQ(ierr);
1296618991cSMark Adams 
1306618991cSMark Adams       /*
1316618991cSMark Adams          Over estimate (usually grossly over), preallocation count for off-diagonal portion of scalar matrix
1326618991cSMark Adams       */
1336618991cSMark Adams       for (Ii = 0, jj = 0; Ii < Iend - Istart; Ii += bs, jj++) {
1346618991cSMark Adams         o_nnz[jj] = 0;
1356618991cSMark Adams         for (kk=0; kk<bs; kk++) { /* rows that get collapsed to a single row */
1360a545947SLisandro Dalcin           ierr = MatGetRow(Oaij,Ii+kk,&ncols,NULL,NULL);CHKERRQ(ierr);
1376618991cSMark Adams           o_nnz[jj] += ncols;
1380a545947SLisandro Dalcin           ierr = MatRestoreRow(Oaij,Ii+kk,&ncols,NULL,NULL);CHKERRQ(ierr);
1396618991cSMark Adams         }
1406618991cSMark Adams         if (o_nnz[jj] > (NN/bs-nloc)) o_nnz[jj] = NN/bs-nloc;
1416618991cSMark Adams       }
1426618991cSMark Adams 
143b817416eSBarry Smith     } else SETERRQ(PETSC_COMM_WORLD,PETSC_ERR_USER,"Require AIJ matrix type");
1446618991cSMark Adams 
145359038b3SMark Adams     /* get scalar copy (norms) of matrix */
1466618991cSMark Adams     ierr = MatCreate(comm, &Gmat);CHKERRQ(ierr);
1476618991cSMark Adams     ierr = MatSetSizes(Gmat,nloc,nloc,PETSC_DETERMINE,PETSC_DETERMINE);CHKERRQ(ierr);
1486618991cSMark Adams     ierr = MatSetBlockSizes(Gmat, 1, 1);CHKERRQ(ierr);
1490e263c94SMark     ierr = MatSetType(Gmat, MATAIJ);CHKERRQ(ierr);
1506618991cSMark Adams     ierr = MatSeqAIJSetPreallocation(Gmat,0,d_nnz);CHKERRQ(ierr);
1516618991cSMark Adams     ierr = MatMPIAIJSetPreallocation(Gmat,0,d_nnz,0,o_nnz);CHKERRQ(ierr);
1526618991cSMark Adams     ierr = PetscFree2(d_nnz,o_nnz);CHKERRQ(ierr);
1536618991cSMark Adams 
1546618991cSMark Adams     for (Ii = Istart; Ii < Iend; Ii++) {
1556618991cSMark Adams       PetscInt dest_row = Ii/bs;
1566618991cSMark Adams       ierr = MatGetRow(Amat,Ii,&ncols,&idx,&vals);CHKERRQ(ierr);
1576618991cSMark Adams       for (jj=0; jj<ncols; jj++) {
1586618991cSMark Adams         PetscInt    dest_col = idx[jj]/bs;
1596618991cSMark Adams         PetscScalar sv       = PetscAbs(PetscRealPart(vals[jj]));
1606618991cSMark Adams         ierr = MatSetValues(Gmat,1,&dest_row,1,&dest_col,&sv,ADD_VALUES);CHKERRQ(ierr);
1616618991cSMark Adams       }
1626618991cSMark Adams       ierr = MatRestoreRow(Amat,Ii,&ncols,&idx,&vals);CHKERRQ(ierr);
1636618991cSMark Adams     }
1646618991cSMark Adams     ierr = MatAssemblyBegin(Gmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1656618991cSMark Adams     ierr = MatAssemblyEnd(Gmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1666618991cSMark Adams   } else {
1676618991cSMark Adams     /* just copy scalar matrix - abs() not taken here but scaled later */
1686618991cSMark Adams     ierr = MatDuplicate(Amat, MAT_COPY_VALUES, &Gmat);CHKERRQ(ierr);
1696618991cSMark Adams   }
17036c1b609SStefano Zampini   ierr = MatPropagateSymmetryOptions(Amat, Gmat);CHKERRQ(ierr);
1716618991cSMark Adams 
1726618991cSMark Adams #if defined PETSC_GAMG_USE_LOG
1736618991cSMark Adams   ierr = PetscLogEventEnd(petsc_gamg_setup_events[GRAPH],0,0,0,0);CHKERRQ(ierr);
1746618991cSMark Adams #endif
1756618991cSMark Adams 
1766618991cSMark Adams   *a_Gmat = Gmat;
1776618991cSMark Adams   PetscFunctionReturn(0);
1786618991cSMark Adams }
1796618991cSMark Adams 
1806618991cSMark Adams /* -------------------------------------------------------------------------- */
181a37438d7SBarry Smith /*@C
182a37438d7SBarry Smith    PCGAMGFilterGraph - filter (remove zero and possibly small values from the) graph and make it symmetric if requested
183a37438d7SBarry Smith 
184a37438d7SBarry Smith    Collective on Mat
1856618991cSMark Adams 
1866618991cSMark Adams    Input Parameter:
187a37438d7SBarry Smith +   a_Gmat - the graph
188fd292e60Sprj- .   vfilter - threshold parameter [0,1)
189a37438d7SBarry Smith -   symm - make the result symmetric
190a37438d7SBarry Smith 
191a37438d7SBarry Smith    Level: developer
192a37438d7SBarry Smith 
19395452b02SPatrick Sanan    Notes:
19495452b02SPatrick Sanan     This is called before graph coarsers are called.
195a37438d7SBarry Smith 
196a37438d7SBarry Smith .seealso: PCGAMGSetThreshold()
197a37438d7SBarry Smith @*/
1986618991cSMark Adams PetscErrorCode PCGAMGFilterGraph(Mat *a_Gmat,PetscReal vfilter,PetscBool symm)
1996618991cSMark Adams {
2006618991cSMark Adams   PetscErrorCode    ierr;
2016618991cSMark Adams   PetscInt          Istart,Iend,Ii,jj,ncols,nnz0,nnz1, NN, MM, nloc;
2026618991cSMark Adams   PetscMPIInt       rank;
2036618991cSMark Adams   Mat               Gmat  = *a_Gmat, tGmat, matTrans;
2046618991cSMark Adams   MPI_Comm          comm;
2056618991cSMark Adams   const PetscScalar *vals;
2066618991cSMark Adams   const PetscInt    *idx;
2076618991cSMark Adams   PetscInt          *d_nnz, *o_nnz;
2086618991cSMark Adams   Vec               diag;
2096618991cSMark Adams 
2106618991cSMark Adams   PetscFunctionBegin;
2116618991cSMark Adams #if defined PETSC_GAMG_USE_LOG
2126618991cSMark Adams   ierr = PetscLogEventBegin(petsc_gamg_setup_events[GRAPH],0,0,0,0);CHKERRQ(ierr);
2136618991cSMark Adams #endif
2146618991cSMark Adams   /* scale Gmat for all values between -1 and 1 */
2150a545947SLisandro Dalcin   ierr = MatCreateVecs(Gmat, &diag, NULL);CHKERRQ(ierr);
2166618991cSMark Adams   ierr = MatGetDiagonal(Gmat, diag);CHKERRQ(ierr);
2176618991cSMark Adams   ierr = VecReciprocal(diag);CHKERRQ(ierr);
2186618991cSMark Adams   ierr = VecSqrtAbs(diag);CHKERRQ(ierr);
2196618991cSMark Adams   ierr = MatDiagonalScale(Gmat, diag, diag);CHKERRQ(ierr);
2206618991cSMark Adams   ierr = VecDestroy(&diag);CHKERRQ(ierr);
2216618991cSMark Adams 
2226618991cSMark Adams   if (vfilter < 0.0 && !symm) {
2236618991cSMark Adams     /* Just use the provided matrix as the graph but make all values positive */
2246618991cSMark Adams     MatInfo     info;
2256618991cSMark Adams     PetscScalar *avals;
226359038b3SMark Adams     PetscBool isaij,ismpiaij;
2274099cc6bSBarry Smith     ierr = PetscObjectBaseTypeCompare((PetscObject)Gmat,MATSEQAIJ,&isaij);CHKERRQ(ierr);
2284099cc6bSBarry Smith     ierr = PetscObjectBaseTypeCompare((PetscObject)Gmat,MATMPIAIJ,&ismpiaij);CHKERRQ(ierr);
229359038b3SMark Adams     if (!isaij && !ismpiaij) SETERRQ(PETSC_COMM_WORLD,PETSC_ERR_USER,"Require (MPI)AIJ matrix type");
230359038b3SMark Adams     if (isaij) {
2316618991cSMark Adams       ierr = MatGetInfo(Gmat,MAT_LOCAL,&info);CHKERRQ(ierr);
2326618991cSMark Adams       ierr = MatSeqAIJGetArray(Gmat,&avals);CHKERRQ(ierr);
2336618991cSMark Adams       for (jj = 0; jj<info.nz_used; jj++) avals[jj] = PetscAbsScalar(avals[jj]);
2346618991cSMark Adams       ierr = MatSeqAIJRestoreArray(Gmat,&avals);CHKERRQ(ierr);
2356618991cSMark Adams     } else {
236359038b3SMark Adams       Mat_MPIAIJ  *aij = (Mat_MPIAIJ*)Gmat->data;
2376618991cSMark Adams       ierr = MatGetInfo(aij->A,MAT_LOCAL,&info);CHKERRQ(ierr);
2386618991cSMark Adams       ierr = MatSeqAIJGetArray(aij->A,&avals);CHKERRQ(ierr);
2396618991cSMark Adams       for (jj = 0; jj<info.nz_used; jj++) avals[jj] = PetscAbsScalar(avals[jj]);
2406618991cSMark Adams       ierr = MatSeqAIJRestoreArray(aij->A,&avals);CHKERRQ(ierr);
2416618991cSMark Adams       ierr = MatGetInfo(aij->B,MAT_LOCAL,&info);CHKERRQ(ierr);
2426618991cSMark Adams       ierr = MatSeqAIJGetArray(aij->B,&avals);CHKERRQ(ierr);
2436618991cSMark Adams       for (jj = 0; jj<info.nz_used; jj++) avals[jj] = PetscAbsScalar(avals[jj]);
2446618991cSMark Adams       ierr = MatSeqAIJRestoreArray(aij->B,&avals);CHKERRQ(ierr);
2456618991cSMark Adams     }
2466618991cSMark Adams #if defined PETSC_GAMG_USE_LOG
2476618991cSMark Adams     ierr = PetscLogEventEnd(petsc_gamg_setup_events[GRAPH],0,0,0,0);CHKERRQ(ierr);
2486618991cSMark Adams #endif
2496618991cSMark Adams     PetscFunctionReturn(0);
2506618991cSMark Adams   }
2516618991cSMark Adams 
2526618991cSMark Adams   ierr = PetscObjectGetComm((PetscObject)Gmat,&comm);CHKERRQ(ierr);
253*ffc4695bSBarry Smith   ierr = MPI_Comm_rank(comm,&rank);CHKERRMPI(ierr);
2546618991cSMark Adams   ierr = MatGetOwnershipRange(Gmat, &Istart, &Iend);CHKERRQ(ierr);
2556618991cSMark Adams   nloc = Iend - Istart;
2566618991cSMark Adams   ierr = MatGetSize(Gmat, &MM, &NN);CHKERRQ(ierr);
2576618991cSMark Adams 
2586618991cSMark Adams   if (symm) {
2596618991cSMark Adams     ierr = MatTranspose(Gmat, MAT_INITIAL_MATRIX, &matTrans);CHKERRQ(ierr);
2606618991cSMark Adams   }
2616618991cSMark Adams 
2626618991cSMark Adams   /* Determine upper bound on nonzeros needed in new filtered matrix */
2636618991cSMark Adams   ierr = PetscMalloc2(nloc, &d_nnz,nloc, &o_nnz);CHKERRQ(ierr);
2646618991cSMark Adams   for (Ii = Istart, jj = 0; Ii < Iend; Ii++, jj++) {
2656618991cSMark Adams     ierr      = MatGetRow(Gmat,Ii,&ncols,NULL,NULL);CHKERRQ(ierr);
2666618991cSMark Adams     d_nnz[jj] = ncols;
2676618991cSMark Adams     o_nnz[jj] = ncols;
2686618991cSMark Adams     ierr      = MatRestoreRow(Gmat,Ii,&ncols,NULL,NULL);CHKERRQ(ierr);
2696618991cSMark Adams     if (symm) {
2706618991cSMark Adams       ierr       = MatGetRow(matTrans,Ii,&ncols,NULL,NULL);CHKERRQ(ierr);
2716618991cSMark Adams       d_nnz[jj] += ncols;
2726618991cSMark Adams       o_nnz[jj] += ncols;
2736618991cSMark Adams       ierr       = MatRestoreRow(matTrans,Ii,&ncols,NULL,NULL);CHKERRQ(ierr);
2746618991cSMark Adams     }
2756618991cSMark Adams     if (d_nnz[jj] > nloc) d_nnz[jj] = nloc;
2766618991cSMark Adams     if (o_nnz[jj] > (MM-nloc)) o_nnz[jj] = MM - nloc;
2776618991cSMark Adams   }
2786618991cSMark Adams   ierr = MatCreate(comm, &tGmat);CHKERRQ(ierr);
2796618991cSMark Adams   ierr = MatSetSizes(tGmat,nloc,nloc,MM,MM);CHKERRQ(ierr);
2806618991cSMark Adams   ierr = MatSetBlockSizes(tGmat, 1, 1);CHKERRQ(ierr);
2810e263c94SMark   ierr = MatSetType(tGmat, MATAIJ);CHKERRQ(ierr);
2826618991cSMark Adams   ierr = MatSeqAIJSetPreallocation(tGmat,0,d_nnz);CHKERRQ(ierr);
2836618991cSMark Adams   ierr = MatMPIAIJSetPreallocation(tGmat,0,d_nnz,0,o_nnz);CHKERRQ(ierr);
2846618991cSMark Adams   ierr = PetscFree2(d_nnz,o_nnz);CHKERRQ(ierr);
2856618991cSMark Adams   if (symm) {
2866618991cSMark Adams     ierr = MatDestroy(&matTrans);CHKERRQ(ierr);
2876618991cSMark Adams   } else {
2886618991cSMark Adams     /* all entries are generated locally so MatAssembly will be slightly faster for large process counts */
2896618991cSMark Adams     ierr = MatSetOption(tGmat,MAT_NO_OFF_PROC_ENTRIES,PETSC_TRUE);CHKERRQ(ierr);
2906618991cSMark Adams   }
2916618991cSMark Adams 
2926618991cSMark Adams   for (Ii = Istart, nnz0 = nnz1 = 0; Ii < Iend; Ii++) {
2936618991cSMark Adams     ierr = MatGetRow(Gmat,Ii,&ncols,&idx,&vals);CHKERRQ(ierr);
2946618991cSMark Adams     for (jj=0; jj<ncols; jj++,nnz0++) {
2956618991cSMark Adams       PetscScalar sv = PetscAbs(PetscRealPart(vals[jj]));
2966618991cSMark Adams       if (PetscRealPart(sv) > vfilter) {
2976618991cSMark Adams         nnz1++;
2986618991cSMark Adams         if (symm) {
2996618991cSMark Adams           sv  *= 0.5;
3006618991cSMark Adams           ierr = MatSetValues(tGmat,1,&Ii,1,&idx[jj],&sv,ADD_VALUES);CHKERRQ(ierr);
3016618991cSMark Adams           ierr = MatSetValues(tGmat,1,&idx[jj],1,&Ii,&sv,ADD_VALUES);CHKERRQ(ierr);
3026618991cSMark Adams         } else {
3036618991cSMark Adams           ierr = MatSetValues(tGmat,1,&Ii,1,&idx[jj],&sv,ADD_VALUES);CHKERRQ(ierr);
3046618991cSMark Adams         }
3056618991cSMark Adams       }
3066618991cSMark Adams     }
3076618991cSMark Adams     ierr = MatRestoreRow(Gmat,Ii,&ncols,&idx,&vals);CHKERRQ(ierr);
3086618991cSMark Adams   }
3096618991cSMark Adams   ierr = MatAssemblyBegin(tGmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
3106618991cSMark Adams   ierr = MatAssemblyEnd(tGmat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
31136c1b609SStefano Zampini   if (symm) {
31236c1b609SStefano Zampini     ierr = MatSetOption(tGmat,MAT_SYMMETRIC,PETSC_TRUE);CHKERRQ(ierr);
31336c1b609SStefano Zampini   } else {
31436c1b609SStefano Zampini     ierr = MatPropagateSymmetryOptions(Gmat,tGmat);CHKERRQ(ierr);
31536c1b609SStefano Zampini   }
3166618991cSMark Adams #if defined PETSC_GAMG_USE_LOG
3176618991cSMark Adams   ierr = PetscLogEventEnd(petsc_gamg_setup_events[GRAPH],0,0,0,0);CHKERRQ(ierr);
3186618991cSMark Adams #endif
3196618991cSMark Adams 
3206618991cSMark Adams #if defined(PETSC_USE_INFO)
3216618991cSMark Adams   {
3226618991cSMark Adams     double t1 = (!nnz0) ? 1. : 100.*(double)nnz1/(double)nnz0, t2 = (!nloc) ? 1. : (double)nnz0/(double)nloc;
3236618991cSMark Adams     ierr = PetscInfo4(*a_Gmat,"\t %g%% nnz after filtering, with threshold %g, %g nnz ave. (N=%D)\n",t1,vfilter,t2,MM);CHKERRQ(ierr);
3246618991cSMark Adams   }
3256618991cSMark Adams #endif
3266618991cSMark Adams   ierr    = MatDestroy(&Gmat);CHKERRQ(ierr);
3276618991cSMark Adams   *a_Gmat = tGmat;
3286618991cSMark Adams   PetscFunctionReturn(0);
3296618991cSMark Adams }
3306618991cSMark Adams 
3316618991cSMark Adams /* -------------------------------------------------------------------------- */
3326618991cSMark Adams /*
333b817416eSBarry Smith    PCGAMGGetDataWithGhosts - hacks into Mat MPIAIJ so this must have size > 1
3346618991cSMark Adams 
3356618991cSMark Adams    Input Parameter:
3366618991cSMark Adams    . Gmat - MPIAIJ matrix for scattters
3376618991cSMark Adams    . data_sz - number of data terms per node (# cols in output)
3386618991cSMark Adams    . data_in[nloc*data_sz] - column oriented data
3396618991cSMark Adams    Output Parameter:
3406618991cSMark Adams    . a_stride - numbrt of rows of output
3416618991cSMark Adams    . a_data_out[stride*data_sz] - output data with ghosts
3426618991cSMark Adams */
3436618991cSMark Adams PetscErrorCode PCGAMGGetDataWithGhosts(Mat Gmat,PetscInt data_sz,PetscReal data_in[],PetscInt *a_stride,PetscReal **a_data_out)
3446618991cSMark Adams {
3456618991cSMark Adams   PetscErrorCode ierr;
3466618991cSMark Adams   Vec            tmp_crds;
3476618991cSMark Adams   Mat_MPIAIJ     *mpimat = (Mat_MPIAIJ*)Gmat->data;
3486618991cSMark Adams   PetscInt       nnodes,num_ghosts,dir,kk,jj,my0,Iend,nloc;
3496618991cSMark Adams   PetscScalar    *data_arr;
3506618991cSMark Adams   PetscReal      *datas;
3516618991cSMark Adams   PetscBool      isMPIAIJ;
3526618991cSMark Adams 
3536618991cSMark Adams   PetscFunctionBegin;
3544099cc6bSBarry Smith   ierr      = PetscObjectBaseTypeCompare((PetscObject)Gmat, MATMPIAIJ, &isMPIAIJ);CHKERRQ(ierr);
3556618991cSMark Adams   ierr      = MatGetOwnershipRange(Gmat, &my0, &Iend);CHKERRQ(ierr);
3566618991cSMark Adams   nloc      = Iend - my0;
3576618991cSMark Adams   ierr      = VecGetLocalSize(mpimat->lvec, &num_ghosts);CHKERRQ(ierr);
3586618991cSMark Adams   nnodes    = num_ghosts + nloc;
3596618991cSMark Adams   *a_stride = nnodes;
3600a545947SLisandro Dalcin   ierr      = MatCreateVecs(Gmat, &tmp_crds, NULL);CHKERRQ(ierr);
3616618991cSMark Adams 
3626618991cSMark Adams   ierr = PetscMalloc1(data_sz*nnodes, &datas);CHKERRQ(ierr);
3636618991cSMark Adams   for (dir=0; dir<data_sz; dir++) {
3646618991cSMark Adams     /* set local, and global */
3656618991cSMark Adams     for (kk=0; kk<nloc; kk++) {
3666618991cSMark Adams       PetscInt    gid = my0 + kk;
3676618991cSMark Adams       PetscScalar crd = (PetscScalar)data_in[dir*nloc + kk]; /* col oriented */
3686618991cSMark Adams       datas[dir*nnodes + kk] = PetscRealPart(crd);
3696618991cSMark Adams 
3706618991cSMark Adams       ierr = VecSetValues(tmp_crds, 1, &gid, &crd, INSERT_VALUES);CHKERRQ(ierr);
3716618991cSMark Adams     }
3726618991cSMark Adams     ierr = VecAssemblyBegin(tmp_crds);CHKERRQ(ierr);
3736618991cSMark Adams     ierr = VecAssemblyEnd(tmp_crds);CHKERRQ(ierr);
3746618991cSMark Adams     /* get ghost datas */
3756618991cSMark Adams     ierr = VecScatterBegin(mpimat->Mvctx,tmp_crds,mpimat->lvec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3766618991cSMark Adams     ierr = VecScatterEnd(mpimat->Mvctx,tmp_crds,mpimat->lvec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3776618991cSMark Adams     ierr = VecGetArray(mpimat->lvec, &data_arr);CHKERRQ(ierr);
3786618991cSMark Adams     for (kk=nloc,jj=0;jj<num_ghosts;kk++,jj++) datas[dir*nnodes + kk] = PetscRealPart(data_arr[jj]);
3796618991cSMark Adams     ierr = VecRestoreArray(mpimat->lvec, &data_arr);CHKERRQ(ierr);
3806618991cSMark Adams   }
3816618991cSMark Adams   ierr        = VecDestroy(&tmp_crds);CHKERRQ(ierr);
3826618991cSMark Adams   *a_data_out = datas;
3836618991cSMark Adams   PetscFunctionReturn(0);
3846618991cSMark Adams }
3856618991cSMark Adams 
3861943db53SBarry Smith PetscErrorCode PCGAMGHashTableCreate(PetscInt a_size, PCGAMGHashTable *a_tab)
3876618991cSMark Adams {
3886618991cSMark Adams   PetscErrorCode ierr;
3896618991cSMark Adams   PetscInt       kk;
3906618991cSMark Adams 
3916618991cSMark Adams   PetscFunctionBegin;
3926618991cSMark Adams   a_tab->size = a_size;
3938f3cd775SBarry Smith   ierr = PetscMalloc2(a_size, &a_tab->table,a_size, &a_tab->data);CHKERRQ(ierr);
3946618991cSMark Adams   for (kk=0; kk<a_size; kk++) a_tab->table[kk] = -1;
3956618991cSMark Adams   PetscFunctionReturn(0);
3966618991cSMark Adams }
3976618991cSMark Adams 
3981943db53SBarry Smith PetscErrorCode PCGAMGHashTableDestroy(PCGAMGHashTable *a_tab)
3996618991cSMark Adams {
4006618991cSMark Adams   PetscErrorCode ierr;
4016618991cSMark Adams 
4026618991cSMark Adams   PetscFunctionBegin;
4038f3cd775SBarry Smith   ierr = PetscFree2(a_tab->table,a_tab->data);CHKERRQ(ierr);
4046618991cSMark Adams   PetscFunctionReturn(0);
4056618991cSMark Adams }
4066618991cSMark Adams 
4071943db53SBarry Smith PetscErrorCode PCGAMGHashTableAdd(PCGAMGHashTable *a_tab, PetscInt a_key, PetscInt a_data)
4086618991cSMark Adams {
4096618991cSMark Adams   PetscInt kk,idx;
4106618991cSMark Adams 
4116618991cSMark Adams   PetscFunctionBegin;
4128f3cd775SBarry Smith   if (a_key<0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_USER,"Negative key %D.",a_key);
4138f3cd775SBarry Smith   for (kk = 0, idx = GAMG_HASH(a_key); kk < a_tab->size; kk++, idx = (idx==(a_tab->size-1)) ? 0 : idx + 1) {
4146618991cSMark Adams     if (a_tab->table[idx] == a_key) {
4156618991cSMark Adams       /* exists */
4166618991cSMark Adams       a_tab->data[idx] = a_data;
4176618991cSMark Adams       break;
4186618991cSMark Adams     } else if (a_tab->table[idx] == -1) {
4196618991cSMark Adams       /* add */
4206618991cSMark Adams       a_tab->table[idx] = a_key;
4216618991cSMark Adams       a_tab->data[idx]  = a_data;
4226618991cSMark Adams       break;
4236618991cSMark Adams     }
4246618991cSMark Adams   }
4256618991cSMark Adams   if (kk==a_tab->size) {
4266618991cSMark Adams     /* this is not to efficient, waiting until completely full */
4276618991cSMark Adams     PetscInt       oldsize = a_tab->size, new_size = 2*a_tab->size + 5, *oldtable = a_tab->table, *olddata = a_tab->data;
4286618991cSMark Adams     PetscErrorCode ierr;
4296618991cSMark Adams 
4306618991cSMark Adams     a_tab->size = new_size;
4318f3cd775SBarry Smith     ierr = PetscMalloc2(a_tab->size, &a_tab->table,a_tab->size, &a_tab->data);CHKERRQ(ierr);
4326618991cSMark Adams     for (kk=0;kk<a_tab->size;kk++) a_tab->table[kk] = -1;
4336618991cSMark Adams     for (kk=0;kk<oldsize;kk++) {
4346618991cSMark Adams       if (oldtable[kk] != -1) {
4351943db53SBarry Smith         ierr = PCGAMGHashTableAdd(a_tab, oldtable[kk], olddata[kk]);CHKERRQ(ierr);
4366618991cSMark Adams        }
4376618991cSMark Adams     }
4388f3cd775SBarry Smith     ierr = PetscFree2(oldtable,olddata);CHKERRQ(ierr);
4391943db53SBarry Smith     ierr = PCGAMGHashTableAdd(a_tab, a_key, a_data);CHKERRQ(ierr);
4406618991cSMark Adams   }
4416618991cSMark Adams   PetscFunctionReturn(0);
4426618991cSMark Adams }
443