xref: /petsc/src/ksp/pc/impls/gamg/gamg.c (revision 1de875819d4354bbe1bdfd24631e58d57ffbd69a)
15b89ad90SMark F. Adams /*
25b89ad90SMark F. Adams  GAMG geometric-algebric multiogrid PC - Mark Adams 2011
35b89ad90SMark F. Adams  */
45ef31b24SMark F. Adams #include <../src/ksp/pc/impls/gamg/gamg.h>
5f96513f1SMatthew G Knepley 
6f96513f1SMatthew G Knepley PetscLogEvent gamg_setup_stages[NUM_SET];
7f96513f1SMatthew G Knepley 
85b89ad90SMark F. Adams /* Private context for the GAMG preconditioner */
95b89ad90SMark F. Adams typedef struct gamg_TAG {
105b89ad90SMark F. Adams   PetscInt       m_dim;
115b89ad90SMark F. Adams   PetscInt       m_Nlevels;
125b89ad90SMark F. Adams   PetscInt       m_data_sz;
13d3d6bff4SMark F. Adams   PetscInt       m_data_rows;
14d3d6bff4SMark F. Adams   PetscInt       m_data_cols;
15d3d6bff4SMark F. Adams   PetscBool      m_useSA;
165b89ad90SMark F. Adams   PetscReal     *m_data; /* blocked vector of vertex data on fine grid (coordinates) */
175b89ad90SMark F. Adams } PC_GAMG;
185b89ad90SMark F. Adams 
195b89ad90SMark F. Adams /* -------------------------------------------------------------------------- */
205b89ad90SMark F. Adams /*
215b89ad90SMark F. Adams    PCSetCoordinates_GAMG
225b89ad90SMark F. Adams 
235b89ad90SMark F. Adams    Input Parameter:
245b89ad90SMark F. Adams    .  pc - the preconditioner context
255b89ad90SMark F. Adams */
26a92563c5SMark F. Adams EXTERN_C_BEGIN
275b89ad90SMark F. Adams #undef __FUNCT__
285b89ad90SMark F. Adams #define __FUNCT__ "PCSetCoordinates_GAMG"
29eb07cef2SMark F. Adams PetscErrorCode PCSetCoordinates_GAMG( PC a_pc, PetscInt a_ndm, PetscReal *a_coords )
305b89ad90SMark F. Adams {
31eb07cef2SMark F. Adams   PC_MG          *mg = (PC_MG*)a_pc->data;
325b89ad90SMark F. Adams   PC_GAMG        *pc_gamg = (PC_GAMG*)mg->innerctx;
336c237d78SBarry Smith   PetscErrorCode ierr;
34d3d6bff4SMark F. Adams   PetscInt       arrsz,bs,my0,kk,ii,jj,nloc,Iend;
35038e3b61SMark F. Adams   Mat            Amat = a_pc->pmat;
36d3d6bff4SMark F. Adams   PetscBool      flag;
37eb07cef2SMark F. Adams   char           str[16];
385b89ad90SMark F. Adams 
395b89ad90SMark F. Adams   PetscFunctionBegin;
40038e3b61SMark F. Adams   ierr  = MatGetBlockSize( Amat, &bs );               CHKERRQ( ierr );
41d3d6bff4SMark F. Adams   ierr  = MatGetOwnershipRange( Amat, &my0, &Iend ); CHKERRQ(ierr);
42d3d6bff4SMark F. Adams   nloc = (Iend-my0)/bs;
43d3d6bff4SMark F. Adams   if((Iend-my0)%bs!=0) SETERRQ1(((PetscObject)Amat)->comm,PETSC_ERR_ARG_WRONG, "Bad local size %d.",nloc);
44038e3b61SMark F. Adams 
45eb07cef2SMark F. Adams   ierr  = PetscOptionsGetString(PETSC_NULL,"-pc_gamg_type",str,16,&flag);    CHKERRQ( ierr );
46d3d6bff4SMark F. Adams   pc_gamg->m_useSA = (PetscBool)(flag && strcmp(str,"sa") == 0);
47038e3b61SMark F. Adams 
48d3d6bff4SMark F. Adams   pc_gamg->m_data_rows = 1;
49d3d6bff4SMark F. Adams   if(a_coords == 0) pc_gamg->m_useSA = PETSC_TRUE; /* use SA if no data */
50d3d6bff4SMark F. Adams   if( !pc_gamg->m_useSA ) pc_gamg->m_data_cols = a_ndm; /* coordinates */
51038e3b61SMark F. Adams   else{ /* SA: null space vectors */
52d3d6bff4SMark F. Adams     if(a_coords != 0 && bs==1 ) pc_gamg->m_data_cols = 1; /* scalar w/ coords and SA (not needed) */
53d3d6bff4SMark F. Adams     else if(a_coords != 0) pc_gamg->m_data_cols = (a_ndm==2 ? 3 : 6); /* elasticity */
54d3d6bff4SMark F. Adams     else pc_gamg->m_data_cols = bs; /* no data, force SA with constant null space vectors */
55d3d6bff4SMark F. Adams     pc_gamg->m_data_rows = bs;
56038e3b61SMark F. Adams   }
57d3d6bff4SMark F. Adams   arrsz = nloc*pc_gamg->m_data_rows*pc_gamg->m_data_cols;
585b89ad90SMark F. Adams 
59038e3b61SMark F. Adams   /* create data - syntactic sugar that should be refactored at some point */
606c237d78SBarry Smith   if (!pc_gamg->m_data || (pc_gamg->m_data_sz != arrsz)) {
615b89ad90SMark F. Adams     ierr = PetscFree( pc_gamg->m_data );  CHKERRQ(ierr);
62eb07cef2SMark F. Adams     ierr = PetscMalloc((arrsz+1)*sizeof(double), &pc_gamg->m_data ); CHKERRQ(ierr);
635b89ad90SMark F. Adams   }
64038e3b61SMark F. Adams   for(kk=0;kk<arrsz;kk++)pc_gamg->m_data[kk] = -999.;
65eb07cef2SMark F. Adams   pc_gamg->m_data[arrsz] = -99.;
66038e3b61SMark F. Adams   /* copy data in - column oriented */
67d3d6bff4SMark F. Adams   if( pc_gamg->m_useSA ) {
68d3d6bff4SMark F. Adams     const PetscInt M = Iend - my0;
69038e3b61SMark F. Adams     for(kk=0;kk<nloc;kk++){
70038e3b61SMark F. Adams       PetscReal *data = &pc_gamg->m_data[kk*bs];
71d3d6bff4SMark F. Adams       if( pc_gamg->m_data_cols==1 ) *data = 1.0;
72038e3b61SMark F. Adams       else {
73038e3b61SMark F. Adams         for(ii=0;ii<bs;ii++)
74038e3b61SMark F. Adams 	  for(jj=0;jj<bs;jj++)
75038e3b61SMark F. Adams 	    if(ii==jj)data[ii*M + jj] = 1.0; /* translational modes */
76038e3b61SMark F. Adams 	    else data[ii*M + jj] = 0.0;
77eb07cef2SMark F. Adams         if( a_coords != 0 ) {
78038e3b61SMark F. Adams           if( a_ndm == 2 ){ /* rotational modes */
79038e3b61SMark F. Adams             data += 2*M;
80038e3b61SMark F. Adams             data[0] = -a_coords[2*kk+1];
81038e3b61SMark F. Adams             data[1] =  a_coords[2*kk];
825b89ad90SMark F. Adams           }
83eb07cef2SMark F. Adams           else {
84038e3b61SMark F. Adams             data += 3*M;
85038e3b61SMark F. Adams             data[0] = 0.0;               data[M+0] =  a_coords[3*kk+2]; data[2*M+0] = -a_coords[3*kk+1];
86038e3b61SMark F. Adams             data[1] = -a_coords[3*kk+2]; data[M+1] = 0.0;               data[2*M+1] =  a_coords[3*kk];
87038e3b61SMark F. Adams             data[2] =  a_coords[3*kk+1]; data[M+2] = -a_coords[3*kk];   data[2*M+2] = 0.0;
88038e3b61SMark F. Adams           }
89eb07cef2SMark F. Adams         }
90eb07cef2SMark F. Adams       }
91eb07cef2SMark F. Adams     }
92eb07cef2SMark F. Adams   }
93eb07cef2SMark F. Adams   else {
94038e3b61SMark F. Adams     for( kk = 0 ; kk < nloc ; kk++ ){
95038e3b61SMark F. Adams       for( ii = 0 ; ii < a_ndm ; ii++ ) {
96038e3b61SMark F. Adams         pc_gamg->m_data[ii*nloc + kk] =  a_coords[kk*a_ndm + ii];
97eb07cef2SMark F. Adams       }
98eb07cef2SMark F. Adams     }
99038e3b61SMark F. Adams   }
100038e3b61SMark F. Adams 
101eb07cef2SMark F. Adams   assert(pc_gamg->m_data[arrsz] == -99.);
102d3d6bff4SMark F. Adams   for(kk=0;kk<arrsz;kk++) assert(pc_gamg->m_data[kk] != -999.); // debug
103038e3b61SMark F. Adams 
1045b89ad90SMark F. Adams   pc_gamg->m_data_sz = arrsz;
105eb07cef2SMark F. Adams   pc_gamg->m_dim = a_ndm;
1065b89ad90SMark F. Adams 
1075b89ad90SMark F. Adams   PetscFunctionReturn(0);
1085b89ad90SMark F. Adams }
109a92563c5SMark F. Adams EXTERN_C_END
1105b89ad90SMark F. Adams 
111d3d6bff4SMark F. Adams 
112d3d6bff4SMark F. Adams /* -----------------------------------------------------------------------------*/
113d3d6bff4SMark F. Adams #undef __FUNCT__
114d3d6bff4SMark F. Adams #define __FUNCT__ "PCReset_GAMG"
115d3d6bff4SMark F. Adams PetscErrorCode PCReset_GAMG(PC pc)
116d3d6bff4SMark F. Adams {
117d3d6bff4SMark F. Adams   PetscErrorCode  ierr;
118d3d6bff4SMark F. Adams   PC_MG           *mg = (PC_MG*)pc->data;
119d3d6bff4SMark F. Adams   PC_GAMG         *pc_gamg = (PC_GAMG*)mg->innerctx;
120d3d6bff4SMark F. Adams 
121d3d6bff4SMark F. Adams   PetscFunctionBegin;
122d3d6bff4SMark F. Adams   ierr = PetscFree(pc_gamg->m_data);CHKERRQ(ierr);
123d3d6bff4SMark F. Adams   pc_gamg->m_data = 0; pc_gamg->m_data_sz = 0;
124d3d6bff4SMark F. Adams   PetscFunctionReturn(0);
125d3d6bff4SMark F. Adams }
126d3d6bff4SMark F. Adams 
1275b89ad90SMark F. Adams /* -------------------------------------------------------------------------- */
1285b89ad90SMark F. Adams /*
12911e60469SMark F. Adams    partitionLevel
1305b89ad90SMark F. Adams 
1315b89ad90SMark F. Adams    Input Parameter:
1323530afc2SMark F. Adams    . a_Amat_fine - matrix on this fine (k) level
133d3d6bff4SMark F. Adams    . a_ndata_rows - size of data to move (coarse grid)
134d3d6bff4SMark F. Adams    . a_ndata_cols - size of data to move (coarse grid)
1353530afc2SMark F. Adams    In/Output Parameter:
1363530afc2SMark F. Adams    . a_P_inout - prolongation operator to the next level (k-1)
137eb07cef2SMark F. Adams    . a_coarse_data - data that need to be moved
1383530afc2SMark F. Adams    . a_active_proc - number of active procs
13911e60469SMark F. Adams    Output Parameter:
1403530afc2SMark F. Adams    . a_Amat_crs - coarse matrix that is created (k-1)
1415b89ad90SMark F. Adams */
1425cb416c2SMark F. Adams 
1435b89ad90SMark F. Adams #undef __FUNCT__
14411e60469SMark F. Adams #define __FUNCT__ "partitionLevel"
1453530afc2SMark F. Adams PetscErrorCode partitionLevel( Mat a_Amat_fine,
146d3d6bff4SMark F. Adams                                PetscInt a_ndata_rows,
147d3d6bff4SMark F. Adams                                PetscInt a_ndata_cols,
148038e3b61SMark F. Adams 			       PetscInt a_cbs,
1493530afc2SMark F. Adams                                Mat *a_P_inout,
150eb07cef2SMark F. Adams                                PetscReal **a_coarse_data,
1513530afc2SMark F. Adams                                PetscMPIInt *a_active_proc,
1523530afc2SMark F. Adams                                Mat *a_Amat_crs
15311e60469SMark F. Adams                                )
1545b89ad90SMark F. Adams {
1555b89ad90SMark F. Adams   PetscErrorCode   ierr;
156038e3b61SMark F. Adams   Mat              Cmat,Pnew,Pold=*a_P_inout;
15711e60469SMark F. Adams   IS               new_indices,isnum;
1583530afc2SMark F. Adams   MPI_Comm         wcomm = ((PetscObject)a_Amat_fine)->comm;
1595ef31b24SMark F. Adams   PetscMPIInt      nactive_procs,mype,npe;
160038e3b61SMark F. Adams   PetscInt         Istart,Iend,Istart0,Iend0,ncrs0,ncrs_new,fbs;
161a6828334SMark F. Adams   PetscInt         neq,NN;
162e33ef3b1SMark F. Adams   PetscMPIInt      new_npe,targ_npe;
1635b89ad90SMark F. Adams 
1645b89ad90SMark F. Adams   PetscFunctionBegin;
16511e60469SMark F. Adams   ierr = MPI_Comm_rank( wcomm, &mype ); CHKERRQ(ierr);
16611e60469SMark F. Adams   ierr = MPI_Comm_size( wcomm, &npe );  CHKERRQ(ierr);
167038e3b61SMark F. Adams   ierr = MatGetBlockSize( a_Amat_fine, &fbs ); CHKERRQ(ierr);
16811e60469SMark F. Adams   /* RAP */
169038e3b61SMark F. Adams   ierr = MatPtAP( a_Amat_fine, Pold, MAT_INITIAL_MATRIX, 2.0, &Cmat ); CHKERRQ(ierr);
170038e3b61SMark F. Adams   ierr = MatSetBlockSize( Cmat, a_cbs );      CHKERRQ(ierr);
171acadaa72SMark F. Adams 
172038e3b61SMark F. Adams   ierr = MatGetOwnershipRange( Cmat, &Istart0, &Iend0 ); CHKERRQ(ierr);
173038e3b61SMark F. Adams   ncrs0 = (Iend0-Istart0)/a_cbs; assert((Iend0-Istart0)%a_cbs == 0);
174038e3b61SMark F. Adams 
175038e3b61SMark F. Adams   /* Repartition Cmat_{k} and move colums of P^{k}_{k-1} and coordinates accordingly */
176038e3b61SMark F. Adams   ierr = MatGetSize( Cmat, &neq, &NN );CHKERRQ(ierr);
177*1de87581SMark F. Adams #define MIN_EQ_PROC 200
1785ef31b24SMark F. Adams   nactive_procs = *a_active_proc;
1793530afc2SMark F. Adams   targ_npe = neq/MIN_EQ_PROC; /* hardwire min. number of eq/proc */
180*1de87581SMark F. Adams #define TOP_GRID_LIM 1000
1815ef31b24SMark F. Adams   if( targ_npe == 0 || neq < TOP_GRID_LIM ) new_npe = 1; /* chop coarsest grid */
1825ef31b24SMark F. Adams   else if (targ_npe >= nactive_procs ) new_npe = nactive_procs; /* no change */
1833530afc2SMark F. Adams   else {
1845ef31b24SMark F. Adams     PetscMPIInt factstart,fact;
1853530afc2SMark F. Adams     new_npe = -9999;
1865ef31b24SMark F. Adams     factstart = nactive_procs;
1873530afc2SMark F. Adams     for(fact=factstart;fact>0;fact--){ /* try to find a better number of procs */
1885ef31b24SMark F. Adams       if( nactive_procs%fact==0 && neq/(nactive_procs/fact) > MIN_EQ_PROC ) {
1895ef31b24SMark F. Adams         new_npe = nactive_procs/fact;
1903530afc2SMark F. Adams       }
1913530afc2SMark F. Adams     }
192038e3b61SMark F. Adams     if(new_npe == -9999) new_npe = nactive_procs;
1933530afc2SMark F. Adams   }
194e33ef3b1SMark F. Adams 
195e33ef3b1SMark F. Adams   if( PETSC_TRUE ) { /* partition: get 'isnewproc' */
19611e60469SMark F. Adams     MatPartitioning  mpart;
1975ef31b24SMark F. Adams     Mat              adj;
1985ef31b24SMark F. Adams     const PetscInt  *is_idx;
199d3d6bff4SMark F. Adams     PetscInt         is_sz,kk,jj,ii,old_fact=(npe/nactive_procs), *isnewproc_idx;
200c9a0b8beSMark F. Adams     /* create sub communicator  */
201c9a0b8beSMark F. Adams     MPI_Comm         cm,new_comm;
202d3d6bff4SMark F. Adams     PetscInt         membershipKey = mype%old_fact, new_fact=(npe/new_npe),counts[npe];
203e33ef3b1SMark F. Adams     IS               isnewproc;
204e33ef3b1SMark F. Adams 
205d3d6bff4SMark F. Adams     *a_active_proc = new_npe; /* output for next level */
206c9a0b8beSMark F. Adams     ierr = MPI_Comm_split(wcomm, membershipKey, mype, &cm); CHKERRQ(ierr);
207c9a0b8beSMark F. Adams     ierr = PetscCommDuplicate( cm, &new_comm, PETSC_NULL ); CHKERRQ(ierr);
208c9a0b8beSMark F. Adams     ierr = MPI_Comm_free( &cm );                            CHKERRQ(ierr);
209c9a0b8beSMark F. Adams 
2105ef31b24SMark F. Adams     /* MatPartitioningApply call MatConvert, which is collective */
211038e3b61SMark F. Adams     if( a_cbs==1) {
212038e3b61SMark F. Adams       ierr = MatConvert( Cmat, MATMPIADJ, MAT_INITIAL_MATRIX, &adj );   CHKERRQ(ierr);
213eb07cef2SMark F. Adams     }
214eb07cef2SMark F. Adams     else {
215038e3b61SMark F. Adams       /* make a scalar matrix to partition */
216eb07cef2SMark F. Adams       Mat tMat;
217eb07cef2SMark F. Adams       PetscInt Ii,ncols; const PetscScalar *vals; const PetscInt *idx;
218eb07cef2SMark F. Adams       ierr = MatCreateMPIAIJ( wcomm, ncrs0, ncrs0,
219eb07cef2SMark F. Adams                               PETSC_DETERMINE, PETSC_DETERMINE,
220eb07cef2SMark F. Adams                               25, PETSC_NULL, 10, PETSC_NULL,
221eb07cef2SMark F. Adams                               &tMat );
222eb07cef2SMark F. Adams 
223eb07cef2SMark F. Adams       for ( Ii = Istart0; Ii < Iend0; Ii++ ) {
224038e3b61SMark F. Adams         PetscInt dest_row = Ii/a_cbs;
225038e3b61SMark F. Adams         ierr = MatGetRow(Cmat,Ii,&ncols,&idx,&vals); CHKERRQ(ierr);
226eb07cef2SMark F. Adams         for( jj = 0 ; jj < ncols ; jj++ ){
227038e3b61SMark F. Adams           PetscInt dest_col = idx[jj]/a_cbs;
228eb07cef2SMark F. Adams           PetscScalar v = 1.0;
229eb07cef2SMark F. Adams           ierr = MatSetValues(tMat,1,&dest_row,1,&dest_col,&v,ADD_VALUES); CHKERRQ(ierr);
230eb07cef2SMark F. Adams         }
231038e3b61SMark F. Adams         ierr = MatRestoreRow(Cmat,Ii,&ncols,&idx,&vals); CHKERRQ(ierr);
232eb07cef2SMark F. Adams       }
233eb07cef2SMark F. Adams       ierr = MatAssemblyBegin(tMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
234eb07cef2SMark F. Adams       ierr = MatAssemblyEnd(tMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
235eb07cef2SMark F. Adams 
236eb07cef2SMark F. Adams       ierr = MatConvert( tMat, MATMPIADJ, MAT_INITIAL_MATRIX, &adj );   CHKERRQ(ierr);
237eb07cef2SMark F. Adams 
238eb07cef2SMark F. Adams       ierr = MatDestroy( &tMat );  CHKERRQ(ierr);
239eb07cef2SMark F. Adams     }
2405ef31b24SMark F. Adams     if( membershipKey == 0 ) {
241038e3b61SMark F. Adams       if(ncrs0==0)SETERRQ(wcomm,PETSC_ERR_LIB,"zero local nodes -- increase min");
2425ef31b24SMark F. Adams       /* hack to fix global data that pmetis.c uses in 'adj' */
2435ef31b24SMark F. Adams       for( kk=0 , jj=0 ; kk<=npe ; jj++, kk += old_fact ) {
2445ef31b24SMark F. Adams         adj->rmap->range[jj] = adj->rmap->range[kk];
2455ef31b24SMark F. Adams       }
2465ef31b24SMark F. Adams       ierr = MatPartitioningCreate( new_comm, &mpart ); CHKERRQ(ierr);
2475ef31b24SMark F. Adams       ierr = MatPartitioningSetAdjacency( mpart, adj ); CHKERRQ(ierr);
24811e60469SMark F. Adams       ierr = MatPartitioningSetFromOptions( mpart ); CHKERRQ(ierr);
2495ef31b24SMark F. Adams       ierr = MatPartitioningSetNParts( mpart, new_npe ); CHKERRQ(ierr);
25011e60469SMark F. Adams       ierr = MatPartitioningApply( mpart, &isnewproc ); CHKERRQ(ierr);
25111e60469SMark F. Adams       ierr = MatPartitioningDestroy( &mpart ); CHKERRQ(ierr);
2525ef31b24SMark F. Adams       /* collect IS info */
2535ef31b24SMark F. Adams       ierr = ISGetLocalSize( isnewproc, &is_sz );        CHKERRQ(ierr);
254038e3b61SMark F. Adams       ierr = PetscMalloc( a_cbs*is_sz*sizeof(PetscInt), &isnewproc_idx ); CHKERRQ(ierr);
2555ef31b24SMark F. Adams       ierr = ISGetIndices( isnewproc, &is_idx );     CHKERRQ(ierr);
256eb07cef2SMark F. Adams       /* spread partitioning across machine - probably the right thing to do but machine spec. */
257eb07cef2SMark F. Adams       for(kk=0,jj=0;kk<is_sz;kk++){
258038e3b61SMark F. Adams         for(ii=0 ; ii<a_cbs ; ii++, jj++ ) { /* expand for equation level by 'bs' */
259eb07cef2SMark F. Adams           isnewproc_idx[jj] = is_idx[kk] * new_fact;
260eb07cef2SMark F. Adams         }
2615ef31b24SMark F. Adams       }
2625ef31b24SMark F. Adams       ierr = ISRestoreIndices( isnewproc, &is_idx );     CHKERRQ(ierr);
2635ef31b24SMark F. Adams       ierr = ISDestroy( &isnewproc );                    CHKERRQ(ierr);
264038e3b61SMark F. Adams       is_sz *= a_cbs;
2655ef31b24SMark F. Adams     }
2665ef31b24SMark F. Adams     else {
2675ef31b24SMark F. Adams       isnewproc_idx = 0;
2685ef31b24SMark F. Adams       is_sz = 0;
2695ef31b24SMark F. Adams     }
2705ef31b24SMark F. Adams     ierr = MatDestroy( &adj );                       CHKERRQ(ierr);
2715ef31b24SMark F. Adams     ierr = MPI_Comm_free( &new_comm );    CHKERRQ(ierr);
2725ef31b24SMark F. Adams     ierr = ISCreateGeneral( wcomm, is_sz, isnewproc_idx, PETSC_COPY_VALUES, &isnewproc );
2735ef31b24SMark F. Adams     if( membershipKey == 0 ) {
2745ef31b24SMark F. Adams       ierr = PetscFree( isnewproc_idx );  CHKERRQ(ierr);
2755ef31b24SMark F. Adams     }
276e33ef3b1SMark F. Adams 
27711e60469SMark F. Adams     /*
27811e60469SMark F. Adams      Create an index set from the isnewproc index set to indicate the mapping TO
27911e60469SMark F. Adams      */
28011e60469SMark F. Adams     ierr = ISPartitioningToNumbering( isnewproc, &isnum ); CHKERRQ(ierr);
28111e60469SMark F. Adams     /*
28211e60469SMark F. Adams      Determine how many elements are assigned to each processor
28311e60469SMark F. Adams      */
28411e60469SMark F. Adams     ierr = ISPartitioningCount( isnewproc, npe, counts ); CHKERRQ(ierr);
28511e60469SMark F. Adams     ierr = ISDestroy( &isnewproc );                       CHKERRQ(ierr);
286038e3b61SMark F. Adams     ncrs_new = counts[mype]/a_cbs;
2875ef31b24SMark F. Adams 
28811e60469SMark F. Adams     { /* Create a vector to contain the newly ordered element information */
289d3d6bff4SMark F. Adams       const PetscInt *idx, data_sz=a_ndata_rows*a_ndata_cols;
290d3d6bff4SMark F. Adams       const PetscInt  stride0=ncrs0*a_ndata_rows,strideNew=ncrs_new*a_ndata_rows;
291038e3b61SMark F. Adams       PetscInt        ii,jj,kk;
29211e60469SMark F. Adams       IS              isscat;
29311e60469SMark F. Adams       PetscScalar    *array;
29411e60469SMark F. Adams       Vec             src_crd, dest_crd;
295eb07cef2SMark F. Adams       PetscReal      *data = *a_coarse_data;
29611e60469SMark F. Adams       VecScatter      vecscat;
297d3d6bff4SMark F. Adams       PetscInt        tidx[ncrs0*data_sz];
298acadaa72SMark F. Adams 
29911e60469SMark F. Adams       ierr = VecCreate( wcomm, &dest_crd );
300d3d6bff4SMark F. Adams       ierr = VecSetSizes( dest_crd, data_sz*ncrs_new, PETSC_DECIDE ); CHKERRQ(ierr);
30111e60469SMark F. Adams       ierr = VecSetFromOptions( dest_crd ); CHKERRQ(ierr); /*funny vector-get global options?*/
30211e60469SMark F. Adams       /*
303d3d6bff4SMark F. Adams        There are 'a_ndata_rows*a_ndata_cols' data items per node, (one can think of the vectors of having
304d3d6bff4SMark F. Adams        a block size of ...).  Note, ISs are expanded into equation space by 'a_cbs'.
30511e60469SMark F. Adams        */
30611e60469SMark F. Adams       ierr = ISGetIndices( isnum, &idx ); CHKERRQ(ierr);
307038e3b61SMark F. Adams       for(ii=0,jj=0; ii<ncrs0 ; ii++) {
308d3d6bff4SMark F. Adams         PetscInt id = idx[ii*a_cbs]/a_cbs; /* get node back */
309d3d6bff4SMark F. Adams         for( kk=0; kk<data_sz ; kk++, jj++) tidx[jj] = id*data_sz + kk;
31011e60469SMark F. Adams       }
311038e3b61SMark F. Adams       ierr = ISRestoreIndices( isnum, &idx ); CHKERRQ(ierr);
312d3d6bff4SMark F. Adams       ierr = ISCreateGeneral( wcomm, data_sz*ncrs0, tidx, PETSC_COPY_VALUES, &isscat );
31311e60469SMark F. Adams       CHKERRQ(ierr);
31411e60469SMark F. Adams       /*
31511e60469SMark F. Adams        Create a vector to contain the original vertex information for each element
31611e60469SMark F. Adams        */
317d3d6bff4SMark F. Adams       ierr = VecCreateSeq( PETSC_COMM_SELF, data_sz*ncrs0, &src_crd ); CHKERRQ(ierr);
318d3d6bff4SMark F. Adams       for( jj=0; jj<a_ndata_cols ; jj++ ) {
319d3d6bff4SMark F. Adams         for( ii=0 ; ii<ncrs0 ; ii++) {
320d3d6bff4SMark F. Adams           for( kk=0; kk<a_ndata_rows ; kk++ ) {
321d3d6bff4SMark F. Adams             PetscInt ix = ii*a_ndata_rows + kk + jj*stride0, jx = ii*data_sz + kk*a_ndata_cols + jj;
322d3d6bff4SMark F. Adams             ierr = VecSetValues( src_crd, 1, &jx, &data[ix], INSERT_VALUES );  CHKERRQ(ierr);
323d3d6bff4SMark F. Adams           }
324038e3b61SMark F. Adams         }
325eb07cef2SMark F. Adams       }
326eb07cef2SMark F. Adams       ierr = VecAssemblyBegin(src_crd); CHKERRQ(ierr);
327eb07cef2SMark F. Adams       ierr = VecAssemblyEnd(src_crd); CHKERRQ(ierr);
32811e60469SMark F. Adams       /*
32911e60469SMark F. Adams        Scatter the element vertex information (still in the original vertex ordering)
33011e60469SMark F. Adams        to the correct processor
33111e60469SMark F. Adams        */
33211e60469SMark F. Adams       ierr = VecScatterCreate( src_crd, PETSC_NULL, dest_crd, isscat, &vecscat);
33311e60469SMark F. Adams       CHKERRQ(ierr);
33411e60469SMark F. Adams       ierr = ISDestroy( &isscat );       CHKERRQ(ierr);
33511e60469SMark F. Adams       ierr = VecScatterBegin(vecscat,src_crd,dest_crd,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
33611e60469SMark F. Adams       ierr = VecScatterEnd(vecscat,src_crd,dest_crd,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
33711e60469SMark F. Adams       ierr = VecScatterDestroy( &vecscat );       CHKERRQ(ierr);
33811e60469SMark F. Adams       ierr = VecDestroy( &src_crd );       CHKERRQ(ierr);
33911e60469SMark F. Adams       /*
34011e60469SMark F. Adams        Put the element vertex data into a new allocation of the gdata->ele
34111e60469SMark F. Adams        */
342eb07cef2SMark F. Adams       ierr = PetscFree( *a_coarse_data );    CHKERRQ(ierr);
343d3d6bff4SMark F. Adams       ierr = PetscMalloc( data_sz*ncrs_new*sizeof(PetscReal), a_coarse_data );    CHKERRQ(ierr);
344eb07cef2SMark F. Adams 
34511e60469SMark F. Adams       ierr = VecGetArray( dest_crd, &array );    CHKERRQ(ierr);
346eb07cef2SMark F. Adams       data = *a_coarse_data;
347d3d6bff4SMark F. Adams       for( jj=0; jj<a_ndata_cols ; jj++ ) {
348d3d6bff4SMark F. Adams         for( ii=0 ; ii<ncrs_new ; ii++) {
349d3d6bff4SMark F. Adams           for( kk=0; kk<a_ndata_rows ; kk++ ) {
350d3d6bff4SMark F. Adams             PetscInt ix = ii*a_ndata_rows + kk + jj*strideNew, jx = ii*data_sz + kk*a_ndata_cols + jj;
351d3d6bff4SMark F. Adams             data[ix] = PetscRealPart(array[jx]);
352d3d6bff4SMark F. Adams             array[jx] = 1.e300;
353d3d6bff4SMark F. Adams           }
354038e3b61SMark F. Adams         }
355038e3b61SMark F. Adams       }
35611e60469SMark F. Adams       ierr = VecRestoreArray( dest_crd, &array );    CHKERRQ(ierr);
35711e60469SMark F. Adams       ierr = VecDestroy( &dest_crd );    CHKERRQ(ierr);
35811e60469SMark F. Adams     }
35911e60469SMark F. Adams     /*
36011e60469SMark F. Adams      Invert for MatGetSubMatrix
36111e60469SMark F. Adams      */
362038e3b61SMark F. Adams     ierr = ISInvertPermutation( isnum, ncrs_new*a_cbs, &new_indices ); CHKERRQ(ierr);
36311e60469SMark F. Adams     ierr = ISSort( new_indices ); CHKERRQ(ierr); /* is this needed? */
36411e60469SMark F. Adams     ierr = ISDestroy( &isnum ); CHKERRQ(ierr);
36511e60469SMark F. Adams     /* A_crs output */
366038e3b61SMark F. Adams     ierr = MatGetSubMatrix( Cmat, new_indices, new_indices, MAT_INITIAL_MATRIX, a_Amat_crs );
36711e60469SMark F. Adams     CHKERRQ(ierr);
368eb07cef2SMark F. Adams 
369038e3b61SMark F. Adams     ierr = MatDestroy( &Cmat ); CHKERRQ(ierr);
370e33ef3b1SMark F. Adams     Cmat = *a_Amat_crs; /* output */
371038e3b61SMark F. Adams     ierr = MatSetBlockSize( Cmat, a_cbs );      CHKERRQ(ierr);
372eb07cef2SMark F. Adams 
37311e60469SMark F. Adams     /* prolongator */
37411e60469SMark F. Adams     ierr = MatGetOwnershipRange( Pold, &Istart, &Iend );    CHKERRQ(ierr);
37511e60469SMark F. Adams     {
37611e60469SMark F. Adams       IS findices;
37711e60469SMark F. Adams       ierr = ISCreateStride(wcomm,Iend-Istart,Istart,1,&findices);   CHKERRQ(ierr);
37811e60469SMark F. Adams       ierr = MatGetSubMatrix( Pold, findices, new_indices, MAT_INITIAL_MATRIX, &Pnew );
37911e60469SMark F. Adams       CHKERRQ(ierr);
38011e60469SMark F. Adams       ierr = ISDestroy( &findices ); CHKERRQ(ierr);
38111e60469SMark F. Adams     }
3823530afc2SMark F. Adams     ierr = MatDestroy( a_P_inout ); CHKERRQ(ierr);
3833530afc2SMark F. Adams     *a_P_inout = Pnew; /* output */
38411e60469SMark F. Adams     ierr = ISDestroy( &new_indices ); CHKERRQ(ierr);
385e33ef3b1SMark F. Adams   }
386e33ef3b1SMark F. Adams   else {
387e33ef3b1SMark F. Adams     *a_Amat_crs = Cmat; /* output */
388e33ef3b1SMark F. Adams   }
3895b89ad90SMark F. Adams 
3905b89ad90SMark F. Adams   PetscFunctionReturn(0);
3915b89ad90SMark F. Adams }
3925b89ad90SMark F. Adams 
393*1de87581SMark F. Adams #define GAMG_MAXLEVELS 30
3945ef31b24SMark F. Adams #if defined(PETSC_USE_LOG)
3955ef31b24SMark F. Adams PetscLogStage  gamg_stages[20];
3965ef31b24SMark F. Adams #endif
3975b89ad90SMark F. Adams /* -------------------------------------------------------------------------- */
3985b89ad90SMark F. Adams /*
3995b89ad90SMark F. Adams    PCSetUp_GAMG - Prepares for the use of the GAMG preconditioner
4005b89ad90SMark F. Adams                     by setting data structures and options.
4015b89ad90SMark F. Adams 
4025b89ad90SMark F. Adams    Input Parameter:
4035b89ad90SMark F. Adams .  pc - the preconditioner context
4045b89ad90SMark F. Adams 
4055b89ad90SMark F. Adams    Application Interface Routine: PCSetUp()
4065b89ad90SMark F. Adams 
4075b89ad90SMark F. Adams    Notes:
4085b89ad90SMark F. Adams    The interface routine PCSetUp() is not usually called directly by
4095b89ad90SMark F. Adams    the user, but instead is called by PCApply() if necessary.
4105b89ad90SMark F. Adams */
4115b89ad90SMark F. Adams #undef __FUNCT__
4125b89ad90SMark F. Adams #define __FUNCT__ "PCSetUp_GAMG"
413eb07cef2SMark F. Adams PetscErrorCode PCSetUp_GAMG( PC a_pc )
4145b89ad90SMark F. Adams {
4155b89ad90SMark F. Adams   PetscErrorCode  ierr;
416eb07cef2SMark F. Adams   PC_MG           *mg = (PC_MG*)a_pc->data;
4175b89ad90SMark F. Adams   PC_GAMG         *pc_gamg = (PC_GAMG*)mg->innerctx;
418eb07cef2SMark F. Adams   Mat              Amat = a_pc->mat, Pmat = a_pc->pmat;
419d3d6bff4SMark F. Adams   PetscInt         fine_level, level, level1, M, N, bs, nloc, lidx, Istart, Iend;
420eb07cef2SMark F. Adams   MPI_Comm         wcomm = ((PetscObject)a_pc)->comm;
4213530afc2SMark F. Adams   PetscMPIInt      mype,npe,nactivepe;
422038e3b61SMark F. Adams   PetscBool        isOK;
423587fa25dSMark F. Adams   Mat              Aarr[GAMG_MAXLEVELS], Parr[GAMG_MAXLEVELS];
424587fa25dSMark F. Adams   PetscReal       *coarse_data = 0, *data, emaxs[GAMG_MAXLEVELS];
4255ef31b24SMark F. Adams 
4265b89ad90SMark F. Adams   PetscFunctionBegin;
427eb07cef2SMark F. Adams   if( a_pc->setupcalled ) {
428eb07cef2SMark F. Adams     /* no state data in GAMG to destroy */
429eb07cef2SMark F. Adams     ierr = PCReset_MG( a_pc ); CHKERRQ(ierr);
430eb07cef2SMark F. Adams   }
431baa4e9faSMark F. Adams   ierr = MPI_Comm_rank(wcomm,&mype);CHKERRQ(ierr);
432baa4e9faSMark F. Adams   ierr = MPI_Comm_size(wcomm,&npe);CHKERRQ(ierr);
4335b89ad90SMark F. Adams   /* GAMG requires input of fine-grid matrix. It determines nlevels. */
4345b89ad90SMark F. Adams   ierr = MatGetBlockSize( Amat, &bs ); CHKERRQ(ierr);
4353530afc2SMark F. Adams   ierr = MatGetSize( Amat, &M, &N );CHKERRQ(ierr);
436eb07cef2SMark F. Adams   ierr = MatGetOwnershipRange( Amat, &Istart, &Iend ); CHKERRQ(ierr);
437eb07cef2SMark F. Adams   nloc = (Iend-Istart)/bs; assert((Iend-Istart)%bs == 0);
438eb07cef2SMark F. Adams 
439038e3b61SMark F. Adams   /* get data of not around */
440038e3b61SMark F. Adams   if( pc_gamg->m_data == 0 && nloc > 0 ) {
441038e3b61SMark F. Adams     ierr  = PCSetCoordinates_GAMG( a_pc, -1, 0 );    CHKERRQ( ierr );
442eb07cef2SMark F. Adams   }
443eb07cef2SMark F. Adams   data = pc_gamg->m_data;
444038e3b61SMark F. Adams 
445eb07cef2SMark F. Adams   /* Get A_i and R_i */
446d3d6bff4SMark F. Adams PetscPrintf(PETSC_COMM_WORLD,"\t[%d]%s level %d N=%d, n data rows=%d, n data cols=%d, nloc=%d, np=%d\n",0,__FUNCT__,0,N,pc_gamg->m_data_rows,pc_gamg->m_data_cols,nloc,npe);
4478f4b7eb5SMark F. Adams   for ( level=0, Aarr[0] = Pmat, nactivepe = npe; /* hard wired stopping logic */
448eb07cef2SMark F. Adams         level < GAMG_MAXLEVELS-1 && (level==0 || M/bs>TOP_GRID_LIM) && (npe==1 || nactivepe>1);
4490205a208SMark F. Adams         level++ ) {
4505b89ad90SMark F. Adams     level1 = level + 1;
4515ef31b24SMark F. Adams     ierr = PetscLogEventBegin(gamg_setup_stages[SET1],0,0,0,0);CHKERRQ(ierr);
452d3d6bff4SMark F. Adams     ierr = createProlongation(Aarr[level], data, pc_gamg->m_dim, pc_gamg->m_data_cols, pc_gamg->m_useSA,
453d3d6bff4SMark F. Adams                               &bs, &Parr[level1], &coarse_data, &isOK, &emaxs[level] );
4545b89ad90SMark F. Adams     CHKERRQ(ierr);
455d3d6bff4SMark F. Adams     ierr = PetscFree( data ); CHKERRQ( ierr );
4565ef31b24SMark F. Adams     ierr = PetscLogEventEnd(gamg_setup_stages[SET1],0,0,0,0);CHKERRQ(ierr);
4575ef31b24SMark F. Adams 
458baa4e9faSMark F. Adams     if(level==0) Aarr[0] = Amat; /* use Pmat for finest level setup, but use mat for solver */
459d3d6bff4SMark F. Adams 
460baa4e9faSMark F. Adams     if( isOK ) {
4615ef31b24SMark F. Adams       ierr = PetscLogEventBegin(gamg_setup_stages[SET2],0,0,0,0);CHKERRQ(ierr);
462d3d6bff4SMark F. Adams       ierr = partitionLevel( Aarr[level], pc_gamg->m_useSA ? bs : 1, pc_gamg->m_data_cols, bs,
463eb07cef2SMark F. Adams                              &Parr[level1], &coarse_data, &nactivepe, &Aarr[level1] );
4643530afc2SMark F. Adams       CHKERRQ(ierr);
4655ef31b24SMark F. Adams       ierr = PetscLogEventEnd(gamg_setup_stages[SET2],0,0,0,0);CHKERRQ(ierr);
4663530afc2SMark F. Adams       ierr = MatGetSize( Aarr[level1], &M, &N );CHKERRQ(ierr);
467d3d6bff4SMark F. Adams PetscPrintf(PETSC_COMM_WORLD,"\t\t[%d]%s %d) N=%d, bs=%d, n data cols=%d, %d active pes\n",0,__FUNCT__,level1,N,bs,pc_gamg->m_data_cols,nactivepe);
468e33ef3b1SMark F. Adams       /* coarse grids with SA can have zero row/cols from singleton aggregates */
469e33ef3b1SMark F. Adams       /* aggregation method can probably gaurrentee this does not happen! - be safe for now */
470e33ef3b1SMark F. Adams       if( PETSC_TRUE ){
471e33ef3b1SMark F. Adams         Vec diag; PetscScalar *data_arr,v; PetscInt Istart,Iend,kk,nloc,id;
472e33ef3b1SMark F. Adams         ierr = MatGetOwnershipRange(Aarr[level1], &Istart, &Iend); CHKERRQ(ierr);
473e33ef3b1SMark F. Adams         nloc = Iend-Istart;
474e33ef3b1SMark F. Adams         ierr = MatGetVecs( Aarr[level1], &diag, 0 );    CHKERRQ(ierr);
475e33ef3b1SMark F. Adams         ierr = MatGetDiagonal( Aarr[level1], diag );    CHKERRQ(ierr);
476e33ef3b1SMark F. Adams         ierr = VecGetArray( diag, &data_arr );   CHKERRQ(ierr);
477e33ef3b1SMark F. Adams         for(kk=0;kk<nloc;kk++){
478e33ef3b1SMark F. Adams           if(data_arr[kk]==0.0) {
479d3d6bff4SMark F. Adams             id = kk + Istart; v = 1.e-1;
480e33ef3b1SMark F. Adams             ierr = MatSetValues(Aarr[level1],1,&id,1,&id,&v,INSERT_VALUES);
481e33ef3b1SMark F. Adams             CHKERRQ(ierr);
482d3d6bff4SMark F. Adams             /* PetscPrintf(PETSC_COMM_SELF,"[%d]%s warning: added diag to zero (%d) on level %d \n",mype,__FUNCT__,id,level); */
483e33ef3b1SMark F. Adams           }
484e33ef3b1SMark F. Adams         }
485e33ef3b1SMark F. Adams         ierr = VecRestoreArray( diag, &data_arr ); CHKERRQ(ierr);
486e33ef3b1SMark F. Adams         ierr = VecDestroy( &diag );                CHKERRQ(ierr);
487e33ef3b1SMark F. Adams         ierr = MatAssemblyBegin(Aarr[level1],MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
488e33ef3b1SMark F. Adams         ierr = MatAssemblyEnd(Aarr[level1],MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
489e33ef3b1SMark F. Adams       }
490baa4e9faSMark F. Adams     }
491baa4e9faSMark F. Adams     else{
492baa4e9faSMark F. Adams       break;
493baa4e9faSMark F. Adams     }
494eb07cef2SMark F. Adams     data = coarse_data;
4955b89ad90SMark F. Adams   }
496eb07cef2SMark F. Adams   ierr = PetscFree( coarse_data ); CHKERRQ( ierr );
497baa4e9faSMark F. Adams PetscPrintf(PETSC_COMM_WORLD,"\t[%d]%s %d levels\n",0,__FUNCT__,level + 1);
4985b89ad90SMark F. Adams   pc_gamg->m_data = 0; /* destroyed coordinate data */
4995b89ad90SMark F. Adams   pc_gamg->m_Nlevels = level + 1;
5005b89ad90SMark F. Adams   fine_level = level;
501eb07cef2SMark F. Adams   ierr = PCMGSetLevels(a_pc,pc_gamg->m_Nlevels,PETSC_NULL);CHKERRQ(ierr);
5025b89ad90SMark F. Adams 
503fc4362bfSMark F. Adams   /* set default smoothers */
504587fa25dSMark F. Adams   for ( lidx=1, level = pc_gamg->m_Nlevels-2;
505587fa25dSMark F. Adams         lidx <= fine_level;
506587fa25dSMark F. Adams         lidx++, level--) {
5075745e0f5SMark F. Adams     PetscReal emax, emin;
5085b89ad90SMark F. Adams     KSP smoother; PC subpc;
509587fa25dSMark F. Adams     ierr = PCMGGetSmoother( a_pc, lidx, &smoother ); CHKERRQ(ierr);
5105b89ad90SMark F. Adams     ierr = KSPSetType( smoother, KSPCHEBYCHEV );CHKERRQ(ierr);
511038e3b61SMark F. Adams     if( emaxs[level] > 0.0 ) emax = emaxs[level];
512587fa25dSMark F. Adams     else{ /* eigen estimate 'emax' */
513587fa25dSMark F. Adams       KSP eksp; Mat Lmat = Aarr[level];
514fc4362bfSMark F. Adams       Vec bb, xx; PC pc;
515038e3b61SMark F. Adams 
5165745e0f5SMark F. Adams       ierr = MatGetVecs( Lmat, &bb, 0 );         CHKERRQ(ierr);
5175745e0f5SMark F. Adams       ierr = MatGetVecs( Lmat, &xx, 0 );         CHKERRQ(ierr);
518fc4362bfSMark F. Adams       {
519fc4362bfSMark F. Adams 	PetscRandom    rctx;
520fc4362bfSMark F. Adams 	ierr = PetscRandomCreate(wcomm,&rctx);CHKERRQ(ierr);
521fc4362bfSMark F. Adams 	ierr = PetscRandomSetFromOptions(rctx);CHKERRQ(ierr);
522fc4362bfSMark F. Adams 	ierr = VecSetRandom(bb,rctx);CHKERRQ(ierr);
523fc4362bfSMark F. Adams 	ierr = PetscRandomDestroy( &rctx ); CHKERRQ(ierr);
5245b89ad90SMark F. Adams       }
525fc4362bfSMark F. Adams       ierr = KSPCreate(wcomm,&eksp);CHKERRQ(ierr);
526e33ef3b1SMark F. Adams       ierr = KSPSetType( eksp, KSPCG );                      CHKERRQ(ierr);
527fc4362bfSMark F. Adams       ierr = KSPSetInitialGuessNonzero( eksp, PETSC_FALSE ); CHKERRQ(ierr);
5285745e0f5SMark F. Adams       ierr = KSPSetOperators( eksp, Lmat, Lmat, DIFFERENT_NONZERO_PATTERN ); CHKERRQ( ierr );
529fc4362bfSMark F. Adams       ierr = KSPGetPC( eksp, &pc );CHKERRQ( ierr );
530e33ef3b1SMark F. Adams       ierr = PCSetType( pc, PETSC_GAMG_SMOOTHER ); CHKERRQ(ierr); /* should be same as above */
531038e3b61SMark F. Adams       ierr = KSPSetTolerances( eksp, PETSC_DEFAULT, PETSC_DEFAULT, PETSC_DEFAULT, 10 );
532fc4362bfSMark F. Adams       CHKERRQ(ierr);
533e33ef3b1SMark F. Adams       //ierr = KSPSetConvergenceTest( eksp, KSPSkipConverged, 0, 0 ); CHKERRQ(ierr);
534fc4362bfSMark F. Adams       ierr = KSPSetNormType( eksp, KSP_NORM_NONE );                 CHKERRQ(ierr);
535fc4362bfSMark F. Adams 
536fc4362bfSMark F. Adams       ierr = KSPSetComputeSingularValues( eksp,PETSC_TRUE ); CHKERRQ(ierr);
537fc4362bfSMark F. Adams       ierr = KSPSolve( eksp, bb, xx ); CHKERRQ(ierr);
538fc4362bfSMark F. Adams       ierr = KSPComputeExtremeSingularValues( eksp, &emax, &emin ); CHKERRQ(ierr);
539fc4362bfSMark F. Adams       ierr = VecDestroy( &xx );       CHKERRQ(ierr);
540fc4362bfSMark F. Adams       ierr = VecDestroy( &bb );       CHKERRQ(ierr);
541fc4362bfSMark F. Adams       ierr = KSPDestroy( &eksp );       CHKERRQ(ierr);
542e33ef3b1SMark F. Adams       PetscPrintf(PETSC_COMM_WORLD,"%s max eigen = %e min = %e\n",__FUNCT__,emax,emin);
543fc4362bfSMark F. Adams     }
544038e3b61SMark F. Adams     {
545038e3b61SMark F. Adams       PetscInt N1, N0, tt;
546038e3b61SMark F. Adams       ierr = MatGetSize( Aarr[level], &N1, &tt );         CHKERRQ(ierr);
547038e3b61SMark F. Adams       ierr = MatGetSize( Aarr[level+1], &N0, &tt );       CHKERRQ(ierr);
548e33ef3b1SMark F. Adams       emin = .5*emax/((PetscReal)N1/(PetscReal)N0); /* this should be about the coarsening rate */
549038e3b61SMark F. Adams       emax *= 1.05;
550038e3b61SMark F. Adams     }
551038e3b61SMark F. Adams 
552587fa25dSMark F. Adams     ierr = KSPSetOperators( smoother, Aarr[level], Aarr[level], DIFFERENT_NONZERO_PATTERN );
553fc4362bfSMark F. Adams     ierr = KSPChebychevSetEigenvalues( smoother, emax, emin );CHKERRQ(ierr);
554e33ef3b1SMark F. Adams     ierr = KSPSetTolerances(smoother,PETSC_DEFAULT,PETSC_DEFAULT,PETSC_DEFAULT,2); CHKERRQ(ierr);
5555745e0f5SMark F. Adams     ierr = KSPGetPC( smoother, &subpc ); CHKERRQ(ierr);
556e33ef3b1SMark F. Adams     ierr = PCSetType( subpc, PETSC_GAMG_SMOOTHER ); CHKERRQ(ierr);
5575745e0f5SMark F. Adams     ierr = KSPSetNormType( smoother, KSP_NORM_NONE ); CHKERRQ(ierr);
5585745e0f5SMark F. Adams   }
5595745e0f5SMark F. Adams   {
5605745e0f5SMark F. Adams     KSP smoother; /* coarse grid */
5615745e0f5SMark F. Adams     Mat Lmat = Aarr[pc_gamg->m_Nlevels-1];
562eb07cef2SMark F. Adams     ierr = PCMGGetSmoother( a_pc, 0, &smoother ); CHKERRQ(ierr);
5635745e0f5SMark F. Adams     ierr = KSPSetOperators( smoother, Lmat, Lmat, DIFFERENT_NONZERO_PATTERN );
5645745e0f5SMark F. Adams     CHKERRQ(ierr);
5655745e0f5SMark F. Adams     ierr = KSPSetNormType( smoother, KSP_NORM_NONE ); CHKERRQ(ierr);
566fc4362bfSMark F. Adams   }
567fc4362bfSMark F. Adams   /* should be called in PCSetFromOptions_GAMG(), but cannot be called prior to PCMGSetLevels() */
568eb07cef2SMark F. Adams   ierr = PCSetFromOptions_MG(a_pc); CHKERRQ(ierr);
5695b89ad90SMark F. Adams   {
5705b89ad90SMark F. Adams     PetscBool galerkin;
571eb07cef2SMark F. Adams     ierr = PCMGGetGalerkin( a_pc,  &galerkin); CHKERRQ(ierr);
5725b89ad90SMark F. Adams     if(galerkin){
5735b89ad90SMark F. Adams       SETERRQ(wcomm,PETSC_ERR_ARG_WRONG, "GAMG does galerkin manually so it must not be used in PC_MG.");
5745b89ad90SMark F. Adams     }
5755b89ad90SMark F. Adams   }
5765745e0f5SMark F. Adams 
5775745e0f5SMark F. Adams   /* set interpolation between the levels, create timer stages, clean up */
5788f4b7eb5SMark F. Adams   if( PETSC_FALSE ) {
5795ef31b24SMark F. Adams     char str[32];
5805ef31b24SMark F. Adams     sprintf(str,"MG Level %d (%d)",0,pc_gamg->m_Nlevels-1);
5815ef31b24SMark F. Adams     PetscLogStageRegister(str, &gamg_stages[fine_level]);
5825ef31b24SMark F. Adams   }
583587fa25dSMark F. Adams   for (lidx=0,level=pc_gamg->m_Nlevels-1;
584587fa25dSMark F. Adams        lidx<fine_level;
585587fa25dSMark F. Adams        lidx++, level--){
586587fa25dSMark F. Adams     ierr = PCMGSetInterpolation( a_pc, lidx+1, Parr[level] );CHKERRQ(ierr);
5876c237d78SBarry Smith     if( !PETSC_TRUE ) {
58811e60469SMark F. Adams       PetscViewer viewer; char fname[32];
589038e3b61SMark F. Adams       sprintf(fname,"Pmat_%d.m",level);
59011e60469SMark F. Adams       ierr = PetscViewerASCIIOpen( wcomm, fname, &viewer );  CHKERRQ(ierr);
5915b89ad90SMark F. Adams       ierr = PetscViewerSetFormat( viewer, PETSC_VIEWER_ASCII_MATLAB);  CHKERRQ(ierr);
592038e3b61SMark F. Adams       ierr = MatView( Parr[level], viewer ); CHKERRQ(ierr);
5935b89ad90SMark F. Adams       ierr = PetscViewerDestroy( &viewer );
594e33ef3b1SMark F. Adams       sprintf(fname,"Amat_%d.m",level);
595e33ef3b1SMark F. Adams       ierr = PetscViewerASCIIOpen( wcomm, fname, &viewer );  CHKERRQ(ierr);
596e33ef3b1SMark F. Adams       ierr = PetscViewerSetFormat( viewer, PETSC_VIEWER_ASCII_MATLAB);  CHKERRQ(ierr);
597e33ef3b1SMark F. Adams       ierr = MatView( Aarr[level], viewer ); CHKERRQ(ierr);
598e33ef3b1SMark F. Adams       ierr = PetscViewerDestroy( &viewer );
5995b89ad90SMark F. Adams     }
600587fa25dSMark F. Adams     ierr = MatDestroy( &Parr[level] );  CHKERRQ(ierr);
601587fa25dSMark F. Adams     ierr = MatDestroy( &Aarr[level] );  CHKERRQ(ierr);
6028f4b7eb5SMark F. Adams     if( PETSC_FALSE ) {
6035ef31b24SMark F. Adams       char str[32];
604587fa25dSMark F. Adams       sprintf(str,"MG Level %d (%d)",lidx+1,level-1);
605587fa25dSMark F. Adams       PetscLogStageRegister(str, &gamg_stages[level-1]);
606a92563c5SMark F. Adams     }
6075b89ad90SMark F. Adams   }
6085745e0f5SMark F. Adams 
6095b89ad90SMark F. Adams   /* setupcalled is set to 0 so that MG is setup from scratch */
610eb07cef2SMark F. Adams   a_pc->setupcalled = 0;
611eb07cef2SMark F. Adams   ierr = PCSetUp_MG(a_pc);CHKERRQ(ierr);
612e33ef3b1SMark F. Adams 
6135b89ad90SMark F. Adams   PetscFunctionReturn(0);
6145b89ad90SMark F. Adams }
6155b89ad90SMark F. Adams 
616eb07cef2SMark F. Adams /* ------------------------------------------------------------------------- */
6175b89ad90SMark F. Adams /*
6185b89ad90SMark F. Adams    PCDestroy_GAMG - Destroys the private context for the GAMG preconditioner
6195b89ad90SMark F. Adams    that was created with PCCreate_GAMG().
6205b89ad90SMark F. Adams 
6215b89ad90SMark F. Adams    Input Parameter:
6225b89ad90SMark F. Adams .  pc - the preconditioner context
6235b89ad90SMark F. Adams 
6245b89ad90SMark F. Adams    Application Interface Routine: PCDestroy()
6255b89ad90SMark F. Adams */
6265b89ad90SMark F. Adams #undef __FUNCT__
6275b89ad90SMark F. Adams #define __FUNCT__ "PCDestroy_GAMG"
6285b89ad90SMark F. Adams PetscErrorCode PCDestroy_GAMG(PC pc)
6295b89ad90SMark F. Adams {
6305b89ad90SMark F. Adams   PetscErrorCode  ierr;
6315b89ad90SMark F. Adams   PC_MG           *mg = (PC_MG*)pc->data;
6325b89ad90SMark F. Adams   PC_GAMG         *pc_gamg= (PC_GAMG*)mg->innerctx;
6335b89ad90SMark F. Adams 
6345b89ad90SMark F. Adams   PetscFunctionBegin;
6355b89ad90SMark F. Adams   ierr = PCReset_GAMG(pc);CHKERRQ(ierr);
6365b89ad90SMark F. Adams   ierr = PetscFree(pc_gamg);CHKERRQ(ierr);
6375b89ad90SMark F. Adams   ierr = PCDestroy_MG(pc);CHKERRQ(ierr);
6385b89ad90SMark F. Adams   PetscFunctionReturn(0);
6395b89ad90SMark F. Adams }
6405b89ad90SMark F. Adams 
6415b89ad90SMark F. Adams #undef __FUNCT__
6425b89ad90SMark F. Adams #define __FUNCT__ "PCSetFromOptions_GAMG"
6435b89ad90SMark F. Adams PetscErrorCode PCSetFromOptions_GAMG(PC pc)
6445b89ad90SMark F. Adams {
6455b89ad90SMark F. Adams   /* PetscErrorCode  ierr; */
6465b89ad90SMark F. Adams   /* PC_MG           *mg = (PC_MG*)pc->data; */
6475b89ad90SMark F. Adams   /* PC_GAMG         *pc_gamg = (PC_GAMG*)mg->innerctx; */
6485b89ad90SMark F. Adams   /* MPI_Comm        comm = ((PetscObject)pc)->comm; */
6495b89ad90SMark F. Adams 
6505b89ad90SMark F. Adams   PetscFunctionBegin;
6515b89ad90SMark F. Adams   PetscFunctionReturn(0);
6525b89ad90SMark F. Adams }
6535b89ad90SMark F. Adams 
6545b89ad90SMark F. Adams /* -------------------------------------------------------------------------- */
6555b89ad90SMark F. Adams /*
6565b89ad90SMark F. Adams  PCCreate_GAMG - Creates a GAMG preconditioner context, PC_GAMG
6575b89ad90SMark F. Adams 
6585b89ad90SMark F. Adams    Input Parameter:
6595b89ad90SMark F. Adams .  pc - the preconditioner context
6605b89ad90SMark F. Adams 
6615b89ad90SMark F. Adams    Application Interface Routine: PCCreate()
6625b89ad90SMark F. Adams 
6635b89ad90SMark F. Adams   */
6645b89ad90SMark F. Adams  /* MC
6655b89ad90SMark F. Adams      PCGAMG - Use algebraic multigrid preconditioning. This preconditioner requires you provide
6665b89ad90SMark F. Adams        fine grid discretization matrix and coordinates on the fine grid.
6675b89ad90SMark F. Adams 
6685b89ad90SMark F. Adams    Options Database Key:
6695b89ad90SMark F. Adams    Multigrid options(inherited)
6705b89ad90SMark F. Adams +  -pc_mg_cycles <1>: 1 for V cycle, 2 for W-cycle (MGSetCycles)
6715b89ad90SMark F. Adams .  -pc_mg_smoothup <1>: Number of post-smoothing steps (MGSetNumberSmoothUp)
6725b89ad90SMark F. Adams .  -pc_mg_smoothdown <1>: Number of pre-smoothing steps (MGSetNumberSmoothDown)
6735b89ad90SMark F. Adams    -pc_mg_type <multiplicative>: (one of) additive multiplicative full cascade kascade
6745b89ad90SMark F. Adams    GAMG options:
6755b89ad90SMark F. Adams 
6765b89ad90SMark F. Adams    Level: intermediate
6775b89ad90SMark F. Adams   Concepts: multigrid
6785b89ad90SMark F. Adams 
6795b89ad90SMark F. Adams .seealso:  PCCreate(), PCSetType(), PCType (for list of available types), PC, PCMGType,
6805b89ad90SMark F. Adams            PCMGSetLevels(), PCMGGetLevels(), PCMGSetType(), MPSetCycles(), PCMGSetNumberSmoothDown(),
6815b89ad90SMark F. Adams            PCMGSetNumberSmoothUp(), PCMGGetCoarseSolve(), PCMGSetResidual(), PCMGSetInterpolation(),
6825b89ad90SMark F. Adams            PCMGSetRestriction(), PCMGGetSmoother(), PCMGGetSmootherUp(), PCMGGetSmootherDown(),
6835b89ad90SMark F. Adams            PCMGSetCyclesOnLevel(), PCMGSetRhs(), PCMGSetX(), PCMGSetR()
6845b89ad90SMark F. Adams M */
6855b89ad90SMark F. Adams 
6865b89ad90SMark F. Adams EXTERN_C_BEGIN
6875b89ad90SMark F. Adams #undef __FUNCT__
6885b89ad90SMark F. Adams #define __FUNCT__ "PCCreate_GAMG"
6895b89ad90SMark F. Adams PetscErrorCode  PCCreate_GAMG(PC pc)
6905b89ad90SMark F. Adams {
6915b89ad90SMark F. Adams   PetscErrorCode  ierr;
6925b89ad90SMark F. Adams   PC_GAMG         *pc_gamg;
6935b89ad90SMark F. Adams   PC_MG           *mg;
6945ef31b24SMark F. Adams   PetscClassId     cookie;
6955b89ad90SMark F. Adams 
6965b89ad90SMark F. Adams   PetscFunctionBegin;
6975b89ad90SMark F. Adams   /* PCGAMG is an inherited class of PCMG. Initialize pc as PCMG */
6985b89ad90SMark F. Adams   ierr = PCSetType(pc,PCMG);CHKERRQ(ierr); /* calls PCCreate_MG() and MGCreate_Private() */
6995b89ad90SMark F. Adams   ierr = PetscObjectChangeTypeName((PetscObject)pc,PCGAMG);CHKERRQ(ierr);
7005b89ad90SMark F. Adams 
7015b89ad90SMark F. Adams   /* create a supporting struct and attach it to pc */
7025b89ad90SMark F. Adams   ierr = PetscNewLog(pc,PC_GAMG,&pc_gamg);CHKERRQ(ierr);
7035b89ad90SMark F. Adams   mg = (PC_MG*)pc->data;
7045b89ad90SMark F. Adams   mg->innerctx = pc_gamg;
7055b89ad90SMark F. Adams 
7065b89ad90SMark F. Adams   pc_gamg->m_Nlevels    = -1;
7075b89ad90SMark F. Adams 
7085b89ad90SMark F. Adams   /* overwrite the pointers of PCMG by the functions of PCGAMG */
7095b89ad90SMark F. Adams   pc->ops->setfromoptions = PCSetFromOptions_GAMG;
7105b89ad90SMark F. Adams   pc->ops->setup          = PCSetUp_GAMG;
7115b89ad90SMark F. Adams   pc->ops->reset          = PCReset_GAMG;
7125b89ad90SMark F. Adams   pc->ops->destroy        = PCDestroy_GAMG;
7135b89ad90SMark F. Adams 
7145b89ad90SMark F. Adams   ierr = PetscObjectComposeFunctionDynamic( (PetscObject)pc,
7155b89ad90SMark F. Adams 					    "PCSetCoordinates_C",
7165b89ad90SMark F. Adams 					    "PCSetCoordinates_GAMG",
7175b89ad90SMark F. Adams 					    PCSetCoordinates_GAMG);CHKERRQ(ierr);
7185ef31b24SMark F. Adams 
7195ef31b24SMark F. Adams   PetscClassIdRegister("GAMG Setup",&cookie);
7205ef31b24SMark F. Adams   PetscLogEventRegister("GAMG-createProl", cookie, &gamg_setup_stages[SET1]);
7215ef31b24SMark F. Adams   PetscLogEventRegister("GAMG-partLevel", cookie, &gamg_setup_stages[SET2]);
7225ef31b24SMark F. Adams   PetscLogEventRegister("GAMG-MIS Graph", cookie, &gamg_setup_stages[SET3]);
7235ef31b24SMark F. Adams   PetscLogEventRegister("GAMG-MIS-Agg", cookie, &gamg_setup_stages[SET4]);
7245ef31b24SMark F. Adams   PetscLogEventRegister("GAMG-growSupp", cookie, &gamg_setup_stages[SET5]);
7255ef31b24SMark F. Adams   PetscLogEventRegister("GAMG-tri-Prol", cookie, &gamg_setup_stages[SET6]);
726e33ef3b1SMark F. Adams   PetscLogEventRegister("GAMG-sa-init", cookie, &gamg_setup_stages[SET7]);
727e33ef3b1SMark F. Adams   PetscLogEventRegister("GAMG-sa-frmProl0", cookie, &gamg_setup_stages[SET8]);
728e33ef3b1SMark F. Adams   PetscLogEventRegister("GAMG-sa-smooth", cookie, &gamg_setup_stages[SET9]);
7295ef31b24SMark F. Adams 
7305b89ad90SMark F. Adams   PetscFunctionReturn(0);
7315b89ad90SMark F. Adams }
7325b89ad90SMark F. Adams EXTERN_C_END
733