xref: /petsc/src/ksp/pc/impls/gamg/gamg.c (revision afc97cdc41892d7ef3be7129261ff8c2fb735c52)
15b89ad90SMark F. Adams /*
25b89ad90SMark F. Adams  GAMG geometric-algebric multiogrid PC - Mark Adams 2011
35b89ad90SMark F. Adams  */
45ef31b24SMark F. Adams #include <../src/ksp/pc/impls/gamg/gamg.h>
5f96513f1SMatthew G Knepley 
6f96513f1SMatthew G Knepley PetscLogEvent gamg_setup_stages[NUM_SET];
7f96513f1SMatthew G Knepley 
85b89ad90SMark F. Adams /* Private context for the GAMG preconditioner */
95b89ad90SMark F. Adams typedef struct gamg_TAG {
105b89ad90SMark F. Adams   PetscInt       m_dim;
115b89ad90SMark F. Adams   PetscInt       m_Nlevels;
125b89ad90SMark F. Adams   PetscInt       m_data_sz;
13d3d6bff4SMark F. Adams   PetscInt       m_data_rows;
14d3d6bff4SMark F. Adams   PetscInt       m_data_cols;
15d3d6bff4SMark F. Adams   PetscBool      m_useSA;
165b89ad90SMark F. Adams   PetscReal     *m_data; /* blocked vector of vertex data on fine grid (coordinates) */
175b89ad90SMark F. Adams } PC_GAMG;
185b89ad90SMark F. Adams 
195b89ad90SMark F. Adams /* -------------------------------------------------------------------------- */
205b89ad90SMark F. Adams /*
215b89ad90SMark F. Adams    PCSetCoordinates_GAMG
225b89ad90SMark F. Adams 
235b89ad90SMark F. Adams    Input Parameter:
245b89ad90SMark F. Adams    .  pc - the preconditioner context
255b89ad90SMark F. Adams */
26a92563c5SMark F. Adams EXTERN_C_BEGIN
275b89ad90SMark F. Adams #undef __FUNCT__
285b89ad90SMark F. Adams #define __FUNCT__ "PCSetCoordinates_GAMG"
29eb07cef2SMark F. Adams PetscErrorCode PCSetCoordinates_GAMG( PC a_pc, PetscInt a_ndm, PetscReal *a_coords )
305b89ad90SMark F. Adams {
31eb07cef2SMark F. Adams   PC_MG          *mg = (PC_MG*)a_pc->data;
325b89ad90SMark F. Adams   PC_GAMG        *pc_gamg = (PC_GAMG*)mg->innerctx;
336c237d78SBarry Smith   PetscErrorCode ierr;
34d3d6bff4SMark F. Adams   PetscInt       arrsz,bs,my0,kk,ii,jj,nloc,Iend;
35038e3b61SMark F. Adams   Mat            Amat = a_pc->pmat;
36d3d6bff4SMark F. Adams   PetscBool      flag;
37785cba28SMark F. Adams   char           str[64];
385b89ad90SMark F. Adams 
395b89ad90SMark F. Adams   PetscFunctionBegin;
40038e3b61SMark F. Adams   ierr  = MatGetBlockSize( Amat, &bs );               CHKERRQ( ierr );
41d3d6bff4SMark F. Adams   ierr  = MatGetOwnershipRange( Amat, &my0, &Iend ); CHKERRQ(ierr);
42d3d6bff4SMark F. Adams   nloc = (Iend-my0)/bs;
43d3d6bff4SMark F. Adams   if((Iend-my0)%bs!=0) SETERRQ1(((PetscObject)Amat)->comm,PETSC_ERR_ARG_WRONG, "Bad local size %d.",nloc);
44038e3b61SMark F. Adams 
45785cba28SMark F. Adams   ierr  = PetscOptionsGetString(PETSC_NULL,"-pc_gamg_type",str,64,&flag);    CHKERRQ( ierr );
46d3d6bff4SMark F. Adams   pc_gamg->m_useSA = (PetscBool)(flag && strcmp(str,"sa") == 0);
47038e3b61SMark F. Adams 
48d3d6bff4SMark F. Adams   pc_gamg->m_data_rows = 1;
49d3d6bff4SMark F. Adams   if(a_coords == 0) pc_gamg->m_useSA = PETSC_TRUE; /* use SA if no data */
50d3d6bff4SMark F. Adams   if( !pc_gamg->m_useSA ) pc_gamg->m_data_cols = a_ndm; /* coordinates */
51038e3b61SMark F. Adams   else{ /* SA: null space vectors */
52d3d6bff4SMark F. Adams     if(a_coords != 0 && bs==1 ) pc_gamg->m_data_cols = 1; /* scalar w/ coords and SA (not needed) */
53d3d6bff4SMark F. Adams     else if(a_coords != 0) pc_gamg->m_data_cols = (a_ndm==2 ? 3 : 6); /* elasticity */
54d3d6bff4SMark F. Adams     else pc_gamg->m_data_cols = bs; /* no data, force SA with constant null space vectors */
55d3d6bff4SMark F. Adams     pc_gamg->m_data_rows = bs;
56038e3b61SMark F. Adams   }
57d3d6bff4SMark F. Adams   arrsz = nloc*pc_gamg->m_data_rows*pc_gamg->m_data_cols;
585b89ad90SMark F. Adams 
59038e3b61SMark F. Adams   /* create data - syntactic sugar that should be refactored at some point */
606c237d78SBarry Smith   if (!pc_gamg->m_data || (pc_gamg->m_data_sz != arrsz)) {
615b89ad90SMark F. Adams     ierr = PetscFree( pc_gamg->m_data );  CHKERRQ(ierr);
62eb07cef2SMark F. Adams     ierr = PetscMalloc((arrsz+1)*sizeof(double), &pc_gamg->m_data ); CHKERRQ(ierr);
635b89ad90SMark F. Adams   }
64038e3b61SMark F. Adams   for(kk=0;kk<arrsz;kk++)pc_gamg->m_data[kk] = -999.;
65eb07cef2SMark F. Adams   pc_gamg->m_data[arrsz] = -99.;
66038e3b61SMark F. Adams   /* copy data in - column oriented */
67d3d6bff4SMark F. Adams   if( pc_gamg->m_useSA ) {
68d3d6bff4SMark F. Adams     const PetscInt M = Iend - my0;
69038e3b61SMark F. Adams     for(kk=0;kk<nloc;kk++){
70038e3b61SMark F. Adams       PetscReal *data = &pc_gamg->m_data[kk*bs];
71d3d6bff4SMark F. Adams       if( pc_gamg->m_data_cols==1 ) *data = 1.0;
72038e3b61SMark F. Adams       else {
73038e3b61SMark F. Adams         for(ii=0;ii<bs;ii++)
74038e3b61SMark F. Adams 	  for(jj=0;jj<bs;jj++)
75038e3b61SMark F. Adams 	    if(ii==jj)data[ii*M + jj] = 1.0; /* translational modes */
76038e3b61SMark F. Adams 	    else data[ii*M + jj] = 0.0;
77eb07cef2SMark F. Adams         if( a_coords != 0 ) {
78038e3b61SMark F. Adams           if( a_ndm == 2 ){ /* rotational modes */
79038e3b61SMark F. Adams             data += 2*M;
80038e3b61SMark F. Adams             data[0] = -a_coords[2*kk+1];
81038e3b61SMark F. Adams             data[1] =  a_coords[2*kk];
825b89ad90SMark F. Adams           }
83eb07cef2SMark F. Adams           else {
84038e3b61SMark F. Adams             data += 3*M;
85038e3b61SMark F. Adams             data[0] = 0.0;               data[M+0] =  a_coords[3*kk+2]; data[2*M+0] = -a_coords[3*kk+1];
86038e3b61SMark F. Adams             data[1] = -a_coords[3*kk+2]; data[M+1] = 0.0;               data[2*M+1] =  a_coords[3*kk];
87038e3b61SMark F. Adams             data[2] =  a_coords[3*kk+1]; data[M+2] = -a_coords[3*kk];   data[2*M+2] = 0.0;
88038e3b61SMark F. Adams           }
89eb07cef2SMark F. Adams         }
90eb07cef2SMark F. Adams       }
91eb07cef2SMark F. Adams     }
92eb07cef2SMark F. Adams   }
93eb07cef2SMark F. Adams   else {
94038e3b61SMark F. Adams     for( kk = 0 ; kk < nloc ; kk++ ){
95038e3b61SMark F. Adams       for( ii = 0 ; ii < a_ndm ; ii++ ) {
96038e3b61SMark F. Adams         pc_gamg->m_data[ii*nloc + kk] =  a_coords[kk*a_ndm + ii];
97eb07cef2SMark F. Adams       }
98eb07cef2SMark F. Adams     }
99038e3b61SMark F. Adams   }
100eb07cef2SMark F. Adams   assert(pc_gamg->m_data[arrsz] == -99.);
101038e3b61SMark F. Adams 
1025b89ad90SMark F. Adams   pc_gamg->m_data_sz = arrsz;
103eb07cef2SMark F. Adams   pc_gamg->m_dim = a_ndm;
1045b89ad90SMark F. Adams 
1055b89ad90SMark F. Adams   PetscFunctionReturn(0);
1065b89ad90SMark F. Adams }
107a92563c5SMark F. Adams EXTERN_C_END
1085b89ad90SMark F. Adams 
109d3d6bff4SMark F. Adams 
110d3d6bff4SMark F. Adams /* -----------------------------------------------------------------------------*/
111d3d6bff4SMark F. Adams #undef __FUNCT__
112d3d6bff4SMark F. Adams #define __FUNCT__ "PCReset_GAMG"
113d3d6bff4SMark F. Adams PetscErrorCode PCReset_GAMG(PC pc)
114d3d6bff4SMark F. Adams {
115d3d6bff4SMark F. Adams   PetscErrorCode  ierr;
116d3d6bff4SMark F. Adams   PC_MG           *mg = (PC_MG*)pc->data;
117d3d6bff4SMark F. Adams   PC_GAMG         *pc_gamg = (PC_GAMG*)mg->innerctx;
118d3d6bff4SMark F. Adams 
119d3d6bff4SMark F. Adams   PetscFunctionBegin;
120d3d6bff4SMark F. Adams   ierr = PetscFree(pc_gamg->m_data);CHKERRQ(ierr);
121d3d6bff4SMark F. Adams   pc_gamg->m_data = 0; pc_gamg->m_data_sz = 0;
122d3d6bff4SMark F. Adams   PetscFunctionReturn(0);
123d3d6bff4SMark F. Adams }
124d3d6bff4SMark F. Adams 
1255b89ad90SMark F. Adams /* -------------------------------------------------------------------------- */
1265b89ad90SMark F. Adams /*
12711e60469SMark F. Adams    partitionLevel
1285b89ad90SMark F. Adams 
1295b89ad90SMark F. Adams    Input Parameter:
1303530afc2SMark F. Adams    . a_Amat_fine - matrix on this fine (k) level
131d3d6bff4SMark F. Adams    . a_ndata_rows - size of data to move (coarse grid)
132d3d6bff4SMark F. Adams    . a_ndata_cols - size of data to move (coarse grid)
1333530afc2SMark F. Adams    In/Output Parameter:
1343530afc2SMark F. Adams    . a_P_inout - prolongation operator to the next level (k-1)
135eb07cef2SMark F. Adams    . a_coarse_data - data that need to be moved
136*afc97cdcSMark F. Adams    . a_nactive_proc - number of active procs
13711e60469SMark F. Adams    Output Parameter:
1383530afc2SMark F. Adams    . a_Amat_crs - coarse matrix that is created (k-1)
1395b89ad90SMark F. Adams */
1405cb416c2SMark F. Adams 
1415b89ad90SMark F. Adams #undef __FUNCT__
14211e60469SMark F. Adams #define __FUNCT__ "partitionLevel"
1433530afc2SMark F. Adams PetscErrorCode partitionLevel( Mat a_Amat_fine,
144d3d6bff4SMark F. Adams                                PetscInt a_ndata_rows,
145d3d6bff4SMark F. Adams                                PetscInt a_ndata_cols,
146038e3b61SMark F. Adams 			       PetscInt a_cbs,
1473530afc2SMark F. Adams                                Mat *a_P_inout,
148eb07cef2SMark F. Adams                                PetscReal **a_coarse_data,
149*afc97cdcSMark F. Adams                                PetscMPIInt *a_nactive_proc,
1503530afc2SMark F. Adams                                Mat *a_Amat_crs
15111e60469SMark F. Adams                                )
1525b89ad90SMark F. Adams {
1535b89ad90SMark F. Adams   PetscErrorCode   ierr;
154038e3b61SMark F. Adams   Mat              Cmat,Pnew,Pold=*a_P_inout;
15511e60469SMark F. Adams   IS               new_indices,isnum;
1563530afc2SMark F. Adams   MPI_Comm         wcomm = ((PetscObject)a_Amat_fine)->comm;
157*afc97cdcSMark F. Adams   PetscMPIInt      mype,npe;
158*afc97cdcSMark F. Adams   PetscInt         neq,NN,Istart,Iend,Istart0,Iend0,ncrs0,ncrs_new,fbs;
159e33ef3b1SMark F. Adams   PetscMPIInt      new_npe,targ_npe;
160737a81a9SMark F. Adams   PetscBool        flag = PETSC_FALSE;
1615b89ad90SMark F. Adams 
1625b89ad90SMark F. Adams   PetscFunctionBegin;
16311e60469SMark F. Adams   ierr = MPI_Comm_rank( wcomm, &mype ); CHKERRQ(ierr);
16411e60469SMark F. Adams   ierr = MPI_Comm_size( wcomm, &npe );  CHKERRQ(ierr);
165038e3b61SMark F. Adams   ierr = MatGetBlockSize( a_Amat_fine, &fbs ); CHKERRQ(ierr);
16611e60469SMark F. Adams   /* RAP */
167038e3b61SMark F. Adams   ierr = MatPtAP( a_Amat_fine, Pold, MAT_INITIAL_MATRIX, 2.0, &Cmat ); CHKERRQ(ierr);
168737a81a9SMark F. Adams 
169038e3b61SMark F. Adams   ierr = MatSetBlockSize( Cmat, a_cbs );      CHKERRQ(ierr);
170acadaa72SMark F. Adams 
171038e3b61SMark F. Adams   ierr = MatGetOwnershipRange( Cmat, &Istart0, &Iend0 ); CHKERRQ(ierr);
172038e3b61SMark F. Adams   ncrs0 = (Iend0-Istart0)/a_cbs; assert((Iend0-Istart0)%a_cbs == 0);
173038e3b61SMark F. Adams 
174038e3b61SMark F. Adams   /* Repartition Cmat_{k} and move colums of P^{k}_{k-1} and coordinates accordingly */
175038e3b61SMark F. Adams   ierr = MatGetSize( Cmat, &neq, &NN );CHKERRQ(ierr);
176*afc97cdcSMark F. Adams #define MIN_EQ_PROC 100
1773530afc2SMark F. Adams   targ_npe = neq/MIN_EQ_PROC; /* hardwire min. number of eq/proc */
178*afc97cdcSMark F. Adams #define TOP_GRID_LIM 1000
179*afc97cdcSMark F. Adams   if( targ_npe == 0 || neq < TOP_GRID_LIM ) {
180*afc97cdcSMark F. Adams     new_npe = 1; /* output for next level */
181*afc97cdcSMark F. Adams   }
182*afc97cdcSMark F. Adams   else if (targ_npe >= *a_nactive_proc ) new_npe = *a_nactive_proc; /* no change */
1833530afc2SMark F. Adams   else{
184*afc97cdcSMark F. Adams     PetscMPIInt factstart,fact,nactivepe=*a_nactive_proc;
185*afc97cdcSMark F. Adams     factstart = nactivepe;
186*afc97cdcSMark F. Adams     new_npe = -9999; /*???*/
1873530afc2SMark F. Adams     for(fact=factstart;fact>0;fact--){ /* try to find a better number of procs */
188*afc97cdcSMark F. Adams       if( nactivepe%fact==0 && neq/(nactivepe/fact) > MIN_EQ_PROC ) {
189*afc97cdcSMark F. Adams 	new_npe = nactivepe/fact;
1903530afc2SMark F. Adams       }
1913530afc2SMark F. Adams     }
192*afc97cdcSMark F. Adams     if( new_npe == -9999 ){
193*afc97cdcSMark F. Adams       new_npe = *a_nactive_proc; /*???*/
194*afc97cdcSMark F. Adams       PetscPrintf(PETSC_COMM_WORLD,"[%d]%s warning: failed to find reduced PE number, targ_npe=%d\n",mype,__FUNCT__,targ_npe);
1953530afc2SMark F. Adams     }
196*afc97cdcSMark F. Adams   }
197*afc97cdcSMark F. Adams   *a_nactive_proc = new_npe; /* this is a nominal value -- output */
198*afc97cdcSMark F. Adams   PetscPrintf(PETSC_COMM_WORLD,"[%d]%s new_npe=%d neq=%d\n",mype,__FUNCT__,new_npe,neq);
199737a81a9SMark F. Adams   ierr  = PetscOptionsHasName(PETSC_NULL,"-pc_gamg_avoid_repartitioning",&flag);
200737a81a9SMark F. Adams   CHKERRQ( ierr );
201737a81a9SMark F. Adams   if( !flag ) { /* re-partition */
20211e60469SMark F. Adams     MatPartitioning  mpart;
2035ef31b24SMark F. Adams     Mat              adj;
2045ef31b24SMark F. Adams     const PetscInt  *is_idx;
205*afc97cdcSMark F. Adams     PetscInt         is_sz,kk,jj,ii, *isnewproc_idx;
206c9a0b8beSMark F. Adams     /* create sub communicator  */
207c9a0b8beSMark F. Adams     MPI_Comm         cm,new_comm;
208e33ef3b1SMark F. Adams     IS               isnewproc;
209*afc97cdcSMark F. Adams     MPI_Group        wg, g2;
210*afc97cdcSMark F. Adams     PetscMPIInt      ranks[npe],counts[npe],nc=ncrs0;
211e33ef3b1SMark F. Adams 
212*afc97cdcSMark F. Adams     /* if( ncrs0 == 0 ) { */
213*afc97cdcSMark F. Adams /*       if(mype==0) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"zero local nodes on root -- increase min"); */
214*afc97cdcSMark F. Adams /*     } */
215*afc97cdcSMark F. Adams     ierr = MPI_Allgather( &nc, 1, MPI_INT, counts, 1, MPI_INT, wcomm ); CHKERRQ(ierr);
216*afc97cdcSMark F. Adams     assert(counts[mype]==ncrs0);
217*afc97cdcSMark F. Adams     /* count real active pes */
218*afc97cdcSMark F. Adams     for( new_npe = jj = 0 ; jj < npe ; jj++) {
219*afc97cdcSMark F. Adams       if( counts[jj] != 0 ) {
220*afc97cdcSMark F. Adams 	ranks[new_npe++] = jj;
221*afc97cdcSMark F. Adams       }
222*afc97cdcSMark F. Adams     }
223*afc97cdcSMark F. Adams     ierr = MPI_Comm_group( wcomm, &wg ); CHKERRQ(ierr);
224*afc97cdcSMark F. Adams     ierr = MPI_Group_incl( wg, new_npe, ranks, &g2 ); CHKERRQ(ierr);
225*afc97cdcSMark F. Adams     ierr = MPI_Comm_create( wcomm, g2, &cm ); CHKERRQ(ierr);
226*afc97cdcSMark F. Adams     if( cm != MPI_COMM_NULL ) {
227c9a0b8beSMark F. Adams       ierr = PetscCommDuplicate( cm, &new_comm, PETSC_NULL ); CHKERRQ(ierr);
228c9a0b8beSMark F. Adams       ierr = MPI_Comm_free( &cm );                             CHKERRQ(ierr);
229*afc97cdcSMark F. Adams     }
230*afc97cdcSMark F. Adams     ierr = MPI_Group_free( &wg );                            CHKERRQ(ierr);
231*afc97cdcSMark F. Adams     ierr = MPI_Group_free( &g2 );                            CHKERRQ(ierr);
232c9a0b8beSMark F. Adams 
2335ef31b24SMark F. Adams     /* MatPartitioningApply call MatConvert, which is collective */
234737a81a9SMark F. Adams     ierr = PetscLogEventBegin(gamg_setup_stages[SET12],0,0,0,0);CHKERRQ(ierr);
235038e3b61SMark F. Adams     if( a_cbs == 1) {
236038e3b61SMark F. Adams       ierr = MatConvert( Cmat, MATMPIADJ, MAT_INITIAL_MATRIX, &adj );   CHKERRQ(ierr);
237eb07cef2SMark F. Adams     }
238eb07cef2SMark F. Adams     else{
239038e3b61SMark F. Adams       /* make a scalar matrix to partition */
240eb07cef2SMark F. Adams       Mat tMat;
241eb07cef2SMark F. Adams       PetscInt Ii,ncols; const PetscScalar *vals; const PetscInt *idx;
2426876a03eSMark F. Adams       MatInfo info;
2436876a03eSMark F. Adams       ierr = MatGetInfo(Cmat,MAT_LOCAL,&info); CHKERRQ(ierr);
24455ea7f60SMark F. Adams       ncols = (PetscInt)info.nz_used/((ncrs0+1)*a_cbs*a_cbs)+1;
2456876a03eSMark F. Adams 
246eb07cef2SMark F. Adams       ierr = MatCreateMPIAIJ( wcomm, ncrs0, ncrs0,
247eb07cef2SMark F. Adams                               PETSC_DETERMINE, PETSC_DETERMINE,
2486876a03eSMark F. Adams                               2*ncols, PETSC_NULL, ncols, PETSC_NULL,
249eb07cef2SMark F. Adams                               &tMat );
2506876a03eSMark F. Adams       CHKERRQ(ierr);
251eb07cef2SMark F. Adams 
252eb07cef2SMark F. Adams       for ( Ii = Istart0; Ii < Iend0; Ii++ ) {
253038e3b61SMark F. Adams         PetscInt dest_row = Ii/a_cbs;
254038e3b61SMark F. Adams         ierr = MatGetRow(Cmat,Ii,&ncols,&idx,&vals); CHKERRQ(ierr);
255eb07cef2SMark F. Adams         for( jj = 0 ; jj < ncols ; jj++ ){
256038e3b61SMark F. Adams           PetscInt dest_col = idx[jj]/a_cbs;
257eb07cef2SMark F. Adams           PetscScalar v = 1.0;
258eb07cef2SMark F. Adams           ierr = MatSetValues(tMat,1,&dest_row,1,&dest_col,&v,ADD_VALUES); CHKERRQ(ierr);
259eb07cef2SMark F. Adams         }
260038e3b61SMark F. Adams         ierr = MatRestoreRow(Cmat,Ii,&ncols,&idx,&vals); CHKERRQ(ierr);
261eb07cef2SMark F. Adams       }
262eb07cef2SMark F. Adams       ierr = MatAssemblyBegin(tMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
263eb07cef2SMark F. Adams       ierr = MatAssemblyEnd(tMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
264eb07cef2SMark F. Adams 
265eb07cef2SMark F. Adams       ierr = MatConvert( tMat, MATMPIADJ, MAT_INITIAL_MATRIX, &adj );   CHKERRQ(ierr);
266eb07cef2SMark F. Adams 
267eb07cef2SMark F. Adams       ierr = MatDestroy( &tMat );  CHKERRQ(ierr);
268eb07cef2SMark F. Adams     }
269*afc97cdcSMark F. Adams     if( ncrs0 != 0 ){
270*afc97cdcSMark F. Adams       if(new_comm==MPI_COMM_NULL)SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"new_comm == MPI_COMM_NULL");
271*afc97cdcSMark F. Adams       /* if(ncrs0==0)SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"zero local nodes -- increase min"); */
2725ef31b24SMark F. Adams       /* hack to fix global data that pmetis.c uses in 'adj' */
273*afc97cdcSMark F. Adams       for(new_npe=jj=0 ; jj<npe ; jj++) {
274*afc97cdcSMark F. Adams 	if( counts[jj] != 0 ) {
275*afc97cdcSMark F. Adams 	  adj->rmap->range[new_npe++] = adj->rmap->range[jj];
276*afc97cdcSMark F. Adams 	}
2775ef31b24SMark F. Adams       }
2785ef31b24SMark F. Adams       ierr = MatPartitioningCreate( new_comm, &mpart ); CHKERRQ(ierr);
2795ef31b24SMark F. Adams       ierr = MatPartitioningSetAdjacency( mpart, adj ); CHKERRQ(ierr);
28011e60469SMark F. Adams       ierr = MatPartitioningSetFromOptions( mpart ); CHKERRQ(ierr);
2815ef31b24SMark F. Adams       ierr = MatPartitioningSetNParts( mpart, new_npe ); CHKERRQ(ierr);
28211e60469SMark F. Adams       ierr = MatPartitioningApply( mpart, &isnewproc ); CHKERRQ(ierr);
28311e60469SMark F. Adams       ierr = MatPartitioningDestroy( &mpart ); CHKERRQ(ierr);
2845ef31b24SMark F. Adams       /* collect IS info */
2855ef31b24SMark F. Adams       ierr = ISGetLocalSize( isnewproc, &is_sz );        CHKERRQ(ierr);
286038e3b61SMark F. Adams       ierr = PetscMalloc( a_cbs*is_sz*sizeof(PetscInt), &isnewproc_idx ); CHKERRQ(ierr);
2875ef31b24SMark F. Adams       ierr = ISGetIndices( isnewproc, &is_idx );     CHKERRQ(ierr);
288eb07cef2SMark F. Adams       /* spread partitioning across machine - probably the right thing to do but machine spec. */
289eb07cef2SMark F. Adams       for(kk=0,jj=0;kk<is_sz;kk++){
290*afc97cdcSMark F. Adams         for(ii=0 ; ii<a_cbs ; ii++, jj++ ) {
291*afc97cdcSMark F. Adams           isnewproc_idx[jj] = is_idx[kk]; /* distribution */
292eb07cef2SMark F. Adams         }
2935ef31b24SMark F. Adams       }
2945ef31b24SMark F. Adams       ierr = ISRestoreIndices( isnewproc, &is_idx );     CHKERRQ(ierr);
2955ef31b24SMark F. Adams       ierr = ISDestroy( &isnewproc );                    CHKERRQ(ierr);
296038e3b61SMark F. Adams       is_sz *= a_cbs;
297*afc97cdcSMark F. Adams 
298*afc97cdcSMark F. Adams       ierr = MPI_Comm_free( &new_comm );    CHKERRQ(ierr);
2995ef31b24SMark F. Adams     }
3005ef31b24SMark F. Adams     else{
3015ef31b24SMark F. Adams       isnewproc_idx = 0;
3025ef31b24SMark F. Adams       is_sz = 0;
3035ef31b24SMark F. Adams     }
3045ef31b24SMark F. Adams     ierr = MatDestroy( &adj );                       CHKERRQ(ierr);
3055ef31b24SMark F. Adams     ierr = ISCreateGeneral( wcomm, is_sz, isnewproc_idx, PETSC_COPY_VALUES, &isnewproc );
306*afc97cdcSMark F. Adams     if( isnewproc_idx != 0 ) {
3075ef31b24SMark F. Adams       ierr = PetscFree( isnewproc_idx );  CHKERRQ(ierr);
3085ef31b24SMark F. Adams     }
309e33ef3b1SMark F. Adams 
31011e60469SMark F. Adams     /*
31111e60469SMark F. Adams      Create an index set from the isnewproc index set to indicate the mapping TO
31211e60469SMark F. Adams      */
31311e60469SMark F. Adams     ierr = ISPartitioningToNumbering( isnewproc, &isnum ); CHKERRQ(ierr);
31411e60469SMark F. Adams     /*
31511e60469SMark F. Adams      Determine how many elements are assigned to each processor
31611e60469SMark F. Adams      */
31711e60469SMark F. Adams     ierr = ISPartitioningCount( isnewproc, npe, counts ); CHKERRQ(ierr);
31811e60469SMark F. Adams     ierr = ISDestroy( &isnewproc );                       CHKERRQ(ierr);
319038e3b61SMark F. Adams     ncrs_new = counts[mype]/a_cbs;
320737a81a9SMark F. Adams     ierr = PetscLogEventEnd(gamg_setup_stages[SET12],0,0,0,0);   CHKERRQ(ierr);
3215ef31b24SMark F. Adams 
32211e60469SMark F. Adams     { /* Create a vector to contain the newly ordered element information */
323d3d6bff4SMark F. Adams       const PetscInt *idx, data_sz=a_ndata_rows*a_ndata_cols;
324d3d6bff4SMark F. Adams       const PetscInt  stride0=ncrs0*a_ndata_rows,strideNew=ncrs_new*a_ndata_rows;
325038e3b61SMark F. Adams       PetscInt        ii,jj,kk;
32611e60469SMark F. Adams       IS              isscat;
32711e60469SMark F. Adams       PetscScalar    *array;
32811e60469SMark F. Adams       Vec             src_crd, dest_crd;
329eb07cef2SMark F. Adams       PetscReal      *data = *a_coarse_data;
33011e60469SMark F. Adams       VecScatter      vecscat;
331d3d6bff4SMark F. Adams       PetscInt        tidx[ncrs0*data_sz];
332acadaa72SMark F. Adams 
33311e60469SMark F. Adams       ierr = VecCreate( wcomm, &dest_crd );
334d3d6bff4SMark F. Adams       ierr = VecSetSizes( dest_crd, data_sz*ncrs_new, PETSC_DECIDE ); CHKERRQ(ierr);
33511e60469SMark F. Adams       ierr = VecSetFromOptions( dest_crd ); CHKERRQ(ierr); /*funny vector-get global options?*/
33611e60469SMark F. Adams       /*
337d3d6bff4SMark F. Adams        There are 'a_ndata_rows*a_ndata_cols' data items per node, (one can think of the vectors of having
338d3d6bff4SMark F. Adams        a block size of ...).  Note, ISs are expanded into equation space by 'a_cbs'.
33911e60469SMark F. Adams        */
34011e60469SMark F. Adams       ierr = ISGetIndices( isnum, &idx ); CHKERRQ(ierr);
341038e3b61SMark F. Adams       for(ii=0,jj=0; ii<ncrs0 ; ii++) {
342d3d6bff4SMark F. Adams         PetscInt id = idx[ii*a_cbs]/a_cbs; /* get node back */
343d3d6bff4SMark F. Adams         for( kk=0; kk<data_sz ; kk++, jj++) tidx[jj] = id*data_sz + kk;
34411e60469SMark F. Adams       }
345038e3b61SMark F. Adams       ierr = ISRestoreIndices( isnum, &idx ); CHKERRQ(ierr);
346d3d6bff4SMark F. Adams       ierr = ISCreateGeneral( wcomm, data_sz*ncrs0, tidx, PETSC_COPY_VALUES, &isscat );
34711e60469SMark F. Adams       CHKERRQ(ierr);
34811e60469SMark F. Adams       /*
34911e60469SMark F. Adams        Create a vector to contain the original vertex information for each element
35011e60469SMark F. Adams        */
351d3d6bff4SMark F. Adams       ierr = VecCreateSeq( PETSC_COMM_SELF, data_sz*ncrs0, &src_crd ); CHKERRQ(ierr);
352d3d6bff4SMark F. Adams       for( jj=0; jj<a_ndata_cols ; jj++ ) {
353d3d6bff4SMark F. Adams         for( ii=0 ; ii<ncrs0 ; ii++) {
354d3d6bff4SMark F. Adams           for( kk=0; kk<a_ndata_rows ; kk++ ) {
355d3d6bff4SMark F. Adams             PetscInt ix = ii*a_ndata_rows + kk + jj*stride0, jx = ii*data_sz + kk*a_ndata_cols + jj;
356d3d6bff4SMark F. Adams             ierr = VecSetValues( src_crd, 1, &jx, &data[ix], INSERT_VALUES );  CHKERRQ(ierr);
357d3d6bff4SMark F. Adams           }
358038e3b61SMark F. Adams         }
359eb07cef2SMark F. Adams       }
360eb07cef2SMark F. Adams       ierr = VecAssemblyBegin(src_crd); CHKERRQ(ierr);
361eb07cef2SMark F. Adams       ierr = VecAssemblyEnd(src_crd); CHKERRQ(ierr);
36211e60469SMark F. Adams       /*
36311e60469SMark F. Adams 	Scatter the element vertex information (still in the original vertex ordering)
36411e60469SMark F. Adams 	to the correct processor
36511e60469SMark F. Adams        */
36611e60469SMark F. Adams       ierr = VecScatterCreate( src_crd, PETSC_NULL, dest_crd, isscat, &vecscat);
36711e60469SMark F. Adams       CHKERRQ(ierr);
36811e60469SMark F. Adams       ierr = ISDestroy( &isscat );       CHKERRQ(ierr);
36911e60469SMark F. Adams       ierr = VecScatterBegin(vecscat,src_crd,dest_crd,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
37011e60469SMark F. Adams       ierr = VecScatterEnd(vecscat,src_crd,dest_crd,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
37111e60469SMark F. Adams       ierr = VecScatterDestroy( &vecscat );       CHKERRQ(ierr);
37211e60469SMark F. Adams       ierr = VecDestroy( &src_crd );       CHKERRQ(ierr);
37311e60469SMark F. Adams       /*
37411e60469SMark F. Adams 	Put the element vertex data into a new allocation of the gdata->ele
37511e60469SMark F. Adams       */
376eb07cef2SMark F. Adams       ierr = PetscFree( *a_coarse_data );    CHKERRQ(ierr);
377d3d6bff4SMark F. Adams       ierr = PetscMalloc( data_sz*ncrs_new*sizeof(PetscReal), a_coarse_data );    CHKERRQ(ierr);
378eb07cef2SMark F. Adams 
37911e60469SMark F. Adams       ierr = VecGetArray( dest_crd, &array );    CHKERRQ(ierr);
380eb07cef2SMark F. Adams       data = *a_coarse_data;
381d3d6bff4SMark F. Adams       for( jj=0; jj<a_ndata_cols ; jj++ ) {
382d3d6bff4SMark F. Adams         for( ii=0 ; ii<ncrs_new ; ii++) {
383d3d6bff4SMark F. Adams           for( kk=0; kk<a_ndata_rows ; kk++ ) {
384d3d6bff4SMark F. Adams             PetscInt ix = ii*a_ndata_rows + kk + jj*strideNew, jx = ii*data_sz + kk*a_ndata_cols + jj;
385d3d6bff4SMark F. Adams             data[ix] = PetscRealPart(array[jx]);
386d3d6bff4SMark F. Adams             array[jx] = 1.e300;
387d3d6bff4SMark F. Adams           }
388038e3b61SMark F. Adams         }
389038e3b61SMark F. Adams       }
39011e60469SMark F. Adams       ierr = VecRestoreArray( dest_crd, &array );    CHKERRQ(ierr);
39111e60469SMark F. Adams       ierr = VecDestroy( &dest_crd );    CHKERRQ(ierr);
39211e60469SMark F. Adams     }
393737a81a9SMark F. Adams 
39411e60469SMark F. Adams     /*
39511e60469SMark F. Adams       Invert for MatGetSubMatrix
39611e60469SMark F. Adams     */
397038e3b61SMark F. Adams     ierr = ISInvertPermutation( isnum, ncrs_new*a_cbs, &new_indices ); CHKERRQ(ierr);
39811e60469SMark F. Adams     ierr = ISSort( new_indices ); CHKERRQ(ierr); /* is this needed? */
39911e60469SMark F. Adams     ierr = ISDestroy( &isnum ); CHKERRQ(ierr);
40011e60469SMark F. Adams     /* A_crs output */
401038e3b61SMark F. Adams     ierr = MatGetSubMatrix( Cmat, new_indices, new_indices, MAT_INITIAL_MATRIX, a_Amat_crs );
40211e60469SMark F. Adams     CHKERRQ(ierr);
403eb07cef2SMark F. Adams 
404038e3b61SMark F. Adams     ierr = MatDestroy( &Cmat ); CHKERRQ(ierr);
405e33ef3b1SMark F. Adams     Cmat = *a_Amat_crs; /* output */
406038e3b61SMark F. Adams     ierr = MatSetBlockSize( Cmat, a_cbs );      CHKERRQ(ierr);
407eb07cef2SMark F. Adams 
40811e60469SMark F. Adams     /* prolongator */
40911e60469SMark F. Adams     ierr = MatGetOwnershipRange( Pold, &Istart, &Iend );    CHKERRQ(ierr);
41011e60469SMark F. Adams     {
41111e60469SMark F. Adams       IS findices;
41211e60469SMark F. Adams       ierr = ISCreateStride(wcomm,Iend-Istart,Istart,1,&findices);   CHKERRQ(ierr);
41311e60469SMark F. Adams       ierr = MatGetSubMatrix( Pold, findices, new_indices, MAT_INITIAL_MATRIX, &Pnew );
41411e60469SMark F. Adams       CHKERRQ(ierr);
41511e60469SMark F. Adams       ierr = ISDestroy( &findices ); CHKERRQ(ierr);
41611e60469SMark F. Adams     }
4173530afc2SMark F. Adams     ierr = MatDestroy( a_P_inout ); CHKERRQ(ierr);
4183530afc2SMark F. Adams     *a_P_inout = Pnew; /* output */
41911e60469SMark F. Adams     ierr = ISDestroy( &new_indices ); CHKERRQ(ierr);
420*afc97cdcSMark F. Adams 
421*afc97cdcSMark F. Adams     ierr = MatGetOwnershipRange(Cmat, &neq, &NN ); CHKERRQ(ierr);
422e33ef3b1SMark F. Adams   }
423e33ef3b1SMark F. Adams   else {
424e33ef3b1SMark F. Adams     *a_Amat_crs = Cmat; /* output */
425e33ef3b1SMark F. Adams   }
4265b89ad90SMark F. Adams 
4275b89ad90SMark F. Adams   PetscFunctionReturn(0);
4285b89ad90SMark F. Adams }
4295b89ad90SMark F. Adams 
4301de87581SMark F. Adams #define GAMG_MAXLEVELS 30
4315ef31b24SMark F. Adams #if defined(PETSC_USE_LOG)
4325ef31b24SMark F. Adams PetscLogStage  gamg_stages[20];
4335ef31b24SMark F. Adams #endif
4345b89ad90SMark F. Adams /* -------------------------------------------------------------------------- */
4355b89ad90SMark F. Adams /*
4365b89ad90SMark F. Adams    PCSetUp_GAMG - Prepares for the use of the GAMG preconditioner
4375b89ad90SMark F. Adams                     by setting data structures and options.
4385b89ad90SMark F. Adams 
4395b89ad90SMark F. Adams    Input Parameter:
4405b89ad90SMark F. Adams .  pc - the preconditioner context
4415b89ad90SMark F. Adams 
4425b89ad90SMark F. Adams    Application Interface Routine: PCSetUp()
4435b89ad90SMark F. Adams 
4445b89ad90SMark F. Adams    Notes:
4455b89ad90SMark F. Adams    The interface routine PCSetUp() is not usually called directly by
4465b89ad90SMark F. Adams    the user, but instead is called by PCApply() if necessary.
4475b89ad90SMark F. Adams */
4485b89ad90SMark F. Adams #undef __FUNCT__
4495b89ad90SMark F. Adams #define __FUNCT__ "PCSetUp_GAMG"
450eb07cef2SMark F. Adams PetscErrorCode PCSetUp_GAMG( PC a_pc )
4515b89ad90SMark F. Adams {
4525b89ad90SMark F. Adams   PetscErrorCode  ierr;
453eb07cef2SMark F. Adams   PC_MG           *mg = (PC_MG*)a_pc->data;
4545b89ad90SMark F. Adams   PC_GAMG         *pc_gamg = (PC_GAMG*)mg->innerctx;
455eb07cef2SMark F. Adams   Mat              Amat = a_pc->mat, Pmat = a_pc->pmat;
456d3d6bff4SMark F. Adams   PetscInt         fine_level, level, level1, M, N, bs, nloc, lidx, Istart, Iend;
457eb07cef2SMark F. Adams   MPI_Comm         wcomm = ((PetscObject)a_pc)->comm;
4583530afc2SMark F. Adams   PetscMPIInt      mype,npe,nactivepe;
459038e3b61SMark F. Adams   PetscBool        isOK;
460587fa25dSMark F. Adams   Mat              Aarr[GAMG_MAXLEVELS], Parr[GAMG_MAXLEVELS];
461587fa25dSMark F. Adams   PetscReal       *coarse_data = 0, *data, emaxs[GAMG_MAXLEVELS];
462737a81a9SMark F. Adams   MatInfo          info;
4635ef31b24SMark F. Adams 
4645b89ad90SMark F. Adams   PetscFunctionBegin;
465eb07cef2SMark F. Adams   if( a_pc->setupcalled ) {
466eb07cef2SMark F. Adams     /* no state data in GAMG to destroy */
467eb07cef2SMark F. Adams     ierr = PCReset_MG( a_pc ); CHKERRQ(ierr);
468eb07cef2SMark F. Adams   }
469baa4e9faSMark F. Adams   ierr = MPI_Comm_rank(wcomm,&mype);CHKERRQ(ierr);
470baa4e9faSMark F. Adams   ierr = MPI_Comm_size(wcomm,&npe);CHKERRQ(ierr);
4715b89ad90SMark F. Adams   /* GAMG requires input of fine-grid matrix. It determines nlevels. */
4725b89ad90SMark F. Adams   ierr = MatGetBlockSize( Amat, &bs ); CHKERRQ(ierr);
4733530afc2SMark F. Adams   ierr = MatGetSize( Amat, &M, &N );CHKERRQ(ierr);
474eb07cef2SMark F. Adams   ierr = MatGetOwnershipRange( Amat, &Istart, &Iend ); CHKERRQ(ierr);
475eb07cef2SMark F. Adams   nloc = (Iend-Istart)/bs; assert((Iend-Istart)%bs == 0);
476eb07cef2SMark F. Adams 
477038e3b61SMark F. Adams   /* get data of not around */
478038e3b61SMark F. Adams   if( pc_gamg->m_data == 0 && nloc > 0 ) {
479038e3b61SMark F. Adams     ierr  = PCSetCoordinates_GAMG( a_pc, -1, 0 );    CHKERRQ( ierr );
480eb07cef2SMark F. Adams   }
481eb07cef2SMark F. Adams   data = pc_gamg->m_data;
482038e3b61SMark F. Adams 
483eb07cef2SMark F. Adams   /* Get A_i and R_i */
484737a81a9SMark F. Adams   ierr = MatGetInfo(Amat,MAT_GLOBAL_SUM,&info); CHKERRQ(ierr);
485737a81a9SMark F. Adams   PetscPrintf(PETSC_COMM_WORLD,"\t[%d]%s level %d N=%d, n data rows=%d, n data cols=%d, nnz/row (ave)=%d, np=%d\n",
48604afdd00SMark F. Adams 	      mype,__FUNCT__,0,N,pc_gamg->m_data_rows,pc_gamg->m_data_cols,(PetscInt)(info.nz_used/(PetscReal)N),npe);
4878f4b7eb5SMark F. Adams   for ( level=0, Aarr[0] = Pmat, nactivepe = npe; /* hard wired stopping logic */
488785cba28SMark F. Adams         level < GAMG_MAXLEVELS-1 && (level==0 || M>TOP_GRID_LIM) && (npe==1 || nactivepe>1);
4890205a208SMark F. Adams         level++ ){
4905b89ad90SMark F. Adams     level1 = level + 1;
4915ef31b24SMark F. Adams     ierr = PetscLogEventBegin(gamg_setup_stages[SET1],0,0,0,0);CHKERRQ(ierr);
492d3d6bff4SMark F. Adams     ierr = createProlongation(Aarr[level], data, pc_gamg->m_dim, pc_gamg->m_data_cols, pc_gamg->m_useSA,
493785cba28SMark F. Adams                               level, &bs, &Parr[level1], &coarse_data, &isOK, &emaxs[level] );
4945b89ad90SMark F. Adams     CHKERRQ(ierr);
495d3d6bff4SMark F. Adams     ierr = PetscFree( data ); CHKERRQ( ierr );
4965ef31b24SMark F. Adams     ierr = PetscLogEventEnd(gamg_setup_stages[SET1],0,0,0,0);CHKERRQ(ierr);
4975ef31b24SMark F. Adams 
498baa4e9faSMark F. Adams     if(level==0) Aarr[0] = Amat; /* use Pmat for finest level setup, but use mat for solver */
499d3d6bff4SMark F. Adams 
500baa4e9faSMark F. Adams     if( isOK ) {
5015ef31b24SMark F. Adams       ierr = PetscLogEventBegin(gamg_setup_stages[SET2],0,0,0,0);CHKERRQ(ierr);
502d3d6bff4SMark F. Adams       ierr = partitionLevel( Aarr[level], pc_gamg->m_useSA ? bs : 1, pc_gamg->m_data_cols, bs,
503eb07cef2SMark F. Adams                              &Parr[level1], &coarse_data, &nactivepe, &Aarr[level1] );
5043530afc2SMark F. Adams       CHKERRQ(ierr);
5055ef31b24SMark F. Adams       ierr = PetscLogEventEnd(gamg_setup_stages[SET2],0,0,0,0);CHKERRQ(ierr);
5063530afc2SMark F. Adams       ierr = MatGetSize( Aarr[level1], &M, &N );CHKERRQ(ierr);
507737a81a9SMark F. Adams       ierr = MatGetInfo(Aarr[level1],MAT_GLOBAL_SUM,&info); CHKERRQ(ierr);
508737a81a9SMark F. Adams       PetscPrintf(PETSC_COMM_WORLD,"\t\t[%d]%s %d) N=%d, bs=%d, n data cols=%d, nnz/row (ave)=%d, %d active pes\n",
50904afdd00SMark F. Adams 		  mype,__FUNCT__,level1,N,bs,pc_gamg->m_data_cols,(PetscInt)(info.nz_used/(PetscReal)N),nactivepe);
510e33ef3b1SMark F. Adams       /* coarse grids with SA can have zero row/cols from singleton aggregates */
511e33ef3b1SMark F. Adams       /* aggregation method can probably gaurrentee this does not happen! - be safe for now */
512737a81a9SMark F. Adams 
513e33ef3b1SMark F. Adams       if( PETSC_TRUE ){
514785cba28SMark F. Adams         Vec diag; PetscScalar *data_arr,v; PetscInt Istart,Iend,kk,nloceq,id;
515785cba28SMark F. Adams         v = 1.e-10; /* LU factor has hard wired numbers for small diags so this needs to match (yuk) */
516e33ef3b1SMark F. Adams         ierr = MatGetOwnershipRange(Aarr[level1], &Istart, &Iend); CHKERRQ(ierr);
517785cba28SMark F. Adams         nloceq = Iend-Istart;
518e33ef3b1SMark F. Adams         ierr = MatGetVecs( Aarr[level1], &diag, 0 );    CHKERRQ(ierr);
519e33ef3b1SMark F. Adams         ierr = MatGetDiagonal( Aarr[level1], diag );    CHKERRQ(ierr);
520e33ef3b1SMark F. Adams         ierr = VecGetArray( diag, &data_arr );   CHKERRQ(ierr);
521785cba28SMark F. Adams         for(kk=0;kk<nloceq;kk++){
522e33ef3b1SMark F. Adams           if(data_arr[kk]==0.0) {
523785cba28SMark F. Adams             id = kk + Istart;
524e33ef3b1SMark F. Adams             ierr = MatSetValues(Aarr[level1],1,&id,1,&id,&v,INSERT_VALUES);
525e33ef3b1SMark F. Adams             CHKERRQ(ierr);
526785cba28SMark F. Adams             PetscPrintf(PETSC_COMM_SELF,"\t[%d]%s warning: added diag to zero (%d) on level %d \n",mype,__FUNCT__,id,level);
527e33ef3b1SMark F. Adams           }
528e33ef3b1SMark F. Adams         }
529e33ef3b1SMark F. Adams         ierr = VecRestoreArray( diag, &data_arr ); CHKERRQ(ierr);
530e33ef3b1SMark F. Adams         ierr = VecDestroy( &diag );                CHKERRQ(ierr);
531e33ef3b1SMark F. Adams         ierr = MatAssemblyBegin(Aarr[level1],MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
532e33ef3b1SMark F. Adams         ierr = MatAssemblyEnd(Aarr[level1],MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
533e33ef3b1SMark F. Adams       }
534baa4e9faSMark F. Adams     }
535baa4e9faSMark F. Adams     else{
536be544d3cSMark F. Adams       coarse_data = 0;
537baa4e9faSMark F. Adams       break;
538baa4e9faSMark F. Adams     }
539eb07cef2SMark F. Adams     data = coarse_data;
5405b89ad90SMark F. Adams   }
541be544d3cSMark F. Adams   if( coarse_data ) {
542eb07cef2SMark F. Adams     ierr = PetscFree( coarse_data ); CHKERRQ( ierr );
543be544d3cSMark F. Adams   }
544baa4e9faSMark F. Adams   PetscPrintf(PETSC_COMM_WORLD,"\t[%d]%s %d levels\n",0,__FUNCT__,level + 1);
5455b89ad90SMark F. Adams   pc_gamg->m_data = 0; /* destroyed coordinate data */
5465b89ad90SMark F. Adams   pc_gamg->m_Nlevels = level + 1;
5475b89ad90SMark F. Adams   fine_level = level;
548eb07cef2SMark F. Adams   ierr = PCMGSetLevels(a_pc,pc_gamg->m_Nlevels,PETSC_NULL);CHKERRQ(ierr);
5495b89ad90SMark F. Adams 
550fc4362bfSMark F. Adams   /* set default smoothers */
551587fa25dSMark F. Adams   for ( lidx=1, level = pc_gamg->m_Nlevels-2;
552587fa25dSMark F. Adams         lidx <= fine_level;
553587fa25dSMark F. Adams         lidx++, level--) {
5545745e0f5SMark F. Adams     PetscReal emax, emin;
5555b89ad90SMark F. Adams     KSP smoother; PC subpc;
556587fa25dSMark F. Adams     ierr = PCMGGetSmoother( a_pc, lidx, &smoother ); CHKERRQ(ierr);
5575b89ad90SMark F. Adams     ierr = KSPSetType( smoother, KSPCHEBYCHEV );CHKERRQ(ierr);
558038e3b61SMark F. Adams     if( emaxs[level] > 0.0 ) emax=emaxs[level];
559587fa25dSMark F. Adams     else{ /* eigen estimate 'emax' */
560587fa25dSMark F. Adams       KSP eksp; Mat Lmat = Aarr[level];
561fc4362bfSMark F. Adams       Vec bb, xx; PC pc;
562038e3b61SMark F. Adams 
5635745e0f5SMark F. Adams       ierr = MatGetVecs( Lmat, &bb, 0 );         CHKERRQ(ierr);
5645745e0f5SMark F. Adams       ierr = MatGetVecs( Lmat, &xx, 0 );         CHKERRQ(ierr);
565fc4362bfSMark F. Adams       {
566fc4362bfSMark F. Adams 	PetscRandom    rctx;
567fc4362bfSMark F. Adams 	ierr = PetscRandomCreate(wcomm,&rctx);CHKERRQ(ierr);
568fc4362bfSMark F. Adams 	ierr = PetscRandomSetFromOptions(rctx);CHKERRQ(ierr);
569fc4362bfSMark F. Adams 	ierr = VecSetRandom(bb,rctx);CHKERRQ(ierr);
570fc4362bfSMark F. Adams 	ierr = PetscRandomDestroy( &rctx ); CHKERRQ(ierr);
5715b89ad90SMark F. Adams       }
572fc4362bfSMark F. Adams       ierr = KSPCreate(wcomm,&eksp);CHKERRQ(ierr);
573e33ef3b1SMark F. Adams       ierr = KSPSetType( eksp, KSPCG );                      CHKERRQ(ierr);
574fc4362bfSMark F. Adams       ierr = KSPSetInitialGuessNonzero( eksp, PETSC_FALSE ); CHKERRQ(ierr);
5755745e0f5SMark F. Adams       ierr = KSPSetOperators( eksp, Lmat, Lmat, DIFFERENT_NONZERO_PATTERN ); CHKERRQ( ierr );
576fc4362bfSMark F. Adams       ierr = KSPGetPC( eksp, &pc );CHKERRQ( ierr );
5771fddbf69SMark F. Adams       ierr = PCSetType( pc, PCPBJACOBI ); CHKERRQ(ierr); /* should be same as above */
578038e3b61SMark F. Adams       ierr = KSPSetTolerances( eksp, PETSC_DEFAULT, PETSC_DEFAULT, PETSC_DEFAULT, 10 );
579fc4362bfSMark F. Adams       CHKERRQ(ierr);
580e33ef3b1SMark F. Adams       //ierr = KSPSetConvergenceTest( eksp, KSPSkipConverged, 0, 0 ); CHKERRQ(ierr);
581fc4362bfSMark F. Adams       ierr = KSPSetNormType( eksp, KSP_NORM_NONE );                 CHKERRQ(ierr);
582fc4362bfSMark F. Adams 
583fc4362bfSMark F. Adams       ierr = KSPSetComputeSingularValues( eksp,PETSC_TRUE ); CHKERRQ(ierr);
584fc4362bfSMark F. Adams       ierr = KSPSolve( eksp, bb, xx ); CHKERRQ(ierr);
585fc4362bfSMark F. Adams       ierr = KSPComputeExtremeSingularValues( eksp, &emax, &emin ); CHKERRQ(ierr);
586fc4362bfSMark F. Adams       ierr = VecDestroy( &xx );       CHKERRQ(ierr);
587fc4362bfSMark F. Adams       ierr = VecDestroy( &bb );       CHKERRQ(ierr);
588fc4362bfSMark F. Adams       ierr = KSPDestroy( &eksp );       CHKERRQ(ierr);
5891fddbf69SMark F. Adams       PetscPrintf(PETSC_COMM_WORLD,"\t\t\t%s max eigen=%e min=%e PC=%s\n",__FUNCT__,emax,emin,PETSC_GAMG_SMOOTHER);
590fc4362bfSMark F. Adams     }
591038e3b61SMark F. Adams     {
592038e3b61SMark F. Adams       PetscInt N1, N0, tt;
593038e3b61SMark F. Adams       ierr = MatGetSize( Aarr[level], &N1, &tt );         CHKERRQ(ierr);
594038e3b61SMark F. Adams       ierr = MatGetSize( Aarr[level+1], &N0, &tt );       CHKERRQ(ierr);
595785cba28SMark F. Adams       emin = 1.*emax/((PetscReal)N1/(PetscReal)N0); /* this should be about the coarsening rate */
596038e3b61SMark F. Adams       emax *= 1.05;
5971fddbf69SMark F. Adams 
598038e3b61SMark F. Adams     }
599038e3b61SMark F. Adams 
600587fa25dSMark F. Adams     ierr = KSPSetOperators( smoother, Aarr[level], Aarr[level], DIFFERENT_NONZERO_PATTERN );
601fc4362bfSMark F. Adams     ierr = KSPChebychevSetEigenvalues( smoother, emax, emin );CHKERRQ(ierr);
6020e1b4bd6SMark F. Adams     /*ierr = KSPSetTolerances(smoother,PETSC_DEFAULT,PETSC_DEFAULT,PETSC_DEFAULT,2); CHKERRQ(ierr);*/
6035745e0f5SMark F. Adams     ierr = KSPGetPC( smoother, &subpc ); CHKERRQ(ierr);
604e33ef3b1SMark F. Adams     ierr = PCSetType( subpc, PETSC_GAMG_SMOOTHER ); CHKERRQ(ierr);
6055745e0f5SMark F. Adams     ierr = KSPSetNormType( smoother, KSP_NORM_NONE ); CHKERRQ(ierr);
6065745e0f5SMark F. Adams   }
6075745e0f5SMark F. Adams   {
6085745e0f5SMark F. Adams     KSP smoother; /* coarse grid */
6095745e0f5SMark F. Adams     Mat Lmat = Aarr[pc_gamg->m_Nlevels-1];
610eb07cef2SMark F. Adams     ierr = PCMGGetSmoother( a_pc, 0, &smoother ); CHKERRQ(ierr);
6115745e0f5SMark F. Adams     ierr = KSPSetOperators( smoother, Lmat, Lmat, DIFFERENT_NONZERO_PATTERN );
6125745e0f5SMark F. Adams     CHKERRQ(ierr);
6135745e0f5SMark F. Adams     ierr = KSPSetNormType( smoother, KSP_NORM_NONE ); CHKERRQ(ierr);
614fc4362bfSMark F. Adams   }
615737a81a9SMark F. Adams 
616fc4362bfSMark F. Adams   /* should be called in PCSetFromOptions_GAMG(), but cannot be called prior to PCMGSetLevels() */
617eb07cef2SMark F. Adams   ierr = PCSetFromOptions_MG(a_pc); CHKERRQ(ierr);
6185b89ad90SMark F. Adams   {
6195b89ad90SMark F. Adams     PetscBool galerkin;
620eb07cef2SMark F. Adams     ierr = PCMGGetGalerkin( a_pc,  &galerkin); CHKERRQ(ierr);
6215b89ad90SMark F. Adams     if(galerkin){
6225b89ad90SMark F. Adams       SETERRQ(wcomm,PETSC_ERR_ARG_WRONG, "GAMG does galerkin manually so it must not be used in PC_MG.");
6235b89ad90SMark F. Adams     }
6245b89ad90SMark F. Adams   }
6255745e0f5SMark F. Adams 
6265745e0f5SMark F. Adams   /* set interpolation between the levels, create timer stages, clean up */
6278f4b7eb5SMark F. Adams   if( PETSC_FALSE ) {
6285ef31b24SMark F. Adams     char str[32];
6295ef31b24SMark F. Adams     sprintf(str,"MG Level %d (%d)",0,pc_gamg->m_Nlevels-1);
6305ef31b24SMark F. Adams     PetscLogStageRegister(str, &gamg_stages[fine_level]);
6315ef31b24SMark F. Adams   }
632587fa25dSMark F. Adams   for (lidx=0,level=pc_gamg->m_Nlevels-1;
633587fa25dSMark F. Adams        lidx<fine_level;
634587fa25dSMark F. Adams        lidx++, level--){
635587fa25dSMark F. Adams     ierr = PCMGSetInterpolation( a_pc, lidx+1, Parr[level] );CHKERRQ(ierr);
6366c237d78SBarry Smith     if( !PETSC_TRUE ) {
63711e60469SMark F. Adams       PetscViewer viewer; char fname[32];
638038e3b61SMark F. Adams       sprintf(fname,"Pmat_%d.m",level);
63911e60469SMark F. Adams       ierr = PetscViewerASCIIOpen( wcomm, fname, &viewer );  CHKERRQ(ierr);
6405b89ad90SMark F. Adams       ierr = PetscViewerSetFormat( viewer, PETSC_VIEWER_ASCII_MATLAB);  CHKERRQ(ierr);
641038e3b61SMark F. Adams       ierr = MatView( Parr[level], viewer ); CHKERRQ(ierr);
6425b89ad90SMark F. Adams       ierr = PetscViewerDestroy( &viewer );
643e33ef3b1SMark F. Adams       sprintf(fname,"Amat_%d.m",level);
644e33ef3b1SMark F. Adams       ierr = PetscViewerASCIIOpen( wcomm, fname, &viewer );  CHKERRQ(ierr);
645e33ef3b1SMark F. Adams       ierr = PetscViewerSetFormat( viewer, PETSC_VIEWER_ASCII_MATLAB);  CHKERRQ(ierr);
646e33ef3b1SMark F. Adams       ierr = MatView( Aarr[level], viewer ); CHKERRQ(ierr);
647e33ef3b1SMark F. Adams       ierr = PetscViewerDestroy( &viewer );
6485b89ad90SMark F. Adams     }
649587fa25dSMark F. Adams     ierr = MatDestroy( &Parr[level] );  CHKERRQ(ierr);
650587fa25dSMark F. Adams     ierr = MatDestroy( &Aarr[level] );  CHKERRQ(ierr);
6518f4b7eb5SMark F. Adams     if( PETSC_FALSE ) {
6525ef31b24SMark F. Adams       char str[32];
653587fa25dSMark F. Adams       sprintf(str,"MG Level %d (%d)",lidx+1,level-1);
654587fa25dSMark F. Adams       PetscLogStageRegister(str, &gamg_stages[level-1]);
655a92563c5SMark F. Adams     }
6565b89ad90SMark F. Adams   }
6575745e0f5SMark F. Adams 
6585b89ad90SMark F. Adams   /* setupcalled is set to 0 so that MG is setup from scratch */
659eb07cef2SMark F. Adams   a_pc->setupcalled = 0;
660eb07cef2SMark F. Adams   ierr = PCSetUp_MG(a_pc);CHKERRQ(ierr);
661e33ef3b1SMark F. Adams 
6625b89ad90SMark F. Adams   PetscFunctionReturn(0);
6635b89ad90SMark F. Adams }
6645b89ad90SMark F. Adams 
665eb07cef2SMark F. Adams /* ------------------------------------------------------------------------- */
6665b89ad90SMark F. Adams /*
6675b89ad90SMark F. Adams    PCDestroy_GAMG - Destroys the private context for the GAMG preconditioner
6685b89ad90SMark F. Adams    that was created with PCCreate_GAMG().
6695b89ad90SMark F. Adams 
6705b89ad90SMark F. Adams    Input Parameter:
6715b89ad90SMark F. Adams .  pc - the preconditioner context
6725b89ad90SMark F. Adams 
6735b89ad90SMark F. Adams    Application Interface Routine: PCDestroy()
6745b89ad90SMark F. Adams */
6755b89ad90SMark F. Adams #undef __FUNCT__
6765b89ad90SMark F. Adams #define __FUNCT__ "PCDestroy_GAMG"
6775b89ad90SMark F. Adams PetscErrorCode PCDestroy_GAMG(PC pc)
6785b89ad90SMark F. Adams {
6795b89ad90SMark F. Adams   PetscErrorCode  ierr;
6805b89ad90SMark F. Adams   PC_MG           *mg = (PC_MG*)pc->data;
6815b89ad90SMark F. Adams   PC_GAMG         *pc_gamg= (PC_GAMG*)mg->innerctx;
6825b89ad90SMark F. Adams 
6835b89ad90SMark F. Adams   PetscFunctionBegin;
6845b89ad90SMark F. Adams   ierr = PCReset_GAMG(pc);CHKERRQ(ierr);
6855b89ad90SMark F. Adams   ierr = PetscFree(pc_gamg);CHKERRQ(ierr);
6865b89ad90SMark F. Adams   ierr = PCDestroy_MG(pc);CHKERRQ(ierr);
6875b89ad90SMark F. Adams   PetscFunctionReturn(0);
6885b89ad90SMark F. Adams }
6895b89ad90SMark F. Adams 
6905b89ad90SMark F. Adams #undef __FUNCT__
6915b89ad90SMark F. Adams #define __FUNCT__ "PCSetFromOptions_GAMG"
6925b89ad90SMark F. Adams PetscErrorCode PCSetFromOptions_GAMG(PC pc)
6935b89ad90SMark F. Adams {
6945b89ad90SMark F. Adams   /* PetscErrorCode  ierr; */
6955b89ad90SMark F. Adams   /* PC_MG           *mg = (PC_MG*)pc->data; */
6965b89ad90SMark F. Adams   /* PC_GAMG         *pc_gamg = (PC_GAMG*)mg->innerctx; */
6975b89ad90SMark F. Adams   /* MPI_Comm        comm = ((PetscObject)pc)->comm; */
6985b89ad90SMark F. Adams 
6995b89ad90SMark F. Adams   PetscFunctionBegin;
7005b89ad90SMark F. Adams   PetscFunctionReturn(0);
7015b89ad90SMark F. Adams }
7025b89ad90SMark F. Adams 
7035b89ad90SMark F. Adams /* -------------------------------------------------------------------------- */
7045b89ad90SMark F. Adams /*
7055b89ad90SMark F. Adams  PCCreate_GAMG - Creates a GAMG preconditioner context, PC_GAMG
7065b89ad90SMark F. Adams 
7075b89ad90SMark F. Adams    Input Parameter:
7085b89ad90SMark F. Adams .  pc - the preconditioner context
7095b89ad90SMark F. Adams 
7105b89ad90SMark F. Adams    Application Interface Routine: PCCreate()
7115b89ad90SMark F. Adams 
7125b89ad90SMark F. Adams   */
7135b89ad90SMark F. Adams  /* MC
7145b89ad90SMark F. Adams      PCGAMG - Use algebraic multigrid preconditioning. This preconditioner requires you provide
7155b89ad90SMark F. Adams        fine grid discretization matrix and coordinates on the fine grid.
7165b89ad90SMark F. Adams 
7175b89ad90SMark F. Adams    Options Database Key:
7185b89ad90SMark F. Adams    Multigrid options(inherited)
7195b89ad90SMark F. Adams +  -pc_mg_cycles <1>: 1 for V cycle, 2 for W-cycle (MGSetCycles)
7205b89ad90SMark F. Adams .  -pc_mg_smoothup <1>: Number of post-smoothing steps (MGSetNumberSmoothUp)
7215b89ad90SMark F. Adams .  -pc_mg_smoothdown <1>: Number of pre-smoothing steps (MGSetNumberSmoothDown)
7225b89ad90SMark F. Adams    -pc_mg_type <multiplicative>: (one of) additive multiplicative full cascade kascade
7235b89ad90SMark F. Adams    GAMG options:
7245b89ad90SMark F. Adams 
7255b89ad90SMark F. Adams    Level: intermediate
7265b89ad90SMark F. Adams   Concepts: multigrid
7275b89ad90SMark F. Adams 
7285b89ad90SMark F. Adams .seealso:  PCCreate(), PCSetType(), PCType (for list of available types), PC, PCMGType,
7295b89ad90SMark F. Adams            PCMGSetLevels(), PCMGGetLevels(), PCMGSetType(), MPSetCycles(), PCMGSetNumberSmoothDown(),
7305b89ad90SMark F. Adams            PCMGSetNumberSmoothUp(), PCMGGetCoarseSolve(), PCMGSetResidual(), PCMGSetInterpolation(),
7315b89ad90SMark F. Adams            PCMGSetRestriction(), PCMGGetSmoother(), PCMGGetSmootherUp(), PCMGGetSmootherDown(),
7325b89ad90SMark F. Adams            PCMGSetCyclesOnLevel(), PCMGSetRhs(), PCMGSetX(), PCMGSetR()
7335b89ad90SMark F. Adams M */
7345b89ad90SMark F. Adams 
7355b89ad90SMark F. Adams EXTERN_C_BEGIN
7365b89ad90SMark F. Adams #undef __FUNCT__
7375b89ad90SMark F. Adams #define __FUNCT__ "PCCreate_GAMG"
7385b89ad90SMark F. Adams PetscErrorCode  PCCreate_GAMG(PC pc)
7395b89ad90SMark F. Adams {
7405b89ad90SMark F. Adams   PetscErrorCode  ierr;
7415b89ad90SMark F. Adams   PC_GAMG         *pc_gamg;
7425b89ad90SMark F. Adams   PC_MG           *mg;
7435ef31b24SMark F. Adams   PetscClassId     cookie;
7445b89ad90SMark F. Adams 
7455b89ad90SMark F. Adams   PetscFunctionBegin;
7465b89ad90SMark F. Adams   /* PCGAMG is an inherited class of PCMG. Initialize pc as PCMG */
7475b89ad90SMark F. Adams   ierr = PCSetType(pc,PCMG);CHKERRQ(ierr); /* calls PCCreate_MG() and MGCreate_Private() */
7485b89ad90SMark F. Adams   ierr = PetscObjectChangeTypeName((PetscObject)pc,PCGAMG);CHKERRQ(ierr);
7495b89ad90SMark F. Adams 
7505b89ad90SMark F. Adams   /* create a supporting struct and attach it to pc */
7515b89ad90SMark F. Adams   ierr = PetscNewLog(pc,PC_GAMG,&pc_gamg);CHKERRQ(ierr);
7525b89ad90SMark F. Adams   mg = (PC_MG*)pc->data;
7535b89ad90SMark F. Adams   mg->innerctx = pc_gamg;
7545b89ad90SMark F. Adams 
7555b89ad90SMark F. Adams   pc_gamg->m_Nlevels    = -1;
7565b89ad90SMark F. Adams 
7575b89ad90SMark F. Adams   /* overwrite the pointers of PCMG by the functions of PCGAMG */
7585b89ad90SMark F. Adams   pc->ops->setfromoptions = PCSetFromOptions_GAMG;
7595b89ad90SMark F. Adams   pc->ops->setup          = PCSetUp_GAMG;
7605b89ad90SMark F. Adams   pc->ops->reset          = PCReset_GAMG;
7615b89ad90SMark F. Adams   pc->ops->destroy        = PCDestroy_GAMG;
7625b89ad90SMark F. Adams 
7635b89ad90SMark F. Adams   ierr = PetscObjectComposeFunctionDynamic( (PetscObject)pc,
7645b89ad90SMark F. Adams 					    "PCSetCoordinates_C",
7655b89ad90SMark F. Adams 					    "PCSetCoordinates_GAMG",
7665b89ad90SMark F. Adams 					    PCSetCoordinates_GAMG);CHKERRQ(ierr);
767785cba28SMark F. Adams   static int count = 0;
768785cba28SMark F. Adams   if( count++ == 0 ) {
7695ef31b24SMark F. Adams     PetscClassIdRegister("GAMG Setup",&cookie);
770737a81a9SMark F. Adams     PetscLogEventRegister("GAMG: createProl", cookie, &gamg_setup_stages[SET1]);
771737a81a9SMark F. Adams     PetscLogEventRegister(" make graph", cookie, &gamg_setup_stages[SET3]);
772737a81a9SMark F. Adams     PetscLogEventRegister(" MIS/Agg", cookie, &gamg_setup_stages[SET4]);
773737a81a9SMark F. Adams     PetscLogEventRegister("  geo: growSupp", cookie, &gamg_setup_stages[SET5]);
774737a81a9SMark F. Adams     PetscLogEventRegister("  geo: triangle", cookie, &gamg_setup_stages[SET6]);
775737a81a9SMark F. Adams     PetscLogEventRegister("   search & set", cookie, &gamg_setup_stages[FIND_V]);
776737a81a9SMark F. Adams     PetscLogEventRegister("  SA: init", cookie, &gamg_setup_stages[SET7]);
777737a81a9SMark F. Adams     /* PetscLogEventRegister("  SA: frmProl0", cookie, &gamg_setup_stages[SET8]); */
778737a81a9SMark F. Adams     PetscLogEventRegister("  SA: smooth", cookie, &gamg_setup_stages[SET9]);
779737a81a9SMark F. Adams     PetscLogEventRegister("GAMG: partLevel", cookie, &gamg_setup_stages[SET2]);
780737a81a9SMark F. Adams     PetscLogEventRegister(" PL repartition", cookie, &gamg_setup_stages[SET12]);
781737a81a9SMark F. Adams     /* PetscLogEventRegister(" PL move data", cookie, &gamg_setup_stages[SET13]); */
782737a81a9SMark F. Adams     /* PetscLogEventRegister("GAMG: fix", cookie, &gamg_setup_stages[SET10]); */
783737a81a9SMark F. Adams     /* PetscLogEventRegister("GAMG: set levels", cookie, &gamg_setup_stages[SET11]); */
784785cba28SMark F. Adams   }
7855ef31b24SMark F. Adams 
7865b89ad90SMark F. Adams   PetscFunctionReturn(0);
7875b89ad90SMark F. Adams }
7885b89ad90SMark F. Adams EXTERN_C_END
789