xref: /petsc/src/ksp/pc/impls/gamg/agg.c (revision 581a99e3f4ff70cb489fbf1cb9c9b1531374fc72)
12e68589bSMark F. Adams /*
22e68589bSMark F. Adams  GAMG geometric-algebric multiogrid PC - Mark Adams 2011
32e68589bSMark F. Adams  */
42e68589bSMark F. Adams 
52e68589bSMark F. Adams #include <../src/ksp/pc/impls/gamg/gamg.h>        /*I "petscpc.h" I*/
62e68589bSMark F. Adams #include <private/kspimpl.h>
72e68589bSMark F. Adams 
82e68589bSMark F. Adams #include <assert.h>
92e68589bSMark F. Adams #include <petscblaslapack.h>
102e68589bSMark F. Adams 
112e68589bSMark F. Adams typedef struct {
12c8b0795cSMark F. Adams   PetscInt nsmooths;
13c8b0795cSMark F. Adams   Mat aux_mat;
14c8b0795cSMark F. Adams   PetscBool sym_graph;
15ef4ad70eSMark F. Adams   PetscBool square_graph;
162e68589bSMark F. Adams }PC_GAMG_AGG;
172e68589bSMark F. Adams 
182e68589bSMark F. Adams #undef __FUNCT__
192e68589bSMark F. Adams #define __FUNCT__ "PCGAMGSetNSmooths"
202e68589bSMark F. Adams /*@
212e68589bSMark F. Adams    PCGAMGSetNSmooths - Set number of smoothing steps (1 is typical)
222e68589bSMark F. Adams 
232e68589bSMark F. Adams    Not Collective on PC
242e68589bSMark F. Adams 
252e68589bSMark F. Adams    Input Parameters:
262e68589bSMark F. Adams .  pc - the preconditioner context
272e68589bSMark F. Adams 
282e68589bSMark F. Adams    Options Database Key:
292e68589bSMark F. Adams .  -pc_gamg_agg_nsmooths
302e68589bSMark F. Adams 
312e68589bSMark F. Adams    Level: intermediate
322e68589bSMark F. Adams 
332e68589bSMark F. Adams    Concepts: Aggregation AMG preconditioner
342e68589bSMark F. Adams 
352e68589bSMark F. Adams .seealso: ()
362e68589bSMark F. Adams @*/
372e68589bSMark F. Adams PetscErrorCode PCGAMGSetNSmooths(PC pc, PetscInt n)
382e68589bSMark F. Adams {
392e68589bSMark F. Adams   PetscErrorCode ierr;
402e68589bSMark F. Adams 
412e68589bSMark F. Adams   PetscFunctionBegin;
422e68589bSMark F. Adams   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
432e68589bSMark F. Adams   ierr = PetscTryMethod(pc,"PCGAMGSetNSmooths_C",(PC,PetscInt),(pc,n));CHKERRQ(ierr);
442e68589bSMark F. Adams   PetscFunctionReturn(0);
452e68589bSMark F. Adams }
462e68589bSMark F. Adams 
472e68589bSMark F. Adams EXTERN_C_BEGIN
482e68589bSMark F. Adams #undef __FUNCT__
492e68589bSMark F. Adams #define __FUNCT__ "PCGAMGSetNSmooths_GAMG"
502e68589bSMark F. Adams PetscErrorCode PCGAMGSetNSmooths_GAMG(PC pc, PetscInt n)
512e68589bSMark F. Adams {
522e68589bSMark F. Adams   PC_MG           *mg = (PC_MG*)pc->data;
532e68589bSMark F. Adams   PC_GAMG         *pc_gamg = (PC_GAMG*)mg->innerctx;
54c8b0795cSMark F. Adams   PC_GAMG_AGG      *pc_gamg_agg = (PC_GAMG_AGG*)pc_gamg->subctx;
552e68589bSMark F. Adams 
562e68589bSMark F. Adams   PetscFunctionBegin;
57c8b0795cSMark F. Adams   pc_gamg_agg->nsmooths = n;
58c8b0795cSMark F. Adams   PetscFunctionReturn(0);
59c8b0795cSMark F. Adams }
60c8b0795cSMark F. Adams EXTERN_C_END
61c8b0795cSMark F. Adams 
62c8b0795cSMark F. Adams #undef __FUNCT__
63c8b0795cSMark F. Adams #define __FUNCT__ "PCGAMGSetSymGraph"
64c8b0795cSMark F. Adams /*@
65c8b0795cSMark F. Adams    PCGAMGSetSymGraph -
66c8b0795cSMark F. Adams 
67c8b0795cSMark F. Adams    Not Collective on PC
68c8b0795cSMark F. Adams 
69c8b0795cSMark F. Adams    Input Parameters:
70c8b0795cSMark F. Adams .  pc - the preconditioner context
71c8b0795cSMark F. Adams 
72c8b0795cSMark F. Adams    Options Database Key:
73c8b0795cSMark F. Adams .  -pc_gamg_sym_graph
74c8b0795cSMark F. Adams 
75c8b0795cSMark F. Adams    Level: intermediate
76c8b0795cSMark F. Adams 
77c8b0795cSMark F. Adams    Concepts: Aggregation AMG preconditioner
78c8b0795cSMark F. Adams 
79c8b0795cSMark F. Adams .seealso: ()
80c8b0795cSMark F. Adams @*/
81c8b0795cSMark F. Adams PetscErrorCode PCGAMGSetSymGraph(PC pc, PetscBool n)
82c8b0795cSMark F. Adams {
83c8b0795cSMark F. Adams   PetscErrorCode ierr;
84c8b0795cSMark F. Adams 
85c8b0795cSMark F. Adams   PetscFunctionBegin;
86c8b0795cSMark F. Adams   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
87c8b0795cSMark F. Adams   ierr = PetscTryMethod(pc,"PCGAMGSetSymGraph_C",(PC,PetscBool),(pc,n));CHKERRQ(ierr);
88c8b0795cSMark F. Adams   PetscFunctionReturn(0);
89c8b0795cSMark F. Adams }
90c8b0795cSMark F. Adams 
91c8b0795cSMark F. Adams EXTERN_C_BEGIN
92c8b0795cSMark F. Adams #undef __FUNCT__
93c8b0795cSMark F. Adams #define __FUNCT__ "PCGAMGSetSymGraph_GAMG"
94c8b0795cSMark F. Adams PetscErrorCode PCGAMGSetSymGraph_GAMG(PC pc, PetscBool n)
95c8b0795cSMark F. Adams {
96c8b0795cSMark F. Adams   PC_MG           *mg = (PC_MG*)pc->data;
97c8b0795cSMark F. Adams   PC_GAMG         *pc_gamg = (PC_GAMG*)mg->innerctx;
98c8b0795cSMark F. Adams   PC_GAMG_AGG      *pc_gamg_agg = (PC_GAMG_AGG*)pc_gamg->subctx;
99c8b0795cSMark F. Adams 
100c8b0795cSMark F. Adams   PetscFunctionBegin;
101c8b0795cSMark F. Adams   pc_gamg_agg->sym_graph = n;
1022e68589bSMark F. Adams   PetscFunctionReturn(0);
1032e68589bSMark F. Adams }
1042e68589bSMark F. Adams EXTERN_C_END
1052e68589bSMark F. Adams 
106ef4ad70eSMark F. Adams #undef __FUNCT__
107ef4ad70eSMark F. Adams #define __FUNCT__ "PCGAMGSetSquareGraph"
108ef4ad70eSMark F. Adams /*@
109ef4ad70eSMark F. Adams    PCGAMGSetSquareGraph -
110ef4ad70eSMark F. Adams 
111ef4ad70eSMark F. Adams    Not Collective on PC
112ef4ad70eSMark F. Adams 
113ef4ad70eSMark F. Adams    Input Parameters:
114ef4ad70eSMark F. Adams .  pc - the preconditioner context
115ef4ad70eSMark F. Adams 
116ef4ad70eSMark F. Adams    Options Database Key:
117ef4ad70eSMark F. Adams .  -pc_gamg_square_graph
118ef4ad70eSMark F. Adams 
119ef4ad70eSMark F. Adams    Level: intermediate
120ef4ad70eSMark F. Adams 
121ef4ad70eSMark F. Adams    Concepts: Aggregation AMG preconditioner
122ef4ad70eSMark F. Adams 
123ef4ad70eSMark F. Adams .seealso: ()
124ef4ad70eSMark F. Adams @*/
125ef4ad70eSMark F. Adams PetscErrorCode PCGAMGSetSquareGraph(PC pc, PetscBool n)
126ef4ad70eSMark F. Adams {
127ef4ad70eSMark F. Adams   PetscErrorCode ierr;
128ef4ad70eSMark F. Adams 
129ef4ad70eSMark F. Adams   PetscFunctionBegin;
130ef4ad70eSMark F. Adams   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
131ef4ad70eSMark F. Adams   ierr = PetscTryMethod(pc,"PCGAMGSetSquareGraph_C",(PC,PetscBool),(pc,n));CHKERRQ(ierr);
132ef4ad70eSMark F. Adams   PetscFunctionReturn(0);
133ef4ad70eSMark F. Adams }
134ef4ad70eSMark F. Adams 
135ef4ad70eSMark F. Adams EXTERN_C_BEGIN
136ef4ad70eSMark F. Adams #undef __FUNCT__
137ef4ad70eSMark F. Adams #define __FUNCT__ "PCGAMGSetSquareGraph_GAMG"
138ef4ad70eSMark F. Adams PetscErrorCode PCGAMGSetSquareGraph_GAMG(PC pc, PetscBool n)
139ef4ad70eSMark F. Adams {
140ef4ad70eSMark F. Adams   PC_MG           *mg = (PC_MG*)pc->data;
141ef4ad70eSMark F. Adams   PC_GAMG         *pc_gamg = (PC_GAMG*)mg->innerctx;
142ef4ad70eSMark F. Adams   PC_GAMG_AGG      *pc_gamg_agg = (PC_GAMG_AGG*)pc_gamg->subctx;
143ef4ad70eSMark F. Adams 
144ef4ad70eSMark F. Adams   PetscFunctionBegin;
145ef4ad70eSMark F. Adams   pc_gamg_agg->square_graph = n;
146ef4ad70eSMark F. Adams   PetscFunctionReturn(0);
147ef4ad70eSMark F. Adams }
148ef4ad70eSMark F. Adams EXTERN_C_END
149ef4ad70eSMark F. Adams 
1502e68589bSMark F. Adams /* -------------------------------------------------------------------------- */
1512e68589bSMark F. Adams /*
1522e68589bSMark F. Adams    PCSetFromOptions_GAMG_AGG
1532e68589bSMark F. Adams 
1542e68589bSMark F. Adams   Input Parameter:
1552e68589bSMark F. Adams    . pc -
1562e68589bSMark F. Adams */
1572e68589bSMark F. Adams #undef __FUNCT__
1582e68589bSMark F. Adams #define __FUNCT__ "PCSetFromOptions_GAMG_AGG"
1592e68589bSMark F. Adams PetscErrorCode PCSetFromOptions_GAMG_AGG( PC pc )
1602e68589bSMark F. Adams {
1612e68589bSMark F. Adams   PetscErrorCode  ierr;
1622e68589bSMark F. Adams   PC_MG           *mg = (PC_MG*)pc->data;
1632e68589bSMark F. Adams   PC_GAMG         *pc_gamg = (PC_GAMG*)mg->innerctx;
164c8b0795cSMark F. Adams   PC_GAMG_AGG      *pc_gamg_agg = (PC_GAMG_AGG*)pc_gamg->subctx;
1652e68589bSMark F. Adams   PetscBool        flag;
1662e68589bSMark F. Adams 
1672e68589bSMark F. Adams   PetscFunctionBegin;
1682e68589bSMark F. Adams   /* call base class */
1692e68589bSMark F. Adams   ierr = PCSetFromOptions_GAMG( pc ); CHKERRQ(ierr);
1702e68589bSMark F. Adams 
1712e68589bSMark F. Adams   ierr = PetscOptionsHead("GAMG-AGG options"); CHKERRQ(ierr);
1722e68589bSMark F. Adams   {
1732e68589bSMark F. Adams     /* -pc_gamg_agg_nsmooths */
174c8b0795cSMark F. Adams     pc_gamg_agg->nsmooths = 0;
1752e68589bSMark F. Adams     ierr = PetscOptionsInt("-pc_gamg_agg_nsmooths",
1762e68589bSMark F. Adams                            "smoothing steps for smoothed aggregation, usually 1 (0)",
1772e68589bSMark F. Adams                            "PCGAMGSetNSmooths",
178c8b0795cSMark F. Adams                            pc_gamg_agg->nsmooths,
179c8b0795cSMark F. Adams                            &pc_gamg_agg->nsmooths,
180c8b0795cSMark F. Adams                            &flag);
181c8b0795cSMark F. Adams     CHKERRQ(ierr);
182c8b0795cSMark F. Adams 
183c8b0795cSMark F. Adams     /* -pc_gamg_sym_graph */
184c8b0795cSMark F. Adams     pc_gamg_agg->sym_graph = PETSC_FALSE;
185c8b0795cSMark F. Adams     ierr = PetscOptionsBool("-pc_gamg_sym_graph",
186*581a99e3SJed Brown                             "Set for asymmetric matrices",
187c8b0795cSMark F. Adams                             "PCGAMGSetSymGraph",
188c8b0795cSMark F. Adams                             pc_gamg_agg->sym_graph,
189c8b0795cSMark F. Adams                             &pc_gamg_agg->sym_graph,
1902e68589bSMark F. Adams                             &flag);
1912e68589bSMark F. Adams     CHKERRQ(ierr);
192ef4ad70eSMark F. Adams 
193ef4ad70eSMark F. Adams     /* -pc_gamg_square_graph */
194ef4ad70eSMark F. Adams     pc_gamg_agg->square_graph = PETSC_TRUE;
195ef4ad70eSMark F. Adams     ierr = PetscOptionsBool("-pc_gamg_square_graph",
196*581a99e3SJed Brown                             "Set for asymmetric matrices",
197ef4ad70eSMark F. Adams                             "PCGAMGSetSquareGraph",
198ef4ad70eSMark F. Adams                             pc_gamg_agg->square_graph,
199ef4ad70eSMark F. Adams                             &pc_gamg_agg->square_graph,
200ef4ad70eSMark F. Adams                             &flag);
201ef4ad70eSMark F. Adams     CHKERRQ(ierr);
2022e68589bSMark F. Adams   }
2032e68589bSMark F. Adams   ierr = PetscOptionsTail();CHKERRQ(ierr);
2042e68589bSMark F. Adams 
2052e68589bSMark F. Adams   PetscFunctionReturn(0);
2062e68589bSMark F. Adams }
2072e68589bSMark F. Adams 
2082e68589bSMark F. Adams /* -------------------------------------------------------------------------- */
2092e68589bSMark F. Adams /*
2102e68589bSMark F. Adams    PCDestroy_AGG
2112e68589bSMark F. Adams 
2122e68589bSMark F. Adams   Input Parameter:
2132e68589bSMark F. Adams    . pc -
2142e68589bSMark F. Adams */
2152e68589bSMark F. Adams #undef __FUNCT__
2162e68589bSMark F. Adams #define __FUNCT__ "PCDestroy_AGG"
2172e68589bSMark F. Adams PetscErrorCode PCDestroy_AGG( PC pc )
2182e68589bSMark F. Adams {
2192e68589bSMark F. Adams   PetscErrorCode  ierr;
2202e68589bSMark F. Adams   PC_MG           *mg = (PC_MG*)pc->data;
2212e68589bSMark F. Adams   PC_GAMG         *pc_gamg = (PC_GAMG*)mg->innerctx;
222c8b0795cSMark F. Adams   PC_GAMG_AGG      *pc_gamg_agg = (PC_GAMG_AGG*)pc_gamg->subctx;
2232e68589bSMark F. Adams 
2242e68589bSMark F. Adams   PetscFunctionBegin;
225c8b0795cSMark F. Adams   if( pc_gamg_agg ) {
226c8b0795cSMark F. Adams     ierr = PetscFree(pc_gamg_agg);CHKERRQ(ierr);
227c8b0795cSMark F. Adams     pc_gamg_agg = 0;
2282e68589bSMark F. Adams   }
2292e68589bSMark F. Adams 
2302e68589bSMark F. Adams   /* call base class */
2312e68589bSMark F. Adams   ierr = PCDestroy_GAMG( pc );CHKERRQ(ierr);
2322e68589bSMark F. Adams 
2332e68589bSMark F. Adams   PetscFunctionReturn(0);
2342e68589bSMark F. Adams }
2352e68589bSMark F. Adams 
2362e68589bSMark F. Adams /* -------------------------------------------------------------------------- */
2372e68589bSMark F. Adams /*
2382e68589bSMark F. Adams    PCSetCoordinates_AGG
2392e68589bSMark F. Adams 
2402e68589bSMark F. Adams    Input Parameter:
2412e68589bSMark F. Adams    .  pc - the preconditioner context
2422e68589bSMark F. Adams */
2432e68589bSMark F. Adams EXTERN_C_BEGIN
2442e68589bSMark F. Adams #undef __FUNCT__
2452e68589bSMark F. Adams #define __FUNCT__ "PCSetCoordinates_AGG"
2462e68589bSMark F. Adams PetscErrorCode PCSetCoordinates_AGG( PC pc, PetscInt ndm, PetscReal *coords )
2472e68589bSMark F. Adams {
2482e68589bSMark F. Adams   PC_MG          *mg = (PC_MG*)pc->data;
2492e68589bSMark F. Adams   PC_GAMG        *pc_gamg = (PC_GAMG*)mg->innerctx;
2502e68589bSMark F. Adams   PetscErrorCode ierr;
2512e68589bSMark F. Adams   PetscInt       arrsz,bs,my0,kk,ii,jj,nloc,Iend;
2522e68589bSMark F. Adams   Mat            Amat = pc->pmat;
2532e68589bSMark F. Adams 
2542e68589bSMark F. Adams   PetscFunctionBegin;
2552e68589bSMark F. Adams   PetscValidHeaderSpecific( Amat, MAT_CLASSID, 1 );
2562e68589bSMark F. Adams   ierr  = MatGetBlockSize( Amat, &bs );               CHKERRQ( ierr );
2572e68589bSMark F. Adams   ierr  = MatGetOwnershipRange( Amat, &my0, &Iend ); CHKERRQ(ierr);
2582e68589bSMark F. Adams   nloc = (Iend-my0)/bs;
2592e68589bSMark F. Adams   if((Iend-my0)%bs!=0) SETERRQ1(((PetscObject)Amat)->comm,PETSC_ERR_ARG_WRONG, "Bad local size %d.",nloc);
2602e68589bSMark F. Adams 
2612e68589bSMark F. Adams   /* SA: null space vectors */
262c8b0795cSMark F. Adams   if( coords && bs==1 ) pc_gamg->data_cell_cols = 1; /* scalar w/ coords and SA (not needed) */
263c8b0795cSMark F. Adams   else if( coords ) pc_gamg->data_cell_cols = (ndm==2 ? 3 : 6); /* elasticity */
264c8b0795cSMark F. Adams   else pc_gamg->data_cell_cols = bs; /* no data, force SA with constant null space vectors */
265c8b0795cSMark F. Adams   pc_gamg->data_cell_rows = bs;
2662e68589bSMark F. Adams 
267c8b0795cSMark F. Adams   arrsz = nloc*pc_gamg->data_cell_rows*pc_gamg->data_cell_cols;
2682e68589bSMark F. Adams 
2692e68589bSMark F. Adams   /* create data - syntactic sugar that should be refactored at some point */
2702e68589bSMark F. Adams   if (pc_gamg->data==0 || (pc_gamg->data_sz != arrsz)) {
2712e68589bSMark F. Adams     ierr = PetscFree( pc_gamg->data );  CHKERRQ(ierr);
272c8b0795cSMark F. Adams     ierr = PetscMalloc(arrsz*sizeof(PetscReal), &pc_gamg->data ); CHKERRQ(ierr);
2732e68589bSMark F. Adams   }
2742e68589bSMark F. Adams   /* copy data in - column oriented */
2752e68589bSMark F. Adams   for(kk=0;kk<nloc;kk++){
2762e68589bSMark F. Adams     const PetscInt M = Iend - my0;
2772e68589bSMark F. Adams     PetscReal *data = &pc_gamg->data[kk*bs];
278c8b0795cSMark F. Adams     if( pc_gamg->data_cell_cols==1 ) *data = 1.0;
2792e68589bSMark F. Adams     else {
2802e68589bSMark F. Adams       for(ii=0;ii<bs;ii++)
2812e68589bSMark F. Adams         for(jj=0;jj<bs;jj++)
2822e68589bSMark F. Adams           if(ii==jj)data[ii*M + jj] = 1.0; /* translational modes */
2832e68589bSMark F. Adams           else data[ii*M + jj] = 0.0;
2842e68589bSMark F. Adams       if( coords ) {
2852e68589bSMark F. Adams         if( ndm == 2 ){ /* rotational modes */
2862e68589bSMark F. Adams           data += 2*M;
2872e68589bSMark F. Adams           data[0] = -coords[2*kk+1];
2882e68589bSMark F. Adams           data[1] =  coords[2*kk];
2892e68589bSMark F. Adams         }
2902e68589bSMark F. Adams         else {
2912e68589bSMark F. Adams           data += 3*M;
2922e68589bSMark F. Adams           data[0] = 0.0;               data[M+0] =  coords[3*kk+2]; data[2*M+0] = -coords[3*kk+1];
2932e68589bSMark F. Adams           data[1] = -coords[3*kk+2]; data[M+1] = 0.0;               data[2*M+1] =  coords[3*kk];
2942e68589bSMark F. Adams           data[2] =  coords[3*kk+1]; data[M+2] = -coords[3*kk];   data[2*M+2] = 0.0;
2952e68589bSMark F. Adams         }
2962e68589bSMark F. Adams       }
2972e68589bSMark F. Adams     }
2982e68589bSMark F. Adams   }
2992e68589bSMark F. Adams 
3002e68589bSMark F. Adams   pc_gamg->data_sz = arrsz;
3012e68589bSMark F. Adams 
3022e68589bSMark F. Adams   PetscFunctionReturn(0);
3032e68589bSMark F. Adams }
3042e68589bSMark F. Adams EXTERN_C_END
3052e68589bSMark F. Adams 
306b43b03e9SMark F. Adams typedef PetscInt NState;
307b43b03e9SMark F. Adams static const NState NOT_DONE=-2;
308b43b03e9SMark F. Adams static const NState DELETED=-1;
309b43b03e9SMark F. Adams static const NState REMOVED=-3;
310b43b03e9SMark F. Adams #define IS_SELECTED(s) (s!=DELETED && s!=NOT_DONE && s!=REMOVED)
311b43b03e9SMark F. Adams 
312c8b0795cSMark F. Adams /* -------------------------------------------------------------------------- */
313c8b0795cSMark F. Adams /*
314b43b03e9SMark F. Adams    smoothAggs - greedy grab of with G1 (unsquared graph) -- AIJ specific
315b43b03e9SMark F. Adams      - AGG-MG specific: clears singletons out of 'selected_2'
316c8b0795cSMark F. Adams 
317c8b0795cSMark F. Adams    Input Parameter:
318c8b0795cSMark F. Adams    . Gmat_2 - glabal matrix of graph (data not defined)
319c8b0795cSMark F. Adams    . Gmat_1 - base graph to grab with
320c8b0795cSMark F. Adams    . selected_2 -
321c8b0795cSMark F. Adams    Input/Output Parameter:
322c8b0795cSMark F. Adams    . llist_aggs_2 - linked list of aggs, ghost lids are based on Gmat_2 (squared graph)
323c8b0795cSMark F. Adams */
324c8b0795cSMark F. Adams #undef __FUNCT__
325c8b0795cSMark F. Adams #define __FUNCT__ "smoothAggs"
326c8b0795cSMark F. Adams PetscErrorCode smoothAggs( const Mat Gmat_2, /* base (squared) graph */
327c8b0795cSMark F. Adams                            const Mat Gmat_1, /* base graph, could be unsymmetic */
328c8b0795cSMark F. Adams                            const IS selected_2, /* [nselected total] selected vertices */
329c8b0795cSMark F. Adams                            IS llist_aggs_2 /* [nloc_nghost] global ID of aggregate */
330c8b0795cSMark F. Adams                            )
331c8b0795cSMark F. Adams {
332c8b0795cSMark F. Adams   PetscErrorCode ierr;
333c8b0795cSMark F. Adams   PetscBool      isMPI;
334c8b0795cSMark F. Adams   Mat_SeqAIJ    *matA_1, *matB_1=0, *matA_2, *matB_2=0;
335c8b0795cSMark F. Adams   MPI_Comm       wcomm = ((PetscObject)Gmat_2)->comm;
336c8b0795cSMark F. Adams   PetscMPIInt    mype;
337b43b03e9SMark F. Adams   PetscInt       lid,*ii,*idx,ix,Iend,my0,nnodes_2,kk,n,j;
338c8b0795cSMark F. Adams   Mat_MPIAIJ    *mpimat_2 = 0, *mpimat_1=0;
339c8b0795cSMark F. Adams   const PetscInt nloc = Gmat_2->rmap->n;
340c8b0795cSMark F. Adams   PetscScalar   *cpcol_1_state,*cpcol_2_state,*deleted_parent_gid;
341c8b0795cSMark F. Adams   PetscInt      *lid_cprowID_1,*id_llist_2,*lid_cprowID_2;
342c8b0795cSMark F. Adams   NState        *lid_state;
343c8b0795cSMark F. Adams 
344c8b0795cSMark F. Adams   PetscFunctionBegin;
345c8b0795cSMark F. Adams   ierr = MPI_Comm_rank( wcomm, &mype );   CHKERRQ(ierr);
346c8b0795cSMark F. Adams   ierr = MatGetOwnershipRange(Gmat_1,&my0,&Iend);  CHKERRQ(ierr);
347c8b0795cSMark F. Adams 
348c8b0795cSMark F. Adams   if( !PETSC_TRUE ) {
349c8b0795cSMark F. Adams     PetscViewer viewer; char fname[32]; static int llev=0;
350c8b0795cSMark F. Adams     sprintf(fname,"Gmat2_%d.m",llev++);
351c8b0795cSMark F. Adams     PetscViewerASCIIOpen(wcomm,fname,&viewer);
352c8b0795cSMark F. Adams     ierr = PetscViewerSetFormat( viewer, PETSC_VIEWER_ASCII_MATLAB);  CHKERRQ(ierr);
353c8b0795cSMark F. Adams     ierr = MatView(Gmat_2, viewer ); CHKERRQ(ierr);
354c8b0795cSMark F. Adams     ierr = PetscViewerDestroy( &viewer );
355c8b0795cSMark F. Adams   }
356c8b0795cSMark F. Adams 
357c8b0795cSMark F. Adams   { /* copy linked list into temp buffer - should not work directly on pointer */
358c8b0795cSMark F. Adams     const PetscInt *llist_idx;
359c8b0795cSMark F. Adams     ierr = ISGetSize( llist_aggs_2, &nnodes_2 );        CHKERRQ(ierr);
360c8b0795cSMark F. Adams     ierr = PetscMalloc( nnodes_2*sizeof(PetscInt), &id_llist_2 ); CHKERRQ(ierr);
361c8b0795cSMark F. Adams     ierr = ISGetIndices( llist_aggs_2, &llist_idx );       CHKERRQ(ierr);
362c8b0795cSMark F. Adams     for(lid=0;lid<nnodes_2;lid++) id_llist_2[lid] = llist_idx[lid];
363c8b0795cSMark F. Adams     ierr = ISRestoreIndices( llist_aggs_2, &llist_idx );     CHKERRQ(ierr);
364c8b0795cSMark F. Adams   }
365c8b0795cSMark F. Adams 
366c8b0795cSMark F. Adams   /* get submatrices */
367c8b0795cSMark F. Adams   ierr = PetscTypeCompare( (PetscObject)Gmat_1, MATMPIAIJ, &isMPI ); CHKERRQ(ierr);
368c8b0795cSMark F. Adams   if(isMPI) {
369c8b0795cSMark F. Adams     /* grab matrix objects */
370c8b0795cSMark F. Adams     mpimat_2 = (Mat_MPIAIJ*)Gmat_2->data;
371c8b0795cSMark F. Adams     mpimat_1 = (Mat_MPIAIJ*)Gmat_1->data;
372c8b0795cSMark F. Adams     matA_1 = (Mat_SeqAIJ*)mpimat_1->A->data;
373c8b0795cSMark F. Adams     matB_1 = (Mat_SeqAIJ*)mpimat_1->B->data;
374c8b0795cSMark F. Adams     matA_2 = (Mat_SeqAIJ*)mpimat_2->A->data;
375c8b0795cSMark F. Adams     matB_2 = (Mat_SeqAIJ*)mpimat_2->B->data;
376c8b0795cSMark F. Adams 
377c8b0795cSMark F. Adams     /* force compressed row storage for B matrix in AuxMat */
378c8b0795cSMark F. Adams     matB_1->compressedrow.check = PETSC_TRUE;
379c8b0795cSMark F. Adams     ierr = MatCheckCompressedRow(mpimat_1->B,&matB_1->compressedrow,matB_1->i,Gmat_1->rmap->n,-1.0);
380c8b0795cSMark F. Adams     CHKERRQ(ierr);
381c8b0795cSMark F. Adams 
382c8b0795cSMark F. Adams     ierr = PetscMalloc( nloc*sizeof(PetscInt), &lid_cprowID_2 ); CHKERRQ(ierr);
383c8b0795cSMark F. Adams     ierr = PetscMalloc( nloc*sizeof(PetscInt), &lid_cprowID_1 ); CHKERRQ(ierr);
384c8b0795cSMark F. Adams     for(lid=0;lid<nloc;lid++) lid_cprowID_1[lid] = lid_cprowID_2[lid] = -1;
385c8b0795cSMark F. Adams     for (ix=0; ix<matB_1->compressedrow.nrows; ix++) {
386c8b0795cSMark F. Adams       PetscInt lid = matB_1->compressedrow.rindex[ix];
387c8b0795cSMark F. Adams       lid_cprowID_1[lid] = ix;
388c8b0795cSMark F. Adams     }
389c8b0795cSMark F. Adams     for (ix=0; ix<matB_2->compressedrow.nrows; ix++) {
390c8b0795cSMark F. Adams       PetscInt lid = matB_2->compressedrow.rindex[ix];
391c8b0795cSMark F. Adams       lid_cprowID_2[lid] = ix;
392c8b0795cSMark F. Adams     }
393c8b0795cSMark F. Adams   }
394c8b0795cSMark F. Adams   else {
395c8b0795cSMark F. Adams     matA_1 = (Mat_SeqAIJ*)Gmat_1->data;
396c8b0795cSMark F. Adams     matA_2 = (Mat_SeqAIJ*)Gmat_2->data;
397c8b0795cSMark F. Adams     lid_cprowID_2 = lid_cprowID_1 = 0;
398c8b0795cSMark F. Adams   }
399c8b0795cSMark F. Adams   assert( matA_1 && !matA_1->compressedrow.use );
400c8b0795cSMark F. Adams   assert( matB_1==0 || matB_1->compressedrow.use );
401c8b0795cSMark F. Adams   assert( matA_2 && !matA_2->compressedrow.use );
402c8b0795cSMark F. Adams   assert( matB_2==0 || matB_2->compressedrow.use );
403c8b0795cSMark F. Adams 
404c8b0795cSMark F. Adams   /* get state of locals and selected gid for deleted */
405c8b0795cSMark F. Adams   ierr = PetscMalloc( nloc*sizeof(NState), &lid_state ); CHKERRQ(ierr);
406c8b0795cSMark F. Adams   ierr = PetscMalloc( nloc*sizeof(PetscScalar), &deleted_parent_gid ); CHKERRQ(ierr);
407c8b0795cSMark F. Adams   for( lid = 0 ; lid < nloc ; lid++ ) {
408c8b0795cSMark F. Adams     deleted_parent_gid[lid] = -1.0;
409c8b0795cSMark F. Adams     lid_state[lid] = DELETED;
410c8b0795cSMark F. Adams   }
411c8b0795cSMark F. Adams   /* set index into compressed row 'lid_cprowID', not -1 means its a boundary node */
412c8b0795cSMark F. Adams   {
413b43b03e9SMark F. Adams     PetscInt nSelected;
414c8b0795cSMark F. Adams     const PetscInt *selected_idx;
415c8b0795cSMark F. Adams     /* set local selected */
416c8b0795cSMark F. Adams     ierr = ISGetSize( selected_2, &nSelected );        CHKERRQ(ierr);
417c8b0795cSMark F. Adams     ierr = ISGetIndices( selected_2, &selected_idx );       CHKERRQ(ierr);
418c8b0795cSMark F. Adams     for(kk=0;kk<nSelected;kk++){
419c8b0795cSMark F. Adams       PetscInt lid = selected_idx[kk];
420c8b0795cSMark F. Adams       if(lid<nloc) lid_state[lid] = (NState)(lid+my0); /* selected flag */
421c8b0795cSMark F. Adams       else break;
422b43b03e9SMark F. Adams       /* remove singletons */
423b43b03e9SMark F. Adams       ii = matA_2->i; n = ii[lid+1] - ii[lid];
424b43b03e9SMark F. Adams       if( n < 2 ) {
425b43b03e9SMark F. Adams         if(!lid_cprowID_2 || (ix=lid_cprowID_2[lid])==-1 || (matB_2->compressedrow.i[ix+1]-matB_2->compressedrow.i[ix])==0){
426b43b03e9SMark F. Adams           lid_state[lid] = REMOVED;
427b43b03e9SMark F. Adams         }
428b43b03e9SMark F. Adams       }
429c8b0795cSMark F. Adams     }
430c8b0795cSMark F. Adams     ierr = ISRestoreIndices( selected_2, &selected_idx );     CHKERRQ(ierr);
431c8b0795cSMark F. Adams   }
432c8b0795cSMark F. Adams   /* map local to selected local, -1 means a ghost owns it */
433c8b0795cSMark F. Adams   for(lid=kk=0;lid<nloc;lid++){
434c8b0795cSMark F. Adams     NState state = lid_state[lid];
435c8b0795cSMark F. Adams     if( IS_SELECTED(state) ){
436c8b0795cSMark F. Adams       PetscInt flid = lid;
437c8b0795cSMark F. Adams       do{
438c8b0795cSMark F. Adams         if(flid<nloc){
439c8b0795cSMark F. Adams           deleted_parent_gid[flid] = (PetscScalar)(lid + my0);
440c8b0795cSMark F. Adams         }
441c8b0795cSMark F. Adams         kk++;
442c8b0795cSMark F. Adams       } while( (flid=id_llist_2[flid]) != -1 );
443c8b0795cSMark F. Adams     }
444c8b0795cSMark F. Adams   }
445c8b0795cSMark F. Adams   /* get 'cpcol_1_state', 'cpcol_2_state' - uses mpimat_1->lvec & mpimat_2->lvec for temp space */
446c8b0795cSMark F. Adams   if (isMPI) {
447c8b0795cSMark F. Adams     Vec          tempVec;
448c8b0795cSMark F. Adams 
449c8b0795cSMark F. Adams     /* get 'cpcol_1_state' */
450c8b0795cSMark F. Adams     ierr = MatGetVecs( Gmat_1, &tempVec, 0 );         CHKERRQ(ierr);
451c8b0795cSMark F. Adams     for(kk=0,j=my0;kk<nloc;kk++,j++){
452c8b0795cSMark F. Adams       PetscScalar v = (PetscScalar)lid_state[kk];
453c8b0795cSMark F. Adams       ierr = VecSetValues( tempVec, 1, &j, &v, INSERT_VALUES );  CHKERRQ(ierr);
454c8b0795cSMark F. Adams     }
455c8b0795cSMark F. Adams     ierr = VecAssemblyBegin( tempVec ); CHKERRQ(ierr);
456c8b0795cSMark F. Adams     ierr = VecAssemblyEnd( tempVec ); CHKERRQ(ierr);
457c8b0795cSMark F. Adams     ierr = VecScatterBegin(mpimat_1->Mvctx,tempVec, mpimat_1->lvec,INSERT_VALUES,SCATTER_FORWARD);
458c8b0795cSMark F. Adams     CHKERRQ(ierr);
459c8b0795cSMark F. Adams     ierr =   VecScatterEnd(mpimat_1->Mvctx,tempVec, mpimat_1->lvec,INSERT_VALUES,SCATTER_FORWARD);
460c8b0795cSMark F. Adams     CHKERRQ(ierr);
461c8b0795cSMark F. Adams     ierr = VecGetArray( mpimat_1->lvec, &cpcol_1_state ); CHKERRQ(ierr);
462c8b0795cSMark F. Adams     ierr = VecDestroy( &tempVec ); CHKERRQ(ierr);
463c8b0795cSMark F. Adams 
464c8b0795cSMark F. Adams     /* get 'cpcol_2_state' */
465c8b0795cSMark F. Adams     ierr = MatGetVecs( Gmat_2, &tempVec, 0 );         CHKERRQ(ierr);
466c8b0795cSMark F. Adams     for(kk=0,j=my0;kk<nloc;kk++,j++){
467c8b0795cSMark F. Adams       PetscScalar v = (PetscScalar)lid_state[kk];
468c8b0795cSMark F. Adams       ierr = VecSetValues( tempVec, 1, &j, &v, INSERT_VALUES );  CHKERRQ(ierr);
469c8b0795cSMark F. Adams     }
470c8b0795cSMark F. Adams     ierr = VecAssemblyBegin( tempVec ); CHKERRQ(ierr);
471c8b0795cSMark F. Adams     ierr = VecAssemblyEnd( tempVec ); CHKERRQ(ierr);
472c8b0795cSMark F. Adams     ierr = VecScatterBegin(mpimat_2->Mvctx,tempVec, mpimat_2->lvec,INSERT_VALUES,SCATTER_FORWARD);
473c8b0795cSMark F. Adams     CHKERRQ(ierr);
474c8b0795cSMark F. Adams     ierr =   VecScatterEnd(mpimat_2->Mvctx,tempVec, mpimat_2->lvec,INSERT_VALUES,SCATTER_FORWARD);
475c8b0795cSMark F. Adams     CHKERRQ(ierr);
476c8b0795cSMark F. Adams     ierr = VecGetArray( mpimat_2->lvec, &cpcol_2_state ); CHKERRQ(ierr);
477c8b0795cSMark F. Adams     ierr = VecDestroy( &tempVec ); CHKERRQ(ierr);
478c8b0795cSMark F. Adams   } /* ismpi */
479c8b0795cSMark F. Adams 
480c8b0795cSMark F. Adams   /* doit */
481c8b0795cSMark F. Adams   for(lid=0;lid<nloc;lid++){
482c8b0795cSMark F. Adams     NState state = lid_state[lid];
483c8b0795cSMark F. Adams     if( IS_SELECTED(state) ) {      /* steal locals */
484c8b0795cSMark F. Adams       ii = matA_1->i; n = ii[lid+1] - ii[lid];
485c8b0795cSMark F. Adams       idx = matA_1->j + ii[lid];
486c8b0795cSMark F. Adams       for (j=0; j<n; j++) {
487c8b0795cSMark F. Adams         PetscInt flid, lidj = idx[j], sgid;
488c8b0795cSMark F. Adams         NState statej = lid_state[lidj];
48974778d6cSJed Brown         if (statej==DELETED && (sgid=(PetscInt)PetscRealPart(deleted_parent_gid[lidj])) != lid+my0) { /* steal local */
490c8b0795cSMark F. Adams           deleted_parent_gid[lidj] = (PetscScalar)(lid+my0); /* send this with _2 */
491c8b0795cSMark F. Adams           if( sgid >= my0 && sgid < my0+nloc ){       /* I'm stealing this local from a local */
492c8b0795cSMark F. Adams             PetscInt hav=0, flid2=sgid-my0, lastid;
493c8b0795cSMark F. Adams             /* looking for local from local so id_llist_2 works */
494c8b0795cSMark F. Adams             for( lastid=flid2, flid=id_llist_2[flid2] ; flid!=-1 ; flid=id_llist_2[flid] ) {
495c8b0795cSMark F. Adams               if( flid == lidj ) {
496c8b0795cSMark F. Adams                 id_llist_2[lastid] = id_llist_2[flid];                    /* remove lidj from list */
497c8b0795cSMark F. Adams                 id_llist_2[flid] = id_llist_2[lid]; id_llist_2[lid] = flid; /* insert 'lidj' into head of llist */
498c8b0795cSMark F. Adams                 hav++;
499c8b0795cSMark F. Adams                 break;
500c8b0795cSMark F. Adams               }
501c8b0795cSMark F. Adams               lastid = flid;
502c8b0795cSMark F. Adams             }
503c8b0795cSMark F. Adams             if(hav!=1){
504c8b0795cSMark F. Adams               if(hav==0)SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"failed to find adj in 'selected' lists - structurally unsymmetric matrix");
505c8b0795cSMark F. Adams               SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"found node %d times???",hav);
506c8b0795cSMark F. Adams             }
507c8b0795cSMark F. Adams           }
508c8b0795cSMark F. Adams           else{            /* I'm stealing this local, owned by a ghost - ok to use _2, local */
509c8b0795cSMark F. Adams             assert(sgid==-1);
510c8b0795cSMark F. Adams             id_llist_2[lidj] = id_llist_2[lid]; id_llist_2[lid] = lidj; /* insert 'lidj' into head of llist */
511c8b0795cSMark F. Adams             /* local remove at end, off add/rm at end */
512c8b0795cSMark F. Adams           }
513c8b0795cSMark F. Adams         }
514c8b0795cSMark F. Adams       }
515c8b0795cSMark F. Adams     }
516c8b0795cSMark F. Adams     else if( state == DELETED && lid_cprowID_1 ) {
51774778d6cSJed Brown       PetscInt sgidold = (PetscInt)PetscRealPart(deleted_parent_gid[lid]);
518c8b0795cSMark F. Adams       /* see if I have a selected ghost neighbor that will steal me */
519c8b0795cSMark F. Adams       if( (ix=lid_cprowID_1[lid]) != -1 ){
520c8b0795cSMark F. Adams         ii = matB_1->compressedrow.i; n = ii[ix+1] - ii[ix];
521c8b0795cSMark F. Adams         idx = matB_1->j + ii[ix];
522c8b0795cSMark F. Adams         for( j=0 ; j<n ; j++ ) {
523c8b0795cSMark F. Adams           PetscInt cpid = idx[j];
524c8b0795cSMark F. Adams           NState statej = (NState)PetscRealPart(cpcol_1_state[cpid]);
525c8b0795cSMark F. Adams           if( IS_SELECTED(statej) && sgidold != (PetscInt)statej ) { /* ghost will steal this, remove from my list */
526c8b0795cSMark F. Adams             deleted_parent_gid[lid] = (PetscScalar)statej; /* send who selected with _2 */
527c8b0795cSMark F. Adams             if( sgidold>=my0 && sgidold<(my0+nloc) ) { /* this was mine */
528c8b0795cSMark F. Adams               PetscInt lastid,hav=0,flid,oldslidj=sgidold-my0;
529c8b0795cSMark F. Adams               /* remove from 'oldslidj' list, local so _2 is OK */
530c8b0795cSMark F. Adams               for( lastid=oldslidj, flid=id_llist_2[oldslidj] ; flid != -1 ; flid=id_llist_2[flid] ) {
531c8b0795cSMark F. Adams                 if( flid == lid ) {
532c8b0795cSMark F. Adams                   id_llist_2[lastid] = id_llist_2[flid];   /* remove lid from oldslidj list */
533c8b0795cSMark F. Adams                   hav++;
534c8b0795cSMark F. Adams                   break;
535c8b0795cSMark F. Adams                 }
536c8b0795cSMark F. Adams                 lastid = flid;
537c8b0795cSMark F. Adams               }
538c8b0795cSMark F. Adams               if(hav!=1){
539c8b0795cSMark F. Adams                 if(hav==0)SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"failed to find adj in 'selected' lists - structurally unsymmetric matrix");
540c8b0795cSMark F. Adams                 SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"found node %d times???",hav);
541c8b0795cSMark F. Adams               }
542c8b0795cSMark F. Adams               id_llist_2[lid] = -1; /* terminate linked list - needed? */
543c8b0795cSMark F. Adams             }
544c8b0795cSMark F. Adams             else assert(id_llist_2[lid] == -1);
545c8b0795cSMark F. Adams           }
546c8b0795cSMark F. Adams         }
547c8b0795cSMark F. Adams       }
548c8b0795cSMark F. Adams     } /* selected/deleted */
549c8b0795cSMark F. Adams     else assert(state == REMOVED || !lid_cprowID_1);
550c8b0795cSMark F. Adams   } /* node loop */
551c8b0795cSMark F. Adams 
552c8b0795cSMark F. Adams   if( isMPI ) {
553c8b0795cSMark F. Adams     PetscScalar *cpcol_2_sel_gid;
554c8b0795cSMark F. Adams     Vec          tempVec;
555c8b0795cSMark F. Adams     PetscInt     cpid;
556c8b0795cSMark F. Adams 
557c8b0795cSMark F. Adams     ierr = VecRestoreArray( mpimat_1->lvec, &cpcol_1_state ); CHKERRQ(ierr);
558c8b0795cSMark F. Adams     ierr = VecRestoreArray( mpimat_2->lvec, &cpcol_2_state ); CHKERRQ(ierr);
559c8b0795cSMark F. Adams 
560c8b0795cSMark F. Adams     /* get 'cpcol_2_sel_gid' */
561c8b0795cSMark F. Adams     ierr = MatGetVecs( Gmat_2, &tempVec, 0 );         CHKERRQ(ierr);
562c8b0795cSMark F. Adams     for(kk=0,j=my0;kk<nloc;kk++,j++){
563c8b0795cSMark F. Adams       ierr = VecSetValues( tempVec, 1, &j, &deleted_parent_gid[kk], INSERT_VALUES );  CHKERRQ(ierr);
564c8b0795cSMark F. Adams     }
565c8b0795cSMark F. Adams     ierr = VecAssemblyBegin( tempVec ); CHKERRQ(ierr);
566c8b0795cSMark F. Adams     ierr = VecAssemblyEnd( tempVec ); CHKERRQ(ierr);
567c8b0795cSMark F. Adams     ierr = VecScatterBegin(mpimat_2->Mvctx,tempVec, mpimat_2->lvec,INSERT_VALUES,SCATTER_FORWARD);
568c8b0795cSMark F. Adams     CHKERRQ(ierr);
569c8b0795cSMark F. Adams     ierr =   VecScatterEnd(mpimat_2->Mvctx,tempVec, mpimat_2->lvec,INSERT_VALUES,SCATTER_FORWARD);
570c8b0795cSMark F. Adams     CHKERRQ(ierr);
571c8b0795cSMark F. Adams     ierr = VecDestroy( &tempVec ); CHKERRQ(ierr);
572c8b0795cSMark F. Adams 
573c8b0795cSMark F. Adams     ierr = VecGetArray( mpimat_2->lvec, &cpcol_2_sel_gid ); CHKERRQ(ierr);
574c8b0795cSMark F. Adams 
575c8b0795cSMark F. Adams     /* look for deleted ghosts and see if they moved */
576c8b0795cSMark F. Adams     for(lid=0;lid<nloc;lid++){
577c8b0795cSMark F. Adams       NState state = lid_state[lid];
578c8b0795cSMark F. Adams       if( IS_SELECTED(state) ){
579c8b0795cSMark F. Adams         PetscInt flid,lastid,old_sgid=lid+my0;
580c8b0795cSMark F. Adams         /* look for deleted ghosts and see if they moved */
581c8b0795cSMark F. Adams         for( lastid=lid, flid=id_llist_2[lid] ; flid!=-1 ; flid=id_llist_2[flid] ) {
582c8b0795cSMark F. Adams           if( flid>=nloc ) {
58374778d6cSJed Brown             PetscInt cpid = flid-nloc, sgid_new = (PetscInt)PetscRealPart(cpcol_2_sel_gid[cpid]);
584c8b0795cSMark F. Adams             if( sgid_new != old_sgid && sgid_new != -1 ) {
585c8b0795cSMark F. Adams               id_llist_2[lastid] = id_llist_2[flid];                    /* remove 'flid' from list */
586c8b0795cSMark F. Adams               id_llist_2[flid] = -1;
587c8b0795cSMark F. Adams               flid = lastid;
588c8b0795cSMark F. Adams             } /* if it changed parents */
589c8b0795cSMark F. Adams             else lastid = flid;
590c8b0795cSMark F. Adams           } /* for ghost nodes */
591c8b0795cSMark F. Adams           else lastid = flid;
592c8b0795cSMark F. Adams         } /* loop over list of deleted */
593c8b0795cSMark F. Adams       } /* selected */
594c8b0795cSMark F. Adams     }
595c8b0795cSMark F. Adams 
596c8b0795cSMark F. Adams     /* look at ghosts, see if they changed, and moved here */
597c8b0795cSMark F. Adams     for(cpid=0;cpid<nnodes_2-nloc;cpid++){
59874778d6cSJed Brown       PetscInt sgid_new = (PetscInt)PetscRealPart(cpcol_2_sel_gid[cpid]);
599c8b0795cSMark F. Adams       if( sgid_new>=my0 && sgid_new<(my0+nloc) ) { /* this is mine */
600c8b0795cSMark F. Adams         PetscInt lastid,flid,slid_new=sgid_new-my0,flidj=nloc+cpid,hav=0;
601c8b0795cSMark F. Adams         for( lastid=slid_new, flid=id_llist_2[slid_new] ; flid != -1 ; flid=id_llist_2[flid] ) {
602c8b0795cSMark F. Adams           if( flid == flidj ) {
603c8b0795cSMark F. Adams             hav++;
604c8b0795cSMark F. Adams             break;
605c8b0795cSMark F. Adams           }
606c8b0795cSMark F. Adams           lastid = flid;
607c8b0795cSMark F. Adams         }
608c8b0795cSMark F. Adams         if( hav != 1 ){
609c8b0795cSMark F. Adams           assert(id_llist_2[flidj] == -1);
610c8b0795cSMark F. Adams           id_llist_2[flidj] = id_llist_2[slid_new]; id_llist_2[slid_new] = flidj; /* insert 'flidj' into head of llist */
611c8b0795cSMark F. Adams         }
612c8b0795cSMark F. Adams       }
613c8b0795cSMark F. Adams     }
614c8b0795cSMark F. Adams 
615c8b0795cSMark F. Adams     ierr = VecRestoreArray( mpimat_2->lvec, &cpcol_2_sel_gid ); CHKERRQ(ierr);
616c8b0795cSMark F. Adams     ierr = PetscFree( lid_cprowID_1 );  CHKERRQ(ierr);
617c8b0795cSMark F. Adams     ierr = PetscFree( lid_cprowID_2 );  CHKERRQ(ierr);
618c8b0795cSMark F. Adams   }
619c8b0795cSMark F. Adams 
620c8b0795cSMark F. Adams   /* copy out new aggs */
621c8b0795cSMark F. Adams   ierr = ISGeneralSetIndices(llist_aggs_2, nnodes_2, id_llist_2, PETSC_COPY_VALUES ); CHKERRQ(ierr);
622c8b0795cSMark F. Adams 
623c8b0795cSMark F. Adams   ierr = PetscFree( id_llist_2 );  CHKERRQ(ierr);
624c8b0795cSMark F. Adams   ierr = PetscFree( deleted_parent_gid );  CHKERRQ(ierr);
625c8b0795cSMark F. Adams   ierr = PetscFree( lid_state );  CHKERRQ(ierr);
626c8b0795cSMark F. Adams 
627c8b0795cSMark F. Adams   PetscFunctionReturn(0);
628c8b0795cSMark F. Adams }
6292e68589bSMark F. Adams 
6302e68589bSMark F. Adams /* -------------------------------------------------------------------------- */
6312e68589bSMark F. Adams /*
6322e68589bSMark F. Adams    PCSetData_AGG
6332e68589bSMark F. Adams 
6342e68589bSMark F. Adams   Input Parameter:
6352e68589bSMark F. Adams    . pc -
6362e68589bSMark F. Adams */
6372e68589bSMark F. Adams #undef __FUNCT__
6382e68589bSMark F. Adams #define __FUNCT__ "PCSetData_AGG"
6392e68589bSMark F. Adams PetscErrorCode PCSetData_AGG( PC pc )
6402e68589bSMark F. Adams {
6412e68589bSMark F. Adams   PetscErrorCode  ierr;
6422e68589bSMark F. Adams   PetscFunctionBegin;
6432e68589bSMark F. Adams   ierr = PCSetCoordinates_AGG( pc, -1, PETSC_NULL ); CHKERRQ(ierr);
6442e68589bSMark F. Adams   PetscFunctionReturn(0);
6452e68589bSMark F. Adams }
6462e68589bSMark F. Adams 
6472e68589bSMark F. Adams /* -------------------------------------------------------------------------- */
6482e68589bSMark F. Adams /*
6492e68589bSMark F. Adams  formProl0
6502e68589bSMark F. Adams 
6512e68589bSMark F. Adams    Input Parameter:
6522e68589bSMark F. Adams    . selected - list of selected local ID, includes selected ghosts
6532e68589bSMark F. Adams    . locals_llist - linked list with aggregates
6542e68589bSMark F. Adams    . bs - block size
6552e68589bSMark F. Adams    . nSAvec - num columns of new P
6562e68589bSMark F. Adams    . my0crs - global index of locals
6572e68589bSMark F. Adams    . data_stride - bs*(nloc nodes + ghost nodes)
6582e68589bSMark F. Adams    . data_in[data_stride*nSAvec] - local data on fine grid
6592e68589bSMark F. Adams    . flid_fgid[data_stride/bs] - make local to global IDs, includes ghosts in 'locals_llist'
6602e68589bSMark F. Adams   Output Parameter:
6612e68589bSMark F. Adams    . a_data_out - in with fine grid data (w/ghosts), out with coarse grid data
6622e68589bSMark F. Adams    . a_Prol - prolongation operator
6632e68589bSMark F. Adams */
6642e68589bSMark F. Adams #undef __FUNCT__
6652e68589bSMark F. Adams #define __FUNCT__ "formProl0"
6662e68589bSMark F. Adams PetscErrorCode formProl0( IS selected, /* list of selected local ID, includes selected ghosts */
6672e68589bSMark F. Adams                           IS locals_llist, /* linked list from selected vertices of aggregate unselected vertices */
6682e68589bSMark F. Adams                           const PetscInt bs,
6692e68589bSMark F. Adams                           const PetscInt nSAvec,
6702e68589bSMark F. Adams                           const PetscInt my0crs,
6712e68589bSMark F. Adams                           const PetscInt data_stride,
6722e68589bSMark F. Adams                           PetscReal data_in[],
6732e68589bSMark F. Adams                           const PetscInt flid_fgid[],
6742e68589bSMark F. Adams                           PetscReal **a_data_out,
6752e68589bSMark F. Adams                           Mat a_Prol /* prolongation operator (output)*/
6762e68589bSMark F. Adams                           )
6772e68589bSMark F. Adams {
6782e68589bSMark F. Adams   PetscErrorCode ierr;
679b43b03e9SMark F. Adams   PetscInt  Istart,Iend,nFineLoc,clid,flid,aggID,kk,jj,ii,mm,nLocalSelected,ndone,nSelected,minsz;
6802e68589bSMark F. Adams   MPI_Comm       wcomm = ((PetscObject)a_Prol)->comm;
6812e68589bSMark F. Adams   PetscMPIInt    mype, npe;
6822e68589bSMark F. Adams   const PetscInt *selected_idx,*llist_idx;
6832e68589bSMark F. Adams   PetscReal      *out_data;
6842adcac29SMark F. Adams /* #define OUT_AGGS */
6859057884aSMark F. Adams #ifdef OUT_AGGS
6869057884aSMark F. Adams   static PetscInt llev = 0; char fname[32]; FILE *file;
6879057884aSMark F. Adams   sprintf(fname,"aggs_%d.m",llev++);
688b2a4f308SMark F. Adams   if(llev==1) {
6899057884aSMark F. Adams     file = fopen(fname,"w");
6909057884aSMark F. Adams     fprintf(file,"figure,\n");
691b2a4f308SMark F. Adams   }
6929057884aSMark F. Adams #endif
6932e68589bSMark F. Adams 
6942e68589bSMark F. Adams   PetscFunctionBegin;
6952e68589bSMark F. Adams   ierr = MPI_Comm_rank(wcomm,&mype);CHKERRQ(ierr);
6962e68589bSMark F. Adams   ierr = MPI_Comm_size(wcomm,&npe);CHKERRQ(ierr);
6972e68589bSMark F. Adams   ierr = MatGetOwnershipRange( a_Prol, &Istart, &Iend );    CHKERRQ(ierr);
6982e68589bSMark F. Adams   nFineLoc = (Iend-Istart)/bs; assert((Iend-Istart)%bs==0);
6992e68589bSMark F. Adams 
700c8b0795cSMark F. Adams   ierr = ISGetSize( selected, &nSelected );        CHKERRQ(ierr);
7012e68589bSMark F. Adams   ierr = ISGetIndices( selected, &selected_idx );       CHKERRQ(ierr);
702b43b03e9SMark F. Adams   ierr = ISGetIndices( locals_llist, &llist_idx );      CHKERRQ(ierr);
7032e68589bSMark F. Adams   for(kk=0,nLocalSelected=0;kk<nSelected;kk++){
7042e68589bSMark F. Adams     PetscInt lid = selected_idx[kk];
705b43b03e9SMark F. Adams     if( lid<nFineLoc && llist_idx[lid] != -1 ) nLocalSelected++;
7062e68589bSMark F. Adams   }
7072e68589bSMark F. Adams 
7082e68589bSMark F. Adams   /* aloc space for coarse point data (output) */
7092e68589bSMark F. Adams #define DATA_OUT_STRIDE (nLocalSelected*nSAvec)
710c8b0795cSMark F. Adams   ierr = PetscMalloc( DATA_OUT_STRIDE*nSAvec*sizeof(PetscReal), &out_data ); CHKERRQ(ierr);
711c8b0795cSMark F. Adams   for(ii=0;ii<DATA_OUT_STRIDE*nSAvec;ii++) out_data[ii]=1.e300;
7122e68589bSMark F. Adams   *a_data_out = out_data; /* output - stride nLocalSelected*nSAvec */
7132e68589bSMark F. Adams 
7142e68589bSMark F. Adams   /* find points and set prolongation */
715c8b0795cSMark F. Adams   minsz = 100;
7162e68589bSMark F. Adams   ndone = 0;
717b43b03e9SMark F. Adams   for( mm = clid = 0 ; mm < nSelected ; mm++ ){
718b43b03e9SMark F. Adams     PetscInt lid = selected_idx[mm];
7192e68589bSMark F. Adams     PetscInt cgid = my0crs + clid, cids[100];
720b43b03e9SMark F. Adams     if( lid>=nFineLoc || llist_idx[lid]==-1 ) continue; /* skip ghost or singleton */
721b43b03e9SMark F. Adams 
7222e68589bSMark F. Adams     /* count agg */
7232e68589bSMark F. Adams     aggID = 0;
724b43b03e9SMark F. Adams     flid = selected_idx[mm]; assert(flid != -1);
7252e68589bSMark F. Adams     do{
7262e68589bSMark F. Adams       aggID++;
7272e68589bSMark F. Adams     } while( (flid=llist_idx[flid]) != -1 );
728c8b0795cSMark F. Adams     if( aggID<minsz ) minsz = aggID;
7292e68589bSMark F. Adams 
7302e68589bSMark F. Adams     /* get block */
7312e68589bSMark F. Adams     {
7322e68589bSMark F. Adams       PetscBLASInt   asz=aggID,M=asz*bs,N=nSAvec,INFO;
7332e68589bSMark F. Adams       PetscBLASInt   Mdata=M+((N-M>0)?N-M:0),LDA=Mdata,LWORK=N*bs;
7342e68589bSMark F. Adams       PetscScalar    *qqc,*qqr,*TAU,*WORK;
7352e68589bSMark F. Adams       PetscInt       *fids;
7362e68589bSMark F. Adams 
7372e68589bSMark F. Adams       ierr = PetscMalloc( (Mdata*N)*sizeof(PetscScalar), &qqc ); CHKERRQ(ierr);
7382e68589bSMark F. Adams       ierr = PetscMalloc( (M*N)*sizeof(PetscScalar), &qqr ); CHKERRQ(ierr);
7392e68589bSMark F. Adams       ierr = PetscMalloc( N*sizeof(PetscScalar), &TAU ); CHKERRQ(ierr);
7402e68589bSMark F. Adams       ierr = PetscMalloc( LWORK*sizeof(PetscScalar), &WORK ); CHKERRQ(ierr);
7412e68589bSMark F. Adams       ierr = PetscMalloc( M*sizeof(PetscInt), &fids ); CHKERRQ(ierr);
7422e68589bSMark F. Adams 
743b43b03e9SMark F. Adams       flid = selected_idx[mm];
7442e68589bSMark F. Adams       aggID = 0;
7452e68589bSMark F. Adams       do{
7462e68589bSMark F. Adams         /* copy in B_i matrix - column oriented */
7472e68589bSMark F. Adams         PetscReal *data = &data_in[flid*bs];
7482e68589bSMark F. Adams         for( kk = ii = 0; ii < bs ; ii++ ) {
7492e68589bSMark F. Adams           for( jj = 0; jj < N ; jj++ ) {
7502e68589bSMark F. Adams             qqc[jj*Mdata + aggID*bs + ii] = data[jj*data_stride + ii];
7512e68589bSMark F. Adams           }
7522e68589bSMark F. Adams         }
7539057884aSMark F. Adams #ifdef OUT_AGGS
754b2a4f308SMark F. Adams         if(llev==1) {
7559057884aSMark F. Adams           char str[] = "plot(%e,%e,'r*'), hold on,\n", col[] = "rgbkmc", sim[] = "*os+h>d<vx^";
756b2a4f308SMark F. Adams           PetscInt M,pi,pj,gid=Istart+flid;
7579057884aSMark F. Adams           str[12] = col[clid%6]; str[13] = sim[(clid/6)%11];
758b2a4f308SMark F. Adams           M = (PetscInt)(PetscSqrtScalar((PetscScalar)nFineLoc*npe));
759b2a4f308SMark F. Adams           pj = gid/M; pi = gid%M;
760b2a4f308SMark F. Adams           fprintf(file,str,(double)pi,(double)pj);
761b2a4f308SMark F. Adams           /* fprintf(file,str,data[2*data_stride+1],-data[2*data_stride]); */
7629057884aSMark F. Adams         }
7639057884aSMark F. Adams #endif
7642e68589bSMark F. Adams         /* set fine IDs */
7652e68589bSMark F. Adams         for(kk=0;kk<bs;kk++) fids[aggID*bs + kk] = flid_fgid[flid]*bs + kk;
7662e68589bSMark F. Adams 
7672e68589bSMark F. Adams         aggID++;
7682e68589bSMark F. Adams       }while( (flid=llist_idx[flid]) != -1 );
7692e68589bSMark F. Adams 
7702e68589bSMark F. Adams       /* pad with zeros */
7712e68589bSMark F. Adams       for( ii = asz*bs; ii < Mdata ; ii++ ) {
7722e68589bSMark F. Adams 	for( jj = 0; jj < N ; jj++, kk++ ) {
7732e68589bSMark F. Adams 	  qqc[jj*Mdata + ii] = .0;
7742e68589bSMark F. Adams 	}
7752e68589bSMark F. Adams       }
7762e68589bSMark F. Adams 
7772e68589bSMark F. Adams       ndone += aggID;
7782e68589bSMark F. Adams       /* QR */
7792e68589bSMark F. Adams       LAPACKgeqrf_( &Mdata, &N, qqc, &LDA, TAU, WORK, &LWORK, &INFO );
7802e68589bSMark F. Adams       if( INFO != 0 ) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"xGEQRS error");
7812e68589bSMark F. Adams       /* get R - column oriented - output B_{i+1} */
7822e68589bSMark F. Adams       {
7832e68589bSMark F. Adams         PetscReal *data = &out_data[clid*nSAvec];
7842e68589bSMark F. Adams         for( jj = 0; jj < nSAvec ; jj++ ) {
7852e68589bSMark F. Adams           for( ii = 0; ii < nSAvec ; ii++ ) {
7862e68589bSMark F. Adams             assert(data[jj*DATA_OUT_STRIDE + ii] == 1.e300);
7872e68589bSMark F. Adams             if( ii <= jj ) data[jj*DATA_OUT_STRIDE + ii] = PetscRealPart(qqc[jj*Mdata + ii]);
7882e68589bSMark F. Adams 	    else data[jj*DATA_OUT_STRIDE + ii] = 0.;
7892e68589bSMark F. Adams           }
7902e68589bSMark F. Adams         }
7912e68589bSMark F. Adams       }
7922e68589bSMark F. Adams 
7932e68589bSMark F. Adams       /* get Q - row oriented */
7942e68589bSMark F. Adams       LAPACKungqr_( &Mdata, &N, &N, qqc, &LDA, TAU, WORK, &LWORK, &INFO );
7952e68589bSMark F. Adams       if( INFO != 0 ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"xORGQR error arg %d",-INFO);
7962e68589bSMark F. Adams 
7972e68589bSMark F. Adams       for( ii = 0 ; ii < M ; ii++ ){
7982e68589bSMark F. Adams         for( jj = 0 ; jj < N ; jj++ ) {
7992e68589bSMark F. Adams           qqr[N*ii + jj] = qqc[jj*Mdata + ii];
8002e68589bSMark F. Adams         }
8012e68589bSMark F. Adams       }
8022e68589bSMark F. Adams 
8032e68589bSMark F. Adams       /* add diagonal block of P0 */
804c8b0795cSMark F. Adams       for(kk=0;kk<N;kk++) {
805c8b0795cSMark F. Adams         cids[kk] = N*cgid + kk; /* global col IDs in P0 */
806c8b0795cSMark F. Adams       }
8072e68589bSMark F. Adams       ierr = MatSetValues(a_Prol,M,fids,N,cids,qqr,INSERT_VALUES); CHKERRQ(ierr);
8082e68589bSMark F. Adams 
8092e68589bSMark F. Adams       ierr = PetscFree( qqc );  CHKERRQ(ierr);
8102e68589bSMark F. Adams       ierr = PetscFree( qqr );  CHKERRQ(ierr);
8112e68589bSMark F. Adams       ierr = PetscFree( TAU );  CHKERRQ(ierr);
8122e68589bSMark F. Adams       ierr = PetscFree( WORK );  CHKERRQ(ierr);
8132e68589bSMark F. Adams       ierr = PetscFree( fids );  CHKERRQ(ierr);
8142e68589bSMark F. Adams     } /* scoping */
815b43b03e9SMark F. Adams     clid++;
8162e68589bSMark F. Adams   } /* for all coarse nodes */
8172e68589bSMark F. Adams 
818c8b0795cSMark F. Adams /* ierr = MPI_Allreduce( &ndone, &ii, 1, MPIU_INT, MPIU_SUM, wcomm ); */
8192e68589bSMark F. Adams /* MatGetSize( a_Prol, &kk, &jj ); */
820c8b0795cSMark F. Adams /* ierr = MPI_Allreduce( &minsz, &jj, 1, MPIU_INT, MPIU_MIN, wcomm ); */
821ef4ad70eSMark F. Adams /* PetscPrintf(PETSC_COMM_WORLD," **** [%d]%s %d total done, %d nodes (%d local done), min agg. size = %d\n",mype,__FUNCT__,ii,kk/bs,ndone,jj); */
8222e68589bSMark F. Adams 
8239057884aSMark F. Adams #ifdef OUT_AGGS
824b2a4f308SMark F. Adams   if(llev==1) fclose(file);
8259057884aSMark F. Adams #endif
8262e68589bSMark F. Adams   ierr = ISRestoreIndices( selected, &selected_idx );     CHKERRQ(ierr);
8272e68589bSMark F. Adams   ierr = ISRestoreIndices( locals_llist, &llist_idx );     CHKERRQ(ierr);
8282e68589bSMark F. Adams   ierr = MatAssemblyBegin(a_Prol,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
8292e68589bSMark F. Adams   ierr = MatAssemblyEnd(a_Prol,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
8302e68589bSMark F. Adams 
8312e68589bSMark F. Adams   PetscFunctionReturn(0);
8322e68589bSMark F. Adams }
8332e68589bSMark F. Adams 
8342e68589bSMark F. Adams /* -------------------------------------------------------------------------- */
8352e68589bSMark F. Adams /*
836c8b0795cSMark F. Adams    PCGAMGgraph_AGG
8372e68589bSMark F. Adams 
8382e68589bSMark F. Adams   Input Parameter:
8392e68589bSMark F. Adams    . pc - this
8402e68589bSMark F. Adams    . Amat - matrix on this fine level
8412e68589bSMark F. Adams   Output Parameter:
842c8b0795cSMark F. Adams    . a_Gmat -
8432e68589bSMark F. Adams */
8442e68589bSMark F. Adams #undef __FUNCT__
845c8b0795cSMark F. Adams #define __FUNCT__ "PCGAMGgraph_AGG"
846c8b0795cSMark F. Adams PetscErrorCode PCGAMGgraph_AGG( PC pc,
8472e68589bSMark F. Adams                                 const Mat Amat,
848c8b0795cSMark F. Adams                                 Mat *a_Gmat
849c8b0795cSMark F. Adams                                 )
850c8b0795cSMark F. Adams {
851c8b0795cSMark F. Adams   PetscErrorCode ierr;
852c8b0795cSMark F. Adams   PC_MG          *mg = (PC_MG*)pc->data;
853c8b0795cSMark F. Adams   PC_GAMG        *pc_gamg = (PC_GAMG*)mg->innerctx;
854c8b0795cSMark F. Adams   const PetscInt verbose = pc_gamg->verbose;
855c8b0795cSMark F. Adams   const PetscReal vfilter = pc_gamg->threshold;
856c8b0795cSMark F. Adams   PC_GAMG_AGG    *pc_gamg_agg = (PC_GAMG_AGG*)pc_gamg->subctx;
857c8b0795cSMark F. Adams   PetscMPIInt    mype,npe;
858c8b0795cSMark F. Adams   Mat            Gmat, Gmat2;
859c8b0795cSMark F. Adams   MPI_Comm       wcomm = ((PetscObject)Amat)->comm;
860c8b0795cSMark F. Adams 
861c8b0795cSMark F. Adams   PetscFunctionBegin;
862c8b0795cSMark F. Adams   ierr = MPI_Comm_rank( wcomm, &mype);  CHKERRQ(ierr);
863c8b0795cSMark F. Adams   ierr = MPI_Comm_size( wcomm, &npe);   CHKERRQ(ierr);
864c8b0795cSMark F. Adams 
865c8b0795cSMark F. Adams   ierr  = createSimpleGraph( Amat, &Gmat ); CHKERRQ( ierr );
866c8b0795cSMark F. Adams   ierr  = scaleFilterGraph( &Gmat, vfilter, pc_gamg_agg->sym_graph, verbose ); CHKERRQ( ierr );
867c8b0795cSMark F. Adams 
868ef4ad70eSMark F. Adams   if( pc_gamg_agg->square_graph ) {
869c8b0795cSMark F. Adams     ierr = MatTransposeMatMult( Gmat, Gmat, MAT_INITIAL_MATRIX, PETSC_DEFAULT, &Gmat2 );
870c8b0795cSMark F. Adams     CHKERRQ(ierr);
871c8b0795cSMark F. Adams     /* attach auxilary matrix */
872c8b0795cSMark F. Adams     pc_gamg_agg->aux_mat = Gmat;
873c8b0795cSMark F. Adams     *a_Gmat = Gmat2;
874ef4ad70eSMark F. Adams   }
875ef4ad70eSMark F. Adams   else {
876ef4ad70eSMark F. Adams     *a_Gmat = Gmat;       assert(pc_gamg_agg->aux_mat == 0);
877ef4ad70eSMark F. Adams   }
878c8b0795cSMark F. Adams 
879c8b0795cSMark F. Adams   PetscFunctionReturn(0);
880c8b0795cSMark F. Adams }
881c8b0795cSMark F. Adams 
882c8b0795cSMark F. Adams /* -------------------------------------------------------------------------- */
883c8b0795cSMark F. Adams /*
884b43b03e9SMark F. Adams    PCGAMGCoarsen_AGG
885c8b0795cSMark F. Adams 
886c8b0795cSMark F. Adams   Input Parameter:
887c8b0795cSMark F. Adams    . pc - this
888c8b0795cSMark F. Adams    . Gmat2 - matrix on this fine level
889c8b0795cSMark F. Adams   Output Parameter:
890c8b0795cSMark F. Adams    . a_selected - prolongation operator to the next level
891c8b0795cSMark F. Adams    . a_llist_parent - data of coarse grid points (num local columns in 'a_P_out')
892c8b0795cSMark F. Adams */
893c8b0795cSMark F. Adams #undef __FUNCT__
894b43b03e9SMark F. Adams #define __FUNCT__ "PCGAMGCoarsen_AGG"
895b43b03e9SMark F. Adams PetscErrorCode PCGAMGCoarsen_AGG( PC pc,
896c8b0795cSMark F. Adams                                   const Mat Gmat2,
897c8b0795cSMark F. Adams                                   IS *a_selected,
898c8b0795cSMark F. Adams                                   IS *a_llist_parent
899c8b0795cSMark F. Adams                                   )
900c8b0795cSMark F. Adams {
901c8b0795cSMark F. Adams   PetscErrorCode ierr;
902c8b0795cSMark F. Adams   PC_MG          *mg = (PC_MG*)pc->data;
903c8b0795cSMark F. Adams   PC_GAMG        *pc_gamg = (PC_GAMG*)mg->innerctx;
904c8b0795cSMark F. Adams   PC_GAMG_AGG    *pc_gamg_agg = (PC_GAMG_AGG*)pc_gamg->subctx;
905c8b0795cSMark F. Adams   Mat             Gmat1; /* unsquared graph (not symetrized!) */
906c8b0795cSMark F. Adams   IS              perm, selected, llist_parent;
907c8b0795cSMark F. Adams   PetscInt        Ii,nloc,bs,n,m;
908c8b0795cSMark F. Adams   PetscInt *permute;
909c8b0795cSMark F. Adams   PetscBool *bIndexSet;
910b43b03e9SMark F. Adams   MatCoarsen crs;
911b43b03e9SMark F. Adams   MPI_Comm        wcomm = ((PetscObject)Gmat2)->comm;
912c8b0795cSMark F. Adams   /* PetscMPIInt     mype,npe; */
913c8b0795cSMark F. Adams 
914c8b0795cSMark F. Adams   PetscFunctionBegin;
915c8b0795cSMark F. Adams   /* ierr = MPI_Comm_rank( wcomm, &mype);  CHKERRQ(ierr); */
916c8b0795cSMark F. Adams   /* ierr = MPI_Comm_size( wcomm, &npe);   CHKERRQ(ierr); */
917c8b0795cSMark F. Adams   ierr = MatGetLocalSize( Gmat2, &n, &m ); CHKERRQ(ierr);
918c8b0795cSMark F. Adams   ierr = MatGetBlockSize( Gmat2, &bs ); CHKERRQ(ierr); assert(bs==1);
919c8b0795cSMark F. Adams   nloc = n/bs;
920c8b0795cSMark F. Adams 
921c8b0795cSMark F. Adams   /* get unsquared graph */
922c8b0795cSMark F. Adams   Gmat1 = pc_gamg_agg->aux_mat; pc_gamg_agg->aux_mat = 0;
923c8b0795cSMark F. Adams 
924c8b0795cSMark F. Adams   /* get MIS aggs */
925c8b0795cSMark F. Adams   /* randomize */
926c8b0795cSMark F. Adams   ierr = PetscMalloc( nloc*sizeof(PetscInt), &permute ); CHKERRQ(ierr);
927c8b0795cSMark F. Adams   ierr = PetscMalloc( nloc*sizeof(PetscBool), &bIndexSet ); CHKERRQ(ierr);
928c8b0795cSMark F. Adams   for ( Ii = 0; Ii < nloc ; Ii++ ){
929c8b0795cSMark F. Adams     bIndexSet[Ii] = PETSC_FALSE;
930c8b0795cSMark F. Adams     permute[Ii] = Ii;
931c8b0795cSMark F. Adams   }
932c8b0795cSMark F. Adams   srand(1); /* make deterministic */
933c8b0795cSMark F. Adams   for ( Ii = 0; Ii < nloc ; Ii++ ) {
934c8b0795cSMark F. Adams     PetscInt iSwapIndex = rand()%nloc;
935c8b0795cSMark F. Adams     if (!bIndexSet[iSwapIndex] && iSwapIndex != Ii) {
936c8b0795cSMark F. Adams       PetscInt iTemp = permute[iSwapIndex];
937c8b0795cSMark F. Adams       permute[iSwapIndex] = permute[Ii];
938c8b0795cSMark F. Adams       permute[Ii] = iTemp;
939c8b0795cSMark F. Adams       bIndexSet[iSwapIndex] = PETSC_TRUE;
940c8b0795cSMark F. Adams     }
941c8b0795cSMark F. Adams   }
942c8b0795cSMark F. Adams   ierr = PetscFree( bIndexSet );  CHKERRQ(ierr);
943c8b0795cSMark F. Adams 
944c8b0795cSMark F. Adams   ierr = ISCreateGeneral(PETSC_COMM_SELF, nloc, permute, PETSC_USE_POINTER, &perm);
945c8b0795cSMark F. Adams   CHKERRQ(ierr);
946b43b03e9SMark F. Adams #if defined PETSC_USE_LOG
947b43b03e9SMark F. Adams   ierr = PetscLogEventBegin(gamg_setup_events[SET4],0,0,0,0);CHKERRQ(ierr);
948b43b03e9SMark F. Adams #endif
949b43b03e9SMark F. Adams   ierr = MatCoarsenCreate( wcomm, &crs ); CHKERRQ(ierr);
9509057884aSMark F. Adams   /* ierr = MatCoarsenSetType( crs, MATCOARSENMIS ); CHKERRQ(ierr); */
9519057884aSMark F. Adams   ierr = MatCoarsenSetFromOptions( crs ); CHKERRQ(ierr);
952b43b03e9SMark F. Adams   ierr = MatCoarsenSetGreedyOrdering( crs, perm ); CHKERRQ(ierr);
953b43b03e9SMark F. Adams   ierr = MatCoarsenSetAdjacency( crs, Gmat2 ); CHKERRQ(ierr);
954b43b03e9SMark F. Adams   ierr = MatCoarsenSetVerbose( crs, pc_gamg->verbose ); CHKERRQ(ierr);
955b43b03e9SMark F. Adams   ierr = MatCoarsenSetStrictAggs( crs, PETSC_TRUE ); CHKERRQ(ierr);
956b43b03e9SMark F. Adams   ierr = MatCoarsenApply( crs ); CHKERRQ(ierr);
957b43b03e9SMark F. Adams   ierr = MatCoarsenGetMISAggLists( crs, &selected, &llist_parent ); CHKERRQ(ierr);
958b43b03e9SMark F. Adams   ierr = MatCoarsenDestroy( &crs ); CHKERRQ(ierr);
959b43b03e9SMark F. Adams 
960c8b0795cSMark F. Adams   ierr = ISDestroy( &perm );                    CHKERRQ(ierr);
961c8b0795cSMark F. Adams   ierr = PetscFree( permute );  CHKERRQ(ierr);
962b43b03e9SMark F. Adams #if defined PETSC_USE_LOG
963b43b03e9SMark F. Adams   ierr = PetscLogEventEnd(gamg_setup_events[SET4],0,0,0,0);CHKERRQ(ierr);
964b43b03e9SMark F. Adams #endif
965c8b0795cSMark F. Adams   /* smooth aggs */
966ef4ad70eSMark F. Adams   if( Gmat1 ) {
967c8b0795cSMark F. Adams     ierr = smoothAggs( Gmat2, Gmat1, selected, llist_parent ); CHKERRQ(ierr);
968c8b0795cSMark F. Adams     ierr = MatDestroy( &Gmat1 );  CHKERRQ(ierr);
969ef4ad70eSMark F. Adams   }
970c8b0795cSMark F. Adams 
971c8b0795cSMark F. Adams   *a_selected = selected;
972c8b0795cSMark F. Adams   *a_llist_parent = llist_parent;
973c8b0795cSMark F. Adams 
974c8b0795cSMark F. Adams   PetscFunctionReturn(0);
975c8b0795cSMark F. Adams }
976c8b0795cSMark F. Adams 
977c8b0795cSMark F. Adams /* -------------------------------------------------------------------------- */
978c8b0795cSMark F. Adams /*
979c8b0795cSMark F. Adams  PCGAMGprolongator_AGG
980c8b0795cSMark F. Adams 
981c8b0795cSMark F. Adams  Input Parameter:
982c8b0795cSMark F. Adams  . pc - this
983c8b0795cSMark F. Adams  . Amat - matrix on this fine level
984c8b0795cSMark F. Adams  . Graph - used to get ghost data for nodes in
985c8b0795cSMark F. Adams  . selected - [nselected inc. chosts]
986c8b0795cSMark F. Adams  . llist_parent - [nloc + Gmat.nghost] linked list
987c8b0795cSMark F. Adams  Output Parameter:
988c8b0795cSMark F. Adams  . a_P_out - prolongation operator to the next level
989c8b0795cSMark F. Adams  */
990c8b0795cSMark F. Adams #undef __FUNCT__
991c8b0795cSMark F. Adams #define __FUNCT__ "PCGAMGprolongator_AGG"
992c8b0795cSMark F. Adams PetscErrorCode PCGAMGprolongator_AGG( PC pc,
993c8b0795cSMark F. Adams                                      const Mat Amat,
994c8b0795cSMark F. Adams                                      const Mat Gmat,
995c8b0795cSMark F. Adams                                      IS selected,
996c8b0795cSMark F. Adams                                      IS llist_parent,
997c8b0795cSMark F. Adams                                      Mat *a_P_out
9982e68589bSMark F. Adams                                      )
9992e68589bSMark F. Adams {
10002e68589bSMark F. Adams   PC_MG          *mg = (PC_MG*)pc->data;
10012e68589bSMark F. Adams   PC_GAMG        *pc_gamg = (PC_GAMG*)mg->innerctx;
10022e68589bSMark F. Adams   const PetscInt verbose = pc_gamg->verbose;
1003c8b0795cSMark F. Adams   const PetscInt data_cols = pc_gamg->data_cell_cols;
10042e68589bSMark F. Adams   PetscErrorCode ierr;
1005c8b0795cSMark F. Adams   PetscInt       Istart,Iend,nloc,ii,jj,kk,my0,nLocalSelected,bs;
1006c8b0795cSMark F. Adams   Mat            Prol;
10072e68589bSMark F. Adams   PetscMPIInt    mype, npe;
10082e68589bSMark F. Adams   MPI_Comm       wcomm = ((PetscObject)Amat)->comm;
1009b43b03e9SMark F. Adams   const PetscInt *selected_idx,*llist_idx,col_bs=data_cols;
1010c8b0795cSMark F. Adams   PetscReal      *data_w_ghost;
1011c8b0795cSMark F. Adams   PetscInt       myCrs0, nbnodes=0, *flid_fgid;
10122e68589bSMark F. Adams 
10132e68589bSMark F. Adams   PetscFunctionBegin;
10142e68589bSMark F. Adams   ierr = MPI_Comm_rank( wcomm, &mype);  CHKERRQ(ierr);
10152e68589bSMark F. Adams   ierr = MPI_Comm_size( wcomm, &npe);   CHKERRQ(ierr);
10162e68589bSMark F. Adams   ierr = MatGetOwnershipRange( Amat, &Istart, &Iend ); CHKERRQ(ierr);
1017c8b0795cSMark F. Adams   ierr  = MatGetBlockSize( Amat, &bs ); CHKERRQ( ierr );
1018c8b0795cSMark F. Adams   nloc = (Iend-Istart)/bs; my0 = Istart/bs; assert((Iend-Istart)%bs==0);
10192e68589bSMark F. Adams 
10202e68589bSMark F. Adams   /* get 'nLocalSelected' */
1021c8b0795cSMark F. Adams   ierr = ISGetSize( selected, &kk );        CHKERRQ(ierr);
1022c8b0795cSMark F. Adams   ierr = ISGetIndices( selected, &selected_idx );     CHKERRQ(ierr);
1023b43b03e9SMark F. Adams   ierr = ISGetIndices( llist_parent, &llist_idx );     CHKERRQ(ierr);
1024c8b0795cSMark F. Adams   for(ii=0,nLocalSelected=0;ii<kk;ii++){
1025c8b0795cSMark F. Adams     PetscInt lid = selected_idx[ii];
1026b43b03e9SMark F. Adams     /* filter out singletons */
1027b43b03e9SMark F. Adams     if( lid<nloc && llist_idx[lid] != -1) nLocalSelected++;
10282e68589bSMark F. Adams   }
1029c8b0795cSMark F. Adams   ierr = ISRestoreIndices( selected, &selected_idx );     CHKERRQ(ierr);
1030b43b03e9SMark F. Adams   ierr = ISRestoreIndices( llist_parent, &llist_idx );     CHKERRQ(ierr);
10312e68589bSMark F. Adams 
10322e68589bSMark F. Adams   /* create prolongator, create P matrix */
103369b1f4b7SBarry Smith   ierr = MatCreateAIJ( wcomm,
1034c8b0795cSMark F. Adams                        nloc*bs, nLocalSelected*col_bs,
10352e68589bSMark F. Adams                        PETSC_DETERMINE, PETSC_DETERMINE,
10362e68589bSMark F. Adams                        data_cols, PETSC_NULL, data_cols, PETSC_NULL,
10372e68589bSMark F. Adams                        &Prol );
10382e68589bSMark F. Adams   CHKERRQ(ierr);
10392e68589bSMark F. Adams 
10402e68589bSMark F. Adams   /* can get all points "removed" */
1041c8b0795cSMark F. Adams   ierr =  MatGetSize( Prol, &kk, &ii ); CHKERRQ(ierr);
1042c8b0795cSMark F. Adams   if( ii==0 ) {
10432e68589bSMark F. Adams     if( verbose ) {
1044c8b0795cSMark F. Adams       PetscPrintf(wcomm,"[%d]%s no selected points on coarse grid\n",mype,__FUNCT__);
10452e68589bSMark F. Adams     }
10462e68589bSMark F. Adams     ierr = MatDestroy( &Prol );  CHKERRQ(ierr);
10472e68589bSMark F. Adams     *a_P_out = PETSC_NULL;  /* out */
10482e68589bSMark F. Adams     PetscFunctionReturn(0);
10492e68589bSMark F. Adams   }
1050c8b0795cSMark F. Adams   if( verbose ) {
1051ef4ad70eSMark F. Adams     PetscPrintf(PETSC_COMM_WORLD,"\t\t[%d]%s New grid %d nodes\n",mype,__FUNCT__,ii/col_bs);
1052c8b0795cSMark F. Adams   }
1053c8b0795cSMark F. Adams   ierr = MatGetOwnershipRangeColumn( Prol, &myCrs0, &kk ); CHKERRQ(ierr);
1054c8b0795cSMark F. Adams   myCrs0 = myCrs0/col_bs;
10552e68589bSMark F. Adams 
10562e68589bSMark F. Adams   /* create global vector of data in 'data_w_ghost' */
10572e68589bSMark F. Adams #if defined PETSC_USE_LOG
10582e68589bSMark F. Adams   ierr = PetscLogEventBegin(gamg_setup_events[SET7],0,0,0,0);CHKERRQ(ierr);
10592e68589bSMark F. Adams #endif
1060c8b0795cSMark F. Adams   if (npe > 1) { /*  */
10612e68589bSMark F. Adams     PetscReal *tmp_gdata,*tmp_ldata,*tp2;
10622e68589bSMark F. Adams     ierr = PetscMalloc( nloc*sizeof(PetscReal), &tmp_ldata ); CHKERRQ(ierr);
10632e68589bSMark F. Adams     for( jj = 0 ; jj < data_cols ; jj++ ){
1064c8b0795cSMark F. Adams       for( kk = 0 ; kk < bs ; kk++) {
10652e68589bSMark F. Adams         PetscInt ii,nnodes;
1066c8b0795cSMark F. Adams         const PetscReal *tp = pc_gamg->data + jj*bs*nloc + kk;
1067c8b0795cSMark F. Adams         for( ii = 0 ; ii < nloc ; ii++, tp += bs ){
10682e68589bSMark F. Adams           tmp_ldata[ii] = *tp;
10692e68589bSMark F. Adams         }
10702e68589bSMark F. Adams         ierr = getDataWithGhosts( Gmat, 1, tmp_ldata, &nnodes, &tmp_gdata );
10712e68589bSMark F. Adams         CHKERRQ(ierr);
10722e68589bSMark F. Adams         if(jj==0 && kk==0) { /* now I know how many todal nodes - allocate */
1073c8b0795cSMark F. Adams           ierr = PetscMalloc( nnodes*bs*data_cols*sizeof(PetscReal), &data_w_ghost ); CHKERRQ(ierr);
1074c8b0795cSMark F. Adams           nbnodes = bs*nnodes;
10752e68589bSMark F. Adams         }
1076c8b0795cSMark F. Adams         tp2 = data_w_ghost + jj*bs*nnodes + kk;
1077c8b0795cSMark F. Adams         for( ii = 0 ; ii < nnodes ; ii++, tp2 += bs ){
10782e68589bSMark F. Adams           *tp2 = tmp_gdata[ii];
10792e68589bSMark F. Adams         }
10802e68589bSMark F. Adams         ierr = PetscFree( tmp_gdata ); CHKERRQ(ierr);
10812e68589bSMark F. Adams       }
10822e68589bSMark F. Adams     }
10832e68589bSMark F. Adams     ierr = PetscFree( tmp_ldata ); CHKERRQ(ierr);
10842e68589bSMark F. Adams   }
10852e68589bSMark F. Adams   else {
1086c8b0795cSMark F. Adams     nbnodes = bs*nloc;
1087c8b0795cSMark F. Adams     data_w_ghost = (PetscReal*)pc_gamg->data;
10882e68589bSMark F. Adams   }
10892e68589bSMark F. Adams 
10902e68589bSMark F. Adams   /* get P0 */
10912e68589bSMark F. Adams   if( npe > 1 ){
10922e68589bSMark F. Adams     PetscReal *fid_glid_loc,*fiddata;
10932e68589bSMark F. Adams     PetscInt nnodes;
10942e68589bSMark F. Adams 
10952e68589bSMark F. Adams     ierr = PetscMalloc( nloc*sizeof(PetscReal), &fid_glid_loc ); CHKERRQ(ierr);
10962e68589bSMark F. Adams     for(kk=0;kk<nloc;kk++) fid_glid_loc[kk] = (PetscReal)(my0+kk);
10972e68589bSMark F. Adams     ierr = getDataWithGhosts( Gmat, 1, fid_glid_loc, &nnodes, &fiddata );
10982e68589bSMark F. Adams     CHKERRQ(ierr);
10992e68589bSMark F. Adams     ierr = PetscMalloc( nnodes*sizeof(PetscInt), &flid_fgid ); CHKERRQ(ierr);
11002e68589bSMark F. Adams     for(kk=0;kk<nnodes;kk++) flid_fgid[kk] = (PetscInt)fiddata[kk];
11012e68589bSMark F. Adams     ierr = PetscFree( fiddata ); CHKERRQ(ierr);
1102c8b0795cSMark F. Adams     assert(nnodes==nbnodes/bs);
11032e68589bSMark F. Adams     ierr = PetscFree( fid_glid_loc ); CHKERRQ(ierr);
11042e68589bSMark F. Adams   }
11052e68589bSMark F. Adams   else {
11062e68589bSMark F. Adams     ierr = PetscMalloc( nloc*sizeof(PetscInt), &flid_fgid ); CHKERRQ(ierr);
11072e68589bSMark F. Adams     for(kk=0;kk<nloc;kk++) flid_fgid[kk] = my0 + kk;
11082e68589bSMark F. Adams   }
11092e68589bSMark F. Adams #if defined PETSC_USE_LOG
11102e68589bSMark F. Adams   ierr = PetscLogEventEnd(gamg_setup_events[SET7],0,0,0,0);CHKERRQ(ierr);
1111c8b0795cSMark F. Adams   ierr = PetscLogEventBegin(gamg_setup_events[SET8],0,0,0,0);CHKERRQ(ierr);
11122e68589bSMark F. Adams #endif
1113c8b0795cSMark F. Adams   {
1114c8b0795cSMark F. Adams     PetscReal *data_out;
1115c8b0795cSMark F. Adams     ierr = formProl0( selected, llist_parent, bs, data_cols, myCrs0, nbnodes,
1116c8b0795cSMark F. Adams                       data_w_ghost, flid_fgid, &data_out, Prol );
11172e68589bSMark F. Adams     CHKERRQ(ierr);
1118c8b0795cSMark F. Adams     ierr = PetscFree( pc_gamg->data ); CHKERRQ( ierr );
1119c8b0795cSMark F. Adams     pc_gamg->data = data_out;
1120c8b0795cSMark F. Adams     pc_gamg->data_cell_rows = data_cols;
1121c8b0795cSMark F. Adams     pc_gamg->data_sz = data_cols*data_cols*nLocalSelected;
1122c8b0795cSMark F. Adams   }
1123c8b0795cSMark F. Adams  #if defined PETSC_USE_LOG
1124c8b0795cSMark F. Adams   ierr = PetscLogEventEnd(gamg_setup_events[SET8],0,0,0,0);CHKERRQ(ierr);
1125c8b0795cSMark F. Adams #endif
11262e68589bSMark F. Adams   if (npe > 1) ierr = PetscFree( data_w_ghost );      CHKERRQ(ierr);
11272e68589bSMark F. Adams   ierr = PetscFree( flid_fgid ); CHKERRQ(ierr);
11282e68589bSMark F. Adams 
1129c8b0795cSMark F. Adams   /* attach block size of columns */
1130c8b0795cSMark F. Adams   if( pc_gamg->col_bs_id == -1 ) {
1131c8b0795cSMark F. Adams     ierr = PetscObjectComposedDataRegister( &pc_gamg->col_bs_id ); assert(pc_gamg->col_bs_id != -1 );
1132c8b0795cSMark F. Adams   }
1133c8b0795cSMark F. Adams   ierr = PetscObjectComposedDataSetInt( (PetscObject)Prol, pc_gamg->col_bs_id, data_cols ); CHKERRQ(ierr);
1134c8b0795cSMark F. Adams 
1135c8b0795cSMark F. Adams   *a_P_out = Prol;  /* out */
1136c8b0795cSMark F. Adams 
1137c8b0795cSMark F. Adams   PetscFunctionReturn(0);
1138c8b0795cSMark F. Adams }
1139c8b0795cSMark F. Adams 
1140c8b0795cSMark F. Adams /* -------------------------------------------------------------------------- */
1141c8b0795cSMark F. Adams /*
1142c8b0795cSMark F. Adams    PCGAMGoptprol_AGG
1143c8b0795cSMark F. Adams 
1144c8b0795cSMark F. Adams   Input Parameter:
1145c8b0795cSMark F. Adams    . pc - this
1146c8b0795cSMark F. Adams    . Amat - matrix on this fine level
1147c8b0795cSMark F. Adams  In/Output Parameter:
1148c8b0795cSMark F. Adams    . a_P_out - prolongation operator to the next level
1149c8b0795cSMark F. Adams */
1150c8b0795cSMark F. Adams #undef __FUNCT__
1151c8b0795cSMark F. Adams #define __FUNCT__ "PCGAMGoptprol_AGG"
1152c8b0795cSMark F. Adams PetscErrorCode PCGAMGoptprol_AGG( PC pc,
1153c8b0795cSMark F. Adams                                   const Mat Amat,
1154c8b0795cSMark F. Adams                                   Mat *a_P
1155c8b0795cSMark F. Adams                                   )
1156c8b0795cSMark F. Adams {
1157c8b0795cSMark F. Adams   PetscErrorCode ierr;
1158c8b0795cSMark F. Adams   PC_MG          *mg = (PC_MG*)pc->data;
1159c8b0795cSMark F. Adams   PC_GAMG        *pc_gamg = (PC_GAMG*)mg->innerctx;
1160c8b0795cSMark F. Adams   const PetscInt verbose = pc_gamg->verbose;
1161c8b0795cSMark F. Adams   PC_GAMG_AGG    *pc_gamg_agg = (PC_GAMG_AGG*)pc_gamg->subctx;
1162c8b0795cSMark F. Adams   PetscInt       jj;
1163c8b0795cSMark F. Adams   PetscMPIInt    mype,npe;
1164c8b0795cSMark F. Adams   Mat            Prol = *a_P;
1165c8b0795cSMark F. Adams   MPI_Comm       wcomm = ((PetscObject)Amat)->comm;
1166c8b0795cSMark F. Adams 
1167c8b0795cSMark F. Adams   PetscFunctionBegin;
1168c8b0795cSMark F. Adams   ierr = MPI_Comm_rank( wcomm, &mype);  CHKERRQ(ierr);
1169c8b0795cSMark F. Adams   ierr = MPI_Comm_size( wcomm, &npe);   CHKERRQ(ierr);
1170c8b0795cSMark F. Adams 
11712e68589bSMark F. Adams   /* smooth P0 */
1172c8b0795cSMark F. Adams   for( jj = 0 ; jj < pc_gamg_agg->nsmooths ; jj++ ){
11732e68589bSMark F. Adams     Mat tMat;
11742e68589bSMark F. Adams     Vec diag;
11752e68589bSMark F. Adams     PetscReal alpha, emax, emin;
11762e68589bSMark F. Adams #if defined PETSC_USE_LOG
11772e68589bSMark F. Adams     ierr = PetscLogEventBegin(gamg_setup_events[SET9],0,0,0,0);CHKERRQ(ierr);
11782e68589bSMark F. Adams #endif
11792e68589bSMark F. Adams     if( jj == 0 ) {
11802e68589bSMark F. Adams       KSP eksp;
11812e68589bSMark F. Adams       Vec bb, xx;
11822e68589bSMark F. Adams       PC pc;
11832e68589bSMark F. Adams       ierr = MatGetVecs( Amat, &bb, 0 );         CHKERRQ(ierr);
11842e68589bSMark F. Adams       ierr = MatGetVecs( Amat, &xx, 0 );         CHKERRQ(ierr);
11852e68589bSMark F. Adams       {
11862e68589bSMark F. Adams         PetscRandom    rctx;
11872e68589bSMark F. Adams         ierr = PetscRandomCreate(wcomm,&rctx);CHKERRQ(ierr);
11882e68589bSMark F. Adams         ierr = PetscRandomSetFromOptions(rctx);CHKERRQ(ierr);
11892e68589bSMark F. Adams         ierr = VecSetRandom(bb,rctx);CHKERRQ(ierr);
11902e68589bSMark F. Adams         ierr = PetscRandomDestroy( &rctx ); CHKERRQ(ierr);
11912e68589bSMark F. Adams       }
11922e68589bSMark F. Adams       ierr = KSPCreate(wcomm,&eksp);                            CHKERRQ(ierr);
11932e68589bSMark F. Adams       ierr = KSPAppendOptionsPrefix( eksp, "est_");         CHKERRQ(ierr);
11942e68589bSMark F. Adams       ierr = KSPSetFromOptions( eksp );    CHKERRQ(ierr);
11952e68589bSMark F. Adams       ierr = KSPSetInitialGuessNonzero( eksp, PETSC_FALSE );    CHKERRQ(ierr);
11962e68589bSMark F. Adams       ierr = KSPSetOperators( eksp, Amat, Amat, SAME_NONZERO_PATTERN );
11972e68589bSMark F. Adams       CHKERRQ( ierr );
11982e68589bSMark F. Adams       ierr = KSPGetPC( eksp, &pc );                              CHKERRQ( ierr );
11992e68589bSMark F. Adams       ierr = PCSetType( pc, PCJACOBI ); CHKERRQ(ierr);  /* smoother */
12002e68589bSMark F. Adams       ierr = KSPSetTolerances(eksp,PETSC_DEFAULT,PETSC_DEFAULT,PETSC_DEFAULT,10);
12012e68589bSMark F. Adams       CHKERRQ(ierr);
12022e68589bSMark F. Adams       ierr = KSPSetNormType( eksp, KSP_NORM_NONE );                 CHKERRQ(ierr);
12032e68589bSMark F. Adams       ierr = KSPSetComputeSingularValues( eksp,PETSC_TRUE );        CHKERRQ(ierr);
12042e68589bSMark F. Adams 
12052e68589bSMark F. Adams       /* solve - keep stuff out of logging */
12062e68589bSMark F. Adams       ierr = PetscLogEventDeactivate(KSP_Solve);CHKERRQ(ierr);
12072e68589bSMark F. Adams       ierr = PetscLogEventDeactivate(PC_Apply);CHKERRQ(ierr);
12082e68589bSMark F. Adams       ierr = KSPSolve( eksp, bb, xx );                              CHKERRQ(ierr);
12092e68589bSMark F. Adams       ierr = PetscLogEventActivate(KSP_Solve);CHKERRQ(ierr);
12102e68589bSMark F. Adams       ierr = PetscLogEventActivate(PC_Apply);CHKERRQ(ierr);
12112e68589bSMark F. Adams 
12122e68589bSMark F. Adams       ierr = KSPComputeExtremeSingularValues( eksp, &emax, &emin ); CHKERRQ(ierr);
12132e68589bSMark F. Adams       if( verbose ) {
1214c8b0795cSMark F. Adams         PetscPrintf(wcomm,"\t\t\t%s smooth P0: max eigen=%e min=%e PC=%s\n",
12152e68589bSMark F. Adams                     __FUNCT__,emax,emin,PCJACOBI);
12162e68589bSMark F. Adams       }
12172e68589bSMark F. Adams       ierr = VecDestroy( &xx );       CHKERRQ(ierr);
12182e68589bSMark F. Adams       ierr = VecDestroy( &bb );       CHKERRQ(ierr);
12192e68589bSMark F. Adams       ierr = KSPDestroy( &eksp );     CHKERRQ(ierr);
12202e68589bSMark F. Adams 
12212e68589bSMark F. Adams       if( pc_gamg->emax_id == -1 ) {
12222e68589bSMark F. Adams         ierr = PetscObjectComposedDataRegister( &pc_gamg->emax_id );
12232e68589bSMark F. Adams         assert(pc_gamg->emax_id != -1 );
12242e68589bSMark F. Adams       }
12252e68589bSMark F. Adams       ierr = PetscObjectComposedDataSetScalar( (PetscObject)Amat, pc_gamg->emax_id, emax ); CHKERRQ(ierr);
12262e68589bSMark F. Adams     }
12272e68589bSMark F. Adams 
12282e68589bSMark F. Adams     /* smooth P1 := (I - omega/lam D^{-1}A)P0 */
12292e68589bSMark F. Adams     ierr = MatMatMult( Amat, Prol, MAT_INITIAL_MATRIX, PETSC_DEFAULT, &tMat );   CHKERRQ(ierr);
12302e68589bSMark F. Adams     ierr = MatGetVecs( Amat, &diag, 0 );    CHKERRQ(ierr);
12312e68589bSMark F. Adams     ierr = MatGetDiagonal( Amat, diag );    CHKERRQ(ierr); /* effectively PCJACOBI */
12322e68589bSMark F. Adams     ierr = VecReciprocal( diag );         CHKERRQ(ierr);
12332e68589bSMark F. Adams     ierr = MatDiagonalScale( tMat, diag, 0 ); CHKERRQ(ierr);
12342e68589bSMark F. Adams     ierr = VecDestroy( &diag );           CHKERRQ(ierr);
12352e68589bSMark F. Adams     alpha = -1.5/emax;
12362e68589bSMark F. Adams     ierr = MatAYPX( tMat, alpha, Prol, SUBSET_NONZERO_PATTERN );           CHKERRQ(ierr);
12372e68589bSMark F. Adams     ierr = MatDestroy( &Prol );  CHKERRQ(ierr);
12382e68589bSMark F. Adams     Prol = tMat;
12392e68589bSMark F. Adams #if defined PETSC_USE_LOG
12402e68589bSMark F. Adams     ierr = PetscLogEventEnd(gamg_setup_events[SET9],0,0,0,0);CHKERRQ(ierr);
12412e68589bSMark F. Adams #endif
12422e68589bSMark F. Adams   }
12432e68589bSMark F. Adams 
1244c8b0795cSMark F. Adams   *a_P = Prol;
1245c8b0795cSMark F. Adams 
1246c8b0795cSMark F. Adams   PetscFunctionReturn(0);
12472e68589bSMark F. Adams }
12482e68589bSMark F. Adams 
1249c8b0795cSMark F. Adams /* -------------------------------------------------------------------------- */
1250c8b0795cSMark F. Adams /*
1251c8b0795cSMark F. Adams    PCCreateGAMG_AGG
12522e68589bSMark F. Adams 
1253c8b0795cSMark F. Adams   Input Parameter:
1254c8b0795cSMark F. Adams    . pc -
1255c8b0795cSMark F. Adams */
1256c8b0795cSMark F. Adams #undef __FUNCT__
1257c8b0795cSMark F. Adams #define __FUNCT__ "PCCreateGAMG_AGG"
1258c8b0795cSMark F. Adams PetscErrorCode  PCCreateGAMG_AGG( PC pc )
1259c8b0795cSMark F. Adams {
1260c8b0795cSMark F. Adams   PetscErrorCode  ierr;
1261c8b0795cSMark F. Adams   PC_MG           *mg = (PC_MG*)pc->data;
1262c8b0795cSMark F. Adams   PC_GAMG         *pc_gamg = (PC_GAMG*)mg->innerctx;
1263c8b0795cSMark F. Adams   PC_GAMG_AGG      *pc_gamg_agg;
12642e68589bSMark F. Adams 
1265c8b0795cSMark F. Adams   PetscFunctionBegin;
1266c8b0795cSMark F. Adams   /* create sub context for SA */
1267c8b0795cSMark F. Adams   ierr = PetscNewLog( pc, PC_GAMG_AGG, &pc_gamg_agg ); CHKERRQ(ierr);
1268c8b0795cSMark F. Adams   assert(!pc_gamg->subctx);
1269c8b0795cSMark F. Adams   pc_gamg->subctx = pc_gamg_agg;
1270c8b0795cSMark F. Adams 
1271c8b0795cSMark F. Adams   pc->ops->setfromoptions = PCSetFromOptions_GAMG_AGG;
1272c8b0795cSMark F. Adams   pc->ops->destroy        = PCDestroy_AGG;
1273c8b0795cSMark F. Adams   /* reset does not do anything; setup not virtual */
1274c8b0795cSMark F. Adams 
1275c8b0795cSMark F. Adams   /* set internal function pointers */
1276c8b0795cSMark F. Adams   pc_gamg->graph = PCGAMGgraph_AGG;
1277b43b03e9SMark F. Adams   pc_gamg->coarsen = PCGAMGCoarsen_AGG;
1278c8b0795cSMark F. Adams   pc_gamg->prolongator = PCGAMGprolongator_AGG;
1279c8b0795cSMark F. Adams   pc_gamg->optprol = PCGAMGoptprol_AGG;
1280c8b0795cSMark F. Adams 
1281c8b0795cSMark F. Adams   pc_gamg->createdefaultdata = PCSetData_AGG;
1282c8b0795cSMark F. Adams 
1283c8b0795cSMark F. Adams   ierr = PetscObjectComposeFunctionDynamic( (PetscObject)pc,
1284c8b0795cSMark F. Adams                                             "PCSetCoordinates_C",
1285c8b0795cSMark F. Adams                                             "PCSetCoordinates_AGG",
1286c8b0795cSMark F. Adams                                             PCSetCoordinates_AGG);
12872e68589bSMark F. Adams   PetscFunctionReturn(0);
12882e68589bSMark F. Adams }
1289