xref: /petsc/src/ksp/pc/impls/gamg/agg.c (revision a2f3521de2a9d7869700f4c17e26c23fcfeaa6f6)
12e68589bSMark F. Adams /*
22e68589bSMark F. Adams  GAMG geometric-algebric multiogrid PC - Mark Adams 2011
32e68589bSMark F. Adams  */
42e68589bSMark F. Adams 
52e68589bSMark F. Adams #include <../src/ksp/pc/impls/gamg/gamg.h>        /*I "petscpc.h" I*/
6b45d2f2cSJed Brown #include <petsc-private/kspimpl.h>
72e68589bSMark F. Adams 
82e68589bSMark F. Adams #include <assert.h>
92e68589bSMark F. Adams #include <petscblaslapack.h>
102e68589bSMark F. Adams 
112e68589bSMark F. Adams typedef struct {
12c8b0795cSMark F. Adams   PetscInt nsmooths;
13c8b0795cSMark F. Adams   PetscBool sym_graph;
14ef4ad70eSMark F. Adams   PetscBool square_graph;
152e68589bSMark F. Adams }PC_GAMG_AGG;
162e68589bSMark F. Adams 
172e68589bSMark F. Adams #undef __FUNCT__
182e68589bSMark F. Adams #define __FUNCT__ "PCGAMGSetNSmooths"
192e68589bSMark F. Adams /*@
202e68589bSMark F. Adams    PCGAMGSetNSmooths - Set number of smoothing steps (1 is typical)
212e68589bSMark F. Adams 
222e68589bSMark F. Adams    Not Collective on PC
232e68589bSMark F. Adams 
242e68589bSMark F. Adams    Input Parameters:
252e68589bSMark F. Adams .  pc - the preconditioner context
262e68589bSMark F. Adams 
272e68589bSMark F. Adams    Options Database Key:
282e68589bSMark F. Adams .  -pc_gamg_agg_nsmooths
292e68589bSMark F. Adams 
302e68589bSMark F. Adams    Level: intermediate
312e68589bSMark F. Adams 
322e68589bSMark F. Adams    Concepts: Aggregation AMG preconditioner
332e68589bSMark F. Adams 
342e68589bSMark F. Adams .seealso: ()
352e68589bSMark F. Adams @*/
362e68589bSMark F. Adams PetscErrorCode PCGAMGSetNSmooths(PC pc, PetscInt n)
372e68589bSMark F. Adams {
382e68589bSMark F. Adams   PetscErrorCode ierr;
392e68589bSMark F. Adams 
402e68589bSMark F. Adams   PetscFunctionBegin;
412e68589bSMark F. Adams   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
422e68589bSMark F. Adams   ierr = PetscTryMethod(pc,"PCGAMGSetNSmooths_C",(PC,PetscInt),(pc,n));CHKERRQ(ierr);
432e68589bSMark F. Adams   PetscFunctionReturn(0);
442e68589bSMark F. Adams }
452e68589bSMark F. Adams 
462e68589bSMark F. Adams EXTERN_C_BEGIN
472e68589bSMark F. Adams #undef __FUNCT__
482e68589bSMark F. Adams #define __FUNCT__ "PCGAMGSetNSmooths_GAMG"
492e68589bSMark F. Adams PetscErrorCode PCGAMGSetNSmooths_GAMG(PC pc, PetscInt n)
502e68589bSMark F. Adams {
512e68589bSMark F. Adams   PC_MG           *mg = (PC_MG*)pc->data;
522e68589bSMark F. Adams   PC_GAMG         *pc_gamg = (PC_GAMG*)mg->innerctx;
53c8b0795cSMark F. Adams   PC_GAMG_AGG     *pc_gamg_agg = (PC_GAMG_AGG*)pc_gamg->subctx;
542e68589bSMark F. Adams 
552e68589bSMark F. Adams   PetscFunctionBegin;
56c8b0795cSMark F. Adams   pc_gamg_agg->nsmooths = n;
57c8b0795cSMark F. Adams   PetscFunctionReturn(0);
58c8b0795cSMark F. Adams }
59c8b0795cSMark F. Adams EXTERN_C_END
60c8b0795cSMark F. Adams 
61c8b0795cSMark F. Adams #undef __FUNCT__
62c8b0795cSMark F. Adams #define __FUNCT__ "PCGAMGSetSymGraph"
63c8b0795cSMark F. Adams /*@
64c8b0795cSMark F. Adams    PCGAMGSetSymGraph -
65c8b0795cSMark F. Adams 
66c8b0795cSMark F. Adams    Not Collective on PC
67c8b0795cSMark F. Adams 
68c8b0795cSMark F. Adams    Input Parameters:
69c8b0795cSMark F. Adams .  pc - the preconditioner context
70c8b0795cSMark F. Adams 
71c8b0795cSMark F. Adams    Options Database Key:
72c8b0795cSMark F. Adams .  -pc_gamg_sym_graph
73c8b0795cSMark F. Adams 
74c8b0795cSMark F. Adams    Level: intermediate
75c8b0795cSMark F. Adams 
76c8b0795cSMark F. Adams    Concepts: Aggregation AMG preconditioner
77c8b0795cSMark F. Adams 
78c8b0795cSMark F. Adams .seealso: ()
79c8b0795cSMark F. Adams @*/
80c8b0795cSMark F. Adams PetscErrorCode PCGAMGSetSymGraph(PC pc, PetscBool n)
81c8b0795cSMark F. Adams {
82c8b0795cSMark F. Adams   PetscErrorCode ierr;
83c8b0795cSMark F. Adams 
84c8b0795cSMark F. Adams   PetscFunctionBegin;
85c8b0795cSMark F. Adams   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
86c8b0795cSMark F. Adams   ierr = PetscTryMethod(pc,"PCGAMGSetSymGraph_C",(PC,PetscBool),(pc,n));CHKERRQ(ierr);
87c8b0795cSMark F. Adams   PetscFunctionReturn(0);
88c8b0795cSMark F. Adams }
89c8b0795cSMark F. Adams 
90c8b0795cSMark F. Adams EXTERN_C_BEGIN
91c8b0795cSMark F. Adams #undef __FUNCT__
92c8b0795cSMark F. Adams #define __FUNCT__ "PCGAMGSetSymGraph_GAMG"
93c8b0795cSMark F. Adams PetscErrorCode PCGAMGSetSymGraph_GAMG(PC pc, PetscBool n)
94c8b0795cSMark F. Adams {
95c8b0795cSMark F. Adams   PC_MG           *mg = (PC_MG*)pc->data;
96c8b0795cSMark F. Adams   PC_GAMG         *pc_gamg = (PC_GAMG*)mg->innerctx;
97c8b0795cSMark F. Adams   PC_GAMG_AGG      *pc_gamg_agg = (PC_GAMG_AGG*)pc_gamg->subctx;
98c8b0795cSMark F. Adams 
99c8b0795cSMark F. Adams   PetscFunctionBegin;
100c8b0795cSMark F. Adams   pc_gamg_agg->sym_graph = n;
1012e68589bSMark F. Adams   PetscFunctionReturn(0);
1022e68589bSMark F. Adams }
1032e68589bSMark F. Adams EXTERN_C_END
1042e68589bSMark F. Adams 
105ef4ad70eSMark F. Adams #undef __FUNCT__
106ef4ad70eSMark F. Adams #define __FUNCT__ "PCGAMGSetSquareGraph"
107ef4ad70eSMark F. Adams /*@
108ef4ad70eSMark F. Adams    PCGAMGSetSquareGraph -
109ef4ad70eSMark F. Adams 
110ef4ad70eSMark F. Adams    Not Collective on PC
111ef4ad70eSMark F. Adams 
112ef4ad70eSMark F. Adams    Input Parameters:
113ef4ad70eSMark F. Adams .  pc - the preconditioner context
114ef4ad70eSMark F. Adams 
115ef4ad70eSMark F. Adams    Options Database Key:
116ef4ad70eSMark F. Adams .  -pc_gamg_square_graph
117ef4ad70eSMark F. Adams 
118ef4ad70eSMark F. Adams    Level: intermediate
119ef4ad70eSMark F. Adams 
120ef4ad70eSMark F. Adams    Concepts: Aggregation AMG preconditioner
121ef4ad70eSMark F. Adams 
122ef4ad70eSMark F. Adams .seealso: ()
123ef4ad70eSMark F. Adams @*/
124ef4ad70eSMark F. Adams PetscErrorCode PCGAMGSetSquareGraph(PC pc, PetscBool n)
125ef4ad70eSMark F. Adams {
126ef4ad70eSMark F. Adams   PetscErrorCode ierr;
127ef4ad70eSMark F. Adams 
128ef4ad70eSMark F. Adams   PetscFunctionBegin;
129ef4ad70eSMark F. Adams   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
130ef4ad70eSMark F. Adams   ierr = PetscTryMethod(pc,"PCGAMGSetSquareGraph_C",(PC,PetscBool),(pc,n));CHKERRQ(ierr);
131ef4ad70eSMark F. Adams   PetscFunctionReturn(0);
132ef4ad70eSMark F. Adams }
133ef4ad70eSMark F. Adams 
134ef4ad70eSMark F. Adams EXTERN_C_BEGIN
135ef4ad70eSMark F. Adams #undef __FUNCT__
136ef4ad70eSMark F. Adams #define __FUNCT__ "PCGAMGSetSquareGraph_GAMG"
137ef4ad70eSMark F. Adams PetscErrorCode PCGAMGSetSquareGraph_GAMG(PC pc, PetscBool n)
138ef4ad70eSMark F. Adams {
139ef4ad70eSMark F. Adams   PC_MG           *mg = (PC_MG*)pc->data;
140ef4ad70eSMark F. Adams   PC_GAMG         *pc_gamg = (PC_GAMG*)mg->innerctx;
141ef4ad70eSMark F. Adams   PC_GAMG_AGG      *pc_gamg_agg = (PC_GAMG_AGG*)pc_gamg->subctx;
142ef4ad70eSMark F. Adams 
143ef4ad70eSMark F. Adams   PetscFunctionBegin;
144ef4ad70eSMark F. Adams   pc_gamg_agg->square_graph = n;
145ef4ad70eSMark F. Adams   PetscFunctionReturn(0);
146ef4ad70eSMark F. Adams }
147ef4ad70eSMark F. Adams EXTERN_C_END
148ef4ad70eSMark F. Adams 
1492e68589bSMark F. Adams /* -------------------------------------------------------------------------- */
1502e68589bSMark F. Adams /*
1512e68589bSMark F. Adams    PCSetFromOptions_GAMG_AGG
1522e68589bSMark F. Adams 
1532e68589bSMark F. Adams   Input Parameter:
1542e68589bSMark F. Adams    . pc -
1552e68589bSMark F. Adams */
1562e68589bSMark F. Adams #undef __FUNCT__
1572e68589bSMark F. Adams #define __FUNCT__ "PCSetFromOptions_GAMG_AGG"
1582e68589bSMark F. Adams PetscErrorCode PCSetFromOptions_GAMG_AGG( PC pc )
1592e68589bSMark F. Adams {
1602e68589bSMark F. Adams   PetscErrorCode  ierr;
1612e68589bSMark F. Adams   PC_MG           *mg = (PC_MG*)pc->data;
1622e68589bSMark F. Adams   PC_GAMG         *pc_gamg = (PC_GAMG*)mg->innerctx;
163c8b0795cSMark F. Adams   PC_GAMG_AGG      *pc_gamg_agg = (PC_GAMG_AGG*)pc_gamg->subctx;
1642e68589bSMark F. Adams   PetscBool        flag;
1652e68589bSMark F. Adams 
1662e68589bSMark F. Adams   PetscFunctionBegin;
1672e68589bSMark F. Adams   /* call base class */
1682e68589bSMark F. Adams   ierr = PCSetFromOptions_GAMG( pc ); CHKERRQ(ierr);
1692e68589bSMark F. Adams 
1702e68589bSMark F. Adams   ierr = PetscOptionsHead("GAMG-AGG options"); CHKERRQ(ierr);
1712e68589bSMark F. Adams   {
1722e68589bSMark F. Adams     /* -pc_gamg_agg_nsmooths */
173c8b0795cSMark F. Adams     pc_gamg_agg->nsmooths = 0;
1742e68589bSMark F. Adams     ierr = PetscOptionsInt("-pc_gamg_agg_nsmooths",
1752e68589bSMark F. Adams                            "smoothing steps for smoothed aggregation, usually 1 (0)",
1762e68589bSMark F. Adams                            "PCGAMGSetNSmooths",
177c8b0795cSMark F. Adams                            pc_gamg_agg->nsmooths,
178c8b0795cSMark F. Adams                            &pc_gamg_agg->nsmooths,
179c8b0795cSMark F. Adams                            &flag);
180c8b0795cSMark F. Adams     CHKERRQ(ierr);
181c8b0795cSMark F. Adams 
182c8b0795cSMark F. Adams     /* -pc_gamg_sym_graph */
183c8b0795cSMark F. Adams     pc_gamg_agg->sym_graph = PETSC_FALSE;
184c8b0795cSMark F. Adams     ierr = PetscOptionsBool("-pc_gamg_sym_graph",
185581a99e3SJed Brown                             "Set for asymmetric matrices",
186c8b0795cSMark F. Adams                             "PCGAMGSetSymGraph",
187c8b0795cSMark F. Adams                             pc_gamg_agg->sym_graph,
188c8b0795cSMark F. Adams                             &pc_gamg_agg->sym_graph,
1892e68589bSMark F. Adams                             &flag);
1902e68589bSMark F. Adams     CHKERRQ(ierr);
191ef4ad70eSMark F. Adams 
192ef4ad70eSMark F. Adams     /* -pc_gamg_square_graph */
193ef4ad70eSMark F. Adams     pc_gamg_agg->square_graph = PETSC_TRUE;
194ef4ad70eSMark F. Adams     ierr = PetscOptionsBool("-pc_gamg_square_graph",
1950cbbd2e1SMark F. Adams                             "For faster coarsening and lower coarse grid complexity",
196ef4ad70eSMark F. Adams                             "PCGAMGSetSquareGraph",
197ef4ad70eSMark F. Adams                             pc_gamg_agg->square_graph,
198ef4ad70eSMark F. Adams                             &pc_gamg_agg->square_graph,
199ef4ad70eSMark F. Adams                             &flag);
200ef4ad70eSMark F. Adams     CHKERRQ(ierr);
2012e68589bSMark F. Adams   }
2022e68589bSMark F. Adams   ierr = PetscOptionsTail();CHKERRQ(ierr);
2032e68589bSMark F. Adams 
2042e68589bSMark F. Adams   PetscFunctionReturn(0);
2052e68589bSMark F. Adams }
2062e68589bSMark F. Adams 
2072e68589bSMark F. Adams /* -------------------------------------------------------------------------- */
2082e68589bSMark F. Adams /*
2092e68589bSMark F. Adams    PCDestroy_AGG
2102e68589bSMark F. Adams 
2112e68589bSMark F. Adams   Input Parameter:
2122e68589bSMark F. Adams    . pc -
2132e68589bSMark F. Adams */
2142e68589bSMark F. Adams #undef __FUNCT__
2152e68589bSMark F. Adams #define __FUNCT__ "PCDestroy_AGG"
2162e68589bSMark F. Adams PetscErrorCode PCDestroy_AGG( PC pc )
2172e68589bSMark F. Adams {
2182e68589bSMark F. Adams   PetscErrorCode  ierr;
2192e68589bSMark F. Adams   PC_MG           *mg = (PC_MG*)pc->data;
2202e68589bSMark F. Adams   PC_GAMG         *pc_gamg = (PC_GAMG*)mg->innerctx;
221c8b0795cSMark F. Adams   PC_GAMG_AGG      *pc_gamg_agg = (PC_GAMG_AGG*)pc_gamg->subctx;
2222e68589bSMark F. Adams 
2232e68589bSMark F. Adams   PetscFunctionBegin;
224c8b0795cSMark F. Adams   if( pc_gamg_agg ) {
225c8b0795cSMark F. Adams     ierr = PetscFree(pc_gamg_agg);CHKERRQ(ierr);
226c8b0795cSMark F. Adams     pc_gamg_agg = 0;
2272e68589bSMark F. Adams   }
2282e68589bSMark F. Adams 
2292e68589bSMark F. Adams   /* call base class */
2302e68589bSMark F. Adams   ierr = PCDestroy_GAMG( pc );CHKERRQ(ierr);
2312e68589bSMark F. Adams 
2322e68589bSMark F. Adams   PetscFunctionReturn(0);
2332e68589bSMark F. Adams }
2342e68589bSMark F. Adams 
2352e68589bSMark F. Adams /* -------------------------------------------------------------------------- */
2362e68589bSMark F. Adams /*
2372e68589bSMark F. Adams    PCSetCoordinates_AGG
238302f38e8SMark F. Adams      - collective
2392e68589bSMark F. Adams 
2402e68589bSMark F. Adams    Input Parameter:
2412e68589bSMark F. Adams    . pc - the preconditioner context
242*a2f3521dSMark F. Adams    . ndm - dimesion of data (used for dof/vertex for Stokes)
243302f38e8SMark F. Adams    . a_nloc - number of vertices local
244302f38e8SMark F. Adams    . coords - [a_nloc][ndm] - interleaved coordinate data: {x_0, y_0, z_0, x_1, y_1, ...}
2452e68589bSMark F. Adams */
2462e68589bSMark F. Adams EXTERN_C_BEGIN
2472e68589bSMark F. Adams #undef __FUNCT__
2482e68589bSMark F. Adams #define __FUNCT__ "PCSetCoordinates_AGG"
249302f38e8SMark F. Adams PetscErrorCode PCSetCoordinates_AGG( PC pc, PetscInt ndm, PetscInt a_nloc, PetscReal *coords )
2502e68589bSMark F. Adams {
2512e68589bSMark F. Adams   PC_MG          *mg = (PC_MG*)pc->data;
2522e68589bSMark F. Adams   PC_GAMG        *pc_gamg = (PC_GAMG*)mg->innerctx;
2532e68589bSMark F. Adams   PetscErrorCode ierr;
254*a2f3521dSMark F. Adams   PetscInt       arrsz,kk,ii,jj,nloc,ndatarows,bs;
255*a2f3521dSMark F. Adams   Mat            mat = pc->pmat;
256*a2f3521dSMark F. Adams   /* MPI_Comm       wcomm = ((PetscObject)pc)->comm; */
2572e68589bSMark F. Adams 
2582e68589bSMark F. Adams   PetscFunctionBegin;
259*a2f3521dSMark F. Adams   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
260*a2f3521dSMark F. Adams   PetscValidHeaderSpecific(mat,MAT_CLASSID,1);
261302f38e8SMark F. Adams   nloc = a_nloc;
2622e68589bSMark F. Adams 
2632e68589bSMark F. Adams   /* SA: null space vectors */
264*a2f3521dSMark F. Adams   ierr = MatGetBlockSize( mat, &bs ); CHKERRQ( ierr ); /* this does not work for Stokes */
265c8b0795cSMark F. Adams   if( coords && bs==1 ) pc_gamg->data_cell_cols = 1; /* scalar w/ coords and SA (not needed) */
266*a2f3521dSMark F. Adams   else if( coords ) {
267*a2f3521dSMark F. Adams     if(ndm > bs) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_LIB,"degrees of motion %d > block size %d",ndm,bs);
268*a2f3521dSMark F. Adams     pc_gamg->data_cell_cols = (ndm==2 ? (bs+1) : (bs+3)); /* elasticity */
269*a2f3521dSMark F. Adams   }
270c8b0795cSMark F. Adams   else pc_gamg->data_cell_cols = bs; /* no data, force SA with constant null space vectors */
271*a2f3521dSMark F. Adams   pc_gamg->data_cell_rows = ndatarows = bs;
272*a2f3521dSMark F. Adams   assert(pc_gamg->data_cell_cols>0);
273c8b0795cSMark F. Adams   arrsz = nloc*pc_gamg->data_cell_rows*pc_gamg->data_cell_cols;
2742e68589bSMark F. Adams 
2752e68589bSMark F. Adams   /* create data - syntactic sugar that should be refactored at some point */
2762e68589bSMark F. Adams   if (pc_gamg->data==0 || (pc_gamg->data_sz != arrsz)) {
2772e68589bSMark F. Adams     ierr = PetscFree( pc_gamg->data );  CHKERRQ(ierr);
278302f38e8SMark F. Adams     ierr = PetscMalloc((arrsz+1)*sizeof(PetscReal), &pc_gamg->data ); CHKERRQ(ierr);
279*a2f3521dSMark F. Adams     /* pc_gamg->data != null if nloc==0: flag for called */
2802e68589bSMark F. Adams   }
2812e68589bSMark F. Adams   /* copy data in - column oriented */
2822e68589bSMark F. Adams   for(kk=0;kk<nloc;kk++){
283302f38e8SMark F. Adams     const PetscInt M = nloc*pc_gamg->data_cell_rows;
284*a2f3521dSMark F. Adams     PetscReal *data = &pc_gamg->data[kk*ndatarows];
285c8b0795cSMark F. Adams     if( pc_gamg->data_cell_cols==1 ) *data = 1.0;
2862e68589bSMark F. Adams     else {
287*a2f3521dSMark F. Adams       for(ii=0;ii<ndatarows;ii++)
288*a2f3521dSMark F. Adams         for(jj=0;jj<ndatarows;jj++)
2892e68589bSMark F. Adams           if(ii==jj)data[ii*M + jj] = 1.0; /* translational modes */
2902e68589bSMark F. Adams           else data[ii*M + jj] = 0.0;
2912e68589bSMark F. Adams       if( coords ) {
2922e68589bSMark F. Adams         if( ndm == 2 ){ /* rotational modes */
2932e68589bSMark F. Adams           data += 2*M;
2942e68589bSMark F. Adams           data[0] = -coords[2*kk+1];
2952e68589bSMark F. Adams           data[1] =  coords[2*kk];
2962e68589bSMark F. Adams         }
2972e68589bSMark F. Adams         else {
2982e68589bSMark F. Adams           data += 3*M;
2992e68589bSMark F. Adams           data[0] = 0.0;             data[M+0] =  coords[3*kk+2]; data[2*M+0] = -coords[3*kk+1];
3002e68589bSMark F. Adams           data[1] = -coords[3*kk+2]; data[M+1] = 0.0;             data[2*M+1] =  coords[3*kk];
3012e68589bSMark F. Adams           data[2] =  coords[3*kk+1]; data[M+2] = -coords[3*kk];   data[2*M+2] = 0.0;
3022e68589bSMark F. Adams         }
3032e68589bSMark F. Adams       }
3042e68589bSMark F. Adams     }
3052e68589bSMark F. Adams   }
3062e68589bSMark F. Adams 
3072e68589bSMark F. Adams   pc_gamg->data_sz = arrsz;
3082e68589bSMark F. Adams 
3092e68589bSMark F. Adams   PetscFunctionReturn(0);
3102e68589bSMark F. Adams }
3112e68589bSMark F. Adams EXTERN_C_END
3122e68589bSMark F. Adams 
313b43b03e9SMark F. Adams typedef PetscInt NState;
314b43b03e9SMark F. Adams static const NState NOT_DONE=-2;
315b43b03e9SMark F. Adams static const NState DELETED=-1;
316b43b03e9SMark F. Adams static const NState REMOVED=-3;
317b43b03e9SMark F. Adams #define IS_SELECTED(s) (s!=DELETED && s!=NOT_DONE && s!=REMOVED)
318b43b03e9SMark F. Adams 
319c8b0795cSMark F. Adams /* -------------------------------------------------------------------------- */
320c8b0795cSMark F. Adams /*
321b43b03e9SMark F. Adams    smoothAggs - greedy grab of with G1 (unsquared graph) -- AIJ specific
322b43b03e9SMark F. Adams      - AGG-MG specific: clears singletons out of 'selected_2'
323c8b0795cSMark F. Adams 
324c8b0795cSMark F. Adams    Input Parameter:
325c8b0795cSMark F. Adams    . Gmat_2 - glabal matrix of graph (data not defined)
326c8b0795cSMark F. Adams    . Gmat_1 - base graph to grab with
327c8b0795cSMark F. Adams    Input/Output Parameter:
3280cbbd2e1SMark F. Adams    . aggs_2 - linked list of aggs with gids )
329c8b0795cSMark F. Adams */
330c8b0795cSMark F. Adams #undef __FUNCT__
331c8b0795cSMark F. Adams #define __FUNCT__ "smoothAggs"
3320cbbd2e1SMark F. Adams static PetscErrorCode smoothAggs( const Mat Gmat_2, /* base (squared) graph */
3330cbbd2e1SMark F. Adams                                   const Mat Gmat_1, /* base graph */
3340cbbd2e1SMark F. Adams                                   /* const IS selected_2, [nselected local] selected vertices */
3350cbbd2e1SMark F. Adams                                   PetscCoarsenData *aggs_2 /* [nselected local] global ID of aggregate */
336c8b0795cSMark F. Adams                                   )
337c8b0795cSMark F. Adams {
338c8b0795cSMark F. Adams   PetscErrorCode ierr;
339c8b0795cSMark F. Adams   PetscBool      isMPI;
340c8b0795cSMark F. Adams   Mat_SeqAIJ    *matA_1, *matB_1=0, *matA_2, *matB_2=0;
341c8b0795cSMark F. Adams   MPI_Comm       wcomm = ((PetscObject)Gmat_2)->comm;
3420cbbd2e1SMark F. Adams   PetscMPIInt    mype,npe;
3430cbbd2e1SMark F. Adams   PetscInt       lid,*ii,*idx,ix,Iend,my0,kk,n,j;
344c8b0795cSMark F. Adams   Mat_MPIAIJ    *mpimat_2 = 0, *mpimat_1=0;
345c8b0795cSMark F. Adams   const PetscInt nloc = Gmat_2->rmap->n;
3460cbbd2e1SMark F. Adams   PetscScalar   *cpcol_1_state,*cpcol_2_state,*cpcol_2_par_orig,*lid_parent_gid;
3470cbbd2e1SMark F. Adams   PetscInt      *lid_cprowID_1;
348c8b0795cSMark F. Adams   NState        *lid_state;
3490cbbd2e1SMark F. Adams   Vec            ghost_par_orig2;
350c8b0795cSMark F. Adams 
351c8b0795cSMark F. Adams   PetscFunctionBegin;
352c8b0795cSMark F. Adams   ierr = MPI_Comm_rank( wcomm, &mype );   CHKERRQ(ierr);
3530cbbd2e1SMark F. Adams   ierr = MPI_Comm_size( wcomm, &npe );   CHKERRQ(ierr);
354c8b0795cSMark F. Adams   ierr = MatGetOwnershipRange(Gmat_1,&my0,&Iend);  CHKERRQ(ierr);
355c8b0795cSMark F. Adams 
3560cbbd2e1SMark F. Adams   if( PETSC_FALSE ) {
357c8b0795cSMark F. Adams     PetscViewer viewer; char fname[32]; static int llev=0;
358c8b0795cSMark F. Adams     sprintf(fname,"Gmat2_%d.m",llev++);
359c8b0795cSMark F. Adams     PetscViewerASCIIOpen(wcomm,fname,&viewer);
360c8b0795cSMark F. Adams     ierr = PetscViewerSetFormat( viewer, PETSC_VIEWER_ASCII_MATLAB);  CHKERRQ(ierr);
361c8b0795cSMark F. Adams     ierr = MatView(Gmat_2, viewer ); CHKERRQ(ierr);
362c8b0795cSMark F. Adams     ierr = PetscViewerDestroy( &viewer );
363c8b0795cSMark F. Adams   }
364c8b0795cSMark F. Adams 
365c8b0795cSMark F. Adams   /* get submatrices */
366251f4c67SDmitry Karpeev   ierr = PetscObjectTypeCompare( (PetscObject)Gmat_1, MATMPIAIJ, &isMPI ); CHKERRQ(ierr);
367c8b0795cSMark F. Adams   if(isMPI) {
368c8b0795cSMark F. Adams     /* grab matrix objects */
369c8b0795cSMark F. Adams     mpimat_2 = (Mat_MPIAIJ*)Gmat_2->data;
370c8b0795cSMark F. Adams     mpimat_1 = (Mat_MPIAIJ*)Gmat_1->data;
371c8b0795cSMark F. Adams     matA_1 = (Mat_SeqAIJ*)mpimat_1->A->data;
372c8b0795cSMark F. Adams     matB_1 = (Mat_SeqAIJ*)mpimat_1->B->data;
373c8b0795cSMark F. Adams     matA_2 = (Mat_SeqAIJ*)mpimat_2->A->data;
374c8b0795cSMark F. Adams     matB_2 = (Mat_SeqAIJ*)mpimat_2->B->data;
375c8b0795cSMark F. Adams 
376c8b0795cSMark F. Adams     /* force compressed row storage for B matrix in AuxMat */
377c8b0795cSMark F. Adams     matB_1->compressedrow.check = PETSC_TRUE;
378c8b0795cSMark F. Adams     ierr = MatCheckCompressedRow(mpimat_1->B,&matB_1->compressedrow,matB_1->i,Gmat_1->rmap->n,-1.0);
379c8b0795cSMark F. Adams     CHKERRQ(ierr);
380c8b0795cSMark F. Adams 
381c8b0795cSMark F. Adams     ierr = PetscMalloc( nloc*sizeof(PetscInt), &lid_cprowID_1 ); CHKERRQ(ierr);
3820cbbd2e1SMark F. Adams     for( lid = 0 ; lid < nloc ; lid++ ) lid_cprowID_1[lid] = -1;
383c8b0795cSMark F. Adams     for (ix=0; ix<matB_1->compressedrow.nrows; ix++) {
384c8b0795cSMark F. Adams       PetscInt lid = matB_1->compressedrow.rindex[ix];
385c8b0795cSMark F. Adams       lid_cprowID_1[lid] = ix;
386c8b0795cSMark F. Adams     }
387c8b0795cSMark F. Adams   }
388c8b0795cSMark F. Adams   else {
389c8b0795cSMark F. Adams     matA_1 = (Mat_SeqAIJ*)Gmat_1->data;
390c8b0795cSMark F. Adams     matA_2 = (Mat_SeqAIJ*)Gmat_2->data;
3910cbbd2e1SMark F. Adams     lid_cprowID_1 = PETSC_NULL;
392c8b0795cSMark F. Adams   }
393c8b0795cSMark F. Adams   assert( matA_1 && !matA_1->compressedrow.use );
394c8b0795cSMark F. Adams   assert( matB_1==0 || matB_1->compressedrow.use );
395c8b0795cSMark F. Adams   assert( matA_2 && !matA_2->compressedrow.use );
396c8b0795cSMark F. Adams   assert( matB_2==0 || matB_2->compressedrow.use );
397c8b0795cSMark F. Adams 
398c8b0795cSMark F. Adams   /* get state of locals and selected gid for deleted */
399c8b0795cSMark F. Adams   ierr = PetscMalloc( nloc*sizeof(NState), &lid_state ); CHKERRQ(ierr);
4000cbbd2e1SMark F. Adams   ierr = PetscMalloc( nloc*sizeof(PetscScalar), &lid_parent_gid ); CHKERRQ(ierr);
401c8b0795cSMark F. Adams   for( lid = 0 ; lid < nloc ; lid++ ) {
4020cbbd2e1SMark F. Adams     lid_parent_gid[lid] = -1.0;
403c8b0795cSMark F. Adams     lid_state[lid] = DELETED;
404c8b0795cSMark F. Adams   }
4050cbbd2e1SMark F. Adams 
4060cbbd2e1SMark F. Adams   /* set lid_state */
4070cbbd2e1SMark F. Adams   for( lid = 0 ; lid < nloc ; lid++ ) {
40841b27cdeSMark F. Adams     PetscCDPos pos;
409e78576d6SMark F. Adams     ierr = PetscCDGetHeadPos(aggs_2,lid,&pos); CHKERRQ(ierr);
410e78576d6SMark F. Adams     if( pos ) {
411e78576d6SMark F. Adams       PetscInt gid1;
412ffc955d6SMark F. Adams       ierr = PetscLLNGetID( pos, &gid1 ); CHKERRQ(ierr); assert(gid1==lid+my0);
4130cbbd2e1SMark F. Adams       lid_state[lid] = gid1;
414b43b03e9SMark F. Adams     }
415b43b03e9SMark F. Adams   }
4160cbbd2e1SMark F. Adams 
4170cbbd2e1SMark F. Adams   /* map local to selected local, DELETED means a ghost owns it */
418c8b0795cSMark F. Adams   for(lid=kk=0;lid<nloc;lid++){
419c8b0795cSMark F. Adams     NState state = lid_state[lid];
420c8b0795cSMark F. Adams     if( IS_SELECTED(state) ){
42141b27cdeSMark F. Adams       PetscCDPos pos;
422e78576d6SMark F. Adams       ierr = PetscCDGetHeadPos(aggs_2,lid,&pos); CHKERRQ(ierr);
423e78576d6SMark F. Adams       while(pos){
424e78576d6SMark F. Adams         PetscInt gid1;
425ffc955d6SMark F. Adams         ierr = PetscLLNGetID( pos, &gid1 ); CHKERRQ(ierr);
426e78576d6SMark F. Adams         ierr = PetscCDGetNextPos(aggs_2,lid,&pos); CHKERRQ(ierr);
427e78576d6SMark F. Adams 
4280cbbd2e1SMark F. Adams         if( gid1 >= my0 && gid1 < Iend ){
4290cbbd2e1SMark F. Adams           lid_parent_gid[gid1-my0] = (PetscScalar)(lid + my0);
430c8b0795cSMark F. Adams         }
431c8b0795cSMark F. Adams       }
4320cbbd2e1SMark F. Adams     }
4330cbbd2e1SMark F. Adams   }
4340cbbd2e1SMark F. Adams   /* get 'cpcol_1/2_state' & cpcol_2_par_orig - uses mpimat_1/2->lvec for temp space */
435c8b0795cSMark F. Adams   if (isMPI) {
436c8b0795cSMark F. Adams     Vec          tempVec;
437c8b0795cSMark F. Adams     /* get 'cpcol_1_state' */
438c8b0795cSMark F. Adams     ierr = MatGetVecs( Gmat_1, &tempVec, 0 );         CHKERRQ(ierr);
439c8b0795cSMark F. Adams     for(kk=0,j=my0;kk<nloc;kk++,j++){
440c8b0795cSMark F. Adams       PetscScalar v = (PetscScalar)lid_state[kk];
441c8b0795cSMark F. Adams       ierr = VecSetValues( tempVec, 1, &j, &v, INSERT_VALUES );  CHKERRQ(ierr);
442c8b0795cSMark F. Adams     }
443c8b0795cSMark F. Adams     ierr = VecAssemblyBegin( tempVec ); CHKERRQ(ierr);
444c8b0795cSMark F. Adams     ierr = VecAssemblyEnd( tempVec ); CHKERRQ(ierr);
445c8b0795cSMark F. Adams     ierr = VecScatterBegin(mpimat_1->Mvctx,tempVec, mpimat_1->lvec,INSERT_VALUES,SCATTER_FORWARD);
446c8b0795cSMark F. Adams     CHKERRQ(ierr);
447c8b0795cSMark F. Adams     ierr =   VecScatterEnd(mpimat_1->Mvctx,tempVec, mpimat_1->lvec,INSERT_VALUES,SCATTER_FORWARD);
448c8b0795cSMark F. Adams     CHKERRQ(ierr);
449c8b0795cSMark F. Adams     ierr = VecGetArray( mpimat_1->lvec, &cpcol_1_state ); CHKERRQ(ierr);
450c8b0795cSMark F. Adams     /* get 'cpcol_2_state' */
451c8b0795cSMark F. Adams     ierr = VecScatterBegin(mpimat_2->Mvctx,tempVec, mpimat_2->lvec,INSERT_VALUES,SCATTER_FORWARD);
452c8b0795cSMark F. Adams     CHKERRQ(ierr);
453c8b0795cSMark F. Adams     ierr =   VecScatterEnd(mpimat_2->Mvctx,tempVec, mpimat_2->lvec,INSERT_VALUES,SCATTER_FORWARD);
454c8b0795cSMark F. Adams     CHKERRQ(ierr);
455c8b0795cSMark F. Adams     ierr = VecGetArray( mpimat_2->lvec, &cpcol_2_state ); CHKERRQ(ierr);
4560cbbd2e1SMark F. Adams     /* get 'cpcol_2_par_orig' */
4570cbbd2e1SMark F. Adams     for(kk=0,j=my0;kk<nloc;kk++,j++){
4580cbbd2e1SMark F. Adams       PetscScalar v = (PetscScalar)lid_parent_gid[kk];
4590cbbd2e1SMark F. Adams       ierr = VecSetValues( tempVec, 1, &j, &v, INSERT_VALUES );  CHKERRQ(ierr);
4600cbbd2e1SMark F. Adams     }
4610cbbd2e1SMark F. Adams     ierr = VecAssemblyBegin( tempVec ); CHKERRQ(ierr);
4620cbbd2e1SMark F. Adams     ierr = VecAssemblyEnd( tempVec ); CHKERRQ(ierr);
4630cbbd2e1SMark F. Adams     ierr = VecDuplicate( mpimat_2->lvec, &ghost_par_orig2 ); CHKERRQ(ierr);
4640cbbd2e1SMark F. Adams     ierr = VecScatterBegin(mpimat_2->Mvctx,tempVec, ghost_par_orig2,INSERT_VALUES,SCATTER_FORWARD);
4650cbbd2e1SMark F. Adams     CHKERRQ(ierr);
4660cbbd2e1SMark F. Adams     ierr =   VecScatterEnd(mpimat_2->Mvctx,tempVec, ghost_par_orig2,INSERT_VALUES,SCATTER_FORWARD);
4670cbbd2e1SMark F. Adams     CHKERRQ(ierr);
4680cbbd2e1SMark F. Adams     ierr = VecGetArray( ghost_par_orig2, &cpcol_2_par_orig ); CHKERRQ(ierr);
4690cbbd2e1SMark F. Adams 
470c8b0795cSMark F. Adams     ierr = VecDestroy( &tempVec ); CHKERRQ(ierr);
471c8b0795cSMark F. Adams   } /* ismpi */
472c8b0795cSMark F. Adams 
473c8b0795cSMark F. Adams   /* doit */
474c8b0795cSMark F. Adams   for(lid=0;lid<nloc;lid++){
475c8b0795cSMark F. Adams     NState state = lid_state[lid];
4760cbbd2e1SMark F. Adams     if( IS_SELECTED(state) ) {
4770cbbd2e1SMark F. Adams       /* steal locals */
478c8b0795cSMark F. Adams       ii = matA_1->i; n = ii[lid+1] - ii[lid];
479c8b0795cSMark F. Adams       idx = matA_1->j + ii[lid];
480c8b0795cSMark F. Adams       for (j=0; j<n; j++) {
4810cbbd2e1SMark F. Adams         PetscInt lidj = idx[j], sgid;
482c8b0795cSMark F. Adams         NState statej = lid_state[lidj];
4830cbbd2e1SMark F. Adams         if (statej==DELETED && (sgid=(PetscInt)PetscRealPart(lid_parent_gid[lidj])) != lid+my0) { /* steal local */
4840cbbd2e1SMark F. Adams           lid_parent_gid[lidj] = (PetscScalar)(lid+my0); /* send this if sgid is not local */
4850cbbd2e1SMark F. Adams           if( sgid >= my0 && sgid < Iend ){       /* I'm stealing this local from a local sgid */
4860cbbd2e1SMark F. Adams             PetscInt hav=0,slid=sgid-my0,gidj=lidj+my0;
48741b27cdeSMark F. Adams             PetscCDPos pos,last=PETSC_NULL;
488c8b0795cSMark F. Adams             /* looking for local from local so id_llist_2 works */
489e78576d6SMark F. Adams             ierr = PetscCDGetHeadPos(aggs_2,slid,&pos); CHKERRQ(ierr);
490e78576d6SMark F. Adams             while(pos){
491e78576d6SMark F. Adams               PetscInt gid;
492ffc955d6SMark F. Adams               ierr = PetscLLNGetID( pos, &gid ); CHKERRQ(ierr);
4930cbbd2e1SMark F. Adams               if( gid == gidj ) {
4940cbbd2e1SMark F. Adams                 assert(last);
49541b27cdeSMark F. Adams                 ierr = PetscCDRemoveNextNode( aggs_2, slid, last ); CHKERRQ(ierr);
49641b27cdeSMark F. Adams                 ierr = PetscCDAppendNode( aggs_2, lid, pos );       CHKERRQ(ierr);
4970cbbd2e1SMark F. Adams                 hav = 1;
498c8b0795cSMark F. Adams                 break;
499c8b0795cSMark F. Adams               }
5000cbbd2e1SMark F. Adams               else last = pos;
501e78576d6SMark F. Adams 
502e78576d6SMark F. Adams               ierr = PetscCDGetNextPos(aggs_2,slid,&pos); CHKERRQ(ierr);
503c8b0795cSMark F. Adams             }
504c8b0795cSMark F. Adams             if(hav!=1){
505c8b0795cSMark F. Adams               if(hav==0)SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"failed to find adj in 'selected' lists - structurally unsymmetric matrix");
506c8b0795cSMark F. Adams               SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"found node %d times???",hav);
507c8b0795cSMark F. Adams             }
508c8b0795cSMark F. Adams           }
5090cbbd2e1SMark F. Adams           else{            /* I'm stealing this local, owned by a ghost */
510c8b0795cSMark F. Adams             assert(sgid==-1);
51141b27cdeSMark F. Adams             ierr = PetscCDAppendID( aggs_2, lid, lidj+my0 );      CHKERRQ(ierr);
512c8b0795cSMark F. Adams           }
513c8b0795cSMark F. Adams         }
5140cbbd2e1SMark F. Adams       } /* local neighbors */
515c8b0795cSMark F. Adams     }
516c8b0795cSMark F. Adams     else if( state == DELETED && lid_cprowID_1 ) {
5170cbbd2e1SMark F. Adams       PetscInt sgidold = (PetscInt)PetscRealPart(lid_parent_gid[lid]);
518c8b0795cSMark F. Adams       /* see if I have a selected ghost neighbor that will steal me */
519c8b0795cSMark F. Adams       if( (ix=lid_cprowID_1[lid]) != -1 ){
520c8b0795cSMark F. Adams         ii = matB_1->compressedrow.i; n = ii[ix+1] - ii[ix];
521c8b0795cSMark F. Adams         idx = matB_1->j + ii[ix];
522c8b0795cSMark F. Adams         for( j=0 ; j<n ; j++ ) {
523c8b0795cSMark F. Adams           PetscInt cpid = idx[j];
524c8b0795cSMark F. Adams           NState statej = (NState)PetscRealPart(cpcol_1_state[cpid]);
525c8b0795cSMark F. Adams           if( IS_SELECTED(statej) && sgidold != (PetscInt)statej ) { /* ghost will steal this, remove from my list */
5260cbbd2e1SMark F. Adams             lid_parent_gid[lid] = (PetscScalar)statej; /* send who selected */
5270cbbd2e1SMark F. Adams             if( sgidold>=my0 && sgidold<Iend ) { /* this was mine */
5280cbbd2e1SMark F. Adams               PetscInt hav=0,oldslidj=sgidold-my0;
52941b27cdeSMark F. Adams               PetscCDPos pos,last=PETSC_NULL;
5300cbbd2e1SMark F. Adams               /* remove from 'oldslidj' list */
531e78576d6SMark F. Adams               ierr = PetscCDGetHeadPos(aggs_2,oldslidj,&pos); CHKERRQ(ierr);
532e78576d6SMark F. Adams               while( pos ) {
533e78576d6SMark F. Adams                 PetscInt gid;
534ffc955d6SMark F. Adams                 ierr = PetscLLNGetID( pos, &gid ); CHKERRQ(ierr);
5350cbbd2e1SMark F. Adams                 if( lid+my0 == gid ) {
5360cbbd2e1SMark F. Adams                   /* id_llist_2[lastid] = id_llist_2[flid];   /\* remove lid from oldslidj list *\/ */
5370cbbd2e1SMark F. Adams                   assert(last);
53841b27cdeSMark F. Adams                   ierr = PetscCDRemoveNextNode( aggs_2, oldslidj, last ); CHKERRQ(ierr);
5390cbbd2e1SMark F. Adams                   /* ghost (PetscScalar)statej will add this later */
5400cbbd2e1SMark F. Adams                   hav = 1;
541c8b0795cSMark F. Adams                   break;
542c8b0795cSMark F. Adams                 }
5430cbbd2e1SMark F. Adams                 else last = pos;
544e78576d6SMark F. Adams 
545e78576d6SMark F. Adams                 ierr = PetscCDGetNextPos(aggs_2,oldslidj,&pos); CHKERRQ(ierr);
546c8b0795cSMark F. Adams               }
547c8b0795cSMark F. Adams               if(hav!=1){
548c8b0795cSMark F. Adams                 if(hav==0)SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"failed to find adj in 'selected' lists - structurally unsymmetric matrix");
549c8b0795cSMark F. Adams                 SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"found node %d times???",hav);
550c8b0795cSMark F. Adams               }
551c8b0795cSMark F. Adams             }
5520cbbd2e1SMark F. Adams             else {
5530cbbd2e1SMark F. Adams               /* ghosts remove this later */
5540cbbd2e1SMark F. Adams             }
555c8b0795cSMark F. Adams           }
556c8b0795cSMark F. Adams         }
557c8b0795cSMark F. Adams       }
558c8b0795cSMark F. Adams     } /* selected/deleted */
559c8b0795cSMark F. Adams   } /* node loop */
560c8b0795cSMark F. Adams 
561c8b0795cSMark F. Adams   if( isMPI ) {
5620cbbd2e1SMark F. Adams     PetscScalar *cpcol_2_parent,*cpcol_2_gid;
5630cbbd2e1SMark F. Adams     Vec          tempVec,ghostgids2,ghostparents2;
5640cbbd2e1SMark F. Adams     PetscInt     cpid,nghost_2;
5650cbbd2e1SMark F. Adams     GAMGHashTable gid_cpid;
566c8b0795cSMark F. Adams 
5670cbbd2e1SMark F. Adams     ierr = VecGetSize( mpimat_2->lvec, &nghost_2 );   CHKERRQ(ierr);
568c8b0795cSMark F. Adams     ierr = MatGetVecs( Gmat_2, &tempVec, 0 );         CHKERRQ(ierr);
5690cbbd2e1SMark F. Adams 
5700cbbd2e1SMark F. Adams     /* get 'cpcol_2_parent' */
571c8b0795cSMark F. Adams     for(kk=0,j=my0;kk<nloc;kk++,j++){
5720cbbd2e1SMark F. Adams       ierr = VecSetValues( tempVec, 1, &j, &lid_parent_gid[kk], INSERT_VALUES );  CHKERRQ(ierr);
573c8b0795cSMark F. Adams     }
574c8b0795cSMark F. Adams     ierr = VecAssemblyBegin( tempVec ); CHKERRQ(ierr);
575c8b0795cSMark F. Adams     ierr = VecAssemblyEnd( tempVec ); CHKERRQ(ierr);
5760cbbd2e1SMark F. Adams     ierr = VecDuplicate( mpimat_2->lvec, &ghostparents2 ); CHKERRQ(ierr);
5770cbbd2e1SMark F. Adams     ierr = VecScatterBegin(mpimat_2->Mvctx,tempVec, ghostparents2,INSERT_VALUES,SCATTER_FORWARD);
578c8b0795cSMark F. Adams     CHKERRQ(ierr);
5790cbbd2e1SMark F. Adams     ierr =   VecScatterEnd(mpimat_2->Mvctx,tempVec, ghostparents2,INSERT_VALUES,SCATTER_FORWARD);
580c8b0795cSMark F. Adams     CHKERRQ(ierr);
5810cbbd2e1SMark F. Adams     ierr = VecGetArray( ghostparents2, &cpcol_2_parent ); CHKERRQ(ierr);
5820cbbd2e1SMark F. Adams 
5830cbbd2e1SMark F. Adams     /* get 'cpcol_2_gid' */
5840cbbd2e1SMark F. Adams     for(kk=0,j=my0;kk<nloc;kk++,j++){
5850cbbd2e1SMark F. Adams       PetscScalar v = (PetscScalar)j;
5860cbbd2e1SMark F. Adams       ierr = VecSetValues( tempVec, 1, &j, &v, INSERT_VALUES );  CHKERRQ(ierr);
5870cbbd2e1SMark F. Adams     }
5880cbbd2e1SMark F. Adams     ierr = VecAssemblyBegin( tempVec ); CHKERRQ(ierr);
5890cbbd2e1SMark F. Adams     ierr = VecAssemblyEnd( tempVec ); CHKERRQ(ierr);
5900cbbd2e1SMark F. Adams     ierr = VecDuplicate( mpimat_2->lvec, &ghostgids2 ); CHKERRQ(ierr);
5910cbbd2e1SMark F. Adams     ierr = VecScatterBegin(mpimat_2->Mvctx,tempVec, ghostgids2,INSERT_VALUES,SCATTER_FORWARD);
5920cbbd2e1SMark F. Adams     CHKERRQ(ierr);
5930cbbd2e1SMark F. Adams     ierr =   VecScatterEnd(mpimat_2->Mvctx,tempVec, ghostgids2,INSERT_VALUES,SCATTER_FORWARD);
5940cbbd2e1SMark F. Adams     CHKERRQ(ierr);
5950cbbd2e1SMark F. Adams     ierr = VecGetArray( ghostgids2, &cpcol_2_gid ); CHKERRQ(ierr);
5960cbbd2e1SMark F. Adams 
597c8b0795cSMark F. Adams     ierr = VecDestroy( &tempVec ); CHKERRQ(ierr);
598c8b0795cSMark F. Adams 
5990cbbd2e1SMark F. Adams     /* look for deleted ghosts and add to table */
6000cbbd2e1SMark F. Adams     ierr = GAMGTableCreate( 2*nghost_2, &gid_cpid ); CHKERRQ(ierr);
6010cbbd2e1SMark F. Adams     for( cpid = 0 ; cpid < nghost_2 ; cpid++ ) {
6020cbbd2e1SMark F. Adams       NState state = (NState)PetscRealPart(cpcol_2_state[cpid]);
6030cbbd2e1SMark F. Adams       if( state==DELETED ) {
6040cbbd2e1SMark F. Adams         PetscInt sgid_new = (PetscInt)PetscRealPart(cpcol_2_parent[cpid]);
6050cbbd2e1SMark F. Adams         PetscInt sgid_old = (PetscInt)PetscRealPart(cpcol_2_par_orig[cpid]);
6060cbbd2e1SMark F. Adams         if( sgid_old == -1 && sgid_new != -1 ) {
6070cbbd2e1SMark F. Adams           PetscInt gid = (PetscInt)PetscRealPart(cpcol_2_gid[cpid]);
6080cbbd2e1SMark F. Adams           ierr = GAMGTableAdd( &gid_cpid, gid, cpid ); CHKERRQ(ierr);
6090cbbd2e1SMark F. Adams         }
6100cbbd2e1SMark F. Adams       }
6110cbbd2e1SMark F. Adams     }
612c8b0795cSMark F. Adams 
6130cbbd2e1SMark F. Adams     /* look for deleted ghosts and see if they moved - remove it */
614c8b0795cSMark F. Adams     for(lid=0;lid<nloc;lid++){
615c8b0795cSMark F. Adams       NState state = lid_state[lid];
616c8b0795cSMark F. Adams       if( IS_SELECTED(state) ){
61741b27cdeSMark F. Adams         PetscCDPos pos,last=PETSC_NULL;
618c8b0795cSMark F. Adams         /* look for deleted ghosts and see if they moved */
619e78576d6SMark F. Adams         ierr = PetscCDGetHeadPos(aggs_2,lid,&pos); CHKERRQ(ierr);
620e78576d6SMark F. Adams         while(pos){
621e78576d6SMark F. Adams           PetscInt gid;
622ffc955d6SMark F. Adams           ierr = PetscLLNGetID( pos, &gid ); CHKERRQ(ierr);
623e78576d6SMark F. Adams 
6240cbbd2e1SMark F. Adams           if( gid < my0 || gid >= Iend ) {
6250cbbd2e1SMark F. Adams             ierr = GAMGTableFind( &gid_cpid, gid, &cpid ); CHKERRQ(ierr);
6260cbbd2e1SMark F. Adams             if( cpid != -1 ) {
6270cbbd2e1SMark F. Adams               /* a moved ghost - */
6280cbbd2e1SMark F. Adams               /* id_llist_2[lastid] = id_llist_2[flid];    /\* remove 'flid' from list *\/ */
62941b27cdeSMark F. Adams               ierr = PetscCDRemoveNextNode( aggs_2, lid, last ); CHKERRQ(ierr);
6300cbbd2e1SMark F. Adams             }
6310cbbd2e1SMark F. Adams             else last = pos;
6320cbbd2e1SMark F. Adams           }
6330cbbd2e1SMark F. Adams           else last = pos;
634e78576d6SMark F. Adams 
635e78576d6SMark F. Adams           ierr = PetscCDGetNextPos(aggs_2,lid,&pos); CHKERRQ(ierr);
636c8b0795cSMark F. Adams         } /* loop over list of deleted */
637c8b0795cSMark F. Adams       } /* selected */
638c8b0795cSMark F. Adams     }
6390cbbd2e1SMark F. Adams     ierr = GAMGTableDestroy( &gid_cpid ); CHKERRQ(ierr);
640c8b0795cSMark F. Adams 
6410cbbd2e1SMark F. Adams     /* look at ghosts, see if they changed - and it */
6420cbbd2e1SMark F. Adams     for( cpid = 0 ; cpid < nghost_2 ; cpid++ ){
6430cbbd2e1SMark F. Adams       PetscInt sgid_new = (PetscInt)PetscRealPart(cpcol_2_parent[cpid]);
6440cbbd2e1SMark F. Adams       if( sgid_new >= my0 && sgid_new < Iend ) { /* this is mine */
6450cbbd2e1SMark F. Adams         PetscInt gid = (PetscInt)PetscRealPart(cpcol_2_gid[cpid]);
6460cbbd2e1SMark F. Adams         PetscInt slid_new=sgid_new-my0,hav=0;
64741b27cdeSMark F. Adams         PetscCDPos pos;
6480cbbd2e1SMark F. Adams         /* search for this gid to see if I have it */
649e78576d6SMark F. Adams         ierr = PetscCDGetHeadPos(aggs_2,slid_new,&pos); CHKERRQ(ierr);
650e78576d6SMark F. Adams         while(pos){
651e78576d6SMark F. Adams           PetscInt gidj;
652ffc955d6SMark F. Adams           ierr = PetscLLNGetID( pos, &gidj ); CHKERRQ(ierr);
653e78576d6SMark F. Adams           ierr = PetscCDGetNextPos(aggs_2,slid_new,&pos); CHKERRQ(ierr);
654e78576d6SMark F. Adams 
6550cbbd2e1SMark F. Adams           if( gidj == gid ) { hav = 1; break; }
656c8b0795cSMark F. Adams         }
657c8b0795cSMark F. Adams         if( hav != 1 ){
658ffc955d6SMark F. Adams           /* insert 'flidj' into head of llist */
65941b27cdeSMark F. Adams           ierr = PetscCDAppendID( aggs_2, slid_new, gid );      CHKERRQ(ierr);
660c8b0795cSMark F. Adams         }
661c8b0795cSMark F. Adams       }
662c8b0795cSMark F. Adams     }
663c8b0795cSMark F. Adams 
6640cbbd2e1SMark F. Adams     ierr = VecRestoreArray( mpimat_1->lvec, &cpcol_1_state ); CHKERRQ(ierr);
6650cbbd2e1SMark F. Adams     ierr = VecRestoreArray( mpimat_2->lvec, &cpcol_2_state ); CHKERRQ(ierr);
6660cbbd2e1SMark F. Adams     ierr = VecRestoreArray( ghostparents2, &cpcol_2_parent ); CHKERRQ(ierr);
6670cbbd2e1SMark F. Adams     ierr = VecRestoreArray( ghostgids2, &cpcol_2_gid ); CHKERRQ(ierr);
668c8b0795cSMark F. Adams     ierr = PetscFree( lid_cprowID_1 );  CHKERRQ(ierr);
6690cbbd2e1SMark F. Adams     ierr = VecDestroy( &ghostgids2 ); CHKERRQ(ierr);
6700cbbd2e1SMark F. Adams     ierr = VecDestroy( &ghostparents2 ); CHKERRQ(ierr);
6710cbbd2e1SMark F. Adams     ierr = VecDestroy( &ghost_par_orig2 ); CHKERRQ(ierr);
672c8b0795cSMark F. Adams   }
673c8b0795cSMark F. Adams 
6740cbbd2e1SMark F. Adams   ierr = PetscFree( lid_parent_gid );  CHKERRQ(ierr);
675c8b0795cSMark F. Adams   ierr = PetscFree( lid_state );  CHKERRQ(ierr);
676c8b0795cSMark F. Adams 
677c8b0795cSMark F. Adams   PetscFunctionReturn(0);
678c8b0795cSMark F. Adams }
6792e68589bSMark F. Adams 
6802e68589bSMark F. Adams /* -------------------------------------------------------------------------- */
6812e68589bSMark F. Adams /*
682*a2f3521dSMark F. Adams    PCSetData_AGG - called if data is not set with PCSetCoordinates.
683*a2f3521dSMark F. Adams       Looks in Mat for near null space.
684*a2f3521dSMark F. Adams       Does not work for Stokes
6852e68589bSMark F. Adams 
6862e68589bSMark F. Adams   Input Parameter:
6872e68589bSMark F. Adams    . pc -
688*a2f3521dSMark F. Adams    . a_A - matrix to get (near) null space out of.
6892e68589bSMark F. Adams */
6902e68589bSMark F. Adams #undef __FUNCT__
6912e68589bSMark F. Adams #define __FUNCT__ "PCSetData_AGG"
692b8cd405aSMark F. Adams PetscErrorCode PCSetData_AGG( PC pc, Mat a_A )
6932e68589bSMark F. Adams {
6942e68589bSMark F. Adams   PetscErrorCode  ierr;
695b8cd405aSMark F. Adams   PC_MG          *mg = (PC_MG*)pc->data;
696b8cd405aSMark F. Adams   PC_GAMG        *pc_gamg = (PC_GAMG*)mg->innerctx;
697b8cd405aSMark F. Adams   MatNullSpace mnull;
698b8cd405aSMark F. Adams 
6992e68589bSMark F. Adams   PetscFunctionBegin;
700b8cd405aSMark F. Adams   ierr = MatGetNearNullSpace( a_A, &mnull ); CHKERRQ(ierr);
701b8cd405aSMark F. Adams   if( !mnull ) {
702*a2f3521dSMark F. Adams     PetscInt bs,NN,MM;
703*a2f3521dSMark F. Adams     ierr = MatGetBlockSize( a_A, &bs ); CHKERRQ( ierr ); /* this does not work for Stokes */
704*a2f3521dSMark F. Adams     ierr = MatGetLocalSize( a_A, &MM, &NN ); CHKERRQ( ierr );
705*a2f3521dSMark F. Adams     /* this does not work for Stokes */
706*a2f3521dSMark F. Adams     ierr = PCSetCoordinates_AGG( pc, bs, MM/bs, PETSC_NULL ); CHKERRQ(ierr);
707b8cd405aSMark F. Adams   }
708b8cd405aSMark F. Adams   else {
709b8cd405aSMark F. Adams     PetscReal *nullvec;
710b8cd405aSMark F. Adams     PetscBool has_const;
711b8cd405aSMark F. Adams     PetscInt i,j,mlocal,nvec,bs;
712b8cd405aSMark F. Adams     const Vec *vecs; const PetscScalar *v;
713b8cd405aSMark F. Adams     ierr = MatGetLocalSize(a_A,&mlocal,PETSC_NULL);CHKERRQ(ierr);
714b8cd405aSMark F. Adams     ierr = MatNullSpaceGetVecs( mnull, &has_const, &nvec, &vecs ); CHKERRQ(ierr);
715b8cd405aSMark F. Adams     ierr = PetscMalloc((nvec+!!has_const)*mlocal*sizeof *nullvec,&nullvec);CHKERRQ(ierr);
716b8cd405aSMark F. Adams     if (has_const) for (i=0; i<mlocal; i++) nullvec[i] = 1.0;
717b8cd405aSMark F. Adams     for (i=0; i<nvec; i++) {
718b8cd405aSMark F. Adams       ierr = VecGetArrayRead(vecs[i],&v);CHKERRQ(ierr);
719b8cd405aSMark F. Adams       for (j=0; j<mlocal; j++) nullvec[(i+!!has_const)*mlocal + j] = PetscRealPart(v[j]);
720b8cd405aSMark F. Adams       ierr = VecRestoreArrayRead(vecs[i],&v);CHKERRQ(ierr);
721b8cd405aSMark F. Adams     }
722b8cd405aSMark F. Adams     pc_gamg->data = nullvec;
723b8cd405aSMark F. Adams     pc_gamg->data_cell_cols = (nvec+!!has_const);
724*a2f3521dSMark F. Adams     ierr = MatGetBlockSize( a_A, &bs ); CHKERRQ( ierr ); /* this does not work for Stokes */
725b8cd405aSMark F. Adams     pc_gamg->data_cell_rows = bs;
726b8cd405aSMark F. Adams   }
7272e68589bSMark F. Adams   PetscFunctionReturn(0);
7282e68589bSMark F. Adams }
7292e68589bSMark F. Adams 
7302e68589bSMark F. Adams /* -------------------------------------------------------------------------- */
7312e68589bSMark F. Adams /*
7322e68589bSMark F. Adams  formProl0
7332e68589bSMark F. Adams 
7342e68589bSMark F. Adams    Input Parameter:
7350cbbd2e1SMark F. Adams    . agg_llists - list of arrays with aggregates
7362e68589bSMark F. Adams    . bs - block size
7370cbbd2e1SMark F. Adams    . nSAvec - column bs of new P
7380cbbd2e1SMark F. Adams    . my0crs - global index of start of locals
7392e68589bSMark F. Adams    . data_stride - bs*(nloc nodes + ghost nodes)
7402e68589bSMark F. Adams    . data_in[data_stride*nSAvec] - local data on fine grid
7412e68589bSMark F. Adams    . flid_fgid[data_stride/bs] - make local to global IDs, includes ghosts in 'locals_llist'
7422e68589bSMark F. Adams   Output Parameter:
7432e68589bSMark F. Adams    . a_data_out - in with fine grid data (w/ghosts), out with coarse grid data
7442e68589bSMark F. Adams    . a_Prol - prolongation operator
7452e68589bSMark F. Adams */
7462e68589bSMark F. Adams #undef __FUNCT__
7472e68589bSMark F. Adams #define __FUNCT__ "formProl0"
7480cbbd2e1SMark F. Adams static PetscErrorCode formProl0(const PetscCoarsenData *agg_llists,/* list from selected vertices of aggregate unselected vertices */
7490cbbd2e1SMark F. Adams                                 const PetscInt bs,          /* (row) block size */
7500cbbd2e1SMark F. Adams                                 const PetscInt nSAvec,      /* column bs */
7510cbbd2e1SMark F. Adams                                 const PetscInt my0crs,      /* global index of start of locals */
7520cbbd2e1SMark F. Adams                                 const PetscInt data_stride, /* (nloc+nghost)*bs */
7530cbbd2e1SMark F. Adams                                 PetscReal      data_in[],   /* [data_stride][nSAvec] */
7540cbbd2e1SMark F. Adams                                 const PetscInt flid_fgid[], /* [data_stride/bs] */
7552e68589bSMark F. Adams                                 PetscReal **a_data_out,
7562e68589bSMark F. Adams                                 Mat a_Prol /* prolongation operator (output)*/
7572e68589bSMark F. Adams                                 )
7582e68589bSMark F. Adams {
7592e68589bSMark F. Adams   PetscErrorCode ierr;
7600cbbd2e1SMark F. Adams   PetscInt  Istart,my0,Iend,nloc,clid,flid,aggID,kk,jj,ii,mm,ndone,nSelected,minsz,nghosts,out_data_stride;
7612e68589bSMark F. Adams   MPI_Comm       wcomm = ((PetscObject)a_Prol)->comm;
7622e68589bSMark F. Adams   PetscMPIInt    mype, npe;
7632e68589bSMark F. Adams   PetscReal      *out_data;
76441b27cdeSMark F. Adams   PetscCDPos         pos;
7650cbbd2e1SMark F. Adams   GAMGHashTable  fgid_flid;
7660cbbd2e1SMark F. Adams 
767797e13b7SMark F. Adams /* #define OUT_AGGS */
7689057884aSMark F. Adams #ifdef OUT_AGGS
769f7620de1SMatthew G Knepley   static PetscInt llev = 0; char fname[32]; FILE *file = PETSC_NULL; PetscInt pM;
7709057884aSMark F. Adams #endif
7712e68589bSMark F. Adams 
7722e68589bSMark F. Adams   PetscFunctionBegin;
7732e68589bSMark F. Adams   ierr = MPI_Comm_rank(wcomm,&mype);CHKERRQ(ierr);
7742e68589bSMark F. Adams   ierr = MPI_Comm_size(wcomm,&npe);CHKERRQ(ierr);
7752e68589bSMark F. Adams   ierr = MatGetOwnershipRange( a_Prol, &Istart, &Iend );    CHKERRQ(ierr);
7760cbbd2e1SMark F. Adams   nloc = (Iend-Istart)/bs; my0 = Istart/bs; assert((Iend-Istart)%bs==0);
7770cbbd2e1SMark F. Adams   Iend /= bs;
7780cbbd2e1SMark F. Adams   nghosts = data_stride/bs - nloc;
7792e68589bSMark F. Adams 
7800cbbd2e1SMark F. Adams   ierr = GAMGTableCreate( 2*nghosts, &fgid_flid ); CHKERRQ(ierr);
7810cbbd2e1SMark F. Adams   for(kk=0;kk<nghosts;kk++) {
7820cbbd2e1SMark F. Adams     ierr = GAMGTableAdd( &fgid_flid, flid_fgid[nloc+kk], nloc+kk ); CHKERRQ(ierr);
7832e68589bSMark F. Adams   }
7842e68589bSMark F. Adams 
7850cbbd2e1SMark F. Adams #ifdef OUT_AGGS
7860cbbd2e1SMark F. Adams   sprintf(fname,"aggs_%d_%d.m",llev++,mype);
7870cbbd2e1SMark F. Adams   if(llev==1) {
7880cbbd2e1SMark F. Adams     file = fopen(fname,"w");
7890cbbd2e1SMark F. Adams   }
7900cbbd2e1SMark F. Adams   MatGetSize( a_Prol, &pM, &jj );
7910cbbd2e1SMark F. Adams #endif
7920cbbd2e1SMark F. Adams 
7930cbbd2e1SMark F. Adams   /* count selected -- same as number of cols of P */
7940cbbd2e1SMark F. Adams   for(nSelected=mm=0;mm<nloc;mm++) {
795e78576d6SMark F. Adams     PetscBool ise;
796e78576d6SMark F. Adams     ierr = PetscCDEmptyAt( agg_llists, mm, &ise ); CHKERRQ(ierr);
797e78576d6SMark F. Adams     if( !ise ) nSelected++;
7980cbbd2e1SMark F. Adams   }
7990cbbd2e1SMark F. Adams   ierr = MatGetOwnershipRangeColumn( a_Prol, &ii, &jj ); CHKERRQ(ierr);
8000cbbd2e1SMark F. Adams   assert((ii/nSAvec)==my0crs); assert(nSelected==(jj-ii)/nSAvec);
8010cbbd2e1SMark F. Adams 
8022e68589bSMark F. Adams   /* aloc space for coarse point data (output) */
8030cbbd2e1SMark F. Adams   out_data_stride = nSelected*nSAvec;
8040cbbd2e1SMark F. Adams   ierr = PetscMalloc( out_data_stride*nSAvec*sizeof(PetscReal), &out_data ); CHKERRQ(ierr);
8050cbbd2e1SMark F. Adams   for(ii=0;ii<out_data_stride*nSAvec;ii++) {
8060cbbd2e1SMark F. Adams     out_data[ii]=1.e300;
8070cbbd2e1SMark F. Adams   }
8080cbbd2e1SMark F. Adams   *a_data_out = out_data; /* output - stride nSelected*nSAvec */
8092e68589bSMark F. Adams 
8102e68589bSMark F. Adams   /* find points and set prolongation */
811c8b0795cSMark F. Adams   minsz = 100;
8122e68589bSMark F. Adams   ndone = 0;
8130cbbd2e1SMark F. Adams   for( mm = clid = 0 ; mm < nloc ; mm++ ){
814e78576d6SMark F. Adams     ierr = PetscCDSizeAt( agg_llists, mm, &jj ); CHKERRQ(ierr);
815e78576d6SMark F. Adams     if( jj > 0 ) {
8160cbbd2e1SMark F. Adams       const PetscInt lid = mm, cgid = my0crs + clid;
8170cbbd2e1SMark F. Adams       PetscInt cids[100]; /* max bs */
8180cbbd2e1SMark F. Adams       PetscBLASInt asz=jj,M=asz*bs,N=nSAvec,INFO;
8192e68589bSMark F. Adams       PetscBLASInt   Mdata=M+((N-M>0)?N-M:0),LDA=Mdata,LWORK=N*bs;
8202e68589bSMark F. Adams       PetscScalar    *qqc,*qqr,*TAU,*WORK;
8212e68589bSMark F. Adams       PetscInt       *fids;
82265d7b583SSatish Balay       PetscReal      *data;
8230cbbd2e1SMark F. Adams       /* count agg */
8240cbbd2e1SMark F. Adams       if( asz<minsz ) minsz = asz;
8250cbbd2e1SMark F. Adams 
8260cbbd2e1SMark F. Adams       /* get block */
8272e68589bSMark F. Adams       ierr = PetscMalloc( (Mdata*N)*sizeof(PetscScalar), &qqc ); CHKERRQ(ierr);
8282e68589bSMark F. Adams       ierr = PetscMalloc( (M*N)*sizeof(PetscScalar), &qqr ); CHKERRQ(ierr);
8292e68589bSMark F. Adams       ierr = PetscMalloc( N*sizeof(PetscScalar), &TAU ); CHKERRQ(ierr);
8302e68589bSMark F. Adams       ierr = PetscMalloc( LWORK*sizeof(PetscScalar), &WORK ); CHKERRQ(ierr);
8312e68589bSMark F. Adams       ierr = PetscMalloc( M*sizeof(PetscInt), &fids ); CHKERRQ(ierr);
8322e68589bSMark F. Adams 
8332e68589bSMark F. Adams       aggID = 0;
834e78576d6SMark F. Adams       ierr = PetscCDGetHeadPos(agg_llists,lid,&pos); CHKERRQ(ierr);
835e78576d6SMark F. Adams       while(pos){
836e78576d6SMark F. Adams         PetscInt gid1;
837ffc955d6SMark F. Adams         ierr = PetscLLNGetID( pos, &gid1 ); CHKERRQ(ierr);
838e78576d6SMark F. Adams         ierr = PetscCDGetNextPos(agg_llists,lid,&pos); CHKERRQ(ierr);
839e78576d6SMark F. Adams 
8400cbbd2e1SMark F. Adams         if( gid1 >= my0 && gid1 < Iend ) flid = gid1 - my0;
8410cbbd2e1SMark F. Adams         else {
8420cbbd2e1SMark F. Adams           ierr = GAMGTableFind( &fgid_flid, gid1, &flid ); CHKERRQ(ierr);
8430cbbd2e1SMark F. Adams           assert(flid>=0);
8440cbbd2e1SMark F. Adams         }
8452e68589bSMark F. Adams         /* copy in B_i matrix - column oriented */
84665d7b583SSatish Balay         data = &data_in[flid*bs];
8472e68589bSMark F. Adams         for( kk = ii = 0; ii < bs ; ii++ ) {
8482e68589bSMark F. Adams           for( jj = 0; jj < N ; jj++ ) {
8490cbbd2e1SMark F. Adams             PetscReal d = data[jj*data_stride + ii];
8500cbbd2e1SMark F. Adams             qqc[jj*Mdata + aggID*bs + ii] = d;
8512e68589bSMark F. Adams           }
8522e68589bSMark F. Adams         }
8539057884aSMark F. Adams #ifdef OUT_AGGS
854b2a4f308SMark F. Adams         if(llev==1) {
8559057884aSMark F. Adams           char str[] = "plot(%e,%e,'r*'), hold on,\n", col[] = "rgbkmc", sim[] = "*os+h>d<vx^";
8560cbbd2e1SMark F. Adams           PetscInt MM,pi,pj;
8570cbbd2e1SMark F. Adams           str[12] = col[(clid+17*mype)%6]; str[13] = sim[(clid+17*mype)%11];
858f7620de1SMatthew G Knepley           MM = (PetscInt)(PetscSqrtReal((PetscReal)pM));
8590cbbd2e1SMark F. Adams           pj = gid1/MM; pi = gid1%MM;
860b2a4f308SMark F. Adams           fprintf(file,str,(double)pi,(double)pj);
861b2a4f308SMark F. Adams           /* fprintf(file,str,data[2*data_stride+1],-data[2*data_stride]); */
8629057884aSMark F. Adams         }
8639057884aSMark F. Adams #endif
8642e68589bSMark F. Adams         /* set fine IDs */
8652e68589bSMark F. Adams         for(kk=0;kk<bs;kk++) fids[aggID*bs + kk] = flid_fgid[flid]*bs + kk;
8662e68589bSMark F. Adams 
8672e68589bSMark F. Adams         aggID++;
8680cbbd2e1SMark F. Adams       }
8692e68589bSMark F. Adams 
8702e68589bSMark F. Adams       /* pad with zeros */
8712e68589bSMark F. Adams       for( ii = asz*bs; ii < Mdata ; ii++ ) {
8722e68589bSMark F. Adams 	for( jj = 0; jj < N ; jj++, kk++ ) {
8732e68589bSMark F. Adams 	  qqc[jj*Mdata + ii] = .0;
8742e68589bSMark F. Adams 	}
8752e68589bSMark F. Adams       }
8762e68589bSMark F. Adams 
8772e68589bSMark F. Adams       ndone += aggID;
8782e68589bSMark F. Adams       /* QR */
8792e68589bSMark F. Adams       LAPACKgeqrf_( &Mdata, &N, qqc, &LDA, TAU, WORK, &LWORK, &INFO );
8802e68589bSMark F. Adams       if( INFO != 0 ) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_LIB,"xGEQRS error");
8812e68589bSMark F. Adams       /* get R - column oriented - output B_{i+1} */
8822e68589bSMark F. Adams       {
8832e68589bSMark F. Adams         PetscReal *data = &out_data[clid*nSAvec];
8842e68589bSMark F. Adams         for( jj = 0; jj < nSAvec ; jj++ ) {
8852e68589bSMark F. Adams           for( ii = 0; ii < nSAvec ; ii++ ) {
8860cbbd2e1SMark F. Adams             assert(data[jj*out_data_stride + ii] == 1.e300);
8870cbbd2e1SMark F. Adams             if( ii <= jj ) data[jj*out_data_stride + ii] = PetscRealPart(qqc[jj*Mdata + ii]);
8880cbbd2e1SMark F. Adams 	    else data[jj*out_data_stride + ii] = 0.;
8892e68589bSMark F. Adams           }
8902e68589bSMark F. Adams         }
8912e68589bSMark F. Adams       }
8922e68589bSMark F. Adams 
8932e68589bSMark F. Adams       /* get Q - row oriented */
8942e68589bSMark F. Adams       LAPACKungqr_( &Mdata, &N, &N, qqc, &LDA, TAU, WORK, &LWORK, &INFO );
8952e68589bSMark F. Adams       if( INFO != 0 ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"xORGQR error arg %d",-INFO);
8962e68589bSMark F. Adams 
8972e68589bSMark F. Adams       for( ii = 0 ; ii < M ; ii++ ){
8982e68589bSMark F. Adams         for( jj = 0 ; jj < N ; jj++ ) {
8992e68589bSMark F. Adams           qqr[N*ii + jj] = qqc[jj*Mdata + ii];
9002e68589bSMark F. Adams         }
9012e68589bSMark F. Adams       }
9022e68589bSMark F. Adams 
9032e68589bSMark F. Adams       /* add diagonal block of P0 */
904c8b0795cSMark F. Adams       for(kk=0;kk<N;kk++) {
905c8b0795cSMark F. Adams         cids[kk] = N*cgid + kk; /* global col IDs in P0 */
906c8b0795cSMark F. Adams       }
9072e68589bSMark F. Adams       ierr = MatSetValues(a_Prol,M,fids,N,cids,qqr,INSERT_VALUES); CHKERRQ(ierr);
9082e68589bSMark F. Adams 
9092e68589bSMark F. Adams       ierr = PetscFree( qqc );  CHKERRQ(ierr);
9102e68589bSMark F. Adams       ierr = PetscFree( qqr );  CHKERRQ(ierr);
9112e68589bSMark F. Adams       ierr = PetscFree( TAU );  CHKERRQ(ierr);
9122e68589bSMark F. Adams       ierr = PetscFree( WORK );  CHKERRQ(ierr);
9132e68589bSMark F. Adams       ierr = PetscFree( fids );  CHKERRQ(ierr);
914b43b03e9SMark F. Adams       clid++;
9150cbbd2e1SMark F. Adams     } /* coarse agg */
9160cbbd2e1SMark F. Adams   } /* for all fine nodes */
9170cbbd2e1SMark F. Adams   ierr = MatAssemblyBegin(a_Prol,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
9180cbbd2e1SMark F. Adams   ierr = MatAssemblyEnd(a_Prol,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
9192e68589bSMark F. Adams 
920c8b0795cSMark F. Adams /* ierr = MPI_Allreduce( &ndone, &ii, 1, MPIU_INT, MPIU_SUM, wcomm ); */
9212e68589bSMark F. Adams /* MatGetSize( a_Prol, &kk, &jj ); */
922c8b0795cSMark F. Adams /* ierr = MPI_Allreduce( &minsz, &jj, 1, MPIU_INT, MPIU_MIN, wcomm ); */
923e78576d6SMark F. Adams /* PetscPrintf(wcomm," **** [%d]%s %d total done, %d nodes (%d local done), min agg. size = %d\n",mype,__FUNCT__,ii,kk/bs,ndone,jj); */
9242e68589bSMark F. Adams 
9259057884aSMark F. Adams #ifdef OUT_AGGS
926b2a4f308SMark F. Adams   if(llev==1) fclose(file);
9279057884aSMark F. Adams #endif
9280cbbd2e1SMark F. Adams   ierr = GAMGTableDestroy( &fgid_flid ); CHKERRQ(ierr);
9292e68589bSMark F. Adams 
9302e68589bSMark F. Adams   PetscFunctionReturn(0);
9312e68589bSMark F. Adams }
9322e68589bSMark F. Adams 
9332e68589bSMark F. Adams /* -------------------------------------------------------------------------- */
9342e68589bSMark F. Adams /*
935c8b0795cSMark F. Adams    PCGAMGgraph_AGG
9362e68589bSMark F. Adams 
9372e68589bSMark F. Adams   Input Parameter:
9382e68589bSMark F. Adams    . pc - this
9392e68589bSMark F. Adams    . Amat - matrix on this fine level
9402e68589bSMark F. Adams   Output Parameter:
941c8b0795cSMark F. Adams    . a_Gmat -
9422e68589bSMark F. Adams */
9432e68589bSMark F. Adams #undef __FUNCT__
944c8b0795cSMark F. Adams #define __FUNCT__ "PCGAMGgraph_AGG"
945c8b0795cSMark F. Adams PetscErrorCode PCGAMGgraph_AGG( PC pc,
9462e68589bSMark F. Adams                                 const Mat Amat,
947c8b0795cSMark F. Adams                                 Mat *a_Gmat
948c8b0795cSMark F. Adams                                 )
949c8b0795cSMark F. Adams {
950c8b0795cSMark F. Adams   PetscErrorCode ierr;
951c8b0795cSMark F. Adams   PC_MG          *mg = (PC_MG*)pc->data;
952c8b0795cSMark F. Adams   PC_GAMG        *pc_gamg = (PC_GAMG*)mg->innerctx;
953c8b0795cSMark F. Adams   const PetscInt verbose = pc_gamg->verbose;
954c8b0795cSMark F. Adams   const PetscReal vfilter = pc_gamg->threshold;
955c8b0795cSMark F. Adams   PC_GAMG_AGG    *pc_gamg_agg = (PC_GAMG_AGG*)pc_gamg->subctx;
956c8b0795cSMark F. Adams   PetscMPIInt    mype,npe;
957e0940f08SMark F. Adams   Mat            Gmat;
958c8b0795cSMark F. Adams   MPI_Comm       wcomm = ((PetscObject)Amat)->comm;
9590cbbd2e1SMark F. Adams   PetscBool  set,flg,symm;
960c8b0795cSMark F. Adams 
961c8b0795cSMark F. Adams   PetscFunctionBegin;
9620cbbd2e1SMark F. Adams #if defined PETSC_USE_LOG
9630cbbd2e1SMark F. Adams   ierr = PetscLogEventBegin(PC_GAMGGgraph_AGG,0,0,0,0);CHKERRQ(ierr);
9640cbbd2e1SMark F. Adams #endif
965c8b0795cSMark F. Adams   ierr = MPI_Comm_rank( wcomm, &mype);  CHKERRQ(ierr);
966c8b0795cSMark F. Adams   ierr = MPI_Comm_size( wcomm, &npe);   CHKERRQ(ierr);
967c8b0795cSMark F. Adams 
9680cbbd2e1SMark F. Adams   ierr = MatIsSymmetricKnown(Amat, &set, &flg);        CHKERRQ(ierr);
969263489e9SJed Brown   symm = (PetscBool)(pc_gamg_agg->sym_graph || !(set && flg));
9700cbbd2e1SMark F. Adams 
9712d7fac45SMark F. Adams   ierr  = PCGAMGCreateGraph( Amat, &Gmat ); CHKERRQ( ierr );
9722d7fac45SMark F. Adams   ierr  = PCGAMGFilterGraph( &Gmat, vfilter, symm, verbose ); CHKERRQ( ierr );
973c8b0795cSMark F. Adams 
974e0940f08SMark F. Adams   *a_Gmat = Gmat;
975c8b0795cSMark F. Adams 
9760cbbd2e1SMark F. Adams #if defined PETSC_USE_LOG
9770cbbd2e1SMark F. Adams   ierr = PetscLogEventEnd(PC_GAMGGgraph_AGG,0,0,0,0);CHKERRQ(ierr);
9780cbbd2e1SMark F. Adams #endif
979c8b0795cSMark F. Adams   PetscFunctionReturn(0);
980c8b0795cSMark F. Adams }
981c8b0795cSMark F. Adams 
982c8b0795cSMark F. Adams /* -------------------------------------------------------------------------- */
983c8b0795cSMark F. Adams /*
984b43b03e9SMark F. Adams    PCGAMGCoarsen_AGG
985c8b0795cSMark F. Adams 
986c8b0795cSMark F. Adams   Input Parameter:
987e0940f08SMark F. Adams    . a_pc - this
988e0940f08SMark F. Adams   Input/Output Parameter:
9890cbbd2e1SMark F. Adams    . a_Gmat1 - graph on this fine level - coarsening can change this (squares it)
990c8b0795cSMark F. Adams   Output Parameter:
9910cbbd2e1SMark F. Adams    . agg_lists - list of aggregates
992c8b0795cSMark F. Adams */
993c8b0795cSMark F. Adams #undef __FUNCT__
994b43b03e9SMark F. Adams #define __FUNCT__ "PCGAMGCoarsen_AGG"
995e0940f08SMark F. Adams PetscErrorCode PCGAMGCoarsen_AGG( PC a_pc,
996e0940f08SMark F. Adams                                   Mat *a_Gmat1,
9970cbbd2e1SMark F. Adams                                   PetscCoarsenData **agg_lists
998c8b0795cSMark F. Adams                                   )
999c8b0795cSMark F. Adams {
1000c8b0795cSMark F. Adams   PetscErrorCode ierr;
1001e0940f08SMark F. Adams   PC_MG          *mg = (PC_MG*)a_pc->data;
1002c8b0795cSMark F. Adams   PC_GAMG        *pc_gamg = (PC_GAMG*)mg->innerctx;
1003c8b0795cSMark F. Adams   PC_GAMG_AGG    *pc_gamg_agg = (PC_GAMG_AGG*)pc_gamg->subctx;
10040cbbd2e1SMark F. Adams   Mat             mat,Gmat2, Gmat1 = *a_Gmat1; /* squared graph */
10050cbbd2e1SMark F. Adams   IS              perm;
1006c8b0795cSMark F. Adams   PetscInt        Ii,nloc,bs,n,m;
1007c8b0795cSMark F. Adams   PetscInt *permute;
1008c8b0795cSMark F. Adams   PetscBool *bIndexSet;
1009b43b03e9SMark F. Adams   MatCoarsen crs;
1010e0940f08SMark F. Adams   MPI_Comm        wcomm = ((PetscObject)Gmat1)->comm;
10110cbbd2e1SMark F. Adams   PetscMPIInt     mype,npe;
1012c8b0795cSMark F. Adams 
1013c8b0795cSMark F. Adams   PetscFunctionBegin;
10140cbbd2e1SMark F. Adams #if defined PETSC_USE_LOG
10150cbbd2e1SMark F. Adams   ierr = PetscLogEventBegin(PC_GAMGCoarsen_AGG,0,0,0,0);CHKERRQ(ierr);
10160cbbd2e1SMark F. Adams #endif
10170cbbd2e1SMark F. Adams   ierr = MPI_Comm_rank( wcomm, &mype);  CHKERRQ(ierr);
10180cbbd2e1SMark F. Adams   ierr = MPI_Comm_size( wcomm, &npe);   CHKERRQ(ierr);
1019e0940f08SMark F. Adams   ierr = MatGetLocalSize( Gmat1, &n, &m ); CHKERRQ(ierr);
1020e0940f08SMark F. Adams   ierr = MatGetBlockSize( Gmat1, &bs ); CHKERRQ(ierr); assert(bs==1);
1021c8b0795cSMark F. Adams   nloc = n/bs;
1022c8b0795cSMark F. Adams 
1023e0940f08SMark F. Adams   if( pc_gamg_agg->square_graph ) {
1024e0940f08SMark F. Adams     ierr = MatTransposeMatMult( Gmat1, Gmat1, MAT_INITIAL_MATRIX, PETSC_DEFAULT, &Gmat2 );
1025e0940f08SMark F. Adams     CHKERRQ(ierr);
1026e0940f08SMark F. Adams   }
1027e0940f08SMark F. Adams   else Gmat2 = Gmat1;
1028c8b0795cSMark F. Adams 
1029c8b0795cSMark F. Adams   /* get MIS aggs */
1030c8b0795cSMark F. Adams   /* randomize */
1031c8b0795cSMark F. Adams   ierr = PetscMalloc( nloc*sizeof(PetscInt), &permute ); CHKERRQ(ierr);
1032c8b0795cSMark F. Adams   ierr = PetscMalloc( nloc*sizeof(PetscBool), &bIndexSet ); CHKERRQ(ierr);
1033c8b0795cSMark F. Adams   for ( Ii = 0; Ii < nloc ; Ii++ ){
1034c8b0795cSMark F. Adams     bIndexSet[Ii] = PETSC_FALSE;
1035c8b0795cSMark F. Adams     permute[Ii] = Ii;
1036c8b0795cSMark F. Adams   }
1037c8b0795cSMark F. Adams   srand(1); /* make deterministic */
1038c8b0795cSMark F. Adams   for ( Ii = 0; Ii < nloc ; Ii++ ) {
1039c8b0795cSMark F. Adams     PetscInt iSwapIndex = rand()%nloc;
1040c8b0795cSMark F. Adams     if (!bIndexSet[iSwapIndex] && iSwapIndex != Ii) {
1041c8b0795cSMark F. Adams       PetscInt iTemp = permute[iSwapIndex];
1042c8b0795cSMark F. Adams       permute[iSwapIndex] = permute[Ii];
1043c8b0795cSMark F. Adams       permute[Ii] = iTemp;
1044c8b0795cSMark F. Adams       bIndexSet[iSwapIndex] = PETSC_TRUE;
1045c8b0795cSMark F. Adams     }
1046c8b0795cSMark F. Adams   }
1047c8b0795cSMark F. Adams   ierr = PetscFree( bIndexSet );  CHKERRQ(ierr);
1048c8b0795cSMark F. Adams 
1049c8b0795cSMark F. Adams   ierr = ISCreateGeneral(PETSC_COMM_SELF, nloc, permute, PETSC_USE_POINTER, &perm);
1050c8b0795cSMark F. Adams   CHKERRQ(ierr);
10510cbbd2e1SMark F. Adams #if defined PETSC_GAMG_USE_LOG
10520cbbd2e1SMark F. Adams   ierr = PetscLogEventBegin(petsc_gamg_setup_events[SET4],0,0,0,0);CHKERRQ(ierr);
1053b43b03e9SMark F. Adams #endif
1054b43b03e9SMark F. Adams   ierr = MatCoarsenCreate( wcomm, &crs ); CHKERRQ(ierr);
10559057884aSMark F. Adams   /* ierr = MatCoarsenSetType( crs, MATCOARSENMIS ); CHKERRQ(ierr); */
10569057884aSMark F. Adams   ierr = MatCoarsenSetFromOptions( crs ); CHKERRQ(ierr);
1057b43b03e9SMark F. Adams   ierr = MatCoarsenSetGreedyOrdering( crs, perm ); CHKERRQ(ierr);
1058b43b03e9SMark F. Adams   ierr = MatCoarsenSetAdjacency( crs, Gmat2 ); CHKERRQ(ierr);
1059b43b03e9SMark F. Adams   ierr = MatCoarsenSetVerbose( crs, pc_gamg->verbose ); CHKERRQ(ierr);
1060b43b03e9SMark F. Adams   ierr = MatCoarsenSetStrictAggs( crs, PETSC_TRUE ); CHKERRQ(ierr);
1061b43b03e9SMark F. Adams   ierr = MatCoarsenApply( crs ); CHKERRQ(ierr);
10620cbbd2e1SMark F. Adams   ierr = MatCoarsenGetData( crs, agg_lists ); CHKERRQ(ierr); /* output */
1063b43b03e9SMark F. Adams   ierr = MatCoarsenDestroy( &crs ); CHKERRQ(ierr);
1064b43b03e9SMark F. Adams 
1065c8b0795cSMark F. Adams   ierr = ISDestroy( &perm );                    CHKERRQ(ierr);
1066c8b0795cSMark F. Adams   ierr = PetscFree( permute );  CHKERRQ(ierr);
10670cbbd2e1SMark F. Adams #if defined PETSC_GAMG_USE_LOG
10680cbbd2e1SMark F. Adams   ierr = PetscLogEventEnd(petsc_gamg_setup_events[SET4],0,0,0,0);CHKERRQ(ierr);
1069b43b03e9SMark F. Adams #endif
1070c8b0795cSMark F. Adams   /* smooth aggs */
1071e0940f08SMark F. Adams   if( Gmat2 != Gmat1 ) {
10720cbbd2e1SMark F. Adams     const PetscCoarsenData *llist = *agg_lists;
10730cbbd2e1SMark F. Adams     ierr = smoothAggs( Gmat2, Gmat1, *agg_lists ); CHKERRQ(ierr);
1074c8b0795cSMark F. Adams     ierr = MatDestroy( &Gmat1 );  CHKERRQ(ierr);
1075e0940f08SMark F. Adams     *a_Gmat1 = Gmat2; /* output */
107641b27cdeSMark F. Adams     ierr = PetscCDGetMat( llist, &mat );  CHKERRQ(ierr);
10770cbbd2e1SMark F. Adams     if(mat) SETERRQ(wcomm,PETSC_ERR_ARG_WRONG, "Auxilary matrix with squared graph????");
1078ef4ad70eSMark F. Adams   }
10790cbbd2e1SMark F. Adams   else {
10800cbbd2e1SMark F. Adams     const PetscCoarsenData *llist = *agg_lists;
10810cbbd2e1SMark F. Adams     /* see if we have a matrix that takes pecedence (returned from MatCoarsenAppply) */
108241b27cdeSMark F. Adams     ierr = PetscCDGetMat( llist, &mat );   CHKERRQ(ierr);
10830cbbd2e1SMark F. Adams     if( mat ) {
10840cbbd2e1SMark F. Adams       ierr = MatDestroy( &Gmat1 );  CHKERRQ(ierr);
10850cbbd2e1SMark F. Adams       *a_Gmat1 = mat; /* output */
10860cbbd2e1SMark F. Adams     }
10870cbbd2e1SMark F. Adams   }
10880cbbd2e1SMark F. Adams #if defined PETSC_USE_LOG
10890cbbd2e1SMark F. Adams   ierr = PetscLogEventEnd(PC_GAMGCoarsen_AGG,0,0,0,0);CHKERRQ(ierr);
10900cbbd2e1SMark F. Adams #endif
1091c8b0795cSMark F. Adams   PetscFunctionReturn(0);
1092c8b0795cSMark F. Adams }
1093c8b0795cSMark F. Adams 
1094c8b0795cSMark F. Adams /* -------------------------------------------------------------------------- */
1095c8b0795cSMark F. Adams /*
10960cbbd2e1SMark F. Adams  PCGAMGProlongator_AGG
1097c8b0795cSMark F. Adams 
1098c8b0795cSMark F. Adams  Input Parameter:
1099c8b0795cSMark F. Adams  . pc - this
1100c8b0795cSMark F. Adams  . Amat - matrix on this fine level
1101c8b0795cSMark F. Adams  . Graph - used to get ghost data for nodes in
11020cbbd2e1SMark F. Adams  . agg_lists - list of aggregates
1103c8b0795cSMark F. Adams  Output Parameter:
1104c8b0795cSMark F. Adams  . a_P_out - prolongation operator to the next level
1105c8b0795cSMark F. Adams  */
1106c8b0795cSMark F. Adams #undef __FUNCT__
11070cbbd2e1SMark F. Adams #define __FUNCT__ "PCGAMGProlongator_AGG"
11080cbbd2e1SMark F. Adams PetscErrorCode PCGAMGProlongator_AGG( PC pc,
1109c8b0795cSMark F. Adams                                       const Mat Amat,
1110c8b0795cSMark F. Adams                                       const Mat Gmat,
11110cbbd2e1SMark F. Adams                                       PetscCoarsenData *agg_lists,
1112c8b0795cSMark F. Adams                                       Mat *a_P_out
11132e68589bSMark F. Adams                                       )
11142e68589bSMark F. Adams {
11152e68589bSMark F. Adams   PC_MG          *mg = (PC_MG*)pc->data;
11162e68589bSMark F. Adams   PC_GAMG        *pc_gamg = (PC_GAMG*)mg->innerctx;
11172e68589bSMark F. Adams   const PetscInt verbose = pc_gamg->verbose;
1118c8b0795cSMark F. Adams   const PetscInt data_cols = pc_gamg->data_cell_cols;
11192e68589bSMark F. Adams   PetscErrorCode ierr;
1120c8b0795cSMark F. Adams   PetscInt       Istart,Iend,nloc,ii,jj,kk,my0,nLocalSelected,bs;
1121c8b0795cSMark F. Adams   Mat            Prol;
11222e68589bSMark F. Adams   PetscMPIInt    mype, npe;
11232e68589bSMark F. Adams   MPI_Comm       wcomm = ((PetscObject)Amat)->comm;
11240cbbd2e1SMark F. Adams   const PetscInt col_bs = data_cols;
1125c8b0795cSMark F. Adams   PetscReal      *data_w_ghost;
1126c8b0795cSMark F. Adams   PetscInt       myCrs0, nbnodes=0, *flid_fgid;
11272e68589bSMark F. Adams 
11282e68589bSMark F. Adams   PetscFunctionBegin;
11290cbbd2e1SMark F. Adams #if defined PETSC_USE_LOG
11300cbbd2e1SMark F. Adams   ierr = PetscLogEventBegin(PC_GAMGProlongator_AGG,0,0,0,0);CHKERRQ(ierr);
11310cbbd2e1SMark F. Adams #endif
11322e68589bSMark F. Adams   ierr = MPI_Comm_rank( wcomm, &mype);  CHKERRQ(ierr);
11332e68589bSMark F. Adams   ierr = MPI_Comm_size( wcomm, &npe);   CHKERRQ(ierr);
11342e68589bSMark F. Adams   ierr = MatGetOwnershipRange( Amat, &Istart, &Iend ); CHKERRQ(ierr);
1135c8b0795cSMark F. Adams   ierr  = MatGetBlockSize( Amat, &bs ); CHKERRQ( ierr );
1136c8b0795cSMark F. Adams   nloc = (Iend-Istart)/bs; my0 = Istart/bs; assert((Iend-Istart)%bs==0);
11372e68589bSMark F. Adams 
11382e68589bSMark F. Adams   /* get 'nLocalSelected' */
11390cbbd2e1SMark F. Adams   for( ii=0, nLocalSelected = 0 ; ii < nloc ; ii++ ){
1140e78576d6SMark F. Adams     PetscBool ise;
11410cbbd2e1SMark F. Adams     /* filter out singletons 0 or 1? */
1142e78576d6SMark F. Adams     ierr = PetscCDEmptyAt( agg_lists, ii, &ise ); CHKERRQ(ierr);
1143e78576d6SMark F. Adams     if( !ise ) nLocalSelected++;
11442e68589bSMark F. Adams   }
11452e68589bSMark F. Adams 
11462e68589bSMark F. Adams   /* create prolongator, create P matrix */
1147*a2f3521dSMark F. Adams   ierr = MatCreate( wcomm, &Prol ); CHKERRQ(ierr);
1148*a2f3521dSMark F. Adams   ierr = MatSetSizes(Prol,nloc*bs,nLocalSelected*col_bs,PETSC_DETERMINE,PETSC_DETERMINE);
11492e68589bSMark F. Adams   CHKERRQ(ierr);
1150*a2f3521dSMark F. Adams   ierr = MatSetBlockSizes( Prol, bs, col_bs ); CHKERRQ(ierr);
1151*a2f3521dSMark F. Adams   ierr = MatSetType( Prol, MATAIJ );   CHKERRQ(ierr);
1152*a2f3521dSMark F. Adams   ierr = MatSeqAIJSetPreallocation( Prol, data_cols, PETSC_NULL);  CHKERRQ(ierr);
1153*a2f3521dSMark F. Adams   ierr = MatMPIAIJSetPreallocation(Prol,data_cols, PETSC_NULL,data_cols, PETSC_NULL);CHKERRQ(ierr);
1154*a2f3521dSMark F. Adams   /* nloc*bs, nLocalSelected*col_bs, */
1155*a2f3521dSMark F. Adams   /* PETSC_DETERMINE, PETSC_DETERMINE, */
1156*a2f3521dSMark F. Adams   /* data_cols, PETSC_NULL, data_cols, PETSC_NULL, */
1157*a2f3521dSMark F. Adams   /* &Prol ); */
11582e68589bSMark F. Adams 
11592e68589bSMark F. Adams   /* can get all points "removed" */
1160c8b0795cSMark F. Adams   ierr =  MatGetSize( Prol, &kk, &ii ); CHKERRQ(ierr);
1161c8b0795cSMark F. Adams   if( ii==0 ) {
11622e68589bSMark F. Adams     if( verbose ) {
1163c8b0795cSMark F. Adams       PetscPrintf(wcomm,"[%d]%s no selected points on coarse grid\n",mype,__FUNCT__);
11642e68589bSMark F. Adams     }
11652e68589bSMark F. Adams     ierr = MatDestroy( &Prol );  CHKERRQ(ierr);
11662e68589bSMark F. Adams     *a_P_out = PETSC_NULL;  /* out */
11672e68589bSMark F. Adams     PetscFunctionReturn(0);
11682e68589bSMark F. Adams   }
1169c8b0795cSMark F. Adams   if( verbose ) {
1170e78576d6SMark F. Adams     PetscPrintf(wcomm,"\t\t[%d]%s New grid %d nodes\n",mype,__FUNCT__,ii/col_bs);
1171c8b0795cSMark F. Adams   }
1172c8b0795cSMark F. Adams   ierr = MatGetOwnershipRangeColumn( Prol, &myCrs0, &kk ); CHKERRQ(ierr);
11730cbbd2e1SMark F. Adams 
11740cbbd2e1SMark F. Adams   assert((kk-myCrs0)%col_bs==0);
1175c8b0795cSMark F. Adams   myCrs0 = myCrs0/col_bs;
11760cbbd2e1SMark F. Adams   assert((kk/col_bs-myCrs0)==nLocalSelected);
11772e68589bSMark F. Adams 
11782e68589bSMark F. Adams   /* create global vector of data in 'data_w_ghost' */
11790cbbd2e1SMark F. Adams #if defined PETSC_GAMG_USE_LOG
11800cbbd2e1SMark F. Adams   ierr = PetscLogEventBegin(petsc_gamg_setup_events[SET7],0,0,0,0);CHKERRQ(ierr);
11812e68589bSMark F. Adams #endif
1182c8b0795cSMark F. Adams   if (npe > 1) { /*  */
11832e68589bSMark F. Adams     PetscReal *tmp_gdata,*tmp_ldata,*tp2;
11842e68589bSMark F. Adams     ierr = PetscMalloc( nloc*sizeof(PetscReal), &tmp_ldata ); CHKERRQ(ierr);
11852e68589bSMark F. Adams     for( jj = 0 ; jj < data_cols ; jj++ ){
1186c8b0795cSMark F. Adams       for( kk = 0 ; kk < bs ; kk++) {
1187*a2f3521dSMark F. Adams         PetscInt ii,stride;
1188c8b0795cSMark F. Adams         const PetscReal *tp = pc_gamg->data + jj*bs*nloc + kk;
1189c8b0795cSMark F. Adams         for( ii = 0 ; ii < nloc ; ii++, tp += bs ){
11902e68589bSMark F. Adams           tmp_ldata[ii] = *tp;
11912e68589bSMark F. Adams         }
1192*a2f3521dSMark F. Adams         ierr = PCGAMGGetDataWithGhosts( Gmat, 1, tmp_ldata, &stride, &tmp_gdata );
11932e68589bSMark F. Adams         CHKERRQ(ierr);
1194*a2f3521dSMark F. Adams 
11952e68589bSMark F. Adams         if(jj==0 && kk==0) { /* now I know how many todal nodes - allocate */
1196*a2f3521dSMark F. Adams           ierr = PetscMalloc( stride*bs*data_cols*sizeof(PetscReal), &data_w_ghost ); CHKERRQ(ierr);
1197*a2f3521dSMark F. Adams           nbnodes = bs*stride;
11982e68589bSMark F. Adams         }
1199*a2f3521dSMark F. Adams         tp2 = data_w_ghost + jj*bs*stride + kk;
1200*a2f3521dSMark F. Adams         for( ii = 0 ; ii < stride ; ii++, tp2 += bs ){
12012e68589bSMark F. Adams           *tp2 = tmp_gdata[ii];
12022e68589bSMark F. Adams         }
12032e68589bSMark F. Adams         ierr = PetscFree( tmp_gdata ); CHKERRQ(ierr);
12042e68589bSMark F. Adams       }
12052e68589bSMark F. Adams     }
12062e68589bSMark F. Adams     ierr = PetscFree( tmp_ldata ); CHKERRQ(ierr);
12072e68589bSMark F. Adams   }
12082e68589bSMark F. Adams   else {
1209c8b0795cSMark F. Adams     nbnodes = bs*nloc;
1210c8b0795cSMark F. Adams     data_w_ghost = (PetscReal*)pc_gamg->data;
12112e68589bSMark F. Adams   }
12122e68589bSMark F. Adams 
12132e68589bSMark F. Adams   /* get P0 */
12142e68589bSMark F. Adams   if( npe > 1 ){
12152e68589bSMark F. Adams     PetscReal *fid_glid_loc,*fiddata;
1216*a2f3521dSMark F. Adams     PetscInt stride;
12172e68589bSMark F. Adams 
12182e68589bSMark F. Adams     ierr = PetscMalloc( nloc*sizeof(PetscReal), &fid_glid_loc ); CHKERRQ(ierr);
12192e68589bSMark F. Adams     for(kk=0;kk<nloc;kk++) fid_glid_loc[kk] = (PetscReal)(my0+kk);
1220*a2f3521dSMark F. Adams     ierr = PCGAMGGetDataWithGhosts( Gmat, 1, fid_glid_loc, &stride, &fiddata );
12212e68589bSMark F. Adams     CHKERRQ(ierr);
1222*a2f3521dSMark F. Adams     ierr = PetscMalloc( stride*sizeof(PetscInt), &flid_fgid ); CHKERRQ(ierr);
1223*a2f3521dSMark F. Adams     for(kk=0;kk<stride;kk++) flid_fgid[kk] = (PetscInt)fiddata[kk];
12242e68589bSMark F. Adams     ierr = PetscFree( fiddata ); CHKERRQ(ierr);
1225*a2f3521dSMark F. Adams 
1226*a2f3521dSMark F. Adams     assert(stride==nbnodes/bs);
12272e68589bSMark F. Adams     ierr = PetscFree( fid_glid_loc ); CHKERRQ(ierr);
12282e68589bSMark F. Adams   }
12292e68589bSMark F. Adams   else {
12302e68589bSMark F. Adams     ierr = PetscMalloc( nloc*sizeof(PetscInt), &flid_fgid ); CHKERRQ(ierr);
12312e68589bSMark F. Adams     for(kk=0;kk<nloc;kk++) flid_fgid[kk] = my0 + kk;
12322e68589bSMark F. Adams   }
12330cbbd2e1SMark F. Adams #if defined PETSC_GAMG_USE_LOG
12340cbbd2e1SMark F. Adams   ierr = PetscLogEventEnd(petsc_gamg_setup_events[SET7],0,0,0,0);CHKERRQ(ierr);
12350cbbd2e1SMark F. Adams   ierr = PetscLogEventBegin(petsc_gamg_setup_events[SET8],0,0,0,0);CHKERRQ(ierr);
12362e68589bSMark F. Adams #endif
1237c8b0795cSMark F. Adams   {
1238ffc955d6SMark F. Adams     PetscReal *data_out = PETSC_NULL;
12390cbbd2e1SMark F. Adams     ierr = formProl0( agg_lists, bs, data_cols, myCrs0, nbnodes,
1240c8b0795cSMark F. Adams                       data_w_ghost, flid_fgid, &data_out, Prol );
12412e68589bSMark F. Adams     CHKERRQ(ierr);
1242c8b0795cSMark F. Adams     ierr = PetscFree( pc_gamg->data ); CHKERRQ( ierr );
1243c8b0795cSMark F. Adams     pc_gamg->data = data_out;
1244c8b0795cSMark F. Adams     pc_gamg->data_cell_rows = data_cols;
1245c8b0795cSMark F. Adams     pc_gamg->data_sz = data_cols*data_cols*nLocalSelected;
1246c8b0795cSMark F. Adams   }
12470cbbd2e1SMark F. Adams #if defined PETSC_GAMG_USE_LOG
12480cbbd2e1SMark F. Adams   ierr = PetscLogEventEnd(petsc_gamg_setup_events[SET8],0,0,0,0);CHKERRQ(ierr);
1249c8b0795cSMark F. Adams #endif
12502e68589bSMark F. Adams   if (npe > 1) ierr = PetscFree( data_w_ghost );      CHKERRQ(ierr);
12512e68589bSMark F. Adams   ierr = PetscFree( flid_fgid ); CHKERRQ(ierr);
12522e68589bSMark F. Adams 
1253c8b0795cSMark F. Adams   /* attach block size of columns */
1254c8b0795cSMark F. Adams   if( pc_gamg->col_bs_id == -1 ) {
1255c8b0795cSMark F. Adams     ierr = PetscObjectComposedDataRegister( &pc_gamg->col_bs_id ); assert(pc_gamg->col_bs_id != -1 );
1256c8b0795cSMark F. Adams   }
1257c8b0795cSMark F. Adams   ierr = PetscObjectComposedDataSetInt( (PetscObject)Prol, pc_gamg->col_bs_id, data_cols ); CHKERRQ(ierr);
1258c8b0795cSMark F. Adams 
1259c8b0795cSMark F. Adams   *a_P_out = Prol;  /* out */
12600cbbd2e1SMark F. Adams #if defined PETSC_USE_LOG
12610cbbd2e1SMark F. Adams   ierr = PetscLogEventEnd(PC_GAMGProlongator_AGG,0,0,0,0);CHKERRQ(ierr);
12620cbbd2e1SMark F. Adams #endif
1263c8b0795cSMark F. Adams   PetscFunctionReturn(0);
1264c8b0795cSMark F. Adams }
1265c8b0795cSMark F. Adams 
1266c8b0795cSMark F. Adams /* -------------------------------------------------------------------------- */
1267c8b0795cSMark F. Adams /*
12680cbbd2e1SMark F. Adams    PCGAMGOptprol_AGG
1269c8b0795cSMark F. Adams 
1270c8b0795cSMark F. Adams   Input Parameter:
1271c8b0795cSMark F. Adams    . pc - this
1272c8b0795cSMark F. Adams    . Amat - matrix on this fine level
1273c8b0795cSMark F. Adams  In/Output Parameter:
1274c8b0795cSMark F. Adams    . a_P_out - prolongation operator to the next level
1275c8b0795cSMark F. Adams */
1276c8b0795cSMark F. Adams #undef __FUNCT__
12770cbbd2e1SMark F. Adams #define __FUNCT__ "PCGAMGOptprol_AGG"
12780cbbd2e1SMark F. Adams PetscErrorCode PCGAMGOptprol_AGG( PC pc,
1279c8b0795cSMark F. Adams                                   const Mat Amat,
1280c8b0795cSMark F. Adams                                   Mat *a_P
1281c8b0795cSMark F. Adams                                   )
1282c8b0795cSMark F. Adams {
1283c8b0795cSMark F. Adams   PetscErrorCode ierr;
1284c8b0795cSMark F. Adams   PC_MG          *mg = (PC_MG*)pc->data;
1285c8b0795cSMark F. Adams   PC_GAMG        *pc_gamg = (PC_GAMG*)mg->innerctx;
1286c8b0795cSMark F. Adams   const PetscInt verbose = pc_gamg->verbose;
1287c8b0795cSMark F. Adams   PC_GAMG_AGG    *pc_gamg_agg = (PC_GAMG_AGG*)pc_gamg->subctx;
1288c8b0795cSMark F. Adams   PetscInt       jj;
1289c8b0795cSMark F. Adams   PetscMPIInt    mype,npe;
1290c8b0795cSMark F. Adams   Mat            Prol = *a_P;
1291c8b0795cSMark F. Adams   MPI_Comm       wcomm = ((PetscObject)Amat)->comm;
1292c8b0795cSMark F. Adams 
1293c8b0795cSMark F. Adams   PetscFunctionBegin;
12940cbbd2e1SMark F. Adams #if defined PETSC_USE_LOG
12950cbbd2e1SMark F. Adams   ierr = PetscLogEventBegin(PC_GAMGOptprol_AGG,0,0,0,0);CHKERRQ(ierr);
12960cbbd2e1SMark F. Adams #endif
1297c8b0795cSMark F. Adams   ierr = MPI_Comm_rank( wcomm, &mype);  CHKERRQ(ierr);
1298c8b0795cSMark F. Adams   ierr = MPI_Comm_size( wcomm, &npe);   CHKERRQ(ierr);
1299c8b0795cSMark F. Adams 
13002e68589bSMark F. Adams   /* smooth P0 */
1301c8b0795cSMark F. Adams   for( jj = 0 ; jj < pc_gamg_agg->nsmooths ; jj++ ){
13022e68589bSMark F. Adams     Mat tMat;
13032e68589bSMark F. Adams     Vec diag;
13042e68589bSMark F. Adams     PetscReal alpha, emax, emin;
13050cbbd2e1SMark F. Adams #if defined PETSC_GAMG_USE_LOG
13060cbbd2e1SMark F. Adams     ierr = PetscLogEventBegin(petsc_gamg_setup_events[SET9],0,0,0,0);CHKERRQ(ierr);
13072e68589bSMark F. Adams #endif
13082e68589bSMark F. Adams     if( jj == 0 ) {
13092e68589bSMark F. Adams       KSP eksp;
13102e68589bSMark F. Adams       Vec bb, xx;
13112e68589bSMark F. Adams       PC pc;
13122e68589bSMark F. Adams       ierr = MatGetVecs( Amat, &bb, 0 );         CHKERRQ(ierr);
13132e68589bSMark F. Adams       ierr = MatGetVecs( Amat, &xx, 0 );         CHKERRQ(ierr);
13142e68589bSMark F. Adams       {
13152e68589bSMark F. Adams         PetscRandom    rctx;
13162e68589bSMark F. Adams         ierr = PetscRandomCreate(wcomm,&rctx);CHKERRQ(ierr);
13172e68589bSMark F. Adams         ierr = PetscRandomSetFromOptions(rctx);CHKERRQ(ierr);
13182e68589bSMark F. Adams         ierr = VecSetRandom(bb,rctx);CHKERRQ(ierr);
13192e68589bSMark F. Adams         ierr = PetscRandomDestroy( &rctx ); CHKERRQ(ierr);
13202e68589bSMark F. Adams       }
13212e68589bSMark F. Adams       ierr = KSPCreate(wcomm,&eksp);                            CHKERRQ(ierr);
1322db36e5aeSMark F. Adams       ierr = KSPAppendOptionsPrefix( eksp, "gamg_est_");         CHKERRQ(ierr);
13232e68589bSMark F. Adams       ierr = KSPSetFromOptions( eksp );    CHKERRQ(ierr);
13242e68589bSMark F. Adams       ierr = KSPSetInitialGuessNonzero( eksp, PETSC_FALSE );    CHKERRQ(ierr);
13252e68589bSMark F. Adams       ierr = KSPSetOperators( eksp, Amat, Amat, SAME_NONZERO_PATTERN );
13262e68589bSMark F. Adams       CHKERRQ( ierr );
13272e68589bSMark F. Adams       ierr = KSPGetPC( eksp, &pc );                              CHKERRQ( ierr );
13282e68589bSMark F. Adams       ierr = PCSetType( pc, PCJACOBI ); CHKERRQ(ierr);  /* smoother */
13292e68589bSMark F. Adams       ierr = KSPSetTolerances(eksp,PETSC_DEFAULT,PETSC_DEFAULT,PETSC_DEFAULT,10);
13302e68589bSMark F. Adams       CHKERRQ(ierr);
13312e68589bSMark F. Adams       ierr = KSPSetNormType( eksp, KSP_NORM_NONE );                 CHKERRQ(ierr);
13322e68589bSMark F. Adams       ierr = KSPSetComputeSingularValues( eksp,PETSC_TRUE );        CHKERRQ(ierr);
13332e68589bSMark F. Adams 
13342e68589bSMark F. Adams       /* solve - keep stuff out of logging */
13352e68589bSMark F. Adams       ierr = PetscLogEventDeactivate(KSP_Solve);CHKERRQ(ierr);
13362e68589bSMark F. Adams       ierr = PetscLogEventDeactivate(PC_Apply);CHKERRQ(ierr);
13372e68589bSMark F. Adams       ierr = KSPSolve( eksp, bb, xx );                              CHKERRQ(ierr);
13382e68589bSMark F. Adams       ierr = PetscLogEventActivate(KSP_Solve);CHKERRQ(ierr);
13392e68589bSMark F. Adams       ierr = PetscLogEventActivate(PC_Apply);CHKERRQ(ierr);
13402e68589bSMark F. Adams 
13412e68589bSMark F. Adams       ierr = KSPComputeExtremeSingularValues( eksp, &emax, &emin ); CHKERRQ(ierr);
13422e68589bSMark F. Adams       if( verbose ) {
1343c8b0795cSMark F. Adams         PetscPrintf(wcomm,"\t\t\t%s smooth P0: max eigen=%e min=%e PC=%s\n",
13442e68589bSMark F. Adams                     __FUNCT__,emax,emin,PCJACOBI);
13452e68589bSMark F. Adams       }
13462e68589bSMark F. Adams       ierr = VecDestroy( &xx );       CHKERRQ(ierr);
13472e68589bSMark F. Adams       ierr = VecDestroy( &bb );       CHKERRQ(ierr);
13482e68589bSMark F. Adams       ierr = KSPDestroy( &eksp );     CHKERRQ(ierr);
13492e68589bSMark F. Adams 
13502e68589bSMark F. Adams       if( pc_gamg->emax_id == -1 ) {
13512e68589bSMark F. Adams         ierr = PetscObjectComposedDataRegister( &pc_gamg->emax_id );
13522e68589bSMark F. Adams         assert(pc_gamg->emax_id != -1 );
13532e68589bSMark F. Adams       }
13542e68589bSMark F. Adams       ierr = PetscObjectComposedDataSetScalar( (PetscObject)Amat, pc_gamg->emax_id, emax ); CHKERRQ(ierr);
13552e68589bSMark F. Adams     }
13562e68589bSMark F. Adams 
13572e68589bSMark F. Adams     /* smooth P1 := (I - omega/lam D^{-1}A)P0 */
13582e68589bSMark F. Adams     ierr = MatMatMult( Amat, Prol, MAT_INITIAL_MATRIX, PETSC_DEFAULT, &tMat );   CHKERRQ(ierr);
13592e68589bSMark F. Adams     ierr = MatGetVecs( Amat, &diag, 0 );    CHKERRQ(ierr);
13602e68589bSMark F. Adams     ierr = MatGetDiagonal( Amat, diag );    CHKERRQ(ierr); /* effectively PCJACOBI */
13612e68589bSMark F. Adams     ierr = VecReciprocal( diag );         CHKERRQ(ierr);
13622e68589bSMark F. Adams     ierr = MatDiagonalScale( tMat, diag, 0 ); CHKERRQ(ierr);
13632e68589bSMark F. Adams     ierr = VecDestroy( &diag );           CHKERRQ(ierr);
13642e68589bSMark F. Adams     alpha = -1.5/emax;
13652e68589bSMark F. Adams     ierr = MatAYPX( tMat, alpha, Prol, SUBSET_NONZERO_PATTERN );           CHKERRQ(ierr);
13662e68589bSMark F. Adams     ierr = MatDestroy( &Prol );  CHKERRQ(ierr);
13672e68589bSMark F. Adams     Prol = tMat;
13680cbbd2e1SMark F. Adams #if defined PETSC_GAMG_USE_LOG
13690cbbd2e1SMark F. Adams     ierr = PetscLogEventEnd(petsc_gamg_setup_events[SET9],0,0,0,0);CHKERRQ(ierr);
13702e68589bSMark F. Adams #endif
13712e68589bSMark F. Adams   }
13720cbbd2e1SMark F. Adams #if defined PETSC_USE_LOG
13730cbbd2e1SMark F. Adams   ierr = PetscLogEventEnd(PC_GAMGOptprol_AGG,0,0,0,0);CHKERRQ(ierr);
13740cbbd2e1SMark F. Adams #endif
1375c8b0795cSMark F. Adams   *a_P = Prol;
1376c8b0795cSMark F. Adams 
1377c8b0795cSMark F. Adams   PetscFunctionReturn(0);
13782e68589bSMark F. Adams }
13792e68589bSMark F. Adams 
1380c8b0795cSMark F. Adams /* -------------------------------------------------------------------------- */
1381c8b0795cSMark F. Adams /*
1382*a2f3521dSMark F. Adams    PCGAMGKKTProl_AGG
1383*a2f3521dSMark F. Adams 
1384*a2f3521dSMark F. Adams   Input Parameter:
1385*a2f3521dSMark F. Adams    . pc - this
1386*a2f3521dSMark F. Adams    . Prol11 - matrix on this fine level
1387*a2f3521dSMark F. Adams    . A21 - matrix on this fine level
1388*a2f3521dSMark F. Adams  In/Output Parameter:
1389*a2f3521dSMark F. Adams    . a_P22 - prolongation operator to the next level
1390*a2f3521dSMark F. Adams */
1391*a2f3521dSMark F. Adams #undef __FUNCT__
1392*a2f3521dSMark F. Adams #define __FUNCT__ "PCGAMGKKTProl_AGG"
1393*a2f3521dSMark F. Adams PetscErrorCode PCGAMGKKTProl_AGG( PC pc,
1394*a2f3521dSMark F. Adams                                   const Mat Prol11,
1395*a2f3521dSMark F. Adams                                   const Mat A21,
1396*a2f3521dSMark F. Adams                                   Mat *a_P22
1397*a2f3521dSMark F. Adams                                   )
1398*a2f3521dSMark F. Adams {
1399*a2f3521dSMark F. Adams   PetscErrorCode ierr;
1400*a2f3521dSMark F. Adams   PC_MG          *mg = (PC_MG*)pc->data;
1401*a2f3521dSMark F. Adams   PC_GAMG        *pc_gamg = (PC_GAMG*)mg->innerctx;
1402*a2f3521dSMark F. Adams   const PetscInt verbose = pc_gamg->verbose;
1403*a2f3521dSMark F. Adams   /* PC_GAMG_AGG    *pc_gamg_agg = (PC_GAMG_AGG*)pc_gamg->subctx;  */
1404*a2f3521dSMark F. Adams   PetscMPIInt    mype,npe;
1405*a2f3521dSMark F. Adams   Mat            Prol22,Tmat,Gmat;
1406*a2f3521dSMark F. Adams   MPI_Comm       wcomm = ((PetscObject)pc)->comm;
1407*a2f3521dSMark F. Adams   PetscCoarsenData *agg_lists;
1408*a2f3521dSMark F. Adams 
1409*a2f3521dSMark F. Adams   PetscFunctionBegin;
1410*a2f3521dSMark F. Adams #if defined PETSC_USE_LOG
1411*a2f3521dSMark F. Adams   ierr = PetscLogEventBegin(PC_GAMGKKTProl_AGG,0,0,0,0); CHKERRQ(ierr);
1412*a2f3521dSMark F. Adams #endif
1413*a2f3521dSMark F. Adams   ierr = MPI_Comm_rank( wcomm, &mype);  CHKERRQ(ierr);
1414*a2f3521dSMark F. Adams   ierr = MPI_Comm_size( wcomm, &npe);   CHKERRQ(ierr);
1415*a2f3521dSMark F. Adams 
1416*a2f3521dSMark F. Adams   /* form C graph */
1417*a2f3521dSMark F. Adams   ierr = MatMatMult( A21, Prol11, MAT_INITIAL_MATRIX, PETSC_DEFAULT, &Tmat);   CHKERRQ(ierr);
1418*a2f3521dSMark F. Adams   ierr = MatMatTransposeMult(Tmat, Tmat, MAT_INITIAL_MATRIX, PETSC_DEFAULT, &Gmat ); CHKERRQ(ierr);
1419*a2f3521dSMark F. Adams   ierr = MatDestroy(&Tmat);      CHKERRQ(ierr);
1420*a2f3521dSMark F. Adams   ierr  = PCGAMGFilterGraph(&Gmat, 0.0, PETSC_FALSE, verbose); CHKERRQ(ierr);
1421*a2f3521dSMark F. Adams 
1422*a2f3521dSMark F. Adams   /* coarsen constraints */
1423*a2f3521dSMark F. Adams   {
1424*a2f3521dSMark F. Adams     MatCoarsen crs;
1425*a2f3521dSMark F. Adams     ierr = MatCoarsenCreate( wcomm, &crs ); CHKERRQ(ierr);
1426*a2f3521dSMark F. Adams     ierr = MatCoarsenSetType( crs, MATCOARSENMIS ); CHKERRQ(ierr);
1427*a2f3521dSMark F. Adams     ierr = MatCoarsenSetAdjacency( crs, Gmat ); CHKERRQ(ierr);
1428*a2f3521dSMark F. Adams     ierr = MatCoarsenSetVerbose( crs, verbose ); CHKERRQ(ierr);
1429*a2f3521dSMark F. Adams     ierr = MatCoarsenSetStrictAggs( crs, PETSC_TRUE ); CHKERRQ(ierr);
1430*a2f3521dSMark F. Adams     ierr = MatCoarsenApply( crs ); CHKERRQ(ierr);
1431*a2f3521dSMark F. Adams     ierr = MatCoarsenGetData( crs, &agg_lists ); CHKERRQ(ierr);
1432*a2f3521dSMark F. Adams     ierr = MatCoarsenDestroy( &crs ); CHKERRQ(ierr);
1433*a2f3521dSMark F. Adams   }
1434*a2f3521dSMark F. Adams 
1435*a2f3521dSMark F. Adams   /* form simple prolongation 'Prol22' */
1436*a2f3521dSMark F. Adams   {
1437*a2f3521dSMark F. Adams     PetscInt ii,mm,clid,my0,nloc,nLocalSelected;
1438*a2f3521dSMark F. Adams     PetscScalar val = 1.0;
1439*a2f3521dSMark F. Adams     /* get 'nLocalSelected' */
1440*a2f3521dSMark F. Adams     ierr = MatGetLocalSize( Gmat, &nloc, &ii ); CHKERRQ(ierr);
1441*a2f3521dSMark F. Adams     for( ii=0, nLocalSelected = 0 ; ii < nloc ; ii++ ){
1442*a2f3521dSMark F. Adams       PetscBool ise;
1443*a2f3521dSMark F. Adams       /* filter out singletons 0 or 1? */
1444*a2f3521dSMark F. Adams       ierr = PetscCDEmptyAt( agg_lists, ii, &ise ); CHKERRQ(ierr);
1445*a2f3521dSMark F. Adams       if( !ise ) nLocalSelected++;
1446*a2f3521dSMark F. Adams     }
1447*a2f3521dSMark F. Adams 
1448*a2f3521dSMark F. Adams     ierr = MatCreate(wcomm,&Prol22);CHKERRQ(ierr);
1449*a2f3521dSMark F. Adams     ierr = MatSetSizes( Prol22,nloc, nLocalSelected,
1450*a2f3521dSMark F. Adams                         PETSC_DETERMINE, PETSC_DETERMINE);
1451*a2f3521dSMark F. Adams     CHKERRQ(ierr);
1452*a2f3521dSMark F. Adams     ierr = MatSetType( Prol22, MATAIJ );       CHKERRQ(ierr);
1453*a2f3521dSMark F. Adams     ierr = MatSeqAIJSetPreallocation(Prol22,1,PETSC_NULL); CHKERRQ(ierr);
1454*a2f3521dSMark F. Adams     ierr = MatMPIAIJSetPreallocation(Prol22,1,PETSC_NULL,1,PETSC_NULL);
1455*a2f3521dSMark F. Adams     CHKERRQ(ierr);
1456*a2f3521dSMark F. Adams     /* ierr = MatCreateAIJ( wcomm, */
1457*a2f3521dSMark F. Adams     /*                      nloc, nLocalSelected, */
1458*a2f3521dSMark F. Adams     /*                      PETSC_DETERMINE, PETSC_DETERMINE, */
1459*a2f3521dSMark F. Adams     /*                      1, PETSC_NULL, 1, PETSC_NULL, */
1460*a2f3521dSMark F. Adams     /*                      &Prol22 ); */
1461*a2f3521dSMark F. Adams 
1462*a2f3521dSMark F. Adams     ierr = MatGetOwnershipRange( Prol22, &my0, &ii );    CHKERRQ(ierr);
1463*a2f3521dSMark F. Adams     nloc = ii - my0;
1464*a2f3521dSMark F. Adams 
1465*a2f3521dSMark F. Adams     /* make aggregates */
1466*a2f3521dSMark F. Adams     for( mm = clid = 0 ; mm < nloc ; mm++ ){
1467*a2f3521dSMark F. Adams       ierr = PetscCDSizeAt( agg_lists, mm, &ii ); CHKERRQ(ierr);
1468*a2f3521dSMark F. Adams       if( ii > 0 ) {
1469*a2f3521dSMark F. Adams         PetscInt asz=ii,cgid=my0+clid,rids[1000];
1470*a2f3521dSMark F. Adams         PetscCDPos pos;
1471*a2f3521dSMark F. Adams         if(asz>1000)SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Very large aggregate: %d",asz);
1472*a2f3521dSMark F. Adams         ii = 0;
1473*a2f3521dSMark F. Adams         ierr = PetscCDGetHeadPos(agg_lists,mm,&pos); CHKERRQ(ierr);
1474*a2f3521dSMark F. Adams         while(pos){
1475*a2f3521dSMark F. Adams           PetscInt gid1;
1476*a2f3521dSMark F. Adams           ierr = PetscLLNGetID( pos, &gid1 ); CHKERRQ(ierr);
1477*a2f3521dSMark F. Adams           ierr = PetscCDGetNextPos(agg_lists,mm,&pos); CHKERRQ(ierr);
1478*a2f3521dSMark F. Adams 
1479*a2f3521dSMark F. Adams           rids[ii++] = gid1;
1480*a2f3521dSMark F. Adams         }
1481*a2f3521dSMark F. Adams         assert(ii==asz);
1482*a2f3521dSMark F. Adams         /* add diagonal block of P0 */
1483*a2f3521dSMark F. Adams         ierr = MatSetValues(Prol22,asz,rids,1,&cgid,&val,INSERT_VALUES); CHKERRQ(ierr);
1484*a2f3521dSMark F. Adams 
1485*a2f3521dSMark F. Adams         clid++;
1486*a2f3521dSMark F. Adams       } /* coarse agg */
1487*a2f3521dSMark F. Adams     } /* for all fine nodes */
1488*a2f3521dSMark F. Adams     ierr = MatAssemblyBegin(Prol22,MAT_FINAL_ASSEMBLY);  CHKERRQ(ierr);
1489*a2f3521dSMark F. Adams     ierr = MatAssemblyEnd(Prol22,MAT_FINAL_ASSEMBLY);    CHKERRQ(ierr);
1490*a2f3521dSMark F. Adams   }
1491*a2f3521dSMark F. Adams 
1492*a2f3521dSMark F. Adams   /* clean up */
1493*a2f3521dSMark F. Adams   ierr = MatDestroy( &Gmat );      CHKERRQ(ierr);
1494*a2f3521dSMark F. Adams   ierr = PetscCDDestroy( agg_lists );  CHKERRQ(ierr);
1495*a2f3521dSMark F. Adams #if defined PETSC_USE_LOG
1496*a2f3521dSMark F. Adams   ierr = PetscLogEventEnd(PC_GAMGKKTProl_AGG,0,0,0,0);CHKERRQ(ierr);
1497*a2f3521dSMark F. Adams #endif
1498*a2f3521dSMark F. Adams   *a_P22 = Prol22;
1499*a2f3521dSMark F. Adams 
1500*a2f3521dSMark F. Adams   PetscFunctionReturn(0);
1501*a2f3521dSMark F. Adams }
1502*a2f3521dSMark F. Adams 
1503*a2f3521dSMark F. Adams /* -------------------------------------------------------------------------- */
1504*a2f3521dSMark F. Adams /*
1505c8b0795cSMark F. Adams    PCCreateGAMG_AGG
15062e68589bSMark F. Adams 
1507c8b0795cSMark F. Adams   Input Parameter:
1508c8b0795cSMark F. Adams    . pc -
1509c8b0795cSMark F. Adams */
1510c8b0795cSMark F. Adams #undef __FUNCT__
1511c8b0795cSMark F. Adams #define __FUNCT__ "PCCreateGAMG_AGG"
1512c8b0795cSMark F. Adams PetscErrorCode  PCCreateGAMG_AGG( PC pc )
1513c8b0795cSMark F. Adams {
1514c8b0795cSMark F. Adams   PetscErrorCode  ierr;
1515c8b0795cSMark F. Adams   PC_MG           *mg = (PC_MG*)pc->data;
1516c8b0795cSMark F. Adams   PC_GAMG         *pc_gamg = (PC_GAMG*)mg->innerctx;
1517c8b0795cSMark F. Adams   PC_GAMG_AGG      *pc_gamg_agg;
15182e68589bSMark F. Adams 
1519c8b0795cSMark F. Adams   PetscFunctionBegin;
1520c8b0795cSMark F. Adams   /* create sub context for SA */
1521c8b0795cSMark F. Adams   ierr = PetscNewLog( pc, PC_GAMG_AGG, &pc_gamg_agg ); CHKERRQ(ierr);
1522c8b0795cSMark F. Adams   assert(!pc_gamg->subctx);
1523c8b0795cSMark F. Adams   pc_gamg->subctx = pc_gamg_agg;
1524c8b0795cSMark F. Adams 
1525c8b0795cSMark F. Adams   pc->ops->setfromoptions = PCSetFromOptions_GAMG_AGG;
1526c8b0795cSMark F. Adams   pc->ops->destroy        = PCDestroy_AGG;
1527c8b0795cSMark F. Adams   /* reset does not do anything; setup not virtual */
1528c8b0795cSMark F. Adams 
1529c8b0795cSMark F. Adams   /* set internal function pointers */
1530c8b0795cSMark F. Adams   pc_gamg->graph = PCGAMGgraph_AGG;
1531b43b03e9SMark F. Adams   pc_gamg->coarsen = PCGAMGCoarsen_AGG;
15320cbbd2e1SMark F. Adams   pc_gamg->prolongator = PCGAMGProlongator_AGG;
15330cbbd2e1SMark F. Adams   pc_gamg->optprol = PCGAMGOptprol_AGG;
1534*a2f3521dSMark F. Adams   pc_gamg->formkktprol = PCGAMGKKTProl_AGG;
1535c8b0795cSMark F. Adams 
1536c8b0795cSMark F. Adams   pc_gamg->createdefaultdata = PCSetData_AGG;
1537c8b0795cSMark F. Adams 
1538c8b0795cSMark F. Adams   ierr = PetscObjectComposeFunctionDynamic( (PetscObject)pc,
1539c8b0795cSMark F. Adams                                             "PCSetCoordinates_C",
1540c8b0795cSMark F. Adams                                             "PCSetCoordinates_AGG",
1541c8b0795cSMark F. Adams                                             PCSetCoordinates_AGG);
15422e68589bSMark F. Adams   PetscFunctionReturn(0);
15432e68589bSMark F. Adams }
1544