xref: /petsc/src/ksp/pc/impls/bddc/bddc.c (revision 142dfd88fad70709bea34a03392fddd5b04e20f1)
153cdbc3dSStefano Zampini /* TODOLIST
2da1bb401SStefano Zampini    DofSplitting and DM attached to pc?
3da1bb401SStefano Zampini    Change SetNeumannBoundaries to SetNeumannBoundariesLocal and provide new SetNeumannBoundaries (same Dirichlet)
4831a100dSStefano Zampini      - change prec_type to switch_inexact_prec_type
53b03a366Sstefano_zampini    Inexact solvers: global preconditioner application is ready, ask to developers (Jed?) on how to best implement Dohrmann's approach (PCSHELL?)
6a0ba757dSStefano Zampini    change how to deal with the coarse problem (PCBDDCSetCoarseEnvironment):
7a0ba757dSStefano Zampini      - simplify coarse problem structure -> PCBDDC or PCREDUDANT, nothing else -> same comm for all levels?
8a0ba757dSStefano Zampini      - remove coarse enums and allow use of PCBDDCGetCoarseKSP
9a0ba757dSStefano Zampini      - remove metis dependency -> use MatPartitioning for multilevel -> Assemble serial adjacency in ManageLocalBoundaries?
103b03a366Sstefano_zampini      - Add levels' slot to bddc data structure and associated Set/Get functions
11a0ba757dSStefano Zampini    code refactoring:
12a0ba757dSStefano Zampini      - pick up better names for static functions
13a0ba757dSStefano Zampini    change options structure:
14a0ba757dSStefano Zampini      - insert BDDC into MG framework?
15a0ba757dSStefano Zampini    provide other ops? Ask to developers
16a0ba757dSStefano Zampini    remove all unused printf
17a0ba757dSStefano Zampini    man pages
1853cdbc3dSStefano Zampini */
190c7d97c5SJed Brown 
2053cdbc3dSStefano Zampini /* ----------------------------------------------------------------------------------------------------------------------------------------------
210c7d97c5SJed Brown    Implementation of BDDC preconditioner based on:
220c7d97c5SJed Brown    C. Dohrmann "An approximate BDDC preconditioner", Numerical Linear Algebra with Applications Volume 14, Issue 2, pages 149-168, March 2007
2353cdbc3dSStefano Zampini    ---------------------------------------------------------------------------------------------------------------------------------------------- */
2453cdbc3dSStefano Zampini 
2553cdbc3dSStefano Zampini #include "bddc.h" /*I "petscpc.h" I*/  /* includes for fortran wrappers */
263b03a366Sstefano_zampini #include <petscblaslapack.h>
270c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
280c7d97c5SJed Brown #undef __FUNCT__
290c7d97c5SJed Brown #define __FUNCT__ "PCSetFromOptions_BDDC"
300c7d97c5SJed Brown PetscErrorCode PCSetFromOptions_BDDC(PC pc)
310c7d97c5SJed Brown {
320c7d97c5SJed Brown   PC_BDDC         *pcbddc = (PC_BDDC*)pc->data;
330c7d97c5SJed Brown   PetscErrorCode ierr;
340c7d97c5SJed Brown 
350c7d97c5SJed Brown   PetscFunctionBegin;
360c7d97c5SJed Brown   ierr = PetscOptionsHead("BDDC options");CHKERRQ(ierr);
370c7d97c5SJed Brown   /* Verbose debugging of main data structures */
38e269702eSStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_check_all"       ,"Verbose (debugging) output for PCBDDC"                       ,"none",pcbddc->dbg_flag      ,&pcbddc->dbg_flag      ,PETSC_NULL);CHKERRQ(ierr);
390c7d97c5SJed Brown   /* Some customization for default primal space */
40da1bb401SStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_vertices_only"   ,"Use only vertices in coarse space (i.e. discard constraints)","none",pcbddc->vertices_flag   ,&pcbddc->vertices_flag   ,PETSC_NULL);CHKERRQ(ierr);
41da1bb401SStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_constraints_only","Use only constraints in coarse space (i.e. discard vertices)","none",pcbddc->constraints_flag,&pcbddc->constraints_flag,PETSC_NULL);CHKERRQ(ierr);
42da1bb401SStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_faces_only"      ,"Use only faces among constraints of coarse space (i.e. discard edges)"         ,"none",pcbddc->faces_flag      ,&pcbddc->faces_flag      ,PETSC_NULL);CHKERRQ(ierr);
43da1bb401SStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_edges_only"      ,"Use only edges among constraints of coarse space (i.e. discard faces)"         ,"none",pcbddc->edges_flag      ,&pcbddc->edges_flag      ,PETSC_NULL);CHKERRQ(ierr);
440c7d97c5SJed Brown   /* Coarse solver context */
456c667b0aSStefano Zampini   static const char * const avail_coarse_problems[] = {"sequential","replicated","parallel","multilevel","CoarseProblemType","PC_BDDC_",0}; /*order of choiches depends on ENUM defined in bddc.h */
460c7d97c5SJed Brown   ierr = PetscOptionsEnum("-pc_bddc_coarse_problem_type","Set coarse problem type","none",avail_coarse_problems,(PetscEnum)pcbddc->coarse_problem_type,(PetscEnum*)&pcbddc->coarse_problem_type,PETSC_NULL);CHKERRQ(ierr);
470c7d97c5SJed Brown   /* Two different application of BDDC to the whole set of dofs, internal and interface */
480c7d97c5SJed Brown   ierr = PetscOptionsBool("-pc_bddc_switch_preconditioning_type","Switch between M_2 (default) and M_3 preconditioners (as defined by Dohrmann)","none",pcbddc->prec_type,&pcbddc->prec_type,PETSC_NULL);CHKERRQ(ierr);
49534831adSStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_use_change_of_basis","Use change of basis approach for primal space","none",pcbddc->usechangeofbasis,&pcbddc->usechangeofbasis,PETSC_NULL);CHKERRQ(ierr);
50534831adSStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_use_change_on_faces","Use change of basis approach for face constraints","none",pcbddc->usechangeonfaces,&pcbddc->usechangeonfaces,PETSC_NULL);CHKERRQ(ierr);
51534831adSStefano Zampini   pcbddc->usechangeonfaces = pcbddc->usechangeonfaces && pcbddc->usechangeofbasis;
520c7d97c5SJed Brown   ierr = PetscOptionsInt("-pc_bddc_coarsening_ratio","Set coarsening ratio used in multilevel coarsening","none",pcbddc->coarsening_ratio,&pcbddc->coarsening_ratio,PETSC_NULL);CHKERRQ(ierr);
530c7d97c5SJed Brown   ierr = PetscOptionsTail();CHKERRQ(ierr);
540c7d97c5SJed Brown   PetscFunctionReturn(0);
550c7d97c5SJed Brown }
560c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
570c7d97c5SJed Brown EXTERN_C_BEGIN
580c7d97c5SJed Brown #undef __FUNCT__
590c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetCoarseProblemType_BDDC"
6053cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetCoarseProblemType_BDDC(PC pc, CoarseProblemType CPT)
610c7d97c5SJed Brown {
620c7d97c5SJed Brown   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
630c7d97c5SJed Brown 
640c7d97c5SJed Brown   PetscFunctionBegin;
650c7d97c5SJed Brown   pcbddc->coarse_problem_type = CPT;
660c7d97c5SJed Brown   PetscFunctionReturn(0);
670c7d97c5SJed Brown }
680c7d97c5SJed Brown EXTERN_C_END
690c7d97c5SJed Brown #undef __FUNCT__
700c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetCoarseProblemType"
7153cdbc3dSStefano Zampini /*@
729c0446d6SStefano Zampini  PCBDDCSetCoarseProblemType - Set coarse problem type in PCBDDC.
7353cdbc3dSStefano Zampini 
749c0446d6SStefano Zampini    Not collective
7553cdbc3dSStefano Zampini 
7653cdbc3dSStefano Zampini    Input Parameters:
7753cdbc3dSStefano Zampini +  pc - the preconditioning context
7853cdbc3dSStefano Zampini -  CoarseProblemType - pick a better name and explain what this is
7953cdbc3dSStefano Zampini 
8053cdbc3dSStefano Zampini    Level: intermediate
8153cdbc3dSStefano Zampini 
8253cdbc3dSStefano Zampini    Notes:
83da1bb401SStefano Zampini    Not collective but all procs must call with same arguments.
8453cdbc3dSStefano Zampini 
8553cdbc3dSStefano Zampini .seealso: PCBDDC
8653cdbc3dSStefano Zampini @*/
870c7d97c5SJed Brown PetscErrorCode PCBDDCSetCoarseProblemType(PC pc, CoarseProblemType CPT)
880c7d97c5SJed Brown {
890c7d97c5SJed Brown   PetscErrorCode ierr;
900c7d97c5SJed Brown 
910c7d97c5SJed Brown   PetscFunctionBegin;
920c7d97c5SJed Brown   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
930c7d97c5SJed Brown   ierr = PetscTryMethod(pc,"PCBDDCSetCoarseProblemType_C",(PC,CoarseProblemType),(pc,CPT));CHKERRQ(ierr);
940c7d97c5SJed Brown   PetscFunctionReturn(0);
950c7d97c5SJed Brown }
960c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
970c7d97c5SJed Brown EXTERN_C_BEGIN
980c7d97c5SJed Brown #undef __FUNCT__
993b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCSetDirichletBoundaries_BDDC"
1003b03a366Sstefano_zampini static PetscErrorCode PCBDDCSetDirichletBoundaries_BDDC(PC pc,IS DirichletBoundaries)
1013b03a366Sstefano_zampini {
1023b03a366Sstefano_zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
1033b03a366Sstefano_zampini   PetscErrorCode ierr;
1043b03a366Sstefano_zampini 
1053b03a366Sstefano_zampini   PetscFunctionBegin;
1063b03a366Sstefano_zampini   ierr = ISDestroy(&pcbddc->DirichletBoundaries);CHKERRQ(ierr);
10736e030ebSStefano Zampini   ierr = PetscObjectReference((PetscObject)DirichletBoundaries);CHKERRQ(ierr);
10836e030ebSStefano Zampini   pcbddc->DirichletBoundaries=DirichletBoundaries;
1093b03a366Sstefano_zampini   PetscFunctionReturn(0);
1103b03a366Sstefano_zampini }
1113b03a366Sstefano_zampini EXTERN_C_END
1123b03a366Sstefano_zampini #undef __FUNCT__
1133b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCSetDirichletBoundaries"
1143b03a366Sstefano_zampini /*@
115da1bb401SStefano Zampini  PCBDDCSetDirichletBoundaries - Set index set defining subdomain part (in local ordering)
116da1bb401SStefano Zampini                               of Dirichlet boundaries for the global problem.
1173b03a366Sstefano_zampini 
1183b03a366Sstefano_zampini    Not collective
1193b03a366Sstefano_zampini 
1203b03a366Sstefano_zampini    Input Parameters:
1213b03a366Sstefano_zampini +  pc - the preconditioning context
1223b03a366Sstefano_zampini -  DirichletBoundaries - sequential index set defining the subdomain part of Dirichlet boundaries (can be PETSC_NULL)
1233b03a366Sstefano_zampini 
1243b03a366Sstefano_zampini    Level: intermediate
1253b03a366Sstefano_zampini 
1263b03a366Sstefano_zampini    Notes:
1273b03a366Sstefano_zampini 
1283b03a366Sstefano_zampini .seealso: PCBDDC
1293b03a366Sstefano_zampini @*/
1303b03a366Sstefano_zampini PetscErrorCode PCBDDCSetDirichletBoundaries(PC pc,IS DirichletBoundaries)
1313b03a366Sstefano_zampini {
1323b03a366Sstefano_zampini   PetscErrorCode ierr;
1333b03a366Sstefano_zampini 
1343b03a366Sstefano_zampini   PetscFunctionBegin;
1353b03a366Sstefano_zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
1363b03a366Sstefano_zampini   ierr = PetscTryMethod(pc,"PCBDDCSetDirichletBoundaries_C",(PC,IS),(pc,DirichletBoundaries));CHKERRQ(ierr);
1373b03a366Sstefano_zampini   PetscFunctionReturn(0);
1383b03a366Sstefano_zampini }
1393b03a366Sstefano_zampini /* -------------------------------------------------------------------------- */
1403b03a366Sstefano_zampini EXTERN_C_BEGIN
1413b03a366Sstefano_zampini #undef __FUNCT__
1420c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetNeumannBoundaries_BDDC"
14353cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetNeumannBoundaries_BDDC(PC pc,IS NeumannBoundaries)
1440c7d97c5SJed Brown {
1450c7d97c5SJed Brown   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
14653cdbc3dSStefano Zampini   PetscErrorCode ierr;
1470c7d97c5SJed Brown 
1480c7d97c5SJed Brown   PetscFunctionBegin;
14953cdbc3dSStefano Zampini   ierr = ISDestroy(&pcbddc->NeumannBoundaries);CHKERRQ(ierr);
15036e030ebSStefano Zampini   ierr = PetscObjectReference((PetscObject)NeumannBoundaries);CHKERRQ(ierr);
15136e030ebSStefano Zampini   pcbddc->NeumannBoundaries=NeumannBoundaries;
1520c7d97c5SJed Brown   PetscFunctionReturn(0);
1530c7d97c5SJed Brown }
1540c7d97c5SJed Brown EXTERN_C_END
1550c7d97c5SJed Brown #undef __FUNCT__
1560c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetNeumannBoundaries"
15757527edcSJed Brown /*@
158da1bb401SStefano Zampini  PCBDDCSetNeumannBoundaries - Set index set defining subdomain part (in local ordering)
159da1bb401SStefano Zampini                               of Neumann boundaries for the global problem.
16057527edcSJed Brown 
1619c0446d6SStefano Zampini    Not collective
16257527edcSJed Brown 
16357527edcSJed Brown    Input Parameters:
16457527edcSJed Brown +  pc - the preconditioning context
1659c0446d6SStefano Zampini -  NeumannBoundaries - sequential index set defining the subdomain part of Neumann boundaries (can be PETSC_NULL)
16657527edcSJed Brown 
16757527edcSJed Brown    Level: intermediate
16857527edcSJed Brown 
16957527edcSJed Brown    Notes:
17057527edcSJed Brown 
17157527edcSJed Brown .seealso: PCBDDC
17257527edcSJed Brown @*/
17353cdbc3dSStefano Zampini PetscErrorCode PCBDDCSetNeumannBoundaries(PC pc,IS NeumannBoundaries)
1740c7d97c5SJed Brown {
1750c7d97c5SJed Brown   PetscErrorCode ierr;
1760c7d97c5SJed Brown 
1770c7d97c5SJed Brown   PetscFunctionBegin;
1780c7d97c5SJed Brown   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
17953cdbc3dSStefano Zampini   ierr = PetscTryMethod(pc,"PCBDDCSetNeumannBoundaries_C",(PC,IS),(pc,NeumannBoundaries));CHKERRQ(ierr);
18053cdbc3dSStefano Zampini   PetscFunctionReturn(0);
18153cdbc3dSStefano Zampini }
18253cdbc3dSStefano Zampini /* -------------------------------------------------------------------------- */
18353cdbc3dSStefano Zampini EXTERN_C_BEGIN
18453cdbc3dSStefano Zampini #undef __FUNCT__
185da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCGetDirichletBoundaries_BDDC"
186da1bb401SStefano Zampini static PetscErrorCode PCBDDCGetDirichletBoundaries_BDDC(PC pc,IS *DirichletBoundaries)
187da1bb401SStefano Zampini {
188da1bb401SStefano Zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
189da1bb401SStefano Zampini 
190da1bb401SStefano Zampini   PetscFunctionBegin;
191da1bb401SStefano Zampini   *DirichletBoundaries = pcbddc->DirichletBoundaries;
192da1bb401SStefano Zampini   PetscFunctionReturn(0);
193da1bb401SStefano Zampini }
194da1bb401SStefano Zampini EXTERN_C_END
195da1bb401SStefano Zampini #undef __FUNCT__
196da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCGetDirichletBoundaries"
197da1bb401SStefano Zampini /*@
198da1bb401SStefano Zampini  PCBDDCGetDirichletBoundaries - Get index set defining subdomain part (in local ordering)
199da1bb401SStefano Zampini                                 of Dirichlet boundaries for the global problem.
200da1bb401SStefano Zampini 
201da1bb401SStefano Zampini    Not collective
202da1bb401SStefano Zampini 
203da1bb401SStefano Zampini    Input Parameters:
204da1bb401SStefano Zampini +  pc - the preconditioning context
205da1bb401SStefano Zampini 
206da1bb401SStefano Zampini    Output Parameters:
207da1bb401SStefano Zampini +  DirichletBoundaries - index set defining the subdomain part of Dirichlet boundaries
208da1bb401SStefano Zampini 
209da1bb401SStefano Zampini    Level: intermediate
210da1bb401SStefano Zampini 
211da1bb401SStefano Zampini    Notes:
212da1bb401SStefano Zampini 
213da1bb401SStefano Zampini .seealso: PCBDDC
214da1bb401SStefano Zampini @*/
215da1bb401SStefano Zampini PetscErrorCode PCBDDCGetDirichletBoundaries(PC pc,IS *DirichletBoundaries)
216da1bb401SStefano Zampini {
217da1bb401SStefano Zampini   PetscErrorCode ierr;
218da1bb401SStefano Zampini 
219da1bb401SStefano Zampini   PetscFunctionBegin;
220da1bb401SStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
221da1bb401SStefano Zampini   ierr = PetscUseMethod(pc,"PCBDDCGetDirichletBoundaries_C",(PC,IS*),(pc,DirichletBoundaries));CHKERRQ(ierr);
222da1bb401SStefano Zampini   PetscFunctionReturn(0);
223da1bb401SStefano Zampini }
224da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
225da1bb401SStefano Zampini EXTERN_C_BEGIN
226da1bb401SStefano Zampini #undef __FUNCT__
22753cdbc3dSStefano Zampini #define __FUNCT__ "PCBDDCGetNeumannBoundaries_BDDC"
22853cdbc3dSStefano Zampini static PetscErrorCode PCBDDCGetNeumannBoundaries_BDDC(PC pc,IS *NeumannBoundaries)
22953cdbc3dSStefano Zampini {
23053cdbc3dSStefano Zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
23153cdbc3dSStefano Zampini 
23253cdbc3dSStefano Zampini   PetscFunctionBegin;
23353cdbc3dSStefano Zampini   *NeumannBoundaries = pcbddc->NeumannBoundaries;
23453cdbc3dSStefano Zampini   PetscFunctionReturn(0);
23553cdbc3dSStefano Zampini }
23653cdbc3dSStefano Zampini EXTERN_C_END
23753cdbc3dSStefano Zampini #undef __FUNCT__
23853cdbc3dSStefano Zampini #define __FUNCT__ "PCBDDCGetNeumannBoundaries"
23953cdbc3dSStefano Zampini /*@
240da1bb401SStefano Zampini  PCBDDCGetNeumannBoundaries - Get index set defining subdomain part (in local ordering)
241da1bb401SStefano Zampini                               of Neumann boundaries for the global problem.
24253cdbc3dSStefano Zampini 
2439c0446d6SStefano Zampini    Not collective
24453cdbc3dSStefano Zampini 
24553cdbc3dSStefano Zampini    Input Parameters:
24653cdbc3dSStefano Zampini +  pc - the preconditioning context
24753cdbc3dSStefano Zampini 
24853cdbc3dSStefano Zampini    Output Parameters:
24953cdbc3dSStefano Zampini +  NeumannBoundaries - index set defining the subdomain part of Neumann boundaries
25053cdbc3dSStefano Zampini 
25153cdbc3dSStefano Zampini    Level: intermediate
25253cdbc3dSStefano Zampini 
25353cdbc3dSStefano Zampini    Notes:
25453cdbc3dSStefano Zampini 
25553cdbc3dSStefano Zampini .seealso: PCBDDC
25653cdbc3dSStefano Zampini @*/
25753cdbc3dSStefano Zampini PetscErrorCode PCBDDCGetNeumannBoundaries(PC pc,IS *NeumannBoundaries)
25853cdbc3dSStefano Zampini {
25953cdbc3dSStefano Zampini   PetscErrorCode ierr;
26053cdbc3dSStefano Zampini 
26153cdbc3dSStefano Zampini   PetscFunctionBegin;
26253cdbc3dSStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
26353cdbc3dSStefano Zampini   ierr = PetscUseMethod(pc,"PCBDDCGetNeumannBoundaries_C",(PC,IS*),(pc,NeumannBoundaries));CHKERRQ(ierr);
2640c7d97c5SJed Brown   PetscFunctionReturn(0);
2650c7d97c5SJed Brown }
26636e030ebSStefano Zampini /* -------------------------------------------------------------------------- */
26736e030ebSStefano Zampini EXTERN_C_BEGIN
26836e030ebSStefano Zampini #undef __FUNCT__
269da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetLocalAdjacencyGraph_BDDC"
270da1bb401SStefano Zampini static PetscErrorCode PCBDDCSetLocalAdjacencyGraph_BDDC(PC pc, PetscInt nvtxs, PetscInt xadj[], PetscInt adjncy[], PetscCopyMode copymode)
27136e030ebSStefano Zampini {
27236e030ebSStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
273da1bb401SStefano Zampini   PCBDDCGraph    mat_graph=pcbddc->mat_graph;
274da1bb401SStefano Zampini   PetscErrorCode ierr;
27536e030ebSStefano Zampini 
27636e030ebSStefano Zampini   PetscFunctionBegin;
277da1bb401SStefano Zampini   mat_graph->nvtxs=nvtxs;
278da1bb401SStefano Zampini   ierr = PetscFree(mat_graph->xadj);CHKERRQ(ierr);
279da1bb401SStefano Zampini   ierr = PetscFree(mat_graph->adjncy);CHKERRQ(ierr);
280da1bb401SStefano Zampini   if(copymode == PETSC_COPY_VALUES) {
281da1bb401SStefano Zampini     ierr = PetscMalloc((mat_graph->nvtxs+1)*sizeof(PetscInt),&mat_graph->xadj);CHKERRQ(ierr);
282da1bb401SStefano Zampini     ierr = PetscMalloc(xadj[mat_graph->nvtxs]*sizeof(PetscInt),&mat_graph->adjncy);CHKERRQ(ierr);
283da1bb401SStefano Zampini     ierr = PetscMemcpy(mat_graph->xadj,xadj,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr);
284da1bb401SStefano Zampini     ierr = PetscMemcpy(mat_graph->adjncy,adjncy,xadj[mat_graph->nvtxs]*sizeof(PetscInt));CHKERRQ(ierr);
285da1bb401SStefano Zampini   } else if(copymode == PETSC_OWN_POINTER) {
286da1bb401SStefano Zampini     mat_graph->xadj=xadj;
287da1bb401SStefano Zampini     mat_graph->adjncy=adjncy;
288da1bb401SStefano Zampini   } else {
289da1bb401SStefano Zampini     SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_SUP,"Unsupported copy mode %d in %s\n",copymode,__FUNCT__);
290da1bb401SStefano Zampini   }
29136e030ebSStefano Zampini   PetscFunctionReturn(0);
29236e030ebSStefano Zampini }
29336e030ebSStefano Zampini EXTERN_C_END
29436e030ebSStefano Zampini #undef __FUNCT__
295da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetLocalAdjacencyGraph"
29636e030ebSStefano Zampini /*@
297da1bb401SStefano Zampini  PCBDDCSetLocalAdjacencyGraph - Set CSR graph of local matrix for use of PCBDDC.
29836e030ebSStefano Zampini 
29936e030ebSStefano Zampini    Not collective
30036e030ebSStefano Zampini 
30136e030ebSStefano Zampini    Input Parameters:
30236e030ebSStefano Zampini +  pc - the preconditioning context
303da1bb401SStefano Zampini -  nvtxs - number of local vertices of the graph
304da1bb401SStefano Zampini -  xadj, adjncy - the CSR graph
305da1bb401SStefano Zampini -  copymode - either PETSC_COPY_VALUES or PETSC_OWN_POINTER. In the former case the user must free the array passed in;
306da1bb401SStefano Zampini                                                              in the latter case, memory must be obtained with PetscMalloc.
30736e030ebSStefano Zampini 
30836e030ebSStefano Zampini    Level: intermediate
30936e030ebSStefano Zampini 
31036e030ebSStefano Zampini    Notes:
31136e030ebSStefano Zampini 
31236e030ebSStefano Zampini .seealso: PCBDDC
31336e030ebSStefano Zampini @*/
314da1bb401SStefano Zampini PetscErrorCode PCBDDCSetLocalAdjacencyGraph(PC pc,PetscInt nvtxs,PetscInt xadj[],PetscInt adjncy[], PetscCopyMode copymode)
31536e030ebSStefano Zampini {
316da1bb401SStefano Zampini   PetscInt       nrows,ncols;
317da1bb401SStefano Zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
31836e030ebSStefano Zampini   PetscErrorCode ierr;
31936e030ebSStefano Zampini 
32036e030ebSStefano Zampini   PetscFunctionBegin;
32136e030ebSStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
322da1bb401SStefano Zampini   ierr = MatGetSize(matis->A,&nrows,&ncols);CHKERRQ(ierr);
323da1bb401SStefano Zampini   if(nvtxs != nrows) {
324da1bb401SStefano Zampini     SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Local adjacency size %d passed in %s differs from local problem size %d!\n",nvtxs,__FUNCT__,nrows);
325da1bb401SStefano Zampini   } else {
326da1bb401SStefano Zampini     ierr = PetscTryMethod(pc,"PCBDDCSetLocalAdjacencyGraph_C",(PC,PetscInt,PetscInt[],PetscInt[],PetscCopyMode),(pc,nvtxs,xadj,adjncy,copymode));CHKERRQ(ierr);
327da1bb401SStefano Zampini   }
32836e030ebSStefano Zampini   PetscFunctionReturn(0);
32936e030ebSStefano Zampini }
3309c0446d6SStefano Zampini /* -------------------------------------------------------------------------- */
3319c0446d6SStefano Zampini EXTERN_C_BEGIN
3329c0446d6SStefano Zampini #undef __FUNCT__
3339c0446d6SStefano Zampini #define __FUNCT__ "PCBDDCSetDofsSplitting_BDDC"
3349c0446d6SStefano Zampini static PetscErrorCode PCBDDCSetDofsSplitting_BDDC(PC pc,PetscInt n_is, IS ISForDofs[])
3359c0446d6SStefano Zampini {
3369c0446d6SStefano Zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
3379c0446d6SStefano Zampini   PetscInt i;
3389c0446d6SStefano Zampini   PetscErrorCode ierr;
3399c0446d6SStefano Zampini 
3409c0446d6SStefano Zampini   PetscFunctionBegin;
341da1bb401SStefano Zampini   /* Destroy ISes if they were already set */
3429c0446d6SStefano Zampini   for(i=0;i<pcbddc->n_ISForDofs;i++) {
3439c0446d6SStefano Zampini     ierr = ISDestroy(&pcbddc->ISForDofs[i]);CHKERRQ(ierr);
3449c0446d6SStefano Zampini   }
345d11ae9bbSstefano_zampini   ierr = PetscFree(pcbddc->ISForDofs);CHKERRQ(ierr);
346da1bb401SStefano Zampini   /* allocate space then set */
3479c0446d6SStefano Zampini   ierr = PetscMalloc(n_is*sizeof(IS),&pcbddc->ISForDofs);CHKERRQ(ierr);
3489c0446d6SStefano Zampini   for(i=0;i<n_is;i++) {
349da1bb401SStefano Zampini     ierr = PetscObjectReference((PetscObject)ISForDofs[i]);CHKERRQ(ierr);
350da1bb401SStefano Zampini     pcbddc->ISForDofs[i]=ISForDofs[i];
3519c0446d6SStefano Zampini   }
3529c0446d6SStefano Zampini   pcbddc->n_ISForDofs=n_is;
3539c0446d6SStefano Zampini   PetscFunctionReturn(0);
3549c0446d6SStefano Zampini }
3559c0446d6SStefano Zampini EXTERN_C_END
3569c0446d6SStefano Zampini #undef __FUNCT__
3579c0446d6SStefano Zampini #define __FUNCT__ "PCBDDCSetDofsSplitting"
3589c0446d6SStefano Zampini /*@
359da1bb401SStefano Zampini  PCBDDCSetDofsSplitting - Set index sets defining fields of local mat.
3609c0446d6SStefano Zampini 
3619c0446d6SStefano Zampini    Not collective
3629c0446d6SStefano Zampini 
3639c0446d6SStefano Zampini    Input Parameters:
3649c0446d6SStefano Zampini +  pc - the preconditioning context
365da1bb401SStefano Zampini -  n - number of index sets defining the fields
366da1bb401SStefano Zampini -  IS[] - array of IS describing the fields
3679c0446d6SStefano Zampini 
3689c0446d6SStefano Zampini    Level: intermediate
3699c0446d6SStefano Zampini 
3709c0446d6SStefano Zampini    Notes:
3719c0446d6SStefano Zampini 
3729c0446d6SStefano Zampini .seealso: PCBDDC
3739c0446d6SStefano Zampini @*/
3749c0446d6SStefano Zampini PetscErrorCode PCBDDCSetDofsSplitting(PC pc,PetscInt n_is, IS ISForDofs[])
3759c0446d6SStefano Zampini {
3769c0446d6SStefano Zampini   PetscErrorCode ierr;
3779c0446d6SStefano Zampini 
3789c0446d6SStefano Zampini   PetscFunctionBegin;
3799c0446d6SStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
3809c0446d6SStefano Zampini   ierr = PetscTryMethod(pc,"PCBDDCSetDofsSplitting_C",(PC,PetscInt,IS[]),(pc,n_is,ISForDofs));CHKERRQ(ierr);
3819c0446d6SStefano Zampini   PetscFunctionReturn(0);
3829c0446d6SStefano Zampini }
383da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
384534831adSStefano Zampini #undef __FUNCT__
385534831adSStefano Zampini #define __FUNCT__ "PCPreSolve_BDDC"
386534831adSStefano Zampini /* -------------------------------------------------------------------------- */
387534831adSStefano Zampini /*
388534831adSStefano Zampini    PCPreSolve_BDDC - Changes the right hand side and (if necessary) the initial
389534831adSStefano Zampini                      guess if a transformation of basis approach has been selected.
3909c0446d6SStefano Zampini 
391534831adSStefano Zampini    Input Parameter:
392534831adSStefano Zampini +  pc - the preconditioner contex
393534831adSStefano Zampini 
394534831adSStefano Zampini    Application Interface Routine: PCPreSolve()
395534831adSStefano Zampini 
396534831adSStefano Zampini    Notes:
397534831adSStefano Zampini    The interface routine PCPreSolve() is not usually called directly by
398534831adSStefano Zampini    the user, but instead is called by KSPSolve().
399534831adSStefano Zampini */
400534831adSStefano Zampini static PetscErrorCode PCPreSolve_BDDC(PC pc, KSP ksp, Vec rhs, Vec x)
401534831adSStefano Zampini {
402534831adSStefano Zampini   PetscErrorCode ierr;
403534831adSStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
404534831adSStefano Zampini   PC_IS          *pcis = (PC_IS*)(pc->data);
405534831adSStefano Zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
406534831adSStefano Zampini   Mat            temp_mat;
4073972b0daSStefano Zampini   IS             dirIS;
4083972b0daSStefano Zampini   PetscInt       dirsize,i,*is_indices;
4093972b0daSStefano Zampini   PetscScalar    *array_x,*array_diagonal;
4103972b0daSStefano Zampini   Vec            used_vec;
4113972b0daSStefano Zampini   PetscBool      guess_nonzero;
412534831adSStefano Zampini 
413534831adSStefano Zampini   PetscFunctionBegin;
4143972b0daSStefano Zampini   if(x) {
4153972b0daSStefano Zampini     ierr = PetscObjectReference((PetscObject)x);CHKERRQ(ierr);
4163972b0daSStefano Zampini     used_vec = x;
4173972b0daSStefano Zampini   } else {
4183972b0daSStefano Zampini     ierr = PetscObjectReference((PetscObject)pcbddc->temp_solution);CHKERRQ(ierr);
4193972b0daSStefano Zampini     used_vec = pcbddc->temp_solution;
4203972b0daSStefano Zampini     ierr = VecSet(used_vec,0.0);CHKERRQ(ierr);
4213972b0daSStefano Zampini   }
4223972b0daSStefano Zampini   /* hack into ksp data structure PCPreSolve comes earlier in src/ksp/ksp/interface/itfunc.c */
4233972b0daSStefano Zampini   if (ksp) {
4243972b0daSStefano Zampini     ierr = KSPGetInitialGuessNonzero(ksp,&guess_nonzero);CHKERRQ(ierr);
4253972b0daSStefano Zampini     if( !guess_nonzero ) {
4263972b0daSStefano Zampini       ierr = VecSet(used_vec,0.0);CHKERRQ(ierr);
4273972b0daSStefano Zampini     }
4283972b0daSStefano Zampini   }
4293972b0daSStefano Zampini   /* store the original rhs */
4303972b0daSStefano Zampini   ierr = VecCopy(rhs,pcbddc->original_rhs);CHKERRQ(ierr);
4313972b0daSStefano Zampini 
4323972b0daSStefano Zampini   /* Take into account zeroed rows -> change rhs and store solution removed */
4333972b0daSStefano Zampini   ierr = MatGetDiagonal(pc->pmat,pcis->vec1_global);CHKERRQ(ierr);
4343972b0daSStefano Zampini   ierr = VecPointwiseDivide(pcis->vec1_global,rhs,pcis->vec1_global);CHKERRQ(ierr);
4353972b0daSStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4363972b0daSStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4373972b0daSStefano Zampini   ierr = VecScatterBegin(matis->ctx,used_vec,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4383972b0daSStefano Zampini   ierr = VecScatterEnd  (matis->ctx,used_vec,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4393972b0daSStefano Zampini   ierr = PCBDDCGetDirichletBoundaries(pc,&dirIS);CHKERRQ(ierr);
4403972b0daSStefano Zampini   if(dirIS) {
4413972b0daSStefano Zampini     ierr = ISGetSize(dirIS,&dirsize);CHKERRQ(ierr);
4423972b0daSStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array_x);CHKERRQ(ierr);
4433972b0daSStefano Zampini     ierr = VecGetArray(pcis->vec2_N,&array_diagonal);CHKERRQ(ierr);
4443972b0daSStefano Zampini     ierr = ISGetIndices(dirIS,(const PetscInt**)&is_indices);CHKERRQ(ierr);
4453972b0daSStefano Zampini     for(i=0;i<dirsize;i++) {
4463972b0daSStefano Zampini       array_x[is_indices[i]]=array_diagonal[is_indices[i]];
4473972b0daSStefano Zampini     }
4483972b0daSStefano Zampini     ierr = ISRestoreIndices(dirIS,(const PetscInt**)&is_indices);CHKERRQ(ierr);
4493972b0daSStefano Zampini     ierr = VecRestoreArray(pcis->vec2_N,&array_diagonal);CHKERRQ(ierr);
4503972b0daSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array_x);CHKERRQ(ierr);
4513972b0daSStefano Zampini   }
4523972b0daSStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4533972b0daSStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
454b76ba322SStefano Zampini 
4553972b0daSStefano Zampini   /* remove the computed solution from the rhs */
4563972b0daSStefano Zampini   ierr = VecScale(used_vec,-1.0);CHKERRQ(ierr);
4573972b0daSStefano Zampini   ierr = MatMultAdd(pc->pmat,used_vec,rhs,rhs);CHKERRQ(ierr);
4583972b0daSStefano Zampini   ierr = VecScale(used_vec,-1.0);CHKERRQ(ierr);
459b76ba322SStefano Zampini 
460b76ba322SStefano Zampini   /* store partially computed solution and set initial guess */
4613972b0daSStefano Zampini   if(x) {
4623972b0daSStefano Zampini     ierr = VecCopy(used_vec,pcbddc->temp_solution);CHKERRQ(ierr);
4633972b0daSStefano Zampini     ierr = VecSet(used_vec,0.0);CHKERRQ(ierr);
464b76ba322SStefano Zampini     if(pcbddc->use_exact_dirichlet) {
465b76ba322SStefano Zampini       ierr = VecScatterBegin(pcis->global_to_D,rhs,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
466b76ba322SStefano Zampini       ierr = VecScatterEnd  (pcis->global_to_D,rhs,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
467b76ba322SStefano Zampini       ierr = KSPSolve(pcbddc->ksp_D,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr);
468b76ba322SStefano Zampini       ierr = VecScatterBegin(pcis->global_to_D,pcis->vec2_D,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
469b76ba322SStefano Zampini       ierr = VecScatterEnd  (pcis->global_to_D,pcis->vec2_D,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
470b76ba322SStefano Zampini       if(ksp) {
471b76ba322SStefano Zampini         ierr = KSPSetInitialGuessNonzero(ksp,PETSC_TRUE);CHKERRQ(ierr);
472b76ba322SStefano Zampini       }
473b76ba322SStefano Zampini     }
4743972b0daSStefano Zampini   }
4753972b0daSStefano Zampini   ierr = VecDestroy(&used_vec);CHKERRQ(ierr);
476b76ba322SStefano Zampini 
477b76ba322SStefano Zampini   /* rhs change of basis */
478b76ba322SStefano Zampini   if(pcbddc->usechangeofbasis) {
479b76ba322SStefano Zampini     /* swap pointers for local matrices */
480b76ba322SStefano Zampini     temp_mat = matis->A;
481b76ba322SStefano Zampini     matis->A = pcbddc->local_mat;
482b76ba322SStefano Zampini     pcbddc->local_mat = temp_mat;
483b76ba322SStefano Zampini     /* Get local rhs and apply transformation of basis */
484b76ba322SStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,rhs,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
485b76ba322SStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,rhs,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
486b76ba322SStefano Zampini     /* from original basis to modified basis */
487b76ba322SStefano Zampini     ierr = MatMultTranspose(pcbddc->ChangeOfBasisMatrix,pcis->vec1_B,pcis->vec2_B);CHKERRQ(ierr);
488b76ba322SStefano Zampini     /* put back modified values into the global vec using INSERT_VALUES copy mode */
489b76ba322SStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,pcis->vec2_B,rhs,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
490b76ba322SStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec2_B,rhs,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
491b76ba322SStefano Zampini   }
492534831adSStefano Zampini   PetscFunctionReturn(0);
493534831adSStefano Zampini }
494534831adSStefano Zampini /* -------------------------------------------------------------------------- */
495534831adSStefano Zampini #undef __FUNCT__
496534831adSStefano Zampini #define __FUNCT__ "PCPostSolve_BDDC"
497534831adSStefano Zampini /* -------------------------------------------------------------------------- */
498534831adSStefano Zampini /*
499534831adSStefano Zampini    PCPostSolve_BDDC - Changes the computed solution if a transformation of basis
500534831adSStefano Zampini                      approach has been selected. Also, restores rhs to its original state.
501534831adSStefano Zampini 
502534831adSStefano Zampini    Input Parameter:
503534831adSStefano Zampini +  pc - the preconditioner contex
504534831adSStefano Zampini 
505534831adSStefano Zampini    Application Interface Routine: PCPostSolve()
506534831adSStefano Zampini 
507534831adSStefano Zampini    Notes:
508534831adSStefano Zampini    The interface routine PCPostSolve() is not usually called directly by
509534831adSStefano Zampini    the user, but instead is called by KSPSolve().
510534831adSStefano Zampini */
511534831adSStefano Zampini static PetscErrorCode PCPostSolve_BDDC(PC pc, KSP ksp, Vec rhs, Vec x)
512534831adSStefano Zampini {
513534831adSStefano Zampini   PetscErrorCode ierr;
514534831adSStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
515534831adSStefano Zampini   PC_IS          *pcis = (PC_IS*)(pc->data);
516534831adSStefano Zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
517534831adSStefano Zampini   Mat            temp_mat;
518534831adSStefano Zampini 
519534831adSStefano Zampini   PetscFunctionBegin;
520534831adSStefano Zampini   if(pcbddc->usechangeofbasis) {
521534831adSStefano Zampini     /* swap pointers for local matrices */
522534831adSStefano Zampini     temp_mat = matis->A;
523534831adSStefano Zampini     matis->A = pcbddc->local_mat;
524534831adSStefano Zampini     pcbddc->local_mat = temp_mat;
525534831adSStefano Zampini     /* restore rhs to its original state */
5263425bc38SStefano Zampini     if(rhs) {
5273425bc38SStefano Zampini       ierr = VecCopy(pcbddc->original_rhs,rhs);CHKERRQ(ierr);
5283425bc38SStefano Zampini     }
529534831adSStefano Zampini     /* Get Local boundary and apply transformation of basis to solution vector */
530534831adSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,x,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
531534831adSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,x,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
532534831adSStefano Zampini     /* from modified basis to original basis */
533534831adSStefano Zampini     ierr = MatMult(pcbddc->ChangeOfBasisMatrix,pcis->vec1_B,pcis->vec2_B);CHKERRQ(ierr);
534534831adSStefano Zampini     /* put back modified values into the global vec using INSERT_VALUES copy mode */
535534831adSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,pcis->vec2_B,x,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
536534831adSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec2_B,x,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
537534831adSStefano Zampini   }
5383972b0daSStefano Zampini   /* add solution removed in presolve */
5393425bc38SStefano Zampini   if(x) {
5403425bc38SStefano Zampini     ierr = VecAXPY(x,1.0,pcbddc->temp_solution);CHKERRQ(ierr);
5413425bc38SStefano Zampini   }
542534831adSStefano Zampini   PetscFunctionReturn(0);
543534831adSStefano Zampini }
544534831adSStefano Zampini /* -------------------------------------------------------------------------- */
54553cdbc3dSStefano Zampini #undef __FUNCT__
54653cdbc3dSStefano Zampini #define __FUNCT__ "PCSetUp_BDDC"
5470c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
5480c7d97c5SJed Brown /*
5490c7d97c5SJed Brown    PCSetUp_BDDC - Prepares for the use of the BDDC preconditioner
5500c7d97c5SJed Brown                   by setting data structures and options.
5510c7d97c5SJed Brown 
5520c7d97c5SJed Brown    Input Parameter:
55353cdbc3dSStefano Zampini +  pc - the preconditioner context
5540c7d97c5SJed Brown 
5550c7d97c5SJed Brown    Application Interface Routine: PCSetUp()
5560c7d97c5SJed Brown 
5570c7d97c5SJed Brown    Notes:
5580c7d97c5SJed Brown    The interface routine PCSetUp() is not usually called directly by
5590c7d97c5SJed Brown    the user, but instead is called by PCApply() if necessary.
5600c7d97c5SJed Brown */
56153cdbc3dSStefano Zampini PetscErrorCode PCSetUp_BDDC(PC pc)
5620c7d97c5SJed Brown {
5630c7d97c5SJed Brown   PetscErrorCode ierr;
5640c7d97c5SJed Brown   PC_BDDC*       pcbddc   = (PC_BDDC*)pc->data;
5650c7d97c5SJed Brown 
5660c7d97c5SJed Brown   PetscFunctionBegin;
5670c7d97c5SJed Brown   if (!pc->setupcalled) {
5683b03a366Sstefano_zampini     /* For BDDC we need to define a local "Neumann" problem different to that defined in PCISSetup
5699c0446d6SStefano Zampini        So, we set to pcnone the Neumann problem of pcis in order to avoid unneeded computation
5700c7d97c5SJed Brown        Also, we decide to directly build the (same) Dirichlet problem */
5710c7d97c5SJed Brown     ierr = PetscOptionsSetValue("-is_localN_pc_type","none");CHKERRQ(ierr);
5720c7d97c5SJed Brown     ierr = PetscOptionsSetValue("-is_localD_pc_type","none");CHKERRQ(ierr);
5730c7d97c5SJed Brown     /* Set up all the "iterative substructuring" common block */
5740c7d97c5SJed Brown     ierr = PCISSetUp(pc);CHKERRQ(ierr);
5753b03a366Sstefano_zampini     /* Get stdout for dbg */
576e269702eSStefano Zampini     if(pcbddc->dbg_flag) {
577e269702eSStefano Zampini       ierr = PetscViewerASCIIGetStdout(((PetscObject)pc)->comm,&pcbddc->dbg_viewer);CHKERRQ(ierr);
578e269702eSStefano Zampini       ierr = PetscViewerASCIISynchronizedAllow(pcbddc->dbg_viewer,PETSC_TRUE);CHKERRQ(ierr);
579e269702eSStefano Zampini     }
5803b03a366Sstefano_zampini     /* Analyze local interface */
5810c7d97c5SJed Brown     ierr = PCBDDCManageLocalBoundaries(pc);CHKERRQ(ierr);
5823b03a366Sstefano_zampini     /* Set up local constraint matrix */
5833b03a366Sstefano_zampini     ierr = PCBDDCCreateConstraintMatrix(pc);CHKERRQ(ierr);
5840c7d97c5SJed Brown     /* Create coarse and local stuffs used for evaluating action of preconditioner */
5850c7d97c5SJed Brown     ierr = PCBDDCCoarseSetUp(pc);CHKERRQ(ierr);
5860c7d97c5SJed Brown   }
5870c7d97c5SJed Brown   PetscFunctionReturn(0);
5880c7d97c5SJed Brown }
5890c7d97c5SJed Brown 
5900c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
5910c7d97c5SJed Brown /*
5920c7d97c5SJed Brown    PCApply_BDDC - Applies the BDDC preconditioner to a vector.
5930c7d97c5SJed Brown 
5940c7d97c5SJed Brown    Input Parameters:
5950c7d97c5SJed Brown .  pc - the preconditioner context
5960c7d97c5SJed Brown .  r - input vector (global)
5970c7d97c5SJed Brown 
5980c7d97c5SJed Brown    Output Parameter:
5990c7d97c5SJed Brown .  z - output vector (global)
6000c7d97c5SJed Brown 
6010c7d97c5SJed Brown    Application Interface Routine: PCApply()
6020c7d97c5SJed Brown  */
6030c7d97c5SJed Brown #undef __FUNCT__
6040c7d97c5SJed Brown #define __FUNCT__ "PCApply_BDDC"
60553cdbc3dSStefano Zampini PetscErrorCode PCApply_BDDC(PC pc,Vec r,Vec z)
6060c7d97c5SJed Brown {
6070c7d97c5SJed Brown   PC_IS             *pcis = (PC_IS*)(pc->data);
6080c7d97c5SJed Brown   PC_BDDC           *pcbddc = (PC_BDDC*)(pc->data);
6090c7d97c5SJed Brown   PetscErrorCode    ierr;
6103b03a366Sstefano_zampini   const PetscScalar one = 1.0;
6113b03a366Sstefano_zampini   const PetscScalar m_one = -1.0;
6122617d88aSStefano Zampini   const PetscScalar zero = 0.0;
6130c7d97c5SJed Brown 
6140c7d97c5SJed Brown /* This code is similar to that provided in nn.c for PCNN
6150c7d97c5SJed Brown    NN interface preconditioner changed to BDDC
6160c7d97c5SJed Brown    Added support for M_3 preconditioenr in the reference article (code is active if pcbddc->prec_type = PETSC_TRUE) */
6170c7d97c5SJed Brown 
6180c7d97c5SJed Brown   PetscFunctionBegin;
619b76ba322SStefano Zampini   if(!pcbddc->use_exact_dirichlet) {
6200c7d97c5SJed Brown     /* First Dirichlet solve */
6210c7d97c5SJed Brown     ierr = VecScatterBegin(pcis->global_to_D,r,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
6220c7d97c5SJed Brown     ierr = VecScatterEnd  (pcis->global_to_D,r,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
62353cdbc3dSStefano Zampini     ierr = KSPSolve(pcbddc->ksp_D,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr);
6240c7d97c5SJed Brown     /*
6250c7d97c5SJed Brown       Assembling right hand side for BDDC operator
6260c7d97c5SJed Brown       - vec1_D for the Dirichlet part (if needed, i.e. prec_flag=PETSC_TRUE)
6270c7d97c5SJed Brown       - the interface part of the global vector z
6280c7d97c5SJed Brown     */
6290c7d97c5SJed Brown     ierr = VecScale(pcis->vec2_D,m_one);CHKERRQ(ierr);
6300c7d97c5SJed Brown     ierr = MatMult(pcis->A_BI,pcis->vec2_D,pcis->vec1_B);CHKERRQ(ierr);
6310c7d97c5SJed Brown     if(pcbddc->prec_type) { ierr = MatMultAdd(pcis->A_II,pcis->vec2_D,pcis->vec1_D,pcis->vec1_D);CHKERRQ(ierr); }
6320c7d97c5SJed Brown     ierr = VecScale(pcis->vec2_D,m_one);CHKERRQ(ierr);
6330c7d97c5SJed Brown     ierr = VecCopy(r,z);CHKERRQ(ierr);
6340c7d97c5SJed Brown     ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
6350c7d97c5SJed Brown     ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
6362617d88aSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
6372617d88aSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
638b76ba322SStefano Zampini   } else {
639b76ba322SStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,r,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
640b76ba322SStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,r,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
641b76ba322SStefano Zampini     ierr = VecSet(pcis->vec2_D,zero);CHKERRQ(ierr);
642b76ba322SStefano Zampini   }
643b76ba322SStefano Zampini 
644b76ba322SStefano Zampini   /* Apply partition of unity */
6452617d88aSStefano Zampini   ierr = VecPointwiseMult(pcis->vec1_B,pcis->D,pcis->vec1_B);CHKERRQ(ierr);
6462617d88aSStefano Zampini 
6472617d88aSStefano Zampini   /* Apply interface preconditioner
6482617d88aSStefano Zampini      input/output vecs: pcis->vec1_B and pcis->vec1_D */
6492617d88aSStefano Zampini   ierr = PCBDDCApplyInterfacePreconditioner(pc);CHKERRQ(ierr);
6502617d88aSStefano Zampini 
6512617d88aSStefano Zampini   /* Apply partition of unity and sum boundary values */
6522617d88aSStefano Zampini   ierr = VecPointwiseMult(pcis->vec1_B,pcis->D,pcis->vec1_B);CHKERRQ(ierr);
6532617d88aSStefano Zampini   ierr = VecSet(z,zero);CHKERRQ(ierr);
6542617d88aSStefano Zampini   ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
6552617d88aSStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
6560c7d97c5SJed Brown 
6573b03a366Sstefano_zampini   /* Second Dirichlet solve and assembling of output */
6580c7d97c5SJed Brown   ierr = VecScatterBegin(pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
6590c7d97c5SJed Brown   ierr = VecScatterEnd  (pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
6600c7d97c5SJed Brown   ierr = MatMult(pcis->A_IB,pcis->vec1_B,pcis->vec3_D);CHKERRQ(ierr);
6610c7d97c5SJed Brown   if(pcbddc->prec_type) { ierr = MatMultAdd(pcis->A_II,pcis->vec1_D,pcis->vec3_D,pcis->vec3_D);CHKERRQ(ierr); }
66253cdbc3dSStefano Zampini   ierr = KSPSolve(pcbddc->ksp_D,pcis->vec3_D,pcbddc->vec4_D);CHKERRQ(ierr);
6630c7d97c5SJed Brown   ierr = VecScale(pcbddc->vec4_D,m_one);CHKERRQ(ierr);
6640c7d97c5SJed Brown   if(pcbddc->prec_type) { ierr = VecAXPY (pcbddc->vec4_D,one,pcis->vec1_D);CHKERRQ(ierr); }
6650c7d97c5SJed Brown   ierr = VecAXPY (pcis->vec2_D,one,pcbddc->vec4_D);CHKERRQ(ierr);
6660c7d97c5SJed Brown   ierr = VecScatterBegin(pcis->global_to_D,pcis->vec2_D,z,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
6670c7d97c5SJed Brown   ierr = VecScatterEnd  (pcis->global_to_D,pcis->vec2_D,z,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
6680c7d97c5SJed Brown   PetscFunctionReturn(0);
6690c7d97c5SJed Brown 
6700c7d97c5SJed Brown }
671da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
672da1bb401SStefano Zampini #undef __FUNCT__
673da1bb401SStefano Zampini #define __FUNCT__ "PCDestroy_BDDC"
674da1bb401SStefano Zampini PetscErrorCode PCDestroy_BDDC(PC pc)
675da1bb401SStefano Zampini {
676da1bb401SStefano Zampini   PC_BDDC          *pcbddc = (PC_BDDC*)pc->data;
677da1bb401SStefano Zampini   PetscErrorCode ierr;
678da1bb401SStefano Zampini 
679da1bb401SStefano Zampini   PetscFunctionBegin;
680da1bb401SStefano Zampini   /* free data created by PCIS */
681da1bb401SStefano Zampini   ierr = PCISDestroy(pc);CHKERRQ(ierr);
682da1bb401SStefano Zampini   /* free BDDC data  */
6833972b0daSStefano Zampini   ierr = VecDestroy(&pcbddc->temp_solution);CHKERRQ(ierr);
684534831adSStefano Zampini   ierr = VecDestroy(&pcbddc->original_rhs);CHKERRQ(ierr);
685534831adSStefano Zampini   ierr = MatDestroy(&pcbddc->local_mat);CHKERRQ(ierr);
686534831adSStefano Zampini   ierr = MatDestroy(&pcbddc->ChangeOfBasisMatrix);CHKERRQ(ierr);
687da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->coarse_vec);CHKERRQ(ierr);
688da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->coarse_rhs);CHKERRQ(ierr);
689da1bb401SStefano Zampini   ierr = KSPDestroy(&pcbddc->coarse_ksp);CHKERRQ(ierr);
690da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->coarse_mat);CHKERRQ(ierr);
691da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->coarse_phi_B);CHKERRQ(ierr);
692da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->coarse_phi_D);CHKERRQ(ierr);
693da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec1_P);CHKERRQ(ierr);
694da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec1_C);CHKERRQ(ierr);
695da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->local_auxmat1);CHKERRQ(ierr);
696da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->local_auxmat2);CHKERRQ(ierr);
697da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec1_R);CHKERRQ(ierr);
698da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec2_R);CHKERRQ(ierr);
699da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec4_D);CHKERRQ(ierr);
700da1bb401SStefano Zampini   ierr = VecScatterDestroy(&pcbddc->R_to_B);CHKERRQ(ierr);
701da1bb401SStefano Zampini   ierr = VecScatterDestroy(&pcbddc->R_to_D);CHKERRQ(ierr);
702da1bb401SStefano Zampini   ierr = VecScatterDestroy(&pcbddc->coarse_loc_to_glob);CHKERRQ(ierr);
703da1bb401SStefano Zampini   ierr = KSPDestroy(&pcbddc->ksp_D);CHKERRQ(ierr);
704da1bb401SStefano Zampini   ierr = KSPDestroy(&pcbddc->ksp_R);CHKERRQ(ierr);
705da1bb401SStefano Zampini   ierr = ISDestroy(&pcbddc->NeumannBoundaries);CHKERRQ(ierr);
706da1bb401SStefano Zampini   ierr = ISDestroy(&pcbddc->DirichletBoundaries);CHKERRQ(ierr);
707da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->ConstraintMatrix);CHKERRQ(ierr);
708da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->local_primal_indices);CHKERRQ(ierr);
709da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->replicated_local_primal_indices);CHKERRQ(ierr);
710da1bb401SStefano Zampini   if (pcbddc->replicated_local_primal_values)    { free(pcbddc->replicated_local_primal_values); }
711da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->local_primal_displacements);CHKERRQ(ierr);
712da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->local_primal_sizes);CHKERRQ(ierr);
713da1bb401SStefano Zampini   PetscInt i;
714da1bb401SStefano Zampini   for(i=0;i<pcbddc->n_ISForDofs;i++) { ierr = ISDestroy(&pcbddc->ISForDofs[i]);CHKERRQ(ierr); }
715da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->ISForDofs);CHKERRQ(ierr);
716da1bb401SStefano Zampini   for(i=0;i<pcbddc->n_ISForFaces;i++) { ierr = ISDestroy(&pcbddc->ISForFaces[i]);CHKERRQ(ierr); }
717da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->ISForFaces);CHKERRQ(ierr);
718da1bb401SStefano Zampini   for(i=0;i<pcbddc->n_ISForEdges;i++) { ierr = ISDestroy(&pcbddc->ISForEdges[i]);CHKERRQ(ierr); }
719da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->ISForEdges);CHKERRQ(ierr);
720da1bb401SStefano Zampini   ierr = ISDestroy(&pcbddc->ISForVertices);CHKERRQ(ierr);
7213972b0daSStefano Zampini   /* Free graph structure */
722da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph->xadj);CHKERRQ(ierr);
723da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph->adjncy);CHKERRQ(ierr);
724*142dfd88SStefano Zampini   if(pcbddc->mat_graph->nvtxs) {
725da1bb401SStefano Zampini     ierr = PetscFree(pcbddc->mat_graph->neighbours_set[0]);CHKERRQ(ierr);
726*142dfd88SStefano Zampini   }
727da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph->neighbours_set);CHKERRQ(ierr);
7283972b0daSStefano Zampini   ierr = PetscFree4(pcbddc->mat_graph->where,pcbddc->mat_graph->count,pcbddc->mat_graph->cptr,pcbddc->mat_graph->queue);CHKERRQ(ierr);
7293972b0daSStefano Zampini   ierr = PetscFree2(pcbddc->mat_graph->which_dof,pcbddc->mat_graph->touched);CHKERRQ(ierr);
7303972b0daSStefano Zampini   ierr = PetscFree(pcbddc->mat_graph->where_ncmps);CHKERRQ(ierr);
731da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph);CHKERRQ(ierr);
7323425bc38SStefano Zampini   /* remove functions */
7333425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDirichletBoundaries_C","",PETSC_NULL);CHKERRQ(ierr);
7343425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetNeumannBoundaries_C","",PETSC_NULL);CHKERRQ(ierr);
7353425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetDirichletBoundaries_C","",PETSC_NULL);CHKERRQ(ierr);
7363425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetNeumannBoundaries_C","",PETSC_NULL);CHKERRQ(ierr);
7373425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetCoarseProblemType_C","",PETSC_NULL);CHKERRQ(ierr);
7383425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDofsSplitting_C","",PETSC_NULL);CHKERRQ(ierr);
7393425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetLocalAdjacencyGraph_C","",PETSC_NULL);CHKERRQ(ierr);
7403425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPreSolve_C","",PETSC_NULL);CHKERRQ(ierr);
7413425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPostSolve_C","",PETSC_NULL);CHKERRQ(ierr);
7423425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCCreateFETIDPOperators_C","",PETSC_NULL);CHKERRQ(ierr);
7433425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetRHS_C","",PETSC_NULL);CHKERRQ(ierr);
7443425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetSolution_C","",PETSC_NULL);CHKERRQ(ierr);
745da1bb401SStefano Zampini   /* Free the private data structure that was hanging off the PC */
746da1bb401SStefano Zampini   ierr = PetscFree(pcbddc);CHKERRQ(ierr);
747da1bb401SStefano Zampini   PetscFunctionReturn(0);
748da1bb401SStefano Zampini }
7493425bc38SStefano Zampini /* -------------------------------------------------------------------------- */
7503425bc38SStefano Zampini EXTERN_C_BEGIN
7513425bc38SStefano Zampini #undef __FUNCT__
7523425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetRHS_BDDC"
7533425bc38SStefano Zampini static PetscErrorCode PCBDDCMatFETIDPGetRHS_BDDC(Mat fetidp_mat, Vec standard_rhs, Vec fetidp_flux_rhs)
7543425bc38SStefano Zampini {
7553425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
7563425bc38SStefano Zampini   PC_IS*         pcis;
7573425bc38SStefano Zampini   PC_BDDC*       pcbddc;
7583425bc38SStefano Zampini   Mat_IS*        matis;
7593425bc38SStefano Zampini   PetscErrorCode ierr;
7600c7d97c5SJed Brown 
7613425bc38SStefano Zampini   PetscFunctionBegin;
7623425bc38SStefano Zampini   ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr);
7633425bc38SStefano Zampini   pcis = (PC_IS*)mat_ctx->pc->data;
7643425bc38SStefano Zampini   pcbddc = (PC_BDDC*)mat_ctx->pc->data;
7653425bc38SStefano Zampini   matis = (Mat_IS*)mat_ctx->pc->pmat->data;
7663425bc38SStefano Zampini 
7673425bc38SStefano Zampini   /* change of basis for physical rhs if needed
7683425bc38SStefano Zampini      It also changes the rhs in case of dirichlet boundaries */
7693425bc38SStefano Zampini   (*mat_ctx->pc->ops->presolve)(mat_ctx->pc,PETSC_NULL,standard_rhs,PETSC_NULL);
7703425bc38SStefano Zampini   /* store vectors for computation of fetidp final solution */
7713425bc38SStefano Zampini   ierr = VecScatterBegin(pcis->global_to_D,standard_rhs,mat_ctx->temp_solution_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
7723425bc38SStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_D,standard_rhs,mat_ctx->temp_solution_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
7733425bc38SStefano Zampini   ierr = VecScatterBegin(pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
7743425bc38SStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
7753425bc38SStefano Zampini   /* scale rhs since it should be unassembled */
7763425bc38SStefano Zampini   ierr = VecPointwiseMult(mat_ctx->temp_solution_B,pcis->D,mat_ctx->temp_solution_B);CHKERRQ(ierr);
7773425bc38SStefano Zampini   if(!pcbddc->prec_type) {
7783425bc38SStefano Zampini     /* compute partially subassembled Schur complement right-hand side */
7793425bc38SStefano Zampini     ierr = KSPSolve(pcbddc->ksp_D,mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr);
7803425bc38SStefano Zampini     ierr = MatMult(pcis->A_BI,pcis->vec1_D,pcis->vec1_B);CHKERRQ(ierr);
7813425bc38SStefano Zampini     ierr = VecAXPY(mat_ctx->temp_solution_B,-1.0,pcis->vec1_B);CHKERRQ(ierr);
7823425bc38SStefano Zampini     ierr = VecSet(standard_rhs,0.0);CHKERRQ(ierr);
7833425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,mat_ctx->temp_solution_B,standard_rhs,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
7843425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,mat_ctx->temp_solution_B,standard_rhs,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
7853425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
7863425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
7873425bc38SStefano Zampini     ierr = VecPointwiseMult(mat_ctx->temp_solution_B,pcis->D,mat_ctx->temp_solution_B);CHKERRQ(ierr);
7883425bc38SStefano Zampini   }
7893425bc38SStefano Zampini   /* BDDC rhs */
7903425bc38SStefano Zampini   ierr = VecCopy(mat_ctx->temp_solution_B,pcis->vec1_B);CHKERRQ(ierr);
7913425bc38SStefano Zampini   if(pcbddc->prec_type) {
7923425bc38SStefano Zampini     ierr = VecCopy(mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr);
7933425bc38SStefano Zampini   }
7943425bc38SStefano Zampini   /* apply BDDC */
7953425bc38SStefano Zampini   ierr = PCBDDCApplyInterfacePreconditioner(mat_ctx->pc);CHKERRQ(ierr);
7963425bc38SStefano Zampini   /* Application of B_delta and assembling of rhs for fetidp fluxes */
7973425bc38SStefano Zampini   ierr = VecSet(fetidp_flux_rhs,0.0);CHKERRQ(ierr);
7983425bc38SStefano Zampini   ierr = MatMult(mat_ctx->B_delta,pcis->vec1_B,mat_ctx->lambda_local);CHKERRQ(ierr);
7993425bc38SStefano Zampini   ierr = VecScatterBegin(mat_ctx->l2g_lambda,mat_ctx->lambda_local,fetidp_flux_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
8003425bc38SStefano Zampini   ierr = VecScatterEnd  (mat_ctx->l2g_lambda,mat_ctx->lambda_local,fetidp_flux_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
8013425bc38SStefano Zampini   /* restore original rhs */
8023425bc38SStefano Zampini   ierr = VecCopy(pcbddc->original_rhs,standard_rhs);CHKERRQ(ierr);
8033425bc38SStefano Zampini   PetscFunctionReturn(0);
8043425bc38SStefano Zampini }
8053425bc38SStefano Zampini EXTERN_C_END
8063425bc38SStefano Zampini #undef __FUNCT__
8073425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetRHS"
8083425bc38SStefano Zampini /*@
8093425bc38SStefano Zampini  PCBDDCMatFETIDPGetRHS - Get rhs for FETIDP linear system.
8103425bc38SStefano Zampini 
8113425bc38SStefano Zampini    Collective
8123425bc38SStefano Zampini 
8133425bc38SStefano Zampini    Input Parameters:
8143425bc38SStefano Zampini +  fetidp_mat   - the FETIDP mat obtained by a call to PCBDDCCreateFETIDPOperators
8153425bc38SStefano Zampini +  standard_rhs - the rhs of your linear system
8163425bc38SStefano Zampini 
8173425bc38SStefano Zampini    Output Parameters:
8183425bc38SStefano Zampini +  fetidp_flux_rhs   - the rhs of the FETIDP linear system
8193425bc38SStefano Zampini 
8203425bc38SStefano Zampini    Level: developer
8213425bc38SStefano Zampini 
8223425bc38SStefano Zampini    Notes:
8233425bc38SStefano Zampini 
8243425bc38SStefano Zampini .seealso: PCBDDC
8253425bc38SStefano Zampini @*/
8263425bc38SStefano Zampini PetscErrorCode PCBDDCMatFETIDPGetRHS(Mat fetidp_mat, Vec standard_rhs, Vec fetidp_flux_rhs)
8273425bc38SStefano Zampini {
8283425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
8293425bc38SStefano Zampini   PetscErrorCode ierr;
8303425bc38SStefano Zampini 
8313425bc38SStefano Zampini   PetscFunctionBegin;
8323425bc38SStefano Zampini   ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr);
8333425bc38SStefano Zampini   ierr = PetscTryMethod(mat_ctx->pc,"PCBDDCMatFETIDPGetRHS_C",(Mat,Vec,Vec),(fetidp_mat,standard_rhs,fetidp_flux_rhs));CHKERRQ(ierr);
8343425bc38SStefano Zampini   PetscFunctionReturn(0);
8353425bc38SStefano Zampini }
8363425bc38SStefano Zampini /* -------------------------------------------------------------------------- */
8373425bc38SStefano Zampini EXTERN_C_BEGIN
8383425bc38SStefano Zampini #undef __FUNCT__
8393425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetSolution_BDDC"
8403425bc38SStefano Zampini static PetscErrorCode PCBDDCMatFETIDPGetSolution_BDDC(Mat fetidp_mat, Vec fetidp_flux_sol, Vec standard_sol)
8413425bc38SStefano Zampini {
8423425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
8433425bc38SStefano Zampini   PC_IS*         pcis;
8443425bc38SStefano Zampini   PC_BDDC*       pcbddc;
8453425bc38SStefano Zampini   Mat_IS*        matis;
8463425bc38SStefano Zampini   PetscErrorCode ierr;
8473425bc38SStefano Zampini 
8483425bc38SStefano Zampini   PetscFunctionBegin;
8493425bc38SStefano Zampini   ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr);
8503425bc38SStefano Zampini   pcis = (PC_IS*)mat_ctx->pc->data;
8513425bc38SStefano Zampini   pcbddc = (PC_BDDC*)mat_ctx->pc->data;
8523425bc38SStefano Zampini   matis = (Mat_IS*)mat_ctx->pc->pmat->data;
8533425bc38SStefano Zampini 
8543425bc38SStefano Zampini   /* apply B_delta^T */
8553425bc38SStefano Zampini   ierr = VecScatterBegin(mat_ctx->l2g_lambda,fetidp_flux_sol,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
8563425bc38SStefano Zampini   ierr = VecScatterEnd  (mat_ctx->l2g_lambda,fetidp_flux_sol,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
8573425bc38SStefano Zampini   ierr = MatMultTranspose(mat_ctx->B_delta,mat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr);
8583425bc38SStefano Zampini   /* compute rhs for BDDC application */
8593425bc38SStefano Zampini   ierr = VecAYPX(pcis->vec1_B,-1.0,mat_ctx->temp_solution_B);CHKERRQ(ierr);
8603425bc38SStefano Zampini   if(pcbddc->prec_type) {
8613425bc38SStefano Zampini     ierr = VecCopy(mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr);
8623425bc38SStefano Zampini   }
8633425bc38SStefano Zampini   /* apply BDDC */
8643425bc38SStefano Zampini   ierr = PCBDDCApplyInterfacePreconditioner(mat_ctx->pc);CHKERRQ(ierr);
8653425bc38SStefano Zampini   /* put values into standard global vector */
8663425bc38SStefano Zampini   ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
8673425bc38SStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec1_B,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
8683425bc38SStefano Zampini   if(!pcbddc->prec_type) {
8693425bc38SStefano Zampini     /* compute values into the interior if solved for the partially subassembled Schur complement */
8703425bc38SStefano Zampini     ierr = MatMult(pcis->A_IB,pcis->vec1_B,pcis->vec1_D);CHKERRQ(ierr);
8713425bc38SStefano Zampini     ierr = VecAXPY(mat_ctx->temp_solution_D,-1.0,pcis->vec1_D);CHKERRQ(ierr);
8723425bc38SStefano Zampini     ierr = KSPSolve(pcbddc->ksp_D,mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr);
8733425bc38SStefano Zampini   }
8743425bc38SStefano Zampini   ierr = VecScatterBegin(pcis->global_to_D,pcis->vec1_D,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
8753425bc38SStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_D,pcis->vec1_D,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
8763425bc38SStefano Zampini   /* final change of basis if needed
8773425bc38SStefano Zampini      Is also sums the dirichlet part removed during RHS assembling */
8783425bc38SStefano Zampini   (*mat_ctx->pc->ops->postsolve)(mat_ctx->pc,PETSC_NULL,PETSC_NULL,standard_sol);
8793425bc38SStefano Zampini   PetscFunctionReturn(0);
8803425bc38SStefano Zampini 
8813425bc38SStefano Zampini }
8823425bc38SStefano Zampini EXTERN_C_END
8833425bc38SStefano Zampini #undef __FUNCT__
8843425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetSolution"
8853425bc38SStefano Zampini /*@
8863425bc38SStefano Zampini  PCBDDCMatFETIDPGetSolution - Get Solution for FETIDP linear system.
8873425bc38SStefano Zampini 
8883425bc38SStefano Zampini    Collective
8893425bc38SStefano Zampini 
8903425bc38SStefano Zampini    Input Parameters:
8913425bc38SStefano Zampini +  fetidp_mat        - the FETIDP mat obtained by a call to PCBDDCCreateFETIDPOperators
8923425bc38SStefano Zampini +  fetidp_flux_sol - the solution of the FETIDP linear system
8933425bc38SStefano Zampini 
8943425bc38SStefano Zampini    Output Parameters:
8953425bc38SStefano Zampini +  standard_sol      - the solution on the global domain
8963425bc38SStefano Zampini 
8973425bc38SStefano Zampini    Level: developer
8983425bc38SStefano Zampini 
8993425bc38SStefano Zampini    Notes:
9003425bc38SStefano Zampini 
9013425bc38SStefano Zampini .seealso: PCBDDC
9023425bc38SStefano Zampini @*/
9033425bc38SStefano Zampini PetscErrorCode PCBDDCMatFETIDPGetSolution(Mat fetidp_mat, Vec fetidp_flux_sol, Vec standard_sol)
9043425bc38SStefano Zampini {
9053425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
9063425bc38SStefano Zampini   PetscErrorCode ierr;
9073425bc38SStefano Zampini 
9083425bc38SStefano Zampini   PetscFunctionBegin;
9093425bc38SStefano Zampini   ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr);
9103425bc38SStefano Zampini   ierr = PetscTryMethod(mat_ctx->pc,"PCBDDCMatFETIDPGetSolution_C",(Mat,Vec,Vec),(fetidp_mat,fetidp_flux_sol,standard_sol));CHKERRQ(ierr);
9113425bc38SStefano Zampini   PetscFunctionReturn(0);
9123425bc38SStefano Zampini }
9133425bc38SStefano Zampini /* -------------------------------------------------------------------------- */
9143425bc38SStefano Zampini EXTERN_C_BEGIN
9153425bc38SStefano Zampini #undef __FUNCT__
9163425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPOperators_BDDC"
9173425bc38SStefano Zampini static PetscErrorCode PCBDDCCreateFETIDPOperators_BDDC(PC pc, Mat *fetidp_mat, PC *fetidp_pc)
9183425bc38SStefano Zampini {
9193425bc38SStefano Zampini   PETSC_EXTERN PetscErrorCode FETIDPMatMult(Mat,Vec,Vec);
9203425bc38SStefano Zampini   PETSC_EXTERN PetscErrorCode PCBDDCDestroyFETIDPMat(Mat);
9213425bc38SStefano Zampini   PETSC_EXTERN PetscErrorCode FETIDPPCApply(PC,Vec,Vec);
9223425bc38SStefano Zampini   PETSC_EXTERN PetscErrorCode PCBDDCDestroyFETIDPPC(PC);
9233425bc38SStefano Zampini 
9243425bc38SStefano Zampini   FETIDPMat_ctx  *fetidpmat_ctx;
9253425bc38SStefano Zampini   Mat            newmat;
9263425bc38SStefano Zampini   FETIDPPC_ctx  *fetidppc_ctx;
9273425bc38SStefano Zampini   PC             newpc;
9283425bc38SStefano Zampini   MPI_Comm       comm = ((PetscObject)pc)->comm;
9293425bc38SStefano Zampini   PetscErrorCode ierr;
9303425bc38SStefano Zampini 
9313425bc38SStefano Zampini   PetscFunctionBegin;
9323425bc38SStefano Zampini   /* FETIDP linear matrix */
9333425bc38SStefano Zampini   ierr = PCBDDCCreateFETIDPMatContext(pc, &fetidpmat_ctx);CHKERRQ(ierr);
9343425bc38SStefano Zampini   ierr = PCBDDCSetupFETIDPMatContext(fetidpmat_ctx);CHKERRQ(ierr);
9353425bc38SStefano Zampini   ierr = MatCreateShell(comm,PETSC_DECIDE,PETSC_DECIDE,fetidpmat_ctx->n_lambda,fetidpmat_ctx->n_lambda,fetidpmat_ctx,&newmat);CHKERRQ(ierr);
9363425bc38SStefano Zampini   ierr = MatShellSetOperation(newmat,MATOP_MULT,(void (*)(void))FETIDPMatMult);CHKERRQ(ierr);
9373425bc38SStefano Zampini   ierr = MatShellSetOperation(newmat,MATOP_DESTROY,(void (*)(void))PCBDDCDestroyFETIDPMat);CHKERRQ(ierr);
9383425bc38SStefano Zampini   ierr = MatSetUp(newmat);CHKERRQ(ierr);
9393425bc38SStefano Zampini   /* FETIDP preconditioner */
9403425bc38SStefano Zampini   ierr = PCBDDCCreateFETIDPPCContext(pc, &fetidppc_ctx);CHKERRQ(ierr);
9413425bc38SStefano Zampini   ierr = PCBDDCSetupFETIDPPCContext(newmat,fetidppc_ctx);CHKERRQ(ierr);
9423425bc38SStefano Zampini   ierr = PCCreate(comm,&newpc);CHKERRQ(ierr);
9433425bc38SStefano Zampini   ierr = PCSetType(newpc,PCSHELL);CHKERRQ(ierr);
9443425bc38SStefano Zampini   ierr = PCShellSetContext(newpc,fetidppc_ctx);CHKERRQ(ierr);
9453425bc38SStefano Zampini   ierr = PCShellSetApply(newpc,FETIDPPCApply);CHKERRQ(ierr);
9463425bc38SStefano Zampini   ierr = PCShellSetDestroy(newpc,PCBDDCDestroyFETIDPPC);CHKERRQ(ierr);
9473425bc38SStefano Zampini   ierr = PCSetOperators(newpc,newmat,newmat,SAME_PRECONDITIONER);CHKERRQ(ierr);
9483425bc38SStefano Zampini   ierr = PCSetUp(newpc);CHKERRQ(ierr);
9493425bc38SStefano Zampini   /* return pointers for objects created */
9503425bc38SStefano Zampini   *fetidp_mat=newmat;
9513425bc38SStefano Zampini   *fetidp_pc=newpc;
9523425bc38SStefano Zampini 
9533425bc38SStefano Zampini   PetscFunctionReturn(0);
9543425bc38SStefano Zampini }
9553425bc38SStefano Zampini EXTERN_C_END
9563425bc38SStefano Zampini #undef __FUNCT__
9573425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPOperators"
9583425bc38SStefano Zampini /*@
9593425bc38SStefano Zampini  PCBDDCCreateFETIDPOperators - Create operators for FETIDP.
9603425bc38SStefano Zampini 
9613425bc38SStefano Zampini    Collective
9623425bc38SStefano Zampini 
9633425bc38SStefano Zampini    Input Parameters:
9643425bc38SStefano Zampini +  pc - the BDDC preconditioning context (setup must be already called)
9653425bc38SStefano Zampini 
9663425bc38SStefano Zampini    Level: developer
9673425bc38SStefano Zampini 
9683425bc38SStefano Zampini    Notes:
9693425bc38SStefano Zampini 
9703425bc38SStefano Zampini .seealso: PCBDDC
9713425bc38SStefano Zampini @*/
9723425bc38SStefano Zampini PetscErrorCode PCBDDCCreateFETIDPOperators(PC pc, Mat *fetidp_mat, PC *fetidp_pc)
9733425bc38SStefano Zampini {
9743425bc38SStefano Zampini   PetscErrorCode ierr;
9753425bc38SStefano Zampini 
9763425bc38SStefano Zampini   PetscFunctionBegin;
9773425bc38SStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
9783425bc38SStefano Zampini   if (pc->setupcalled) {
9793425bc38SStefano Zampini     ierr = PetscTryMethod(pc,"PCBDDCCreateFETIDPOperators_C",(PC,Mat*,PC*),(pc,fetidp_mat,fetidp_pc));CHKERRQ(ierr);
9803425bc38SStefano Zampini   } else {
9813425bc38SStefano Zampini     SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SUP,"You must call PCSetup_BDDC before calling %s\n",__FUNCT__);
9823425bc38SStefano Zampini   }
9833425bc38SStefano Zampini   PetscFunctionReturn(0);
9843425bc38SStefano Zampini }
9850c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
986da1bb401SStefano Zampini /*MC
987da1bb401SStefano Zampini    PCBDDC - Balancing Domain Decomposition by Constraints.
9880c7d97c5SJed Brown 
989da1bb401SStefano Zampini    Options Database Keys:
990da1bb401SStefano Zampini .    -pcbddc ??? -
991da1bb401SStefano Zampini 
992da1bb401SStefano Zampini    Level: intermediate
993da1bb401SStefano Zampini 
994da1bb401SStefano Zampini    Notes: The matrix used with this preconditioner must be of type MATIS
995da1bb401SStefano Zampini 
996da1bb401SStefano Zampini           Unlike more 'conventional' interface preconditioners, this iterates over ALL the
997da1bb401SStefano Zampini           degrees of freedom, NOT just those on the interface (this allows the use of approximate solvers
998da1bb401SStefano Zampini           on the subdomains).
999da1bb401SStefano Zampini 
1000da1bb401SStefano Zampini           Options for the coarse grid preconditioner can be set with -
1001da1bb401SStefano Zampini           Options for the Dirichlet subproblem can be set with -
1002da1bb401SStefano Zampini           Options for the Neumann subproblem can be set with -
1003da1bb401SStefano Zampini 
1004da1bb401SStefano Zampini    Contributed by Stefano Zampini
1005da1bb401SStefano Zampini 
1006da1bb401SStefano Zampini .seealso:  PCCreate(), PCSetType(), PCType (for list of available types), PC,  MATIS
1007da1bb401SStefano Zampini M*/
1008da1bb401SStefano Zampini EXTERN_C_BEGIN
1009da1bb401SStefano Zampini #undef __FUNCT__
1010da1bb401SStefano Zampini #define __FUNCT__ "PCCreate_BDDC"
1011da1bb401SStefano Zampini PetscErrorCode PCCreate_BDDC(PC pc)
1012da1bb401SStefano Zampini {
1013da1bb401SStefano Zampini   PetscErrorCode ierr;
1014da1bb401SStefano Zampini   PC_BDDC        *pcbddc;
1015da1bb401SStefano Zampini   PCBDDCGraph    mat_graph;
1016da1bb401SStefano Zampini 
1017da1bb401SStefano Zampini   PetscFunctionBegin;
1018da1bb401SStefano Zampini   /* Creates the private data structure for this preconditioner and attach it to the PC object. */
1019da1bb401SStefano Zampini   ierr      = PetscNewLog(pc,PC_BDDC,&pcbddc);CHKERRQ(ierr);
1020da1bb401SStefano Zampini   pc->data  = (void*)pcbddc;
1021da1bb401SStefano Zampini 
1022da1bb401SStefano Zampini   /* create PCIS data structure */
1023da1bb401SStefano Zampini   ierr = PCISCreate(pc);CHKERRQ(ierr);
1024da1bb401SStefano Zampini 
1025da1bb401SStefano Zampini   /* BDDC specific */
10263972b0daSStefano Zampini   pcbddc->temp_solution              = 0;
1027534831adSStefano Zampini   pcbddc->original_rhs               = 0;
1028534831adSStefano Zampini   pcbddc->local_mat                  = 0;
1029534831adSStefano Zampini   pcbddc->ChangeOfBasisMatrix        = 0;
1030534831adSStefano Zampini   pcbddc->usechangeofbasis           = PETSC_TRUE;
1031534831adSStefano Zampini   pcbddc->usechangeonfaces           = PETSC_FALSE;
1032da1bb401SStefano Zampini   pcbddc->coarse_vec                 = 0;
1033da1bb401SStefano Zampini   pcbddc->coarse_rhs                 = 0;
1034da1bb401SStefano Zampini   pcbddc->coarse_ksp                 = 0;
1035da1bb401SStefano Zampini   pcbddc->coarse_phi_B               = 0;
1036da1bb401SStefano Zampini   pcbddc->coarse_phi_D               = 0;
1037da1bb401SStefano Zampini   pcbddc->vec1_P                     = 0;
1038da1bb401SStefano Zampini   pcbddc->vec1_R                     = 0;
1039da1bb401SStefano Zampini   pcbddc->vec2_R                     = 0;
1040da1bb401SStefano Zampini   pcbddc->local_auxmat1              = 0;
1041da1bb401SStefano Zampini   pcbddc->local_auxmat2              = 0;
1042da1bb401SStefano Zampini   pcbddc->R_to_B                     = 0;
1043da1bb401SStefano Zampini   pcbddc->R_to_D                     = 0;
1044da1bb401SStefano Zampini   pcbddc->ksp_D                      = 0;
1045da1bb401SStefano Zampini   pcbddc->ksp_R                      = 0;
1046da1bb401SStefano Zampini   pcbddc->local_primal_indices       = 0;
1047da1bb401SStefano Zampini   pcbddc->prec_type                  = PETSC_FALSE;
1048da1bb401SStefano Zampini   pcbddc->NeumannBoundaries          = 0;
1049da1bb401SStefano Zampini   pcbddc->ISForDofs                  = 0;
1050da1bb401SStefano Zampini   pcbddc->ISForVertices              = 0;
1051da1bb401SStefano Zampini   pcbddc->n_ISForFaces               = 0;
1052da1bb401SStefano Zampini   pcbddc->n_ISForEdges               = 0;
1053da1bb401SStefano Zampini   pcbddc->ConstraintMatrix           = 0;
1054da1bb401SStefano Zampini   pcbddc->use_nnsp_true              = PETSC_FALSE;
1055da1bb401SStefano Zampini   pcbddc->local_primal_sizes         = 0;
1056da1bb401SStefano Zampini   pcbddc->local_primal_displacements = 0;
1057da1bb401SStefano Zampini   pcbddc->replicated_local_primal_indices = 0;
1058da1bb401SStefano Zampini   pcbddc->replicated_local_primal_values  = 0;
1059da1bb401SStefano Zampini   pcbddc->coarse_loc_to_glob         = 0;
1060da1bb401SStefano Zampini   pcbddc->dbg_flag                   = PETSC_FALSE;
1061da1bb401SStefano Zampini   pcbddc->coarsening_ratio           = 8;
1062b76ba322SStefano Zampini   pcbddc->use_exact_dirichlet        = PETSC_TRUE;
1063da1bb401SStefano Zampini 
1064da1bb401SStefano Zampini   /* allocate and initialize needed graph structure */
1065da1bb401SStefano Zampini   ierr = PetscMalloc(sizeof(*mat_graph),&pcbddc->mat_graph);CHKERRQ(ierr);
1066da1bb401SStefano Zampini   pcbddc->mat_graph->xadj            = 0;
1067da1bb401SStefano Zampini   pcbddc->mat_graph->adjncy          = 0;
1068da1bb401SStefano Zampini 
1069da1bb401SStefano Zampini   /* function pointers */
1070da1bb401SStefano Zampini   pc->ops->apply               = PCApply_BDDC;
1071da1bb401SStefano Zampini   pc->ops->applytranspose      = 0;
1072da1bb401SStefano Zampini   pc->ops->setup               = PCSetUp_BDDC;
1073da1bb401SStefano Zampini   pc->ops->destroy             = PCDestroy_BDDC;
1074da1bb401SStefano Zampini   pc->ops->setfromoptions      = PCSetFromOptions_BDDC;
1075da1bb401SStefano Zampini   pc->ops->view                = 0;
1076da1bb401SStefano Zampini   pc->ops->applyrichardson     = 0;
1077da1bb401SStefano Zampini   pc->ops->applysymmetricleft  = 0;
1078da1bb401SStefano Zampini   pc->ops->applysymmetricright = 0;
1079534831adSStefano Zampini   pc->ops->presolve            = PCPreSolve_BDDC;
1080534831adSStefano Zampini   pc->ops->postsolve           = PCPostSolve_BDDC;
1081da1bb401SStefano Zampini 
1082da1bb401SStefano Zampini   /* composing function */
1083da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDirichletBoundaries_C","PCBDDCSetDirichletBoundaries_BDDC",
1084da1bb401SStefano Zampini                     PCBDDCSetDirichletBoundaries_BDDC);CHKERRQ(ierr);
1085da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetNeumannBoundaries_C","PCBDDCSetNeumannBoundaries_BDDC",
1086da1bb401SStefano Zampini                     PCBDDCSetNeumannBoundaries_BDDC);CHKERRQ(ierr);
1087da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetDirichletBoundaries_C","PCBDDCGetDirichletBoundaries_BDDC",
1088da1bb401SStefano Zampini                     PCBDDCGetDirichletBoundaries_BDDC);CHKERRQ(ierr);
1089da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetNeumannBoundaries_C","PCBDDCGetNeumannBoundaries_BDDC",
1090da1bb401SStefano Zampini                     PCBDDCGetNeumannBoundaries_BDDC);CHKERRQ(ierr);
1091da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetCoarseProblemType_C","PCBDDCSetCoarseProblemType_BDDC",
1092da1bb401SStefano Zampini                     PCBDDCSetCoarseProblemType_BDDC);CHKERRQ(ierr);
1093da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDofsSplitting_C","PCBDDCSetDofsSplitting_BDDC",
1094da1bb401SStefano Zampini                     PCBDDCSetDofsSplitting_BDDC);CHKERRQ(ierr);
1095da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetLocalAdjacencyGraph_C","PCBDDCSetLocalAdjacencyGraph_BDDC",
1096da1bb401SStefano Zampini                     PCBDDCSetLocalAdjacencyGraph_BDDC);CHKERRQ(ierr);
1097534831adSStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPreSolve_C","PCPreSolve_BDDC",
1098534831adSStefano Zampini                     PCPreSolve_BDDC);CHKERRQ(ierr);
1099534831adSStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPostSolve_C","PCPostSolve_BDDC",
1100534831adSStefano Zampini                     PCPostSolve_BDDC);CHKERRQ(ierr);
11013425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCCreateFETIDPOperators_C","PCBDDCCreateFETIDPOperators_BDDC",
11023425bc38SStefano Zampini                     PCBDDCCreateFETIDPOperators_BDDC);CHKERRQ(ierr);
11033425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetRHS_C","PCBDDCMatFETIDPGetRHS_BDDC",
11043425bc38SStefano Zampini                     PCBDDCMatFETIDPGetRHS_BDDC);CHKERRQ(ierr);
11053425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetSolution_C","PCBDDCMatFETIDPGetSolution_BDDC",
11063425bc38SStefano Zampini                     PCBDDCMatFETIDPGetSolution_BDDC);CHKERRQ(ierr);
1107da1bb401SStefano Zampini   PetscFunctionReturn(0);
1108da1bb401SStefano Zampini }
1109da1bb401SStefano Zampini EXTERN_C_END
11103425bc38SStefano Zampini 
1111da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
1112da1bb401SStefano Zampini /* All static functions from now on                                           */
1113da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
11143425bc38SStefano Zampini 
11153425bc38SStefano Zampini #undef __FUNCT__
11163425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPMatContext"
11173425bc38SStefano Zampini static PetscErrorCode PCBDDCCreateFETIDPMatContext(PC pc, FETIDPMat_ctx **fetidpmat_ctx)
11183425bc38SStefano Zampini {
11193425bc38SStefano Zampini   FETIDPMat_ctx  *newctx;
11203425bc38SStefano Zampini   PetscErrorCode ierr;
11213425bc38SStefano Zampini 
11223425bc38SStefano Zampini   PetscFunctionBegin;
11233425bc38SStefano Zampini   ierr = PetscMalloc(sizeof(*newctx),&newctx);CHKERRQ(ierr);
11243425bc38SStefano Zampini   newctx->lambda_local    = 0;
11253425bc38SStefano Zampini   newctx->temp_solution_B = 0;
11263425bc38SStefano Zampini   newctx->temp_solution_D = 0;
11273425bc38SStefano Zampini   newctx->B_delta         = 0;
11283425bc38SStefano Zampini   newctx->B_Ddelta        = 0; /* theoretically belongs to the FETIDP preconditioner */
11293425bc38SStefano Zampini   newctx->l2g_lambda      = 0;
11303425bc38SStefano Zampini   /* increase the reference count for BDDC preconditioner */
11313425bc38SStefano Zampini   ierr = PetscObjectReference((PetscObject)pc);CHKERRQ(ierr);
11323425bc38SStefano Zampini   newctx->pc              = pc;
11333425bc38SStefano Zampini   *fetidpmat_ctx          = newctx;
11343425bc38SStefano Zampini   PetscFunctionReturn(0);
11353425bc38SStefano Zampini }
11363425bc38SStefano Zampini 
11373425bc38SStefano Zampini #undef __FUNCT__
11383425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPPCContext"
11393425bc38SStefano Zampini static PetscErrorCode PCBDDCCreateFETIDPPCContext(PC pc, FETIDPPC_ctx **fetidppc_ctx)
11403425bc38SStefano Zampini {
11413425bc38SStefano Zampini   FETIDPPC_ctx  *newctx;
11423425bc38SStefano Zampini   PetscErrorCode ierr;
11433425bc38SStefano Zampini 
11443425bc38SStefano Zampini   PetscFunctionBegin;
11453425bc38SStefano Zampini   ierr = PetscMalloc(sizeof(*newctx),&newctx);CHKERRQ(ierr);
11463425bc38SStefano Zampini   newctx->lambda_local    = 0;
11473425bc38SStefano Zampini   newctx->B_Ddelta        = 0;
11483425bc38SStefano Zampini   newctx->l2g_lambda      = 0;
11493425bc38SStefano Zampini   /* increase the reference count for BDDC preconditioner */
11503425bc38SStefano Zampini   ierr = PetscObjectReference((PetscObject)pc);CHKERRQ(ierr);
11513425bc38SStefano Zampini   newctx->pc              = pc;
11523425bc38SStefano Zampini   *fetidppc_ctx           = newctx;
11533425bc38SStefano Zampini   PetscFunctionReturn(0);
11543425bc38SStefano Zampini }
11553425bc38SStefano Zampini 
11563425bc38SStefano Zampini #undef __FUNCT__
11573425bc38SStefano Zampini #define __FUNCT__ "PCBDDCDestroyFETIDPMat"
11583425bc38SStefano Zampini static PetscErrorCode PCBDDCDestroyFETIDPMat(Mat A)
11593425bc38SStefano Zampini {
11603425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
11613425bc38SStefano Zampini   PetscErrorCode ierr;
11623425bc38SStefano Zampini 
11633425bc38SStefano Zampini   PetscFunctionBegin;
11643425bc38SStefano Zampini   ierr = MatShellGetContext(A,(void**)&mat_ctx);CHKERRQ(ierr);
11653425bc38SStefano Zampini   ierr = VecDestroy(&mat_ctx->lambda_local);CHKERRQ(ierr);
11663425bc38SStefano Zampini   ierr = VecDestroy(&mat_ctx->temp_solution_D);CHKERRQ(ierr);
11673425bc38SStefano Zampini   ierr = VecDestroy(&mat_ctx->temp_solution_B);CHKERRQ(ierr);
11683425bc38SStefano Zampini   ierr = MatDestroy(&mat_ctx->B_delta);CHKERRQ(ierr);
11693425bc38SStefano Zampini   ierr = MatDestroy(&mat_ctx->B_Ddelta);CHKERRQ(ierr);
11703425bc38SStefano Zampini   ierr = VecScatterDestroy(&mat_ctx->l2g_lambda);CHKERRQ(ierr);
11713425bc38SStefano Zampini   ierr = PCDestroy(&mat_ctx->pc);CHKERRQ(ierr); /* actually it does not destroy BDDC, only decrease its reference count */
11723425bc38SStefano Zampini   ierr = PetscFree(mat_ctx);CHKERRQ(ierr);
11733425bc38SStefano Zampini   PetscFunctionReturn(0);
11743425bc38SStefano Zampini }
11753425bc38SStefano Zampini 
11763425bc38SStefano Zampini #undef __FUNCT__
11773425bc38SStefano Zampini #define __FUNCT__ "PCBDDCDestroyFETIDPPC"
11783425bc38SStefano Zampini static PetscErrorCode PCBDDCDestroyFETIDPPC(PC pc)
11793425bc38SStefano Zampini {
11803425bc38SStefano Zampini   FETIDPPC_ctx  *pc_ctx;
11813425bc38SStefano Zampini   PetscErrorCode ierr;
11823425bc38SStefano Zampini 
11833425bc38SStefano Zampini   PetscFunctionBegin;
11843425bc38SStefano Zampini   ierr = PCShellGetContext(pc,(void**)&pc_ctx);CHKERRQ(ierr);
11853425bc38SStefano Zampini   ierr = VecDestroy(&pc_ctx->lambda_local);CHKERRQ(ierr);
11863425bc38SStefano Zampini   ierr = MatDestroy(&pc_ctx->B_Ddelta);CHKERRQ(ierr);
11873425bc38SStefano Zampini   ierr = VecScatterDestroy(&pc_ctx->l2g_lambda);CHKERRQ(ierr);
11883425bc38SStefano Zampini   ierr = PCDestroy(&pc_ctx->pc);CHKERRQ(ierr); /* actually it does not destroy BDDC, only decrease its reference count */
11893425bc38SStefano Zampini   ierr = PetscFree(pc_ctx);CHKERRQ(ierr);
11903425bc38SStefano Zampini   PetscFunctionReturn(0);
11913425bc38SStefano Zampini }
11923425bc38SStefano Zampini 
11933425bc38SStefano Zampini #undef __FUNCT__
11943425bc38SStefano Zampini #define __FUNCT__ "PCBDDCSetupFETIDPMatContext"
11953425bc38SStefano Zampini static PetscErrorCode PCBDDCSetupFETIDPMatContext(FETIDPMat_ctx *fetidpmat_ctx )
11963425bc38SStefano Zampini {
11973425bc38SStefano Zampini   PetscErrorCode ierr;
11983425bc38SStefano Zampini   PC_IS          *pcis=(PC_IS*)fetidpmat_ctx->pc->data;
11993425bc38SStefano Zampini   PC_BDDC        *pcbddc=(PC_BDDC*)fetidpmat_ctx->pc->data;
12003425bc38SStefano Zampini   PCBDDCGraph    mat_graph=pcbddc->mat_graph;
12013425bc38SStefano Zampini   Mat_IS         *matis  = (Mat_IS*)fetidpmat_ctx->pc->pmat->data;
12023425bc38SStefano Zampini   MPI_Comm       comm = ((PetscObject)(fetidpmat_ctx->pc))->comm;
12033425bc38SStefano Zampini 
12043425bc38SStefano Zampini   Mat            ScalingMat;
12053425bc38SStefano Zampini   Vec            lambda_global;
12063425bc38SStefano Zampini   IS             IS_l2g_lambda;
12073425bc38SStefano Zampini 
12083425bc38SStefano Zampini   PetscBool      skip_node,fully_redundant;
12093425bc38SStefano Zampini   PetscInt       i,j,k,s,n_boundary_dofs,sum_dof_sizes,n_global_lambda,n_vertices;
12103425bc38SStefano Zampini   PetscInt       n_local_lambda,n_lambda_for_dof,dual_size,n_neg_values,n_pos_values;
12113425bc38SStefano Zampini   PetscMPIInt    rank,nprocs,partial_sum;
12123425bc38SStefano Zampini   PetscScalar    scalar_value;
12133425bc38SStefano Zampini 
12143425bc38SStefano Zampini   PetscInt       *vertex_indices,*temp_indices;
12153425bc38SStefano Zampini   PetscInt       *dual_dofs_boundary_indices,*aux_local_numbering_1,*aux_global_numbering;
12163425bc38SStefano Zampini   PetscInt       *aux_sums,*cols_B_delta,*l2g_indices;
12173425bc38SStefano Zampini   PetscMPIInt    *aux_local_numbering_2,*aux_global_numbering_mpi,*dof_sizes,*dof_displs;
12183425bc38SStefano Zampini   PetscMPIInt    *all_aux_global_numbering_mpi_1,*all_aux_global_numbering_mpi_2,*global_dofs_numbering;
12193425bc38SStefano Zampini   PetscScalar    *array,*scaling_factors,*vals_B_delta;
12203425bc38SStefano Zampini 
12213425bc38SStefano Zampini   /* For communication of scaling factors */
12223425bc38SStefano Zampini   PetscInt       *ptrs_buffer,neigh_position;
12233425bc38SStefano Zampini   PetscScalar    **all_factors,*send_buffer,*recv_buffer;
12243425bc38SStefano Zampini   MPI_Request    *send_reqs,*recv_reqs;
12253425bc38SStefano Zampini 
12263425bc38SStefano Zampini   /* tests */
12273425bc38SStefano Zampini   Vec            test_vec;
12283425bc38SStefano Zampini   PetscBool      test_fetidp;
12293425bc38SStefano Zampini   PetscViewer    viewer;
12303425bc38SStefano Zampini 
12313425bc38SStefano Zampini   PetscFunctionBegin;
12323425bc38SStefano Zampini   ierr = MPI_Comm_rank(comm,&rank);CHKERRQ(ierr);
12333425bc38SStefano Zampini   ierr = MPI_Comm_size(comm,&nprocs);CHKERRQ(ierr);
12343425bc38SStefano Zampini 
12353425bc38SStefano Zampini   /* Default type of lagrange multipliers is non-redundant */
12363425bc38SStefano Zampini   fully_redundant = PETSC_FALSE;
12373425bc38SStefano Zampini   ierr = PetscOptionsGetBool(PETSC_NULL,"-fetidp_fullyredundant",&fully_redundant,PETSC_NULL);CHKERRQ(ierr);
12383425bc38SStefano Zampini 
12393425bc38SStefano Zampini   /* Evaluate local and global number of lagrange multipliers */
12403425bc38SStefano Zampini   ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
12413425bc38SStefano Zampini   n_local_lambda = 0;
12423425bc38SStefano Zampini   partial_sum = 0;
12433425bc38SStefano Zampini   n_boundary_dofs = 0;
12443425bc38SStefano Zampini   s = 0;
12453425bc38SStefano Zampini   n_vertices = 0;
12463425bc38SStefano Zampini   /* Get Vertices used to define the BDDC */
12473425bc38SStefano Zampini   ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(*vertex_indices),&vertex_indices);CHKERRQ(ierr);
12483425bc38SStefano Zampini   for(i=0;i<pcbddc->local_primal_size;i++) {
12493425bc38SStefano Zampini     ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&j,(const PetscInt**)&temp_indices,PETSC_NULL);CHKERRQ(ierr);
12503425bc38SStefano Zampini     if(j == 1) {
12513425bc38SStefano Zampini       vertex_indices[n_vertices]=temp_indices[0];
12523425bc38SStefano Zampini       n_vertices++;
12533425bc38SStefano Zampini     }
12543425bc38SStefano Zampini     ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&j,(const PetscInt**)&temp_indices,PETSC_NULL);CHKERRQ(ierr);
12553425bc38SStefano Zampini   }
12563425bc38SStefano Zampini   dual_size = pcis->n_B-n_vertices;
12573425bc38SStefano Zampini   ierr = PetscMalloc(dual_size*sizeof(*dual_dofs_boundary_indices),&dual_dofs_boundary_indices);CHKERRQ(ierr);
12583425bc38SStefano Zampini   ierr = PetscMalloc(dual_size*sizeof(*aux_local_numbering_1),&aux_local_numbering_1);CHKERRQ(ierr);
12593425bc38SStefano Zampini   ierr = PetscMalloc(dual_size*sizeof(*aux_local_numbering_2),&aux_local_numbering_2);CHKERRQ(ierr);
12603425bc38SStefano Zampini 
12613425bc38SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
12623425bc38SStefano Zampini   for(i=0;i<pcis->n;i++){
12633425bc38SStefano Zampini     j = mat_graph->count[i]; /* RECALL: mat_graph->count[i] does not count myself */
1264c6582918SStefano Zampini     k = 0;
1265c6582918SStefano Zampini     if(j > 0) {
12663425bc38SStefano Zampini       k = (mat_graph->neighbours_set[i][0] == -1 ?  1 : 0);
1267c6582918SStefano Zampini     }
12683425bc38SStefano Zampini     j = j - k ;
12693425bc38SStefano Zampini     if( j > 0 ) { n_boundary_dofs++; }
12703425bc38SStefano Zampini 
12713425bc38SStefano Zampini     skip_node = PETSC_FALSE;
1272c6582918SStefano Zampini     if( s < n_vertices && vertex_indices[s]==i) { /* it works for a sorted set of vertices */
12733425bc38SStefano Zampini       skip_node = PETSC_TRUE;
12743425bc38SStefano Zampini       s++;
12753425bc38SStefano Zampini     }
12763425bc38SStefano Zampini     if(j < 1) {skip_node = PETSC_TRUE;}
12773425bc38SStefano Zampini     if( !skip_node ) {
12783425bc38SStefano Zampini       if(fully_redundant) {
12793425bc38SStefano Zampini         /* fully redundant set of lagrange multipliers */
12803425bc38SStefano Zampini         n_lambda_for_dof = (j*(j+1))/2;
12813425bc38SStefano Zampini       } else {
12823425bc38SStefano Zampini         n_lambda_for_dof = j;
12833425bc38SStefano Zampini       }
12843425bc38SStefano Zampini       n_local_lambda += j;
12853425bc38SStefano Zampini       /* needed to evaluate global number of lagrange multipliers */
12863425bc38SStefano Zampini       array[i]=(1.0*n_lambda_for_dof)/(j+1.0); /* already scaled for the next global sum */
12873425bc38SStefano Zampini       /* store some data needed */
12883425bc38SStefano Zampini       dual_dofs_boundary_indices[partial_sum] = n_boundary_dofs-1;
12893425bc38SStefano Zampini       aux_local_numbering_1[partial_sum] = i;
12903425bc38SStefano Zampini       aux_local_numbering_2[partial_sum] = (PetscMPIInt)n_lambda_for_dof;
12913425bc38SStefano Zampini       partial_sum++;
12923425bc38SStefano Zampini     }
12933425bc38SStefano Zampini   }
12943425bc38SStefano Zampini   /*printf("I found %d local lambda dofs\n",n_local_lambda);
12953425bc38SStefano Zampini   printf("I found %d boundary dofs (should be %d)\n",n_boundary_dofs,pcis->n_B);
12963425bc38SStefano Zampini   printf("Partial sum %d should be %d\n",partial_sum,dual_size);*/
12973425bc38SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
12983425bc38SStefano Zampini   ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
12993425bc38SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
13003425bc38SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
13013425bc38SStefano Zampini   ierr = VecSum(pcis->vec1_global,&scalar_value);CHKERRQ(ierr);
13023425bc38SStefano Zampini   fetidpmat_ctx->n_lambda = (PetscInt) scalar_value;
13033425bc38SStefano Zampini   /* printf("I found %d global multipliers (%f)\n",fetidpmat_ctx->n_lambda,scalar_value); */
13043425bc38SStefano Zampini   ierr = VecCreate(PETSC_COMM_SELF,&fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
13053425bc38SStefano Zampini   ierr = VecSetSizes(fetidpmat_ctx->lambda_local,n_local_lambda,n_local_lambda);CHKERRQ(ierr);
13063425bc38SStefano Zampini   ierr = VecSetType(fetidpmat_ctx->lambda_local,VECSEQ);CHKERRQ(ierr);
13073425bc38SStefano Zampini   ierr = VecCreate(comm,&lambda_global);CHKERRQ(ierr);
13083425bc38SStefano Zampini   ierr = VecSetSizes(lambda_global,PETSC_DECIDE,fetidpmat_ctx->n_lambda);CHKERRQ(ierr);
13093425bc38SStefano Zampini   ierr = VecSetType(lambda_global,VECMPI);CHKERRQ(ierr);
13103425bc38SStefano Zampini 
13113425bc38SStefano Zampini   /* compute global ordering of lagrange multipliers and associate l2g map */
13123425bc38SStefano Zampini 
13133425bc38SStefano Zampini   ierr = PetscMalloc(dual_size*sizeof(*aux_global_numbering),&aux_global_numbering);CHKERRQ(ierr);
13143425bc38SStefano Zampini   ierr = PetscMalloc(dual_size*sizeof(*aux_global_numbering_mpi),&aux_global_numbering_mpi);CHKERRQ(ierr);
13153425bc38SStefano Zampini   j = (rank == 0 ? nprocs : 0);
13163425bc38SStefano Zampini   ierr = PetscMalloc(j*sizeof(*dof_sizes),&dof_sizes);CHKERRQ(ierr);
13173425bc38SStefano Zampini   ierr = PetscMalloc(j*sizeof(*dof_displs),&dof_displs);CHKERRQ(ierr);
13183425bc38SStefano Zampini   ierr = ISLocalToGlobalMappingApply(matis->mapping,dual_size,aux_local_numbering_1,aux_global_numbering);CHKERRQ(ierr);
13193425bc38SStefano Zampini   ierr = MPI_Gather(&dual_size,1,MPIU_INT,dof_sizes,1,MPIU_INT,0,comm);CHKERRQ(ierr);
13203425bc38SStefano Zampini   sum_dof_sizes=0;
13213425bc38SStefano Zampini   if ( rank == 0 ) {
13223425bc38SStefano Zampini     dof_displs[0]=0;
13233425bc38SStefano Zampini     sum_dof_sizes=dual_size;
13243425bc38SStefano Zampini     for(i=1;i<nprocs;i++) {
13253425bc38SStefano Zampini       dof_displs[i] = dof_displs[i-1]+dof_sizes[i-1];
13263425bc38SStefano Zampini       sum_dof_sizes += dof_sizes[i];
13273425bc38SStefano Zampini     }
13283425bc38SStefano Zampini   }
13293425bc38SStefano Zampini   for(i=0;i<dual_size;i++) {
13303425bc38SStefano Zampini     aux_global_numbering_mpi[i]=(PetscMPIInt)aux_global_numbering[i];
13313425bc38SStefano Zampini   }
13323425bc38SStefano Zampini   ierr = PetscMalloc(sum_dof_sizes*sizeof(*all_aux_global_numbering_mpi_1),&all_aux_global_numbering_mpi_1);CHKERRQ(ierr);
13333425bc38SStefano Zampini   ierr = PetscMalloc(sum_dof_sizes*sizeof(*all_aux_global_numbering_mpi_2),&all_aux_global_numbering_mpi_2);CHKERRQ(ierr);
13343425bc38SStefano Zampini   ierr = MPI_Gatherv(aux_global_numbering_mpi,dual_size,MPIU_INT,all_aux_global_numbering_mpi_1,dof_sizes,dof_displs,MPIU_INT,0,comm);CHKERRQ(ierr);
13353425bc38SStefano Zampini   ierr = MPI_Gatherv(aux_local_numbering_2,dual_size,MPIU_INT,all_aux_global_numbering_mpi_2,dof_sizes,dof_displs,MPIU_INT,0,comm);CHKERRQ(ierr);
13363425bc38SStefano Zampini 
13373425bc38SStefano Zampini   ierr = PetscMalloc(fetidpmat_ctx->n_lambda*sizeof(*global_dofs_numbering),&global_dofs_numbering);CHKERRQ(ierr);
13383425bc38SStefano Zampini   if( rank == 0 ) {
13393425bc38SStefano Zampini     ierr = PetscSortMPIIntWithArray(sum_dof_sizes,all_aux_global_numbering_mpi_1,all_aux_global_numbering_mpi_2);CHKERRQ(ierr);
13403425bc38SStefano Zampini     j=-1;
13413425bc38SStefano Zampini     partial_sum = 0;
13423425bc38SStefano Zampini     for(i=0;i<sum_dof_sizes;i++) {
13433425bc38SStefano Zampini       if(j != all_aux_global_numbering_mpi_1[i] ) {
13443425bc38SStefano Zampini         j=all_aux_global_numbering_mpi_1[i];
13453425bc38SStefano Zampini         for(k=0;k<all_aux_global_numbering_mpi_2[i];k++) {
13463425bc38SStefano Zampini           global_dofs_numbering[partial_sum+k]=all_aux_global_numbering_mpi_1[i];
13473425bc38SStefano Zampini         }
13483425bc38SStefano Zampini         partial_sum += all_aux_global_numbering_mpi_2[i];
13493425bc38SStefano Zampini       }
13503425bc38SStefano Zampini     }
13513425bc38SStefano Zampini     /* printf("Partial sum for global dofs %d should be %d\n",partial_sum,fetidpmat_ctx->n_lambda); */
13523425bc38SStefano Zampini   }
13533425bc38SStefano Zampini   ierr = MPI_Bcast(global_dofs_numbering,fetidpmat_ctx->n_lambda,MPIU_INT,0,comm);CHKERRQ(ierr);
13543425bc38SStefano Zampini 
13553425bc38SStefano Zampini   /* init data for scaling factors exchange */
13563425bc38SStefano Zampini   partial_sum = 0;
13573425bc38SStefano Zampini   j = 0;
13583425bc38SStefano Zampini   ierr = PetscMalloc( pcis->n_neigh*sizeof(PetscInt),&ptrs_buffer);CHKERRQ(ierr);
13593425bc38SStefano Zampini   ierr = PetscMalloc( (pcis->n_neigh-1)*sizeof(MPI_Request),&send_reqs);CHKERRQ(ierr);
13603425bc38SStefano Zampini   ierr = PetscMalloc( (pcis->n_neigh-1)*sizeof(MPI_Request),&recv_reqs);CHKERRQ(ierr);
13613425bc38SStefano Zampini   ierr = PetscMalloc( pcis->n*sizeof(PetscScalar*),&all_factors);CHKERRQ(ierr);
13623425bc38SStefano Zampini   ptrs_buffer[0]=0;
13633425bc38SStefano Zampini   for(i=1;i<pcis->n_neigh;i++) {
13643425bc38SStefano Zampini     partial_sum += pcis->n_shared[i];
13653425bc38SStefano Zampini     ptrs_buffer[i] = ptrs_buffer[i-1]+pcis->n_shared[i];
13663425bc38SStefano Zampini   }
13673425bc38SStefano Zampini   ierr = PetscMalloc( partial_sum*sizeof(PetscScalar),&send_buffer);CHKERRQ(ierr);
13683425bc38SStefano Zampini   ierr = PetscMalloc( partial_sum*sizeof(PetscScalar),&recv_buffer);CHKERRQ(ierr);
13693425bc38SStefano Zampini   ierr = PetscMalloc( partial_sum*sizeof(PetscScalar),&all_factors[0]);CHKERRQ(ierr);
13703425bc38SStefano Zampini   for(i=0;i<pcis->n-1;i++) {
13713425bc38SStefano Zampini     j = mat_graph->count[i];
13723425bc38SStefano Zampini     if(j>0) {
13733425bc38SStefano Zampini       k = (mat_graph->neighbours_set[i][0] == -1 ?  1 : 0);
13743425bc38SStefano Zampini       j = j - k;
13753425bc38SStefano Zampini     }
13763425bc38SStefano Zampini     all_factors[i+1]=all_factors[i]+j;
13773425bc38SStefano Zampini   }
13783425bc38SStefano Zampini   /* scatter B scaling to N vec */
13793425bc38SStefano Zampini   ierr = VecScatterBegin(pcis->N_to_B,pcis->D,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
13803425bc38SStefano Zampini   ierr = VecScatterEnd  (pcis->N_to_B,pcis->D,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
13813425bc38SStefano Zampini   /* communications */
13823425bc38SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
13833425bc38SStefano Zampini   for(i=1;i<pcis->n_neigh;i++) {
13843425bc38SStefano Zampini     for(j=0;j<pcis->n_shared[i];j++) {
13853425bc38SStefano Zampini       send_buffer[ptrs_buffer[i-1]+j]=array[pcis->shared[i][j]];
13863425bc38SStefano Zampini     }
13873425bc38SStefano Zampini     j = ptrs_buffer[i]-ptrs_buffer[i-1];
1388ea7e1babSStefano Zampini     ierr = MPI_Isend(&send_buffer[ptrs_buffer[i-1]],j,MPIU_SCALAR,pcis->neigh[i],0,comm,&send_reqs[i-1]);CHKERRQ(ierr);
1389ea7e1babSStefano Zampini     ierr = MPI_Irecv(&recv_buffer[ptrs_buffer[i-1]],j,MPIU_SCALAR,pcis->neigh[i],0,comm,&recv_reqs[i-1]);CHKERRQ(ierr);
13903425bc38SStefano Zampini   }
13913425bc38SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
1392ea7e1babSStefano Zampini   ierr = MPI_Waitall((pcis->n_neigh-1),recv_reqs,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
13933425bc38SStefano Zampini   /* put values in correct places */
13943425bc38SStefano Zampini   for(i=1;i<pcis->n_neigh;i++) {
13953425bc38SStefano Zampini     for(j=0;j<pcis->n_shared[i];j++) {
13963425bc38SStefano Zampini       k = pcis->shared[i][j];
13973425bc38SStefano Zampini       neigh_position = 0;
13983425bc38SStefano Zampini       while(mat_graph->neighbours_set[k][neigh_position] != pcis->neigh[i]) {neigh_position++;}
13993425bc38SStefano Zampini       s = (mat_graph->neighbours_set[k][0] == -1 ?  1 : 0);
14003425bc38SStefano Zampini       neigh_position = neigh_position - s;
14013425bc38SStefano Zampini       all_factors[k][neigh_position]=recv_buffer[ptrs_buffer[i-1]+j];
14023425bc38SStefano Zampini     }
14033425bc38SStefano Zampini   }
1404ea7e1babSStefano Zampini   ierr = MPI_Waitall((pcis->n_neigh-1),send_reqs,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
14053425bc38SStefano Zampini   ierr = PetscFree(send_reqs);CHKERRQ(ierr);
14063425bc38SStefano Zampini   ierr = PetscFree(recv_reqs);CHKERRQ(ierr);
14073425bc38SStefano Zampini   ierr = PetscFree(send_buffer);CHKERRQ(ierr);
14083425bc38SStefano Zampini   ierr = PetscFree(recv_buffer);CHKERRQ(ierr);
14093425bc38SStefano Zampini   ierr = PetscFree(ptrs_buffer);CHKERRQ(ierr);
14103425bc38SStefano Zampini 
14113425bc38SStefano Zampini   /* Compute B and B_delta (local actions) */
14123425bc38SStefano Zampini   ierr = PetscMalloc(pcis->n_neigh*sizeof(*aux_sums),&aux_sums);CHKERRQ(ierr);
14133425bc38SStefano Zampini   ierr = PetscMalloc(n_local_lambda*sizeof(*l2g_indices),&l2g_indices);CHKERRQ(ierr);
14143425bc38SStefano Zampini   ierr = PetscMalloc(n_local_lambda*sizeof(*vals_B_delta),&vals_B_delta);CHKERRQ(ierr);
14153425bc38SStefano Zampini   ierr = PetscMalloc(n_local_lambda*sizeof(*cols_B_delta),&cols_B_delta);CHKERRQ(ierr);
14163425bc38SStefano Zampini   ierr = PetscMalloc(n_local_lambda*sizeof(*scaling_factors),&scaling_factors);CHKERRQ(ierr);
14173425bc38SStefano Zampini   n_global_lambda=0;
14183425bc38SStefano Zampini   partial_sum=0;
14193425bc38SStefano Zampini   for(i=0;i<dual_size;i++) {
14203425bc38SStefano Zampini     while( global_dofs_numbering[n_global_lambda] != aux_global_numbering_mpi[i] ) { n_global_lambda++; }
14213425bc38SStefano Zampini     j = mat_graph->count[aux_local_numbering_1[i]];
14223425bc38SStefano Zampini     k = (mat_graph->neighbours_set[aux_local_numbering_1[i]][0] == -1 ?  1 : 0);
14233425bc38SStefano Zampini     j = j - k;
14243425bc38SStefano Zampini     aux_sums[0]=0;
14253425bc38SStefano Zampini     for(s=1;s<j;s++) {
14263425bc38SStefano Zampini       aux_sums[s]=aux_sums[s-1]+j-s+1;
14273425bc38SStefano Zampini     }
14283425bc38SStefano Zampini     array = all_factors[aux_local_numbering_1[i]];
14293425bc38SStefano Zampini     n_neg_values = 0;
14303425bc38SStefano Zampini     while(n_neg_values < j && mat_graph->neighbours_set[aux_local_numbering_1[i]][n_neg_values+k] < rank) {n_neg_values++;}
14313425bc38SStefano Zampini     n_pos_values = j - n_neg_values;
14323425bc38SStefano Zampini     if(fully_redundant) {
14333425bc38SStefano Zampini       for(s=0;s<n_neg_values;s++) {
14343425bc38SStefano Zampini         l2g_indices    [partial_sum+s]=aux_sums[s]+n_neg_values-s-1+n_global_lambda;
14353425bc38SStefano Zampini         cols_B_delta   [partial_sum+s]=dual_dofs_boundary_indices[i];
14363425bc38SStefano Zampini         vals_B_delta   [partial_sum+s]=-1.0;
14373425bc38SStefano Zampini         scaling_factors[partial_sum+s]=array[s];
14383425bc38SStefano Zampini       }
14393425bc38SStefano Zampini       for(s=0;s<n_pos_values;s++) {
14403425bc38SStefano Zampini         l2g_indices    [partial_sum+s+n_neg_values]=aux_sums[n_neg_values]+s+n_global_lambda;
14413425bc38SStefano Zampini         cols_B_delta   [partial_sum+s+n_neg_values]=dual_dofs_boundary_indices[i];
14423425bc38SStefano Zampini         vals_B_delta   [partial_sum+s+n_neg_values]=1.0;
14433425bc38SStefano Zampini         scaling_factors[partial_sum+s+n_neg_values]=array[s+n_neg_values];
14443425bc38SStefano Zampini       }
14453425bc38SStefano Zampini       partial_sum += j;
14463425bc38SStefano Zampini     } else {
14473425bc38SStefano Zampini       /* l2g_indices and default cols and vals of B_delta */
14483425bc38SStefano Zampini       for(s=0;s<j;s++) {
14493425bc38SStefano Zampini         l2g_indices    [partial_sum+s]=n_global_lambda+s;
14503425bc38SStefano Zampini         cols_B_delta   [partial_sum+s]=dual_dofs_boundary_indices[i];
14513425bc38SStefano Zampini         vals_B_delta   [partial_sum+s]=0.0;
14523425bc38SStefano Zampini       }
14533425bc38SStefano Zampini       /* B_delta */
14543425bc38SStefano Zampini       if( n_neg_values > 0 ) { /* there's a rank next to me to the left */
14553425bc38SStefano Zampini         vals_B_delta   [partial_sum+n_neg_values-1]=-1.0;
14563425bc38SStefano Zampini       }
14573425bc38SStefano Zampini       if ( n_neg_values < j ) { /* there's a rank next to me to the right */
14583425bc38SStefano Zampini         vals_B_delta   [partial_sum+n_neg_values]=1.0;
14593425bc38SStefano Zampini       }
14603425bc38SStefano Zampini       /* scaling as in Klawonn-Widlund 1999*/
14613425bc38SStefano Zampini       for(s=0;s<n_neg_values;s++) {
14623425bc38SStefano Zampini         scalar_value = 0.0;
14633425bc38SStefano Zampini         for(k=0;k<s+1;k++) {
14643425bc38SStefano Zampini           scalar_value += array[k];
14653425bc38SStefano Zampini         }
14663425bc38SStefano Zampini         scalar_value = -scalar_value;
14673425bc38SStefano Zampini         scaling_factors[partial_sum+s] = scalar_value;
14683425bc38SStefano Zampini       }
14693425bc38SStefano Zampini       for(s=0;s<n_pos_values;s++) {
14703425bc38SStefano Zampini         scalar_value = 0.0;
14713425bc38SStefano Zampini         for(k=s+n_neg_values;k<j;k++) {
14723425bc38SStefano Zampini           scalar_value += array[k];
14733425bc38SStefano Zampini         }
14743425bc38SStefano Zampini         scaling_factors[partial_sum+s+n_neg_values] = scalar_value;
14753425bc38SStefano Zampini       }
14763425bc38SStefano Zampini       partial_sum += j;
14773425bc38SStefano Zampini     }
14783425bc38SStefano Zampini   }
14793425bc38SStefano Zampini   ierr = PetscFree(all_factors[0]);CHKERRQ(ierr);
14803425bc38SStefano Zampini   ierr = PetscFree(all_factors);CHKERRQ(ierr);
14813425bc38SStefano Zampini   /* printf("I found %d local lambda dofs when numbering them (should be %d)\n",partial_sum,n_local_lambda); */
14823425bc38SStefano Zampini   ierr = ISCreateGeneral(comm,n_local_lambda,l2g_indices,PETSC_OWN_POINTER,&IS_l2g_lambda);CHKERRQ(ierr);
14833425bc38SStefano Zampini   ierr = VecScatterCreate(fetidpmat_ctx->lambda_local,(IS)0,lambda_global,IS_l2g_lambda,&fetidpmat_ctx->l2g_lambda);CHKERRQ(ierr);
14843425bc38SStefano Zampini 
14853425bc38SStefano Zampini   /* Create local part of B_delta */
14863425bc38SStefano Zampini   ierr = MatCreate(PETSC_COMM_SELF,&fetidpmat_ctx->B_delta);
14873425bc38SStefano Zampini   ierr = MatSetSizes(fetidpmat_ctx->B_delta,n_local_lambda,pcis->n_B,n_local_lambda,pcis->n_B);CHKERRQ(ierr);
14883425bc38SStefano Zampini   ierr = MatSetType(fetidpmat_ctx->B_delta,MATSEQAIJ);CHKERRQ(ierr);
14893425bc38SStefano Zampini   ierr = MatSeqAIJSetPreallocation(fetidpmat_ctx->B_delta,1,PETSC_NULL);CHKERRQ(ierr);
14903425bc38SStefano Zampini   ierr = MatSetOption(fetidpmat_ctx->B_delta,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr);
14913425bc38SStefano Zampini   for(i=0;i<n_local_lambda;i++) {
14923425bc38SStefano Zampini     ierr = MatSetValue(fetidpmat_ctx->B_delta,i,cols_B_delta[i],vals_B_delta[i],INSERT_VALUES);CHKERRQ(ierr);
14933425bc38SStefano Zampini   }
14943425bc38SStefano Zampini   ierr = MatAssemblyBegin(fetidpmat_ctx->B_delta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
14953425bc38SStefano Zampini   ierr = MatAssemblyEnd  (fetidpmat_ctx->B_delta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
14963425bc38SStefano Zampini 
14973425bc38SStefano Zampini   if(fully_redundant) {
14983425bc38SStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&ScalingMat);
14993425bc38SStefano Zampini     ierr = MatSetSizes(ScalingMat,n_local_lambda,n_local_lambda,n_local_lambda,n_local_lambda);CHKERRQ(ierr);
15003425bc38SStefano Zampini     ierr = MatSetType(ScalingMat,MATSEQAIJ);CHKERRQ(ierr);
15013425bc38SStefano Zampini     ierr = MatSeqAIJSetPreallocation(ScalingMat,1,PETSC_NULL);CHKERRQ(ierr);
15023425bc38SStefano Zampini     for(i=0;i<n_local_lambda;i++) {
15033425bc38SStefano Zampini       ierr = MatSetValue(ScalingMat,i,i,scaling_factors[i],INSERT_VALUES);CHKERRQ(ierr);
15043425bc38SStefano Zampini     }
15053425bc38SStefano Zampini     ierr = MatAssemblyBegin(ScalingMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
15063425bc38SStefano Zampini     ierr = MatAssemblyEnd  (ScalingMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
15073425bc38SStefano Zampini     ierr = MatMatMult(ScalingMat,fetidpmat_ctx->B_delta,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&fetidpmat_ctx->B_Ddelta);CHKERRQ(ierr);
15083425bc38SStefano Zampini     ierr = MatDestroy(&ScalingMat);CHKERRQ(ierr);
15093425bc38SStefano Zampini   } else {
15103425bc38SStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&fetidpmat_ctx->B_Ddelta);
15113425bc38SStefano Zampini     ierr = MatSetSizes(fetidpmat_ctx->B_Ddelta,n_local_lambda,pcis->n_B,n_local_lambda,pcis->n_B);CHKERRQ(ierr);
15123425bc38SStefano Zampini     ierr = MatSetType(fetidpmat_ctx->B_Ddelta,MATSEQAIJ);CHKERRQ(ierr);
15133425bc38SStefano Zampini     ierr = MatSeqAIJSetPreallocation(fetidpmat_ctx->B_Ddelta,1,PETSC_NULL);CHKERRQ(ierr);
15143425bc38SStefano Zampini     for(i=0;i<n_local_lambda;i++) {
15153425bc38SStefano Zampini       ierr = MatSetValue(fetidpmat_ctx->B_Ddelta,i,cols_B_delta[i],scaling_factors[i],INSERT_VALUES);CHKERRQ(ierr);
15163425bc38SStefano Zampini     }
15173425bc38SStefano Zampini     ierr = MatAssemblyBegin(fetidpmat_ctx->B_Ddelta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
15183425bc38SStefano Zampini     ierr = MatAssemblyEnd  (fetidpmat_ctx->B_Ddelta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
15193425bc38SStefano Zampini   }
15203425bc38SStefano Zampini 
15213425bc38SStefano Zampini   /* Create some vectors needed by fetidp */
15223425bc38SStefano Zampini   ierr = VecDuplicate(pcis->vec1_B,&fetidpmat_ctx->temp_solution_B);CHKERRQ(ierr);
15233425bc38SStefano Zampini   ierr = VecDuplicate(pcis->vec1_D,&fetidpmat_ctx->temp_solution_D);CHKERRQ(ierr);
15243425bc38SStefano Zampini 
15253425bc38SStefano Zampini   test_fetidp = PETSC_FALSE;
15263425bc38SStefano Zampini   ierr = PetscOptionsGetBool(PETSC_NULL,"-fetidp_check",&test_fetidp,PETSC_NULL);CHKERRQ(ierr);
15273425bc38SStefano Zampini 
15283425bc38SStefano Zampini   if(test_fetidp) {
15293425bc38SStefano Zampini 
15303425bc38SStefano Zampini     ierr = PetscViewerASCIIGetStdout(((PetscObject)(fetidpmat_ctx->pc))->comm,&viewer);CHKERRQ(ierr);
15313425bc38SStefano Zampini     ierr = PetscViewerASCIISynchronizedAllow(viewer,PETSC_TRUE);CHKERRQ(ierr);
15323425bc38SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"----------FETI_DP TESTS--------------\n");CHKERRQ(ierr);
15333425bc38SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"All tests should return zero!\n");CHKERRQ(ierr);
15343425bc38SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"FETIDP MAT context in the ");CHKERRQ(ierr);
15353425bc38SStefano Zampini     if(fully_redundant) {
15363425bc38SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"fully redundant case for lagrange multipliers.\n");CHKERRQ(ierr);
15373425bc38SStefano Zampini     } else {
15383425bc38SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Non-fully redundant case for lagrange multiplier.\n");CHKERRQ(ierr);
15393425bc38SStefano Zampini     }
15403425bc38SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
15413425bc38SStefano Zampini 
15423425bc38SStefano Zampini     /******************************************************************/
15433425bc38SStefano Zampini     /* TEST A/B: Test numbering of global lambda dofs             */
15443425bc38SStefano Zampini     /******************************************************************/
15453425bc38SStefano Zampini 
15463425bc38SStefano Zampini     ierr = VecDuplicate(fetidpmat_ctx->lambda_local,&test_vec);CHKERRQ(ierr);
15473425bc38SStefano Zampini     ierr = VecSet(lambda_global,1.0);CHKERRQ(ierr);
15483425bc38SStefano Zampini     ierr = VecSet(test_vec,1.0);CHKERRQ(ierr);
15493425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
15503425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
15513425bc38SStefano Zampini     scalar_value = -1.0;
15523425bc38SStefano Zampini     ierr = VecAXPY(test_vec,scalar_value,fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
15533425bc38SStefano Zampini     ierr = VecNorm(test_vec,NORM_INFINITY,&scalar_value);CHKERRQ(ierr);
15543425bc38SStefano Zampini     ierr = VecDestroy(&test_vec);CHKERRQ(ierr);
15553425bc38SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"A[%04d]: CHECK glob to loc: % 1.14e\n",rank,scalar_value);CHKERRQ(ierr);
15563425bc38SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
15573425bc38SStefano Zampini     if(fully_redundant) {
15583425bc38SStefano Zampini       ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr);
15593425bc38SStefano Zampini       ierr = VecSet(fetidpmat_ctx->lambda_local,0.5);CHKERRQ(ierr);
15603425bc38SStefano Zampini       ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
15613425bc38SStefano Zampini       ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
15623425bc38SStefano Zampini       ierr = VecSum(lambda_global,&scalar_value);CHKERRQ(ierr);
15633425bc38SStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"B[%04d]: CHECK loc to glob: % 1.14e\n",rank,scalar_value-fetidpmat_ctx->n_lambda);CHKERRQ(ierr);
15643425bc38SStefano Zampini       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
15653425bc38SStefano Zampini     }
15663425bc38SStefano Zampini 
15673425bc38SStefano Zampini     /******************************************************************/
15683425bc38SStefano Zampini     /* TEST C: It should holds B_delta*w=0, w\in\widehat{W}           */
15693425bc38SStefano Zampini     /* This is the meaning of the B matrix                            */
15703425bc38SStefano Zampini     /******************************************************************/
15713425bc38SStefano Zampini 
15723425bc38SStefano Zampini     ierr = VecSetRandom(pcis->vec1_N,PETSC_NULL);CHKERRQ(ierr);
15733425bc38SStefano Zampini     ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
15743425bc38SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
15753425bc38SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
15763425bc38SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
15773425bc38SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
15783425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
15793425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
15803425bc38SStefano Zampini     /* Action of B_delta */
15813425bc38SStefano Zampini     ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
15823425bc38SStefano Zampini     ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr);
15833425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
15843425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
15853425bc38SStefano Zampini     ierr = VecNorm(lambda_global,NORM_INFINITY,&scalar_value);CHKERRQ(ierr);
15863425bc38SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"C[coll]: CHECK infty norm of B_delta*w (w continuous): % 1.14e\n",scalar_value);CHKERRQ(ierr);
15873425bc38SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
15883425bc38SStefano Zampini 
15893425bc38SStefano Zampini     /******************************************************************/
15903425bc38SStefano Zampini     /* TEST D: It should holds E_Dw = w - P_Dw w\in\widetilde{W}     */
15913425bc38SStefano Zampini     /* E_D = R_D^TR                                                   */
15923425bc38SStefano Zampini     /* P_D = B_{D,delta}^T B_{delta}                                  */
15933425bc38SStefano Zampini     /* eq.44 Mandel Tezaur and Dohrmann 2005                          */
15943425bc38SStefano Zampini     /******************************************************************/
15953425bc38SStefano Zampini 
15963425bc38SStefano Zampini     /* compute a random vector in \widetilde{W} */
15973425bc38SStefano Zampini     ierr = VecSetRandom(pcis->vec1_N,PETSC_NULL);CHKERRQ(ierr);
15983425bc38SStefano Zampini     scalar_value = 0.0;  /* set zero at vertices */
15993425bc38SStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
16003425bc38SStefano Zampini     for(i=0;i<n_vertices;i++) { array[vertex_indices[i]]=scalar_value; }
16013425bc38SStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
16023425bc38SStefano Zampini     /* store w for final comparison */
16033425bc38SStefano Zampini     ierr = VecDuplicate(pcis->vec1_B,&test_vec);CHKERRQ(ierr);
16043425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,test_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
16053425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,test_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
16063425bc38SStefano Zampini 
16073425bc38SStefano Zampini     /* Jump operator P_D : results stored in pcis->vec1_B */
16083425bc38SStefano Zampini 
16093425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
16103425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
16113425bc38SStefano Zampini     /* Action of B_delta */
16123425bc38SStefano Zampini     ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
16133425bc38SStefano Zampini     ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr);
16143425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
16153425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
16163425bc38SStefano Zampini     /* Action of B_Ddelta^T */
16173425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
16183425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
16193425bc38SStefano Zampini     ierr = MatMultTranspose(fetidpmat_ctx->B_Ddelta,fetidpmat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr);
16203425bc38SStefano Zampini 
16213425bc38SStefano Zampini     /* Average operator E_D : results stored in pcis->vec2_B */
16223425bc38SStefano Zampini 
16233425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
16243425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
16253425bc38SStefano Zampini     ierr = VecPointwiseMult(pcis->vec2_B,pcis->D,pcis->vec2_B);CHKERRQ(ierr);
16263425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec2_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
16273425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec2_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
16283425bc38SStefano Zampini     ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
16293425bc38SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
16303425bc38SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
16313425bc38SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
16323425bc38SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
16333425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
16343425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
16353425bc38SStefano Zampini 
16363425bc38SStefano Zampini     /* test E_D=I-P_D */
16373425bc38SStefano Zampini     scalar_value = 1.0;
16383425bc38SStefano Zampini     ierr = VecAXPY(pcis->vec1_B,scalar_value,pcis->vec2_B);CHKERRQ(ierr);
16393425bc38SStefano Zampini     scalar_value = -1.0;
16403425bc38SStefano Zampini     ierr = VecAXPY(pcis->vec1_B,scalar_value,test_vec);CHKERRQ(ierr);
16413425bc38SStefano Zampini     ierr = VecNorm(pcis->vec1_B,NORM_INFINITY,&scalar_value);CHKERRQ(ierr);
16423425bc38SStefano Zampini     ierr = VecDestroy(&test_vec);CHKERRQ(ierr);
16433425bc38SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"D[%04d] CHECK infty norm of E_D + P_D - I: % 1.14e\n",rank,scalar_value);CHKERRQ(ierr);
16443425bc38SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
16453425bc38SStefano Zampini 
16463425bc38SStefano Zampini     /******************************************************************/
16473425bc38SStefano Zampini     /* TEST E: It should holds R_D^TP_Dw=0 w\in\widetilde{W}          */
16483425bc38SStefano Zampini     /* eq.48 Mandel Tezaur and Dohrmann 2005                          */
16493425bc38SStefano Zampini     /******************************************************************/
16503425bc38SStefano Zampini 
16513425bc38SStefano Zampini     ierr = VecSetRandom(pcis->vec1_N,PETSC_NULL);CHKERRQ(ierr);
16523425bc38SStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
16533425bc38SStefano Zampini     scalar_value = 0.0;  /* set zero at vertices */
16543425bc38SStefano Zampini     for(i=0;i<n_vertices;i++) { array[vertex_indices[i]]=scalar_value; }
16553425bc38SStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
16563425bc38SStefano Zampini 
16573425bc38SStefano Zampini     /* Jump operator P_D : results stored in pcis->vec1_B */
16583425bc38SStefano Zampini 
16593425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
16603425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
16613425bc38SStefano Zampini     /* Action of B_delta */
16623425bc38SStefano Zampini     ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
16633425bc38SStefano Zampini     ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr);
16643425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
16653425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
16663425bc38SStefano Zampini     /* Action of B_Ddelta^T */
16673425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
16683425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
16693425bc38SStefano Zampini     ierr = MatMultTranspose(fetidpmat_ctx->B_Ddelta,fetidpmat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr);
16703425bc38SStefano Zampini     /* diagonal scaling */
16713425bc38SStefano Zampini     ierr = VecPointwiseMult(pcis->vec1_B,pcis->D,pcis->vec1_B);CHKERRQ(ierr);
16723425bc38SStefano Zampini     /* sum on the interface */
16733425bc38SStefano Zampini     ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
16743425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
16753425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
16763425bc38SStefano Zampini     ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
16773425bc38SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
16783425bc38SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
16793425bc38SStefano Zampini     ierr = VecNorm(pcis->vec1_global,NORM_INFINITY,&scalar_value);CHKERRQ(ierr);
16803425bc38SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"E[coll]: CHECK infty norm of R^T_D P_D: % 1.14e\n",scalar_value);CHKERRQ(ierr);
16813425bc38SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
16823425bc38SStefano Zampini 
16833425bc38SStefano Zampini     if(!fully_redundant) {
16843425bc38SStefano Zampini       /******************************************************************/
16853425bc38SStefano Zampini       /* TEST F: It should holds B_{delta}B^T_{D,delta}=I               */
16863425bc38SStefano Zampini       /* Corollary thm 14 Mandel Tezaur and Dohrmann 2005               */
16873425bc38SStefano Zampini       /******************************************************************/
16883425bc38SStefano Zampini       ierr = VecDuplicate(lambda_global,&test_vec);CHKERRQ(ierr);
16893425bc38SStefano Zampini       ierr = VecSetRandom(lambda_global,PETSC_NULL);CHKERRQ(ierr);
16903425bc38SStefano Zampini       /* Action of B_Ddelta^T */
16913425bc38SStefano Zampini       ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
16923425bc38SStefano Zampini       ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
16933425bc38SStefano Zampini       ierr = MatMultTranspose(fetidpmat_ctx->B_Ddelta,fetidpmat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr);
16943425bc38SStefano Zampini       /* Action of B_delta */
16953425bc38SStefano Zampini       ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
16963425bc38SStefano Zampini       ierr = VecSet(test_vec,0.0);CHKERRQ(ierr);
16973425bc38SStefano Zampini       ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,test_vec,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
16983425bc38SStefano Zampini       ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,test_vec,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
16993425bc38SStefano Zampini       scalar_value = -1.0;
17003425bc38SStefano Zampini       ierr = VecAXPY(lambda_global,scalar_value,test_vec);CHKERRQ(ierr);
17013425bc38SStefano Zampini       ierr = VecNorm(lambda_global,NORM_INFINITY,&scalar_value);CHKERRQ(ierr);
17023425bc38SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"E[coll]: CHECK infty norm of P^T_D - I: % 1.14e\n",scalar_value);CHKERRQ(ierr);
17033425bc38SStefano Zampini       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
17043425bc38SStefano Zampini       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
17053425bc38SStefano Zampini       ierr = VecDestroy(&test_vec);CHKERRQ(ierr);
17063425bc38SStefano Zampini     }
17073425bc38SStefano Zampini   }
17083425bc38SStefano Zampini   /* final cleanup */
17093425bc38SStefano Zampini   ierr = PetscFree(dual_dofs_boundary_indices);CHKERRQ(ierr);
17103425bc38SStefano Zampini   ierr = PetscFree(vertex_indices);CHKERRQ(ierr);
17113425bc38SStefano Zampini   ierr = PetscFree(aux_local_numbering_1);CHKERRQ(ierr);
17123425bc38SStefano Zampini   ierr = PetscFree(aux_local_numbering_2);CHKERRQ(ierr);
17133425bc38SStefano Zampini   ierr = PetscFree(aux_global_numbering);CHKERRQ(ierr);
17143425bc38SStefano Zampini   ierr = PetscFree(aux_global_numbering_mpi);CHKERRQ(ierr);
17153425bc38SStefano Zampini   ierr = PetscFree(dof_sizes);CHKERRQ(ierr);
17163425bc38SStefano Zampini   ierr = PetscFree(dof_displs);CHKERRQ(ierr);
17173425bc38SStefano Zampini   ierr = PetscFree(all_aux_global_numbering_mpi_1);CHKERRQ(ierr);
17183425bc38SStefano Zampini   ierr = PetscFree(all_aux_global_numbering_mpi_2);CHKERRQ(ierr);
17193425bc38SStefano Zampini   ierr = PetscFree(global_dofs_numbering);CHKERRQ(ierr);
17203425bc38SStefano Zampini   ierr = PetscFree(aux_sums);CHKERRQ(ierr);
17213425bc38SStefano Zampini   ierr = PetscFree(cols_B_delta);CHKERRQ(ierr);
17223425bc38SStefano Zampini   ierr = PetscFree(vals_B_delta);CHKERRQ(ierr);
17233425bc38SStefano Zampini   ierr = PetscFree(scaling_factors);CHKERRQ(ierr);
17243425bc38SStefano Zampini   ierr = VecDestroy(&lambda_global);CHKERRQ(ierr);
17253425bc38SStefano Zampini   ierr = ISDestroy(&IS_l2g_lambda);CHKERRQ(ierr);
17263425bc38SStefano Zampini 
17273425bc38SStefano Zampini   PetscFunctionReturn(0);
17283425bc38SStefano Zampini }
17293425bc38SStefano Zampini 
17303425bc38SStefano Zampini #undef __FUNCT__
17313425bc38SStefano Zampini #define __FUNCT__ "PCBDDCSetupFETIDPPCContext"
17323425bc38SStefano Zampini static PetscErrorCode PCBDDCSetupFETIDPPCContext(Mat fetimat, FETIDPPC_ctx *fetidppc_ctx)
17333425bc38SStefano Zampini {
17343425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
17353425bc38SStefano Zampini   PetscErrorCode ierr;
17363425bc38SStefano Zampini 
17373425bc38SStefano Zampini   PetscFunctionBegin;
17383425bc38SStefano Zampini   ierr = MatShellGetContext(fetimat,&mat_ctx);CHKERRQ(ierr);
17393425bc38SStefano Zampini   /* get references from objects created when setting up feti mat context */
17403425bc38SStefano Zampini   ierr = PetscObjectReference((PetscObject)mat_ctx->lambda_local);CHKERRQ(ierr);
17413425bc38SStefano Zampini   fetidppc_ctx->lambda_local = mat_ctx->lambda_local;
17423425bc38SStefano Zampini   ierr = PetscObjectReference((PetscObject)mat_ctx->B_Ddelta);CHKERRQ(ierr);
17433425bc38SStefano Zampini   fetidppc_ctx->B_Ddelta = mat_ctx->B_Ddelta;
17443425bc38SStefano Zampini   ierr = PetscObjectReference((PetscObject)mat_ctx->l2g_lambda);CHKERRQ(ierr);
17453425bc38SStefano Zampini   fetidppc_ctx->l2g_lambda = mat_ctx->l2g_lambda;
17463425bc38SStefano Zampini   PetscFunctionReturn(0);
17473425bc38SStefano Zampini }
17483425bc38SStefano Zampini 
17493425bc38SStefano Zampini #undef __FUNCT__
17503425bc38SStefano Zampini #define __FUNCT__ "FETIDPMatMult"
17513425bc38SStefano Zampini static PetscErrorCode FETIDPMatMult(Mat fetimat, Vec x, Vec y)
17523425bc38SStefano Zampini {
17533425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
17543425bc38SStefano Zampini   PC_IS          *pcis;
17553425bc38SStefano Zampini   PetscErrorCode ierr;
17563425bc38SStefano Zampini 
17573425bc38SStefano Zampini   PetscFunctionBegin;
17583425bc38SStefano Zampini   ierr = MatShellGetContext(fetimat,&mat_ctx);CHKERRQ(ierr);
17593425bc38SStefano Zampini   pcis = (PC_IS*)mat_ctx->pc->data;
17603425bc38SStefano Zampini   /* Application of B_delta^T */
17613425bc38SStefano Zampini   ierr = VecScatterBegin(mat_ctx->l2g_lambda,x,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
17623425bc38SStefano Zampini   ierr = VecScatterEnd(mat_ctx->l2g_lambda,x,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
17633425bc38SStefano Zampini   ierr = MatMultTranspose(mat_ctx->B_delta,mat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr);
17643425bc38SStefano Zampini   /* Application of \widetilde{S}^-1 */
17653425bc38SStefano Zampini   ierr = VecSet(pcis->vec1_D,0.0);CHKERRQ(ierr);
17663425bc38SStefano Zampini   ierr = PCBDDCApplyInterfacePreconditioner(mat_ctx->pc);CHKERRQ(ierr);
17673425bc38SStefano Zampini   /* Application of B_delta */
17683425bc38SStefano Zampini   ierr = MatMult(mat_ctx->B_delta,pcis->vec1_B,mat_ctx->lambda_local);CHKERRQ(ierr);
17693425bc38SStefano Zampini   ierr = VecSet(y,0.0);CHKERRQ(ierr);
17703425bc38SStefano Zampini   ierr = VecScatterBegin(mat_ctx->l2g_lambda,mat_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
17713425bc38SStefano Zampini   ierr = VecScatterEnd(mat_ctx->l2g_lambda,mat_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
17723425bc38SStefano Zampini   PetscFunctionReturn(0);
17733425bc38SStefano Zampini }
17743425bc38SStefano Zampini 
17753425bc38SStefano Zampini #undef __FUNCT__
17763425bc38SStefano Zampini #define __FUNCT__ "FETIDPPCApply"
17773425bc38SStefano Zampini static PetscErrorCode FETIDPPCApply(PC fetipc, Vec x, Vec y)
17783425bc38SStefano Zampini {
17793425bc38SStefano Zampini   FETIDPPC_ctx   *pc_ctx;
17803425bc38SStefano Zampini   PC_IS          *pcis;
17813425bc38SStefano Zampini   PetscErrorCode ierr;
17823425bc38SStefano Zampini 
17833425bc38SStefano Zampini   PetscFunctionBegin;
17843425bc38SStefano Zampini   ierr = PCShellGetContext(fetipc,(void**)&pc_ctx);
17853425bc38SStefano Zampini   pcis = (PC_IS*)pc_ctx->pc->data;
17863425bc38SStefano Zampini   /* Application of B_Ddelta^T */
17873425bc38SStefano Zampini   ierr = VecScatterBegin(pc_ctx->l2g_lambda,x,pc_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
17883425bc38SStefano Zampini   ierr = VecScatterEnd(pc_ctx->l2g_lambda,x,pc_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
17893425bc38SStefano Zampini   ierr = VecSet(pcis->vec2_B,0.0);CHKERRQ(ierr);
17903425bc38SStefano Zampini   ierr = MatMultTranspose(pc_ctx->B_Ddelta,pc_ctx->lambda_local,pcis->vec2_B);CHKERRQ(ierr);
17913425bc38SStefano Zampini   /* Application of S */
17923425bc38SStefano Zampini   ierr = PCISApplySchur(pc_ctx->pc,pcis->vec2_B,pcis->vec1_B,(Vec)0,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr);
17933425bc38SStefano Zampini   /* Application of B_Ddelta */
17943425bc38SStefano Zampini   ierr = MatMult(pc_ctx->B_Ddelta,pcis->vec1_B,pc_ctx->lambda_local);CHKERRQ(ierr);
17953425bc38SStefano Zampini   ierr = VecSet(y,0.0);CHKERRQ(ierr);
17963425bc38SStefano Zampini   ierr = VecScatterBegin(pc_ctx->l2g_lambda,pc_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
17973425bc38SStefano Zampini   ierr = VecScatterEnd(pc_ctx->l2g_lambda,pc_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
17983425bc38SStefano Zampini   PetscFunctionReturn(0);
17993425bc38SStefano Zampini }
18003425bc38SStefano Zampini 
1801da1bb401SStefano Zampini #undef __FUNCT__
1802da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetupLocalAdjacencyGraph"
1803da1bb401SStefano Zampini static PetscErrorCode PCBDDCSetupLocalAdjacencyGraph(PC pc)
1804da1bb401SStefano Zampini {
1805da1bb401SStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
1806da1bb401SStefano Zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
1807da1bb401SStefano Zampini   PetscInt       nvtxs,*xadj,*adjncy;
1808da1bb401SStefano Zampini   Mat            mat_adj;
1809da1bb401SStefano Zampini   PetscBool      symmetrize_rowij=PETSC_TRUE,compressed_rowij=PETSC_FALSE,flg_row=PETSC_TRUE;
1810da1bb401SStefano Zampini   PCBDDCGraph    mat_graph=pcbddc->mat_graph;
1811da1bb401SStefano Zampini   PetscErrorCode ierr;
1812da1bb401SStefano Zampini 
1813da1bb401SStefano Zampini   PetscFunctionBegin;
1814da1bb401SStefano Zampini   /* get CSR adjacency from local matrix if user has not yet provided local graph using PCBDDCSetLocalAdjacencyGraph function */
1815da1bb401SStefano Zampini   if(!mat_graph->xadj) {
1816da1bb401SStefano Zampini     ierr = MatConvert(matis->A,MATMPIADJ,MAT_INITIAL_MATRIX,&mat_adj);CHKERRQ(ierr);
1817da1bb401SStefano Zampini     ierr = MatGetRowIJ(mat_adj,0,symmetrize_rowij,compressed_rowij,&nvtxs,&xadj,&adjncy,&flg_row);CHKERRQ(ierr);
1818da1bb401SStefano Zampini     if(!flg_row) {
1819da1bb401SStefano Zampini       SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in MatGetRowIJ called in %s\n",__FUNCT__);
1820da1bb401SStefano Zampini     }
1821da1bb401SStefano Zampini     /* Get adjacency into BDDC workspace */
1822da1bb401SStefano Zampini     ierr = PCBDDCSetLocalAdjacencyGraph(pc,nvtxs,xadj,adjncy,PETSC_COPY_VALUES);CHKERRQ(ierr);
1823da1bb401SStefano Zampini     ierr = MatRestoreRowIJ(mat_adj,0,symmetrize_rowij,compressed_rowij,&nvtxs,&xadj,&adjncy,&flg_row);CHKERRQ(ierr);
1824da1bb401SStefano Zampini     if(!flg_row) {
1825da1bb401SStefano Zampini       SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in MatRestoreRowIJ called in %s\n",__FUNCT__);
1826da1bb401SStefano Zampini     }
1827da1bb401SStefano Zampini     ierr = MatDestroy(&mat_adj);CHKERRQ(ierr);
1828da1bb401SStefano Zampini   }
1829da1bb401SStefano Zampini   PetscFunctionReturn(0);
1830da1bb401SStefano Zampini }
1831da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
18320c7d97c5SJed Brown #undef __FUNCT__
18330c7d97c5SJed Brown #define __FUNCT__ "PCBDDCApplyInterfacePreconditioner"
18342617d88aSStefano Zampini static PetscErrorCode  PCBDDCApplyInterfacePreconditioner(PC pc)
18350c7d97c5SJed Brown {
18360c7d97c5SJed Brown   PetscErrorCode ierr;
18370c7d97c5SJed Brown   PC_BDDC*        pcbddc = (PC_BDDC*)(pc->data);
18380c7d97c5SJed Brown   PC_IS*            pcis = (PC_IS*)  (pc->data);
18393b03a366Sstefano_zampini   const PetscScalar zero = 0.0;
18400c7d97c5SJed Brown 
18410c7d97c5SJed Brown   PetscFunctionBegin;
18420c7d97c5SJed Brown   /* Application of PHI^T  */
18430c7d97c5SJed Brown   ierr = MatMultTranspose(pcbddc->coarse_phi_B,pcis->vec1_B,pcbddc->vec1_P);CHKERRQ(ierr);
18440c7d97c5SJed Brown   if(pcbddc->prec_type) { ierr = MatMultTransposeAdd(pcbddc->coarse_phi_D,pcis->vec1_D,pcbddc->vec1_P,pcbddc->vec1_P);CHKERRQ(ierr); }
18450c7d97c5SJed Brown 
18460c7d97c5SJed Brown   /* Scatter data of coarse_rhs */
1847*142dfd88SStefano Zampini   if(pcbddc->coarse_rhs) { ierr = VecSet(pcbddc->coarse_rhs,zero);CHKERRQ(ierr); }
18480c7d97c5SJed Brown   ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->vec1_P,pcbddc->coarse_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18490c7d97c5SJed Brown 
18500c7d97c5SJed Brown   /* Local solution on R nodes */
18510c7d97c5SJed Brown   ierr = VecSet(pcbddc->vec1_R,zero);CHKERRQ(ierr);
18520c7d97c5SJed Brown   ierr = VecScatterBegin(pcbddc->R_to_B,pcis->vec1_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
18530c7d97c5SJed Brown   ierr = VecScatterEnd  (pcbddc->R_to_B,pcis->vec1_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
18540c7d97c5SJed Brown   if(pcbddc->prec_type) {
18550c7d97c5SJed Brown     ierr = VecScatterBegin(pcbddc->R_to_D,pcis->vec1_D,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
18560c7d97c5SJed Brown     ierr = VecScatterEnd  (pcbddc->R_to_D,pcis->vec1_D,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
18570c7d97c5SJed Brown   }
18580c7d97c5SJed Brown   ierr = PCBDDCSolveSaddlePoint(pc);CHKERRQ(ierr);
18590c7d97c5SJed Brown   ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr);
18600c7d97c5SJed Brown   ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec2_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18610c7d97c5SJed Brown   ierr = VecScatterEnd  (pcbddc->R_to_B,pcbddc->vec2_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18620c7d97c5SJed Brown   if(pcbddc->prec_type) {
18630c7d97c5SJed Brown     ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec2_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18640c7d97c5SJed Brown     ierr = VecScatterEnd  (pcbddc->R_to_D,pcbddc->vec2_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18650c7d97c5SJed Brown   }
18660c7d97c5SJed Brown 
18670c7d97c5SJed Brown   /* Coarse solution */
18680c7d97c5SJed Brown   ierr = PCBDDCScatterCoarseDataEnd(pc,pcbddc->vec1_P,pcbddc->coarse_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1869*142dfd88SStefano Zampini   if(pcbddc->coarse_rhs) { ierr = KSPSolve(pcbddc->coarse_ksp,pcbddc->coarse_rhs,pcbddc->coarse_vec);CHKERRQ(ierr); }
18700c7d97c5SJed Brown   ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->coarse_vec,pcbddc->vec1_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
18710c7d97c5SJed Brown   ierr = PCBDDCScatterCoarseDataEnd  (pc,pcbddc->coarse_vec,pcbddc->vec1_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
18720c7d97c5SJed Brown 
18730c7d97c5SJed Brown   /* Sum contributions from two levels */
18740c7d97c5SJed Brown   ierr = MatMultAdd(pcbddc->coarse_phi_B,pcbddc->vec1_P,pcis->vec1_B,pcis->vec1_B);CHKERRQ(ierr);
18750c7d97c5SJed Brown   if(pcbddc->prec_type) { ierr = MatMultAdd(pcbddc->coarse_phi_D,pcbddc->vec1_P,pcis->vec1_D,pcis->vec1_D);CHKERRQ(ierr); }
18760c7d97c5SJed Brown   PetscFunctionReturn(0);
18770c7d97c5SJed Brown }
18780c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
18790c7d97c5SJed Brown #undef __FUNCT__
18800c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSolveSaddlePoint"
188153cdbc3dSStefano Zampini static PetscErrorCode  PCBDDCSolveSaddlePoint(PC pc)
18820c7d97c5SJed Brown {
18830c7d97c5SJed Brown   PetscErrorCode ierr;
18840c7d97c5SJed Brown   PC_BDDC*       pcbddc = (PC_BDDC*)(pc->data);
18850c7d97c5SJed Brown 
18860c7d97c5SJed Brown   PetscFunctionBegin;
188753cdbc3dSStefano Zampini   ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr);
1888534831adSStefano Zampini   if(pcbddc->local_auxmat1) {
18890c7d97c5SJed Brown     ierr = MatMult(pcbddc->local_auxmat1,pcbddc->vec2_R,pcbddc->vec1_C);CHKERRQ(ierr);
18900c7d97c5SJed Brown     ierr = MatMultAdd(pcbddc->local_auxmat2,pcbddc->vec1_C,pcbddc->vec2_R,pcbddc->vec2_R);CHKERRQ(ierr);
18910c7d97c5SJed Brown   }
18920c7d97c5SJed Brown   PetscFunctionReturn(0);
18930c7d97c5SJed Brown }
18940c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
18950c7d97c5SJed Brown #undef __FUNCT__
18960c7d97c5SJed Brown #define __FUNCT__ "PCBDDCScatterCoarseDataBegin"
189753cdbc3dSStefano Zampini static PetscErrorCode  PCBDDCScatterCoarseDataBegin(PC pc,Vec vec_from, Vec vec_to, InsertMode imode, ScatterMode smode)
18980c7d97c5SJed Brown {
18990c7d97c5SJed Brown   PetscErrorCode ierr;
19000c7d97c5SJed Brown   PC_BDDC*       pcbddc = (PC_BDDC*)(pc->data);
19010c7d97c5SJed Brown 
19020c7d97c5SJed Brown   PetscFunctionBegin;
19030c7d97c5SJed Brown   switch(pcbddc->coarse_communications_type){
19040c7d97c5SJed Brown     case SCATTERS_BDDC:
19050c7d97c5SJed Brown       ierr = VecScatterBegin(pcbddc->coarse_loc_to_glob,vec_from,vec_to,imode,smode);CHKERRQ(ierr);
19060c7d97c5SJed Brown       break;
19070c7d97c5SJed Brown     case GATHERS_BDDC:
19080c7d97c5SJed Brown       break;
19090c7d97c5SJed Brown   }
19100c7d97c5SJed Brown   PetscFunctionReturn(0);
19110c7d97c5SJed Brown }
19120c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
19130c7d97c5SJed Brown #undef __FUNCT__
19140c7d97c5SJed Brown #define __FUNCT__ "PCBDDCScatterCoarseDataEnd"
191553cdbc3dSStefano Zampini static PetscErrorCode  PCBDDCScatterCoarseDataEnd(PC pc,Vec vec_from, Vec vec_to, InsertMode imode, ScatterMode smode)
19160c7d97c5SJed Brown {
19170c7d97c5SJed Brown   PetscErrorCode ierr;
19180c7d97c5SJed Brown   PC_BDDC*       pcbddc = (PC_BDDC*)(pc->data);
19190c7d97c5SJed Brown   PetscScalar*   array_to;
19200c7d97c5SJed Brown   PetscScalar*   array_from;
19210c7d97c5SJed Brown   MPI_Comm       comm=((PetscObject)pc)->comm;
19220c7d97c5SJed Brown   PetscInt i;
19230c7d97c5SJed Brown 
19240c7d97c5SJed Brown   PetscFunctionBegin;
19250c7d97c5SJed Brown 
19260c7d97c5SJed Brown   switch(pcbddc->coarse_communications_type){
19270c7d97c5SJed Brown     case SCATTERS_BDDC:
19280c7d97c5SJed Brown       ierr = VecScatterEnd(pcbddc->coarse_loc_to_glob,vec_from,vec_to,imode,smode);CHKERRQ(ierr);
19290c7d97c5SJed Brown       break;
19300c7d97c5SJed Brown     case GATHERS_BDDC:
19310c7d97c5SJed Brown       if(vec_from) VecGetArray(vec_from,&array_from);
19320c7d97c5SJed Brown       if(vec_to)   VecGetArray(vec_to,&array_to);
19330c7d97c5SJed Brown       switch(pcbddc->coarse_problem_type){
19340c7d97c5SJed Brown         case SEQUENTIAL_BDDC:
19350c7d97c5SJed Brown           if(smode == SCATTER_FORWARD) {
193653cdbc3dSStefano Zampini             ierr = MPI_Gatherv(&array_from[0],pcbddc->local_primal_size,MPIU_SCALAR,&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,0,comm);CHKERRQ(ierr);
19370c7d97c5SJed Brown             if(vec_to) {
19380c7d97c5SJed Brown               for(i=0;i<pcbddc->replicated_primal_size;i++)
19390c7d97c5SJed Brown                 array_to[pcbddc->replicated_local_primal_indices[i]]+=pcbddc->replicated_local_primal_values[i];
19400c7d97c5SJed Brown             }
19410c7d97c5SJed Brown           } else {
19420c7d97c5SJed Brown             if(vec_from)
19430c7d97c5SJed Brown               for(i=0;i<pcbddc->replicated_primal_size;i++)
19440c7d97c5SJed Brown                 pcbddc->replicated_local_primal_values[i]=array_from[pcbddc->replicated_local_primal_indices[i]];
194553cdbc3dSStefano Zampini             ierr = MPI_Scatterv(&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,&array_to[0],pcbddc->local_primal_size,MPIU_SCALAR,0,comm);CHKERRQ(ierr);
19460c7d97c5SJed Brown           }
19470c7d97c5SJed Brown           break;
19480c7d97c5SJed Brown         case REPLICATED_BDDC:
19490c7d97c5SJed Brown           if(smode == SCATTER_FORWARD) {
195053cdbc3dSStefano Zampini             ierr = MPI_Allgatherv(&array_from[0],pcbddc->local_primal_size,MPIU_SCALAR,&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,comm);CHKERRQ(ierr);
19510c7d97c5SJed Brown             for(i=0;i<pcbddc->replicated_primal_size;i++)
19520c7d97c5SJed Brown               array_to[pcbddc->replicated_local_primal_indices[i]]+=pcbddc->replicated_local_primal_values[i];
19530c7d97c5SJed Brown           } else { /* no communications needed for SCATTER_REVERSE since needed data is already present */
19540c7d97c5SJed Brown             for(i=0;i<pcbddc->local_primal_size;i++)
19550c7d97c5SJed Brown               array_to[i]=array_from[pcbddc->local_primal_indices[i]];
19560c7d97c5SJed Brown           }
19570c7d97c5SJed Brown           break;
195853cdbc3dSStefano Zampini         case MULTILEVEL_BDDC:
195953cdbc3dSStefano Zampini           break;
196053cdbc3dSStefano Zampini         case PARALLEL_BDDC:
196153cdbc3dSStefano Zampini           break;
19620c7d97c5SJed Brown       }
19630c7d97c5SJed Brown       if(vec_from) VecRestoreArray(vec_from,&array_from);
19640c7d97c5SJed Brown       if(vec_to)   VecRestoreArray(vec_to,&array_to);
19650c7d97c5SJed Brown       break;
19660c7d97c5SJed Brown   }
19670c7d97c5SJed Brown   PetscFunctionReturn(0);
19680c7d97c5SJed Brown }
19690c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
19703b03a366Sstefano_zampini #undef __FUNCT__
19713b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCCreateConstraintMatrix"
19723b03a366Sstefano_zampini static PetscErrorCode PCBDDCCreateConstraintMatrix(PC pc)
19733b03a366Sstefano_zampini {
19743b03a366Sstefano_zampini   PetscErrorCode ierr;
19753b03a366Sstefano_zampini   PC_IS*         pcis = (PC_IS*)(pc->data);
19763b03a366Sstefano_zampini   PC_BDDC*       pcbddc = (PC_BDDC*)pc->data;
19773b03a366Sstefano_zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
197823d4d1a5SStefano Zampini   PetscInt       *nnz,*is_indices;
19793b03a366Sstefano_zampini   PetscScalar    *temp_quadrature_constraint;
1980534831adSStefano Zampini   PetscInt       *temp_indices,*temp_indices_to_constraint,*temp_indices_to_constraint_B,*local_to_B;
19813b03a366Sstefano_zampini   PetscInt       local_primal_size,i,j,k,total_counts,max_size_of_constraint;
19823b03a366Sstefano_zampini   PetscInt       n_constraints,n_vertices,size_of_constraint;
1983534831adSStefano Zampini   PetscScalar    quad_value;
19843b03a366Sstefano_zampini   PetscBool      nnsp_has_cnst=PETSC_FALSE,use_nnsp_true=pcbddc->use_nnsp_true;
19853b03a366Sstefano_zampini   PetscInt       nnsp_size=0,nnsp_addone=0,temp_constraints,temp_start_ptr;
19863b03a366Sstefano_zampini   IS             *used_IS;
19873b03a366Sstefano_zampini   const MatType  impMatType=MATSEQAIJ;
19883b03a366Sstefano_zampini   PetscBLASInt   Bs,Bt,lwork,lierr;
19893b03a366Sstefano_zampini   PetscReal      tol=1.0e-8;
1990fcda91b4SJed Brown   MatNullSpace   nearnullsp;
1991fcda91b4SJed Brown   const Vec      *nearnullvecs;
19923b03a366Sstefano_zampini   Vec            *localnearnullsp;
19933b03a366Sstefano_zampini   PetscScalar    *work,*temp_basis,*array_vector,*correlation_mat;
19943b03a366Sstefano_zampini   PetscReal      *rwork,*singular_vals;
1995534831adSStefano Zampini   PetscBLASInt   Bone=1,*ipiv;
1996534831adSStefano Zampini   Vec            temp_vec;
1997534831adSStefano Zampini   Mat            temp_mat;
1998534831adSStefano Zampini   KSP            temp_ksp;
1999ffe5efe1SStefano Zampini   PC             temp_pc;
2000534831adSStefano Zampini   PetscInt       s,start_constraint,dual_dofs;
2001534831adSStefano Zampini   PetscBool      compute_submatrix,useksp=PETSC_FALSE;
2002534831adSStefano Zampini   PetscInt       *aux_primal_permutation,*aux_primal_numbering;
2003534831adSStefano Zampini   PetscBool      boolforface,*change_basis;
2004de534f79Sstefano_zampini /* some ugly conditional declarations */
20053b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD)
20063b03a366Sstefano_zampini   PetscScalar    dot_result;
20073b03a366Sstefano_zampini   PetscScalar    one=1.0,zero=0.0;
20083b03a366Sstefano_zampini   PetscInt       ii;
20093425bc38SStefano Zampini   PetscScalar    *singular_vectors;
20103425bc38SStefano Zampini   PetscBLASInt   *iwork,*ifail;
20113425bc38SStefano Zampini   PetscReal      dummy_real,abs_tol;
20123425bc38SStefano Zampini   PetscBLASInt   eigs_found;
20133b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX)
20143b03a366Sstefano_zampini   PetscScalar    val1,val2;
20153b03a366Sstefano_zampini #endif
20163425bc38SStefano Zampini #endif
20173b03a366Sstefano_zampini   PetscBLASInt   dummy_int;
20183b03a366Sstefano_zampini   PetscScalar    dummy_scalar;
20193b03a366Sstefano_zampini 
20203b03a366Sstefano_zampini   PetscFunctionBegin;
20213b03a366Sstefano_zampini   /* check if near null space is attached to global mat */
2022fcda91b4SJed Brown   ierr = MatGetNearNullSpace(pc->pmat,&nearnullsp);CHKERRQ(ierr);
2023fcda91b4SJed Brown   if (nearnullsp) {
2024fcda91b4SJed Brown     ierr = MatNullSpaceGetVecs(nearnullsp,&nnsp_has_cnst,&nnsp_size,&nearnullvecs);CHKERRQ(ierr);
20253b03a366Sstefano_zampini   } else { /* if near null space is not provided it uses constants */
20263b03a366Sstefano_zampini     nnsp_has_cnst = PETSC_TRUE;
20273b03a366Sstefano_zampini     use_nnsp_true = PETSC_TRUE;
20283b03a366Sstefano_zampini   }
20293b03a366Sstefano_zampini   if(nnsp_has_cnst) {
20303b03a366Sstefano_zampini     nnsp_addone = 1;
20313b03a366Sstefano_zampini   }
20323b03a366Sstefano_zampini   /*
20333b03a366Sstefano_zampini        Evaluate maximum storage size needed by the procedure
20343b03a366Sstefano_zampini        - temp_indices will contain start index of each constraint stored as follows
20353b03a366Sstefano_zampini        - temp_indices_to_constraint  [temp_indices[i],...,temp[indices[i+1]-1] will contain the indices (in local numbering) on which the constraint acts
2036534831adSStefano Zampini        - temp_indices_to_constraint_B[temp_indices[i],...,temp[indices[i+1]-1] will contain the indices (in boundary numbering) on which the constraint acts
20373b03a366Sstefano_zampini        - temp_quadrature_constraint  [temp_indices[i],...,temp[indices[i+1]-1] will contain the scalars representing the constraint itself
20383b03a366Sstefano_zampini                                                                                                                                                          */
2039da1bb401SStefano Zampini 
20403b03a366Sstefano_zampini   total_counts = pcbddc->n_ISForFaces+pcbddc->n_ISForEdges;
20413b03a366Sstefano_zampini   total_counts *= (nnsp_addone+nnsp_size);
2042da1bb401SStefano Zampini   ierr = ISGetSize(pcbddc->ISForVertices,&n_vertices);CHKERRQ(ierr);
2043da1bb401SStefano Zampini   total_counts += n_vertices;
20443b03a366Sstefano_zampini   ierr = PetscMalloc((total_counts+1)*sizeof(PetscInt),&temp_indices);CHKERRQ(ierr);
2045534831adSStefano Zampini   ierr = PetscMalloc((total_counts+1)*sizeof(PetscBool),&change_basis);CHKERRQ(ierr);
20463b03a366Sstefano_zampini   total_counts = 0;
20473b03a366Sstefano_zampini   max_size_of_constraint = 0;
20483b03a366Sstefano_zampini   for(i=0;i<pcbddc->n_ISForEdges+pcbddc->n_ISForFaces;i++){
20493b03a366Sstefano_zampini     if(i<pcbddc->n_ISForEdges){
20503b03a366Sstefano_zampini       used_IS = &pcbddc->ISForEdges[i];
20513b03a366Sstefano_zampini     } else {
20523b03a366Sstefano_zampini       used_IS = &pcbddc->ISForFaces[i-pcbddc->n_ISForEdges];
20533b03a366Sstefano_zampini     }
20543b03a366Sstefano_zampini     ierr = ISGetSize(*used_IS,&j);CHKERRQ(ierr);
20553b03a366Sstefano_zampini     total_counts += j;
20563b03a366Sstefano_zampini     if(j>max_size_of_constraint) max_size_of_constraint=j;
20573b03a366Sstefano_zampini   }
20583b03a366Sstefano_zampini   total_counts *= (nnsp_addone+nnsp_size);
2059da1bb401SStefano Zampini   total_counts += n_vertices;
20603b03a366Sstefano_zampini   ierr = PetscMalloc(total_counts*sizeof(PetscScalar),&temp_quadrature_constraint);CHKERRQ(ierr);
20613b03a366Sstefano_zampini   ierr = PetscMalloc(total_counts*sizeof(PetscInt),&temp_indices_to_constraint);CHKERRQ(ierr);
2062534831adSStefano Zampini   ierr = PetscMalloc(total_counts*sizeof(PetscInt),&temp_indices_to_constraint_B);CHKERRQ(ierr);
2063534831adSStefano Zampini   ierr = PetscMalloc(pcis->n*sizeof(PetscInt),&local_to_B);CHKERRQ(ierr);
2064534831adSStefano Zampini   ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2065534831adSStefano Zampini   for(i=0;i<pcis->n;i++) {
2066534831adSStefano Zampini     local_to_B[i]=-1;
2067534831adSStefano Zampini   }
2068534831adSStefano Zampini   for(i=0;i<pcis->n_B;i++) {
2069534831adSStefano Zampini     local_to_B[is_indices[i]]=i;
2070534831adSStefano Zampini   }
2071534831adSStefano Zampini   ierr = ISRestoreIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2072534831adSStefano Zampini 
20733b03a366Sstefano_zampini   /* First we issue queries to allocate optimal workspace for LAPACKgesvd or LAPACKsyev/LAPACKheev */
20743b03a366Sstefano_zampini   rwork = 0;
20753b03a366Sstefano_zampini   work = 0;
20763b03a366Sstefano_zampini   singular_vals = 0;
20773b03a366Sstefano_zampini   temp_basis = 0;
20783b03a366Sstefano_zampini   correlation_mat = 0;
20793b03a366Sstefano_zampini   if(!pcbddc->use_nnsp_true) {
20803b03a366Sstefano_zampini     PetscScalar temp_work;
20813b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD)
20823b03a366Sstefano_zampini     /* POD */
20833b03a366Sstefano_zampini     PetscInt max_n;
20843b03a366Sstefano_zampini     max_n = nnsp_addone+nnsp_size;
20853b03a366Sstefano_zampini     /* using some techniques borrowed from Proper Orthogonal Decomposition */
20863b03a366Sstefano_zampini     ierr = PetscMalloc(max_n*max_n*sizeof(PetscScalar),&correlation_mat);CHKERRQ(ierr);
20873425bc38SStefano Zampini     ierr = PetscMalloc(max_n*max_n*sizeof(PetscScalar),&singular_vectors);CHKERRQ(ierr);
20883b03a366Sstefano_zampini     ierr = PetscMalloc(max_n*sizeof(PetscReal),&singular_vals);CHKERRQ(ierr);
20893b03a366Sstefano_zampini     ierr = PetscMalloc(max_size_of_constraint*(nnsp_addone+nnsp_size)*sizeof(PetscScalar),&temp_basis);CHKERRQ(ierr);
20903b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX)
20913b03a366Sstefano_zampini     ierr = PetscMalloc(3*max_n*sizeof(PetscReal),&rwork);CHKERRQ(ierr);
20923b03a366Sstefano_zampini #endif
20933425bc38SStefano Zampini     ierr = PetscMalloc(5*max_n*sizeof(PetscBLASInt),&iwork);CHKERRQ(ierr);
20943425bc38SStefano Zampini     ierr = PetscMalloc(max_n*sizeof(PetscBLASInt),&ifail);CHKERRQ(ierr);
20953b03a366Sstefano_zampini     /* now we evaluate the optimal workspace using query with lwork=-1 */
20963b03a366Sstefano_zampini     Bt = PetscBLASIntCast(max_n);
20973b03a366Sstefano_zampini     lwork=-1;
20983425bc38SStefano Zampini     ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
20993b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX)
21003425bc38SStefano Zampini     abs_tol=1.e-8;
21013425bc38SStefano Zampini /*    LAPACKsyev_("V","U",&Bt,correlation_mat,&Bt,singular_vals,&temp_work,&lwork,&lierr); */
21023425bc38SStefano Zampini     LAPACKsyevx_("V","A","U",&Bt,correlation_mat,&Bt,&dummy_real,&dummy_real,&dummy_int,&dummy_int,
21033425bc38SStefano Zampini                  &abs_tol,&eigs_found,singular_vals,singular_vectors,&Bt,&temp_work,&lwork,iwork,ifail,&lierr);
21043b03a366Sstefano_zampini #else
21053425bc38SStefano Zampini /*    LAPACKsyev_("V","U",&Bt,correlation_mat,&Bt,singular_vals,&temp_work,&lwork,rwork,&lierr); */
21063425bc38SStefano Zampini /*  LAPACK call is missing here! TODO */
21073425bc38SStefano Zampini     SETERRQ(((PetscObject) pc)->comm, PETSC_ERR_SUP, "Not yet implemented for complexes when PETSC_MISSING_GESVD = 1");
21083b03a366Sstefano_zampini #endif
21093425bc38SStefano Zampini     if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to SYEVX Lapack routine %d",(int)lierr);
21103425bc38SStefano Zampini     ierr = PetscFPTrapPop();CHKERRQ(ierr);
21113b03a366Sstefano_zampini #else /* on missing GESVD */
21123b03a366Sstefano_zampini     /* SVD */
21133b03a366Sstefano_zampini     PetscInt max_n,min_n;
21143b03a366Sstefano_zampini     max_n = max_size_of_constraint;
21153b03a366Sstefano_zampini     min_n = nnsp_addone+nnsp_size;
21163b03a366Sstefano_zampini     if(max_size_of_constraint < ( nnsp_addone+nnsp_size ) ) {
21173b03a366Sstefano_zampini       min_n = max_size_of_constraint;
21183b03a366Sstefano_zampini       max_n = nnsp_addone+nnsp_size;
21193b03a366Sstefano_zampini     }
21203b03a366Sstefano_zampini     ierr = PetscMalloc(min_n*sizeof(PetscReal),&singular_vals);CHKERRQ(ierr);
21213b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX)
21223b03a366Sstefano_zampini     ierr = PetscMalloc(5*min_n*sizeof(PetscReal),&rwork);CHKERRQ(ierr);
21233b03a366Sstefano_zampini #endif
21243b03a366Sstefano_zampini     /* now we evaluate the optimal workspace using query with lwork=-1 */
21253b03a366Sstefano_zampini     lwork=-1;
21263b03a366Sstefano_zampini     Bs = PetscBLASIntCast(max_n);
21273b03a366Sstefano_zampini     Bt = PetscBLASIntCast(min_n);
21283b03a366Sstefano_zampini     dummy_int = Bs;
2129670f3ff9SJed Brown     ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
21303b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX)
21313b03a366Sstefano_zampini     LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[0],&Bs,singular_vals,
21323b03a366Sstefano_zampini                  &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,&temp_work,&lwork,&lierr);
21333b03a366Sstefano_zampini #else
21343b03a366Sstefano_zampini     LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[0],&Bs,singular_vals,
21353b03a366Sstefano_zampini                  &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,&temp_work,&lwork,rwork,&lierr);
21363b03a366Sstefano_zampini #endif
21373b03a366Sstefano_zampini     if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to SVD Lapack routine %d",(int)lierr);
2138670f3ff9SJed Brown     ierr = PetscFPTrapPop();CHKERRQ(ierr);
21393b03a366Sstefano_zampini #endif
21403b03a366Sstefano_zampini     /* Allocate optimal workspace */
21413b03a366Sstefano_zampini     lwork = PetscBLASIntCast((PetscInt)PetscRealPart(temp_work));
21423b03a366Sstefano_zampini     total_counts = (PetscInt)lwork;
21433b03a366Sstefano_zampini     ierr = PetscMalloc(total_counts*sizeof(PetscScalar),&work);CHKERRQ(ierr);
21443b03a366Sstefano_zampini   }
21453b03a366Sstefano_zampini   /* get local part of global near null space vectors */
21463b03a366Sstefano_zampini   ierr = PetscMalloc(nnsp_size*sizeof(Vec),&localnearnullsp);CHKERRQ(ierr);
21473b03a366Sstefano_zampini   for(k=0;k<nnsp_size;k++) {
21483b03a366Sstefano_zampini     ierr = VecDuplicate(pcis->vec1_N,&localnearnullsp[k]);CHKERRQ(ierr);
2149fcda91b4SJed Brown     ierr = VecScatterBegin(matis->ctx,nearnullvecs[k],localnearnullsp[k],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
2150fcda91b4SJed Brown     ierr = VecScatterEnd  (matis->ctx,nearnullvecs[k],localnearnullsp[k],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21513b03a366Sstefano_zampini   }
21523b03a366Sstefano_zampini   /* Now we can loop on constraining sets */
21533b03a366Sstefano_zampini   total_counts=0;
21543b03a366Sstefano_zampini   temp_indices[0]=0;
2155da1bb401SStefano Zampini   /* vertices */
2156da1bb401SStefano Zampini   PetscBool used_vertex;
2157da1bb401SStefano Zampini   ierr = ISGetIndices(pcbddc->ISForVertices,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2158da1bb401SStefano Zampini   if(nnsp_has_cnst) { /* consider all vertices */
2159da1bb401SStefano Zampini     for(i=0;i<n_vertices;i++) {
2160da1bb401SStefano Zampini       temp_indices_to_constraint[temp_indices[total_counts]]=is_indices[i];
2161534831adSStefano Zampini       temp_indices_to_constraint_B[temp_indices[total_counts]]=local_to_B[is_indices[i]];
2162da1bb401SStefano Zampini       temp_quadrature_constraint[temp_indices[total_counts]]=1.0;
2163da1bb401SStefano Zampini       temp_indices[total_counts+1]=temp_indices[total_counts]+1;
2164534831adSStefano Zampini       change_basis[total_counts]=PETSC_FALSE;
2165da1bb401SStefano Zampini       total_counts++;
2166da1bb401SStefano Zampini     }
2167da1bb401SStefano Zampini   } else { /* consider vertices for which exist at least a localnearnullsp which is not null there */
2168da1bb401SStefano Zampini     for(i=0;i<n_vertices;i++) {
2169da1bb401SStefano Zampini       used_vertex=PETSC_FALSE;
2170da1bb401SStefano Zampini       k=0;
2171da1bb401SStefano Zampini       while(!used_vertex && k<nnsp_size) {
2172da1bb401SStefano Zampini         ierr = VecGetArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr);
2173da1bb401SStefano Zampini         if(PetscAbsScalar(array_vector[is_indices[i]])>0.0) {
2174da1bb401SStefano Zampini           temp_indices_to_constraint[temp_indices[total_counts]]=is_indices[i];
2175534831adSStefano Zampini           temp_indices_to_constraint_B[temp_indices[total_counts]]=local_to_B[is_indices[i]];
2176da1bb401SStefano Zampini           temp_quadrature_constraint[temp_indices[total_counts]]=1.0;
2177da1bb401SStefano Zampini           temp_indices[total_counts+1]=temp_indices[total_counts]+1;
2178534831adSStefano Zampini           change_basis[total_counts]=PETSC_FALSE;
2179da1bb401SStefano Zampini           total_counts++;
2180da1bb401SStefano Zampini           used_vertex=PETSC_TRUE;
2181da1bb401SStefano Zampini         }
2182da1bb401SStefano Zampini         ierr = VecRestoreArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr);
2183da1bb401SStefano Zampini         k++;
2184da1bb401SStefano Zampini       }
2185da1bb401SStefano Zampini     }
2186da1bb401SStefano Zampini   }
2187da1bb401SStefano Zampini   ierr = ISRestoreIndices(pcbddc->ISForVertices,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2188da1bb401SStefano Zampini   n_vertices=total_counts;
2189da1bb401SStefano Zampini   /* edges and faces */
21903b03a366Sstefano_zampini   for(i=0;i<pcbddc->n_ISForEdges+pcbddc->n_ISForFaces;i++){
21913b03a366Sstefano_zampini     if(i<pcbddc->n_ISForEdges){
21923b03a366Sstefano_zampini       used_IS = &pcbddc->ISForEdges[i];
2193534831adSStefano Zampini       boolforface = pcbddc->usechangeofbasis;
21943b03a366Sstefano_zampini     } else {
21953b03a366Sstefano_zampini       used_IS = &pcbddc->ISForFaces[i-pcbddc->n_ISForEdges];
2196534831adSStefano Zampini       boolforface = pcbddc->usechangeonfaces;
21973b03a366Sstefano_zampini     }
21983b03a366Sstefano_zampini     temp_constraints = 0;          /* zero the number of constraints I have on this conn comp */
21993b03a366Sstefano_zampini     temp_start_ptr = total_counts; /* need to know the starting index of constraints stored */
22003b03a366Sstefano_zampini     ierr = ISGetSize(*used_IS,&size_of_constraint);CHKERRQ(ierr);
22013b03a366Sstefano_zampini     ierr = ISGetIndices(*used_IS,(const PetscInt**)&is_indices);CHKERRQ(ierr);
22023b03a366Sstefano_zampini     if(nnsp_has_cnst) {
22033b03a366Sstefano_zampini       temp_constraints++;
2204534831adSStefano Zampini       quad_value = (PetscScalar) (1.0/PetscSqrtReal((PetscReal)size_of_constraint));
22053b03a366Sstefano_zampini       for(j=0;j<size_of_constraint;j++) {
22063b03a366Sstefano_zampini         temp_indices_to_constraint[temp_indices[total_counts]+j]=is_indices[j];
2207534831adSStefano Zampini         temp_indices_to_constraint_B[temp_indices[total_counts]+j]=local_to_B[is_indices[j]];
22083b03a366Sstefano_zampini         temp_quadrature_constraint[temp_indices[total_counts]+j]=quad_value;
22093b03a366Sstefano_zampini       }
22103b03a366Sstefano_zampini       temp_indices[total_counts+1]=temp_indices[total_counts]+size_of_constraint;  /* store new starting point */
2211534831adSStefano Zampini       change_basis[total_counts]=boolforface;
22123b03a366Sstefano_zampini       total_counts++;
22133b03a366Sstefano_zampini     }
22143b03a366Sstefano_zampini     for(k=0;k<nnsp_size;k++) {
22153b03a366Sstefano_zampini       ierr = VecGetArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr);
22163b03a366Sstefano_zampini       for(j=0;j<size_of_constraint;j++) {
22173b03a366Sstefano_zampini         temp_indices_to_constraint[temp_indices[total_counts]+j]=is_indices[j];
2218534831adSStefano Zampini         temp_indices_to_constraint_B[temp_indices[total_counts]+j]=local_to_B[is_indices[j]];
22193b03a366Sstefano_zampini         temp_quadrature_constraint[temp_indices[total_counts]+j]=array_vector[is_indices[j]];
22203b03a366Sstefano_zampini       }
22213b03a366Sstefano_zampini       ierr = VecRestoreArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr);
2222de534f79Sstefano_zampini       quad_value = 1.0;
2223de534f79Sstefano_zampini       if( use_nnsp_true ) { /* check if array is null on the connected component in case use_nnsp_true has been requested */
2224de534f79Sstefano_zampini         Bs = PetscBLASIntCast(size_of_constraint);
2225de534f79Sstefano_zampini         quad_value = BLASasum_(&Bs,&temp_quadrature_constraint[temp_indices[total_counts]],&Bone);
2226de534f79Sstefano_zampini       }
2227de534f79Sstefano_zampini       if ( quad_value > 0.0 ) { /* keep indices and values */
2228de534f79Sstefano_zampini         temp_constraints++;
22293b03a366Sstefano_zampini         temp_indices[total_counts+1]=temp_indices[total_counts]+size_of_constraint;  /* store new starting point */
2230534831adSStefano Zampini         change_basis[total_counts]=boolforface;
22313b03a366Sstefano_zampini         total_counts++;
22323b03a366Sstefano_zampini       }
2233de534f79Sstefano_zampini     }
22343b03a366Sstefano_zampini     ierr = ISRestoreIndices(*used_IS,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2235de534f79Sstefano_zampini     /* perform SVD on the constraint if use_nnsp_true has not be requested by the user */
22363b03a366Sstefano_zampini     if(!use_nnsp_true) {
2237de534f79Sstefano_zampini 
22383b03a366Sstefano_zampini       Bs = PetscBLASIntCast(size_of_constraint);
22393b03a366Sstefano_zampini       Bt = PetscBLASIntCast(temp_constraints);
2240de534f79Sstefano_zampini 
22413b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD)
22423b03a366Sstefano_zampini       ierr = PetscMemzero(correlation_mat,Bt*Bt*sizeof(PetscScalar));CHKERRQ(ierr);
22433b03a366Sstefano_zampini       /* Store upper triangular part of correlation matrix */
22443b03a366Sstefano_zampini       for(j=0;j<temp_constraints;j++) {
22453b03a366Sstefano_zampini         for(k=0;k<j+1;k++) {
22463b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX)
22473425bc38SStefano Zampini           /* hand made complex dot product -> replace */
22483b03a366Sstefano_zampini           dot_result = 0.0;
22493b03a366Sstefano_zampini           for (ii=0; ii<size_of_constraint; ii++) {
22503b03a366Sstefano_zampini             val1 = temp_quadrature_constraint[temp_indices[temp_start_ptr+j]+ii];
22513b03a366Sstefano_zampini             val2 = temp_quadrature_constraint[temp_indices[temp_start_ptr+k]+ii];
22523b03a366Sstefano_zampini             dot_result += val1*PetscConj(val2);
22533b03a366Sstefano_zampini           }
22543b03a366Sstefano_zampini #else
22553b03a366Sstefano_zampini           dot_result = BLASdot_(&Bs,&temp_quadrature_constraint[temp_indices[temp_start_ptr+j]],&Bone,
22563b03a366Sstefano_zampini                                     &temp_quadrature_constraint[temp_indices[temp_start_ptr+k]],&Bone);
22573b03a366Sstefano_zampini #endif
22583b03a366Sstefano_zampini           correlation_mat[j*temp_constraints+k]=dot_result;
22593b03a366Sstefano_zampini         }
22603b03a366Sstefano_zampini       }
22613425bc38SStefano Zampini       ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
22623b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX)
22633425bc38SStefano Zampini /*      LAPACKsyev_("V","U",&Bt,correlation_mat,&Bt,singular_vals,work,&lwork,&lierr); */
22643425bc38SStefano Zampini       LAPACKsyevx_("V","A","U",&Bt,correlation_mat,&Bt,&dummy_real,&dummy_real,&dummy_int,&dummy_int,
22653425bc38SStefano Zampini                  &abs_tol,&eigs_found,singular_vals,singular_vectors,&Bt,work,&lwork,iwork,ifail,&lierr);
22663b03a366Sstefano_zampini #else
22673425bc38SStefano Zampini /*  LAPACK call is missing here! TODO */
22683425bc38SStefano Zampini       SETERRQ(((PetscObject) pc)->comm, PETSC_ERR_SUP, "Not yet implemented for complexes when PETSC_MISSING_GESVD = 1");
22693b03a366Sstefano_zampini #endif
22703425bc38SStefano Zampini       if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYEVX Lapack routine %d",(int)lierr);
22713425bc38SStefano Zampini       ierr = PetscFPTrapPop();CHKERRQ(ierr);
22723b03a366Sstefano_zampini       /* retain eigenvalues greater than tol: note that lapack SYEV gives eigs in ascending order */
22733b03a366Sstefano_zampini       j=0;
22743b03a366Sstefano_zampini       while( j < Bt && singular_vals[j] < tol) j++;
22753b03a366Sstefano_zampini       total_counts=total_counts-j;
22763b03a366Sstefano_zampini       if(j<temp_constraints) {
22773b03a366Sstefano_zampini         for(k=j;k<Bt;k++) { singular_vals[k]=1.0/PetscSqrtReal(singular_vals[k]); }
22783425bc38SStefano Zampini         ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
22793b03a366Sstefano_zampini         BLASgemm_("N","N",&Bs,&Bt,&Bt,&one,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,correlation_mat,&Bt,&zero,temp_basis,&Bs);
22803425bc38SStefano Zampini         ierr = PetscFPTrapPop();CHKERRQ(ierr);
22813b03a366Sstefano_zampini         /* copy POD basis into used quadrature memory */
22823b03a366Sstefano_zampini         for(k=0;k<Bt-j;k++) {
22833b03a366Sstefano_zampini           for(ii=0;ii<size_of_constraint;ii++) {
22843b03a366Sstefano_zampini             temp_quadrature_constraint[temp_indices[temp_start_ptr+k]+ii]=singular_vals[Bt-1-k]*temp_basis[(Bt-1-k)*size_of_constraint+ii];
22853b03a366Sstefano_zampini           }
22863b03a366Sstefano_zampini         }
22873b03a366Sstefano_zampini       }
2288de534f79Sstefano_zampini 
22893b03a366Sstefano_zampini #else  /* on missing GESVD */
22903b03a366Sstefano_zampini       PetscInt min_n = temp_constraints;
22913b03a366Sstefano_zampini       if(min_n > size_of_constraint) min_n = size_of_constraint;
22923b03a366Sstefano_zampini       dummy_int = Bs;
2293670f3ff9SJed Brown       ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
22943b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX)
22953b03a366Sstefano_zampini       LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,singular_vals,
22963b03a366Sstefano_zampini                    &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,work,&lwork,&lierr);
22973b03a366Sstefano_zampini #else
22983b03a366Sstefano_zampini       LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,singular_vals,
22993b03a366Sstefano_zampini                    &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,work,&lwork,rwork,&lierr);
23003b03a366Sstefano_zampini #endif
23013b03a366Sstefano_zampini       if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SVD Lapack routine %d",(int)lierr);
2302670f3ff9SJed Brown       ierr = PetscFPTrapPop();CHKERRQ(ierr);
23033b03a366Sstefano_zampini       /* retain eigenvalues greater than tol: note that lapack SVD gives eigs in descending order */
23043b03a366Sstefano_zampini       j=0;
23053b03a366Sstefano_zampini       while( j < min_n && singular_vals[min_n-j-1] < tol) j++;
23063b03a366Sstefano_zampini       total_counts = total_counts-(PetscInt)Bt+(min_n-j);
23073b03a366Sstefano_zampini #endif
23083b03a366Sstefano_zampini     }
23093b03a366Sstefano_zampini   }
2310534831adSStefano Zampini 
2311da1bb401SStefano Zampini   n_constraints=total_counts-n_vertices;
2312da1bb401SStefano Zampini   local_primal_size = total_counts;
23133b03a366Sstefano_zampini   /* set quantities in pcbddc data structure */
23143b03a366Sstefano_zampini   pcbddc->n_vertices = n_vertices;
23153b03a366Sstefano_zampini   pcbddc->n_constraints = n_constraints;
2316da1bb401SStefano Zampini   pcbddc->local_primal_size = local_primal_size;
2317534831adSStefano Zampini 
2318534831adSStefano Zampini   /* Create constraint matrix */
2319534831adSStefano Zampini   /* The constraint matrix is used to compute the l2g map of primal dofs */
2320534831adSStefano Zampini   /* so we need to set it up properly either with or without change of basis */
2321534831adSStefano Zampini   ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->ConstraintMatrix);CHKERRQ(ierr);
2322534831adSStefano Zampini   ierr = MatSetType(pcbddc->ConstraintMatrix,impMatType);CHKERRQ(ierr);
2323534831adSStefano Zampini   ierr = MatSetSizes(pcbddc->ConstraintMatrix,local_primal_size,pcis->n,local_primal_size,pcis->n);CHKERRQ(ierr);
2324534831adSStefano Zampini   /* compute a local numbering of constraints : vertices first then constraints */
2325534831adSStefano Zampini   ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
2326534831adSStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array_vector);CHKERRQ(ierr);
2327534831adSStefano Zampini   ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&aux_primal_numbering);CHKERRQ(ierr);
2328534831adSStefano Zampini   ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&aux_primal_permutation);CHKERRQ(ierr);
2329534831adSStefano Zampini   total_counts=0;
2330534831adSStefano Zampini   /* find vertices: subdomain corners plus dofs with basis changed */
2331534831adSStefano Zampini   for(i=0;i<local_primal_size;i++) {
2332534831adSStefano Zampini     size_of_constraint=temp_indices[i+1]-temp_indices[i];
2333534831adSStefano Zampini     if(change_basis[i] || size_of_constraint == 1) {
2334534831adSStefano Zampini       k=0;
2335534831adSStefano Zampini       while(k < size_of_constraint && array_vector[temp_indices_to_constraint[temp_indices[i]+size_of_constraint-k-1]] != 0.0) {
2336534831adSStefano Zampini         k=k+1;
2337534831adSStefano Zampini       }
2338534831adSStefano Zampini       j=temp_indices_to_constraint[temp_indices[i]+size_of_constraint-k-1];
2339534831adSStefano Zampini       array_vector[j] = 1.0;
2340534831adSStefano Zampini       aux_primal_numbering[total_counts]=j;
2341534831adSStefano Zampini       aux_primal_permutation[total_counts]=total_counts;
2342534831adSStefano Zampini       total_counts++;
2343534831adSStefano Zampini     }
2344534831adSStefano Zampini   }
2345534831adSStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array_vector);CHKERRQ(ierr);
2346534831adSStefano Zampini   /* permute indices in order to have a sorted set of vertices */
2347534831adSStefano Zampini   ierr = PetscSortIntWithPermutation(total_counts,aux_primal_numbering,aux_primal_permutation);
2348534831adSStefano Zampini   /* nonzero structure */
2349534831adSStefano Zampini   ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&nnz);CHKERRQ(ierr);
2350534831adSStefano Zampini   for(i=0;i<total_counts;i++) {
2351534831adSStefano Zampini     nnz[i]=1;
2352534831adSStefano Zampini   }
2353534831adSStefano Zampini   j=total_counts;
2354534831adSStefano Zampini   for(i=n_vertices;i<local_primal_size;i++) {
2355534831adSStefano Zampini     if(!change_basis[i]) {
2356534831adSStefano Zampini       nnz[j]=temp_indices[i+1]-temp_indices[i];
2357534831adSStefano Zampini       j++;
2358534831adSStefano Zampini     }
2359534831adSStefano Zampini   }
2360534831adSStefano Zampini   ierr = MatSeqAIJSetPreallocation(pcbddc->ConstraintMatrix,0,nnz);CHKERRQ(ierr);
2361534831adSStefano Zampini   ierr = PetscFree(nnz);CHKERRQ(ierr);
2362534831adSStefano Zampini   /* set values in constraint matrix */
2363534831adSStefano Zampini   for(i=0;i<total_counts;i++) {
2364534831adSStefano Zampini     j = aux_primal_permutation[i];
2365534831adSStefano Zampini     k = aux_primal_numbering[j];
2366534831adSStefano Zampini     ierr = MatSetValue(pcbddc->ConstraintMatrix,i,k,1.0,INSERT_VALUES);CHKERRQ(ierr);
2367534831adSStefano Zampini   }
2368534831adSStefano Zampini   for(i=n_vertices;i<local_primal_size;i++) {
2369534831adSStefano Zampini     if(!change_basis[i]) {
2370534831adSStefano Zampini       size_of_constraint=temp_indices[i+1]-temp_indices[i];
2371534831adSStefano Zampini       ierr = MatSetValues(pcbddc->ConstraintMatrix,1,&total_counts,size_of_constraint,&temp_indices_to_constraint[temp_indices[i]],&temp_quadrature_constraint[temp_indices[i]],INSERT_VALUES);CHKERRQ(ierr);
2372534831adSStefano Zampini       total_counts++;
2373534831adSStefano Zampini     }
2374534831adSStefano Zampini   }
2375534831adSStefano Zampini   ierr = PetscFree(aux_primal_numbering);CHKERRQ(ierr);
2376534831adSStefano Zampini   ierr = PetscFree(aux_primal_permutation);CHKERRQ(ierr);
2377534831adSStefano Zampini   /* assembling */
2378534831adSStefano Zampini   ierr = MatAssemblyBegin(pcbddc->ConstraintMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2379534831adSStefano Zampini   ierr = MatAssemblyEnd(pcbddc->ConstraintMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2380534831adSStefano Zampini 
2381534831adSStefano Zampini   /* Create matrix for change of basis. We don't need it in case pcbddc->usechangeofbasis is FALSE */
2382534831adSStefano Zampini   if(pcbddc->usechangeofbasis) {
2383534831adSStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->ChangeOfBasisMatrix);CHKERRQ(ierr);
2384534831adSStefano Zampini     ierr = MatSetType(pcbddc->ChangeOfBasisMatrix,impMatType);CHKERRQ(ierr);
2385534831adSStefano Zampini     ierr = MatSetSizes(pcbddc->ChangeOfBasisMatrix,pcis->n_B,pcis->n_B,pcis->n_B,pcis->n_B);CHKERRQ(ierr);
2386534831adSStefano Zampini     /* work arrays */
2387534831adSStefano Zampini     /* we need to reuse these arrays, so we free them */
2388534831adSStefano Zampini     ierr = PetscFree(temp_basis);CHKERRQ(ierr);
2389534831adSStefano Zampini     ierr = PetscFree(work);CHKERRQ(ierr);
2390534831adSStefano Zampini     ierr = PetscMalloc(pcis->n_B*sizeof(PetscInt),&nnz);CHKERRQ(ierr);
2391534831adSStefano Zampini     ierr = PetscMalloc((nnsp_addone+nnsp_size)*(nnsp_addone+nnsp_size)*sizeof(PetscScalar),&temp_basis);CHKERRQ(ierr);
2392534831adSStefano Zampini     ierr = PetscMalloc((nnsp_addone+nnsp_size)*sizeof(PetscScalar),&work);CHKERRQ(ierr);
2393534831adSStefano Zampini     ierr = PetscMalloc((nnsp_addone+nnsp_size)*sizeof(PetscBLASInt),&ipiv);CHKERRQ(ierr);
2394534831adSStefano Zampini     for(i=0;i<pcis->n_B;i++) {
2395534831adSStefano Zampini       nnz[i]=1;
2396534831adSStefano Zampini     }
2397534831adSStefano Zampini     /* Overestimated nonzeros per row */
2398534831adSStefano Zampini     k=1;
2399534831adSStefano Zampini     for(i=pcbddc->n_vertices;i<local_primal_size;i++) {
2400534831adSStefano Zampini       if(change_basis[i]) {
2401534831adSStefano Zampini         size_of_constraint = temp_indices[i+1]-temp_indices[i];
2402534831adSStefano Zampini         if(k < size_of_constraint) {
2403534831adSStefano Zampini           k = size_of_constraint;
2404534831adSStefano Zampini         }
2405534831adSStefano Zampini         for(j=0;j<size_of_constraint;j++) {
2406534831adSStefano Zampini           nnz[temp_indices_to_constraint_B[temp_indices[i]+j]] = size_of_constraint;
2407534831adSStefano Zampini         }
2408534831adSStefano Zampini       }
2409534831adSStefano Zampini     }
2410534831adSStefano Zampini     ierr = MatSeqAIJSetPreallocation(pcbddc->ChangeOfBasisMatrix,0,nnz);CHKERRQ(ierr);
2411534831adSStefano Zampini     ierr = PetscFree(nnz);CHKERRQ(ierr);
2412534831adSStefano Zampini     /* Temporary array to store indices */
2413534831adSStefano Zampini     ierr = PetscMalloc(k*sizeof(PetscInt),&is_indices);CHKERRQ(ierr);
2414534831adSStefano Zampini     /* Set initial identity in the matrix */
2415534831adSStefano Zampini     for(i=0;i<pcis->n_B;i++) {
2416534831adSStefano Zampini       ierr = MatSetValue(pcbddc->ChangeOfBasisMatrix,i,i,1.0,INSERT_VALUES);CHKERRQ(ierr);
2417534831adSStefano Zampini     }
2418534831adSStefano Zampini     /* Now we loop on the constraints which need a change of basis */
2419534831adSStefano Zampini     /* Change of basis matrix is evaluated as the FIRST APPROACH in */
2420534831adSStefano Zampini     /* Klawonn and Widlund, Dual-primal FETI-DP methods for linear elasticity, (6.2.1) */
2421534831adSStefano Zampini     temp_constraints = 0;
242293dc3b60SStefano Zampini     if(pcbddc->n_vertices < local_primal_size) {
2423534831adSStefano Zampini       temp_start_ptr = temp_indices_to_constraint_B[temp_indices[pcbddc->n_vertices]];
242493dc3b60SStefano Zampini     }
2425534831adSStefano Zampini     for(i=pcbddc->n_vertices;i<local_primal_size;i++) {
2426534831adSStefano Zampini       if(change_basis[i]) {
2427534831adSStefano Zampini         compute_submatrix = PETSC_FALSE;
2428534831adSStefano Zampini         useksp = PETSC_FALSE;
2429534831adSStefano Zampini         if(temp_start_ptr == temp_indices_to_constraint_B[temp_indices[i]]) {
2430534831adSStefano Zampini           temp_constraints++;
243104eaf177SStefano Zampini           if(i == local_primal_size -1 ||  temp_start_ptr != temp_indices_to_constraint_B[temp_indices[i+1]]) {
2432534831adSStefano Zampini             compute_submatrix = PETSC_TRUE;
2433534831adSStefano Zampini           }
2434534831adSStefano Zampini         }
2435534831adSStefano Zampini         if(compute_submatrix) {
2436534831adSStefano Zampini           if(temp_constraints > 1 || pcbddc->use_nnsp_true) {
2437534831adSStefano Zampini             useksp = PETSC_TRUE;
2438534831adSStefano Zampini           }
2439534831adSStefano Zampini           size_of_constraint = temp_indices[i+1]-temp_indices[i];
2440534831adSStefano Zampini           if(useksp) { /* experimental */
2441534831adSStefano Zampini             ierr = MatCreate(PETSC_COMM_SELF,&temp_mat);CHKERRQ(ierr);
2442534831adSStefano Zampini             ierr = MatSetType(temp_mat,impMatType);CHKERRQ(ierr);
2443534831adSStefano Zampini             ierr = MatSetSizes(temp_mat,size_of_constraint,size_of_constraint,size_of_constraint,size_of_constraint);CHKERRQ(ierr);
2444534831adSStefano Zampini             ierr = MatSeqAIJSetPreallocation(temp_mat,size_of_constraint,PETSC_NULL);CHKERRQ(ierr);
2445534831adSStefano Zampini           }
2446534831adSStefano Zampini           /* First _size_of_constraint-temp_constraints_ columns */
2447534831adSStefano Zampini           dual_dofs = size_of_constraint-temp_constraints;
2448534831adSStefano Zampini           start_constraint = i+1-temp_constraints;
2449534831adSStefano Zampini           for(s=0;s<dual_dofs;s++) {
2450534831adSStefano Zampini             is_indices[0] = s;
2451534831adSStefano Zampini             for(j=0;j<temp_constraints;j++) {
2452534831adSStefano Zampini               for(k=0;k<temp_constraints;k++) {
2453534831adSStefano Zampini                 temp_basis[j*temp_constraints+k]=temp_quadrature_constraint[temp_indices[start_constraint+k]+s+j+1];
2454534831adSStefano Zampini               }
2455534831adSStefano Zampini               work[j]=-temp_quadrature_constraint[temp_indices[start_constraint+j]+s];
2456534831adSStefano Zampini               is_indices[j+1]=s+j+1;
2457534831adSStefano Zampini             }
2458534831adSStefano Zampini             Bt = temp_constraints;
2459534831adSStefano Zampini             ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
2460534831adSStefano Zampini             LAPACKgesv_(&Bt,&Bone,temp_basis,&Bt,ipiv,work,&Bt,&lierr);
2461534831adSStefano Zampini             if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GESV Lapack routine %d",(int)lierr);
2462534831adSStefano Zampini             ierr = PetscFPTrapPop();CHKERRQ(ierr);
2463534831adSStefano Zampini             j = temp_indices_to_constraint_B[temp_indices[start_constraint]+s];
2464534831adSStefano Zampini             ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,temp_constraints,&temp_indices_to_constraint_B[temp_indices[start_constraint]+s+1],1,&j,work,INSERT_VALUES);CHKERRQ(ierr);
2465534831adSStefano Zampini             if(useksp) {
2466534831adSStefano Zampini               /* temp mat with transposed rows and columns */
2467534831adSStefano Zampini               ierr = MatSetValues(temp_mat,1,&s,temp_constraints,&is_indices[1],work,INSERT_VALUES);CHKERRQ(ierr);
2468534831adSStefano Zampini               ierr = MatSetValue(temp_mat,is_indices[0],is_indices[0],1.0,INSERT_VALUES);CHKERRQ(ierr);
2469534831adSStefano Zampini             }
2470534831adSStefano Zampini           }
2471534831adSStefano Zampini           if(useksp) {
2472534831adSStefano Zampini             /* last rows of temp_mat */
2473534831adSStefano Zampini             for(j=0;j<size_of_constraint;j++) {
2474534831adSStefano Zampini               is_indices[j] = j;
2475534831adSStefano Zampini             }
2476534831adSStefano Zampini             for(s=0;s<temp_constraints;s++) {
2477534831adSStefano Zampini               k = s + dual_dofs;
2478534831adSStefano Zampini               ierr = MatSetValues(temp_mat,1,&k,size_of_constraint,is_indices,&temp_quadrature_constraint[temp_indices[start_constraint+s]],INSERT_VALUES);CHKERRQ(ierr);
2479534831adSStefano Zampini             }
2480534831adSStefano Zampini             ierr = MatAssemblyBegin(temp_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2481534831adSStefano Zampini             ierr = MatAssemblyEnd(temp_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2482534831adSStefano Zampini             ierr = MatGetVecs(temp_mat,&temp_vec,PETSC_NULL);CHKERRQ(ierr);
2483534831adSStefano Zampini             ierr = KSPCreate(PETSC_COMM_SELF,&temp_ksp);CHKERRQ(ierr);
2484534831adSStefano Zampini             ierr = KSPSetOperators(temp_ksp,temp_mat,temp_mat,SAME_PRECONDITIONER);CHKERRQ(ierr);
2485534831adSStefano Zampini             ierr = KSPSetType(temp_ksp,KSPPREONLY);CHKERRQ(ierr);
2486ffe5efe1SStefano Zampini             ierr = KSPGetPC(temp_ksp,&temp_pc);CHKERRQ(ierr);
2487ffe5efe1SStefano Zampini             ierr = PCSetType(temp_pc,PCLU);CHKERRQ(ierr);
2488534831adSStefano Zampini             ierr = KSPSetUp(temp_ksp);CHKERRQ(ierr);
2489534831adSStefano Zampini             for(s=0;s<temp_constraints;s++) {
2490534831adSStefano Zampini               ierr = VecSet(temp_vec,0.0);CHKERRQ(ierr);
2491534831adSStefano Zampini               ierr = VecSetValue(temp_vec,s+dual_dofs,1.0,INSERT_VALUES);CHKERRQ(ierr);
2492534831adSStefano Zampini               ierr = VecAssemblyBegin(temp_vec);CHKERRQ(ierr);
2493534831adSStefano Zampini               ierr = VecAssemblyEnd(temp_vec);CHKERRQ(ierr);
2494534831adSStefano Zampini               ierr = KSPSolve(temp_ksp,temp_vec,temp_vec);CHKERRQ(ierr);
2495534831adSStefano Zampini               ierr = VecGetArray(temp_vec,&array_vector);CHKERRQ(ierr);
2496534831adSStefano Zampini               j = temp_indices_to_constraint_B[temp_indices[start_constraint+s]+size_of_constraint-s-1];
2497534831adSStefano Zampini               /* last columns of change of basis matrix associated to new primal dofs */
2498534831adSStefano Zampini               ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,size_of_constraint,&temp_indices_to_constraint_B[temp_indices[start_constraint+s]],1,&j,array_vector,INSERT_VALUES);CHKERRQ(ierr);
2499534831adSStefano Zampini               ierr = VecRestoreArray(temp_vec,&array_vector);CHKERRQ(ierr);
2500534831adSStefano Zampini             }
2501534831adSStefano Zampini             ierr = MatDestroy(&temp_mat);CHKERRQ(ierr);
2502534831adSStefano Zampini             ierr = KSPDestroy(&temp_ksp);CHKERRQ(ierr);
2503534831adSStefano Zampini             ierr = VecDestroy(&temp_vec);CHKERRQ(ierr);
2504534831adSStefano Zampini           } else {
2505534831adSStefano Zampini             /* last columns of change of basis matrix associated to new primal dofs */
2506534831adSStefano Zampini             for(s=0;s<temp_constraints;s++) {
2507534831adSStefano Zampini               j = temp_indices_to_constraint_B[temp_indices[start_constraint+s]+size_of_constraint-s-1];
2508534831adSStefano Zampini               ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,size_of_constraint,&temp_indices_to_constraint_B[temp_indices[start_constraint+s]],1,&j,&temp_quadrature_constraint[temp_indices[start_constraint+s]],INSERT_VALUES);CHKERRQ(ierr);
2509534831adSStefano Zampini             }
2510534831adSStefano Zampini           }
2511534831adSStefano Zampini           /* prepare for the next cycle */
2512534831adSStefano Zampini           temp_constraints = 0;
251304eaf177SStefano Zampini           if(i != local_primal_size -1 ) {
2514534831adSStefano Zampini             temp_start_ptr = temp_indices_to_constraint_B[temp_indices[i+1]];
2515534831adSStefano Zampini           }
2516534831adSStefano Zampini         }
2517534831adSStefano Zampini       }
251804eaf177SStefano Zampini     }
2519534831adSStefano Zampini     /* assembling */
2520534831adSStefano Zampini     ierr = MatAssemblyBegin(pcbddc->ChangeOfBasisMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2521534831adSStefano Zampini     ierr = MatAssemblyEnd(pcbddc->ChangeOfBasisMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2522534831adSStefano Zampini     ierr = PetscFree(ipiv);CHKERRQ(ierr);
2523534831adSStefano Zampini     ierr = PetscFree(is_indices);CHKERRQ(ierr);
2524534831adSStefano Zampini   }
25253b03a366Sstefano_zampini   /* free workspace no longer needed */
25263b03a366Sstefano_zampini   ierr = PetscFree(rwork);CHKERRQ(ierr);
25273b03a366Sstefano_zampini   ierr = PetscFree(work);CHKERRQ(ierr);
25283b03a366Sstefano_zampini   ierr = PetscFree(temp_basis);CHKERRQ(ierr);
25293b03a366Sstefano_zampini   ierr = PetscFree(singular_vals);CHKERRQ(ierr);
25303b03a366Sstefano_zampini   ierr = PetscFree(correlation_mat);CHKERRQ(ierr);
25313b03a366Sstefano_zampini   ierr = PetscFree(temp_indices);CHKERRQ(ierr);
2532534831adSStefano Zampini   ierr = PetscFree(change_basis);CHKERRQ(ierr);
25333b03a366Sstefano_zampini   ierr = PetscFree(temp_indices_to_constraint);CHKERRQ(ierr);
2534534831adSStefano Zampini   ierr = PetscFree(temp_indices_to_constraint_B);CHKERRQ(ierr);
2535534831adSStefano Zampini   ierr = PetscFree(local_to_B);CHKERRQ(ierr);
25363b03a366Sstefano_zampini   ierr = PetscFree(temp_quadrature_constraint);CHKERRQ(ierr);
25373425bc38SStefano Zampini #if defined(PETSC_MISSING_LAPACK_GESVD)
25383425bc38SStefano Zampini   ierr = PetscFree(iwork);CHKERRQ(ierr);
25393425bc38SStefano Zampini   ierr = PetscFree(ifail);CHKERRQ(ierr);
25403425bc38SStefano Zampini   ierr = PetscFree(singular_vectors);CHKERRQ(ierr);
25413425bc38SStefano Zampini #endif
2542da1bb401SStefano Zampini   for(k=0;k<nnsp_size;k++) {
2543da1bb401SStefano Zampini     ierr = VecDestroy(&localnearnullsp[k]);CHKERRQ(ierr);
2544da1bb401SStefano Zampini   }
25453b03a366Sstefano_zampini   ierr = PetscFree(localnearnullsp);CHKERRQ(ierr);
25463b03a366Sstefano_zampini   PetscFunctionReturn(0);
25473b03a366Sstefano_zampini }
25483b03a366Sstefano_zampini /* -------------------------------------------------------------------------- */
25490c7d97c5SJed Brown #undef __FUNCT__
25500c7d97c5SJed Brown #define __FUNCT__ "PCBDDCCoarseSetUp"
255153cdbc3dSStefano Zampini static PetscErrorCode PCBDDCCoarseSetUp(PC pc)
25520c7d97c5SJed Brown {
25530c7d97c5SJed Brown   PetscErrorCode  ierr;
25540c7d97c5SJed Brown 
25550c7d97c5SJed Brown   PC_IS*            pcis = (PC_IS*)(pc->data);
25560c7d97c5SJed Brown   PC_BDDC*          pcbddc = (PC_BDDC*)pc->data;
25570c7d97c5SJed Brown   Mat_IS            *matis = (Mat_IS*)pc->pmat->data;
2558534831adSStefano Zampini   Mat               change_mat_all;
25590c7d97c5SJed Brown   IS                is_R_local;
25600c7d97c5SJed Brown   IS                is_V_local;
25610c7d97c5SJed Brown   IS                is_C_local;
25620c7d97c5SJed Brown   IS                is_aux1;
25630c7d97c5SJed Brown   IS                is_aux2;
25640c7d97c5SJed Brown   const VecType     impVecType;
25650c7d97c5SJed Brown   const MatType     impMatType;
25660c7d97c5SJed Brown   PetscInt          n_R=0;
25670c7d97c5SJed Brown   PetscInt          n_D=0;
25680c7d97c5SJed Brown   PetscInt          n_B=0;
25690c7d97c5SJed Brown   PetscScalar       zero=0.0;
25700c7d97c5SJed Brown   PetscScalar       one=1.0;
25710c7d97c5SJed Brown   PetscScalar       m_one=-1.0;
25720c7d97c5SJed Brown   PetscScalar*      array;
25730c7d97c5SJed Brown   PetscScalar       *coarse_submat_vals;
25740c7d97c5SJed Brown   PetscInt          *idx_R_local;
25750c7d97c5SJed Brown   PetscInt          *idx_V_B;
25760c7d97c5SJed Brown   PetscScalar       *coarsefunctions_errors;
25770c7d97c5SJed Brown   PetscScalar       *constraints_errors;
25780c7d97c5SJed Brown   /* auxiliary indices */
2579534831adSStefano Zampini   PetscInt i,j,k;
2580e269702eSStefano Zampini   /* for verbose output of bddc */
2581e269702eSStefano Zampini   PetscViewer       viewer=pcbddc->dbg_viewer;
2582e269702eSStefano Zampini   PetscBool         dbg_flag=pcbddc->dbg_flag;
2583a0ba757dSStefano Zampini   /* for counting coarse dofs */
2584534831adSStefano Zampini   PetscInt          n_vertices,n_constraints;
25853b03a366Sstefano_zampini   PetscInt          size_of_constraint;
25863b03a366Sstefano_zampini   PetscInt          *row_cmat_indices;
25873b03a366Sstefano_zampini   PetscScalar       *row_cmat_values;
2588534831adSStefano Zampini   PetscInt          *vertices,*nnz,*is_indices,*temp_indices;
25890c7d97c5SJed Brown 
25900c7d97c5SJed Brown   PetscFunctionBegin;
25910c7d97c5SJed Brown   /* Set Non-overlapping dimensions */
25920c7d97c5SJed Brown   n_B = pcis->n_B; n_D = pcis->n - n_B;
2593534831adSStefano Zampini   /* Set types for local objects needed by BDDC precondtioner */
2594534831adSStefano Zampini   impMatType = MATSEQDENSE;
2595534831adSStefano Zampini   impVecType = VECSEQ;
2596da1bb401SStefano Zampini   /* get vertex indices from constraint matrix */
2597534831adSStefano Zampini   ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscInt),&vertices);CHKERRQ(ierr);
2598534831adSStefano Zampini   n_vertices=0;
2599da1bb401SStefano Zampini   for(i=0;i<pcbddc->local_primal_size;i++) {
2600da1bb401SStefano Zampini     ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr);
2601da1bb401SStefano Zampini     if(size_of_constraint == 1) {
2602534831adSStefano Zampini       vertices[n_vertices]=row_cmat_indices[0];
2603534831adSStefano Zampini       n_vertices++;
2604a0ba757dSStefano Zampini     }
2605da1bb401SStefano Zampini     ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr);
2606a0ba757dSStefano Zampini   }
2607534831adSStefano Zampini   /* Set number of constraints */
2608534831adSStefano Zampini   n_constraints = pcbddc->local_primal_size-n_vertices;
2609534831adSStefano Zampini 
2610534831adSStefano Zampini   /* vertices in boundary numbering */
2611534831adSStefano Zampini   if(n_vertices) {
2612534831adSStefano Zampini     ierr = VecSet(pcis->vec1_N,m_one);CHKERRQ(ierr);
2613534831adSStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
2614534831adSStefano Zampini     for (i=0; i<n_vertices; i++) { array[ vertices[i] ] = i; }
2615534831adSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
2616534831adSStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
2617534831adSStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
2618534831adSStefano Zampini     ierr = PetscMalloc(n_vertices*sizeof(PetscInt),&idx_V_B);CHKERRQ(ierr);
2619534831adSStefano Zampini     ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr);
2620534831adSStefano Zampini     for (i=0; i<n_vertices; i++) {
2621534831adSStefano Zampini       j=0;
2622534831adSStefano Zampini       while (array[j] != i ) {j++;}
2623534831adSStefano Zampini       idx_V_B[i]=j;
2624534831adSStefano Zampini     }
2625534831adSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr);
2626534831adSStefano Zampini   }
2627534831adSStefano Zampini 
2628534831adSStefano Zampini   /* transform local matrices if needed */
2629534831adSStefano Zampini   if(pcbddc->usechangeofbasis) {
2630534831adSStefano Zampini     ierr = PetscMalloc(pcis->n*sizeof(PetscInt),&nnz);CHKERRQ(ierr);
2631534831adSStefano Zampini     ierr = ISGetIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2632534831adSStefano Zampini     for(i=0;i<n_D;i++) {
2633534831adSStefano Zampini       nnz[is_indices[i]]=1;
2634534831adSStefano Zampini     }
2635534831adSStefano Zampini     ierr = ISRestoreIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2636534831adSStefano Zampini     ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2637534831adSStefano Zampini     k=1;
2638534831adSStefano Zampini     for(i=0;i<n_B;i++) {
2639534831adSStefano Zampini       ierr = MatGetRow(pcbddc->ChangeOfBasisMatrix,i,&j,PETSC_NULL,PETSC_NULL);CHKERRQ(ierr);
2640534831adSStefano Zampini       nnz[is_indices[i]]=j;
2641534831adSStefano Zampini       if( k < j) {
2642534831adSStefano Zampini         k = j;
2643534831adSStefano Zampini       }
2644534831adSStefano Zampini       ierr = MatRestoreRow(pcbddc->ChangeOfBasisMatrix,i,&j,PETSC_NULL,PETSC_NULL);CHKERRQ(ierr);
2645534831adSStefano Zampini     }
2646534831adSStefano Zampini     ierr = ISRestoreIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2647534831adSStefano Zampini     /* assemble change of basis matrix on the whole set of local dofs */
2648534831adSStefano Zampini     ierr = PetscMalloc(k*sizeof(PetscInt),&temp_indices);CHKERRQ(ierr);
2649534831adSStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&change_mat_all);CHKERRQ(ierr);
2650534831adSStefano Zampini     ierr = MatSetSizes(change_mat_all,pcis->n,pcis->n,pcis->n,pcis->n);CHKERRQ(ierr);
2651534831adSStefano Zampini     ierr = MatSetType(change_mat_all,MATSEQAIJ);CHKERRQ(ierr);
2652534831adSStefano Zampini     ierr = MatSeqAIJSetPreallocation(change_mat_all,0,nnz);CHKERRQ(ierr);
2653534831adSStefano Zampini     ierr = ISGetIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2654534831adSStefano Zampini     for(i=0;i<n_D;i++) {
2655534831adSStefano Zampini       ierr = MatSetValue(change_mat_all,is_indices[i],is_indices[i],1.0,INSERT_VALUES);CHKERRQ(ierr);
2656534831adSStefano Zampini     }
2657534831adSStefano Zampini     ierr = ISRestoreIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2658534831adSStefano Zampini     ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2659534831adSStefano Zampini     for(i=0;i<n_B;i++) {
2660534831adSStefano Zampini       ierr = MatGetRow(pcbddc->ChangeOfBasisMatrix,i,&j,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr);
2661534831adSStefano Zampini       for(k=0;k<j;k++) {
2662534831adSStefano Zampini         temp_indices[k]=is_indices[row_cmat_indices[k]];
2663534831adSStefano Zampini       }
2664534831adSStefano Zampini       ierr = MatSetValues(change_mat_all,1,&is_indices[i],j,temp_indices,row_cmat_values,INSERT_VALUES);CHKERRQ(ierr);
2665534831adSStefano Zampini       ierr = MatRestoreRow(pcbddc->ChangeOfBasisMatrix,i,&j,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr);
2666534831adSStefano Zampini     }
2667534831adSStefano Zampini     ierr = MatAssemblyBegin(change_mat_all,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2668534831adSStefano Zampini     ierr = MatAssemblyEnd(change_mat_all,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2669534831adSStefano Zampini     ierr = MatPtAP(matis->A,change_mat_all,MAT_INITIAL_MATRIX,1.0,&pcbddc->local_mat);CHKERRQ(ierr);
2670534831adSStefano Zampini     ierr = MatDestroy(&pcis->A_IB);CHKERRQ(ierr);
2671534831adSStefano Zampini     ierr = MatDestroy(&pcis->A_BI);CHKERRQ(ierr);
2672534831adSStefano Zampini     ierr = MatDestroy(&pcis->A_BB);CHKERRQ(ierr);
2673534831adSStefano Zampini     ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_I_local,pcis->is_B_local,MAT_INITIAL_MATRIX,&pcis->A_IB);CHKERRQ(ierr);
2674534831adSStefano Zampini     ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_B_local,pcis->is_I_local,MAT_INITIAL_MATRIX,&pcis->A_BI);CHKERRQ(ierr);
2675534831adSStefano Zampini     ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_B_local,pcis->is_B_local,MAT_INITIAL_MATRIX,&pcis->A_BB);CHKERRQ(ierr);
2676534831adSStefano Zampini     ierr = MatDestroy(&change_mat_all);CHKERRQ(ierr);
2677534831adSStefano Zampini     ierr = PetscFree(nnz);CHKERRQ(ierr);
2678534831adSStefano Zampini     ierr = PetscFree(temp_indices);CHKERRQ(ierr);
2679534831adSStefano Zampini   } else {
2680534831adSStefano Zampini     /* without change of basis, the local matrix is unchanged */
2681534831adSStefano Zampini     ierr = PetscObjectReference((PetscObject)matis->A);CHKERRQ(ierr);
2682534831adSStefano Zampini     pcbddc->local_mat = matis->A;
2683534831adSStefano Zampini   }
2684a0ba757dSStefano Zampini 
26850c7d97c5SJed Brown   /* Dohrmann's notation: dofs splitted in R (Remaining: all dofs but the vertices) and V (Vertices) */
26860c7d97c5SJed Brown   ierr = VecSet(pcis->vec1_N,one);CHKERRQ(ierr);
26870c7d97c5SJed Brown   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
26883b03a366Sstefano_zampini   for (i=0;i<n_vertices;i++) { array[ vertices[i] ] = zero; }
26893b03a366Sstefano_zampini   ierr = PetscMalloc(( pcis->n - n_vertices )*sizeof(PetscInt),&idx_R_local);CHKERRQ(ierr);
26900c7d97c5SJed Brown   for (i=0, n_R=0; i<pcis->n; i++) { if (array[i] == one) { idx_R_local[n_R] = i; n_R++; } }
26910c7d97c5SJed Brown   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
2692e269702eSStefano Zampini   if(dbg_flag) {
26930c7d97c5SJed Brown     ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
26940c7d97c5SJed Brown     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
26950c7d97c5SJed Brown     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d local dimensions\n",PetscGlobalRank);CHKERRQ(ierr);
26960c7d97c5SJed Brown     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local_size = %d, dirichlet_size = %d, boundary_size = %d\n",pcis->n,n_D,n_B);CHKERRQ(ierr);
26973b03a366Sstefano_zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"r_size = %d, v_size = %d, constraints = %d, local_primal_size = %d\n",n_R,n_vertices,n_constraints,pcbddc->local_primal_size);CHKERRQ(ierr);
2698534831adSStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"pcbddc->n_vertices = %d, pcbddc->n_constraints = %d\n",pcbddc->n_vertices,pcbddc->n_constraints);CHKERRQ(ierr);
26990c7d97c5SJed Brown     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
27000c7d97c5SJed Brown   }
2701534831adSStefano Zampini 
27020c7d97c5SJed Brown   /* Allocate needed vectors */
2703534831adSStefano Zampini   ierr = VecDuplicate(pcis->vec1_global,&pcbddc->original_rhs);CHKERRQ(ierr);
27043972b0daSStefano Zampini   ierr = VecDuplicate(pcis->vec1_global,&pcbddc->temp_solution);CHKERRQ(ierr);
27050c7d97c5SJed Brown   ierr = VecDuplicate(pcis->vec1_D,&pcbddc->vec4_D);CHKERRQ(ierr);
27060c7d97c5SJed Brown   ierr = VecCreate(PETSC_COMM_SELF,&pcbddc->vec1_R);CHKERRQ(ierr);
27070c7d97c5SJed Brown   ierr = VecSetSizes(pcbddc->vec1_R,n_R,n_R);CHKERRQ(ierr);
27080c7d97c5SJed Brown   ierr = VecSetType(pcbddc->vec1_R,impVecType);CHKERRQ(ierr);
2709d49ef151SStefano Zampini   ierr = VecDuplicate(pcbddc->vec1_R,&pcbddc->vec2_R);CHKERRQ(ierr);
27100c7d97c5SJed Brown   ierr = VecCreate(PETSC_COMM_SELF,&pcbddc->vec1_P);CHKERRQ(ierr);
27110c7d97c5SJed Brown   ierr = VecSetSizes(pcbddc->vec1_P,pcbddc->local_primal_size,pcbddc->local_primal_size);CHKERRQ(ierr);
27120c7d97c5SJed Brown   ierr = VecSetType(pcbddc->vec1_P,impVecType);CHKERRQ(ierr);
27130c7d97c5SJed Brown 
27140c7d97c5SJed Brown   /* Creating some index sets needed  */
27150c7d97c5SJed Brown   /* For submatrices */
2716da1bb401SStefano Zampini   ierr = ISCreateGeneral(PETSC_COMM_SELF,n_R,idx_R_local,PETSC_OWN_POINTER,&is_R_local);CHKERRQ(ierr);
27173b03a366Sstefano_zampini   if(n_vertices)    {
2718da1bb401SStefano Zampini     ierr = ISCreateGeneral(PETSC_COMM_SELF,n_vertices,vertices,PETSC_OWN_POINTER,&is_V_local);CHKERRQ(ierr);
27193b03a366Sstefano_zampini   }
2720da1bb401SStefano Zampini   if(n_constraints) {
2721da1bb401SStefano Zampini     ierr = ISCreateStride(PETSC_COMM_SELF,n_constraints,n_vertices,1,&is_C_local);CHKERRQ(ierr);
2722da1bb401SStefano Zampini   }
2723da1bb401SStefano Zampini 
27240c7d97c5SJed Brown   /* For VecScatters pcbddc->R_to_B and (optionally) pcbddc->R_to_D */
27250c7d97c5SJed Brown   {
27260c7d97c5SJed Brown     PetscInt   *aux_array1;
27270c7d97c5SJed Brown     PetscInt   *aux_array2;
27280c7d97c5SJed Brown 
27293b03a366Sstefano_zampini     ierr = PetscMalloc( (pcis->n_B-n_vertices)*sizeof(PetscInt),&aux_array1);CHKERRQ(ierr);
27303b03a366Sstefano_zampini     ierr = PetscMalloc( (pcis->n_B-n_vertices)*sizeof(PetscInt),&aux_array2);CHKERRQ(ierr);
27310c7d97c5SJed Brown 
2732d49ef151SStefano Zampini     ierr = VecSet(pcis->vec1_global,zero);CHKERRQ(ierr);
27330c7d97c5SJed Brown     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
27340c7d97c5SJed Brown     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
27350c7d97c5SJed Brown     ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
27360c7d97c5SJed Brown     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
27370c7d97c5SJed Brown     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
27380c7d97c5SJed Brown     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
27390c7d97c5SJed Brown     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
2740da1bb401SStefano Zampini     for (i=0, j=0; i<n_R; i++) { if (array[idx_R_local[i]] > one) { aux_array1[j] = i; j++; } }
27410c7d97c5SJed Brown     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
2742da1bb401SStefano Zampini     ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array1,PETSC_COPY_VALUES,&is_aux1);CHKERRQ(ierr);
27430c7d97c5SJed Brown     ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr);
2744da1bb401SStefano Zampini     for (i=0, j=0; i<n_B; i++) { if (array[i] > one) { aux_array2[j] = i; j++; } }
27453828260eSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr);
2746da1bb401SStefano Zampini     ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array2,PETSC_COPY_VALUES,&is_aux2);CHKERRQ(ierr);
27470c7d97c5SJed Brown     ierr = VecScatterCreate(pcbddc->vec1_R,is_aux1,pcis->vec1_B,is_aux2,&pcbddc->R_to_B);CHKERRQ(ierr);
27480c7d97c5SJed Brown     ierr = PetscFree(aux_array1);CHKERRQ(ierr);
27490c7d97c5SJed Brown     ierr = PetscFree(aux_array2);CHKERRQ(ierr);
27500c7d97c5SJed Brown     ierr = ISDestroy(&is_aux1);CHKERRQ(ierr);
27510c7d97c5SJed Brown     ierr = ISDestroy(&is_aux2);CHKERRQ(ierr);
27520c7d97c5SJed Brown 
2753e269702eSStefano Zampini     if(pcbddc->prec_type || dbg_flag ) {
27540c7d97c5SJed Brown       ierr = PetscMalloc(n_D*sizeof(PetscInt),&aux_array1);CHKERRQ(ierr);
27550c7d97c5SJed Brown       ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
2756da1bb401SStefano Zampini       for (i=0, j=0; i<n_R; i++) { if (array[idx_R_local[i]] == one) { aux_array1[j] = i; j++; } }
27570c7d97c5SJed Brown       ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
2758da1bb401SStefano Zampini       ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array1,PETSC_COPY_VALUES,&is_aux1);CHKERRQ(ierr);
27590c7d97c5SJed Brown       ierr = VecScatterCreate(pcbddc->vec1_R,is_aux1,pcis->vec1_D,(IS)0,&pcbddc->R_to_D);CHKERRQ(ierr);
27600c7d97c5SJed Brown       ierr = PetscFree(aux_array1);CHKERRQ(ierr);
27610c7d97c5SJed Brown       ierr = ISDestroy(&is_aux1);CHKERRQ(ierr);
27620c7d97c5SJed Brown     }
27630c7d97c5SJed Brown   }
27640c7d97c5SJed Brown 
27650c7d97c5SJed Brown   /* Creating PC contexts for local Dirichlet and Neumann problems */
27660c7d97c5SJed Brown   {
27670c7d97c5SJed Brown     Mat  A_RR;
276853cdbc3dSStefano Zampini     PC   pc_temp;
27690c7d97c5SJed Brown     /* Matrix for Dirichlet problem is A_II -> we already have it from pcis.c code */
277053cdbc3dSStefano Zampini     ierr = KSPCreate(PETSC_COMM_SELF,&pcbddc->ksp_D);CHKERRQ(ierr);
277153cdbc3dSStefano Zampini     ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->ksp_D,(PetscObject)pc,1);CHKERRQ(ierr);
277253cdbc3dSStefano Zampini     ierr = KSPSetOperators(pcbddc->ksp_D,pcis->A_II,pcis->A_II,SAME_PRECONDITIONER);CHKERRQ(ierr);
277353cdbc3dSStefano Zampini     ierr = KSPSetType(pcbddc->ksp_D,KSPPREONLY);CHKERRQ(ierr);
2774da1bb401SStefano Zampini     ierr = KSPSetOptionsPrefix(pcbddc->ksp_D,"dirichlet_");CHKERRQ(ierr);
27750c7d97c5SJed Brown     /* default */
277653cdbc3dSStefano Zampini     ierr = KSPGetPC(pcbddc->ksp_D,&pc_temp);CHKERRQ(ierr);
277753cdbc3dSStefano Zampini     ierr = PCSetType(pc_temp,PCLU);CHKERRQ(ierr);
27780c7d97c5SJed Brown     /* Allow user's customization */
277953cdbc3dSStefano Zampini     ierr = KSPSetFromOptions(pcbddc->ksp_D);CHKERRQ(ierr);
278053cdbc3dSStefano Zampini     /* Set Up KSP for Dirichlet problem of BDDC */
278153cdbc3dSStefano Zampini     ierr = KSPSetUp(pcbddc->ksp_D);CHKERRQ(ierr);
27823972b0daSStefano Zampini     /* set ksp_D into pcis data */
27833972b0daSStefano Zampini     ierr = KSPDestroy(&pcis->ksp_D);CHKERRQ(ierr);
27843972b0daSStefano Zampini     ierr = PetscObjectReference((PetscObject)pcbddc->ksp_D);CHKERRQ(ierr);
27853972b0daSStefano Zampini     pcis->ksp_D = pcbddc->ksp_D;
27860c7d97c5SJed Brown     /* Matrix for Neumann problem is A_RR -> we need to create it */
2787534831adSStefano Zampini     ierr = MatGetSubMatrix(pcbddc->local_mat,is_R_local,is_R_local,MAT_INITIAL_MATRIX,&A_RR);CHKERRQ(ierr);
278853cdbc3dSStefano Zampini     ierr = KSPCreate(PETSC_COMM_SELF,&pcbddc->ksp_R);CHKERRQ(ierr);
278953cdbc3dSStefano Zampini     ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->ksp_R,(PetscObject)pc,1);CHKERRQ(ierr);
279053cdbc3dSStefano Zampini     ierr = KSPSetOperators(pcbddc->ksp_R,A_RR,A_RR,SAME_PRECONDITIONER);CHKERRQ(ierr);
279153cdbc3dSStefano Zampini     ierr = KSPSetType(pcbddc->ksp_R,KSPPREONLY);CHKERRQ(ierr);
2792da1bb401SStefano Zampini     ierr = KSPSetOptionsPrefix(pcbddc->ksp_R,"neumann_");CHKERRQ(ierr);
27930c7d97c5SJed Brown     /* default */
279453cdbc3dSStefano Zampini     ierr = KSPGetPC(pcbddc->ksp_R,&pc_temp);CHKERRQ(ierr);
279553cdbc3dSStefano Zampini     ierr = PCSetType(pc_temp,PCLU);CHKERRQ(ierr);
27960c7d97c5SJed Brown     /* Allow user's customization */
279753cdbc3dSStefano Zampini     ierr = KSPSetFromOptions(pcbddc->ksp_R);CHKERRQ(ierr);
279853cdbc3dSStefano Zampini     /* Set Up KSP for Neumann problem of BDDC */
279953cdbc3dSStefano Zampini     ierr = KSPSetUp(pcbddc->ksp_R);CHKERRQ(ierr);
2800a0ba757dSStefano Zampini     /* check Dirichlet and Neumann solvers */
2801b76ba322SStefano Zampini     {
28020c7d97c5SJed Brown       Vec         temp_vec;
2803b76ba322SStefano Zampini       PetscReal   value;
2804b76ba322SStefano Zampini       PetscMPIInt use_exact,use_exact_reduced;
28050c7d97c5SJed Brown 
2806a0ba757dSStefano Zampini       ierr = VecDuplicate(pcis->vec1_D,&temp_vec);CHKERRQ(ierr);
2807a0ba757dSStefano Zampini       ierr = VecSetRandom(pcis->vec1_D,PETSC_NULL);CHKERRQ(ierr);
2808a0ba757dSStefano Zampini       ierr = MatMult(pcis->A_II,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr);
2809a0ba757dSStefano Zampini       ierr = KSPSolve(pcbddc->ksp_D,pcis->vec2_D,temp_vec);CHKERRQ(ierr);
2810a0ba757dSStefano Zampini       ierr = VecAXPY(temp_vec,m_one,pcis->vec1_D);CHKERRQ(ierr);
2811a0ba757dSStefano Zampini       ierr = VecNorm(temp_vec,NORM_INFINITY,&value);CHKERRQ(ierr);
2812b76ba322SStefano Zampini       use_exact = 1;
2813b76ba322SStefano Zampini       if(PetscAbsReal(value) > 1.e-4) {
2814b76ba322SStefano Zampini         use_exact = 0;
2815b76ba322SStefano Zampini       }
2816b76ba322SStefano Zampini       ierr = MPI_Allreduce(&use_exact,&use_exact_reduced,1,MPIU_INT,MPI_LAND,((PetscObject)pc)->comm);CHKERRQ(ierr);
2817b76ba322SStefano Zampini       pcbddc->use_exact_dirichlet = (PetscBool) use_exact_reduced;
2818a0ba757dSStefano Zampini       ierr = VecDestroy(&temp_vec);CHKERRQ(ierr);
2819b76ba322SStefano Zampini       if(dbg_flag) {
2820a0ba757dSStefano Zampini         ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
2821a0ba757dSStefano Zampini         ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
2822a0ba757dSStefano Zampini         ierr = PetscViewerASCIIPrintf(viewer,"Checking solution of Dirichlet and Neumann problems\n");CHKERRQ(ierr);
2823a0ba757dSStefano Zampini         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d infinity error for Dirichlet solve = % 1.14e \n",PetscGlobalRank,value);CHKERRQ(ierr);
2824d49ef151SStefano Zampini         ierr = VecDuplicate(pcbddc->vec1_R,&temp_vec);CHKERRQ(ierr);
2825d49ef151SStefano Zampini         ierr = VecSetRandom(pcbddc->vec1_R,PETSC_NULL);CHKERRQ(ierr);
2826d49ef151SStefano Zampini         ierr = MatMult(A_RR,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr);
2827d49ef151SStefano Zampini         ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec2_R,temp_vec);CHKERRQ(ierr);
2828d49ef151SStefano Zampini         ierr = VecAXPY(temp_vec,m_one,pcbddc->vec1_R);CHKERRQ(ierr);
2829d49ef151SStefano Zampini         ierr = VecNorm(temp_vec,NORM_INFINITY,&value);CHKERRQ(ierr);
2830e269702eSStefano Zampini         ierr = VecDestroy(&temp_vec);CHKERRQ(ierr);
28310c7d97c5SJed Brown         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d infinity error for  Neumann  solve = % 1.14e \n",PetscGlobalRank,value);CHKERRQ(ierr);
2832d49ef151SStefano Zampini         ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
28330c7d97c5SJed Brown       }
2834b76ba322SStefano Zampini     }
28350c7d97c5SJed Brown     /* free Neumann problem's matrix */
28360c7d97c5SJed Brown     ierr = MatDestroy(&A_RR);CHKERRQ(ierr);
28370c7d97c5SJed Brown   }
28380c7d97c5SJed Brown 
28390c7d97c5SJed Brown   /* Assemble all remaining stuff needed to apply BDDC  */
28400c7d97c5SJed Brown   {
28410c7d97c5SJed Brown     Mat          A_RV,A_VR,A_VV;
28420c7d97c5SJed Brown     Mat          M1,M2;
28430c7d97c5SJed Brown     Mat          C_CR;
28443b03a366Sstefano_zampini     Mat          AUXMAT;
28450c7d97c5SJed Brown     Vec          vec1_C;
28460c7d97c5SJed Brown     Vec          vec2_C;
28470c7d97c5SJed Brown     Vec          vec1_V;
28480c7d97c5SJed Brown     Vec          vec2_V;
28490c7d97c5SJed Brown     PetscInt     *nnz;
28500c7d97c5SJed Brown     PetscInt     *auxindices;
285153cdbc3dSStefano Zampini     PetscInt     index;
28520c7d97c5SJed Brown     PetscScalar* array2;
28530c7d97c5SJed Brown     MatFactorInfo matinfo;
28540c7d97c5SJed Brown 
28550c7d97c5SJed Brown     /* Allocating some extra storage just to be safe */
28560c7d97c5SJed Brown     ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&nnz);CHKERRQ(ierr);
28570c7d97c5SJed Brown     ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&auxindices);CHKERRQ(ierr);
28580c7d97c5SJed Brown     for(i=0;i<pcis->n;i++) {auxindices[i]=i;}
28590c7d97c5SJed Brown 
28600c7d97c5SJed Brown     /* some work vectors on vertices and/or constraints */
28613b03a366Sstefano_zampini     if(n_vertices) {
28620c7d97c5SJed Brown       ierr = VecCreate(PETSC_COMM_SELF,&vec1_V);CHKERRQ(ierr);
28633b03a366Sstefano_zampini       ierr = VecSetSizes(vec1_V,n_vertices,n_vertices);CHKERRQ(ierr);
28640c7d97c5SJed Brown       ierr = VecSetType(vec1_V,impVecType);CHKERRQ(ierr);
28650c7d97c5SJed Brown       ierr = VecDuplicate(vec1_V,&vec2_V);CHKERRQ(ierr);
28660c7d97c5SJed Brown     }
2867534831adSStefano Zampini     if(n_constraints) {
28680c7d97c5SJed Brown       ierr = VecCreate(PETSC_COMM_SELF,&vec1_C);CHKERRQ(ierr);
2869534831adSStefano Zampini       ierr = VecSetSizes(vec1_C,n_constraints,n_constraints);CHKERRQ(ierr);
28700c7d97c5SJed Brown       ierr = VecSetType(vec1_C,impVecType);CHKERRQ(ierr);
28710c7d97c5SJed Brown       ierr = VecDuplicate(vec1_C,&vec2_C);CHKERRQ(ierr);
28720c7d97c5SJed Brown       ierr = VecDuplicate(vec1_C,&pcbddc->vec1_C);CHKERRQ(ierr);
28730c7d97c5SJed Brown     }
28740c7d97c5SJed Brown     /* Precompute stuffs needed for preprocessing and application of BDDC*/
28753b03a366Sstefano_zampini     if(n_constraints) {
28760c7d97c5SJed Brown       ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->local_auxmat2);CHKERRQ(ierr);
28773b03a366Sstefano_zampini       ierr = MatSetSizes(pcbddc->local_auxmat2,n_R,n_constraints,n_R,n_constraints);CHKERRQ(ierr);
28780c7d97c5SJed Brown       ierr = MatSetType(pcbddc->local_auxmat2,impMatType);CHKERRQ(ierr);
28793b03a366Sstefano_zampini       ierr = MatSeqDenseSetPreallocation(pcbddc->local_auxmat2,PETSC_NULL);CHKERRQ(ierr);
28800c7d97c5SJed Brown 
288157a90decSStefano Zampini       /* Create Constraint matrix on R nodes: C_{CR}  */
288257a90decSStefano Zampini       ierr = MatGetSubMatrix(pcbddc->ConstraintMatrix,is_C_local,is_R_local,MAT_INITIAL_MATRIX,&C_CR);CHKERRQ(ierr);
288357a90decSStefano Zampini       ierr = ISDestroy(&is_C_local);CHKERRQ(ierr);
288457a90decSStefano Zampini 
28850c7d97c5SJed Brown       /* Assemble local_auxmat2 = - A_{RR}^{-1} C^T_{CR} needed by BDDC application */
28863b03a366Sstefano_zampini       for(i=0;i<n_constraints;i++) {
28873b03a366Sstefano_zampini         ierr = VecSet(pcbddc->vec1_R,zero);CHKERRQ(ierr);
28883b03a366Sstefano_zampini         /* Get row of constraint matrix in R numbering */
288957a90decSStefano Zampini         ierr = VecGetArray(pcbddc->vec1_R,&array);CHKERRQ(ierr);
289057a90decSStefano Zampini         ierr = MatGetRow(C_CR,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr);
28913b03a366Sstefano_zampini         for(j=0;j<size_of_constraint;j++) { array[ row_cmat_indices[j] ] = - row_cmat_values[j]; }
289257a90decSStefano Zampini         ierr = MatRestoreRow(C_CR,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr);
289357a90decSStefano Zampini         ierr = VecRestoreArray(pcbddc->vec1_R,&array);CHKERRQ(ierr);
28943b03a366Sstefano_zampini         /* Solve for row of constraint matrix in R numbering */
289553cdbc3dSStefano Zampini         ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr);
28963b03a366Sstefano_zampini         /* Set values */
28970c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec2_R,&array);CHKERRQ(ierr);
28983b03a366Sstefano_zampini         ierr = MatSetValues(pcbddc->local_auxmat2,n_R,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
28990c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec2_R,&array);CHKERRQ(ierr);
29000c7d97c5SJed Brown       }
29010c7d97c5SJed Brown       ierr = MatAssemblyBegin(pcbddc->local_auxmat2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
29020c7d97c5SJed Brown       ierr = MatAssemblyEnd(pcbddc->local_auxmat2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
29030c7d97c5SJed Brown 
29040c7d97c5SJed Brown       /* Assemble AUXMAT = ( LUFactor )( -C_{CR} A_{RR}^{-1} C^T_{CR} )^{-1} */
29050c7d97c5SJed Brown       ierr = MatMatMult(C_CR,pcbddc->local_auxmat2,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&AUXMAT);CHKERRQ(ierr);
2906d49ef151SStefano Zampini       ierr = MatFactorInfoInitialize(&matinfo);CHKERRQ(ierr);
29073b03a366Sstefano_zampini       ierr = ISCreateStride(PETSC_COMM_SELF,n_constraints,0,1,&is_aux1);CHKERRQ(ierr);
29080c7d97c5SJed Brown       ierr = MatLUFactor(AUXMAT,is_aux1,is_aux1,&matinfo);CHKERRQ(ierr);
29090c7d97c5SJed Brown       ierr = ISDestroy(&is_aux1);CHKERRQ(ierr);
29100c7d97c5SJed Brown 
29113b03a366Sstefano_zampini       /* Assemble explicitly M1 = ( C_{CR} A_{RR}^{-1} C^T_{CR} )^{-1} needed in preproc  */
2912d49ef151SStefano Zampini       ierr = MatCreate(PETSC_COMM_SELF,&M1);CHKERRQ(ierr);
29133b03a366Sstefano_zampini       ierr = MatSetSizes(M1,n_constraints,n_constraints,n_constraints,n_constraints);CHKERRQ(ierr);
29140c7d97c5SJed Brown       ierr = MatSetType(M1,impMatType);CHKERRQ(ierr);
29153b03a366Sstefano_zampini       ierr = MatSeqDenseSetPreallocation(M1,PETSC_NULL);CHKERRQ(ierr);
29163b03a366Sstefano_zampini       for(i=0;i<n_constraints;i++) {
29170c7d97c5SJed Brown         ierr = VecSet(vec1_C,zero);CHKERRQ(ierr);
29180c7d97c5SJed Brown         ierr = VecSetValue(vec1_C,i,one,INSERT_VALUES);CHKERRQ(ierr);
29190c7d97c5SJed Brown         ierr = VecAssemblyBegin(vec1_C);CHKERRQ(ierr);
29200c7d97c5SJed Brown         ierr = VecAssemblyEnd(vec1_C);CHKERRQ(ierr);
29210c7d97c5SJed Brown         ierr = MatSolve(AUXMAT,vec1_C,vec2_C);CHKERRQ(ierr);
29220c7d97c5SJed Brown         ierr = VecScale(vec2_C,m_one);CHKERRQ(ierr);
29230c7d97c5SJed Brown         ierr = VecGetArray(vec2_C,&array);CHKERRQ(ierr);
29243b03a366Sstefano_zampini         ierr = MatSetValues(M1,n_constraints,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
29250c7d97c5SJed Brown         ierr = VecRestoreArray(vec2_C,&array);CHKERRQ(ierr);
29260c7d97c5SJed Brown       }
29270c7d97c5SJed Brown       ierr = MatAssemblyBegin(M1,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
29280c7d97c5SJed Brown       ierr = MatAssemblyEnd(M1,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
29290c7d97c5SJed Brown       ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr);
29300c7d97c5SJed Brown       /* Assemble local_auxmat1 = M1*C_{CR} needed by BDDC application in KSP and in preproc */
29310c7d97c5SJed Brown       ierr = MatMatMult(M1,C_CR,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&pcbddc->local_auxmat1);CHKERRQ(ierr);
29320c7d97c5SJed Brown 
29330c7d97c5SJed Brown     }
29340c7d97c5SJed Brown 
29350c7d97c5SJed Brown     /* Get submatrices from subdomain matrix */
29363b03a366Sstefano_zampini     if(n_vertices){
2937534831adSStefano Zampini       ierr = MatGetSubMatrix(pcbddc->local_mat,is_R_local,is_V_local,MAT_INITIAL_MATRIX,&A_RV);CHKERRQ(ierr);
2938534831adSStefano Zampini       ierr = MatGetSubMatrix(pcbddc->local_mat,is_V_local,is_R_local,MAT_INITIAL_MATRIX,&A_VR);CHKERRQ(ierr);
2939534831adSStefano Zampini       ierr = MatGetSubMatrix(pcbddc->local_mat,is_V_local,is_V_local,MAT_INITIAL_MATRIX,&A_VV);CHKERRQ(ierr);
29400c7d97c5SJed Brown       /* Assemble M2 = A_RR^{-1}A_RV */
2941d49ef151SStefano Zampini       ierr = MatCreate(PETSC_COMM_SELF,&M2);CHKERRQ(ierr);
29423b03a366Sstefano_zampini       ierr = MatSetSizes(M2,n_R,n_vertices,n_R,n_vertices);CHKERRQ(ierr);
29430c7d97c5SJed Brown       ierr = MatSetType(M2,impMatType);CHKERRQ(ierr);
29443b03a366Sstefano_zampini       ierr = MatSeqDenseSetPreallocation(M2,PETSC_NULL);CHKERRQ(ierr);
29453b03a366Sstefano_zampini       for(i=0;i<n_vertices;i++) {
29460c7d97c5SJed Brown         ierr = VecSet(vec1_V,zero);CHKERRQ(ierr);
29470c7d97c5SJed Brown         ierr = VecSetValue(vec1_V,i,one,INSERT_VALUES);CHKERRQ(ierr);
29480c7d97c5SJed Brown         ierr = VecAssemblyBegin(vec1_V);CHKERRQ(ierr);
29490c7d97c5SJed Brown         ierr = VecAssemblyEnd(vec1_V);CHKERRQ(ierr);
29500c7d97c5SJed Brown         ierr = MatMult(A_RV,vec1_V,pcbddc->vec1_R);CHKERRQ(ierr);
295153cdbc3dSStefano Zampini         ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr);
29520c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec2_R,&array);CHKERRQ(ierr);
29533b03a366Sstefano_zampini         ierr = MatSetValues(M2,n_R,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
29540c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec2_R,&array);CHKERRQ(ierr);
29550c7d97c5SJed Brown       }
29560c7d97c5SJed Brown       ierr = MatAssemblyBegin(M2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
29570c7d97c5SJed Brown       ierr = MatAssemblyEnd(M2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
29580c7d97c5SJed Brown     }
29590c7d97c5SJed Brown 
29600c7d97c5SJed Brown     /* Matrix of coarse basis functions (local) */
2961d49ef151SStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->coarse_phi_B);CHKERRQ(ierr);
29620c7d97c5SJed Brown     ierr = MatSetSizes(pcbddc->coarse_phi_B,n_B,pcbddc->local_primal_size,n_B,pcbddc->local_primal_size);CHKERRQ(ierr);
29630c7d97c5SJed Brown     ierr = MatSetType(pcbddc->coarse_phi_B,impMatType);CHKERRQ(ierr);
29643b03a366Sstefano_zampini     ierr = MatSeqDenseSetPreallocation(pcbddc->coarse_phi_B,PETSC_NULL);CHKERRQ(ierr);
2965e269702eSStefano Zampini     if(pcbddc->prec_type || dbg_flag ) {
2966d49ef151SStefano Zampini       ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->coarse_phi_D);CHKERRQ(ierr);
29670c7d97c5SJed Brown       ierr = MatSetSizes(pcbddc->coarse_phi_D,n_D,pcbddc->local_primal_size,n_D,pcbddc->local_primal_size);CHKERRQ(ierr);
29680c7d97c5SJed Brown       ierr = MatSetType(pcbddc->coarse_phi_D,impMatType);CHKERRQ(ierr);
29693b03a366Sstefano_zampini       ierr = MatSeqDenseSetPreallocation(pcbddc->coarse_phi_D,PETSC_NULL);CHKERRQ(ierr);
29700c7d97c5SJed Brown     }
29710c7d97c5SJed Brown 
2972e269702eSStefano Zampini     if(dbg_flag) {
29730c7d97c5SJed Brown       ierr = PetscMalloc( pcbddc->local_primal_size*sizeof(PetscScalar),&coarsefunctions_errors);CHKERRQ(ierr);
29740c7d97c5SJed Brown       ierr = PetscMalloc( pcbddc->local_primal_size*sizeof(PetscScalar),&constraints_errors);CHKERRQ(ierr);
29750c7d97c5SJed Brown     }
29763b03a366Sstefano_zampini     /* Subdomain contribution (Non-overlapping) to coarse matrix  */
29770c7d97c5SJed Brown     ierr = PetscMalloc ((pcbddc->local_primal_size)*(pcbddc->local_primal_size)*sizeof(PetscScalar),&coarse_submat_vals);CHKERRQ(ierr);
29780c7d97c5SJed Brown 
29790c7d97c5SJed Brown     /* We are now ready to evaluate coarse basis functions and subdomain contribution to coarse problem */
29803b03a366Sstefano_zampini     for(i=0;i<n_vertices;i++){
29810c7d97c5SJed Brown       ierr = VecSet(vec1_V,zero);CHKERRQ(ierr);
29820c7d97c5SJed Brown       ierr = VecSetValue(vec1_V,i,one,INSERT_VALUES);CHKERRQ(ierr);
29830c7d97c5SJed Brown       ierr = VecAssemblyBegin(vec1_V);CHKERRQ(ierr);
29840c7d97c5SJed Brown       ierr = VecAssemblyEnd(vec1_V);CHKERRQ(ierr);
29850c7d97c5SJed Brown       /* solution of saddle point problem */
29860c7d97c5SJed Brown       ierr = MatMult(M2,vec1_V,pcbddc->vec1_R);CHKERRQ(ierr);
29870c7d97c5SJed Brown       ierr = VecScale(pcbddc->vec1_R,m_one);CHKERRQ(ierr);
29883b03a366Sstefano_zampini       if(n_constraints) {
29890c7d97c5SJed Brown         ierr = MatMult(pcbddc->local_auxmat1,pcbddc->vec1_R,vec1_C);CHKERRQ(ierr);
29900c7d97c5SJed Brown         ierr = MatMultAdd(pcbddc->local_auxmat2,vec1_C,pcbddc->vec1_R,pcbddc->vec1_R);CHKERRQ(ierr);
29910c7d97c5SJed Brown         ierr = VecScale(vec1_C,m_one);CHKERRQ(ierr);
29920c7d97c5SJed Brown       }
29930c7d97c5SJed Brown       ierr = MatMult(A_VR,pcbddc->vec1_R,vec2_V);CHKERRQ(ierr);
29940c7d97c5SJed Brown       ierr = MatMultAdd(A_VV,vec1_V,vec2_V,vec2_V);CHKERRQ(ierr);
29950c7d97c5SJed Brown 
29960c7d97c5SJed Brown       /* Set values in coarse basis function and subdomain part of coarse_mat */
29970c7d97c5SJed Brown       /* coarse basis functions */
29980c7d97c5SJed Brown       ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr);
29990c7d97c5SJed Brown       ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
30000c7d97c5SJed Brown       ierr = VecScatterEnd  (pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
30010c7d97c5SJed Brown       ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr);
30023b03a366Sstefano_zampini       ierr = MatSetValues(pcbddc->coarse_phi_B,n_B,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
30030c7d97c5SJed Brown       ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr);
30040c7d97c5SJed Brown       ierr = MatSetValue(pcbddc->coarse_phi_B,idx_V_B[i],i,one,INSERT_VALUES);CHKERRQ(ierr);
3005e269702eSStefano Zampini       if( pcbddc->prec_type || dbg_flag  ) {
30060c7d97c5SJed Brown         ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
30070c7d97c5SJed Brown         ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
30080c7d97c5SJed Brown         ierr = VecGetArray(pcis->vec1_D,&array);CHKERRQ(ierr);
30093b03a366Sstefano_zampini         ierr = MatSetValues(pcbddc->coarse_phi_D,n_D,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
30100c7d97c5SJed Brown         ierr = VecRestoreArray(pcis->vec1_D,&array);CHKERRQ(ierr);
30110c7d97c5SJed Brown       }
30120c7d97c5SJed Brown       /* subdomain contribution to coarse matrix */
30130c7d97c5SJed Brown       ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr);
3014da1bb401SStefano Zampini       for(j=0;j<n_vertices;j++) { coarse_submat_vals[i*pcbddc->local_primal_size+j] = array[j]; } /* WARNING -> column major ordering */
30150c7d97c5SJed Brown       ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr);
30163b03a366Sstefano_zampini       if(n_constraints) {
30170c7d97c5SJed Brown         ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr);
3018da1bb401SStefano Zampini         for(j=0;j<n_constraints;j++) { coarse_submat_vals[i*pcbddc->local_primal_size+j+n_vertices] = array[j]; } /* WARNING -> column major ordering */
30190c7d97c5SJed Brown         ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr);
30200c7d97c5SJed Brown       }
30210c7d97c5SJed Brown 
3022e269702eSStefano Zampini       if( dbg_flag ) {
30230c7d97c5SJed Brown         /* assemble subdomain vector on nodes */
3024d49ef151SStefano Zampini         ierr = VecSet(pcis->vec1_N,zero);CHKERRQ(ierr);
30250c7d97c5SJed Brown         ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
30260c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr);
30270c7d97c5SJed Brown         for(j=0;j<n_R;j++) { array[idx_R_local[j]] = array2[j]; }
30283b03a366Sstefano_zampini         array[ vertices[i] ] = one;
30290c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr);
30300c7d97c5SJed Brown         ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
30310c7d97c5SJed Brown         /* assemble subdomain vector of lagrange multipliers (i.e. primal nodes) */
3032d49ef151SStefano Zampini         ierr = VecSet(pcbddc->vec1_P,zero);CHKERRQ(ierr);
30330c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr);
30340c7d97c5SJed Brown         ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr);
30353b03a366Sstefano_zampini         for(j=0;j<n_vertices;j++) { array2[j]=array[j]; }
30360c7d97c5SJed Brown         ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr);
30373b03a366Sstefano_zampini         if(n_constraints) {
30380c7d97c5SJed Brown           ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr);
30393b03a366Sstefano_zampini           for(j=0;j<n_constraints;j++) { array2[j+n_vertices]=array[j]; }
30400c7d97c5SJed Brown           ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr);
30410c7d97c5SJed Brown         }
30420c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr);
30430c7d97c5SJed Brown         ierr = VecScale(pcbddc->vec1_P,m_one);CHKERRQ(ierr);
30440c7d97c5SJed Brown         /* check saddle point solution */
3045534831adSStefano Zampini         ierr = MatMult(pcbddc->local_mat,pcis->vec1_N,pcis->vec2_N);CHKERRQ(ierr);
30463b03a366Sstefano_zampini         ierr = MatMultTransposeAdd(pcbddc->ConstraintMatrix,pcbddc->vec1_P,pcis->vec2_N,pcis->vec2_N);CHKERRQ(ierr);
30473b03a366Sstefano_zampini         ierr = VecNorm(pcis->vec2_N,NORM_INFINITY,&coarsefunctions_errors[i]);CHKERRQ(ierr);
30483b03a366Sstefano_zampini         ierr = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr);
30490c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
30503b03a366Sstefano_zampini         array[i]=array[i]+m_one;  /* shift by the identity matrix */
30510c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
30523b03a366Sstefano_zampini         ierr = VecNorm(pcbddc->vec1_P,NORM_INFINITY,&constraints_errors[i]);CHKERRQ(ierr);
30530c7d97c5SJed Brown       }
30540c7d97c5SJed Brown     }
30550c7d97c5SJed Brown 
30563b03a366Sstefano_zampini     for(i=0;i<n_constraints;i++){
3057d49ef151SStefano Zampini       ierr = VecSet(vec2_C,zero);CHKERRQ(ierr);
30580c7d97c5SJed Brown       ierr = VecSetValue(vec2_C,i,m_one,INSERT_VALUES);CHKERRQ(ierr);
30590c7d97c5SJed Brown       ierr = VecAssemblyBegin(vec2_C);CHKERRQ(ierr);
30600c7d97c5SJed Brown       ierr = VecAssemblyEnd(vec2_C);CHKERRQ(ierr);
30610c7d97c5SJed Brown       /* solution of saddle point problem */
30620c7d97c5SJed Brown       ierr = MatMult(M1,vec2_C,vec1_C);CHKERRQ(ierr);
30630c7d97c5SJed Brown       ierr = MatMult(pcbddc->local_auxmat2,vec1_C,pcbddc->vec1_R);CHKERRQ(ierr);
30640c7d97c5SJed Brown       ierr = VecScale(vec1_C,m_one);CHKERRQ(ierr);
30653b03a366Sstefano_zampini       if(n_vertices) { ierr = MatMult(A_VR,pcbddc->vec1_R,vec2_V);CHKERRQ(ierr); }
30660c7d97c5SJed Brown       /* Set values in coarse basis function and subdomain part of coarse_mat */
30670c7d97c5SJed Brown       /* coarse basis functions */
30683b03a366Sstefano_zampini       index=i+n_vertices;
30690c7d97c5SJed Brown       ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr);
30700c7d97c5SJed Brown       ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
30710c7d97c5SJed Brown       ierr = VecScatterEnd  (pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
30720c7d97c5SJed Brown       ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr);
307353cdbc3dSStefano Zampini       ierr = MatSetValues(pcbddc->coarse_phi_B,n_B,auxindices,1,&index,array,INSERT_VALUES);CHKERRQ(ierr);
30740c7d97c5SJed Brown       ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr);
3075e269702eSStefano Zampini       if( pcbddc->prec_type || dbg_flag ) {
30760c7d97c5SJed Brown         ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
30770c7d97c5SJed Brown         ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
30780c7d97c5SJed Brown         ierr = VecGetArray(pcis->vec1_D,&array);CHKERRQ(ierr);
307953cdbc3dSStefano Zampini         ierr = MatSetValues(pcbddc->coarse_phi_D,n_D,auxindices,1,&index,array,INSERT_VALUES);CHKERRQ(ierr);
30800c7d97c5SJed Brown         ierr = VecRestoreArray(pcis->vec1_D,&array);CHKERRQ(ierr);
30810c7d97c5SJed Brown       }
30820c7d97c5SJed Brown       /* subdomain contribution to coarse matrix */
30833b03a366Sstefano_zampini       if(n_vertices) {
30840c7d97c5SJed Brown         ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr);
3085da1bb401SStefano Zampini         for(j=0;j<n_vertices;j++) {coarse_submat_vals[index*pcbddc->local_primal_size+j]=array[j];} /* WARNING -> column major ordering */
30860c7d97c5SJed Brown         ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr);
30870c7d97c5SJed Brown       }
30880c7d97c5SJed Brown       ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr);
3089da1bb401SStefano Zampini       for(j=0;j<n_constraints;j++) {coarse_submat_vals[index*pcbddc->local_primal_size+j+n_vertices]=array[j];} /* WARNING -> column major ordering */
30900c7d97c5SJed Brown       ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr);
30910c7d97c5SJed Brown 
3092e269702eSStefano Zampini       if( dbg_flag ) {
30930c7d97c5SJed Brown         /* assemble subdomain vector on nodes */
309453cdbc3dSStefano Zampini         ierr = VecSet(pcis->vec1_N,zero);CHKERRQ(ierr);
30950c7d97c5SJed Brown         ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
30960c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr);
30970c7d97c5SJed Brown         for(j=0;j<n_R;j++){ array[ idx_R_local[j] ] = array2[j]; }
30980c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr);
30990c7d97c5SJed Brown         ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
31000c7d97c5SJed Brown         /* assemble subdomain vector of lagrange multipliers */
310153cdbc3dSStefano Zampini         ierr = VecSet(pcbddc->vec1_P,zero);CHKERRQ(ierr);
31020c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr);
31033b03a366Sstefano_zampini         if( n_vertices) {
31040c7d97c5SJed Brown           ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr);
31053b03a366Sstefano_zampini           for(j=0;j<n_vertices;j++) {array2[j]=-array[j];}
31060c7d97c5SJed Brown           ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr);
31070c7d97c5SJed Brown         }
31080c7d97c5SJed Brown         ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr);
31093b03a366Sstefano_zampini         for(j=0;j<n_constraints;j++) {array2[j+n_vertices]=-array[j];}
31100c7d97c5SJed Brown         ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr);
31110c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr);
31123972b0daSStefano Zampini         /* check saddle point solution */
3113534831adSStefano Zampini         ierr = MatMult(pcbddc->local_mat,pcis->vec1_N,pcis->vec2_N);CHKERRQ(ierr);
31143b03a366Sstefano_zampini         ierr = MatMultTransposeAdd(pcbddc->ConstraintMatrix,pcbddc->vec1_P,pcis->vec2_N,pcis->vec2_N);CHKERRQ(ierr);
311553cdbc3dSStefano Zampini         ierr = VecNorm(pcis->vec2_N,NORM_INFINITY,&coarsefunctions_errors[index]);CHKERRQ(ierr);
31163b03a366Sstefano_zampini         ierr = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr);
31170c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
311853cdbc3dSStefano Zampini         array[index]=array[index]+m_one; /* shift by the identity matrix */
31190c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
312053cdbc3dSStefano Zampini         ierr = VecNorm(pcbddc->vec1_P,NORM_INFINITY,&constraints_errors[index]);CHKERRQ(ierr);
31210c7d97c5SJed Brown       }
31220c7d97c5SJed Brown     }
31230c7d97c5SJed Brown     ierr = MatAssemblyBegin(pcbddc->coarse_phi_B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
31240c7d97c5SJed Brown     ierr = MatAssemblyEnd  (pcbddc->coarse_phi_B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
3125e269702eSStefano Zampini     if( pcbddc->prec_type || dbg_flag ) {
31260c7d97c5SJed Brown       ierr = MatAssemblyBegin(pcbddc->coarse_phi_D,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
31270c7d97c5SJed Brown       ierr = MatAssemblyEnd  (pcbddc->coarse_phi_D,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
31280c7d97c5SJed Brown     }
31290c7d97c5SJed Brown     /* Checking coarse_sub_mat and coarse basis functios */
31300c7d97c5SJed Brown     /* It shuld be \Phi^{(j)^T} A^{(j)} \Phi^{(j)}=coarse_sub_mat */
31319d2fce94SStefano Zampini     if(dbg_flag) {
31320c7d97c5SJed Brown 
31330c7d97c5SJed Brown       Mat coarse_sub_mat;
31340c7d97c5SJed Brown       Mat TM1,TM2,TM3,TM4;
31350c7d97c5SJed Brown       Mat coarse_phi_D,coarse_phi_B,A_II,A_BB,A_IB,A_BI;
3136a0ba757dSStefano Zampini       const MatType checkmattype=MATSEQAIJ;
31370c7d97c5SJed Brown       PetscScalar      value;
31380c7d97c5SJed Brown 
3139c042a7c3SStefano Zampini       ierr = MatConvert(pcis->A_II,checkmattype,MAT_INITIAL_MATRIX,&A_II);CHKERRQ(ierr);
3140c042a7c3SStefano Zampini       ierr = MatConvert(pcis->A_IB,checkmattype,MAT_INITIAL_MATRIX,&A_IB);CHKERRQ(ierr);
3141c042a7c3SStefano Zampini       ierr = MatConvert(pcis->A_BI,checkmattype,MAT_INITIAL_MATRIX,&A_BI);CHKERRQ(ierr);
3142c042a7c3SStefano Zampini       ierr = MatConvert(pcis->A_BB,checkmattype,MAT_INITIAL_MATRIX,&A_BB);CHKERRQ(ierr);
3143c042a7c3SStefano Zampini       ierr = MatConvert(pcbddc->coarse_phi_D,checkmattype,MAT_INITIAL_MATRIX,&coarse_phi_D);CHKERRQ(ierr);
3144c042a7c3SStefano Zampini       ierr = MatConvert(pcbddc->coarse_phi_B,checkmattype,MAT_INITIAL_MATRIX,&coarse_phi_B);CHKERRQ(ierr);
3145c042a7c3SStefano Zampini       ierr = MatCreateSeqDense(PETSC_COMM_SELF,pcbddc->local_primal_size,pcbddc->local_primal_size,coarse_submat_vals,&coarse_sub_mat);CHKERRQ(ierr);
3146c042a7c3SStefano Zampini       ierr = MatConvert(coarse_sub_mat,checkmattype,MAT_REUSE_MATRIX,&coarse_sub_mat);CHKERRQ(ierr);
31470c7d97c5SJed Brown 
3148da1bb401SStefano Zampini       /*PetscViewer view_out;
3149da1bb401SStefano Zampini       PetscMPIInt myrank;
3150da1bb401SStefano Zampini       char filename[256];
3151da1bb401SStefano Zampini       MPI_Comm_rank(((PetscObject)pc)->comm,&myrank);
3152da1bb401SStefano Zampini       sprintf(filename,"coarsesubmat_%04d.m",myrank);
3153da1bb401SStefano Zampini       ierr = PetscViewerASCIIOpen(PETSC_COMM_SELF,filename,&view_out);CHKERRQ(ierr);
3154da1bb401SStefano Zampini       ierr = PetscViewerSetFormat(view_out,PETSC_VIEWER_ASCII_MATLAB);CHKERRQ(ierr);
3155da1bb401SStefano Zampini       ierr = MatView(coarse_sub_mat,view_out);CHKERRQ(ierr);
3156da1bb401SStefano Zampini       ierr = PetscViewerDestroy(&view_out);CHKERRQ(ierr);*/
3157da1bb401SStefano Zampini 
31580c7d97c5SJed Brown       ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
31590c7d97c5SJed Brown       ierr = PetscViewerASCIIPrintf(viewer,"Check coarse sub mat and local basis functions\n");CHKERRQ(ierr);
31600c7d97c5SJed Brown       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
316153cdbc3dSStefano Zampini       ierr = MatPtAP(A_II,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&TM1);CHKERRQ(ierr);
316253cdbc3dSStefano Zampini       ierr = MatPtAP(A_BB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&TM2);CHKERRQ(ierr);
316353cdbc3dSStefano Zampini       ierr = MatMatMult(A_IB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr);
3164c042a7c3SStefano Zampini       ierr = MatTransposeMatMult(coarse_phi_D,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM3);CHKERRQ(ierr);
316553cdbc3dSStefano Zampini       ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr);
316653cdbc3dSStefano Zampini       ierr = MatMatMult(A_BI,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr);
3167c042a7c3SStefano Zampini       ierr = MatTransposeMatMult(coarse_phi_B,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM4);CHKERRQ(ierr);
316853cdbc3dSStefano Zampini       ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr);
316953cdbc3dSStefano Zampini       ierr = MatAXPY(TM1,one,TM2,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
317053cdbc3dSStefano Zampini       ierr = MatAXPY(TM1,one,TM3,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
317153cdbc3dSStefano Zampini       ierr = MatAXPY(TM1,one,TM4,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
317253cdbc3dSStefano Zampini       ierr = MatAXPY(TM1,m_one,coarse_sub_mat,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
317353cdbc3dSStefano Zampini       ierr = MatNorm(TM1,NORM_INFINITY,&value);CHKERRQ(ierr);
31740c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"----------------------------------\n");CHKERRQ(ierr);
31750c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d \n",PetscGlobalRank);CHKERRQ(ierr);
31760c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"matrix error = % 1.14e\n",value);CHKERRQ(ierr);
31770c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"coarse functions errors\n");CHKERRQ(ierr);
317853cdbc3dSStefano Zampini       for(i=0;i<pcbddc->local_primal_size;i++) { ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local %02d-th function error = % 1.14e\n",i,coarsefunctions_errors[i]);CHKERRQ(ierr); }
31790c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"constraints errors\n");CHKERRQ(ierr);
318053cdbc3dSStefano Zampini       for(i=0;i<pcbddc->local_primal_size;i++) { ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local %02d-th function error = % 1.14e\n",i,constraints_errors[i]);CHKERRQ(ierr); }
31810c7d97c5SJed Brown       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
318253cdbc3dSStefano Zampini       ierr = MatDestroy(&A_II);CHKERRQ(ierr);
318353cdbc3dSStefano Zampini       ierr = MatDestroy(&A_BB);CHKERRQ(ierr);
318453cdbc3dSStefano Zampini       ierr = MatDestroy(&A_IB);CHKERRQ(ierr);
318553cdbc3dSStefano Zampini       ierr = MatDestroy(&A_BI);CHKERRQ(ierr);
318653cdbc3dSStefano Zampini       ierr = MatDestroy(&TM1);CHKERRQ(ierr);
318753cdbc3dSStefano Zampini       ierr = MatDestroy(&TM2);CHKERRQ(ierr);
318853cdbc3dSStefano Zampini       ierr = MatDestroy(&TM3);CHKERRQ(ierr);
318953cdbc3dSStefano Zampini       ierr = MatDestroy(&TM4);CHKERRQ(ierr);
319053cdbc3dSStefano Zampini       ierr = MatDestroy(&coarse_phi_D);CHKERRQ(ierr);
319153cdbc3dSStefano Zampini       ierr = MatDestroy(&coarse_sub_mat);CHKERRQ(ierr);
319253cdbc3dSStefano Zampini       ierr = MatDestroy(&coarse_phi_B);CHKERRQ(ierr);
31930c7d97c5SJed Brown       ierr = PetscFree(coarsefunctions_errors);CHKERRQ(ierr);
31940c7d97c5SJed Brown       ierr = PetscFree(constraints_errors);CHKERRQ(ierr);
31950c7d97c5SJed Brown     }
31960c7d97c5SJed Brown 
31970c7d97c5SJed Brown     /* create coarse matrix and data structures for message passing associated actual choice of coarse problem type */
31980c7d97c5SJed Brown     ierr = PCBDDCSetupCoarseEnvironment(pc,coarse_submat_vals);CHKERRQ(ierr);
31990c7d97c5SJed Brown     /* free memory */
32000c7d97c5SJed Brown     ierr = PetscFree(coarse_submat_vals);CHKERRQ(ierr);
32010c7d97c5SJed Brown     ierr = PetscFree(auxindices);CHKERRQ(ierr);
32020c7d97c5SJed Brown     ierr = PetscFree(nnz);CHKERRQ(ierr);
32033b03a366Sstefano_zampini     if(n_vertices) {
32040c7d97c5SJed Brown       ierr = VecDestroy(&vec1_V);CHKERRQ(ierr);
32050c7d97c5SJed Brown       ierr = VecDestroy(&vec2_V);CHKERRQ(ierr);
32060c7d97c5SJed Brown       ierr = MatDestroy(&M2);CHKERRQ(ierr);
32070c7d97c5SJed Brown       ierr = MatDestroy(&A_RV);CHKERRQ(ierr);
32080c7d97c5SJed Brown       ierr = MatDestroy(&A_VR);CHKERRQ(ierr);
32090c7d97c5SJed Brown       ierr = MatDestroy(&A_VV);CHKERRQ(ierr);
32100c7d97c5SJed Brown     }
3211534831adSStefano Zampini     if(n_constraints) {
32120c7d97c5SJed Brown       ierr = VecDestroy(&vec1_C);CHKERRQ(ierr);
32130c7d97c5SJed Brown       ierr = VecDestroy(&vec2_C);CHKERRQ(ierr);
32140c7d97c5SJed Brown       ierr = MatDestroy(&M1);CHKERRQ(ierr);
32150c7d97c5SJed Brown       ierr = MatDestroy(&C_CR);CHKERRQ(ierr);
32160c7d97c5SJed Brown     }
32170c7d97c5SJed Brown   }
32180c7d97c5SJed Brown   /* free memory */
32193b03a366Sstefano_zampini   if(n_vertices) {
32200c7d97c5SJed Brown     ierr = PetscFree(idx_V_B);CHKERRQ(ierr);
32210c7d97c5SJed Brown     ierr = ISDestroy(&is_V_local);CHKERRQ(ierr);
32220c7d97c5SJed Brown   }
32230c7d97c5SJed Brown   ierr = ISDestroy(&is_R_local);CHKERRQ(ierr);
32240c7d97c5SJed Brown 
32250c7d97c5SJed Brown   PetscFunctionReturn(0);
32260c7d97c5SJed Brown }
32270c7d97c5SJed Brown 
32280c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
32290c7d97c5SJed Brown 
32300c7d97c5SJed Brown #undef __FUNCT__
32310c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetupCoarseEnvironment"
323253cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetupCoarseEnvironment(PC pc,PetscScalar* coarse_submat_vals)
32330c7d97c5SJed Brown {
32340c7d97c5SJed Brown 
32350c7d97c5SJed Brown 
32360c7d97c5SJed Brown   Mat_IS    *matis    = (Mat_IS*)pc->pmat->data;
32370c7d97c5SJed Brown   PC_BDDC   *pcbddc   = (PC_BDDC*)pc->data;
32380c7d97c5SJed Brown   PC_IS     *pcis     = (PC_IS*)pc->data;
32390c7d97c5SJed Brown   MPI_Comm  prec_comm = ((PetscObject)pc)->comm;
32400c7d97c5SJed Brown   MPI_Comm  coarse_comm;
32410c7d97c5SJed Brown 
32420c7d97c5SJed Brown   /* common to all choiches */
32430c7d97c5SJed Brown   PetscScalar *temp_coarse_mat_vals;
32440c7d97c5SJed Brown   PetscScalar *ins_coarse_mat_vals;
32450c7d97c5SJed Brown   PetscInt    *ins_local_primal_indices;
32460c7d97c5SJed Brown   PetscMPIInt *localsizes2,*localdispl2;
32470c7d97c5SJed Brown   PetscMPIInt size_prec_comm;
32480c7d97c5SJed Brown   PetscMPIInt rank_prec_comm;
32490c7d97c5SJed Brown   PetscMPIInt active_rank=MPI_PROC_NULL;
32500c7d97c5SJed Brown   PetscMPIInt master_proc=0;
32510c7d97c5SJed Brown   PetscInt    ins_local_primal_size;
32520c7d97c5SJed Brown   /* specific to MULTILEVEL_BDDC */
32530c7d97c5SJed Brown   PetscMPIInt *ranks_recv;
32540c7d97c5SJed Brown   PetscMPIInt count_recv=0;
32550c7d97c5SJed Brown   PetscMPIInt rank_coarse_proc_send_to;
32560c7d97c5SJed Brown   PetscMPIInt coarse_color = MPI_UNDEFINED;
32570c7d97c5SJed Brown   ISLocalToGlobalMapping coarse_ISLG;
32580c7d97c5SJed Brown   /* some other variables */
32590c7d97c5SJed Brown   PetscErrorCode ierr;
32600c7d97c5SJed Brown   const MatType coarse_mat_type;
32610c7d97c5SJed Brown   const PCType  coarse_pc_type;
326253cdbc3dSStefano Zampini   const KSPType coarse_ksp_type;
326353cdbc3dSStefano Zampini   PC pc_temp;
32640c7d97c5SJed Brown   PetscInt i,j,k,bs;
32653b03a366Sstefano_zampini   PetscInt max_it_coarse_ksp=1;  /* don't increase this value */
3266e269702eSStefano Zampini   /* verbose output viewer */
3267e269702eSStefano Zampini   PetscViewer viewer=pcbddc->dbg_viewer;
3268e269702eSStefano Zampini   PetscBool   dbg_flag=pcbddc->dbg_flag;
3269*142dfd88SStefano Zampini 
3270ea7e1babSStefano Zampini   PetscInt      offset,offset2;
3271*142dfd88SStefano Zampini   PetscMPIInt   im_active=0;
3272*142dfd88SStefano Zampini   PetscMPIInt   *auxglobal_primal;
3273*142dfd88SStefano Zampini 
3274*142dfd88SStefano Zampini   PetscBool     setsym,issym=PETSC_FALSE;
32750c7d97c5SJed Brown 
32760c7d97c5SJed Brown   PetscFunctionBegin;
32770c7d97c5SJed Brown   ins_local_primal_indices = 0;
32780c7d97c5SJed Brown   ins_coarse_mat_vals      = 0;
32790c7d97c5SJed Brown   localsizes2              = 0;
32800c7d97c5SJed Brown   localdispl2              = 0;
32810c7d97c5SJed Brown   temp_coarse_mat_vals     = 0;
32820c7d97c5SJed Brown   coarse_ISLG              = 0;
32830c7d97c5SJed Brown 
328453cdbc3dSStefano Zampini   ierr = MPI_Comm_size(prec_comm,&size_prec_comm);CHKERRQ(ierr);
328553cdbc3dSStefano Zampini   ierr = MPI_Comm_rank(prec_comm,&rank_prec_comm);CHKERRQ(ierr);
32860c7d97c5SJed Brown   ierr = MatGetBlockSize(matis->A,&bs);CHKERRQ(ierr);
3287*142dfd88SStefano Zampini   ierr = MatIsSymmetricKnown(pc->pmat,&setsym,&issym);CHKERRQ(ierr);
3288*142dfd88SStefano Zampini 
3289*142dfd88SStefano Zampini   if(pcis->n) { im_active = 1; }
3290*142dfd88SStefano Zampini   ierr = MPI_Allreduce(&im_active,&pcbddc->active_procs,1,MPIU_INT,MPI_SUM,prec_comm);CHKERRQ(ierr);
32910c7d97c5SJed Brown 
3292ffe5efe1SStefano Zampini   /* adapt coarse problem type */
3293*142dfd88SStefano Zampini   if(pcbddc->coarse_problem_type == MULTILEVEL_BDDC && (pcbddc->active_procs/pcbddc->coarsening_ratio) < 2 ) {
3294*142dfd88SStefano Zampini     if(dbg_flag) {
3295*142dfd88SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Not enough active processes on level. Parallel direct solve\n");CHKERRQ(ierr);
3296*142dfd88SStefano Zampini       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
3297*142dfd88SStefano Zampini     }
3298ffe5efe1SStefano Zampini     pcbddc->coarse_problem_type = PARALLEL_BDDC;
3299*142dfd88SStefano Zampini   }
3300ffe5efe1SStefano Zampini 
3301beed3852SStefano Zampini   /* Assign global numbering to coarse dofs */
3302beed3852SStefano Zampini   {
3303a0ba757dSStefano Zampini     PetscScalar    one=1.,zero=0.;
3304beed3852SStefano Zampini     PetscScalar    *array;
3305beed3852SStefano Zampini     PetscMPIInt    *auxlocal_primal;
3306beed3852SStefano Zampini     PetscMPIInt    *all_auxglobal_primal;
3307beed3852SStefano Zampini     PetscMPIInt    mpi_local_primal_size = (PetscMPIInt)pcbddc->local_primal_size;
3308da1bb401SStefano Zampini     PetscInt       *row_cmat_indices;
33093b03a366Sstefano_zampini     PetscInt       size_of_constraint;
3310da1bb401SStefano Zampini     PetscScalar    coarsesum;
3311beed3852SStefano Zampini 
3312beed3852SStefano Zampini     /* Construct needed data structures for message passing */
3313beed3852SStefano Zampini     ierr = PetscMalloc(mpi_local_primal_size*sizeof(PetscMPIInt),&pcbddc->local_primal_indices);CHKERRQ(ierr);
3314ffe5efe1SStefano Zampini     j = 0;
3315*142dfd88SStefano Zampini     if(rank_prec_comm == 0 || pcbddc->coarse_problem_type == REPLICATED_BDDC || pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
3316ffe5efe1SStefano Zampini       j = size_prec_comm;
3317ffe5efe1SStefano Zampini     }
3318ffe5efe1SStefano Zampini     ierr = PetscMalloc(j*sizeof(PetscMPIInt),&pcbddc->local_primal_sizes);CHKERRQ(ierr);
3319ffe5efe1SStefano Zampini     ierr = PetscMalloc(j*sizeof(PetscMPIInt),&pcbddc->local_primal_displacements);CHKERRQ(ierr);
3320beed3852SStefano Zampini     /* Gather local_primal_size information for all processes  */
3321*142dfd88SStefano Zampini     if(pcbddc->coarse_problem_type == REPLICATED_BDDC || pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
33225619798eSStefano Zampini       ierr = MPI_Allgather(&mpi_local_primal_size,1,MPIU_INT,&pcbddc->local_primal_sizes[0],1,MPIU_INT,prec_comm);CHKERRQ(ierr);
3323ffe5efe1SStefano Zampini     } else {
3324ffe5efe1SStefano Zampini       ierr = MPI_Gather(&mpi_local_primal_size,1,MPIU_INT,&pcbddc->local_primal_sizes[0],1,MPIU_INT,0,prec_comm);CHKERRQ(ierr);
3325ffe5efe1SStefano Zampini     }
3326beed3852SStefano Zampini     pcbddc->replicated_primal_size = 0;
3327ffe5efe1SStefano Zampini     for (i=0; i<j; i++) {
3328beed3852SStefano Zampini       pcbddc->local_primal_displacements[i] = pcbddc->replicated_primal_size ;
3329beed3852SStefano Zampini       pcbddc->replicated_primal_size += pcbddc->local_primal_sizes[i];
3330beed3852SStefano Zampini     }
33315619798eSStefano Zampini     if(rank_prec_comm == 0) {
3332beed3852SStefano Zampini       /* allocate some auxiliary space */
3333beed3852SStefano Zampini       ierr = PetscMalloc(pcbddc->replicated_primal_size*sizeof(*all_auxglobal_primal),&all_auxglobal_primal);CHKERRQ(ierr);
3334beed3852SStefano Zampini     }
3335beed3852SStefano Zampini     ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscMPIInt),&auxlocal_primal);CHKERRQ(ierr);
3336beed3852SStefano Zampini     ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscMPIInt),&auxglobal_primal);CHKERRQ(ierr);
3337beed3852SStefano Zampini 
3338da1bb401SStefano Zampini     /* First let's count coarse dofs.
3339beed3852SStefano Zampini        This code fragment assumes that the number of local constraints per connected component
3340beed3852SStefano Zampini        is not greater than the number of nodes defined for the connected component
3341beed3852SStefano Zampini        (otherwise we will surely have linear dependence between constraints and thus a singular coarse problem) */
33423b03a366Sstefano_zampini     /* auxlocal_primal      : primal indices in local nodes numbering (internal and interface) with complete queue sorted by global ordering */
3343beed3852SStefano Zampini     ierr = VecSet(pcis->vec1_N,zero);CHKERRQ(ierr);
3344beed3852SStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3345da1bb401SStefano Zampini     for(i=0;i<pcbddc->local_primal_size;i++) {
3346da1bb401SStefano Zampini       ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr);
33473b03a366Sstefano_zampini       for (j=0; j<size_of_constraint; j++) {
33483b03a366Sstefano_zampini         k = row_cmat_indices[j];
3349beed3852SStefano Zampini         if( array[k] == zero ) {
3350beed3852SStefano Zampini           array[k] = one;
3351da1bb401SStefano Zampini           auxlocal_primal[i] = k;
3352beed3852SStefano Zampini           break;
3353beed3852SStefano Zampini         }
3354beed3852SStefano Zampini       }
3355da1bb401SStefano Zampini       ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr);
3356beed3852SStefano Zampini     }
3357beed3852SStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3358da1bb401SStefano Zampini     ierr = VecSet(pcis->vec1_global,zero);CHKERRQ(ierr);
3359da1bb401SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3360da1bb401SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3361da1bb401SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3362da1bb401SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3363da1bb401SStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3364*142dfd88SStefano Zampini     for(i=0;i<pcis->n;i++) { if( PetscAbsScalar(array[i]) > zero) array[i] = one/array[i]; }
3365da1bb401SStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3366da1bb401SStefano Zampini     ierr = VecSet(pcis->vec1_global,zero);CHKERRQ(ierr);
3367da1bb401SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3368da1bb401SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3369da1bb401SStefano Zampini     ierr = VecSum(pcis->vec1_global,&coarsesum);CHKERRQ(ierr);
3370da1bb401SStefano Zampini     pcbddc->coarse_size = (PetscInt) coarsesum;
3371a0ba757dSStefano Zampini 
3372beed3852SStefano Zampini     /* Now assign them a global numbering */
3373beed3852SStefano Zampini     /* auxglobal_primal contains indices in global nodes numbering (internal and interface) */
3374beed3852SStefano Zampini     ierr = ISLocalToGlobalMappingApply(matis->mapping,pcbddc->local_primal_size,auxlocal_primal,auxglobal_primal);CHKERRQ(ierr);
3375*142dfd88SStefano Zampini     ierr = PetscFree(auxlocal_primal);CHKERRQ(ierr);
3376beed3852SStefano Zampini     /* all_auxglobal_primal contains all primal nodes indices in global nodes numbering (internal and interface) */
3377beed3852SStefano Zampini     ierr = MPI_Gatherv(&auxglobal_primal[0],pcbddc->local_primal_size,MPIU_INT,&all_auxglobal_primal[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,0,prec_comm);CHKERRQ(ierr);
3378*142dfd88SStefano Zampini     ierr = PetscFree(auxglobal_primal);CHKERRQ(ierr);
3379beed3852SStefano Zampini 
3380beed3852SStefano Zampini     /* After this block all_auxglobal_primal should contains one copy of each primal node's indices in global nodes numbering */
3381beed3852SStefano Zampini     if(rank_prec_comm==0) {
338217d7d925SStefano Zampini       j=pcbddc->replicated_primal_size;
3383*142dfd88SStefano Zampini       ierr = PetscMalloc(j*sizeof(PetscMPIInt),&auxglobal_primal);CHKERRQ(ierr);
3384*142dfd88SStefano Zampini       ierr = PetscMemcpy(auxglobal_primal,all_auxglobal_primal,j*sizeof(PetscMPIInt));CHKERRQ(ierr);
338517d7d925SStefano Zampini       ierr = PetscSortRemoveDupsMPIInt(&j,all_auxglobal_primal);CHKERRQ(ierr);
3386*142dfd88SStefano Zampini       for(j=0;j<size_prec_comm;j++) {
3387*142dfd88SStefano Zampini         for(i=0;i<pcbddc->local_primal_sizes[j];i++) {
3388beed3852SStefano Zampini           k=0;
3389*142dfd88SStefano Zampini           while( all_auxglobal_primal[k] != auxglobal_primal[i+pcbddc->local_primal_displacements[j]] ) { k++;}
3390*142dfd88SStefano Zampini           auxglobal_primal[i+pcbddc->local_primal_displacements[j]]=k;
3391beed3852SStefano Zampini         }
3392e269702eSStefano Zampini       }
3393beed3852SStefano Zampini       ierr = PetscFree(all_auxglobal_primal);CHKERRQ(ierr);
3394e269702eSStefano Zampini     }
3395*142dfd88SStefano Zampini     ierr = MPI_Scatterv(auxglobal_primal,pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,
3396*142dfd88SStefano Zampini                         pcbddc->local_primal_indices,pcbddc->local_primal_size,MPIU_INT,0,prec_comm);
3397*142dfd88SStefano Zampini   }
3398beed3852SStefano Zampini 
33990c7d97c5SJed Brown   switch(pcbddc->coarse_problem_type){
34000c7d97c5SJed Brown 
3401da1bb401SStefano Zampini     case(MULTILEVEL_BDDC):   /* we define a coarse mesh where subdomains are elements */
34020c7d97c5SJed Brown     {
34030c7d97c5SJed Brown       /* we need additional variables */
34040c7d97c5SJed Brown       MetisInt   n_subdomains,n_parts,objval,ncon,faces_nvtxs;
34050c7d97c5SJed Brown       MetisInt   *metis_coarse_subdivision;
34060c7d97c5SJed Brown       MetisInt   options[METIS_NOPTIONS];
34070c7d97c5SJed Brown       PetscMPIInt size_coarse_comm,rank_coarse_comm;
34080c7d97c5SJed Brown       PetscMPIInt procs_jumps_coarse_comm;
34090c7d97c5SJed Brown       PetscMPIInt *coarse_subdivision;
34100c7d97c5SJed Brown       PetscMPIInt *total_count_recv;
34110c7d97c5SJed Brown       PetscMPIInt *total_ranks_recv;
34120c7d97c5SJed Brown       PetscMPIInt *displacements_recv;
34130c7d97c5SJed Brown       PetscMPIInt *my_faces_connectivity;
34140c7d97c5SJed Brown       PetscMPIInt *petsc_faces_adjncy;
34150c7d97c5SJed Brown       MetisInt    *faces_adjncy;
34160c7d97c5SJed Brown       MetisInt    *faces_xadj;
34170c7d97c5SJed Brown       PetscMPIInt *number_of_faces;
34180c7d97c5SJed Brown       PetscMPIInt *faces_displacements;
34190c7d97c5SJed Brown       PetscInt    *array_int;
34200c7d97c5SJed Brown       PetscMPIInt my_faces=0;
34210c7d97c5SJed Brown       PetscMPIInt total_faces=0;
34223828260eSStefano Zampini       PetscInt    ranks_stretching_ratio;
34230c7d97c5SJed Brown 
34240c7d97c5SJed Brown       /* define some quantities */
34250c7d97c5SJed Brown       pcbddc->coarse_communications_type = SCATTERS_BDDC;
34260c7d97c5SJed Brown       coarse_mat_type = MATIS;
34270c7d97c5SJed Brown       coarse_pc_type  = PCBDDC;
3428*142dfd88SStefano Zampini       coarse_ksp_type = KSPRICHARDSON;
34290c7d97c5SJed Brown 
34300c7d97c5SJed Brown       /* details of coarse decomposition */
34310c7d97c5SJed Brown       n_subdomains = pcbddc->active_procs;
34320c7d97c5SJed Brown       n_parts      = n_subdomains/pcbddc->coarsening_ratio;
34333828260eSStefano Zampini       ranks_stretching_ratio = size_prec_comm/pcbddc->active_procs;
34343828260eSStefano Zampini       procs_jumps_coarse_comm = pcbddc->coarsening_ratio*ranks_stretching_ratio;
34353828260eSStefano Zampini 
3436da1bb401SStefano Zampini       /*printf("Coarse algorithm details: \n");
3437da1bb401SStefano Zampini       printf("n_subdomains %d, n_parts %d\nstretch %d,jumps %d,coarse_ratio %d\nlevel should be log_%d(%d)\n",n_subdomains,n_parts,ranks_stretching_ratio,procs_jumps_coarse_comm,pcbddc->coarsening_ratio,pcbddc->coarsening_ratio,(ranks_stretching_ratio/pcbddc->coarsening_ratio+1));*/
34380c7d97c5SJed Brown 
34390c7d97c5SJed Brown       /* build CSR graph of subdomains' connectivity through faces */
34400c7d97c5SJed Brown       ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&array_int);CHKERRQ(ierr);
34413828260eSStefano Zampini       ierr = PetscMemzero(array_int,pcis->n*sizeof(PetscInt));CHKERRQ(ierr);
34420c7d97c5SJed Brown       for(i=1;i<pcis->n_neigh;i++){/* i=1 so I don't count myself -> faces nodes counts to 1 */
34430c7d97c5SJed Brown         for(j=0;j<pcis->n_shared[i];j++){
34440c7d97c5SJed Brown           array_int[ pcis->shared[i][j] ]+=1;
34450c7d97c5SJed Brown         }
34460c7d97c5SJed Brown       }
34470c7d97c5SJed Brown       for(i=1;i<pcis->n_neigh;i++){
34480c7d97c5SJed Brown         for(j=0;j<pcis->n_shared[i];j++){
34490c7d97c5SJed Brown           if(array_int[ pcis->shared[i][j] ] == 1 ){
34500c7d97c5SJed Brown             my_faces++;
34510c7d97c5SJed Brown             break;
34520c7d97c5SJed Brown           }
34530c7d97c5SJed Brown         }
34540c7d97c5SJed Brown       }
34550c7d97c5SJed Brown 
345653cdbc3dSStefano Zampini       ierr = MPI_Reduce(&my_faces,&total_faces,1,MPIU_INT,MPI_SUM,master_proc,prec_comm);CHKERRQ(ierr);
34570c7d97c5SJed Brown       ierr = PetscMalloc (my_faces*sizeof(PetscInt),&my_faces_connectivity);CHKERRQ(ierr);
34580c7d97c5SJed Brown       my_faces=0;
34590c7d97c5SJed Brown       for(i=1;i<pcis->n_neigh;i++){
34600c7d97c5SJed Brown         for(j=0;j<pcis->n_shared[i];j++){
34610c7d97c5SJed Brown           if(array_int[ pcis->shared[i][j] ] == 1 ){
34620c7d97c5SJed Brown             my_faces_connectivity[my_faces]=pcis->neigh[i];
34630c7d97c5SJed Brown             my_faces++;
34640c7d97c5SJed Brown             break;
34650c7d97c5SJed Brown           }
34660c7d97c5SJed Brown         }
34670c7d97c5SJed Brown       }
34680c7d97c5SJed Brown       if(rank_prec_comm == master_proc) {
34690c7d97c5SJed Brown         ierr = PetscMalloc (total_faces*sizeof(PetscMPIInt),&petsc_faces_adjncy);CHKERRQ(ierr);
34700c7d97c5SJed Brown         ierr = PetscMalloc (size_prec_comm*sizeof(PetscMPIInt),&number_of_faces);CHKERRQ(ierr);
34710c7d97c5SJed Brown         ierr = PetscMalloc (total_faces*sizeof(MetisInt),&faces_adjncy);CHKERRQ(ierr);
34720c7d97c5SJed Brown         ierr = PetscMalloc ((n_subdomains+1)*sizeof(MetisInt),&faces_xadj);CHKERRQ(ierr);
34730c7d97c5SJed Brown         ierr = PetscMalloc ((size_prec_comm+1)*sizeof(PetscMPIInt),&faces_displacements);CHKERRQ(ierr);
34740c7d97c5SJed Brown       }
347553cdbc3dSStefano Zampini       ierr = MPI_Gather(&my_faces,1,MPIU_INT,&number_of_faces[0],1,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr);
34760c7d97c5SJed Brown       if(rank_prec_comm == master_proc) {
34770c7d97c5SJed Brown         faces_xadj[0]=0;
34780c7d97c5SJed Brown         faces_displacements[0]=0;
34790c7d97c5SJed Brown         j=0;
34800c7d97c5SJed Brown         for(i=1;i<size_prec_comm+1;i++) {
34810c7d97c5SJed Brown           faces_displacements[i]=faces_displacements[i-1]+number_of_faces[i-1];
34820c7d97c5SJed Brown           if(number_of_faces[i-1]) {
34830c7d97c5SJed Brown             j++;
34840c7d97c5SJed Brown             faces_xadj[j]=faces_xadj[j-1]+number_of_faces[i-1];
34850c7d97c5SJed Brown           }
34860c7d97c5SJed Brown         }
3487da1bb401SStefano Zampini         /*printf("The J I count is %d and should be %d\n",j,n_subdomains);
3488da1bb401SStefano Zampini         printf("Total faces seem %d and should be %d\n",faces_xadj[j],total_faces);*/
34890c7d97c5SJed Brown       }
349053cdbc3dSStefano Zampini       ierr = MPI_Gatherv(&my_faces_connectivity[0],my_faces,MPIU_INT,&petsc_faces_adjncy[0],number_of_faces,faces_displacements,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr);
34910c7d97c5SJed Brown       ierr = PetscFree(my_faces_connectivity);CHKERRQ(ierr);
34920c7d97c5SJed Brown       ierr = PetscFree(array_int);CHKERRQ(ierr);
34930c7d97c5SJed Brown       if(rank_prec_comm == master_proc) {
34943828260eSStefano Zampini         for(i=0;i<total_faces;i++) faces_adjncy[i]=(MetisInt)(petsc_faces_adjncy[i]/ranks_stretching_ratio); /* cast to MetisInt */
3495da1bb401SStefano Zampini         /*printf("This is the face connectivity (actual ranks)\n");
34960c7d97c5SJed Brown         for(i=0;i<n_subdomains;i++){
34970c7d97c5SJed Brown           printf("proc %d is connected with \n",i);
34980c7d97c5SJed Brown           for(j=faces_xadj[i];j<faces_xadj[i+1];j++)
34990c7d97c5SJed Brown             printf("%d ",faces_adjncy[j]);
35000c7d97c5SJed Brown           printf("\n");
3501da1bb401SStefano Zampini         }*/
35020c7d97c5SJed Brown         ierr = PetscFree(faces_displacements);CHKERRQ(ierr);
35030c7d97c5SJed Brown         ierr = PetscFree(number_of_faces);CHKERRQ(ierr);
35040c7d97c5SJed Brown         ierr = PetscFree(petsc_faces_adjncy);CHKERRQ(ierr);
35050c7d97c5SJed Brown       }
35060c7d97c5SJed Brown 
35070c7d97c5SJed Brown       if( rank_prec_comm == master_proc ) {
35080c7d97c5SJed Brown 
35093828260eSStefano Zampini         PetscInt heuristic_for_metis=3;
35103828260eSStefano Zampini 
35110c7d97c5SJed Brown         ncon=1;
35120c7d97c5SJed Brown         faces_nvtxs=n_subdomains;
35130c7d97c5SJed Brown         /* partition graoh induced by face connectivity */
35140c7d97c5SJed Brown         ierr = PetscMalloc (n_subdomains*sizeof(MetisInt),&metis_coarse_subdivision);CHKERRQ(ierr);
35150c7d97c5SJed Brown         ierr = METIS_SetDefaultOptions(options);
35160c7d97c5SJed Brown         /* we need a contiguous partition of the coarse mesh */
35170c7d97c5SJed Brown         options[METIS_OPTION_CONTIG]=1;
35180c7d97c5SJed Brown         options[METIS_OPTION_NITER]=30;
35193828260eSStefano Zampini         if(n_subdomains>n_parts*heuristic_for_metis) {
35203828260eSStefano Zampini           options[METIS_OPTION_IPTYPE]=METIS_IPTYPE_EDGE;
35213828260eSStefano Zampini           options[METIS_OPTION_OBJTYPE]=METIS_OBJTYPE_CUT;
35220c7d97c5SJed Brown           ierr = METIS_PartGraphKway(&faces_nvtxs,&ncon,faces_xadj,faces_adjncy,NULL,NULL,NULL,&n_parts,NULL,NULL,options,&objval,metis_coarse_subdivision);
3523*142dfd88SStefano Zampini           if(ierr != METIS_OK) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in METIS_PartGraphKway (metis error code %D) called from PCBDDCSetupCoarseEnvironment\n",ierr);
35243828260eSStefano Zampini         } else {
35253828260eSStefano Zampini           ierr = METIS_PartGraphRecursive(&faces_nvtxs,&ncon,faces_xadj,faces_adjncy,NULL,NULL,NULL,&n_parts,NULL,NULL,options,&objval,metis_coarse_subdivision);
3526*142dfd88SStefano Zampini           if(ierr != METIS_OK) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in METIS_PartGraphRecursive (metis error code %D) called from PCBDDCSetupCoarseEnvironment\n",ierr);
35273828260eSStefano Zampini         }
35280c7d97c5SJed Brown         ierr = PetscFree(faces_xadj);CHKERRQ(ierr);
35290c7d97c5SJed Brown         ierr = PetscFree(faces_adjncy);CHKERRQ(ierr);
35300c7d97c5SJed Brown         coarse_subdivision = (PetscMPIInt*)calloc(size_prec_comm,sizeof(PetscMPIInt)); /* calloc for contiguous memory since we need to scatter these values later */
35310c7d97c5SJed Brown         /* copy/cast values avoiding possible type conflicts between PETSc, MPI and METIS */
35323828260eSStefano Zampini         for(i=0;i<size_prec_comm;i++) coarse_subdivision[i]=MPI_PROC_NULL;
35333828260eSStefano Zampini         for(i=0;i<n_subdomains;i++)   coarse_subdivision[ranks_stretching_ratio*i]=(PetscInt)(metis_coarse_subdivision[i]);
35340c7d97c5SJed Brown         ierr = PetscFree(metis_coarse_subdivision);CHKERRQ(ierr);
35350c7d97c5SJed Brown       }
35360c7d97c5SJed Brown 
35370c7d97c5SJed Brown       /* Create new communicator for coarse problem splitting the old one */
35380c7d97c5SJed Brown       if( !(rank_prec_comm%procs_jumps_coarse_comm) && rank_prec_comm < procs_jumps_coarse_comm*n_parts ){
3539da1bb401SStefano Zampini         coarse_color=0;              /* for communicator splitting */
3540da1bb401SStefano Zampini         active_rank=rank_prec_comm;  /* for insertion of matrix values */
35410c7d97c5SJed Brown       }
3542da1bb401SStefano Zampini       /* procs with coarse_color = MPI_UNDEFINED will have coarse_comm = MPI_COMM_NULL (from mpi standards)
3543da1bb401SStefano Zampini          key = rank_prec_comm -> keep same ordering of ranks from the old to the new communicator */
354453cdbc3dSStefano Zampini       ierr = MPI_Comm_split(prec_comm,coarse_color,rank_prec_comm,&coarse_comm);CHKERRQ(ierr);
35450c7d97c5SJed Brown 
35460c7d97c5SJed Brown       if( coarse_color == 0 ) {
354753cdbc3dSStefano Zampini         ierr = MPI_Comm_size(coarse_comm,&size_coarse_comm);CHKERRQ(ierr);
354853cdbc3dSStefano Zampini         ierr = MPI_Comm_rank(coarse_comm,&rank_coarse_comm);CHKERRQ(ierr);
3549da1bb401SStefano Zampini         /*printf("Details of coarse comm\n");
35503828260eSStefano Zampini         printf("size = %d, myrank = %d\n",size_coarse_comm,rank_coarse_comm);
3551da1bb401SStefano Zampini         printf("jumps = %d, coarse_color = %d, n_parts = %d\n",procs_jumps_coarse_comm,coarse_color,n_parts);*/
35520c7d97c5SJed Brown       } else {
35530c7d97c5SJed Brown         rank_coarse_comm = MPI_PROC_NULL;
35540c7d97c5SJed Brown       }
35550c7d97c5SJed Brown 
35560c7d97c5SJed Brown       /* master proc take care of arranging and distributing coarse informations */
35570c7d97c5SJed Brown       if(rank_coarse_comm == master_proc) {
35580c7d97c5SJed Brown         ierr = PetscMalloc (size_coarse_comm*sizeof(PetscMPIInt),&displacements_recv);CHKERRQ(ierr);
3559da1bb401SStefano Zampini         /*ierr = PetscMalloc (size_coarse_comm*sizeof(PetscMPIInt),&total_count_recv);CHKERRQ(ierr);
3560da1bb401SStefano Zampini           ierr = PetscMalloc (n_subdomains*sizeof(PetscMPIInt),&total_ranks_recv);CHKERRQ(ierr);*/
35610c7d97c5SJed Brown         total_count_recv = (PetscMPIInt*)calloc(size_prec_comm,sizeof(PetscMPIInt));
35620c7d97c5SJed Brown         total_ranks_recv = (PetscMPIInt*)calloc(n_subdomains,sizeof(PetscMPIInt));
35630c7d97c5SJed Brown         /* some initializations */
35640c7d97c5SJed Brown         displacements_recv[0]=0;
3565da1bb401SStefano Zampini         /* PetscMemzero(total_count_recv,size_coarse_comm*sizeof(PetscMPIInt)); not needed -> calloc initializes to zero */
35660c7d97c5SJed Brown         /* count from how many processes the j-th process of the coarse decomposition will receive data */
35670c7d97c5SJed Brown         for(j=0;j<size_coarse_comm;j++)
35683828260eSStefano Zampini           for(i=0;i<size_prec_comm;i++)
35690c7d97c5SJed Brown             if(coarse_subdivision[i]==j)
35700c7d97c5SJed Brown               total_count_recv[j]++;
35710c7d97c5SJed Brown         /* displacements needed for scatterv of total_ranks_recv */
35720c7d97c5SJed Brown         for(i=1;i<size_coarse_comm;i++) displacements_recv[i]=displacements_recv[i-1]+total_count_recv[i-1];
35730c7d97c5SJed Brown         /* Now fill properly total_ranks_recv -> each coarse process will receive the ranks (in prec_comm communicator) of its friend (sending) processes */
35740c7d97c5SJed Brown         ierr = PetscMemzero(total_count_recv,size_coarse_comm*sizeof(PetscMPIInt));CHKERRQ(ierr);
35750c7d97c5SJed Brown         for(j=0;j<size_coarse_comm;j++) {
35763828260eSStefano Zampini           for(i=0;i<size_prec_comm;i++) {
35770c7d97c5SJed Brown             if(coarse_subdivision[i]==j) {
35780c7d97c5SJed Brown               total_ranks_recv[displacements_recv[j]+total_count_recv[j]]=i;
35793828260eSStefano Zampini               total_count_recv[j]+=1;
35800c7d97c5SJed Brown             }
35810c7d97c5SJed Brown           }
35820c7d97c5SJed Brown         }
3583da1bb401SStefano Zampini         /*for(j=0;j<size_coarse_comm;j++) {
35843828260eSStefano Zampini           printf("process %d in new rank will receive from %d processes (original ranks follows)\n",j,total_count_recv[j]);
35853828260eSStefano Zampini           for(i=0;i<total_count_recv[j];i++) {
35863828260eSStefano Zampini             printf("%d ",total_ranks_recv[displacements_recv[j]+i]);
35873828260eSStefano Zampini           }
35883828260eSStefano Zampini           printf("\n");
3589da1bb401SStefano Zampini         }*/
35900c7d97c5SJed Brown 
35910c7d97c5SJed Brown         /* identify new decomposition in terms of ranks in the old communicator */
35923828260eSStefano Zampini         for(i=0;i<n_subdomains;i++) coarse_subdivision[ranks_stretching_ratio*i]=coarse_subdivision[ranks_stretching_ratio*i]*procs_jumps_coarse_comm;
3593da1bb401SStefano Zampini         /*printf("coarse_subdivision in old end new ranks\n");
35940c7d97c5SJed Brown         for(i=0;i<size_prec_comm;i++)
35953828260eSStefano Zampini           if(coarse_subdivision[i]!=MPI_PROC_NULL) {
35963828260eSStefano Zampini             printf("%d=(%d %d), ",i,coarse_subdivision[i],coarse_subdivision[i]/procs_jumps_coarse_comm);
35973828260eSStefano Zampini           } else {
35983828260eSStefano Zampini             printf("%d=(%d %d), ",i,coarse_subdivision[i],coarse_subdivision[i]);
35993828260eSStefano Zampini           }
3600da1bb401SStefano Zampini         printf("\n");*/
36010c7d97c5SJed Brown       }
36020c7d97c5SJed Brown 
36030c7d97c5SJed Brown       /* Scatter new decomposition for send details */
360453cdbc3dSStefano Zampini       ierr = MPI_Scatter(&coarse_subdivision[0],1,MPIU_INT,&rank_coarse_proc_send_to,1,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr);
36050c7d97c5SJed Brown       /* Scatter receiving details to members of coarse decomposition */
36060c7d97c5SJed Brown       if( coarse_color == 0) {
360753cdbc3dSStefano Zampini         ierr = MPI_Scatter(&total_count_recv[0],1,MPIU_INT,&count_recv,1,MPIU_INT,master_proc,coarse_comm);CHKERRQ(ierr);
36080c7d97c5SJed Brown         ierr = PetscMalloc (count_recv*sizeof(PetscMPIInt),&ranks_recv);CHKERRQ(ierr);
360953cdbc3dSStefano Zampini         ierr = MPI_Scatterv(&total_ranks_recv[0],total_count_recv,displacements_recv,MPIU_INT,&ranks_recv[0],count_recv,MPIU_INT,master_proc,coarse_comm);CHKERRQ(ierr);
36100c7d97c5SJed Brown       }
36110c7d97c5SJed Brown 
3612da1bb401SStefano Zampini       /*printf("I will send my matrix data to proc  %d\n",rank_coarse_proc_send_to);
3613da1bb401SStefano Zampini       if(coarse_color == 0) {
3614da1bb401SStefano Zampini         printf("I will receive some matrix data from %d processes (ranks follows)\n",count_recv);
3615da1bb401SStefano Zampini         for(i=0;i<count_recv;i++)
3616da1bb401SStefano Zampini           printf("%d ",ranks_recv[i]);
3617da1bb401SStefano Zampini         printf("\n");
3618da1bb401SStefano Zampini       }*/
36190c7d97c5SJed Brown 
36200c7d97c5SJed Brown       if(rank_prec_comm == master_proc) {
3621da1bb401SStefano Zampini         /*ierr = PetscFree(coarse_subdivision);CHKERRQ(ierr);
3622da1bb401SStefano Zampini         ierr = PetscFree(total_count_recv);CHKERRQ(ierr);
3623da1bb401SStefano Zampini         ierr = PetscFree(total_ranks_recv);CHKERRQ(ierr);*/
36240c7d97c5SJed Brown         free(coarse_subdivision);
36250c7d97c5SJed Brown         free(total_count_recv);
36260c7d97c5SJed Brown         free(total_ranks_recv);
36270c7d97c5SJed Brown         ierr = PetscFree(displacements_recv);CHKERRQ(ierr);
36280c7d97c5SJed Brown       }
36290c7d97c5SJed Brown       break;
36300c7d97c5SJed Brown     }
36310c7d97c5SJed Brown 
36320c7d97c5SJed Brown     case(REPLICATED_BDDC):
36330c7d97c5SJed Brown 
36340c7d97c5SJed Brown       pcbddc->coarse_communications_type = GATHERS_BDDC;
36350c7d97c5SJed Brown       coarse_mat_type = MATSEQAIJ;
36360c7d97c5SJed Brown       coarse_pc_type  = PCLU;
363753cdbc3dSStefano Zampini       coarse_ksp_type  = KSPPREONLY;
36380c7d97c5SJed Brown       coarse_comm = PETSC_COMM_SELF;
36390c7d97c5SJed Brown       active_rank = rank_prec_comm;
36400c7d97c5SJed Brown       break;
36410c7d97c5SJed Brown 
36420c7d97c5SJed Brown     case(PARALLEL_BDDC):
36430c7d97c5SJed Brown 
36440c7d97c5SJed Brown       pcbddc->coarse_communications_type = SCATTERS_BDDC;
36450c7d97c5SJed Brown       coarse_mat_type = MATMPIAIJ;
36460c7d97c5SJed Brown       coarse_pc_type  = PCREDUNDANT;
364753cdbc3dSStefano Zampini       coarse_ksp_type  = KSPPREONLY;
36480c7d97c5SJed Brown       coarse_comm = prec_comm;
36490c7d97c5SJed Brown       active_rank = rank_prec_comm;
36500c7d97c5SJed Brown       break;
36510c7d97c5SJed Brown 
36520c7d97c5SJed Brown     case(SEQUENTIAL_BDDC):
36530c7d97c5SJed Brown       pcbddc->coarse_communications_type = GATHERS_BDDC;
36540c7d97c5SJed Brown       coarse_mat_type = MATSEQAIJ;
36550c7d97c5SJed Brown       coarse_pc_type = PCLU;
365653cdbc3dSStefano Zampini       coarse_ksp_type  = KSPPREONLY;
36570c7d97c5SJed Brown       coarse_comm = PETSC_COMM_SELF;
36580c7d97c5SJed Brown       active_rank = master_proc;
36590c7d97c5SJed Brown       break;
36600c7d97c5SJed Brown   }
36610c7d97c5SJed Brown 
36620c7d97c5SJed Brown   switch(pcbddc->coarse_communications_type){
36630c7d97c5SJed Brown 
36640c7d97c5SJed Brown     case(SCATTERS_BDDC):
36650c7d97c5SJed Brown       {
36660c7d97c5SJed Brown         if(pcbddc->coarse_problem_type==MULTILEVEL_BDDC) {
36670c7d97c5SJed Brown 
36680c7d97c5SJed Brown           PetscMPIInt send_size;
36690c7d97c5SJed Brown           PetscInt    *aux_ins_indices;
36700c7d97c5SJed Brown           PetscInt    ii,jj;
36710c7d97c5SJed Brown           MPI_Request *requests;
36720c7d97c5SJed Brown 
36730c7d97c5SJed Brown           /* allocate auxiliary space */
36745619798eSStefano Zampini           ierr = PetscMalloc (pcbddc->replicated_primal_size*sizeof(PetscMPIInt),&pcbddc->replicated_local_primal_indices);CHKERRQ(ierr);
36755619798eSStefano Zampini           ierr = MPI_Allgatherv(&pcbddc->local_primal_indices[0],pcbddc->local_primal_size,MPIU_INT,&pcbddc->replicated_local_primal_indices[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,prec_comm);CHKERRQ(ierr);
36760c7d97c5SJed Brown           ierr = PetscMalloc ( pcbddc->coarse_size*sizeof(PetscInt),&aux_ins_indices);CHKERRQ(ierr);
36770c7d97c5SJed Brown           ierr = PetscMemzero(aux_ins_indices,pcbddc->coarse_size*sizeof(PetscInt));CHKERRQ(ierr);
36780c7d97c5SJed Brown           /* allocate stuffs for message massing */
36790c7d97c5SJed Brown           ierr = PetscMalloc ( (count_recv+1)*sizeof(MPI_Request),&requests);CHKERRQ(ierr);
36800c7d97c5SJed Brown           for(i=0;i<count_recv+1;i++) requests[i]=MPI_REQUEST_NULL;
36810c7d97c5SJed Brown           ierr = PetscMalloc ( count_recv*sizeof(PetscMPIInt),&localsizes2);CHKERRQ(ierr);
36820c7d97c5SJed Brown           ierr = PetscMalloc ( count_recv*sizeof(PetscMPIInt),&localdispl2);CHKERRQ(ierr);
36830c7d97c5SJed Brown           /* fill up quantities */
36840c7d97c5SJed Brown           j=0;
36850c7d97c5SJed Brown           for(i=0;i<count_recv;i++){
36860c7d97c5SJed Brown             ii = ranks_recv[i];
36870c7d97c5SJed Brown             localsizes2[i]=pcbddc->local_primal_sizes[ii]*pcbddc->local_primal_sizes[ii];
36880c7d97c5SJed Brown             localdispl2[i]=j;
36890c7d97c5SJed Brown             j+=localsizes2[i];
36900c7d97c5SJed Brown             jj = pcbddc->local_primal_displacements[ii];
3691da1bb401SStefano Zampini             for(k=0;k<pcbddc->local_primal_sizes[ii];k++) aux_ins_indices[pcbddc->replicated_local_primal_indices[jj+k]]+=1;  /* it counts the coarse subdomains sharing the coarse node */
36920c7d97c5SJed Brown           }
3693da1bb401SStefano Zampini           /*printf("aux_ins_indices 1\n");
3694da1bb401SStefano Zampini           for(i=0;i<pcbddc->coarse_size;i++)
3695da1bb401SStefano Zampini             printf("%d ",aux_ins_indices[i]);
3696da1bb401SStefano Zampini           printf("\n");*/
36970c7d97c5SJed Brown           /* temp_coarse_mat_vals used to store temporarly received matrix values */
36980c7d97c5SJed Brown           ierr = PetscMalloc ( j*sizeof(PetscScalar),&temp_coarse_mat_vals);CHKERRQ(ierr);
36990c7d97c5SJed Brown           /* evaluate how many values I will insert in coarse mat */
37000c7d97c5SJed Brown           ins_local_primal_size=0;
3701ea7e1babSStefano Zampini           for(i=0;i<pcbddc->coarse_size;i++){
3702ea7e1babSStefano Zampini             if(aux_ins_indices[i]){
37030c7d97c5SJed Brown               ins_local_primal_size++;
3704ea7e1babSStefano Zampini             }
3705ea7e1babSStefano Zampini           }
37060c7d97c5SJed Brown           /* evaluate indices I will insert in coarse mat */
37070c7d97c5SJed Brown           ierr = PetscMalloc ( ins_local_primal_size*sizeof(PetscInt),&ins_local_primal_indices);CHKERRQ(ierr);
37080c7d97c5SJed Brown           j=0;
3709ea7e1babSStefano Zampini           for(i=0;i<pcbddc->coarse_size;i++){
3710ea7e1babSStefano Zampini             if(aux_ins_indices[i]){
37110c7d97c5SJed Brown               ins_local_primal_indices[j++]=i;
3712ea7e1babSStefano Zampini             }
3713ea7e1babSStefano Zampini           }
37140c7d97c5SJed Brown           /* use aux_ins_indices to realize a global to local mapping */
37150c7d97c5SJed Brown           j=0;
37160c7d97c5SJed Brown           for(i=0;i<pcbddc->coarse_size;i++){
37170c7d97c5SJed Brown             if(aux_ins_indices[i]==0){
37180c7d97c5SJed Brown               aux_ins_indices[i]=-1;
37190c7d97c5SJed Brown             } else {
37200c7d97c5SJed Brown               aux_ins_indices[i]=j;
37210c7d97c5SJed Brown               j++;
37220c7d97c5SJed Brown             }
37230c7d97c5SJed Brown           }
37240c7d97c5SJed Brown 
3725da1bb401SStefano Zampini           /*printf("New details localsizes2 localdispl2\n");
3726da1bb401SStefano Zampini           for(i=0;i<count_recv;i++)
3727da1bb401SStefano Zampini             printf("(%d %d) ",localsizes2[i],localdispl2[i]);
3728da1bb401SStefano Zampini           printf("\n");
3729da1bb401SStefano Zampini           printf("aux_ins_indices 2\n");
3730da1bb401SStefano Zampini           for(i=0;i<pcbddc->coarse_size;i++)
3731da1bb401SStefano Zampini             printf("%d ",aux_ins_indices[i]);
3732da1bb401SStefano Zampini           printf("\n");
3733da1bb401SStefano Zampini           printf("ins_local_primal_indices\n");
3734da1bb401SStefano Zampini           for(i=0;i<ins_local_primal_size;i++)
3735da1bb401SStefano Zampini             printf("%d ",ins_local_primal_indices[i]);
3736da1bb401SStefano Zampini           printf("\n");
3737da1bb401SStefano Zampini           printf("coarse_submat_vals\n");
3738da1bb401SStefano Zampini           for(i=0;i<pcbddc->local_primal_size;i++)
3739da1bb401SStefano Zampini             for(j=0;j<pcbddc->local_primal_size;j++)
3740da1bb401SStefano Zampini               printf("(%lf %d %d)\n",coarse_submat_vals[j*pcbddc->local_primal_size+i],pcbddc->local_primal_indices[i],pcbddc->local_primal_indices[j]);
3741da1bb401SStefano Zampini           printf("\n");*/
37420c7d97c5SJed Brown 
37430c7d97c5SJed Brown           /* processes partecipating in coarse problem receive matrix data from their friends */
374453cdbc3dSStefano Zampini           for(i=0;i<count_recv;i++) ierr = MPI_Irecv(&temp_coarse_mat_vals[localdispl2[i]],localsizes2[i],MPIU_SCALAR,ranks_recv[i],666,prec_comm,&requests[i]);CHKERRQ(ierr);
37450c7d97c5SJed Brown           if(rank_coarse_proc_send_to != MPI_PROC_NULL ) {
37460c7d97c5SJed Brown             send_size=pcbddc->local_primal_size*pcbddc->local_primal_size;
374753cdbc3dSStefano Zampini             ierr = MPI_Isend(&coarse_submat_vals[0],send_size,MPIU_SCALAR,rank_coarse_proc_send_to,666,prec_comm,&requests[count_recv]);CHKERRQ(ierr);
37480c7d97c5SJed Brown           }
374953cdbc3dSStefano Zampini           ierr = MPI_Waitall(count_recv+1,requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
37500c7d97c5SJed Brown 
3751da1bb401SStefano Zampini           /*if(coarse_color == 0) {
3752da1bb401SStefano Zampini             printf("temp_coarse_mat_vals\n");
3753da1bb401SStefano Zampini             for(k=0;k<count_recv;k++){
3754da1bb401SStefano Zampini               printf("---- %d ----\n",ranks_recv[k]);
3755da1bb401SStefano Zampini               for(i=0;i<pcbddc->local_primal_sizes[ranks_recv[k]];i++)
3756da1bb401SStefano Zampini                 for(j=0;j<pcbddc->local_primal_sizes[ranks_recv[k]];j++)
3757da1bb401SStefano Zampini                   printf("(%lf %d %d)\n",temp_coarse_mat_vals[localdispl2[k]+j*pcbddc->local_primal_sizes[ranks_recv[k]]+i],pcbddc->replicated_local_primal_indices[pcbddc->local_primal_displacements[ranks_recv[k]]+i],pcbddc->replicated_local_primal_indices[pcbddc->local_primal_displacements[ranks_recv[k]]+j]);
3758da1bb401SStefano Zampini               printf("\n");
3759da1bb401SStefano Zampini             }
3760da1bb401SStefano Zampini           }*/
37610c7d97c5SJed Brown           /* calculate data to insert in coarse mat */
37620c7d97c5SJed Brown           ierr = PetscMalloc ( ins_local_primal_size*ins_local_primal_size*sizeof(PetscScalar),&ins_coarse_mat_vals);CHKERRQ(ierr);
37630c7d97c5SJed Brown           PetscMemzero(ins_coarse_mat_vals,ins_local_primal_size*ins_local_primal_size*sizeof(PetscScalar));
37640c7d97c5SJed Brown 
37650c7d97c5SJed Brown           PetscMPIInt rr,kk,lps,lpd;
37660c7d97c5SJed Brown           PetscInt row_ind,col_ind;
37670c7d97c5SJed Brown           for(k=0;k<count_recv;k++){
37680c7d97c5SJed Brown             rr = ranks_recv[k];
37690c7d97c5SJed Brown             kk = localdispl2[k];
37700c7d97c5SJed Brown             lps = pcbddc->local_primal_sizes[rr];
37710c7d97c5SJed Brown             lpd = pcbddc->local_primal_displacements[rr];
3772da1bb401SStefano Zampini             /*printf("Inserting the following indices (received from %d)\n",rr);*/
37730c7d97c5SJed Brown             for(j=0;j<lps;j++){
37740c7d97c5SJed Brown               col_ind=aux_ins_indices[pcbddc->replicated_local_primal_indices[lpd+j]];
37750c7d97c5SJed Brown               for(i=0;i<lps;i++){
37760c7d97c5SJed Brown                 row_ind=aux_ins_indices[pcbddc->replicated_local_primal_indices[lpd+i]];
3777da1bb401SStefano Zampini                 /*printf("%d %d\n",row_ind,col_ind);*/
37780c7d97c5SJed Brown                 ins_coarse_mat_vals[col_ind*ins_local_primal_size+row_ind]+=temp_coarse_mat_vals[kk+j*lps+i];
37790c7d97c5SJed Brown               }
37800c7d97c5SJed Brown             }
37810c7d97c5SJed Brown           }
37820c7d97c5SJed Brown           ierr = PetscFree(requests);CHKERRQ(ierr);
37830c7d97c5SJed Brown           ierr = PetscFree(aux_ins_indices);CHKERRQ(ierr);
37840c7d97c5SJed Brown           ierr = PetscFree(temp_coarse_mat_vals);CHKERRQ(ierr);
37850c7d97c5SJed Brown           if(coarse_color == 0) { ierr = PetscFree(ranks_recv);CHKERRQ(ierr); }
37860c7d97c5SJed Brown 
37870c7d97c5SJed Brown           /* create local to global mapping needed by coarse MATIS */
37880c7d97c5SJed Brown           {
37890c7d97c5SJed Brown             IS coarse_IS;
3790*142dfd88SStefano Zampini             if(coarse_comm != MPI_COMM_NULL ) {ierr = MPI_Comm_free(&coarse_comm);CHKERRQ(ierr);}
37910c7d97c5SJed Brown             coarse_comm = prec_comm;
37920c7d97c5SJed Brown             active_rank=rank_prec_comm;
37930c7d97c5SJed Brown             ierr = ISCreateGeneral(coarse_comm,ins_local_primal_size,ins_local_primal_indices,PETSC_COPY_VALUES,&coarse_IS);CHKERRQ(ierr);
37940c7d97c5SJed Brown             ierr = ISLocalToGlobalMappingCreateIS(coarse_IS,&coarse_ISLG);CHKERRQ(ierr);
37950c7d97c5SJed Brown             ierr = ISDestroy(&coarse_IS);CHKERRQ(ierr);
37960c7d97c5SJed Brown           }
37970c7d97c5SJed Brown         }
37980c7d97c5SJed Brown         if(pcbddc->coarse_problem_type==PARALLEL_BDDC) {
37990c7d97c5SJed Brown           /* arrays for values insertion */
38000c7d97c5SJed Brown           ins_local_primal_size = pcbddc->local_primal_size;
38010c7d97c5SJed Brown           ierr = PetscMalloc ( ins_local_primal_size*sizeof(PetscMPIInt),&ins_local_primal_indices);CHKERRQ(ierr);
38020c7d97c5SJed Brown           ierr = PetscMalloc ( ins_local_primal_size*ins_local_primal_size*sizeof(PetscScalar),&ins_coarse_mat_vals);CHKERRQ(ierr);
38030c7d97c5SJed Brown           for(j=0;j<ins_local_primal_size;j++){
38040c7d97c5SJed Brown             ins_local_primal_indices[j]=pcbddc->local_primal_indices[j];
38050c7d97c5SJed Brown             for(i=0;i<ins_local_primal_size;i++) ins_coarse_mat_vals[j*ins_local_primal_size+i]=coarse_submat_vals[j*ins_local_primal_size+i];
38060c7d97c5SJed Brown           }
38070c7d97c5SJed Brown         }
38080c7d97c5SJed Brown         break;
38090c7d97c5SJed Brown 
38100c7d97c5SJed Brown     }
38110c7d97c5SJed Brown 
38120c7d97c5SJed Brown     case(GATHERS_BDDC):
38130c7d97c5SJed Brown       {
38140c7d97c5SJed Brown 
38150c7d97c5SJed Brown         PetscMPIInt mysize,mysize2;
38160c7d97c5SJed Brown 
38170c7d97c5SJed Brown         if(rank_prec_comm==active_rank) {
38180c7d97c5SJed Brown           ierr = PetscMalloc ( pcbddc->replicated_primal_size*sizeof(PetscMPIInt),&pcbddc->replicated_local_primal_indices);CHKERRQ(ierr);
38190c7d97c5SJed Brown           pcbddc->replicated_local_primal_values = (PetscScalar*)calloc(pcbddc->replicated_primal_size,sizeof(PetscScalar));
38200c7d97c5SJed Brown           ierr = PetscMalloc ( size_prec_comm*sizeof(PetscMPIInt),&localsizes2);CHKERRQ(ierr);
38210c7d97c5SJed Brown           ierr = PetscMalloc ( size_prec_comm*sizeof(PetscMPIInt),&localdispl2);CHKERRQ(ierr);
38220c7d97c5SJed Brown           /* arrays for values insertion */
38230c7d97c5SJed Brown           for(i=0;i<size_prec_comm;i++) localsizes2[i]=pcbddc->local_primal_sizes[i]*pcbddc->local_primal_sizes[i];
38240c7d97c5SJed Brown           localdispl2[0]=0;
38250c7d97c5SJed Brown           for(i=1;i<size_prec_comm;i++) localdispl2[i]=localsizes2[i-1]+localdispl2[i-1];
38260c7d97c5SJed Brown           j=0;
38270c7d97c5SJed Brown           for(i=0;i<size_prec_comm;i++) j+=localsizes2[i];
38280c7d97c5SJed Brown           ierr = PetscMalloc ( j*sizeof(PetscScalar),&temp_coarse_mat_vals);CHKERRQ(ierr);
38290c7d97c5SJed Brown         }
38300c7d97c5SJed Brown 
38310c7d97c5SJed Brown         mysize=pcbddc->local_primal_size;
38320c7d97c5SJed Brown         mysize2=pcbddc->local_primal_size*pcbddc->local_primal_size;
38330c7d97c5SJed Brown         if(pcbddc->coarse_problem_type == SEQUENTIAL_BDDC){
383453cdbc3dSStefano Zampini           ierr = MPI_Gatherv(&pcbddc->local_primal_indices[0],mysize,MPIU_INT,&pcbddc->replicated_local_primal_indices[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr);
383553cdbc3dSStefano Zampini           ierr = MPI_Gatherv(&coarse_submat_vals[0],mysize2,MPIU_SCALAR,&temp_coarse_mat_vals[0],localsizes2,localdispl2,MPIU_SCALAR,master_proc,prec_comm);CHKERRQ(ierr);
38360c7d97c5SJed Brown         } else {
383753cdbc3dSStefano Zampini           ierr = MPI_Allgatherv(&pcbddc->local_primal_indices[0],mysize,MPIU_INT,&pcbddc->replicated_local_primal_indices[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,prec_comm);CHKERRQ(ierr);
383853cdbc3dSStefano Zampini           ierr = MPI_Allgatherv(&coarse_submat_vals[0],mysize2,MPIU_SCALAR,&temp_coarse_mat_vals[0],localsizes2,localdispl2,MPIU_SCALAR,prec_comm);CHKERRQ(ierr);
38390c7d97c5SJed Brown         }
38400c7d97c5SJed Brown         break;
3841da1bb401SStefano Zampini       }/* switch on coarse problem and communications associated with finished */
38420c7d97c5SJed Brown   }
38430c7d97c5SJed Brown 
38440c7d97c5SJed Brown   /* Now create and fill up coarse matrix */
38450c7d97c5SJed Brown   if( rank_prec_comm == active_rank ) {
3846*142dfd88SStefano Zampini 
3847*142dfd88SStefano Zampini     Mat matis_coarse_local_mat;
3848*142dfd88SStefano Zampini 
38490c7d97c5SJed Brown     if(pcbddc->coarse_problem_type != MULTILEVEL_BDDC) {
38500c7d97c5SJed Brown       ierr = MatCreate(coarse_comm,&pcbddc->coarse_mat);CHKERRQ(ierr);
38510c7d97c5SJed Brown       ierr = MatSetSizes(pcbddc->coarse_mat,PETSC_DECIDE,PETSC_DECIDE,pcbddc->coarse_size,pcbddc->coarse_size);CHKERRQ(ierr);
38520c7d97c5SJed Brown       ierr = MatSetType(pcbddc->coarse_mat,coarse_mat_type);CHKERRQ(ierr);
38533b03a366Sstefano_zampini       ierr = MatSetUp(pcbddc->coarse_mat);CHKERRQ(ierr);
3854da1bb401SStefano Zampini       ierr = MatSetOption(pcbddc->coarse_mat,MAT_ROW_ORIENTED,PETSC_FALSE);CHKERRQ(ierr); /* local values stored in column major */
38553b03a366Sstefano_zampini       ierr = MatSetOption(pcbddc->coarse_mat,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr);
38560c7d97c5SJed Brown     } else {
3857d3ee2243SStefano Zampini       /* remind bs */
3858d3ee2243SStefano Zampini       ierr = MatCreateIS(coarse_comm,bs,PETSC_DECIDE,PETSC_DECIDE,pcbddc->coarse_size,pcbddc->coarse_size,coarse_ISLG,&pcbddc->coarse_mat);CHKERRQ(ierr);
38593b03a366Sstefano_zampini       ierr = MatSetUp(pcbddc->coarse_mat);CHKERRQ(ierr);
38600c7d97c5SJed Brown       ierr = MatISGetLocalMat(pcbddc->coarse_mat,&matis_coarse_local_mat);CHKERRQ(ierr);
38613b03a366Sstefano_zampini       ierr = MatSetUp(matis_coarse_local_mat);CHKERRQ(ierr);
3862da1bb401SStefano Zampini       ierr = MatSetOption(matis_coarse_local_mat,MAT_ROW_ORIENTED,PETSC_FALSE);CHKERRQ(ierr); /* local values stored in column major */
3863a0ba757dSStefano Zampini       ierr = MatSetOption(matis_coarse_local_mat,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr);
38640c7d97c5SJed Brown     }
3865*142dfd88SStefano Zampini     /* preallocation */
3866*142dfd88SStefano Zampini     if(pcbddc->coarse_problem_type != MULTILEVEL_BDDC) {
3867*142dfd88SStefano Zampini       PetscInt *dnz,*onz;
3868*142dfd88SStefano Zampini       PetscInt lrows,lcols;
3869*142dfd88SStefano Zampini       ierr = MatGetLocalSize(pcbddc->coarse_mat,&lrows,&lcols);CHKERRQ(ierr);
3870*142dfd88SStefano Zampini       ierr = MatPreallocateInitialize(coarse_comm,lrows,lcols,dnz,onz);CHKERRQ(ierr);
3871*142dfd88SStefano Zampini       if(pcbddc->coarse_problem_type == PARALLEL_BDDC) {
3872*142dfd88SStefano Zampini         PetscInt coarse_index_row,coarse_index_col,start_row,owner;
3873*142dfd88SStefano Zampini         PetscMPIInt *auxpreall_displs;
3874*142dfd88SStefano Zampini         PetscMPIInt *auxpreall_sizes;
3875*142dfd88SStefano Zampini         PetscMPIInt *auxpreall_dnz;
3876*142dfd88SStefano Zampini         PetscMPIInt *auxpreall_onz;
3877*142dfd88SStefano Zampini         PetscInt    *auxpreall_ownership;
3878*142dfd88SStefano Zampini         if(rank_prec_comm == 0) {
3879*142dfd88SStefano Zampini           ierr = PetscMalloc((size_prec_comm+1)*sizeof(PetscMPIInt),&auxpreall_displs);CHKERRQ(ierr);
3880*142dfd88SStefano Zampini           auxpreall_displs[size_prec_comm]=pcbddc->coarse_size;
3881*142dfd88SStefano Zampini           ierr = PetscMalloc(size_prec_comm*sizeof(PetscMPIInt),&auxpreall_sizes);CHKERRQ(ierr);
3882*142dfd88SStefano Zampini           ierr = PetscMalloc(pcbddc->coarse_size*sizeof(PetscMPIInt),&auxpreall_dnz);CHKERRQ(ierr);
3883*142dfd88SStefano Zampini           ierr = PetscMemzero(auxpreall_dnz,pcbddc->coarse_size*sizeof(PetscMPIInt));CHKERRQ(ierr);
3884*142dfd88SStefano Zampini           ierr = PetscMalloc(pcbddc->coarse_size*sizeof(PetscMPIInt),&auxpreall_onz);CHKERRQ(ierr);
3885*142dfd88SStefano Zampini           ierr = PetscMemzero(auxpreall_onz,pcbddc->coarse_size*sizeof(PetscMPIInt));CHKERRQ(ierr);
3886*142dfd88SStefano Zampini           ierr = PetscMalloc(pcbddc->coarse_size*sizeof(PetscInt),&auxpreall_ownership);CHKERRQ(ierr);
3887*142dfd88SStefano Zampini         }
3888*142dfd88SStefano Zampini         ierr = MatGetOwnershipRange(pcbddc->coarse_mat,&start_row,PETSC_NULL);CHKERRQ(ierr);
3889*142dfd88SStefano Zampini         ierr = MPI_Gather(&start_row,1,MPIU_INT,auxpreall_displs,1,MPIU_INT,0,prec_comm);CHKERRQ(ierr);
3890*142dfd88SStefano Zampini         if(rank_prec_comm == 0) {
3891*142dfd88SStefano Zampini           k=0;
3892*142dfd88SStefano Zampini           for(i=0;i<size_prec_comm;i++) {
3893*142dfd88SStefano Zampini             auxpreall_sizes[i]=auxpreall_displs[i+1]-auxpreall_displs[i];
3894*142dfd88SStefano Zampini             for(j=0;j<auxpreall_sizes[i];j++) {
3895*142dfd88SStefano Zampini               auxpreall_ownership[auxpreall_displs[i]+j]=i;
3896*142dfd88SStefano Zampini             }
3897*142dfd88SStefano Zampini           }
3898*142dfd88SStefano Zampini           for(i=0;i<size_prec_comm;i++) {
3899*142dfd88SStefano Zampini             for(j=0;j<pcbddc->local_primal_sizes[i];j++) {
3900*142dfd88SStefano Zampini               coarse_index_row=auxglobal_primal[j+pcbddc->local_primal_displacements[i]];
3901*142dfd88SStefano Zampini               for(k=j;k<pcbddc->local_primal_sizes[i];k++) {
3902*142dfd88SStefano Zampini                 coarse_index_col=auxglobal_primal[k+pcbddc->local_primal_displacements[i]];
3903*142dfd88SStefano Zampini                 owner = auxpreall_ownership[coarse_index_row];
3904*142dfd88SStefano Zampini                 if(coarse_index_col>auxpreall_displs[owner]-1 && coarse_index_col < auxpreall_displs[owner]+auxpreall_sizes[owner]) {
3905*142dfd88SStefano Zampini                   auxpreall_dnz[coarse_index_row]++;
3906*142dfd88SStefano Zampini                 } else {
3907*142dfd88SStefano Zampini                   auxpreall_onz[coarse_index_row]++;
3908*142dfd88SStefano Zampini                 }
3909*142dfd88SStefano Zampini                 if(k != j) {
3910*142dfd88SStefano Zampini                   owner = auxpreall_ownership[coarse_index_col];
3911*142dfd88SStefano Zampini                   if(coarse_index_row>auxpreall_displs[owner]-1 && coarse_index_row < auxpreall_displs[owner]+auxpreall_sizes[owner]) {
3912*142dfd88SStefano Zampini                     auxpreall_dnz[coarse_index_col]++;
3913*142dfd88SStefano Zampini                   } else {
3914*142dfd88SStefano Zampini                     auxpreall_onz[coarse_index_col]++;
3915*142dfd88SStefano Zampini                   }
3916*142dfd88SStefano Zampini                 }
3917*142dfd88SStefano Zampini               }
3918*142dfd88SStefano Zampini             }
3919*142dfd88SStefano Zampini           }
3920*142dfd88SStefano Zampini         }
3921*142dfd88SStefano Zampini         ierr = MPI_Scatterv(auxpreall_dnz,auxpreall_sizes,auxpreall_displs,MPIU_INT,
3922*142dfd88SStefano Zampini                             dnz,lrows,MPIU_INT,0,prec_comm);
3923*142dfd88SStefano Zampini         ierr = MPI_Scatterv(auxpreall_onz,auxpreall_sizes,auxpreall_displs,MPIU_INT,
3924*142dfd88SStefano Zampini                             onz,lrows,MPIU_INT,0,prec_comm);
3925*142dfd88SStefano Zampini         if(rank_prec_comm == 0) {
3926*142dfd88SStefano Zampini           ierr = PetscFree(auxpreall_displs);CHKERRQ(ierr);
3927*142dfd88SStefano Zampini           ierr = PetscFree(auxpreall_sizes);CHKERRQ(ierr);
3928*142dfd88SStefano Zampini           ierr = PetscFree(auxpreall_dnz);CHKERRQ(ierr);
3929*142dfd88SStefano Zampini           ierr = PetscFree(auxpreall_onz);CHKERRQ(ierr);
3930*142dfd88SStefano Zampini           ierr = PetscFree(auxpreall_ownership);CHKERRQ(ierr);
3931*142dfd88SStefano Zampini         }
3932*142dfd88SStefano Zampini       } else {
3933*142dfd88SStefano Zampini         for(k=0;k<size_prec_comm;k++){
3934*142dfd88SStefano Zampini           offset=pcbddc->local_primal_displacements[k];
3935*142dfd88SStefano Zampini           offset2=localdispl2[k];
3936*142dfd88SStefano Zampini           ins_local_primal_size = pcbddc->local_primal_sizes[k];
3937*142dfd88SStefano Zampini           ins_local_primal_indices = &pcbddc->replicated_local_primal_indices[offset];
3938*142dfd88SStefano Zampini           for(j=0;j<ins_local_primal_size;j++) {
3939*142dfd88SStefano Zampini             ierr = MatPreallocateSet(ins_local_primal_indices[j],ins_local_primal_size,ins_local_primal_indices,dnz,onz);CHKERRQ(ierr);
3940*142dfd88SStefano Zampini           }
3941*142dfd88SStefano Zampini         }
3942*142dfd88SStefano Zampini       }
3943*142dfd88SStefano Zampini       /* check */
3944*142dfd88SStefano Zampini       for(i=0;i<lrows;i++) {
3945*142dfd88SStefano Zampini         if(dnz[i]>lcols) {
3946*142dfd88SStefano Zampini           dnz[i]=lcols;
3947*142dfd88SStefano Zampini         }
3948*142dfd88SStefano Zampini         if(onz[i]>pcbddc->coarse_size-lcols) {
3949*142dfd88SStefano Zampini           onz[i]=pcbddc->coarse_size-lcols;
3950*142dfd88SStefano Zampini         }
3951*142dfd88SStefano Zampini       }
3952*142dfd88SStefano Zampini       ierr = MatSeqAIJSetPreallocation(pcbddc->coarse_mat,PETSC_NULL,dnz);CHKERRQ(ierr);
3953*142dfd88SStefano Zampini       ierr = MatMPIAIJSetPreallocation(pcbddc->coarse_mat,PETSC_NULL,dnz,PETSC_NULL,onz);CHKERRQ(ierr);
3954*142dfd88SStefano Zampini       ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr);
3955*142dfd88SStefano Zampini     } else {
3956*142dfd88SStefano Zampini       ierr = MatSeqAIJSetPreallocation(matis_coarse_local_mat,ins_local_primal_size,PETSC_NULL);CHKERRQ(ierr);
3957*142dfd88SStefano Zampini     }
3958*142dfd88SStefano Zampini     if(rank_prec_comm == 0) { ierr = PetscFree(auxglobal_primal);CHKERRQ(ierr); }
3959*142dfd88SStefano Zampini     /* insert values */
3960ea7e1babSStefano Zampini     if(pcbddc->coarse_communications_type != GATHERS_BDDC) {
39610c7d97c5SJed Brown       ierr = MatSetValues(pcbddc->coarse_mat,ins_local_primal_size,ins_local_primal_indices,ins_local_primal_size,ins_local_primal_indices,ins_coarse_mat_vals,ADD_VALUES);CHKERRQ(ierr);
3962ea7e1babSStefano Zampini     } else {
3963ea7e1babSStefano Zampini       for(k=0;k<size_prec_comm;k++){
3964ea7e1babSStefano Zampini         offset=pcbddc->local_primal_displacements[k];
3965ea7e1babSStefano Zampini         offset2=localdispl2[k];
3966ea7e1babSStefano Zampini         ins_local_primal_size = pcbddc->local_primal_sizes[k];
3967ea7e1babSStefano Zampini         ins_local_primal_indices = &pcbddc->replicated_local_primal_indices[offset];
3968ea7e1babSStefano Zampini         ins_coarse_mat_vals = &temp_coarse_mat_vals[offset2];
3969ea7e1babSStefano Zampini         ierr = MatSetValues(pcbddc->coarse_mat,ins_local_primal_size,ins_local_primal_indices,ins_local_primal_size,ins_local_primal_indices,ins_coarse_mat_vals,ADD_VALUES);CHKERRQ(ierr);
3970ea7e1babSStefano Zampini       }
3971ea7e1babSStefano Zampini       ins_local_primal_indices = 0;
3972ea7e1babSStefano Zampini       ins_coarse_mat_vals = 0;
3973ea7e1babSStefano Zampini     }
39740c7d97c5SJed Brown     ierr = MatAssemblyBegin(pcbddc->coarse_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
39750c7d97c5SJed Brown     ierr = MatAssemblyEnd(pcbddc->coarse_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
3976*142dfd88SStefano Zampini     /* symmetry of coarse matrix */
3977*142dfd88SStefano Zampini     if(issym) {
3978*142dfd88SStefano Zampini       ierr = MatSetOption(pcbddc->coarse_mat,MAT_SYMMETRIC,PETSC_TRUE);CHKERRQ(ierr);
3979*142dfd88SStefano Zampini     }
39800c7d97c5SJed Brown     ierr = MatGetVecs(pcbddc->coarse_mat,&pcbddc->coarse_vec,&pcbddc->coarse_rhs);CHKERRQ(ierr);
39810c7d97c5SJed Brown     /* Preconditioner for coarse problem */
398253cdbc3dSStefano Zampini     ierr = KSPCreate(coarse_comm,&pcbddc->coarse_ksp);CHKERRQ(ierr);
398353cdbc3dSStefano Zampini     ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->coarse_ksp,(PetscObject)pc,1);CHKERRQ(ierr);
398453cdbc3dSStefano Zampini     ierr = KSPSetOperators(pcbddc->coarse_ksp,pcbddc->coarse_mat,pcbddc->coarse_mat,SAME_PRECONDITIONER);CHKERRQ(ierr);
39853b03a366Sstefano_zampini     ierr = KSPSetTolerances(pcbddc->coarse_ksp,PETSC_DEFAULT,PETSC_DEFAULT,PETSC_DEFAULT,max_it_coarse_ksp);CHKERRQ(ierr);
398653cdbc3dSStefano Zampini     ierr = KSPSetType(pcbddc->coarse_ksp,coarse_ksp_type);CHKERRQ(ierr);
3987*142dfd88SStefano Zampini     ierr = KSPSetInitialGuessNonzero(pcbddc->coarse_ksp,PETSC_FALSE);CHKERRQ(ierr);
398853cdbc3dSStefano Zampini     ierr = KSPGetPC(pcbddc->coarse_ksp,&pc_temp);CHKERRQ(ierr);
398953cdbc3dSStefano Zampini     ierr = PCSetType(pc_temp,coarse_pc_type);CHKERRQ(ierr);
39900c7d97c5SJed Brown     /* Allow user's customization */
3991da1bb401SStefano Zampini     ierr = KSPSetOptionsPrefix(pcbddc->coarse_ksp,"coarse_");CHKERRQ(ierr);
399253cdbc3dSStefano Zampini     ierr = KSPSetFromOptions(pcbddc->coarse_ksp);CHKERRQ(ierr);
39930c7d97c5SJed Brown     /* Set Up PC for coarse problem BDDC */
399453cdbc3dSStefano Zampini     if(pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
3995e269702eSStefano Zampini       if(dbg_flag) {
3996e269702eSStefano Zampini         ierr = PetscViewerASCIIPrintf(viewer,"----------------Setting up a new level---------------\n");CHKERRQ(ierr);
3997e269702eSStefano Zampini         ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
3998e269702eSStefano Zampini       }
399953cdbc3dSStefano Zampini       ierr = PCBDDCSetCoarseProblemType(pc_temp,MULTILEVEL_BDDC);CHKERRQ(ierr);
400053cdbc3dSStefano Zampini     }
400153cdbc3dSStefano Zampini     ierr = KSPSetUp(pcbddc->coarse_ksp);CHKERRQ(ierr);
4002*142dfd88SStefano Zampini 
4003*142dfd88SStefano Zampini     { /* TODO: this is a hack! need to be solved! */
4004*142dfd88SStefano Zampini       PC_BDDC     *coarse_pcbddc = (PC_BDDC*)pc_temp->data;
4005*142dfd88SStefano Zampini       coarse_pcbddc->use_exact_dirichlet = PETSC_FALSE;
4006*142dfd88SStefano Zampini     }
4007*142dfd88SStefano Zampini 
40085619798eSStefano Zampini     if(pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
40095619798eSStefano Zampini       if(dbg_flag) {
40105619798eSStefano Zampini         ierr = PetscViewerASCIIPrintf(viewer,"----------------New level set------------------------\n");CHKERRQ(ierr);
40115619798eSStefano Zampini         ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
40125619798eSStefano Zampini       }
40135619798eSStefano Zampini     }
40140c7d97c5SJed Brown   }
40150c7d97c5SJed Brown   if(pcbddc->coarse_communications_type == SCATTERS_BDDC) {
40160c7d97c5SJed Brown      IS local_IS,global_IS;
40170c7d97c5SJed Brown      ierr = ISCreateStride(PETSC_COMM_SELF,pcbddc->local_primal_size,0,1,&local_IS);CHKERRQ(ierr);
40180c7d97c5SJed Brown      ierr = ISCreateGeneral(PETSC_COMM_SELF,pcbddc->local_primal_size,pcbddc->local_primal_indices,PETSC_COPY_VALUES,&global_IS);CHKERRQ(ierr);
40190c7d97c5SJed Brown      ierr = VecScatterCreate(pcbddc->vec1_P,local_IS,pcbddc->coarse_vec,global_IS,&pcbddc->coarse_loc_to_glob);CHKERRQ(ierr);
40200c7d97c5SJed Brown      ierr = ISDestroy(&local_IS);CHKERRQ(ierr);
40210c7d97c5SJed Brown      ierr = ISDestroy(&global_IS);CHKERRQ(ierr);
40220c7d97c5SJed Brown   }
40233b03a366Sstefano_zampini   /* Evaluate condition number of coarse problem for cheby (and verbose output if requested) */
4024*142dfd88SStefano Zampini   if( dbg_flag && rank_prec_comm == active_rank ) {
4025*142dfd88SStefano Zampini     KSP check_ksp;
4026*142dfd88SStefano Zampini     PC  check_pc;
4027*142dfd88SStefano Zampini     Vec check_vec;
4028*142dfd88SStefano Zampini     PetscReal   abs_infty_error,infty_error,lambda_min,lambda_max;
4029*142dfd88SStefano Zampini     const KSPType check_ksp_type;
40300c7d97c5SJed Brown 
4031*142dfd88SStefano Zampini     /* Create ksp object suitable for extreme eigenvalues' estimation */
4032*142dfd88SStefano Zampini     ierr = KSPCreate(coarse_comm,&check_ksp);CHKERRQ(ierr);
4033*142dfd88SStefano Zampini     ierr = KSPSetOperators(check_ksp,pcbddc->coarse_mat,pcbddc->coarse_mat,SAME_PRECONDITIONER);CHKERRQ(ierr);
4034*142dfd88SStefano Zampini     ierr = KSPSetTolerances(check_ksp,1.e-8,1.e-8,PETSC_DEFAULT,pcbddc->coarse_size);CHKERRQ(ierr);
4035*142dfd88SStefano Zampini     if(pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
4036*142dfd88SStefano Zampini       if(issym) {
4037*142dfd88SStefano Zampini         check_ksp_type = KSPCG;
4038*142dfd88SStefano Zampini       } else {
4039*142dfd88SStefano Zampini         check_ksp_type = KSPGMRES;
4040*142dfd88SStefano Zampini       }
4041*142dfd88SStefano Zampini       ierr = KSPSetComputeSingularValues(check_ksp,PETSC_TRUE);CHKERRQ(ierr);
4042*142dfd88SStefano Zampini     } else {
4043*142dfd88SStefano Zampini       check_ksp_type = KSPPREONLY;
4044*142dfd88SStefano Zampini     }
4045*142dfd88SStefano Zampini     ierr = KSPSetType(check_ksp,check_ksp_type);CHKERRQ(ierr);
4046*142dfd88SStefano Zampini     ierr = KSPGetPC(pcbddc->coarse_ksp,&check_pc);CHKERRQ(ierr);
4047*142dfd88SStefano Zampini     ierr = KSPSetPC(check_ksp,check_pc);CHKERRQ(ierr);
4048*142dfd88SStefano Zampini     ierr = KSPSetUp(check_ksp);CHKERRQ(ierr);
4049*142dfd88SStefano Zampini     /* create random vec */
4050*142dfd88SStefano Zampini     ierr = VecDuplicate(pcbddc->coarse_vec,&check_vec);CHKERRQ(ierr);
4051*142dfd88SStefano Zampini     ierr = VecSetRandom(check_vec,PETSC_NULL);CHKERRQ(ierr);
4052*142dfd88SStefano Zampini     ierr = MatMult(pcbddc->coarse_mat,check_vec,pcbddc->coarse_rhs);CHKERRQ(ierr);
4053*142dfd88SStefano Zampini     /* solve coarse problem */
4054*142dfd88SStefano Zampini     ierr = KSPSolve(check_ksp,pcbddc->coarse_rhs,pcbddc->coarse_vec);CHKERRQ(ierr);
4055*142dfd88SStefano Zampini     /* check coarse problem residual error */
4056*142dfd88SStefano Zampini     ierr = VecAXPY(check_vec,-1.0,pcbddc->coarse_vec);CHKERRQ(ierr);
4057*142dfd88SStefano Zampini     ierr = VecNorm(check_vec,NORM_INFINITY,&infty_error);CHKERRQ(ierr);
4058*142dfd88SStefano Zampini     ierr = MatMult(pcbddc->coarse_mat,check_vec,pcbddc->coarse_rhs);CHKERRQ(ierr);
4059*142dfd88SStefano Zampini     ierr = VecNorm(pcbddc->coarse_rhs,NORM_INFINITY,&abs_infty_error);CHKERRQ(ierr);
4060*142dfd88SStefano Zampini     ierr = VecDestroy(&check_vec);CHKERRQ(ierr);
4061*142dfd88SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"Size of coarse problem %d\n",pcbddc->coarse_size);CHKERRQ(ierr);
4062*142dfd88SStefano Zampini     /* get eigenvalue estimation if inexact */
4063*142dfd88SStefano Zampini     if(pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
4064*142dfd88SStefano Zampini       ierr = KSPComputeExtremeSingularValues(check_ksp,&lambda_max,&lambda_min);CHKERRQ(ierr);
4065*142dfd88SStefano Zampini       ierr = KSPGetIterationNumber(check_ksp,&k);CHKERRQ(ierr);
4066*142dfd88SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem eigenvalues estimated with %d iterations of %s.\n",k,check_ksp_type);CHKERRQ(ierr);
4067e269702eSStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem eigenvalues: % 1.14e %1.14e\n",lambda_min,lambda_max);CHKERRQ(ierr);
40683b03a366Sstefano_zampini     }
4069*142dfd88SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem exact infty_error   : %1.14e\n",infty_error);CHKERRQ(ierr);
4070*142dfd88SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem residual infty_error: %1.14e\n",abs_infty_error);CHKERRQ(ierr);
4071*142dfd88SStefano Zampini     ierr = KSPDestroy(&check_ksp);CHKERRQ(ierr);
407253cdbc3dSStefano Zampini   }
4073*142dfd88SStefano Zampini   if(dbg_flag) { ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); }
40740c7d97c5SJed Brown   /* free data structures no longer needed */
40750c7d97c5SJed Brown   if(coarse_ISLG)                { ierr = ISLocalToGlobalMappingDestroy(&coarse_ISLG);CHKERRQ(ierr); }
40760c7d97c5SJed Brown   if(ins_local_primal_indices)   { ierr = PetscFree(ins_local_primal_indices);CHKERRQ(ierr);  }
40770c7d97c5SJed Brown   if(ins_coarse_mat_vals)        { ierr = PetscFree(ins_coarse_mat_vals);CHKERRQ(ierr);}
40780c7d97c5SJed Brown   if(localsizes2)                { ierr = PetscFree(localsizes2);CHKERRQ(ierr);}
40790c7d97c5SJed Brown   if(localdispl2)                { ierr = PetscFree(localdispl2);CHKERRQ(ierr);}
40800c7d97c5SJed Brown   if(temp_coarse_mat_vals)       { ierr = PetscFree(temp_coarse_mat_vals);CHKERRQ(ierr);}
40810c7d97c5SJed Brown 
40820c7d97c5SJed Brown   PetscFunctionReturn(0);
40830c7d97c5SJed Brown }
40840c7d97c5SJed Brown 
40850c7d97c5SJed Brown #undef __FUNCT__
40860c7d97c5SJed Brown #define __FUNCT__ "PCBDDCManageLocalBoundaries"
408753cdbc3dSStefano Zampini static PetscErrorCode PCBDDCManageLocalBoundaries(PC pc)
40880c7d97c5SJed Brown {
40890c7d97c5SJed Brown 
40900c7d97c5SJed Brown   PC_BDDC     *pcbddc = (PC_BDDC*)pc->data;
40910c7d97c5SJed Brown   PC_IS         *pcis = (PC_IS*)pc->data;
40920c7d97c5SJed Brown   Mat_IS      *matis  = (Mat_IS*)pc->pmat->data;
4093da1bb401SStefano Zampini   PCBDDCGraph mat_graph=pcbddc->mat_graph;
40943972b0daSStefano Zampini   PetscInt    *queue_in_global_numbering,*is_indices,*auxis;
40953b03a366Sstefano_zampini   PetscInt    bs,ierr,i,j,s,k,iindex,neumann_bsize,dirichlet_bsize;
4096da1bb401SStefano Zampini   PetscInt    total_counts,nodes_touched,where_values=1,vertex_size;
4097534831adSStefano Zampini   PetscMPIInt adapt_interface=0,adapt_interface_reduced=0,NEUMANNCNT=0;
4098da1bb401SStefano Zampini   PetscBool   same_set;
4099a0ba757dSStefano Zampini   MPI_Comm    interface_comm=((PetscObject)pc)->comm;
41003b03a366Sstefano_zampini   PetscBool   use_faces=PETSC_FALSE,use_edges=PETSC_FALSE;
41013b03a366Sstefano_zampini   const PetscInt *neumann_nodes;
41023b03a366Sstefano_zampini   const PetscInt *dirichlet_nodes;
4103a81d60d8SStefano Zampini   IS          used_IS,*custom_ISForDofs;
4104da1bb401SStefano Zampini   PetscScalar *array;
4105da1bb401SStefano Zampini   PetscScalar *array2;
4106da1bb401SStefano Zampini   PetscViewer viewer=pcbddc->dbg_viewer;
41070c7d97c5SJed Brown 
41080c7d97c5SJed Brown   PetscFunctionBegin;
4109da1bb401SStefano Zampini   /* Setup local adjacency graph */
4110da1bb401SStefano Zampini   mat_graph->nvtxs=pcis->n;
4111534831adSStefano Zampini   if(!mat_graph->xadj) { NEUMANNCNT = 1; }
4112da1bb401SStefano Zampini   ierr = PCBDDCSetupLocalAdjacencyGraph(pc);CHKERRQ(ierr);
4113a0ba757dSStefano Zampini   i = mat_graph->nvtxs;
4114a0ba757dSStefano Zampini   ierr = PetscMalloc4(i,PetscInt,&mat_graph->where,i,PetscInt,&mat_graph->count,i+1,PetscInt,&mat_graph->cptr,i,PetscInt,&mat_graph->queue);CHKERRQ(ierr);
41153972b0daSStefano Zampini   ierr = PetscMalloc2(i,PetscInt,&mat_graph->which_dof,i,PetscBool,&mat_graph->touched);CHKERRQ(ierr);
41163972b0daSStefano Zampini   ierr = PetscMalloc(i*sizeof(PetscInt),&queue_in_global_numbering);CHKERRQ(ierr);
4117a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->where,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
4118a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->count,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
4119a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->which_dof,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
4120a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->queue,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
41213828260eSStefano Zampini   ierr = PetscMemzero(mat_graph->cptr,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr);
4122a0ba757dSStefano Zampini 
4123a81d60d8SStefano Zampini   /* Setting dofs splitting in mat_graph->which_dof
4124a81d60d8SStefano Zampini      Get information about dofs' splitting if provided by the user
4125a81d60d8SStefano Zampini      Otherwise it assumes a constant block size */
4126a81d60d8SStefano Zampini   vertex_size=0;
4127a81d60d8SStefano Zampini   if(!pcbddc->n_ISForDofs) {
4128a81d60d8SStefano Zampini     ierr = MatGetBlockSize(matis->A,&bs);CHKERRQ(ierr);
4129a81d60d8SStefano Zampini     ierr = PetscMalloc(bs*sizeof(IS),&custom_ISForDofs);CHKERRQ(ierr);
4130a81d60d8SStefano Zampini     for(i=0;i<bs;i++) {
4131a81d60d8SStefano Zampini       ierr = ISCreateStride(PETSC_COMM_SELF,pcis->n/bs,i,bs,&custom_ISForDofs[i]);CHKERRQ(ierr);
4132a81d60d8SStefano Zampini     }
4133a81d60d8SStefano Zampini     ierr = PCBDDCSetDofsSplitting(pc,bs,custom_ISForDofs);CHKERRQ(ierr);
4134a81d60d8SStefano Zampini     vertex_size=1;
4135a81d60d8SStefano Zampini     /* remove my references to IS objects */
4136a81d60d8SStefano Zampini     for(i=0;i<bs;i++) {
4137a81d60d8SStefano Zampini       ierr = ISDestroy(&custom_ISForDofs[i]);CHKERRQ(ierr);
4138a81d60d8SStefano Zampini     }
4139a81d60d8SStefano Zampini     ierr = PetscFree(custom_ISForDofs);CHKERRQ(ierr);
4140a81d60d8SStefano Zampini   }
41419c0446d6SStefano Zampini   for(i=0;i<pcbddc->n_ISForDofs;i++) {
4142a81d60d8SStefano Zampini     ierr = ISGetSize(pcbddc->ISForDofs[i],&k);CHKERRQ(ierr);
41439c0446d6SStefano Zampini     ierr = ISGetIndices(pcbddc->ISForDofs[i],(const PetscInt**)&is_indices);CHKERRQ(ierr);
4144a81d60d8SStefano Zampini     for(j=0;j<k;j++) {
41459c0446d6SStefano Zampini       mat_graph->which_dof[is_indices[j]]=i;
41469c0446d6SStefano Zampini     }
41479c0446d6SStefano Zampini     ierr = ISRestoreIndices(pcbddc->ISForDofs[i],(const PetscInt**)&is_indices);CHKERRQ(ierr);
41489c0446d6SStefano Zampini   }
4149a81d60d8SStefano Zampini   /* use mat block size as vertex size if it has not yet set */
4150a81d60d8SStefano Zampini   if(!vertex_size) {
41513b03a366Sstefano_zampini     ierr = MatGetBlockSize(matis->A,&vertex_size);CHKERRQ(ierr);
41520c7d97c5SJed Brown   }
4153a81d60d8SStefano Zampini 
41543b03a366Sstefano_zampini   /* count number of neigh per node */
41550c7d97c5SJed Brown   total_counts=0;
41563b03a366Sstefano_zampini   for(i=1;i<pcis->n_neigh;i++){
41570c7d97c5SJed Brown     s=pcis->n_shared[i];
41580c7d97c5SJed Brown     total_counts+=s;
415953cdbc3dSStefano Zampini     for(j=0;j<s;j++){
41600c7d97c5SJed Brown       mat_graph->count[pcis->shared[i][j]] += 1;
41610c7d97c5SJed Brown     }
41620c7d97c5SJed Brown   }
4163534831adSStefano Zampini   /* Take into account Neumann data -> it increments number of sharing subdomains for nodes lying on the interface */
416436e030ebSStefano Zampini   ierr = PCBDDCGetNeumannBoundaries(pc,&used_IS);CHKERRQ(ierr);
4165da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
4166da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
416736e030ebSStefano Zampini   if(used_IS) {
416836e030ebSStefano Zampini     ierr = ISGetSize(used_IS,&neumann_bsize);CHKERRQ(ierr);
416936e030ebSStefano Zampini     ierr = ISGetIndices(used_IS,&neumann_nodes);CHKERRQ(ierr);
417053cdbc3dSStefano Zampini     for(i=0;i<neumann_bsize;i++){
417153cdbc3dSStefano Zampini       iindex = neumann_nodes[i];
4172534831adSStefano Zampini       if(mat_graph->count[iindex] > NEUMANNCNT && array[iindex]==0.0){
417353cdbc3dSStefano Zampini         mat_graph->count[iindex]+=1;
41740c7d97c5SJed Brown         total_counts++;
4175da1bb401SStefano Zampini         array[iindex]=array[iindex]+1.0;
4176da1bb401SStefano Zampini       } else if(array[iindex]>0.0) {
4177da1bb401SStefano Zampini         SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_USER,"Error for neumann nodes provided to BDDC! They must be uniquely listed! Found duplicate node %d\n",iindex);
41780c7d97c5SJed Brown       }
41790c7d97c5SJed Brown     }
41800c7d97c5SJed Brown   }
4181da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
4182da1bb401SStefano Zampini   /* allocate space for storing the set of neighbours for each node */
4183da1bb401SStefano Zampini   ierr = PetscMalloc(mat_graph->nvtxs*sizeof(PetscInt*),&mat_graph->neighbours_set);CHKERRQ(ierr);
4184da1bb401SStefano Zampini   if(mat_graph->nvtxs) { ierr = PetscMalloc(total_counts*sizeof(PetscInt),&mat_graph->neighbours_set[0]);CHKERRQ(ierr); }
4185da1bb401SStefano Zampini   for(i=1;i<mat_graph->nvtxs;i++) mat_graph->neighbours_set[i]=mat_graph->neighbours_set[i-1]+mat_graph->count[i-1];
4186a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->count,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
41873b03a366Sstefano_zampini   for(i=1;i<pcis->n_neigh;i++){
41880c7d97c5SJed Brown     s=pcis->n_shared[i];
41890c7d97c5SJed Brown     for(j=0;j<s;j++) {
41900c7d97c5SJed Brown       k=pcis->shared[i][j];
4191da1bb401SStefano Zampini       mat_graph->neighbours_set[k][mat_graph->count[k]] = pcis->neigh[i];
41920c7d97c5SJed Brown       mat_graph->count[k]+=1;
41930c7d97c5SJed Brown     }
41940c7d97c5SJed Brown   }
4195da1bb401SStefano Zampini   /* Check consistency of Neumann nodes */
4196da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
4197da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4198da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4199da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4200da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4201da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
42023b03a366Sstefano_zampini   /* set -1 fake neighbour to mimic Neumann boundary */
420336e030ebSStefano Zampini   if(used_IS) {
420453cdbc3dSStefano Zampini     for(i=0;i<neumann_bsize;i++){
420553cdbc3dSStefano Zampini       iindex = neumann_nodes[i];
4206534831adSStefano Zampini       if(mat_graph->count[iindex] > NEUMANNCNT){
4207da1bb401SStefano Zampini         if(mat_graph->count[iindex]+1 != (PetscInt)array[iindex]) {
4208da1bb401SStefano Zampini           SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_USER,"Neumann nodes provided to BDDC must be consistent among neighbours!\nNode %d: number of sharing subdomains %d != number of subdomains for which it is a neumann node %d\n",iindex,mat_graph->count[iindex]+1,(PetscInt)array[iindex]);
4209da1bb401SStefano Zampini         }
4210da1bb401SStefano Zampini         mat_graph->neighbours_set[iindex][mat_graph->count[iindex]] = -1;
421153cdbc3dSStefano Zampini         mat_graph->count[iindex]+=1;
42120c7d97c5SJed Brown       }
42130c7d97c5SJed Brown     }
421436e030ebSStefano Zampini     ierr = ISRestoreIndices(used_IS,&neumann_nodes);CHKERRQ(ierr);
42150c7d97c5SJed Brown   }
4216da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
4217da1bb401SStefano Zampini   /* sort set of sharing subdomains */
4218da1bb401SStefano Zampini   for(i=0;i<mat_graph->nvtxs;i++) { ierr = PetscSortInt(mat_graph->count[i],mat_graph->neighbours_set[i]);CHKERRQ(ierr); }
42193b03a366Sstefano_zampini   /* remove interior nodes and dirichlet boundary nodes from the next search into the graph */
4220da1bb401SStefano Zampini   for(i=0;i<mat_graph->nvtxs;i++){mat_graph->touched[i]=PETSC_FALSE;}
4221da1bb401SStefano Zampini   nodes_touched=0;
422236e030ebSStefano Zampini   ierr = PCBDDCGetDirichletBoundaries(pc,&used_IS);CHKERRQ(ierr);
4223da1bb401SStefano Zampini   ierr = VecSet(pcis->vec2_N,0.0);CHKERRQ(ierr);
4224da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
4225da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec2_N,&array2);CHKERRQ(ierr);
4226da1bb401SStefano Zampini   if(used_IS) {
4227da1bb401SStefano Zampini     ierr = ISGetSize(used_IS,&dirichlet_bsize);CHKERRQ(ierr);
4228da1bb401SStefano Zampini     if(dirichlet_bsize && matis->pure_neumann) {
4229da1bb401SStefano Zampini       SETERRQ(PETSC_COMM_SELF,PETSC_ERR_USER,"Dirichlet boundaries are intended to be used with matrices with zeroed rows!\n");
4230da1bb401SStefano Zampini     }
4231da1bb401SStefano Zampini     ierr = ISGetIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr);
4232da1bb401SStefano Zampini     for(i=0;i<dirichlet_bsize;i++){
4233da1bb401SStefano Zampini       iindex=dirichlet_nodes[i];
4234da1bb401SStefano Zampini       if(mat_graph->count[iindex] && !mat_graph->touched[iindex]) {
4235da1bb401SStefano Zampini         if(array[iindex]>0.0) {
4236da1bb401SStefano Zampini           SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_USER,"BDDC cannot have nodes which are marked as Neumann and Dirichlet at the same time! Wrong node %d\n",iindex);
4237da1bb401SStefano Zampini         }
4238da1bb401SStefano Zampini         mat_graph->touched[iindex]=PETSC_TRUE;
4239da1bb401SStefano Zampini         mat_graph->where[iindex]=0;
4240da1bb401SStefano Zampini         nodes_touched++;
4241da1bb401SStefano Zampini         array2[iindex]=array2[iindex]+1.0;
4242da1bb401SStefano Zampini       }
4243da1bb401SStefano Zampini     }
4244da1bb401SStefano Zampini     ierr = ISRestoreIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr);
4245da1bb401SStefano Zampini   }
4246da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
4247da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec2_N,&array2);CHKERRQ(ierr);
4248da1bb401SStefano Zampini   /* Check consistency of Dirichlet nodes */
4249da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_N,1.0);CHKERRQ(ierr);
4250da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
4251da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4252da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4253da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4254da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4255da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
4256da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec2_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4257da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec2_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4258da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4259da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4260da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
4261da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec2_N,&array2);CHKERRQ(ierr);
426236e030ebSStefano Zampini   if(used_IS) {
426336e030ebSStefano Zampini     ierr = ISGetSize(used_IS,&dirichlet_bsize);CHKERRQ(ierr);
426436e030ebSStefano Zampini     ierr = ISGetIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr);
42653b03a366Sstefano_zampini     for(i=0;i<dirichlet_bsize;i++){
4266da1bb401SStefano Zampini       iindex=dirichlet_nodes[i];
4267da1bb401SStefano Zampini       if(array[iindex]>1.0 && array[iindex]!=array2[iindex] ) {
4268da1bb401SStefano Zampini          SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_USER,"Dirichlet nodes provided to BDDC must be consistent among neighbours!\nNode %d: number of sharing subdomains %d != number of subdomains for which it is a neumann node %d\n",iindex,(PetscInt)array[iindex],(PetscInt)array2[iindex]);
4269da1bb401SStefano Zampini       }
42703b03a366Sstefano_zampini     }
427136e030ebSStefano Zampini     ierr = ISRestoreIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr);
42723b03a366Sstefano_zampini   }
4273da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
4274da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec2_N,&array2);CHKERRQ(ierr);
4275da1bb401SStefano Zampini 
42760c7d97c5SJed Brown   for(i=0;i<mat_graph->nvtxs;i++){
42773b03a366Sstefano_zampini     if(!mat_graph->count[i]){  /* interior nodes */
42780c7d97c5SJed Brown       mat_graph->touched[i]=PETSC_TRUE;
42790c7d97c5SJed Brown       mat_graph->where[i]=0;
42800c7d97c5SJed Brown       nodes_touched++;
42810c7d97c5SJed Brown     }
42820c7d97c5SJed Brown   }
42830c7d97c5SJed Brown   mat_graph->ncmps = 0;
4284da1bb401SStefano Zampini   i=0;
42850c7d97c5SJed Brown   while(nodes_touched<mat_graph->nvtxs) {
4286a0ba757dSStefano Zampini     /*  find first untouched node in local ordering */
42870c7d97c5SJed Brown     while(mat_graph->touched[i]) i++;
42880c7d97c5SJed Brown     mat_graph->touched[i]=PETSC_TRUE;
4289a0ba757dSStefano Zampini     mat_graph->where[i]=where_values;
42900c7d97c5SJed Brown     nodes_touched++;
4291a0ba757dSStefano Zampini     /* now find all other nodes having the same set of sharing subdomains */
42920c7d97c5SJed Brown     for(j=i+1;j<mat_graph->nvtxs;j++){
4293a0ba757dSStefano Zampini       /* check for same number of sharing subdomains and dof number */
4294da1bb401SStefano Zampini       if(!mat_graph->touched[j] && mat_graph->count[i]==mat_graph->count[j] && mat_graph->which_dof[i] == mat_graph->which_dof[j] ){
4295a0ba757dSStefano Zampini         /* check for same set of sharing subdomains */
42960c7d97c5SJed Brown         same_set=PETSC_TRUE;
42970c7d97c5SJed Brown         for(k=0;k<mat_graph->count[j];k++){
4298da1bb401SStefano Zampini           if(mat_graph->neighbours_set[i][k]!=mat_graph->neighbours_set[j][k]) {
42990c7d97c5SJed Brown             same_set=PETSC_FALSE;
43000c7d97c5SJed Brown           }
43010c7d97c5SJed Brown         }
4302a0ba757dSStefano Zampini         /* I found a friend of mine */
43030c7d97c5SJed Brown         if(same_set) {
4304a0ba757dSStefano Zampini           mat_graph->where[j]=where_values;
43050c7d97c5SJed Brown           mat_graph->touched[j]=PETSC_TRUE;
43060c7d97c5SJed Brown           nodes_touched++;
43070c7d97c5SJed Brown         }
43080c7d97c5SJed Brown       }
43090c7d97c5SJed Brown     }
4310a0ba757dSStefano Zampini     where_values++;
43110c7d97c5SJed Brown   }
4312a0ba757dSStefano Zampini   where_values--; if(where_values<0) where_values=0;
4313a0ba757dSStefano Zampini   ierr = PetscMalloc(where_values*sizeof(PetscMPIInt),&mat_graph->where_ncmps);CHKERRQ(ierr);
4314a0ba757dSStefano Zampini   /* Find connected components defined on the shared interface */
4315a0ba757dSStefano Zampini   if(where_values) {
4316a0ba757dSStefano Zampini     ierr = PCBDDCFindConnectedComponents(mat_graph, where_values);
43173b03a366Sstefano_zampini     /* For consistency among neughbouring procs, I need to sort (by global ordering) each connected component */
4318a0ba757dSStefano Zampini     for(i=0;i<mat_graph->ncmps;i++) {
4319a0ba757dSStefano Zampini       ierr = ISLocalToGlobalMappingApply(matis->mapping,mat_graph->cptr[i+1]-mat_graph->cptr[i],&mat_graph->queue[mat_graph->cptr[i]],&queue_in_global_numbering[mat_graph->cptr[i]]);CHKERRQ(ierr);
4320a0ba757dSStefano Zampini       ierr = PetscSortIntWithArray(mat_graph->cptr[i+1]-mat_graph->cptr[i],&queue_in_global_numbering[mat_graph->cptr[i]],&mat_graph->queue[mat_graph->cptr[i]]);CHKERRQ(ierr);
4321a0ba757dSStefano Zampini     }
4322a0ba757dSStefano Zampini   }
4323a0ba757dSStefano Zampini   /* check consistency of connected components among neighbouring subdomains -> it adapt them in case it is needed */
4324a0ba757dSStefano Zampini   for(i=0;i<where_values;i++) {
43253b03a366Sstefano_zampini     /* We are not sure that two connected components will be the same among subdomains sharing a subset of local interface */
43263b03a366Sstefano_zampini     if(mat_graph->where_ncmps[i]>1) {
4327a0ba757dSStefano Zampini       adapt_interface=1;
4328a0ba757dSStefano Zampini       break;
4329a0ba757dSStefano Zampini     }
4330a0ba757dSStefano Zampini   }
4331a0ba757dSStefano Zampini   ierr = MPI_Allreduce(&adapt_interface,&adapt_interface_reduced,1,MPIU_INT,MPI_LOR,interface_comm);CHKERRQ(ierr);
4332da1bb401SStefano Zampini   if(pcbddc->dbg_flag && adapt_interface_reduced) {
4333d8923723SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"Adapting interface\n");CHKERRQ(ierr);
4334da1bb401SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
4335da1bb401SStefano Zampini   }
4336a0ba757dSStefano Zampini   if(where_values && adapt_interface_reduced) {
43370c7d97c5SJed Brown 
4338a0ba757dSStefano Zampini     PetscInt sum_requests=0,my_rank;
4339a0ba757dSStefano Zampini     PetscInt buffer_size,start_of_recv,size_of_recv,start_of_send;
4340a0ba757dSStefano Zampini     PetscInt temp_buffer_size,ins_val,global_where_counter;
4341a0ba757dSStefano Zampini     PetscInt *cum_recv_counts;
4342a0ba757dSStefano Zampini     PetscInt *where_to_nodes_indices;
4343a0ba757dSStefano Zampini     PetscInt *petsc_buffer;
4344a0ba757dSStefano Zampini     PetscMPIInt *recv_buffer;
4345a0ba757dSStefano Zampini     PetscMPIInt *recv_buffer_where;
4346a0ba757dSStefano Zampini     PetscMPIInt *send_buffer;
4347a0ba757dSStefano Zampini     PetscMPIInt size_of_send;
4348a0ba757dSStefano Zampini     PetscInt *sizes_of_sends;
4349a0ba757dSStefano Zampini     MPI_Request *send_requests;
4350a0ba757dSStefano Zampini     MPI_Request *recv_requests;
4351a0ba757dSStefano Zampini     PetscInt *where_cc_adapt;
4352a0ba757dSStefano Zampini     PetscInt **temp_buffer;
4353a0ba757dSStefano Zampini     PetscInt *nodes_to_temp_buffer_indices;
4354a0ba757dSStefano Zampini     PetscInt *add_to_where;
4355a0ba757dSStefano Zampini 
4356a0ba757dSStefano Zampini     ierr = MPI_Comm_rank(interface_comm,&my_rank);CHKERRQ(ierr);
4357a0ba757dSStefano Zampini     ierr = PetscMalloc((where_values+1)*sizeof(PetscInt),&cum_recv_counts);CHKERRQ(ierr);
4358a0ba757dSStefano Zampini     ierr = PetscMemzero(cum_recv_counts,(where_values+1)*sizeof(PetscInt));CHKERRQ(ierr);
4359a0ba757dSStefano Zampini     ierr = PetscMalloc(where_values*sizeof(PetscInt),&where_to_nodes_indices);CHKERRQ(ierr);
4360a0ba757dSStefano Zampini     /* first count how many neighbours per connected component I will receive from */
4361a0ba757dSStefano Zampini     cum_recv_counts[0]=0;
4362a0ba757dSStefano Zampini     for(i=1;i<where_values+1;i++){
4363a0ba757dSStefano Zampini       j=0;
4364d8923723SStefano Zampini       while(mat_graph->where[j] != i) { j++; }
4365a0ba757dSStefano Zampini       where_to_nodes_indices[i-1]=j;
4366da1bb401SStefano Zampini       if(mat_graph->neighbours_set[j][0]!=-1) { cum_recv_counts[i]=cum_recv_counts[i-1]+mat_graph->count[j]; } /* We don't want sends/recvs_to/from_self -> here I don't count myself  */
43673b03a366Sstefano_zampini       else { cum_recv_counts[i]=cum_recv_counts[i-1]+mat_graph->count[j]-1; }
4368a0ba757dSStefano Zampini     }
4369a0ba757dSStefano Zampini     ierr = PetscMalloc(2*cum_recv_counts[where_values]*sizeof(PetscMPIInt),&recv_buffer_where);CHKERRQ(ierr);
4370a0ba757dSStefano Zampini     ierr = PetscMalloc(cum_recv_counts[where_values]*sizeof(MPI_Request),&send_requests);CHKERRQ(ierr);
4371a0ba757dSStefano Zampini     ierr = PetscMalloc(cum_recv_counts[where_values]*sizeof(MPI_Request),&recv_requests);CHKERRQ(ierr);
4372a0ba757dSStefano Zampini     for(i=0;i<cum_recv_counts[where_values];i++) {
4373a0ba757dSStefano Zampini       send_requests[i]=MPI_REQUEST_NULL;
4374a0ba757dSStefano Zampini       recv_requests[i]=MPI_REQUEST_NULL;
4375a0ba757dSStefano Zampini     }
4376a0ba757dSStefano Zampini     /* exchange with my neighbours the number of my connected components on the shared interface */
4377a0ba757dSStefano Zampini     for(i=0;i<where_values;i++){
4378a0ba757dSStefano Zampini       j=where_to_nodes_indices[i];
4379da1bb401SStefano Zampini       k = (mat_graph->neighbours_set[j][0] == -1 ?  1 : 0);
4380a0ba757dSStefano Zampini       for(;k<mat_graph->count[j];k++){
4381da1bb401SStefano Zampini         ierr = MPI_Isend(&mat_graph->where_ncmps[i],1,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr);
4382da1bb401SStefano Zampini         ierr = MPI_Irecv(&recv_buffer_where[sum_requests],1,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr);
4383a0ba757dSStefano Zampini         sum_requests++;
4384a0ba757dSStefano Zampini       }
4385a0ba757dSStefano Zampini     }
4386a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
4387a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
4388a0ba757dSStefano Zampini     /* determine the connected component I need to adapt */
4389a0ba757dSStefano Zampini     ierr = PetscMalloc(where_values*sizeof(PetscInt),&where_cc_adapt);CHKERRQ(ierr);
4390a0ba757dSStefano Zampini     ierr = PetscMemzero(where_cc_adapt,where_values*sizeof(PetscInt));CHKERRQ(ierr);
4391a0ba757dSStefano Zampini     for(i=0;i<where_values;i++){
4392a0ba757dSStefano Zampini       for(j=cum_recv_counts[i];j<cum_recv_counts[i+1];j++){
43933b03a366Sstefano_zampini         /* The first condition is natural (i.e someone has a different number of cc than me), the second one is just to be safe */
43943b03a366Sstefano_zampini         if( mat_graph->where_ncmps[i]!=recv_buffer_where[j] || mat_graph->where_ncmps[i] > 1 ) {
4395a0ba757dSStefano Zampini           where_cc_adapt[i]=PETSC_TRUE;
4396a0ba757dSStefano Zampini           break;
4397a0ba757dSStefano Zampini         }
4398a0ba757dSStefano Zampini       }
4399a0ba757dSStefano Zampini     }
4400d8923723SStefano Zampini     buffer_size = 0;
4401d8923723SStefano Zampini     for(i=0;i<where_values;i++) {
4402d8923723SStefano Zampini       if(where_cc_adapt[i]) {
4403d8923723SStefano Zampini         for(j=i;j<mat_graph->ncmps;j++) {
4404d8923723SStefano Zampini           if(mat_graph->where[mat_graph->queue[mat_graph->cptr[j]]] == i+1) { /* WARNING -> where values goes from 1 to where_values included */
4405d8923723SStefano Zampini             buffer_size += 1 + mat_graph->cptr[j+1]-mat_graph->cptr[j];
4406d8923723SStefano Zampini           }
4407d8923723SStefano Zampini         }
4408d8923723SStefano Zampini       }
4409d8923723SStefano Zampini     }
4410d8923723SStefano Zampini     ierr = PetscMalloc(buffer_size*sizeof(PetscMPIInt),&send_buffer);CHKERRQ(ierr);
4411a0ba757dSStefano Zampini     /* now get from neighbours their ccs (in global numbering) and adapt them (in case it is needed) */
4412a0ba757dSStefano Zampini     /* first determine how much data to send (size of each queue plus the global indices) and communicate it to neighbours */
4413a0ba757dSStefano Zampini     ierr = PetscMalloc(where_values*sizeof(PetscInt),&sizes_of_sends);CHKERRQ(ierr);
4414a0ba757dSStefano Zampini     ierr = PetscMemzero(sizes_of_sends,where_values*sizeof(PetscInt));CHKERRQ(ierr);
4415a0ba757dSStefano Zampini     sum_requests=0;
4416a0ba757dSStefano Zampini     start_of_send=0;
4417a0ba757dSStefano Zampini     start_of_recv=cum_recv_counts[where_values];
4418a0ba757dSStefano Zampini     for(i=0;i<where_values;i++) {
4419a0ba757dSStefano Zampini       if(where_cc_adapt[i]) {
4420a0ba757dSStefano Zampini         size_of_send=0;
4421a0ba757dSStefano Zampini         for(j=i;j<mat_graph->ncmps;j++) {
4422a0ba757dSStefano Zampini           if(mat_graph->where[mat_graph->queue[mat_graph->cptr[j]]] == i+1) { /* WARNING -> where values goes from 1 to where_values included */
4423a0ba757dSStefano Zampini             send_buffer[start_of_send+size_of_send]=mat_graph->cptr[j+1]-mat_graph->cptr[j];
4424a0ba757dSStefano Zampini             size_of_send+=1;
4425a0ba757dSStefano Zampini             for(k=0;k<mat_graph->cptr[j+1]-mat_graph->cptr[j];k++) {
4426a0ba757dSStefano Zampini               send_buffer[start_of_send+size_of_send+k]=queue_in_global_numbering[mat_graph->cptr[j]+k];
4427a0ba757dSStefano Zampini             }
4428a0ba757dSStefano Zampini             size_of_send=size_of_send+mat_graph->cptr[j+1]-mat_graph->cptr[j];
4429a0ba757dSStefano Zampini           }
4430a0ba757dSStefano Zampini         }
4431a0ba757dSStefano Zampini         j = where_to_nodes_indices[i];
4432da1bb401SStefano Zampini         k = (mat_graph->neighbours_set[j][0] == -1 ?  1 : 0);
443311d8f4c2SStefano Zampini         sizes_of_sends[i]=size_of_send;
4434a0ba757dSStefano Zampini         for(;k<mat_graph->count[j];k++){
443511d8f4c2SStefano Zampini           ierr = MPI_Isend(&sizes_of_sends[i],1,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr);
4436da1bb401SStefano Zampini           ierr = MPI_Irecv(&recv_buffer_where[sum_requests+start_of_recv],1,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr);
4437a0ba757dSStefano Zampini           sum_requests++;
4438a0ba757dSStefano Zampini         }
4439a0ba757dSStefano Zampini         start_of_send+=size_of_send;
4440a0ba757dSStefano Zampini       }
4441a0ba757dSStefano Zampini     }
4442a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
4443a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
4444a0ba757dSStefano Zampini     buffer_size=0;
4445a0ba757dSStefano Zampini     for(k=0;k<sum_requests;k++) { buffer_size+=recv_buffer_where[start_of_recv+k]; }
4446a0ba757dSStefano Zampini     ierr = PetscMalloc(buffer_size*sizeof(PetscMPIInt),&recv_buffer);CHKERRQ(ierr);
4447a0ba757dSStefano Zampini     /* now exchange the data */
4448a0ba757dSStefano Zampini     start_of_recv=0;
4449a0ba757dSStefano Zampini     start_of_send=0;
4450a0ba757dSStefano Zampini     sum_requests=0;
4451a0ba757dSStefano Zampini     for(i=0;i<where_values;i++) {
4452a0ba757dSStefano Zampini       if(where_cc_adapt[i]) {
4453a0ba757dSStefano Zampini         size_of_send = sizes_of_sends[i];
4454a0ba757dSStefano Zampini         j = where_to_nodes_indices[i];
4455da1bb401SStefano Zampini         k = (mat_graph->neighbours_set[j][0] == -1 ?  1 : 0);
4456a0ba757dSStefano Zampini         for(;k<mat_graph->count[j];k++){
4457da1bb401SStefano Zampini           ierr = MPI_Isend(&send_buffer[start_of_send],size_of_send,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr);
4458a0ba757dSStefano Zampini           size_of_recv=recv_buffer_where[cum_recv_counts[where_values]+sum_requests];
4459da1bb401SStefano Zampini           ierr = MPI_Irecv(&recv_buffer[start_of_recv],size_of_recv,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr);
4460a0ba757dSStefano Zampini           start_of_recv+=size_of_recv;
4461a0ba757dSStefano Zampini           sum_requests++;
4462a0ba757dSStefano Zampini         }
4463a0ba757dSStefano Zampini         start_of_send+=size_of_send;
4464a0ba757dSStefano Zampini       }
4465a0ba757dSStefano Zampini     }
4466a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
4467a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
4468a0ba757dSStefano Zampini     ierr = PetscMalloc(buffer_size*sizeof(PetscInt),&petsc_buffer);CHKERRQ(ierr);
4469a0ba757dSStefano Zampini     for(k=0;k<start_of_recv;k++) { petsc_buffer[k]=(PetscInt)recv_buffer[k]; }
4470a0ba757dSStefano Zampini     for(j=0;j<buffer_size;) {
4471a0ba757dSStefano Zampini        ierr = ISGlobalToLocalMappingApply(matis->mapping,IS_GTOLM_MASK,petsc_buffer[j],&petsc_buffer[j+1],&petsc_buffer[j],&petsc_buffer[j+1]);CHKERRQ(ierr);
4472a0ba757dSStefano Zampini        k=petsc_buffer[j]+1;
4473a0ba757dSStefano Zampini        j+=k;
4474a0ba757dSStefano Zampini     }
4475a0ba757dSStefano Zampini     sum_requests=cum_recv_counts[where_values];
4476a0ba757dSStefano Zampini     start_of_recv=0;
4477a0ba757dSStefano Zampini     ierr = PetscMalloc(mat_graph->nvtxs*sizeof(PetscInt),&nodes_to_temp_buffer_indices);CHKERRQ(ierr);
4478a0ba757dSStefano Zampini     global_where_counter=0;
4479a0ba757dSStefano Zampini     for(i=0;i<where_values;i++){
4480a0ba757dSStefano Zampini       if(where_cc_adapt[i]){
4481a0ba757dSStefano Zampini         temp_buffer_size=0;
4482a0ba757dSStefano Zampini         /* find nodes on the shared interface we need to adapt */
4483a0ba757dSStefano Zampini         for(j=0;j<mat_graph->nvtxs;j++){
4484a0ba757dSStefano Zampini           if(mat_graph->where[j]==i+1) {
4485a0ba757dSStefano Zampini             nodes_to_temp_buffer_indices[j]=temp_buffer_size;
4486a0ba757dSStefano Zampini             temp_buffer_size++;
4487a0ba757dSStefano Zampini           } else {
4488a0ba757dSStefano Zampini             nodes_to_temp_buffer_indices[j]=-1;
4489a0ba757dSStefano Zampini           }
4490a0ba757dSStefano Zampini         }
4491a0ba757dSStefano Zampini         /* allocate some temporary space */
4492a0ba757dSStefano Zampini         ierr = PetscMalloc(temp_buffer_size*sizeof(PetscInt*),&temp_buffer);CHKERRQ(ierr);
4493a0ba757dSStefano Zampini         ierr = PetscMalloc(temp_buffer_size*(cum_recv_counts[i+1]-cum_recv_counts[i])*sizeof(PetscInt),&temp_buffer[0]);CHKERRQ(ierr);
4494a0ba757dSStefano Zampini         ierr = PetscMemzero(temp_buffer[0],temp_buffer_size*(cum_recv_counts[i+1]-cum_recv_counts[i])*sizeof(PetscInt));CHKERRQ(ierr);
4495a0ba757dSStefano Zampini         for(j=1;j<temp_buffer_size;j++){
4496a0ba757dSStefano Zampini           temp_buffer[j]=temp_buffer[j-1]+cum_recv_counts[i+1]-cum_recv_counts[i];
4497a0ba757dSStefano Zampini         }
4498a0ba757dSStefano Zampini         /* analyze contributions from neighbouring subdomains for i-th conn comp
4499a0ba757dSStefano Zampini            temp buffer structure:
4500a0ba757dSStefano Zampini            supposing part of the interface has dimension 5 (global nodes 0,1,2,3,4)
4501a0ba757dSStefano Zampini            3 neighs procs with structured connected components:
4502a0ba757dSStefano Zampini              neigh 0: [0 1 4], [2 3];  (2 connected components)
4503a0ba757dSStefano Zampini              neigh 1: [0 1], [2 3 4];  (2 connected components)
4504a0ba757dSStefano Zampini              neigh 2: [0 4], [1], [2 3]; (3 connected components)
4505a0ba757dSStefano Zampini            tempbuffer (row-oriented) should be filled as:
4506a0ba757dSStefano Zampini              [ 0, 0, 0;
4507a0ba757dSStefano Zampini                0, 0, 1;
4508a0ba757dSStefano Zampini                1, 1, 2;
4509a0ba757dSStefano Zampini                1, 1, 2;
4510a0ba757dSStefano Zampini                0, 1, 0; ];
4511a0ba757dSStefano Zampini            This way we can simply recover the resulting structure account for possible intersections of ccs among neighs.
4512a0ba757dSStefano Zampini            The mat_graph->where array will be modified to reproduce the following 4 connected components [0], [1], [2 3], [4];
4513a0ba757dSStefano Zampini                                                                                                                                    */
4514a0ba757dSStefano Zampini         for(j=0;j<cum_recv_counts[i+1]-cum_recv_counts[i];j++) {
4515a0ba757dSStefano Zampini           ins_val=0;
4516a0ba757dSStefano Zampini           size_of_recv=recv_buffer_where[sum_requests];  /* total size of recv from neighs */
4517a0ba757dSStefano Zampini           for(buffer_size=0;buffer_size<size_of_recv;) {  /* loop until all data from neighs has been taken into account */
4518a0ba757dSStefano Zampini             for(k=1;k<petsc_buffer[buffer_size+start_of_recv]+1;k++) { /* filling properly temp_buffer using data from a single recv */
4519a0ba757dSStefano Zampini               temp_buffer[ nodes_to_temp_buffer_indices[ petsc_buffer[ start_of_recv+buffer_size+k ] ] ][j]=ins_val;
4520a0ba757dSStefano Zampini             }
4521a0ba757dSStefano Zampini             buffer_size+=k;
4522a0ba757dSStefano Zampini             ins_val++;
4523a0ba757dSStefano Zampini           }
4524a0ba757dSStefano Zampini           start_of_recv+=size_of_recv;
4525a0ba757dSStefano Zampini           sum_requests++;
4526a0ba757dSStefano Zampini         }
4527a0ba757dSStefano Zampini         ierr = PetscMalloc(temp_buffer_size*sizeof(PetscInt),&add_to_where);CHKERRQ(ierr);
4528a0ba757dSStefano Zampini         ierr = PetscMemzero(add_to_where,temp_buffer_size*sizeof(PetscInt));CHKERRQ(ierr);
4529a0ba757dSStefano Zampini         for(j=0;j<temp_buffer_size;j++){
4530a0ba757dSStefano Zampini           if(!add_to_where[j]){ /* found a new cc  */
4531a0ba757dSStefano Zampini             global_where_counter++;
4532a0ba757dSStefano Zampini             add_to_where[j]=global_where_counter;
4533a0ba757dSStefano Zampini             for(k=j+1;k<temp_buffer_size;k++){ /* check for other nodes in new cc */
4534a0ba757dSStefano Zampini               same_set=PETSC_TRUE;
4535a0ba757dSStefano Zampini               for(s=0;s<cum_recv_counts[i+1]-cum_recv_counts[i];s++){
4536a0ba757dSStefano Zampini                 if(temp_buffer[j][s]!=temp_buffer[k][s]) {
4537a0ba757dSStefano Zampini                   same_set=PETSC_FALSE;
4538a0ba757dSStefano Zampini                   break;
4539a0ba757dSStefano Zampini                 }
4540a0ba757dSStefano Zampini               }
4541a0ba757dSStefano Zampini               if(same_set) add_to_where[k]=global_where_counter;
4542a0ba757dSStefano Zampini             }
4543a0ba757dSStefano Zampini           }
4544a0ba757dSStefano Zampini         }
4545a0ba757dSStefano Zampini         /* insert new data in where array */
4546a0ba757dSStefano Zampini         temp_buffer_size=0;
4547a0ba757dSStefano Zampini         for(j=0;j<mat_graph->nvtxs;j++){
4548a0ba757dSStefano Zampini           if(mat_graph->where[j]==i+1) {
4549a0ba757dSStefano Zampini             mat_graph->where[j]=where_values+add_to_where[temp_buffer_size];
4550a0ba757dSStefano Zampini             temp_buffer_size++;
4551a0ba757dSStefano Zampini           }
4552a0ba757dSStefano Zampini         }
4553a0ba757dSStefano Zampini         ierr = PetscFree(temp_buffer[0]);CHKERRQ(ierr);
4554a0ba757dSStefano Zampini         ierr = PetscFree(temp_buffer);CHKERRQ(ierr);
4555a0ba757dSStefano Zampini         ierr = PetscFree(add_to_where);CHKERRQ(ierr);
4556a0ba757dSStefano Zampini       }
4557a0ba757dSStefano Zampini     }
4558a0ba757dSStefano Zampini     ierr = PetscFree(nodes_to_temp_buffer_indices);CHKERRQ(ierr);
4559a0ba757dSStefano Zampini     ierr = PetscFree(sizes_of_sends);CHKERRQ(ierr);
4560a0ba757dSStefano Zampini     ierr = PetscFree(send_requests);CHKERRQ(ierr);
4561a0ba757dSStefano Zampini     ierr = PetscFree(recv_requests);CHKERRQ(ierr);
4562a0ba757dSStefano Zampini     ierr = PetscFree(petsc_buffer);CHKERRQ(ierr);
4563a0ba757dSStefano Zampini     ierr = PetscFree(recv_buffer);CHKERRQ(ierr);
4564a0ba757dSStefano Zampini     ierr = PetscFree(recv_buffer_where);CHKERRQ(ierr);
4565a0ba757dSStefano Zampini     ierr = PetscFree(send_buffer);CHKERRQ(ierr);
4566a0ba757dSStefano Zampini     ierr = PetscFree(cum_recv_counts);CHKERRQ(ierr);
4567a0ba757dSStefano Zampini     ierr = PetscFree(where_to_nodes_indices);CHKERRQ(ierr);
456823d4d1a5SStefano Zampini     ierr = PetscFree(where_cc_adapt);CHKERRQ(ierr);
4569a0ba757dSStefano Zampini     /* We are ready to evaluate consistent connected components on each part of the shared interface */
4570a0ba757dSStefano Zampini     if(global_where_counter) {
4571a0ba757dSStefano Zampini       for(i=0;i<mat_graph->nvtxs;i++){ mat_graph->touched[i]=PETSC_FALSE; }
4572a0ba757dSStefano Zampini       global_where_counter=0;
4573a0ba757dSStefano Zampini       for(i=0;i<mat_graph->nvtxs;i++){
4574a0ba757dSStefano Zampini         if(mat_graph->where[i] && !mat_graph->touched[i]) {
4575a0ba757dSStefano Zampini           global_where_counter++;
4576a0ba757dSStefano Zampini           for(j=i+1;j<mat_graph->nvtxs;j++){
4577a0ba757dSStefano Zampini             if(!mat_graph->touched[j] && mat_graph->where[j]==mat_graph->where[i]) {
4578a0ba757dSStefano Zampini               mat_graph->where[j]=global_where_counter;
4579a0ba757dSStefano Zampini               mat_graph->touched[j]=PETSC_TRUE;
4580a0ba757dSStefano Zampini             }
4581a0ba757dSStefano Zampini           }
4582a0ba757dSStefano Zampini           mat_graph->where[i]=global_where_counter;
4583a0ba757dSStefano Zampini           mat_graph->touched[i]=PETSC_TRUE;
4584a0ba757dSStefano Zampini         }
4585a0ba757dSStefano Zampini       }
4586a0ba757dSStefano Zampini       where_values=global_where_counter;
4587a0ba757dSStefano Zampini     }
4588a0ba757dSStefano Zampini     if(global_where_counter) {
4589a0ba757dSStefano Zampini       ierr = PetscMemzero(mat_graph->cptr,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr);
4590a0ba757dSStefano Zampini       ierr = PetscMemzero(mat_graph->queue,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
4591a0ba757dSStefano Zampini       ierr = PetscFree(mat_graph->where_ncmps);CHKERRQ(ierr);
4592a0ba757dSStefano Zampini       ierr = PetscMalloc(where_values*sizeof(PetscMPIInt),&mat_graph->where_ncmps);CHKERRQ(ierr);
4593a0ba757dSStefano Zampini       ierr = PCBDDCFindConnectedComponents(mat_graph, where_values);
4594a0ba757dSStefano Zampini       for(i=0;i<mat_graph->ncmps;i++) {
4595a0ba757dSStefano Zampini         ierr = ISLocalToGlobalMappingApply(matis->mapping,mat_graph->cptr[i+1]-mat_graph->cptr[i],&mat_graph->queue[mat_graph->cptr[i]],&queue_in_global_numbering[mat_graph->cptr[i]]);CHKERRQ(ierr);
4596a0ba757dSStefano Zampini         ierr = PetscSortIntWithArray(mat_graph->cptr[i+1]-mat_graph->cptr[i],&queue_in_global_numbering[mat_graph->cptr[i]],&mat_graph->queue[mat_graph->cptr[i]]);CHKERRQ(ierr);
4597a0ba757dSStefano Zampini       }
4598a0ba757dSStefano Zampini     }
45993b03a366Sstefano_zampini   } /* Finished adapting interface */
46000c7d97c5SJed Brown   PetscInt nfc=0;
46010c7d97c5SJed Brown   PetscInt nec=0;
46020c7d97c5SJed Brown   PetscInt nvc=0;
46033b03a366Sstefano_zampini   PetscBool twodim_flag=PETSC_FALSE;
46040c7d97c5SJed Brown   for (i=0; i<mat_graph->ncmps; i++) {
46053b03a366Sstefano_zampini     if( mat_graph->cptr[i+1]-mat_graph->cptr[i] > vertex_size ){
4606534831adSStefano Zampini       if(mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]==1){ /* 1 neigh Neumann fake included */
46070c7d97c5SJed Brown         nfc++;
46083b03a366Sstefano_zampini       } else { /* note that nec will be zero in 2d */
46093b03a366Sstefano_zampini         nec++;
46103b03a366Sstefano_zampini       }
46110c7d97c5SJed Brown     } else {
46123b03a366Sstefano_zampini       nvc+=mat_graph->cptr[i+1]-mat_graph->cptr[i];
46133b03a366Sstefano_zampini     }
46143b03a366Sstefano_zampini   }
46153b03a366Sstefano_zampini 
46163b03a366Sstefano_zampini   if(!nec) { /* we are in a 2d case -> no faces, only edges */
46173b03a366Sstefano_zampini     nec = nfc;
46183b03a366Sstefano_zampini     nfc = 0;
46193b03a366Sstefano_zampini     twodim_flag = PETSC_TRUE;
46203b03a366Sstefano_zampini   }
46213972b0daSStefano Zampini   /* allocate IS arrays for faces, edges. Vertices need a single index set. */
46223972b0daSStefano Zampini   k=0;
46233972b0daSStefano Zampini   for (i=0; i<mat_graph->ncmps; i++) {
46243972b0daSStefano Zampini     j=mat_graph->cptr[i+1]-mat_graph->cptr[i];
46253972b0daSStefano Zampini     if( j > k) {
46263972b0daSStefano Zampini       k=j;
46273972b0daSStefano Zampini     }
4628ba1573a8SStefano Zampini     if(j<=vertex_size) {
4629ba1573a8SStefano Zampini       k+=vertex_size;
4630ba1573a8SStefano Zampini     }
46313972b0daSStefano Zampini   }
46323972b0daSStefano Zampini   ierr = PetscMalloc(k*sizeof(PetscInt),&auxis);CHKERRQ(ierr);
46333972b0daSStefano Zampini 
46343b03a366Sstefano_zampini   if(!pcbddc->vertices_flag && !pcbddc->edges_flag) {
46353b03a366Sstefano_zampini     ierr = PetscMalloc(nfc*sizeof(IS),&pcbddc->ISForFaces);CHKERRQ(ierr);
46363b03a366Sstefano_zampini     use_faces=PETSC_TRUE;
46373b03a366Sstefano_zampini   }
46383b03a366Sstefano_zampini   if(!pcbddc->vertices_flag && !pcbddc->faces_flag) {
46393b03a366Sstefano_zampini     ierr = PetscMalloc(nec*sizeof(IS),&pcbddc->ISForEdges);CHKERRQ(ierr);
46403b03a366Sstefano_zampini     use_edges=PETSC_TRUE;
46413b03a366Sstefano_zampini   }
46423b03a366Sstefano_zampini   nfc=0;
46433b03a366Sstefano_zampini   nec=0;
46443b03a366Sstefano_zampini   for (i=0; i<mat_graph->ncmps; i++) {
46453b03a366Sstefano_zampini     if( mat_graph->cptr[i+1]-mat_graph->cptr[i] > vertex_size ){
46463b03a366Sstefano_zampini       for(j=0;j<mat_graph->cptr[i+1]-mat_graph->cptr[i];j++) {
46473972b0daSStefano Zampini         auxis[j]=mat_graph->queue[mat_graph->cptr[i]+j];
46483b03a366Sstefano_zampini       }
46493b03a366Sstefano_zampini       if(mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]==1){
46503b03a366Sstefano_zampini         if(twodim_flag) {
46513b03a366Sstefano_zampini           if(use_edges) {
46523972b0daSStefano Zampini             ierr = ISCreateGeneral(PETSC_COMM_SELF,j,auxis,PETSC_COPY_VALUES,&pcbddc->ISForEdges[nec]);CHKERRQ(ierr);
46533b03a366Sstefano_zampini             nec++;
46543b03a366Sstefano_zampini           }
46553b03a366Sstefano_zampini         } else {
46563b03a366Sstefano_zampini           if(use_faces) {
46573972b0daSStefano Zampini             ierr = ISCreateGeneral(PETSC_COMM_SELF,j,auxis,PETSC_COPY_VALUES,&pcbddc->ISForFaces[nfc]);CHKERRQ(ierr);
46583b03a366Sstefano_zampini             nfc++;
46593b03a366Sstefano_zampini           }
46603b03a366Sstefano_zampini         }
46613b03a366Sstefano_zampini       } else {
46623b03a366Sstefano_zampini         if(use_edges) {
46633972b0daSStefano Zampini           ierr = ISCreateGeneral(PETSC_COMM_SELF,j,auxis,PETSC_COPY_VALUES,&pcbddc->ISForEdges[nec]);CHKERRQ(ierr);
46640c7d97c5SJed Brown           nec++;
46650c7d97c5SJed Brown         }
46660c7d97c5SJed Brown       }
46670c7d97c5SJed Brown     }
46683b03a366Sstefano_zampini   }
46693b03a366Sstefano_zampini   pcbddc->n_ISForFaces=nfc;
46703b03a366Sstefano_zampini   pcbddc->n_ISForEdges=nec;
46713b03a366Sstefano_zampini   nvc=0;
46720c7d97c5SJed Brown   if( !pcbddc->constraints_flag ) {
46733b03a366Sstefano_zampini     for (i=0; i<mat_graph->ncmps; i++) {
46743b03a366Sstefano_zampini       if( mat_graph->cptr[i+1]-mat_graph->cptr[i] <= vertex_size ){
46753b03a366Sstefano_zampini         for( j=mat_graph->cptr[i];j<mat_graph->cptr[i+1];j++) {
46763972b0daSStefano Zampini           auxis[nvc]=mat_graph->queue[j];
46770c7d97c5SJed Brown           nvc++;
46780c7d97c5SJed Brown         }
46790c7d97c5SJed Brown       }
46800c7d97c5SJed Brown     }
46810c7d97c5SJed Brown   }
4682a0ba757dSStefano Zampini   /* sort vertex set (by local ordering) */
46833972b0daSStefano Zampini   ierr = PetscSortInt(nvc,auxis);CHKERRQ(ierr);
46843972b0daSStefano Zampini   ierr = ISCreateGeneral(PETSC_COMM_SELF,nvc,auxis,PETSC_COPY_VALUES,&pcbddc->ISForVertices);CHKERRQ(ierr);
46850c7d97c5SJed Brown 
4686e269702eSStefano Zampini   if(pcbddc->dbg_flag) {
4687e269702eSStefano Zampini 
4688d49ef151SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"--------------------------------------------------------------\n");CHKERRQ(ierr);
4689d49ef151SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Details from PCBDDCManageLocalBoundaries for subdomain %04d\n",PetscGlobalRank);CHKERRQ(ierr);
4690d49ef151SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"--------------------------------------------------------------\n");CHKERRQ(ierr);
4691a0ba757dSStefano Zampini /*    ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Graph (adjacency structure) of local Neumann mat\n");CHKERRQ(ierr);
4692a0ba757dSStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"--------------------------------------------------------------\n");CHKERRQ(ierr);
4693e269702eSStefano Zampini     for(i=0;i<mat_graph->nvtxs;i++) {
4694a0ba757dSStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Nodes connected to node number %d are %d\n",i,mat_graph->xadj[i+1]-mat_graph->xadj[i]);CHKERRQ(ierr);
4695e269702eSStefano Zampini       for(j=mat_graph->xadj[i];j<mat_graph->xadj[i+1];j++){
4696a0ba757dSStefano Zampini         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d ",mat_graph->adjncy[j]);CHKERRQ(ierr);
4697e269702eSStefano Zampini       }
4698a0ba757dSStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\n--------------------------------------------------------------\n");CHKERRQ(ierr);
4699da1bb401SStefano Zampini     }*/
4700d49ef151SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Matrix graph has %d connected components", mat_graph->ncmps);CHKERRQ(ierr);
47010c7d97c5SJed Brown     for(i=0;i<mat_graph->ncmps;i++) {
47023b03a366Sstefano_zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\nDetails for connected component number %02d: size %04d, count %01d. Nodes follow.\n",
47033b03a366Sstefano_zampini              i,mat_graph->cptr[i+1]-mat_graph->cptr[i],mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]);CHKERRQ(ierr);
4704da1bb401SStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"subdomains: ");
4705da1bb401SStefano Zampini       for (j=0;j<mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]; j++) {
4706da1bb401SStefano Zampini         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d ",mat_graph->neighbours_set[mat_graph->queue[mat_graph->cptr[i]]][j]);
4707da1bb401SStefano Zampini       }
4708da1bb401SStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\n");
47090c7d97c5SJed Brown       for (j=mat_graph->cptr[i]; j<mat_graph->cptr[i+1]; j++){
4710da1bb401SStefano Zampini         /* ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d (%d), ",queue_in_global_numbering[j],mat_graph->queue[j]);CHKERRQ(ierr); */
4711da1bb401SStefano Zampini         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d, ",mat_graph->queue[j]);CHKERRQ(ierr);
47120c7d97c5SJed Brown       }
47130c7d97c5SJed Brown     }
4714da1bb401SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\n--------------------------------------------------------------\n");CHKERRQ(ierr);
47153b03a366Sstefano_zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local vertices\n",PetscGlobalRank,nvc);CHKERRQ(ierr);
47163b03a366Sstefano_zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local faces\n",PetscGlobalRank,nfc);CHKERRQ(ierr);
47173b03a366Sstefano_zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local edges\n",PetscGlobalRank,nec);CHKERRQ(ierr);
4718d49ef151SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
47190c7d97c5SJed Brown   }
47200c7d97c5SJed Brown 
47213972b0daSStefano Zampini   ierr = PetscFree(queue_in_global_numbering);CHKERRQ(ierr);
47223972b0daSStefano Zampini   ierr = PetscFree(auxis);CHKERRQ(ierr);
47230c7d97c5SJed Brown   PetscFunctionReturn(0);
47240c7d97c5SJed Brown 
47250c7d97c5SJed Brown }
47260c7d97c5SJed Brown 
47270c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
47280c7d97c5SJed Brown 
47290c7d97c5SJed Brown /* The following code has been adapted from function IsConnectedSubdomain contained
4730da1bb401SStefano Zampini    in source file contig.c of METIS library (version 5.0.1)
4731da1bb401SStefano Zampini    It finds connected components of each partition labeled from 1 to n_dist  */
47320c7d97c5SJed Brown 
47330c7d97c5SJed Brown #undef __FUNCT__
47340c7d97c5SJed Brown #define __FUNCT__ "PCBDDCFindConnectedComponents"
47359c0446d6SStefano Zampini static PetscErrorCode PCBDDCFindConnectedComponents(PCBDDCGraph graph, PetscInt n_dist )
47360c7d97c5SJed Brown {
47370c7d97c5SJed Brown   PetscInt i, j, k, nvtxs, first, last, nleft, ncmps,pid,cum_queue,n,ncmps_pid;
47380c7d97c5SJed Brown   PetscInt *xadj, *adjncy, *where, *queue;
47390c7d97c5SJed Brown   PetscInt *cptr;
47400c7d97c5SJed Brown   PetscBool *touched;
47410c7d97c5SJed Brown 
47420c7d97c5SJed Brown   PetscFunctionBegin;
47430c7d97c5SJed Brown 
47440c7d97c5SJed Brown   nvtxs   = graph->nvtxs;
47450c7d97c5SJed Brown   xadj    = graph->xadj;
47460c7d97c5SJed Brown   adjncy  = graph->adjncy;
47470c7d97c5SJed Brown   where   = graph->where;
47480c7d97c5SJed Brown   touched = graph->touched;
47490c7d97c5SJed Brown   queue   = graph->queue;
47500c7d97c5SJed Brown   cptr    = graph->cptr;
47510c7d97c5SJed Brown 
47520c7d97c5SJed Brown   for (i=0; i<nvtxs; i++)
47530c7d97c5SJed Brown     touched[i] = PETSC_FALSE;
47540c7d97c5SJed Brown 
47550c7d97c5SJed Brown   cum_queue=0;
47560c7d97c5SJed Brown   ncmps=0;
47570c7d97c5SJed Brown 
47580c7d97c5SJed Brown   for(n=0; n<n_dist; n++) {
4759da1bb401SStefano Zampini     pid = n+1;  /* partition labeled by 0 is discarded */
47600c7d97c5SJed Brown     nleft = 0;
47610c7d97c5SJed Brown     for (i=0; i<nvtxs; i++) {
47620c7d97c5SJed Brown       if (where[i] == pid)
47630c7d97c5SJed Brown         nleft++;
47640c7d97c5SJed Brown     }
47650c7d97c5SJed Brown     for (i=0; i<nvtxs; i++) {
47660c7d97c5SJed Brown       if (where[i] == pid)
47670c7d97c5SJed Brown         break;
47680c7d97c5SJed Brown     }
47690c7d97c5SJed Brown     touched[i] = PETSC_TRUE;
47700c7d97c5SJed Brown     queue[cum_queue] = i;
47710c7d97c5SJed Brown     first = 0; last = 1;
47720c7d97c5SJed Brown     cptr[ncmps] = cum_queue;  /* This actually points to queue */
47730c7d97c5SJed Brown     ncmps_pid = 0;
47740c7d97c5SJed Brown     while (first != nleft) {
47750c7d97c5SJed Brown       if (first == last) { /* Find another starting vertex */
47760c7d97c5SJed Brown         cptr[++ncmps] = first+cum_queue;
47770c7d97c5SJed Brown         ncmps_pid++;
47780c7d97c5SJed Brown         for (i=0; i<nvtxs; i++) {
47790c7d97c5SJed Brown           if (where[i] == pid && !touched[i])
47800c7d97c5SJed Brown             break;
47810c7d97c5SJed Brown         }
47820c7d97c5SJed Brown         queue[cum_queue+last] = i;
47830c7d97c5SJed Brown         last++;
47840c7d97c5SJed Brown         touched[i] = PETSC_TRUE;
47850c7d97c5SJed Brown       }
47860c7d97c5SJed Brown       i = queue[cum_queue+first];
47870c7d97c5SJed Brown       first++;
47880c7d97c5SJed Brown       for (j=xadj[i]; j<xadj[i+1]; j++) {
47890c7d97c5SJed Brown         k = adjncy[j];
47900c7d97c5SJed Brown         if (where[k] == pid && !touched[k]) {
47910c7d97c5SJed Brown           queue[cum_queue+last] = k;
47920c7d97c5SJed Brown           last++;
47930c7d97c5SJed Brown           touched[k] = PETSC_TRUE;
47940c7d97c5SJed Brown         }
47950c7d97c5SJed Brown       }
47960c7d97c5SJed Brown     }
47970c7d97c5SJed Brown     cptr[++ncmps] = first+cum_queue;
47980c7d97c5SJed Brown     ncmps_pid++;
47990c7d97c5SJed Brown     cum_queue=cptr[ncmps];
4800a0ba757dSStefano Zampini     graph->where_ncmps[n] = ncmps_pid;
48010c7d97c5SJed Brown   }
48020c7d97c5SJed Brown   graph->ncmps = ncmps;
48030c7d97c5SJed Brown 
48040c7d97c5SJed Brown   PetscFunctionReturn(0);
48050c7d97c5SJed Brown }
4806