xref: /petsc/src/ksp/pc/impls/bddc/bddc.c (revision 0bdf917e49196d1b82a9235c97597536d20d8387)
153cdbc3dSStefano Zampini /* TODOLIST
2da1bb401SStefano Zampini    DofSplitting and DM attached to pc?
3da1bb401SStefano Zampini    Change SetNeumannBoundaries to SetNeumannBoundariesLocal and provide new SetNeumannBoundaries (same Dirichlet)
4831a100dSStefano Zampini      - change prec_type to switch_inexact_prec_type
53b03a366Sstefano_zampini    Inexact solvers: global preconditioner application is ready, ask to developers (Jed?) on how to best implement Dohrmann's approach (PCSHELL?)
6a0ba757dSStefano Zampini    change how to deal with the coarse problem (PCBDDCSetCoarseEnvironment):
7a0ba757dSStefano Zampini      - simplify coarse problem structure -> PCBDDC or PCREDUDANT, nothing else -> same comm for all levels?
8a0ba757dSStefano Zampini      - remove coarse enums and allow use of PCBDDCGetCoarseKSP
9a0ba757dSStefano Zampini      - remove metis dependency -> use MatPartitioning for multilevel -> Assemble serial adjacency in ManageLocalBoundaries?
103b03a366Sstefano_zampini      - Add levels' slot to bddc data structure and associated Set/Get functions
11a0ba757dSStefano Zampini    code refactoring:
12a0ba757dSStefano Zampini      - pick up better names for static functions
13a0ba757dSStefano Zampini    change options structure:
14a0ba757dSStefano Zampini      - insert BDDC into MG framework?
15a0ba757dSStefano Zampini    provide other ops? Ask to developers
16a0ba757dSStefano Zampini    remove all unused printf
17a0ba757dSStefano Zampini    man pages
1853cdbc3dSStefano Zampini */
190c7d97c5SJed Brown 
2053cdbc3dSStefano Zampini /* ----------------------------------------------------------------------------------------------------------------------------------------------
210c7d97c5SJed Brown    Implementation of BDDC preconditioner based on:
220c7d97c5SJed Brown    C. Dohrmann "An approximate BDDC preconditioner", Numerical Linear Algebra with Applications Volume 14, Issue 2, pages 149-168, March 2007
2353cdbc3dSStefano Zampini    ---------------------------------------------------------------------------------------------------------------------------------------------- */
2453cdbc3dSStefano Zampini 
2553cdbc3dSStefano Zampini #include "bddc.h" /*I "petscpc.h" I*/  /* includes for fortran wrappers */
263b03a366Sstefano_zampini #include <petscblaslapack.h>
270c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
280c7d97c5SJed Brown #undef __FUNCT__
290c7d97c5SJed Brown #define __FUNCT__ "PCSetFromOptions_BDDC"
300c7d97c5SJed Brown PetscErrorCode PCSetFromOptions_BDDC(PC pc)
310c7d97c5SJed Brown {
320c7d97c5SJed Brown   PC_BDDC         *pcbddc = (PC_BDDC*)pc->data;
330c7d97c5SJed Brown   PetscErrorCode ierr;
340c7d97c5SJed Brown 
350c7d97c5SJed Brown   PetscFunctionBegin;
360c7d97c5SJed Brown   ierr = PetscOptionsHead("BDDC options");CHKERRQ(ierr);
370c7d97c5SJed Brown   /* Verbose debugging of main data structures */
38e269702eSStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_check_all"       ,"Verbose (debugging) output for PCBDDC"                       ,"none",pcbddc->dbg_flag      ,&pcbddc->dbg_flag      ,PETSC_NULL);CHKERRQ(ierr);
390c7d97c5SJed Brown   /* Some customization for default primal space */
40da1bb401SStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_vertices_only"   ,"Use only vertices in coarse space (i.e. discard constraints)","none",pcbddc->vertices_flag   ,&pcbddc->vertices_flag   ,PETSC_NULL);CHKERRQ(ierr);
41da1bb401SStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_constraints_only","Use only constraints in coarse space (i.e. discard vertices)","none",pcbddc->constraints_flag,&pcbddc->constraints_flag,PETSC_NULL);CHKERRQ(ierr);
42da1bb401SStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_faces_only"      ,"Use only faces among constraints of coarse space (i.e. discard edges)"         ,"none",pcbddc->faces_flag      ,&pcbddc->faces_flag      ,PETSC_NULL);CHKERRQ(ierr);
43da1bb401SStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_edges_only"      ,"Use only edges among constraints of coarse space (i.e. discard faces)"         ,"none",pcbddc->edges_flag      ,&pcbddc->edges_flag      ,PETSC_NULL);CHKERRQ(ierr);
440c7d97c5SJed Brown   /* Coarse solver context */
456c667b0aSStefano Zampini   static const char * const avail_coarse_problems[] = {"sequential","replicated","parallel","multilevel","CoarseProblemType","PC_BDDC_",0}; /*order of choiches depends on ENUM defined in bddc.h */
460c7d97c5SJed Brown   ierr = PetscOptionsEnum("-pc_bddc_coarse_problem_type","Set coarse problem type","none",avail_coarse_problems,(PetscEnum)pcbddc->coarse_problem_type,(PetscEnum*)&pcbddc->coarse_problem_type,PETSC_NULL);CHKERRQ(ierr);
470c7d97c5SJed Brown   /* Two different application of BDDC to the whole set of dofs, internal and interface */
480c7d97c5SJed Brown   ierr = PetscOptionsBool("-pc_bddc_switch_preconditioning_type","Switch between M_2 (default) and M_3 preconditioners (as defined by Dohrmann)","none",pcbddc->prec_type,&pcbddc->prec_type,PETSC_NULL);CHKERRQ(ierr);
49534831adSStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_use_change_of_basis","Use change of basis approach for primal space","none",pcbddc->usechangeofbasis,&pcbddc->usechangeofbasis,PETSC_NULL);CHKERRQ(ierr);
50534831adSStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_use_change_on_faces","Use change of basis approach for face constraints","none",pcbddc->usechangeonfaces,&pcbddc->usechangeonfaces,PETSC_NULL);CHKERRQ(ierr);
51534831adSStefano Zampini   pcbddc->usechangeonfaces = pcbddc->usechangeonfaces && pcbddc->usechangeofbasis;
520c7d97c5SJed Brown   ierr = PetscOptionsInt("-pc_bddc_coarsening_ratio","Set coarsening ratio used in multilevel coarsening","none",pcbddc->coarsening_ratio,&pcbddc->coarsening_ratio,PETSC_NULL);CHKERRQ(ierr);
530c7d97c5SJed Brown   ierr = PetscOptionsTail();CHKERRQ(ierr);
540c7d97c5SJed Brown   PetscFunctionReturn(0);
550c7d97c5SJed Brown }
560c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
570c7d97c5SJed Brown EXTERN_C_BEGIN
580c7d97c5SJed Brown #undef __FUNCT__
590c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetCoarseProblemType_BDDC"
6053cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetCoarseProblemType_BDDC(PC pc, CoarseProblemType CPT)
610c7d97c5SJed Brown {
620c7d97c5SJed Brown   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
630c7d97c5SJed Brown 
640c7d97c5SJed Brown   PetscFunctionBegin;
650c7d97c5SJed Brown   pcbddc->coarse_problem_type = CPT;
660c7d97c5SJed Brown   PetscFunctionReturn(0);
670c7d97c5SJed Brown }
680c7d97c5SJed Brown EXTERN_C_END
690c7d97c5SJed Brown #undef __FUNCT__
700c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetCoarseProblemType"
7153cdbc3dSStefano Zampini /*@
729c0446d6SStefano Zampini  PCBDDCSetCoarseProblemType - Set coarse problem type in PCBDDC.
7353cdbc3dSStefano Zampini 
749c0446d6SStefano Zampini    Not collective
7553cdbc3dSStefano Zampini 
7653cdbc3dSStefano Zampini    Input Parameters:
7753cdbc3dSStefano Zampini +  pc - the preconditioning context
7853cdbc3dSStefano Zampini -  CoarseProblemType - pick a better name and explain what this is
7953cdbc3dSStefano Zampini 
8053cdbc3dSStefano Zampini    Level: intermediate
8153cdbc3dSStefano Zampini 
8253cdbc3dSStefano Zampini    Notes:
83da1bb401SStefano Zampini    Not collective but all procs must call with same arguments.
8453cdbc3dSStefano Zampini 
8553cdbc3dSStefano Zampini .seealso: PCBDDC
8653cdbc3dSStefano Zampini @*/
870c7d97c5SJed Brown PetscErrorCode PCBDDCSetCoarseProblemType(PC pc, CoarseProblemType CPT)
880c7d97c5SJed Brown {
890c7d97c5SJed Brown   PetscErrorCode ierr;
900c7d97c5SJed Brown 
910c7d97c5SJed Brown   PetscFunctionBegin;
920c7d97c5SJed Brown   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
930c7d97c5SJed Brown   ierr = PetscTryMethod(pc,"PCBDDCSetCoarseProblemType_C",(PC,CoarseProblemType),(pc,CPT));CHKERRQ(ierr);
940c7d97c5SJed Brown   PetscFunctionReturn(0);
950c7d97c5SJed Brown }
960c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
970c7d97c5SJed Brown EXTERN_C_BEGIN
980c7d97c5SJed Brown #undef __FUNCT__
99*0bdf917eSStefano Zampini #define __FUNCT__ "PCBDDCSetNullSpace_BDDC"
100*0bdf917eSStefano Zampini static PetscErrorCode PCBDDCSetNullSpace_BDDC(PC pc,MatNullSpace NullSpace)
101*0bdf917eSStefano Zampini {
102*0bdf917eSStefano Zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
103*0bdf917eSStefano Zampini   PetscErrorCode ierr;
104*0bdf917eSStefano Zampini 
105*0bdf917eSStefano Zampini   PetscFunctionBegin;
106*0bdf917eSStefano Zampini   ierr = PetscObjectReference((PetscObject)NullSpace);CHKERRQ(ierr);
107*0bdf917eSStefano Zampini   ierr = MatNullSpaceDestroy(&pcbddc->NullSpace);CHKERRQ(ierr);
108*0bdf917eSStefano Zampini   pcbddc->NullSpace=NullSpace;
109*0bdf917eSStefano Zampini   PetscFunctionReturn(0);
110*0bdf917eSStefano Zampini }
111*0bdf917eSStefano Zampini EXTERN_C_END
112*0bdf917eSStefano Zampini #undef __FUNCT__
113*0bdf917eSStefano Zampini #define __FUNCT__ "PCBDDCSetNullSpace"
114*0bdf917eSStefano Zampini /*@
115*0bdf917eSStefano Zampini  PCBDDCSetNullSpace - Set NullSpace of global operator of BDDC preconditioned mat.
116*0bdf917eSStefano Zampini 
117*0bdf917eSStefano Zampini    Logically collective on PC and MatNullSpace
118*0bdf917eSStefano Zampini 
119*0bdf917eSStefano Zampini    Input Parameters:
120*0bdf917eSStefano Zampini +  pc - the preconditioning context
121*0bdf917eSStefano Zampini -  NullSpace - Null space of the linear operator to be preconditioned.
122*0bdf917eSStefano Zampini 
123*0bdf917eSStefano Zampini    Level: intermediate
124*0bdf917eSStefano Zampini 
125*0bdf917eSStefano Zampini    Notes:
126*0bdf917eSStefano Zampini 
127*0bdf917eSStefano Zampini .seealso: PCBDDC
128*0bdf917eSStefano Zampini @*/
129*0bdf917eSStefano Zampini PetscErrorCode PCBDDCSetNullSpace(PC pc,MatNullSpace NullSpace)
130*0bdf917eSStefano Zampini {
131*0bdf917eSStefano Zampini   PetscErrorCode ierr;
132*0bdf917eSStefano Zampini 
133*0bdf917eSStefano Zampini   PetscFunctionBegin;
134*0bdf917eSStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
135*0bdf917eSStefano Zampini   ierr = PetscTryMethod(pc,"PCBDDCSetNullSpace_C",(PC,MatNullSpace),(pc,NullSpace));CHKERRQ(ierr);
136*0bdf917eSStefano Zampini   PetscFunctionReturn(0);
137*0bdf917eSStefano Zampini }
138*0bdf917eSStefano Zampini /* -------------------------------------------------------------------------- */
139*0bdf917eSStefano Zampini EXTERN_C_BEGIN
140*0bdf917eSStefano Zampini #undef __FUNCT__
1413b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCSetDirichletBoundaries_BDDC"
1423b03a366Sstefano_zampini static PetscErrorCode PCBDDCSetDirichletBoundaries_BDDC(PC pc,IS DirichletBoundaries)
1433b03a366Sstefano_zampini {
1443b03a366Sstefano_zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
1453b03a366Sstefano_zampini   PetscErrorCode ierr;
1463b03a366Sstefano_zampini 
1473b03a366Sstefano_zampini   PetscFunctionBegin;
1483b03a366Sstefano_zampini   ierr = ISDestroy(&pcbddc->DirichletBoundaries);CHKERRQ(ierr);
14936e030ebSStefano Zampini   ierr = PetscObjectReference((PetscObject)DirichletBoundaries);CHKERRQ(ierr);
15036e030ebSStefano Zampini   pcbddc->DirichletBoundaries=DirichletBoundaries;
1513b03a366Sstefano_zampini   PetscFunctionReturn(0);
1523b03a366Sstefano_zampini }
1533b03a366Sstefano_zampini EXTERN_C_END
1543b03a366Sstefano_zampini #undef __FUNCT__
1553b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCSetDirichletBoundaries"
1563b03a366Sstefano_zampini /*@
157da1bb401SStefano Zampini  PCBDDCSetDirichletBoundaries - Set index set defining subdomain part (in local ordering)
158da1bb401SStefano Zampini                               of Dirichlet boundaries for the global problem.
1593b03a366Sstefano_zampini 
1603b03a366Sstefano_zampini    Not collective
1613b03a366Sstefano_zampini 
1623b03a366Sstefano_zampini    Input Parameters:
1633b03a366Sstefano_zampini +  pc - the preconditioning context
1643b03a366Sstefano_zampini -  DirichletBoundaries - sequential index set defining the subdomain part of Dirichlet boundaries (can be PETSC_NULL)
1653b03a366Sstefano_zampini 
1663b03a366Sstefano_zampini    Level: intermediate
1673b03a366Sstefano_zampini 
1683b03a366Sstefano_zampini    Notes:
1693b03a366Sstefano_zampini 
1703b03a366Sstefano_zampini .seealso: PCBDDC
1713b03a366Sstefano_zampini @*/
1723b03a366Sstefano_zampini PetscErrorCode PCBDDCSetDirichletBoundaries(PC pc,IS DirichletBoundaries)
1733b03a366Sstefano_zampini {
1743b03a366Sstefano_zampini   PetscErrorCode ierr;
1753b03a366Sstefano_zampini 
1763b03a366Sstefano_zampini   PetscFunctionBegin;
1773b03a366Sstefano_zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
1783b03a366Sstefano_zampini   ierr = PetscTryMethod(pc,"PCBDDCSetDirichletBoundaries_C",(PC,IS),(pc,DirichletBoundaries));CHKERRQ(ierr);
1793b03a366Sstefano_zampini   PetscFunctionReturn(0);
1803b03a366Sstefano_zampini }
1813b03a366Sstefano_zampini /* -------------------------------------------------------------------------- */
1823b03a366Sstefano_zampini EXTERN_C_BEGIN
1833b03a366Sstefano_zampini #undef __FUNCT__
1840c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetNeumannBoundaries_BDDC"
18553cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetNeumannBoundaries_BDDC(PC pc,IS NeumannBoundaries)
1860c7d97c5SJed Brown {
1870c7d97c5SJed Brown   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
18853cdbc3dSStefano Zampini   PetscErrorCode ierr;
1890c7d97c5SJed Brown 
1900c7d97c5SJed Brown   PetscFunctionBegin;
19153cdbc3dSStefano Zampini   ierr = ISDestroy(&pcbddc->NeumannBoundaries);CHKERRQ(ierr);
19236e030ebSStefano Zampini   ierr = PetscObjectReference((PetscObject)NeumannBoundaries);CHKERRQ(ierr);
19336e030ebSStefano Zampini   pcbddc->NeumannBoundaries=NeumannBoundaries;
1940c7d97c5SJed Brown   PetscFunctionReturn(0);
1950c7d97c5SJed Brown }
1960c7d97c5SJed Brown EXTERN_C_END
1970c7d97c5SJed Brown #undef __FUNCT__
1980c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetNeumannBoundaries"
19957527edcSJed Brown /*@
200da1bb401SStefano Zampini  PCBDDCSetNeumannBoundaries - Set index set defining subdomain part (in local ordering)
201da1bb401SStefano Zampini                               of Neumann boundaries for the global problem.
20257527edcSJed Brown 
2039c0446d6SStefano Zampini    Not collective
20457527edcSJed Brown 
20557527edcSJed Brown    Input Parameters:
20657527edcSJed Brown +  pc - the preconditioning context
2079c0446d6SStefano Zampini -  NeumannBoundaries - sequential index set defining the subdomain part of Neumann boundaries (can be PETSC_NULL)
20857527edcSJed Brown 
20957527edcSJed Brown    Level: intermediate
21057527edcSJed Brown 
21157527edcSJed Brown    Notes:
21257527edcSJed Brown 
21357527edcSJed Brown .seealso: PCBDDC
21457527edcSJed Brown @*/
21553cdbc3dSStefano Zampini PetscErrorCode PCBDDCSetNeumannBoundaries(PC pc,IS NeumannBoundaries)
2160c7d97c5SJed Brown {
2170c7d97c5SJed Brown   PetscErrorCode ierr;
2180c7d97c5SJed Brown 
2190c7d97c5SJed Brown   PetscFunctionBegin;
2200c7d97c5SJed Brown   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
22153cdbc3dSStefano Zampini   ierr = PetscTryMethod(pc,"PCBDDCSetNeumannBoundaries_C",(PC,IS),(pc,NeumannBoundaries));CHKERRQ(ierr);
22253cdbc3dSStefano Zampini   PetscFunctionReturn(0);
22353cdbc3dSStefano Zampini }
22453cdbc3dSStefano Zampini /* -------------------------------------------------------------------------- */
22553cdbc3dSStefano Zampini EXTERN_C_BEGIN
22653cdbc3dSStefano Zampini #undef __FUNCT__
227da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCGetDirichletBoundaries_BDDC"
228da1bb401SStefano Zampini static PetscErrorCode PCBDDCGetDirichletBoundaries_BDDC(PC pc,IS *DirichletBoundaries)
229da1bb401SStefano Zampini {
230da1bb401SStefano Zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
231da1bb401SStefano Zampini 
232da1bb401SStefano Zampini   PetscFunctionBegin;
233da1bb401SStefano Zampini   *DirichletBoundaries = pcbddc->DirichletBoundaries;
234da1bb401SStefano Zampini   PetscFunctionReturn(0);
235da1bb401SStefano Zampini }
236da1bb401SStefano Zampini EXTERN_C_END
237da1bb401SStefano Zampini #undef __FUNCT__
238da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCGetDirichletBoundaries"
239da1bb401SStefano Zampini /*@
240da1bb401SStefano Zampini  PCBDDCGetDirichletBoundaries - Get index set defining subdomain part (in local ordering)
241da1bb401SStefano Zampini                                 of Dirichlet boundaries for the global problem.
242da1bb401SStefano Zampini 
243da1bb401SStefano Zampini    Not collective
244da1bb401SStefano Zampini 
245da1bb401SStefano Zampini    Input Parameters:
246da1bb401SStefano Zampini +  pc - the preconditioning context
247da1bb401SStefano Zampini 
248da1bb401SStefano Zampini    Output Parameters:
249da1bb401SStefano Zampini +  DirichletBoundaries - index set defining the subdomain part of Dirichlet boundaries
250da1bb401SStefano Zampini 
251da1bb401SStefano Zampini    Level: intermediate
252da1bb401SStefano Zampini 
253da1bb401SStefano Zampini    Notes:
254da1bb401SStefano Zampini 
255da1bb401SStefano Zampini .seealso: PCBDDC
256da1bb401SStefano Zampini @*/
257da1bb401SStefano Zampini PetscErrorCode PCBDDCGetDirichletBoundaries(PC pc,IS *DirichletBoundaries)
258da1bb401SStefano Zampini {
259da1bb401SStefano Zampini   PetscErrorCode ierr;
260da1bb401SStefano Zampini 
261da1bb401SStefano Zampini   PetscFunctionBegin;
262da1bb401SStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
263da1bb401SStefano Zampini   ierr = PetscUseMethod(pc,"PCBDDCGetDirichletBoundaries_C",(PC,IS*),(pc,DirichletBoundaries));CHKERRQ(ierr);
264da1bb401SStefano Zampini   PetscFunctionReturn(0);
265da1bb401SStefano Zampini }
266da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
267da1bb401SStefano Zampini EXTERN_C_BEGIN
268da1bb401SStefano Zampini #undef __FUNCT__
26953cdbc3dSStefano Zampini #define __FUNCT__ "PCBDDCGetNeumannBoundaries_BDDC"
27053cdbc3dSStefano Zampini static PetscErrorCode PCBDDCGetNeumannBoundaries_BDDC(PC pc,IS *NeumannBoundaries)
27153cdbc3dSStefano Zampini {
27253cdbc3dSStefano Zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
27353cdbc3dSStefano Zampini 
27453cdbc3dSStefano Zampini   PetscFunctionBegin;
27553cdbc3dSStefano Zampini   *NeumannBoundaries = pcbddc->NeumannBoundaries;
27653cdbc3dSStefano Zampini   PetscFunctionReturn(0);
27753cdbc3dSStefano Zampini }
27853cdbc3dSStefano Zampini EXTERN_C_END
27953cdbc3dSStefano Zampini #undef __FUNCT__
28053cdbc3dSStefano Zampini #define __FUNCT__ "PCBDDCGetNeumannBoundaries"
28153cdbc3dSStefano Zampini /*@
282da1bb401SStefano Zampini  PCBDDCGetNeumannBoundaries - Get index set defining subdomain part (in local ordering)
283da1bb401SStefano Zampini                               of Neumann boundaries for the global problem.
28453cdbc3dSStefano Zampini 
2859c0446d6SStefano Zampini    Not collective
28653cdbc3dSStefano Zampini 
28753cdbc3dSStefano Zampini    Input Parameters:
28853cdbc3dSStefano Zampini +  pc - the preconditioning context
28953cdbc3dSStefano Zampini 
29053cdbc3dSStefano Zampini    Output Parameters:
29153cdbc3dSStefano Zampini +  NeumannBoundaries - index set defining the subdomain part of Neumann boundaries
29253cdbc3dSStefano Zampini 
29353cdbc3dSStefano Zampini    Level: intermediate
29453cdbc3dSStefano Zampini 
29553cdbc3dSStefano Zampini    Notes:
29653cdbc3dSStefano Zampini 
29753cdbc3dSStefano Zampini .seealso: PCBDDC
29853cdbc3dSStefano Zampini @*/
29953cdbc3dSStefano Zampini PetscErrorCode PCBDDCGetNeumannBoundaries(PC pc,IS *NeumannBoundaries)
30053cdbc3dSStefano Zampini {
30153cdbc3dSStefano Zampini   PetscErrorCode ierr;
30253cdbc3dSStefano Zampini 
30353cdbc3dSStefano Zampini   PetscFunctionBegin;
30453cdbc3dSStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
30553cdbc3dSStefano Zampini   ierr = PetscUseMethod(pc,"PCBDDCGetNeumannBoundaries_C",(PC,IS*),(pc,NeumannBoundaries));CHKERRQ(ierr);
3060c7d97c5SJed Brown   PetscFunctionReturn(0);
3070c7d97c5SJed Brown }
30836e030ebSStefano Zampini /* -------------------------------------------------------------------------- */
30936e030ebSStefano Zampini EXTERN_C_BEGIN
31036e030ebSStefano Zampini #undef __FUNCT__
311da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetLocalAdjacencyGraph_BDDC"
312da1bb401SStefano Zampini static PetscErrorCode PCBDDCSetLocalAdjacencyGraph_BDDC(PC pc, PetscInt nvtxs, PetscInt xadj[], PetscInt adjncy[], PetscCopyMode copymode)
31336e030ebSStefano Zampini {
31436e030ebSStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
315da1bb401SStefano Zampini   PCBDDCGraph    mat_graph=pcbddc->mat_graph;
316da1bb401SStefano Zampini   PetscErrorCode ierr;
31736e030ebSStefano Zampini 
31836e030ebSStefano Zampini   PetscFunctionBegin;
319da1bb401SStefano Zampini   mat_graph->nvtxs=nvtxs;
320da1bb401SStefano Zampini   ierr = PetscFree(mat_graph->xadj);CHKERRQ(ierr);
321da1bb401SStefano Zampini   ierr = PetscFree(mat_graph->adjncy);CHKERRQ(ierr);
322da1bb401SStefano Zampini   if (copymode == PETSC_COPY_VALUES) {
323da1bb401SStefano Zampini     ierr = PetscMalloc((mat_graph->nvtxs+1)*sizeof(PetscInt),&mat_graph->xadj);CHKERRQ(ierr);
324da1bb401SStefano Zampini     ierr = PetscMalloc(xadj[mat_graph->nvtxs]*sizeof(PetscInt),&mat_graph->adjncy);CHKERRQ(ierr);
325da1bb401SStefano Zampini     ierr = PetscMemcpy(mat_graph->xadj,xadj,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr);
326da1bb401SStefano Zampini     ierr = PetscMemcpy(mat_graph->adjncy,adjncy,xadj[mat_graph->nvtxs]*sizeof(PetscInt));CHKERRQ(ierr);
327da1bb401SStefano Zampini   } else if (copymode == PETSC_OWN_POINTER) {
328da1bb401SStefano Zampini     mat_graph->xadj=xadj;
329da1bb401SStefano Zampini     mat_graph->adjncy=adjncy;
330da1bb401SStefano Zampini   } else {
331da1bb401SStefano Zampini     SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_SUP,"Unsupported copy mode %d in %s\n",copymode,__FUNCT__);
332da1bb401SStefano Zampini   }
33336e030ebSStefano Zampini   PetscFunctionReturn(0);
33436e030ebSStefano Zampini }
33536e030ebSStefano Zampini EXTERN_C_END
33636e030ebSStefano Zampini #undef __FUNCT__
337da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetLocalAdjacencyGraph"
33836e030ebSStefano Zampini /*@
339da1bb401SStefano Zampini  PCBDDCSetLocalAdjacencyGraph - Set CSR graph of local matrix for use of PCBDDC.
34036e030ebSStefano Zampini 
34136e030ebSStefano Zampini    Not collective
34236e030ebSStefano Zampini 
34336e030ebSStefano Zampini    Input Parameters:
34436e030ebSStefano Zampini +  pc - the preconditioning context
345da1bb401SStefano Zampini -  nvtxs - number of local vertices of the graph
346da1bb401SStefano Zampini -  xadj, adjncy - the CSR graph
347da1bb401SStefano Zampini -  copymode - either PETSC_COPY_VALUES or PETSC_OWN_POINTER. In the former case the user must free the array passed in;
348da1bb401SStefano Zampini                                                              in the latter case, memory must be obtained with PetscMalloc.
34936e030ebSStefano Zampini 
35036e030ebSStefano Zampini    Level: intermediate
35136e030ebSStefano Zampini 
35236e030ebSStefano Zampini    Notes:
35336e030ebSStefano Zampini 
35436e030ebSStefano Zampini .seealso: PCBDDC
35536e030ebSStefano Zampini @*/
356da1bb401SStefano Zampini PetscErrorCode PCBDDCSetLocalAdjacencyGraph(PC pc,PetscInt nvtxs,PetscInt xadj[],PetscInt adjncy[], PetscCopyMode copymode)
35736e030ebSStefano Zampini {
358da1bb401SStefano Zampini   PetscInt       nrows,ncols;
359da1bb401SStefano Zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
36036e030ebSStefano Zampini   PetscErrorCode ierr;
36136e030ebSStefano Zampini 
36236e030ebSStefano Zampini   PetscFunctionBegin;
36336e030ebSStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
364da1bb401SStefano Zampini   ierr = MatGetSize(matis->A,&nrows,&ncols);CHKERRQ(ierr);
365da1bb401SStefano Zampini   if (nvtxs != nrows) {
366da1bb401SStefano Zampini     SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Local adjacency size %d passed in %s differs from local problem size %d!\n",nvtxs,__FUNCT__,nrows);
367da1bb401SStefano Zampini   } else {
368da1bb401SStefano Zampini     ierr = PetscTryMethod(pc,"PCBDDCSetLocalAdjacencyGraph_C",(PC,PetscInt,PetscInt[],PetscInt[],PetscCopyMode),(pc,nvtxs,xadj,adjncy,copymode));CHKERRQ(ierr);
369da1bb401SStefano Zampini   }
37036e030ebSStefano Zampini   PetscFunctionReturn(0);
37136e030ebSStefano Zampini }
3729c0446d6SStefano Zampini /* -------------------------------------------------------------------------- */
3739c0446d6SStefano Zampini EXTERN_C_BEGIN
3749c0446d6SStefano Zampini #undef __FUNCT__
3759c0446d6SStefano Zampini #define __FUNCT__ "PCBDDCSetDofsSplitting_BDDC"
3769c0446d6SStefano Zampini static PetscErrorCode PCBDDCSetDofsSplitting_BDDC(PC pc,PetscInt n_is, IS ISForDofs[])
3779c0446d6SStefano Zampini {
3789c0446d6SStefano Zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
3799c0446d6SStefano Zampini   PetscInt i;
3809c0446d6SStefano Zampini   PetscErrorCode ierr;
3819c0446d6SStefano Zampini 
3829c0446d6SStefano Zampini   PetscFunctionBegin;
383da1bb401SStefano Zampini   /* Destroy ISes if they were already set */
3849c0446d6SStefano Zampini   for (i=0;i<pcbddc->n_ISForDofs;i++) {
3859c0446d6SStefano Zampini     ierr = ISDestroy(&pcbddc->ISForDofs[i]);CHKERRQ(ierr);
3869c0446d6SStefano Zampini   }
387d11ae9bbSstefano_zampini   ierr = PetscFree(pcbddc->ISForDofs);CHKERRQ(ierr);
388da1bb401SStefano Zampini   /* allocate space then set */
3899c0446d6SStefano Zampini   ierr = PetscMalloc(n_is*sizeof(IS),&pcbddc->ISForDofs);CHKERRQ(ierr);
3909c0446d6SStefano Zampini   for (i=0;i<n_is;i++) {
391da1bb401SStefano Zampini     ierr = PetscObjectReference((PetscObject)ISForDofs[i]);CHKERRQ(ierr);
392da1bb401SStefano Zampini     pcbddc->ISForDofs[i]=ISForDofs[i];
3939c0446d6SStefano Zampini   }
3949c0446d6SStefano Zampini   pcbddc->n_ISForDofs=n_is;
3959c0446d6SStefano Zampini   PetscFunctionReturn(0);
3969c0446d6SStefano Zampini }
3979c0446d6SStefano Zampini EXTERN_C_END
3989c0446d6SStefano Zampini #undef __FUNCT__
3999c0446d6SStefano Zampini #define __FUNCT__ "PCBDDCSetDofsSplitting"
4009c0446d6SStefano Zampini /*@
401da1bb401SStefano Zampini  PCBDDCSetDofsSplitting - Set index sets defining fields of local mat.
4029c0446d6SStefano Zampini 
4039c0446d6SStefano Zampini    Not collective
4049c0446d6SStefano Zampini 
4059c0446d6SStefano Zampini    Input Parameters:
4069c0446d6SStefano Zampini +  pc - the preconditioning context
407da1bb401SStefano Zampini -  n - number of index sets defining the fields
408da1bb401SStefano Zampini -  IS[] - array of IS describing the fields
4099c0446d6SStefano Zampini 
4109c0446d6SStefano Zampini    Level: intermediate
4119c0446d6SStefano Zampini 
4129c0446d6SStefano Zampini    Notes:
4139c0446d6SStefano Zampini 
4149c0446d6SStefano Zampini .seealso: PCBDDC
4159c0446d6SStefano Zampini @*/
4169c0446d6SStefano Zampini PetscErrorCode PCBDDCSetDofsSplitting(PC pc,PetscInt n_is, IS ISForDofs[])
4179c0446d6SStefano Zampini {
4189c0446d6SStefano Zampini   PetscErrorCode ierr;
4199c0446d6SStefano Zampini 
4209c0446d6SStefano Zampini   PetscFunctionBegin;
4219c0446d6SStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
4229c0446d6SStefano Zampini   ierr = PetscTryMethod(pc,"PCBDDCSetDofsSplitting_C",(PC,PetscInt,IS[]),(pc,n_is,ISForDofs));CHKERRQ(ierr);
4239c0446d6SStefano Zampini   PetscFunctionReturn(0);
4249c0446d6SStefano Zampini }
425da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
426534831adSStefano Zampini #undef __FUNCT__
427534831adSStefano Zampini #define __FUNCT__ "PCPreSolve_BDDC"
428534831adSStefano Zampini /* -------------------------------------------------------------------------- */
429534831adSStefano Zampini /*
430534831adSStefano Zampini    PCPreSolve_BDDC - Changes the right hand side and (if necessary) the initial
431534831adSStefano Zampini                      guess if a transformation of basis approach has been selected.
4329c0446d6SStefano Zampini 
433534831adSStefano Zampini    Input Parameter:
434534831adSStefano Zampini +  pc - the preconditioner contex
435534831adSStefano Zampini 
436534831adSStefano Zampini    Application Interface Routine: PCPreSolve()
437534831adSStefano Zampini 
438534831adSStefano Zampini    Notes:
439534831adSStefano Zampini    The interface routine PCPreSolve() is not usually called directly by
440534831adSStefano Zampini    the user, but instead is called by KSPSolve().
441534831adSStefano Zampini */
442534831adSStefano Zampini static PetscErrorCode PCPreSolve_BDDC(PC pc, KSP ksp, Vec rhs, Vec x)
443534831adSStefano Zampini {
444534831adSStefano Zampini   PetscErrorCode ierr;
445534831adSStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
446534831adSStefano Zampini   PC_IS          *pcis = (PC_IS*)(pc->data);
447534831adSStefano Zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
448534831adSStefano Zampini   Mat            temp_mat;
4493972b0daSStefano Zampini   IS             dirIS;
4503972b0daSStefano Zampini   PetscInt       dirsize,i,*is_indices;
4513972b0daSStefano Zampini   PetscScalar    *array_x,*array_diagonal;
4523972b0daSStefano Zampini   Vec            used_vec;
4533972b0daSStefano Zampini   PetscBool      guess_nonzero;
454534831adSStefano Zampini 
455534831adSStefano Zampini   PetscFunctionBegin;
4563972b0daSStefano Zampini   if (x) {
4573972b0daSStefano Zampini     ierr = PetscObjectReference((PetscObject)x);CHKERRQ(ierr);
4583972b0daSStefano Zampini     used_vec = x;
4593972b0daSStefano Zampini   } else {
4603972b0daSStefano Zampini     ierr = PetscObjectReference((PetscObject)pcbddc->temp_solution);CHKERRQ(ierr);
4613972b0daSStefano Zampini     used_vec = pcbddc->temp_solution;
4623972b0daSStefano Zampini     ierr = VecSet(used_vec,0.0);CHKERRQ(ierr);
4633972b0daSStefano Zampini   }
4643972b0daSStefano Zampini   /* hack into ksp data structure PCPreSolve comes earlier in src/ksp/ksp/interface/itfunc.c */
4653972b0daSStefano Zampini   if (ksp) {
4663972b0daSStefano Zampini     ierr = KSPGetInitialGuessNonzero(ksp,&guess_nonzero);CHKERRQ(ierr);
4673972b0daSStefano Zampini     if ( !guess_nonzero ) {
4683972b0daSStefano Zampini       ierr = VecSet(used_vec,0.0);CHKERRQ(ierr);
4693972b0daSStefano Zampini     }
4703972b0daSStefano Zampini   }
4713972b0daSStefano Zampini   /* store the original rhs */
4723972b0daSStefano Zampini   ierr = VecCopy(rhs,pcbddc->original_rhs);CHKERRQ(ierr);
4733972b0daSStefano Zampini 
4743972b0daSStefano Zampini   /* Take into account zeroed rows -> change rhs and store solution removed */
4753972b0daSStefano Zampini   ierr = MatGetDiagonal(pc->pmat,pcis->vec1_global);CHKERRQ(ierr);
4763972b0daSStefano Zampini   ierr = VecPointwiseDivide(pcis->vec1_global,rhs,pcis->vec1_global);CHKERRQ(ierr);
4773972b0daSStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4783972b0daSStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4793972b0daSStefano Zampini   ierr = VecScatterBegin(matis->ctx,used_vec,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4803972b0daSStefano Zampini   ierr = VecScatterEnd  (matis->ctx,used_vec,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4813972b0daSStefano Zampini   ierr = PCBDDCGetDirichletBoundaries(pc,&dirIS);CHKERRQ(ierr);
4823972b0daSStefano Zampini   if (dirIS) {
4833972b0daSStefano Zampini     ierr = ISGetSize(dirIS,&dirsize);CHKERRQ(ierr);
4843972b0daSStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array_x);CHKERRQ(ierr);
4853972b0daSStefano Zampini     ierr = VecGetArray(pcis->vec2_N,&array_diagonal);CHKERRQ(ierr);
4863972b0daSStefano Zampini     ierr = ISGetIndices(dirIS,(const PetscInt**)&is_indices);CHKERRQ(ierr);
4873972b0daSStefano Zampini     for (i=0;i<dirsize;i++) {
4883972b0daSStefano Zampini       array_x[is_indices[i]]=array_diagonal[is_indices[i]];
4893972b0daSStefano Zampini     }
4903972b0daSStefano Zampini     ierr = ISRestoreIndices(dirIS,(const PetscInt**)&is_indices);CHKERRQ(ierr);
4913972b0daSStefano Zampini     ierr = VecRestoreArray(pcis->vec2_N,&array_diagonal);CHKERRQ(ierr);
4923972b0daSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array_x);CHKERRQ(ierr);
4933972b0daSStefano Zampini   }
4943972b0daSStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4953972b0daSStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
496b76ba322SStefano Zampini 
4973972b0daSStefano Zampini   /* remove the computed solution from the rhs */
4983972b0daSStefano Zampini   ierr = VecScale(used_vec,-1.0);CHKERRQ(ierr);
4993972b0daSStefano Zampini   ierr = MatMultAdd(pc->pmat,used_vec,rhs,rhs);CHKERRQ(ierr);
5003972b0daSStefano Zampini   ierr = VecScale(used_vec,-1.0);CHKERRQ(ierr);
501b76ba322SStefano Zampini 
502b76ba322SStefano Zampini   /* store partially computed solution and set initial guess */
5033972b0daSStefano Zampini   if (x) {
5043972b0daSStefano Zampini     ierr = VecCopy(used_vec,pcbddc->temp_solution);CHKERRQ(ierr);
5053972b0daSStefano Zampini     ierr = VecSet(used_vec,0.0);CHKERRQ(ierr);
506b76ba322SStefano Zampini     if (pcbddc->use_exact_dirichlet) {
507b76ba322SStefano Zampini       ierr = VecScatterBegin(pcis->global_to_D,rhs,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
508b76ba322SStefano Zampini       ierr = VecScatterEnd  (pcis->global_to_D,rhs,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
509b76ba322SStefano Zampini       ierr = KSPSolve(pcbddc->ksp_D,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr);
510b76ba322SStefano Zampini       ierr = VecScatterBegin(pcis->global_to_D,pcis->vec2_D,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
511b76ba322SStefano Zampini       ierr = VecScatterEnd  (pcis->global_to_D,pcis->vec2_D,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
512b76ba322SStefano Zampini       if (ksp) {
513b76ba322SStefano Zampini         ierr = KSPSetInitialGuessNonzero(ksp,PETSC_TRUE);CHKERRQ(ierr);
514b76ba322SStefano Zampini       }
515b76ba322SStefano Zampini     }
5163972b0daSStefano Zampini   }
517b76ba322SStefano Zampini 
518b76ba322SStefano Zampini   /* rhs change of basis */
519b76ba322SStefano Zampini   if (pcbddc->usechangeofbasis) {
520b76ba322SStefano Zampini     /* swap pointers for local matrices */
521b76ba322SStefano Zampini     temp_mat = matis->A;
522b76ba322SStefano Zampini     matis->A = pcbddc->local_mat;
523b76ba322SStefano Zampini     pcbddc->local_mat = temp_mat;
524b76ba322SStefano Zampini     /* Get local rhs and apply transformation of basis */
525b76ba322SStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,rhs,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
526b76ba322SStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,rhs,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
527b76ba322SStefano Zampini     /* from original basis to modified basis */
528b76ba322SStefano Zampini     ierr = MatMultTranspose(pcbddc->ChangeOfBasisMatrix,pcis->vec1_B,pcis->vec2_B);CHKERRQ(ierr);
529b76ba322SStefano Zampini     /* put back modified values into the global vec using INSERT_VALUES copy mode */
530b76ba322SStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,pcis->vec2_B,rhs,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
531b76ba322SStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec2_B,rhs,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
532*0bdf917eSStefano Zampini     if (ksp && pcbddc->NullSpace) {
533*0bdf917eSStefano Zampini       ierr = MatNullSpaceRemove(pcbddc->NullSpace,used_vec,PETSC_NULL);CHKERRQ(ierr);
534*0bdf917eSStefano Zampini       ierr = MatNullSpaceRemove(pcbddc->NullSpace,rhs,PETSC_NULL);CHKERRQ(ierr);
535b76ba322SStefano Zampini     }
536*0bdf917eSStefano Zampini   }
537*0bdf917eSStefano Zampini   ierr = VecDestroy(&used_vec);CHKERRQ(ierr);
538534831adSStefano Zampini   PetscFunctionReturn(0);
539534831adSStefano Zampini }
540534831adSStefano Zampini /* -------------------------------------------------------------------------- */
541534831adSStefano Zampini #undef __FUNCT__
542534831adSStefano Zampini #define __FUNCT__ "PCPostSolve_BDDC"
543534831adSStefano Zampini /* -------------------------------------------------------------------------- */
544534831adSStefano Zampini /*
545534831adSStefano Zampini    PCPostSolve_BDDC - Changes the computed solution if a transformation of basis
546534831adSStefano Zampini                      approach has been selected. Also, restores rhs to its original state.
547534831adSStefano Zampini 
548534831adSStefano Zampini    Input Parameter:
549534831adSStefano Zampini +  pc - the preconditioner contex
550534831adSStefano Zampini 
551534831adSStefano Zampini    Application Interface Routine: PCPostSolve()
552534831adSStefano Zampini 
553534831adSStefano Zampini    Notes:
554534831adSStefano Zampini    The interface routine PCPostSolve() is not usually called directly by
555534831adSStefano Zampini    the user, but instead is called by KSPSolve().
556534831adSStefano Zampini */
557534831adSStefano Zampini static PetscErrorCode PCPostSolve_BDDC(PC pc, KSP ksp, Vec rhs, Vec x)
558534831adSStefano Zampini {
559534831adSStefano Zampini   PetscErrorCode ierr;
560534831adSStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
561534831adSStefano Zampini   PC_IS          *pcis = (PC_IS*)(pc->data);
562534831adSStefano Zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
563534831adSStefano Zampini   Mat            temp_mat;
564534831adSStefano Zampini 
565534831adSStefano Zampini   PetscFunctionBegin;
566534831adSStefano Zampini   if (pcbddc->usechangeofbasis) {
567534831adSStefano Zampini     /* swap pointers for local matrices */
568534831adSStefano Zampini     temp_mat = matis->A;
569534831adSStefano Zampini     matis->A = pcbddc->local_mat;
570534831adSStefano Zampini     pcbddc->local_mat = temp_mat;
571534831adSStefano Zampini     /* restore rhs to its original state */
5723425bc38SStefano Zampini     if (rhs) {
5733425bc38SStefano Zampini       ierr = VecCopy(pcbddc->original_rhs,rhs);CHKERRQ(ierr);
5743425bc38SStefano Zampini     }
575534831adSStefano Zampini     /* Get Local boundary and apply transformation of basis to solution vector */
576534831adSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,x,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
577534831adSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,x,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
578534831adSStefano Zampini     /* from modified basis to original basis */
579534831adSStefano Zampini     ierr = MatMult(pcbddc->ChangeOfBasisMatrix,pcis->vec1_B,pcis->vec2_B);CHKERRQ(ierr);
580534831adSStefano Zampini     /* put back modified values into the global vec using INSERT_VALUES copy mode */
581534831adSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,pcis->vec2_B,x,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
582534831adSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec2_B,x,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
583534831adSStefano Zampini   }
5843972b0daSStefano Zampini   /* add solution removed in presolve */
5853425bc38SStefano Zampini   if (x) {
5863425bc38SStefano Zampini     ierr = VecAXPY(x,1.0,pcbddc->temp_solution);CHKERRQ(ierr);
5873425bc38SStefano Zampini   }
588534831adSStefano Zampini   PetscFunctionReturn(0);
589534831adSStefano Zampini }
590534831adSStefano Zampini /* -------------------------------------------------------------------------- */
59153cdbc3dSStefano Zampini #undef __FUNCT__
59253cdbc3dSStefano Zampini #define __FUNCT__ "PCSetUp_BDDC"
5930c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
5940c7d97c5SJed Brown /*
5950c7d97c5SJed Brown    PCSetUp_BDDC - Prepares for the use of the BDDC preconditioner
5960c7d97c5SJed Brown                   by setting data structures and options.
5970c7d97c5SJed Brown 
5980c7d97c5SJed Brown    Input Parameter:
59953cdbc3dSStefano Zampini +  pc - the preconditioner context
6000c7d97c5SJed Brown 
6010c7d97c5SJed Brown    Application Interface Routine: PCSetUp()
6020c7d97c5SJed Brown 
6030c7d97c5SJed Brown    Notes:
6040c7d97c5SJed Brown    The interface routine PCSetUp() is not usually called directly by
6050c7d97c5SJed Brown    the user, but instead is called by PCApply() if necessary.
6060c7d97c5SJed Brown */
60753cdbc3dSStefano Zampini PetscErrorCode PCSetUp_BDDC(PC pc)
6080c7d97c5SJed Brown {
6090c7d97c5SJed Brown   PetscErrorCode ierr;
6100c7d97c5SJed Brown   PC_BDDC*       pcbddc   = (PC_BDDC*)pc->data;
6110c7d97c5SJed Brown 
6120c7d97c5SJed Brown   PetscFunctionBegin;
6130c7d97c5SJed Brown   if (!pc->setupcalled) {
6143b03a366Sstefano_zampini     /* For BDDC we need to define a local "Neumann" problem different to that defined in PCISSetup
6159c0446d6SStefano Zampini        So, we set to pcnone the Neumann problem of pcis in order to avoid unneeded computation
6160c7d97c5SJed Brown        Also, we decide to directly build the (same) Dirichlet problem */
6170c7d97c5SJed Brown     ierr = PetscOptionsSetValue("-is_localN_pc_type","none");CHKERRQ(ierr);
6180c7d97c5SJed Brown     ierr = PetscOptionsSetValue("-is_localD_pc_type","none");CHKERRQ(ierr);
6190c7d97c5SJed Brown     /* Set up all the "iterative substructuring" common block */
620*0bdf917eSStefano Zampini 
6210c7d97c5SJed Brown     ierr = PCISSetUp(pc);CHKERRQ(ierr);
6223b03a366Sstefano_zampini     /* Get stdout for dbg */
623e269702eSStefano Zampini     if (pcbddc->dbg_flag) {
624e269702eSStefano Zampini       ierr = PetscViewerASCIIGetStdout(((PetscObject)pc)->comm,&pcbddc->dbg_viewer);CHKERRQ(ierr);
625e269702eSStefano Zampini       ierr = PetscViewerASCIISynchronizedAllow(pcbddc->dbg_viewer,PETSC_TRUE);CHKERRQ(ierr);
626e269702eSStefano Zampini     }
6273b03a366Sstefano_zampini     /* Analyze local interface */
6280c7d97c5SJed Brown     ierr = PCBDDCManageLocalBoundaries(pc);CHKERRQ(ierr);
6293b03a366Sstefano_zampini     /* Set up local constraint matrix */
6303b03a366Sstefano_zampini     ierr = PCBDDCCreateConstraintMatrix(pc);CHKERRQ(ierr);
6310c7d97c5SJed Brown     /* Create coarse and local stuffs used for evaluating action of preconditioner */
6320c7d97c5SJed Brown     ierr = PCBDDCCoarseSetUp(pc);CHKERRQ(ierr);
6330c7d97c5SJed Brown   }
6340c7d97c5SJed Brown   PetscFunctionReturn(0);
6350c7d97c5SJed Brown }
6360c7d97c5SJed Brown 
6370c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
6380c7d97c5SJed Brown /*
6390c7d97c5SJed Brown    PCApply_BDDC - Applies the BDDC preconditioner to a vector.
6400c7d97c5SJed Brown 
6410c7d97c5SJed Brown    Input Parameters:
6420c7d97c5SJed Brown .  pc - the preconditioner context
6430c7d97c5SJed Brown .  r - input vector (global)
6440c7d97c5SJed Brown 
6450c7d97c5SJed Brown    Output Parameter:
6460c7d97c5SJed Brown .  z - output vector (global)
6470c7d97c5SJed Brown 
6480c7d97c5SJed Brown    Application Interface Routine: PCApply()
6490c7d97c5SJed Brown  */
6500c7d97c5SJed Brown #undef __FUNCT__
6510c7d97c5SJed Brown #define __FUNCT__ "PCApply_BDDC"
65253cdbc3dSStefano Zampini PetscErrorCode PCApply_BDDC(PC pc,Vec r,Vec z)
6530c7d97c5SJed Brown {
6540c7d97c5SJed Brown   PC_IS             *pcis = (PC_IS*)(pc->data);
6550c7d97c5SJed Brown   PC_BDDC           *pcbddc = (PC_BDDC*)(pc->data);
6560c7d97c5SJed Brown   PetscErrorCode    ierr;
6573b03a366Sstefano_zampini   const PetscScalar one = 1.0;
6583b03a366Sstefano_zampini   const PetscScalar m_one = -1.0;
6592617d88aSStefano Zampini   const PetscScalar zero = 0.0;
6600c7d97c5SJed Brown 
6610c7d97c5SJed Brown /* This code is similar to that provided in nn.c for PCNN
6620c7d97c5SJed Brown    NN interface preconditioner changed to BDDC
6630c7d97c5SJed Brown    Added support for M_3 preconditioenr in the reference article (code is active if pcbddc->prec_type = PETSC_TRUE) */
6640c7d97c5SJed Brown 
6650c7d97c5SJed Brown   PetscFunctionBegin;
666b76ba322SStefano Zampini   if (!pcbddc->use_exact_dirichlet) {
6670c7d97c5SJed Brown     /* First Dirichlet solve */
6680c7d97c5SJed Brown     ierr = VecScatterBegin(pcis->global_to_D,r,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
6690c7d97c5SJed Brown     ierr = VecScatterEnd  (pcis->global_to_D,r,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
67053cdbc3dSStefano Zampini     ierr = KSPSolve(pcbddc->ksp_D,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr);
6710c7d97c5SJed Brown     /*
6720c7d97c5SJed Brown       Assembling right hand side for BDDC operator
6730c7d97c5SJed Brown       - vec1_D for the Dirichlet part (if needed, i.e. prec_flag=PETSC_TRUE)
6740c7d97c5SJed Brown       - the interface part of the global vector z
6750c7d97c5SJed Brown     */
6760c7d97c5SJed Brown     ierr = VecScale(pcis->vec2_D,m_one);CHKERRQ(ierr);
6770c7d97c5SJed Brown     ierr = MatMult(pcis->A_BI,pcis->vec2_D,pcis->vec1_B);CHKERRQ(ierr);
6780c7d97c5SJed Brown     if (pcbddc->prec_type) { ierr = MatMultAdd(pcis->A_II,pcis->vec2_D,pcis->vec1_D,pcis->vec1_D);CHKERRQ(ierr); }
6790c7d97c5SJed Brown     ierr = VecScale(pcis->vec2_D,m_one);CHKERRQ(ierr);
6800c7d97c5SJed Brown     ierr = VecCopy(r,z);CHKERRQ(ierr);
6810c7d97c5SJed Brown     ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
6820c7d97c5SJed Brown     ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
6832617d88aSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
6842617d88aSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
685b76ba322SStefano Zampini   } else {
686b76ba322SStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,r,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
687b76ba322SStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,r,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
688*0bdf917eSStefano Zampini     ierr = VecSet(pcis->vec1_D,zero);CHKERRQ(ierr);
689b76ba322SStefano Zampini     ierr = VecSet(pcis->vec2_D,zero);CHKERRQ(ierr);
690b76ba322SStefano Zampini   }
691b76ba322SStefano Zampini 
692b76ba322SStefano Zampini   /* Apply partition of unity */
6932617d88aSStefano Zampini   ierr = VecPointwiseMult(pcis->vec1_B,pcis->D,pcis->vec1_B);CHKERRQ(ierr);
6942617d88aSStefano Zampini 
6952617d88aSStefano Zampini   /* Apply interface preconditioner
6962617d88aSStefano Zampini      input/output vecs: pcis->vec1_B and pcis->vec1_D */
6972617d88aSStefano Zampini   ierr = PCBDDCApplyInterfacePreconditioner(pc);CHKERRQ(ierr);
6982617d88aSStefano Zampini 
6992617d88aSStefano Zampini   /* Apply partition of unity and sum boundary values */
7002617d88aSStefano Zampini   ierr = VecPointwiseMult(pcis->vec1_B,pcis->D,pcis->vec1_B);CHKERRQ(ierr);
7012617d88aSStefano Zampini   ierr = VecSet(z,zero);CHKERRQ(ierr);
7022617d88aSStefano Zampini   ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
7032617d88aSStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
7040c7d97c5SJed Brown 
7053b03a366Sstefano_zampini   /* Second Dirichlet solve and assembling of output */
7060c7d97c5SJed Brown   ierr = VecScatterBegin(pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
7070c7d97c5SJed Brown   ierr = VecScatterEnd  (pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
7080c7d97c5SJed Brown   ierr = MatMult(pcis->A_IB,pcis->vec1_B,pcis->vec3_D);CHKERRQ(ierr);
7090c7d97c5SJed Brown   if (pcbddc->prec_type) { ierr = MatMultAdd(pcis->A_II,pcis->vec1_D,pcis->vec3_D,pcis->vec3_D);CHKERRQ(ierr); }
71053cdbc3dSStefano Zampini   ierr = KSPSolve(pcbddc->ksp_D,pcis->vec3_D,pcbddc->vec4_D);CHKERRQ(ierr);
7110c7d97c5SJed Brown   ierr = VecScale(pcbddc->vec4_D,m_one);CHKERRQ(ierr);
7120c7d97c5SJed Brown   if (pcbddc->prec_type) { ierr = VecAXPY (pcbddc->vec4_D,one,pcis->vec1_D);CHKERRQ(ierr); }
7130c7d97c5SJed Brown   ierr = VecAXPY (pcis->vec2_D,one,pcbddc->vec4_D);CHKERRQ(ierr);
7140c7d97c5SJed Brown   ierr = VecScatterBegin(pcis->global_to_D,pcis->vec2_D,z,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
7150c7d97c5SJed Brown   ierr = VecScatterEnd  (pcis->global_to_D,pcis->vec2_D,z,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
7160c7d97c5SJed Brown   PetscFunctionReturn(0);
7170c7d97c5SJed Brown 
7180c7d97c5SJed Brown }
719da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
720da1bb401SStefano Zampini #undef __FUNCT__
721da1bb401SStefano Zampini #define __FUNCT__ "PCDestroy_BDDC"
722da1bb401SStefano Zampini PetscErrorCode PCDestroy_BDDC(PC pc)
723da1bb401SStefano Zampini {
724da1bb401SStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
725*0bdf917eSStefano Zampini   PetscInt       i;
726da1bb401SStefano Zampini   PetscErrorCode ierr;
727da1bb401SStefano Zampini 
728da1bb401SStefano Zampini   PetscFunctionBegin;
729da1bb401SStefano Zampini   /* free data created by PCIS */
730da1bb401SStefano Zampini   ierr = PCISDestroy(pc);CHKERRQ(ierr);
731da1bb401SStefano Zampini   /* free BDDC data  */
732*0bdf917eSStefano Zampini   ierr = MatNullSpaceDestroy(&pcbddc->CoarseNullSpace);CHKERRQ(ierr);
733*0bdf917eSStefano Zampini   ierr = MatNullSpaceDestroy(&pcbddc->NullSpace);CHKERRQ(ierr);
7343972b0daSStefano Zampini   ierr = VecDestroy(&pcbddc->temp_solution);CHKERRQ(ierr);
735534831adSStefano Zampini   ierr = VecDestroy(&pcbddc->original_rhs);CHKERRQ(ierr);
736534831adSStefano Zampini   ierr = MatDestroy(&pcbddc->local_mat);CHKERRQ(ierr);
737534831adSStefano Zampini   ierr = MatDestroy(&pcbddc->ChangeOfBasisMatrix);CHKERRQ(ierr);
738da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->coarse_vec);CHKERRQ(ierr);
739da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->coarse_rhs);CHKERRQ(ierr);
740da1bb401SStefano Zampini   ierr = KSPDestroy(&pcbddc->coarse_ksp);CHKERRQ(ierr);
741da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->coarse_mat);CHKERRQ(ierr);
742da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->coarse_phi_B);CHKERRQ(ierr);
743da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->coarse_phi_D);CHKERRQ(ierr);
744da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec1_P);CHKERRQ(ierr);
745da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec1_C);CHKERRQ(ierr);
746da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->local_auxmat1);CHKERRQ(ierr);
747da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->local_auxmat2);CHKERRQ(ierr);
748da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec1_R);CHKERRQ(ierr);
749da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec2_R);CHKERRQ(ierr);
750da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec4_D);CHKERRQ(ierr);
751da1bb401SStefano Zampini   ierr = VecScatterDestroy(&pcbddc->R_to_B);CHKERRQ(ierr);
752da1bb401SStefano Zampini   ierr = VecScatterDestroy(&pcbddc->R_to_D);CHKERRQ(ierr);
753da1bb401SStefano Zampini   ierr = VecScatterDestroy(&pcbddc->coarse_loc_to_glob);CHKERRQ(ierr);
754da1bb401SStefano Zampini   ierr = KSPDestroy(&pcbddc->ksp_D);CHKERRQ(ierr);
755da1bb401SStefano Zampini   ierr = KSPDestroy(&pcbddc->ksp_R);CHKERRQ(ierr);
756da1bb401SStefano Zampini   ierr = ISDestroy(&pcbddc->NeumannBoundaries);CHKERRQ(ierr);
757da1bb401SStefano Zampini   ierr = ISDestroy(&pcbddc->DirichletBoundaries);CHKERRQ(ierr);
758da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->ConstraintMatrix);CHKERRQ(ierr);
759da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->local_primal_indices);CHKERRQ(ierr);
760da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->replicated_local_primal_indices);CHKERRQ(ierr);
761*0bdf917eSStefano Zampini   ierr = PetscFree(pcbddc->replicated_local_primal_values);CHKERRQ(ierr);
762da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->local_primal_displacements);CHKERRQ(ierr);
763da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->local_primal_sizes);CHKERRQ(ierr);
764da1bb401SStefano Zampini   for (i=0;i<pcbddc->n_ISForDofs;i++) { ierr = ISDestroy(&pcbddc->ISForDofs[i]);CHKERRQ(ierr); }
765da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->ISForDofs);CHKERRQ(ierr);
766da1bb401SStefano Zampini   for (i=0;i<pcbddc->n_ISForFaces;i++) { ierr = ISDestroy(&pcbddc->ISForFaces[i]);CHKERRQ(ierr); }
767da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->ISForFaces);CHKERRQ(ierr);
768da1bb401SStefano Zampini   for (i=0;i<pcbddc->n_ISForEdges;i++) { ierr = ISDestroy(&pcbddc->ISForEdges[i]);CHKERRQ(ierr); }
769da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->ISForEdges);CHKERRQ(ierr);
770da1bb401SStefano Zampini   ierr = ISDestroy(&pcbddc->ISForVertices);CHKERRQ(ierr);
7713972b0daSStefano Zampini   /* Free graph structure */
772da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph->xadj);CHKERRQ(ierr);
773da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph->adjncy);CHKERRQ(ierr);
774142dfd88SStefano Zampini   if (pcbddc->mat_graph->nvtxs) {
775da1bb401SStefano Zampini     ierr = PetscFree(pcbddc->mat_graph->neighbours_set[0]);CHKERRQ(ierr);
776142dfd88SStefano Zampini   }
777da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph->neighbours_set);CHKERRQ(ierr);
7783972b0daSStefano Zampini   ierr = PetscFree4(pcbddc->mat_graph->where,pcbddc->mat_graph->count,pcbddc->mat_graph->cptr,pcbddc->mat_graph->queue);CHKERRQ(ierr);
7793972b0daSStefano Zampini   ierr = PetscFree2(pcbddc->mat_graph->which_dof,pcbddc->mat_graph->touched);CHKERRQ(ierr);
7803972b0daSStefano Zampini   ierr = PetscFree(pcbddc->mat_graph->where_ncmps);CHKERRQ(ierr);
781da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph);CHKERRQ(ierr);
7823425bc38SStefano Zampini   /* remove functions */
783*0bdf917eSStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetNullSpace_C","",PETSC_NULL);CHKERRQ(ierr);
7843425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDirichletBoundaries_C","",PETSC_NULL);CHKERRQ(ierr);
7853425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetNeumannBoundaries_C","",PETSC_NULL);CHKERRQ(ierr);
7863425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetDirichletBoundaries_C","",PETSC_NULL);CHKERRQ(ierr);
7873425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetNeumannBoundaries_C","",PETSC_NULL);CHKERRQ(ierr);
7883425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetCoarseProblemType_C","",PETSC_NULL);CHKERRQ(ierr);
7893425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDofsSplitting_C","",PETSC_NULL);CHKERRQ(ierr);
7903425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetLocalAdjacencyGraph_C","",PETSC_NULL);CHKERRQ(ierr);
7913425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPreSolve_C","",PETSC_NULL);CHKERRQ(ierr);
7923425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPostSolve_C","",PETSC_NULL);CHKERRQ(ierr);
7933425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCCreateFETIDPOperators_C","",PETSC_NULL);CHKERRQ(ierr);
7943425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetRHS_C","",PETSC_NULL);CHKERRQ(ierr);
7953425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetSolution_C","",PETSC_NULL);CHKERRQ(ierr);
796da1bb401SStefano Zampini   /* Free the private data structure that was hanging off the PC */
797da1bb401SStefano Zampini   ierr = PetscFree(pcbddc);CHKERRQ(ierr);
798da1bb401SStefano Zampini   PetscFunctionReturn(0);
799da1bb401SStefano Zampini }
8003425bc38SStefano Zampini /* -------------------------------------------------------------------------- */
8013425bc38SStefano Zampini EXTERN_C_BEGIN
8023425bc38SStefano Zampini #undef __FUNCT__
8033425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetRHS_BDDC"
8043425bc38SStefano Zampini static PetscErrorCode PCBDDCMatFETIDPGetRHS_BDDC(Mat fetidp_mat, Vec standard_rhs, Vec fetidp_flux_rhs)
8053425bc38SStefano Zampini {
8063425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
8073425bc38SStefano Zampini   PC_IS*         pcis;
8083425bc38SStefano Zampini   PC_BDDC*       pcbddc;
8093425bc38SStefano Zampini   Mat_IS*        matis;
8103425bc38SStefano Zampini   PetscErrorCode ierr;
8110c7d97c5SJed Brown 
8123425bc38SStefano Zampini   PetscFunctionBegin;
8133425bc38SStefano Zampini   ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr);
8143425bc38SStefano Zampini   pcis = (PC_IS*)mat_ctx->pc->data;
8153425bc38SStefano Zampini   pcbddc = (PC_BDDC*)mat_ctx->pc->data;
8163425bc38SStefano Zampini   matis = (Mat_IS*)mat_ctx->pc->pmat->data;
8173425bc38SStefano Zampini 
8183425bc38SStefano Zampini   /* change of basis for physical rhs if needed
8193425bc38SStefano Zampini      It also changes the rhs in case of dirichlet boundaries */
8203425bc38SStefano Zampini   (*mat_ctx->pc->ops->presolve)(mat_ctx->pc,PETSC_NULL,standard_rhs,PETSC_NULL);
8213425bc38SStefano Zampini   /* store vectors for computation of fetidp final solution */
8223425bc38SStefano Zampini   ierr = VecScatterBegin(pcis->global_to_D,standard_rhs,mat_ctx->temp_solution_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
8233425bc38SStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_D,standard_rhs,mat_ctx->temp_solution_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
8243425bc38SStefano Zampini   ierr = VecScatterBegin(pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
8253425bc38SStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
8263425bc38SStefano Zampini   /* scale rhs since it should be unassembled */
8273425bc38SStefano Zampini   ierr = VecPointwiseMult(mat_ctx->temp_solution_B,pcis->D,mat_ctx->temp_solution_B);CHKERRQ(ierr);
8283425bc38SStefano Zampini   if (!pcbddc->prec_type) {
8293425bc38SStefano Zampini     /* compute partially subassembled Schur complement right-hand side */
8303425bc38SStefano Zampini     ierr = KSPSolve(pcbddc->ksp_D,mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr);
8313425bc38SStefano Zampini     ierr = MatMult(pcis->A_BI,pcis->vec1_D,pcis->vec1_B);CHKERRQ(ierr);
8323425bc38SStefano Zampini     ierr = VecAXPY(mat_ctx->temp_solution_B,-1.0,pcis->vec1_B);CHKERRQ(ierr);
8333425bc38SStefano Zampini     ierr = VecSet(standard_rhs,0.0);CHKERRQ(ierr);
8343425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,mat_ctx->temp_solution_B,standard_rhs,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
8353425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,mat_ctx->temp_solution_B,standard_rhs,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
8363425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
8373425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
8383425bc38SStefano Zampini     ierr = VecPointwiseMult(mat_ctx->temp_solution_B,pcis->D,mat_ctx->temp_solution_B);CHKERRQ(ierr);
8393425bc38SStefano Zampini   }
8403425bc38SStefano Zampini   /* BDDC rhs */
8413425bc38SStefano Zampini   ierr = VecCopy(mat_ctx->temp_solution_B,pcis->vec1_B);CHKERRQ(ierr);
8423425bc38SStefano Zampini   if (pcbddc->prec_type) {
8433425bc38SStefano Zampini     ierr = VecCopy(mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr);
8443425bc38SStefano Zampini   }
8453425bc38SStefano Zampini   /* apply BDDC */
8463425bc38SStefano Zampini   ierr = PCBDDCApplyInterfacePreconditioner(mat_ctx->pc);CHKERRQ(ierr);
8473425bc38SStefano Zampini   /* Application of B_delta and assembling of rhs for fetidp fluxes */
8483425bc38SStefano Zampini   ierr = VecSet(fetidp_flux_rhs,0.0);CHKERRQ(ierr);
8493425bc38SStefano Zampini   ierr = MatMult(mat_ctx->B_delta,pcis->vec1_B,mat_ctx->lambda_local);CHKERRQ(ierr);
8503425bc38SStefano Zampini   ierr = VecScatterBegin(mat_ctx->l2g_lambda,mat_ctx->lambda_local,fetidp_flux_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
8513425bc38SStefano Zampini   ierr = VecScatterEnd  (mat_ctx->l2g_lambda,mat_ctx->lambda_local,fetidp_flux_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
8523425bc38SStefano Zampini   /* restore original rhs */
8533425bc38SStefano Zampini   ierr = VecCopy(pcbddc->original_rhs,standard_rhs);CHKERRQ(ierr);
8543425bc38SStefano Zampini   PetscFunctionReturn(0);
8553425bc38SStefano Zampini }
8563425bc38SStefano Zampini EXTERN_C_END
8573425bc38SStefano Zampini #undef __FUNCT__
8583425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetRHS"
8593425bc38SStefano Zampini /*@
8603425bc38SStefano Zampini  PCBDDCMatFETIDPGetRHS - Get rhs for FETIDP linear system.
8613425bc38SStefano Zampini 
8623425bc38SStefano Zampini    Collective
8633425bc38SStefano Zampini 
8643425bc38SStefano Zampini    Input Parameters:
8653425bc38SStefano Zampini +  fetidp_mat   - the FETIDP mat obtained by a call to PCBDDCCreateFETIDPOperators
8663425bc38SStefano Zampini +  standard_rhs - the rhs of your linear system
8673425bc38SStefano Zampini 
8683425bc38SStefano Zampini    Output Parameters:
8693425bc38SStefano Zampini +  fetidp_flux_rhs   - the rhs of the FETIDP linear system
8703425bc38SStefano Zampini 
8713425bc38SStefano Zampini    Level: developer
8723425bc38SStefano Zampini 
8733425bc38SStefano Zampini    Notes:
8743425bc38SStefano Zampini 
8753425bc38SStefano Zampini .seealso: PCBDDC
8763425bc38SStefano Zampini @*/
8773425bc38SStefano Zampini PetscErrorCode PCBDDCMatFETIDPGetRHS(Mat fetidp_mat, Vec standard_rhs, Vec fetidp_flux_rhs)
8783425bc38SStefano Zampini {
8793425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
8803425bc38SStefano Zampini   PetscErrorCode ierr;
8813425bc38SStefano Zampini 
8823425bc38SStefano Zampini   PetscFunctionBegin;
8833425bc38SStefano Zampini   ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr);
8843425bc38SStefano Zampini   ierr = PetscTryMethod(mat_ctx->pc,"PCBDDCMatFETIDPGetRHS_C",(Mat,Vec,Vec),(fetidp_mat,standard_rhs,fetidp_flux_rhs));CHKERRQ(ierr);
8853425bc38SStefano Zampini   PetscFunctionReturn(0);
8863425bc38SStefano Zampini }
8873425bc38SStefano Zampini /* -------------------------------------------------------------------------- */
8883425bc38SStefano Zampini EXTERN_C_BEGIN
8893425bc38SStefano Zampini #undef __FUNCT__
8903425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetSolution_BDDC"
8913425bc38SStefano Zampini static PetscErrorCode PCBDDCMatFETIDPGetSolution_BDDC(Mat fetidp_mat, Vec fetidp_flux_sol, Vec standard_sol)
8923425bc38SStefano Zampini {
8933425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
8943425bc38SStefano Zampini   PC_IS*         pcis;
8953425bc38SStefano Zampini   PC_BDDC*       pcbddc;
8963425bc38SStefano Zampini   Mat_IS*        matis;
8973425bc38SStefano Zampini   PetscErrorCode ierr;
8983425bc38SStefano Zampini 
8993425bc38SStefano Zampini   PetscFunctionBegin;
9003425bc38SStefano Zampini   ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr);
9013425bc38SStefano Zampini   pcis = (PC_IS*)mat_ctx->pc->data;
9023425bc38SStefano Zampini   pcbddc = (PC_BDDC*)mat_ctx->pc->data;
9033425bc38SStefano Zampini   matis = (Mat_IS*)mat_ctx->pc->pmat->data;
9043425bc38SStefano Zampini 
9053425bc38SStefano Zampini   /* apply B_delta^T */
9063425bc38SStefano Zampini   ierr = VecScatterBegin(mat_ctx->l2g_lambda,fetidp_flux_sol,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
9073425bc38SStefano Zampini   ierr = VecScatterEnd  (mat_ctx->l2g_lambda,fetidp_flux_sol,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
9083425bc38SStefano Zampini   ierr = MatMultTranspose(mat_ctx->B_delta,mat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr);
9093425bc38SStefano Zampini   /* compute rhs for BDDC application */
9103425bc38SStefano Zampini   ierr = VecAYPX(pcis->vec1_B,-1.0,mat_ctx->temp_solution_B);CHKERRQ(ierr);
9113425bc38SStefano Zampini   if (pcbddc->prec_type) {
9123425bc38SStefano Zampini     ierr = VecCopy(mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr);
9133425bc38SStefano Zampini   }
9143425bc38SStefano Zampini   /* apply BDDC */
9153425bc38SStefano Zampini   ierr = PCBDDCApplyInterfacePreconditioner(mat_ctx->pc);CHKERRQ(ierr);
9163425bc38SStefano Zampini   /* put values into standard global vector */
9173425bc38SStefano Zampini   ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
9183425bc38SStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec1_B,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
9193425bc38SStefano Zampini   if (!pcbddc->prec_type) {
9203425bc38SStefano Zampini     /* compute values into the interior if solved for the partially subassembled Schur complement */
9213425bc38SStefano Zampini     ierr = MatMult(pcis->A_IB,pcis->vec1_B,pcis->vec1_D);CHKERRQ(ierr);
9223425bc38SStefano Zampini     ierr = VecAXPY(mat_ctx->temp_solution_D,-1.0,pcis->vec1_D);CHKERRQ(ierr);
9233425bc38SStefano Zampini     ierr = KSPSolve(pcbddc->ksp_D,mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr);
9243425bc38SStefano Zampini   }
9253425bc38SStefano Zampini   ierr = VecScatterBegin(pcis->global_to_D,pcis->vec1_D,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
9263425bc38SStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_D,pcis->vec1_D,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
9273425bc38SStefano Zampini   /* final change of basis if needed
9283425bc38SStefano Zampini      Is also sums the dirichlet part removed during RHS assembling */
9293425bc38SStefano Zampini   (*mat_ctx->pc->ops->postsolve)(mat_ctx->pc,PETSC_NULL,PETSC_NULL,standard_sol);
9303425bc38SStefano Zampini   PetscFunctionReturn(0);
9313425bc38SStefano Zampini 
9323425bc38SStefano Zampini }
9333425bc38SStefano Zampini EXTERN_C_END
9343425bc38SStefano Zampini #undef __FUNCT__
9353425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetSolution"
9363425bc38SStefano Zampini /*@
9373425bc38SStefano Zampini  PCBDDCMatFETIDPGetSolution - Get Solution for FETIDP linear system.
9383425bc38SStefano Zampini 
9393425bc38SStefano Zampini    Collective
9403425bc38SStefano Zampini 
9413425bc38SStefano Zampini    Input Parameters:
9423425bc38SStefano Zampini +  fetidp_mat        - the FETIDP mat obtained by a call to PCBDDCCreateFETIDPOperators
9433425bc38SStefano Zampini +  fetidp_flux_sol - the solution of the FETIDP linear system
9443425bc38SStefano Zampini 
9453425bc38SStefano Zampini    Output Parameters:
9463425bc38SStefano Zampini +  standard_sol      - the solution on the global domain
9473425bc38SStefano Zampini 
9483425bc38SStefano Zampini    Level: developer
9493425bc38SStefano Zampini 
9503425bc38SStefano Zampini    Notes:
9513425bc38SStefano Zampini 
9523425bc38SStefano Zampini .seealso: PCBDDC
9533425bc38SStefano Zampini @*/
9543425bc38SStefano Zampini PetscErrorCode PCBDDCMatFETIDPGetSolution(Mat fetidp_mat, Vec fetidp_flux_sol, Vec standard_sol)
9553425bc38SStefano Zampini {
9563425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
9573425bc38SStefano Zampini   PetscErrorCode ierr;
9583425bc38SStefano Zampini 
9593425bc38SStefano Zampini   PetscFunctionBegin;
9603425bc38SStefano Zampini   ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr);
9613425bc38SStefano Zampini   ierr = PetscTryMethod(mat_ctx->pc,"PCBDDCMatFETIDPGetSolution_C",(Mat,Vec,Vec),(fetidp_mat,fetidp_flux_sol,standard_sol));CHKERRQ(ierr);
9623425bc38SStefano Zampini   PetscFunctionReturn(0);
9633425bc38SStefano Zampini }
9643425bc38SStefano Zampini /* -------------------------------------------------------------------------- */
9653425bc38SStefano Zampini EXTERN_C_BEGIN
9663425bc38SStefano Zampini #undef __FUNCT__
9673425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPOperators_BDDC"
9683425bc38SStefano Zampini static PetscErrorCode PCBDDCCreateFETIDPOperators_BDDC(PC pc, Mat *fetidp_mat, PC *fetidp_pc)
9693425bc38SStefano Zampini {
9703425bc38SStefano Zampini   PETSC_EXTERN PetscErrorCode FETIDPMatMult(Mat,Vec,Vec);
9713425bc38SStefano Zampini   PETSC_EXTERN PetscErrorCode PCBDDCDestroyFETIDPMat(Mat);
9723425bc38SStefano Zampini   PETSC_EXTERN PetscErrorCode FETIDPPCApply(PC,Vec,Vec);
9733425bc38SStefano Zampini   PETSC_EXTERN PetscErrorCode PCBDDCDestroyFETIDPPC(PC);
9743425bc38SStefano Zampini 
9753425bc38SStefano Zampini   FETIDPMat_ctx  *fetidpmat_ctx;
9763425bc38SStefano Zampini   Mat            newmat;
9773425bc38SStefano Zampini   FETIDPPC_ctx  *fetidppc_ctx;
9783425bc38SStefano Zampini   PC             newpc;
9793425bc38SStefano Zampini   MPI_Comm       comm = ((PetscObject)pc)->comm;
9803425bc38SStefano Zampini   PetscErrorCode ierr;
9813425bc38SStefano Zampini 
9823425bc38SStefano Zampini   PetscFunctionBegin;
9833425bc38SStefano Zampini   /* FETIDP linear matrix */
9843425bc38SStefano Zampini   ierr = PCBDDCCreateFETIDPMatContext(pc, &fetidpmat_ctx);CHKERRQ(ierr);
9853425bc38SStefano Zampini   ierr = PCBDDCSetupFETIDPMatContext(fetidpmat_ctx);CHKERRQ(ierr);
9863425bc38SStefano Zampini   ierr = MatCreateShell(comm,PETSC_DECIDE,PETSC_DECIDE,fetidpmat_ctx->n_lambda,fetidpmat_ctx->n_lambda,fetidpmat_ctx,&newmat);CHKERRQ(ierr);
9873425bc38SStefano Zampini   ierr = MatShellSetOperation(newmat,MATOP_MULT,(void (*)(void))FETIDPMatMult);CHKERRQ(ierr);
9883425bc38SStefano Zampini   ierr = MatShellSetOperation(newmat,MATOP_DESTROY,(void (*)(void))PCBDDCDestroyFETIDPMat);CHKERRQ(ierr);
9893425bc38SStefano Zampini   ierr = MatSetUp(newmat);CHKERRQ(ierr);
9903425bc38SStefano Zampini   /* FETIDP preconditioner */
9913425bc38SStefano Zampini   ierr = PCBDDCCreateFETIDPPCContext(pc, &fetidppc_ctx);CHKERRQ(ierr);
9923425bc38SStefano Zampini   ierr = PCBDDCSetupFETIDPPCContext(newmat,fetidppc_ctx);CHKERRQ(ierr);
9933425bc38SStefano Zampini   ierr = PCCreate(comm,&newpc);CHKERRQ(ierr);
9943425bc38SStefano Zampini   ierr = PCSetType(newpc,PCSHELL);CHKERRQ(ierr);
9953425bc38SStefano Zampini   ierr = PCShellSetContext(newpc,fetidppc_ctx);CHKERRQ(ierr);
9963425bc38SStefano Zampini   ierr = PCShellSetApply(newpc,FETIDPPCApply);CHKERRQ(ierr);
9973425bc38SStefano Zampini   ierr = PCShellSetDestroy(newpc,PCBDDCDestroyFETIDPPC);CHKERRQ(ierr);
9983425bc38SStefano Zampini   ierr = PCSetOperators(newpc,newmat,newmat,SAME_PRECONDITIONER);CHKERRQ(ierr);
9993425bc38SStefano Zampini   ierr = PCSetUp(newpc);CHKERRQ(ierr);
10003425bc38SStefano Zampini   /* return pointers for objects created */
10013425bc38SStefano Zampini   *fetidp_mat=newmat;
10023425bc38SStefano Zampini   *fetidp_pc=newpc;
10033425bc38SStefano Zampini 
10043425bc38SStefano Zampini   PetscFunctionReturn(0);
10053425bc38SStefano Zampini }
10063425bc38SStefano Zampini EXTERN_C_END
10073425bc38SStefano Zampini #undef __FUNCT__
10083425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPOperators"
10093425bc38SStefano Zampini /*@
10103425bc38SStefano Zampini  PCBDDCCreateFETIDPOperators - Create operators for FETIDP.
10113425bc38SStefano Zampini 
10123425bc38SStefano Zampini    Collective
10133425bc38SStefano Zampini 
10143425bc38SStefano Zampini    Input Parameters:
10153425bc38SStefano Zampini +  pc - the BDDC preconditioning context (setup must be already called)
10163425bc38SStefano Zampini 
10173425bc38SStefano Zampini    Level: developer
10183425bc38SStefano Zampini 
10193425bc38SStefano Zampini    Notes:
10203425bc38SStefano Zampini 
10213425bc38SStefano Zampini .seealso: PCBDDC
10223425bc38SStefano Zampini @*/
10233425bc38SStefano Zampini PetscErrorCode PCBDDCCreateFETIDPOperators(PC pc, Mat *fetidp_mat, PC *fetidp_pc)
10243425bc38SStefano Zampini {
10253425bc38SStefano Zampini   PetscErrorCode ierr;
10263425bc38SStefano Zampini 
10273425bc38SStefano Zampini   PetscFunctionBegin;
10283425bc38SStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
10293425bc38SStefano Zampini   if (pc->setupcalled) {
10303425bc38SStefano Zampini     ierr = PetscTryMethod(pc,"PCBDDCCreateFETIDPOperators_C",(PC,Mat*,PC*),(pc,fetidp_mat,fetidp_pc));CHKERRQ(ierr);
10313425bc38SStefano Zampini   } else {
10323425bc38SStefano Zampini     SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SUP,"You must call PCSetup_BDDC before calling %s\n",__FUNCT__);
10333425bc38SStefano Zampini   }
10343425bc38SStefano Zampini   PetscFunctionReturn(0);
10353425bc38SStefano Zampini }
10360c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
1037da1bb401SStefano Zampini /*MC
1038da1bb401SStefano Zampini    PCBDDC - Balancing Domain Decomposition by Constraints.
10390c7d97c5SJed Brown 
1040da1bb401SStefano Zampini    Options Database Keys:
1041da1bb401SStefano Zampini .    -pcbddc ??? -
1042da1bb401SStefano Zampini 
1043da1bb401SStefano Zampini    Level: intermediate
1044da1bb401SStefano Zampini 
1045da1bb401SStefano Zampini    Notes: The matrix used with this preconditioner must be of type MATIS
1046da1bb401SStefano Zampini 
1047da1bb401SStefano Zampini           Unlike more 'conventional' interface preconditioners, this iterates over ALL the
1048da1bb401SStefano Zampini           degrees of freedom, NOT just those on the interface (this allows the use of approximate solvers
1049da1bb401SStefano Zampini           on the subdomains).
1050da1bb401SStefano Zampini 
1051da1bb401SStefano Zampini           Options for the coarse grid preconditioner can be set with -
1052da1bb401SStefano Zampini           Options for the Dirichlet subproblem can be set with -
1053da1bb401SStefano Zampini           Options for the Neumann subproblem can be set with -
1054da1bb401SStefano Zampini 
1055da1bb401SStefano Zampini    Contributed by Stefano Zampini
1056da1bb401SStefano Zampini 
1057da1bb401SStefano Zampini .seealso:  PCCreate(), PCSetType(), PCType (for list of available types), PC,  MATIS
1058da1bb401SStefano Zampini M*/
1059da1bb401SStefano Zampini EXTERN_C_BEGIN
1060da1bb401SStefano Zampini #undef __FUNCT__
1061da1bb401SStefano Zampini #define __FUNCT__ "PCCreate_BDDC"
1062da1bb401SStefano Zampini PetscErrorCode PCCreate_BDDC(PC pc)
1063da1bb401SStefano Zampini {
1064da1bb401SStefano Zampini   PetscErrorCode ierr;
1065da1bb401SStefano Zampini   PC_BDDC        *pcbddc;
1066da1bb401SStefano Zampini   PCBDDCGraph    mat_graph;
1067da1bb401SStefano Zampini 
1068da1bb401SStefano Zampini   PetscFunctionBegin;
1069da1bb401SStefano Zampini   /* Creates the private data structure for this preconditioner and attach it to the PC object. */
1070da1bb401SStefano Zampini   ierr      = PetscNewLog(pc,PC_BDDC,&pcbddc);CHKERRQ(ierr);
1071da1bb401SStefano Zampini   pc->data  = (void*)pcbddc;
1072da1bb401SStefano Zampini 
1073da1bb401SStefano Zampini   /* create PCIS data structure */
1074da1bb401SStefano Zampini   ierr = PCISCreate(pc);CHKERRQ(ierr);
1075da1bb401SStefano Zampini 
1076da1bb401SStefano Zampini   /* BDDC specific */
1077*0bdf917eSStefano Zampini   pcbddc->CoarseNullSpace            = 0;
1078*0bdf917eSStefano Zampini   pcbddc->NullSpace                  = 0;
10793972b0daSStefano Zampini   pcbddc->temp_solution              = 0;
1080534831adSStefano Zampini   pcbddc->original_rhs               = 0;
1081534831adSStefano Zampini   pcbddc->local_mat                  = 0;
1082534831adSStefano Zampini   pcbddc->ChangeOfBasisMatrix        = 0;
1083534831adSStefano Zampini   pcbddc->usechangeofbasis           = PETSC_TRUE;
1084534831adSStefano Zampini   pcbddc->usechangeonfaces           = PETSC_FALSE;
1085da1bb401SStefano Zampini   pcbddc->coarse_vec                 = 0;
1086da1bb401SStefano Zampini   pcbddc->coarse_rhs                 = 0;
1087da1bb401SStefano Zampini   pcbddc->coarse_ksp                 = 0;
1088da1bb401SStefano Zampini   pcbddc->coarse_phi_B               = 0;
1089da1bb401SStefano Zampini   pcbddc->coarse_phi_D               = 0;
1090da1bb401SStefano Zampini   pcbddc->vec1_P                     = 0;
1091da1bb401SStefano Zampini   pcbddc->vec1_R                     = 0;
1092da1bb401SStefano Zampini   pcbddc->vec2_R                     = 0;
1093da1bb401SStefano Zampini   pcbddc->local_auxmat1              = 0;
1094da1bb401SStefano Zampini   pcbddc->local_auxmat2              = 0;
1095da1bb401SStefano Zampini   pcbddc->R_to_B                     = 0;
1096da1bb401SStefano Zampini   pcbddc->R_to_D                     = 0;
1097da1bb401SStefano Zampini   pcbddc->ksp_D                      = 0;
1098da1bb401SStefano Zampini   pcbddc->ksp_R                      = 0;
1099da1bb401SStefano Zampini   pcbddc->local_primal_indices       = 0;
1100da1bb401SStefano Zampini   pcbddc->prec_type                  = PETSC_FALSE;
1101da1bb401SStefano Zampini   pcbddc->NeumannBoundaries          = 0;
1102da1bb401SStefano Zampini   pcbddc->ISForDofs                  = 0;
1103da1bb401SStefano Zampini   pcbddc->ISForVertices              = 0;
1104da1bb401SStefano Zampini   pcbddc->n_ISForFaces               = 0;
1105da1bb401SStefano Zampini   pcbddc->n_ISForEdges               = 0;
1106da1bb401SStefano Zampini   pcbddc->ConstraintMatrix           = 0;
1107da1bb401SStefano Zampini   pcbddc->use_nnsp_true              = PETSC_FALSE;
1108da1bb401SStefano Zampini   pcbddc->local_primal_sizes         = 0;
1109da1bb401SStefano Zampini   pcbddc->local_primal_displacements = 0;
1110da1bb401SStefano Zampini   pcbddc->replicated_local_primal_indices = 0;
1111da1bb401SStefano Zampini   pcbddc->replicated_local_primal_values  = 0;
1112da1bb401SStefano Zampini   pcbddc->coarse_loc_to_glob         = 0;
1113da1bb401SStefano Zampini   pcbddc->dbg_flag                   = PETSC_FALSE;
1114da1bb401SStefano Zampini   pcbddc->coarsening_ratio           = 8;
1115b76ba322SStefano Zampini   pcbddc->use_exact_dirichlet        = PETSC_TRUE;
1116da1bb401SStefano Zampini 
1117da1bb401SStefano Zampini   /* allocate and initialize needed graph structure */
1118da1bb401SStefano Zampini   ierr = PetscMalloc(sizeof(*mat_graph),&pcbddc->mat_graph);CHKERRQ(ierr);
1119da1bb401SStefano Zampini   pcbddc->mat_graph->xadj            = 0;
1120da1bb401SStefano Zampini   pcbddc->mat_graph->adjncy          = 0;
1121da1bb401SStefano Zampini 
1122da1bb401SStefano Zampini   /* function pointers */
1123da1bb401SStefano Zampini   pc->ops->apply               = PCApply_BDDC;
1124da1bb401SStefano Zampini   pc->ops->applytranspose      = 0;
1125da1bb401SStefano Zampini   pc->ops->setup               = PCSetUp_BDDC;
1126da1bb401SStefano Zampini   pc->ops->destroy             = PCDestroy_BDDC;
1127da1bb401SStefano Zampini   pc->ops->setfromoptions      = PCSetFromOptions_BDDC;
1128da1bb401SStefano Zampini   pc->ops->view                = 0;
1129da1bb401SStefano Zampini   pc->ops->applyrichardson     = 0;
1130da1bb401SStefano Zampini   pc->ops->applysymmetricleft  = 0;
1131da1bb401SStefano Zampini   pc->ops->applysymmetricright = 0;
1132534831adSStefano Zampini   pc->ops->presolve            = PCPreSolve_BDDC;
1133534831adSStefano Zampini   pc->ops->postsolve           = PCPostSolve_BDDC;
1134da1bb401SStefano Zampini 
1135da1bb401SStefano Zampini   /* composing function */
1136*0bdf917eSStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetNullSpace_C","PCBDDCSetNullSpace_BDDC",
1137*0bdf917eSStefano Zampini                     PCBDDCSetNullSpace_BDDC);CHKERRQ(ierr);
1138da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDirichletBoundaries_C","PCBDDCSetDirichletBoundaries_BDDC",
1139da1bb401SStefano Zampini                     PCBDDCSetDirichletBoundaries_BDDC);CHKERRQ(ierr);
1140da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetNeumannBoundaries_C","PCBDDCSetNeumannBoundaries_BDDC",
1141da1bb401SStefano Zampini                     PCBDDCSetNeumannBoundaries_BDDC);CHKERRQ(ierr);
1142da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetDirichletBoundaries_C","PCBDDCGetDirichletBoundaries_BDDC",
1143da1bb401SStefano Zampini                     PCBDDCGetDirichletBoundaries_BDDC);CHKERRQ(ierr);
1144da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetNeumannBoundaries_C","PCBDDCGetNeumannBoundaries_BDDC",
1145da1bb401SStefano Zampini                     PCBDDCGetNeumannBoundaries_BDDC);CHKERRQ(ierr);
1146da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetCoarseProblemType_C","PCBDDCSetCoarseProblemType_BDDC",
1147da1bb401SStefano Zampini                     PCBDDCSetCoarseProblemType_BDDC);CHKERRQ(ierr);
1148da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDofsSplitting_C","PCBDDCSetDofsSplitting_BDDC",
1149da1bb401SStefano Zampini                     PCBDDCSetDofsSplitting_BDDC);CHKERRQ(ierr);
1150da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetLocalAdjacencyGraph_C","PCBDDCSetLocalAdjacencyGraph_BDDC",
1151da1bb401SStefano Zampini                     PCBDDCSetLocalAdjacencyGraph_BDDC);CHKERRQ(ierr);
1152534831adSStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPreSolve_C","PCPreSolve_BDDC",
1153534831adSStefano Zampini                     PCPreSolve_BDDC);CHKERRQ(ierr);
1154534831adSStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPostSolve_C","PCPostSolve_BDDC",
1155534831adSStefano Zampini                     PCPostSolve_BDDC);CHKERRQ(ierr);
11563425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCCreateFETIDPOperators_C","PCBDDCCreateFETIDPOperators_BDDC",
11573425bc38SStefano Zampini                     PCBDDCCreateFETIDPOperators_BDDC);CHKERRQ(ierr);
11583425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetRHS_C","PCBDDCMatFETIDPGetRHS_BDDC",
11593425bc38SStefano Zampini                     PCBDDCMatFETIDPGetRHS_BDDC);CHKERRQ(ierr);
11603425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetSolution_C","PCBDDCMatFETIDPGetSolution_BDDC",
11613425bc38SStefano Zampini                     PCBDDCMatFETIDPGetSolution_BDDC);CHKERRQ(ierr);
1162da1bb401SStefano Zampini   PetscFunctionReturn(0);
1163da1bb401SStefano Zampini }
1164da1bb401SStefano Zampini EXTERN_C_END
11653425bc38SStefano Zampini 
1166da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
1167da1bb401SStefano Zampini /* All static functions from now on                                           */
1168da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
11693425bc38SStefano Zampini 
11703425bc38SStefano Zampini #undef __FUNCT__
1171*0bdf917eSStefano Zampini #define __FUNCT__ "PCBDDCAdaptNullSpace"
1172*0bdf917eSStefano Zampini static PetscErrorCode PCBDDCAdaptNullSpace(PC pc)
1173*0bdf917eSStefano Zampini {
1174*0bdf917eSStefano Zampini   PC_IS*         pcis = (PC_IS*)  (pc->data);
1175*0bdf917eSStefano Zampini   PC_BDDC*       pcbddc = (PC_BDDC*)(pc->data);
1176*0bdf917eSStefano Zampini   KSP            inv_change;
1177*0bdf917eSStefano Zampini   PC             pc_change;
1178*0bdf917eSStefano Zampini   const Vec      *nsp_vecs;
1179*0bdf917eSStefano Zampini   Vec            *new_nsp_vecs;
1180*0bdf917eSStefano Zampini   PetscInt       i,nsp_size,new_nsp_size,start_new;
1181*0bdf917eSStefano Zampini   PetscBool      nsp_has_cnst;
1182*0bdf917eSStefano Zampini   MatNullSpace   new_nsp;
1183*0bdf917eSStefano Zampini   PetscErrorCode ierr;
1184*0bdf917eSStefano Zampini 
1185*0bdf917eSStefano Zampini   PetscFunctionBegin;
1186*0bdf917eSStefano Zampini   ierr = MatNullSpaceGetVecs(pcbddc->NullSpace,&nsp_has_cnst,&nsp_size,&nsp_vecs);CHKERRQ(ierr);
1187*0bdf917eSStefano Zampini   ierr = KSPCreate(PETSC_COMM_SELF,&inv_change);CHKERRQ(ierr);
1188*0bdf917eSStefano Zampini   ierr = KSPSetOperators(inv_change,pcbddc->ChangeOfBasisMatrix,pcbddc->ChangeOfBasisMatrix,SAME_PRECONDITIONER);CHKERRQ(ierr);
1189*0bdf917eSStefano Zampini   ierr = KSPSetType(inv_change,KSPPREONLY);CHKERRQ(ierr);
1190*0bdf917eSStefano Zampini   ierr = KSPGetPC(inv_change,&pc_change);CHKERRQ(ierr);
1191*0bdf917eSStefano Zampini   ierr = PCSetType(pc_change,PCLU);CHKERRQ(ierr);
1192*0bdf917eSStefano Zampini   ierr = KSPSetUp(inv_change);CHKERRQ(ierr);
1193*0bdf917eSStefano Zampini   new_nsp_size = nsp_size;
1194*0bdf917eSStefano Zampini   if (nsp_has_cnst) { new_nsp_size++; }
1195*0bdf917eSStefano Zampini   ierr = PetscMalloc(new_nsp_size*sizeof(Vec),&new_nsp_vecs);CHKERRQ(ierr);
1196*0bdf917eSStefano Zampini   for (i=0;i<new_nsp_size;i++) { ierr = VecDuplicate(pcis->vec1_global,&new_nsp_vecs[i]);CHKERRQ(ierr); }
1197*0bdf917eSStefano Zampini   start_new = 0;
1198*0bdf917eSStefano Zampini   if (nsp_has_cnst) {
1199*0bdf917eSStefano Zampini     start_new = 1;
1200*0bdf917eSStefano Zampini     ierr = VecSet(new_nsp_vecs[0],1.0);CHKERRQ(ierr);
1201*0bdf917eSStefano Zampini     ierr = VecSet(pcis->vec1_B,1.0);CHKERRQ(ierr);
1202*0bdf917eSStefano Zampini     ierr = KSPSolve(inv_change,pcis->vec1_B,pcis->vec1_B);
1203*0bdf917eSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,new_nsp_vecs[0],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
1204*0bdf917eSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec1_B,new_nsp_vecs[0],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
1205*0bdf917eSStefano Zampini   }
1206*0bdf917eSStefano Zampini   for (i=0;i<nsp_size;i++) {
1207*0bdf917eSStefano Zampini     ierr = VecCopy(nsp_vecs[i],new_nsp_vecs[i+start_new]);CHKERRQ(ierr);
1208*0bdf917eSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,nsp_vecs[i],pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1209*0bdf917eSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,nsp_vecs[i],pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1210*0bdf917eSStefano Zampini     ierr = KSPSolve(inv_change,pcis->vec1_B,pcis->vec1_B);
1211*0bdf917eSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,new_nsp_vecs[i+start_new],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
1212*0bdf917eSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec1_B,new_nsp_vecs[i+start_new],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
1213*0bdf917eSStefano Zampini   }
1214*0bdf917eSStefano Zampini   ierr = VecNormalize(new_nsp_vecs[0],PETSC_NULL);CHKERRQ(ierr);
1215*0bdf917eSStefano Zampini   /* TODO : Orthonormalize vecs when new_nsp_size > 0! */
1216*0bdf917eSStefano Zampini 
1217*0bdf917eSStefano Zampini   /*PetscBool nsp_t=PETSC_FALSE;
1218*0bdf917eSStefano Zampini   ierr = MatNullSpaceTest(pcbddc->NullSpace,pc->pmat,&nsp_t);CHKERRQ(ierr);
1219*0bdf917eSStefano Zampini   printf("Original Null Space test: %d\n",nsp_t);
1220*0bdf917eSStefano Zampini   Mat temp_mat;
1221*0bdf917eSStefano Zampini   Mat_IS* matis = (Mat_IS*)pc->pmat->data;
1222*0bdf917eSStefano Zampini     temp_mat = matis->A;
1223*0bdf917eSStefano Zampini     matis->A = pcbddc->local_mat;
1224*0bdf917eSStefano Zampini     pcbddc->local_mat = temp_mat;
1225*0bdf917eSStefano Zampini   ierr = MatNullSpaceTest(pcbddc->NullSpace,pc->pmat,&nsp_t);CHKERRQ(ierr);
1226*0bdf917eSStefano Zampini   printf("Original Null Space, mat changed test: %d\n",nsp_t);
1227*0bdf917eSStefano Zampini   {
1228*0bdf917eSStefano Zampini     PetscReal test_norm;
1229*0bdf917eSStefano Zampini     for (i=0;i<new_nsp_size;i++) {
1230*0bdf917eSStefano Zampini       ierr = MatMult(pc->pmat,new_nsp_vecs[i],pcis->vec1_global);CHKERRQ(ierr);
1231*0bdf917eSStefano Zampini       ierr = VecNorm(pcis->vec1_global,NORM_2,&test_norm);CHKERRQ(ierr);
1232*0bdf917eSStefano Zampini       if (test_norm > 1.e-12) {
1233*0bdf917eSStefano Zampini         printf("------------ERROR VEC %d------------------\n",i);
1234*0bdf917eSStefano Zampini         ierr = VecView(pcis->vec1_global,PETSC_VIEWER_STDOUT_WORLD);
1235*0bdf917eSStefano Zampini         printf("------------------------------------------\n");
1236*0bdf917eSStefano Zampini       }
1237*0bdf917eSStefano Zampini     }
1238*0bdf917eSStefano Zampini   }*/
1239*0bdf917eSStefano Zampini 
1240*0bdf917eSStefano Zampini   ierr = KSPDestroy(&inv_change);CHKERRQ(ierr);
1241*0bdf917eSStefano Zampini   ierr = MatNullSpaceCreate(((PetscObject)pc)->comm,PETSC_FALSE,new_nsp_size,new_nsp_vecs,&new_nsp);CHKERRQ(ierr);
1242*0bdf917eSStefano Zampini   ierr = PCBDDCSetNullSpace(pc,new_nsp);CHKERRQ(ierr);
1243*0bdf917eSStefano Zampini   ierr = MatNullSpaceDestroy(&new_nsp);CHKERRQ(ierr);
1244*0bdf917eSStefano Zampini   /*
1245*0bdf917eSStefano Zampini   ierr = MatNullSpaceTest(pcbddc->NullSpace,pc->pmat,&nsp_t);CHKERRQ(ierr);
1246*0bdf917eSStefano Zampini   printf("New Null Space, mat changed: %d\n",nsp_t);
1247*0bdf917eSStefano Zampini     temp_mat = matis->A;
1248*0bdf917eSStefano Zampini     matis->A = pcbddc->local_mat;
1249*0bdf917eSStefano Zampini     pcbddc->local_mat = temp_mat;
1250*0bdf917eSStefano Zampini   ierr = MatNullSpaceTest(pcbddc->NullSpace,pc->pmat,&nsp_t);CHKERRQ(ierr);
1251*0bdf917eSStefano Zampini   printf("New Null Space, mat original: %d\n",nsp_t);*/
1252*0bdf917eSStefano Zampini 
1253*0bdf917eSStefano Zampini   for (i=0;i<new_nsp_size;i++) { ierr = VecDestroy(&new_nsp_vecs[i]);CHKERRQ(ierr); }
1254*0bdf917eSStefano Zampini   ierr = PetscFree(new_nsp_vecs);CHKERRQ(ierr);
1255*0bdf917eSStefano Zampini   PetscFunctionReturn(0);
1256*0bdf917eSStefano Zampini }
1257*0bdf917eSStefano Zampini 
1258*0bdf917eSStefano Zampini 
1259*0bdf917eSStefano Zampini 
1260*0bdf917eSStefano Zampini #undef __FUNCT__
12613425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPMatContext"
12623425bc38SStefano Zampini static PetscErrorCode PCBDDCCreateFETIDPMatContext(PC pc, FETIDPMat_ctx **fetidpmat_ctx)
12633425bc38SStefano Zampini {
12643425bc38SStefano Zampini   FETIDPMat_ctx  *newctx;
12653425bc38SStefano Zampini   PetscErrorCode ierr;
12663425bc38SStefano Zampini 
12673425bc38SStefano Zampini   PetscFunctionBegin;
12683425bc38SStefano Zampini   ierr = PetscMalloc(sizeof(*newctx),&newctx);CHKERRQ(ierr);
12693425bc38SStefano Zampini   newctx->lambda_local    = 0;
12703425bc38SStefano Zampini   newctx->temp_solution_B = 0;
12713425bc38SStefano Zampini   newctx->temp_solution_D = 0;
12723425bc38SStefano Zampini   newctx->B_delta         = 0;
12733425bc38SStefano Zampini   newctx->B_Ddelta        = 0; /* theoretically belongs to the FETIDP preconditioner */
12743425bc38SStefano Zampini   newctx->l2g_lambda      = 0;
12753425bc38SStefano Zampini   /* increase the reference count for BDDC preconditioner */
12763425bc38SStefano Zampini   ierr = PetscObjectReference((PetscObject)pc);CHKERRQ(ierr);
12773425bc38SStefano Zampini   newctx->pc              = pc;
12783425bc38SStefano Zampini   *fetidpmat_ctx          = newctx;
12793425bc38SStefano Zampini   PetscFunctionReturn(0);
12803425bc38SStefano Zampini }
12813425bc38SStefano Zampini 
12823425bc38SStefano Zampini #undef __FUNCT__
12833425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPPCContext"
12843425bc38SStefano Zampini static PetscErrorCode PCBDDCCreateFETIDPPCContext(PC pc, FETIDPPC_ctx **fetidppc_ctx)
12853425bc38SStefano Zampini {
12863425bc38SStefano Zampini   FETIDPPC_ctx  *newctx;
12873425bc38SStefano Zampini   PetscErrorCode ierr;
12883425bc38SStefano Zampini 
12893425bc38SStefano Zampini   PetscFunctionBegin;
12903425bc38SStefano Zampini   ierr = PetscMalloc(sizeof(*newctx),&newctx);CHKERRQ(ierr);
12913425bc38SStefano Zampini   newctx->lambda_local    = 0;
12923425bc38SStefano Zampini   newctx->B_Ddelta        = 0;
12933425bc38SStefano Zampini   newctx->l2g_lambda      = 0;
12943425bc38SStefano Zampini   /* increase the reference count for BDDC preconditioner */
12953425bc38SStefano Zampini   ierr = PetscObjectReference((PetscObject)pc);CHKERRQ(ierr);
12963425bc38SStefano Zampini   newctx->pc              = pc;
12973425bc38SStefano Zampini   *fetidppc_ctx           = newctx;
12983425bc38SStefano Zampini   PetscFunctionReturn(0);
12993425bc38SStefano Zampini }
13003425bc38SStefano Zampini 
13013425bc38SStefano Zampini #undef __FUNCT__
13023425bc38SStefano Zampini #define __FUNCT__ "PCBDDCDestroyFETIDPMat"
13033425bc38SStefano Zampini static PetscErrorCode PCBDDCDestroyFETIDPMat(Mat A)
13043425bc38SStefano Zampini {
13053425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
13063425bc38SStefano Zampini   PetscErrorCode ierr;
13073425bc38SStefano Zampini 
13083425bc38SStefano Zampini   PetscFunctionBegin;
13093425bc38SStefano Zampini   ierr = MatShellGetContext(A,(void**)&mat_ctx);CHKERRQ(ierr);
13103425bc38SStefano Zampini   ierr = VecDestroy(&mat_ctx->lambda_local);CHKERRQ(ierr);
13113425bc38SStefano Zampini   ierr = VecDestroy(&mat_ctx->temp_solution_D);CHKERRQ(ierr);
13123425bc38SStefano Zampini   ierr = VecDestroy(&mat_ctx->temp_solution_B);CHKERRQ(ierr);
13133425bc38SStefano Zampini   ierr = MatDestroy(&mat_ctx->B_delta);CHKERRQ(ierr);
13143425bc38SStefano Zampini   ierr = MatDestroy(&mat_ctx->B_Ddelta);CHKERRQ(ierr);
13153425bc38SStefano Zampini   ierr = VecScatterDestroy(&mat_ctx->l2g_lambda);CHKERRQ(ierr);
13163425bc38SStefano Zampini   ierr = PCDestroy(&mat_ctx->pc);CHKERRQ(ierr); /* actually it does not destroy BDDC, only decrease its reference count */
13173425bc38SStefano Zampini   ierr = PetscFree(mat_ctx);CHKERRQ(ierr);
13183425bc38SStefano Zampini   PetscFunctionReturn(0);
13193425bc38SStefano Zampini }
13203425bc38SStefano Zampini 
13213425bc38SStefano Zampini #undef __FUNCT__
13223425bc38SStefano Zampini #define __FUNCT__ "PCBDDCDestroyFETIDPPC"
13233425bc38SStefano Zampini static PetscErrorCode PCBDDCDestroyFETIDPPC(PC pc)
13243425bc38SStefano Zampini {
13253425bc38SStefano Zampini   FETIDPPC_ctx  *pc_ctx;
13263425bc38SStefano Zampini   PetscErrorCode ierr;
13273425bc38SStefano Zampini 
13283425bc38SStefano Zampini   PetscFunctionBegin;
13293425bc38SStefano Zampini   ierr = PCShellGetContext(pc,(void**)&pc_ctx);CHKERRQ(ierr);
13303425bc38SStefano Zampini   ierr = VecDestroy(&pc_ctx->lambda_local);CHKERRQ(ierr);
13313425bc38SStefano Zampini   ierr = MatDestroy(&pc_ctx->B_Ddelta);CHKERRQ(ierr);
13323425bc38SStefano Zampini   ierr = VecScatterDestroy(&pc_ctx->l2g_lambda);CHKERRQ(ierr);
13333425bc38SStefano Zampini   ierr = PCDestroy(&pc_ctx->pc);CHKERRQ(ierr); /* actually it does not destroy BDDC, only decrease its reference count */
13343425bc38SStefano Zampini   ierr = PetscFree(pc_ctx);CHKERRQ(ierr);
13353425bc38SStefano Zampini   PetscFunctionReturn(0);
13363425bc38SStefano Zampini }
13373425bc38SStefano Zampini 
13383425bc38SStefano Zampini #undef __FUNCT__
13393425bc38SStefano Zampini #define __FUNCT__ "PCBDDCSetupFETIDPMatContext"
13403425bc38SStefano Zampini static PetscErrorCode PCBDDCSetupFETIDPMatContext(FETIDPMat_ctx *fetidpmat_ctx )
13413425bc38SStefano Zampini {
13423425bc38SStefano Zampini   PetscErrorCode ierr;
13433425bc38SStefano Zampini   PC_IS          *pcis=(PC_IS*)fetidpmat_ctx->pc->data;
13443425bc38SStefano Zampini   PC_BDDC        *pcbddc=(PC_BDDC*)fetidpmat_ctx->pc->data;
13453425bc38SStefano Zampini   PCBDDCGraph    mat_graph=pcbddc->mat_graph;
13463425bc38SStefano Zampini   Mat_IS         *matis  = (Mat_IS*)fetidpmat_ctx->pc->pmat->data;
13473425bc38SStefano Zampini   MPI_Comm       comm = ((PetscObject)(fetidpmat_ctx->pc))->comm;
13483425bc38SStefano Zampini 
13493425bc38SStefano Zampini   Mat            ScalingMat;
13503425bc38SStefano Zampini   Vec            lambda_global;
13513425bc38SStefano Zampini   IS             IS_l2g_lambda;
13523425bc38SStefano Zampini 
13533425bc38SStefano Zampini   PetscBool      skip_node,fully_redundant;
13543425bc38SStefano Zampini   PetscInt       i,j,k,s,n_boundary_dofs,sum_dof_sizes,n_global_lambda,n_vertices;
13553425bc38SStefano Zampini   PetscInt       n_local_lambda,n_lambda_for_dof,dual_size,n_neg_values,n_pos_values;
13563425bc38SStefano Zampini   PetscMPIInt    rank,nprocs,partial_sum;
13573425bc38SStefano Zampini   PetscScalar    scalar_value;
13583425bc38SStefano Zampini 
13593425bc38SStefano Zampini   PetscInt       *vertex_indices,*temp_indices;
13603425bc38SStefano Zampini   PetscInt       *dual_dofs_boundary_indices,*aux_local_numbering_1,*aux_global_numbering;
13613425bc38SStefano Zampini   PetscInt       *aux_sums,*cols_B_delta,*l2g_indices;
13623425bc38SStefano Zampini   PetscMPIInt    *aux_local_numbering_2,*aux_global_numbering_mpi,*dof_sizes,*dof_displs;
13633425bc38SStefano Zampini   PetscMPIInt    *all_aux_global_numbering_mpi_1,*all_aux_global_numbering_mpi_2,*global_dofs_numbering;
13643425bc38SStefano Zampini   PetscScalar    *array,*scaling_factors,*vals_B_delta;
13653425bc38SStefano Zampini 
13663425bc38SStefano Zampini   /* For communication of scaling factors */
13673425bc38SStefano Zampini   PetscInt       *ptrs_buffer,neigh_position;
13683425bc38SStefano Zampini   PetscScalar    **all_factors,*send_buffer,*recv_buffer;
13693425bc38SStefano Zampini   MPI_Request    *send_reqs,*recv_reqs;
13703425bc38SStefano Zampini 
13713425bc38SStefano Zampini   /* tests */
13723425bc38SStefano Zampini   Vec            test_vec;
13733425bc38SStefano Zampini   PetscBool      test_fetidp;
13743425bc38SStefano Zampini   PetscViewer    viewer;
13753425bc38SStefano Zampini 
13763425bc38SStefano Zampini   PetscFunctionBegin;
13773425bc38SStefano Zampini   ierr = MPI_Comm_rank(comm,&rank);CHKERRQ(ierr);
13783425bc38SStefano Zampini   ierr = MPI_Comm_size(comm,&nprocs);CHKERRQ(ierr);
13793425bc38SStefano Zampini 
13803425bc38SStefano Zampini   /* Default type of lagrange multipliers is non-redundant */
13813425bc38SStefano Zampini   fully_redundant = PETSC_FALSE;
13823425bc38SStefano Zampini   ierr = PetscOptionsGetBool(PETSC_NULL,"-fetidp_fullyredundant",&fully_redundant,PETSC_NULL);CHKERRQ(ierr);
13833425bc38SStefano Zampini 
13843425bc38SStefano Zampini   /* Evaluate local and global number of lagrange multipliers */
13853425bc38SStefano Zampini   ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
13863425bc38SStefano Zampini   n_local_lambda = 0;
13873425bc38SStefano Zampini   partial_sum = 0;
13883425bc38SStefano Zampini   n_boundary_dofs = 0;
13893425bc38SStefano Zampini   s = 0;
13903425bc38SStefano Zampini   n_vertices = 0;
13913425bc38SStefano Zampini   /* Get Vertices used to define the BDDC */
13923425bc38SStefano Zampini   ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(*vertex_indices),&vertex_indices);CHKERRQ(ierr);
13933425bc38SStefano Zampini   for (i=0;i<pcbddc->local_primal_size;i++) {
13943425bc38SStefano Zampini     ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&j,(const PetscInt**)&temp_indices,PETSC_NULL);CHKERRQ(ierr);
13953425bc38SStefano Zampini     if (j == 1) {
13963425bc38SStefano Zampini       vertex_indices[n_vertices]=temp_indices[0];
13973425bc38SStefano Zampini       n_vertices++;
13983425bc38SStefano Zampini     }
13993425bc38SStefano Zampini     ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&j,(const PetscInt**)&temp_indices,PETSC_NULL);CHKERRQ(ierr);
14003425bc38SStefano Zampini   }
14013425bc38SStefano Zampini   dual_size = pcis->n_B-n_vertices;
14023425bc38SStefano Zampini   ierr = PetscMalloc(dual_size*sizeof(*dual_dofs_boundary_indices),&dual_dofs_boundary_indices);CHKERRQ(ierr);
14033425bc38SStefano Zampini   ierr = PetscMalloc(dual_size*sizeof(*aux_local_numbering_1),&aux_local_numbering_1);CHKERRQ(ierr);
14043425bc38SStefano Zampini   ierr = PetscMalloc(dual_size*sizeof(*aux_local_numbering_2),&aux_local_numbering_2);CHKERRQ(ierr);
14053425bc38SStefano Zampini 
14063425bc38SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
14073425bc38SStefano Zampini   for (i=0;i<pcis->n;i++){
14083425bc38SStefano Zampini     j = mat_graph->count[i]; /* RECALL: mat_graph->count[i] does not count myself */
1409c6582918SStefano Zampini     k = 0;
1410c6582918SStefano Zampini     if (j > 0) {
14113425bc38SStefano Zampini       k = (mat_graph->neighbours_set[i][0] == -1 ?  1 : 0);
1412c6582918SStefano Zampini     }
14133425bc38SStefano Zampini     j = j - k ;
14143425bc38SStefano Zampini     if ( j > 0 ) { n_boundary_dofs++; }
14153425bc38SStefano Zampini 
14163425bc38SStefano Zampini     skip_node = PETSC_FALSE;
1417c6582918SStefano Zampini     if ( s < n_vertices && vertex_indices[s]==i) { /* it works for a sorted set of vertices */
14183425bc38SStefano Zampini       skip_node = PETSC_TRUE;
14193425bc38SStefano Zampini       s++;
14203425bc38SStefano Zampini     }
14213425bc38SStefano Zampini     if (j < 1) {skip_node = PETSC_TRUE;}
14223425bc38SStefano Zampini     if ( !skip_node ) {
14233425bc38SStefano Zampini       if (fully_redundant) {
14243425bc38SStefano Zampini         /* fully redundant set of lagrange multipliers */
14253425bc38SStefano Zampini         n_lambda_for_dof = (j*(j+1))/2;
14263425bc38SStefano Zampini       } else {
14273425bc38SStefano Zampini         n_lambda_for_dof = j;
14283425bc38SStefano Zampini       }
14293425bc38SStefano Zampini       n_local_lambda += j;
14303425bc38SStefano Zampini       /* needed to evaluate global number of lagrange multipliers */
14313425bc38SStefano Zampini       array[i]=(1.0*n_lambda_for_dof)/(j+1.0); /* already scaled for the next global sum */
14323425bc38SStefano Zampini       /* store some data needed */
14333425bc38SStefano Zampini       dual_dofs_boundary_indices[partial_sum] = n_boundary_dofs-1;
14343425bc38SStefano Zampini       aux_local_numbering_1[partial_sum] = i;
14353425bc38SStefano Zampini       aux_local_numbering_2[partial_sum] = (PetscMPIInt)n_lambda_for_dof;
14363425bc38SStefano Zampini       partial_sum++;
14373425bc38SStefano Zampini     }
14383425bc38SStefano Zampini   }
14393425bc38SStefano Zampini   /*printf("I found %d local lambda dofs\n",n_local_lambda);
14403425bc38SStefano Zampini   printf("I found %d boundary dofs (should be %d)\n",n_boundary_dofs,pcis->n_B);
14413425bc38SStefano Zampini   printf("Partial sum %d should be %d\n",partial_sum,dual_size);*/
14423425bc38SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
14433425bc38SStefano Zampini   ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
14443425bc38SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
14453425bc38SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
14463425bc38SStefano Zampini   ierr = VecSum(pcis->vec1_global,&scalar_value);CHKERRQ(ierr);
14473425bc38SStefano Zampini   fetidpmat_ctx->n_lambda = (PetscInt) scalar_value;
14483425bc38SStefano Zampini   /* printf("I found %d global multipliers (%f)\n",fetidpmat_ctx->n_lambda,scalar_value); */
14493425bc38SStefano Zampini   ierr = VecCreate(PETSC_COMM_SELF,&fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
14503425bc38SStefano Zampini   ierr = VecSetSizes(fetidpmat_ctx->lambda_local,n_local_lambda,n_local_lambda);CHKERRQ(ierr);
14513425bc38SStefano Zampini   ierr = VecSetType(fetidpmat_ctx->lambda_local,VECSEQ);CHKERRQ(ierr);
14523425bc38SStefano Zampini   ierr = VecCreate(comm,&lambda_global);CHKERRQ(ierr);
14533425bc38SStefano Zampini   ierr = VecSetSizes(lambda_global,PETSC_DECIDE,fetidpmat_ctx->n_lambda);CHKERRQ(ierr);
14543425bc38SStefano Zampini   ierr = VecSetType(lambda_global,VECMPI);CHKERRQ(ierr);
14553425bc38SStefano Zampini 
14563425bc38SStefano Zampini   /* compute global ordering of lagrange multipliers and associate l2g map */
14573425bc38SStefano Zampini 
14583425bc38SStefano Zampini   ierr = PetscMalloc(dual_size*sizeof(*aux_global_numbering),&aux_global_numbering);CHKERRQ(ierr);
14593425bc38SStefano Zampini   ierr = PetscMalloc(dual_size*sizeof(*aux_global_numbering_mpi),&aux_global_numbering_mpi);CHKERRQ(ierr);
14603425bc38SStefano Zampini   j = (rank == 0 ? nprocs : 0);
14613425bc38SStefano Zampini   ierr = PetscMalloc(j*sizeof(*dof_sizes),&dof_sizes);CHKERRQ(ierr);
14623425bc38SStefano Zampini   ierr = PetscMalloc(j*sizeof(*dof_displs),&dof_displs);CHKERRQ(ierr);
14633425bc38SStefano Zampini   ierr = ISLocalToGlobalMappingApply(matis->mapping,dual_size,aux_local_numbering_1,aux_global_numbering);CHKERRQ(ierr);
14643425bc38SStefano Zampini   ierr = MPI_Gather(&dual_size,1,MPIU_INT,dof_sizes,1,MPIU_INT,0,comm);CHKERRQ(ierr);
14653425bc38SStefano Zampini   sum_dof_sizes=0;
14663425bc38SStefano Zampini   if ( rank == 0 ) {
14673425bc38SStefano Zampini     dof_displs[0]=0;
14683425bc38SStefano Zampini     sum_dof_sizes=dual_size;
14693425bc38SStefano Zampini     for (i=1;i<nprocs;i++) {
14703425bc38SStefano Zampini       dof_displs[i] = dof_displs[i-1]+dof_sizes[i-1];
14713425bc38SStefano Zampini       sum_dof_sizes += dof_sizes[i];
14723425bc38SStefano Zampini     }
14733425bc38SStefano Zampini   }
14743425bc38SStefano Zampini   for (i=0;i<dual_size;i++) {
14753425bc38SStefano Zampini     aux_global_numbering_mpi[i]=(PetscMPIInt)aux_global_numbering[i];
14763425bc38SStefano Zampini   }
14773425bc38SStefano Zampini   ierr = PetscMalloc(sum_dof_sizes*sizeof(*all_aux_global_numbering_mpi_1),&all_aux_global_numbering_mpi_1);CHKERRQ(ierr);
14783425bc38SStefano Zampini   ierr = PetscMalloc(sum_dof_sizes*sizeof(*all_aux_global_numbering_mpi_2),&all_aux_global_numbering_mpi_2);CHKERRQ(ierr);
14793425bc38SStefano Zampini   ierr = MPI_Gatherv(aux_global_numbering_mpi,dual_size,MPIU_INT,all_aux_global_numbering_mpi_1,dof_sizes,dof_displs,MPIU_INT,0,comm);CHKERRQ(ierr);
14803425bc38SStefano Zampini   ierr = MPI_Gatherv(aux_local_numbering_2,dual_size,MPIU_INT,all_aux_global_numbering_mpi_2,dof_sizes,dof_displs,MPIU_INT,0,comm);CHKERRQ(ierr);
14813425bc38SStefano Zampini 
14823425bc38SStefano Zampini   ierr = PetscMalloc(fetidpmat_ctx->n_lambda*sizeof(*global_dofs_numbering),&global_dofs_numbering);CHKERRQ(ierr);
14833425bc38SStefano Zampini   if ( rank == 0 ) {
14843425bc38SStefano Zampini     ierr = PetscSortMPIIntWithArray(sum_dof_sizes,all_aux_global_numbering_mpi_1,all_aux_global_numbering_mpi_2);CHKERRQ(ierr);
14853425bc38SStefano Zampini     j=-1;
14863425bc38SStefano Zampini     partial_sum = 0;
14873425bc38SStefano Zampini     for (i=0;i<sum_dof_sizes;i++) {
14883425bc38SStefano Zampini       if (j != all_aux_global_numbering_mpi_1[i] ) {
14893425bc38SStefano Zampini         j=all_aux_global_numbering_mpi_1[i];
14903425bc38SStefano Zampini         for (k=0;k<all_aux_global_numbering_mpi_2[i];k++) {
14913425bc38SStefano Zampini           global_dofs_numbering[partial_sum+k]=all_aux_global_numbering_mpi_1[i];
14923425bc38SStefano Zampini         }
14933425bc38SStefano Zampini         partial_sum += all_aux_global_numbering_mpi_2[i];
14943425bc38SStefano Zampini       }
14953425bc38SStefano Zampini     }
14963425bc38SStefano Zampini     /* printf("Partial sum for global dofs %d should be %d\n",partial_sum,fetidpmat_ctx->n_lambda); */
14973425bc38SStefano Zampini   }
14983425bc38SStefano Zampini   ierr = MPI_Bcast(global_dofs_numbering,fetidpmat_ctx->n_lambda,MPIU_INT,0,comm);CHKERRQ(ierr);
14993425bc38SStefano Zampini 
15003425bc38SStefano Zampini   /* init data for scaling factors exchange */
15013425bc38SStefano Zampini   partial_sum = 0;
15023425bc38SStefano Zampini   j = 0;
15033425bc38SStefano Zampini   ierr = PetscMalloc( pcis->n_neigh*sizeof(PetscInt),&ptrs_buffer);CHKERRQ(ierr);
15043425bc38SStefano Zampini   ierr = PetscMalloc( (pcis->n_neigh-1)*sizeof(MPI_Request),&send_reqs);CHKERRQ(ierr);
15053425bc38SStefano Zampini   ierr = PetscMalloc( (pcis->n_neigh-1)*sizeof(MPI_Request),&recv_reqs);CHKERRQ(ierr);
15063425bc38SStefano Zampini   ierr = PetscMalloc( pcis->n*sizeof(PetscScalar*),&all_factors);CHKERRQ(ierr);
15073425bc38SStefano Zampini   ptrs_buffer[0]=0;
15083425bc38SStefano Zampini   for (i=1;i<pcis->n_neigh;i++) {
15093425bc38SStefano Zampini     partial_sum += pcis->n_shared[i];
15103425bc38SStefano Zampini     ptrs_buffer[i] = ptrs_buffer[i-1]+pcis->n_shared[i];
15113425bc38SStefano Zampini   }
15123425bc38SStefano Zampini   ierr = PetscMalloc( partial_sum*sizeof(PetscScalar),&send_buffer);CHKERRQ(ierr);
15133425bc38SStefano Zampini   ierr = PetscMalloc( partial_sum*sizeof(PetscScalar),&recv_buffer);CHKERRQ(ierr);
15143425bc38SStefano Zampini   ierr = PetscMalloc( partial_sum*sizeof(PetscScalar),&all_factors[0]);CHKERRQ(ierr);
15153425bc38SStefano Zampini   for (i=0;i<pcis->n-1;i++) {
15163425bc38SStefano Zampini     j = mat_graph->count[i];
15173425bc38SStefano Zampini     if (j>0) {
15183425bc38SStefano Zampini       k = (mat_graph->neighbours_set[i][0] == -1 ?  1 : 0);
15193425bc38SStefano Zampini       j = j - k;
15203425bc38SStefano Zampini     }
15213425bc38SStefano Zampini     all_factors[i+1]=all_factors[i]+j;
15223425bc38SStefano Zampini   }
15233425bc38SStefano Zampini   /* scatter B scaling to N vec */
15243425bc38SStefano Zampini   ierr = VecScatterBegin(pcis->N_to_B,pcis->D,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
15253425bc38SStefano Zampini   ierr = VecScatterEnd  (pcis->N_to_B,pcis->D,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
15263425bc38SStefano Zampini   /* communications */
15273425bc38SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
15283425bc38SStefano Zampini   for (i=1;i<pcis->n_neigh;i++) {
15293425bc38SStefano Zampini     for (j=0;j<pcis->n_shared[i];j++) {
15303425bc38SStefano Zampini       send_buffer[ptrs_buffer[i-1]+j]=array[pcis->shared[i][j]];
15313425bc38SStefano Zampini     }
15323425bc38SStefano Zampini     j = ptrs_buffer[i]-ptrs_buffer[i-1];
1533ea7e1babSStefano Zampini     ierr = MPI_Isend(&send_buffer[ptrs_buffer[i-1]],j,MPIU_SCALAR,pcis->neigh[i],0,comm,&send_reqs[i-1]);CHKERRQ(ierr);
1534ea7e1babSStefano Zampini     ierr = MPI_Irecv(&recv_buffer[ptrs_buffer[i-1]],j,MPIU_SCALAR,pcis->neigh[i],0,comm,&recv_reqs[i-1]);CHKERRQ(ierr);
15353425bc38SStefano Zampini   }
15363425bc38SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
1537ea7e1babSStefano Zampini   ierr = MPI_Waitall((pcis->n_neigh-1),recv_reqs,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
15383425bc38SStefano Zampini   /* put values in correct places */
15393425bc38SStefano Zampini   for (i=1;i<pcis->n_neigh;i++) {
15403425bc38SStefano Zampini     for (j=0;j<pcis->n_shared[i];j++) {
15413425bc38SStefano Zampini       k = pcis->shared[i][j];
15423425bc38SStefano Zampini       neigh_position = 0;
15433425bc38SStefano Zampini       while(mat_graph->neighbours_set[k][neigh_position] != pcis->neigh[i]) {neigh_position++;}
15443425bc38SStefano Zampini       s = (mat_graph->neighbours_set[k][0] == -1 ?  1 : 0);
15453425bc38SStefano Zampini       neigh_position = neigh_position - s;
15463425bc38SStefano Zampini       all_factors[k][neigh_position]=recv_buffer[ptrs_buffer[i-1]+j];
15473425bc38SStefano Zampini     }
15483425bc38SStefano Zampini   }
1549ea7e1babSStefano Zampini   ierr = MPI_Waitall((pcis->n_neigh-1),send_reqs,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
15503425bc38SStefano Zampini   ierr = PetscFree(send_reqs);CHKERRQ(ierr);
15513425bc38SStefano Zampini   ierr = PetscFree(recv_reqs);CHKERRQ(ierr);
15523425bc38SStefano Zampini   ierr = PetscFree(send_buffer);CHKERRQ(ierr);
15533425bc38SStefano Zampini   ierr = PetscFree(recv_buffer);CHKERRQ(ierr);
15543425bc38SStefano Zampini   ierr = PetscFree(ptrs_buffer);CHKERRQ(ierr);
15553425bc38SStefano Zampini 
15563425bc38SStefano Zampini   /* Compute B and B_delta (local actions) */
15573425bc38SStefano Zampini   ierr = PetscMalloc(pcis->n_neigh*sizeof(*aux_sums),&aux_sums);CHKERRQ(ierr);
15583425bc38SStefano Zampini   ierr = PetscMalloc(n_local_lambda*sizeof(*l2g_indices),&l2g_indices);CHKERRQ(ierr);
15593425bc38SStefano Zampini   ierr = PetscMalloc(n_local_lambda*sizeof(*vals_B_delta),&vals_B_delta);CHKERRQ(ierr);
15603425bc38SStefano Zampini   ierr = PetscMalloc(n_local_lambda*sizeof(*cols_B_delta),&cols_B_delta);CHKERRQ(ierr);
15613425bc38SStefano Zampini   ierr = PetscMalloc(n_local_lambda*sizeof(*scaling_factors),&scaling_factors);CHKERRQ(ierr);
15623425bc38SStefano Zampini   n_global_lambda=0;
15633425bc38SStefano Zampini   partial_sum=0;
15643425bc38SStefano Zampini   for (i=0;i<dual_size;i++) {
15653425bc38SStefano Zampini     while( global_dofs_numbering[n_global_lambda] != aux_global_numbering_mpi[i] ) { n_global_lambda++; }
15663425bc38SStefano Zampini     j = mat_graph->count[aux_local_numbering_1[i]];
15673425bc38SStefano Zampini     k = (mat_graph->neighbours_set[aux_local_numbering_1[i]][0] == -1 ?  1 : 0);
15683425bc38SStefano Zampini     j = j - k;
15693425bc38SStefano Zampini     aux_sums[0]=0;
15703425bc38SStefano Zampini     for (s=1;s<j;s++) {
15713425bc38SStefano Zampini       aux_sums[s]=aux_sums[s-1]+j-s+1;
15723425bc38SStefano Zampini     }
15733425bc38SStefano Zampini     array = all_factors[aux_local_numbering_1[i]];
15743425bc38SStefano Zampini     n_neg_values = 0;
15753425bc38SStefano Zampini     while(n_neg_values < j && mat_graph->neighbours_set[aux_local_numbering_1[i]][n_neg_values+k] < rank) {n_neg_values++;}
15763425bc38SStefano Zampini     n_pos_values = j - n_neg_values;
15773425bc38SStefano Zampini     if (fully_redundant) {
15783425bc38SStefano Zampini       for (s=0;s<n_neg_values;s++) {
15793425bc38SStefano Zampini         l2g_indices    [partial_sum+s]=aux_sums[s]+n_neg_values-s-1+n_global_lambda;
15803425bc38SStefano Zampini         cols_B_delta   [partial_sum+s]=dual_dofs_boundary_indices[i];
15813425bc38SStefano Zampini         vals_B_delta   [partial_sum+s]=-1.0;
15823425bc38SStefano Zampini         scaling_factors[partial_sum+s]=array[s];
15833425bc38SStefano Zampini       }
15843425bc38SStefano Zampini       for (s=0;s<n_pos_values;s++) {
15853425bc38SStefano Zampini         l2g_indices    [partial_sum+s+n_neg_values]=aux_sums[n_neg_values]+s+n_global_lambda;
15863425bc38SStefano Zampini         cols_B_delta   [partial_sum+s+n_neg_values]=dual_dofs_boundary_indices[i];
15873425bc38SStefano Zampini         vals_B_delta   [partial_sum+s+n_neg_values]=1.0;
15883425bc38SStefano Zampini         scaling_factors[partial_sum+s+n_neg_values]=array[s+n_neg_values];
15893425bc38SStefano Zampini       }
15903425bc38SStefano Zampini       partial_sum += j;
15913425bc38SStefano Zampini     } else {
15923425bc38SStefano Zampini       /* l2g_indices and default cols and vals of B_delta */
15933425bc38SStefano Zampini       for (s=0;s<j;s++) {
15943425bc38SStefano Zampini         l2g_indices    [partial_sum+s]=n_global_lambda+s;
15953425bc38SStefano Zampini         cols_B_delta   [partial_sum+s]=dual_dofs_boundary_indices[i];
15963425bc38SStefano Zampini         vals_B_delta   [partial_sum+s]=0.0;
15973425bc38SStefano Zampini       }
15983425bc38SStefano Zampini       /* B_delta */
15993425bc38SStefano Zampini       if ( n_neg_values > 0 ) { /* there's a rank next to me to the left */
16003425bc38SStefano Zampini         vals_B_delta   [partial_sum+n_neg_values-1]=-1.0;
16013425bc38SStefano Zampini       }
16023425bc38SStefano Zampini       if ( n_neg_values < j ) { /* there's a rank next to me to the right */
16033425bc38SStefano Zampini         vals_B_delta   [partial_sum+n_neg_values]=1.0;
16043425bc38SStefano Zampini       }
16053425bc38SStefano Zampini       /* scaling as in Klawonn-Widlund 1999*/
16063425bc38SStefano Zampini       for (s=0;s<n_neg_values;s++) {
16073425bc38SStefano Zampini         scalar_value = 0.0;
16083425bc38SStefano Zampini         for (k=0;k<s+1;k++) {
16093425bc38SStefano Zampini           scalar_value += array[k];
16103425bc38SStefano Zampini         }
16113425bc38SStefano Zampini         scalar_value = -scalar_value;
16123425bc38SStefano Zampini         scaling_factors[partial_sum+s] = scalar_value;
16133425bc38SStefano Zampini       }
16143425bc38SStefano Zampini       for (s=0;s<n_pos_values;s++) {
16153425bc38SStefano Zampini         scalar_value = 0.0;
16163425bc38SStefano Zampini         for (k=s+n_neg_values;k<j;k++) {
16173425bc38SStefano Zampini           scalar_value += array[k];
16183425bc38SStefano Zampini         }
16193425bc38SStefano Zampini         scaling_factors[partial_sum+s+n_neg_values] = scalar_value;
16203425bc38SStefano Zampini       }
16213425bc38SStefano Zampini       partial_sum += j;
16223425bc38SStefano Zampini     }
16233425bc38SStefano Zampini   }
16243425bc38SStefano Zampini   ierr = PetscFree(all_factors[0]);CHKERRQ(ierr);
16253425bc38SStefano Zampini   ierr = PetscFree(all_factors);CHKERRQ(ierr);
16263425bc38SStefano Zampini   /* printf("I found %d local lambda dofs when numbering them (should be %d)\n",partial_sum,n_local_lambda); */
16273425bc38SStefano Zampini   ierr = ISCreateGeneral(comm,n_local_lambda,l2g_indices,PETSC_OWN_POINTER,&IS_l2g_lambda);CHKERRQ(ierr);
16283425bc38SStefano Zampini   ierr = VecScatterCreate(fetidpmat_ctx->lambda_local,(IS)0,lambda_global,IS_l2g_lambda,&fetidpmat_ctx->l2g_lambda);CHKERRQ(ierr);
16293425bc38SStefano Zampini 
16303425bc38SStefano Zampini   /* Create local part of B_delta */
16313425bc38SStefano Zampini   ierr = MatCreate(PETSC_COMM_SELF,&fetidpmat_ctx->B_delta);
16323425bc38SStefano Zampini   ierr = MatSetSizes(fetidpmat_ctx->B_delta,n_local_lambda,pcis->n_B,n_local_lambda,pcis->n_B);CHKERRQ(ierr);
16333425bc38SStefano Zampini   ierr = MatSetType(fetidpmat_ctx->B_delta,MATSEQAIJ);CHKERRQ(ierr);
16343425bc38SStefano Zampini   ierr = MatSeqAIJSetPreallocation(fetidpmat_ctx->B_delta,1,PETSC_NULL);CHKERRQ(ierr);
16353425bc38SStefano Zampini   ierr = MatSetOption(fetidpmat_ctx->B_delta,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr);
16363425bc38SStefano Zampini   for (i=0;i<n_local_lambda;i++) {
16373425bc38SStefano Zampini     ierr = MatSetValue(fetidpmat_ctx->B_delta,i,cols_B_delta[i],vals_B_delta[i],INSERT_VALUES);CHKERRQ(ierr);
16383425bc38SStefano Zampini   }
16393425bc38SStefano Zampini   ierr = MatAssemblyBegin(fetidpmat_ctx->B_delta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
16403425bc38SStefano Zampini   ierr = MatAssemblyEnd  (fetidpmat_ctx->B_delta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
16413425bc38SStefano Zampini 
16423425bc38SStefano Zampini   if (fully_redundant) {
16433425bc38SStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&ScalingMat);
16443425bc38SStefano Zampini     ierr = MatSetSizes(ScalingMat,n_local_lambda,n_local_lambda,n_local_lambda,n_local_lambda);CHKERRQ(ierr);
16453425bc38SStefano Zampini     ierr = MatSetType(ScalingMat,MATSEQAIJ);CHKERRQ(ierr);
16463425bc38SStefano Zampini     ierr = MatSeqAIJSetPreallocation(ScalingMat,1,PETSC_NULL);CHKERRQ(ierr);
16473425bc38SStefano Zampini     for (i=0;i<n_local_lambda;i++) {
16483425bc38SStefano Zampini       ierr = MatSetValue(ScalingMat,i,i,scaling_factors[i],INSERT_VALUES);CHKERRQ(ierr);
16493425bc38SStefano Zampini     }
16503425bc38SStefano Zampini     ierr = MatAssemblyBegin(ScalingMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
16513425bc38SStefano Zampini     ierr = MatAssemblyEnd  (ScalingMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
16523425bc38SStefano Zampini     ierr = MatMatMult(ScalingMat,fetidpmat_ctx->B_delta,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&fetidpmat_ctx->B_Ddelta);CHKERRQ(ierr);
16533425bc38SStefano Zampini     ierr = MatDestroy(&ScalingMat);CHKERRQ(ierr);
16543425bc38SStefano Zampini   } else {
16553425bc38SStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&fetidpmat_ctx->B_Ddelta);
16563425bc38SStefano Zampini     ierr = MatSetSizes(fetidpmat_ctx->B_Ddelta,n_local_lambda,pcis->n_B,n_local_lambda,pcis->n_B);CHKERRQ(ierr);
16573425bc38SStefano Zampini     ierr = MatSetType(fetidpmat_ctx->B_Ddelta,MATSEQAIJ);CHKERRQ(ierr);
16583425bc38SStefano Zampini     ierr = MatSeqAIJSetPreallocation(fetidpmat_ctx->B_Ddelta,1,PETSC_NULL);CHKERRQ(ierr);
16593425bc38SStefano Zampini     for (i=0;i<n_local_lambda;i++) {
16603425bc38SStefano Zampini       ierr = MatSetValue(fetidpmat_ctx->B_Ddelta,i,cols_B_delta[i],scaling_factors[i],INSERT_VALUES);CHKERRQ(ierr);
16613425bc38SStefano Zampini     }
16623425bc38SStefano Zampini     ierr = MatAssemblyBegin(fetidpmat_ctx->B_Ddelta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
16633425bc38SStefano Zampini     ierr = MatAssemblyEnd  (fetidpmat_ctx->B_Ddelta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
16643425bc38SStefano Zampini   }
16653425bc38SStefano Zampini 
16663425bc38SStefano Zampini   /* Create some vectors needed by fetidp */
16673425bc38SStefano Zampini   ierr = VecDuplicate(pcis->vec1_B,&fetidpmat_ctx->temp_solution_B);CHKERRQ(ierr);
16683425bc38SStefano Zampini   ierr = VecDuplicate(pcis->vec1_D,&fetidpmat_ctx->temp_solution_D);CHKERRQ(ierr);
16693425bc38SStefano Zampini 
16703425bc38SStefano Zampini   test_fetidp = PETSC_FALSE;
16713425bc38SStefano Zampini   ierr = PetscOptionsGetBool(PETSC_NULL,"-fetidp_check",&test_fetidp,PETSC_NULL);CHKERRQ(ierr);
16723425bc38SStefano Zampini 
16733425bc38SStefano Zampini   if (test_fetidp) {
16743425bc38SStefano Zampini 
16753425bc38SStefano Zampini     ierr = PetscViewerASCIIGetStdout(((PetscObject)(fetidpmat_ctx->pc))->comm,&viewer);CHKERRQ(ierr);
16763425bc38SStefano Zampini     ierr = PetscViewerASCIISynchronizedAllow(viewer,PETSC_TRUE);CHKERRQ(ierr);
16773425bc38SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"----------FETI_DP TESTS--------------\n");CHKERRQ(ierr);
16783425bc38SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"All tests should return zero!\n");CHKERRQ(ierr);
16793425bc38SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"FETIDP MAT context in the ");CHKERRQ(ierr);
16803425bc38SStefano Zampini     if (fully_redundant) {
16813425bc38SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"fully redundant case for lagrange multipliers.\n");CHKERRQ(ierr);
16823425bc38SStefano Zampini     } else {
16833425bc38SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Non-fully redundant case for lagrange multiplier.\n");CHKERRQ(ierr);
16843425bc38SStefano Zampini     }
16853425bc38SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
16863425bc38SStefano Zampini 
16873425bc38SStefano Zampini     /******************************************************************/
16883425bc38SStefano Zampini     /* TEST A/B: Test numbering of global lambda dofs             */
16893425bc38SStefano Zampini     /******************************************************************/
16903425bc38SStefano Zampini 
16913425bc38SStefano Zampini     ierr = VecDuplicate(fetidpmat_ctx->lambda_local,&test_vec);CHKERRQ(ierr);
16923425bc38SStefano Zampini     ierr = VecSet(lambda_global,1.0);CHKERRQ(ierr);
16933425bc38SStefano Zampini     ierr = VecSet(test_vec,1.0);CHKERRQ(ierr);
16943425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
16953425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
16963425bc38SStefano Zampini     scalar_value = -1.0;
16973425bc38SStefano Zampini     ierr = VecAXPY(test_vec,scalar_value,fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
16983425bc38SStefano Zampini     ierr = VecNorm(test_vec,NORM_INFINITY,&scalar_value);CHKERRQ(ierr);
16993425bc38SStefano Zampini     ierr = VecDestroy(&test_vec);CHKERRQ(ierr);
17003425bc38SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"A[%04d]: CHECK glob to loc: % 1.14e\n",rank,scalar_value);CHKERRQ(ierr);
17013425bc38SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
17023425bc38SStefano Zampini     if (fully_redundant) {
17033425bc38SStefano Zampini       ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr);
17043425bc38SStefano Zampini       ierr = VecSet(fetidpmat_ctx->lambda_local,0.5);CHKERRQ(ierr);
17053425bc38SStefano Zampini       ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
17063425bc38SStefano Zampini       ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
17073425bc38SStefano Zampini       ierr = VecSum(lambda_global,&scalar_value);CHKERRQ(ierr);
17083425bc38SStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"B[%04d]: CHECK loc to glob: % 1.14e\n",rank,scalar_value-fetidpmat_ctx->n_lambda);CHKERRQ(ierr);
17093425bc38SStefano Zampini       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
17103425bc38SStefano Zampini     }
17113425bc38SStefano Zampini 
17123425bc38SStefano Zampini     /******************************************************************/
17133425bc38SStefano Zampini     /* TEST C: It should holds B_delta*w=0, w\in\widehat{W}           */
17143425bc38SStefano Zampini     /* This is the meaning of the B matrix                            */
17153425bc38SStefano Zampini     /******************************************************************/
17163425bc38SStefano Zampini 
17173425bc38SStefano Zampini     ierr = VecSetRandom(pcis->vec1_N,PETSC_NULL);CHKERRQ(ierr);
17183425bc38SStefano Zampini     ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
17193425bc38SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
17203425bc38SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
17213425bc38SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
17223425bc38SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
17233425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
17243425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
17253425bc38SStefano Zampini     /* Action of B_delta */
17263425bc38SStefano Zampini     ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
17273425bc38SStefano Zampini     ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr);
17283425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
17293425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
17303425bc38SStefano Zampini     ierr = VecNorm(lambda_global,NORM_INFINITY,&scalar_value);CHKERRQ(ierr);
17313425bc38SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"C[coll]: CHECK infty norm of B_delta*w (w continuous): % 1.14e\n",scalar_value);CHKERRQ(ierr);
17323425bc38SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
17333425bc38SStefano Zampini 
17343425bc38SStefano Zampini     /******************************************************************/
17353425bc38SStefano Zampini     /* TEST D: It should holds E_Dw = w - P_Dw w\in\widetilde{W}     */
17363425bc38SStefano Zampini     /* E_D = R_D^TR                                                   */
17373425bc38SStefano Zampini     /* P_D = B_{D,delta}^T B_{delta}                                  */
17383425bc38SStefano Zampini     /* eq.44 Mandel Tezaur and Dohrmann 2005                          */
17393425bc38SStefano Zampini     /******************************************************************/
17403425bc38SStefano Zampini 
17413425bc38SStefano Zampini     /* compute a random vector in \widetilde{W} */
17423425bc38SStefano Zampini     ierr = VecSetRandom(pcis->vec1_N,PETSC_NULL);CHKERRQ(ierr);
17433425bc38SStefano Zampini     scalar_value = 0.0;  /* set zero at vertices */
17443425bc38SStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
17453425bc38SStefano Zampini     for (i=0;i<n_vertices;i++) { array[vertex_indices[i]]=scalar_value; }
17463425bc38SStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
17473425bc38SStefano Zampini     /* store w for final comparison */
17483425bc38SStefano Zampini     ierr = VecDuplicate(pcis->vec1_B,&test_vec);CHKERRQ(ierr);
17493425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,test_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
17503425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,test_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
17513425bc38SStefano Zampini 
17523425bc38SStefano Zampini     /* Jump operator P_D : results stored in pcis->vec1_B */
17533425bc38SStefano Zampini 
17543425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
17553425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
17563425bc38SStefano Zampini     /* Action of B_delta */
17573425bc38SStefano Zampini     ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
17583425bc38SStefano Zampini     ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr);
17593425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
17603425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
17613425bc38SStefano Zampini     /* Action of B_Ddelta^T */
17623425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
17633425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
17643425bc38SStefano Zampini     ierr = MatMultTranspose(fetidpmat_ctx->B_Ddelta,fetidpmat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr);
17653425bc38SStefano Zampini 
17663425bc38SStefano Zampini     /* Average operator E_D : results stored in pcis->vec2_B */
17673425bc38SStefano Zampini 
17683425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
17693425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
17703425bc38SStefano Zampini     ierr = VecPointwiseMult(pcis->vec2_B,pcis->D,pcis->vec2_B);CHKERRQ(ierr);
17713425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec2_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
17723425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec2_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
17733425bc38SStefano Zampini     ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
17743425bc38SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
17753425bc38SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
17763425bc38SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
17773425bc38SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
17783425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
17793425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
17803425bc38SStefano Zampini 
17813425bc38SStefano Zampini     /* test E_D=I-P_D */
17823425bc38SStefano Zampini     scalar_value = 1.0;
17833425bc38SStefano Zampini     ierr = VecAXPY(pcis->vec1_B,scalar_value,pcis->vec2_B);CHKERRQ(ierr);
17843425bc38SStefano Zampini     scalar_value = -1.0;
17853425bc38SStefano Zampini     ierr = VecAXPY(pcis->vec1_B,scalar_value,test_vec);CHKERRQ(ierr);
17863425bc38SStefano Zampini     ierr = VecNorm(pcis->vec1_B,NORM_INFINITY,&scalar_value);CHKERRQ(ierr);
17873425bc38SStefano Zampini     ierr = VecDestroy(&test_vec);CHKERRQ(ierr);
17883425bc38SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"D[%04d] CHECK infty norm of E_D + P_D - I: % 1.14e\n",rank,scalar_value);CHKERRQ(ierr);
17893425bc38SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
17903425bc38SStefano Zampini 
17913425bc38SStefano Zampini     /******************************************************************/
17923425bc38SStefano Zampini     /* TEST E: It should holds R_D^TP_Dw=0 w\in\widetilde{W}          */
17933425bc38SStefano Zampini     /* eq.48 Mandel Tezaur and Dohrmann 2005                          */
17943425bc38SStefano Zampini     /******************************************************************/
17953425bc38SStefano Zampini 
17963425bc38SStefano Zampini     ierr = VecSetRandom(pcis->vec1_N,PETSC_NULL);CHKERRQ(ierr);
17973425bc38SStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
17983425bc38SStefano Zampini     scalar_value = 0.0;  /* set zero at vertices */
17993425bc38SStefano Zampini     for (i=0;i<n_vertices;i++) { array[vertex_indices[i]]=scalar_value; }
18003425bc38SStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
18013425bc38SStefano Zampini 
18023425bc38SStefano Zampini     /* Jump operator P_D : results stored in pcis->vec1_B */
18033425bc38SStefano Zampini 
18043425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18053425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18063425bc38SStefano Zampini     /* Action of B_delta */
18073425bc38SStefano Zampini     ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
18083425bc38SStefano Zampini     ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr);
18093425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18103425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18113425bc38SStefano Zampini     /* Action of B_Ddelta^T */
18123425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
18133425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
18143425bc38SStefano Zampini     ierr = MatMultTranspose(fetidpmat_ctx->B_Ddelta,fetidpmat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr);
18153425bc38SStefano Zampini     /* diagonal scaling */
18163425bc38SStefano Zampini     ierr = VecPointwiseMult(pcis->vec1_B,pcis->D,pcis->vec1_B);CHKERRQ(ierr);
18173425bc38SStefano Zampini     /* sum on the interface */
18183425bc38SStefano Zampini     ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
18193425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
18203425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
18213425bc38SStefano Zampini     ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
18223425bc38SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
18233425bc38SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
18243425bc38SStefano Zampini     ierr = VecNorm(pcis->vec1_global,NORM_INFINITY,&scalar_value);CHKERRQ(ierr);
18253425bc38SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"E[coll]: CHECK infty norm of R^T_D P_D: % 1.14e\n",scalar_value);CHKERRQ(ierr);
18263425bc38SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
18273425bc38SStefano Zampini 
18283425bc38SStefano Zampini     if (!fully_redundant) {
18293425bc38SStefano Zampini       /******************************************************************/
18303425bc38SStefano Zampini       /* TEST F: It should holds B_{delta}B^T_{D,delta}=I               */
18313425bc38SStefano Zampini       /* Corollary thm 14 Mandel Tezaur and Dohrmann 2005               */
18323425bc38SStefano Zampini       /******************************************************************/
18333425bc38SStefano Zampini       ierr = VecDuplicate(lambda_global,&test_vec);CHKERRQ(ierr);
18343425bc38SStefano Zampini       ierr = VecSetRandom(lambda_global,PETSC_NULL);CHKERRQ(ierr);
18353425bc38SStefano Zampini       /* Action of B_Ddelta^T */
18363425bc38SStefano Zampini       ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
18373425bc38SStefano Zampini       ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
18383425bc38SStefano Zampini       ierr = MatMultTranspose(fetidpmat_ctx->B_Ddelta,fetidpmat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr);
18393425bc38SStefano Zampini       /* Action of B_delta */
18403425bc38SStefano Zampini       ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
18413425bc38SStefano Zampini       ierr = VecSet(test_vec,0.0);CHKERRQ(ierr);
18423425bc38SStefano Zampini       ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,test_vec,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18433425bc38SStefano Zampini       ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,test_vec,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18443425bc38SStefano Zampini       scalar_value = -1.0;
18453425bc38SStefano Zampini       ierr = VecAXPY(lambda_global,scalar_value,test_vec);CHKERRQ(ierr);
18463425bc38SStefano Zampini       ierr = VecNorm(lambda_global,NORM_INFINITY,&scalar_value);CHKERRQ(ierr);
18473425bc38SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"E[coll]: CHECK infty norm of P^T_D - I: % 1.14e\n",scalar_value);CHKERRQ(ierr);
18483425bc38SStefano Zampini       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
18493425bc38SStefano Zampini       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
18503425bc38SStefano Zampini       ierr = VecDestroy(&test_vec);CHKERRQ(ierr);
18513425bc38SStefano Zampini     }
18523425bc38SStefano Zampini   }
18533425bc38SStefano Zampini   /* final cleanup */
18543425bc38SStefano Zampini   ierr = PetscFree(dual_dofs_boundary_indices);CHKERRQ(ierr);
18553425bc38SStefano Zampini   ierr = PetscFree(vertex_indices);CHKERRQ(ierr);
18563425bc38SStefano Zampini   ierr = PetscFree(aux_local_numbering_1);CHKERRQ(ierr);
18573425bc38SStefano Zampini   ierr = PetscFree(aux_local_numbering_2);CHKERRQ(ierr);
18583425bc38SStefano Zampini   ierr = PetscFree(aux_global_numbering);CHKERRQ(ierr);
18593425bc38SStefano Zampini   ierr = PetscFree(aux_global_numbering_mpi);CHKERRQ(ierr);
18603425bc38SStefano Zampini   ierr = PetscFree(dof_sizes);CHKERRQ(ierr);
18613425bc38SStefano Zampini   ierr = PetscFree(dof_displs);CHKERRQ(ierr);
18623425bc38SStefano Zampini   ierr = PetscFree(all_aux_global_numbering_mpi_1);CHKERRQ(ierr);
18633425bc38SStefano Zampini   ierr = PetscFree(all_aux_global_numbering_mpi_2);CHKERRQ(ierr);
18643425bc38SStefano Zampini   ierr = PetscFree(global_dofs_numbering);CHKERRQ(ierr);
18653425bc38SStefano Zampini   ierr = PetscFree(aux_sums);CHKERRQ(ierr);
18663425bc38SStefano Zampini   ierr = PetscFree(cols_B_delta);CHKERRQ(ierr);
18673425bc38SStefano Zampini   ierr = PetscFree(vals_B_delta);CHKERRQ(ierr);
18683425bc38SStefano Zampini   ierr = PetscFree(scaling_factors);CHKERRQ(ierr);
18693425bc38SStefano Zampini   ierr = VecDestroy(&lambda_global);CHKERRQ(ierr);
18703425bc38SStefano Zampini   ierr = ISDestroy(&IS_l2g_lambda);CHKERRQ(ierr);
18713425bc38SStefano Zampini 
18723425bc38SStefano Zampini   PetscFunctionReturn(0);
18733425bc38SStefano Zampini }
18743425bc38SStefano Zampini 
18753425bc38SStefano Zampini #undef __FUNCT__
18763425bc38SStefano Zampini #define __FUNCT__ "PCBDDCSetupFETIDPPCContext"
18773425bc38SStefano Zampini static PetscErrorCode PCBDDCSetupFETIDPPCContext(Mat fetimat, FETIDPPC_ctx *fetidppc_ctx)
18783425bc38SStefano Zampini {
18793425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
18803425bc38SStefano Zampini   PetscErrorCode ierr;
18813425bc38SStefano Zampini 
18823425bc38SStefano Zampini   PetscFunctionBegin;
18833425bc38SStefano Zampini   ierr = MatShellGetContext(fetimat,&mat_ctx);CHKERRQ(ierr);
18843425bc38SStefano Zampini   /* get references from objects created when setting up feti mat context */
18853425bc38SStefano Zampini   ierr = PetscObjectReference((PetscObject)mat_ctx->lambda_local);CHKERRQ(ierr);
18863425bc38SStefano Zampini   fetidppc_ctx->lambda_local = mat_ctx->lambda_local;
18873425bc38SStefano Zampini   ierr = PetscObjectReference((PetscObject)mat_ctx->B_Ddelta);CHKERRQ(ierr);
18883425bc38SStefano Zampini   fetidppc_ctx->B_Ddelta = mat_ctx->B_Ddelta;
18893425bc38SStefano Zampini   ierr = PetscObjectReference((PetscObject)mat_ctx->l2g_lambda);CHKERRQ(ierr);
18903425bc38SStefano Zampini   fetidppc_ctx->l2g_lambda = mat_ctx->l2g_lambda;
18913425bc38SStefano Zampini   PetscFunctionReturn(0);
18923425bc38SStefano Zampini }
18933425bc38SStefano Zampini 
18943425bc38SStefano Zampini #undef __FUNCT__
18953425bc38SStefano Zampini #define __FUNCT__ "FETIDPMatMult"
18963425bc38SStefano Zampini static PetscErrorCode FETIDPMatMult(Mat fetimat, Vec x, Vec y)
18973425bc38SStefano Zampini {
18983425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
18993425bc38SStefano Zampini   PC_IS          *pcis;
19003425bc38SStefano Zampini   PetscErrorCode ierr;
19013425bc38SStefano Zampini 
19023425bc38SStefano Zampini   PetscFunctionBegin;
19033425bc38SStefano Zampini   ierr = MatShellGetContext(fetimat,&mat_ctx);CHKERRQ(ierr);
19043425bc38SStefano Zampini   pcis = (PC_IS*)mat_ctx->pc->data;
19053425bc38SStefano Zampini   /* Application of B_delta^T */
19063425bc38SStefano Zampini   ierr = VecScatterBegin(mat_ctx->l2g_lambda,x,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
19073425bc38SStefano Zampini   ierr = VecScatterEnd(mat_ctx->l2g_lambda,x,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
19083425bc38SStefano Zampini   ierr = MatMultTranspose(mat_ctx->B_delta,mat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr);
19093425bc38SStefano Zampini   /* Application of \widetilde{S}^-1 */
19103425bc38SStefano Zampini   ierr = VecSet(pcis->vec1_D,0.0);CHKERRQ(ierr);
19113425bc38SStefano Zampini   ierr = PCBDDCApplyInterfacePreconditioner(mat_ctx->pc);CHKERRQ(ierr);
19123425bc38SStefano Zampini   /* Application of B_delta */
19133425bc38SStefano Zampini   ierr = MatMult(mat_ctx->B_delta,pcis->vec1_B,mat_ctx->lambda_local);CHKERRQ(ierr);
19143425bc38SStefano Zampini   ierr = VecSet(y,0.0);CHKERRQ(ierr);
19153425bc38SStefano Zampini   ierr = VecScatterBegin(mat_ctx->l2g_lambda,mat_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
19163425bc38SStefano Zampini   ierr = VecScatterEnd(mat_ctx->l2g_lambda,mat_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
19173425bc38SStefano Zampini   PetscFunctionReturn(0);
19183425bc38SStefano Zampini }
19193425bc38SStefano Zampini 
19203425bc38SStefano Zampini #undef __FUNCT__
19213425bc38SStefano Zampini #define __FUNCT__ "FETIDPPCApply"
19223425bc38SStefano Zampini static PetscErrorCode FETIDPPCApply(PC fetipc, Vec x, Vec y)
19233425bc38SStefano Zampini {
19243425bc38SStefano Zampini   FETIDPPC_ctx   *pc_ctx;
19253425bc38SStefano Zampini   PC_IS          *pcis;
19263425bc38SStefano Zampini   PetscErrorCode ierr;
19273425bc38SStefano Zampini 
19283425bc38SStefano Zampini   PetscFunctionBegin;
19293425bc38SStefano Zampini   ierr = PCShellGetContext(fetipc,(void**)&pc_ctx);
19303425bc38SStefano Zampini   pcis = (PC_IS*)pc_ctx->pc->data;
19313425bc38SStefano Zampini   /* Application of B_Ddelta^T */
19323425bc38SStefano Zampini   ierr = VecScatterBegin(pc_ctx->l2g_lambda,x,pc_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
19333425bc38SStefano Zampini   ierr = VecScatterEnd(pc_ctx->l2g_lambda,x,pc_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
19343425bc38SStefano Zampini   ierr = VecSet(pcis->vec2_B,0.0);CHKERRQ(ierr);
19353425bc38SStefano Zampini   ierr = MatMultTranspose(pc_ctx->B_Ddelta,pc_ctx->lambda_local,pcis->vec2_B);CHKERRQ(ierr);
19363425bc38SStefano Zampini   /* Application of S */
19373425bc38SStefano Zampini   ierr = PCISApplySchur(pc_ctx->pc,pcis->vec2_B,pcis->vec1_B,(Vec)0,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr);
19383425bc38SStefano Zampini   /* Application of B_Ddelta */
19393425bc38SStefano Zampini   ierr = MatMult(pc_ctx->B_Ddelta,pcis->vec1_B,pc_ctx->lambda_local);CHKERRQ(ierr);
19403425bc38SStefano Zampini   ierr = VecSet(y,0.0);CHKERRQ(ierr);
19413425bc38SStefano Zampini   ierr = VecScatterBegin(pc_ctx->l2g_lambda,pc_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
19423425bc38SStefano Zampini   ierr = VecScatterEnd(pc_ctx->l2g_lambda,pc_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
19433425bc38SStefano Zampini   PetscFunctionReturn(0);
19443425bc38SStefano Zampini }
19453425bc38SStefano Zampini 
1946da1bb401SStefano Zampini #undef __FUNCT__
1947da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetupLocalAdjacencyGraph"
1948da1bb401SStefano Zampini static PetscErrorCode PCBDDCSetupLocalAdjacencyGraph(PC pc)
1949da1bb401SStefano Zampini {
1950da1bb401SStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
1951da1bb401SStefano Zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
1952da1bb401SStefano Zampini   PetscInt       nvtxs,*xadj,*adjncy;
1953da1bb401SStefano Zampini   Mat            mat_adj;
1954da1bb401SStefano Zampini   PetscBool      symmetrize_rowij=PETSC_TRUE,compressed_rowij=PETSC_FALSE,flg_row=PETSC_TRUE;
1955da1bb401SStefano Zampini   PCBDDCGraph    mat_graph=pcbddc->mat_graph;
1956da1bb401SStefano Zampini   PetscErrorCode ierr;
1957da1bb401SStefano Zampini 
1958da1bb401SStefano Zampini   PetscFunctionBegin;
1959da1bb401SStefano Zampini   /* get CSR adjacency from local matrix if user has not yet provided local graph using PCBDDCSetLocalAdjacencyGraph function */
1960da1bb401SStefano Zampini   if (!mat_graph->xadj) {
1961da1bb401SStefano Zampini     ierr = MatConvert(matis->A,MATMPIADJ,MAT_INITIAL_MATRIX,&mat_adj);CHKERRQ(ierr);
1962da1bb401SStefano Zampini     ierr = MatGetRowIJ(mat_adj,0,symmetrize_rowij,compressed_rowij,&nvtxs,&xadj,&adjncy,&flg_row);CHKERRQ(ierr);
1963da1bb401SStefano Zampini     if (!flg_row) {
1964da1bb401SStefano Zampini       SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in MatGetRowIJ called in %s\n",__FUNCT__);
1965da1bb401SStefano Zampini     }
1966da1bb401SStefano Zampini     /* Get adjacency into BDDC workspace */
1967da1bb401SStefano Zampini     ierr = PCBDDCSetLocalAdjacencyGraph(pc,nvtxs,xadj,adjncy,PETSC_COPY_VALUES);CHKERRQ(ierr);
1968da1bb401SStefano Zampini     ierr = MatRestoreRowIJ(mat_adj,0,symmetrize_rowij,compressed_rowij,&nvtxs,&xadj,&adjncy,&flg_row);CHKERRQ(ierr);
1969da1bb401SStefano Zampini     if (!flg_row) {
1970da1bb401SStefano Zampini       SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in MatRestoreRowIJ called in %s\n",__FUNCT__);
1971da1bb401SStefano Zampini     }
1972da1bb401SStefano Zampini     ierr = MatDestroy(&mat_adj);CHKERRQ(ierr);
1973da1bb401SStefano Zampini   }
1974da1bb401SStefano Zampini   PetscFunctionReturn(0);
1975da1bb401SStefano Zampini }
1976da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
19770c7d97c5SJed Brown #undef __FUNCT__
19780c7d97c5SJed Brown #define __FUNCT__ "PCBDDCApplyInterfacePreconditioner"
19792617d88aSStefano Zampini static PetscErrorCode  PCBDDCApplyInterfacePreconditioner(PC pc)
19800c7d97c5SJed Brown {
19810c7d97c5SJed Brown   PetscErrorCode ierr;
19820c7d97c5SJed Brown   PC_BDDC*        pcbddc = (PC_BDDC*)(pc->data);
19830c7d97c5SJed Brown   PC_IS*            pcis = (PC_IS*)  (pc->data);
19843b03a366Sstefano_zampini   const PetscScalar zero = 0.0;
19850c7d97c5SJed Brown 
19860c7d97c5SJed Brown   PetscFunctionBegin;
19870c7d97c5SJed Brown   /* Application of PHI^T  */
19880c7d97c5SJed Brown   ierr = MatMultTranspose(pcbddc->coarse_phi_B,pcis->vec1_B,pcbddc->vec1_P);CHKERRQ(ierr);
19890c7d97c5SJed Brown   if (pcbddc->prec_type) { ierr = MatMultTransposeAdd(pcbddc->coarse_phi_D,pcis->vec1_D,pcbddc->vec1_P,pcbddc->vec1_P);CHKERRQ(ierr); }
19900c7d97c5SJed Brown 
19910c7d97c5SJed Brown   /* Scatter data of coarse_rhs */
1992142dfd88SStefano Zampini   if (pcbddc->coarse_rhs) { ierr = VecSet(pcbddc->coarse_rhs,zero);CHKERRQ(ierr); }
19930c7d97c5SJed Brown   ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->vec1_P,pcbddc->coarse_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
19940c7d97c5SJed Brown 
19950c7d97c5SJed Brown   /* Local solution on R nodes */
19960c7d97c5SJed Brown   ierr = VecSet(pcbddc->vec1_R,zero);CHKERRQ(ierr);
19970c7d97c5SJed Brown   ierr = VecScatterBegin(pcbddc->R_to_B,pcis->vec1_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
19980c7d97c5SJed Brown   ierr = VecScatterEnd  (pcbddc->R_to_B,pcis->vec1_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
19990c7d97c5SJed Brown   if (pcbddc->prec_type) {
20000c7d97c5SJed Brown     ierr = VecScatterBegin(pcbddc->R_to_D,pcis->vec1_D,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
20010c7d97c5SJed Brown     ierr = VecScatterEnd  (pcbddc->R_to_D,pcis->vec1_D,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
20020c7d97c5SJed Brown   }
20030c7d97c5SJed Brown   ierr = PCBDDCSolveSaddlePoint(pc);CHKERRQ(ierr);
20040c7d97c5SJed Brown   ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr);
20050c7d97c5SJed Brown   ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec2_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20060c7d97c5SJed Brown   ierr = VecScatterEnd  (pcbddc->R_to_B,pcbddc->vec2_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20070c7d97c5SJed Brown   if (pcbddc->prec_type) {
20080c7d97c5SJed Brown     ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec2_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20090c7d97c5SJed Brown     ierr = VecScatterEnd  (pcbddc->R_to_D,pcbddc->vec2_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20100c7d97c5SJed Brown   }
20110c7d97c5SJed Brown 
20120c7d97c5SJed Brown   /* Coarse solution */
20130c7d97c5SJed Brown   ierr = PCBDDCScatterCoarseDataEnd(pc,pcbddc->vec1_P,pcbddc->coarse_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
2014*0bdf917eSStefano Zampini   if (pcbddc->coarse_rhs) {
2015*0bdf917eSStefano Zampini     if (pcbddc->CoarseNullSpace) {
2016*0bdf917eSStefano Zampini       ierr = MatNullSpaceRemove(pcbddc->CoarseNullSpace,pcbddc->coarse_rhs,PETSC_NULL);CHKERRQ(ierr);
2017*0bdf917eSStefano Zampini     }
2018*0bdf917eSStefano Zampini     ierr = KSPSolve(pcbddc->coarse_ksp,pcbddc->coarse_rhs,pcbddc->coarse_vec);CHKERRQ(ierr);
2019*0bdf917eSStefano Zampini     if (pcbddc->CoarseNullSpace) {
2020*0bdf917eSStefano Zampini       ierr = MatNullSpaceRemove(pcbddc->CoarseNullSpace,pcbddc->coarse_vec,PETSC_NULL);CHKERRQ(ierr);
2021*0bdf917eSStefano Zampini     }
2022*0bdf917eSStefano Zampini   }
20230c7d97c5SJed Brown   ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->coarse_vec,pcbddc->vec1_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
20240c7d97c5SJed Brown   ierr = PCBDDCScatterCoarseDataEnd  (pc,pcbddc->coarse_vec,pcbddc->vec1_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
20250c7d97c5SJed Brown 
20260c7d97c5SJed Brown   /* Sum contributions from two levels */
20270c7d97c5SJed Brown   ierr = MatMultAdd(pcbddc->coarse_phi_B,pcbddc->vec1_P,pcis->vec1_B,pcis->vec1_B);CHKERRQ(ierr);
20280c7d97c5SJed Brown   if (pcbddc->prec_type) { ierr = MatMultAdd(pcbddc->coarse_phi_D,pcbddc->vec1_P,pcis->vec1_D,pcis->vec1_D);CHKERRQ(ierr); }
20290c7d97c5SJed Brown   PetscFunctionReturn(0);
20300c7d97c5SJed Brown }
20310c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
20320c7d97c5SJed Brown #undef __FUNCT__
20330c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSolveSaddlePoint"
203453cdbc3dSStefano Zampini static PetscErrorCode  PCBDDCSolveSaddlePoint(PC pc)
20350c7d97c5SJed Brown {
20360c7d97c5SJed Brown   PetscErrorCode ierr;
20370c7d97c5SJed Brown   PC_BDDC*       pcbddc = (PC_BDDC*)(pc->data);
20380c7d97c5SJed Brown 
20390c7d97c5SJed Brown   PetscFunctionBegin;
204053cdbc3dSStefano Zampini   ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr);
2041534831adSStefano Zampini   if (pcbddc->local_auxmat1) {
20420c7d97c5SJed Brown     ierr = MatMult(pcbddc->local_auxmat1,pcbddc->vec2_R,pcbddc->vec1_C);CHKERRQ(ierr);
20430c7d97c5SJed Brown     ierr = MatMultAdd(pcbddc->local_auxmat2,pcbddc->vec1_C,pcbddc->vec2_R,pcbddc->vec2_R);CHKERRQ(ierr);
20440c7d97c5SJed Brown   }
20450c7d97c5SJed Brown   PetscFunctionReturn(0);
20460c7d97c5SJed Brown }
20470c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
20480c7d97c5SJed Brown #undef __FUNCT__
20490c7d97c5SJed Brown #define __FUNCT__ "PCBDDCScatterCoarseDataBegin"
205053cdbc3dSStefano Zampini static PetscErrorCode  PCBDDCScatterCoarseDataBegin(PC pc,Vec vec_from, Vec vec_to, InsertMode imode, ScatterMode smode)
20510c7d97c5SJed Brown {
20520c7d97c5SJed Brown   PetscErrorCode ierr;
20530c7d97c5SJed Brown   PC_BDDC*       pcbddc = (PC_BDDC*)(pc->data);
20540c7d97c5SJed Brown 
20550c7d97c5SJed Brown   PetscFunctionBegin;
20560c7d97c5SJed Brown   switch(pcbddc->coarse_communications_type){
20570c7d97c5SJed Brown     case SCATTERS_BDDC:
20580c7d97c5SJed Brown       ierr = VecScatterBegin(pcbddc->coarse_loc_to_glob,vec_from,vec_to,imode,smode);CHKERRQ(ierr);
20590c7d97c5SJed Brown       break;
20600c7d97c5SJed Brown     case GATHERS_BDDC:
20610c7d97c5SJed Brown       break;
20620c7d97c5SJed Brown   }
20630c7d97c5SJed Brown   PetscFunctionReturn(0);
20640c7d97c5SJed Brown }
20650c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
20660c7d97c5SJed Brown #undef __FUNCT__
20670c7d97c5SJed Brown #define __FUNCT__ "PCBDDCScatterCoarseDataEnd"
206853cdbc3dSStefano Zampini static PetscErrorCode  PCBDDCScatterCoarseDataEnd(PC pc,Vec vec_from, Vec vec_to, InsertMode imode, ScatterMode smode)
20690c7d97c5SJed Brown {
20700c7d97c5SJed Brown   PetscErrorCode ierr;
20710c7d97c5SJed Brown   PC_BDDC*       pcbddc = (PC_BDDC*)(pc->data);
20720c7d97c5SJed Brown   PetscScalar*   array_to;
20730c7d97c5SJed Brown   PetscScalar*   array_from;
20740c7d97c5SJed Brown   MPI_Comm       comm=((PetscObject)pc)->comm;
20750c7d97c5SJed Brown   PetscInt i;
20760c7d97c5SJed Brown 
20770c7d97c5SJed Brown   PetscFunctionBegin;
20780c7d97c5SJed Brown 
20790c7d97c5SJed Brown   switch(pcbddc->coarse_communications_type){
20800c7d97c5SJed Brown     case SCATTERS_BDDC:
20810c7d97c5SJed Brown       ierr = VecScatterEnd(pcbddc->coarse_loc_to_glob,vec_from,vec_to,imode,smode);CHKERRQ(ierr);
20820c7d97c5SJed Brown       break;
20830c7d97c5SJed Brown     case GATHERS_BDDC:
20840c7d97c5SJed Brown       if (vec_from) VecGetArray(vec_from,&array_from);
20850c7d97c5SJed Brown       if (vec_to)   VecGetArray(vec_to,&array_to);
20860c7d97c5SJed Brown       switch(pcbddc->coarse_problem_type){
20870c7d97c5SJed Brown         case SEQUENTIAL_BDDC:
20880c7d97c5SJed Brown           if (smode == SCATTER_FORWARD) {
208953cdbc3dSStefano Zampini             ierr = MPI_Gatherv(&array_from[0],pcbddc->local_primal_size,MPIU_SCALAR,&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,0,comm);CHKERRQ(ierr);
20900c7d97c5SJed Brown             if (vec_to) {
2091*0bdf917eSStefano Zampini               if (imode == ADD_VALUES) {
2092*0bdf917eSStefano Zampini                 for (i=0;i<pcbddc->replicated_primal_size;i++) {
20930c7d97c5SJed Brown                   array_to[pcbddc->replicated_local_primal_indices[i]]+=pcbddc->replicated_local_primal_values[i];
20940c7d97c5SJed Brown                 }
20950c7d97c5SJed Brown               } else {
2096*0bdf917eSStefano Zampini                 for (i=0;i<pcbddc->replicated_primal_size;i++) {
2097*0bdf917eSStefano Zampini                   array_to[pcbddc->replicated_local_primal_indices[i]]=pcbddc->replicated_local_primal_values[i];
2098*0bdf917eSStefano Zampini                 }
2099*0bdf917eSStefano Zampini               }
2100*0bdf917eSStefano Zampini             }
2101*0bdf917eSStefano Zampini           } else {
2102*0bdf917eSStefano Zampini             if (vec_from) {
2103*0bdf917eSStefano Zampini               if (imode == ADD_VALUES) {
2104*0bdf917eSStefano Zampini                 printf("Scatter mode %d, insert mode %d for case %d not implemented!\n",smode,imode,pcbddc->coarse_problem_type);
2105*0bdf917eSStefano Zampini               }
2106*0bdf917eSStefano Zampini               for (i=0;i<pcbddc->replicated_primal_size;i++) {
21070c7d97c5SJed Brown                 pcbddc->replicated_local_primal_values[i]=array_from[pcbddc->replicated_local_primal_indices[i]];
2108*0bdf917eSStefano Zampini               }
2109*0bdf917eSStefano Zampini             }
211053cdbc3dSStefano Zampini             ierr = MPI_Scatterv(&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,&array_to[0],pcbddc->local_primal_size,MPIU_SCALAR,0,comm);CHKERRQ(ierr);
21110c7d97c5SJed Brown           }
21120c7d97c5SJed Brown           break;
21130c7d97c5SJed Brown         case REPLICATED_BDDC:
21140c7d97c5SJed Brown           if (smode == SCATTER_FORWARD) {
211553cdbc3dSStefano Zampini             ierr = MPI_Allgatherv(&array_from[0],pcbddc->local_primal_size,MPIU_SCALAR,&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,comm);CHKERRQ(ierr);
2116*0bdf917eSStefano Zampini             if (imode == ADD_VALUES) {
2117*0bdf917eSStefano Zampini               for (i=0;i<pcbddc->replicated_primal_size;i++) {
21180c7d97c5SJed Brown                 array_to[pcbddc->replicated_local_primal_indices[i]]+=pcbddc->replicated_local_primal_values[i];
2119*0bdf917eSStefano Zampini               }
2120*0bdf917eSStefano Zampini             } else {
2121*0bdf917eSStefano Zampini               for (i=0;i<pcbddc->replicated_primal_size;i++) {
2122*0bdf917eSStefano Zampini                 array_to[pcbddc->replicated_local_primal_indices[i]]=pcbddc->replicated_local_primal_values[i];
2123*0bdf917eSStefano Zampini               }
2124*0bdf917eSStefano Zampini             }
21250c7d97c5SJed Brown           } else { /* no communications needed for SCATTER_REVERSE since needed data is already present */
2126*0bdf917eSStefano Zampini             if (imode == ADD_VALUES) {
2127*0bdf917eSStefano Zampini               for (i=0;i<pcbddc->local_primal_size;i++) {
2128*0bdf917eSStefano Zampini                 array_to[i]+=array_from[pcbddc->local_primal_indices[i]];
2129*0bdf917eSStefano Zampini               }
2130*0bdf917eSStefano Zampini             } else {
2131*0bdf917eSStefano Zampini               for (i=0;i<pcbddc->local_primal_size;i++) {
21320c7d97c5SJed Brown                 array_to[i]=array_from[pcbddc->local_primal_indices[i]];
21330c7d97c5SJed Brown               }
2134*0bdf917eSStefano Zampini             }
2135*0bdf917eSStefano Zampini           }
21360c7d97c5SJed Brown           break;
213753cdbc3dSStefano Zampini         case MULTILEVEL_BDDC:
213853cdbc3dSStefano Zampini           break;
213953cdbc3dSStefano Zampini         case PARALLEL_BDDC:
214053cdbc3dSStefano Zampini           break;
21410c7d97c5SJed Brown       }
21420c7d97c5SJed Brown       if (vec_from) VecRestoreArray(vec_from,&array_from);
21430c7d97c5SJed Brown       if (vec_to)   VecRestoreArray(vec_to,&array_to);
21440c7d97c5SJed Brown       break;
21450c7d97c5SJed Brown   }
21460c7d97c5SJed Brown   PetscFunctionReturn(0);
21470c7d97c5SJed Brown }
21480c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
21493b03a366Sstefano_zampini #undef __FUNCT__
21503b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCCreateConstraintMatrix"
21513b03a366Sstefano_zampini static PetscErrorCode PCBDDCCreateConstraintMatrix(PC pc)
21523b03a366Sstefano_zampini {
21533b03a366Sstefano_zampini   PetscErrorCode ierr;
21543b03a366Sstefano_zampini   PC_IS*         pcis = (PC_IS*)(pc->data);
21553b03a366Sstefano_zampini   PC_BDDC*       pcbddc = (PC_BDDC*)pc->data;
21563b03a366Sstefano_zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
215723d4d1a5SStefano Zampini   PetscInt       *nnz,*is_indices;
21583b03a366Sstefano_zampini   PetscScalar    *temp_quadrature_constraint;
2159534831adSStefano Zampini   PetscInt       *temp_indices,*temp_indices_to_constraint,*temp_indices_to_constraint_B,*local_to_B;
21603b03a366Sstefano_zampini   PetscInt       local_primal_size,i,j,k,total_counts,max_size_of_constraint;
21613b03a366Sstefano_zampini   PetscInt       n_constraints,n_vertices,size_of_constraint;
2162534831adSStefano Zampini   PetscScalar    quad_value;
21633b03a366Sstefano_zampini   PetscBool      nnsp_has_cnst=PETSC_FALSE,use_nnsp_true=pcbddc->use_nnsp_true;
21643b03a366Sstefano_zampini   PetscInt       nnsp_size=0,nnsp_addone=0,temp_constraints,temp_start_ptr;
21653b03a366Sstefano_zampini   IS             *used_IS;
21663b03a366Sstefano_zampini   const MatType  impMatType=MATSEQAIJ;
21673b03a366Sstefano_zampini   PetscBLASInt   Bs,Bt,lwork,lierr;
21683b03a366Sstefano_zampini   PetscReal      tol=1.0e-8;
2169fcda91b4SJed Brown   MatNullSpace   nearnullsp;
2170fcda91b4SJed Brown   const Vec      *nearnullvecs;
21713b03a366Sstefano_zampini   Vec            *localnearnullsp;
21723b03a366Sstefano_zampini   PetscScalar    *work,*temp_basis,*array_vector,*correlation_mat;
21733b03a366Sstefano_zampini   PetscReal      *rwork,*singular_vals;
2174534831adSStefano Zampini   PetscBLASInt   Bone=1,*ipiv;
2175534831adSStefano Zampini   Vec            temp_vec;
2176534831adSStefano Zampini   Mat            temp_mat;
2177534831adSStefano Zampini   KSP            temp_ksp;
2178ffe5efe1SStefano Zampini   PC             temp_pc;
2179534831adSStefano Zampini   PetscInt       s,start_constraint,dual_dofs;
2180534831adSStefano Zampini   PetscBool      compute_submatrix,useksp=PETSC_FALSE;
2181534831adSStefano Zampini   PetscInt       *aux_primal_permutation,*aux_primal_numbering;
2182534831adSStefano Zampini   PetscBool      boolforface,*change_basis;
2183de534f79Sstefano_zampini /* some ugly conditional declarations */
21843b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD)
21853b03a366Sstefano_zampini   PetscScalar    dot_result;
21863b03a366Sstefano_zampini   PetscScalar    one=1.0,zero=0.0;
21873b03a366Sstefano_zampini   PetscInt       ii;
21883425bc38SStefano Zampini   PetscScalar    *singular_vectors;
21893425bc38SStefano Zampini   PetscBLASInt   *iwork,*ifail;
21903425bc38SStefano Zampini   PetscReal      dummy_real,abs_tol;
21913425bc38SStefano Zampini   PetscBLASInt   eigs_found;
21923b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX)
21933b03a366Sstefano_zampini   PetscScalar    val1,val2;
21943b03a366Sstefano_zampini #endif
21953425bc38SStefano Zampini #endif
21963b03a366Sstefano_zampini   PetscBLASInt   dummy_int;
21973b03a366Sstefano_zampini   PetscScalar    dummy_scalar;
21983b03a366Sstefano_zampini 
21993b03a366Sstefano_zampini   PetscFunctionBegin;
22003b03a366Sstefano_zampini   /* check if near null space is attached to global mat */
2201fcda91b4SJed Brown   ierr = MatGetNearNullSpace(pc->pmat,&nearnullsp);CHKERRQ(ierr);
2202fcda91b4SJed Brown   if (nearnullsp) {
2203fcda91b4SJed Brown     ierr = MatNullSpaceGetVecs(nearnullsp,&nnsp_has_cnst,&nnsp_size,&nearnullvecs);CHKERRQ(ierr);
22043b03a366Sstefano_zampini   } else { /* if near null space is not provided it uses constants */
22053b03a366Sstefano_zampini     nnsp_has_cnst = PETSC_TRUE;
22063b03a366Sstefano_zampini     use_nnsp_true = PETSC_TRUE;
22073b03a366Sstefano_zampini   }
22083b03a366Sstefano_zampini   if (nnsp_has_cnst) {
22093b03a366Sstefano_zampini     nnsp_addone = 1;
22103b03a366Sstefano_zampini   }
22113b03a366Sstefano_zampini   /*
22123b03a366Sstefano_zampini        Evaluate maximum storage size needed by the procedure
22133b03a366Sstefano_zampini        - temp_indices will contain start index of each constraint stored as follows
22143b03a366Sstefano_zampini        - temp_indices_to_constraint  [temp_indices[i],...,temp[indices[i+1]-1] will contain the indices (in local numbering) on which the constraint acts
2215534831adSStefano Zampini        - temp_indices_to_constraint_B[temp_indices[i],...,temp[indices[i+1]-1] will contain the indices (in boundary numbering) on which the constraint acts
22163b03a366Sstefano_zampini        - temp_quadrature_constraint  [temp_indices[i],...,temp[indices[i+1]-1] will contain the scalars representing the constraint itself
22173b03a366Sstefano_zampini                                                                                                                                                          */
2218da1bb401SStefano Zampini 
22193b03a366Sstefano_zampini   total_counts = pcbddc->n_ISForFaces+pcbddc->n_ISForEdges;
22203b03a366Sstefano_zampini   total_counts *= (nnsp_addone+nnsp_size);
2221da1bb401SStefano Zampini   ierr = ISGetSize(pcbddc->ISForVertices,&n_vertices);CHKERRQ(ierr);
2222da1bb401SStefano Zampini   total_counts += n_vertices;
22233b03a366Sstefano_zampini   ierr = PetscMalloc((total_counts+1)*sizeof(PetscInt),&temp_indices);CHKERRQ(ierr);
2224534831adSStefano Zampini   ierr = PetscMalloc((total_counts+1)*sizeof(PetscBool),&change_basis);CHKERRQ(ierr);
22253b03a366Sstefano_zampini   total_counts = 0;
22263b03a366Sstefano_zampini   max_size_of_constraint = 0;
22273b03a366Sstefano_zampini   for (i=0;i<pcbddc->n_ISForEdges+pcbddc->n_ISForFaces;i++){
22283b03a366Sstefano_zampini     if (i<pcbddc->n_ISForEdges){
22293b03a366Sstefano_zampini       used_IS = &pcbddc->ISForEdges[i];
22303b03a366Sstefano_zampini     } else {
22313b03a366Sstefano_zampini       used_IS = &pcbddc->ISForFaces[i-pcbddc->n_ISForEdges];
22323b03a366Sstefano_zampini     }
22333b03a366Sstefano_zampini     ierr = ISGetSize(*used_IS,&j);CHKERRQ(ierr);
22343b03a366Sstefano_zampini     total_counts += j;
22353b03a366Sstefano_zampini     if (j>max_size_of_constraint) max_size_of_constraint=j;
22363b03a366Sstefano_zampini   }
22373b03a366Sstefano_zampini   total_counts *= (nnsp_addone+nnsp_size);
2238da1bb401SStefano Zampini   total_counts += n_vertices;
22393b03a366Sstefano_zampini   ierr = PetscMalloc(total_counts*sizeof(PetscScalar),&temp_quadrature_constraint);CHKERRQ(ierr);
22403b03a366Sstefano_zampini   ierr = PetscMalloc(total_counts*sizeof(PetscInt),&temp_indices_to_constraint);CHKERRQ(ierr);
2241534831adSStefano Zampini   ierr = PetscMalloc(total_counts*sizeof(PetscInt),&temp_indices_to_constraint_B);CHKERRQ(ierr);
2242534831adSStefano Zampini   ierr = PetscMalloc(pcis->n*sizeof(PetscInt),&local_to_B);CHKERRQ(ierr);
2243534831adSStefano Zampini   ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2244534831adSStefano Zampini   for (i=0;i<pcis->n;i++) {
2245534831adSStefano Zampini     local_to_B[i]=-1;
2246534831adSStefano Zampini   }
2247534831adSStefano Zampini   for (i=0;i<pcis->n_B;i++) {
2248534831adSStefano Zampini     local_to_B[is_indices[i]]=i;
2249534831adSStefano Zampini   }
2250534831adSStefano Zampini   ierr = ISRestoreIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2251534831adSStefano Zampini 
22523b03a366Sstefano_zampini   /* First we issue queries to allocate optimal workspace for LAPACKgesvd or LAPACKsyev/LAPACKheev */
22533b03a366Sstefano_zampini   rwork = 0;
22543b03a366Sstefano_zampini   work = 0;
22553b03a366Sstefano_zampini   singular_vals = 0;
22563b03a366Sstefano_zampini   temp_basis = 0;
22573b03a366Sstefano_zampini   correlation_mat = 0;
22583b03a366Sstefano_zampini   if (!pcbddc->use_nnsp_true) {
22593b03a366Sstefano_zampini     PetscScalar temp_work;
22603b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD)
22613b03a366Sstefano_zampini     /* POD */
22623b03a366Sstefano_zampini     PetscInt max_n;
22633b03a366Sstefano_zampini     max_n = nnsp_addone+nnsp_size;
22643b03a366Sstefano_zampini     /* using some techniques borrowed from Proper Orthogonal Decomposition */
22653b03a366Sstefano_zampini     ierr = PetscMalloc(max_n*max_n*sizeof(PetscScalar),&correlation_mat);CHKERRQ(ierr);
22663425bc38SStefano Zampini     ierr = PetscMalloc(max_n*max_n*sizeof(PetscScalar),&singular_vectors);CHKERRQ(ierr);
22673b03a366Sstefano_zampini     ierr = PetscMalloc(max_n*sizeof(PetscReal),&singular_vals);CHKERRQ(ierr);
22683b03a366Sstefano_zampini     ierr = PetscMalloc(max_size_of_constraint*(nnsp_addone+nnsp_size)*sizeof(PetscScalar),&temp_basis);CHKERRQ(ierr);
22693b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX)
22703b03a366Sstefano_zampini     ierr = PetscMalloc(3*max_n*sizeof(PetscReal),&rwork);CHKERRQ(ierr);
22713b03a366Sstefano_zampini #endif
22723425bc38SStefano Zampini     ierr = PetscMalloc(5*max_n*sizeof(PetscBLASInt),&iwork);CHKERRQ(ierr);
22733425bc38SStefano Zampini     ierr = PetscMalloc(max_n*sizeof(PetscBLASInt),&ifail);CHKERRQ(ierr);
22743b03a366Sstefano_zampini     /* now we evaluate the optimal workspace using query with lwork=-1 */
22753b03a366Sstefano_zampini     Bt = PetscBLASIntCast(max_n);
22763b03a366Sstefano_zampini     lwork=-1;
22773425bc38SStefano Zampini     ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
22783b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX)
22793425bc38SStefano Zampini     abs_tol=1.e-8;
22803425bc38SStefano Zampini /*    LAPACKsyev_("V","U",&Bt,correlation_mat,&Bt,singular_vals,&temp_work,&lwork,&lierr); */
22813425bc38SStefano Zampini     LAPACKsyevx_("V","A","U",&Bt,correlation_mat,&Bt,&dummy_real,&dummy_real,&dummy_int,&dummy_int,
22823425bc38SStefano Zampini                  &abs_tol,&eigs_found,singular_vals,singular_vectors,&Bt,&temp_work,&lwork,iwork,ifail,&lierr);
22833b03a366Sstefano_zampini #else
22843425bc38SStefano Zampini /*    LAPACKsyev_("V","U",&Bt,correlation_mat,&Bt,singular_vals,&temp_work,&lwork,rwork,&lierr); */
22853425bc38SStefano Zampini /*  LAPACK call is missing here! TODO */
22863425bc38SStefano Zampini     SETERRQ(((PetscObject) pc)->comm, PETSC_ERR_SUP, "Not yet implemented for complexes when PETSC_MISSING_GESVD = 1");
22873b03a366Sstefano_zampini #endif
22883425bc38SStefano Zampini     if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to SYEVX Lapack routine %d",(int)lierr);
22893425bc38SStefano Zampini     ierr = PetscFPTrapPop();CHKERRQ(ierr);
22903b03a366Sstefano_zampini #else /* on missing GESVD */
22913b03a366Sstefano_zampini     /* SVD */
22923b03a366Sstefano_zampini     PetscInt max_n,min_n;
22933b03a366Sstefano_zampini     max_n = max_size_of_constraint;
22943b03a366Sstefano_zampini     min_n = nnsp_addone+nnsp_size;
22953b03a366Sstefano_zampini     if (max_size_of_constraint < ( nnsp_addone+nnsp_size ) ) {
22963b03a366Sstefano_zampini       min_n = max_size_of_constraint;
22973b03a366Sstefano_zampini       max_n = nnsp_addone+nnsp_size;
22983b03a366Sstefano_zampini     }
22993b03a366Sstefano_zampini     ierr = PetscMalloc(min_n*sizeof(PetscReal),&singular_vals);CHKERRQ(ierr);
23003b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX)
23013b03a366Sstefano_zampini     ierr = PetscMalloc(5*min_n*sizeof(PetscReal),&rwork);CHKERRQ(ierr);
23023b03a366Sstefano_zampini #endif
23033b03a366Sstefano_zampini     /* now we evaluate the optimal workspace using query with lwork=-1 */
23043b03a366Sstefano_zampini     lwork=-1;
23053b03a366Sstefano_zampini     Bs = PetscBLASIntCast(max_n);
23063b03a366Sstefano_zampini     Bt = PetscBLASIntCast(min_n);
23073b03a366Sstefano_zampini     dummy_int = Bs;
2308670f3ff9SJed Brown     ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
23093b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX)
23103b03a366Sstefano_zampini     LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[0],&Bs,singular_vals,
23113b03a366Sstefano_zampini                  &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,&temp_work,&lwork,&lierr);
23123b03a366Sstefano_zampini #else
23133b03a366Sstefano_zampini     LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[0],&Bs,singular_vals,
23143b03a366Sstefano_zampini                  &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,&temp_work,&lwork,rwork,&lierr);
23153b03a366Sstefano_zampini #endif
23163b03a366Sstefano_zampini     if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to SVD Lapack routine %d",(int)lierr);
2317670f3ff9SJed Brown     ierr = PetscFPTrapPop();CHKERRQ(ierr);
23183b03a366Sstefano_zampini #endif
23193b03a366Sstefano_zampini     /* Allocate optimal workspace */
23203b03a366Sstefano_zampini     lwork = PetscBLASIntCast((PetscInt)PetscRealPart(temp_work));
23213b03a366Sstefano_zampini     total_counts = (PetscInt)lwork;
23223b03a366Sstefano_zampini     ierr = PetscMalloc(total_counts*sizeof(PetscScalar),&work);CHKERRQ(ierr);
23233b03a366Sstefano_zampini   }
23243b03a366Sstefano_zampini   /* get local part of global near null space vectors */
23253b03a366Sstefano_zampini   ierr = PetscMalloc(nnsp_size*sizeof(Vec),&localnearnullsp);CHKERRQ(ierr);
23263b03a366Sstefano_zampini   for (k=0;k<nnsp_size;k++) {
23273b03a366Sstefano_zampini     ierr = VecDuplicate(pcis->vec1_N,&localnearnullsp[k]);CHKERRQ(ierr);
2328fcda91b4SJed Brown     ierr = VecScatterBegin(matis->ctx,nearnullvecs[k],localnearnullsp[k],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
2329fcda91b4SJed Brown     ierr = VecScatterEnd  (matis->ctx,nearnullvecs[k],localnearnullsp[k],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
23303b03a366Sstefano_zampini   }
23313b03a366Sstefano_zampini   /* Now we can loop on constraining sets */
23323b03a366Sstefano_zampini   total_counts=0;
23333b03a366Sstefano_zampini   temp_indices[0]=0;
2334da1bb401SStefano Zampini   /* vertices */
2335da1bb401SStefano Zampini   PetscBool used_vertex;
2336da1bb401SStefano Zampini   ierr = ISGetIndices(pcbddc->ISForVertices,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2337da1bb401SStefano Zampini   if (nnsp_has_cnst) { /* consider all vertices */
2338da1bb401SStefano Zampini     for (i=0;i<n_vertices;i++) {
2339da1bb401SStefano Zampini       temp_indices_to_constraint[temp_indices[total_counts]]=is_indices[i];
2340534831adSStefano Zampini       temp_indices_to_constraint_B[temp_indices[total_counts]]=local_to_B[is_indices[i]];
2341da1bb401SStefano Zampini       temp_quadrature_constraint[temp_indices[total_counts]]=1.0;
2342da1bb401SStefano Zampini       temp_indices[total_counts+1]=temp_indices[total_counts]+1;
2343534831adSStefano Zampini       change_basis[total_counts]=PETSC_FALSE;
2344da1bb401SStefano Zampini       total_counts++;
2345da1bb401SStefano Zampini     }
2346da1bb401SStefano Zampini   } else { /* consider vertices for which exist at least a localnearnullsp which is not null there */
2347da1bb401SStefano Zampini     for (i=0;i<n_vertices;i++) {
2348da1bb401SStefano Zampini       used_vertex=PETSC_FALSE;
2349da1bb401SStefano Zampini       k=0;
2350da1bb401SStefano Zampini       while(!used_vertex && k<nnsp_size) {
2351da1bb401SStefano Zampini         ierr = VecGetArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr);
2352da1bb401SStefano Zampini         if (PetscAbsScalar(array_vector[is_indices[i]])>0.0) {
2353da1bb401SStefano Zampini           temp_indices_to_constraint[temp_indices[total_counts]]=is_indices[i];
2354534831adSStefano Zampini           temp_indices_to_constraint_B[temp_indices[total_counts]]=local_to_B[is_indices[i]];
2355da1bb401SStefano Zampini           temp_quadrature_constraint[temp_indices[total_counts]]=1.0;
2356da1bb401SStefano Zampini           temp_indices[total_counts+1]=temp_indices[total_counts]+1;
2357534831adSStefano Zampini           change_basis[total_counts]=PETSC_FALSE;
2358da1bb401SStefano Zampini           total_counts++;
2359da1bb401SStefano Zampini           used_vertex=PETSC_TRUE;
2360da1bb401SStefano Zampini         }
2361da1bb401SStefano Zampini         ierr = VecRestoreArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr);
2362da1bb401SStefano Zampini         k++;
2363da1bb401SStefano Zampini       }
2364da1bb401SStefano Zampini     }
2365da1bb401SStefano Zampini   }
2366da1bb401SStefano Zampini   ierr = ISRestoreIndices(pcbddc->ISForVertices,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2367da1bb401SStefano Zampini   n_vertices=total_counts;
2368da1bb401SStefano Zampini   /* edges and faces */
23693b03a366Sstefano_zampini   for (i=0;i<pcbddc->n_ISForEdges+pcbddc->n_ISForFaces;i++){
23703b03a366Sstefano_zampini     if (i<pcbddc->n_ISForEdges){
23713b03a366Sstefano_zampini       used_IS = &pcbddc->ISForEdges[i];
2372534831adSStefano Zampini       boolforface = pcbddc->usechangeofbasis;
23733b03a366Sstefano_zampini     } else {
23743b03a366Sstefano_zampini       used_IS = &pcbddc->ISForFaces[i-pcbddc->n_ISForEdges];
2375534831adSStefano Zampini       boolforface = pcbddc->usechangeonfaces;
23763b03a366Sstefano_zampini     }
23773b03a366Sstefano_zampini     temp_constraints = 0;          /* zero the number of constraints I have on this conn comp */
23783b03a366Sstefano_zampini     temp_start_ptr = total_counts; /* need to know the starting index of constraints stored */
23793b03a366Sstefano_zampini     ierr = ISGetSize(*used_IS,&size_of_constraint);CHKERRQ(ierr);
23803b03a366Sstefano_zampini     ierr = ISGetIndices(*used_IS,(const PetscInt**)&is_indices);CHKERRQ(ierr);
23813b03a366Sstefano_zampini     if (nnsp_has_cnst) {
23823b03a366Sstefano_zampini       temp_constraints++;
2383534831adSStefano Zampini       quad_value = (PetscScalar) (1.0/PetscSqrtReal((PetscReal)size_of_constraint));
23843b03a366Sstefano_zampini       for (j=0;j<size_of_constraint;j++) {
23853b03a366Sstefano_zampini         temp_indices_to_constraint[temp_indices[total_counts]+j]=is_indices[j];
2386534831adSStefano Zampini         temp_indices_to_constraint_B[temp_indices[total_counts]+j]=local_to_B[is_indices[j]];
23873b03a366Sstefano_zampini         temp_quadrature_constraint[temp_indices[total_counts]+j]=quad_value;
23883b03a366Sstefano_zampini       }
23893b03a366Sstefano_zampini       temp_indices[total_counts+1]=temp_indices[total_counts]+size_of_constraint;  /* store new starting point */
2390534831adSStefano Zampini       change_basis[total_counts]=boolforface;
23913b03a366Sstefano_zampini       total_counts++;
23923b03a366Sstefano_zampini     }
23933b03a366Sstefano_zampini     for (k=0;k<nnsp_size;k++) {
23943b03a366Sstefano_zampini       ierr = VecGetArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr);
23953b03a366Sstefano_zampini       for (j=0;j<size_of_constraint;j++) {
23963b03a366Sstefano_zampini         temp_indices_to_constraint[temp_indices[total_counts]+j]=is_indices[j];
2397534831adSStefano Zampini         temp_indices_to_constraint_B[temp_indices[total_counts]+j]=local_to_B[is_indices[j]];
23983b03a366Sstefano_zampini         temp_quadrature_constraint[temp_indices[total_counts]+j]=array_vector[is_indices[j]];
23993b03a366Sstefano_zampini       }
24003b03a366Sstefano_zampini       ierr = VecRestoreArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr);
2401de534f79Sstefano_zampini       quad_value = 1.0;
2402de534f79Sstefano_zampini       if ( use_nnsp_true ) { /* check if array is null on the connected component in case use_nnsp_true has been requested */
2403de534f79Sstefano_zampini         Bs = PetscBLASIntCast(size_of_constraint);
2404de534f79Sstefano_zampini         quad_value = BLASasum_(&Bs,&temp_quadrature_constraint[temp_indices[total_counts]],&Bone);
2405de534f79Sstefano_zampini       }
2406de534f79Sstefano_zampini       if ( quad_value > 0.0 ) { /* keep indices and values */
2407de534f79Sstefano_zampini         temp_constraints++;
24083b03a366Sstefano_zampini         temp_indices[total_counts+1]=temp_indices[total_counts]+size_of_constraint;  /* store new starting point */
2409534831adSStefano Zampini         change_basis[total_counts]=boolforface;
24103b03a366Sstefano_zampini         total_counts++;
24113b03a366Sstefano_zampini       }
2412de534f79Sstefano_zampini     }
24133b03a366Sstefano_zampini     ierr = ISRestoreIndices(*used_IS,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2414de534f79Sstefano_zampini     /* perform SVD on the constraint if use_nnsp_true has not be requested by the user */
24153b03a366Sstefano_zampini     if (!use_nnsp_true) {
2416de534f79Sstefano_zampini 
24173b03a366Sstefano_zampini       Bs = PetscBLASIntCast(size_of_constraint);
24183b03a366Sstefano_zampini       Bt = PetscBLASIntCast(temp_constraints);
2419de534f79Sstefano_zampini 
24203b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD)
24213b03a366Sstefano_zampini       ierr = PetscMemzero(correlation_mat,Bt*Bt*sizeof(PetscScalar));CHKERRQ(ierr);
24223b03a366Sstefano_zampini       /* Store upper triangular part of correlation matrix */
24233b03a366Sstefano_zampini       for (j=0;j<temp_constraints;j++) {
24243b03a366Sstefano_zampini         for (k=0;k<j+1;k++) {
24253b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX)
24263425bc38SStefano Zampini           /* hand made complex dot product -> replace */
24273b03a366Sstefano_zampini           dot_result = 0.0;
24283b03a366Sstefano_zampini           for (ii=0; ii<size_of_constraint; ii++) {
24293b03a366Sstefano_zampini             val1 = temp_quadrature_constraint[temp_indices[temp_start_ptr+j]+ii];
24303b03a366Sstefano_zampini             val2 = temp_quadrature_constraint[temp_indices[temp_start_ptr+k]+ii];
24313b03a366Sstefano_zampini             dot_result += val1*PetscConj(val2);
24323b03a366Sstefano_zampini           }
24333b03a366Sstefano_zampini #else
24343b03a366Sstefano_zampini           dot_result = BLASdot_(&Bs,&temp_quadrature_constraint[temp_indices[temp_start_ptr+j]],&Bone,
24353b03a366Sstefano_zampini                                     &temp_quadrature_constraint[temp_indices[temp_start_ptr+k]],&Bone);
24363b03a366Sstefano_zampini #endif
24373b03a366Sstefano_zampini           correlation_mat[j*temp_constraints+k]=dot_result;
24383b03a366Sstefano_zampini         }
24393b03a366Sstefano_zampini       }
24403425bc38SStefano Zampini       ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
24413b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX)
24423425bc38SStefano Zampini /*      LAPACKsyev_("V","U",&Bt,correlation_mat,&Bt,singular_vals,work,&lwork,&lierr); */
24433425bc38SStefano Zampini       LAPACKsyevx_("V","A","U",&Bt,correlation_mat,&Bt,&dummy_real,&dummy_real,&dummy_int,&dummy_int,
24443425bc38SStefano Zampini                  &abs_tol,&eigs_found,singular_vals,singular_vectors,&Bt,work,&lwork,iwork,ifail,&lierr);
24453b03a366Sstefano_zampini #else
24463425bc38SStefano Zampini /*  LAPACK call is missing here! TODO */
24473425bc38SStefano Zampini       SETERRQ(((PetscObject) pc)->comm, PETSC_ERR_SUP, "Not yet implemented for complexes when PETSC_MISSING_GESVD = 1");
24483b03a366Sstefano_zampini #endif
24493425bc38SStefano Zampini       if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYEVX Lapack routine %d",(int)lierr);
24503425bc38SStefano Zampini       ierr = PetscFPTrapPop();CHKERRQ(ierr);
24513b03a366Sstefano_zampini       /* retain eigenvalues greater than tol: note that lapack SYEV gives eigs in ascending order */
24523b03a366Sstefano_zampini       j=0;
24533b03a366Sstefano_zampini       while( j < Bt && singular_vals[j] < tol) j++;
24543b03a366Sstefano_zampini       total_counts=total_counts-j;
24553b03a366Sstefano_zampini       if (j<temp_constraints) {
24563b03a366Sstefano_zampini         for (k=j;k<Bt;k++) { singular_vals[k]=1.0/PetscSqrtReal(singular_vals[k]); }
24573425bc38SStefano Zampini         ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
24583b03a366Sstefano_zampini         BLASgemm_("N","N",&Bs,&Bt,&Bt,&one,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,correlation_mat,&Bt,&zero,temp_basis,&Bs);
24593425bc38SStefano Zampini         ierr = PetscFPTrapPop();CHKERRQ(ierr);
24603b03a366Sstefano_zampini         /* copy POD basis into used quadrature memory */
24613b03a366Sstefano_zampini         for (k=0;k<Bt-j;k++) {
24623b03a366Sstefano_zampini           for (ii=0;ii<size_of_constraint;ii++) {
24633b03a366Sstefano_zampini             temp_quadrature_constraint[temp_indices[temp_start_ptr+k]+ii]=singular_vals[Bt-1-k]*temp_basis[(Bt-1-k)*size_of_constraint+ii];
24643b03a366Sstefano_zampini           }
24653b03a366Sstefano_zampini         }
24663b03a366Sstefano_zampini       }
2467de534f79Sstefano_zampini 
24683b03a366Sstefano_zampini #else  /* on missing GESVD */
24693b03a366Sstefano_zampini       PetscInt min_n = temp_constraints;
24703b03a366Sstefano_zampini       if (min_n > size_of_constraint) min_n = size_of_constraint;
24713b03a366Sstefano_zampini       dummy_int = Bs;
2472670f3ff9SJed Brown       ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
24733b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX)
24743b03a366Sstefano_zampini       LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,singular_vals,
24753b03a366Sstefano_zampini                    &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,work,&lwork,&lierr);
24763b03a366Sstefano_zampini #else
24773b03a366Sstefano_zampini       LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,singular_vals,
24783b03a366Sstefano_zampini                    &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,work,&lwork,rwork,&lierr);
24793b03a366Sstefano_zampini #endif
24803b03a366Sstefano_zampini       if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SVD Lapack routine %d",(int)lierr);
2481670f3ff9SJed Brown       ierr = PetscFPTrapPop();CHKERRQ(ierr);
24823b03a366Sstefano_zampini       /* retain eigenvalues greater than tol: note that lapack SVD gives eigs in descending order */
24833b03a366Sstefano_zampini       j=0;
24843b03a366Sstefano_zampini       while( j < min_n && singular_vals[min_n-j-1] < tol) j++;
24853b03a366Sstefano_zampini       total_counts = total_counts-(PetscInt)Bt+(min_n-j);
24863b03a366Sstefano_zampini #endif
24873b03a366Sstefano_zampini     }
24883b03a366Sstefano_zampini   }
2489534831adSStefano Zampini 
2490da1bb401SStefano Zampini   n_constraints=total_counts-n_vertices;
2491da1bb401SStefano Zampini   local_primal_size = total_counts;
24923b03a366Sstefano_zampini   /* set quantities in pcbddc data structure */
24933b03a366Sstefano_zampini   pcbddc->n_vertices = n_vertices;
24943b03a366Sstefano_zampini   pcbddc->n_constraints = n_constraints;
2495da1bb401SStefano Zampini   pcbddc->local_primal_size = local_primal_size;
2496534831adSStefano Zampini 
2497534831adSStefano Zampini   /* Create constraint matrix */
2498534831adSStefano Zampini   /* The constraint matrix is used to compute the l2g map of primal dofs */
2499534831adSStefano Zampini   /* so we need to set it up properly either with or without change of basis */
2500534831adSStefano Zampini   ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->ConstraintMatrix);CHKERRQ(ierr);
2501534831adSStefano Zampini   ierr = MatSetType(pcbddc->ConstraintMatrix,impMatType);CHKERRQ(ierr);
2502534831adSStefano Zampini   ierr = MatSetSizes(pcbddc->ConstraintMatrix,local_primal_size,pcis->n,local_primal_size,pcis->n);CHKERRQ(ierr);
2503534831adSStefano Zampini   /* compute a local numbering of constraints : vertices first then constraints */
2504534831adSStefano Zampini   ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
2505534831adSStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array_vector);CHKERRQ(ierr);
2506534831adSStefano Zampini   ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&aux_primal_numbering);CHKERRQ(ierr);
2507534831adSStefano Zampini   ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&aux_primal_permutation);CHKERRQ(ierr);
2508534831adSStefano Zampini   total_counts=0;
2509534831adSStefano Zampini   /* find vertices: subdomain corners plus dofs with basis changed */
2510534831adSStefano Zampini   for (i=0;i<local_primal_size;i++) {
2511534831adSStefano Zampini     size_of_constraint=temp_indices[i+1]-temp_indices[i];
2512534831adSStefano Zampini     if (change_basis[i] || size_of_constraint == 1) {
2513534831adSStefano Zampini       k=0;
2514534831adSStefano Zampini       while(k < size_of_constraint && array_vector[temp_indices_to_constraint[temp_indices[i]+size_of_constraint-k-1]] != 0.0) {
2515534831adSStefano Zampini         k=k+1;
2516534831adSStefano Zampini       }
2517534831adSStefano Zampini       j=temp_indices_to_constraint[temp_indices[i]+size_of_constraint-k-1];
2518534831adSStefano Zampini       array_vector[j] = 1.0;
2519534831adSStefano Zampini       aux_primal_numbering[total_counts]=j;
2520534831adSStefano Zampini       aux_primal_permutation[total_counts]=total_counts;
2521534831adSStefano Zampini       total_counts++;
2522534831adSStefano Zampini     }
2523534831adSStefano Zampini   }
2524534831adSStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array_vector);CHKERRQ(ierr);
2525534831adSStefano Zampini   /* permute indices in order to have a sorted set of vertices */
2526534831adSStefano Zampini   ierr = PetscSortIntWithPermutation(total_counts,aux_primal_numbering,aux_primal_permutation);
2527534831adSStefano Zampini   /* nonzero structure */
2528534831adSStefano Zampini   ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&nnz);CHKERRQ(ierr);
2529534831adSStefano Zampini   for (i=0;i<total_counts;i++) {
2530534831adSStefano Zampini     nnz[i]=1;
2531534831adSStefano Zampini   }
2532534831adSStefano Zampini   j=total_counts;
2533534831adSStefano Zampini   for (i=n_vertices;i<local_primal_size;i++) {
2534534831adSStefano Zampini     if (!change_basis[i]) {
2535534831adSStefano Zampini       nnz[j]=temp_indices[i+1]-temp_indices[i];
2536534831adSStefano Zampini       j++;
2537534831adSStefano Zampini     }
2538534831adSStefano Zampini   }
2539534831adSStefano Zampini   ierr = MatSeqAIJSetPreallocation(pcbddc->ConstraintMatrix,0,nnz);CHKERRQ(ierr);
2540534831adSStefano Zampini   ierr = PetscFree(nnz);CHKERRQ(ierr);
2541534831adSStefano Zampini   /* set values in constraint matrix */
2542534831adSStefano Zampini   for (i=0;i<total_counts;i++) {
2543534831adSStefano Zampini     j = aux_primal_permutation[i];
2544534831adSStefano Zampini     k = aux_primal_numbering[j];
2545534831adSStefano Zampini     ierr = MatSetValue(pcbddc->ConstraintMatrix,i,k,1.0,INSERT_VALUES);CHKERRQ(ierr);
2546534831adSStefano Zampini   }
2547534831adSStefano Zampini   for (i=n_vertices;i<local_primal_size;i++) {
2548534831adSStefano Zampini     if (!change_basis[i]) {
2549534831adSStefano Zampini       size_of_constraint=temp_indices[i+1]-temp_indices[i];
2550534831adSStefano Zampini       ierr = MatSetValues(pcbddc->ConstraintMatrix,1,&total_counts,size_of_constraint,&temp_indices_to_constraint[temp_indices[i]],&temp_quadrature_constraint[temp_indices[i]],INSERT_VALUES);CHKERRQ(ierr);
2551534831adSStefano Zampini       total_counts++;
2552534831adSStefano Zampini     }
2553534831adSStefano Zampini   }
2554534831adSStefano Zampini   ierr = PetscFree(aux_primal_numbering);CHKERRQ(ierr);
2555534831adSStefano Zampini   ierr = PetscFree(aux_primal_permutation);CHKERRQ(ierr);
2556534831adSStefano Zampini   /* assembling */
2557534831adSStefano Zampini   ierr = MatAssemblyBegin(pcbddc->ConstraintMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2558534831adSStefano Zampini   ierr = MatAssemblyEnd(pcbddc->ConstraintMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2559534831adSStefano Zampini 
2560534831adSStefano Zampini   /* Create matrix for change of basis. We don't need it in case pcbddc->usechangeofbasis is FALSE */
2561534831adSStefano Zampini   if (pcbddc->usechangeofbasis) {
2562534831adSStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->ChangeOfBasisMatrix);CHKERRQ(ierr);
2563534831adSStefano Zampini     ierr = MatSetType(pcbddc->ChangeOfBasisMatrix,impMatType);CHKERRQ(ierr);
2564534831adSStefano Zampini     ierr = MatSetSizes(pcbddc->ChangeOfBasisMatrix,pcis->n_B,pcis->n_B,pcis->n_B,pcis->n_B);CHKERRQ(ierr);
2565534831adSStefano Zampini     /* work arrays */
2566534831adSStefano Zampini     /* we need to reuse these arrays, so we free them */
2567534831adSStefano Zampini     ierr = PetscFree(temp_basis);CHKERRQ(ierr);
2568534831adSStefano Zampini     ierr = PetscFree(work);CHKERRQ(ierr);
2569534831adSStefano Zampini     ierr = PetscMalloc(pcis->n_B*sizeof(PetscInt),&nnz);CHKERRQ(ierr);
2570534831adSStefano Zampini     ierr = PetscMalloc((nnsp_addone+nnsp_size)*(nnsp_addone+nnsp_size)*sizeof(PetscScalar),&temp_basis);CHKERRQ(ierr);
2571534831adSStefano Zampini     ierr = PetscMalloc((nnsp_addone+nnsp_size)*sizeof(PetscScalar),&work);CHKERRQ(ierr);
2572534831adSStefano Zampini     ierr = PetscMalloc((nnsp_addone+nnsp_size)*sizeof(PetscBLASInt),&ipiv);CHKERRQ(ierr);
2573534831adSStefano Zampini     for (i=0;i<pcis->n_B;i++) {
2574534831adSStefano Zampini       nnz[i]=1;
2575534831adSStefano Zampini     }
2576534831adSStefano Zampini     /* Overestimated nonzeros per row */
2577534831adSStefano Zampini     k=1;
2578534831adSStefano Zampini     for (i=pcbddc->n_vertices;i<local_primal_size;i++) {
2579534831adSStefano Zampini       if (change_basis[i]) {
2580534831adSStefano Zampini         size_of_constraint = temp_indices[i+1]-temp_indices[i];
2581534831adSStefano Zampini         if (k < size_of_constraint) {
2582534831adSStefano Zampini           k = size_of_constraint;
2583534831adSStefano Zampini         }
2584534831adSStefano Zampini         for (j=0;j<size_of_constraint;j++) {
2585534831adSStefano Zampini           nnz[temp_indices_to_constraint_B[temp_indices[i]+j]] = size_of_constraint;
2586534831adSStefano Zampini         }
2587534831adSStefano Zampini       }
2588534831adSStefano Zampini     }
2589534831adSStefano Zampini     ierr = MatSeqAIJSetPreallocation(pcbddc->ChangeOfBasisMatrix,0,nnz);CHKERRQ(ierr);
2590534831adSStefano Zampini     ierr = PetscFree(nnz);CHKERRQ(ierr);
2591534831adSStefano Zampini     /* Temporary array to store indices */
2592534831adSStefano Zampini     ierr = PetscMalloc(k*sizeof(PetscInt),&is_indices);CHKERRQ(ierr);
2593534831adSStefano Zampini     /* Set initial identity in the matrix */
2594534831adSStefano Zampini     for (i=0;i<pcis->n_B;i++) {
2595534831adSStefano Zampini       ierr = MatSetValue(pcbddc->ChangeOfBasisMatrix,i,i,1.0,INSERT_VALUES);CHKERRQ(ierr);
2596534831adSStefano Zampini     }
2597534831adSStefano Zampini     /* Now we loop on the constraints which need a change of basis */
2598534831adSStefano Zampini     /* Change of basis matrix is evaluated as the FIRST APPROACH in */
2599534831adSStefano Zampini     /* Klawonn and Widlund, Dual-primal FETI-DP methods for linear elasticity, (6.2.1) */
2600534831adSStefano Zampini     temp_constraints = 0;
260193dc3b60SStefano Zampini     if (pcbddc->n_vertices < local_primal_size) {
2602534831adSStefano Zampini       temp_start_ptr = temp_indices_to_constraint_B[temp_indices[pcbddc->n_vertices]];
260393dc3b60SStefano Zampini     }
2604534831adSStefano Zampini     for (i=pcbddc->n_vertices;i<local_primal_size;i++) {
2605534831adSStefano Zampini       if (change_basis[i]) {
2606534831adSStefano Zampini         compute_submatrix = PETSC_FALSE;
2607534831adSStefano Zampini         useksp = PETSC_FALSE;
2608534831adSStefano Zampini         if (temp_start_ptr == temp_indices_to_constraint_B[temp_indices[i]]) {
2609534831adSStefano Zampini           temp_constraints++;
261004eaf177SStefano Zampini           if (i == local_primal_size -1 ||  temp_start_ptr != temp_indices_to_constraint_B[temp_indices[i+1]]) {
2611534831adSStefano Zampini             compute_submatrix = PETSC_TRUE;
2612534831adSStefano Zampini           }
2613534831adSStefano Zampini         }
2614534831adSStefano Zampini         if (compute_submatrix) {
2615534831adSStefano Zampini           if (temp_constraints > 1 || pcbddc->use_nnsp_true) {
2616534831adSStefano Zampini             useksp = PETSC_TRUE;
2617534831adSStefano Zampini           }
2618534831adSStefano Zampini           size_of_constraint = temp_indices[i+1]-temp_indices[i];
2619534831adSStefano Zampini           if (useksp) { /* experimental */
2620534831adSStefano Zampini             ierr = MatCreate(PETSC_COMM_SELF,&temp_mat);CHKERRQ(ierr);
2621534831adSStefano Zampini             ierr = MatSetType(temp_mat,impMatType);CHKERRQ(ierr);
2622534831adSStefano Zampini             ierr = MatSetSizes(temp_mat,size_of_constraint,size_of_constraint,size_of_constraint,size_of_constraint);CHKERRQ(ierr);
2623534831adSStefano Zampini             ierr = MatSeqAIJSetPreallocation(temp_mat,size_of_constraint,PETSC_NULL);CHKERRQ(ierr);
2624534831adSStefano Zampini           }
2625534831adSStefano Zampini           /* First _size_of_constraint-temp_constraints_ columns */
2626534831adSStefano Zampini           dual_dofs = size_of_constraint-temp_constraints;
2627534831adSStefano Zampini           start_constraint = i+1-temp_constraints;
2628534831adSStefano Zampini           for (s=0;s<dual_dofs;s++) {
2629534831adSStefano Zampini             is_indices[0] = s;
2630534831adSStefano Zampini             for (j=0;j<temp_constraints;j++) {
2631534831adSStefano Zampini               for (k=0;k<temp_constraints;k++) {
2632534831adSStefano Zampini                 temp_basis[j*temp_constraints+k]=temp_quadrature_constraint[temp_indices[start_constraint+k]+s+j+1];
2633534831adSStefano Zampini               }
2634534831adSStefano Zampini               work[j]=-temp_quadrature_constraint[temp_indices[start_constraint+j]+s];
2635534831adSStefano Zampini               is_indices[j+1]=s+j+1;
2636534831adSStefano Zampini             }
2637534831adSStefano Zampini             Bt = temp_constraints;
2638534831adSStefano Zampini             ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
2639534831adSStefano Zampini             LAPACKgesv_(&Bt,&Bone,temp_basis,&Bt,ipiv,work,&Bt,&lierr);
2640534831adSStefano Zampini             if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GESV Lapack routine %d",(int)lierr);
2641534831adSStefano Zampini             ierr = PetscFPTrapPop();CHKERRQ(ierr);
2642534831adSStefano Zampini             j = temp_indices_to_constraint_B[temp_indices[start_constraint]+s];
2643534831adSStefano Zampini             ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,temp_constraints,&temp_indices_to_constraint_B[temp_indices[start_constraint]+s+1],1,&j,work,INSERT_VALUES);CHKERRQ(ierr);
2644534831adSStefano Zampini             if (useksp) {
2645534831adSStefano Zampini               /* temp mat with transposed rows and columns */
2646534831adSStefano Zampini               ierr = MatSetValues(temp_mat,1,&s,temp_constraints,&is_indices[1],work,INSERT_VALUES);CHKERRQ(ierr);
2647534831adSStefano Zampini               ierr = MatSetValue(temp_mat,is_indices[0],is_indices[0],1.0,INSERT_VALUES);CHKERRQ(ierr);
2648534831adSStefano Zampini             }
2649534831adSStefano Zampini           }
2650534831adSStefano Zampini           if (useksp) {
2651534831adSStefano Zampini             /* last rows of temp_mat */
2652534831adSStefano Zampini             for (j=0;j<size_of_constraint;j++) {
2653534831adSStefano Zampini               is_indices[j] = j;
2654534831adSStefano Zampini             }
2655534831adSStefano Zampini             for (s=0;s<temp_constraints;s++) {
2656534831adSStefano Zampini               k = s + dual_dofs;
2657534831adSStefano Zampini               ierr = MatSetValues(temp_mat,1,&k,size_of_constraint,is_indices,&temp_quadrature_constraint[temp_indices[start_constraint+s]],INSERT_VALUES);CHKERRQ(ierr);
2658534831adSStefano Zampini             }
2659534831adSStefano Zampini             ierr = MatAssemblyBegin(temp_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2660534831adSStefano Zampini             ierr = MatAssemblyEnd(temp_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2661534831adSStefano Zampini             ierr = MatGetVecs(temp_mat,&temp_vec,PETSC_NULL);CHKERRQ(ierr);
2662534831adSStefano Zampini             ierr = KSPCreate(PETSC_COMM_SELF,&temp_ksp);CHKERRQ(ierr);
2663534831adSStefano Zampini             ierr = KSPSetOperators(temp_ksp,temp_mat,temp_mat,SAME_PRECONDITIONER);CHKERRQ(ierr);
2664534831adSStefano Zampini             ierr = KSPSetType(temp_ksp,KSPPREONLY);CHKERRQ(ierr);
2665ffe5efe1SStefano Zampini             ierr = KSPGetPC(temp_ksp,&temp_pc);CHKERRQ(ierr);
2666ffe5efe1SStefano Zampini             ierr = PCSetType(temp_pc,PCLU);CHKERRQ(ierr);
2667534831adSStefano Zampini             ierr = KSPSetUp(temp_ksp);CHKERRQ(ierr);
2668534831adSStefano Zampini             for (s=0;s<temp_constraints;s++) {
2669534831adSStefano Zampini               ierr = VecSet(temp_vec,0.0);CHKERRQ(ierr);
2670534831adSStefano Zampini               ierr = VecSetValue(temp_vec,s+dual_dofs,1.0,INSERT_VALUES);CHKERRQ(ierr);
2671534831adSStefano Zampini               ierr = VecAssemblyBegin(temp_vec);CHKERRQ(ierr);
2672534831adSStefano Zampini               ierr = VecAssemblyEnd(temp_vec);CHKERRQ(ierr);
2673534831adSStefano Zampini               ierr = KSPSolve(temp_ksp,temp_vec,temp_vec);CHKERRQ(ierr);
2674534831adSStefano Zampini               ierr = VecGetArray(temp_vec,&array_vector);CHKERRQ(ierr);
2675534831adSStefano Zampini               j = temp_indices_to_constraint_B[temp_indices[start_constraint+s]+size_of_constraint-s-1];
2676534831adSStefano Zampini               /* last columns of change of basis matrix associated to new primal dofs */
2677534831adSStefano Zampini               ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,size_of_constraint,&temp_indices_to_constraint_B[temp_indices[start_constraint+s]],1,&j,array_vector,INSERT_VALUES);CHKERRQ(ierr);
2678534831adSStefano Zampini               ierr = VecRestoreArray(temp_vec,&array_vector);CHKERRQ(ierr);
2679534831adSStefano Zampini             }
2680534831adSStefano Zampini             ierr = MatDestroy(&temp_mat);CHKERRQ(ierr);
2681534831adSStefano Zampini             ierr = KSPDestroy(&temp_ksp);CHKERRQ(ierr);
2682534831adSStefano Zampini             ierr = VecDestroy(&temp_vec);CHKERRQ(ierr);
2683534831adSStefano Zampini           } else {
2684534831adSStefano Zampini             /* last columns of change of basis matrix associated to new primal dofs */
2685534831adSStefano Zampini             for (s=0;s<temp_constraints;s++) {
2686534831adSStefano Zampini               j = temp_indices_to_constraint_B[temp_indices[start_constraint+s]+size_of_constraint-s-1];
2687534831adSStefano Zampini               ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,size_of_constraint,&temp_indices_to_constraint_B[temp_indices[start_constraint+s]],1,&j,&temp_quadrature_constraint[temp_indices[start_constraint+s]],INSERT_VALUES);CHKERRQ(ierr);
2688534831adSStefano Zampini             }
2689534831adSStefano Zampini           }
2690534831adSStefano Zampini           /* prepare for the next cycle */
2691534831adSStefano Zampini           temp_constraints = 0;
269204eaf177SStefano Zampini           if (i != local_primal_size -1 ) {
2693534831adSStefano Zampini             temp_start_ptr = temp_indices_to_constraint_B[temp_indices[i+1]];
2694534831adSStefano Zampini           }
2695534831adSStefano Zampini         }
2696534831adSStefano Zampini       }
269704eaf177SStefano Zampini     }
2698534831adSStefano Zampini     /* assembling */
2699534831adSStefano Zampini     ierr = MatAssemblyBegin(pcbddc->ChangeOfBasisMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2700534831adSStefano Zampini     ierr = MatAssemblyEnd(pcbddc->ChangeOfBasisMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2701534831adSStefano Zampini     ierr = PetscFree(ipiv);CHKERRQ(ierr);
2702534831adSStefano Zampini     ierr = PetscFree(is_indices);CHKERRQ(ierr);
2703534831adSStefano Zampini   }
27043b03a366Sstefano_zampini   /* free workspace no longer needed */
27053b03a366Sstefano_zampini   ierr = PetscFree(rwork);CHKERRQ(ierr);
27063b03a366Sstefano_zampini   ierr = PetscFree(work);CHKERRQ(ierr);
27073b03a366Sstefano_zampini   ierr = PetscFree(temp_basis);CHKERRQ(ierr);
27083b03a366Sstefano_zampini   ierr = PetscFree(singular_vals);CHKERRQ(ierr);
27093b03a366Sstefano_zampini   ierr = PetscFree(correlation_mat);CHKERRQ(ierr);
27103b03a366Sstefano_zampini   ierr = PetscFree(temp_indices);CHKERRQ(ierr);
2711534831adSStefano Zampini   ierr = PetscFree(change_basis);CHKERRQ(ierr);
27123b03a366Sstefano_zampini   ierr = PetscFree(temp_indices_to_constraint);CHKERRQ(ierr);
2713534831adSStefano Zampini   ierr = PetscFree(temp_indices_to_constraint_B);CHKERRQ(ierr);
2714534831adSStefano Zampini   ierr = PetscFree(local_to_B);CHKERRQ(ierr);
27153b03a366Sstefano_zampini   ierr = PetscFree(temp_quadrature_constraint);CHKERRQ(ierr);
27163425bc38SStefano Zampini #if defined(PETSC_MISSING_LAPACK_GESVD)
27173425bc38SStefano Zampini   ierr = PetscFree(iwork);CHKERRQ(ierr);
27183425bc38SStefano Zampini   ierr = PetscFree(ifail);CHKERRQ(ierr);
27193425bc38SStefano Zampini   ierr = PetscFree(singular_vectors);CHKERRQ(ierr);
27203425bc38SStefano Zampini #endif
2721da1bb401SStefano Zampini   for (k=0;k<nnsp_size;k++) {
2722da1bb401SStefano Zampini     ierr = VecDestroy(&localnearnullsp[k]);CHKERRQ(ierr);
2723da1bb401SStefano Zampini   }
27243b03a366Sstefano_zampini   ierr = PetscFree(localnearnullsp);CHKERRQ(ierr);
27253b03a366Sstefano_zampini   PetscFunctionReturn(0);
27263b03a366Sstefano_zampini }
27273b03a366Sstefano_zampini /* -------------------------------------------------------------------------- */
27280c7d97c5SJed Brown #undef __FUNCT__
27290c7d97c5SJed Brown #define __FUNCT__ "PCBDDCCoarseSetUp"
273053cdbc3dSStefano Zampini static PetscErrorCode PCBDDCCoarseSetUp(PC pc)
27310c7d97c5SJed Brown {
27320c7d97c5SJed Brown   PetscErrorCode  ierr;
27330c7d97c5SJed Brown 
27340c7d97c5SJed Brown   PC_IS*            pcis = (PC_IS*)(pc->data);
27350c7d97c5SJed Brown   PC_BDDC*          pcbddc = (PC_BDDC*)pc->data;
27360c7d97c5SJed Brown   Mat_IS            *matis = (Mat_IS*)pc->pmat->data;
2737534831adSStefano Zampini   Mat               change_mat_all;
27380c7d97c5SJed Brown   IS                is_R_local;
27390c7d97c5SJed Brown   IS                is_V_local;
27400c7d97c5SJed Brown   IS                is_C_local;
27410c7d97c5SJed Brown   IS                is_aux1;
27420c7d97c5SJed Brown   IS                is_aux2;
27430c7d97c5SJed Brown   const VecType     impVecType;
27440c7d97c5SJed Brown   const MatType     impMatType;
27450c7d97c5SJed Brown   PetscInt          n_R=0;
27460c7d97c5SJed Brown   PetscInt          n_D=0;
27470c7d97c5SJed Brown   PetscInt          n_B=0;
27480c7d97c5SJed Brown   PetscScalar       zero=0.0;
27490c7d97c5SJed Brown   PetscScalar       one=1.0;
27500c7d97c5SJed Brown   PetscScalar       m_one=-1.0;
27510c7d97c5SJed Brown   PetscScalar*      array;
27520c7d97c5SJed Brown   PetscScalar       *coarse_submat_vals;
27530c7d97c5SJed Brown   PetscInt          *idx_R_local;
27540c7d97c5SJed Brown   PetscInt          *idx_V_B;
27550c7d97c5SJed Brown   PetscScalar       *coarsefunctions_errors;
27560c7d97c5SJed Brown   PetscScalar       *constraints_errors;
27570c7d97c5SJed Brown   /* auxiliary indices */
2758534831adSStefano Zampini   PetscInt i,j,k;
2759e269702eSStefano Zampini   /* for verbose output of bddc */
2760e269702eSStefano Zampini   PetscViewer       viewer=pcbddc->dbg_viewer;
2761e269702eSStefano Zampini   PetscBool         dbg_flag=pcbddc->dbg_flag;
2762a0ba757dSStefano Zampini   /* for counting coarse dofs */
2763534831adSStefano Zampini   PetscInt          n_vertices,n_constraints;
27643b03a366Sstefano_zampini   PetscInt          size_of_constraint;
27653b03a366Sstefano_zampini   PetscInt          *row_cmat_indices;
27663b03a366Sstefano_zampini   PetscScalar       *row_cmat_values;
2767534831adSStefano Zampini   PetscInt          *vertices,*nnz,*is_indices,*temp_indices;
27680c7d97c5SJed Brown 
27690c7d97c5SJed Brown   PetscFunctionBegin;
27700c7d97c5SJed Brown   /* Set Non-overlapping dimensions */
27710c7d97c5SJed Brown   n_B = pcis->n_B; n_D = pcis->n - n_B;
2772534831adSStefano Zampini   /* Set types for local objects needed by BDDC precondtioner */
2773534831adSStefano Zampini   impMatType = MATSEQDENSE;
2774534831adSStefano Zampini   impVecType = VECSEQ;
2775da1bb401SStefano Zampini   /* get vertex indices from constraint matrix */
2776534831adSStefano Zampini   ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscInt),&vertices);CHKERRQ(ierr);
2777534831adSStefano Zampini   n_vertices=0;
2778da1bb401SStefano Zampini   for (i=0;i<pcbddc->local_primal_size;i++) {
2779da1bb401SStefano Zampini     ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr);
2780da1bb401SStefano Zampini     if (size_of_constraint == 1) {
2781534831adSStefano Zampini       vertices[n_vertices]=row_cmat_indices[0];
2782534831adSStefano Zampini       n_vertices++;
2783a0ba757dSStefano Zampini     }
2784da1bb401SStefano Zampini     ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr);
2785a0ba757dSStefano Zampini   }
2786534831adSStefano Zampini   /* Set number of constraints */
2787534831adSStefano Zampini   n_constraints = pcbddc->local_primal_size-n_vertices;
2788534831adSStefano Zampini 
2789534831adSStefano Zampini   /* vertices in boundary numbering */
2790534831adSStefano Zampini   if (n_vertices) {
2791534831adSStefano Zampini     ierr = VecSet(pcis->vec1_N,m_one);CHKERRQ(ierr);
2792534831adSStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
2793534831adSStefano Zampini     for (i=0; i<n_vertices; i++) { array[ vertices[i] ] = i; }
2794534831adSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
2795534831adSStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
2796534831adSStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
2797534831adSStefano Zampini     ierr = PetscMalloc(n_vertices*sizeof(PetscInt),&idx_V_B);CHKERRQ(ierr);
2798534831adSStefano Zampini     ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr);
2799534831adSStefano Zampini     for (i=0; i<n_vertices; i++) {
2800534831adSStefano Zampini       j=0;
2801534831adSStefano Zampini       while (array[j] != i ) {j++;}
2802534831adSStefano Zampini       idx_V_B[i]=j;
2803534831adSStefano Zampini     }
2804534831adSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr);
2805534831adSStefano Zampini   }
2806534831adSStefano Zampini 
2807534831adSStefano Zampini   /* transform local matrices if needed */
2808534831adSStefano Zampini   if (pcbddc->usechangeofbasis) {
2809534831adSStefano Zampini     ierr = PetscMalloc(pcis->n*sizeof(PetscInt),&nnz);CHKERRQ(ierr);
2810534831adSStefano Zampini     ierr = ISGetIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2811534831adSStefano Zampini     for (i=0;i<n_D;i++) {
2812534831adSStefano Zampini       nnz[is_indices[i]]=1;
2813534831adSStefano Zampini     }
2814534831adSStefano Zampini     ierr = ISRestoreIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2815534831adSStefano Zampini     ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2816534831adSStefano Zampini     k=1;
2817534831adSStefano Zampini     for (i=0;i<n_B;i++) {
2818534831adSStefano Zampini       ierr = MatGetRow(pcbddc->ChangeOfBasisMatrix,i,&j,PETSC_NULL,PETSC_NULL);CHKERRQ(ierr);
2819534831adSStefano Zampini       nnz[is_indices[i]]=j;
2820534831adSStefano Zampini       if ( k < j) {
2821534831adSStefano Zampini         k = j;
2822534831adSStefano Zampini       }
2823534831adSStefano Zampini       ierr = MatRestoreRow(pcbddc->ChangeOfBasisMatrix,i,&j,PETSC_NULL,PETSC_NULL);CHKERRQ(ierr);
2824534831adSStefano Zampini     }
2825534831adSStefano Zampini     ierr = ISRestoreIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2826534831adSStefano Zampini     /* assemble change of basis matrix on the whole set of local dofs */
2827534831adSStefano Zampini     ierr = PetscMalloc(k*sizeof(PetscInt),&temp_indices);CHKERRQ(ierr);
2828534831adSStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&change_mat_all);CHKERRQ(ierr);
2829534831adSStefano Zampini     ierr = MatSetSizes(change_mat_all,pcis->n,pcis->n,pcis->n,pcis->n);CHKERRQ(ierr);
2830534831adSStefano Zampini     ierr = MatSetType(change_mat_all,MATSEQAIJ);CHKERRQ(ierr);
2831534831adSStefano Zampini     ierr = MatSeqAIJSetPreallocation(change_mat_all,0,nnz);CHKERRQ(ierr);
2832534831adSStefano Zampini     ierr = ISGetIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2833534831adSStefano Zampini     for (i=0;i<n_D;i++) {
2834534831adSStefano Zampini       ierr = MatSetValue(change_mat_all,is_indices[i],is_indices[i],1.0,INSERT_VALUES);CHKERRQ(ierr);
2835534831adSStefano Zampini     }
2836534831adSStefano Zampini     ierr = ISRestoreIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2837534831adSStefano Zampini     ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2838534831adSStefano Zampini     for (i=0;i<n_B;i++) {
2839534831adSStefano Zampini       ierr = MatGetRow(pcbddc->ChangeOfBasisMatrix,i,&j,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr);
2840534831adSStefano Zampini       for (k=0;k<j;k++) {
2841534831adSStefano Zampini         temp_indices[k]=is_indices[row_cmat_indices[k]];
2842534831adSStefano Zampini       }
2843534831adSStefano Zampini       ierr = MatSetValues(change_mat_all,1,&is_indices[i],j,temp_indices,row_cmat_values,INSERT_VALUES);CHKERRQ(ierr);
2844534831adSStefano Zampini       ierr = MatRestoreRow(pcbddc->ChangeOfBasisMatrix,i,&j,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr);
2845534831adSStefano Zampini     }
2846534831adSStefano Zampini     ierr = MatAssemblyBegin(change_mat_all,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2847534831adSStefano Zampini     ierr = MatAssemblyEnd(change_mat_all,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2848534831adSStefano Zampini     ierr = MatPtAP(matis->A,change_mat_all,MAT_INITIAL_MATRIX,1.0,&pcbddc->local_mat);CHKERRQ(ierr);
2849534831adSStefano Zampini     ierr = MatDestroy(&pcis->A_IB);CHKERRQ(ierr);
2850534831adSStefano Zampini     ierr = MatDestroy(&pcis->A_BI);CHKERRQ(ierr);
2851534831adSStefano Zampini     ierr = MatDestroy(&pcis->A_BB);CHKERRQ(ierr);
2852534831adSStefano Zampini     ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_I_local,pcis->is_B_local,MAT_INITIAL_MATRIX,&pcis->A_IB);CHKERRQ(ierr);
2853534831adSStefano Zampini     ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_B_local,pcis->is_I_local,MAT_INITIAL_MATRIX,&pcis->A_BI);CHKERRQ(ierr);
2854534831adSStefano Zampini     ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_B_local,pcis->is_B_local,MAT_INITIAL_MATRIX,&pcis->A_BB);CHKERRQ(ierr);
2855534831adSStefano Zampini     ierr = MatDestroy(&change_mat_all);CHKERRQ(ierr);
2856534831adSStefano Zampini     ierr = PetscFree(nnz);CHKERRQ(ierr);
2857534831adSStefano Zampini     ierr = PetscFree(temp_indices);CHKERRQ(ierr);
2858534831adSStefano Zampini   } else {
2859534831adSStefano Zampini     /* without change of basis, the local matrix is unchanged */
2860534831adSStefano Zampini     ierr = PetscObjectReference((PetscObject)matis->A);CHKERRQ(ierr);
2861534831adSStefano Zampini     pcbddc->local_mat = matis->A;
2862534831adSStefano Zampini   }
2863*0bdf917eSStefano Zampini   /* Change global null space passed in by the user if change of basis has been performed */
2864*0bdf917eSStefano Zampini   if (pcbddc->NullSpace && pcbddc->usechangeofbasis) {
2865*0bdf917eSStefano Zampini     ierr = PCBDDCAdaptNullSpace(pc);CHKERRQ(ierr);
2866*0bdf917eSStefano Zampini   }
2867a0ba757dSStefano Zampini 
28680c7d97c5SJed Brown   /* Dohrmann's notation: dofs splitted in R (Remaining: all dofs but the vertices) and V (Vertices) */
28690c7d97c5SJed Brown   ierr = VecSet(pcis->vec1_N,one);CHKERRQ(ierr);
28700c7d97c5SJed Brown   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
28713b03a366Sstefano_zampini   for (i=0;i<n_vertices;i++) { array[ vertices[i] ] = zero; }
28723b03a366Sstefano_zampini   ierr = PetscMalloc(( pcis->n - n_vertices )*sizeof(PetscInt),&idx_R_local);CHKERRQ(ierr);
28730c7d97c5SJed Brown   for (i=0, n_R=0; i<pcis->n; i++) { if (array[i] == one) { idx_R_local[n_R] = i; n_R++; } }
28740c7d97c5SJed Brown   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
2875e269702eSStefano Zampini   if (dbg_flag) {
28760c7d97c5SJed Brown     ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
28770c7d97c5SJed Brown     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
28780c7d97c5SJed Brown     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d local dimensions\n",PetscGlobalRank);CHKERRQ(ierr);
28790c7d97c5SJed Brown     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local_size = %d, dirichlet_size = %d, boundary_size = %d\n",pcis->n,n_D,n_B);CHKERRQ(ierr);
28803b03a366Sstefano_zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"r_size = %d, v_size = %d, constraints = %d, local_primal_size = %d\n",n_R,n_vertices,n_constraints,pcbddc->local_primal_size);CHKERRQ(ierr);
2881534831adSStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"pcbddc->n_vertices = %d, pcbddc->n_constraints = %d\n",pcbddc->n_vertices,pcbddc->n_constraints);CHKERRQ(ierr);
28820c7d97c5SJed Brown     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
28830c7d97c5SJed Brown   }
2884534831adSStefano Zampini 
28850c7d97c5SJed Brown   /* Allocate needed vectors */
2886534831adSStefano Zampini   ierr = VecDuplicate(pcis->vec1_global,&pcbddc->original_rhs);CHKERRQ(ierr);
28873972b0daSStefano Zampini   ierr = VecDuplicate(pcis->vec1_global,&pcbddc->temp_solution);CHKERRQ(ierr);
28880c7d97c5SJed Brown   ierr = VecDuplicate(pcis->vec1_D,&pcbddc->vec4_D);CHKERRQ(ierr);
28890c7d97c5SJed Brown   ierr = VecCreate(PETSC_COMM_SELF,&pcbddc->vec1_R);CHKERRQ(ierr);
28900c7d97c5SJed Brown   ierr = VecSetSizes(pcbddc->vec1_R,n_R,n_R);CHKERRQ(ierr);
28910c7d97c5SJed Brown   ierr = VecSetType(pcbddc->vec1_R,impVecType);CHKERRQ(ierr);
2892d49ef151SStefano Zampini   ierr = VecDuplicate(pcbddc->vec1_R,&pcbddc->vec2_R);CHKERRQ(ierr);
28930c7d97c5SJed Brown   ierr = VecCreate(PETSC_COMM_SELF,&pcbddc->vec1_P);CHKERRQ(ierr);
28940c7d97c5SJed Brown   ierr = VecSetSizes(pcbddc->vec1_P,pcbddc->local_primal_size,pcbddc->local_primal_size);CHKERRQ(ierr);
28950c7d97c5SJed Brown   ierr = VecSetType(pcbddc->vec1_P,impVecType);CHKERRQ(ierr);
28960c7d97c5SJed Brown 
28970c7d97c5SJed Brown   /* Creating some index sets needed  */
28980c7d97c5SJed Brown   /* For submatrices */
2899da1bb401SStefano Zampini   ierr = ISCreateGeneral(PETSC_COMM_SELF,n_R,idx_R_local,PETSC_OWN_POINTER,&is_R_local);CHKERRQ(ierr);
29003b03a366Sstefano_zampini   if (n_vertices)    {
2901da1bb401SStefano Zampini     ierr = ISCreateGeneral(PETSC_COMM_SELF,n_vertices,vertices,PETSC_OWN_POINTER,&is_V_local);CHKERRQ(ierr);
29023b03a366Sstefano_zampini   }
2903da1bb401SStefano Zampini   if (n_constraints) {
2904da1bb401SStefano Zampini     ierr = ISCreateStride(PETSC_COMM_SELF,n_constraints,n_vertices,1,&is_C_local);CHKERRQ(ierr);
2905da1bb401SStefano Zampini   }
2906da1bb401SStefano Zampini 
29070c7d97c5SJed Brown   /* For VecScatters pcbddc->R_to_B and (optionally) pcbddc->R_to_D */
29080c7d97c5SJed Brown   {
29090c7d97c5SJed Brown     PetscInt   *aux_array1;
29100c7d97c5SJed Brown     PetscInt   *aux_array2;
29110c7d97c5SJed Brown 
29123b03a366Sstefano_zampini     ierr = PetscMalloc( (pcis->n_B-n_vertices)*sizeof(PetscInt),&aux_array1);CHKERRQ(ierr);
29133b03a366Sstefano_zampini     ierr = PetscMalloc( (pcis->n_B-n_vertices)*sizeof(PetscInt),&aux_array2);CHKERRQ(ierr);
29140c7d97c5SJed Brown 
2915d49ef151SStefano Zampini     ierr = VecSet(pcis->vec1_global,zero);CHKERRQ(ierr);
29160c7d97c5SJed Brown     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
29170c7d97c5SJed Brown     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
29180c7d97c5SJed Brown     ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
29190c7d97c5SJed Brown     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
29200c7d97c5SJed Brown     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
29210c7d97c5SJed Brown     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
29220c7d97c5SJed Brown     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
2923da1bb401SStefano Zampini     for (i=0, j=0; i<n_R; i++) { if ( array[idx_R_local[i]] > one ) { aux_array1[j] = i; j++; } }
29240c7d97c5SJed Brown     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
2925da1bb401SStefano Zampini     ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array1,PETSC_COPY_VALUES,&is_aux1);CHKERRQ(ierr);
29260c7d97c5SJed Brown     ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr);
2927da1bb401SStefano Zampini     for (i=0, j=0; i<n_B; i++) { if ( array[i] > one ) { aux_array2[j] = i; j++; } }
29283828260eSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr);
2929da1bb401SStefano Zampini     ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array2,PETSC_COPY_VALUES,&is_aux2);CHKERRQ(ierr);
29300c7d97c5SJed Brown     ierr = VecScatterCreate(pcbddc->vec1_R,is_aux1,pcis->vec1_B,is_aux2,&pcbddc->R_to_B);CHKERRQ(ierr);
29310c7d97c5SJed Brown     ierr = PetscFree(aux_array1);CHKERRQ(ierr);
29320c7d97c5SJed Brown     ierr = PetscFree(aux_array2);CHKERRQ(ierr);
29330c7d97c5SJed Brown     ierr = ISDestroy(&is_aux1);CHKERRQ(ierr);
29340c7d97c5SJed Brown     ierr = ISDestroy(&is_aux2);CHKERRQ(ierr);
29350c7d97c5SJed Brown 
2936e269702eSStefano Zampini     if (pcbddc->prec_type || dbg_flag ) {
29370c7d97c5SJed Brown       ierr = PetscMalloc(n_D*sizeof(PetscInt),&aux_array1);CHKERRQ(ierr);
29380c7d97c5SJed Brown       ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
2939da1bb401SStefano Zampini       for (i=0, j=0; i<n_R; i++) { if (array[idx_R_local[i]] == one) { aux_array1[j] = i; j++; } }
29400c7d97c5SJed Brown       ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
2941da1bb401SStefano Zampini       ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array1,PETSC_COPY_VALUES,&is_aux1);CHKERRQ(ierr);
29420c7d97c5SJed Brown       ierr = VecScatterCreate(pcbddc->vec1_R,is_aux1,pcis->vec1_D,(IS)0,&pcbddc->R_to_D);CHKERRQ(ierr);
29430c7d97c5SJed Brown       ierr = PetscFree(aux_array1);CHKERRQ(ierr);
29440c7d97c5SJed Brown       ierr = ISDestroy(&is_aux1);CHKERRQ(ierr);
29450c7d97c5SJed Brown     }
29460c7d97c5SJed Brown   }
29470c7d97c5SJed Brown 
29480c7d97c5SJed Brown   /* Creating PC contexts for local Dirichlet and Neumann problems */
29490c7d97c5SJed Brown   {
29500c7d97c5SJed Brown     Mat  A_RR;
295153cdbc3dSStefano Zampini     PC   pc_temp;
29520c7d97c5SJed Brown     /* Matrix for Dirichlet problem is A_II -> we already have it from pcis.c code */
295353cdbc3dSStefano Zampini     ierr = KSPCreate(PETSC_COMM_SELF,&pcbddc->ksp_D);CHKERRQ(ierr);
295453cdbc3dSStefano Zampini     ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->ksp_D,(PetscObject)pc,1);CHKERRQ(ierr);
295553cdbc3dSStefano Zampini     ierr = KSPSetOperators(pcbddc->ksp_D,pcis->A_II,pcis->A_II,SAME_PRECONDITIONER);CHKERRQ(ierr);
295653cdbc3dSStefano Zampini     ierr = KSPSetType(pcbddc->ksp_D,KSPPREONLY);CHKERRQ(ierr);
2957da1bb401SStefano Zampini     ierr = KSPSetOptionsPrefix(pcbddc->ksp_D,"dirichlet_");CHKERRQ(ierr);
29580c7d97c5SJed Brown     /* default */
295953cdbc3dSStefano Zampini     ierr = KSPGetPC(pcbddc->ksp_D,&pc_temp);CHKERRQ(ierr);
296053cdbc3dSStefano Zampini     ierr = PCSetType(pc_temp,PCLU);CHKERRQ(ierr);
29610c7d97c5SJed Brown     /* Allow user's customization */
296253cdbc3dSStefano Zampini     ierr = KSPSetFromOptions(pcbddc->ksp_D);CHKERRQ(ierr);
296353cdbc3dSStefano Zampini     /* Set Up KSP for Dirichlet problem of BDDC */
296453cdbc3dSStefano Zampini     ierr = KSPSetUp(pcbddc->ksp_D);CHKERRQ(ierr);
29653972b0daSStefano Zampini     /* set ksp_D into pcis data */
29663972b0daSStefano Zampini     ierr = KSPDestroy(&pcis->ksp_D);CHKERRQ(ierr);
29673972b0daSStefano Zampini     ierr = PetscObjectReference((PetscObject)pcbddc->ksp_D);CHKERRQ(ierr);
29683972b0daSStefano Zampini     pcis->ksp_D = pcbddc->ksp_D;
29690c7d97c5SJed Brown     /* Matrix for Neumann problem is A_RR -> we need to create it */
2970534831adSStefano Zampini     ierr = MatGetSubMatrix(pcbddc->local_mat,is_R_local,is_R_local,MAT_INITIAL_MATRIX,&A_RR);CHKERRQ(ierr);
297153cdbc3dSStefano Zampini     ierr = KSPCreate(PETSC_COMM_SELF,&pcbddc->ksp_R);CHKERRQ(ierr);
297253cdbc3dSStefano Zampini     ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->ksp_R,(PetscObject)pc,1);CHKERRQ(ierr);
297353cdbc3dSStefano Zampini     ierr = KSPSetOperators(pcbddc->ksp_R,A_RR,A_RR,SAME_PRECONDITIONER);CHKERRQ(ierr);
297453cdbc3dSStefano Zampini     ierr = KSPSetType(pcbddc->ksp_R,KSPPREONLY);CHKERRQ(ierr);
2975da1bb401SStefano Zampini     ierr = KSPSetOptionsPrefix(pcbddc->ksp_R,"neumann_");CHKERRQ(ierr);
29760c7d97c5SJed Brown     /* default */
297753cdbc3dSStefano Zampini     ierr = KSPGetPC(pcbddc->ksp_R,&pc_temp);CHKERRQ(ierr);
297853cdbc3dSStefano Zampini     ierr = PCSetType(pc_temp,PCLU);CHKERRQ(ierr);
29790c7d97c5SJed Brown     /* Allow user's customization */
298053cdbc3dSStefano Zampini     ierr = KSPSetFromOptions(pcbddc->ksp_R);CHKERRQ(ierr);
298153cdbc3dSStefano Zampini     /* Set Up KSP for Neumann problem of BDDC */
298253cdbc3dSStefano Zampini     ierr = KSPSetUp(pcbddc->ksp_R);CHKERRQ(ierr);
2983a0ba757dSStefano Zampini     /* check Dirichlet and Neumann solvers */
2984b76ba322SStefano Zampini     {
29850c7d97c5SJed Brown       Vec         temp_vec;
2986b76ba322SStefano Zampini       PetscReal   value;
2987b76ba322SStefano Zampini       PetscMPIInt use_exact,use_exact_reduced;
29880c7d97c5SJed Brown 
2989a0ba757dSStefano Zampini       ierr = VecDuplicate(pcis->vec1_D,&temp_vec);CHKERRQ(ierr);
2990a0ba757dSStefano Zampini       ierr = VecSetRandom(pcis->vec1_D,PETSC_NULL);CHKERRQ(ierr);
2991a0ba757dSStefano Zampini       ierr = MatMult(pcis->A_II,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr);
2992a0ba757dSStefano Zampini       ierr = KSPSolve(pcbddc->ksp_D,pcis->vec2_D,temp_vec);CHKERRQ(ierr);
2993a0ba757dSStefano Zampini       ierr = VecAXPY(temp_vec,m_one,pcis->vec1_D);CHKERRQ(ierr);
2994a0ba757dSStefano Zampini       ierr = VecNorm(temp_vec,NORM_INFINITY,&value);CHKERRQ(ierr);
2995b76ba322SStefano Zampini       use_exact = 1;
2996b76ba322SStefano Zampini       if (PetscAbsReal(value) > 1.e-4) {
2997b76ba322SStefano Zampini         use_exact = 0;
2998b76ba322SStefano Zampini       }
2999b76ba322SStefano Zampini       ierr = MPI_Allreduce(&use_exact,&use_exact_reduced,1,MPIU_INT,MPI_LAND,((PetscObject)pc)->comm);CHKERRQ(ierr);
3000b76ba322SStefano Zampini       pcbddc->use_exact_dirichlet = (PetscBool) use_exact_reduced;
3001a0ba757dSStefano Zampini       ierr = VecDestroy(&temp_vec);CHKERRQ(ierr);
3002b76ba322SStefano Zampini       if (dbg_flag) {
3003a0ba757dSStefano Zampini         ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
3004a0ba757dSStefano Zampini         ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
3005a0ba757dSStefano Zampini         ierr = PetscViewerASCIIPrintf(viewer,"Checking solution of Dirichlet and Neumann problems\n");CHKERRQ(ierr);
3006a0ba757dSStefano Zampini         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d infinity error for Dirichlet solve = % 1.14e \n",PetscGlobalRank,value);CHKERRQ(ierr);
3007d49ef151SStefano Zampini         ierr = VecDuplicate(pcbddc->vec1_R,&temp_vec);CHKERRQ(ierr);
3008d49ef151SStefano Zampini         ierr = VecSetRandom(pcbddc->vec1_R,PETSC_NULL);CHKERRQ(ierr);
3009d49ef151SStefano Zampini         ierr = MatMult(A_RR,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr);
3010d49ef151SStefano Zampini         ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec2_R,temp_vec);CHKERRQ(ierr);
3011d49ef151SStefano Zampini         ierr = VecAXPY(temp_vec,m_one,pcbddc->vec1_R);CHKERRQ(ierr);
3012d49ef151SStefano Zampini         ierr = VecNorm(temp_vec,NORM_INFINITY,&value);CHKERRQ(ierr);
3013e269702eSStefano Zampini         ierr = VecDestroy(&temp_vec);CHKERRQ(ierr);
30140c7d97c5SJed Brown         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d infinity error for  Neumann  solve = % 1.14e \n",PetscGlobalRank,value);CHKERRQ(ierr);
3015d49ef151SStefano Zampini         ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
30160c7d97c5SJed Brown       }
3017b76ba322SStefano Zampini     }
30180c7d97c5SJed Brown     /* free Neumann problem's matrix */
30190c7d97c5SJed Brown     ierr = MatDestroy(&A_RR);CHKERRQ(ierr);
30200c7d97c5SJed Brown   }
30210c7d97c5SJed Brown 
30220c7d97c5SJed Brown   /* Assemble all remaining stuff needed to apply BDDC  */
30230c7d97c5SJed Brown   {
30240c7d97c5SJed Brown     Mat          A_RV,A_VR,A_VV;
3025*0bdf917eSStefano Zampini     Mat          M1;
30260c7d97c5SJed Brown     Mat          C_CR;
30273b03a366Sstefano_zampini     Mat          AUXMAT;
30280c7d97c5SJed Brown     Vec          vec1_C;
30290c7d97c5SJed Brown     Vec          vec2_C;
30300c7d97c5SJed Brown     Vec          vec1_V;
30310c7d97c5SJed Brown     Vec          vec2_V;
30320c7d97c5SJed Brown     PetscInt     *nnz;
30330c7d97c5SJed Brown     PetscInt     *auxindices;
303453cdbc3dSStefano Zampini     PetscInt     index;
30350c7d97c5SJed Brown     PetscScalar* array2;
30360c7d97c5SJed Brown     MatFactorInfo matinfo;
30370c7d97c5SJed Brown 
30380c7d97c5SJed Brown     /* Allocating some extra storage just to be safe */
30390c7d97c5SJed Brown     ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&nnz);CHKERRQ(ierr);
30400c7d97c5SJed Brown     ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&auxindices);CHKERRQ(ierr);
30410c7d97c5SJed Brown     for (i=0;i<pcis->n;i++) {auxindices[i]=i;}
30420c7d97c5SJed Brown 
30430c7d97c5SJed Brown     /* some work vectors on vertices and/or constraints */
30443b03a366Sstefano_zampini     if (n_vertices) {
30450c7d97c5SJed Brown       ierr = VecCreate(PETSC_COMM_SELF,&vec1_V);CHKERRQ(ierr);
30463b03a366Sstefano_zampini       ierr = VecSetSizes(vec1_V,n_vertices,n_vertices);CHKERRQ(ierr);
30470c7d97c5SJed Brown       ierr = VecSetType(vec1_V,impVecType);CHKERRQ(ierr);
30480c7d97c5SJed Brown       ierr = VecDuplicate(vec1_V,&vec2_V);CHKERRQ(ierr);
30490c7d97c5SJed Brown     }
3050534831adSStefano Zampini     if (n_constraints) {
30510c7d97c5SJed Brown       ierr = VecCreate(PETSC_COMM_SELF,&vec1_C);CHKERRQ(ierr);
3052534831adSStefano Zampini       ierr = VecSetSizes(vec1_C,n_constraints,n_constraints);CHKERRQ(ierr);
30530c7d97c5SJed Brown       ierr = VecSetType(vec1_C,impVecType);CHKERRQ(ierr);
30540c7d97c5SJed Brown       ierr = VecDuplicate(vec1_C,&vec2_C);CHKERRQ(ierr);
30550c7d97c5SJed Brown       ierr = VecDuplicate(vec1_C,&pcbddc->vec1_C);CHKERRQ(ierr);
30560c7d97c5SJed Brown     }
30570c7d97c5SJed Brown     /* Precompute stuffs needed for preprocessing and application of BDDC*/
30583b03a366Sstefano_zampini     if (n_constraints) {
30590c7d97c5SJed Brown       ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->local_auxmat2);CHKERRQ(ierr);
30603b03a366Sstefano_zampini       ierr = MatSetSizes(pcbddc->local_auxmat2,n_R,n_constraints,n_R,n_constraints);CHKERRQ(ierr);
30610c7d97c5SJed Brown       ierr = MatSetType(pcbddc->local_auxmat2,impMatType);CHKERRQ(ierr);
30623b03a366Sstefano_zampini       ierr = MatSeqDenseSetPreallocation(pcbddc->local_auxmat2,PETSC_NULL);CHKERRQ(ierr);
30630c7d97c5SJed Brown 
306457a90decSStefano Zampini       /* Create Constraint matrix on R nodes: C_{CR}  */
306557a90decSStefano Zampini       ierr = MatGetSubMatrix(pcbddc->ConstraintMatrix,is_C_local,is_R_local,MAT_INITIAL_MATRIX,&C_CR);CHKERRQ(ierr);
306657a90decSStefano Zampini       ierr = ISDestroy(&is_C_local);CHKERRQ(ierr);
306757a90decSStefano Zampini 
30680c7d97c5SJed Brown       /* Assemble local_auxmat2 = - A_{RR}^{-1} C^T_{CR} needed by BDDC application */
30693b03a366Sstefano_zampini       for (i=0;i<n_constraints;i++) {
30703b03a366Sstefano_zampini         ierr = VecSet(pcbddc->vec1_R,zero);CHKERRQ(ierr);
30713b03a366Sstefano_zampini         /* Get row of constraint matrix in R numbering */
307257a90decSStefano Zampini         ierr = VecGetArray(pcbddc->vec1_R,&array);CHKERRQ(ierr);
307357a90decSStefano Zampini         ierr = MatGetRow(C_CR,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr);
30743b03a366Sstefano_zampini         for (j=0;j<size_of_constraint;j++) { array[ row_cmat_indices[j] ] = - row_cmat_values[j]; }
307557a90decSStefano Zampini         ierr = MatRestoreRow(C_CR,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr);
307657a90decSStefano Zampini         ierr = VecRestoreArray(pcbddc->vec1_R,&array);CHKERRQ(ierr);
30773b03a366Sstefano_zampini         /* Solve for row of constraint matrix in R numbering */
307853cdbc3dSStefano Zampini         ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr);
30793b03a366Sstefano_zampini         /* Set values */
30800c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec2_R,&array);CHKERRQ(ierr);
30813b03a366Sstefano_zampini         ierr = MatSetValues(pcbddc->local_auxmat2,n_R,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
30820c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec2_R,&array);CHKERRQ(ierr);
30830c7d97c5SJed Brown       }
30840c7d97c5SJed Brown       ierr = MatAssemblyBegin(pcbddc->local_auxmat2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
30850c7d97c5SJed Brown       ierr = MatAssemblyEnd(pcbddc->local_auxmat2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
30860c7d97c5SJed Brown 
30870c7d97c5SJed Brown       /* Assemble AUXMAT = ( LUFactor )( -C_{CR} A_{RR}^{-1} C^T_{CR} )^{-1} */
30880c7d97c5SJed Brown       ierr = MatMatMult(C_CR,pcbddc->local_auxmat2,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&AUXMAT);CHKERRQ(ierr);
3089d49ef151SStefano Zampini       ierr = MatFactorInfoInitialize(&matinfo);CHKERRQ(ierr);
30903b03a366Sstefano_zampini       ierr = ISCreateStride(PETSC_COMM_SELF,n_constraints,0,1,&is_aux1);CHKERRQ(ierr);
30910c7d97c5SJed Brown       ierr = MatLUFactor(AUXMAT,is_aux1,is_aux1,&matinfo);CHKERRQ(ierr);
30920c7d97c5SJed Brown       ierr = ISDestroy(&is_aux1);CHKERRQ(ierr);
30930c7d97c5SJed Brown 
30943b03a366Sstefano_zampini       /* Assemble explicitly M1 = ( C_{CR} A_{RR}^{-1} C^T_{CR} )^{-1} needed in preproc  */
3095d49ef151SStefano Zampini       ierr = MatCreate(PETSC_COMM_SELF,&M1);CHKERRQ(ierr);
30963b03a366Sstefano_zampini       ierr = MatSetSizes(M1,n_constraints,n_constraints,n_constraints,n_constraints);CHKERRQ(ierr);
30970c7d97c5SJed Brown       ierr = MatSetType(M1,impMatType);CHKERRQ(ierr);
30983b03a366Sstefano_zampini       ierr = MatSeqDenseSetPreallocation(M1,PETSC_NULL);CHKERRQ(ierr);
30993b03a366Sstefano_zampini       for (i=0;i<n_constraints;i++) {
31000c7d97c5SJed Brown         ierr = VecSet(vec1_C,zero);CHKERRQ(ierr);
31010c7d97c5SJed Brown         ierr = VecSetValue(vec1_C,i,one,INSERT_VALUES);CHKERRQ(ierr);
31020c7d97c5SJed Brown         ierr = VecAssemblyBegin(vec1_C);CHKERRQ(ierr);
31030c7d97c5SJed Brown         ierr = VecAssemblyEnd(vec1_C);CHKERRQ(ierr);
31040c7d97c5SJed Brown         ierr = MatSolve(AUXMAT,vec1_C,vec2_C);CHKERRQ(ierr);
31050c7d97c5SJed Brown         ierr = VecScale(vec2_C,m_one);CHKERRQ(ierr);
31060c7d97c5SJed Brown         ierr = VecGetArray(vec2_C,&array);CHKERRQ(ierr);
31073b03a366Sstefano_zampini         ierr = MatSetValues(M1,n_constraints,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
31080c7d97c5SJed Brown         ierr = VecRestoreArray(vec2_C,&array);CHKERRQ(ierr);
31090c7d97c5SJed Brown       }
31100c7d97c5SJed Brown       ierr = MatAssemblyBegin(M1,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
31110c7d97c5SJed Brown       ierr = MatAssemblyEnd(M1,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
31120c7d97c5SJed Brown       ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr);
31130c7d97c5SJed Brown       /* Assemble local_auxmat1 = M1*C_{CR} needed by BDDC application in KSP and in preproc */
31140c7d97c5SJed Brown       ierr = MatMatMult(M1,C_CR,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&pcbddc->local_auxmat1);CHKERRQ(ierr);
31150c7d97c5SJed Brown 
31160c7d97c5SJed Brown     }
31170c7d97c5SJed Brown 
31180c7d97c5SJed Brown     /* Get submatrices from subdomain matrix */
31193b03a366Sstefano_zampini     if (n_vertices){
3120534831adSStefano Zampini       ierr = MatGetSubMatrix(pcbddc->local_mat,is_R_local,is_V_local,MAT_INITIAL_MATRIX,&A_RV);CHKERRQ(ierr);
3121534831adSStefano Zampini       ierr = MatGetSubMatrix(pcbddc->local_mat,is_V_local,is_R_local,MAT_INITIAL_MATRIX,&A_VR);CHKERRQ(ierr);
3122534831adSStefano Zampini       ierr = MatGetSubMatrix(pcbddc->local_mat,is_V_local,is_V_local,MAT_INITIAL_MATRIX,&A_VV);CHKERRQ(ierr);
31230c7d97c5SJed Brown     }
31240c7d97c5SJed Brown 
31250c7d97c5SJed Brown     /* Matrix of coarse basis functions (local) */
3126d49ef151SStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->coarse_phi_B);CHKERRQ(ierr);
31270c7d97c5SJed Brown     ierr = MatSetSizes(pcbddc->coarse_phi_B,n_B,pcbddc->local_primal_size,n_B,pcbddc->local_primal_size);CHKERRQ(ierr);
31280c7d97c5SJed Brown     ierr = MatSetType(pcbddc->coarse_phi_B,impMatType);CHKERRQ(ierr);
31293b03a366Sstefano_zampini     ierr = MatSeqDenseSetPreallocation(pcbddc->coarse_phi_B,PETSC_NULL);CHKERRQ(ierr);
3130e269702eSStefano Zampini     if (pcbddc->prec_type || dbg_flag ) {
3131d49ef151SStefano Zampini       ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->coarse_phi_D);CHKERRQ(ierr);
31320c7d97c5SJed Brown       ierr = MatSetSizes(pcbddc->coarse_phi_D,n_D,pcbddc->local_primal_size,n_D,pcbddc->local_primal_size);CHKERRQ(ierr);
31330c7d97c5SJed Brown       ierr = MatSetType(pcbddc->coarse_phi_D,impMatType);CHKERRQ(ierr);
31343b03a366Sstefano_zampini       ierr = MatSeqDenseSetPreallocation(pcbddc->coarse_phi_D,PETSC_NULL);CHKERRQ(ierr);
31350c7d97c5SJed Brown     }
31360c7d97c5SJed Brown 
3137e269702eSStefano Zampini     if (dbg_flag) {
31380c7d97c5SJed Brown       ierr = PetscMalloc( pcbddc->local_primal_size*sizeof(PetscScalar),&coarsefunctions_errors);CHKERRQ(ierr);
31390c7d97c5SJed Brown       ierr = PetscMalloc( pcbddc->local_primal_size*sizeof(PetscScalar),&constraints_errors);CHKERRQ(ierr);
31400c7d97c5SJed Brown     }
31413b03a366Sstefano_zampini     /* Subdomain contribution (Non-overlapping) to coarse matrix  */
31420c7d97c5SJed Brown     ierr = PetscMalloc ((pcbddc->local_primal_size)*(pcbddc->local_primal_size)*sizeof(PetscScalar),&coarse_submat_vals);CHKERRQ(ierr);
31430c7d97c5SJed Brown 
31440c7d97c5SJed Brown     /* We are now ready to evaluate coarse basis functions and subdomain contribution to coarse problem */
31453b03a366Sstefano_zampini     for (i=0;i<n_vertices;i++){
31460c7d97c5SJed Brown       ierr = VecSet(vec1_V,zero);CHKERRQ(ierr);
31470c7d97c5SJed Brown       ierr = VecSetValue(vec1_V,i,one,INSERT_VALUES);CHKERRQ(ierr);
31480c7d97c5SJed Brown       ierr = VecAssemblyBegin(vec1_V);CHKERRQ(ierr);
31490c7d97c5SJed Brown       ierr = VecAssemblyEnd(vec1_V);CHKERRQ(ierr);
31500c7d97c5SJed Brown       /* solution of saddle point problem */
3151*0bdf917eSStefano Zampini       ierr = MatMult(A_RV,vec1_V,pcbddc->vec1_R);CHKERRQ(ierr);
3152*0bdf917eSStefano Zampini       ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec1_R);CHKERRQ(ierr);
31530c7d97c5SJed Brown       ierr = VecScale(pcbddc->vec1_R,m_one);CHKERRQ(ierr);
31543b03a366Sstefano_zampini       if (n_constraints) {
31550c7d97c5SJed Brown         ierr = MatMult(pcbddc->local_auxmat1,pcbddc->vec1_R,vec1_C);CHKERRQ(ierr);
31560c7d97c5SJed Brown         ierr = MatMultAdd(pcbddc->local_auxmat2,vec1_C,pcbddc->vec1_R,pcbddc->vec1_R);CHKERRQ(ierr);
31570c7d97c5SJed Brown         ierr = VecScale(vec1_C,m_one);CHKERRQ(ierr);
31580c7d97c5SJed Brown       }
31590c7d97c5SJed Brown       ierr = MatMult(A_VR,pcbddc->vec1_R,vec2_V);CHKERRQ(ierr);
31600c7d97c5SJed Brown       ierr = MatMultAdd(A_VV,vec1_V,vec2_V,vec2_V);CHKERRQ(ierr);
31610c7d97c5SJed Brown 
31620c7d97c5SJed Brown       /* Set values in coarse basis function and subdomain part of coarse_mat */
31630c7d97c5SJed Brown       /* coarse basis functions */
31640c7d97c5SJed Brown       ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr);
31650c7d97c5SJed Brown       ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
31660c7d97c5SJed Brown       ierr = VecScatterEnd  (pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
31670c7d97c5SJed Brown       ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr);
31683b03a366Sstefano_zampini       ierr = MatSetValues(pcbddc->coarse_phi_B,n_B,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
31690c7d97c5SJed Brown       ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr);
31700c7d97c5SJed Brown       ierr = MatSetValue(pcbddc->coarse_phi_B,idx_V_B[i],i,one,INSERT_VALUES);CHKERRQ(ierr);
3171e269702eSStefano Zampini       if ( pcbddc->prec_type || dbg_flag  ) {
31720c7d97c5SJed Brown         ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
31730c7d97c5SJed Brown         ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
31740c7d97c5SJed Brown         ierr = VecGetArray(pcis->vec1_D,&array);CHKERRQ(ierr);
31753b03a366Sstefano_zampini         ierr = MatSetValues(pcbddc->coarse_phi_D,n_D,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
31760c7d97c5SJed Brown         ierr = VecRestoreArray(pcis->vec1_D,&array);CHKERRQ(ierr);
31770c7d97c5SJed Brown       }
31780c7d97c5SJed Brown       /* subdomain contribution to coarse matrix */
31790c7d97c5SJed Brown       ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr);
3180da1bb401SStefano Zampini       for (j=0;j<n_vertices;j++) { coarse_submat_vals[i*pcbddc->local_primal_size+j] = array[j]; } /* WARNING -> column major ordering */
31810c7d97c5SJed Brown       ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr);
31823b03a366Sstefano_zampini       if (n_constraints) {
31830c7d97c5SJed Brown         ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr);
3184da1bb401SStefano Zampini         for (j=0;j<n_constraints;j++) { coarse_submat_vals[i*pcbddc->local_primal_size+j+n_vertices] = array[j]; } /* WARNING -> column major ordering */
31850c7d97c5SJed Brown         ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr);
31860c7d97c5SJed Brown       }
31870c7d97c5SJed Brown 
3188e269702eSStefano Zampini       if ( dbg_flag ) {
31890c7d97c5SJed Brown         /* assemble subdomain vector on nodes */
3190d49ef151SStefano Zampini         ierr = VecSet(pcis->vec1_N,zero);CHKERRQ(ierr);
31910c7d97c5SJed Brown         ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
31920c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr);
31930c7d97c5SJed Brown         for (j=0;j<n_R;j++) { array[idx_R_local[j]] = array2[j]; }
31943b03a366Sstefano_zampini         array[ vertices[i] ] = one;
31950c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr);
31960c7d97c5SJed Brown         ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
31970c7d97c5SJed Brown         /* assemble subdomain vector of lagrange multipliers (i.e. primal nodes) */
3198d49ef151SStefano Zampini         ierr = VecSet(pcbddc->vec1_P,zero);CHKERRQ(ierr);
31990c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr);
32000c7d97c5SJed Brown         ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr);
32013b03a366Sstefano_zampini         for (j=0;j<n_vertices;j++) { array2[j]=array[j]; }
32020c7d97c5SJed Brown         ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr);
32033b03a366Sstefano_zampini         if (n_constraints) {
32040c7d97c5SJed Brown           ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr);
32053b03a366Sstefano_zampini           for (j=0;j<n_constraints;j++) { array2[j+n_vertices]=array[j]; }
32060c7d97c5SJed Brown           ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr);
32070c7d97c5SJed Brown         }
32080c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr);
32090c7d97c5SJed Brown         ierr = VecScale(pcbddc->vec1_P,m_one);CHKERRQ(ierr);
32100c7d97c5SJed Brown         /* check saddle point solution */
3211534831adSStefano Zampini         ierr = MatMult(pcbddc->local_mat,pcis->vec1_N,pcis->vec2_N);CHKERRQ(ierr);
32123b03a366Sstefano_zampini         ierr = MatMultTransposeAdd(pcbddc->ConstraintMatrix,pcbddc->vec1_P,pcis->vec2_N,pcis->vec2_N);CHKERRQ(ierr);
32133b03a366Sstefano_zampini         ierr = VecNorm(pcis->vec2_N,NORM_INFINITY,&coarsefunctions_errors[i]);CHKERRQ(ierr);
32143b03a366Sstefano_zampini         ierr = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr);
32150c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
32163b03a366Sstefano_zampini         array[i]=array[i]+m_one;  /* shift by the identity matrix */
32170c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
32183b03a366Sstefano_zampini         ierr = VecNorm(pcbddc->vec1_P,NORM_INFINITY,&constraints_errors[i]);CHKERRQ(ierr);
32190c7d97c5SJed Brown       }
32200c7d97c5SJed Brown     }
32210c7d97c5SJed Brown 
32223b03a366Sstefano_zampini     for (i=0;i<n_constraints;i++){
3223d49ef151SStefano Zampini       ierr = VecSet(vec2_C,zero);CHKERRQ(ierr);
32240c7d97c5SJed Brown       ierr = VecSetValue(vec2_C,i,m_one,INSERT_VALUES);CHKERRQ(ierr);
32250c7d97c5SJed Brown       ierr = VecAssemblyBegin(vec2_C);CHKERRQ(ierr);
32260c7d97c5SJed Brown       ierr = VecAssemblyEnd(vec2_C);CHKERRQ(ierr);
32270c7d97c5SJed Brown       /* solution of saddle point problem */
32280c7d97c5SJed Brown       ierr = MatMult(M1,vec2_C,vec1_C);CHKERRQ(ierr);
32290c7d97c5SJed Brown       ierr = MatMult(pcbddc->local_auxmat2,vec1_C,pcbddc->vec1_R);CHKERRQ(ierr);
32300c7d97c5SJed Brown       ierr = VecScale(vec1_C,m_one);CHKERRQ(ierr);
32313b03a366Sstefano_zampini       if (n_vertices) { ierr = MatMult(A_VR,pcbddc->vec1_R,vec2_V);CHKERRQ(ierr); }
32320c7d97c5SJed Brown       /* Set values in coarse basis function and subdomain part of coarse_mat */
32330c7d97c5SJed Brown       /* coarse basis functions */
32343b03a366Sstefano_zampini       index=i+n_vertices;
32350c7d97c5SJed Brown       ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr);
32360c7d97c5SJed Brown       ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
32370c7d97c5SJed Brown       ierr = VecScatterEnd  (pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
32380c7d97c5SJed Brown       ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr);
323953cdbc3dSStefano Zampini       ierr = MatSetValues(pcbddc->coarse_phi_B,n_B,auxindices,1,&index,array,INSERT_VALUES);CHKERRQ(ierr);
32400c7d97c5SJed Brown       ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr);
3241e269702eSStefano Zampini       if ( pcbddc->prec_type || dbg_flag ) {
32420c7d97c5SJed Brown         ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
32430c7d97c5SJed Brown         ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
32440c7d97c5SJed Brown         ierr = VecGetArray(pcis->vec1_D,&array);CHKERRQ(ierr);
324553cdbc3dSStefano Zampini         ierr = MatSetValues(pcbddc->coarse_phi_D,n_D,auxindices,1,&index,array,INSERT_VALUES);CHKERRQ(ierr);
32460c7d97c5SJed Brown         ierr = VecRestoreArray(pcis->vec1_D,&array);CHKERRQ(ierr);
32470c7d97c5SJed Brown       }
32480c7d97c5SJed Brown       /* subdomain contribution to coarse matrix */
32493b03a366Sstefano_zampini       if (n_vertices) {
32500c7d97c5SJed Brown         ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr);
3251da1bb401SStefano Zampini         for (j=0;j<n_vertices;j++) {coarse_submat_vals[index*pcbddc->local_primal_size+j]=array[j];} /* WARNING -> column major ordering */
32520c7d97c5SJed Brown         ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr);
32530c7d97c5SJed Brown       }
32540c7d97c5SJed Brown       ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr);
3255da1bb401SStefano Zampini       for (j=0;j<n_constraints;j++) {coarse_submat_vals[index*pcbddc->local_primal_size+j+n_vertices]=array[j];} /* WARNING -> column major ordering */
32560c7d97c5SJed Brown       ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr);
32570c7d97c5SJed Brown 
3258e269702eSStefano Zampini       if ( dbg_flag ) {
32590c7d97c5SJed Brown         /* assemble subdomain vector on nodes */
326053cdbc3dSStefano Zampini         ierr = VecSet(pcis->vec1_N,zero);CHKERRQ(ierr);
32610c7d97c5SJed Brown         ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
32620c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr);
32630c7d97c5SJed Brown         for (j=0;j<n_R;j++){ array[ idx_R_local[j] ] = array2[j]; }
32640c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr);
32650c7d97c5SJed Brown         ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
32660c7d97c5SJed Brown         /* assemble subdomain vector of lagrange multipliers */
326753cdbc3dSStefano Zampini         ierr = VecSet(pcbddc->vec1_P,zero);CHKERRQ(ierr);
32680c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr);
32693b03a366Sstefano_zampini         if ( n_vertices) {
32700c7d97c5SJed Brown           ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr);
32713b03a366Sstefano_zampini           for (j=0;j<n_vertices;j++) {array2[j]=-array[j];}
32720c7d97c5SJed Brown           ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr);
32730c7d97c5SJed Brown         }
32740c7d97c5SJed Brown         ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr);
32753b03a366Sstefano_zampini         for (j=0;j<n_constraints;j++) {array2[j+n_vertices]=-array[j];}
32760c7d97c5SJed Brown         ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr);
32770c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr);
32783972b0daSStefano Zampini         /* check saddle point solution */
3279534831adSStefano Zampini         ierr = MatMult(pcbddc->local_mat,pcis->vec1_N,pcis->vec2_N);CHKERRQ(ierr);
32803b03a366Sstefano_zampini         ierr = MatMultTransposeAdd(pcbddc->ConstraintMatrix,pcbddc->vec1_P,pcis->vec2_N,pcis->vec2_N);CHKERRQ(ierr);
328153cdbc3dSStefano Zampini         ierr = VecNorm(pcis->vec2_N,NORM_INFINITY,&coarsefunctions_errors[index]);CHKERRQ(ierr);
32823b03a366Sstefano_zampini         ierr = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr);
32830c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
328453cdbc3dSStefano Zampini         array[index]=array[index]+m_one; /* shift by the identity matrix */
32850c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
328653cdbc3dSStefano Zampini         ierr = VecNorm(pcbddc->vec1_P,NORM_INFINITY,&constraints_errors[index]);CHKERRQ(ierr);
32870c7d97c5SJed Brown       }
32880c7d97c5SJed Brown     }
32890c7d97c5SJed Brown     ierr = MatAssemblyBegin(pcbddc->coarse_phi_B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
32900c7d97c5SJed Brown     ierr = MatAssemblyEnd  (pcbddc->coarse_phi_B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
3291e269702eSStefano Zampini     if ( pcbddc->prec_type || dbg_flag ) {
32920c7d97c5SJed Brown       ierr = MatAssemblyBegin(pcbddc->coarse_phi_D,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
32930c7d97c5SJed Brown       ierr = MatAssemblyEnd  (pcbddc->coarse_phi_D,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
32940c7d97c5SJed Brown     }
32950c7d97c5SJed Brown     /* Checking coarse_sub_mat and coarse basis functios */
32960c7d97c5SJed Brown     /* It shuld be \Phi^{(j)^T} A^{(j)} \Phi^{(j)}=coarse_sub_mat */
32979d2fce94SStefano Zampini     if (dbg_flag) {
32980c7d97c5SJed Brown 
32990c7d97c5SJed Brown       Mat coarse_sub_mat;
33000c7d97c5SJed Brown       Mat TM1,TM2,TM3,TM4;
33010c7d97c5SJed Brown       Mat coarse_phi_D,coarse_phi_B,A_II,A_BB,A_IB,A_BI;
3302a0ba757dSStefano Zampini       const MatType checkmattype=MATSEQAIJ;
33030c7d97c5SJed Brown       PetscScalar      value;
33040c7d97c5SJed Brown 
3305c042a7c3SStefano Zampini       ierr = MatConvert(pcis->A_II,checkmattype,MAT_INITIAL_MATRIX,&A_II);CHKERRQ(ierr);
3306c042a7c3SStefano Zampini       ierr = MatConvert(pcis->A_IB,checkmattype,MAT_INITIAL_MATRIX,&A_IB);CHKERRQ(ierr);
3307c042a7c3SStefano Zampini       ierr = MatConvert(pcis->A_BI,checkmattype,MAT_INITIAL_MATRIX,&A_BI);CHKERRQ(ierr);
3308c042a7c3SStefano Zampini       ierr = MatConvert(pcis->A_BB,checkmattype,MAT_INITIAL_MATRIX,&A_BB);CHKERRQ(ierr);
3309c042a7c3SStefano Zampini       ierr = MatConvert(pcbddc->coarse_phi_D,checkmattype,MAT_INITIAL_MATRIX,&coarse_phi_D);CHKERRQ(ierr);
3310c042a7c3SStefano Zampini       ierr = MatConvert(pcbddc->coarse_phi_B,checkmattype,MAT_INITIAL_MATRIX,&coarse_phi_B);CHKERRQ(ierr);
3311c042a7c3SStefano Zampini       ierr = MatCreateSeqDense(PETSC_COMM_SELF,pcbddc->local_primal_size,pcbddc->local_primal_size,coarse_submat_vals,&coarse_sub_mat);CHKERRQ(ierr);
3312c042a7c3SStefano Zampini       ierr = MatConvert(coarse_sub_mat,checkmattype,MAT_REUSE_MATRIX,&coarse_sub_mat);CHKERRQ(ierr);
33130c7d97c5SJed Brown 
3314da1bb401SStefano Zampini       /*PetscViewer view_out;
3315da1bb401SStefano Zampini       PetscMPIInt myrank;
3316da1bb401SStefano Zampini       char filename[256];
3317da1bb401SStefano Zampini       MPI_Comm_rank(((PetscObject)pc)->comm,&myrank);
3318da1bb401SStefano Zampini       sprintf(filename,"coarsesubmat_%04d.m",myrank);
3319da1bb401SStefano Zampini       ierr = PetscViewerASCIIOpen(PETSC_COMM_SELF,filename,&view_out);CHKERRQ(ierr);
3320da1bb401SStefano Zampini       ierr = PetscViewerSetFormat(view_out,PETSC_VIEWER_ASCII_MATLAB);CHKERRQ(ierr);
3321da1bb401SStefano Zampini       ierr = MatView(coarse_sub_mat,view_out);CHKERRQ(ierr);
3322da1bb401SStefano Zampini       ierr = PetscViewerDestroy(&view_out);CHKERRQ(ierr);*/
3323da1bb401SStefano Zampini 
33240c7d97c5SJed Brown       ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
33250c7d97c5SJed Brown       ierr = PetscViewerASCIIPrintf(viewer,"Check coarse sub mat and local basis functions\n");CHKERRQ(ierr);
33260c7d97c5SJed Brown       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
332753cdbc3dSStefano Zampini       ierr = MatPtAP(A_II,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&TM1);CHKERRQ(ierr);
332853cdbc3dSStefano Zampini       ierr = MatPtAP(A_BB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&TM2);CHKERRQ(ierr);
332953cdbc3dSStefano Zampini       ierr = MatMatMult(A_IB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr);
3330c042a7c3SStefano Zampini       ierr = MatTransposeMatMult(coarse_phi_D,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM3);CHKERRQ(ierr);
333153cdbc3dSStefano Zampini       ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr);
333253cdbc3dSStefano Zampini       ierr = MatMatMult(A_BI,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr);
3333c042a7c3SStefano Zampini       ierr = MatTransposeMatMult(coarse_phi_B,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM4);CHKERRQ(ierr);
333453cdbc3dSStefano Zampini       ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr);
333553cdbc3dSStefano Zampini       ierr = MatAXPY(TM1,one,TM2,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
333653cdbc3dSStefano Zampini       ierr = MatAXPY(TM1,one,TM3,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
333753cdbc3dSStefano Zampini       ierr = MatAXPY(TM1,one,TM4,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
333853cdbc3dSStefano Zampini       ierr = MatAXPY(TM1,m_one,coarse_sub_mat,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
333953cdbc3dSStefano Zampini       ierr = MatNorm(TM1,NORM_INFINITY,&value);CHKERRQ(ierr);
33400c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"----------------------------------\n");CHKERRQ(ierr);
33410c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d \n",PetscGlobalRank);CHKERRQ(ierr);
33420c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"matrix error = % 1.14e\n",value);CHKERRQ(ierr);
33430c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"coarse functions errors\n");CHKERRQ(ierr);
334453cdbc3dSStefano Zampini       for (i=0;i<pcbddc->local_primal_size;i++) { ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local %02d-th function error = % 1.14e\n",i,coarsefunctions_errors[i]);CHKERRQ(ierr); }
33450c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"constraints errors\n");CHKERRQ(ierr);
334653cdbc3dSStefano Zampini       for (i=0;i<pcbddc->local_primal_size;i++) { ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local %02d-th function error = % 1.14e\n",i,constraints_errors[i]);CHKERRQ(ierr); }
33470c7d97c5SJed Brown       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
334853cdbc3dSStefano Zampini       ierr = MatDestroy(&A_II);CHKERRQ(ierr);
334953cdbc3dSStefano Zampini       ierr = MatDestroy(&A_BB);CHKERRQ(ierr);
335053cdbc3dSStefano Zampini       ierr = MatDestroy(&A_IB);CHKERRQ(ierr);
335153cdbc3dSStefano Zampini       ierr = MatDestroy(&A_BI);CHKERRQ(ierr);
335253cdbc3dSStefano Zampini       ierr = MatDestroy(&TM1);CHKERRQ(ierr);
335353cdbc3dSStefano Zampini       ierr = MatDestroy(&TM2);CHKERRQ(ierr);
335453cdbc3dSStefano Zampini       ierr = MatDestroy(&TM3);CHKERRQ(ierr);
335553cdbc3dSStefano Zampini       ierr = MatDestroy(&TM4);CHKERRQ(ierr);
335653cdbc3dSStefano Zampini       ierr = MatDestroy(&coarse_phi_D);CHKERRQ(ierr);
335753cdbc3dSStefano Zampini       ierr = MatDestroy(&coarse_sub_mat);CHKERRQ(ierr);
335853cdbc3dSStefano Zampini       ierr = MatDestroy(&coarse_phi_B);CHKERRQ(ierr);
33590c7d97c5SJed Brown       ierr = PetscFree(coarsefunctions_errors);CHKERRQ(ierr);
33600c7d97c5SJed Brown       ierr = PetscFree(constraints_errors);CHKERRQ(ierr);
33610c7d97c5SJed Brown     }
33620c7d97c5SJed Brown 
33630c7d97c5SJed Brown     /* create coarse matrix and data structures for message passing associated actual choice of coarse problem type */
33640c7d97c5SJed Brown     ierr = PCBDDCSetupCoarseEnvironment(pc,coarse_submat_vals);CHKERRQ(ierr);
33650c7d97c5SJed Brown     /* free memory */
33660c7d97c5SJed Brown     ierr = PetscFree(coarse_submat_vals);CHKERRQ(ierr);
33670c7d97c5SJed Brown     ierr = PetscFree(auxindices);CHKERRQ(ierr);
33680c7d97c5SJed Brown     ierr = PetscFree(nnz);CHKERRQ(ierr);
33693b03a366Sstefano_zampini     if (n_vertices) {
33700c7d97c5SJed Brown       ierr = VecDestroy(&vec1_V);CHKERRQ(ierr);
33710c7d97c5SJed Brown       ierr = VecDestroy(&vec2_V);CHKERRQ(ierr);
33720c7d97c5SJed Brown       ierr = MatDestroy(&A_RV);CHKERRQ(ierr);
33730c7d97c5SJed Brown       ierr = MatDestroy(&A_VR);CHKERRQ(ierr);
33740c7d97c5SJed Brown       ierr = MatDestroy(&A_VV);CHKERRQ(ierr);
33750c7d97c5SJed Brown     }
3376534831adSStefano Zampini     if (n_constraints) {
33770c7d97c5SJed Brown       ierr = VecDestroy(&vec1_C);CHKERRQ(ierr);
33780c7d97c5SJed Brown       ierr = VecDestroy(&vec2_C);CHKERRQ(ierr);
33790c7d97c5SJed Brown       ierr = MatDestroy(&M1);CHKERRQ(ierr);
33800c7d97c5SJed Brown       ierr = MatDestroy(&C_CR);CHKERRQ(ierr);
33810c7d97c5SJed Brown     }
33820c7d97c5SJed Brown   }
33830c7d97c5SJed Brown   /* free memory */
33843b03a366Sstefano_zampini   if (n_vertices) {
33850c7d97c5SJed Brown     ierr = PetscFree(idx_V_B);CHKERRQ(ierr);
33860c7d97c5SJed Brown     ierr = ISDestroy(&is_V_local);CHKERRQ(ierr);
33870c7d97c5SJed Brown   }
33880c7d97c5SJed Brown   ierr = ISDestroy(&is_R_local);CHKERRQ(ierr);
33890c7d97c5SJed Brown 
33900c7d97c5SJed Brown   PetscFunctionReturn(0);
33910c7d97c5SJed Brown }
33920c7d97c5SJed Brown 
33930c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
33940c7d97c5SJed Brown 
33950c7d97c5SJed Brown #undef __FUNCT__
33960c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetupCoarseEnvironment"
339753cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetupCoarseEnvironment(PC pc,PetscScalar* coarse_submat_vals)
33980c7d97c5SJed Brown {
33990c7d97c5SJed Brown 
34000c7d97c5SJed Brown 
34010c7d97c5SJed Brown   Mat_IS    *matis    = (Mat_IS*)pc->pmat->data;
34020c7d97c5SJed Brown   PC_BDDC   *pcbddc   = (PC_BDDC*)pc->data;
34030c7d97c5SJed Brown   PC_IS     *pcis     = (PC_IS*)pc->data;
34040c7d97c5SJed Brown   MPI_Comm  prec_comm = ((PetscObject)pc)->comm;
34050c7d97c5SJed Brown   MPI_Comm  coarse_comm;
34060c7d97c5SJed Brown 
34070c7d97c5SJed Brown   /* common to all choiches */
34080c7d97c5SJed Brown   PetscScalar *temp_coarse_mat_vals;
34090c7d97c5SJed Brown   PetscScalar *ins_coarse_mat_vals;
34100c7d97c5SJed Brown   PetscInt    *ins_local_primal_indices;
34110c7d97c5SJed Brown   PetscMPIInt *localsizes2,*localdispl2;
34120c7d97c5SJed Brown   PetscMPIInt size_prec_comm;
34130c7d97c5SJed Brown   PetscMPIInt rank_prec_comm;
34140c7d97c5SJed Brown   PetscMPIInt active_rank=MPI_PROC_NULL;
34150c7d97c5SJed Brown   PetscMPIInt master_proc=0;
34160c7d97c5SJed Brown   PetscInt    ins_local_primal_size;
34170c7d97c5SJed Brown   /* specific to MULTILEVEL_BDDC */
34180c7d97c5SJed Brown   PetscMPIInt *ranks_recv;
34190c7d97c5SJed Brown   PetscMPIInt count_recv=0;
34200c7d97c5SJed Brown   PetscMPIInt rank_coarse_proc_send_to;
34210c7d97c5SJed Brown   PetscMPIInt coarse_color = MPI_UNDEFINED;
34220c7d97c5SJed Brown   ISLocalToGlobalMapping coarse_ISLG;
34230c7d97c5SJed Brown   /* some other variables */
34240c7d97c5SJed Brown   PetscErrorCode ierr;
34250c7d97c5SJed Brown   const MatType coarse_mat_type;
34260c7d97c5SJed Brown   const PCType  coarse_pc_type;
342753cdbc3dSStefano Zampini   const KSPType coarse_ksp_type;
342853cdbc3dSStefano Zampini   PC pc_temp;
34290c7d97c5SJed Brown   PetscInt i,j,k,bs;
34303b03a366Sstefano_zampini   PetscInt max_it_coarse_ksp=1;  /* don't increase this value */
3431e269702eSStefano Zampini   /* verbose output viewer */
3432e269702eSStefano Zampini   PetscViewer viewer=pcbddc->dbg_viewer;
3433e269702eSStefano Zampini   PetscBool   dbg_flag=pcbddc->dbg_flag;
3434142dfd88SStefano Zampini 
3435ea7e1babSStefano Zampini   PetscInt      offset,offset2;
3436142dfd88SStefano Zampini   PetscMPIInt   im_active=0;
3437142dfd88SStefano Zampini   PetscMPIInt   *auxglobal_primal;
3438142dfd88SStefano Zampini 
3439142dfd88SStefano Zampini   PetscBool     setsym,issym=PETSC_FALSE;
34400c7d97c5SJed Brown 
34410c7d97c5SJed Brown   PetscFunctionBegin;
34420c7d97c5SJed Brown   ins_local_primal_indices = 0;
34430c7d97c5SJed Brown   ins_coarse_mat_vals      = 0;
34440c7d97c5SJed Brown   localsizes2              = 0;
34450c7d97c5SJed Brown   localdispl2              = 0;
34460c7d97c5SJed Brown   temp_coarse_mat_vals     = 0;
34470c7d97c5SJed Brown   coarse_ISLG              = 0;
34480c7d97c5SJed Brown 
344953cdbc3dSStefano Zampini   ierr = MPI_Comm_size(prec_comm,&size_prec_comm);CHKERRQ(ierr);
345053cdbc3dSStefano Zampini   ierr = MPI_Comm_rank(prec_comm,&rank_prec_comm);CHKERRQ(ierr);
34510c7d97c5SJed Brown   ierr = MatGetBlockSize(matis->A,&bs);CHKERRQ(ierr);
3452142dfd88SStefano Zampini   ierr = MatIsSymmetricKnown(pc->pmat,&setsym,&issym);CHKERRQ(ierr);
3453142dfd88SStefano Zampini 
3454beed3852SStefano Zampini   /* Assign global numbering to coarse dofs */
3455beed3852SStefano Zampini   {
3456a0ba757dSStefano Zampini     PetscScalar    one=1.,zero=0.;
3457beed3852SStefano Zampini     PetscScalar    *array;
3458beed3852SStefano Zampini     PetscMPIInt    *auxlocal_primal;
3459beed3852SStefano Zampini     PetscMPIInt    *all_auxglobal_primal;
3460beed3852SStefano Zampini     PetscMPIInt    mpi_local_primal_size = (PetscMPIInt)pcbddc->local_primal_size;
3461da1bb401SStefano Zampini     PetscInt       *row_cmat_indices;
34623b03a366Sstefano_zampini     PetscInt       size_of_constraint;
3463da1bb401SStefano Zampini     PetscScalar    coarsesum;
3464beed3852SStefano Zampini 
3465beed3852SStefano Zampini     /* Construct needed data structures for message passing */
3466beed3852SStefano Zampini     ierr = PetscMalloc(mpi_local_primal_size*sizeof(PetscMPIInt),&pcbddc->local_primal_indices);CHKERRQ(ierr);
3467ffe5efe1SStefano Zampini     j = 0;
3468142dfd88SStefano Zampini     if (rank_prec_comm == 0 || pcbddc->coarse_problem_type == REPLICATED_BDDC || pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
3469ffe5efe1SStefano Zampini       j = size_prec_comm;
3470ffe5efe1SStefano Zampini     }
3471ffe5efe1SStefano Zampini     ierr = PetscMalloc(j*sizeof(PetscMPIInt),&pcbddc->local_primal_sizes);CHKERRQ(ierr);
3472ffe5efe1SStefano Zampini     ierr = PetscMalloc(j*sizeof(PetscMPIInt),&pcbddc->local_primal_displacements);CHKERRQ(ierr);
3473beed3852SStefano Zampini     /* Gather local_primal_size information for all processes  */
3474142dfd88SStefano Zampini     if (pcbddc->coarse_problem_type == REPLICATED_BDDC || pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
34755619798eSStefano Zampini       ierr = MPI_Allgather(&mpi_local_primal_size,1,MPIU_INT,&pcbddc->local_primal_sizes[0],1,MPIU_INT,prec_comm);CHKERRQ(ierr);
3476ffe5efe1SStefano Zampini     } else {
3477ffe5efe1SStefano Zampini       ierr = MPI_Gather(&mpi_local_primal_size,1,MPIU_INT,&pcbddc->local_primal_sizes[0],1,MPIU_INT,0,prec_comm);CHKERRQ(ierr);
3478ffe5efe1SStefano Zampini     }
3479beed3852SStefano Zampini     pcbddc->replicated_primal_size = 0;
3480ffe5efe1SStefano Zampini     for (i=0; i<j; i++) {
3481beed3852SStefano Zampini       pcbddc->local_primal_displacements[i] = pcbddc->replicated_primal_size ;
3482beed3852SStefano Zampini       pcbddc->replicated_primal_size += pcbddc->local_primal_sizes[i];
3483beed3852SStefano Zampini     }
34845619798eSStefano Zampini     if (rank_prec_comm == 0) {
3485beed3852SStefano Zampini       /* allocate some auxiliary space */
3486beed3852SStefano Zampini       ierr = PetscMalloc(pcbddc->replicated_primal_size*sizeof(*all_auxglobal_primal),&all_auxglobal_primal);CHKERRQ(ierr);
3487beed3852SStefano Zampini     }
3488beed3852SStefano Zampini     ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscMPIInt),&auxlocal_primal);CHKERRQ(ierr);
3489beed3852SStefano Zampini     ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscMPIInt),&auxglobal_primal);CHKERRQ(ierr);
3490beed3852SStefano Zampini 
3491da1bb401SStefano Zampini     /* First let's count coarse dofs.
3492beed3852SStefano Zampini        This code fragment assumes that the number of local constraints per connected component
3493beed3852SStefano Zampini        is not greater than the number of nodes defined for the connected component
3494beed3852SStefano Zampini        (otherwise we will surely have linear dependence between constraints and thus a singular coarse problem) */
34953b03a366Sstefano_zampini     /* auxlocal_primal      : primal indices in local nodes numbering (internal and interface) with complete queue sorted by global ordering */
3496beed3852SStefano Zampini     ierr = VecSet(pcis->vec1_N,zero);CHKERRQ(ierr);
3497beed3852SStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3498da1bb401SStefano Zampini     for (i=0;i<pcbddc->local_primal_size;i++) {
3499da1bb401SStefano Zampini       ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr);
35003b03a366Sstefano_zampini       for (j=0; j<size_of_constraint; j++) {
35013b03a366Sstefano_zampini         k = row_cmat_indices[j];
3502beed3852SStefano Zampini         if ( array[k] == zero ) {
3503beed3852SStefano Zampini           array[k] = one;
3504da1bb401SStefano Zampini           auxlocal_primal[i] = k;
3505beed3852SStefano Zampini           break;
3506beed3852SStefano Zampini         }
3507beed3852SStefano Zampini       }
3508da1bb401SStefano Zampini       ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr);
3509beed3852SStefano Zampini     }
3510beed3852SStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3511da1bb401SStefano Zampini     ierr = VecSet(pcis->vec1_global,zero);CHKERRQ(ierr);
3512da1bb401SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3513da1bb401SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3514da1bb401SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3515da1bb401SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3516da1bb401SStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3517142dfd88SStefano Zampini     for (i=0;i<pcis->n;i++) { if ( PetscAbsScalar(array[i]) > zero) array[i] = one/array[i]; }
3518da1bb401SStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3519da1bb401SStefano Zampini     ierr = VecSet(pcis->vec1_global,zero);CHKERRQ(ierr);
3520da1bb401SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3521da1bb401SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3522da1bb401SStefano Zampini     ierr = VecSum(pcis->vec1_global,&coarsesum);CHKERRQ(ierr);
3523da1bb401SStefano Zampini     pcbddc->coarse_size = (PetscInt) coarsesum;
3524a0ba757dSStefano Zampini 
3525beed3852SStefano Zampini     /* Now assign them a global numbering */
3526beed3852SStefano Zampini     /* auxglobal_primal contains indices in global nodes numbering (internal and interface) */
3527beed3852SStefano Zampini     ierr = ISLocalToGlobalMappingApply(matis->mapping,pcbddc->local_primal_size,auxlocal_primal,auxglobal_primal);CHKERRQ(ierr);
3528142dfd88SStefano Zampini     ierr = PetscFree(auxlocal_primal);CHKERRQ(ierr);
3529beed3852SStefano Zampini     /* all_auxglobal_primal contains all primal nodes indices in global nodes numbering (internal and interface) */
3530beed3852SStefano Zampini     ierr = MPI_Gatherv(&auxglobal_primal[0],pcbddc->local_primal_size,MPIU_INT,&all_auxglobal_primal[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,0,prec_comm);CHKERRQ(ierr);
3531beed3852SStefano Zampini 
3532beed3852SStefano Zampini     /* After this block all_auxglobal_primal should contains one copy of each primal node's indices in global nodes numbering */
3533beed3852SStefano Zampini     if (rank_prec_comm==0) {
353417d7d925SStefano Zampini       j=pcbddc->replicated_primal_size;
353517d7d925SStefano Zampini       ierr = PetscSortRemoveDupsMPIInt(&j,all_auxglobal_primal);CHKERRQ(ierr);
3536*0bdf917eSStefano Zampini     } else {
3537*0bdf917eSStefano Zampini       ierr = PetscMalloc(pcbddc->coarse_size*sizeof(PetscMPIInt),&all_auxglobal_primal);CHKERRQ(ierr);
3538*0bdf917eSStefano Zampini     }
3539*0bdf917eSStefano Zampini     /* We only need to broadcast the indices from 0 to pcbddc->coarse_size. Remaning elements of array all_aux_global_primal are garbage. */
3540*0bdf917eSStefano Zampini     ierr = MPI_Bcast(all_auxglobal_primal,pcbddc->coarse_size,MPIU_INT,0,prec_comm);CHKERRQ(ierr);
3541*0bdf917eSStefano Zampini 
3542*0bdf917eSStefano Zampini     /* Now get global coarse numbering of local primal nodes */
3543*0bdf917eSStefano Zampini     for (i=0;i<pcbddc->local_primal_size;i++) {
3544beed3852SStefano Zampini       k=0;
3545*0bdf917eSStefano Zampini       while( all_auxglobal_primal[k] != auxglobal_primal[i] ) { k++;}
3546*0bdf917eSStefano Zampini       pcbddc->local_primal_indices[i]=k;
3547beed3852SStefano Zampini     }
3548*0bdf917eSStefano Zampini     ierr = PetscFree(auxglobal_primal);CHKERRQ(ierr);
3549beed3852SStefano Zampini     ierr = PetscFree(all_auxglobal_primal);CHKERRQ(ierr);
3550*0bdf917eSStefano Zampini     if (rank_prec_comm==0) {
3551*0bdf917eSStefano Zampini       j=pcbddc->replicated_primal_size;
3552*0bdf917eSStefano Zampini       ierr = PetscMalloc(j*sizeof(PetscMPIInt),&auxglobal_primal);CHKERRQ(ierr);
3553e269702eSStefano Zampini     }
3554*0bdf917eSStefano Zampini     ierr = MPI_Gatherv(pcbddc->local_primal_indices,pcbddc->local_primal_size,MPIU_INT,auxglobal_primal,pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,0,prec_comm);CHKERRQ(ierr);
3555*0bdf917eSStefano Zampini   }
3556*0bdf917eSStefano Zampini 
3557*0bdf917eSStefano Zampini   if (pcis->n) { im_active = 1; }
3558*0bdf917eSStefano Zampini   ierr = MPI_Allreduce(&im_active,&pcbddc->active_procs,1,MPIU_INT,MPI_SUM,prec_comm);CHKERRQ(ierr);
3559*0bdf917eSStefano Zampini 
3560*0bdf917eSStefano Zampini   /* adapt coarse problem type */
3561*0bdf917eSStefano Zampini   if (pcbddc->coarse_problem_type == MULTILEVEL_BDDC && (pcbddc->active_procs/pcbddc->coarsening_ratio) < 2 ) {
3562*0bdf917eSStefano Zampini     if (dbg_flag) {
3563*0bdf917eSStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Not enough active processes on level. Parallel direct solve\n");CHKERRQ(ierr);
3564*0bdf917eSStefano Zampini       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
3565*0bdf917eSStefano Zampini     }
3566*0bdf917eSStefano Zampini     pcbddc->coarse_problem_type = PARALLEL_BDDC;
3567142dfd88SStefano Zampini   }
3568beed3852SStefano Zampini 
35690c7d97c5SJed Brown   switch(pcbddc->coarse_problem_type){
35700c7d97c5SJed Brown 
3571da1bb401SStefano Zampini     case(MULTILEVEL_BDDC):   /* we define a coarse mesh where subdomains are elements */
35720c7d97c5SJed Brown     {
35730c7d97c5SJed Brown       /* we need additional variables */
35740c7d97c5SJed Brown       MetisInt    n_subdomains,n_parts,objval,ncon,faces_nvtxs;
35750c7d97c5SJed Brown       MetisInt    *metis_coarse_subdivision;
35760c7d97c5SJed Brown       MetisInt    options[METIS_NOPTIONS];
35770c7d97c5SJed Brown       PetscMPIInt size_coarse_comm,rank_coarse_comm;
35780c7d97c5SJed Brown       PetscMPIInt procs_jumps_coarse_comm;
35790c7d97c5SJed Brown       PetscMPIInt *coarse_subdivision;
35800c7d97c5SJed Brown       PetscMPIInt *total_count_recv;
35810c7d97c5SJed Brown       PetscMPIInt *total_ranks_recv;
35820c7d97c5SJed Brown       PetscMPIInt *displacements_recv;
35830c7d97c5SJed Brown       PetscMPIInt *my_faces_connectivity;
35840c7d97c5SJed Brown       PetscMPIInt *petsc_faces_adjncy;
35850c7d97c5SJed Brown       MetisInt    *faces_adjncy;
35860c7d97c5SJed Brown       MetisInt    *faces_xadj;
35870c7d97c5SJed Brown       PetscMPIInt *number_of_faces;
35880c7d97c5SJed Brown       PetscMPIInt *faces_displacements;
35890c7d97c5SJed Brown       PetscInt    *array_int;
35900c7d97c5SJed Brown       PetscMPIInt my_faces=0;
35910c7d97c5SJed Brown       PetscMPIInt total_faces=0;
35923828260eSStefano Zampini       PetscInt    ranks_stretching_ratio;
35930c7d97c5SJed Brown 
35940c7d97c5SJed Brown       /* define some quantities */
35950c7d97c5SJed Brown       pcbddc->coarse_communications_type = SCATTERS_BDDC;
35960c7d97c5SJed Brown       coarse_mat_type = MATIS;
35970c7d97c5SJed Brown       coarse_pc_type  = PCBDDC;
3598142dfd88SStefano Zampini       coarse_ksp_type = KSPRICHARDSON;
35990c7d97c5SJed Brown 
36000c7d97c5SJed Brown       /* details of coarse decomposition */
36010c7d97c5SJed Brown       n_subdomains = pcbddc->active_procs;
36020c7d97c5SJed Brown       n_parts      = n_subdomains/pcbddc->coarsening_ratio;
36033828260eSStefano Zampini       ranks_stretching_ratio = size_prec_comm/pcbddc->active_procs;
36043828260eSStefano Zampini       procs_jumps_coarse_comm = pcbddc->coarsening_ratio*ranks_stretching_ratio;
36053828260eSStefano Zampini 
3606da1bb401SStefano Zampini       /*printf("Coarse algorithm details: \n");
3607da1bb401SStefano Zampini       printf("n_subdomains %d, n_parts %d\nstretch %d,jumps %d,coarse_ratio %d\nlevel should be log_%d(%d)\n",n_subdomains,n_parts,ranks_stretching_ratio,procs_jumps_coarse_comm,pcbddc->coarsening_ratio,pcbddc->coarsening_ratio,(ranks_stretching_ratio/pcbddc->coarsening_ratio+1));*/
36080c7d97c5SJed Brown 
36090c7d97c5SJed Brown       /* build CSR graph of subdomains' connectivity through faces */
36100c7d97c5SJed Brown       ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&array_int);CHKERRQ(ierr);
36113828260eSStefano Zampini       ierr = PetscMemzero(array_int,pcis->n*sizeof(PetscInt));CHKERRQ(ierr);
36120c7d97c5SJed Brown       for (i=1;i<pcis->n_neigh;i++){/* i=1 so I don't count myself -> faces nodes counts to 1 */
36130c7d97c5SJed Brown         for (j=0;j<pcis->n_shared[i];j++){
36140c7d97c5SJed Brown           array_int[ pcis->shared[i][j] ]+=1;
36150c7d97c5SJed Brown         }
36160c7d97c5SJed Brown       }
36170c7d97c5SJed Brown       for (i=1;i<pcis->n_neigh;i++){
36180c7d97c5SJed Brown         for (j=0;j<pcis->n_shared[i];j++){
36190c7d97c5SJed Brown           if (array_int[ pcis->shared[i][j] ] == 1 ){
36200c7d97c5SJed Brown             my_faces++;
36210c7d97c5SJed Brown             break;
36220c7d97c5SJed Brown           }
36230c7d97c5SJed Brown         }
36240c7d97c5SJed Brown       }
36250c7d97c5SJed Brown 
362653cdbc3dSStefano Zampini       ierr = MPI_Reduce(&my_faces,&total_faces,1,MPIU_INT,MPI_SUM,master_proc,prec_comm);CHKERRQ(ierr);
36270c7d97c5SJed Brown       ierr = PetscMalloc (my_faces*sizeof(PetscInt),&my_faces_connectivity);CHKERRQ(ierr);
36280c7d97c5SJed Brown       my_faces=0;
36290c7d97c5SJed Brown       for (i=1;i<pcis->n_neigh;i++){
36300c7d97c5SJed Brown         for (j=0;j<pcis->n_shared[i];j++){
36310c7d97c5SJed Brown           if (array_int[ pcis->shared[i][j] ] == 1 ){
36320c7d97c5SJed Brown             my_faces_connectivity[my_faces]=pcis->neigh[i];
36330c7d97c5SJed Brown             my_faces++;
36340c7d97c5SJed Brown             break;
36350c7d97c5SJed Brown           }
36360c7d97c5SJed Brown         }
36370c7d97c5SJed Brown       }
36380c7d97c5SJed Brown       if (rank_prec_comm == master_proc) {
36390c7d97c5SJed Brown         ierr = PetscMalloc (total_faces*sizeof(PetscMPIInt),&petsc_faces_adjncy);CHKERRQ(ierr);
36400c7d97c5SJed Brown         ierr = PetscMalloc (size_prec_comm*sizeof(PetscMPIInt),&number_of_faces);CHKERRQ(ierr);
36410c7d97c5SJed Brown         ierr = PetscMalloc (total_faces*sizeof(MetisInt),&faces_adjncy);CHKERRQ(ierr);
36420c7d97c5SJed Brown         ierr = PetscMalloc ((n_subdomains+1)*sizeof(MetisInt),&faces_xadj);CHKERRQ(ierr);
36430c7d97c5SJed Brown         ierr = PetscMalloc ((size_prec_comm+1)*sizeof(PetscMPIInt),&faces_displacements);CHKERRQ(ierr);
36440c7d97c5SJed Brown       }
364553cdbc3dSStefano Zampini       ierr = MPI_Gather(&my_faces,1,MPIU_INT,&number_of_faces[0],1,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr);
36460c7d97c5SJed Brown       if (rank_prec_comm == master_proc) {
36470c7d97c5SJed Brown         faces_xadj[0]=0;
36480c7d97c5SJed Brown         faces_displacements[0]=0;
36490c7d97c5SJed Brown         j=0;
36500c7d97c5SJed Brown         for (i=1;i<size_prec_comm+1;i++) {
36510c7d97c5SJed Brown           faces_displacements[i]=faces_displacements[i-1]+number_of_faces[i-1];
36520c7d97c5SJed Brown           if (number_of_faces[i-1]) {
36530c7d97c5SJed Brown             j++;
36540c7d97c5SJed Brown             faces_xadj[j]=faces_xadj[j-1]+number_of_faces[i-1];
36550c7d97c5SJed Brown           }
36560c7d97c5SJed Brown         }
3657da1bb401SStefano Zampini         /*printf("The J I count is %d and should be %d\n",j,n_subdomains);
3658da1bb401SStefano Zampini         printf("Total faces seem %d and should be %d\n",faces_xadj[j],total_faces);*/
36590c7d97c5SJed Brown       }
366053cdbc3dSStefano Zampini       ierr = MPI_Gatherv(&my_faces_connectivity[0],my_faces,MPIU_INT,&petsc_faces_adjncy[0],number_of_faces,faces_displacements,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr);
36610c7d97c5SJed Brown       ierr = PetscFree(my_faces_connectivity);CHKERRQ(ierr);
36620c7d97c5SJed Brown       ierr = PetscFree(array_int);CHKERRQ(ierr);
36630c7d97c5SJed Brown       if (rank_prec_comm == master_proc) {
36643828260eSStefano Zampini         for (i=0;i<total_faces;i++) faces_adjncy[i]=(MetisInt)(petsc_faces_adjncy[i]/ranks_stretching_ratio); /* cast to MetisInt */
3665da1bb401SStefano Zampini         /*printf("This is the face connectivity (actual ranks)\n");
36660c7d97c5SJed Brown         for (i=0;i<n_subdomains;i++){
36670c7d97c5SJed Brown           printf("proc %d is connected with \n",i);
36680c7d97c5SJed Brown           for (j=faces_xadj[i];j<faces_xadj[i+1];j++)
36690c7d97c5SJed Brown             printf("%d ",faces_adjncy[j]);
36700c7d97c5SJed Brown           printf("\n");
3671da1bb401SStefano Zampini         }*/
36720c7d97c5SJed Brown         ierr = PetscFree(faces_displacements);CHKERRQ(ierr);
36730c7d97c5SJed Brown         ierr = PetscFree(number_of_faces);CHKERRQ(ierr);
36740c7d97c5SJed Brown         ierr = PetscFree(petsc_faces_adjncy);CHKERRQ(ierr);
36750c7d97c5SJed Brown       }
36760c7d97c5SJed Brown 
36770c7d97c5SJed Brown       if ( rank_prec_comm == master_proc ) {
36780c7d97c5SJed Brown 
36793828260eSStefano Zampini         PetscInt heuristic_for_metis=3;
36803828260eSStefano Zampini 
36810c7d97c5SJed Brown         ncon=1;
36820c7d97c5SJed Brown         faces_nvtxs=n_subdomains;
36830c7d97c5SJed Brown         /* partition graoh induced by face connectivity */
36840c7d97c5SJed Brown         ierr = PetscMalloc (n_subdomains*sizeof(MetisInt),&metis_coarse_subdivision);CHKERRQ(ierr);
36850c7d97c5SJed Brown         ierr = METIS_SetDefaultOptions(options);
36860c7d97c5SJed Brown         /* we need a contiguous partition of the coarse mesh */
36870c7d97c5SJed Brown         options[METIS_OPTION_CONTIG]=1;
36880c7d97c5SJed Brown         options[METIS_OPTION_NITER]=30;
36893828260eSStefano Zampini         if (n_subdomains>n_parts*heuristic_for_metis) {
36903828260eSStefano Zampini           options[METIS_OPTION_IPTYPE]=METIS_IPTYPE_EDGE;
36913828260eSStefano Zampini           options[METIS_OPTION_OBJTYPE]=METIS_OBJTYPE_CUT;
36920c7d97c5SJed Brown           ierr = METIS_PartGraphKway(&faces_nvtxs,&ncon,faces_xadj,faces_adjncy,NULL,NULL,NULL,&n_parts,NULL,NULL,options,&objval,metis_coarse_subdivision);
3693142dfd88SStefano Zampini           if (ierr != METIS_OK) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in METIS_PartGraphKway (metis error code %D) called from PCBDDCSetupCoarseEnvironment\n",ierr);
36943828260eSStefano Zampini         } else {
36953828260eSStefano Zampini           ierr = METIS_PartGraphRecursive(&faces_nvtxs,&ncon,faces_xadj,faces_adjncy,NULL,NULL,NULL,&n_parts,NULL,NULL,options,&objval,metis_coarse_subdivision);
3696142dfd88SStefano Zampini           if (ierr != METIS_OK) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in METIS_PartGraphRecursive (metis error code %D) called from PCBDDCSetupCoarseEnvironment\n",ierr);
36973828260eSStefano Zampini         }
36980c7d97c5SJed Brown         ierr = PetscFree(faces_xadj);CHKERRQ(ierr);
36990c7d97c5SJed Brown         ierr = PetscFree(faces_adjncy);CHKERRQ(ierr);
3700*0bdf917eSStefano Zampini         ierr = PetscMalloc(size_prec_comm*sizeof(PetscMPIInt),&coarse_subdivision);CHKERRQ(ierr);
37010c7d97c5SJed Brown         /* copy/cast values avoiding possible type conflicts between PETSc, MPI and METIS */
3702*0bdf917eSStefano Zampini         for (i=0;i<size_prec_comm;i++) { coarse_subdivision[i]=MPI_PROC_NULL; }
3703*0bdf917eSStefano Zampini         for (i=0;i<n_subdomains;i++)   { coarse_subdivision[ranks_stretching_ratio*i]=(PetscInt)(metis_coarse_subdivision[i]); }
37040c7d97c5SJed Brown         ierr = PetscFree(metis_coarse_subdivision);CHKERRQ(ierr);
37050c7d97c5SJed Brown       }
37060c7d97c5SJed Brown 
37070c7d97c5SJed Brown       /* Create new communicator for coarse problem splitting the old one */
37080c7d97c5SJed Brown       if ( !(rank_prec_comm%procs_jumps_coarse_comm) && rank_prec_comm < procs_jumps_coarse_comm*n_parts ){
3709da1bb401SStefano Zampini         coarse_color=0;              /* for communicator splitting */
3710da1bb401SStefano Zampini         active_rank=rank_prec_comm;  /* for insertion of matrix values */
37110c7d97c5SJed Brown       }
3712da1bb401SStefano Zampini       /* procs with coarse_color = MPI_UNDEFINED will have coarse_comm = MPI_COMM_NULL (from mpi standards)
3713da1bb401SStefano Zampini          key = rank_prec_comm -> keep same ordering of ranks from the old to the new communicator */
371453cdbc3dSStefano Zampini       ierr = MPI_Comm_split(prec_comm,coarse_color,rank_prec_comm,&coarse_comm);CHKERRQ(ierr);
37150c7d97c5SJed Brown 
37160c7d97c5SJed Brown       if ( coarse_color == 0 ) {
371753cdbc3dSStefano Zampini         ierr = MPI_Comm_size(coarse_comm,&size_coarse_comm);CHKERRQ(ierr);
371853cdbc3dSStefano Zampini         ierr = MPI_Comm_rank(coarse_comm,&rank_coarse_comm);CHKERRQ(ierr);
3719da1bb401SStefano Zampini         /*printf("Details of coarse comm\n");
37203828260eSStefano Zampini         printf("size = %d, myrank = %d\n",size_coarse_comm,rank_coarse_comm);
3721da1bb401SStefano Zampini         printf("jumps = %d, coarse_color = %d, n_parts = %d\n",procs_jumps_coarse_comm,coarse_color,n_parts);*/
37220c7d97c5SJed Brown       } else {
37230c7d97c5SJed Brown         rank_coarse_comm = MPI_PROC_NULL;
37240c7d97c5SJed Brown       }
37250c7d97c5SJed Brown 
37260c7d97c5SJed Brown       /* master proc take care of arranging and distributing coarse informations */
37270c7d97c5SJed Brown       if (rank_coarse_comm == master_proc) {
37280c7d97c5SJed Brown         ierr = PetscMalloc (size_coarse_comm*sizeof(PetscMPIInt),&displacements_recv);CHKERRQ(ierr);
3729*0bdf917eSStefano Zampini         ierr = PetscMalloc (size_coarse_comm*sizeof(PetscMPIInt),&total_count_recv);CHKERRQ(ierr);
3730*0bdf917eSStefano Zampini         ierr = PetscMalloc (n_subdomains*sizeof(PetscMPIInt),&total_ranks_recv);CHKERRQ(ierr);
37310c7d97c5SJed Brown         /* some initializations */
37320c7d97c5SJed Brown         displacements_recv[0]=0;
3733*0bdf917eSStefano Zampini         ierr = PetscMemzero(total_count_recv,size_coarse_comm*sizeof(PetscMPIInt));CHKERRQ(ierr);
37340c7d97c5SJed Brown         /* count from how many processes the j-th process of the coarse decomposition will receive data */
3735*0bdf917eSStefano Zampini         for (j=0;j<size_coarse_comm;j++) {
3736*0bdf917eSStefano Zampini           for (i=0;i<size_prec_comm;i++) {
3737*0bdf917eSStefano Zampini             if (coarse_subdivision[i]==j) {
37380c7d97c5SJed Brown               total_count_recv[j]++;
3739*0bdf917eSStefano Zampini             }
3740*0bdf917eSStefano Zampini           }
3741*0bdf917eSStefano Zampini         }
37420c7d97c5SJed Brown         /* displacements needed for scatterv of total_ranks_recv */
3743*0bdf917eSStefano Zampini         for (i=1;i<size_coarse_comm;i++) { displacements_recv[i]=displacements_recv[i-1]+total_count_recv[i-1]; }
37440c7d97c5SJed Brown         /* Now fill properly total_ranks_recv -> each coarse process will receive the ranks (in prec_comm communicator) of its friend (sending) processes */
37450c7d97c5SJed Brown         ierr = PetscMemzero(total_count_recv,size_coarse_comm*sizeof(PetscMPIInt));CHKERRQ(ierr);
37460c7d97c5SJed Brown         for (j=0;j<size_coarse_comm;j++) {
37473828260eSStefano Zampini           for (i=0;i<size_prec_comm;i++) {
37480c7d97c5SJed Brown             if (coarse_subdivision[i]==j) {
37490c7d97c5SJed Brown               total_ranks_recv[displacements_recv[j]+total_count_recv[j]]=i;
37503828260eSStefano Zampini               total_count_recv[j]+=1;
37510c7d97c5SJed Brown             }
37520c7d97c5SJed Brown           }
37530c7d97c5SJed Brown         }
3754da1bb401SStefano Zampini         /*for (j=0;j<size_coarse_comm;j++) {
37553828260eSStefano Zampini           printf("process %d in new rank will receive from %d processes (original ranks follows)\n",j,total_count_recv[j]);
37563828260eSStefano Zampini           for (i=0;i<total_count_recv[j];i++) {
37573828260eSStefano Zampini             printf("%d ",total_ranks_recv[displacements_recv[j]+i]);
37583828260eSStefano Zampini           }
37593828260eSStefano Zampini           printf("\n");
3760da1bb401SStefano Zampini         }*/
37610c7d97c5SJed Brown 
37620c7d97c5SJed Brown         /* identify new decomposition in terms of ranks in the old communicator */
3763*0bdf917eSStefano Zampini         for (i=0;i<n_subdomains;i++) {
3764*0bdf917eSStefano Zampini           coarse_subdivision[ranks_stretching_ratio*i]=coarse_subdivision[ranks_stretching_ratio*i]*procs_jumps_coarse_comm;
3765*0bdf917eSStefano Zampini         }
3766da1bb401SStefano Zampini         /*printf("coarse_subdivision in old end new ranks\n");
37670c7d97c5SJed Brown         for (i=0;i<size_prec_comm;i++)
37683828260eSStefano Zampini           if (coarse_subdivision[i]!=MPI_PROC_NULL) {
37693828260eSStefano Zampini             printf("%d=(%d %d), ",i,coarse_subdivision[i],coarse_subdivision[i]/procs_jumps_coarse_comm);
37703828260eSStefano Zampini           } else {
37713828260eSStefano Zampini             printf("%d=(%d %d), ",i,coarse_subdivision[i],coarse_subdivision[i]);
37723828260eSStefano Zampini           }
3773da1bb401SStefano Zampini         printf("\n");*/
37740c7d97c5SJed Brown       }
37750c7d97c5SJed Brown 
37760c7d97c5SJed Brown       /* Scatter new decomposition for send details */
377753cdbc3dSStefano Zampini       ierr = MPI_Scatter(&coarse_subdivision[0],1,MPIU_INT,&rank_coarse_proc_send_to,1,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr);
37780c7d97c5SJed Brown       /* Scatter receiving details to members of coarse decomposition */
37790c7d97c5SJed Brown       if ( coarse_color == 0) {
378053cdbc3dSStefano Zampini         ierr = MPI_Scatter(&total_count_recv[0],1,MPIU_INT,&count_recv,1,MPIU_INT,master_proc,coarse_comm);CHKERRQ(ierr);
37810c7d97c5SJed Brown         ierr = PetscMalloc (count_recv*sizeof(PetscMPIInt),&ranks_recv);CHKERRQ(ierr);
378253cdbc3dSStefano Zampini         ierr = MPI_Scatterv(&total_ranks_recv[0],total_count_recv,displacements_recv,MPIU_INT,&ranks_recv[0],count_recv,MPIU_INT,master_proc,coarse_comm);CHKERRQ(ierr);
37830c7d97c5SJed Brown       }
37840c7d97c5SJed Brown 
3785da1bb401SStefano Zampini       /*printf("I will send my matrix data to proc  %d\n",rank_coarse_proc_send_to);
3786da1bb401SStefano Zampini       if (coarse_color == 0) {
3787da1bb401SStefano Zampini         printf("I will receive some matrix data from %d processes (ranks follows)\n",count_recv);
3788da1bb401SStefano Zampini         for (i=0;i<count_recv;i++)
3789da1bb401SStefano Zampini           printf("%d ",ranks_recv[i]);
3790da1bb401SStefano Zampini         printf("\n");
3791da1bb401SStefano Zampini       }*/
37920c7d97c5SJed Brown 
37930c7d97c5SJed Brown       if (rank_prec_comm == master_proc) {
3794*0bdf917eSStefano Zampini         ierr = PetscFree(coarse_subdivision);CHKERRQ(ierr);
3795da1bb401SStefano Zampini         ierr = PetscFree(total_count_recv);CHKERRQ(ierr);
3796*0bdf917eSStefano Zampini         ierr = PetscFree(total_ranks_recv);CHKERRQ(ierr);
37970c7d97c5SJed Brown         ierr = PetscFree(displacements_recv);CHKERRQ(ierr);
37980c7d97c5SJed Brown       }
37990c7d97c5SJed Brown       break;
38000c7d97c5SJed Brown     }
38010c7d97c5SJed Brown 
38020c7d97c5SJed Brown     case(REPLICATED_BDDC):
38030c7d97c5SJed Brown 
38040c7d97c5SJed Brown       pcbddc->coarse_communications_type = GATHERS_BDDC;
38050c7d97c5SJed Brown       coarse_mat_type = MATSEQAIJ;
38060c7d97c5SJed Brown       coarse_pc_type  = PCLU;
380753cdbc3dSStefano Zampini       coarse_ksp_type  = KSPPREONLY;
38080c7d97c5SJed Brown       coarse_comm = PETSC_COMM_SELF;
38090c7d97c5SJed Brown       active_rank = rank_prec_comm;
38100c7d97c5SJed Brown       break;
38110c7d97c5SJed Brown 
38120c7d97c5SJed Brown     case(PARALLEL_BDDC):
38130c7d97c5SJed Brown 
38140c7d97c5SJed Brown       pcbddc->coarse_communications_type = SCATTERS_BDDC;
38150c7d97c5SJed Brown       coarse_mat_type = MATMPIAIJ;
38160c7d97c5SJed Brown       coarse_pc_type  = PCREDUNDANT;
381753cdbc3dSStefano Zampini       coarse_ksp_type  = KSPPREONLY;
38180c7d97c5SJed Brown       coarse_comm = prec_comm;
38190c7d97c5SJed Brown       active_rank = rank_prec_comm;
38200c7d97c5SJed Brown       break;
38210c7d97c5SJed Brown 
38220c7d97c5SJed Brown     case(SEQUENTIAL_BDDC):
38230c7d97c5SJed Brown       pcbddc->coarse_communications_type = GATHERS_BDDC;
38240c7d97c5SJed Brown       coarse_mat_type = MATSEQAIJ;
38250c7d97c5SJed Brown       coarse_pc_type = PCLU;
382653cdbc3dSStefano Zampini       coarse_ksp_type  = KSPPREONLY;
38270c7d97c5SJed Brown       coarse_comm = PETSC_COMM_SELF;
38280c7d97c5SJed Brown       active_rank = master_proc;
38290c7d97c5SJed Brown       break;
38300c7d97c5SJed Brown   }
38310c7d97c5SJed Brown 
38320c7d97c5SJed Brown   switch(pcbddc->coarse_communications_type){
38330c7d97c5SJed Brown 
38340c7d97c5SJed Brown     case(SCATTERS_BDDC):
38350c7d97c5SJed Brown       {
38360c7d97c5SJed Brown         if (pcbddc->coarse_problem_type==MULTILEVEL_BDDC) {
38370c7d97c5SJed Brown 
38380c7d97c5SJed Brown           PetscMPIInt send_size;
38390c7d97c5SJed Brown           PetscInt    *aux_ins_indices;
38400c7d97c5SJed Brown           PetscInt    ii,jj;
38410c7d97c5SJed Brown           MPI_Request *requests;
38420c7d97c5SJed Brown 
38430c7d97c5SJed Brown           /* allocate auxiliary space */
38445619798eSStefano Zampini           ierr = PetscMalloc (pcbddc->replicated_primal_size*sizeof(PetscMPIInt),&pcbddc->replicated_local_primal_indices);CHKERRQ(ierr);
38455619798eSStefano Zampini           ierr = MPI_Allgatherv(&pcbddc->local_primal_indices[0],pcbddc->local_primal_size,MPIU_INT,&pcbddc->replicated_local_primal_indices[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,prec_comm);CHKERRQ(ierr);
38460c7d97c5SJed Brown           ierr = PetscMalloc ( pcbddc->coarse_size*sizeof(PetscInt),&aux_ins_indices);CHKERRQ(ierr);
38470c7d97c5SJed Brown           ierr = PetscMemzero(aux_ins_indices,pcbddc->coarse_size*sizeof(PetscInt));CHKERRQ(ierr);
38480c7d97c5SJed Brown           /* allocate stuffs for message massing */
38490c7d97c5SJed Brown           ierr = PetscMalloc ( (count_recv+1)*sizeof(MPI_Request),&requests);CHKERRQ(ierr);
38500c7d97c5SJed Brown           for (i=0;i<count_recv+1;i++) requests[i]=MPI_REQUEST_NULL;
38510c7d97c5SJed Brown           ierr = PetscMalloc ( count_recv*sizeof(PetscMPIInt),&localsizes2);CHKERRQ(ierr);
38520c7d97c5SJed Brown           ierr = PetscMalloc ( count_recv*sizeof(PetscMPIInt),&localdispl2);CHKERRQ(ierr);
38530c7d97c5SJed Brown           /* fill up quantities */
38540c7d97c5SJed Brown           j=0;
38550c7d97c5SJed Brown           for (i=0;i<count_recv;i++){
38560c7d97c5SJed Brown             ii = ranks_recv[i];
38570c7d97c5SJed Brown             localsizes2[i]=pcbddc->local_primal_sizes[ii]*pcbddc->local_primal_sizes[ii];
38580c7d97c5SJed Brown             localdispl2[i]=j;
38590c7d97c5SJed Brown             j+=localsizes2[i];
38600c7d97c5SJed Brown             jj = pcbddc->local_primal_displacements[ii];
3861da1bb401SStefano Zampini             for (k=0;k<pcbddc->local_primal_sizes[ii];k++) aux_ins_indices[pcbddc->replicated_local_primal_indices[jj+k]]+=1;  /* it counts the coarse subdomains sharing the coarse node */
38620c7d97c5SJed Brown           }
3863da1bb401SStefano Zampini           /*printf("aux_ins_indices 1\n");
3864da1bb401SStefano Zampini           for (i=0;i<pcbddc->coarse_size;i++)
3865da1bb401SStefano Zampini             printf("%d ",aux_ins_indices[i]);
3866da1bb401SStefano Zampini           printf("\n");*/
38670c7d97c5SJed Brown           /* temp_coarse_mat_vals used to store temporarly received matrix values */
38680c7d97c5SJed Brown           ierr = PetscMalloc ( j*sizeof(PetscScalar),&temp_coarse_mat_vals);CHKERRQ(ierr);
38690c7d97c5SJed Brown           /* evaluate how many values I will insert in coarse mat */
38700c7d97c5SJed Brown           ins_local_primal_size=0;
3871ea7e1babSStefano Zampini           for (i=0;i<pcbddc->coarse_size;i++){
3872ea7e1babSStefano Zampini             if (aux_ins_indices[i]){
38730c7d97c5SJed Brown               ins_local_primal_size++;
3874ea7e1babSStefano Zampini             }
3875ea7e1babSStefano Zampini           }
38760c7d97c5SJed Brown           /* evaluate indices I will insert in coarse mat */
38770c7d97c5SJed Brown           ierr = PetscMalloc ( ins_local_primal_size*sizeof(PetscInt),&ins_local_primal_indices);CHKERRQ(ierr);
38780c7d97c5SJed Brown           j=0;
3879ea7e1babSStefano Zampini           for (i=0;i<pcbddc->coarse_size;i++){
3880ea7e1babSStefano Zampini             if (aux_ins_indices[i]){
38810c7d97c5SJed Brown               ins_local_primal_indices[j++]=i;
3882ea7e1babSStefano Zampini             }
3883ea7e1babSStefano Zampini           }
38840c7d97c5SJed Brown           /* use aux_ins_indices to realize a global to local mapping */
38850c7d97c5SJed Brown           j=0;
38860c7d97c5SJed Brown           for (i=0;i<pcbddc->coarse_size;i++){
38870c7d97c5SJed Brown             if (aux_ins_indices[i]==0){
38880c7d97c5SJed Brown               aux_ins_indices[i]=-1;
38890c7d97c5SJed Brown             } else {
38900c7d97c5SJed Brown               aux_ins_indices[i]=j;
38910c7d97c5SJed Brown               j++;
38920c7d97c5SJed Brown             }
38930c7d97c5SJed Brown           }
38940c7d97c5SJed Brown 
3895da1bb401SStefano Zampini           /*printf("New details localsizes2 localdispl2\n");
3896da1bb401SStefano Zampini           for (i=0;i<count_recv;i++)
3897da1bb401SStefano Zampini             printf("(%d %d) ",localsizes2[i],localdispl2[i]);
3898da1bb401SStefano Zampini           printf("\n");
3899da1bb401SStefano Zampini           printf("aux_ins_indices 2\n");
3900da1bb401SStefano Zampini           for (i=0;i<pcbddc->coarse_size;i++)
3901da1bb401SStefano Zampini             printf("%d ",aux_ins_indices[i]);
3902da1bb401SStefano Zampini           printf("\n");
3903da1bb401SStefano Zampini           printf("ins_local_primal_indices\n");
3904da1bb401SStefano Zampini           for (i=0;i<ins_local_primal_size;i++)
3905da1bb401SStefano Zampini             printf("%d ",ins_local_primal_indices[i]);
3906da1bb401SStefano Zampini           printf("\n");
3907da1bb401SStefano Zampini           printf("coarse_submat_vals\n");
3908da1bb401SStefano Zampini           for (i=0;i<pcbddc->local_primal_size;i++)
3909da1bb401SStefano Zampini             for (j=0;j<pcbddc->local_primal_size;j++)
3910da1bb401SStefano Zampini               printf("(%lf %d %d)\n",coarse_submat_vals[j*pcbddc->local_primal_size+i],pcbddc->local_primal_indices[i],pcbddc->local_primal_indices[j]);
3911da1bb401SStefano Zampini           printf("\n");*/
39120c7d97c5SJed Brown 
39130c7d97c5SJed Brown           /* processes partecipating in coarse problem receive matrix data from their friends */
391453cdbc3dSStefano Zampini           for (i=0;i<count_recv;i++) ierr = MPI_Irecv(&temp_coarse_mat_vals[localdispl2[i]],localsizes2[i],MPIU_SCALAR,ranks_recv[i],666,prec_comm,&requests[i]);CHKERRQ(ierr);
39150c7d97c5SJed Brown           if (rank_coarse_proc_send_to != MPI_PROC_NULL ) {
39160c7d97c5SJed Brown             send_size=pcbddc->local_primal_size*pcbddc->local_primal_size;
391753cdbc3dSStefano Zampini             ierr = MPI_Isend(&coarse_submat_vals[0],send_size,MPIU_SCALAR,rank_coarse_proc_send_to,666,prec_comm,&requests[count_recv]);CHKERRQ(ierr);
39180c7d97c5SJed Brown           }
391953cdbc3dSStefano Zampini           ierr = MPI_Waitall(count_recv+1,requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
39200c7d97c5SJed Brown 
3921da1bb401SStefano Zampini           /*if (coarse_color == 0) {
3922da1bb401SStefano Zampini             printf("temp_coarse_mat_vals\n");
3923da1bb401SStefano Zampini             for (k=0;k<count_recv;k++){
3924da1bb401SStefano Zampini               printf("---- %d ----\n",ranks_recv[k]);
3925da1bb401SStefano Zampini               for (i=0;i<pcbddc->local_primal_sizes[ranks_recv[k]];i++)
3926da1bb401SStefano Zampini                 for (j=0;j<pcbddc->local_primal_sizes[ranks_recv[k]];j++)
3927da1bb401SStefano Zampini                   printf("(%lf %d %d)\n",temp_coarse_mat_vals[localdispl2[k]+j*pcbddc->local_primal_sizes[ranks_recv[k]]+i],pcbddc->replicated_local_primal_indices[pcbddc->local_primal_displacements[ranks_recv[k]]+i],pcbddc->replicated_local_primal_indices[pcbddc->local_primal_displacements[ranks_recv[k]]+j]);
3928da1bb401SStefano Zampini               printf("\n");
3929da1bb401SStefano Zampini             }
3930da1bb401SStefano Zampini           }*/
39310c7d97c5SJed Brown           /* calculate data to insert in coarse mat */
39320c7d97c5SJed Brown           ierr = PetscMalloc ( ins_local_primal_size*ins_local_primal_size*sizeof(PetscScalar),&ins_coarse_mat_vals);CHKERRQ(ierr);
39330c7d97c5SJed Brown           PetscMemzero(ins_coarse_mat_vals,ins_local_primal_size*ins_local_primal_size*sizeof(PetscScalar));
39340c7d97c5SJed Brown 
39350c7d97c5SJed Brown           PetscMPIInt rr,kk,lps,lpd;
39360c7d97c5SJed Brown           PetscInt row_ind,col_ind;
39370c7d97c5SJed Brown           for (k=0;k<count_recv;k++){
39380c7d97c5SJed Brown             rr = ranks_recv[k];
39390c7d97c5SJed Brown             kk = localdispl2[k];
39400c7d97c5SJed Brown             lps = pcbddc->local_primal_sizes[rr];
39410c7d97c5SJed Brown             lpd = pcbddc->local_primal_displacements[rr];
3942da1bb401SStefano Zampini             /*printf("Inserting the following indices (received from %d)\n",rr);*/
39430c7d97c5SJed Brown             for (j=0;j<lps;j++){
39440c7d97c5SJed Brown               col_ind=aux_ins_indices[pcbddc->replicated_local_primal_indices[lpd+j]];
39450c7d97c5SJed Brown               for (i=0;i<lps;i++){
39460c7d97c5SJed Brown                 row_ind=aux_ins_indices[pcbddc->replicated_local_primal_indices[lpd+i]];
3947da1bb401SStefano Zampini                 /*printf("%d %d\n",row_ind,col_ind);*/
39480c7d97c5SJed Brown                 ins_coarse_mat_vals[col_ind*ins_local_primal_size+row_ind]+=temp_coarse_mat_vals[kk+j*lps+i];
39490c7d97c5SJed Brown               }
39500c7d97c5SJed Brown             }
39510c7d97c5SJed Brown           }
39520c7d97c5SJed Brown           ierr = PetscFree(requests);CHKERRQ(ierr);
39530c7d97c5SJed Brown           ierr = PetscFree(aux_ins_indices);CHKERRQ(ierr);
39540c7d97c5SJed Brown           ierr = PetscFree(temp_coarse_mat_vals);CHKERRQ(ierr);
39550c7d97c5SJed Brown           if (coarse_color == 0) { ierr = PetscFree(ranks_recv);CHKERRQ(ierr); }
39560c7d97c5SJed Brown 
39570c7d97c5SJed Brown           /* create local to global mapping needed by coarse MATIS */
39580c7d97c5SJed Brown           {
39590c7d97c5SJed Brown             IS coarse_IS;
3960142dfd88SStefano Zampini             if (coarse_comm != MPI_COMM_NULL ) {ierr = MPI_Comm_free(&coarse_comm);CHKERRQ(ierr);}
39610c7d97c5SJed Brown             coarse_comm = prec_comm;
39620c7d97c5SJed Brown             active_rank=rank_prec_comm;
39630c7d97c5SJed Brown             ierr = ISCreateGeneral(coarse_comm,ins_local_primal_size,ins_local_primal_indices,PETSC_COPY_VALUES,&coarse_IS);CHKERRQ(ierr);
39640c7d97c5SJed Brown             ierr = ISLocalToGlobalMappingCreateIS(coarse_IS,&coarse_ISLG);CHKERRQ(ierr);
39650c7d97c5SJed Brown             ierr = ISDestroy(&coarse_IS);CHKERRQ(ierr);
39660c7d97c5SJed Brown           }
39670c7d97c5SJed Brown         }
39680c7d97c5SJed Brown         if (pcbddc->coarse_problem_type==PARALLEL_BDDC) {
39690c7d97c5SJed Brown           /* arrays for values insertion */
39700c7d97c5SJed Brown           ins_local_primal_size = pcbddc->local_primal_size;
39710c7d97c5SJed Brown           ierr = PetscMalloc ( ins_local_primal_size*sizeof(PetscMPIInt),&ins_local_primal_indices);CHKERRQ(ierr);
39720c7d97c5SJed Brown           ierr = PetscMalloc ( ins_local_primal_size*ins_local_primal_size*sizeof(PetscScalar),&ins_coarse_mat_vals);CHKERRQ(ierr);
39730c7d97c5SJed Brown           for (j=0;j<ins_local_primal_size;j++){
39740c7d97c5SJed Brown             ins_local_primal_indices[j]=pcbddc->local_primal_indices[j];
39750c7d97c5SJed Brown             for (i=0;i<ins_local_primal_size;i++) ins_coarse_mat_vals[j*ins_local_primal_size+i]=coarse_submat_vals[j*ins_local_primal_size+i];
39760c7d97c5SJed Brown           }
39770c7d97c5SJed Brown         }
39780c7d97c5SJed Brown         break;
39790c7d97c5SJed Brown 
39800c7d97c5SJed Brown     }
39810c7d97c5SJed Brown 
39820c7d97c5SJed Brown     case(GATHERS_BDDC):
39830c7d97c5SJed Brown       {
39840c7d97c5SJed Brown 
39850c7d97c5SJed Brown         PetscMPIInt mysize,mysize2;
39860c7d97c5SJed Brown 
39870c7d97c5SJed Brown         if (rank_prec_comm==active_rank) {
39880c7d97c5SJed Brown           ierr = PetscMalloc ( pcbddc->replicated_primal_size*sizeof(PetscMPIInt),&pcbddc->replicated_local_primal_indices);CHKERRQ(ierr);
3989*0bdf917eSStefano Zampini           ierr = PetscMalloc ( pcbddc->replicated_primal_size*sizeof(PetscScalar),&pcbddc->replicated_local_primal_values);CHKERRQ(ierr);
39900c7d97c5SJed Brown           ierr = PetscMalloc ( size_prec_comm*sizeof(PetscMPIInt),&localsizes2);CHKERRQ(ierr);
39910c7d97c5SJed Brown           ierr = PetscMalloc ( size_prec_comm*sizeof(PetscMPIInt),&localdispl2);CHKERRQ(ierr);
39920c7d97c5SJed Brown           /* arrays for values insertion */
39930c7d97c5SJed Brown           for (i=0;i<size_prec_comm;i++) localsizes2[i]=pcbddc->local_primal_sizes[i]*pcbddc->local_primal_sizes[i];
39940c7d97c5SJed Brown           localdispl2[0]=0;
39950c7d97c5SJed Brown           for (i=1;i<size_prec_comm;i++) localdispl2[i]=localsizes2[i-1]+localdispl2[i-1];
39960c7d97c5SJed Brown           j=0;
39970c7d97c5SJed Brown           for (i=0;i<size_prec_comm;i++) j+=localsizes2[i];
39980c7d97c5SJed Brown           ierr = PetscMalloc ( j*sizeof(PetscScalar),&temp_coarse_mat_vals);CHKERRQ(ierr);
39990c7d97c5SJed Brown         }
40000c7d97c5SJed Brown 
40010c7d97c5SJed Brown         mysize=pcbddc->local_primal_size;
40020c7d97c5SJed Brown         mysize2=pcbddc->local_primal_size*pcbddc->local_primal_size;
40030c7d97c5SJed Brown         if (pcbddc->coarse_problem_type == SEQUENTIAL_BDDC){
400453cdbc3dSStefano Zampini           ierr = MPI_Gatherv(&pcbddc->local_primal_indices[0],mysize,MPIU_INT,&pcbddc->replicated_local_primal_indices[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr);
400553cdbc3dSStefano Zampini           ierr = MPI_Gatherv(&coarse_submat_vals[0],mysize2,MPIU_SCALAR,&temp_coarse_mat_vals[0],localsizes2,localdispl2,MPIU_SCALAR,master_proc,prec_comm);CHKERRQ(ierr);
40060c7d97c5SJed Brown         } else {
400753cdbc3dSStefano Zampini           ierr = MPI_Allgatherv(&pcbddc->local_primal_indices[0],mysize,MPIU_INT,&pcbddc->replicated_local_primal_indices[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,prec_comm);CHKERRQ(ierr);
400853cdbc3dSStefano Zampini           ierr = MPI_Allgatherv(&coarse_submat_vals[0],mysize2,MPIU_SCALAR,&temp_coarse_mat_vals[0],localsizes2,localdispl2,MPIU_SCALAR,prec_comm);CHKERRQ(ierr);
40090c7d97c5SJed Brown         }
40100c7d97c5SJed Brown         break;
4011da1bb401SStefano Zampini       }/* switch on coarse problem and communications associated with finished */
40120c7d97c5SJed Brown   }
40130c7d97c5SJed Brown 
40140c7d97c5SJed Brown   /* Now create and fill up coarse matrix */
40150c7d97c5SJed Brown   if ( rank_prec_comm == active_rank ) {
4016142dfd88SStefano Zampini 
4017142dfd88SStefano Zampini     Mat matis_coarse_local_mat;
4018142dfd88SStefano Zampini 
40190c7d97c5SJed Brown     if (pcbddc->coarse_problem_type != MULTILEVEL_BDDC) {
40200c7d97c5SJed Brown       ierr = MatCreate(coarse_comm,&pcbddc->coarse_mat);CHKERRQ(ierr);
40210c7d97c5SJed Brown       ierr = MatSetSizes(pcbddc->coarse_mat,PETSC_DECIDE,PETSC_DECIDE,pcbddc->coarse_size,pcbddc->coarse_size);CHKERRQ(ierr);
40220c7d97c5SJed Brown       ierr = MatSetType(pcbddc->coarse_mat,coarse_mat_type);CHKERRQ(ierr);
40233b03a366Sstefano_zampini       ierr = MatSetUp(pcbddc->coarse_mat);CHKERRQ(ierr);
4024da1bb401SStefano Zampini       ierr = MatSetOption(pcbddc->coarse_mat,MAT_ROW_ORIENTED,PETSC_FALSE);CHKERRQ(ierr); /* local values stored in column major */
40253b03a366Sstefano_zampini       ierr = MatSetOption(pcbddc->coarse_mat,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr);
40260c7d97c5SJed Brown     } else {
4027d3ee2243SStefano Zampini       /* remind bs */
4028d3ee2243SStefano Zampini       ierr = MatCreateIS(coarse_comm,bs,PETSC_DECIDE,PETSC_DECIDE,pcbddc->coarse_size,pcbddc->coarse_size,coarse_ISLG,&pcbddc->coarse_mat);CHKERRQ(ierr);
40293b03a366Sstefano_zampini       ierr = MatSetUp(pcbddc->coarse_mat);CHKERRQ(ierr);
40300c7d97c5SJed Brown       ierr = MatISGetLocalMat(pcbddc->coarse_mat,&matis_coarse_local_mat);CHKERRQ(ierr);
40313b03a366Sstefano_zampini       ierr = MatSetUp(matis_coarse_local_mat);CHKERRQ(ierr);
4032da1bb401SStefano Zampini       ierr = MatSetOption(matis_coarse_local_mat,MAT_ROW_ORIENTED,PETSC_FALSE);CHKERRQ(ierr); /* local values stored in column major */
4033a0ba757dSStefano Zampini       ierr = MatSetOption(matis_coarse_local_mat,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr);
40340c7d97c5SJed Brown     }
4035142dfd88SStefano Zampini     /* preallocation */
4036142dfd88SStefano Zampini     if (pcbddc->coarse_problem_type != MULTILEVEL_BDDC) {
4037142dfd88SStefano Zampini       PetscInt *dnz,*onz;
4038142dfd88SStefano Zampini       PetscInt lrows,lcols;
4039142dfd88SStefano Zampini       ierr = MatGetLocalSize(pcbddc->coarse_mat,&lrows,&lcols);CHKERRQ(ierr);
4040142dfd88SStefano Zampini       ierr = MatPreallocateInitialize(coarse_comm,lrows,lcols,dnz,onz);CHKERRQ(ierr);
4041142dfd88SStefano Zampini       if (pcbddc->coarse_problem_type == PARALLEL_BDDC) {
4042142dfd88SStefano Zampini         PetscInt coarse_index_row,coarse_index_col,start_row,owner;
4043142dfd88SStefano Zampini         PetscMPIInt *auxpreall_displs;
4044142dfd88SStefano Zampini         PetscMPIInt *auxpreall_sizes;
4045142dfd88SStefano Zampini         PetscMPIInt *auxpreall_dnz;
4046142dfd88SStefano Zampini         PetscMPIInt *auxpreall_onz;
4047142dfd88SStefano Zampini         PetscInt    *auxpreall_ownership;
4048142dfd88SStefano Zampini         if (rank_prec_comm == 0) {
4049142dfd88SStefano Zampini           ierr = PetscMalloc((size_prec_comm+1)*sizeof(PetscMPIInt),&auxpreall_displs);CHKERRQ(ierr);
4050142dfd88SStefano Zampini           auxpreall_displs[size_prec_comm]=pcbddc->coarse_size;
4051142dfd88SStefano Zampini           ierr = PetscMalloc(size_prec_comm*sizeof(PetscMPIInt),&auxpreall_sizes);CHKERRQ(ierr);
4052142dfd88SStefano Zampini           ierr = PetscMalloc(pcbddc->coarse_size*sizeof(PetscMPIInt),&auxpreall_dnz);CHKERRQ(ierr);
4053142dfd88SStefano Zampini           ierr = PetscMemzero(auxpreall_dnz,pcbddc->coarse_size*sizeof(PetscMPIInt));CHKERRQ(ierr);
4054142dfd88SStefano Zampini           ierr = PetscMalloc(pcbddc->coarse_size*sizeof(PetscMPIInt),&auxpreall_onz);CHKERRQ(ierr);
4055142dfd88SStefano Zampini           ierr = PetscMemzero(auxpreall_onz,pcbddc->coarse_size*sizeof(PetscMPIInt));CHKERRQ(ierr);
4056142dfd88SStefano Zampini           ierr = PetscMalloc(pcbddc->coarse_size*sizeof(PetscInt),&auxpreall_ownership);CHKERRQ(ierr);
4057142dfd88SStefano Zampini         }
4058142dfd88SStefano Zampini         ierr = MatGetOwnershipRange(pcbddc->coarse_mat,&start_row,PETSC_NULL);CHKERRQ(ierr);
4059142dfd88SStefano Zampini         ierr = MPI_Gather(&start_row,1,MPIU_INT,auxpreall_displs,1,MPIU_INT,0,prec_comm);CHKERRQ(ierr);
4060142dfd88SStefano Zampini         if (rank_prec_comm == 0) {
4061142dfd88SStefano Zampini           k=0;
4062142dfd88SStefano Zampini           for (i=0;i<size_prec_comm;i++) {
4063142dfd88SStefano Zampini             auxpreall_sizes[i]=auxpreall_displs[i+1]-auxpreall_displs[i];
4064142dfd88SStefano Zampini             for (j=0;j<auxpreall_sizes[i];j++) {
4065142dfd88SStefano Zampini               auxpreall_ownership[auxpreall_displs[i]+j]=i;
4066142dfd88SStefano Zampini             }
4067142dfd88SStefano Zampini           }
4068142dfd88SStefano Zampini           for (i=0;i<size_prec_comm;i++) {
4069142dfd88SStefano Zampini             for (j=0;j<pcbddc->local_primal_sizes[i];j++) {
4070142dfd88SStefano Zampini               coarse_index_row=auxglobal_primal[j+pcbddc->local_primal_displacements[i]];
4071142dfd88SStefano Zampini               for (k=j;k<pcbddc->local_primal_sizes[i];k++) {
4072142dfd88SStefano Zampini                 coarse_index_col=auxglobal_primal[k+pcbddc->local_primal_displacements[i]];
4073142dfd88SStefano Zampini                 owner = auxpreall_ownership[coarse_index_row];
4074142dfd88SStefano Zampini                 if (coarse_index_col>auxpreall_displs[owner]-1 && coarse_index_col < auxpreall_displs[owner]+auxpreall_sizes[owner]) {
4075142dfd88SStefano Zampini                   auxpreall_dnz[coarse_index_row]++;
4076142dfd88SStefano Zampini                 } else {
4077142dfd88SStefano Zampini                   auxpreall_onz[coarse_index_row]++;
4078142dfd88SStefano Zampini                 }
4079142dfd88SStefano Zampini                 if (k != j) {
4080142dfd88SStefano Zampini                   owner = auxpreall_ownership[coarse_index_col];
4081142dfd88SStefano Zampini                   if (coarse_index_row>auxpreall_displs[owner]-1 && coarse_index_row < auxpreall_displs[owner]+auxpreall_sizes[owner]) {
4082142dfd88SStefano Zampini                     auxpreall_dnz[coarse_index_col]++;
4083142dfd88SStefano Zampini                   } else {
4084142dfd88SStefano Zampini                     auxpreall_onz[coarse_index_col]++;
4085142dfd88SStefano Zampini                   }
4086142dfd88SStefano Zampini                 }
4087142dfd88SStefano Zampini               }
4088142dfd88SStefano Zampini             }
4089142dfd88SStefano Zampini           }
4090142dfd88SStefano Zampini         }
4091142dfd88SStefano Zampini         ierr = MPI_Scatterv(auxpreall_dnz,auxpreall_sizes,auxpreall_displs,MPIU_INT,
4092142dfd88SStefano Zampini                             dnz,lrows,MPIU_INT,0,prec_comm);
4093142dfd88SStefano Zampini         ierr = MPI_Scatterv(auxpreall_onz,auxpreall_sizes,auxpreall_displs,MPIU_INT,
4094142dfd88SStefano Zampini                             onz,lrows,MPIU_INT,0,prec_comm);
4095142dfd88SStefano Zampini         if (rank_prec_comm == 0) {
4096142dfd88SStefano Zampini           ierr = PetscFree(auxpreall_displs);CHKERRQ(ierr);
4097142dfd88SStefano Zampini           ierr = PetscFree(auxpreall_sizes);CHKERRQ(ierr);
4098142dfd88SStefano Zampini           ierr = PetscFree(auxpreall_dnz);CHKERRQ(ierr);
4099142dfd88SStefano Zampini           ierr = PetscFree(auxpreall_onz);CHKERRQ(ierr);
4100142dfd88SStefano Zampini           ierr = PetscFree(auxpreall_ownership);CHKERRQ(ierr);
4101142dfd88SStefano Zampini         }
4102142dfd88SStefano Zampini       } else {
4103142dfd88SStefano Zampini         for (k=0;k<size_prec_comm;k++){
4104142dfd88SStefano Zampini           offset=pcbddc->local_primal_displacements[k];
4105142dfd88SStefano Zampini           offset2=localdispl2[k];
4106142dfd88SStefano Zampini           ins_local_primal_size = pcbddc->local_primal_sizes[k];
4107142dfd88SStefano Zampini           ins_local_primal_indices = &pcbddc->replicated_local_primal_indices[offset];
4108142dfd88SStefano Zampini           for (j=0;j<ins_local_primal_size;j++) {
4109142dfd88SStefano Zampini             ierr = MatPreallocateSet(ins_local_primal_indices[j],ins_local_primal_size,ins_local_primal_indices,dnz,onz);CHKERRQ(ierr);
4110142dfd88SStefano Zampini           }
4111142dfd88SStefano Zampini         }
4112142dfd88SStefano Zampini       }
4113142dfd88SStefano Zampini       /* check */
4114142dfd88SStefano Zampini       for (i=0;i<lrows;i++) {
4115142dfd88SStefano Zampini         if (dnz[i]>lcols) {
4116142dfd88SStefano Zampini           dnz[i]=lcols;
4117142dfd88SStefano Zampini         }
4118142dfd88SStefano Zampini         if (onz[i]>pcbddc->coarse_size-lcols) {
4119142dfd88SStefano Zampini           onz[i]=pcbddc->coarse_size-lcols;
4120142dfd88SStefano Zampini         }
4121142dfd88SStefano Zampini       }
4122142dfd88SStefano Zampini       ierr = MatSeqAIJSetPreallocation(pcbddc->coarse_mat,PETSC_NULL,dnz);CHKERRQ(ierr);
4123142dfd88SStefano Zampini       ierr = MatMPIAIJSetPreallocation(pcbddc->coarse_mat,PETSC_NULL,dnz,PETSC_NULL,onz);CHKERRQ(ierr);
4124142dfd88SStefano Zampini       ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr);
4125142dfd88SStefano Zampini     } else {
4126142dfd88SStefano Zampini       ierr = MatSeqAIJSetPreallocation(matis_coarse_local_mat,ins_local_primal_size,PETSC_NULL);CHKERRQ(ierr);
4127142dfd88SStefano Zampini     }
4128142dfd88SStefano Zampini     if (rank_prec_comm == 0) { ierr = PetscFree(auxglobal_primal);CHKERRQ(ierr); }
4129142dfd88SStefano Zampini     /* insert values */
4130ea7e1babSStefano Zampini     if (pcbddc->coarse_communications_type != GATHERS_BDDC) {
41310c7d97c5SJed Brown       ierr = MatSetValues(pcbddc->coarse_mat,ins_local_primal_size,ins_local_primal_indices,ins_local_primal_size,ins_local_primal_indices,ins_coarse_mat_vals,ADD_VALUES);CHKERRQ(ierr);
4132ea7e1babSStefano Zampini     } else {
4133ea7e1babSStefano Zampini       for (k=0;k<size_prec_comm;k++){
4134ea7e1babSStefano Zampini         offset=pcbddc->local_primal_displacements[k];
4135ea7e1babSStefano Zampini         offset2=localdispl2[k];
4136ea7e1babSStefano Zampini         ins_local_primal_size = pcbddc->local_primal_sizes[k];
4137ea7e1babSStefano Zampini         ins_local_primal_indices = &pcbddc->replicated_local_primal_indices[offset];
4138ea7e1babSStefano Zampini         ins_coarse_mat_vals = &temp_coarse_mat_vals[offset2];
4139ea7e1babSStefano Zampini         ierr = MatSetValues(pcbddc->coarse_mat,ins_local_primal_size,ins_local_primal_indices,ins_local_primal_size,ins_local_primal_indices,ins_coarse_mat_vals,ADD_VALUES);CHKERRQ(ierr);
4140ea7e1babSStefano Zampini       }
4141ea7e1babSStefano Zampini       ins_local_primal_indices = 0;
4142ea7e1babSStefano Zampini       ins_coarse_mat_vals = 0;
4143ea7e1babSStefano Zampini     }
41440c7d97c5SJed Brown     ierr = MatAssemblyBegin(pcbddc->coarse_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
41450c7d97c5SJed Brown     ierr = MatAssemblyEnd(pcbddc->coarse_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
4146142dfd88SStefano Zampini     /* symmetry of coarse matrix */
4147142dfd88SStefano Zampini     if (issym) {
4148142dfd88SStefano Zampini       ierr = MatSetOption(pcbddc->coarse_mat,MAT_SYMMETRIC,PETSC_TRUE);CHKERRQ(ierr);
4149142dfd88SStefano Zampini     }
41500c7d97c5SJed Brown     ierr = MatGetVecs(pcbddc->coarse_mat,&pcbddc->coarse_vec,&pcbddc->coarse_rhs);CHKERRQ(ierr);
4151*0bdf917eSStefano Zampini   }
4152*0bdf917eSStefano Zampini 
4153*0bdf917eSStefano Zampini   /* create loc to glob scatters if needed */
4154*0bdf917eSStefano Zampini   if (pcbddc->coarse_communications_type == SCATTERS_BDDC) {
4155*0bdf917eSStefano Zampini      IS local_IS,global_IS;
4156*0bdf917eSStefano Zampini      ierr = ISCreateStride(PETSC_COMM_SELF,pcbddc->local_primal_size,0,1,&local_IS);CHKERRQ(ierr);
4157*0bdf917eSStefano Zampini      ierr = ISCreateGeneral(PETSC_COMM_SELF,pcbddc->local_primal_size,pcbddc->local_primal_indices,PETSC_COPY_VALUES,&global_IS);CHKERRQ(ierr);
4158*0bdf917eSStefano Zampini      ierr = VecScatterCreate(pcbddc->vec1_P,local_IS,pcbddc->coarse_vec,global_IS,&pcbddc->coarse_loc_to_glob);CHKERRQ(ierr);
4159*0bdf917eSStefano Zampini      ierr = ISDestroy(&local_IS);CHKERRQ(ierr);
4160*0bdf917eSStefano Zampini      ierr = ISDestroy(&global_IS);CHKERRQ(ierr);
4161*0bdf917eSStefano Zampini   }
4162*0bdf917eSStefano Zampini 
4163*0bdf917eSStefano Zampini   /* Eval coarse null space */
4164*0bdf917eSStefano Zampini   if (pcbddc->NullSpace) {
4165*0bdf917eSStefano Zampini     const Vec      *nsp_vecs;
4166*0bdf917eSStefano Zampini     PetscInt       nsp_size,coarse_nsp_size;
4167*0bdf917eSStefano Zampini     PetscBool      nsp_has_cnst;
4168*0bdf917eSStefano Zampini     PetscReal      test_null;
4169*0bdf917eSStefano Zampini     Vec            *coarse_nsp_vecs;
4170*0bdf917eSStefano Zampini 
4171*0bdf917eSStefano Zampini     coarse_nsp_size = 0;
4172*0bdf917eSStefano Zampini     coarse_nsp_vecs = 0;
4173*0bdf917eSStefano Zampini     ierr = MatNullSpaceGetVecs(pcbddc->NullSpace,&nsp_has_cnst,&nsp_size,&nsp_vecs);CHKERRQ(ierr);
4174*0bdf917eSStefano Zampini     if (rank_prec_comm == active_rank) {
4175*0bdf917eSStefano Zampini       ierr = PetscMalloc((nsp_size+1)*sizeof(Vec),&coarse_nsp_vecs);CHKERRQ(ierr);
4176*0bdf917eSStefano Zampini       for (i=0;i<nsp_size+1;i++) {
4177*0bdf917eSStefano Zampini         ierr = VecDuplicate(pcbddc->coarse_vec,&coarse_nsp_vecs[i]);CHKERRQ(ierr);
4178*0bdf917eSStefano Zampini       }
4179*0bdf917eSStefano Zampini     }
4180*0bdf917eSStefano Zampini     if (nsp_has_cnst) {
4181*0bdf917eSStefano Zampini       ierr = VecSet(pcis->vec1_N,1.0);CHKERRQ(ierr);
4182*0bdf917eSStefano Zampini       ierr = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr);
4183*0bdf917eSStefano Zampini       ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->vec1_P,pcbddc->coarse_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4184*0bdf917eSStefano Zampini       ierr = PCBDDCScatterCoarseDataEnd(pc,pcbddc->vec1_P,pcbddc->coarse_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4185*0bdf917eSStefano Zampini       if (rank_prec_comm == active_rank) {
4186*0bdf917eSStefano Zampini         ierr = MatMult(pcbddc->coarse_mat,pcbddc->coarse_vec,pcbddc->coarse_rhs);CHKERRQ(ierr);
4187*0bdf917eSStefano Zampini         ierr = VecNorm(pcbddc->coarse_rhs,NORM_INFINITY,&test_null);CHKERRQ(ierr);
4188*0bdf917eSStefano Zampini         if (test_null > 1.0e-12 && pcbddc->dbg_flag ) {
4189*0bdf917eSStefano Zampini           ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Constant coarse null space error % 1.14e\n",test_null);CHKERRQ(ierr);
4190*0bdf917eSStefano Zampini         }
4191*0bdf917eSStefano Zampini         ierr = VecCopy(pcbddc->coarse_vec,coarse_nsp_vecs[coarse_nsp_size]);CHKERRQ(ierr);
4192*0bdf917eSStefano Zampini         coarse_nsp_size++;
4193*0bdf917eSStefano Zampini       }
4194*0bdf917eSStefano Zampini     }
4195*0bdf917eSStefano Zampini     for (i=0;i<nsp_size;i++)  {
4196*0bdf917eSStefano Zampini       ierr = VecScatterBegin(matis->ctx,nsp_vecs[i],pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4197*0bdf917eSStefano Zampini       ierr = VecScatterEnd  (matis->ctx,nsp_vecs[i],pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4198*0bdf917eSStefano Zampini       ierr = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr);
4199*0bdf917eSStefano Zampini       ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->vec1_P,pcbddc->coarse_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4200*0bdf917eSStefano Zampini       ierr = PCBDDCScatterCoarseDataEnd(pc,pcbddc->vec1_P,pcbddc->coarse_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4201*0bdf917eSStefano Zampini       if (rank_prec_comm == active_rank) {
4202*0bdf917eSStefano Zampini         ierr = MatMult(pcbddc->coarse_mat,pcbddc->coarse_vec,pcbddc->coarse_rhs);CHKERRQ(ierr);
4203*0bdf917eSStefano Zampini         ierr = VecNorm(pcbddc->coarse_rhs,NORM_2,&test_null);CHKERRQ(ierr);
4204*0bdf917eSStefano Zampini         if (test_null > 1.0e-12 && pcbddc->dbg_flag ) {
4205*0bdf917eSStefano Zampini           ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Vec %d coarse null space error % 1.14e\n",i,test_null);CHKERRQ(ierr);
4206*0bdf917eSStefano Zampini         }
4207*0bdf917eSStefano Zampini         ierr = VecCopy(pcbddc->coarse_vec,coarse_nsp_vecs[coarse_nsp_size]);CHKERRQ(ierr);
4208*0bdf917eSStefano Zampini         coarse_nsp_size++;
4209*0bdf917eSStefano Zampini       }
4210*0bdf917eSStefano Zampini     }
4211*0bdf917eSStefano Zampini     if (coarse_nsp_size > 0) {
4212*0bdf917eSStefano Zampini       /* TODO orthonormalize vecs */
4213*0bdf917eSStefano Zampini       ierr = VecNormalize(coarse_nsp_vecs[0],PETSC_NULL);CHKERRQ(ierr);
4214*0bdf917eSStefano Zampini       ierr = MatNullSpaceCreate(coarse_comm,PETSC_FALSE,coarse_nsp_size,coarse_nsp_vecs,&pcbddc->CoarseNullSpace);CHKERRQ(ierr);
4215*0bdf917eSStefano Zampini       for (i=0;i<nsp_size+1;i++) {
4216*0bdf917eSStefano Zampini         ierr = VecDestroy(&coarse_nsp_vecs[i]);CHKERRQ(ierr);
4217*0bdf917eSStefano Zampini       }
4218*0bdf917eSStefano Zampini     }
4219*0bdf917eSStefano Zampini     ierr = PetscFree(coarse_nsp_vecs);CHKERRQ(ierr);
4220*0bdf917eSStefano Zampini   }
4221*0bdf917eSStefano Zampini 
4222*0bdf917eSStefano Zampini   /* KSP for coarse problem */
4223*0bdf917eSStefano Zampini   if (rank_prec_comm == active_rank) {
4224*0bdf917eSStefano Zampini 
422553cdbc3dSStefano Zampini     ierr = KSPCreate(coarse_comm,&pcbddc->coarse_ksp);CHKERRQ(ierr);
422653cdbc3dSStefano Zampini     ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->coarse_ksp,(PetscObject)pc,1);CHKERRQ(ierr);
422753cdbc3dSStefano Zampini     ierr = KSPSetOperators(pcbddc->coarse_ksp,pcbddc->coarse_mat,pcbddc->coarse_mat,SAME_PRECONDITIONER);CHKERRQ(ierr);
42283b03a366Sstefano_zampini     ierr = KSPSetTolerances(pcbddc->coarse_ksp,PETSC_DEFAULT,PETSC_DEFAULT,PETSC_DEFAULT,max_it_coarse_ksp);CHKERRQ(ierr);
422953cdbc3dSStefano Zampini     ierr = KSPSetType(pcbddc->coarse_ksp,coarse_ksp_type);CHKERRQ(ierr);
423053cdbc3dSStefano Zampini     ierr = KSPGetPC(pcbddc->coarse_ksp,&pc_temp);CHKERRQ(ierr);
423153cdbc3dSStefano Zampini     ierr = PCSetType(pc_temp,coarse_pc_type);CHKERRQ(ierr);
42320c7d97c5SJed Brown     /* Allow user's customization */
4233da1bb401SStefano Zampini     ierr = KSPSetOptionsPrefix(pcbddc->coarse_ksp,"coarse_");CHKERRQ(ierr);
423453cdbc3dSStefano Zampini     ierr = KSPSetFromOptions(pcbddc->coarse_ksp);CHKERRQ(ierr);
42350c7d97c5SJed Brown     /* Set Up PC for coarse problem BDDC */
423653cdbc3dSStefano Zampini     if (pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
4237e269702eSStefano Zampini       if (dbg_flag) {
4238e269702eSStefano Zampini         ierr = PetscViewerASCIIPrintf(viewer,"----------------Setting up a new level---------------\n");CHKERRQ(ierr);
4239e269702eSStefano Zampini         ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
4240e269702eSStefano Zampini       }
424153cdbc3dSStefano Zampini       ierr = PCBDDCSetCoarseProblemType(pc_temp,MULTILEVEL_BDDC);CHKERRQ(ierr);
4242*0bdf917eSStefano Zampini       if (pcbddc->CoarseNullSpace) { ierr = PCBDDCSetNullSpace(pc_temp,pcbddc->CoarseNullSpace);CHKERRQ(ierr); }
4243e4886b5aSStefano Zampini       ierr = KSPSetNormType(pcbddc->coarse_ksp,KSP_NORM_NONE);CHKERRQ(ierr);
424453cdbc3dSStefano Zampini     }
424553cdbc3dSStefano Zampini     ierr = KSPSetUp(pcbddc->coarse_ksp);CHKERRQ(ierr);
4246142dfd88SStefano Zampini 
4247*0bdf917eSStefano Zampini     if (pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
4248*0bdf917eSStefano Zampini       /* TODO: this is a hack! need to be solved! */
4249142dfd88SStefano Zampini       PC_BDDC*     coarse_pcbddc = (PC_BDDC*)pc_temp->data;
4250142dfd88SStefano Zampini       coarse_pcbddc->use_exact_dirichlet = PETSC_FALSE;
42515619798eSStefano Zampini       if (dbg_flag) {
42525619798eSStefano Zampini         ierr = PetscViewerASCIIPrintf(viewer,"----------------New level set------------------------\n");CHKERRQ(ierr);
42535619798eSStefano Zampini         ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
42545619798eSStefano Zampini       }
42555619798eSStefano Zampini     }
42560c7d97c5SJed Brown   }
42573b03a366Sstefano_zampini   /* Evaluate condition number of coarse problem for cheby (and verbose output if requested) */
4258142dfd88SStefano Zampini   if ( dbg_flag && rank_prec_comm == active_rank ) {
4259142dfd88SStefano Zampini     KSP check_ksp;
4260142dfd88SStefano Zampini     PC  check_pc;
4261142dfd88SStefano Zampini     Vec check_vec;
4262142dfd88SStefano Zampini     PetscReal   abs_infty_error,infty_error,lambda_min,lambda_max;
4263142dfd88SStefano Zampini     const KSPType check_ksp_type;
42640c7d97c5SJed Brown 
4265142dfd88SStefano Zampini     /* Create ksp object suitable for extreme eigenvalues' estimation */
4266142dfd88SStefano Zampini     ierr = KSPCreate(coarse_comm,&check_ksp);CHKERRQ(ierr);
4267142dfd88SStefano Zampini     ierr = KSPSetOperators(check_ksp,pcbddc->coarse_mat,pcbddc->coarse_mat,SAME_PRECONDITIONER);CHKERRQ(ierr);
4268*0bdf917eSStefano Zampini     ierr = KSPSetTolerances(check_ksp,1.e-12,1.e-12,PETSC_DEFAULT,pcbddc->coarse_size);CHKERRQ(ierr);
4269142dfd88SStefano Zampini     if (pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
4270142dfd88SStefano Zampini       if (issym) {
4271142dfd88SStefano Zampini         check_ksp_type = KSPCG;
4272142dfd88SStefano Zampini       } else {
4273142dfd88SStefano Zampini         check_ksp_type = KSPGMRES;
4274142dfd88SStefano Zampini       }
4275142dfd88SStefano Zampini       ierr = KSPSetComputeSingularValues(check_ksp,PETSC_TRUE);CHKERRQ(ierr);
4276142dfd88SStefano Zampini     } else {
4277142dfd88SStefano Zampini       check_ksp_type = KSPPREONLY;
4278142dfd88SStefano Zampini     }
4279142dfd88SStefano Zampini     ierr = KSPSetType(check_ksp,check_ksp_type);CHKERRQ(ierr);
4280142dfd88SStefano Zampini     ierr = KSPGetPC(pcbddc->coarse_ksp,&check_pc);CHKERRQ(ierr);
4281142dfd88SStefano Zampini     ierr = KSPSetPC(check_ksp,check_pc);CHKERRQ(ierr);
4282142dfd88SStefano Zampini     ierr = KSPSetUp(check_ksp);CHKERRQ(ierr);
4283142dfd88SStefano Zampini     /* create random vec */
4284142dfd88SStefano Zampini     ierr = VecDuplicate(pcbddc->coarse_vec,&check_vec);CHKERRQ(ierr);
4285142dfd88SStefano Zampini     ierr = VecSetRandom(check_vec,PETSC_NULL);CHKERRQ(ierr);
4286*0bdf917eSStefano Zampini     if (pcbddc->CoarseNullSpace) { ierr = MatNullSpaceRemove(pcbddc->CoarseNullSpace,check_vec,PETSC_NULL);CHKERRQ(ierr); }
4287142dfd88SStefano Zampini     ierr = MatMult(pcbddc->coarse_mat,check_vec,pcbddc->coarse_rhs);CHKERRQ(ierr);
4288142dfd88SStefano Zampini     /* solve coarse problem */
4289142dfd88SStefano Zampini     ierr = KSPSolve(check_ksp,pcbddc->coarse_rhs,pcbddc->coarse_vec);CHKERRQ(ierr);
4290*0bdf917eSStefano Zampini     if (pcbddc->CoarseNullSpace) { ierr = MatNullSpaceRemove(pcbddc->CoarseNullSpace,pcbddc->coarse_vec,PETSC_NULL);CHKERRQ(ierr); }
4291142dfd88SStefano Zampini     /* check coarse problem residual error */
4292142dfd88SStefano Zampini     ierr = VecAXPY(check_vec,-1.0,pcbddc->coarse_vec);CHKERRQ(ierr);
4293142dfd88SStefano Zampini     ierr = VecNorm(check_vec,NORM_INFINITY,&infty_error);CHKERRQ(ierr);
4294142dfd88SStefano Zampini     ierr = MatMult(pcbddc->coarse_mat,check_vec,pcbddc->coarse_rhs);CHKERRQ(ierr);
4295142dfd88SStefano Zampini     ierr = VecNorm(pcbddc->coarse_rhs,NORM_INFINITY,&abs_infty_error);CHKERRQ(ierr);
4296142dfd88SStefano Zampini     ierr = VecDestroy(&check_vec);CHKERRQ(ierr);
4297142dfd88SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"Size of coarse problem %d\n",pcbddc->coarse_size);CHKERRQ(ierr);
4298142dfd88SStefano Zampini     /* get eigenvalue estimation if inexact */
4299142dfd88SStefano Zampini     if (pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
4300142dfd88SStefano Zampini       ierr = KSPComputeExtremeSingularValues(check_ksp,&lambda_max,&lambda_min);CHKERRQ(ierr);
4301142dfd88SStefano Zampini       ierr = KSPGetIterationNumber(check_ksp,&k);CHKERRQ(ierr);
4302142dfd88SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem eigenvalues estimated with %d iterations of %s.\n",k,check_ksp_type);CHKERRQ(ierr);
4303e269702eSStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem eigenvalues: % 1.14e %1.14e\n",lambda_min,lambda_max);CHKERRQ(ierr);
43043b03a366Sstefano_zampini     }
4305142dfd88SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem exact infty_error   : %1.14e\n",infty_error);CHKERRQ(ierr);
4306142dfd88SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem residual infty_error: %1.14e\n",abs_infty_error);CHKERRQ(ierr);
4307142dfd88SStefano Zampini     ierr = KSPDestroy(&check_ksp);CHKERRQ(ierr);
430853cdbc3dSStefano Zampini   }
4309142dfd88SStefano Zampini   if (dbg_flag) { ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); }
43100c7d97c5SJed Brown   /* free data structures no longer needed */
43110c7d97c5SJed Brown   if (coarse_ISLG)                { ierr = ISLocalToGlobalMappingDestroy(&coarse_ISLG);CHKERRQ(ierr); }
43120c7d97c5SJed Brown   if (ins_local_primal_indices)   { ierr = PetscFree(ins_local_primal_indices);CHKERRQ(ierr);  }
43130c7d97c5SJed Brown   if (ins_coarse_mat_vals)        { ierr = PetscFree(ins_coarse_mat_vals);CHKERRQ(ierr);}
43140c7d97c5SJed Brown   if (localsizes2)                { ierr = PetscFree(localsizes2);CHKERRQ(ierr);}
43150c7d97c5SJed Brown   if (localdispl2)                { ierr = PetscFree(localdispl2);CHKERRQ(ierr);}
43160c7d97c5SJed Brown   if (temp_coarse_mat_vals)       { ierr = PetscFree(temp_coarse_mat_vals);CHKERRQ(ierr);}
43170c7d97c5SJed Brown 
43180c7d97c5SJed Brown   PetscFunctionReturn(0);
43190c7d97c5SJed Brown }
43200c7d97c5SJed Brown 
43210c7d97c5SJed Brown #undef __FUNCT__
43220c7d97c5SJed Brown #define __FUNCT__ "PCBDDCManageLocalBoundaries"
432353cdbc3dSStefano Zampini static PetscErrorCode PCBDDCManageLocalBoundaries(PC pc)
43240c7d97c5SJed Brown {
43250c7d97c5SJed Brown 
43260c7d97c5SJed Brown   PC_BDDC     *pcbddc = (PC_BDDC*)pc->data;
43270c7d97c5SJed Brown   PC_IS         *pcis = (PC_IS*)pc->data;
43280c7d97c5SJed Brown   Mat_IS      *matis  = (Mat_IS*)pc->pmat->data;
4329da1bb401SStefano Zampini   PCBDDCGraph mat_graph=pcbddc->mat_graph;
43303972b0daSStefano Zampini   PetscInt    *queue_in_global_numbering,*is_indices,*auxis;
43313b03a366Sstefano_zampini   PetscInt    bs,ierr,i,j,s,k,iindex,neumann_bsize,dirichlet_bsize;
4332da1bb401SStefano Zampini   PetscInt    total_counts,nodes_touched,where_values=1,vertex_size;
4333534831adSStefano Zampini   PetscMPIInt adapt_interface=0,adapt_interface_reduced=0,NEUMANNCNT=0;
4334da1bb401SStefano Zampini   PetscBool   same_set;
4335a0ba757dSStefano Zampini   MPI_Comm    interface_comm=((PetscObject)pc)->comm;
43363b03a366Sstefano_zampini   PetscBool   use_faces=PETSC_FALSE,use_edges=PETSC_FALSE;
43373b03a366Sstefano_zampini   const PetscInt *neumann_nodes;
43383b03a366Sstefano_zampini   const PetscInt *dirichlet_nodes;
4339a81d60d8SStefano Zampini   IS          used_IS,*custom_ISForDofs;
4340da1bb401SStefano Zampini   PetscScalar *array;
4341da1bb401SStefano Zampini   PetscScalar *array2;
4342da1bb401SStefano Zampini   PetscViewer viewer=pcbddc->dbg_viewer;
43430c7d97c5SJed Brown 
43440c7d97c5SJed Brown   PetscFunctionBegin;
4345da1bb401SStefano Zampini   /* Setup local adjacency graph */
4346da1bb401SStefano Zampini   mat_graph->nvtxs=pcis->n;
4347534831adSStefano Zampini   if (!mat_graph->xadj) { NEUMANNCNT = 1; }
4348da1bb401SStefano Zampini   ierr = PCBDDCSetupLocalAdjacencyGraph(pc);CHKERRQ(ierr);
4349a0ba757dSStefano Zampini   i = mat_graph->nvtxs;
4350a0ba757dSStefano Zampini   ierr = PetscMalloc4(i,PetscInt,&mat_graph->where,i,PetscInt,&mat_graph->count,i+1,PetscInt,&mat_graph->cptr,i,PetscInt,&mat_graph->queue);CHKERRQ(ierr);
43513972b0daSStefano Zampini   ierr = PetscMalloc2(i,PetscInt,&mat_graph->which_dof,i,PetscBool,&mat_graph->touched);CHKERRQ(ierr);
43523972b0daSStefano Zampini   ierr = PetscMalloc(i*sizeof(PetscInt),&queue_in_global_numbering);CHKERRQ(ierr);
4353a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->where,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
4354a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->count,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
4355a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->which_dof,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
4356a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->queue,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
43573828260eSStefano Zampini   ierr = PetscMemzero(mat_graph->cptr,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr);
4358a0ba757dSStefano Zampini 
4359a81d60d8SStefano Zampini   /* Setting dofs splitting in mat_graph->which_dof
4360a81d60d8SStefano Zampini      Get information about dofs' splitting if provided by the user
4361a81d60d8SStefano Zampini      Otherwise it assumes a constant block size */
4362a81d60d8SStefano Zampini   vertex_size=0;
4363a81d60d8SStefano Zampini   if (!pcbddc->n_ISForDofs) {
4364a81d60d8SStefano Zampini     ierr = MatGetBlockSize(matis->A,&bs);CHKERRQ(ierr);
4365a81d60d8SStefano Zampini     ierr = PetscMalloc(bs*sizeof(IS),&custom_ISForDofs);CHKERRQ(ierr);
4366a81d60d8SStefano Zampini     for (i=0;i<bs;i++) {
4367a81d60d8SStefano Zampini       ierr = ISCreateStride(PETSC_COMM_SELF,pcis->n/bs,i,bs,&custom_ISForDofs[i]);CHKERRQ(ierr);
4368a81d60d8SStefano Zampini     }
4369a81d60d8SStefano Zampini     ierr = PCBDDCSetDofsSplitting(pc,bs,custom_ISForDofs);CHKERRQ(ierr);
4370a81d60d8SStefano Zampini     vertex_size=1;
4371a81d60d8SStefano Zampini     /* remove my references to IS objects */
4372a81d60d8SStefano Zampini     for (i=0;i<bs;i++) {
4373a81d60d8SStefano Zampini       ierr = ISDestroy(&custom_ISForDofs[i]);CHKERRQ(ierr);
4374a81d60d8SStefano Zampini     }
4375a81d60d8SStefano Zampini     ierr = PetscFree(custom_ISForDofs);CHKERRQ(ierr);
4376a81d60d8SStefano Zampini   }
43779c0446d6SStefano Zampini   for (i=0;i<pcbddc->n_ISForDofs;i++) {
4378a81d60d8SStefano Zampini     ierr = ISGetSize(pcbddc->ISForDofs[i],&k);CHKERRQ(ierr);
43799c0446d6SStefano Zampini     ierr = ISGetIndices(pcbddc->ISForDofs[i],(const PetscInt**)&is_indices);CHKERRQ(ierr);
4380a81d60d8SStefano Zampini     for (j=0;j<k;j++) {
43819c0446d6SStefano Zampini       mat_graph->which_dof[is_indices[j]]=i;
43829c0446d6SStefano Zampini     }
43839c0446d6SStefano Zampini     ierr = ISRestoreIndices(pcbddc->ISForDofs[i],(const PetscInt**)&is_indices);CHKERRQ(ierr);
43849c0446d6SStefano Zampini   }
4385a81d60d8SStefano Zampini   /* use mat block size as vertex size if it has not yet set */
4386a81d60d8SStefano Zampini   if (!vertex_size) {
43873b03a366Sstefano_zampini     ierr = MatGetBlockSize(matis->A,&vertex_size);CHKERRQ(ierr);
43880c7d97c5SJed Brown   }
4389a81d60d8SStefano Zampini 
43903b03a366Sstefano_zampini   /* count number of neigh per node */
43910c7d97c5SJed Brown   total_counts=0;
43923b03a366Sstefano_zampini   for (i=1;i<pcis->n_neigh;i++){
43930c7d97c5SJed Brown     s=pcis->n_shared[i];
43940c7d97c5SJed Brown     total_counts+=s;
439553cdbc3dSStefano Zampini     for (j=0;j<s;j++){
43960c7d97c5SJed Brown       mat_graph->count[pcis->shared[i][j]] += 1;
43970c7d97c5SJed Brown     }
43980c7d97c5SJed Brown   }
4399534831adSStefano Zampini   /* Take into account Neumann data -> it increments number of sharing subdomains for nodes lying on the interface */
440036e030ebSStefano Zampini   ierr = PCBDDCGetNeumannBoundaries(pc,&used_IS);CHKERRQ(ierr);
4401da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
4402da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
440336e030ebSStefano Zampini   if (used_IS) {
440436e030ebSStefano Zampini     ierr = ISGetSize(used_IS,&neumann_bsize);CHKERRQ(ierr);
440536e030ebSStefano Zampini     ierr = ISGetIndices(used_IS,&neumann_nodes);CHKERRQ(ierr);
440653cdbc3dSStefano Zampini     for (i=0;i<neumann_bsize;i++){
440753cdbc3dSStefano Zampini       iindex = neumann_nodes[i];
4408534831adSStefano Zampini       if (mat_graph->count[iindex] > NEUMANNCNT && array[iindex]==0.0){
440953cdbc3dSStefano Zampini         mat_graph->count[iindex]+=1;
44100c7d97c5SJed Brown         total_counts++;
4411da1bb401SStefano Zampini         array[iindex]=array[iindex]+1.0;
4412da1bb401SStefano Zampini       } else if (array[iindex]>0.0) {
4413da1bb401SStefano Zampini         SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_USER,"Error for neumann nodes provided to BDDC! They must be uniquely listed! Found duplicate node %d\n",iindex);
44140c7d97c5SJed Brown       }
44150c7d97c5SJed Brown     }
44160c7d97c5SJed Brown   }
4417da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
4418da1bb401SStefano Zampini   /* allocate space for storing the set of neighbours for each node */
4419da1bb401SStefano Zampini   ierr = PetscMalloc(mat_graph->nvtxs*sizeof(PetscInt*),&mat_graph->neighbours_set);CHKERRQ(ierr);
4420da1bb401SStefano Zampini   if (mat_graph->nvtxs) { ierr = PetscMalloc(total_counts*sizeof(PetscInt),&mat_graph->neighbours_set[0]);CHKERRQ(ierr); }
4421da1bb401SStefano Zampini   for (i=1;i<mat_graph->nvtxs;i++) mat_graph->neighbours_set[i]=mat_graph->neighbours_set[i-1]+mat_graph->count[i-1];
4422a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->count,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
44233b03a366Sstefano_zampini   for (i=1;i<pcis->n_neigh;i++){
44240c7d97c5SJed Brown     s=pcis->n_shared[i];
44250c7d97c5SJed Brown     for (j=0;j<s;j++) {
44260c7d97c5SJed Brown       k=pcis->shared[i][j];
4427da1bb401SStefano Zampini       mat_graph->neighbours_set[k][mat_graph->count[k]] = pcis->neigh[i];
44280c7d97c5SJed Brown       mat_graph->count[k]+=1;
44290c7d97c5SJed Brown     }
44300c7d97c5SJed Brown   }
4431da1bb401SStefano Zampini   /* Check consistency of Neumann nodes */
4432da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
4433da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4434da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4435da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4436da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4437da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
44383b03a366Sstefano_zampini   /* set -1 fake neighbour to mimic Neumann boundary */
443936e030ebSStefano Zampini   if (used_IS) {
444053cdbc3dSStefano Zampini     for (i=0;i<neumann_bsize;i++){
444153cdbc3dSStefano Zampini       iindex = neumann_nodes[i];
4442534831adSStefano Zampini       if (mat_graph->count[iindex] > NEUMANNCNT){
4443da1bb401SStefano Zampini         if (mat_graph->count[iindex]+1 != (PetscInt)array[iindex]) {
4444da1bb401SStefano Zampini           SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_USER,"Neumann nodes provided to BDDC must be consistent among neighbours!\nNode %d: number of sharing subdomains %d != number of subdomains for which it is a neumann node %d\n",iindex,mat_graph->count[iindex]+1,(PetscInt)array[iindex]);
4445da1bb401SStefano Zampini         }
4446da1bb401SStefano Zampini         mat_graph->neighbours_set[iindex][mat_graph->count[iindex]] = -1;
444753cdbc3dSStefano Zampini         mat_graph->count[iindex]+=1;
44480c7d97c5SJed Brown       }
44490c7d97c5SJed Brown     }
445036e030ebSStefano Zampini     ierr = ISRestoreIndices(used_IS,&neumann_nodes);CHKERRQ(ierr);
44510c7d97c5SJed Brown   }
4452da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
4453da1bb401SStefano Zampini   /* sort set of sharing subdomains */
4454da1bb401SStefano Zampini   for (i=0;i<mat_graph->nvtxs;i++) { ierr = PetscSortInt(mat_graph->count[i],mat_graph->neighbours_set[i]);CHKERRQ(ierr); }
44553b03a366Sstefano_zampini   /* remove interior nodes and dirichlet boundary nodes from the next search into the graph */
4456da1bb401SStefano Zampini   for (i=0;i<mat_graph->nvtxs;i++){mat_graph->touched[i]=PETSC_FALSE;}
4457da1bb401SStefano Zampini   nodes_touched=0;
445836e030ebSStefano Zampini   ierr = PCBDDCGetDirichletBoundaries(pc,&used_IS);CHKERRQ(ierr);
4459da1bb401SStefano Zampini   ierr = VecSet(pcis->vec2_N,0.0);CHKERRQ(ierr);
4460da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
4461da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec2_N,&array2);CHKERRQ(ierr);
4462da1bb401SStefano Zampini   if (used_IS) {
4463da1bb401SStefano Zampini     ierr = ISGetSize(used_IS,&dirichlet_bsize);CHKERRQ(ierr);
4464da1bb401SStefano Zampini     if (dirichlet_bsize && matis->pure_neumann) {
4465da1bb401SStefano Zampini       SETERRQ(PETSC_COMM_SELF,PETSC_ERR_USER,"Dirichlet boundaries are intended to be used with matrices with zeroed rows!\n");
4466da1bb401SStefano Zampini     }
4467da1bb401SStefano Zampini     ierr = ISGetIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr);
4468da1bb401SStefano Zampini     for (i=0;i<dirichlet_bsize;i++){
4469da1bb401SStefano Zampini       iindex=dirichlet_nodes[i];
4470da1bb401SStefano Zampini       if (mat_graph->count[iindex] && !mat_graph->touched[iindex]) {
4471da1bb401SStefano Zampini         if (array[iindex]>0.0) {
4472da1bb401SStefano Zampini           SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_USER,"BDDC cannot have nodes which are marked as Neumann and Dirichlet at the same time! Wrong node %d\n",iindex);
4473da1bb401SStefano Zampini         }
4474da1bb401SStefano Zampini         mat_graph->touched[iindex]=PETSC_TRUE;
4475da1bb401SStefano Zampini         mat_graph->where[iindex]=0;
4476da1bb401SStefano Zampini         nodes_touched++;
4477da1bb401SStefano Zampini         array2[iindex]=array2[iindex]+1.0;
4478da1bb401SStefano Zampini       }
4479da1bb401SStefano Zampini     }
4480da1bb401SStefano Zampini     ierr = ISRestoreIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr);
4481da1bb401SStefano Zampini   }
4482da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
4483da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec2_N,&array2);CHKERRQ(ierr);
4484da1bb401SStefano Zampini   /* Check consistency of Dirichlet nodes */
4485da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_N,1.0);CHKERRQ(ierr);
4486da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
4487da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4488da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4489da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4490da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4491da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
4492da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec2_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4493da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec2_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4494da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4495da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4496da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
4497da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec2_N,&array2);CHKERRQ(ierr);
449836e030ebSStefano Zampini   if (used_IS) {
449936e030ebSStefano Zampini     ierr = ISGetSize(used_IS,&dirichlet_bsize);CHKERRQ(ierr);
450036e030ebSStefano Zampini     ierr = ISGetIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr);
45013b03a366Sstefano_zampini     for (i=0;i<dirichlet_bsize;i++){
4502da1bb401SStefano Zampini       iindex=dirichlet_nodes[i];
4503da1bb401SStefano Zampini       if (array[iindex]>1.0 && array[iindex]!=array2[iindex] ) {
4504da1bb401SStefano Zampini          SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_USER,"Dirichlet nodes provided to BDDC must be consistent among neighbours!\nNode %d: number of sharing subdomains %d != number of subdomains for which it is a neumann node %d\n",iindex,(PetscInt)array[iindex],(PetscInt)array2[iindex]);
4505da1bb401SStefano Zampini       }
45063b03a366Sstefano_zampini     }
450736e030ebSStefano Zampini     ierr = ISRestoreIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr);
45083b03a366Sstefano_zampini   }
4509da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
4510da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec2_N,&array2);CHKERRQ(ierr);
4511da1bb401SStefano Zampini 
45120c7d97c5SJed Brown   for (i=0;i<mat_graph->nvtxs;i++){
45133b03a366Sstefano_zampini     if (!mat_graph->count[i]){  /* interior nodes */
45140c7d97c5SJed Brown       mat_graph->touched[i]=PETSC_TRUE;
45150c7d97c5SJed Brown       mat_graph->where[i]=0;
45160c7d97c5SJed Brown       nodes_touched++;
45170c7d97c5SJed Brown     }
45180c7d97c5SJed Brown   }
45190c7d97c5SJed Brown   mat_graph->ncmps = 0;
4520da1bb401SStefano Zampini   i=0;
45210c7d97c5SJed Brown   while(nodes_touched<mat_graph->nvtxs) {
4522a0ba757dSStefano Zampini     /*  find first untouched node in local ordering */
45230c7d97c5SJed Brown     while(mat_graph->touched[i]) i++;
45240c7d97c5SJed Brown     mat_graph->touched[i]=PETSC_TRUE;
4525a0ba757dSStefano Zampini     mat_graph->where[i]=where_values;
45260c7d97c5SJed Brown     nodes_touched++;
4527a0ba757dSStefano Zampini     /* now find all other nodes having the same set of sharing subdomains */
45280c7d97c5SJed Brown     for (j=i+1;j<mat_graph->nvtxs;j++){
4529a0ba757dSStefano Zampini       /* check for same number of sharing subdomains and dof number */
4530da1bb401SStefano Zampini       if (!mat_graph->touched[j] && mat_graph->count[i]==mat_graph->count[j] && mat_graph->which_dof[i] == mat_graph->which_dof[j] ){
4531a0ba757dSStefano Zampini         /* check for same set of sharing subdomains */
45320c7d97c5SJed Brown         same_set=PETSC_TRUE;
45330c7d97c5SJed Brown         for (k=0;k<mat_graph->count[j];k++){
4534da1bb401SStefano Zampini           if (mat_graph->neighbours_set[i][k]!=mat_graph->neighbours_set[j][k]) {
45350c7d97c5SJed Brown             same_set=PETSC_FALSE;
45360c7d97c5SJed Brown           }
45370c7d97c5SJed Brown         }
4538a0ba757dSStefano Zampini         /* I found a friend of mine */
45390c7d97c5SJed Brown         if (same_set) {
4540a0ba757dSStefano Zampini           mat_graph->where[j]=where_values;
45410c7d97c5SJed Brown           mat_graph->touched[j]=PETSC_TRUE;
45420c7d97c5SJed Brown           nodes_touched++;
45430c7d97c5SJed Brown         }
45440c7d97c5SJed Brown       }
45450c7d97c5SJed Brown     }
4546a0ba757dSStefano Zampini     where_values++;
45470c7d97c5SJed Brown   }
4548a0ba757dSStefano Zampini   where_values--; if (where_values<0) where_values=0;
4549a0ba757dSStefano Zampini   ierr = PetscMalloc(where_values*sizeof(PetscMPIInt),&mat_graph->where_ncmps);CHKERRQ(ierr);
4550a0ba757dSStefano Zampini   /* Find connected components defined on the shared interface */
4551a0ba757dSStefano Zampini   if (where_values) {
4552a0ba757dSStefano Zampini     ierr = PCBDDCFindConnectedComponents(mat_graph, where_values);
45533b03a366Sstefano_zampini     /* For consistency among neughbouring procs, I need to sort (by global ordering) each connected component */
4554a0ba757dSStefano Zampini     for (i=0;i<mat_graph->ncmps;i++) {
4555a0ba757dSStefano Zampini       ierr = ISLocalToGlobalMappingApply(matis->mapping,mat_graph->cptr[i+1]-mat_graph->cptr[i],&mat_graph->queue[mat_graph->cptr[i]],&queue_in_global_numbering[mat_graph->cptr[i]]);CHKERRQ(ierr);
4556a0ba757dSStefano Zampini       ierr = PetscSortIntWithArray(mat_graph->cptr[i+1]-mat_graph->cptr[i],&queue_in_global_numbering[mat_graph->cptr[i]],&mat_graph->queue[mat_graph->cptr[i]]);CHKERRQ(ierr);
4557a0ba757dSStefano Zampini     }
4558a0ba757dSStefano Zampini   }
4559a0ba757dSStefano Zampini   /* check consistency of connected components among neighbouring subdomains -> it adapt them in case it is needed */
4560a0ba757dSStefano Zampini   for (i=0;i<where_values;i++) {
45613b03a366Sstefano_zampini     /* We are not sure that two connected components will be the same among subdomains sharing a subset of local interface */
45623b03a366Sstefano_zampini     if (mat_graph->where_ncmps[i]>1) {
4563a0ba757dSStefano Zampini       adapt_interface=1;
4564a0ba757dSStefano Zampini       break;
4565a0ba757dSStefano Zampini     }
4566a0ba757dSStefano Zampini   }
4567a0ba757dSStefano Zampini   ierr = MPI_Allreduce(&adapt_interface,&adapt_interface_reduced,1,MPIU_INT,MPI_LOR,interface_comm);CHKERRQ(ierr);
4568da1bb401SStefano Zampini   if (pcbddc->dbg_flag && adapt_interface_reduced) {
4569d8923723SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"Adapting interface\n");CHKERRQ(ierr);
4570da1bb401SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
4571da1bb401SStefano Zampini   }
4572a0ba757dSStefano Zampini   if (where_values && adapt_interface_reduced) {
45730c7d97c5SJed Brown 
4574a0ba757dSStefano Zampini     PetscInt sum_requests=0,my_rank;
4575a0ba757dSStefano Zampini     PetscInt buffer_size,start_of_recv,size_of_recv,start_of_send;
4576a0ba757dSStefano Zampini     PetscInt temp_buffer_size,ins_val,global_where_counter;
4577a0ba757dSStefano Zampini     PetscInt *cum_recv_counts;
4578a0ba757dSStefano Zampini     PetscInt *where_to_nodes_indices;
4579a0ba757dSStefano Zampini     PetscInt *petsc_buffer;
4580a0ba757dSStefano Zampini     PetscMPIInt *recv_buffer;
4581a0ba757dSStefano Zampini     PetscMPIInt *recv_buffer_where;
4582a0ba757dSStefano Zampini     PetscMPIInt *send_buffer;
4583a0ba757dSStefano Zampini     PetscMPIInt size_of_send;
4584a0ba757dSStefano Zampini     PetscInt *sizes_of_sends;
4585a0ba757dSStefano Zampini     MPI_Request *send_requests;
4586a0ba757dSStefano Zampini     MPI_Request *recv_requests;
4587a0ba757dSStefano Zampini     PetscInt *where_cc_adapt;
4588a0ba757dSStefano Zampini     PetscInt **temp_buffer;
4589a0ba757dSStefano Zampini     PetscInt *nodes_to_temp_buffer_indices;
4590a0ba757dSStefano Zampini     PetscInt *add_to_where;
4591a0ba757dSStefano Zampini 
4592a0ba757dSStefano Zampini     ierr = MPI_Comm_rank(interface_comm,&my_rank);CHKERRQ(ierr);
4593a0ba757dSStefano Zampini     ierr = PetscMalloc((where_values+1)*sizeof(PetscInt),&cum_recv_counts);CHKERRQ(ierr);
4594a0ba757dSStefano Zampini     ierr = PetscMemzero(cum_recv_counts,(where_values+1)*sizeof(PetscInt));CHKERRQ(ierr);
4595a0ba757dSStefano Zampini     ierr = PetscMalloc(where_values*sizeof(PetscInt),&where_to_nodes_indices);CHKERRQ(ierr);
4596a0ba757dSStefano Zampini     /* first count how many neighbours per connected component I will receive from */
4597a0ba757dSStefano Zampini     cum_recv_counts[0]=0;
4598a0ba757dSStefano Zampini     for (i=1;i<where_values+1;i++){
4599a0ba757dSStefano Zampini       j=0;
4600d8923723SStefano Zampini       while(mat_graph->where[j] != i) { j++; }
4601a0ba757dSStefano Zampini       where_to_nodes_indices[i-1]=j;
4602da1bb401SStefano Zampini       if (mat_graph->neighbours_set[j][0]!=-1) { cum_recv_counts[i]=cum_recv_counts[i-1]+mat_graph->count[j]; } /* We don't want sends/recvs_to/from_self -> here I don't count myself  */
46033b03a366Sstefano_zampini       else { cum_recv_counts[i]=cum_recv_counts[i-1]+mat_graph->count[j]-1; }
4604a0ba757dSStefano Zampini     }
4605a0ba757dSStefano Zampini     ierr = PetscMalloc(2*cum_recv_counts[where_values]*sizeof(PetscMPIInt),&recv_buffer_where);CHKERRQ(ierr);
4606a0ba757dSStefano Zampini     ierr = PetscMalloc(cum_recv_counts[where_values]*sizeof(MPI_Request),&send_requests);CHKERRQ(ierr);
4607a0ba757dSStefano Zampini     ierr = PetscMalloc(cum_recv_counts[where_values]*sizeof(MPI_Request),&recv_requests);CHKERRQ(ierr);
4608a0ba757dSStefano Zampini     for (i=0;i<cum_recv_counts[where_values];i++) {
4609a0ba757dSStefano Zampini       send_requests[i]=MPI_REQUEST_NULL;
4610a0ba757dSStefano Zampini       recv_requests[i]=MPI_REQUEST_NULL;
4611a0ba757dSStefano Zampini     }
4612a0ba757dSStefano Zampini     /* exchange with my neighbours the number of my connected components on the shared interface */
4613a0ba757dSStefano Zampini     for (i=0;i<where_values;i++){
4614a0ba757dSStefano Zampini       j=where_to_nodes_indices[i];
4615da1bb401SStefano Zampini       k = (mat_graph->neighbours_set[j][0] == -1 ?  1 : 0);
4616a0ba757dSStefano Zampini       for (;k<mat_graph->count[j];k++){
4617da1bb401SStefano Zampini         ierr = MPI_Isend(&mat_graph->where_ncmps[i],1,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr);
4618da1bb401SStefano Zampini         ierr = MPI_Irecv(&recv_buffer_where[sum_requests],1,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr);
4619a0ba757dSStefano Zampini         sum_requests++;
4620a0ba757dSStefano Zampini       }
4621a0ba757dSStefano Zampini     }
4622a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
4623a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
4624a0ba757dSStefano Zampini     /* determine the connected component I need to adapt */
4625a0ba757dSStefano Zampini     ierr = PetscMalloc(where_values*sizeof(PetscInt),&where_cc_adapt);CHKERRQ(ierr);
4626a0ba757dSStefano Zampini     ierr = PetscMemzero(where_cc_adapt,where_values*sizeof(PetscInt));CHKERRQ(ierr);
4627a0ba757dSStefano Zampini     for (i=0;i<where_values;i++){
4628a0ba757dSStefano Zampini       for (j=cum_recv_counts[i];j<cum_recv_counts[i+1];j++){
46293b03a366Sstefano_zampini         /* The first condition is natural (i.e someone has a different number of cc than me), the second one is just to be safe */
46303b03a366Sstefano_zampini         if ( mat_graph->where_ncmps[i]!=recv_buffer_where[j] || mat_graph->where_ncmps[i] > 1 ) {
4631a0ba757dSStefano Zampini           where_cc_adapt[i]=PETSC_TRUE;
4632a0ba757dSStefano Zampini           break;
4633a0ba757dSStefano Zampini         }
4634a0ba757dSStefano Zampini       }
4635a0ba757dSStefano Zampini     }
4636d8923723SStefano Zampini     buffer_size = 0;
4637d8923723SStefano Zampini     for (i=0;i<where_values;i++) {
4638d8923723SStefano Zampini       if (where_cc_adapt[i]) {
4639d8923723SStefano Zampini         for (j=i;j<mat_graph->ncmps;j++) {
4640d8923723SStefano Zampini           if (mat_graph->where[mat_graph->queue[mat_graph->cptr[j]]] == i+1) { /* WARNING -> where values goes from 1 to where_values included */
4641d8923723SStefano Zampini             buffer_size += 1 + mat_graph->cptr[j+1]-mat_graph->cptr[j];
4642d8923723SStefano Zampini           }
4643d8923723SStefano Zampini         }
4644d8923723SStefano Zampini       }
4645d8923723SStefano Zampini     }
4646d8923723SStefano Zampini     ierr = PetscMalloc(buffer_size*sizeof(PetscMPIInt),&send_buffer);CHKERRQ(ierr);
4647a0ba757dSStefano Zampini     /* now get from neighbours their ccs (in global numbering) and adapt them (in case it is needed) */
4648a0ba757dSStefano Zampini     /* first determine how much data to send (size of each queue plus the global indices) and communicate it to neighbours */
4649a0ba757dSStefano Zampini     ierr = PetscMalloc(where_values*sizeof(PetscInt),&sizes_of_sends);CHKERRQ(ierr);
4650a0ba757dSStefano Zampini     ierr = PetscMemzero(sizes_of_sends,where_values*sizeof(PetscInt));CHKERRQ(ierr);
4651a0ba757dSStefano Zampini     sum_requests=0;
4652a0ba757dSStefano Zampini     start_of_send=0;
4653a0ba757dSStefano Zampini     start_of_recv=cum_recv_counts[where_values];
4654a0ba757dSStefano Zampini     for (i=0;i<where_values;i++) {
4655a0ba757dSStefano Zampini       if (where_cc_adapt[i]) {
4656a0ba757dSStefano Zampini         size_of_send=0;
4657a0ba757dSStefano Zampini         for (j=i;j<mat_graph->ncmps;j++) {
4658a0ba757dSStefano Zampini           if (mat_graph->where[mat_graph->queue[mat_graph->cptr[j]]] == i+1) { /* WARNING -> where values goes from 1 to where_values included */
4659a0ba757dSStefano Zampini             send_buffer[start_of_send+size_of_send]=mat_graph->cptr[j+1]-mat_graph->cptr[j];
4660a0ba757dSStefano Zampini             size_of_send+=1;
4661a0ba757dSStefano Zampini             for (k=0;k<mat_graph->cptr[j+1]-mat_graph->cptr[j];k++) {
4662a0ba757dSStefano Zampini               send_buffer[start_of_send+size_of_send+k]=queue_in_global_numbering[mat_graph->cptr[j]+k];
4663a0ba757dSStefano Zampini             }
4664a0ba757dSStefano Zampini             size_of_send=size_of_send+mat_graph->cptr[j+1]-mat_graph->cptr[j];
4665a0ba757dSStefano Zampini           }
4666a0ba757dSStefano Zampini         }
4667a0ba757dSStefano Zampini         j = where_to_nodes_indices[i];
4668da1bb401SStefano Zampini         k = (mat_graph->neighbours_set[j][0] == -1 ?  1 : 0);
466911d8f4c2SStefano Zampini         sizes_of_sends[i]=size_of_send;
4670a0ba757dSStefano Zampini         for (;k<mat_graph->count[j];k++){
467111d8f4c2SStefano Zampini           ierr = MPI_Isend(&sizes_of_sends[i],1,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr);
4672da1bb401SStefano Zampini           ierr = MPI_Irecv(&recv_buffer_where[sum_requests+start_of_recv],1,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr);
4673a0ba757dSStefano Zampini           sum_requests++;
4674a0ba757dSStefano Zampini         }
4675a0ba757dSStefano Zampini         start_of_send+=size_of_send;
4676a0ba757dSStefano Zampini       }
4677a0ba757dSStefano Zampini     }
4678a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
4679a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
4680a0ba757dSStefano Zampini     buffer_size=0;
4681a0ba757dSStefano Zampini     for (k=0;k<sum_requests;k++) { buffer_size+=recv_buffer_where[start_of_recv+k]; }
4682a0ba757dSStefano Zampini     ierr = PetscMalloc(buffer_size*sizeof(PetscMPIInt),&recv_buffer);CHKERRQ(ierr);
4683a0ba757dSStefano Zampini     /* now exchange the data */
4684a0ba757dSStefano Zampini     start_of_recv=0;
4685a0ba757dSStefano Zampini     start_of_send=0;
4686a0ba757dSStefano Zampini     sum_requests=0;
4687a0ba757dSStefano Zampini     for (i=0;i<where_values;i++) {
4688a0ba757dSStefano Zampini       if (where_cc_adapt[i]) {
4689a0ba757dSStefano Zampini         size_of_send = sizes_of_sends[i];
4690a0ba757dSStefano Zampini         j = where_to_nodes_indices[i];
4691da1bb401SStefano Zampini         k = (mat_graph->neighbours_set[j][0] == -1 ?  1 : 0);
4692a0ba757dSStefano Zampini         for (;k<mat_graph->count[j];k++){
4693da1bb401SStefano Zampini           ierr = MPI_Isend(&send_buffer[start_of_send],size_of_send,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr);
4694a0ba757dSStefano Zampini           size_of_recv=recv_buffer_where[cum_recv_counts[where_values]+sum_requests];
4695da1bb401SStefano Zampini           ierr = MPI_Irecv(&recv_buffer[start_of_recv],size_of_recv,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr);
4696a0ba757dSStefano Zampini           start_of_recv+=size_of_recv;
4697a0ba757dSStefano Zampini           sum_requests++;
4698a0ba757dSStefano Zampini         }
4699a0ba757dSStefano Zampini         start_of_send+=size_of_send;
4700a0ba757dSStefano Zampini       }
4701a0ba757dSStefano Zampini     }
4702a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
4703a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
4704a0ba757dSStefano Zampini     ierr = PetscMalloc(buffer_size*sizeof(PetscInt),&petsc_buffer);CHKERRQ(ierr);
4705a0ba757dSStefano Zampini     for (k=0;k<start_of_recv;k++) { petsc_buffer[k]=(PetscInt)recv_buffer[k]; }
4706a0ba757dSStefano Zampini     for (j=0;j<buffer_size;) {
4707a0ba757dSStefano Zampini        ierr = ISGlobalToLocalMappingApply(matis->mapping,IS_GTOLM_MASK,petsc_buffer[j],&petsc_buffer[j+1],&petsc_buffer[j],&petsc_buffer[j+1]);CHKERRQ(ierr);
4708a0ba757dSStefano Zampini        k=petsc_buffer[j]+1;
4709a0ba757dSStefano Zampini        j+=k;
4710a0ba757dSStefano Zampini     }
4711a0ba757dSStefano Zampini     sum_requests=cum_recv_counts[where_values];
4712a0ba757dSStefano Zampini     start_of_recv=0;
4713a0ba757dSStefano Zampini     ierr = PetscMalloc(mat_graph->nvtxs*sizeof(PetscInt),&nodes_to_temp_buffer_indices);CHKERRQ(ierr);
4714a0ba757dSStefano Zampini     global_where_counter=0;
4715a0ba757dSStefano Zampini     for (i=0;i<where_values;i++){
4716a0ba757dSStefano Zampini       if (where_cc_adapt[i]){
4717a0ba757dSStefano Zampini         temp_buffer_size=0;
4718a0ba757dSStefano Zampini         /* find nodes on the shared interface we need to adapt */
4719a0ba757dSStefano Zampini         for (j=0;j<mat_graph->nvtxs;j++){
4720a0ba757dSStefano Zampini           if (mat_graph->where[j]==i+1) {
4721a0ba757dSStefano Zampini             nodes_to_temp_buffer_indices[j]=temp_buffer_size;
4722a0ba757dSStefano Zampini             temp_buffer_size++;
4723a0ba757dSStefano Zampini           } else {
4724a0ba757dSStefano Zampini             nodes_to_temp_buffer_indices[j]=-1;
4725a0ba757dSStefano Zampini           }
4726a0ba757dSStefano Zampini         }
4727a0ba757dSStefano Zampini         /* allocate some temporary space */
4728a0ba757dSStefano Zampini         ierr = PetscMalloc(temp_buffer_size*sizeof(PetscInt*),&temp_buffer);CHKERRQ(ierr);
4729a0ba757dSStefano Zampini         ierr = PetscMalloc(temp_buffer_size*(cum_recv_counts[i+1]-cum_recv_counts[i])*sizeof(PetscInt),&temp_buffer[0]);CHKERRQ(ierr);
4730a0ba757dSStefano Zampini         ierr = PetscMemzero(temp_buffer[0],temp_buffer_size*(cum_recv_counts[i+1]-cum_recv_counts[i])*sizeof(PetscInt));CHKERRQ(ierr);
4731a0ba757dSStefano Zampini         for (j=1;j<temp_buffer_size;j++){
4732a0ba757dSStefano Zampini           temp_buffer[j]=temp_buffer[j-1]+cum_recv_counts[i+1]-cum_recv_counts[i];
4733a0ba757dSStefano Zampini         }
4734a0ba757dSStefano Zampini         /* analyze contributions from neighbouring subdomains for i-th conn comp
4735a0ba757dSStefano Zampini            temp buffer structure:
4736a0ba757dSStefano Zampini            supposing part of the interface has dimension 5 (global nodes 0,1,2,3,4)
4737a0ba757dSStefano Zampini            3 neighs procs with structured connected components:
4738a0ba757dSStefano Zampini              neigh 0: [0 1 4], [2 3];  (2 connected components)
4739a0ba757dSStefano Zampini              neigh 1: [0 1], [2 3 4];  (2 connected components)
4740a0ba757dSStefano Zampini              neigh 2: [0 4], [1], [2 3]; (3 connected components)
4741a0ba757dSStefano Zampini            tempbuffer (row-oriented) should be filled as:
4742a0ba757dSStefano Zampini              [ 0, 0, 0;
4743a0ba757dSStefano Zampini                0, 0, 1;
4744a0ba757dSStefano Zampini                1, 1, 2;
4745a0ba757dSStefano Zampini                1, 1, 2;
4746a0ba757dSStefano Zampini                0, 1, 0; ];
4747a0ba757dSStefano Zampini            This way we can simply recover the resulting structure account for possible intersections of ccs among neighs.
4748a0ba757dSStefano Zampini            The mat_graph->where array will be modified to reproduce the following 4 connected components [0], [1], [2 3], [4];
4749a0ba757dSStefano Zampini                                                                                                                                    */
4750a0ba757dSStefano Zampini         for (j=0;j<cum_recv_counts[i+1]-cum_recv_counts[i];j++) {
4751a0ba757dSStefano Zampini           ins_val=0;
4752a0ba757dSStefano Zampini           size_of_recv=recv_buffer_where[sum_requests];  /* total size of recv from neighs */
4753a0ba757dSStefano Zampini           for (buffer_size=0;buffer_size<size_of_recv;) {  /* loop until all data from neighs has been taken into account */
4754a0ba757dSStefano Zampini             for (k=1;k<petsc_buffer[buffer_size+start_of_recv]+1;k++) { /* filling properly temp_buffer using data from a single recv */
4755a0ba757dSStefano Zampini               temp_buffer[ nodes_to_temp_buffer_indices[ petsc_buffer[ start_of_recv+buffer_size+k ] ] ][j]=ins_val;
4756a0ba757dSStefano Zampini             }
4757a0ba757dSStefano Zampini             buffer_size+=k;
4758a0ba757dSStefano Zampini             ins_val++;
4759a0ba757dSStefano Zampini           }
4760a0ba757dSStefano Zampini           start_of_recv+=size_of_recv;
4761a0ba757dSStefano Zampini           sum_requests++;
4762a0ba757dSStefano Zampini         }
4763a0ba757dSStefano Zampini         ierr = PetscMalloc(temp_buffer_size*sizeof(PetscInt),&add_to_where);CHKERRQ(ierr);
4764a0ba757dSStefano Zampini         ierr = PetscMemzero(add_to_where,temp_buffer_size*sizeof(PetscInt));CHKERRQ(ierr);
4765a0ba757dSStefano Zampini         for (j=0;j<temp_buffer_size;j++){
4766a0ba757dSStefano Zampini           if (!add_to_where[j]){ /* found a new cc  */
4767a0ba757dSStefano Zampini             global_where_counter++;
4768a0ba757dSStefano Zampini             add_to_where[j]=global_where_counter;
4769a0ba757dSStefano Zampini             for (k=j+1;k<temp_buffer_size;k++){ /* check for other nodes in new cc */
4770a0ba757dSStefano Zampini               same_set=PETSC_TRUE;
4771a0ba757dSStefano Zampini               for (s=0;s<cum_recv_counts[i+1]-cum_recv_counts[i];s++){
4772a0ba757dSStefano Zampini                 if (temp_buffer[j][s]!=temp_buffer[k][s]) {
4773a0ba757dSStefano Zampini                   same_set=PETSC_FALSE;
4774a0ba757dSStefano Zampini                   break;
4775a0ba757dSStefano Zampini                 }
4776a0ba757dSStefano Zampini               }
4777a0ba757dSStefano Zampini               if (same_set) add_to_where[k]=global_where_counter;
4778a0ba757dSStefano Zampini             }
4779a0ba757dSStefano Zampini           }
4780a0ba757dSStefano Zampini         }
4781a0ba757dSStefano Zampini         /* insert new data in where array */
4782a0ba757dSStefano Zampini         temp_buffer_size=0;
4783a0ba757dSStefano Zampini         for (j=0;j<mat_graph->nvtxs;j++){
4784a0ba757dSStefano Zampini           if (mat_graph->where[j]==i+1) {
4785a0ba757dSStefano Zampini             mat_graph->where[j]=where_values+add_to_where[temp_buffer_size];
4786a0ba757dSStefano Zampini             temp_buffer_size++;
4787a0ba757dSStefano Zampini           }
4788a0ba757dSStefano Zampini         }
4789a0ba757dSStefano Zampini         ierr = PetscFree(temp_buffer[0]);CHKERRQ(ierr);
4790a0ba757dSStefano Zampini         ierr = PetscFree(temp_buffer);CHKERRQ(ierr);
4791a0ba757dSStefano Zampini         ierr = PetscFree(add_to_where);CHKERRQ(ierr);
4792a0ba757dSStefano Zampini       }
4793a0ba757dSStefano Zampini     }
4794a0ba757dSStefano Zampini     ierr = PetscFree(nodes_to_temp_buffer_indices);CHKERRQ(ierr);
4795a0ba757dSStefano Zampini     ierr = PetscFree(sizes_of_sends);CHKERRQ(ierr);
4796a0ba757dSStefano Zampini     ierr = PetscFree(send_requests);CHKERRQ(ierr);
4797a0ba757dSStefano Zampini     ierr = PetscFree(recv_requests);CHKERRQ(ierr);
4798a0ba757dSStefano Zampini     ierr = PetscFree(petsc_buffer);CHKERRQ(ierr);
4799a0ba757dSStefano Zampini     ierr = PetscFree(recv_buffer);CHKERRQ(ierr);
4800a0ba757dSStefano Zampini     ierr = PetscFree(recv_buffer_where);CHKERRQ(ierr);
4801a0ba757dSStefano Zampini     ierr = PetscFree(send_buffer);CHKERRQ(ierr);
4802a0ba757dSStefano Zampini     ierr = PetscFree(cum_recv_counts);CHKERRQ(ierr);
4803a0ba757dSStefano Zampini     ierr = PetscFree(where_to_nodes_indices);CHKERRQ(ierr);
480423d4d1a5SStefano Zampini     ierr = PetscFree(where_cc_adapt);CHKERRQ(ierr);
4805a0ba757dSStefano Zampini     /* We are ready to evaluate consistent connected components on each part of the shared interface */
4806a0ba757dSStefano Zampini     if (global_where_counter) {
4807a0ba757dSStefano Zampini       for (i=0;i<mat_graph->nvtxs;i++){ mat_graph->touched[i]=PETSC_FALSE; }
4808a0ba757dSStefano Zampini       global_where_counter=0;
4809a0ba757dSStefano Zampini       for (i=0;i<mat_graph->nvtxs;i++){
4810a0ba757dSStefano Zampini         if (mat_graph->where[i] && !mat_graph->touched[i]) {
4811a0ba757dSStefano Zampini           global_where_counter++;
4812a0ba757dSStefano Zampini           for (j=i+1;j<mat_graph->nvtxs;j++){
4813a0ba757dSStefano Zampini             if (!mat_graph->touched[j] && mat_graph->where[j]==mat_graph->where[i]) {
4814a0ba757dSStefano Zampini               mat_graph->where[j]=global_where_counter;
4815a0ba757dSStefano Zampini               mat_graph->touched[j]=PETSC_TRUE;
4816a0ba757dSStefano Zampini             }
4817a0ba757dSStefano Zampini           }
4818a0ba757dSStefano Zampini           mat_graph->where[i]=global_where_counter;
4819a0ba757dSStefano Zampini           mat_graph->touched[i]=PETSC_TRUE;
4820a0ba757dSStefano Zampini         }
4821a0ba757dSStefano Zampini       }
4822a0ba757dSStefano Zampini       where_values=global_where_counter;
4823a0ba757dSStefano Zampini     }
4824a0ba757dSStefano Zampini     if (global_where_counter) {
4825a0ba757dSStefano Zampini       ierr = PetscMemzero(mat_graph->cptr,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr);
4826a0ba757dSStefano Zampini       ierr = PetscMemzero(mat_graph->queue,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
4827a0ba757dSStefano Zampini       ierr = PetscFree(mat_graph->where_ncmps);CHKERRQ(ierr);
4828a0ba757dSStefano Zampini       ierr = PetscMalloc(where_values*sizeof(PetscMPIInt),&mat_graph->where_ncmps);CHKERRQ(ierr);
4829a0ba757dSStefano Zampini       ierr = PCBDDCFindConnectedComponents(mat_graph, where_values);
4830a0ba757dSStefano Zampini       for (i=0;i<mat_graph->ncmps;i++) {
4831a0ba757dSStefano Zampini         ierr = ISLocalToGlobalMappingApply(matis->mapping,mat_graph->cptr[i+1]-mat_graph->cptr[i],&mat_graph->queue[mat_graph->cptr[i]],&queue_in_global_numbering[mat_graph->cptr[i]]);CHKERRQ(ierr);
4832a0ba757dSStefano Zampini         ierr = PetscSortIntWithArray(mat_graph->cptr[i+1]-mat_graph->cptr[i],&queue_in_global_numbering[mat_graph->cptr[i]],&mat_graph->queue[mat_graph->cptr[i]]);CHKERRQ(ierr);
4833a0ba757dSStefano Zampini       }
4834a0ba757dSStefano Zampini     }
48353b03a366Sstefano_zampini   } /* Finished adapting interface */
48360c7d97c5SJed Brown   PetscInt nfc=0;
48370c7d97c5SJed Brown   PetscInt nec=0;
48380c7d97c5SJed Brown   PetscInt nvc=0;
48393b03a366Sstefano_zampini   PetscBool twodim_flag=PETSC_FALSE;
48400c7d97c5SJed Brown   for (i=0; i<mat_graph->ncmps; i++) {
48413b03a366Sstefano_zampini     if ( mat_graph->cptr[i+1]-mat_graph->cptr[i] > vertex_size ){
4842534831adSStefano Zampini       if (mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]==1){ /* 1 neigh Neumann fake included */
48430c7d97c5SJed Brown         nfc++;
48443b03a366Sstefano_zampini       } else { /* note that nec will be zero in 2d */
48453b03a366Sstefano_zampini         nec++;
48463b03a366Sstefano_zampini       }
48470c7d97c5SJed Brown     } else {
48483b03a366Sstefano_zampini       nvc+=mat_graph->cptr[i+1]-mat_graph->cptr[i];
48493b03a366Sstefano_zampini     }
48503b03a366Sstefano_zampini   }
48513b03a366Sstefano_zampini 
48523b03a366Sstefano_zampini   if (!nec) { /* we are in a 2d case -> no faces, only edges */
48533b03a366Sstefano_zampini     nec = nfc;
48543b03a366Sstefano_zampini     nfc = 0;
48553b03a366Sstefano_zampini     twodim_flag = PETSC_TRUE;
48563b03a366Sstefano_zampini   }
48573972b0daSStefano Zampini   /* allocate IS arrays for faces, edges. Vertices need a single index set. */
48583972b0daSStefano Zampini   k=0;
48593972b0daSStefano Zampini   for (i=0; i<mat_graph->ncmps; i++) {
48603972b0daSStefano Zampini     j=mat_graph->cptr[i+1]-mat_graph->cptr[i];
48613972b0daSStefano Zampini     if ( j > k) {
48623972b0daSStefano Zampini       k=j;
48633972b0daSStefano Zampini     }
4864ba1573a8SStefano Zampini     if (j<=vertex_size) {
4865ba1573a8SStefano Zampini       k+=vertex_size;
4866ba1573a8SStefano Zampini     }
48673972b0daSStefano Zampini   }
48683972b0daSStefano Zampini   ierr = PetscMalloc(k*sizeof(PetscInt),&auxis);CHKERRQ(ierr);
48693972b0daSStefano Zampini 
48703b03a366Sstefano_zampini   if (!pcbddc->vertices_flag && !pcbddc->edges_flag) {
48713b03a366Sstefano_zampini     ierr = PetscMalloc(nfc*sizeof(IS),&pcbddc->ISForFaces);CHKERRQ(ierr);
48723b03a366Sstefano_zampini     use_faces=PETSC_TRUE;
48733b03a366Sstefano_zampini   }
48743b03a366Sstefano_zampini   if (!pcbddc->vertices_flag && !pcbddc->faces_flag) {
48753b03a366Sstefano_zampini     ierr = PetscMalloc(nec*sizeof(IS),&pcbddc->ISForEdges);CHKERRQ(ierr);
48763b03a366Sstefano_zampini     use_edges=PETSC_TRUE;
48773b03a366Sstefano_zampini   }
48783b03a366Sstefano_zampini   nfc=0;
48793b03a366Sstefano_zampini   nec=0;
48803b03a366Sstefano_zampini   for (i=0; i<mat_graph->ncmps; i++) {
48813b03a366Sstefano_zampini     if ( mat_graph->cptr[i+1]-mat_graph->cptr[i] > vertex_size ){
48823b03a366Sstefano_zampini       for (j=0;j<mat_graph->cptr[i+1]-mat_graph->cptr[i];j++) {
48833972b0daSStefano Zampini         auxis[j]=mat_graph->queue[mat_graph->cptr[i]+j];
48843b03a366Sstefano_zampini       }
48853b03a366Sstefano_zampini       if (mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]==1){
48863b03a366Sstefano_zampini         if (twodim_flag) {
48873b03a366Sstefano_zampini           if (use_edges) {
48883972b0daSStefano Zampini             ierr = ISCreateGeneral(PETSC_COMM_SELF,j,auxis,PETSC_COPY_VALUES,&pcbddc->ISForEdges[nec]);CHKERRQ(ierr);
48893b03a366Sstefano_zampini             nec++;
48903b03a366Sstefano_zampini           }
48913b03a366Sstefano_zampini         } else {
48923b03a366Sstefano_zampini           if (use_faces) {
48933972b0daSStefano Zampini             ierr = ISCreateGeneral(PETSC_COMM_SELF,j,auxis,PETSC_COPY_VALUES,&pcbddc->ISForFaces[nfc]);CHKERRQ(ierr);
48943b03a366Sstefano_zampini             nfc++;
48953b03a366Sstefano_zampini           }
48963b03a366Sstefano_zampini         }
48973b03a366Sstefano_zampini       } else {
48983b03a366Sstefano_zampini         if (use_edges) {
48993972b0daSStefano Zampini           ierr = ISCreateGeneral(PETSC_COMM_SELF,j,auxis,PETSC_COPY_VALUES,&pcbddc->ISForEdges[nec]);CHKERRQ(ierr);
49000c7d97c5SJed Brown           nec++;
49010c7d97c5SJed Brown         }
49020c7d97c5SJed Brown       }
49030c7d97c5SJed Brown     }
49043b03a366Sstefano_zampini   }
49053b03a366Sstefano_zampini   pcbddc->n_ISForFaces=nfc;
49063b03a366Sstefano_zampini   pcbddc->n_ISForEdges=nec;
49073b03a366Sstefano_zampini   nvc=0;
49080c7d97c5SJed Brown   if ( !pcbddc->constraints_flag ) {
49093b03a366Sstefano_zampini     for (i=0; i<mat_graph->ncmps; i++) {
49103b03a366Sstefano_zampini       if ( mat_graph->cptr[i+1]-mat_graph->cptr[i] <= vertex_size ){
49113b03a366Sstefano_zampini         for ( j=mat_graph->cptr[i];j<mat_graph->cptr[i+1];j++) {
49123972b0daSStefano Zampini           auxis[nvc]=mat_graph->queue[j];
49130c7d97c5SJed Brown           nvc++;
49140c7d97c5SJed Brown         }
49150c7d97c5SJed Brown       }
49160c7d97c5SJed Brown     }
49170c7d97c5SJed Brown   }
4918a0ba757dSStefano Zampini   /* sort vertex set (by local ordering) */
49193972b0daSStefano Zampini   ierr = PetscSortInt(nvc,auxis);CHKERRQ(ierr);
49203972b0daSStefano Zampini   ierr = ISCreateGeneral(PETSC_COMM_SELF,nvc,auxis,PETSC_COPY_VALUES,&pcbddc->ISForVertices);CHKERRQ(ierr);
49210c7d97c5SJed Brown 
4922e269702eSStefano Zampini   if (pcbddc->dbg_flag) {
4923e269702eSStefano Zampini 
4924d49ef151SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"--------------------------------------------------------------\n");CHKERRQ(ierr);
4925d49ef151SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Details from PCBDDCManageLocalBoundaries for subdomain %04d\n",PetscGlobalRank);CHKERRQ(ierr);
4926d49ef151SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"--------------------------------------------------------------\n");CHKERRQ(ierr);
4927a0ba757dSStefano Zampini /*    ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Graph (adjacency structure) of local Neumann mat\n");CHKERRQ(ierr);
4928a0ba757dSStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"--------------------------------------------------------------\n");CHKERRQ(ierr);
4929e269702eSStefano Zampini     for (i=0;i<mat_graph->nvtxs;i++) {
4930a0ba757dSStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Nodes connected to node number %d are %d\n",i,mat_graph->xadj[i+1]-mat_graph->xadj[i]);CHKERRQ(ierr);
4931e269702eSStefano Zampini       for (j=mat_graph->xadj[i];j<mat_graph->xadj[i+1];j++){
4932a0ba757dSStefano Zampini         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d ",mat_graph->adjncy[j]);CHKERRQ(ierr);
4933e269702eSStefano Zampini       }
4934a0ba757dSStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\n--------------------------------------------------------------\n");CHKERRQ(ierr);
4935da1bb401SStefano Zampini     }*/
4936d49ef151SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Matrix graph has %d connected components", mat_graph->ncmps);CHKERRQ(ierr);
49370c7d97c5SJed Brown     for (i=0;i<mat_graph->ncmps;i++) {
49383b03a366Sstefano_zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\nDetails for connected component number %02d: size %04d, count %01d. Nodes follow.\n",
49393b03a366Sstefano_zampini              i,mat_graph->cptr[i+1]-mat_graph->cptr[i],mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]);CHKERRQ(ierr);
4940da1bb401SStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"subdomains: ");
4941da1bb401SStefano Zampini       for (j=0;j<mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]; j++) {
4942da1bb401SStefano Zampini         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d ",mat_graph->neighbours_set[mat_graph->queue[mat_graph->cptr[i]]][j]);
4943da1bb401SStefano Zampini       }
4944da1bb401SStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\n");
49450c7d97c5SJed Brown       for (j=mat_graph->cptr[i]; j<mat_graph->cptr[i+1]; j++){
4946da1bb401SStefano Zampini         /* ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d (%d), ",queue_in_global_numbering[j],mat_graph->queue[j]);CHKERRQ(ierr); */
4947da1bb401SStefano Zampini         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d, ",mat_graph->queue[j]);CHKERRQ(ierr);
49480c7d97c5SJed Brown       }
49490c7d97c5SJed Brown     }
4950da1bb401SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\n--------------------------------------------------------------\n");CHKERRQ(ierr);
49513b03a366Sstefano_zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local vertices\n",PetscGlobalRank,nvc);CHKERRQ(ierr);
49523b03a366Sstefano_zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local faces\n",PetscGlobalRank,nfc);CHKERRQ(ierr);
49533b03a366Sstefano_zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local edges\n",PetscGlobalRank,nec);CHKERRQ(ierr);
4954d49ef151SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
49550c7d97c5SJed Brown   }
49560c7d97c5SJed Brown 
49573972b0daSStefano Zampini   ierr = PetscFree(queue_in_global_numbering);CHKERRQ(ierr);
49583972b0daSStefano Zampini   ierr = PetscFree(auxis);CHKERRQ(ierr);
49590c7d97c5SJed Brown   PetscFunctionReturn(0);
49600c7d97c5SJed Brown 
49610c7d97c5SJed Brown }
49620c7d97c5SJed Brown 
49630c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
49640c7d97c5SJed Brown 
49650c7d97c5SJed Brown /* The following code has been adapted from function IsConnectedSubdomain contained
4966da1bb401SStefano Zampini    in source file contig.c of METIS library (version 5.0.1)
4967da1bb401SStefano Zampini    It finds connected components of each partition labeled from 1 to n_dist  */
49680c7d97c5SJed Brown 
49690c7d97c5SJed Brown #undef __FUNCT__
49700c7d97c5SJed Brown #define __FUNCT__ "PCBDDCFindConnectedComponents"
49719c0446d6SStefano Zampini static PetscErrorCode PCBDDCFindConnectedComponents(PCBDDCGraph graph, PetscInt n_dist )
49720c7d97c5SJed Brown {
49730c7d97c5SJed Brown   PetscInt i, j, k, nvtxs, first, last, nleft, ncmps,pid,cum_queue,n,ncmps_pid;
49740c7d97c5SJed Brown   PetscInt *xadj, *adjncy, *where, *queue;
49750c7d97c5SJed Brown   PetscInt *cptr;
49760c7d97c5SJed Brown   PetscBool *touched;
49770c7d97c5SJed Brown 
49780c7d97c5SJed Brown   PetscFunctionBegin;
49790c7d97c5SJed Brown 
49800c7d97c5SJed Brown   nvtxs   = graph->nvtxs;
49810c7d97c5SJed Brown   xadj    = graph->xadj;
49820c7d97c5SJed Brown   adjncy  = graph->adjncy;
49830c7d97c5SJed Brown   where   = graph->where;
49840c7d97c5SJed Brown   touched = graph->touched;
49850c7d97c5SJed Brown   queue   = graph->queue;
49860c7d97c5SJed Brown   cptr    = graph->cptr;
49870c7d97c5SJed Brown 
49880c7d97c5SJed Brown   for (i=0; i<nvtxs; i++)
49890c7d97c5SJed Brown     touched[i] = PETSC_FALSE;
49900c7d97c5SJed Brown 
49910c7d97c5SJed Brown   cum_queue=0;
49920c7d97c5SJed Brown   ncmps=0;
49930c7d97c5SJed Brown 
49940c7d97c5SJed Brown   for (n=0; n<n_dist; n++) {
4995da1bb401SStefano Zampini     pid = n+1;  /* partition labeled by 0 is discarded */
49960c7d97c5SJed Brown     nleft = 0;
49970c7d97c5SJed Brown     for (i=0; i<nvtxs; i++) {
49980c7d97c5SJed Brown       if (where[i] == pid)
49990c7d97c5SJed Brown         nleft++;
50000c7d97c5SJed Brown     }
50010c7d97c5SJed Brown     for (i=0; i<nvtxs; i++) {
50020c7d97c5SJed Brown       if (where[i] == pid)
50030c7d97c5SJed Brown         break;
50040c7d97c5SJed Brown     }
50050c7d97c5SJed Brown     touched[i] = PETSC_TRUE;
50060c7d97c5SJed Brown     queue[cum_queue] = i;
50070c7d97c5SJed Brown     first = 0; last = 1;
50080c7d97c5SJed Brown     cptr[ncmps] = cum_queue;  /* This actually points to queue */
50090c7d97c5SJed Brown     ncmps_pid = 0;
50100c7d97c5SJed Brown     while (first != nleft) {
50110c7d97c5SJed Brown       if (first == last) { /* Find another starting vertex */
50120c7d97c5SJed Brown         cptr[++ncmps] = first+cum_queue;
50130c7d97c5SJed Brown         ncmps_pid++;
50140c7d97c5SJed Brown         for (i=0; i<nvtxs; i++) {
50150c7d97c5SJed Brown           if (where[i] == pid && !touched[i])
50160c7d97c5SJed Brown             break;
50170c7d97c5SJed Brown         }
50180c7d97c5SJed Brown         queue[cum_queue+last] = i;
50190c7d97c5SJed Brown         last++;
50200c7d97c5SJed Brown         touched[i] = PETSC_TRUE;
50210c7d97c5SJed Brown       }
50220c7d97c5SJed Brown       i = queue[cum_queue+first];
50230c7d97c5SJed Brown       first++;
50240c7d97c5SJed Brown       for (j=xadj[i]; j<xadj[i+1]; j++) {
50250c7d97c5SJed Brown         k = adjncy[j];
50260c7d97c5SJed Brown         if (where[k] == pid && !touched[k]) {
50270c7d97c5SJed Brown           queue[cum_queue+last] = k;
50280c7d97c5SJed Brown           last++;
50290c7d97c5SJed Brown           touched[k] = PETSC_TRUE;
50300c7d97c5SJed Brown         }
50310c7d97c5SJed Brown       }
50320c7d97c5SJed Brown     }
50330c7d97c5SJed Brown     cptr[++ncmps] = first+cum_queue;
50340c7d97c5SJed Brown     ncmps_pid++;
50350c7d97c5SJed Brown     cum_queue=cptr[ncmps];
5036a0ba757dSStefano Zampini     graph->where_ncmps[n] = ncmps_pid;
50370c7d97c5SJed Brown   }
50380c7d97c5SJed Brown   graph->ncmps = ncmps;
50390c7d97c5SJed Brown 
50400c7d97c5SJed Brown   PetscFunctionReturn(0);
50410c7d97c5SJed Brown }
5042