xref: /petsc/src/ksp/pc/impls/bddc/bddc.c (revision 4fad6a165e29709c3e1e0764af817b7d288c45e2)
153cdbc3dSStefano Zampini /* TODOLIST
2da1bb401SStefano Zampini    DofSplitting and DM attached to pc?
3da1bb401SStefano Zampini    Change SetNeumannBoundaries to SetNeumannBoundariesLocal and provide new SetNeumannBoundaries (same Dirichlet)
4831a100dSStefano Zampini      - change prec_type to switch_inexact_prec_type
53b03a366Sstefano_zampini    Inexact solvers: global preconditioner application is ready, ask to developers (Jed?) on how to best implement Dohrmann's approach (PCSHELL?)
6a0ba757dSStefano Zampini    change how to deal with the coarse problem (PCBDDCSetCoarseEnvironment):
7a0ba757dSStefano Zampini      - simplify coarse problem structure -> PCBDDC or PCREDUDANT, nothing else -> same comm for all levels?
8a0ba757dSStefano Zampini      - remove coarse enums and allow use of PCBDDCGetCoarseKSP
9a0ba757dSStefano Zampini      - remove metis dependency -> use MatPartitioning for multilevel -> Assemble serial adjacency in ManageLocalBoundaries?
10a0ba757dSStefano Zampini    code refactoring:
11a0ba757dSStefano Zampini      - pick up better names for static functions
12a0ba757dSStefano Zampini    change options structure:
13a0ba757dSStefano Zampini      - insert BDDC into MG framework?
14a0ba757dSStefano Zampini    provide other ops? Ask to developers
15a0ba757dSStefano Zampini    remove all unused printf
16a0ba757dSStefano Zampini    man pages
1753cdbc3dSStefano Zampini */
180c7d97c5SJed Brown 
1953cdbc3dSStefano Zampini /* ----------------------------------------------------------------------------------------------------------------------------------------------
200c7d97c5SJed Brown    Implementation of BDDC preconditioner based on:
210c7d97c5SJed Brown    C. Dohrmann "An approximate BDDC preconditioner", Numerical Linear Algebra with Applications Volume 14, Issue 2, pages 149-168, March 2007
2253cdbc3dSStefano Zampini    ---------------------------------------------------------------------------------------------------------------------------------------------- */
2353cdbc3dSStefano Zampini 
2453cdbc3dSStefano Zampini #include "bddc.h" /*I "petscpc.h" I*/  /* includes for fortran wrappers */
253b03a366Sstefano_zampini #include <petscblaslapack.h>
260c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
270c7d97c5SJed Brown #undef __FUNCT__
280c7d97c5SJed Brown #define __FUNCT__ "PCSetFromOptions_BDDC"
290c7d97c5SJed Brown PetscErrorCode PCSetFromOptions_BDDC(PC pc)
300c7d97c5SJed Brown {
310c7d97c5SJed Brown   PC_BDDC         *pcbddc = (PC_BDDC*)pc->data;
320c7d97c5SJed Brown   PetscErrorCode ierr;
330c7d97c5SJed Brown 
340c7d97c5SJed Brown   PetscFunctionBegin;
350c7d97c5SJed Brown   ierr = PetscOptionsHead("BDDC options");CHKERRQ(ierr);
360c7d97c5SJed Brown   /* Verbose debugging of main data structures */
37e269702eSStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_check_all"       ,"Verbose (debugging) output for PCBDDC"                       ,"none",pcbddc->dbg_flag      ,&pcbddc->dbg_flag      ,PETSC_NULL);CHKERRQ(ierr);
380c7d97c5SJed Brown   /* Some customization for default primal space */
39da1bb401SStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_vertices_only"   ,"Use only vertices in coarse space (i.e. discard constraints)","none",pcbddc->vertices_flag   ,&pcbddc->vertices_flag   ,PETSC_NULL);CHKERRQ(ierr);
40da1bb401SStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_constraints_only","Use only constraints in coarse space (i.e. discard vertices)","none",pcbddc->constraints_flag,&pcbddc->constraints_flag,PETSC_NULL);CHKERRQ(ierr);
41da1bb401SStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_faces_only"      ,"Use only faces among constraints of coarse space (i.e. discard edges)"         ,"none",pcbddc->faces_flag      ,&pcbddc->faces_flag      ,PETSC_NULL);CHKERRQ(ierr);
42da1bb401SStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_edges_only"      ,"Use only edges among constraints of coarse space (i.e. discard faces)"         ,"none",pcbddc->edges_flag      ,&pcbddc->edges_flag      ,PETSC_NULL);CHKERRQ(ierr);
430c7d97c5SJed Brown   /* Coarse solver context */
446c667b0aSStefano Zampini   static const char * const avail_coarse_problems[] = {"sequential","replicated","parallel","multilevel","CoarseProblemType","PC_BDDC_",0}; /*order of choiches depends on ENUM defined in bddc.h */
450c7d97c5SJed Brown   ierr = PetscOptionsEnum("-pc_bddc_coarse_problem_type","Set coarse problem type","none",avail_coarse_problems,(PetscEnum)pcbddc->coarse_problem_type,(PetscEnum*)&pcbddc->coarse_problem_type,PETSC_NULL);CHKERRQ(ierr);
460c7d97c5SJed Brown   /* Two different application of BDDC to the whole set of dofs, internal and interface */
470c7d97c5SJed Brown   ierr = PetscOptionsBool("-pc_bddc_switch_preconditioning_type","Switch between M_2 (default) and M_3 preconditioners (as defined by Dohrmann)","none",pcbddc->prec_type,&pcbddc->prec_type,PETSC_NULL);CHKERRQ(ierr);
48534831adSStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_use_change_of_basis","Use change of basis approach for primal space","none",pcbddc->usechangeofbasis,&pcbddc->usechangeofbasis,PETSC_NULL);CHKERRQ(ierr);
49534831adSStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_use_change_on_faces","Use change of basis approach for face constraints","none",pcbddc->usechangeonfaces,&pcbddc->usechangeonfaces,PETSC_NULL);CHKERRQ(ierr);
50534831adSStefano Zampini   pcbddc->usechangeonfaces = pcbddc->usechangeonfaces && pcbddc->usechangeofbasis;
510c7d97c5SJed Brown   ierr = PetscOptionsInt("-pc_bddc_coarsening_ratio","Set coarsening ratio used in multilevel coarsening","none",pcbddc->coarsening_ratio,&pcbddc->coarsening_ratio,PETSC_NULL);CHKERRQ(ierr);
52*4fad6a16SStefano Zampini   ierr = PetscOptionsInt("-pc_bddc_max_levels","Set maximum number of levels for multilevel","none",pcbddc->max_levels,&pcbddc->max_levels,PETSC_NULL);CHKERRQ(ierr);
530c7d97c5SJed Brown   ierr = PetscOptionsTail();CHKERRQ(ierr);
540c7d97c5SJed Brown   PetscFunctionReturn(0);
550c7d97c5SJed Brown }
560c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
570c7d97c5SJed Brown EXTERN_C_BEGIN
580c7d97c5SJed Brown #undef __FUNCT__
590c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetCoarseProblemType_BDDC"
6053cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetCoarseProblemType_BDDC(PC pc, CoarseProblemType CPT)
610c7d97c5SJed Brown {
620c7d97c5SJed Brown   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
630c7d97c5SJed Brown 
640c7d97c5SJed Brown   PetscFunctionBegin;
650c7d97c5SJed Brown   pcbddc->coarse_problem_type = CPT;
660c7d97c5SJed Brown   PetscFunctionReturn(0);
670c7d97c5SJed Brown }
680c7d97c5SJed Brown EXTERN_C_END
690c7d97c5SJed Brown #undef __FUNCT__
700c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetCoarseProblemType"
7153cdbc3dSStefano Zampini /*@
729c0446d6SStefano Zampini  PCBDDCSetCoarseProblemType - Set coarse problem type in PCBDDC.
7353cdbc3dSStefano Zampini 
749c0446d6SStefano Zampini    Not collective
7553cdbc3dSStefano Zampini 
7653cdbc3dSStefano Zampini    Input Parameters:
7753cdbc3dSStefano Zampini +  pc - the preconditioning context
7853cdbc3dSStefano Zampini -  CoarseProblemType - pick a better name and explain what this is
7953cdbc3dSStefano Zampini 
8053cdbc3dSStefano Zampini    Level: intermediate
8153cdbc3dSStefano Zampini 
8253cdbc3dSStefano Zampini    Notes:
83da1bb401SStefano Zampini    Not collective but all procs must call with same arguments.
8453cdbc3dSStefano Zampini 
8553cdbc3dSStefano Zampini .seealso: PCBDDC
8653cdbc3dSStefano Zampini @*/
870c7d97c5SJed Brown PetscErrorCode PCBDDCSetCoarseProblemType(PC pc, CoarseProblemType CPT)
880c7d97c5SJed Brown {
890c7d97c5SJed Brown   PetscErrorCode ierr;
900c7d97c5SJed Brown 
910c7d97c5SJed Brown   PetscFunctionBegin;
920c7d97c5SJed Brown   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
930c7d97c5SJed Brown   ierr = PetscTryMethod(pc,"PCBDDCSetCoarseProblemType_C",(PC,CoarseProblemType),(pc,CPT));CHKERRQ(ierr);
940c7d97c5SJed Brown   PetscFunctionReturn(0);
950c7d97c5SJed Brown }
960c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
970c7d97c5SJed Brown EXTERN_C_BEGIN
980c7d97c5SJed Brown #undef __FUNCT__
99*4fad6a16SStefano Zampini #define __FUNCT__ "PCBDDCSetCoarseningRatio_BDDC"
100*4fad6a16SStefano Zampini static PetscErrorCode PCBDDCSetCoarseningRatio_BDDC(PC pc,PetscInt k)
101*4fad6a16SStefano Zampini {
102*4fad6a16SStefano Zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
103*4fad6a16SStefano Zampini 
104*4fad6a16SStefano Zampini   PetscFunctionBegin;
105*4fad6a16SStefano Zampini   pcbddc->coarsening_ratio=k;
106*4fad6a16SStefano Zampini   PetscFunctionReturn(0);
107*4fad6a16SStefano Zampini }
108*4fad6a16SStefano Zampini EXTERN_C_END
109*4fad6a16SStefano Zampini #undef __FUNCT__
110*4fad6a16SStefano Zampini #define __FUNCT__ "PCBDDCSetCoarseningRatio"
111*4fad6a16SStefano Zampini /*@
112*4fad6a16SStefano Zampini  PCBDDCSetCoarseningRatio - Set coarsening ratio used in multilevel coarsening
113*4fad6a16SStefano Zampini 
114*4fad6a16SStefano Zampini    Logically collective on PC
115*4fad6a16SStefano Zampini 
116*4fad6a16SStefano Zampini    Input Parameters:
117*4fad6a16SStefano Zampini +  pc - the preconditioning context
118*4fad6a16SStefano Zampini -  k - coarsening ratio
119*4fad6a16SStefano Zampini 
120*4fad6a16SStefano Zampini    Approximatively k subdomains at the finer level will be aggregated into a single subdomain at the coarser level.
121*4fad6a16SStefano Zampini 
122*4fad6a16SStefano Zampini    Level: intermediate
123*4fad6a16SStefano Zampini 
124*4fad6a16SStefano Zampini    Notes:
125*4fad6a16SStefano Zampini 
126*4fad6a16SStefano Zampini .seealso: PCBDDC
127*4fad6a16SStefano Zampini @*/
128*4fad6a16SStefano Zampini PetscErrorCode PCBDDCSetCoarseningRatio(PC pc,PetscInt k)
129*4fad6a16SStefano Zampini {
130*4fad6a16SStefano Zampini   PetscErrorCode ierr;
131*4fad6a16SStefano Zampini 
132*4fad6a16SStefano Zampini   PetscFunctionBegin;
133*4fad6a16SStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
134*4fad6a16SStefano Zampini   ierr = PetscTryMethod(pc,"PCBDDCSetCoarseningRatio_C",(PC,PetscInt),(pc,k));CHKERRQ(ierr);
135*4fad6a16SStefano Zampini   PetscFunctionReturn(0);
136*4fad6a16SStefano Zampini }
137*4fad6a16SStefano Zampini /* -------------------------------------------------------------------------- */
138*4fad6a16SStefano Zampini EXTERN_C_BEGIN
139*4fad6a16SStefano Zampini #undef __FUNCT__
140*4fad6a16SStefano Zampini #define __FUNCT__ "PCBDDCSetMaxLevels_BDDC"
141*4fad6a16SStefano Zampini static PetscErrorCode PCBDDCSetMaxLevels_BDDC(PC pc,PetscInt max_levels)
142*4fad6a16SStefano Zampini {
143*4fad6a16SStefano Zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
144*4fad6a16SStefano Zampini 
145*4fad6a16SStefano Zampini   PetscFunctionBegin;
146*4fad6a16SStefano Zampini   pcbddc->max_levels=max_levels;
147*4fad6a16SStefano Zampini   PetscFunctionReturn(0);
148*4fad6a16SStefano Zampini }
149*4fad6a16SStefano Zampini EXTERN_C_END
150*4fad6a16SStefano Zampini #undef __FUNCT__
151*4fad6a16SStefano Zampini #define __FUNCT__ "PCBDDCSetMaxLevels"
152*4fad6a16SStefano Zampini /*@
153*4fad6a16SStefano Zampini  PCBDDCSetMaxLevels - Sets the maximum number of levels within the multilevel approach.
154*4fad6a16SStefano Zampini 
155*4fad6a16SStefano Zampini    Logically collective on PC
156*4fad6a16SStefano Zampini 
157*4fad6a16SStefano Zampini    Input Parameters:
158*4fad6a16SStefano Zampini +  pc - the preconditioning context
159*4fad6a16SStefano Zampini -  max_levels - the maximum number of levels
160*4fad6a16SStefano Zampini 
161*4fad6a16SStefano Zampini    Default value is 1, i.e. coarse problem will be solved inexactly with one application
162*4fad6a16SStefano Zampini    of PCBDDC preconditioner if the multilevel approach is requested.
163*4fad6a16SStefano Zampini 
164*4fad6a16SStefano Zampini    Level: intermediate
165*4fad6a16SStefano Zampini 
166*4fad6a16SStefano Zampini    Notes:
167*4fad6a16SStefano Zampini 
168*4fad6a16SStefano Zampini .seealso: PCBDDC
169*4fad6a16SStefano Zampini @*/
170*4fad6a16SStefano Zampini PetscErrorCode PCBDDCSetMaxLevels(PC pc,PetscInt max_levels)
171*4fad6a16SStefano Zampini {
172*4fad6a16SStefano Zampini   PetscErrorCode ierr;
173*4fad6a16SStefano Zampini 
174*4fad6a16SStefano Zampini   PetscFunctionBegin;
175*4fad6a16SStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
176*4fad6a16SStefano Zampini   ierr = PetscTryMethod(pc,"PCBDDCSetMaxLevels_C",(PC,PetscInt),(pc,max_levels));CHKERRQ(ierr);
177*4fad6a16SStefano Zampini   PetscFunctionReturn(0);
178*4fad6a16SStefano Zampini }
179*4fad6a16SStefano Zampini /* -------------------------------------------------------------------------- */
180*4fad6a16SStefano Zampini EXTERN_C_BEGIN
181*4fad6a16SStefano Zampini #undef __FUNCT__
1820bdf917eSStefano Zampini #define __FUNCT__ "PCBDDCSetNullSpace_BDDC"
1830bdf917eSStefano Zampini static PetscErrorCode PCBDDCSetNullSpace_BDDC(PC pc,MatNullSpace NullSpace)
1840bdf917eSStefano Zampini {
1850bdf917eSStefano Zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
1860bdf917eSStefano Zampini   PetscErrorCode ierr;
1870bdf917eSStefano Zampini 
1880bdf917eSStefano Zampini   PetscFunctionBegin;
1890bdf917eSStefano Zampini   ierr = PetscObjectReference((PetscObject)NullSpace);CHKERRQ(ierr);
1900bdf917eSStefano Zampini   ierr = MatNullSpaceDestroy(&pcbddc->NullSpace);CHKERRQ(ierr);
1910bdf917eSStefano Zampini   pcbddc->NullSpace=NullSpace;
1920bdf917eSStefano Zampini   PetscFunctionReturn(0);
1930bdf917eSStefano Zampini }
1940bdf917eSStefano Zampini EXTERN_C_END
1950bdf917eSStefano Zampini #undef __FUNCT__
1960bdf917eSStefano Zampini #define __FUNCT__ "PCBDDCSetNullSpace"
1970bdf917eSStefano Zampini /*@
1980bdf917eSStefano Zampini  PCBDDCSetNullSpace - Set NullSpace of global operator of BDDC preconditioned mat.
1990bdf917eSStefano Zampini 
2000bdf917eSStefano Zampini    Logically collective on PC and MatNullSpace
2010bdf917eSStefano Zampini 
2020bdf917eSStefano Zampini    Input Parameters:
2030bdf917eSStefano Zampini +  pc - the preconditioning context
2040bdf917eSStefano Zampini -  NullSpace - Null space of the linear operator to be preconditioned.
2050bdf917eSStefano Zampini 
2060bdf917eSStefano Zampini    Level: intermediate
2070bdf917eSStefano Zampini 
2080bdf917eSStefano Zampini    Notes:
2090bdf917eSStefano Zampini 
2100bdf917eSStefano Zampini .seealso: PCBDDC
2110bdf917eSStefano Zampini @*/
2120bdf917eSStefano Zampini PetscErrorCode PCBDDCSetNullSpace(PC pc,MatNullSpace NullSpace)
2130bdf917eSStefano Zampini {
2140bdf917eSStefano Zampini   PetscErrorCode ierr;
2150bdf917eSStefano Zampini 
2160bdf917eSStefano Zampini   PetscFunctionBegin;
2170bdf917eSStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
2180bdf917eSStefano Zampini   ierr = PetscTryMethod(pc,"PCBDDCSetNullSpace_C",(PC,MatNullSpace),(pc,NullSpace));CHKERRQ(ierr);
2190bdf917eSStefano Zampini   PetscFunctionReturn(0);
2200bdf917eSStefano Zampini }
2210bdf917eSStefano Zampini /* -------------------------------------------------------------------------- */
2220bdf917eSStefano Zampini EXTERN_C_BEGIN
2230bdf917eSStefano Zampini #undef __FUNCT__
2243b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCSetDirichletBoundaries_BDDC"
2253b03a366Sstefano_zampini static PetscErrorCode PCBDDCSetDirichletBoundaries_BDDC(PC pc,IS DirichletBoundaries)
2263b03a366Sstefano_zampini {
2273b03a366Sstefano_zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
2283b03a366Sstefano_zampini   PetscErrorCode ierr;
2293b03a366Sstefano_zampini 
2303b03a366Sstefano_zampini   PetscFunctionBegin;
2313b03a366Sstefano_zampini   ierr = ISDestroy(&pcbddc->DirichletBoundaries);CHKERRQ(ierr);
23236e030ebSStefano Zampini   ierr = PetscObjectReference((PetscObject)DirichletBoundaries);CHKERRQ(ierr);
23336e030ebSStefano Zampini   pcbddc->DirichletBoundaries=DirichletBoundaries;
2343b03a366Sstefano_zampini   PetscFunctionReturn(0);
2353b03a366Sstefano_zampini }
2363b03a366Sstefano_zampini EXTERN_C_END
2373b03a366Sstefano_zampini #undef __FUNCT__
2383b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCSetDirichletBoundaries"
2393b03a366Sstefano_zampini /*@
240da1bb401SStefano Zampini  PCBDDCSetDirichletBoundaries - Set index set defining subdomain part (in local ordering)
241da1bb401SStefano Zampini                               of Dirichlet boundaries for the global problem.
2423b03a366Sstefano_zampini 
2433b03a366Sstefano_zampini    Not collective
2443b03a366Sstefano_zampini 
2453b03a366Sstefano_zampini    Input Parameters:
2463b03a366Sstefano_zampini +  pc - the preconditioning context
2473b03a366Sstefano_zampini -  DirichletBoundaries - sequential index set defining the subdomain part of Dirichlet boundaries (can be PETSC_NULL)
2483b03a366Sstefano_zampini 
2493b03a366Sstefano_zampini    Level: intermediate
2503b03a366Sstefano_zampini 
2513b03a366Sstefano_zampini    Notes:
2523b03a366Sstefano_zampini 
2533b03a366Sstefano_zampini .seealso: PCBDDC
2543b03a366Sstefano_zampini @*/
2553b03a366Sstefano_zampini PetscErrorCode PCBDDCSetDirichletBoundaries(PC pc,IS DirichletBoundaries)
2563b03a366Sstefano_zampini {
2573b03a366Sstefano_zampini   PetscErrorCode ierr;
2583b03a366Sstefano_zampini 
2593b03a366Sstefano_zampini   PetscFunctionBegin;
2603b03a366Sstefano_zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
2613b03a366Sstefano_zampini   ierr = PetscTryMethod(pc,"PCBDDCSetDirichletBoundaries_C",(PC,IS),(pc,DirichletBoundaries));CHKERRQ(ierr);
2623b03a366Sstefano_zampini   PetscFunctionReturn(0);
2633b03a366Sstefano_zampini }
2643b03a366Sstefano_zampini /* -------------------------------------------------------------------------- */
2653b03a366Sstefano_zampini EXTERN_C_BEGIN
2663b03a366Sstefano_zampini #undef __FUNCT__
2670c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetNeumannBoundaries_BDDC"
26853cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetNeumannBoundaries_BDDC(PC pc,IS NeumannBoundaries)
2690c7d97c5SJed Brown {
2700c7d97c5SJed Brown   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
27153cdbc3dSStefano Zampini   PetscErrorCode ierr;
2720c7d97c5SJed Brown 
2730c7d97c5SJed Brown   PetscFunctionBegin;
27453cdbc3dSStefano Zampini   ierr = ISDestroy(&pcbddc->NeumannBoundaries);CHKERRQ(ierr);
27536e030ebSStefano Zampini   ierr = PetscObjectReference((PetscObject)NeumannBoundaries);CHKERRQ(ierr);
27636e030ebSStefano Zampini   pcbddc->NeumannBoundaries=NeumannBoundaries;
2770c7d97c5SJed Brown   PetscFunctionReturn(0);
2780c7d97c5SJed Brown }
2790c7d97c5SJed Brown EXTERN_C_END
2800c7d97c5SJed Brown #undef __FUNCT__
2810c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetNeumannBoundaries"
28257527edcSJed Brown /*@
283da1bb401SStefano Zampini  PCBDDCSetNeumannBoundaries - Set index set defining subdomain part (in local ordering)
284da1bb401SStefano Zampini                               of Neumann boundaries for the global problem.
28557527edcSJed Brown 
2869c0446d6SStefano Zampini    Not collective
28757527edcSJed Brown 
28857527edcSJed Brown    Input Parameters:
28957527edcSJed Brown +  pc - the preconditioning context
2909c0446d6SStefano Zampini -  NeumannBoundaries - sequential index set defining the subdomain part of Neumann boundaries (can be PETSC_NULL)
29157527edcSJed Brown 
29257527edcSJed Brown    Level: intermediate
29357527edcSJed Brown 
29457527edcSJed Brown    Notes:
29557527edcSJed Brown 
29657527edcSJed Brown .seealso: PCBDDC
29757527edcSJed Brown @*/
29853cdbc3dSStefano Zampini PetscErrorCode PCBDDCSetNeumannBoundaries(PC pc,IS NeumannBoundaries)
2990c7d97c5SJed Brown {
3000c7d97c5SJed Brown   PetscErrorCode ierr;
3010c7d97c5SJed Brown 
3020c7d97c5SJed Brown   PetscFunctionBegin;
3030c7d97c5SJed Brown   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
30453cdbc3dSStefano Zampini   ierr = PetscTryMethod(pc,"PCBDDCSetNeumannBoundaries_C",(PC,IS),(pc,NeumannBoundaries));CHKERRQ(ierr);
30553cdbc3dSStefano Zampini   PetscFunctionReturn(0);
30653cdbc3dSStefano Zampini }
30753cdbc3dSStefano Zampini /* -------------------------------------------------------------------------- */
30853cdbc3dSStefano Zampini EXTERN_C_BEGIN
30953cdbc3dSStefano Zampini #undef __FUNCT__
310da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCGetDirichletBoundaries_BDDC"
311da1bb401SStefano Zampini static PetscErrorCode PCBDDCGetDirichletBoundaries_BDDC(PC pc,IS *DirichletBoundaries)
312da1bb401SStefano Zampini {
313da1bb401SStefano Zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
314da1bb401SStefano Zampini 
315da1bb401SStefano Zampini   PetscFunctionBegin;
316da1bb401SStefano Zampini   *DirichletBoundaries = pcbddc->DirichletBoundaries;
317da1bb401SStefano Zampini   PetscFunctionReturn(0);
318da1bb401SStefano Zampini }
319da1bb401SStefano Zampini EXTERN_C_END
320da1bb401SStefano Zampini #undef __FUNCT__
321da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCGetDirichletBoundaries"
322da1bb401SStefano Zampini /*@
323da1bb401SStefano Zampini  PCBDDCGetDirichletBoundaries - Get index set defining subdomain part (in local ordering)
324da1bb401SStefano Zampini                                 of Dirichlet boundaries for the global problem.
325da1bb401SStefano Zampini 
326da1bb401SStefano Zampini    Not collective
327da1bb401SStefano Zampini 
328da1bb401SStefano Zampini    Input Parameters:
329da1bb401SStefano Zampini +  pc - the preconditioning context
330da1bb401SStefano Zampini 
331da1bb401SStefano Zampini    Output Parameters:
332da1bb401SStefano Zampini +  DirichletBoundaries - index set defining the subdomain part of Dirichlet boundaries
333da1bb401SStefano Zampini 
334da1bb401SStefano Zampini    Level: intermediate
335da1bb401SStefano Zampini 
336da1bb401SStefano Zampini    Notes:
337da1bb401SStefano Zampini 
338da1bb401SStefano Zampini .seealso: PCBDDC
339da1bb401SStefano Zampini @*/
340da1bb401SStefano Zampini PetscErrorCode PCBDDCGetDirichletBoundaries(PC pc,IS *DirichletBoundaries)
341da1bb401SStefano Zampini {
342da1bb401SStefano Zampini   PetscErrorCode ierr;
343da1bb401SStefano Zampini 
344da1bb401SStefano Zampini   PetscFunctionBegin;
345da1bb401SStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
346da1bb401SStefano Zampini   ierr = PetscUseMethod(pc,"PCBDDCGetDirichletBoundaries_C",(PC,IS*),(pc,DirichletBoundaries));CHKERRQ(ierr);
347da1bb401SStefano Zampini   PetscFunctionReturn(0);
348da1bb401SStefano Zampini }
349da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
350da1bb401SStefano Zampini EXTERN_C_BEGIN
351da1bb401SStefano Zampini #undef __FUNCT__
35253cdbc3dSStefano Zampini #define __FUNCT__ "PCBDDCGetNeumannBoundaries_BDDC"
35353cdbc3dSStefano Zampini static PetscErrorCode PCBDDCGetNeumannBoundaries_BDDC(PC pc,IS *NeumannBoundaries)
35453cdbc3dSStefano Zampini {
35553cdbc3dSStefano Zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
35653cdbc3dSStefano Zampini 
35753cdbc3dSStefano Zampini   PetscFunctionBegin;
35853cdbc3dSStefano Zampini   *NeumannBoundaries = pcbddc->NeumannBoundaries;
35953cdbc3dSStefano Zampini   PetscFunctionReturn(0);
36053cdbc3dSStefano Zampini }
36153cdbc3dSStefano Zampini EXTERN_C_END
36253cdbc3dSStefano Zampini #undef __FUNCT__
36353cdbc3dSStefano Zampini #define __FUNCT__ "PCBDDCGetNeumannBoundaries"
36453cdbc3dSStefano Zampini /*@
365da1bb401SStefano Zampini  PCBDDCGetNeumannBoundaries - Get index set defining subdomain part (in local ordering)
366da1bb401SStefano Zampini                               of Neumann boundaries for the global problem.
36753cdbc3dSStefano Zampini 
3689c0446d6SStefano Zampini    Not collective
36953cdbc3dSStefano Zampini 
37053cdbc3dSStefano Zampini    Input Parameters:
37153cdbc3dSStefano Zampini +  pc - the preconditioning context
37253cdbc3dSStefano Zampini 
37353cdbc3dSStefano Zampini    Output Parameters:
37453cdbc3dSStefano Zampini +  NeumannBoundaries - index set defining the subdomain part of Neumann boundaries
37553cdbc3dSStefano Zampini 
37653cdbc3dSStefano Zampini    Level: intermediate
37753cdbc3dSStefano Zampini 
37853cdbc3dSStefano Zampini    Notes:
37953cdbc3dSStefano Zampini 
38053cdbc3dSStefano Zampini .seealso: PCBDDC
38153cdbc3dSStefano Zampini @*/
38253cdbc3dSStefano Zampini PetscErrorCode PCBDDCGetNeumannBoundaries(PC pc,IS *NeumannBoundaries)
38353cdbc3dSStefano Zampini {
38453cdbc3dSStefano Zampini   PetscErrorCode ierr;
38553cdbc3dSStefano Zampini 
38653cdbc3dSStefano Zampini   PetscFunctionBegin;
38753cdbc3dSStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
38853cdbc3dSStefano Zampini   ierr = PetscUseMethod(pc,"PCBDDCGetNeumannBoundaries_C",(PC,IS*),(pc,NeumannBoundaries));CHKERRQ(ierr);
3890c7d97c5SJed Brown   PetscFunctionReturn(0);
3900c7d97c5SJed Brown }
39136e030ebSStefano Zampini /* -------------------------------------------------------------------------- */
39236e030ebSStefano Zampini EXTERN_C_BEGIN
39336e030ebSStefano Zampini #undef __FUNCT__
394da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetLocalAdjacencyGraph_BDDC"
395da1bb401SStefano Zampini static PetscErrorCode PCBDDCSetLocalAdjacencyGraph_BDDC(PC pc, PetscInt nvtxs, PetscInt xadj[], PetscInt adjncy[], PetscCopyMode copymode)
39636e030ebSStefano Zampini {
39736e030ebSStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
398da1bb401SStefano Zampini   PCBDDCGraph    mat_graph=pcbddc->mat_graph;
399da1bb401SStefano Zampini   PetscErrorCode ierr;
40036e030ebSStefano Zampini 
40136e030ebSStefano Zampini   PetscFunctionBegin;
402da1bb401SStefano Zampini   mat_graph->nvtxs=nvtxs;
403da1bb401SStefano Zampini   ierr = PetscFree(mat_graph->xadj);CHKERRQ(ierr);
404da1bb401SStefano Zampini   ierr = PetscFree(mat_graph->adjncy);CHKERRQ(ierr);
405da1bb401SStefano Zampini   if (copymode == PETSC_COPY_VALUES) {
406da1bb401SStefano Zampini     ierr = PetscMalloc((mat_graph->nvtxs+1)*sizeof(PetscInt),&mat_graph->xadj);CHKERRQ(ierr);
407da1bb401SStefano Zampini     ierr = PetscMalloc(xadj[mat_graph->nvtxs]*sizeof(PetscInt),&mat_graph->adjncy);CHKERRQ(ierr);
408da1bb401SStefano Zampini     ierr = PetscMemcpy(mat_graph->xadj,xadj,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr);
409da1bb401SStefano Zampini     ierr = PetscMemcpy(mat_graph->adjncy,adjncy,xadj[mat_graph->nvtxs]*sizeof(PetscInt));CHKERRQ(ierr);
410da1bb401SStefano Zampini   } else if (copymode == PETSC_OWN_POINTER) {
411da1bb401SStefano Zampini     mat_graph->xadj=xadj;
412da1bb401SStefano Zampini     mat_graph->adjncy=adjncy;
413da1bb401SStefano Zampini   } else {
414da1bb401SStefano Zampini     SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_SUP,"Unsupported copy mode %d in %s\n",copymode,__FUNCT__);
415da1bb401SStefano Zampini   }
41636e030ebSStefano Zampini   PetscFunctionReturn(0);
41736e030ebSStefano Zampini }
41836e030ebSStefano Zampini EXTERN_C_END
41936e030ebSStefano Zampini #undef __FUNCT__
420da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetLocalAdjacencyGraph"
42136e030ebSStefano Zampini /*@
422da1bb401SStefano Zampini  PCBDDCSetLocalAdjacencyGraph - Set CSR graph of local matrix for use of PCBDDC.
42336e030ebSStefano Zampini 
42436e030ebSStefano Zampini    Not collective
42536e030ebSStefano Zampini 
42636e030ebSStefano Zampini    Input Parameters:
42736e030ebSStefano Zampini +  pc - the preconditioning context
428da1bb401SStefano Zampini -  nvtxs - number of local vertices of the graph
429da1bb401SStefano Zampini -  xadj, adjncy - the CSR graph
430da1bb401SStefano Zampini -  copymode - either PETSC_COPY_VALUES or PETSC_OWN_POINTER. In the former case the user must free the array passed in;
431da1bb401SStefano Zampini                                                              in the latter case, memory must be obtained with PetscMalloc.
43236e030ebSStefano Zampini 
43336e030ebSStefano Zampini    Level: intermediate
43436e030ebSStefano Zampini 
43536e030ebSStefano Zampini    Notes:
43636e030ebSStefano Zampini 
43736e030ebSStefano Zampini .seealso: PCBDDC
43836e030ebSStefano Zampini @*/
439da1bb401SStefano Zampini PetscErrorCode PCBDDCSetLocalAdjacencyGraph(PC pc,PetscInt nvtxs,PetscInt xadj[],PetscInt adjncy[], PetscCopyMode copymode)
44036e030ebSStefano Zampini {
441da1bb401SStefano Zampini   PetscInt       nrows,ncols;
442da1bb401SStefano Zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
44336e030ebSStefano Zampini   PetscErrorCode ierr;
44436e030ebSStefano Zampini 
44536e030ebSStefano Zampini   PetscFunctionBegin;
44636e030ebSStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
447da1bb401SStefano Zampini   ierr = MatGetSize(matis->A,&nrows,&ncols);CHKERRQ(ierr);
448da1bb401SStefano Zampini   if (nvtxs != nrows) {
449da1bb401SStefano Zampini     SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Local adjacency size %d passed in %s differs from local problem size %d!\n",nvtxs,__FUNCT__,nrows);
450da1bb401SStefano Zampini   } else {
451da1bb401SStefano Zampini     ierr = PetscTryMethod(pc,"PCBDDCSetLocalAdjacencyGraph_C",(PC,PetscInt,PetscInt[],PetscInt[],PetscCopyMode),(pc,nvtxs,xadj,adjncy,copymode));CHKERRQ(ierr);
452da1bb401SStefano Zampini   }
45336e030ebSStefano Zampini   PetscFunctionReturn(0);
45436e030ebSStefano Zampini }
4559c0446d6SStefano Zampini /* -------------------------------------------------------------------------- */
4569c0446d6SStefano Zampini EXTERN_C_BEGIN
4579c0446d6SStefano Zampini #undef __FUNCT__
4589c0446d6SStefano Zampini #define __FUNCT__ "PCBDDCSetDofsSplitting_BDDC"
4599c0446d6SStefano Zampini static PetscErrorCode PCBDDCSetDofsSplitting_BDDC(PC pc,PetscInt n_is, IS ISForDofs[])
4609c0446d6SStefano Zampini {
4619c0446d6SStefano Zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
4629c0446d6SStefano Zampini   PetscInt i;
4639c0446d6SStefano Zampini   PetscErrorCode ierr;
4649c0446d6SStefano Zampini 
4659c0446d6SStefano Zampini   PetscFunctionBegin;
466da1bb401SStefano Zampini   /* Destroy ISes if they were already set */
4679c0446d6SStefano Zampini   for (i=0;i<pcbddc->n_ISForDofs;i++) {
4689c0446d6SStefano Zampini     ierr = ISDestroy(&pcbddc->ISForDofs[i]);CHKERRQ(ierr);
4699c0446d6SStefano Zampini   }
470d11ae9bbSstefano_zampini   ierr = PetscFree(pcbddc->ISForDofs);CHKERRQ(ierr);
471da1bb401SStefano Zampini   /* allocate space then set */
4729c0446d6SStefano Zampini   ierr = PetscMalloc(n_is*sizeof(IS),&pcbddc->ISForDofs);CHKERRQ(ierr);
4739c0446d6SStefano Zampini   for (i=0;i<n_is;i++) {
474da1bb401SStefano Zampini     ierr = PetscObjectReference((PetscObject)ISForDofs[i]);CHKERRQ(ierr);
475da1bb401SStefano Zampini     pcbddc->ISForDofs[i]=ISForDofs[i];
4769c0446d6SStefano Zampini   }
4779c0446d6SStefano Zampini   pcbddc->n_ISForDofs=n_is;
4789c0446d6SStefano Zampini   PetscFunctionReturn(0);
4799c0446d6SStefano Zampini }
4809c0446d6SStefano Zampini EXTERN_C_END
4819c0446d6SStefano Zampini #undef __FUNCT__
4829c0446d6SStefano Zampini #define __FUNCT__ "PCBDDCSetDofsSplitting"
4839c0446d6SStefano Zampini /*@
484da1bb401SStefano Zampini  PCBDDCSetDofsSplitting - Set index sets defining fields of local mat.
4859c0446d6SStefano Zampini 
4869c0446d6SStefano Zampini    Not collective
4879c0446d6SStefano Zampini 
4889c0446d6SStefano Zampini    Input Parameters:
4899c0446d6SStefano Zampini +  pc - the preconditioning context
490da1bb401SStefano Zampini -  n - number of index sets defining the fields
491da1bb401SStefano Zampini -  IS[] - array of IS describing the fields
4929c0446d6SStefano Zampini 
4939c0446d6SStefano Zampini    Level: intermediate
4949c0446d6SStefano Zampini 
4959c0446d6SStefano Zampini    Notes:
4969c0446d6SStefano Zampini 
4979c0446d6SStefano Zampini .seealso: PCBDDC
4989c0446d6SStefano Zampini @*/
4999c0446d6SStefano Zampini PetscErrorCode PCBDDCSetDofsSplitting(PC pc,PetscInt n_is, IS ISForDofs[])
5009c0446d6SStefano Zampini {
5019c0446d6SStefano Zampini   PetscErrorCode ierr;
5029c0446d6SStefano Zampini 
5039c0446d6SStefano Zampini   PetscFunctionBegin;
5049c0446d6SStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
5059c0446d6SStefano Zampini   ierr = PetscTryMethod(pc,"PCBDDCSetDofsSplitting_C",(PC,PetscInt,IS[]),(pc,n_is,ISForDofs));CHKERRQ(ierr);
5069c0446d6SStefano Zampini   PetscFunctionReturn(0);
5079c0446d6SStefano Zampini }
508da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
509534831adSStefano Zampini #undef __FUNCT__
510534831adSStefano Zampini #define __FUNCT__ "PCPreSolve_BDDC"
511534831adSStefano Zampini /* -------------------------------------------------------------------------- */
512534831adSStefano Zampini /*
513534831adSStefano Zampini    PCPreSolve_BDDC - Changes the right hand side and (if necessary) the initial
514534831adSStefano Zampini                      guess if a transformation of basis approach has been selected.
5159c0446d6SStefano Zampini 
516534831adSStefano Zampini    Input Parameter:
517534831adSStefano Zampini +  pc - the preconditioner contex
518534831adSStefano Zampini 
519534831adSStefano Zampini    Application Interface Routine: PCPreSolve()
520534831adSStefano Zampini 
521534831adSStefano Zampini    Notes:
522534831adSStefano Zampini    The interface routine PCPreSolve() is not usually called directly by
523534831adSStefano Zampini    the user, but instead is called by KSPSolve().
524534831adSStefano Zampini */
525534831adSStefano Zampini static PetscErrorCode PCPreSolve_BDDC(PC pc, KSP ksp, Vec rhs, Vec x)
526534831adSStefano Zampini {
527534831adSStefano Zampini   PetscErrorCode ierr;
528534831adSStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
529534831adSStefano Zampini   PC_IS          *pcis = (PC_IS*)(pc->data);
530534831adSStefano Zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
531534831adSStefano Zampini   Mat            temp_mat;
5323972b0daSStefano Zampini   IS             dirIS;
5333972b0daSStefano Zampini   PetscInt       dirsize,i,*is_indices;
5343972b0daSStefano Zampini   PetscScalar    *array_x,*array_diagonal;
5353972b0daSStefano Zampini   Vec            used_vec;
5363972b0daSStefano Zampini   PetscBool      guess_nonzero;
537534831adSStefano Zampini 
538534831adSStefano Zampini   PetscFunctionBegin;
5393972b0daSStefano Zampini   if (x) {
5403972b0daSStefano Zampini     ierr = PetscObjectReference((PetscObject)x);CHKERRQ(ierr);
5413972b0daSStefano Zampini     used_vec = x;
5423972b0daSStefano Zampini   } else {
5433972b0daSStefano Zampini     ierr = PetscObjectReference((PetscObject)pcbddc->temp_solution);CHKERRQ(ierr);
5443972b0daSStefano Zampini     used_vec = pcbddc->temp_solution;
5453972b0daSStefano Zampini     ierr = VecSet(used_vec,0.0);CHKERRQ(ierr);
5463972b0daSStefano Zampini   }
5473972b0daSStefano Zampini   /* hack into ksp data structure PCPreSolve comes earlier in src/ksp/ksp/interface/itfunc.c */
5483972b0daSStefano Zampini   if (ksp) {
5493972b0daSStefano Zampini     ierr = KSPGetInitialGuessNonzero(ksp,&guess_nonzero);CHKERRQ(ierr);
5503972b0daSStefano Zampini     if ( !guess_nonzero ) {
5513972b0daSStefano Zampini       ierr = VecSet(used_vec,0.0);CHKERRQ(ierr);
5523972b0daSStefano Zampini     }
5533972b0daSStefano Zampini   }
5543972b0daSStefano Zampini   /* store the original rhs */
5553972b0daSStefano Zampini   ierr = VecCopy(rhs,pcbddc->original_rhs);CHKERRQ(ierr);
5563972b0daSStefano Zampini 
5573972b0daSStefano Zampini   /* Take into account zeroed rows -> change rhs and store solution removed */
5583972b0daSStefano Zampini   ierr = MatGetDiagonal(pc->pmat,pcis->vec1_global);CHKERRQ(ierr);
5593972b0daSStefano Zampini   ierr = VecPointwiseDivide(pcis->vec1_global,rhs,pcis->vec1_global);CHKERRQ(ierr);
5603972b0daSStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
5613972b0daSStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
5623972b0daSStefano Zampini   ierr = VecScatterBegin(matis->ctx,used_vec,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
5633972b0daSStefano Zampini   ierr = VecScatterEnd  (matis->ctx,used_vec,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
5643972b0daSStefano Zampini   ierr = PCBDDCGetDirichletBoundaries(pc,&dirIS);CHKERRQ(ierr);
5653972b0daSStefano Zampini   if (dirIS) {
5663972b0daSStefano Zampini     ierr = ISGetSize(dirIS,&dirsize);CHKERRQ(ierr);
5673972b0daSStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array_x);CHKERRQ(ierr);
5683972b0daSStefano Zampini     ierr = VecGetArray(pcis->vec2_N,&array_diagonal);CHKERRQ(ierr);
5693972b0daSStefano Zampini     ierr = ISGetIndices(dirIS,(const PetscInt**)&is_indices);CHKERRQ(ierr);
5703972b0daSStefano Zampini     for (i=0;i<dirsize;i++) {
5713972b0daSStefano Zampini       array_x[is_indices[i]]=array_diagonal[is_indices[i]];
5723972b0daSStefano Zampini     }
5733972b0daSStefano Zampini     ierr = ISRestoreIndices(dirIS,(const PetscInt**)&is_indices);CHKERRQ(ierr);
5743972b0daSStefano Zampini     ierr = VecRestoreArray(pcis->vec2_N,&array_diagonal);CHKERRQ(ierr);
5753972b0daSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array_x);CHKERRQ(ierr);
5763972b0daSStefano Zampini   }
5773972b0daSStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
5783972b0daSStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
579b76ba322SStefano Zampini 
5803972b0daSStefano Zampini   /* remove the computed solution from the rhs */
5813972b0daSStefano Zampini   ierr = VecScale(used_vec,-1.0);CHKERRQ(ierr);
5823972b0daSStefano Zampini   ierr = MatMultAdd(pc->pmat,used_vec,rhs,rhs);CHKERRQ(ierr);
5833972b0daSStefano Zampini   ierr = VecScale(used_vec,-1.0);CHKERRQ(ierr);
584b76ba322SStefano Zampini 
585b76ba322SStefano Zampini   /* store partially computed solution and set initial guess */
5863972b0daSStefano Zampini   if (x) {
5873972b0daSStefano Zampini     ierr = VecCopy(used_vec,pcbddc->temp_solution);CHKERRQ(ierr);
5883972b0daSStefano Zampini     ierr = VecSet(used_vec,0.0);CHKERRQ(ierr);
589b76ba322SStefano Zampini     if (pcbddc->use_exact_dirichlet) {
590b76ba322SStefano Zampini       ierr = VecScatterBegin(pcis->global_to_D,rhs,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
591b76ba322SStefano Zampini       ierr = VecScatterEnd  (pcis->global_to_D,rhs,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
592b76ba322SStefano Zampini       ierr = KSPSolve(pcbddc->ksp_D,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr);
593b76ba322SStefano Zampini       ierr = VecScatterBegin(pcis->global_to_D,pcis->vec2_D,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
594b76ba322SStefano Zampini       ierr = VecScatterEnd  (pcis->global_to_D,pcis->vec2_D,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
595b76ba322SStefano Zampini       if (ksp) {
596b76ba322SStefano Zampini         ierr = KSPSetInitialGuessNonzero(ksp,PETSC_TRUE);CHKERRQ(ierr);
597b76ba322SStefano Zampini       }
598b76ba322SStefano Zampini     }
5993972b0daSStefano Zampini   }
600b76ba322SStefano Zampini 
601b76ba322SStefano Zampini   /* rhs change of basis */
602b76ba322SStefano Zampini   if (pcbddc->usechangeofbasis) {
603b76ba322SStefano Zampini     /* swap pointers for local matrices */
604b76ba322SStefano Zampini     temp_mat = matis->A;
605b76ba322SStefano Zampini     matis->A = pcbddc->local_mat;
606b76ba322SStefano Zampini     pcbddc->local_mat = temp_mat;
607b76ba322SStefano Zampini     /* Get local rhs and apply transformation of basis */
608b76ba322SStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,rhs,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
609b76ba322SStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,rhs,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
610b76ba322SStefano Zampini     /* from original basis to modified basis */
611b76ba322SStefano Zampini     ierr = MatMultTranspose(pcbddc->ChangeOfBasisMatrix,pcis->vec1_B,pcis->vec2_B);CHKERRQ(ierr);
612b76ba322SStefano Zampini     /* put back modified values into the global vec using INSERT_VALUES copy mode */
613b76ba322SStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,pcis->vec2_B,rhs,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
614b76ba322SStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec2_B,rhs,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
6150bdf917eSStefano Zampini     if (ksp && pcbddc->NullSpace) {
6160bdf917eSStefano Zampini       ierr = MatNullSpaceRemove(pcbddc->NullSpace,used_vec,PETSC_NULL);CHKERRQ(ierr);
6170bdf917eSStefano Zampini       ierr = MatNullSpaceRemove(pcbddc->NullSpace,rhs,PETSC_NULL);CHKERRQ(ierr);
618b76ba322SStefano Zampini     }
6190bdf917eSStefano Zampini   }
6200bdf917eSStefano Zampini   ierr = VecDestroy(&used_vec);CHKERRQ(ierr);
621534831adSStefano Zampini   PetscFunctionReturn(0);
622534831adSStefano Zampini }
623534831adSStefano Zampini /* -------------------------------------------------------------------------- */
624534831adSStefano Zampini #undef __FUNCT__
625534831adSStefano Zampini #define __FUNCT__ "PCPostSolve_BDDC"
626534831adSStefano Zampini /* -------------------------------------------------------------------------- */
627534831adSStefano Zampini /*
628534831adSStefano Zampini    PCPostSolve_BDDC - Changes the computed solution if a transformation of basis
629534831adSStefano Zampini                      approach has been selected. Also, restores rhs to its original state.
630534831adSStefano Zampini 
631534831adSStefano Zampini    Input Parameter:
632534831adSStefano Zampini +  pc - the preconditioner contex
633534831adSStefano Zampini 
634534831adSStefano Zampini    Application Interface Routine: PCPostSolve()
635534831adSStefano Zampini 
636534831adSStefano Zampini    Notes:
637534831adSStefano Zampini    The interface routine PCPostSolve() is not usually called directly by
638534831adSStefano Zampini    the user, but instead is called by KSPSolve().
639534831adSStefano Zampini */
640534831adSStefano Zampini static PetscErrorCode PCPostSolve_BDDC(PC pc, KSP ksp, Vec rhs, Vec x)
641534831adSStefano Zampini {
642534831adSStefano Zampini   PetscErrorCode ierr;
643534831adSStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
644534831adSStefano Zampini   PC_IS          *pcis = (PC_IS*)(pc->data);
645534831adSStefano Zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
646534831adSStefano Zampini   Mat            temp_mat;
647534831adSStefano Zampini 
648534831adSStefano Zampini   PetscFunctionBegin;
649534831adSStefano Zampini   if (pcbddc->usechangeofbasis) {
650534831adSStefano Zampini     /* swap pointers for local matrices */
651534831adSStefano Zampini     temp_mat = matis->A;
652534831adSStefano Zampini     matis->A = pcbddc->local_mat;
653534831adSStefano Zampini     pcbddc->local_mat = temp_mat;
654534831adSStefano Zampini     /* restore rhs to its original state */
6553425bc38SStefano Zampini     if (rhs) {
6563425bc38SStefano Zampini       ierr = VecCopy(pcbddc->original_rhs,rhs);CHKERRQ(ierr);
6573425bc38SStefano Zampini     }
658534831adSStefano Zampini     /* Get Local boundary and apply transformation of basis to solution vector */
659534831adSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,x,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
660534831adSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,x,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
661534831adSStefano Zampini     /* from modified basis to original basis */
662534831adSStefano Zampini     ierr = MatMult(pcbddc->ChangeOfBasisMatrix,pcis->vec1_B,pcis->vec2_B);CHKERRQ(ierr);
663534831adSStefano Zampini     /* put back modified values into the global vec using INSERT_VALUES copy mode */
664534831adSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,pcis->vec2_B,x,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
665534831adSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec2_B,x,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
666534831adSStefano Zampini   }
6673972b0daSStefano Zampini   /* add solution removed in presolve */
6683425bc38SStefano Zampini   if (x) {
6693425bc38SStefano Zampini     ierr = VecAXPY(x,1.0,pcbddc->temp_solution);CHKERRQ(ierr);
6703425bc38SStefano Zampini   }
671534831adSStefano Zampini   PetscFunctionReturn(0);
672534831adSStefano Zampini }
673534831adSStefano Zampini /* -------------------------------------------------------------------------- */
67453cdbc3dSStefano Zampini #undef __FUNCT__
67553cdbc3dSStefano Zampini #define __FUNCT__ "PCSetUp_BDDC"
6760c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
6770c7d97c5SJed Brown /*
6780c7d97c5SJed Brown    PCSetUp_BDDC - Prepares for the use of the BDDC preconditioner
6790c7d97c5SJed Brown                   by setting data structures and options.
6800c7d97c5SJed Brown 
6810c7d97c5SJed Brown    Input Parameter:
68253cdbc3dSStefano Zampini +  pc - the preconditioner context
6830c7d97c5SJed Brown 
6840c7d97c5SJed Brown    Application Interface Routine: PCSetUp()
6850c7d97c5SJed Brown 
6860c7d97c5SJed Brown    Notes:
6870c7d97c5SJed Brown    The interface routine PCSetUp() is not usually called directly by
6880c7d97c5SJed Brown    the user, but instead is called by PCApply() if necessary.
6890c7d97c5SJed Brown */
69053cdbc3dSStefano Zampini PetscErrorCode PCSetUp_BDDC(PC pc)
6910c7d97c5SJed Brown {
6920c7d97c5SJed Brown   PetscErrorCode ierr;
6930c7d97c5SJed Brown   PC_BDDC*       pcbddc   = (PC_BDDC*)pc->data;
6940c7d97c5SJed Brown 
6950c7d97c5SJed Brown   PetscFunctionBegin;
6960c7d97c5SJed Brown   if (!pc->setupcalled) {
6973b03a366Sstefano_zampini     /* For BDDC we need to define a local "Neumann" problem different to that defined in PCISSetup
6989c0446d6SStefano Zampini        So, we set to pcnone the Neumann problem of pcis in order to avoid unneeded computation
6990c7d97c5SJed Brown        Also, we decide to directly build the (same) Dirichlet problem */
7000c7d97c5SJed Brown     ierr = PetscOptionsSetValue("-is_localN_pc_type","none");CHKERRQ(ierr);
7010c7d97c5SJed Brown     ierr = PetscOptionsSetValue("-is_localD_pc_type","none");CHKERRQ(ierr);
7020c7d97c5SJed Brown     /* Set up all the "iterative substructuring" common block */
7030bdf917eSStefano Zampini 
7040c7d97c5SJed Brown     ierr = PCISSetUp(pc);CHKERRQ(ierr);
7053b03a366Sstefano_zampini     /* Get stdout for dbg */
706e269702eSStefano Zampini     if (pcbddc->dbg_flag) {
707e269702eSStefano Zampini       ierr = PetscViewerASCIIGetStdout(((PetscObject)pc)->comm,&pcbddc->dbg_viewer);CHKERRQ(ierr);
708e269702eSStefano Zampini       ierr = PetscViewerASCIISynchronizedAllow(pcbddc->dbg_viewer,PETSC_TRUE);CHKERRQ(ierr);
709e269702eSStefano Zampini     }
7103b03a366Sstefano_zampini     /* Analyze local interface */
7110c7d97c5SJed Brown     ierr = PCBDDCManageLocalBoundaries(pc);CHKERRQ(ierr);
7123b03a366Sstefano_zampini     /* Set up local constraint matrix */
7133b03a366Sstefano_zampini     ierr = PCBDDCCreateConstraintMatrix(pc);CHKERRQ(ierr);
7140c7d97c5SJed Brown     /* Create coarse and local stuffs used for evaluating action of preconditioner */
7150c7d97c5SJed Brown     ierr = PCBDDCCoarseSetUp(pc);CHKERRQ(ierr);
7160c7d97c5SJed Brown   }
7170c7d97c5SJed Brown   PetscFunctionReturn(0);
7180c7d97c5SJed Brown }
7190c7d97c5SJed Brown 
7200c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
7210c7d97c5SJed Brown /*
7220c7d97c5SJed Brown    PCApply_BDDC - Applies the BDDC preconditioner to a vector.
7230c7d97c5SJed Brown 
7240c7d97c5SJed Brown    Input Parameters:
7250c7d97c5SJed Brown .  pc - the preconditioner context
7260c7d97c5SJed Brown .  r - input vector (global)
7270c7d97c5SJed Brown 
7280c7d97c5SJed Brown    Output Parameter:
7290c7d97c5SJed Brown .  z - output vector (global)
7300c7d97c5SJed Brown 
7310c7d97c5SJed Brown    Application Interface Routine: PCApply()
7320c7d97c5SJed Brown  */
7330c7d97c5SJed Brown #undef __FUNCT__
7340c7d97c5SJed Brown #define __FUNCT__ "PCApply_BDDC"
73553cdbc3dSStefano Zampini PetscErrorCode PCApply_BDDC(PC pc,Vec r,Vec z)
7360c7d97c5SJed Brown {
7370c7d97c5SJed Brown   PC_IS             *pcis = (PC_IS*)(pc->data);
7380c7d97c5SJed Brown   PC_BDDC           *pcbddc = (PC_BDDC*)(pc->data);
7390c7d97c5SJed Brown   PetscErrorCode    ierr;
7403b03a366Sstefano_zampini   const PetscScalar one = 1.0;
7413b03a366Sstefano_zampini   const PetscScalar m_one = -1.0;
7422617d88aSStefano Zampini   const PetscScalar zero = 0.0;
7430c7d97c5SJed Brown 
7440c7d97c5SJed Brown /* This code is similar to that provided in nn.c for PCNN
7450c7d97c5SJed Brown    NN interface preconditioner changed to BDDC
7460c7d97c5SJed Brown    Added support for M_3 preconditioenr in the reference article (code is active if pcbddc->prec_type = PETSC_TRUE) */
7470c7d97c5SJed Brown 
7480c7d97c5SJed Brown   PetscFunctionBegin;
749b76ba322SStefano Zampini   if (!pcbddc->use_exact_dirichlet) {
7500c7d97c5SJed Brown     /* First Dirichlet solve */
7510c7d97c5SJed Brown     ierr = VecScatterBegin(pcis->global_to_D,r,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
7520c7d97c5SJed Brown     ierr = VecScatterEnd  (pcis->global_to_D,r,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
75353cdbc3dSStefano Zampini     ierr = KSPSolve(pcbddc->ksp_D,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr);
7540c7d97c5SJed Brown     /*
7550c7d97c5SJed Brown       Assembling right hand side for BDDC operator
7560c7d97c5SJed Brown       - vec1_D for the Dirichlet part (if needed, i.e. prec_flag=PETSC_TRUE)
7570c7d97c5SJed Brown       - the interface part of the global vector z
7580c7d97c5SJed Brown     */
7590c7d97c5SJed Brown     ierr = VecScale(pcis->vec2_D,m_one);CHKERRQ(ierr);
7600c7d97c5SJed Brown     ierr = MatMult(pcis->A_BI,pcis->vec2_D,pcis->vec1_B);CHKERRQ(ierr);
7610c7d97c5SJed Brown     if (pcbddc->prec_type) { ierr = MatMultAdd(pcis->A_II,pcis->vec2_D,pcis->vec1_D,pcis->vec1_D);CHKERRQ(ierr); }
7620c7d97c5SJed Brown     ierr = VecScale(pcis->vec2_D,m_one);CHKERRQ(ierr);
7630c7d97c5SJed Brown     ierr = VecCopy(r,z);CHKERRQ(ierr);
7640c7d97c5SJed Brown     ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
7650c7d97c5SJed Brown     ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
7662617d88aSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
7672617d88aSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
768b76ba322SStefano Zampini   } else {
769b76ba322SStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,r,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
770b76ba322SStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,r,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
7710bdf917eSStefano Zampini     ierr = VecSet(pcis->vec1_D,zero);CHKERRQ(ierr);
772b76ba322SStefano Zampini     ierr = VecSet(pcis->vec2_D,zero);CHKERRQ(ierr);
773b76ba322SStefano Zampini   }
774b76ba322SStefano Zampini 
775b76ba322SStefano Zampini   /* Apply partition of unity */
7762617d88aSStefano Zampini   ierr = VecPointwiseMult(pcis->vec1_B,pcis->D,pcis->vec1_B);CHKERRQ(ierr);
7772617d88aSStefano Zampini 
7782617d88aSStefano Zampini   /* Apply interface preconditioner
7792617d88aSStefano Zampini      input/output vecs: pcis->vec1_B and pcis->vec1_D */
7802617d88aSStefano Zampini   ierr = PCBDDCApplyInterfacePreconditioner(pc);CHKERRQ(ierr);
7812617d88aSStefano Zampini 
7822617d88aSStefano Zampini   /* Apply partition of unity and sum boundary values */
7832617d88aSStefano Zampini   ierr = VecPointwiseMult(pcis->vec1_B,pcis->D,pcis->vec1_B);CHKERRQ(ierr);
7842617d88aSStefano Zampini   ierr = VecSet(z,zero);CHKERRQ(ierr);
7852617d88aSStefano Zampini   ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
7862617d88aSStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
7870c7d97c5SJed Brown 
7883b03a366Sstefano_zampini   /* Second Dirichlet solve and assembling of output */
7890c7d97c5SJed Brown   ierr = VecScatterBegin(pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
7900c7d97c5SJed Brown   ierr = VecScatterEnd  (pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
7910c7d97c5SJed Brown   ierr = MatMult(pcis->A_IB,pcis->vec1_B,pcis->vec3_D);CHKERRQ(ierr);
7920c7d97c5SJed Brown   if (pcbddc->prec_type) { ierr = MatMultAdd(pcis->A_II,pcis->vec1_D,pcis->vec3_D,pcis->vec3_D);CHKERRQ(ierr); }
79353cdbc3dSStefano Zampini   ierr = KSPSolve(pcbddc->ksp_D,pcis->vec3_D,pcbddc->vec4_D);CHKERRQ(ierr);
7940c7d97c5SJed Brown   ierr = VecScale(pcbddc->vec4_D,m_one);CHKERRQ(ierr);
7950c7d97c5SJed Brown   if (pcbddc->prec_type) { ierr = VecAXPY (pcbddc->vec4_D,one,pcis->vec1_D);CHKERRQ(ierr); }
7960c7d97c5SJed Brown   ierr = VecAXPY (pcis->vec2_D,one,pcbddc->vec4_D);CHKERRQ(ierr);
7970c7d97c5SJed Brown   ierr = VecScatterBegin(pcis->global_to_D,pcis->vec2_D,z,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
7980c7d97c5SJed Brown   ierr = VecScatterEnd  (pcis->global_to_D,pcis->vec2_D,z,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
7990c7d97c5SJed Brown   PetscFunctionReturn(0);
8000c7d97c5SJed Brown 
8010c7d97c5SJed Brown }
802da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
803da1bb401SStefano Zampini #undef __FUNCT__
804da1bb401SStefano Zampini #define __FUNCT__ "PCDestroy_BDDC"
805da1bb401SStefano Zampini PetscErrorCode PCDestroy_BDDC(PC pc)
806da1bb401SStefano Zampini {
807da1bb401SStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
8080bdf917eSStefano Zampini   PetscInt       i;
809da1bb401SStefano Zampini   PetscErrorCode ierr;
810da1bb401SStefano Zampini 
811da1bb401SStefano Zampini   PetscFunctionBegin;
812da1bb401SStefano Zampini   /* free data created by PCIS */
813da1bb401SStefano Zampini   ierr = PCISDestroy(pc);CHKERRQ(ierr);
814da1bb401SStefano Zampini   /* free BDDC data  */
8150bdf917eSStefano Zampini   ierr = MatNullSpaceDestroy(&pcbddc->CoarseNullSpace);CHKERRQ(ierr);
8160bdf917eSStefano Zampini   ierr = MatNullSpaceDestroy(&pcbddc->NullSpace);CHKERRQ(ierr);
8173972b0daSStefano Zampini   ierr = VecDestroy(&pcbddc->temp_solution);CHKERRQ(ierr);
818534831adSStefano Zampini   ierr = VecDestroy(&pcbddc->original_rhs);CHKERRQ(ierr);
819534831adSStefano Zampini   ierr = MatDestroy(&pcbddc->local_mat);CHKERRQ(ierr);
820534831adSStefano Zampini   ierr = MatDestroy(&pcbddc->ChangeOfBasisMatrix);CHKERRQ(ierr);
821da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->coarse_vec);CHKERRQ(ierr);
822da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->coarse_rhs);CHKERRQ(ierr);
823da1bb401SStefano Zampini   ierr = KSPDestroy(&pcbddc->coarse_ksp);CHKERRQ(ierr);
824da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->coarse_mat);CHKERRQ(ierr);
825da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->coarse_phi_B);CHKERRQ(ierr);
826da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->coarse_phi_D);CHKERRQ(ierr);
827da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec1_P);CHKERRQ(ierr);
828da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec1_C);CHKERRQ(ierr);
829da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->local_auxmat1);CHKERRQ(ierr);
830da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->local_auxmat2);CHKERRQ(ierr);
831da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec1_R);CHKERRQ(ierr);
832da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec2_R);CHKERRQ(ierr);
833da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec4_D);CHKERRQ(ierr);
834da1bb401SStefano Zampini   ierr = VecScatterDestroy(&pcbddc->R_to_B);CHKERRQ(ierr);
835da1bb401SStefano Zampini   ierr = VecScatterDestroy(&pcbddc->R_to_D);CHKERRQ(ierr);
836da1bb401SStefano Zampini   ierr = VecScatterDestroy(&pcbddc->coarse_loc_to_glob);CHKERRQ(ierr);
837da1bb401SStefano Zampini   ierr = KSPDestroy(&pcbddc->ksp_D);CHKERRQ(ierr);
838da1bb401SStefano Zampini   ierr = KSPDestroy(&pcbddc->ksp_R);CHKERRQ(ierr);
839da1bb401SStefano Zampini   ierr = ISDestroy(&pcbddc->NeumannBoundaries);CHKERRQ(ierr);
840da1bb401SStefano Zampini   ierr = ISDestroy(&pcbddc->DirichletBoundaries);CHKERRQ(ierr);
841da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->ConstraintMatrix);CHKERRQ(ierr);
842da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->local_primal_indices);CHKERRQ(ierr);
843da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->replicated_local_primal_indices);CHKERRQ(ierr);
8440bdf917eSStefano Zampini   ierr = PetscFree(pcbddc->replicated_local_primal_values);CHKERRQ(ierr);
845da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->local_primal_displacements);CHKERRQ(ierr);
846da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->local_primal_sizes);CHKERRQ(ierr);
847da1bb401SStefano Zampini   for (i=0;i<pcbddc->n_ISForDofs;i++) { ierr = ISDestroy(&pcbddc->ISForDofs[i]);CHKERRQ(ierr); }
848da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->ISForDofs);CHKERRQ(ierr);
849da1bb401SStefano Zampini   for (i=0;i<pcbddc->n_ISForFaces;i++) { ierr = ISDestroy(&pcbddc->ISForFaces[i]);CHKERRQ(ierr); }
850da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->ISForFaces);CHKERRQ(ierr);
851da1bb401SStefano Zampini   for (i=0;i<pcbddc->n_ISForEdges;i++) { ierr = ISDestroy(&pcbddc->ISForEdges[i]);CHKERRQ(ierr); }
852da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->ISForEdges);CHKERRQ(ierr);
853da1bb401SStefano Zampini   ierr = ISDestroy(&pcbddc->ISForVertices);CHKERRQ(ierr);
8543972b0daSStefano Zampini   /* Free graph structure */
855da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph->xadj);CHKERRQ(ierr);
856da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph->adjncy);CHKERRQ(ierr);
857142dfd88SStefano Zampini   if (pcbddc->mat_graph->nvtxs) {
858da1bb401SStefano Zampini     ierr = PetscFree(pcbddc->mat_graph->neighbours_set[0]);CHKERRQ(ierr);
859142dfd88SStefano Zampini   }
860da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph->neighbours_set);CHKERRQ(ierr);
8613972b0daSStefano Zampini   ierr = PetscFree4(pcbddc->mat_graph->where,pcbddc->mat_graph->count,pcbddc->mat_graph->cptr,pcbddc->mat_graph->queue);CHKERRQ(ierr);
8623972b0daSStefano Zampini   ierr = PetscFree2(pcbddc->mat_graph->which_dof,pcbddc->mat_graph->touched);CHKERRQ(ierr);
8633972b0daSStefano Zampini   ierr = PetscFree(pcbddc->mat_graph->where_ncmps);CHKERRQ(ierr);
864da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph);CHKERRQ(ierr);
8653425bc38SStefano Zampini   /* remove functions */
866*4fad6a16SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetCoarseningRatio_C","",PETSC_NULL);CHKERRQ(ierr);
867*4fad6a16SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetMaxLevels_C","",PETSC_NULL);CHKERRQ(ierr);
8680bdf917eSStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetNullSpace_C","",PETSC_NULL);CHKERRQ(ierr);
8693425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDirichletBoundaries_C","",PETSC_NULL);CHKERRQ(ierr);
8703425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetNeumannBoundaries_C","",PETSC_NULL);CHKERRQ(ierr);
8713425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetDirichletBoundaries_C","",PETSC_NULL);CHKERRQ(ierr);
8723425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetNeumannBoundaries_C","",PETSC_NULL);CHKERRQ(ierr);
8733425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetCoarseProblemType_C","",PETSC_NULL);CHKERRQ(ierr);
8743425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDofsSplitting_C","",PETSC_NULL);CHKERRQ(ierr);
8753425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetLocalAdjacencyGraph_C","",PETSC_NULL);CHKERRQ(ierr);
8763425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPreSolve_C","",PETSC_NULL);CHKERRQ(ierr);
8773425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPostSolve_C","",PETSC_NULL);CHKERRQ(ierr);
8783425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCCreateFETIDPOperators_C","",PETSC_NULL);CHKERRQ(ierr);
8793425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetRHS_C","",PETSC_NULL);CHKERRQ(ierr);
8803425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetSolution_C","",PETSC_NULL);CHKERRQ(ierr);
881da1bb401SStefano Zampini   /* Free the private data structure that was hanging off the PC */
882da1bb401SStefano Zampini   ierr = PetscFree(pcbddc);CHKERRQ(ierr);
883da1bb401SStefano Zampini   PetscFunctionReturn(0);
884da1bb401SStefano Zampini }
8853425bc38SStefano Zampini /* -------------------------------------------------------------------------- */
8863425bc38SStefano Zampini EXTERN_C_BEGIN
8873425bc38SStefano Zampini #undef __FUNCT__
8883425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetRHS_BDDC"
8893425bc38SStefano Zampini static PetscErrorCode PCBDDCMatFETIDPGetRHS_BDDC(Mat fetidp_mat, Vec standard_rhs, Vec fetidp_flux_rhs)
8903425bc38SStefano Zampini {
8913425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
8923425bc38SStefano Zampini   PC_IS*         pcis;
8933425bc38SStefano Zampini   PC_BDDC*       pcbddc;
8943425bc38SStefano Zampini   Mat_IS*        matis;
8953425bc38SStefano Zampini   PetscErrorCode ierr;
8960c7d97c5SJed Brown 
8973425bc38SStefano Zampini   PetscFunctionBegin;
8983425bc38SStefano Zampini   ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr);
8993425bc38SStefano Zampini   pcis = (PC_IS*)mat_ctx->pc->data;
9003425bc38SStefano Zampini   pcbddc = (PC_BDDC*)mat_ctx->pc->data;
9013425bc38SStefano Zampini   matis = (Mat_IS*)mat_ctx->pc->pmat->data;
9023425bc38SStefano Zampini 
9033425bc38SStefano Zampini   /* change of basis for physical rhs if needed
9043425bc38SStefano Zampini      It also changes the rhs in case of dirichlet boundaries */
9053425bc38SStefano Zampini   (*mat_ctx->pc->ops->presolve)(mat_ctx->pc,PETSC_NULL,standard_rhs,PETSC_NULL);
9063425bc38SStefano Zampini   /* store vectors for computation of fetidp final solution */
9073425bc38SStefano Zampini   ierr = VecScatterBegin(pcis->global_to_D,standard_rhs,mat_ctx->temp_solution_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
9083425bc38SStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_D,standard_rhs,mat_ctx->temp_solution_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
9093425bc38SStefano Zampini   ierr = VecScatterBegin(pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
9103425bc38SStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
9113425bc38SStefano Zampini   /* scale rhs since it should be unassembled */
9123425bc38SStefano Zampini   ierr = VecPointwiseMult(mat_ctx->temp_solution_B,pcis->D,mat_ctx->temp_solution_B);CHKERRQ(ierr);
9133425bc38SStefano Zampini   if (!pcbddc->prec_type) {
9143425bc38SStefano Zampini     /* compute partially subassembled Schur complement right-hand side */
9153425bc38SStefano Zampini     ierr = KSPSolve(pcbddc->ksp_D,mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr);
9163425bc38SStefano Zampini     ierr = MatMult(pcis->A_BI,pcis->vec1_D,pcis->vec1_B);CHKERRQ(ierr);
9173425bc38SStefano Zampini     ierr = VecAXPY(mat_ctx->temp_solution_B,-1.0,pcis->vec1_B);CHKERRQ(ierr);
9183425bc38SStefano Zampini     ierr = VecSet(standard_rhs,0.0);CHKERRQ(ierr);
9193425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,mat_ctx->temp_solution_B,standard_rhs,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
9203425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,mat_ctx->temp_solution_B,standard_rhs,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
9213425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
9223425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
9233425bc38SStefano Zampini     ierr = VecPointwiseMult(mat_ctx->temp_solution_B,pcis->D,mat_ctx->temp_solution_B);CHKERRQ(ierr);
9243425bc38SStefano Zampini   }
9253425bc38SStefano Zampini   /* BDDC rhs */
9263425bc38SStefano Zampini   ierr = VecCopy(mat_ctx->temp_solution_B,pcis->vec1_B);CHKERRQ(ierr);
9273425bc38SStefano Zampini   if (pcbddc->prec_type) {
9283425bc38SStefano Zampini     ierr = VecCopy(mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr);
9293425bc38SStefano Zampini   }
9303425bc38SStefano Zampini   /* apply BDDC */
9313425bc38SStefano Zampini   ierr = PCBDDCApplyInterfacePreconditioner(mat_ctx->pc);CHKERRQ(ierr);
9323425bc38SStefano Zampini   /* Application of B_delta and assembling of rhs for fetidp fluxes */
9333425bc38SStefano Zampini   ierr = VecSet(fetidp_flux_rhs,0.0);CHKERRQ(ierr);
9343425bc38SStefano Zampini   ierr = MatMult(mat_ctx->B_delta,pcis->vec1_B,mat_ctx->lambda_local);CHKERRQ(ierr);
9353425bc38SStefano Zampini   ierr = VecScatterBegin(mat_ctx->l2g_lambda,mat_ctx->lambda_local,fetidp_flux_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
9363425bc38SStefano Zampini   ierr = VecScatterEnd  (mat_ctx->l2g_lambda,mat_ctx->lambda_local,fetidp_flux_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
9373425bc38SStefano Zampini   /* restore original rhs */
9383425bc38SStefano Zampini   ierr = VecCopy(pcbddc->original_rhs,standard_rhs);CHKERRQ(ierr);
9393425bc38SStefano Zampini   PetscFunctionReturn(0);
9403425bc38SStefano Zampini }
9413425bc38SStefano Zampini EXTERN_C_END
9423425bc38SStefano Zampini #undef __FUNCT__
9433425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetRHS"
9443425bc38SStefano Zampini /*@
9453425bc38SStefano Zampini  PCBDDCMatFETIDPGetRHS - Get rhs for FETIDP linear system.
9463425bc38SStefano Zampini 
9473425bc38SStefano Zampini    Collective
9483425bc38SStefano Zampini 
9493425bc38SStefano Zampini    Input Parameters:
9503425bc38SStefano Zampini +  fetidp_mat   - the FETIDP mat obtained by a call to PCBDDCCreateFETIDPOperators
9513425bc38SStefano Zampini +  standard_rhs - the rhs of your linear system
9523425bc38SStefano Zampini 
9533425bc38SStefano Zampini    Output Parameters:
9543425bc38SStefano Zampini +  fetidp_flux_rhs   - the rhs of the FETIDP linear system
9553425bc38SStefano Zampini 
9563425bc38SStefano Zampini    Level: developer
9573425bc38SStefano Zampini 
9583425bc38SStefano Zampini    Notes:
9593425bc38SStefano Zampini 
9603425bc38SStefano Zampini .seealso: PCBDDC
9613425bc38SStefano Zampini @*/
9623425bc38SStefano Zampini PetscErrorCode PCBDDCMatFETIDPGetRHS(Mat fetidp_mat, Vec standard_rhs, Vec fetidp_flux_rhs)
9633425bc38SStefano Zampini {
9643425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
9653425bc38SStefano Zampini   PetscErrorCode ierr;
9663425bc38SStefano Zampini 
9673425bc38SStefano Zampini   PetscFunctionBegin;
9683425bc38SStefano Zampini   ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr);
9693425bc38SStefano Zampini   ierr = PetscTryMethod(mat_ctx->pc,"PCBDDCMatFETIDPGetRHS_C",(Mat,Vec,Vec),(fetidp_mat,standard_rhs,fetidp_flux_rhs));CHKERRQ(ierr);
9703425bc38SStefano Zampini   PetscFunctionReturn(0);
9713425bc38SStefano Zampini }
9723425bc38SStefano Zampini /* -------------------------------------------------------------------------- */
9733425bc38SStefano Zampini EXTERN_C_BEGIN
9743425bc38SStefano Zampini #undef __FUNCT__
9753425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetSolution_BDDC"
9763425bc38SStefano Zampini static PetscErrorCode PCBDDCMatFETIDPGetSolution_BDDC(Mat fetidp_mat, Vec fetidp_flux_sol, Vec standard_sol)
9773425bc38SStefano Zampini {
9783425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
9793425bc38SStefano Zampini   PC_IS*         pcis;
9803425bc38SStefano Zampini   PC_BDDC*       pcbddc;
9813425bc38SStefano Zampini   Mat_IS*        matis;
9823425bc38SStefano Zampini   PetscErrorCode ierr;
9833425bc38SStefano Zampini 
9843425bc38SStefano Zampini   PetscFunctionBegin;
9853425bc38SStefano Zampini   ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr);
9863425bc38SStefano Zampini   pcis = (PC_IS*)mat_ctx->pc->data;
9873425bc38SStefano Zampini   pcbddc = (PC_BDDC*)mat_ctx->pc->data;
9883425bc38SStefano Zampini   matis = (Mat_IS*)mat_ctx->pc->pmat->data;
9893425bc38SStefano Zampini 
9903425bc38SStefano Zampini   /* apply B_delta^T */
9913425bc38SStefano Zampini   ierr = VecScatterBegin(mat_ctx->l2g_lambda,fetidp_flux_sol,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
9923425bc38SStefano Zampini   ierr = VecScatterEnd  (mat_ctx->l2g_lambda,fetidp_flux_sol,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
9933425bc38SStefano Zampini   ierr = MatMultTranspose(mat_ctx->B_delta,mat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr);
9943425bc38SStefano Zampini   /* compute rhs for BDDC application */
9953425bc38SStefano Zampini   ierr = VecAYPX(pcis->vec1_B,-1.0,mat_ctx->temp_solution_B);CHKERRQ(ierr);
9963425bc38SStefano Zampini   if (pcbddc->prec_type) {
9973425bc38SStefano Zampini     ierr = VecCopy(mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr);
9983425bc38SStefano Zampini   }
9993425bc38SStefano Zampini   /* apply BDDC */
10003425bc38SStefano Zampini   ierr = PCBDDCApplyInterfacePreconditioner(mat_ctx->pc);CHKERRQ(ierr);
10013425bc38SStefano Zampini   /* put values into standard global vector */
10023425bc38SStefano Zampini   ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
10033425bc38SStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec1_B,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
10043425bc38SStefano Zampini   if (!pcbddc->prec_type) {
10053425bc38SStefano Zampini     /* compute values into the interior if solved for the partially subassembled Schur complement */
10063425bc38SStefano Zampini     ierr = MatMult(pcis->A_IB,pcis->vec1_B,pcis->vec1_D);CHKERRQ(ierr);
10073425bc38SStefano Zampini     ierr = VecAXPY(mat_ctx->temp_solution_D,-1.0,pcis->vec1_D);CHKERRQ(ierr);
10083425bc38SStefano Zampini     ierr = KSPSolve(pcbddc->ksp_D,mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr);
10093425bc38SStefano Zampini   }
10103425bc38SStefano Zampini   ierr = VecScatterBegin(pcis->global_to_D,pcis->vec1_D,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
10113425bc38SStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_D,pcis->vec1_D,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
10123425bc38SStefano Zampini   /* final change of basis if needed
10133425bc38SStefano Zampini      Is also sums the dirichlet part removed during RHS assembling */
10143425bc38SStefano Zampini   (*mat_ctx->pc->ops->postsolve)(mat_ctx->pc,PETSC_NULL,PETSC_NULL,standard_sol);
10153425bc38SStefano Zampini   PetscFunctionReturn(0);
10163425bc38SStefano Zampini 
10173425bc38SStefano Zampini }
10183425bc38SStefano Zampini EXTERN_C_END
10193425bc38SStefano Zampini #undef __FUNCT__
10203425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetSolution"
10213425bc38SStefano Zampini /*@
10223425bc38SStefano Zampini  PCBDDCMatFETIDPGetSolution - Get Solution for FETIDP linear system.
10233425bc38SStefano Zampini 
10243425bc38SStefano Zampini    Collective
10253425bc38SStefano Zampini 
10263425bc38SStefano Zampini    Input Parameters:
10273425bc38SStefano Zampini +  fetidp_mat        - the FETIDP mat obtained by a call to PCBDDCCreateFETIDPOperators
10283425bc38SStefano Zampini +  fetidp_flux_sol - the solution of the FETIDP linear system
10293425bc38SStefano Zampini 
10303425bc38SStefano Zampini    Output Parameters:
10313425bc38SStefano Zampini +  standard_sol      - the solution on the global domain
10323425bc38SStefano Zampini 
10333425bc38SStefano Zampini    Level: developer
10343425bc38SStefano Zampini 
10353425bc38SStefano Zampini    Notes:
10363425bc38SStefano Zampini 
10373425bc38SStefano Zampini .seealso: PCBDDC
10383425bc38SStefano Zampini @*/
10393425bc38SStefano Zampini PetscErrorCode PCBDDCMatFETIDPGetSolution(Mat fetidp_mat, Vec fetidp_flux_sol, Vec standard_sol)
10403425bc38SStefano Zampini {
10413425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
10423425bc38SStefano Zampini   PetscErrorCode ierr;
10433425bc38SStefano Zampini 
10443425bc38SStefano Zampini   PetscFunctionBegin;
10453425bc38SStefano Zampini   ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr);
10463425bc38SStefano Zampini   ierr = PetscTryMethod(mat_ctx->pc,"PCBDDCMatFETIDPGetSolution_C",(Mat,Vec,Vec),(fetidp_mat,fetidp_flux_sol,standard_sol));CHKERRQ(ierr);
10473425bc38SStefano Zampini   PetscFunctionReturn(0);
10483425bc38SStefano Zampini }
10493425bc38SStefano Zampini /* -------------------------------------------------------------------------- */
10503425bc38SStefano Zampini EXTERN_C_BEGIN
10513425bc38SStefano Zampini #undef __FUNCT__
10523425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPOperators_BDDC"
10533425bc38SStefano Zampini static PetscErrorCode PCBDDCCreateFETIDPOperators_BDDC(PC pc, Mat *fetidp_mat, PC *fetidp_pc)
10543425bc38SStefano Zampini {
10553425bc38SStefano Zampini   PETSC_EXTERN PetscErrorCode FETIDPMatMult(Mat,Vec,Vec);
10563425bc38SStefano Zampini   PETSC_EXTERN PetscErrorCode PCBDDCDestroyFETIDPMat(Mat);
10573425bc38SStefano Zampini   PETSC_EXTERN PetscErrorCode FETIDPPCApply(PC,Vec,Vec);
10583425bc38SStefano Zampini   PETSC_EXTERN PetscErrorCode PCBDDCDestroyFETIDPPC(PC);
10593425bc38SStefano Zampini 
10603425bc38SStefano Zampini   FETIDPMat_ctx  *fetidpmat_ctx;
10613425bc38SStefano Zampini   Mat            newmat;
10623425bc38SStefano Zampini   FETIDPPC_ctx  *fetidppc_ctx;
10633425bc38SStefano Zampini   PC             newpc;
10643425bc38SStefano Zampini   MPI_Comm       comm = ((PetscObject)pc)->comm;
10653425bc38SStefano Zampini   PetscErrorCode ierr;
10663425bc38SStefano Zampini 
10673425bc38SStefano Zampini   PetscFunctionBegin;
10683425bc38SStefano Zampini   /* FETIDP linear matrix */
10693425bc38SStefano Zampini   ierr = PCBDDCCreateFETIDPMatContext(pc, &fetidpmat_ctx);CHKERRQ(ierr);
10703425bc38SStefano Zampini   ierr = PCBDDCSetupFETIDPMatContext(fetidpmat_ctx);CHKERRQ(ierr);
10713425bc38SStefano Zampini   ierr = MatCreateShell(comm,PETSC_DECIDE,PETSC_DECIDE,fetidpmat_ctx->n_lambda,fetidpmat_ctx->n_lambda,fetidpmat_ctx,&newmat);CHKERRQ(ierr);
10723425bc38SStefano Zampini   ierr = MatShellSetOperation(newmat,MATOP_MULT,(void (*)(void))FETIDPMatMult);CHKERRQ(ierr);
10733425bc38SStefano Zampini   ierr = MatShellSetOperation(newmat,MATOP_DESTROY,(void (*)(void))PCBDDCDestroyFETIDPMat);CHKERRQ(ierr);
10743425bc38SStefano Zampini   ierr = MatSetUp(newmat);CHKERRQ(ierr);
10753425bc38SStefano Zampini   /* FETIDP preconditioner */
10763425bc38SStefano Zampini   ierr = PCBDDCCreateFETIDPPCContext(pc, &fetidppc_ctx);CHKERRQ(ierr);
10773425bc38SStefano Zampini   ierr = PCBDDCSetupFETIDPPCContext(newmat,fetidppc_ctx);CHKERRQ(ierr);
10783425bc38SStefano Zampini   ierr = PCCreate(comm,&newpc);CHKERRQ(ierr);
10793425bc38SStefano Zampini   ierr = PCSetType(newpc,PCSHELL);CHKERRQ(ierr);
10803425bc38SStefano Zampini   ierr = PCShellSetContext(newpc,fetidppc_ctx);CHKERRQ(ierr);
10813425bc38SStefano Zampini   ierr = PCShellSetApply(newpc,FETIDPPCApply);CHKERRQ(ierr);
10823425bc38SStefano Zampini   ierr = PCShellSetDestroy(newpc,PCBDDCDestroyFETIDPPC);CHKERRQ(ierr);
10833425bc38SStefano Zampini   ierr = PCSetOperators(newpc,newmat,newmat,SAME_PRECONDITIONER);CHKERRQ(ierr);
10843425bc38SStefano Zampini   ierr = PCSetUp(newpc);CHKERRQ(ierr);
10853425bc38SStefano Zampini   /* return pointers for objects created */
10863425bc38SStefano Zampini   *fetidp_mat=newmat;
10873425bc38SStefano Zampini   *fetidp_pc=newpc;
10883425bc38SStefano Zampini 
10893425bc38SStefano Zampini   PetscFunctionReturn(0);
10903425bc38SStefano Zampini }
10913425bc38SStefano Zampini EXTERN_C_END
10923425bc38SStefano Zampini #undef __FUNCT__
10933425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPOperators"
10943425bc38SStefano Zampini /*@
10953425bc38SStefano Zampini  PCBDDCCreateFETIDPOperators - Create operators for FETIDP.
10963425bc38SStefano Zampini 
10973425bc38SStefano Zampini    Collective
10983425bc38SStefano Zampini 
10993425bc38SStefano Zampini    Input Parameters:
11003425bc38SStefano Zampini +  pc - the BDDC preconditioning context (setup must be already called)
11013425bc38SStefano Zampini 
11023425bc38SStefano Zampini    Level: developer
11033425bc38SStefano Zampini 
11043425bc38SStefano Zampini    Notes:
11053425bc38SStefano Zampini 
11063425bc38SStefano Zampini .seealso: PCBDDC
11073425bc38SStefano Zampini @*/
11083425bc38SStefano Zampini PetscErrorCode PCBDDCCreateFETIDPOperators(PC pc, Mat *fetidp_mat, PC *fetidp_pc)
11093425bc38SStefano Zampini {
11103425bc38SStefano Zampini   PetscErrorCode ierr;
11113425bc38SStefano Zampini 
11123425bc38SStefano Zampini   PetscFunctionBegin;
11133425bc38SStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
11143425bc38SStefano Zampini   if (pc->setupcalled) {
11153425bc38SStefano Zampini     ierr = PetscTryMethod(pc,"PCBDDCCreateFETIDPOperators_C",(PC,Mat*,PC*),(pc,fetidp_mat,fetidp_pc));CHKERRQ(ierr);
11163425bc38SStefano Zampini   } else {
11173425bc38SStefano Zampini     SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SUP,"You must call PCSetup_BDDC before calling %s\n",__FUNCT__);
11183425bc38SStefano Zampini   }
11193425bc38SStefano Zampini   PetscFunctionReturn(0);
11203425bc38SStefano Zampini }
11210c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
1122da1bb401SStefano Zampini /*MC
1123da1bb401SStefano Zampini    PCBDDC - Balancing Domain Decomposition by Constraints.
11240c7d97c5SJed Brown 
1125da1bb401SStefano Zampini    Options Database Keys:
1126da1bb401SStefano Zampini .    -pcbddc ??? -
1127da1bb401SStefano Zampini 
1128da1bb401SStefano Zampini    Level: intermediate
1129da1bb401SStefano Zampini 
1130da1bb401SStefano Zampini    Notes: The matrix used with this preconditioner must be of type MATIS
1131da1bb401SStefano Zampini 
1132da1bb401SStefano Zampini           Unlike more 'conventional' interface preconditioners, this iterates over ALL the
1133da1bb401SStefano Zampini           degrees of freedom, NOT just those on the interface (this allows the use of approximate solvers
1134da1bb401SStefano Zampini           on the subdomains).
1135da1bb401SStefano Zampini 
1136da1bb401SStefano Zampini           Options for the coarse grid preconditioner can be set with -
1137da1bb401SStefano Zampini           Options for the Dirichlet subproblem can be set with -
1138da1bb401SStefano Zampini           Options for the Neumann subproblem can be set with -
1139da1bb401SStefano Zampini 
1140da1bb401SStefano Zampini    Contributed by Stefano Zampini
1141da1bb401SStefano Zampini 
1142da1bb401SStefano Zampini .seealso:  PCCreate(), PCSetType(), PCType (for list of available types), PC,  MATIS
1143da1bb401SStefano Zampini M*/
1144da1bb401SStefano Zampini EXTERN_C_BEGIN
1145da1bb401SStefano Zampini #undef __FUNCT__
1146da1bb401SStefano Zampini #define __FUNCT__ "PCCreate_BDDC"
1147da1bb401SStefano Zampini PetscErrorCode PCCreate_BDDC(PC pc)
1148da1bb401SStefano Zampini {
1149da1bb401SStefano Zampini   PetscErrorCode ierr;
1150da1bb401SStefano Zampini   PC_BDDC        *pcbddc;
1151da1bb401SStefano Zampini   PCBDDCGraph    mat_graph;
1152da1bb401SStefano Zampini 
1153da1bb401SStefano Zampini   PetscFunctionBegin;
1154da1bb401SStefano Zampini   /* Creates the private data structure for this preconditioner and attach it to the PC object. */
1155da1bb401SStefano Zampini   ierr      = PetscNewLog(pc,PC_BDDC,&pcbddc);CHKERRQ(ierr);
1156da1bb401SStefano Zampini   pc->data  = (void*)pcbddc;
1157da1bb401SStefano Zampini 
1158da1bb401SStefano Zampini   /* create PCIS data structure */
1159da1bb401SStefano Zampini   ierr = PCISCreate(pc);CHKERRQ(ierr);
1160da1bb401SStefano Zampini 
1161da1bb401SStefano Zampini   /* BDDC specific */
11620bdf917eSStefano Zampini   pcbddc->CoarseNullSpace            = 0;
11630bdf917eSStefano Zampini   pcbddc->NullSpace                  = 0;
11643972b0daSStefano Zampini   pcbddc->temp_solution              = 0;
1165534831adSStefano Zampini   pcbddc->original_rhs               = 0;
1166534831adSStefano Zampini   pcbddc->local_mat                  = 0;
1167534831adSStefano Zampini   pcbddc->ChangeOfBasisMatrix        = 0;
1168534831adSStefano Zampini   pcbddc->usechangeofbasis           = PETSC_TRUE;
1169534831adSStefano Zampini   pcbddc->usechangeonfaces           = PETSC_FALSE;
1170da1bb401SStefano Zampini   pcbddc->coarse_vec                 = 0;
1171da1bb401SStefano Zampini   pcbddc->coarse_rhs                 = 0;
1172da1bb401SStefano Zampini   pcbddc->coarse_ksp                 = 0;
1173da1bb401SStefano Zampini   pcbddc->coarse_phi_B               = 0;
1174da1bb401SStefano Zampini   pcbddc->coarse_phi_D               = 0;
1175da1bb401SStefano Zampini   pcbddc->vec1_P                     = 0;
1176da1bb401SStefano Zampini   pcbddc->vec1_R                     = 0;
1177da1bb401SStefano Zampini   pcbddc->vec2_R                     = 0;
1178da1bb401SStefano Zampini   pcbddc->local_auxmat1              = 0;
1179da1bb401SStefano Zampini   pcbddc->local_auxmat2              = 0;
1180da1bb401SStefano Zampini   pcbddc->R_to_B                     = 0;
1181da1bb401SStefano Zampini   pcbddc->R_to_D                     = 0;
1182da1bb401SStefano Zampini   pcbddc->ksp_D                      = 0;
1183da1bb401SStefano Zampini   pcbddc->ksp_R                      = 0;
1184da1bb401SStefano Zampini   pcbddc->local_primal_indices       = 0;
1185da1bb401SStefano Zampini   pcbddc->prec_type                  = PETSC_FALSE;
1186da1bb401SStefano Zampini   pcbddc->NeumannBoundaries          = 0;
1187da1bb401SStefano Zampini   pcbddc->ISForDofs                  = 0;
1188da1bb401SStefano Zampini   pcbddc->ISForVertices              = 0;
1189da1bb401SStefano Zampini   pcbddc->n_ISForFaces               = 0;
1190da1bb401SStefano Zampini   pcbddc->n_ISForEdges               = 0;
1191da1bb401SStefano Zampini   pcbddc->ConstraintMatrix           = 0;
1192da1bb401SStefano Zampini   pcbddc->use_nnsp_true              = PETSC_FALSE;
1193da1bb401SStefano Zampini   pcbddc->local_primal_sizes         = 0;
1194da1bb401SStefano Zampini   pcbddc->local_primal_displacements = 0;
1195da1bb401SStefano Zampini   pcbddc->replicated_local_primal_indices = 0;
1196da1bb401SStefano Zampini   pcbddc->replicated_local_primal_values  = 0;
1197da1bb401SStefano Zampini   pcbddc->coarse_loc_to_glob         = 0;
1198da1bb401SStefano Zampini   pcbddc->dbg_flag                   = PETSC_FALSE;
1199da1bb401SStefano Zampini   pcbddc->coarsening_ratio           = 8;
1200b76ba322SStefano Zampini   pcbddc->use_exact_dirichlet        = PETSC_TRUE;
1201*4fad6a16SStefano Zampini   pcbddc->current_level              = 0;
1202*4fad6a16SStefano Zampini   pcbddc->max_levels                 = 1;
1203da1bb401SStefano Zampini 
1204da1bb401SStefano Zampini   /* allocate and initialize needed graph structure */
1205da1bb401SStefano Zampini   ierr = PetscMalloc(sizeof(*mat_graph),&pcbddc->mat_graph);CHKERRQ(ierr);
1206da1bb401SStefano Zampini   pcbddc->mat_graph->xadj            = 0;
1207da1bb401SStefano Zampini   pcbddc->mat_graph->adjncy          = 0;
1208da1bb401SStefano Zampini 
1209da1bb401SStefano Zampini   /* function pointers */
1210da1bb401SStefano Zampini   pc->ops->apply               = PCApply_BDDC;
1211da1bb401SStefano Zampini   pc->ops->applytranspose      = 0;
1212da1bb401SStefano Zampini   pc->ops->setup               = PCSetUp_BDDC;
1213da1bb401SStefano Zampini   pc->ops->destroy             = PCDestroy_BDDC;
1214da1bb401SStefano Zampini   pc->ops->setfromoptions      = PCSetFromOptions_BDDC;
1215da1bb401SStefano Zampini   pc->ops->view                = 0;
1216da1bb401SStefano Zampini   pc->ops->applyrichardson     = 0;
1217da1bb401SStefano Zampini   pc->ops->applysymmetricleft  = 0;
1218da1bb401SStefano Zampini   pc->ops->applysymmetricright = 0;
1219534831adSStefano Zampini   pc->ops->presolve            = PCPreSolve_BDDC;
1220534831adSStefano Zampini   pc->ops->postsolve           = PCPostSolve_BDDC;
1221da1bb401SStefano Zampini 
1222da1bb401SStefano Zampini   /* composing function */
1223*4fad6a16SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetCoarseningRatio_C","PCBDDCSetCoarseningRatio_BDDC",
1224*4fad6a16SStefano Zampini                     PCBDDCSetCoarseningRatio_BDDC);CHKERRQ(ierr);
1225*4fad6a16SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetMaxLevels_C","PCBDDCSetMaxLevels_BDDC",
1226*4fad6a16SStefano Zampini                     PCBDDCSetMaxLevels_BDDC);CHKERRQ(ierr);
12270bdf917eSStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetNullSpace_C","PCBDDCSetNullSpace_BDDC",
12280bdf917eSStefano Zampini                     PCBDDCSetNullSpace_BDDC);CHKERRQ(ierr);
1229da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDirichletBoundaries_C","PCBDDCSetDirichletBoundaries_BDDC",
1230da1bb401SStefano Zampini                     PCBDDCSetDirichletBoundaries_BDDC);CHKERRQ(ierr);
1231da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetNeumannBoundaries_C","PCBDDCSetNeumannBoundaries_BDDC",
1232da1bb401SStefano Zampini                     PCBDDCSetNeumannBoundaries_BDDC);CHKERRQ(ierr);
1233da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetDirichletBoundaries_C","PCBDDCGetDirichletBoundaries_BDDC",
1234da1bb401SStefano Zampini                     PCBDDCGetDirichletBoundaries_BDDC);CHKERRQ(ierr);
1235da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetNeumannBoundaries_C","PCBDDCGetNeumannBoundaries_BDDC",
1236da1bb401SStefano Zampini                     PCBDDCGetNeumannBoundaries_BDDC);CHKERRQ(ierr);
1237da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetCoarseProblemType_C","PCBDDCSetCoarseProblemType_BDDC",
1238da1bb401SStefano Zampini                     PCBDDCSetCoarseProblemType_BDDC);CHKERRQ(ierr);
1239da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDofsSplitting_C","PCBDDCSetDofsSplitting_BDDC",
1240da1bb401SStefano Zampini                     PCBDDCSetDofsSplitting_BDDC);CHKERRQ(ierr);
1241da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetLocalAdjacencyGraph_C","PCBDDCSetLocalAdjacencyGraph_BDDC",
1242da1bb401SStefano Zampini                     PCBDDCSetLocalAdjacencyGraph_BDDC);CHKERRQ(ierr);
1243534831adSStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPreSolve_C","PCPreSolve_BDDC",
1244534831adSStefano Zampini                     PCPreSolve_BDDC);CHKERRQ(ierr);
1245534831adSStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPostSolve_C","PCPostSolve_BDDC",
1246534831adSStefano Zampini                     PCPostSolve_BDDC);CHKERRQ(ierr);
12473425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCCreateFETIDPOperators_C","PCBDDCCreateFETIDPOperators_BDDC",
12483425bc38SStefano Zampini                     PCBDDCCreateFETIDPOperators_BDDC);CHKERRQ(ierr);
12493425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetRHS_C","PCBDDCMatFETIDPGetRHS_BDDC",
12503425bc38SStefano Zampini                     PCBDDCMatFETIDPGetRHS_BDDC);CHKERRQ(ierr);
12513425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetSolution_C","PCBDDCMatFETIDPGetSolution_BDDC",
12523425bc38SStefano Zampini                     PCBDDCMatFETIDPGetSolution_BDDC);CHKERRQ(ierr);
1253da1bb401SStefano Zampini   PetscFunctionReturn(0);
1254da1bb401SStefano Zampini }
1255da1bb401SStefano Zampini EXTERN_C_END
12563425bc38SStefano Zampini 
1257da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
1258da1bb401SStefano Zampini /* All static functions from now on                                           */
1259da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
1260*4fad6a16SStefano Zampini #undef __FUNCT__
1261*4fad6a16SStefano Zampini #define __FUNCT__ "PCBDDCSetLevel"
1262*4fad6a16SStefano Zampini static PetscErrorCode PCBDDCSetLevel(PC pc,PetscInt level)
1263*4fad6a16SStefano Zampini {
1264*4fad6a16SStefano Zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
1265*4fad6a16SStefano Zampini 
1266*4fad6a16SStefano Zampini   PetscFunctionBegin;
1267*4fad6a16SStefano Zampini   pcbddc->current_level=level;
1268*4fad6a16SStefano Zampini   PetscFunctionReturn(0);
1269*4fad6a16SStefano Zampini }
12703425bc38SStefano Zampini 
12713425bc38SStefano Zampini #undef __FUNCT__
12720bdf917eSStefano Zampini #define __FUNCT__ "PCBDDCAdaptNullSpace"
12730bdf917eSStefano Zampini static PetscErrorCode PCBDDCAdaptNullSpace(PC pc)
12740bdf917eSStefano Zampini {
12750bdf917eSStefano Zampini   PC_IS*         pcis = (PC_IS*)  (pc->data);
12760bdf917eSStefano Zampini   PC_BDDC*       pcbddc = (PC_BDDC*)(pc->data);
12770bdf917eSStefano Zampini   KSP            inv_change;
12780bdf917eSStefano Zampini   PC             pc_change;
12790bdf917eSStefano Zampini   const Vec      *nsp_vecs;
12800bdf917eSStefano Zampini   Vec            *new_nsp_vecs;
12810bdf917eSStefano Zampini   PetscInt       i,nsp_size,new_nsp_size,start_new;
12820bdf917eSStefano Zampini   PetscBool      nsp_has_cnst;
12830bdf917eSStefano Zampini   MatNullSpace   new_nsp;
12840bdf917eSStefano Zampini   PetscErrorCode ierr;
12850bdf917eSStefano Zampini 
12860bdf917eSStefano Zampini   PetscFunctionBegin;
12870bdf917eSStefano Zampini   ierr = MatNullSpaceGetVecs(pcbddc->NullSpace,&nsp_has_cnst,&nsp_size,&nsp_vecs);CHKERRQ(ierr);
12880bdf917eSStefano Zampini   ierr = KSPCreate(PETSC_COMM_SELF,&inv_change);CHKERRQ(ierr);
12890bdf917eSStefano Zampini   ierr = KSPSetOperators(inv_change,pcbddc->ChangeOfBasisMatrix,pcbddc->ChangeOfBasisMatrix,SAME_PRECONDITIONER);CHKERRQ(ierr);
12900bdf917eSStefano Zampini   ierr = KSPSetType(inv_change,KSPPREONLY);CHKERRQ(ierr);
12910bdf917eSStefano Zampini   ierr = KSPGetPC(inv_change,&pc_change);CHKERRQ(ierr);
12920bdf917eSStefano Zampini   ierr = PCSetType(pc_change,PCLU);CHKERRQ(ierr);
12930bdf917eSStefano Zampini   ierr = KSPSetUp(inv_change);CHKERRQ(ierr);
12940bdf917eSStefano Zampini   new_nsp_size = nsp_size;
12950bdf917eSStefano Zampini   if (nsp_has_cnst) { new_nsp_size++; }
12960bdf917eSStefano Zampini   ierr = PetscMalloc(new_nsp_size*sizeof(Vec),&new_nsp_vecs);CHKERRQ(ierr);
12970bdf917eSStefano Zampini   for (i=0;i<new_nsp_size;i++) { ierr = VecDuplicate(pcis->vec1_global,&new_nsp_vecs[i]);CHKERRQ(ierr); }
12980bdf917eSStefano Zampini   start_new = 0;
12990bdf917eSStefano Zampini   if (nsp_has_cnst) {
13000bdf917eSStefano Zampini     start_new = 1;
13010bdf917eSStefano Zampini     ierr = VecSet(new_nsp_vecs[0],1.0);CHKERRQ(ierr);
13020bdf917eSStefano Zampini     ierr = VecSet(pcis->vec1_B,1.0);CHKERRQ(ierr);
13030bdf917eSStefano Zampini     ierr = KSPSolve(inv_change,pcis->vec1_B,pcis->vec1_B);
13040bdf917eSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,new_nsp_vecs[0],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
13050bdf917eSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec1_B,new_nsp_vecs[0],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
13060bdf917eSStefano Zampini   }
13070bdf917eSStefano Zampini   for (i=0;i<nsp_size;i++) {
13080bdf917eSStefano Zampini     ierr = VecCopy(nsp_vecs[i],new_nsp_vecs[i+start_new]);CHKERRQ(ierr);
13090bdf917eSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,nsp_vecs[i],pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
13100bdf917eSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,nsp_vecs[i],pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
13110bdf917eSStefano Zampini     ierr = KSPSolve(inv_change,pcis->vec1_B,pcis->vec1_B);
13120bdf917eSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,new_nsp_vecs[i+start_new],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
13130bdf917eSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec1_B,new_nsp_vecs[i+start_new],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
13140bdf917eSStefano Zampini   }
13150bdf917eSStefano Zampini   ierr = VecNormalize(new_nsp_vecs[0],PETSC_NULL);CHKERRQ(ierr);
13160bdf917eSStefano Zampini   /* TODO : Orthonormalize vecs when new_nsp_size > 0! */
13170bdf917eSStefano Zampini 
13180bdf917eSStefano Zampini   /*PetscBool nsp_t=PETSC_FALSE;
13190bdf917eSStefano Zampini   ierr = MatNullSpaceTest(pcbddc->NullSpace,pc->pmat,&nsp_t);CHKERRQ(ierr);
13200bdf917eSStefano Zampini   printf("Original Null Space test: %d\n",nsp_t);
13210bdf917eSStefano Zampini   Mat temp_mat;
13220bdf917eSStefano Zampini   Mat_IS* matis = (Mat_IS*)pc->pmat->data;
13230bdf917eSStefano Zampini     temp_mat = matis->A;
13240bdf917eSStefano Zampini     matis->A = pcbddc->local_mat;
13250bdf917eSStefano Zampini     pcbddc->local_mat = temp_mat;
13260bdf917eSStefano Zampini   ierr = MatNullSpaceTest(pcbddc->NullSpace,pc->pmat,&nsp_t);CHKERRQ(ierr);
13270bdf917eSStefano Zampini   printf("Original Null Space, mat changed test: %d\n",nsp_t);
13280bdf917eSStefano Zampini   {
13290bdf917eSStefano Zampini     PetscReal test_norm;
13300bdf917eSStefano Zampini     for (i=0;i<new_nsp_size;i++) {
13310bdf917eSStefano Zampini       ierr = MatMult(pc->pmat,new_nsp_vecs[i],pcis->vec1_global);CHKERRQ(ierr);
13320bdf917eSStefano Zampini       ierr = VecNorm(pcis->vec1_global,NORM_2,&test_norm);CHKERRQ(ierr);
13330bdf917eSStefano Zampini       if (test_norm > 1.e-12) {
13340bdf917eSStefano Zampini         printf("------------ERROR VEC %d------------------\n",i);
13350bdf917eSStefano Zampini         ierr = VecView(pcis->vec1_global,PETSC_VIEWER_STDOUT_WORLD);
13360bdf917eSStefano Zampini         printf("------------------------------------------\n");
13370bdf917eSStefano Zampini       }
13380bdf917eSStefano Zampini     }
13390bdf917eSStefano Zampini   }*/
13400bdf917eSStefano Zampini 
13410bdf917eSStefano Zampini   ierr = KSPDestroy(&inv_change);CHKERRQ(ierr);
13420bdf917eSStefano Zampini   ierr = MatNullSpaceCreate(((PetscObject)pc)->comm,PETSC_FALSE,new_nsp_size,new_nsp_vecs,&new_nsp);CHKERRQ(ierr);
13430bdf917eSStefano Zampini   ierr = PCBDDCSetNullSpace(pc,new_nsp);CHKERRQ(ierr);
13440bdf917eSStefano Zampini   ierr = MatNullSpaceDestroy(&new_nsp);CHKERRQ(ierr);
13450bdf917eSStefano Zampini   /*
13460bdf917eSStefano Zampini   ierr = MatNullSpaceTest(pcbddc->NullSpace,pc->pmat,&nsp_t);CHKERRQ(ierr);
13470bdf917eSStefano Zampini   printf("New Null Space, mat changed: %d\n",nsp_t);
13480bdf917eSStefano Zampini     temp_mat = matis->A;
13490bdf917eSStefano Zampini     matis->A = pcbddc->local_mat;
13500bdf917eSStefano Zampini     pcbddc->local_mat = temp_mat;
13510bdf917eSStefano Zampini   ierr = MatNullSpaceTest(pcbddc->NullSpace,pc->pmat,&nsp_t);CHKERRQ(ierr);
13520bdf917eSStefano Zampini   printf("New Null Space, mat original: %d\n",nsp_t);*/
13530bdf917eSStefano Zampini 
13540bdf917eSStefano Zampini   for (i=0;i<new_nsp_size;i++) { ierr = VecDestroy(&new_nsp_vecs[i]);CHKERRQ(ierr); }
13550bdf917eSStefano Zampini   ierr = PetscFree(new_nsp_vecs);CHKERRQ(ierr);
13560bdf917eSStefano Zampini   PetscFunctionReturn(0);
13570bdf917eSStefano Zampini }
13580bdf917eSStefano Zampini 
13590bdf917eSStefano Zampini #undef __FUNCT__
13603425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPMatContext"
13613425bc38SStefano Zampini static PetscErrorCode PCBDDCCreateFETIDPMatContext(PC pc, FETIDPMat_ctx **fetidpmat_ctx)
13623425bc38SStefano Zampini {
13633425bc38SStefano Zampini   FETIDPMat_ctx  *newctx;
13643425bc38SStefano Zampini   PetscErrorCode ierr;
13653425bc38SStefano Zampini 
13663425bc38SStefano Zampini   PetscFunctionBegin;
13673425bc38SStefano Zampini   ierr = PetscMalloc(sizeof(*newctx),&newctx);CHKERRQ(ierr);
13683425bc38SStefano Zampini   newctx->lambda_local    = 0;
13693425bc38SStefano Zampini   newctx->temp_solution_B = 0;
13703425bc38SStefano Zampini   newctx->temp_solution_D = 0;
13713425bc38SStefano Zampini   newctx->B_delta         = 0;
13723425bc38SStefano Zampini   newctx->B_Ddelta        = 0; /* theoretically belongs to the FETIDP preconditioner */
13733425bc38SStefano Zampini   newctx->l2g_lambda      = 0;
13743425bc38SStefano Zampini   /* increase the reference count for BDDC preconditioner */
13753425bc38SStefano Zampini   ierr = PetscObjectReference((PetscObject)pc);CHKERRQ(ierr);
13763425bc38SStefano Zampini   newctx->pc              = pc;
13773425bc38SStefano Zampini   *fetidpmat_ctx          = newctx;
13783425bc38SStefano Zampini   PetscFunctionReturn(0);
13793425bc38SStefano Zampini }
13803425bc38SStefano Zampini 
13813425bc38SStefano Zampini #undef __FUNCT__
13823425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPPCContext"
13833425bc38SStefano Zampini static PetscErrorCode PCBDDCCreateFETIDPPCContext(PC pc, FETIDPPC_ctx **fetidppc_ctx)
13843425bc38SStefano Zampini {
13853425bc38SStefano Zampini   FETIDPPC_ctx  *newctx;
13863425bc38SStefano Zampini   PetscErrorCode ierr;
13873425bc38SStefano Zampini 
13883425bc38SStefano Zampini   PetscFunctionBegin;
13893425bc38SStefano Zampini   ierr = PetscMalloc(sizeof(*newctx),&newctx);CHKERRQ(ierr);
13903425bc38SStefano Zampini   newctx->lambda_local    = 0;
13913425bc38SStefano Zampini   newctx->B_Ddelta        = 0;
13923425bc38SStefano Zampini   newctx->l2g_lambda      = 0;
13933425bc38SStefano Zampini   /* increase the reference count for BDDC preconditioner */
13943425bc38SStefano Zampini   ierr = PetscObjectReference((PetscObject)pc);CHKERRQ(ierr);
13953425bc38SStefano Zampini   newctx->pc              = pc;
13963425bc38SStefano Zampini   *fetidppc_ctx           = newctx;
13973425bc38SStefano Zampini   PetscFunctionReturn(0);
13983425bc38SStefano Zampini }
13993425bc38SStefano Zampini 
14003425bc38SStefano Zampini #undef __FUNCT__
14013425bc38SStefano Zampini #define __FUNCT__ "PCBDDCDestroyFETIDPMat"
14023425bc38SStefano Zampini static PetscErrorCode PCBDDCDestroyFETIDPMat(Mat A)
14033425bc38SStefano Zampini {
14043425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
14053425bc38SStefano Zampini   PetscErrorCode ierr;
14063425bc38SStefano Zampini 
14073425bc38SStefano Zampini   PetscFunctionBegin;
14083425bc38SStefano Zampini   ierr = MatShellGetContext(A,(void**)&mat_ctx);CHKERRQ(ierr);
14093425bc38SStefano Zampini   ierr = VecDestroy(&mat_ctx->lambda_local);CHKERRQ(ierr);
14103425bc38SStefano Zampini   ierr = VecDestroy(&mat_ctx->temp_solution_D);CHKERRQ(ierr);
14113425bc38SStefano Zampini   ierr = VecDestroy(&mat_ctx->temp_solution_B);CHKERRQ(ierr);
14123425bc38SStefano Zampini   ierr = MatDestroy(&mat_ctx->B_delta);CHKERRQ(ierr);
14133425bc38SStefano Zampini   ierr = MatDestroy(&mat_ctx->B_Ddelta);CHKERRQ(ierr);
14143425bc38SStefano Zampini   ierr = VecScatterDestroy(&mat_ctx->l2g_lambda);CHKERRQ(ierr);
14153425bc38SStefano Zampini   ierr = PCDestroy(&mat_ctx->pc);CHKERRQ(ierr); /* actually it does not destroy BDDC, only decrease its reference count */
14163425bc38SStefano Zampini   ierr = PetscFree(mat_ctx);CHKERRQ(ierr);
14173425bc38SStefano Zampini   PetscFunctionReturn(0);
14183425bc38SStefano Zampini }
14193425bc38SStefano Zampini 
14203425bc38SStefano Zampini #undef __FUNCT__
14213425bc38SStefano Zampini #define __FUNCT__ "PCBDDCDestroyFETIDPPC"
14223425bc38SStefano Zampini static PetscErrorCode PCBDDCDestroyFETIDPPC(PC pc)
14233425bc38SStefano Zampini {
14243425bc38SStefano Zampini   FETIDPPC_ctx  *pc_ctx;
14253425bc38SStefano Zampini   PetscErrorCode ierr;
14263425bc38SStefano Zampini 
14273425bc38SStefano Zampini   PetscFunctionBegin;
14283425bc38SStefano Zampini   ierr = PCShellGetContext(pc,(void**)&pc_ctx);CHKERRQ(ierr);
14293425bc38SStefano Zampini   ierr = VecDestroy(&pc_ctx->lambda_local);CHKERRQ(ierr);
14303425bc38SStefano Zampini   ierr = MatDestroy(&pc_ctx->B_Ddelta);CHKERRQ(ierr);
14313425bc38SStefano Zampini   ierr = VecScatterDestroy(&pc_ctx->l2g_lambda);CHKERRQ(ierr);
14323425bc38SStefano Zampini   ierr = PCDestroy(&pc_ctx->pc);CHKERRQ(ierr); /* actually it does not destroy BDDC, only decrease its reference count */
14333425bc38SStefano Zampini   ierr = PetscFree(pc_ctx);CHKERRQ(ierr);
14343425bc38SStefano Zampini   PetscFunctionReturn(0);
14353425bc38SStefano Zampini }
14363425bc38SStefano Zampini 
14373425bc38SStefano Zampini #undef __FUNCT__
14383425bc38SStefano Zampini #define __FUNCT__ "PCBDDCSetupFETIDPMatContext"
14393425bc38SStefano Zampini static PetscErrorCode PCBDDCSetupFETIDPMatContext(FETIDPMat_ctx *fetidpmat_ctx )
14403425bc38SStefano Zampini {
14413425bc38SStefano Zampini   PetscErrorCode ierr;
14423425bc38SStefano Zampini   PC_IS          *pcis=(PC_IS*)fetidpmat_ctx->pc->data;
14433425bc38SStefano Zampini   PC_BDDC        *pcbddc=(PC_BDDC*)fetidpmat_ctx->pc->data;
14443425bc38SStefano Zampini   PCBDDCGraph    mat_graph=pcbddc->mat_graph;
14453425bc38SStefano Zampini   Mat_IS         *matis  = (Mat_IS*)fetidpmat_ctx->pc->pmat->data;
14463425bc38SStefano Zampini   MPI_Comm       comm = ((PetscObject)(fetidpmat_ctx->pc))->comm;
14473425bc38SStefano Zampini 
14483425bc38SStefano Zampini   Mat            ScalingMat;
14493425bc38SStefano Zampini   Vec            lambda_global;
14503425bc38SStefano Zampini   IS             IS_l2g_lambda;
14513425bc38SStefano Zampini 
14523425bc38SStefano Zampini   PetscBool      skip_node,fully_redundant;
14533425bc38SStefano Zampini   PetscInt       i,j,k,s,n_boundary_dofs,sum_dof_sizes,n_global_lambda,n_vertices;
14543425bc38SStefano Zampini   PetscInt       n_local_lambda,n_lambda_for_dof,dual_size,n_neg_values,n_pos_values;
14553425bc38SStefano Zampini   PetscMPIInt    rank,nprocs,partial_sum;
14563425bc38SStefano Zampini   PetscScalar    scalar_value;
14573425bc38SStefano Zampini 
14583425bc38SStefano Zampini   PetscInt       *vertex_indices,*temp_indices;
14593425bc38SStefano Zampini   PetscInt       *dual_dofs_boundary_indices,*aux_local_numbering_1,*aux_global_numbering;
14603425bc38SStefano Zampini   PetscInt       *aux_sums,*cols_B_delta,*l2g_indices;
14613425bc38SStefano Zampini   PetscMPIInt    *aux_local_numbering_2,*aux_global_numbering_mpi,*dof_sizes,*dof_displs;
14623425bc38SStefano Zampini   PetscMPIInt    *all_aux_global_numbering_mpi_1,*all_aux_global_numbering_mpi_2,*global_dofs_numbering;
14633425bc38SStefano Zampini   PetscScalar    *array,*scaling_factors,*vals_B_delta;
14643425bc38SStefano Zampini 
14653425bc38SStefano Zampini   /* For communication of scaling factors */
14663425bc38SStefano Zampini   PetscInt       *ptrs_buffer,neigh_position;
14673425bc38SStefano Zampini   PetscScalar    **all_factors,*send_buffer,*recv_buffer;
14683425bc38SStefano Zampini   MPI_Request    *send_reqs,*recv_reqs;
14693425bc38SStefano Zampini 
14703425bc38SStefano Zampini   /* tests */
14713425bc38SStefano Zampini   Vec            test_vec;
14723425bc38SStefano Zampini   PetscBool      test_fetidp;
14733425bc38SStefano Zampini   PetscViewer    viewer;
14743425bc38SStefano Zampini 
14753425bc38SStefano Zampini   PetscFunctionBegin;
14763425bc38SStefano Zampini   ierr = MPI_Comm_rank(comm,&rank);CHKERRQ(ierr);
14773425bc38SStefano Zampini   ierr = MPI_Comm_size(comm,&nprocs);CHKERRQ(ierr);
14783425bc38SStefano Zampini 
14793425bc38SStefano Zampini   /* Default type of lagrange multipliers is non-redundant */
14803425bc38SStefano Zampini   fully_redundant = PETSC_FALSE;
14813425bc38SStefano Zampini   ierr = PetscOptionsGetBool(PETSC_NULL,"-fetidp_fullyredundant",&fully_redundant,PETSC_NULL);CHKERRQ(ierr);
14823425bc38SStefano Zampini 
14833425bc38SStefano Zampini   /* Evaluate local and global number of lagrange multipliers */
14843425bc38SStefano Zampini   ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
14853425bc38SStefano Zampini   n_local_lambda = 0;
14863425bc38SStefano Zampini   partial_sum = 0;
14873425bc38SStefano Zampini   n_boundary_dofs = 0;
14883425bc38SStefano Zampini   s = 0;
14893425bc38SStefano Zampini   n_vertices = 0;
14903425bc38SStefano Zampini   /* Get Vertices used to define the BDDC */
14913425bc38SStefano Zampini   ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(*vertex_indices),&vertex_indices);CHKERRQ(ierr);
14923425bc38SStefano Zampini   for (i=0;i<pcbddc->local_primal_size;i++) {
14933425bc38SStefano Zampini     ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&j,(const PetscInt**)&temp_indices,PETSC_NULL);CHKERRQ(ierr);
14943425bc38SStefano Zampini     if (j == 1) {
14953425bc38SStefano Zampini       vertex_indices[n_vertices]=temp_indices[0];
14963425bc38SStefano Zampini       n_vertices++;
14973425bc38SStefano Zampini     }
14983425bc38SStefano Zampini     ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&j,(const PetscInt**)&temp_indices,PETSC_NULL);CHKERRQ(ierr);
14993425bc38SStefano Zampini   }
15003425bc38SStefano Zampini   dual_size = pcis->n_B-n_vertices;
15013425bc38SStefano Zampini   ierr = PetscMalloc(dual_size*sizeof(*dual_dofs_boundary_indices),&dual_dofs_boundary_indices);CHKERRQ(ierr);
15023425bc38SStefano Zampini   ierr = PetscMalloc(dual_size*sizeof(*aux_local_numbering_1),&aux_local_numbering_1);CHKERRQ(ierr);
15033425bc38SStefano Zampini   ierr = PetscMalloc(dual_size*sizeof(*aux_local_numbering_2),&aux_local_numbering_2);CHKERRQ(ierr);
15043425bc38SStefano Zampini 
15053425bc38SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
15063425bc38SStefano Zampini   for (i=0;i<pcis->n;i++){
15073425bc38SStefano Zampini     j = mat_graph->count[i]; /* RECALL: mat_graph->count[i] does not count myself */
1508c6582918SStefano Zampini     k = 0;
1509c6582918SStefano Zampini     if (j > 0) {
15103425bc38SStefano Zampini       k = (mat_graph->neighbours_set[i][0] == -1 ?  1 : 0);
1511c6582918SStefano Zampini     }
15123425bc38SStefano Zampini     j = j - k ;
15133425bc38SStefano Zampini     if ( j > 0 ) { n_boundary_dofs++; }
15143425bc38SStefano Zampini 
15153425bc38SStefano Zampini     skip_node = PETSC_FALSE;
1516c6582918SStefano Zampini     if ( s < n_vertices && vertex_indices[s]==i) { /* it works for a sorted set of vertices */
15173425bc38SStefano Zampini       skip_node = PETSC_TRUE;
15183425bc38SStefano Zampini       s++;
15193425bc38SStefano Zampini     }
15203425bc38SStefano Zampini     if (j < 1) {skip_node = PETSC_TRUE;}
15213425bc38SStefano Zampini     if ( !skip_node ) {
15223425bc38SStefano Zampini       if (fully_redundant) {
15233425bc38SStefano Zampini         /* fully redundant set of lagrange multipliers */
15243425bc38SStefano Zampini         n_lambda_for_dof = (j*(j+1))/2;
15253425bc38SStefano Zampini       } else {
15263425bc38SStefano Zampini         n_lambda_for_dof = j;
15273425bc38SStefano Zampini       }
15283425bc38SStefano Zampini       n_local_lambda += j;
15293425bc38SStefano Zampini       /* needed to evaluate global number of lagrange multipliers */
15303425bc38SStefano Zampini       array[i]=(1.0*n_lambda_for_dof)/(j+1.0); /* already scaled for the next global sum */
15313425bc38SStefano Zampini       /* store some data needed */
15323425bc38SStefano Zampini       dual_dofs_boundary_indices[partial_sum] = n_boundary_dofs-1;
15333425bc38SStefano Zampini       aux_local_numbering_1[partial_sum] = i;
15343425bc38SStefano Zampini       aux_local_numbering_2[partial_sum] = (PetscMPIInt)n_lambda_for_dof;
15353425bc38SStefano Zampini       partial_sum++;
15363425bc38SStefano Zampini     }
15373425bc38SStefano Zampini   }
15383425bc38SStefano Zampini   /*printf("I found %d local lambda dofs\n",n_local_lambda);
15393425bc38SStefano Zampini   printf("I found %d boundary dofs (should be %d)\n",n_boundary_dofs,pcis->n_B);
15403425bc38SStefano Zampini   printf("Partial sum %d should be %d\n",partial_sum,dual_size);*/
15413425bc38SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
15423425bc38SStefano Zampini   ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
15433425bc38SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
15443425bc38SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
15453425bc38SStefano Zampini   ierr = VecSum(pcis->vec1_global,&scalar_value);CHKERRQ(ierr);
15463425bc38SStefano Zampini   fetidpmat_ctx->n_lambda = (PetscInt) scalar_value;
15473425bc38SStefano Zampini   /* printf("I found %d global multipliers (%f)\n",fetidpmat_ctx->n_lambda,scalar_value); */
15483425bc38SStefano Zampini   ierr = VecCreate(PETSC_COMM_SELF,&fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
15493425bc38SStefano Zampini   ierr = VecSetSizes(fetidpmat_ctx->lambda_local,n_local_lambda,n_local_lambda);CHKERRQ(ierr);
15503425bc38SStefano Zampini   ierr = VecSetType(fetidpmat_ctx->lambda_local,VECSEQ);CHKERRQ(ierr);
15513425bc38SStefano Zampini   ierr = VecCreate(comm,&lambda_global);CHKERRQ(ierr);
15523425bc38SStefano Zampini   ierr = VecSetSizes(lambda_global,PETSC_DECIDE,fetidpmat_ctx->n_lambda);CHKERRQ(ierr);
15533425bc38SStefano Zampini   ierr = VecSetType(lambda_global,VECMPI);CHKERRQ(ierr);
15543425bc38SStefano Zampini 
15553425bc38SStefano Zampini   /* compute global ordering of lagrange multipliers and associate l2g map */
15563425bc38SStefano Zampini 
15573425bc38SStefano Zampini   ierr = PetscMalloc(dual_size*sizeof(*aux_global_numbering),&aux_global_numbering);CHKERRQ(ierr);
15583425bc38SStefano Zampini   ierr = PetscMalloc(dual_size*sizeof(*aux_global_numbering_mpi),&aux_global_numbering_mpi);CHKERRQ(ierr);
15593425bc38SStefano Zampini   j = (rank == 0 ? nprocs : 0);
15603425bc38SStefano Zampini   ierr = PetscMalloc(j*sizeof(*dof_sizes),&dof_sizes);CHKERRQ(ierr);
15613425bc38SStefano Zampini   ierr = PetscMalloc(j*sizeof(*dof_displs),&dof_displs);CHKERRQ(ierr);
15623425bc38SStefano Zampini   ierr = ISLocalToGlobalMappingApply(matis->mapping,dual_size,aux_local_numbering_1,aux_global_numbering);CHKERRQ(ierr);
15633425bc38SStefano Zampini   ierr = MPI_Gather(&dual_size,1,MPIU_INT,dof_sizes,1,MPIU_INT,0,comm);CHKERRQ(ierr);
15643425bc38SStefano Zampini   sum_dof_sizes=0;
15653425bc38SStefano Zampini   if ( rank == 0 ) {
15663425bc38SStefano Zampini     dof_displs[0]=0;
15673425bc38SStefano Zampini     sum_dof_sizes=dual_size;
15683425bc38SStefano Zampini     for (i=1;i<nprocs;i++) {
15693425bc38SStefano Zampini       dof_displs[i] = dof_displs[i-1]+dof_sizes[i-1];
15703425bc38SStefano Zampini       sum_dof_sizes += dof_sizes[i];
15713425bc38SStefano Zampini     }
15723425bc38SStefano Zampini   }
15733425bc38SStefano Zampini   for (i=0;i<dual_size;i++) {
15743425bc38SStefano Zampini     aux_global_numbering_mpi[i]=(PetscMPIInt)aux_global_numbering[i];
15753425bc38SStefano Zampini   }
15763425bc38SStefano Zampini   ierr = PetscMalloc(sum_dof_sizes*sizeof(*all_aux_global_numbering_mpi_1),&all_aux_global_numbering_mpi_1);CHKERRQ(ierr);
15773425bc38SStefano Zampini   ierr = PetscMalloc(sum_dof_sizes*sizeof(*all_aux_global_numbering_mpi_2),&all_aux_global_numbering_mpi_2);CHKERRQ(ierr);
15783425bc38SStefano Zampini   ierr = MPI_Gatherv(aux_global_numbering_mpi,dual_size,MPIU_INT,all_aux_global_numbering_mpi_1,dof_sizes,dof_displs,MPIU_INT,0,comm);CHKERRQ(ierr);
15793425bc38SStefano Zampini   ierr = MPI_Gatherv(aux_local_numbering_2,dual_size,MPIU_INT,all_aux_global_numbering_mpi_2,dof_sizes,dof_displs,MPIU_INT,0,comm);CHKERRQ(ierr);
15803425bc38SStefano Zampini 
15813425bc38SStefano Zampini   ierr = PetscMalloc(fetidpmat_ctx->n_lambda*sizeof(*global_dofs_numbering),&global_dofs_numbering);CHKERRQ(ierr);
15823425bc38SStefano Zampini   if ( rank == 0 ) {
15833425bc38SStefano Zampini     ierr = PetscSortMPIIntWithArray(sum_dof_sizes,all_aux_global_numbering_mpi_1,all_aux_global_numbering_mpi_2);CHKERRQ(ierr);
15843425bc38SStefano Zampini     j=-1;
15853425bc38SStefano Zampini     partial_sum = 0;
15863425bc38SStefano Zampini     for (i=0;i<sum_dof_sizes;i++) {
15873425bc38SStefano Zampini       if (j != all_aux_global_numbering_mpi_1[i] ) {
15883425bc38SStefano Zampini         j=all_aux_global_numbering_mpi_1[i];
15893425bc38SStefano Zampini         for (k=0;k<all_aux_global_numbering_mpi_2[i];k++) {
15903425bc38SStefano Zampini           global_dofs_numbering[partial_sum+k]=all_aux_global_numbering_mpi_1[i];
15913425bc38SStefano Zampini         }
15923425bc38SStefano Zampini         partial_sum += all_aux_global_numbering_mpi_2[i];
15933425bc38SStefano Zampini       }
15943425bc38SStefano Zampini     }
15953425bc38SStefano Zampini     /* printf("Partial sum for global dofs %d should be %d\n",partial_sum,fetidpmat_ctx->n_lambda); */
15963425bc38SStefano Zampini   }
15973425bc38SStefano Zampini   ierr = MPI_Bcast(global_dofs_numbering,fetidpmat_ctx->n_lambda,MPIU_INT,0,comm);CHKERRQ(ierr);
15983425bc38SStefano Zampini 
15993425bc38SStefano Zampini   /* init data for scaling factors exchange */
16003425bc38SStefano Zampini   partial_sum = 0;
16013425bc38SStefano Zampini   j = 0;
16023425bc38SStefano Zampini   ierr = PetscMalloc( pcis->n_neigh*sizeof(PetscInt),&ptrs_buffer);CHKERRQ(ierr);
16033425bc38SStefano Zampini   ierr = PetscMalloc( (pcis->n_neigh-1)*sizeof(MPI_Request),&send_reqs);CHKERRQ(ierr);
16043425bc38SStefano Zampini   ierr = PetscMalloc( (pcis->n_neigh-1)*sizeof(MPI_Request),&recv_reqs);CHKERRQ(ierr);
16053425bc38SStefano Zampini   ierr = PetscMalloc( pcis->n*sizeof(PetscScalar*),&all_factors);CHKERRQ(ierr);
16063425bc38SStefano Zampini   ptrs_buffer[0]=0;
16073425bc38SStefano Zampini   for (i=1;i<pcis->n_neigh;i++) {
16083425bc38SStefano Zampini     partial_sum += pcis->n_shared[i];
16093425bc38SStefano Zampini     ptrs_buffer[i] = ptrs_buffer[i-1]+pcis->n_shared[i];
16103425bc38SStefano Zampini   }
16113425bc38SStefano Zampini   ierr = PetscMalloc( partial_sum*sizeof(PetscScalar),&send_buffer);CHKERRQ(ierr);
16123425bc38SStefano Zampini   ierr = PetscMalloc( partial_sum*sizeof(PetscScalar),&recv_buffer);CHKERRQ(ierr);
16133425bc38SStefano Zampini   ierr = PetscMalloc( partial_sum*sizeof(PetscScalar),&all_factors[0]);CHKERRQ(ierr);
16143425bc38SStefano Zampini   for (i=0;i<pcis->n-1;i++) {
16153425bc38SStefano Zampini     j = mat_graph->count[i];
16163425bc38SStefano Zampini     if (j>0) {
16173425bc38SStefano Zampini       k = (mat_graph->neighbours_set[i][0] == -1 ?  1 : 0);
16183425bc38SStefano Zampini       j = j - k;
16193425bc38SStefano Zampini     }
16203425bc38SStefano Zampini     all_factors[i+1]=all_factors[i]+j;
16213425bc38SStefano Zampini   }
16223425bc38SStefano Zampini   /* scatter B scaling to N vec */
16233425bc38SStefano Zampini   ierr = VecScatterBegin(pcis->N_to_B,pcis->D,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
16243425bc38SStefano Zampini   ierr = VecScatterEnd  (pcis->N_to_B,pcis->D,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
16253425bc38SStefano Zampini   /* communications */
16263425bc38SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
16273425bc38SStefano Zampini   for (i=1;i<pcis->n_neigh;i++) {
16283425bc38SStefano Zampini     for (j=0;j<pcis->n_shared[i];j++) {
16293425bc38SStefano Zampini       send_buffer[ptrs_buffer[i-1]+j]=array[pcis->shared[i][j]];
16303425bc38SStefano Zampini     }
16313425bc38SStefano Zampini     j = ptrs_buffer[i]-ptrs_buffer[i-1];
1632ea7e1babSStefano Zampini     ierr = MPI_Isend(&send_buffer[ptrs_buffer[i-1]],j,MPIU_SCALAR,pcis->neigh[i],0,comm,&send_reqs[i-1]);CHKERRQ(ierr);
1633ea7e1babSStefano Zampini     ierr = MPI_Irecv(&recv_buffer[ptrs_buffer[i-1]],j,MPIU_SCALAR,pcis->neigh[i],0,comm,&recv_reqs[i-1]);CHKERRQ(ierr);
16343425bc38SStefano Zampini   }
16353425bc38SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
1636ea7e1babSStefano Zampini   ierr = MPI_Waitall((pcis->n_neigh-1),recv_reqs,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
16373425bc38SStefano Zampini   /* put values in correct places */
16383425bc38SStefano Zampini   for (i=1;i<pcis->n_neigh;i++) {
16393425bc38SStefano Zampini     for (j=0;j<pcis->n_shared[i];j++) {
16403425bc38SStefano Zampini       k = pcis->shared[i][j];
16413425bc38SStefano Zampini       neigh_position = 0;
16423425bc38SStefano Zampini       while(mat_graph->neighbours_set[k][neigh_position] != pcis->neigh[i]) {neigh_position++;}
16433425bc38SStefano Zampini       s = (mat_graph->neighbours_set[k][0] == -1 ?  1 : 0);
16443425bc38SStefano Zampini       neigh_position = neigh_position - s;
16453425bc38SStefano Zampini       all_factors[k][neigh_position]=recv_buffer[ptrs_buffer[i-1]+j];
16463425bc38SStefano Zampini     }
16473425bc38SStefano Zampini   }
1648ea7e1babSStefano Zampini   ierr = MPI_Waitall((pcis->n_neigh-1),send_reqs,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
16493425bc38SStefano Zampini   ierr = PetscFree(send_reqs);CHKERRQ(ierr);
16503425bc38SStefano Zampini   ierr = PetscFree(recv_reqs);CHKERRQ(ierr);
16513425bc38SStefano Zampini   ierr = PetscFree(send_buffer);CHKERRQ(ierr);
16523425bc38SStefano Zampini   ierr = PetscFree(recv_buffer);CHKERRQ(ierr);
16533425bc38SStefano Zampini   ierr = PetscFree(ptrs_buffer);CHKERRQ(ierr);
16543425bc38SStefano Zampini 
16553425bc38SStefano Zampini   /* Compute B and B_delta (local actions) */
16563425bc38SStefano Zampini   ierr = PetscMalloc(pcis->n_neigh*sizeof(*aux_sums),&aux_sums);CHKERRQ(ierr);
16573425bc38SStefano Zampini   ierr = PetscMalloc(n_local_lambda*sizeof(*l2g_indices),&l2g_indices);CHKERRQ(ierr);
16583425bc38SStefano Zampini   ierr = PetscMalloc(n_local_lambda*sizeof(*vals_B_delta),&vals_B_delta);CHKERRQ(ierr);
16593425bc38SStefano Zampini   ierr = PetscMalloc(n_local_lambda*sizeof(*cols_B_delta),&cols_B_delta);CHKERRQ(ierr);
16603425bc38SStefano Zampini   ierr = PetscMalloc(n_local_lambda*sizeof(*scaling_factors),&scaling_factors);CHKERRQ(ierr);
16613425bc38SStefano Zampini   n_global_lambda=0;
16623425bc38SStefano Zampini   partial_sum=0;
16633425bc38SStefano Zampini   for (i=0;i<dual_size;i++) {
16643425bc38SStefano Zampini     while( global_dofs_numbering[n_global_lambda] != aux_global_numbering_mpi[i] ) { n_global_lambda++; }
16653425bc38SStefano Zampini     j = mat_graph->count[aux_local_numbering_1[i]];
16663425bc38SStefano Zampini     k = (mat_graph->neighbours_set[aux_local_numbering_1[i]][0] == -1 ?  1 : 0);
16673425bc38SStefano Zampini     j = j - k;
16683425bc38SStefano Zampini     aux_sums[0]=0;
16693425bc38SStefano Zampini     for (s=1;s<j;s++) {
16703425bc38SStefano Zampini       aux_sums[s]=aux_sums[s-1]+j-s+1;
16713425bc38SStefano Zampini     }
16723425bc38SStefano Zampini     array = all_factors[aux_local_numbering_1[i]];
16733425bc38SStefano Zampini     n_neg_values = 0;
16743425bc38SStefano Zampini     while(n_neg_values < j && mat_graph->neighbours_set[aux_local_numbering_1[i]][n_neg_values+k] < rank) {n_neg_values++;}
16753425bc38SStefano Zampini     n_pos_values = j - n_neg_values;
16763425bc38SStefano Zampini     if (fully_redundant) {
16773425bc38SStefano Zampini       for (s=0;s<n_neg_values;s++) {
16783425bc38SStefano Zampini         l2g_indices    [partial_sum+s]=aux_sums[s]+n_neg_values-s-1+n_global_lambda;
16793425bc38SStefano Zampini         cols_B_delta   [partial_sum+s]=dual_dofs_boundary_indices[i];
16803425bc38SStefano Zampini         vals_B_delta   [partial_sum+s]=-1.0;
16813425bc38SStefano Zampini         scaling_factors[partial_sum+s]=array[s];
16823425bc38SStefano Zampini       }
16833425bc38SStefano Zampini       for (s=0;s<n_pos_values;s++) {
16843425bc38SStefano Zampini         l2g_indices    [partial_sum+s+n_neg_values]=aux_sums[n_neg_values]+s+n_global_lambda;
16853425bc38SStefano Zampini         cols_B_delta   [partial_sum+s+n_neg_values]=dual_dofs_boundary_indices[i];
16863425bc38SStefano Zampini         vals_B_delta   [partial_sum+s+n_neg_values]=1.0;
16873425bc38SStefano Zampini         scaling_factors[partial_sum+s+n_neg_values]=array[s+n_neg_values];
16883425bc38SStefano Zampini       }
16893425bc38SStefano Zampini       partial_sum += j;
16903425bc38SStefano Zampini     } else {
16913425bc38SStefano Zampini       /* l2g_indices and default cols and vals of B_delta */
16923425bc38SStefano Zampini       for (s=0;s<j;s++) {
16933425bc38SStefano Zampini         l2g_indices    [partial_sum+s]=n_global_lambda+s;
16943425bc38SStefano Zampini         cols_B_delta   [partial_sum+s]=dual_dofs_boundary_indices[i];
16953425bc38SStefano Zampini         vals_B_delta   [partial_sum+s]=0.0;
16963425bc38SStefano Zampini       }
16973425bc38SStefano Zampini       /* B_delta */
16983425bc38SStefano Zampini       if ( n_neg_values > 0 ) { /* there's a rank next to me to the left */
16993425bc38SStefano Zampini         vals_B_delta   [partial_sum+n_neg_values-1]=-1.0;
17003425bc38SStefano Zampini       }
17013425bc38SStefano Zampini       if ( n_neg_values < j ) { /* there's a rank next to me to the right */
17023425bc38SStefano Zampini         vals_B_delta   [partial_sum+n_neg_values]=1.0;
17033425bc38SStefano Zampini       }
17043425bc38SStefano Zampini       /* scaling as in Klawonn-Widlund 1999*/
17053425bc38SStefano Zampini       for (s=0;s<n_neg_values;s++) {
17063425bc38SStefano Zampini         scalar_value = 0.0;
17073425bc38SStefano Zampini         for (k=0;k<s+1;k++) {
17083425bc38SStefano Zampini           scalar_value += array[k];
17093425bc38SStefano Zampini         }
17103425bc38SStefano Zampini         scalar_value = -scalar_value;
17113425bc38SStefano Zampini         scaling_factors[partial_sum+s] = scalar_value;
17123425bc38SStefano Zampini       }
17133425bc38SStefano Zampini       for (s=0;s<n_pos_values;s++) {
17143425bc38SStefano Zampini         scalar_value = 0.0;
17153425bc38SStefano Zampini         for (k=s+n_neg_values;k<j;k++) {
17163425bc38SStefano Zampini           scalar_value += array[k];
17173425bc38SStefano Zampini         }
17183425bc38SStefano Zampini         scaling_factors[partial_sum+s+n_neg_values] = scalar_value;
17193425bc38SStefano Zampini       }
17203425bc38SStefano Zampini       partial_sum += j;
17213425bc38SStefano Zampini     }
17223425bc38SStefano Zampini   }
17233425bc38SStefano Zampini   ierr = PetscFree(all_factors[0]);CHKERRQ(ierr);
17243425bc38SStefano Zampini   ierr = PetscFree(all_factors);CHKERRQ(ierr);
17253425bc38SStefano Zampini   /* printf("I found %d local lambda dofs when numbering them (should be %d)\n",partial_sum,n_local_lambda); */
17263425bc38SStefano Zampini   ierr = ISCreateGeneral(comm,n_local_lambda,l2g_indices,PETSC_OWN_POINTER,&IS_l2g_lambda);CHKERRQ(ierr);
17273425bc38SStefano Zampini   ierr = VecScatterCreate(fetidpmat_ctx->lambda_local,(IS)0,lambda_global,IS_l2g_lambda,&fetidpmat_ctx->l2g_lambda);CHKERRQ(ierr);
17283425bc38SStefano Zampini 
17293425bc38SStefano Zampini   /* Create local part of B_delta */
17303425bc38SStefano Zampini   ierr = MatCreate(PETSC_COMM_SELF,&fetidpmat_ctx->B_delta);
17313425bc38SStefano Zampini   ierr = MatSetSizes(fetidpmat_ctx->B_delta,n_local_lambda,pcis->n_B,n_local_lambda,pcis->n_B);CHKERRQ(ierr);
17323425bc38SStefano Zampini   ierr = MatSetType(fetidpmat_ctx->B_delta,MATSEQAIJ);CHKERRQ(ierr);
17333425bc38SStefano Zampini   ierr = MatSeqAIJSetPreallocation(fetidpmat_ctx->B_delta,1,PETSC_NULL);CHKERRQ(ierr);
17343425bc38SStefano Zampini   ierr = MatSetOption(fetidpmat_ctx->B_delta,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr);
17353425bc38SStefano Zampini   for (i=0;i<n_local_lambda;i++) {
17363425bc38SStefano Zampini     ierr = MatSetValue(fetidpmat_ctx->B_delta,i,cols_B_delta[i],vals_B_delta[i],INSERT_VALUES);CHKERRQ(ierr);
17373425bc38SStefano Zampini   }
17383425bc38SStefano Zampini   ierr = MatAssemblyBegin(fetidpmat_ctx->B_delta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
17393425bc38SStefano Zampini   ierr = MatAssemblyEnd  (fetidpmat_ctx->B_delta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
17403425bc38SStefano Zampini 
17413425bc38SStefano Zampini   if (fully_redundant) {
17423425bc38SStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&ScalingMat);
17433425bc38SStefano Zampini     ierr = MatSetSizes(ScalingMat,n_local_lambda,n_local_lambda,n_local_lambda,n_local_lambda);CHKERRQ(ierr);
17443425bc38SStefano Zampini     ierr = MatSetType(ScalingMat,MATSEQAIJ);CHKERRQ(ierr);
17453425bc38SStefano Zampini     ierr = MatSeqAIJSetPreallocation(ScalingMat,1,PETSC_NULL);CHKERRQ(ierr);
17463425bc38SStefano Zampini     for (i=0;i<n_local_lambda;i++) {
17473425bc38SStefano Zampini       ierr = MatSetValue(ScalingMat,i,i,scaling_factors[i],INSERT_VALUES);CHKERRQ(ierr);
17483425bc38SStefano Zampini     }
17493425bc38SStefano Zampini     ierr = MatAssemblyBegin(ScalingMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
17503425bc38SStefano Zampini     ierr = MatAssemblyEnd  (ScalingMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
17513425bc38SStefano Zampini     ierr = MatMatMult(ScalingMat,fetidpmat_ctx->B_delta,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&fetidpmat_ctx->B_Ddelta);CHKERRQ(ierr);
17523425bc38SStefano Zampini     ierr = MatDestroy(&ScalingMat);CHKERRQ(ierr);
17533425bc38SStefano Zampini   } else {
17543425bc38SStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&fetidpmat_ctx->B_Ddelta);
17553425bc38SStefano Zampini     ierr = MatSetSizes(fetidpmat_ctx->B_Ddelta,n_local_lambda,pcis->n_B,n_local_lambda,pcis->n_B);CHKERRQ(ierr);
17563425bc38SStefano Zampini     ierr = MatSetType(fetidpmat_ctx->B_Ddelta,MATSEQAIJ);CHKERRQ(ierr);
17573425bc38SStefano Zampini     ierr = MatSeqAIJSetPreallocation(fetidpmat_ctx->B_Ddelta,1,PETSC_NULL);CHKERRQ(ierr);
17583425bc38SStefano Zampini     for (i=0;i<n_local_lambda;i++) {
17593425bc38SStefano Zampini       ierr = MatSetValue(fetidpmat_ctx->B_Ddelta,i,cols_B_delta[i],scaling_factors[i],INSERT_VALUES);CHKERRQ(ierr);
17603425bc38SStefano Zampini     }
17613425bc38SStefano Zampini     ierr = MatAssemblyBegin(fetidpmat_ctx->B_Ddelta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
17623425bc38SStefano Zampini     ierr = MatAssemblyEnd  (fetidpmat_ctx->B_Ddelta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
17633425bc38SStefano Zampini   }
17643425bc38SStefano Zampini 
17653425bc38SStefano Zampini   /* Create some vectors needed by fetidp */
17663425bc38SStefano Zampini   ierr = VecDuplicate(pcis->vec1_B,&fetidpmat_ctx->temp_solution_B);CHKERRQ(ierr);
17673425bc38SStefano Zampini   ierr = VecDuplicate(pcis->vec1_D,&fetidpmat_ctx->temp_solution_D);CHKERRQ(ierr);
17683425bc38SStefano Zampini 
17693425bc38SStefano Zampini   test_fetidp = PETSC_FALSE;
17703425bc38SStefano Zampini   ierr = PetscOptionsGetBool(PETSC_NULL,"-fetidp_check",&test_fetidp,PETSC_NULL);CHKERRQ(ierr);
17713425bc38SStefano Zampini 
17723425bc38SStefano Zampini   if (test_fetidp) {
17733425bc38SStefano Zampini 
17743425bc38SStefano Zampini     ierr = PetscViewerASCIIGetStdout(((PetscObject)(fetidpmat_ctx->pc))->comm,&viewer);CHKERRQ(ierr);
17753425bc38SStefano Zampini     ierr = PetscViewerASCIISynchronizedAllow(viewer,PETSC_TRUE);CHKERRQ(ierr);
17763425bc38SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"----------FETI_DP TESTS--------------\n");CHKERRQ(ierr);
17773425bc38SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"All tests should return zero!\n");CHKERRQ(ierr);
17783425bc38SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"FETIDP MAT context in the ");CHKERRQ(ierr);
17793425bc38SStefano Zampini     if (fully_redundant) {
17803425bc38SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"fully redundant case for lagrange multipliers.\n");CHKERRQ(ierr);
17813425bc38SStefano Zampini     } else {
17823425bc38SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Non-fully redundant case for lagrange multiplier.\n");CHKERRQ(ierr);
17833425bc38SStefano Zampini     }
17843425bc38SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
17853425bc38SStefano Zampini 
17863425bc38SStefano Zampini     /******************************************************************/
17873425bc38SStefano Zampini     /* TEST A/B: Test numbering of global lambda dofs             */
17883425bc38SStefano Zampini     /******************************************************************/
17893425bc38SStefano Zampini 
17903425bc38SStefano Zampini     ierr = VecDuplicate(fetidpmat_ctx->lambda_local,&test_vec);CHKERRQ(ierr);
17913425bc38SStefano Zampini     ierr = VecSet(lambda_global,1.0);CHKERRQ(ierr);
17923425bc38SStefano Zampini     ierr = VecSet(test_vec,1.0);CHKERRQ(ierr);
17933425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
17943425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
17953425bc38SStefano Zampini     scalar_value = -1.0;
17963425bc38SStefano Zampini     ierr = VecAXPY(test_vec,scalar_value,fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
17973425bc38SStefano Zampini     ierr = VecNorm(test_vec,NORM_INFINITY,&scalar_value);CHKERRQ(ierr);
17983425bc38SStefano Zampini     ierr = VecDestroy(&test_vec);CHKERRQ(ierr);
17993425bc38SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"A[%04d]: CHECK glob to loc: % 1.14e\n",rank,scalar_value);CHKERRQ(ierr);
18003425bc38SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
18013425bc38SStefano Zampini     if (fully_redundant) {
18023425bc38SStefano Zampini       ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr);
18033425bc38SStefano Zampini       ierr = VecSet(fetidpmat_ctx->lambda_local,0.5);CHKERRQ(ierr);
18043425bc38SStefano Zampini       ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18053425bc38SStefano Zampini       ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18063425bc38SStefano Zampini       ierr = VecSum(lambda_global,&scalar_value);CHKERRQ(ierr);
18073425bc38SStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"B[%04d]: CHECK loc to glob: % 1.14e\n",rank,scalar_value-fetidpmat_ctx->n_lambda);CHKERRQ(ierr);
18083425bc38SStefano Zampini       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
18093425bc38SStefano Zampini     }
18103425bc38SStefano Zampini 
18113425bc38SStefano Zampini     /******************************************************************/
18123425bc38SStefano Zampini     /* TEST C: It should holds B_delta*w=0, w\in\widehat{W}           */
18133425bc38SStefano Zampini     /* This is the meaning of the B matrix                            */
18143425bc38SStefano Zampini     /******************************************************************/
18153425bc38SStefano Zampini 
18163425bc38SStefano Zampini     ierr = VecSetRandom(pcis->vec1_N,PETSC_NULL);CHKERRQ(ierr);
18173425bc38SStefano Zampini     ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
18183425bc38SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
18193425bc38SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
18203425bc38SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18213425bc38SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18223425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18233425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18243425bc38SStefano Zampini     /* Action of B_delta */
18253425bc38SStefano Zampini     ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
18263425bc38SStefano Zampini     ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr);
18273425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18283425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18293425bc38SStefano Zampini     ierr = VecNorm(lambda_global,NORM_INFINITY,&scalar_value);CHKERRQ(ierr);
18303425bc38SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"C[coll]: CHECK infty norm of B_delta*w (w continuous): % 1.14e\n",scalar_value);CHKERRQ(ierr);
18313425bc38SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
18323425bc38SStefano Zampini 
18333425bc38SStefano Zampini     /******************************************************************/
18343425bc38SStefano Zampini     /* TEST D: It should holds E_Dw = w - P_Dw w\in\widetilde{W}     */
18353425bc38SStefano Zampini     /* E_D = R_D^TR                                                   */
18363425bc38SStefano Zampini     /* P_D = B_{D,delta}^T B_{delta}                                  */
18373425bc38SStefano Zampini     /* eq.44 Mandel Tezaur and Dohrmann 2005                          */
18383425bc38SStefano Zampini     /******************************************************************/
18393425bc38SStefano Zampini 
18403425bc38SStefano Zampini     /* compute a random vector in \widetilde{W} */
18413425bc38SStefano Zampini     ierr = VecSetRandom(pcis->vec1_N,PETSC_NULL);CHKERRQ(ierr);
18423425bc38SStefano Zampini     scalar_value = 0.0;  /* set zero at vertices */
18433425bc38SStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
18443425bc38SStefano Zampini     for (i=0;i<n_vertices;i++) { array[vertex_indices[i]]=scalar_value; }
18453425bc38SStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
18463425bc38SStefano Zampini     /* store w for final comparison */
18473425bc38SStefano Zampini     ierr = VecDuplicate(pcis->vec1_B,&test_vec);CHKERRQ(ierr);
18483425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,test_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18493425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,test_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18503425bc38SStefano Zampini 
18513425bc38SStefano Zampini     /* Jump operator P_D : results stored in pcis->vec1_B */
18523425bc38SStefano Zampini 
18533425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18543425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18553425bc38SStefano Zampini     /* Action of B_delta */
18563425bc38SStefano Zampini     ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
18573425bc38SStefano Zampini     ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr);
18583425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18593425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18603425bc38SStefano Zampini     /* Action of B_Ddelta^T */
18613425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
18623425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
18633425bc38SStefano Zampini     ierr = MatMultTranspose(fetidpmat_ctx->B_Ddelta,fetidpmat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr);
18643425bc38SStefano Zampini 
18653425bc38SStefano Zampini     /* Average operator E_D : results stored in pcis->vec2_B */
18663425bc38SStefano Zampini 
18673425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18683425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18693425bc38SStefano Zampini     ierr = VecPointwiseMult(pcis->vec2_B,pcis->D,pcis->vec2_B);CHKERRQ(ierr);
18703425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec2_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
18713425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec2_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
18723425bc38SStefano Zampini     ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
18733425bc38SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
18743425bc38SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
18753425bc38SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18763425bc38SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18773425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18783425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18793425bc38SStefano Zampini 
18803425bc38SStefano Zampini     /* test E_D=I-P_D */
18813425bc38SStefano Zampini     scalar_value = 1.0;
18823425bc38SStefano Zampini     ierr = VecAXPY(pcis->vec1_B,scalar_value,pcis->vec2_B);CHKERRQ(ierr);
18833425bc38SStefano Zampini     scalar_value = -1.0;
18843425bc38SStefano Zampini     ierr = VecAXPY(pcis->vec1_B,scalar_value,test_vec);CHKERRQ(ierr);
18853425bc38SStefano Zampini     ierr = VecNorm(pcis->vec1_B,NORM_INFINITY,&scalar_value);CHKERRQ(ierr);
18863425bc38SStefano Zampini     ierr = VecDestroy(&test_vec);CHKERRQ(ierr);
18873425bc38SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"D[%04d] CHECK infty norm of E_D + P_D - I: % 1.14e\n",rank,scalar_value);CHKERRQ(ierr);
18883425bc38SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
18893425bc38SStefano Zampini 
18903425bc38SStefano Zampini     /******************************************************************/
18913425bc38SStefano Zampini     /* TEST E: It should holds R_D^TP_Dw=0 w\in\widetilde{W}          */
18923425bc38SStefano Zampini     /* eq.48 Mandel Tezaur and Dohrmann 2005                          */
18933425bc38SStefano Zampini     /******************************************************************/
18943425bc38SStefano Zampini 
18953425bc38SStefano Zampini     ierr = VecSetRandom(pcis->vec1_N,PETSC_NULL);CHKERRQ(ierr);
18963425bc38SStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
18973425bc38SStefano Zampini     scalar_value = 0.0;  /* set zero at vertices */
18983425bc38SStefano Zampini     for (i=0;i<n_vertices;i++) { array[vertex_indices[i]]=scalar_value; }
18993425bc38SStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
19003425bc38SStefano Zampini 
19013425bc38SStefano Zampini     /* Jump operator P_D : results stored in pcis->vec1_B */
19023425bc38SStefano Zampini 
19033425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
19043425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
19053425bc38SStefano Zampini     /* Action of B_delta */
19063425bc38SStefano Zampini     ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
19073425bc38SStefano Zampini     ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr);
19083425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
19093425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
19103425bc38SStefano Zampini     /* Action of B_Ddelta^T */
19113425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
19123425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
19133425bc38SStefano Zampini     ierr = MatMultTranspose(fetidpmat_ctx->B_Ddelta,fetidpmat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr);
19143425bc38SStefano Zampini     /* diagonal scaling */
19153425bc38SStefano Zampini     ierr = VecPointwiseMult(pcis->vec1_B,pcis->D,pcis->vec1_B);CHKERRQ(ierr);
19163425bc38SStefano Zampini     /* sum on the interface */
19173425bc38SStefano Zampini     ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
19183425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
19193425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
19203425bc38SStefano Zampini     ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
19213425bc38SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
19223425bc38SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
19233425bc38SStefano Zampini     ierr = VecNorm(pcis->vec1_global,NORM_INFINITY,&scalar_value);CHKERRQ(ierr);
19243425bc38SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"E[coll]: CHECK infty norm of R^T_D P_D: % 1.14e\n",scalar_value);CHKERRQ(ierr);
19253425bc38SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
19263425bc38SStefano Zampini 
19273425bc38SStefano Zampini     if (!fully_redundant) {
19283425bc38SStefano Zampini       /******************************************************************/
19293425bc38SStefano Zampini       /* TEST F: It should holds B_{delta}B^T_{D,delta}=I               */
19303425bc38SStefano Zampini       /* Corollary thm 14 Mandel Tezaur and Dohrmann 2005               */
19313425bc38SStefano Zampini       /******************************************************************/
19323425bc38SStefano Zampini       ierr = VecDuplicate(lambda_global,&test_vec);CHKERRQ(ierr);
19333425bc38SStefano Zampini       ierr = VecSetRandom(lambda_global,PETSC_NULL);CHKERRQ(ierr);
19343425bc38SStefano Zampini       /* Action of B_Ddelta^T */
19353425bc38SStefano Zampini       ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
19363425bc38SStefano Zampini       ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
19373425bc38SStefano Zampini       ierr = MatMultTranspose(fetidpmat_ctx->B_Ddelta,fetidpmat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr);
19383425bc38SStefano Zampini       /* Action of B_delta */
19393425bc38SStefano Zampini       ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
19403425bc38SStefano Zampini       ierr = VecSet(test_vec,0.0);CHKERRQ(ierr);
19413425bc38SStefano Zampini       ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,test_vec,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
19423425bc38SStefano Zampini       ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,test_vec,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
19433425bc38SStefano Zampini       scalar_value = -1.0;
19443425bc38SStefano Zampini       ierr = VecAXPY(lambda_global,scalar_value,test_vec);CHKERRQ(ierr);
19453425bc38SStefano Zampini       ierr = VecNorm(lambda_global,NORM_INFINITY,&scalar_value);CHKERRQ(ierr);
19463425bc38SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"E[coll]: CHECK infty norm of P^T_D - I: % 1.14e\n",scalar_value);CHKERRQ(ierr);
19473425bc38SStefano Zampini       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
19483425bc38SStefano Zampini       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
19493425bc38SStefano Zampini       ierr = VecDestroy(&test_vec);CHKERRQ(ierr);
19503425bc38SStefano Zampini     }
19513425bc38SStefano Zampini   }
19523425bc38SStefano Zampini   /* final cleanup */
19533425bc38SStefano Zampini   ierr = PetscFree(dual_dofs_boundary_indices);CHKERRQ(ierr);
19543425bc38SStefano Zampini   ierr = PetscFree(vertex_indices);CHKERRQ(ierr);
19553425bc38SStefano Zampini   ierr = PetscFree(aux_local_numbering_1);CHKERRQ(ierr);
19563425bc38SStefano Zampini   ierr = PetscFree(aux_local_numbering_2);CHKERRQ(ierr);
19573425bc38SStefano Zampini   ierr = PetscFree(aux_global_numbering);CHKERRQ(ierr);
19583425bc38SStefano Zampini   ierr = PetscFree(aux_global_numbering_mpi);CHKERRQ(ierr);
19593425bc38SStefano Zampini   ierr = PetscFree(dof_sizes);CHKERRQ(ierr);
19603425bc38SStefano Zampini   ierr = PetscFree(dof_displs);CHKERRQ(ierr);
19613425bc38SStefano Zampini   ierr = PetscFree(all_aux_global_numbering_mpi_1);CHKERRQ(ierr);
19623425bc38SStefano Zampini   ierr = PetscFree(all_aux_global_numbering_mpi_2);CHKERRQ(ierr);
19633425bc38SStefano Zampini   ierr = PetscFree(global_dofs_numbering);CHKERRQ(ierr);
19643425bc38SStefano Zampini   ierr = PetscFree(aux_sums);CHKERRQ(ierr);
19653425bc38SStefano Zampini   ierr = PetscFree(cols_B_delta);CHKERRQ(ierr);
19663425bc38SStefano Zampini   ierr = PetscFree(vals_B_delta);CHKERRQ(ierr);
19673425bc38SStefano Zampini   ierr = PetscFree(scaling_factors);CHKERRQ(ierr);
19683425bc38SStefano Zampini   ierr = VecDestroy(&lambda_global);CHKERRQ(ierr);
19693425bc38SStefano Zampini   ierr = ISDestroy(&IS_l2g_lambda);CHKERRQ(ierr);
19703425bc38SStefano Zampini 
19713425bc38SStefano Zampini   PetscFunctionReturn(0);
19723425bc38SStefano Zampini }
19733425bc38SStefano Zampini 
19743425bc38SStefano Zampini #undef __FUNCT__
19753425bc38SStefano Zampini #define __FUNCT__ "PCBDDCSetupFETIDPPCContext"
19763425bc38SStefano Zampini static PetscErrorCode PCBDDCSetupFETIDPPCContext(Mat fetimat, FETIDPPC_ctx *fetidppc_ctx)
19773425bc38SStefano Zampini {
19783425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
19793425bc38SStefano Zampini   PetscErrorCode ierr;
19803425bc38SStefano Zampini 
19813425bc38SStefano Zampini   PetscFunctionBegin;
19823425bc38SStefano Zampini   ierr = MatShellGetContext(fetimat,&mat_ctx);CHKERRQ(ierr);
19833425bc38SStefano Zampini   /* get references from objects created when setting up feti mat context */
19843425bc38SStefano Zampini   ierr = PetscObjectReference((PetscObject)mat_ctx->lambda_local);CHKERRQ(ierr);
19853425bc38SStefano Zampini   fetidppc_ctx->lambda_local = mat_ctx->lambda_local;
19863425bc38SStefano Zampini   ierr = PetscObjectReference((PetscObject)mat_ctx->B_Ddelta);CHKERRQ(ierr);
19873425bc38SStefano Zampini   fetidppc_ctx->B_Ddelta = mat_ctx->B_Ddelta;
19883425bc38SStefano Zampini   ierr = PetscObjectReference((PetscObject)mat_ctx->l2g_lambda);CHKERRQ(ierr);
19893425bc38SStefano Zampini   fetidppc_ctx->l2g_lambda = mat_ctx->l2g_lambda;
19903425bc38SStefano Zampini   PetscFunctionReturn(0);
19913425bc38SStefano Zampini }
19923425bc38SStefano Zampini 
19933425bc38SStefano Zampini #undef __FUNCT__
19943425bc38SStefano Zampini #define __FUNCT__ "FETIDPMatMult"
19953425bc38SStefano Zampini static PetscErrorCode FETIDPMatMult(Mat fetimat, Vec x, Vec y)
19963425bc38SStefano Zampini {
19973425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
19983425bc38SStefano Zampini   PC_IS          *pcis;
19993425bc38SStefano Zampini   PetscErrorCode ierr;
20003425bc38SStefano Zampini 
20013425bc38SStefano Zampini   PetscFunctionBegin;
20023425bc38SStefano Zampini   ierr = MatShellGetContext(fetimat,&mat_ctx);CHKERRQ(ierr);
20033425bc38SStefano Zampini   pcis = (PC_IS*)mat_ctx->pc->data;
20043425bc38SStefano Zampini   /* Application of B_delta^T */
20053425bc38SStefano Zampini   ierr = VecScatterBegin(mat_ctx->l2g_lambda,x,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
20063425bc38SStefano Zampini   ierr = VecScatterEnd(mat_ctx->l2g_lambda,x,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
20073425bc38SStefano Zampini   ierr = MatMultTranspose(mat_ctx->B_delta,mat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr);
20083425bc38SStefano Zampini   /* Application of \widetilde{S}^-1 */
20093425bc38SStefano Zampini   ierr = VecSet(pcis->vec1_D,0.0);CHKERRQ(ierr);
20103425bc38SStefano Zampini   ierr = PCBDDCApplyInterfacePreconditioner(mat_ctx->pc);CHKERRQ(ierr);
20113425bc38SStefano Zampini   /* Application of B_delta */
20123425bc38SStefano Zampini   ierr = MatMult(mat_ctx->B_delta,pcis->vec1_B,mat_ctx->lambda_local);CHKERRQ(ierr);
20133425bc38SStefano Zampini   ierr = VecSet(y,0.0);CHKERRQ(ierr);
20143425bc38SStefano Zampini   ierr = VecScatterBegin(mat_ctx->l2g_lambda,mat_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20153425bc38SStefano Zampini   ierr = VecScatterEnd(mat_ctx->l2g_lambda,mat_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20163425bc38SStefano Zampini   PetscFunctionReturn(0);
20173425bc38SStefano Zampini }
20183425bc38SStefano Zampini 
20193425bc38SStefano Zampini #undef __FUNCT__
20203425bc38SStefano Zampini #define __FUNCT__ "FETIDPPCApply"
20213425bc38SStefano Zampini static PetscErrorCode FETIDPPCApply(PC fetipc, Vec x, Vec y)
20223425bc38SStefano Zampini {
20233425bc38SStefano Zampini   FETIDPPC_ctx   *pc_ctx;
20243425bc38SStefano Zampini   PC_IS          *pcis;
20253425bc38SStefano Zampini   PetscErrorCode ierr;
20263425bc38SStefano Zampini 
20273425bc38SStefano Zampini   PetscFunctionBegin;
20283425bc38SStefano Zampini   ierr = PCShellGetContext(fetipc,(void**)&pc_ctx);
20293425bc38SStefano Zampini   pcis = (PC_IS*)pc_ctx->pc->data;
20303425bc38SStefano Zampini   /* Application of B_Ddelta^T */
20313425bc38SStefano Zampini   ierr = VecScatterBegin(pc_ctx->l2g_lambda,x,pc_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
20323425bc38SStefano Zampini   ierr = VecScatterEnd(pc_ctx->l2g_lambda,x,pc_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
20333425bc38SStefano Zampini   ierr = VecSet(pcis->vec2_B,0.0);CHKERRQ(ierr);
20343425bc38SStefano Zampini   ierr = MatMultTranspose(pc_ctx->B_Ddelta,pc_ctx->lambda_local,pcis->vec2_B);CHKERRQ(ierr);
20353425bc38SStefano Zampini   /* Application of S */
20363425bc38SStefano Zampini   ierr = PCISApplySchur(pc_ctx->pc,pcis->vec2_B,pcis->vec1_B,(Vec)0,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr);
20373425bc38SStefano Zampini   /* Application of B_Ddelta */
20383425bc38SStefano Zampini   ierr = MatMult(pc_ctx->B_Ddelta,pcis->vec1_B,pc_ctx->lambda_local);CHKERRQ(ierr);
20393425bc38SStefano Zampini   ierr = VecSet(y,0.0);CHKERRQ(ierr);
20403425bc38SStefano Zampini   ierr = VecScatterBegin(pc_ctx->l2g_lambda,pc_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20413425bc38SStefano Zampini   ierr = VecScatterEnd(pc_ctx->l2g_lambda,pc_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20423425bc38SStefano Zampini   PetscFunctionReturn(0);
20433425bc38SStefano Zampini }
20443425bc38SStefano Zampini 
2045da1bb401SStefano Zampini #undef __FUNCT__
2046da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetupLocalAdjacencyGraph"
2047da1bb401SStefano Zampini static PetscErrorCode PCBDDCSetupLocalAdjacencyGraph(PC pc)
2048da1bb401SStefano Zampini {
2049da1bb401SStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
2050da1bb401SStefano Zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
2051da1bb401SStefano Zampini   PetscInt       nvtxs,*xadj,*adjncy;
2052da1bb401SStefano Zampini   Mat            mat_adj;
2053da1bb401SStefano Zampini   PetscBool      symmetrize_rowij=PETSC_TRUE,compressed_rowij=PETSC_FALSE,flg_row=PETSC_TRUE;
2054da1bb401SStefano Zampini   PCBDDCGraph    mat_graph=pcbddc->mat_graph;
2055da1bb401SStefano Zampini   PetscErrorCode ierr;
2056da1bb401SStefano Zampini 
2057da1bb401SStefano Zampini   PetscFunctionBegin;
2058da1bb401SStefano Zampini   /* get CSR adjacency from local matrix if user has not yet provided local graph using PCBDDCSetLocalAdjacencyGraph function */
2059da1bb401SStefano Zampini   if (!mat_graph->xadj) {
2060da1bb401SStefano Zampini     ierr = MatConvert(matis->A,MATMPIADJ,MAT_INITIAL_MATRIX,&mat_adj);CHKERRQ(ierr);
2061da1bb401SStefano Zampini     ierr = MatGetRowIJ(mat_adj,0,symmetrize_rowij,compressed_rowij,&nvtxs,&xadj,&adjncy,&flg_row);CHKERRQ(ierr);
2062da1bb401SStefano Zampini     if (!flg_row) {
2063da1bb401SStefano Zampini       SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in MatGetRowIJ called in %s\n",__FUNCT__);
2064da1bb401SStefano Zampini     }
2065da1bb401SStefano Zampini     /* Get adjacency into BDDC workspace */
2066da1bb401SStefano Zampini     ierr = PCBDDCSetLocalAdjacencyGraph(pc,nvtxs,xadj,adjncy,PETSC_COPY_VALUES);CHKERRQ(ierr);
2067da1bb401SStefano Zampini     ierr = MatRestoreRowIJ(mat_adj,0,symmetrize_rowij,compressed_rowij,&nvtxs,&xadj,&adjncy,&flg_row);CHKERRQ(ierr);
2068da1bb401SStefano Zampini     if (!flg_row) {
2069da1bb401SStefano Zampini       SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in MatRestoreRowIJ called in %s\n",__FUNCT__);
2070da1bb401SStefano Zampini     }
2071da1bb401SStefano Zampini     ierr = MatDestroy(&mat_adj);CHKERRQ(ierr);
2072da1bb401SStefano Zampini   }
2073da1bb401SStefano Zampini   PetscFunctionReturn(0);
2074da1bb401SStefano Zampini }
2075da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
20760c7d97c5SJed Brown #undef __FUNCT__
20770c7d97c5SJed Brown #define __FUNCT__ "PCBDDCApplyInterfacePreconditioner"
20782617d88aSStefano Zampini static PetscErrorCode  PCBDDCApplyInterfacePreconditioner(PC pc)
20790c7d97c5SJed Brown {
20800c7d97c5SJed Brown   PetscErrorCode ierr;
20810c7d97c5SJed Brown   PC_BDDC*        pcbddc = (PC_BDDC*)(pc->data);
20820c7d97c5SJed Brown   PC_IS*            pcis = (PC_IS*)  (pc->data);
20833b03a366Sstefano_zampini   const PetscScalar zero = 0.0;
20840c7d97c5SJed Brown 
20850c7d97c5SJed Brown   PetscFunctionBegin;
20860c7d97c5SJed Brown   /* Application of PHI^T  */
20870c7d97c5SJed Brown   ierr = MatMultTranspose(pcbddc->coarse_phi_B,pcis->vec1_B,pcbddc->vec1_P);CHKERRQ(ierr);
20880c7d97c5SJed Brown   if (pcbddc->prec_type) { ierr = MatMultTransposeAdd(pcbddc->coarse_phi_D,pcis->vec1_D,pcbddc->vec1_P,pcbddc->vec1_P);CHKERRQ(ierr); }
20890c7d97c5SJed Brown 
20900c7d97c5SJed Brown   /* Scatter data of coarse_rhs */
2091142dfd88SStefano Zampini   if (pcbddc->coarse_rhs) { ierr = VecSet(pcbddc->coarse_rhs,zero);CHKERRQ(ierr); }
20920c7d97c5SJed Brown   ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->vec1_P,pcbddc->coarse_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20930c7d97c5SJed Brown 
20940c7d97c5SJed Brown   /* Local solution on R nodes */
20950c7d97c5SJed Brown   ierr = VecSet(pcbddc->vec1_R,zero);CHKERRQ(ierr);
20960c7d97c5SJed Brown   ierr = VecScatterBegin(pcbddc->R_to_B,pcis->vec1_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
20970c7d97c5SJed Brown   ierr = VecScatterEnd  (pcbddc->R_to_B,pcis->vec1_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
20980c7d97c5SJed Brown   if (pcbddc->prec_type) {
20990c7d97c5SJed Brown     ierr = VecScatterBegin(pcbddc->R_to_D,pcis->vec1_D,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21000c7d97c5SJed Brown     ierr = VecScatterEnd  (pcbddc->R_to_D,pcis->vec1_D,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21010c7d97c5SJed Brown   }
21020c7d97c5SJed Brown   ierr = PCBDDCSolveSaddlePoint(pc);CHKERRQ(ierr);
21030c7d97c5SJed Brown   ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr);
21040c7d97c5SJed Brown   ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec2_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21050c7d97c5SJed Brown   ierr = VecScatterEnd  (pcbddc->R_to_B,pcbddc->vec2_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21060c7d97c5SJed Brown   if (pcbddc->prec_type) {
21070c7d97c5SJed Brown     ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec2_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21080c7d97c5SJed Brown     ierr = VecScatterEnd  (pcbddc->R_to_D,pcbddc->vec2_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21090c7d97c5SJed Brown   }
21100c7d97c5SJed Brown 
21110c7d97c5SJed Brown   /* Coarse solution */
21120c7d97c5SJed Brown   ierr = PCBDDCScatterCoarseDataEnd(pc,pcbddc->vec1_P,pcbddc->coarse_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21130bdf917eSStefano Zampini   if (pcbddc->coarse_rhs) {
21140bdf917eSStefano Zampini     if (pcbddc->CoarseNullSpace) {
21150bdf917eSStefano Zampini       ierr = MatNullSpaceRemove(pcbddc->CoarseNullSpace,pcbddc->coarse_rhs,PETSC_NULL);CHKERRQ(ierr);
21160bdf917eSStefano Zampini     }
21170bdf917eSStefano Zampini     ierr = KSPSolve(pcbddc->coarse_ksp,pcbddc->coarse_rhs,pcbddc->coarse_vec);CHKERRQ(ierr);
21180bdf917eSStefano Zampini     if (pcbddc->CoarseNullSpace) {
21190bdf917eSStefano Zampini       ierr = MatNullSpaceRemove(pcbddc->CoarseNullSpace,pcbddc->coarse_vec,PETSC_NULL);CHKERRQ(ierr);
21200bdf917eSStefano Zampini     }
21210bdf917eSStefano Zampini   }
21220c7d97c5SJed Brown   ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->coarse_vec,pcbddc->vec1_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21230c7d97c5SJed Brown   ierr = PCBDDCScatterCoarseDataEnd  (pc,pcbddc->coarse_vec,pcbddc->vec1_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21240c7d97c5SJed Brown 
21250c7d97c5SJed Brown   /* Sum contributions from two levels */
21260c7d97c5SJed Brown   ierr = MatMultAdd(pcbddc->coarse_phi_B,pcbddc->vec1_P,pcis->vec1_B,pcis->vec1_B);CHKERRQ(ierr);
21270c7d97c5SJed Brown   if (pcbddc->prec_type) { ierr = MatMultAdd(pcbddc->coarse_phi_D,pcbddc->vec1_P,pcis->vec1_D,pcis->vec1_D);CHKERRQ(ierr); }
21280c7d97c5SJed Brown   PetscFunctionReturn(0);
21290c7d97c5SJed Brown }
21300c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
21310c7d97c5SJed Brown #undef __FUNCT__
21320c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSolveSaddlePoint"
213353cdbc3dSStefano Zampini static PetscErrorCode  PCBDDCSolveSaddlePoint(PC pc)
21340c7d97c5SJed Brown {
21350c7d97c5SJed Brown   PetscErrorCode ierr;
21360c7d97c5SJed Brown   PC_BDDC*       pcbddc = (PC_BDDC*)(pc->data);
21370c7d97c5SJed Brown 
21380c7d97c5SJed Brown   PetscFunctionBegin;
213953cdbc3dSStefano Zampini   ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr);
2140534831adSStefano Zampini   if (pcbddc->local_auxmat1) {
21410c7d97c5SJed Brown     ierr = MatMult(pcbddc->local_auxmat1,pcbddc->vec2_R,pcbddc->vec1_C);CHKERRQ(ierr);
21420c7d97c5SJed Brown     ierr = MatMultAdd(pcbddc->local_auxmat2,pcbddc->vec1_C,pcbddc->vec2_R,pcbddc->vec2_R);CHKERRQ(ierr);
21430c7d97c5SJed Brown   }
21440c7d97c5SJed Brown   PetscFunctionReturn(0);
21450c7d97c5SJed Brown }
21460c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
21470c7d97c5SJed Brown #undef __FUNCT__
21480c7d97c5SJed Brown #define __FUNCT__ "PCBDDCScatterCoarseDataBegin"
214953cdbc3dSStefano Zampini static PetscErrorCode  PCBDDCScatterCoarseDataBegin(PC pc,Vec vec_from, Vec vec_to, InsertMode imode, ScatterMode smode)
21500c7d97c5SJed Brown {
21510c7d97c5SJed Brown   PetscErrorCode ierr;
21520c7d97c5SJed Brown   PC_BDDC*       pcbddc = (PC_BDDC*)(pc->data);
21530c7d97c5SJed Brown 
21540c7d97c5SJed Brown   PetscFunctionBegin;
21550c7d97c5SJed Brown   switch(pcbddc->coarse_communications_type){
21560c7d97c5SJed Brown     case SCATTERS_BDDC:
21570c7d97c5SJed Brown       ierr = VecScatterBegin(pcbddc->coarse_loc_to_glob,vec_from,vec_to,imode,smode);CHKERRQ(ierr);
21580c7d97c5SJed Brown       break;
21590c7d97c5SJed Brown     case GATHERS_BDDC:
21600c7d97c5SJed Brown       break;
21610c7d97c5SJed Brown   }
21620c7d97c5SJed Brown   PetscFunctionReturn(0);
21630c7d97c5SJed Brown }
21640c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
21650c7d97c5SJed Brown #undef __FUNCT__
21660c7d97c5SJed Brown #define __FUNCT__ "PCBDDCScatterCoarseDataEnd"
216753cdbc3dSStefano Zampini static PetscErrorCode  PCBDDCScatterCoarseDataEnd(PC pc,Vec vec_from, Vec vec_to, InsertMode imode, ScatterMode smode)
21680c7d97c5SJed Brown {
21690c7d97c5SJed Brown   PetscErrorCode ierr;
21700c7d97c5SJed Brown   PC_BDDC*       pcbddc = (PC_BDDC*)(pc->data);
21710c7d97c5SJed Brown   PetscScalar*   array_to;
21720c7d97c5SJed Brown   PetscScalar*   array_from;
21730c7d97c5SJed Brown   MPI_Comm       comm=((PetscObject)pc)->comm;
21740c7d97c5SJed Brown   PetscInt i;
21750c7d97c5SJed Brown 
21760c7d97c5SJed Brown   PetscFunctionBegin;
21770c7d97c5SJed Brown 
21780c7d97c5SJed Brown   switch(pcbddc->coarse_communications_type){
21790c7d97c5SJed Brown     case SCATTERS_BDDC:
21800c7d97c5SJed Brown       ierr = VecScatterEnd(pcbddc->coarse_loc_to_glob,vec_from,vec_to,imode,smode);CHKERRQ(ierr);
21810c7d97c5SJed Brown       break;
21820c7d97c5SJed Brown     case GATHERS_BDDC:
21830c7d97c5SJed Brown       if (vec_from) VecGetArray(vec_from,&array_from);
21840c7d97c5SJed Brown       if (vec_to)   VecGetArray(vec_to,&array_to);
21850c7d97c5SJed Brown       switch(pcbddc->coarse_problem_type){
21860c7d97c5SJed Brown         case SEQUENTIAL_BDDC:
21870c7d97c5SJed Brown           if (smode == SCATTER_FORWARD) {
218853cdbc3dSStefano Zampini             ierr = MPI_Gatherv(&array_from[0],pcbddc->local_primal_size,MPIU_SCALAR,&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,0,comm);CHKERRQ(ierr);
21890c7d97c5SJed Brown             if (vec_to) {
21900bdf917eSStefano Zampini               if (imode == ADD_VALUES) {
21910bdf917eSStefano Zampini                 for (i=0;i<pcbddc->replicated_primal_size;i++) {
21920c7d97c5SJed Brown                   array_to[pcbddc->replicated_local_primal_indices[i]]+=pcbddc->replicated_local_primal_values[i];
21930c7d97c5SJed Brown                 }
21940c7d97c5SJed Brown               } else {
21950bdf917eSStefano Zampini                 for (i=0;i<pcbddc->replicated_primal_size;i++) {
21960bdf917eSStefano Zampini                   array_to[pcbddc->replicated_local_primal_indices[i]]=pcbddc->replicated_local_primal_values[i];
21970bdf917eSStefano Zampini                 }
21980bdf917eSStefano Zampini               }
21990bdf917eSStefano Zampini             }
22000bdf917eSStefano Zampini           } else {
22010bdf917eSStefano Zampini             if (vec_from) {
22020bdf917eSStefano Zampini               if (imode == ADD_VALUES) {
22030bdf917eSStefano Zampini                 printf("Scatter mode %d, insert mode %d for case %d not implemented!\n",smode,imode,pcbddc->coarse_problem_type);
22040bdf917eSStefano Zampini               }
22050bdf917eSStefano Zampini               for (i=0;i<pcbddc->replicated_primal_size;i++) {
22060c7d97c5SJed Brown                 pcbddc->replicated_local_primal_values[i]=array_from[pcbddc->replicated_local_primal_indices[i]];
22070bdf917eSStefano Zampini               }
22080bdf917eSStefano Zampini             }
220953cdbc3dSStefano Zampini             ierr = MPI_Scatterv(&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,&array_to[0],pcbddc->local_primal_size,MPIU_SCALAR,0,comm);CHKERRQ(ierr);
22100c7d97c5SJed Brown           }
22110c7d97c5SJed Brown           break;
22120c7d97c5SJed Brown         case REPLICATED_BDDC:
22130c7d97c5SJed Brown           if (smode == SCATTER_FORWARD) {
221453cdbc3dSStefano Zampini             ierr = MPI_Allgatherv(&array_from[0],pcbddc->local_primal_size,MPIU_SCALAR,&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,comm);CHKERRQ(ierr);
22150bdf917eSStefano Zampini             if (imode == ADD_VALUES) {
22160bdf917eSStefano Zampini               for (i=0;i<pcbddc->replicated_primal_size;i++) {
22170c7d97c5SJed Brown                 array_to[pcbddc->replicated_local_primal_indices[i]]+=pcbddc->replicated_local_primal_values[i];
22180bdf917eSStefano Zampini               }
22190bdf917eSStefano Zampini             } else {
22200bdf917eSStefano Zampini               for (i=0;i<pcbddc->replicated_primal_size;i++) {
22210bdf917eSStefano Zampini                 array_to[pcbddc->replicated_local_primal_indices[i]]=pcbddc->replicated_local_primal_values[i];
22220bdf917eSStefano Zampini               }
22230bdf917eSStefano Zampini             }
22240c7d97c5SJed Brown           } else { /* no communications needed for SCATTER_REVERSE since needed data is already present */
22250bdf917eSStefano Zampini             if (imode == ADD_VALUES) {
22260bdf917eSStefano Zampini               for (i=0;i<pcbddc->local_primal_size;i++) {
22270bdf917eSStefano Zampini                 array_to[i]+=array_from[pcbddc->local_primal_indices[i]];
22280bdf917eSStefano Zampini               }
22290bdf917eSStefano Zampini             } else {
22300bdf917eSStefano Zampini               for (i=0;i<pcbddc->local_primal_size;i++) {
22310c7d97c5SJed Brown                 array_to[i]=array_from[pcbddc->local_primal_indices[i]];
22320c7d97c5SJed Brown               }
22330bdf917eSStefano Zampini             }
22340bdf917eSStefano Zampini           }
22350c7d97c5SJed Brown           break;
223653cdbc3dSStefano Zampini         case MULTILEVEL_BDDC:
223753cdbc3dSStefano Zampini           break;
223853cdbc3dSStefano Zampini         case PARALLEL_BDDC:
223953cdbc3dSStefano Zampini           break;
22400c7d97c5SJed Brown       }
22410c7d97c5SJed Brown       if (vec_from) VecRestoreArray(vec_from,&array_from);
22420c7d97c5SJed Brown       if (vec_to)   VecRestoreArray(vec_to,&array_to);
22430c7d97c5SJed Brown       break;
22440c7d97c5SJed Brown   }
22450c7d97c5SJed Brown   PetscFunctionReturn(0);
22460c7d97c5SJed Brown }
22470c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
22483b03a366Sstefano_zampini #undef __FUNCT__
22493b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCCreateConstraintMatrix"
22503b03a366Sstefano_zampini static PetscErrorCode PCBDDCCreateConstraintMatrix(PC pc)
22513b03a366Sstefano_zampini {
22523b03a366Sstefano_zampini   PetscErrorCode ierr;
22533b03a366Sstefano_zampini   PC_IS*         pcis = (PC_IS*)(pc->data);
22543b03a366Sstefano_zampini   PC_BDDC*       pcbddc = (PC_BDDC*)pc->data;
22553b03a366Sstefano_zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
225623d4d1a5SStefano Zampini   PetscInt       *nnz,*is_indices;
22573b03a366Sstefano_zampini   PetscScalar    *temp_quadrature_constraint;
2258534831adSStefano Zampini   PetscInt       *temp_indices,*temp_indices_to_constraint,*temp_indices_to_constraint_B,*local_to_B;
22593b03a366Sstefano_zampini   PetscInt       local_primal_size,i,j,k,total_counts,max_size_of_constraint;
22603b03a366Sstefano_zampini   PetscInt       n_constraints,n_vertices,size_of_constraint;
2261534831adSStefano Zampini   PetscScalar    quad_value;
22623b03a366Sstefano_zampini   PetscBool      nnsp_has_cnst=PETSC_FALSE,use_nnsp_true=pcbddc->use_nnsp_true;
22633b03a366Sstefano_zampini   PetscInt       nnsp_size=0,nnsp_addone=0,temp_constraints,temp_start_ptr;
22643b03a366Sstefano_zampini   IS             *used_IS;
22653b03a366Sstefano_zampini   const MatType  impMatType=MATSEQAIJ;
22663b03a366Sstefano_zampini   PetscBLASInt   Bs,Bt,lwork,lierr;
22673b03a366Sstefano_zampini   PetscReal      tol=1.0e-8;
2268fcda91b4SJed Brown   MatNullSpace   nearnullsp;
2269fcda91b4SJed Brown   const Vec      *nearnullvecs;
22703b03a366Sstefano_zampini   Vec            *localnearnullsp;
22713b03a366Sstefano_zampini   PetscScalar    *work,*temp_basis,*array_vector,*correlation_mat;
22723b03a366Sstefano_zampini   PetscReal      *rwork,*singular_vals;
2273534831adSStefano Zampini   PetscBLASInt   Bone=1,*ipiv;
2274534831adSStefano Zampini   Vec            temp_vec;
2275534831adSStefano Zampini   Mat            temp_mat;
2276534831adSStefano Zampini   KSP            temp_ksp;
2277ffe5efe1SStefano Zampini   PC             temp_pc;
2278534831adSStefano Zampini   PetscInt       s,start_constraint,dual_dofs;
2279534831adSStefano Zampini   PetscBool      compute_submatrix,useksp=PETSC_FALSE;
2280534831adSStefano Zampini   PetscInt       *aux_primal_permutation,*aux_primal_numbering;
2281534831adSStefano Zampini   PetscBool      boolforface,*change_basis;
2282de534f79Sstefano_zampini /* some ugly conditional declarations */
22833b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD)
22843b03a366Sstefano_zampini   PetscScalar    dot_result;
22853b03a366Sstefano_zampini   PetscScalar    one=1.0,zero=0.0;
22863b03a366Sstefano_zampini   PetscInt       ii;
22873425bc38SStefano Zampini   PetscScalar    *singular_vectors;
22883425bc38SStefano Zampini   PetscBLASInt   *iwork,*ifail;
22893425bc38SStefano Zampini   PetscReal      dummy_real,abs_tol;
22903425bc38SStefano Zampini   PetscBLASInt   eigs_found;
22913b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX)
22923b03a366Sstefano_zampini   PetscScalar    val1,val2;
22933b03a366Sstefano_zampini #endif
22943425bc38SStefano Zampini #endif
22953b03a366Sstefano_zampini   PetscBLASInt   dummy_int;
22963b03a366Sstefano_zampini   PetscScalar    dummy_scalar;
22973b03a366Sstefano_zampini 
22983b03a366Sstefano_zampini   PetscFunctionBegin;
22993b03a366Sstefano_zampini   /* check if near null space is attached to global mat */
2300fcda91b4SJed Brown   ierr = MatGetNearNullSpace(pc->pmat,&nearnullsp);CHKERRQ(ierr);
2301fcda91b4SJed Brown   if (nearnullsp) {
2302fcda91b4SJed Brown     ierr = MatNullSpaceGetVecs(nearnullsp,&nnsp_has_cnst,&nnsp_size,&nearnullvecs);CHKERRQ(ierr);
23033b03a366Sstefano_zampini   } else { /* if near null space is not provided it uses constants */
23043b03a366Sstefano_zampini     nnsp_has_cnst = PETSC_TRUE;
23053b03a366Sstefano_zampini     use_nnsp_true = PETSC_TRUE;
23063b03a366Sstefano_zampini   }
23073b03a366Sstefano_zampini   if (nnsp_has_cnst) {
23083b03a366Sstefano_zampini     nnsp_addone = 1;
23093b03a366Sstefano_zampini   }
23103b03a366Sstefano_zampini   /*
23113b03a366Sstefano_zampini        Evaluate maximum storage size needed by the procedure
23123b03a366Sstefano_zampini        - temp_indices will contain start index of each constraint stored as follows
23133b03a366Sstefano_zampini        - temp_indices_to_constraint  [temp_indices[i],...,temp[indices[i+1]-1] will contain the indices (in local numbering) on which the constraint acts
2314534831adSStefano Zampini        - temp_indices_to_constraint_B[temp_indices[i],...,temp[indices[i+1]-1] will contain the indices (in boundary numbering) on which the constraint acts
23153b03a366Sstefano_zampini        - temp_quadrature_constraint  [temp_indices[i],...,temp[indices[i+1]-1] will contain the scalars representing the constraint itself
23163b03a366Sstefano_zampini                                                                                                                                                          */
2317da1bb401SStefano Zampini 
23183b03a366Sstefano_zampini   total_counts = pcbddc->n_ISForFaces+pcbddc->n_ISForEdges;
23193b03a366Sstefano_zampini   total_counts *= (nnsp_addone+nnsp_size);
2320da1bb401SStefano Zampini   ierr = ISGetSize(pcbddc->ISForVertices,&n_vertices);CHKERRQ(ierr);
2321da1bb401SStefano Zampini   total_counts += n_vertices;
23223b03a366Sstefano_zampini   ierr = PetscMalloc((total_counts+1)*sizeof(PetscInt),&temp_indices);CHKERRQ(ierr);
2323534831adSStefano Zampini   ierr = PetscMalloc((total_counts+1)*sizeof(PetscBool),&change_basis);CHKERRQ(ierr);
23243b03a366Sstefano_zampini   total_counts = 0;
23253b03a366Sstefano_zampini   max_size_of_constraint = 0;
23263b03a366Sstefano_zampini   for (i=0;i<pcbddc->n_ISForEdges+pcbddc->n_ISForFaces;i++){
23273b03a366Sstefano_zampini     if (i<pcbddc->n_ISForEdges){
23283b03a366Sstefano_zampini       used_IS = &pcbddc->ISForEdges[i];
23293b03a366Sstefano_zampini     } else {
23303b03a366Sstefano_zampini       used_IS = &pcbddc->ISForFaces[i-pcbddc->n_ISForEdges];
23313b03a366Sstefano_zampini     }
23323b03a366Sstefano_zampini     ierr = ISGetSize(*used_IS,&j);CHKERRQ(ierr);
23333b03a366Sstefano_zampini     total_counts += j;
23343b03a366Sstefano_zampini     if (j>max_size_of_constraint) max_size_of_constraint=j;
23353b03a366Sstefano_zampini   }
23363b03a366Sstefano_zampini   total_counts *= (nnsp_addone+nnsp_size);
2337da1bb401SStefano Zampini   total_counts += n_vertices;
23383b03a366Sstefano_zampini   ierr = PetscMalloc(total_counts*sizeof(PetscScalar),&temp_quadrature_constraint);CHKERRQ(ierr);
23393b03a366Sstefano_zampini   ierr = PetscMalloc(total_counts*sizeof(PetscInt),&temp_indices_to_constraint);CHKERRQ(ierr);
2340534831adSStefano Zampini   ierr = PetscMalloc(total_counts*sizeof(PetscInt),&temp_indices_to_constraint_B);CHKERRQ(ierr);
2341534831adSStefano Zampini   ierr = PetscMalloc(pcis->n*sizeof(PetscInt),&local_to_B);CHKERRQ(ierr);
2342534831adSStefano Zampini   ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2343534831adSStefano Zampini   for (i=0;i<pcis->n;i++) {
2344534831adSStefano Zampini     local_to_B[i]=-1;
2345534831adSStefano Zampini   }
2346534831adSStefano Zampini   for (i=0;i<pcis->n_B;i++) {
2347534831adSStefano Zampini     local_to_B[is_indices[i]]=i;
2348534831adSStefano Zampini   }
2349534831adSStefano Zampini   ierr = ISRestoreIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2350534831adSStefano Zampini 
23513b03a366Sstefano_zampini   /* First we issue queries to allocate optimal workspace for LAPACKgesvd or LAPACKsyev/LAPACKheev */
23523b03a366Sstefano_zampini   rwork = 0;
23533b03a366Sstefano_zampini   work = 0;
23543b03a366Sstefano_zampini   singular_vals = 0;
23553b03a366Sstefano_zampini   temp_basis = 0;
23563b03a366Sstefano_zampini   correlation_mat = 0;
23573b03a366Sstefano_zampini   if (!pcbddc->use_nnsp_true) {
23583b03a366Sstefano_zampini     PetscScalar temp_work;
23593b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD)
23603b03a366Sstefano_zampini     /* POD */
23613b03a366Sstefano_zampini     PetscInt max_n;
23623b03a366Sstefano_zampini     max_n = nnsp_addone+nnsp_size;
23633b03a366Sstefano_zampini     /* using some techniques borrowed from Proper Orthogonal Decomposition */
23643b03a366Sstefano_zampini     ierr = PetscMalloc(max_n*max_n*sizeof(PetscScalar),&correlation_mat);CHKERRQ(ierr);
23653425bc38SStefano Zampini     ierr = PetscMalloc(max_n*max_n*sizeof(PetscScalar),&singular_vectors);CHKERRQ(ierr);
23663b03a366Sstefano_zampini     ierr = PetscMalloc(max_n*sizeof(PetscReal),&singular_vals);CHKERRQ(ierr);
23673b03a366Sstefano_zampini     ierr = PetscMalloc(max_size_of_constraint*(nnsp_addone+nnsp_size)*sizeof(PetscScalar),&temp_basis);CHKERRQ(ierr);
23683b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX)
23693b03a366Sstefano_zampini     ierr = PetscMalloc(3*max_n*sizeof(PetscReal),&rwork);CHKERRQ(ierr);
23703b03a366Sstefano_zampini #endif
23713425bc38SStefano Zampini     ierr = PetscMalloc(5*max_n*sizeof(PetscBLASInt),&iwork);CHKERRQ(ierr);
23723425bc38SStefano Zampini     ierr = PetscMalloc(max_n*sizeof(PetscBLASInt),&ifail);CHKERRQ(ierr);
23733b03a366Sstefano_zampini     /* now we evaluate the optimal workspace using query with lwork=-1 */
23743b03a366Sstefano_zampini     Bt = PetscBLASIntCast(max_n);
23753b03a366Sstefano_zampini     lwork=-1;
23763425bc38SStefano Zampini     ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
23773b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX)
23783425bc38SStefano Zampini     abs_tol=1.e-8;
23793425bc38SStefano Zampini /*    LAPACKsyev_("V","U",&Bt,correlation_mat,&Bt,singular_vals,&temp_work,&lwork,&lierr); */
23803425bc38SStefano Zampini     LAPACKsyevx_("V","A","U",&Bt,correlation_mat,&Bt,&dummy_real,&dummy_real,&dummy_int,&dummy_int,
23813425bc38SStefano Zampini                  &abs_tol,&eigs_found,singular_vals,singular_vectors,&Bt,&temp_work,&lwork,iwork,ifail,&lierr);
23823b03a366Sstefano_zampini #else
23833425bc38SStefano Zampini /*    LAPACKsyev_("V","U",&Bt,correlation_mat,&Bt,singular_vals,&temp_work,&lwork,rwork,&lierr); */
23843425bc38SStefano Zampini /*  LAPACK call is missing here! TODO */
23853425bc38SStefano Zampini     SETERRQ(((PetscObject) pc)->comm, PETSC_ERR_SUP, "Not yet implemented for complexes when PETSC_MISSING_GESVD = 1");
23863b03a366Sstefano_zampini #endif
23873425bc38SStefano Zampini     if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to SYEVX Lapack routine %d",(int)lierr);
23883425bc38SStefano Zampini     ierr = PetscFPTrapPop();CHKERRQ(ierr);
23893b03a366Sstefano_zampini #else /* on missing GESVD */
23903b03a366Sstefano_zampini     /* SVD */
23913b03a366Sstefano_zampini     PetscInt max_n,min_n;
23923b03a366Sstefano_zampini     max_n = max_size_of_constraint;
23933b03a366Sstefano_zampini     min_n = nnsp_addone+nnsp_size;
23943b03a366Sstefano_zampini     if (max_size_of_constraint < ( nnsp_addone+nnsp_size ) ) {
23953b03a366Sstefano_zampini       min_n = max_size_of_constraint;
23963b03a366Sstefano_zampini       max_n = nnsp_addone+nnsp_size;
23973b03a366Sstefano_zampini     }
23983b03a366Sstefano_zampini     ierr = PetscMalloc(min_n*sizeof(PetscReal),&singular_vals);CHKERRQ(ierr);
23993b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX)
24003b03a366Sstefano_zampini     ierr = PetscMalloc(5*min_n*sizeof(PetscReal),&rwork);CHKERRQ(ierr);
24013b03a366Sstefano_zampini #endif
24023b03a366Sstefano_zampini     /* now we evaluate the optimal workspace using query with lwork=-1 */
24033b03a366Sstefano_zampini     lwork=-1;
24043b03a366Sstefano_zampini     Bs = PetscBLASIntCast(max_n);
24053b03a366Sstefano_zampini     Bt = PetscBLASIntCast(min_n);
24063b03a366Sstefano_zampini     dummy_int = Bs;
2407670f3ff9SJed Brown     ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
24083b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX)
24093b03a366Sstefano_zampini     LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[0],&Bs,singular_vals,
24103b03a366Sstefano_zampini                  &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,&temp_work,&lwork,&lierr);
24113b03a366Sstefano_zampini #else
24123b03a366Sstefano_zampini     LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[0],&Bs,singular_vals,
24133b03a366Sstefano_zampini                  &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,&temp_work,&lwork,rwork,&lierr);
24143b03a366Sstefano_zampini #endif
24153b03a366Sstefano_zampini     if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to SVD Lapack routine %d",(int)lierr);
2416670f3ff9SJed Brown     ierr = PetscFPTrapPop();CHKERRQ(ierr);
24173b03a366Sstefano_zampini #endif
24183b03a366Sstefano_zampini     /* Allocate optimal workspace */
24193b03a366Sstefano_zampini     lwork = PetscBLASIntCast((PetscInt)PetscRealPart(temp_work));
24203b03a366Sstefano_zampini     total_counts = (PetscInt)lwork;
24213b03a366Sstefano_zampini     ierr = PetscMalloc(total_counts*sizeof(PetscScalar),&work);CHKERRQ(ierr);
24223b03a366Sstefano_zampini   }
24233b03a366Sstefano_zampini   /* get local part of global near null space vectors */
24243b03a366Sstefano_zampini   ierr = PetscMalloc(nnsp_size*sizeof(Vec),&localnearnullsp);CHKERRQ(ierr);
24253b03a366Sstefano_zampini   for (k=0;k<nnsp_size;k++) {
24263b03a366Sstefano_zampini     ierr = VecDuplicate(pcis->vec1_N,&localnearnullsp[k]);CHKERRQ(ierr);
2427fcda91b4SJed Brown     ierr = VecScatterBegin(matis->ctx,nearnullvecs[k],localnearnullsp[k],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
2428fcda91b4SJed Brown     ierr = VecScatterEnd  (matis->ctx,nearnullvecs[k],localnearnullsp[k],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
24293b03a366Sstefano_zampini   }
24303b03a366Sstefano_zampini   /* Now we can loop on constraining sets */
24313b03a366Sstefano_zampini   total_counts=0;
24323b03a366Sstefano_zampini   temp_indices[0]=0;
2433da1bb401SStefano Zampini   /* vertices */
2434da1bb401SStefano Zampini   PetscBool used_vertex;
2435da1bb401SStefano Zampini   ierr = ISGetIndices(pcbddc->ISForVertices,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2436da1bb401SStefano Zampini   if (nnsp_has_cnst) { /* consider all vertices */
2437da1bb401SStefano Zampini     for (i=0;i<n_vertices;i++) {
2438da1bb401SStefano Zampini       temp_indices_to_constraint[temp_indices[total_counts]]=is_indices[i];
2439534831adSStefano Zampini       temp_indices_to_constraint_B[temp_indices[total_counts]]=local_to_B[is_indices[i]];
2440da1bb401SStefano Zampini       temp_quadrature_constraint[temp_indices[total_counts]]=1.0;
2441da1bb401SStefano Zampini       temp_indices[total_counts+1]=temp_indices[total_counts]+1;
2442534831adSStefano Zampini       change_basis[total_counts]=PETSC_FALSE;
2443da1bb401SStefano Zampini       total_counts++;
2444da1bb401SStefano Zampini     }
2445da1bb401SStefano Zampini   } else { /* consider vertices for which exist at least a localnearnullsp which is not null there */
2446da1bb401SStefano Zampini     for (i=0;i<n_vertices;i++) {
2447da1bb401SStefano Zampini       used_vertex=PETSC_FALSE;
2448da1bb401SStefano Zampini       k=0;
2449da1bb401SStefano Zampini       while(!used_vertex && k<nnsp_size) {
2450da1bb401SStefano Zampini         ierr = VecGetArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr);
2451da1bb401SStefano Zampini         if (PetscAbsScalar(array_vector[is_indices[i]])>0.0) {
2452da1bb401SStefano Zampini           temp_indices_to_constraint[temp_indices[total_counts]]=is_indices[i];
2453534831adSStefano Zampini           temp_indices_to_constraint_B[temp_indices[total_counts]]=local_to_B[is_indices[i]];
2454da1bb401SStefano Zampini           temp_quadrature_constraint[temp_indices[total_counts]]=1.0;
2455da1bb401SStefano Zampini           temp_indices[total_counts+1]=temp_indices[total_counts]+1;
2456534831adSStefano Zampini           change_basis[total_counts]=PETSC_FALSE;
2457da1bb401SStefano Zampini           total_counts++;
2458da1bb401SStefano Zampini           used_vertex=PETSC_TRUE;
2459da1bb401SStefano Zampini         }
2460da1bb401SStefano Zampini         ierr = VecRestoreArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr);
2461da1bb401SStefano Zampini         k++;
2462da1bb401SStefano Zampini       }
2463da1bb401SStefano Zampini     }
2464da1bb401SStefano Zampini   }
2465da1bb401SStefano Zampini   ierr = ISRestoreIndices(pcbddc->ISForVertices,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2466da1bb401SStefano Zampini   n_vertices=total_counts;
2467da1bb401SStefano Zampini   /* edges and faces */
24683b03a366Sstefano_zampini   for (i=0;i<pcbddc->n_ISForEdges+pcbddc->n_ISForFaces;i++){
24693b03a366Sstefano_zampini     if (i<pcbddc->n_ISForEdges){
24703b03a366Sstefano_zampini       used_IS = &pcbddc->ISForEdges[i];
2471534831adSStefano Zampini       boolforface = pcbddc->usechangeofbasis;
24723b03a366Sstefano_zampini     } else {
24733b03a366Sstefano_zampini       used_IS = &pcbddc->ISForFaces[i-pcbddc->n_ISForEdges];
2474534831adSStefano Zampini       boolforface = pcbddc->usechangeonfaces;
24753b03a366Sstefano_zampini     }
24763b03a366Sstefano_zampini     temp_constraints = 0;          /* zero the number of constraints I have on this conn comp */
24773b03a366Sstefano_zampini     temp_start_ptr = total_counts; /* need to know the starting index of constraints stored */
24783b03a366Sstefano_zampini     ierr = ISGetSize(*used_IS,&size_of_constraint);CHKERRQ(ierr);
24793b03a366Sstefano_zampini     ierr = ISGetIndices(*used_IS,(const PetscInt**)&is_indices);CHKERRQ(ierr);
24803b03a366Sstefano_zampini     if (nnsp_has_cnst) {
24813b03a366Sstefano_zampini       temp_constraints++;
2482534831adSStefano Zampini       quad_value = (PetscScalar) (1.0/PetscSqrtReal((PetscReal)size_of_constraint));
24833b03a366Sstefano_zampini       for (j=0;j<size_of_constraint;j++) {
24843b03a366Sstefano_zampini         temp_indices_to_constraint[temp_indices[total_counts]+j]=is_indices[j];
2485534831adSStefano Zampini         temp_indices_to_constraint_B[temp_indices[total_counts]+j]=local_to_B[is_indices[j]];
24863b03a366Sstefano_zampini         temp_quadrature_constraint[temp_indices[total_counts]+j]=quad_value;
24873b03a366Sstefano_zampini       }
24883b03a366Sstefano_zampini       temp_indices[total_counts+1]=temp_indices[total_counts]+size_of_constraint;  /* store new starting point */
2489534831adSStefano Zampini       change_basis[total_counts]=boolforface;
24903b03a366Sstefano_zampini       total_counts++;
24913b03a366Sstefano_zampini     }
24923b03a366Sstefano_zampini     for (k=0;k<nnsp_size;k++) {
24933b03a366Sstefano_zampini       ierr = VecGetArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr);
24943b03a366Sstefano_zampini       for (j=0;j<size_of_constraint;j++) {
24953b03a366Sstefano_zampini         temp_indices_to_constraint[temp_indices[total_counts]+j]=is_indices[j];
2496534831adSStefano Zampini         temp_indices_to_constraint_B[temp_indices[total_counts]+j]=local_to_B[is_indices[j]];
24973b03a366Sstefano_zampini         temp_quadrature_constraint[temp_indices[total_counts]+j]=array_vector[is_indices[j]];
24983b03a366Sstefano_zampini       }
24993b03a366Sstefano_zampini       ierr = VecRestoreArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr);
2500de534f79Sstefano_zampini       quad_value = 1.0;
2501de534f79Sstefano_zampini       if ( use_nnsp_true ) { /* check if array is null on the connected component in case use_nnsp_true has been requested */
2502de534f79Sstefano_zampini         Bs = PetscBLASIntCast(size_of_constraint);
2503de534f79Sstefano_zampini         quad_value = BLASasum_(&Bs,&temp_quadrature_constraint[temp_indices[total_counts]],&Bone);
2504de534f79Sstefano_zampini       }
2505de534f79Sstefano_zampini       if ( quad_value > 0.0 ) { /* keep indices and values */
2506de534f79Sstefano_zampini         temp_constraints++;
25073b03a366Sstefano_zampini         temp_indices[total_counts+1]=temp_indices[total_counts]+size_of_constraint;  /* store new starting point */
2508534831adSStefano Zampini         change_basis[total_counts]=boolforface;
25093b03a366Sstefano_zampini         total_counts++;
25103b03a366Sstefano_zampini       }
2511de534f79Sstefano_zampini     }
25123b03a366Sstefano_zampini     ierr = ISRestoreIndices(*used_IS,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2513de534f79Sstefano_zampini     /* perform SVD on the constraint if use_nnsp_true has not be requested by the user */
25143b03a366Sstefano_zampini     if (!use_nnsp_true) {
2515de534f79Sstefano_zampini 
25163b03a366Sstefano_zampini       Bs = PetscBLASIntCast(size_of_constraint);
25173b03a366Sstefano_zampini       Bt = PetscBLASIntCast(temp_constraints);
2518de534f79Sstefano_zampini 
25193b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD)
25203b03a366Sstefano_zampini       ierr = PetscMemzero(correlation_mat,Bt*Bt*sizeof(PetscScalar));CHKERRQ(ierr);
25213b03a366Sstefano_zampini       /* Store upper triangular part of correlation matrix */
25223b03a366Sstefano_zampini       for (j=0;j<temp_constraints;j++) {
25233b03a366Sstefano_zampini         for (k=0;k<j+1;k++) {
25243b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX)
25253425bc38SStefano Zampini           /* hand made complex dot product -> replace */
25263b03a366Sstefano_zampini           dot_result = 0.0;
25273b03a366Sstefano_zampini           for (ii=0; ii<size_of_constraint; ii++) {
25283b03a366Sstefano_zampini             val1 = temp_quadrature_constraint[temp_indices[temp_start_ptr+j]+ii];
25293b03a366Sstefano_zampini             val2 = temp_quadrature_constraint[temp_indices[temp_start_ptr+k]+ii];
25303b03a366Sstefano_zampini             dot_result += val1*PetscConj(val2);
25313b03a366Sstefano_zampini           }
25323b03a366Sstefano_zampini #else
25333b03a366Sstefano_zampini           dot_result = BLASdot_(&Bs,&temp_quadrature_constraint[temp_indices[temp_start_ptr+j]],&Bone,
25343b03a366Sstefano_zampini                                     &temp_quadrature_constraint[temp_indices[temp_start_ptr+k]],&Bone);
25353b03a366Sstefano_zampini #endif
25363b03a366Sstefano_zampini           correlation_mat[j*temp_constraints+k]=dot_result;
25373b03a366Sstefano_zampini         }
25383b03a366Sstefano_zampini       }
25393425bc38SStefano Zampini       ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
25403b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX)
25413425bc38SStefano Zampini /*      LAPACKsyev_("V","U",&Bt,correlation_mat,&Bt,singular_vals,work,&lwork,&lierr); */
25423425bc38SStefano Zampini       LAPACKsyevx_("V","A","U",&Bt,correlation_mat,&Bt,&dummy_real,&dummy_real,&dummy_int,&dummy_int,
25433425bc38SStefano Zampini                  &abs_tol,&eigs_found,singular_vals,singular_vectors,&Bt,work,&lwork,iwork,ifail,&lierr);
25443b03a366Sstefano_zampini #else
25453425bc38SStefano Zampini /*  LAPACK call is missing here! TODO */
25463425bc38SStefano Zampini       SETERRQ(((PetscObject) pc)->comm, PETSC_ERR_SUP, "Not yet implemented for complexes when PETSC_MISSING_GESVD = 1");
25473b03a366Sstefano_zampini #endif
25483425bc38SStefano Zampini       if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYEVX Lapack routine %d",(int)lierr);
25493425bc38SStefano Zampini       ierr = PetscFPTrapPop();CHKERRQ(ierr);
25503b03a366Sstefano_zampini       /* retain eigenvalues greater than tol: note that lapack SYEV gives eigs in ascending order */
25513b03a366Sstefano_zampini       j=0;
25523b03a366Sstefano_zampini       while( j < Bt && singular_vals[j] < tol) j++;
25533b03a366Sstefano_zampini       total_counts=total_counts-j;
25543b03a366Sstefano_zampini       if (j<temp_constraints) {
25553b03a366Sstefano_zampini         for (k=j;k<Bt;k++) { singular_vals[k]=1.0/PetscSqrtReal(singular_vals[k]); }
25563425bc38SStefano Zampini         ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
25573b03a366Sstefano_zampini         BLASgemm_("N","N",&Bs,&Bt,&Bt,&one,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,correlation_mat,&Bt,&zero,temp_basis,&Bs);
25583425bc38SStefano Zampini         ierr = PetscFPTrapPop();CHKERRQ(ierr);
25593b03a366Sstefano_zampini         /* copy POD basis into used quadrature memory */
25603b03a366Sstefano_zampini         for (k=0;k<Bt-j;k++) {
25613b03a366Sstefano_zampini           for (ii=0;ii<size_of_constraint;ii++) {
25623b03a366Sstefano_zampini             temp_quadrature_constraint[temp_indices[temp_start_ptr+k]+ii]=singular_vals[Bt-1-k]*temp_basis[(Bt-1-k)*size_of_constraint+ii];
25633b03a366Sstefano_zampini           }
25643b03a366Sstefano_zampini         }
25653b03a366Sstefano_zampini       }
2566de534f79Sstefano_zampini 
25673b03a366Sstefano_zampini #else  /* on missing GESVD */
25683b03a366Sstefano_zampini       PetscInt min_n = temp_constraints;
25693b03a366Sstefano_zampini       if (min_n > size_of_constraint) min_n = size_of_constraint;
25703b03a366Sstefano_zampini       dummy_int = Bs;
2571670f3ff9SJed Brown       ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
25723b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX)
25733b03a366Sstefano_zampini       LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,singular_vals,
25743b03a366Sstefano_zampini                    &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,work,&lwork,&lierr);
25753b03a366Sstefano_zampini #else
25763b03a366Sstefano_zampini       LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,singular_vals,
25773b03a366Sstefano_zampini                    &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,work,&lwork,rwork,&lierr);
25783b03a366Sstefano_zampini #endif
25793b03a366Sstefano_zampini       if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SVD Lapack routine %d",(int)lierr);
2580670f3ff9SJed Brown       ierr = PetscFPTrapPop();CHKERRQ(ierr);
25813b03a366Sstefano_zampini       /* retain eigenvalues greater than tol: note that lapack SVD gives eigs in descending order */
25823b03a366Sstefano_zampini       j=0;
25833b03a366Sstefano_zampini       while( j < min_n && singular_vals[min_n-j-1] < tol) j++;
25843b03a366Sstefano_zampini       total_counts = total_counts-(PetscInt)Bt+(min_n-j);
25853b03a366Sstefano_zampini #endif
25863b03a366Sstefano_zampini     }
25873b03a366Sstefano_zampini   }
2588534831adSStefano Zampini 
2589da1bb401SStefano Zampini   n_constraints=total_counts-n_vertices;
2590da1bb401SStefano Zampini   local_primal_size = total_counts;
25913b03a366Sstefano_zampini   /* set quantities in pcbddc data structure */
25923b03a366Sstefano_zampini   pcbddc->n_vertices = n_vertices;
25933b03a366Sstefano_zampini   pcbddc->n_constraints = n_constraints;
2594da1bb401SStefano Zampini   pcbddc->local_primal_size = local_primal_size;
2595534831adSStefano Zampini 
2596534831adSStefano Zampini   /* Create constraint matrix */
2597534831adSStefano Zampini   /* The constraint matrix is used to compute the l2g map of primal dofs */
2598534831adSStefano Zampini   /* so we need to set it up properly either with or without change of basis */
2599534831adSStefano Zampini   ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->ConstraintMatrix);CHKERRQ(ierr);
2600534831adSStefano Zampini   ierr = MatSetType(pcbddc->ConstraintMatrix,impMatType);CHKERRQ(ierr);
2601534831adSStefano Zampini   ierr = MatSetSizes(pcbddc->ConstraintMatrix,local_primal_size,pcis->n,local_primal_size,pcis->n);CHKERRQ(ierr);
2602534831adSStefano Zampini   /* compute a local numbering of constraints : vertices first then constraints */
2603534831adSStefano Zampini   ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
2604534831adSStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array_vector);CHKERRQ(ierr);
2605534831adSStefano Zampini   ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&aux_primal_numbering);CHKERRQ(ierr);
2606534831adSStefano Zampini   ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&aux_primal_permutation);CHKERRQ(ierr);
2607534831adSStefano Zampini   total_counts=0;
2608534831adSStefano Zampini   /* find vertices: subdomain corners plus dofs with basis changed */
2609534831adSStefano Zampini   for (i=0;i<local_primal_size;i++) {
2610534831adSStefano Zampini     size_of_constraint=temp_indices[i+1]-temp_indices[i];
2611534831adSStefano Zampini     if (change_basis[i] || size_of_constraint == 1) {
2612534831adSStefano Zampini       k=0;
2613534831adSStefano Zampini       while(k < size_of_constraint && array_vector[temp_indices_to_constraint[temp_indices[i]+size_of_constraint-k-1]] != 0.0) {
2614534831adSStefano Zampini         k=k+1;
2615534831adSStefano Zampini       }
2616534831adSStefano Zampini       j=temp_indices_to_constraint[temp_indices[i]+size_of_constraint-k-1];
2617534831adSStefano Zampini       array_vector[j] = 1.0;
2618534831adSStefano Zampini       aux_primal_numbering[total_counts]=j;
2619534831adSStefano Zampini       aux_primal_permutation[total_counts]=total_counts;
2620534831adSStefano Zampini       total_counts++;
2621534831adSStefano Zampini     }
2622534831adSStefano Zampini   }
2623534831adSStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array_vector);CHKERRQ(ierr);
2624534831adSStefano Zampini   /* permute indices in order to have a sorted set of vertices */
2625534831adSStefano Zampini   ierr = PetscSortIntWithPermutation(total_counts,aux_primal_numbering,aux_primal_permutation);
2626534831adSStefano Zampini   /* nonzero structure */
2627534831adSStefano Zampini   ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&nnz);CHKERRQ(ierr);
2628534831adSStefano Zampini   for (i=0;i<total_counts;i++) {
2629534831adSStefano Zampini     nnz[i]=1;
2630534831adSStefano Zampini   }
2631534831adSStefano Zampini   j=total_counts;
2632534831adSStefano Zampini   for (i=n_vertices;i<local_primal_size;i++) {
2633534831adSStefano Zampini     if (!change_basis[i]) {
2634534831adSStefano Zampini       nnz[j]=temp_indices[i+1]-temp_indices[i];
2635534831adSStefano Zampini       j++;
2636534831adSStefano Zampini     }
2637534831adSStefano Zampini   }
2638534831adSStefano Zampini   ierr = MatSeqAIJSetPreallocation(pcbddc->ConstraintMatrix,0,nnz);CHKERRQ(ierr);
2639534831adSStefano Zampini   ierr = PetscFree(nnz);CHKERRQ(ierr);
2640534831adSStefano Zampini   /* set values in constraint matrix */
2641534831adSStefano Zampini   for (i=0;i<total_counts;i++) {
2642534831adSStefano Zampini     j = aux_primal_permutation[i];
2643534831adSStefano Zampini     k = aux_primal_numbering[j];
2644534831adSStefano Zampini     ierr = MatSetValue(pcbddc->ConstraintMatrix,i,k,1.0,INSERT_VALUES);CHKERRQ(ierr);
2645534831adSStefano Zampini   }
2646534831adSStefano Zampini   for (i=n_vertices;i<local_primal_size;i++) {
2647534831adSStefano Zampini     if (!change_basis[i]) {
2648534831adSStefano Zampini       size_of_constraint=temp_indices[i+1]-temp_indices[i];
2649534831adSStefano Zampini       ierr = MatSetValues(pcbddc->ConstraintMatrix,1,&total_counts,size_of_constraint,&temp_indices_to_constraint[temp_indices[i]],&temp_quadrature_constraint[temp_indices[i]],INSERT_VALUES);CHKERRQ(ierr);
2650534831adSStefano Zampini       total_counts++;
2651534831adSStefano Zampini     }
2652534831adSStefano Zampini   }
2653534831adSStefano Zampini   ierr = PetscFree(aux_primal_numbering);CHKERRQ(ierr);
2654534831adSStefano Zampini   ierr = PetscFree(aux_primal_permutation);CHKERRQ(ierr);
2655534831adSStefano Zampini   /* assembling */
2656534831adSStefano Zampini   ierr = MatAssemblyBegin(pcbddc->ConstraintMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2657534831adSStefano Zampini   ierr = MatAssemblyEnd(pcbddc->ConstraintMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2658534831adSStefano Zampini 
2659534831adSStefano Zampini   /* Create matrix for change of basis. We don't need it in case pcbddc->usechangeofbasis is FALSE */
2660534831adSStefano Zampini   if (pcbddc->usechangeofbasis) {
2661534831adSStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->ChangeOfBasisMatrix);CHKERRQ(ierr);
2662534831adSStefano Zampini     ierr = MatSetType(pcbddc->ChangeOfBasisMatrix,impMatType);CHKERRQ(ierr);
2663534831adSStefano Zampini     ierr = MatSetSizes(pcbddc->ChangeOfBasisMatrix,pcis->n_B,pcis->n_B,pcis->n_B,pcis->n_B);CHKERRQ(ierr);
2664534831adSStefano Zampini     /* work arrays */
2665534831adSStefano Zampini     /* we need to reuse these arrays, so we free them */
2666534831adSStefano Zampini     ierr = PetscFree(temp_basis);CHKERRQ(ierr);
2667534831adSStefano Zampini     ierr = PetscFree(work);CHKERRQ(ierr);
2668534831adSStefano Zampini     ierr = PetscMalloc(pcis->n_B*sizeof(PetscInt),&nnz);CHKERRQ(ierr);
2669534831adSStefano Zampini     ierr = PetscMalloc((nnsp_addone+nnsp_size)*(nnsp_addone+nnsp_size)*sizeof(PetscScalar),&temp_basis);CHKERRQ(ierr);
2670534831adSStefano Zampini     ierr = PetscMalloc((nnsp_addone+nnsp_size)*sizeof(PetscScalar),&work);CHKERRQ(ierr);
2671534831adSStefano Zampini     ierr = PetscMalloc((nnsp_addone+nnsp_size)*sizeof(PetscBLASInt),&ipiv);CHKERRQ(ierr);
2672534831adSStefano Zampini     for (i=0;i<pcis->n_B;i++) {
2673534831adSStefano Zampini       nnz[i]=1;
2674534831adSStefano Zampini     }
2675534831adSStefano Zampini     /* Overestimated nonzeros per row */
2676534831adSStefano Zampini     k=1;
2677534831adSStefano Zampini     for (i=pcbddc->n_vertices;i<local_primal_size;i++) {
2678534831adSStefano Zampini       if (change_basis[i]) {
2679534831adSStefano Zampini         size_of_constraint = temp_indices[i+1]-temp_indices[i];
2680534831adSStefano Zampini         if (k < size_of_constraint) {
2681534831adSStefano Zampini           k = size_of_constraint;
2682534831adSStefano Zampini         }
2683534831adSStefano Zampini         for (j=0;j<size_of_constraint;j++) {
2684534831adSStefano Zampini           nnz[temp_indices_to_constraint_B[temp_indices[i]+j]] = size_of_constraint;
2685534831adSStefano Zampini         }
2686534831adSStefano Zampini       }
2687534831adSStefano Zampini     }
2688534831adSStefano Zampini     ierr = MatSeqAIJSetPreallocation(pcbddc->ChangeOfBasisMatrix,0,nnz);CHKERRQ(ierr);
2689534831adSStefano Zampini     ierr = PetscFree(nnz);CHKERRQ(ierr);
2690534831adSStefano Zampini     /* Temporary array to store indices */
2691534831adSStefano Zampini     ierr = PetscMalloc(k*sizeof(PetscInt),&is_indices);CHKERRQ(ierr);
2692534831adSStefano Zampini     /* Set initial identity in the matrix */
2693534831adSStefano Zampini     for (i=0;i<pcis->n_B;i++) {
2694534831adSStefano Zampini       ierr = MatSetValue(pcbddc->ChangeOfBasisMatrix,i,i,1.0,INSERT_VALUES);CHKERRQ(ierr);
2695534831adSStefano Zampini     }
2696534831adSStefano Zampini     /* Now we loop on the constraints which need a change of basis */
2697534831adSStefano Zampini     /* Change of basis matrix is evaluated as the FIRST APPROACH in */
2698534831adSStefano Zampini     /* Klawonn and Widlund, Dual-primal FETI-DP methods for linear elasticity, (6.2.1) */
2699534831adSStefano Zampini     temp_constraints = 0;
270093dc3b60SStefano Zampini     if (pcbddc->n_vertices < local_primal_size) {
2701534831adSStefano Zampini       temp_start_ptr = temp_indices_to_constraint_B[temp_indices[pcbddc->n_vertices]];
270293dc3b60SStefano Zampini     }
2703534831adSStefano Zampini     for (i=pcbddc->n_vertices;i<local_primal_size;i++) {
2704534831adSStefano Zampini       if (change_basis[i]) {
2705534831adSStefano Zampini         compute_submatrix = PETSC_FALSE;
2706534831adSStefano Zampini         useksp = PETSC_FALSE;
2707534831adSStefano Zampini         if (temp_start_ptr == temp_indices_to_constraint_B[temp_indices[i]]) {
2708534831adSStefano Zampini           temp_constraints++;
270904eaf177SStefano Zampini           if (i == local_primal_size -1 ||  temp_start_ptr != temp_indices_to_constraint_B[temp_indices[i+1]]) {
2710534831adSStefano Zampini             compute_submatrix = PETSC_TRUE;
2711534831adSStefano Zampini           }
2712534831adSStefano Zampini         }
2713534831adSStefano Zampini         if (compute_submatrix) {
2714534831adSStefano Zampini           if (temp_constraints > 1 || pcbddc->use_nnsp_true) {
2715534831adSStefano Zampini             useksp = PETSC_TRUE;
2716534831adSStefano Zampini           }
2717534831adSStefano Zampini           size_of_constraint = temp_indices[i+1]-temp_indices[i];
2718534831adSStefano Zampini           if (useksp) { /* experimental */
2719534831adSStefano Zampini             ierr = MatCreate(PETSC_COMM_SELF,&temp_mat);CHKERRQ(ierr);
2720534831adSStefano Zampini             ierr = MatSetType(temp_mat,impMatType);CHKERRQ(ierr);
2721534831adSStefano Zampini             ierr = MatSetSizes(temp_mat,size_of_constraint,size_of_constraint,size_of_constraint,size_of_constraint);CHKERRQ(ierr);
2722534831adSStefano Zampini             ierr = MatSeqAIJSetPreallocation(temp_mat,size_of_constraint,PETSC_NULL);CHKERRQ(ierr);
2723534831adSStefano Zampini           }
2724534831adSStefano Zampini           /* First _size_of_constraint-temp_constraints_ columns */
2725534831adSStefano Zampini           dual_dofs = size_of_constraint-temp_constraints;
2726534831adSStefano Zampini           start_constraint = i+1-temp_constraints;
2727534831adSStefano Zampini           for (s=0;s<dual_dofs;s++) {
2728534831adSStefano Zampini             is_indices[0] = s;
2729534831adSStefano Zampini             for (j=0;j<temp_constraints;j++) {
2730534831adSStefano Zampini               for (k=0;k<temp_constraints;k++) {
2731534831adSStefano Zampini                 temp_basis[j*temp_constraints+k]=temp_quadrature_constraint[temp_indices[start_constraint+k]+s+j+1];
2732534831adSStefano Zampini               }
2733534831adSStefano Zampini               work[j]=-temp_quadrature_constraint[temp_indices[start_constraint+j]+s];
2734534831adSStefano Zampini               is_indices[j+1]=s+j+1;
2735534831adSStefano Zampini             }
2736534831adSStefano Zampini             Bt = temp_constraints;
2737534831adSStefano Zampini             ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
2738534831adSStefano Zampini             LAPACKgesv_(&Bt,&Bone,temp_basis,&Bt,ipiv,work,&Bt,&lierr);
2739534831adSStefano Zampini             if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GESV Lapack routine %d",(int)lierr);
2740534831adSStefano Zampini             ierr = PetscFPTrapPop();CHKERRQ(ierr);
2741534831adSStefano Zampini             j = temp_indices_to_constraint_B[temp_indices[start_constraint]+s];
2742534831adSStefano Zampini             ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,temp_constraints,&temp_indices_to_constraint_B[temp_indices[start_constraint]+s+1],1,&j,work,INSERT_VALUES);CHKERRQ(ierr);
2743534831adSStefano Zampini             if (useksp) {
2744534831adSStefano Zampini               /* temp mat with transposed rows and columns */
2745534831adSStefano Zampini               ierr = MatSetValues(temp_mat,1,&s,temp_constraints,&is_indices[1],work,INSERT_VALUES);CHKERRQ(ierr);
2746534831adSStefano Zampini               ierr = MatSetValue(temp_mat,is_indices[0],is_indices[0],1.0,INSERT_VALUES);CHKERRQ(ierr);
2747534831adSStefano Zampini             }
2748534831adSStefano Zampini           }
2749534831adSStefano Zampini           if (useksp) {
2750534831adSStefano Zampini             /* last rows of temp_mat */
2751534831adSStefano Zampini             for (j=0;j<size_of_constraint;j++) {
2752534831adSStefano Zampini               is_indices[j] = j;
2753534831adSStefano Zampini             }
2754534831adSStefano Zampini             for (s=0;s<temp_constraints;s++) {
2755534831adSStefano Zampini               k = s + dual_dofs;
2756534831adSStefano Zampini               ierr = MatSetValues(temp_mat,1,&k,size_of_constraint,is_indices,&temp_quadrature_constraint[temp_indices[start_constraint+s]],INSERT_VALUES);CHKERRQ(ierr);
2757534831adSStefano Zampini             }
2758534831adSStefano Zampini             ierr = MatAssemblyBegin(temp_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2759534831adSStefano Zampini             ierr = MatAssemblyEnd(temp_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2760534831adSStefano Zampini             ierr = MatGetVecs(temp_mat,&temp_vec,PETSC_NULL);CHKERRQ(ierr);
2761534831adSStefano Zampini             ierr = KSPCreate(PETSC_COMM_SELF,&temp_ksp);CHKERRQ(ierr);
2762534831adSStefano Zampini             ierr = KSPSetOperators(temp_ksp,temp_mat,temp_mat,SAME_PRECONDITIONER);CHKERRQ(ierr);
2763534831adSStefano Zampini             ierr = KSPSetType(temp_ksp,KSPPREONLY);CHKERRQ(ierr);
2764ffe5efe1SStefano Zampini             ierr = KSPGetPC(temp_ksp,&temp_pc);CHKERRQ(ierr);
2765ffe5efe1SStefano Zampini             ierr = PCSetType(temp_pc,PCLU);CHKERRQ(ierr);
2766534831adSStefano Zampini             ierr = KSPSetUp(temp_ksp);CHKERRQ(ierr);
2767534831adSStefano Zampini             for (s=0;s<temp_constraints;s++) {
2768534831adSStefano Zampini               ierr = VecSet(temp_vec,0.0);CHKERRQ(ierr);
2769534831adSStefano Zampini               ierr = VecSetValue(temp_vec,s+dual_dofs,1.0,INSERT_VALUES);CHKERRQ(ierr);
2770534831adSStefano Zampini               ierr = VecAssemblyBegin(temp_vec);CHKERRQ(ierr);
2771534831adSStefano Zampini               ierr = VecAssemblyEnd(temp_vec);CHKERRQ(ierr);
2772534831adSStefano Zampini               ierr = KSPSolve(temp_ksp,temp_vec,temp_vec);CHKERRQ(ierr);
2773534831adSStefano Zampini               ierr = VecGetArray(temp_vec,&array_vector);CHKERRQ(ierr);
2774534831adSStefano Zampini               j = temp_indices_to_constraint_B[temp_indices[start_constraint+s]+size_of_constraint-s-1];
2775534831adSStefano Zampini               /* last columns of change of basis matrix associated to new primal dofs */
2776534831adSStefano Zampini               ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,size_of_constraint,&temp_indices_to_constraint_B[temp_indices[start_constraint+s]],1,&j,array_vector,INSERT_VALUES);CHKERRQ(ierr);
2777534831adSStefano Zampini               ierr = VecRestoreArray(temp_vec,&array_vector);CHKERRQ(ierr);
2778534831adSStefano Zampini             }
2779534831adSStefano Zampini             ierr = MatDestroy(&temp_mat);CHKERRQ(ierr);
2780534831adSStefano Zampini             ierr = KSPDestroy(&temp_ksp);CHKERRQ(ierr);
2781534831adSStefano Zampini             ierr = VecDestroy(&temp_vec);CHKERRQ(ierr);
2782534831adSStefano Zampini           } else {
2783534831adSStefano Zampini             /* last columns of change of basis matrix associated to new primal dofs */
2784534831adSStefano Zampini             for (s=0;s<temp_constraints;s++) {
2785534831adSStefano Zampini               j = temp_indices_to_constraint_B[temp_indices[start_constraint+s]+size_of_constraint-s-1];
2786534831adSStefano Zampini               ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,size_of_constraint,&temp_indices_to_constraint_B[temp_indices[start_constraint+s]],1,&j,&temp_quadrature_constraint[temp_indices[start_constraint+s]],INSERT_VALUES);CHKERRQ(ierr);
2787534831adSStefano Zampini             }
2788534831adSStefano Zampini           }
2789534831adSStefano Zampini           /* prepare for the next cycle */
2790534831adSStefano Zampini           temp_constraints = 0;
279104eaf177SStefano Zampini           if (i != local_primal_size -1 ) {
2792534831adSStefano Zampini             temp_start_ptr = temp_indices_to_constraint_B[temp_indices[i+1]];
2793534831adSStefano Zampini           }
2794534831adSStefano Zampini         }
2795534831adSStefano Zampini       }
279604eaf177SStefano Zampini     }
2797534831adSStefano Zampini     /* assembling */
2798534831adSStefano Zampini     ierr = MatAssemblyBegin(pcbddc->ChangeOfBasisMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2799534831adSStefano Zampini     ierr = MatAssemblyEnd(pcbddc->ChangeOfBasisMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2800534831adSStefano Zampini     ierr = PetscFree(ipiv);CHKERRQ(ierr);
2801534831adSStefano Zampini     ierr = PetscFree(is_indices);CHKERRQ(ierr);
2802534831adSStefano Zampini   }
28033b03a366Sstefano_zampini   /* free workspace no longer needed */
28043b03a366Sstefano_zampini   ierr = PetscFree(rwork);CHKERRQ(ierr);
28053b03a366Sstefano_zampini   ierr = PetscFree(work);CHKERRQ(ierr);
28063b03a366Sstefano_zampini   ierr = PetscFree(temp_basis);CHKERRQ(ierr);
28073b03a366Sstefano_zampini   ierr = PetscFree(singular_vals);CHKERRQ(ierr);
28083b03a366Sstefano_zampini   ierr = PetscFree(correlation_mat);CHKERRQ(ierr);
28093b03a366Sstefano_zampini   ierr = PetscFree(temp_indices);CHKERRQ(ierr);
2810534831adSStefano Zampini   ierr = PetscFree(change_basis);CHKERRQ(ierr);
28113b03a366Sstefano_zampini   ierr = PetscFree(temp_indices_to_constraint);CHKERRQ(ierr);
2812534831adSStefano Zampini   ierr = PetscFree(temp_indices_to_constraint_B);CHKERRQ(ierr);
2813534831adSStefano Zampini   ierr = PetscFree(local_to_B);CHKERRQ(ierr);
28143b03a366Sstefano_zampini   ierr = PetscFree(temp_quadrature_constraint);CHKERRQ(ierr);
28153425bc38SStefano Zampini #if defined(PETSC_MISSING_LAPACK_GESVD)
28163425bc38SStefano Zampini   ierr = PetscFree(iwork);CHKERRQ(ierr);
28173425bc38SStefano Zampini   ierr = PetscFree(ifail);CHKERRQ(ierr);
28183425bc38SStefano Zampini   ierr = PetscFree(singular_vectors);CHKERRQ(ierr);
28193425bc38SStefano Zampini #endif
2820da1bb401SStefano Zampini   for (k=0;k<nnsp_size;k++) {
2821da1bb401SStefano Zampini     ierr = VecDestroy(&localnearnullsp[k]);CHKERRQ(ierr);
2822da1bb401SStefano Zampini   }
28233b03a366Sstefano_zampini   ierr = PetscFree(localnearnullsp);CHKERRQ(ierr);
28243b03a366Sstefano_zampini   PetscFunctionReturn(0);
28253b03a366Sstefano_zampini }
28263b03a366Sstefano_zampini /* -------------------------------------------------------------------------- */
28270c7d97c5SJed Brown #undef __FUNCT__
28280c7d97c5SJed Brown #define __FUNCT__ "PCBDDCCoarseSetUp"
282953cdbc3dSStefano Zampini static PetscErrorCode PCBDDCCoarseSetUp(PC pc)
28300c7d97c5SJed Brown {
28310c7d97c5SJed Brown   PetscErrorCode  ierr;
28320c7d97c5SJed Brown 
28330c7d97c5SJed Brown   PC_IS*            pcis = (PC_IS*)(pc->data);
28340c7d97c5SJed Brown   PC_BDDC*          pcbddc = (PC_BDDC*)pc->data;
28350c7d97c5SJed Brown   Mat_IS            *matis = (Mat_IS*)pc->pmat->data;
2836534831adSStefano Zampini   Mat               change_mat_all;
28370c7d97c5SJed Brown   IS                is_R_local;
28380c7d97c5SJed Brown   IS                is_V_local;
28390c7d97c5SJed Brown   IS                is_C_local;
28400c7d97c5SJed Brown   IS                is_aux1;
28410c7d97c5SJed Brown   IS                is_aux2;
28420c7d97c5SJed Brown   const VecType     impVecType;
28430c7d97c5SJed Brown   const MatType     impMatType;
28440c7d97c5SJed Brown   PetscInt          n_R=0;
28450c7d97c5SJed Brown   PetscInt          n_D=0;
28460c7d97c5SJed Brown   PetscInt          n_B=0;
28470c7d97c5SJed Brown   PetscScalar       zero=0.0;
28480c7d97c5SJed Brown   PetscScalar       one=1.0;
28490c7d97c5SJed Brown   PetscScalar       m_one=-1.0;
28500c7d97c5SJed Brown   PetscScalar*      array;
28510c7d97c5SJed Brown   PetscScalar       *coarse_submat_vals;
28520c7d97c5SJed Brown   PetscInt          *idx_R_local;
28530c7d97c5SJed Brown   PetscInt          *idx_V_B;
28540c7d97c5SJed Brown   PetscScalar       *coarsefunctions_errors;
28550c7d97c5SJed Brown   PetscScalar       *constraints_errors;
28560c7d97c5SJed Brown   /* auxiliary indices */
2857534831adSStefano Zampini   PetscInt i,j,k;
2858e269702eSStefano Zampini   /* for verbose output of bddc */
2859e269702eSStefano Zampini   PetscViewer       viewer=pcbddc->dbg_viewer;
2860e269702eSStefano Zampini   PetscBool         dbg_flag=pcbddc->dbg_flag;
2861a0ba757dSStefano Zampini   /* for counting coarse dofs */
2862534831adSStefano Zampini   PetscInt          n_vertices,n_constraints;
28633b03a366Sstefano_zampini   PetscInt          size_of_constraint;
28643b03a366Sstefano_zampini   PetscInt          *row_cmat_indices;
28653b03a366Sstefano_zampini   PetscScalar       *row_cmat_values;
2866534831adSStefano Zampini   PetscInt          *vertices,*nnz,*is_indices,*temp_indices;
28670c7d97c5SJed Brown 
28680c7d97c5SJed Brown   PetscFunctionBegin;
28690c7d97c5SJed Brown   /* Set Non-overlapping dimensions */
28700c7d97c5SJed Brown   n_B = pcis->n_B; n_D = pcis->n - n_B;
2871534831adSStefano Zampini   /* Set types for local objects needed by BDDC precondtioner */
2872534831adSStefano Zampini   impMatType = MATSEQDENSE;
2873534831adSStefano Zampini   impVecType = VECSEQ;
2874da1bb401SStefano Zampini   /* get vertex indices from constraint matrix */
2875534831adSStefano Zampini   ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscInt),&vertices);CHKERRQ(ierr);
2876534831adSStefano Zampini   n_vertices=0;
2877da1bb401SStefano Zampini   for (i=0;i<pcbddc->local_primal_size;i++) {
2878da1bb401SStefano Zampini     ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr);
2879da1bb401SStefano Zampini     if (size_of_constraint == 1) {
2880534831adSStefano Zampini       vertices[n_vertices]=row_cmat_indices[0];
2881534831adSStefano Zampini       n_vertices++;
2882a0ba757dSStefano Zampini     }
2883da1bb401SStefano Zampini     ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr);
2884a0ba757dSStefano Zampini   }
2885534831adSStefano Zampini   /* Set number of constraints */
2886534831adSStefano Zampini   n_constraints = pcbddc->local_primal_size-n_vertices;
2887534831adSStefano Zampini 
2888534831adSStefano Zampini   /* vertices in boundary numbering */
2889534831adSStefano Zampini   if (n_vertices) {
2890534831adSStefano Zampini     ierr = VecSet(pcis->vec1_N,m_one);CHKERRQ(ierr);
2891534831adSStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
2892534831adSStefano Zampini     for (i=0; i<n_vertices; i++) { array[ vertices[i] ] = i; }
2893534831adSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
2894534831adSStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
2895534831adSStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
2896534831adSStefano Zampini     ierr = PetscMalloc(n_vertices*sizeof(PetscInt),&idx_V_B);CHKERRQ(ierr);
2897534831adSStefano Zampini     ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr);
2898534831adSStefano Zampini     for (i=0; i<n_vertices; i++) {
2899534831adSStefano Zampini       j=0;
2900534831adSStefano Zampini       while (array[j] != i ) {j++;}
2901534831adSStefano Zampini       idx_V_B[i]=j;
2902534831adSStefano Zampini     }
2903534831adSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr);
2904534831adSStefano Zampini   }
2905534831adSStefano Zampini 
2906534831adSStefano Zampini   /* transform local matrices if needed */
2907534831adSStefano Zampini   if (pcbddc->usechangeofbasis) {
2908534831adSStefano Zampini     ierr = PetscMalloc(pcis->n*sizeof(PetscInt),&nnz);CHKERRQ(ierr);
2909534831adSStefano Zampini     ierr = ISGetIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2910534831adSStefano Zampini     for (i=0;i<n_D;i++) {
2911534831adSStefano Zampini       nnz[is_indices[i]]=1;
2912534831adSStefano Zampini     }
2913534831adSStefano Zampini     ierr = ISRestoreIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2914534831adSStefano Zampini     ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2915534831adSStefano Zampini     k=1;
2916534831adSStefano Zampini     for (i=0;i<n_B;i++) {
2917534831adSStefano Zampini       ierr = MatGetRow(pcbddc->ChangeOfBasisMatrix,i,&j,PETSC_NULL,PETSC_NULL);CHKERRQ(ierr);
2918534831adSStefano Zampini       nnz[is_indices[i]]=j;
2919534831adSStefano Zampini       if ( k < j) {
2920534831adSStefano Zampini         k = j;
2921534831adSStefano Zampini       }
2922534831adSStefano Zampini       ierr = MatRestoreRow(pcbddc->ChangeOfBasisMatrix,i,&j,PETSC_NULL,PETSC_NULL);CHKERRQ(ierr);
2923534831adSStefano Zampini     }
2924534831adSStefano Zampini     ierr = ISRestoreIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2925534831adSStefano Zampini     /* assemble change of basis matrix on the whole set of local dofs */
2926534831adSStefano Zampini     ierr = PetscMalloc(k*sizeof(PetscInt),&temp_indices);CHKERRQ(ierr);
2927534831adSStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&change_mat_all);CHKERRQ(ierr);
2928534831adSStefano Zampini     ierr = MatSetSizes(change_mat_all,pcis->n,pcis->n,pcis->n,pcis->n);CHKERRQ(ierr);
2929534831adSStefano Zampini     ierr = MatSetType(change_mat_all,MATSEQAIJ);CHKERRQ(ierr);
2930534831adSStefano Zampini     ierr = MatSeqAIJSetPreallocation(change_mat_all,0,nnz);CHKERRQ(ierr);
2931534831adSStefano Zampini     ierr = ISGetIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2932534831adSStefano Zampini     for (i=0;i<n_D;i++) {
2933534831adSStefano Zampini       ierr = MatSetValue(change_mat_all,is_indices[i],is_indices[i],1.0,INSERT_VALUES);CHKERRQ(ierr);
2934534831adSStefano Zampini     }
2935534831adSStefano Zampini     ierr = ISRestoreIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2936534831adSStefano Zampini     ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2937534831adSStefano Zampini     for (i=0;i<n_B;i++) {
2938534831adSStefano Zampini       ierr = MatGetRow(pcbddc->ChangeOfBasisMatrix,i,&j,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr);
2939534831adSStefano Zampini       for (k=0;k<j;k++) {
2940534831adSStefano Zampini         temp_indices[k]=is_indices[row_cmat_indices[k]];
2941534831adSStefano Zampini       }
2942534831adSStefano Zampini       ierr = MatSetValues(change_mat_all,1,&is_indices[i],j,temp_indices,row_cmat_values,INSERT_VALUES);CHKERRQ(ierr);
2943534831adSStefano Zampini       ierr = MatRestoreRow(pcbddc->ChangeOfBasisMatrix,i,&j,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr);
2944534831adSStefano Zampini     }
2945534831adSStefano Zampini     ierr = MatAssemblyBegin(change_mat_all,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2946534831adSStefano Zampini     ierr = MatAssemblyEnd(change_mat_all,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2947534831adSStefano Zampini     ierr = MatPtAP(matis->A,change_mat_all,MAT_INITIAL_MATRIX,1.0,&pcbddc->local_mat);CHKERRQ(ierr);
2948534831adSStefano Zampini     ierr = MatDestroy(&pcis->A_IB);CHKERRQ(ierr);
2949534831adSStefano Zampini     ierr = MatDestroy(&pcis->A_BI);CHKERRQ(ierr);
2950534831adSStefano Zampini     ierr = MatDestroy(&pcis->A_BB);CHKERRQ(ierr);
2951534831adSStefano Zampini     ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_I_local,pcis->is_B_local,MAT_INITIAL_MATRIX,&pcis->A_IB);CHKERRQ(ierr);
2952534831adSStefano Zampini     ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_B_local,pcis->is_I_local,MAT_INITIAL_MATRIX,&pcis->A_BI);CHKERRQ(ierr);
2953534831adSStefano Zampini     ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_B_local,pcis->is_B_local,MAT_INITIAL_MATRIX,&pcis->A_BB);CHKERRQ(ierr);
2954534831adSStefano Zampini     ierr = MatDestroy(&change_mat_all);CHKERRQ(ierr);
2955534831adSStefano Zampini     ierr = PetscFree(nnz);CHKERRQ(ierr);
2956534831adSStefano Zampini     ierr = PetscFree(temp_indices);CHKERRQ(ierr);
2957534831adSStefano Zampini   } else {
2958534831adSStefano Zampini     /* without change of basis, the local matrix is unchanged */
2959534831adSStefano Zampini     ierr = PetscObjectReference((PetscObject)matis->A);CHKERRQ(ierr);
2960534831adSStefano Zampini     pcbddc->local_mat = matis->A;
2961534831adSStefano Zampini   }
29620bdf917eSStefano Zampini   /* Change global null space passed in by the user if change of basis has been performed */
29630bdf917eSStefano Zampini   if (pcbddc->NullSpace && pcbddc->usechangeofbasis) {
29640bdf917eSStefano Zampini     ierr = PCBDDCAdaptNullSpace(pc);CHKERRQ(ierr);
29650bdf917eSStefano Zampini   }
2966a0ba757dSStefano Zampini 
29670c7d97c5SJed Brown   /* Dohrmann's notation: dofs splitted in R (Remaining: all dofs but the vertices) and V (Vertices) */
29680c7d97c5SJed Brown   ierr = VecSet(pcis->vec1_N,one);CHKERRQ(ierr);
29690c7d97c5SJed Brown   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
29703b03a366Sstefano_zampini   for (i=0;i<n_vertices;i++) { array[ vertices[i] ] = zero; }
29713b03a366Sstefano_zampini   ierr = PetscMalloc(( pcis->n - n_vertices )*sizeof(PetscInt),&idx_R_local);CHKERRQ(ierr);
29720c7d97c5SJed Brown   for (i=0, n_R=0; i<pcis->n; i++) { if (array[i] == one) { idx_R_local[n_R] = i; n_R++; } }
29730c7d97c5SJed Brown   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
2974e269702eSStefano Zampini   if (dbg_flag) {
29750c7d97c5SJed Brown     ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
29760c7d97c5SJed Brown     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
29770c7d97c5SJed Brown     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d local dimensions\n",PetscGlobalRank);CHKERRQ(ierr);
29780c7d97c5SJed Brown     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local_size = %d, dirichlet_size = %d, boundary_size = %d\n",pcis->n,n_D,n_B);CHKERRQ(ierr);
29793b03a366Sstefano_zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"r_size = %d, v_size = %d, constraints = %d, local_primal_size = %d\n",n_R,n_vertices,n_constraints,pcbddc->local_primal_size);CHKERRQ(ierr);
2980534831adSStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"pcbddc->n_vertices = %d, pcbddc->n_constraints = %d\n",pcbddc->n_vertices,pcbddc->n_constraints);CHKERRQ(ierr);
29810c7d97c5SJed Brown     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
29820c7d97c5SJed Brown   }
2983534831adSStefano Zampini 
29840c7d97c5SJed Brown   /* Allocate needed vectors */
2985534831adSStefano Zampini   ierr = VecDuplicate(pcis->vec1_global,&pcbddc->original_rhs);CHKERRQ(ierr);
29863972b0daSStefano Zampini   ierr = VecDuplicate(pcis->vec1_global,&pcbddc->temp_solution);CHKERRQ(ierr);
29870c7d97c5SJed Brown   ierr = VecDuplicate(pcis->vec1_D,&pcbddc->vec4_D);CHKERRQ(ierr);
29880c7d97c5SJed Brown   ierr = VecCreate(PETSC_COMM_SELF,&pcbddc->vec1_R);CHKERRQ(ierr);
29890c7d97c5SJed Brown   ierr = VecSetSizes(pcbddc->vec1_R,n_R,n_R);CHKERRQ(ierr);
29900c7d97c5SJed Brown   ierr = VecSetType(pcbddc->vec1_R,impVecType);CHKERRQ(ierr);
2991d49ef151SStefano Zampini   ierr = VecDuplicate(pcbddc->vec1_R,&pcbddc->vec2_R);CHKERRQ(ierr);
29920c7d97c5SJed Brown   ierr = VecCreate(PETSC_COMM_SELF,&pcbddc->vec1_P);CHKERRQ(ierr);
29930c7d97c5SJed Brown   ierr = VecSetSizes(pcbddc->vec1_P,pcbddc->local_primal_size,pcbddc->local_primal_size);CHKERRQ(ierr);
29940c7d97c5SJed Brown   ierr = VecSetType(pcbddc->vec1_P,impVecType);CHKERRQ(ierr);
29950c7d97c5SJed Brown 
29960c7d97c5SJed Brown   /* Creating some index sets needed  */
29970c7d97c5SJed Brown   /* For submatrices */
2998da1bb401SStefano Zampini   ierr = ISCreateGeneral(PETSC_COMM_SELF,n_R,idx_R_local,PETSC_OWN_POINTER,&is_R_local);CHKERRQ(ierr);
29993b03a366Sstefano_zampini   if (n_vertices)    {
3000da1bb401SStefano Zampini     ierr = ISCreateGeneral(PETSC_COMM_SELF,n_vertices,vertices,PETSC_OWN_POINTER,&is_V_local);CHKERRQ(ierr);
30013b03a366Sstefano_zampini   }
3002da1bb401SStefano Zampini   if (n_constraints) {
3003da1bb401SStefano Zampini     ierr = ISCreateStride(PETSC_COMM_SELF,n_constraints,n_vertices,1,&is_C_local);CHKERRQ(ierr);
3004da1bb401SStefano Zampini   }
3005da1bb401SStefano Zampini 
30060c7d97c5SJed Brown   /* For VecScatters pcbddc->R_to_B and (optionally) pcbddc->R_to_D */
30070c7d97c5SJed Brown   {
30080c7d97c5SJed Brown     PetscInt   *aux_array1;
30090c7d97c5SJed Brown     PetscInt   *aux_array2;
30100c7d97c5SJed Brown 
30113b03a366Sstefano_zampini     ierr = PetscMalloc( (pcis->n_B-n_vertices)*sizeof(PetscInt),&aux_array1);CHKERRQ(ierr);
30123b03a366Sstefano_zampini     ierr = PetscMalloc( (pcis->n_B-n_vertices)*sizeof(PetscInt),&aux_array2);CHKERRQ(ierr);
30130c7d97c5SJed Brown 
3014d49ef151SStefano Zampini     ierr = VecSet(pcis->vec1_global,zero);CHKERRQ(ierr);
30150c7d97c5SJed Brown     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
30160c7d97c5SJed Brown     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
30170c7d97c5SJed Brown     ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
30180c7d97c5SJed Brown     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
30190c7d97c5SJed Brown     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
30200c7d97c5SJed Brown     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
30210c7d97c5SJed Brown     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3022da1bb401SStefano Zampini     for (i=0, j=0; i<n_R; i++) { if ( array[idx_R_local[i]] > one ) { aux_array1[j] = i; j++; } }
30230c7d97c5SJed Brown     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3024da1bb401SStefano Zampini     ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array1,PETSC_COPY_VALUES,&is_aux1);CHKERRQ(ierr);
30250c7d97c5SJed Brown     ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr);
3026da1bb401SStefano Zampini     for (i=0, j=0; i<n_B; i++) { if ( array[i] > one ) { aux_array2[j] = i; j++; } }
30273828260eSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr);
3028da1bb401SStefano Zampini     ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array2,PETSC_COPY_VALUES,&is_aux2);CHKERRQ(ierr);
30290c7d97c5SJed Brown     ierr = VecScatterCreate(pcbddc->vec1_R,is_aux1,pcis->vec1_B,is_aux2,&pcbddc->R_to_B);CHKERRQ(ierr);
30300c7d97c5SJed Brown     ierr = PetscFree(aux_array1);CHKERRQ(ierr);
30310c7d97c5SJed Brown     ierr = PetscFree(aux_array2);CHKERRQ(ierr);
30320c7d97c5SJed Brown     ierr = ISDestroy(&is_aux1);CHKERRQ(ierr);
30330c7d97c5SJed Brown     ierr = ISDestroy(&is_aux2);CHKERRQ(ierr);
30340c7d97c5SJed Brown 
3035e269702eSStefano Zampini     if (pcbddc->prec_type || dbg_flag ) {
30360c7d97c5SJed Brown       ierr = PetscMalloc(n_D*sizeof(PetscInt),&aux_array1);CHKERRQ(ierr);
30370c7d97c5SJed Brown       ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3038da1bb401SStefano Zampini       for (i=0, j=0; i<n_R; i++) { if (array[idx_R_local[i]] == one) { aux_array1[j] = i; j++; } }
30390c7d97c5SJed Brown       ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3040da1bb401SStefano Zampini       ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array1,PETSC_COPY_VALUES,&is_aux1);CHKERRQ(ierr);
30410c7d97c5SJed Brown       ierr = VecScatterCreate(pcbddc->vec1_R,is_aux1,pcis->vec1_D,(IS)0,&pcbddc->R_to_D);CHKERRQ(ierr);
30420c7d97c5SJed Brown       ierr = PetscFree(aux_array1);CHKERRQ(ierr);
30430c7d97c5SJed Brown       ierr = ISDestroy(&is_aux1);CHKERRQ(ierr);
30440c7d97c5SJed Brown     }
30450c7d97c5SJed Brown   }
30460c7d97c5SJed Brown 
30470c7d97c5SJed Brown   /* Creating PC contexts for local Dirichlet and Neumann problems */
30480c7d97c5SJed Brown   {
30490c7d97c5SJed Brown     Mat  A_RR;
305053cdbc3dSStefano Zampini     PC   pc_temp;
30510c7d97c5SJed Brown     /* Matrix for Dirichlet problem is A_II -> we already have it from pcis.c code */
305253cdbc3dSStefano Zampini     ierr = KSPCreate(PETSC_COMM_SELF,&pcbddc->ksp_D);CHKERRQ(ierr);
305353cdbc3dSStefano Zampini     ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->ksp_D,(PetscObject)pc,1);CHKERRQ(ierr);
305453cdbc3dSStefano Zampini     ierr = KSPSetOperators(pcbddc->ksp_D,pcis->A_II,pcis->A_II,SAME_PRECONDITIONER);CHKERRQ(ierr);
305553cdbc3dSStefano Zampini     ierr = KSPSetType(pcbddc->ksp_D,KSPPREONLY);CHKERRQ(ierr);
3056da1bb401SStefano Zampini     ierr = KSPSetOptionsPrefix(pcbddc->ksp_D,"dirichlet_");CHKERRQ(ierr);
30570c7d97c5SJed Brown     /* default */
305853cdbc3dSStefano Zampini     ierr = KSPGetPC(pcbddc->ksp_D,&pc_temp);CHKERRQ(ierr);
305953cdbc3dSStefano Zampini     ierr = PCSetType(pc_temp,PCLU);CHKERRQ(ierr);
30600c7d97c5SJed Brown     /* Allow user's customization */
306153cdbc3dSStefano Zampini     ierr = KSPSetFromOptions(pcbddc->ksp_D);CHKERRQ(ierr);
306253cdbc3dSStefano Zampini     /* Set Up KSP for Dirichlet problem of BDDC */
306353cdbc3dSStefano Zampini     ierr = KSPSetUp(pcbddc->ksp_D);CHKERRQ(ierr);
30643972b0daSStefano Zampini     /* set ksp_D into pcis data */
30653972b0daSStefano Zampini     ierr = KSPDestroy(&pcis->ksp_D);CHKERRQ(ierr);
30663972b0daSStefano Zampini     ierr = PetscObjectReference((PetscObject)pcbddc->ksp_D);CHKERRQ(ierr);
30673972b0daSStefano Zampini     pcis->ksp_D = pcbddc->ksp_D;
30680c7d97c5SJed Brown     /* Matrix for Neumann problem is A_RR -> we need to create it */
3069534831adSStefano Zampini     ierr = MatGetSubMatrix(pcbddc->local_mat,is_R_local,is_R_local,MAT_INITIAL_MATRIX,&A_RR);CHKERRQ(ierr);
307053cdbc3dSStefano Zampini     ierr = KSPCreate(PETSC_COMM_SELF,&pcbddc->ksp_R);CHKERRQ(ierr);
307153cdbc3dSStefano Zampini     ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->ksp_R,(PetscObject)pc,1);CHKERRQ(ierr);
307253cdbc3dSStefano Zampini     ierr = KSPSetOperators(pcbddc->ksp_R,A_RR,A_RR,SAME_PRECONDITIONER);CHKERRQ(ierr);
307353cdbc3dSStefano Zampini     ierr = KSPSetType(pcbddc->ksp_R,KSPPREONLY);CHKERRQ(ierr);
3074da1bb401SStefano Zampini     ierr = KSPSetOptionsPrefix(pcbddc->ksp_R,"neumann_");CHKERRQ(ierr);
30750c7d97c5SJed Brown     /* default */
307653cdbc3dSStefano Zampini     ierr = KSPGetPC(pcbddc->ksp_R,&pc_temp);CHKERRQ(ierr);
307753cdbc3dSStefano Zampini     ierr = PCSetType(pc_temp,PCLU);CHKERRQ(ierr);
30780c7d97c5SJed Brown     /* Allow user's customization */
307953cdbc3dSStefano Zampini     ierr = KSPSetFromOptions(pcbddc->ksp_R);CHKERRQ(ierr);
308053cdbc3dSStefano Zampini     /* Set Up KSP for Neumann problem of BDDC */
308153cdbc3dSStefano Zampini     ierr = KSPSetUp(pcbddc->ksp_R);CHKERRQ(ierr);
3082a0ba757dSStefano Zampini     /* check Dirichlet and Neumann solvers */
3083b76ba322SStefano Zampini     {
30840c7d97c5SJed Brown       Vec         temp_vec;
3085b76ba322SStefano Zampini       PetscReal   value;
3086b76ba322SStefano Zampini       PetscMPIInt use_exact,use_exact_reduced;
30870c7d97c5SJed Brown 
3088a0ba757dSStefano Zampini       ierr = VecDuplicate(pcis->vec1_D,&temp_vec);CHKERRQ(ierr);
3089a0ba757dSStefano Zampini       ierr = VecSetRandom(pcis->vec1_D,PETSC_NULL);CHKERRQ(ierr);
3090a0ba757dSStefano Zampini       ierr = MatMult(pcis->A_II,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr);
3091a0ba757dSStefano Zampini       ierr = KSPSolve(pcbddc->ksp_D,pcis->vec2_D,temp_vec);CHKERRQ(ierr);
3092a0ba757dSStefano Zampini       ierr = VecAXPY(temp_vec,m_one,pcis->vec1_D);CHKERRQ(ierr);
3093a0ba757dSStefano Zampini       ierr = VecNorm(temp_vec,NORM_INFINITY,&value);CHKERRQ(ierr);
3094b76ba322SStefano Zampini       use_exact = 1;
3095b76ba322SStefano Zampini       if (PetscAbsReal(value) > 1.e-4) {
3096b76ba322SStefano Zampini         use_exact = 0;
3097b76ba322SStefano Zampini       }
3098b76ba322SStefano Zampini       ierr = MPI_Allreduce(&use_exact,&use_exact_reduced,1,MPIU_INT,MPI_LAND,((PetscObject)pc)->comm);CHKERRQ(ierr);
3099b76ba322SStefano Zampini       pcbddc->use_exact_dirichlet = (PetscBool) use_exact_reduced;
3100a0ba757dSStefano Zampini       ierr = VecDestroy(&temp_vec);CHKERRQ(ierr);
3101b76ba322SStefano Zampini       if (dbg_flag) {
3102a0ba757dSStefano Zampini         ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
3103a0ba757dSStefano Zampini         ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
3104a0ba757dSStefano Zampini         ierr = PetscViewerASCIIPrintf(viewer,"Checking solution of Dirichlet and Neumann problems\n");CHKERRQ(ierr);
3105a0ba757dSStefano Zampini         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d infinity error for Dirichlet solve = % 1.14e \n",PetscGlobalRank,value);CHKERRQ(ierr);
3106d49ef151SStefano Zampini         ierr = VecDuplicate(pcbddc->vec1_R,&temp_vec);CHKERRQ(ierr);
3107d49ef151SStefano Zampini         ierr = VecSetRandom(pcbddc->vec1_R,PETSC_NULL);CHKERRQ(ierr);
3108d49ef151SStefano Zampini         ierr = MatMult(A_RR,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr);
3109d49ef151SStefano Zampini         ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec2_R,temp_vec);CHKERRQ(ierr);
3110d49ef151SStefano Zampini         ierr = VecAXPY(temp_vec,m_one,pcbddc->vec1_R);CHKERRQ(ierr);
3111d49ef151SStefano Zampini         ierr = VecNorm(temp_vec,NORM_INFINITY,&value);CHKERRQ(ierr);
3112e269702eSStefano Zampini         ierr = VecDestroy(&temp_vec);CHKERRQ(ierr);
31130c7d97c5SJed Brown         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d infinity error for  Neumann  solve = % 1.14e \n",PetscGlobalRank,value);CHKERRQ(ierr);
3114d49ef151SStefano Zampini         ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
31150c7d97c5SJed Brown       }
3116b76ba322SStefano Zampini     }
31170c7d97c5SJed Brown     /* free Neumann problem's matrix */
31180c7d97c5SJed Brown     ierr = MatDestroy(&A_RR);CHKERRQ(ierr);
31190c7d97c5SJed Brown   }
31200c7d97c5SJed Brown 
31210c7d97c5SJed Brown   /* Assemble all remaining stuff needed to apply BDDC  */
31220c7d97c5SJed Brown   {
31230c7d97c5SJed Brown     Mat          A_RV,A_VR,A_VV;
31240bdf917eSStefano Zampini     Mat          M1;
31250c7d97c5SJed Brown     Mat          C_CR;
31263b03a366Sstefano_zampini     Mat          AUXMAT;
31270c7d97c5SJed Brown     Vec          vec1_C;
31280c7d97c5SJed Brown     Vec          vec2_C;
31290c7d97c5SJed Brown     Vec          vec1_V;
31300c7d97c5SJed Brown     Vec          vec2_V;
31310c7d97c5SJed Brown     PetscInt     *nnz;
31320c7d97c5SJed Brown     PetscInt     *auxindices;
313353cdbc3dSStefano Zampini     PetscInt     index;
31340c7d97c5SJed Brown     PetscScalar* array2;
31350c7d97c5SJed Brown     MatFactorInfo matinfo;
31360c7d97c5SJed Brown 
31370c7d97c5SJed Brown     /* Allocating some extra storage just to be safe */
31380c7d97c5SJed Brown     ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&nnz);CHKERRQ(ierr);
31390c7d97c5SJed Brown     ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&auxindices);CHKERRQ(ierr);
31400c7d97c5SJed Brown     for (i=0;i<pcis->n;i++) {auxindices[i]=i;}
31410c7d97c5SJed Brown 
31420c7d97c5SJed Brown     /* some work vectors on vertices and/or constraints */
31433b03a366Sstefano_zampini     if (n_vertices) {
31440c7d97c5SJed Brown       ierr = VecCreate(PETSC_COMM_SELF,&vec1_V);CHKERRQ(ierr);
31453b03a366Sstefano_zampini       ierr = VecSetSizes(vec1_V,n_vertices,n_vertices);CHKERRQ(ierr);
31460c7d97c5SJed Brown       ierr = VecSetType(vec1_V,impVecType);CHKERRQ(ierr);
31470c7d97c5SJed Brown       ierr = VecDuplicate(vec1_V,&vec2_V);CHKERRQ(ierr);
31480c7d97c5SJed Brown     }
3149534831adSStefano Zampini     if (n_constraints) {
31500c7d97c5SJed Brown       ierr = VecCreate(PETSC_COMM_SELF,&vec1_C);CHKERRQ(ierr);
3151534831adSStefano Zampini       ierr = VecSetSizes(vec1_C,n_constraints,n_constraints);CHKERRQ(ierr);
31520c7d97c5SJed Brown       ierr = VecSetType(vec1_C,impVecType);CHKERRQ(ierr);
31530c7d97c5SJed Brown       ierr = VecDuplicate(vec1_C,&vec2_C);CHKERRQ(ierr);
31540c7d97c5SJed Brown       ierr = VecDuplicate(vec1_C,&pcbddc->vec1_C);CHKERRQ(ierr);
31550c7d97c5SJed Brown     }
31560c7d97c5SJed Brown     /* Precompute stuffs needed for preprocessing and application of BDDC*/
31573b03a366Sstefano_zampini     if (n_constraints) {
31580c7d97c5SJed Brown       ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->local_auxmat2);CHKERRQ(ierr);
31593b03a366Sstefano_zampini       ierr = MatSetSizes(pcbddc->local_auxmat2,n_R,n_constraints,n_R,n_constraints);CHKERRQ(ierr);
31600c7d97c5SJed Brown       ierr = MatSetType(pcbddc->local_auxmat2,impMatType);CHKERRQ(ierr);
31613b03a366Sstefano_zampini       ierr = MatSeqDenseSetPreallocation(pcbddc->local_auxmat2,PETSC_NULL);CHKERRQ(ierr);
31620c7d97c5SJed Brown 
316357a90decSStefano Zampini       /* Create Constraint matrix on R nodes: C_{CR}  */
316457a90decSStefano Zampini       ierr = MatGetSubMatrix(pcbddc->ConstraintMatrix,is_C_local,is_R_local,MAT_INITIAL_MATRIX,&C_CR);CHKERRQ(ierr);
316557a90decSStefano Zampini       ierr = ISDestroy(&is_C_local);CHKERRQ(ierr);
316657a90decSStefano Zampini 
31670c7d97c5SJed Brown       /* Assemble local_auxmat2 = - A_{RR}^{-1} C^T_{CR} needed by BDDC application */
31683b03a366Sstefano_zampini       for (i=0;i<n_constraints;i++) {
31693b03a366Sstefano_zampini         ierr = VecSet(pcbddc->vec1_R,zero);CHKERRQ(ierr);
31703b03a366Sstefano_zampini         /* Get row of constraint matrix in R numbering */
317157a90decSStefano Zampini         ierr = VecGetArray(pcbddc->vec1_R,&array);CHKERRQ(ierr);
317257a90decSStefano Zampini         ierr = MatGetRow(C_CR,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr);
31733b03a366Sstefano_zampini         for (j=0;j<size_of_constraint;j++) { array[ row_cmat_indices[j] ] = - row_cmat_values[j]; }
317457a90decSStefano Zampini         ierr = MatRestoreRow(C_CR,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr);
317557a90decSStefano Zampini         ierr = VecRestoreArray(pcbddc->vec1_R,&array);CHKERRQ(ierr);
31763b03a366Sstefano_zampini         /* Solve for row of constraint matrix in R numbering */
317753cdbc3dSStefano Zampini         ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr);
31783b03a366Sstefano_zampini         /* Set values */
31790c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec2_R,&array);CHKERRQ(ierr);
31803b03a366Sstefano_zampini         ierr = MatSetValues(pcbddc->local_auxmat2,n_R,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
31810c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec2_R,&array);CHKERRQ(ierr);
31820c7d97c5SJed Brown       }
31830c7d97c5SJed Brown       ierr = MatAssemblyBegin(pcbddc->local_auxmat2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
31840c7d97c5SJed Brown       ierr = MatAssemblyEnd(pcbddc->local_auxmat2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
31850c7d97c5SJed Brown 
31860c7d97c5SJed Brown       /* Assemble AUXMAT = ( LUFactor )( -C_{CR} A_{RR}^{-1} C^T_{CR} )^{-1} */
31870c7d97c5SJed Brown       ierr = MatMatMult(C_CR,pcbddc->local_auxmat2,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&AUXMAT);CHKERRQ(ierr);
3188d49ef151SStefano Zampini       ierr = MatFactorInfoInitialize(&matinfo);CHKERRQ(ierr);
31893b03a366Sstefano_zampini       ierr = ISCreateStride(PETSC_COMM_SELF,n_constraints,0,1,&is_aux1);CHKERRQ(ierr);
31900c7d97c5SJed Brown       ierr = MatLUFactor(AUXMAT,is_aux1,is_aux1,&matinfo);CHKERRQ(ierr);
31910c7d97c5SJed Brown       ierr = ISDestroy(&is_aux1);CHKERRQ(ierr);
31920c7d97c5SJed Brown 
31933b03a366Sstefano_zampini       /* Assemble explicitly M1 = ( C_{CR} A_{RR}^{-1} C^T_{CR} )^{-1} needed in preproc  */
3194d49ef151SStefano Zampini       ierr = MatCreate(PETSC_COMM_SELF,&M1);CHKERRQ(ierr);
31953b03a366Sstefano_zampini       ierr = MatSetSizes(M1,n_constraints,n_constraints,n_constraints,n_constraints);CHKERRQ(ierr);
31960c7d97c5SJed Brown       ierr = MatSetType(M1,impMatType);CHKERRQ(ierr);
31973b03a366Sstefano_zampini       ierr = MatSeqDenseSetPreallocation(M1,PETSC_NULL);CHKERRQ(ierr);
31983b03a366Sstefano_zampini       for (i=0;i<n_constraints;i++) {
31990c7d97c5SJed Brown         ierr = VecSet(vec1_C,zero);CHKERRQ(ierr);
32000c7d97c5SJed Brown         ierr = VecSetValue(vec1_C,i,one,INSERT_VALUES);CHKERRQ(ierr);
32010c7d97c5SJed Brown         ierr = VecAssemblyBegin(vec1_C);CHKERRQ(ierr);
32020c7d97c5SJed Brown         ierr = VecAssemblyEnd(vec1_C);CHKERRQ(ierr);
32030c7d97c5SJed Brown         ierr = MatSolve(AUXMAT,vec1_C,vec2_C);CHKERRQ(ierr);
32040c7d97c5SJed Brown         ierr = VecScale(vec2_C,m_one);CHKERRQ(ierr);
32050c7d97c5SJed Brown         ierr = VecGetArray(vec2_C,&array);CHKERRQ(ierr);
32063b03a366Sstefano_zampini         ierr = MatSetValues(M1,n_constraints,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
32070c7d97c5SJed Brown         ierr = VecRestoreArray(vec2_C,&array);CHKERRQ(ierr);
32080c7d97c5SJed Brown       }
32090c7d97c5SJed Brown       ierr = MatAssemblyBegin(M1,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
32100c7d97c5SJed Brown       ierr = MatAssemblyEnd(M1,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
32110c7d97c5SJed Brown       ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr);
32120c7d97c5SJed Brown       /* Assemble local_auxmat1 = M1*C_{CR} needed by BDDC application in KSP and in preproc */
32130c7d97c5SJed Brown       ierr = MatMatMult(M1,C_CR,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&pcbddc->local_auxmat1);CHKERRQ(ierr);
32140c7d97c5SJed Brown 
32150c7d97c5SJed Brown     }
32160c7d97c5SJed Brown 
32170c7d97c5SJed Brown     /* Get submatrices from subdomain matrix */
32183b03a366Sstefano_zampini     if (n_vertices){
3219534831adSStefano Zampini       ierr = MatGetSubMatrix(pcbddc->local_mat,is_R_local,is_V_local,MAT_INITIAL_MATRIX,&A_RV);CHKERRQ(ierr);
3220534831adSStefano Zampini       ierr = MatGetSubMatrix(pcbddc->local_mat,is_V_local,is_R_local,MAT_INITIAL_MATRIX,&A_VR);CHKERRQ(ierr);
3221534831adSStefano Zampini       ierr = MatGetSubMatrix(pcbddc->local_mat,is_V_local,is_V_local,MAT_INITIAL_MATRIX,&A_VV);CHKERRQ(ierr);
32220c7d97c5SJed Brown     }
32230c7d97c5SJed Brown 
32240c7d97c5SJed Brown     /* Matrix of coarse basis functions (local) */
3225d49ef151SStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->coarse_phi_B);CHKERRQ(ierr);
32260c7d97c5SJed Brown     ierr = MatSetSizes(pcbddc->coarse_phi_B,n_B,pcbddc->local_primal_size,n_B,pcbddc->local_primal_size);CHKERRQ(ierr);
32270c7d97c5SJed Brown     ierr = MatSetType(pcbddc->coarse_phi_B,impMatType);CHKERRQ(ierr);
32283b03a366Sstefano_zampini     ierr = MatSeqDenseSetPreallocation(pcbddc->coarse_phi_B,PETSC_NULL);CHKERRQ(ierr);
3229e269702eSStefano Zampini     if (pcbddc->prec_type || dbg_flag ) {
3230d49ef151SStefano Zampini       ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->coarse_phi_D);CHKERRQ(ierr);
32310c7d97c5SJed Brown       ierr = MatSetSizes(pcbddc->coarse_phi_D,n_D,pcbddc->local_primal_size,n_D,pcbddc->local_primal_size);CHKERRQ(ierr);
32320c7d97c5SJed Brown       ierr = MatSetType(pcbddc->coarse_phi_D,impMatType);CHKERRQ(ierr);
32333b03a366Sstefano_zampini       ierr = MatSeqDenseSetPreallocation(pcbddc->coarse_phi_D,PETSC_NULL);CHKERRQ(ierr);
32340c7d97c5SJed Brown     }
32350c7d97c5SJed Brown 
3236e269702eSStefano Zampini     if (dbg_flag) {
32370c7d97c5SJed Brown       ierr = PetscMalloc( pcbddc->local_primal_size*sizeof(PetscScalar),&coarsefunctions_errors);CHKERRQ(ierr);
32380c7d97c5SJed Brown       ierr = PetscMalloc( pcbddc->local_primal_size*sizeof(PetscScalar),&constraints_errors);CHKERRQ(ierr);
32390c7d97c5SJed Brown     }
32403b03a366Sstefano_zampini     /* Subdomain contribution (Non-overlapping) to coarse matrix  */
32410c7d97c5SJed Brown     ierr = PetscMalloc ((pcbddc->local_primal_size)*(pcbddc->local_primal_size)*sizeof(PetscScalar),&coarse_submat_vals);CHKERRQ(ierr);
32420c7d97c5SJed Brown 
32430c7d97c5SJed Brown     /* We are now ready to evaluate coarse basis functions and subdomain contribution to coarse problem */
32443b03a366Sstefano_zampini     for (i=0;i<n_vertices;i++){
32450c7d97c5SJed Brown       ierr = VecSet(vec1_V,zero);CHKERRQ(ierr);
32460c7d97c5SJed Brown       ierr = VecSetValue(vec1_V,i,one,INSERT_VALUES);CHKERRQ(ierr);
32470c7d97c5SJed Brown       ierr = VecAssemblyBegin(vec1_V);CHKERRQ(ierr);
32480c7d97c5SJed Brown       ierr = VecAssemblyEnd(vec1_V);CHKERRQ(ierr);
32490c7d97c5SJed Brown       /* solution of saddle point problem */
32500bdf917eSStefano Zampini       ierr = MatMult(A_RV,vec1_V,pcbddc->vec1_R);CHKERRQ(ierr);
32510bdf917eSStefano Zampini       ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec1_R);CHKERRQ(ierr);
32520c7d97c5SJed Brown       ierr = VecScale(pcbddc->vec1_R,m_one);CHKERRQ(ierr);
32533b03a366Sstefano_zampini       if (n_constraints) {
32540c7d97c5SJed Brown         ierr = MatMult(pcbddc->local_auxmat1,pcbddc->vec1_R,vec1_C);CHKERRQ(ierr);
32550c7d97c5SJed Brown         ierr = MatMultAdd(pcbddc->local_auxmat2,vec1_C,pcbddc->vec1_R,pcbddc->vec1_R);CHKERRQ(ierr);
32560c7d97c5SJed Brown         ierr = VecScale(vec1_C,m_one);CHKERRQ(ierr);
32570c7d97c5SJed Brown       }
32580c7d97c5SJed Brown       ierr = MatMult(A_VR,pcbddc->vec1_R,vec2_V);CHKERRQ(ierr);
32590c7d97c5SJed Brown       ierr = MatMultAdd(A_VV,vec1_V,vec2_V,vec2_V);CHKERRQ(ierr);
32600c7d97c5SJed Brown 
32610c7d97c5SJed Brown       /* Set values in coarse basis function and subdomain part of coarse_mat */
32620c7d97c5SJed Brown       /* coarse basis functions */
32630c7d97c5SJed Brown       ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr);
32640c7d97c5SJed Brown       ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
32650c7d97c5SJed Brown       ierr = VecScatterEnd  (pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
32660c7d97c5SJed Brown       ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr);
32673b03a366Sstefano_zampini       ierr = MatSetValues(pcbddc->coarse_phi_B,n_B,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
32680c7d97c5SJed Brown       ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr);
32690c7d97c5SJed Brown       ierr = MatSetValue(pcbddc->coarse_phi_B,idx_V_B[i],i,one,INSERT_VALUES);CHKERRQ(ierr);
3270e269702eSStefano Zampini       if ( pcbddc->prec_type || dbg_flag  ) {
32710c7d97c5SJed Brown         ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
32720c7d97c5SJed Brown         ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
32730c7d97c5SJed Brown         ierr = VecGetArray(pcis->vec1_D,&array);CHKERRQ(ierr);
32743b03a366Sstefano_zampini         ierr = MatSetValues(pcbddc->coarse_phi_D,n_D,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
32750c7d97c5SJed Brown         ierr = VecRestoreArray(pcis->vec1_D,&array);CHKERRQ(ierr);
32760c7d97c5SJed Brown       }
32770c7d97c5SJed Brown       /* subdomain contribution to coarse matrix */
32780c7d97c5SJed Brown       ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr);
3279da1bb401SStefano Zampini       for (j=0;j<n_vertices;j++) { coarse_submat_vals[i*pcbddc->local_primal_size+j] = array[j]; } /* WARNING -> column major ordering */
32800c7d97c5SJed Brown       ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr);
32813b03a366Sstefano_zampini       if (n_constraints) {
32820c7d97c5SJed Brown         ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr);
3283da1bb401SStefano Zampini         for (j=0;j<n_constraints;j++) { coarse_submat_vals[i*pcbddc->local_primal_size+j+n_vertices] = array[j]; } /* WARNING -> column major ordering */
32840c7d97c5SJed Brown         ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr);
32850c7d97c5SJed Brown       }
32860c7d97c5SJed Brown 
3287e269702eSStefano Zampini       if ( dbg_flag ) {
32880c7d97c5SJed Brown         /* assemble subdomain vector on nodes */
3289d49ef151SStefano Zampini         ierr = VecSet(pcis->vec1_N,zero);CHKERRQ(ierr);
32900c7d97c5SJed Brown         ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
32910c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr);
32920c7d97c5SJed Brown         for (j=0;j<n_R;j++) { array[idx_R_local[j]] = array2[j]; }
32933b03a366Sstefano_zampini         array[ vertices[i] ] = one;
32940c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr);
32950c7d97c5SJed Brown         ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
32960c7d97c5SJed Brown         /* assemble subdomain vector of lagrange multipliers (i.e. primal nodes) */
3297d49ef151SStefano Zampini         ierr = VecSet(pcbddc->vec1_P,zero);CHKERRQ(ierr);
32980c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr);
32990c7d97c5SJed Brown         ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr);
33003b03a366Sstefano_zampini         for (j=0;j<n_vertices;j++) { array2[j]=array[j]; }
33010c7d97c5SJed Brown         ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr);
33023b03a366Sstefano_zampini         if (n_constraints) {
33030c7d97c5SJed Brown           ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr);
33043b03a366Sstefano_zampini           for (j=0;j<n_constraints;j++) { array2[j+n_vertices]=array[j]; }
33050c7d97c5SJed Brown           ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr);
33060c7d97c5SJed Brown         }
33070c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr);
33080c7d97c5SJed Brown         ierr = VecScale(pcbddc->vec1_P,m_one);CHKERRQ(ierr);
33090c7d97c5SJed Brown         /* check saddle point solution */
3310534831adSStefano Zampini         ierr = MatMult(pcbddc->local_mat,pcis->vec1_N,pcis->vec2_N);CHKERRQ(ierr);
33113b03a366Sstefano_zampini         ierr = MatMultTransposeAdd(pcbddc->ConstraintMatrix,pcbddc->vec1_P,pcis->vec2_N,pcis->vec2_N);CHKERRQ(ierr);
33123b03a366Sstefano_zampini         ierr = VecNorm(pcis->vec2_N,NORM_INFINITY,&coarsefunctions_errors[i]);CHKERRQ(ierr);
33133b03a366Sstefano_zampini         ierr = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr);
33140c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
33153b03a366Sstefano_zampini         array[i]=array[i]+m_one;  /* shift by the identity matrix */
33160c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
33173b03a366Sstefano_zampini         ierr = VecNorm(pcbddc->vec1_P,NORM_INFINITY,&constraints_errors[i]);CHKERRQ(ierr);
33180c7d97c5SJed Brown       }
33190c7d97c5SJed Brown     }
33200c7d97c5SJed Brown 
33213b03a366Sstefano_zampini     for (i=0;i<n_constraints;i++){
3322d49ef151SStefano Zampini       ierr = VecSet(vec2_C,zero);CHKERRQ(ierr);
33230c7d97c5SJed Brown       ierr = VecSetValue(vec2_C,i,m_one,INSERT_VALUES);CHKERRQ(ierr);
33240c7d97c5SJed Brown       ierr = VecAssemblyBegin(vec2_C);CHKERRQ(ierr);
33250c7d97c5SJed Brown       ierr = VecAssemblyEnd(vec2_C);CHKERRQ(ierr);
33260c7d97c5SJed Brown       /* solution of saddle point problem */
33270c7d97c5SJed Brown       ierr = MatMult(M1,vec2_C,vec1_C);CHKERRQ(ierr);
33280c7d97c5SJed Brown       ierr = MatMult(pcbddc->local_auxmat2,vec1_C,pcbddc->vec1_R);CHKERRQ(ierr);
33290c7d97c5SJed Brown       ierr = VecScale(vec1_C,m_one);CHKERRQ(ierr);
33303b03a366Sstefano_zampini       if (n_vertices) { ierr = MatMult(A_VR,pcbddc->vec1_R,vec2_V);CHKERRQ(ierr); }
33310c7d97c5SJed Brown       /* Set values in coarse basis function and subdomain part of coarse_mat */
33320c7d97c5SJed Brown       /* coarse basis functions */
33333b03a366Sstefano_zampini       index=i+n_vertices;
33340c7d97c5SJed Brown       ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr);
33350c7d97c5SJed Brown       ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
33360c7d97c5SJed Brown       ierr = VecScatterEnd  (pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
33370c7d97c5SJed Brown       ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr);
333853cdbc3dSStefano Zampini       ierr = MatSetValues(pcbddc->coarse_phi_B,n_B,auxindices,1,&index,array,INSERT_VALUES);CHKERRQ(ierr);
33390c7d97c5SJed Brown       ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr);
3340e269702eSStefano Zampini       if ( pcbddc->prec_type || dbg_flag ) {
33410c7d97c5SJed Brown         ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
33420c7d97c5SJed Brown         ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
33430c7d97c5SJed Brown         ierr = VecGetArray(pcis->vec1_D,&array);CHKERRQ(ierr);
334453cdbc3dSStefano Zampini         ierr = MatSetValues(pcbddc->coarse_phi_D,n_D,auxindices,1,&index,array,INSERT_VALUES);CHKERRQ(ierr);
33450c7d97c5SJed Brown         ierr = VecRestoreArray(pcis->vec1_D,&array);CHKERRQ(ierr);
33460c7d97c5SJed Brown       }
33470c7d97c5SJed Brown       /* subdomain contribution to coarse matrix */
33483b03a366Sstefano_zampini       if (n_vertices) {
33490c7d97c5SJed Brown         ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr);
3350da1bb401SStefano Zampini         for (j=0;j<n_vertices;j++) {coarse_submat_vals[index*pcbddc->local_primal_size+j]=array[j];} /* WARNING -> column major ordering */
33510c7d97c5SJed Brown         ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr);
33520c7d97c5SJed Brown       }
33530c7d97c5SJed Brown       ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr);
3354da1bb401SStefano Zampini       for (j=0;j<n_constraints;j++) {coarse_submat_vals[index*pcbddc->local_primal_size+j+n_vertices]=array[j];} /* WARNING -> column major ordering */
33550c7d97c5SJed Brown       ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr);
33560c7d97c5SJed Brown 
3357e269702eSStefano Zampini       if ( dbg_flag ) {
33580c7d97c5SJed Brown         /* assemble subdomain vector on nodes */
335953cdbc3dSStefano Zampini         ierr = VecSet(pcis->vec1_N,zero);CHKERRQ(ierr);
33600c7d97c5SJed Brown         ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
33610c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr);
33620c7d97c5SJed Brown         for (j=0;j<n_R;j++){ array[ idx_R_local[j] ] = array2[j]; }
33630c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr);
33640c7d97c5SJed Brown         ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
33650c7d97c5SJed Brown         /* assemble subdomain vector of lagrange multipliers */
336653cdbc3dSStefano Zampini         ierr = VecSet(pcbddc->vec1_P,zero);CHKERRQ(ierr);
33670c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr);
33683b03a366Sstefano_zampini         if ( n_vertices) {
33690c7d97c5SJed Brown           ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr);
33703b03a366Sstefano_zampini           for (j=0;j<n_vertices;j++) {array2[j]=-array[j];}
33710c7d97c5SJed Brown           ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr);
33720c7d97c5SJed Brown         }
33730c7d97c5SJed Brown         ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr);
33743b03a366Sstefano_zampini         for (j=0;j<n_constraints;j++) {array2[j+n_vertices]=-array[j];}
33750c7d97c5SJed Brown         ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr);
33760c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr);
33773972b0daSStefano Zampini         /* check saddle point solution */
3378534831adSStefano Zampini         ierr = MatMult(pcbddc->local_mat,pcis->vec1_N,pcis->vec2_N);CHKERRQ(ierr);
33793b03a366Sstefano_zampini         ierr = MatMultTransposeAdd(pcbddc->ConstraintMatrix,pcbddc->vec1_P,pcis->vec2_N,pcis->vec2_N);CHKERRQ(ierr);
338053cdbc3dSStefano Zampini         ierr = VecNorm(pcis->vec2_N,NORM_INFINITY,&coarsefunctions_errors[index]);CHKERRQ(ierr);
33813b03a366Sstefano_zampini         ierr = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr);
33820c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
338353cdbc3dSStefano Zampini         array[index]=array[index]+m_one; /* shift by the identity matrix */
33840c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
338553cdbc3dSStefano Zampini         ierr = VecNorm(pcbddc->vec1_P,NORM_INFINITY,&constraints_errors[index]);CHKERRQ(ierr);
33860c7d97c5SJed Brown       }
33870c7d97c5SJed Brown     }
33880c7d97c5SJed Brown     ierr = MatAssemblyBegin(pcbddc->coarse_phi_B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
33890c7d97c5SJed Brown     ierr = MatAssemblyEnd  (pcbddc->coarse_phi_B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
3390e269702eSStefano Zampini     if ( pcbddc->prec_type || dbg_flag ) {
33910c7d97c5SJed Brown       ierr = MatAssemblyBegin(pcbddc->coarse_phi_D,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
33920c7d97c5SJed Brown       ierr = MatAssemblyEnd  (pcbddc->coarse_phi_D,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
33930c7d97c5SJed Brown     }
33940c7d97c5SJed Brown     /* Checking coarse_sub_mat and coarse basis functios */
33950c7d97c5SJed Brown     /* It shuld be \Phi^{(j)^T} A^{(j)} \Phi^{(j)}=coarse_sub_mat */
33969d2fce94SStefano Zampini     if (dbg_flag) {
33970c7d97c5SJed Brown 
33980c7d97c5SJed Brown       Mat coarse_sub_mat;
33990c7d97c5SJed Brown       Mat TM1,TM2,TM3,TM4;
34000c7d97c5SJed Brown       Mat coarse_phi_D,coarse_phi_B,A_II,A_BB,A_IB,A_BI;
3401a0ba757dSStefano Zampini       const MatType checkmattype=MATSEQAIJ;
34020c7d97c5SJed Brown       PetscScalar      value;
34030c7d97c5SJed Brown 
3404c042a7c3SStefano Zampini       ierr = MatConvert(pcis->A_II,checkmattype,MAT_INITIAL_MATRIX,&A_II);CHKERRQ(ierr);
3405c042a7c3SStefano Zampini       ierr = MatConvert(pcis->A_IB,checkmattype,MAT_INITIAL_MATRIX,&A_IB);CHKERRQ(ierr);
3406c042a7c3SStefano Zampini       ierr = MatConvert(pcis->A_BI,checkmattype,MAT_INITIAL_MATRIX,&A_BI);CHKERRQ(ierr);
3407c042a7c3SStefano Zampini       ierr = MatConvert(pcis->A_BB,checkmattype,MAT_INITIAL_MATRIX,&A_BB);CHKERRQ(ierr);
3408c042a7c3SStefano Zampini       ierr = MatConvert(pcbddc->coarse_phi_D,checkmattype,MAT_INITIAL_MATRIX,&coarse_phi_D);CHKERRQ(ierr);
3409c042a7c3SStefano Zampini       ierr = MatConvert(pcbddc->coarse_phi_B,checkmattype,MAT_INITIAL_MATRIX,&coarse_phi_B);CHKERRQ(ierr);
3410c042a7c3SStefano Zampini       ierr = MatCreateSeqDense(PETSC_COMM_SELF,pcbddc->local_primal_size,pcbddc->local_primal_size,coarse_submat_vals,&coarse_sub_mat);CHKERRQ(ierr);
3411c042a7c3SStefano Zampini       ierr = MatConvert(coarse_sub_mat,checkmattype,MAT_REUSE_MATRIX,&coarse_sub_mat);CHKERRQ(ierr);
34120c7d97c5SJed Brown 
3413da1bb401SStefano Zampini       /*PetscViewer view_out;
3414da1bb401SStefano Zampini       PetscMPIInt myrank;
3415da1bb401SStefano Zampini       char filename[256];
3416da1bb401SStefano Zampini       MPI_Comm_rank(((PetscObject)pc)->comm,&myrank);
3417da1bb401SStefano Zampini       sprintf(filename,"coarsesubmat_%04d.m",myrank);
3418da1bb401SStefano Zampini       ierr = PetscViewerASCIIOpen(PETSC_COMM_SELF,filename,&view_out);CHKERRQ(ierr);
3419da1bb401SStefano Zampini       ierr = PetscViewerSetFormat(view_out,PETSC_VIEWER_ASCII_MATLAB);CHKERRQ(ierr);
3420da1bb401SStefano Zampini       ierr = MatView(coarse_sub_mat,view_out);CHKERRQ(ierr);
3421da1bb401SStefano Zampini       ierr = PetscViewerDestroy(&view_out);CHKERRQ(ierr);*/
3422da1bb401SStefano Zampini 
34230c7d97c5SJed Brown       ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
34240c7d97c5SJed Brown       ierr = PetscViewerASCIIPrintf(viewer,"Check coarse sub mat and local basis functions\n");CHKERRQ(ierr);
34250c7d97c5SJed Brown       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
342653cdbc3dSStefano Zampini       ierr = MatPtAP(A_II,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&TM1);CHKERRQ(ierr);
342753cdbc3dSStefano Zampini       ierr = MatPtAP(A_BB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&TM2);CHKERRQ(ierr);
342853cdbc3dSStefano Zampini       ierr = MatMatMult(A_IB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr);
3429c042a7c3SStefano Zampini       ierr = MatTransposeMatMult(coarse_phi_D,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM3);CHKERRQ(ierr);
343053cdbc3dSStefano Zampini       ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr);
343153cdbc3dSStefano Zampini       ierr = MatMatMult(A_BI,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr);
3432c042a7c3SStefano Zampini       ierr = MatTransposeMatMult(coarse_phi_B,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM4);CHKERRQ(ierr);
343353cdbc3dSStefano Zampini       ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr);
343453cdbc3dSStefano Zampini       ierr = MatAXPY(TM1,one,TM2,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
343553cdbc3dSStefano Zampini       ierr = MatAXPY(TM1,one,TM3,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
343653cdbc3dSStefano Zampini       ierr = MatAXPY(TM1,one,TM4,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
343753cdbc3dSStefano Zampini       ierr = MatAXPY(TM1,m_one,coarse_sub_mat,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
343853cdbc3dSStefano Zampini       ierr = MatNorm(TM1,NORM_INFINITY,&value);CHKERRQ(ierr);
34390c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"----------------------------------\n");CHKERRQ(ierr);
34400c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d \n",PetscGlobalRank);CHKERRQ(ierr);
34410c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"matrix error = % 1.14e\n",value);CHKERRQ(ierr);
34420c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"coarse functions errors\n");CHKERRQ(ierr);
344353cdbc3dSStefano Zampini       for (i=0;i<pcbddc->local_primal_size;i++) { ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local %02d-th function error = % 1.14e\n",i,coarsefunctions_errors[i]);CHKERRQ(ierr); }
34440c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"constraints errors\n");CHKERRQ(ierr);
344553cdbc3dSStefano Zampini       for (i=0;i<pcbddc->local_primal_size;i++) { ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local %02d-th function error = % 1.14e\n",i,constraints_errors[i]);CHKERRQ(ierr); }
34460c7d97c5SJed Brown       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
344753cdbc3dSStefano Zampini       ierr = MatDestroy(&A_II);CHKERRQ(ierr);
344853cdbc3dSStefano Zampini       ierr = MatDestroy(&A_BB);CHKERRQ(ierr);
344953cdbc3dSStefano Zampini       ierr = MatDestroy(&A_IB);CHKERRQ(ierr);
345053cdbc3dSStefano Zampini       ierr = MatDestroy(&A_BI);CHKERRQ(ierr);
345153cdbc3dSStefano Zampini       ierr = MatDestroy(&TM1);CHKERRQ(ierr);
345253cdbc3dSStefano Zampini       ierr = MatDestroy(&TM2);CHKERRQ(ierr);
345353cdbc3dSStefano Zampini       ierr = MatDestroy(&TM3);CHKERRQ(ierr);
345453cdbc3dSStefano Zampini       ierr = MatDestroy(&TM4);CHKERRQ(ierr);
345553cdbc3dSStefano Zampini       ierr = MatDestroy(&coarse_phi_D);CHKERRQ(ierr);
345653cdbc3dSStefano Zampini       ierr = MatDestroy(&coarse_sub_mat);CHKERRQ(ierr);
345753cdbc3dSStefano Zampini       ierr = MatDestroy(&coarse_phi_B);CHKERRQ(ierr);
34580c7d97c5SJed Brown       ierr = PetscFree(coarsefunctions_errors);CHKERRQ(ierr);
34590c7d97c5SJed Brown       ierr = PetscFree(constraints_errors);CHKERRQ(ierr);
34600c7d97c5SJed Brown     }
34610c7d97c5SJed Brown 
34620c7d97c5SJed Brown     /* create coarse matrix and data structures for message passing associated actual choice of coarse problem type */
34630c7d97c5SJed Brown     ierr = PCBDDCSetupCoarseEnvironment(pc,coarse_submat_vals);CHKERRQ(ierr);
34640c7d97c5SJed Brown     /* free memory */
34650c7d97c5SJed Brown     ierr = PetscFree(coarse_submat_vals);CHKERRQ(ierr);
34660c7d97c5SJed Brown     ierr = PetscFree(auxindices);CHKERRQ(ierr);
34670c7d97c5SJed Brown     ierr = PetscFree(nnz);CHKERRQ(ierr);
34683b03a366Sstefano_zampini     if (n_vertices) {
34690c7d97c5SJed Brown       ierr = VecDestroy(&vec1_V);CHKERRQ(ierr);
34700c7d97c5SJed Brown       ierr = VecDestroy(&vec2_V);CHKERRQ(ierr);
34710c7d97c5SJed Brown       ierr = MatDestroy(&A_RV);CHKERRQ(ierr);
34720c7d97c5SJed Brown       ierr = MatDestroy(&A_VR);CHKERRQ(ierr);
34730c7d97c5SJed Brown       ierr = MatDestroy(&A_VV);CHKERRQ(ierr);
34740c7d97c5SJed Brown     }
3475534831adSStefano Zampini     if (n_constraints) {
34760c7d97c5SJed Brown       ierr = VecDestroy(&vec1_C);CHKERRQ(ierr);
34770c7d97c5SJed Brown       ierr = VecDestroy(&vec2_C);CHKERRQ(ierr);
34780c7d97c5SJed Brown       ierr = MatDestroy(&M1);CHKERRQ(ierr);
34790c7d97c5SJed Brown       ierr = MatDestroy(&C_CR);CHKERRQ(ierr);
34800c7d97c5SJed Brown     }
34810c7d97c5SJed Brown   }
34820c7d97c5SJed Brown   /* free memory */
34833b03a366Sstefano_zampini   if (n_vertices) {
34840c7d97c5SJed Brown     ierr = PetscFree(idx_V_B);CHKERRQ(ierr);
34850c7d97c5SJed Brown     ierr = ISDestroy(&is_V_local);CHKERRQ(ierr);
34860c7d97c5SJed Brown   }
34870c7d97c5SJed Brown   ierr = ISDestroy(&is_R_local);CHKERRQ(ierr);
34880c7d97c5SJed Brown 
34890c7d97c5SJed Brown   PetscFunctionReturn(0);
34900c7d97c5SJed Brown }
34910c7d97c5SJed Brown 
34920c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
34930c7d97c5SJed Brown 
34940c7d97c5SJed Brown #undef __FUNCT__
34950c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetupCoarseEnvironment"
349653cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetupCoarseEnvironment(PC pc,PetscScalar* coarse_submat_vals)
34970c7d97c5SJed Brown {
34980c7d97c5SJed Brown 
34990c7d97c5SJed Brown 
35000c7d97c5SJed Brown   Mat_IS    *matis    = (Mat_IS*)pc->pmat->data;
35010c7d97c5SJed Brown   PC_BDDC   *pcbddc   = (PC_BDDC*)pc->data;
35020c7d97c5SJed Brown   PC_IS     *pcis     = (PC_IS*)pc->data;
35030c7d97c5SJed Brown   MPI_Comm  prec_comm = ((PetscObject)pc)->comm;
35040c7d97c5SJed Brown   MPI_Comm  coarse_comm;
35050c7d97c5SJed Brown 
35060c7d97c5SJed Brown   /* common to all choiches */
35070c7d97c5SJed Brown   PetscScalar *temp_coarse_mat_vals;
35080c7d97c5SJed Brown   PetscScalar *ins_coarse_mat_vals;
35090c7d97c5SJed Brown   PetscInt    *ins_local_primal_indices;
35100c7d97c5SJed Brown   PetscMPIInt *localsizes2,*localdispl2;
35110c7d97c5SJed Brown   PetscMPIInt size_prec_comm;
35120c7d97c5SJed Brown   PetscMPIInt rank_prec_comm;
35130c7d97c5SJed Brown   PetscMPIInt active_rank=MPI_PROC_NULL;
35140c7d97c5SJed Brown   PetscMPIInt master_proc=0;
35150c7d97c5SJed Brown   PetscInt    ins_local_primal_size;
35160c7d97c5SJed Brown   /* specific to MULTILEVEL_BDDC */
35170c7d97c5SJed Brown   PetscMPIInt *ranks_recv;
35180c7d97c5SJed Brown   PetscMPIInt count_recv=0;
35190c7d97c5SJed Brown   PetscMPIInt rank_coarse_proc_send_to;
35200c7d97c5SJed Brown   PetscMPIInt coarse_color = MPI_UNDEFINED;
35210c7d97c5SJed Brown   ISLocalToGlobalMapping coarse_ISLG;
35220c7d97c5SJed Brown   /* some other variables */
35230c7d97c5SJed Brown   PetscErrorCode ierr;
35240c7d97c5SJed Brown   const MatType coarse_mat_type;
35250c7d97c5SJed Brown   const PCType  coarse_pc_type;
352653cdbc3dSStefano Zampini   const KSPType coarse_ksp_type;
352753cdbc3dSStefano Zampini   PC pc_temp;
3528*4fad6a16SStefano Zampini   PetscInt i,j,k;
35293b03a366Sstefano_zampini   PetscInt max_it_coarse_ksp=1;  /* don't increase this value */
3530e269702eSStefano Zampini   /* verbose output viewer */
3531e269702eSStefano Zampini   PetscViewer viewer=pcbddc->dbg_viewer;
3532e269702eSStefano Zampini   PetscBool   dbg_flag=pcbddc->dbg_flag;
3533142dfd88SStefano Zampini 
3534ea7e1babSStefano Zampini   PetscInt      offset,offset2;
3535142dfd88SStefano Zampini   PetscMPIInt   im_active=0;
3536142dfd88SStefano Zampini   PetscMPIInt   *auxglobal_primal;
3537142dfd88SStefano Zampini 
3538142dfd88SStefano Zampini   PetscBool     setsym,issym=PETSC_FALSE;
35390c7d97c5SJed Brown 
35400c7d97c5SJed Brown   PetscFunctionBegin;
35410c7d97c5SJed Brown   ins_local_primal_indices = 0;
35420c7d97c5SJed Brown   ins_coarse_mat_vals      = 0;
35430c7d97c5SJed Brown   localsizes2              = 0;
35440c7d97c5SJed Brown   localdispl2              = 0;
35450c7d97c5SJed Brown   temp_coarse_mat_vals     = 0;
35460c7d97c5SJed Brown   coarse_ISLG              = 0;
35470c7d97c5SJed Brown 
354853cdbc3dSStefano Zampini   ierr = MPI_Comm_size(prec_comm,&size_prec_comm);CHKERRQ(ierr);
354953cdbc3dSStefano Zampini   ierr = MPI_Comm_rank(prec_comm,&rank_prec_comm);CHKERRQ(ierr);
3550142dfd88SStefano Zampini   ierr = MatIsSymmetricKnown(pc->pmat,&setsym,&issym);CHKERRQ(ierr);
3551142dfd88SStefano Zampini 
3552beed3852SStefano Zampini   /* Assign global numbering to coarse dofs */
3553beed3852SStefano Zampini   {
3554a0ba757dSStefano Zampini     PetscScalar    one=1.,zero=0.;
3555beed3852SStefano Zampini     PetscScalar    *array;
3556beed3852SStefano Zampini     PetscMPIInt    *auxlocal_primal;
3557beed3852SStefano Zampini     PetscMPIInt    *all_auxglobal_primal;
3558beed3852SStefano Zampini     PetscMPIInt    mpi_local_primal_size = (PetscMPIInt)pcbddc->local_primal_size;
3559da1bb401SStefano Zampini     PetscInt       *row_cmat_indices;
35603b03a366Sstefano_zampini     PetscInt       size_of_constraint;
3561da1bb401SStefano Zampini     PetscScalar    coarsesum;
3562beed3852SStefano Zampini 
3563beed3852SStefano Zampini     /* Construct needed data structures for message passing */
3564beed3852SStefano Zampini     ierr = PetscMalloc(mpi_local_primal_size*sizeof(PetscMPIInt),&pcbddc->local_primal_indices);CHKERRQ(ierr);
3565ffe5efe1SStefano Zampini     j = 0;
3566142dfd88SStefano Zampini     if (rank_prec_comm == 0 || pcbddc->coarse_problem_type == REPLICATED_BDDC || pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
3567ffe5efe1SStefano Zampini       j = size_prec_comm;
3568ffe5efe1SStefano Zampini     }
3569ffe5efe1SStefano Zampini     ierr = PetscMalloc(j*sizeof(PetscMPIInt),&pcbddc->local_primal_sizes);CHKERRQ(ierr);
3570ffe5efe1SStefano Zampini     ierr = PetscMalloc(j*sizeof(PetscMPIInt),&pcbddc->local_primal_displacements);CHKERRQ(ierr);
3571beed3852SStefano Zampini     /* Gather local_primal_size information for all processes  */
3572142dfd88SStefano Zampini     if (pcbddc->coarse_problem_type == REPLICATED_BDDC || pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
35735619798eSStefano Zampini       ierr = MPI_Allgather(&mpi_local_primal_size,1,MPIU_INT,&pcbddc->local_primal_sizes[0],1,MPIU_INT,prec_comm);CHKERRQ(ierr);
3574ffe5efe1SStefano Zampini     } else {
3575ffe5efe1SStefano Zampini       ierr = MPI_Gather(&mpi_local_primal_size,1,MPIU_INT,&pcbddc->local_primal_sizes[0],1,MPIU_INT,0,prec_comm);CHKERRQ(ierr);
3576ffe5efe1SStefano Zampini     }
3577beed3852SStefano Zampini     pcbddc->replicated_primal_size = 0;
3578ffe5efe1SStefano Zampini     for (i=0; i<j; i++) {
3579beed3852SStefano Zampini       pcbddc->local_primal_displacements[i] = pcbddc->replicated_primal_size ;
3580beed3852SStefano Zampini       pcbddc->replicated_primal_size += pcbddc->local_primal_sizes[i];
3581beed3852SStefano Zampini     }
35825619798eSStefano Zampini     if (rank_prec_comm == 0) {
3583beed3852SStefano Zampini       /* allocate some auxiliary space */
3584beed3852SStefano Zampini       ierr = PetscMalloc(pcbddc->replicated_primal_size*sizeof(*all_auxglobal_primal),&all_auxglobal_primal);CHKERRQ(ierr);
3585beed3852SStefano Zampini     }
3586beed3852SStefano Zampini     ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscMPIInt),&auxlocal_primal);CHKERRQ(ierr);
3587beed3852SStefano Zampini     ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscMPIInt),&auxglobal_primal);CHKERRQ(ierr);
3588beed3852SStefano Zampini 
3589da1bb401SStefano Zampini     /* First let's count coarse dofs.
3590beed3852SStefano Zampini        This code fragment assumes that the number of local constraints per connected component
3591beed3852SStefano Zampini        is not greater than the number of nodes defined for the connected component
3592beed3852SStefano Zampini        (otherwise we will surely have linear dependence between constraints and thus a singular coarse problem) */
35933b03a366Sstefano_zampini     /* auxlocal_primal      : primal indices in local nodes numbering (internal and interface) with complete queue sorted by global ordering */
3594beed3852SStefano Zampini     ierr = VecSet(pcis->vec1_N,zero);CHKERRQ(ierr);
3595beed3852SStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3596da1bb401SStefano Zampini     for (i=0;i<pcbddc->local_primal_size;i++) {
3597da1bb401SStefano Zampini       ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr);
35983b03a366Sstefano_zampini       for (j=0; j<size_of_constraint; j++) {
35993b03a366Sstefano_zampini         k = row_cmat_indices[j];
3600beed3852SStefano Zampini         if ( array[k] == zero ) {
3601beed3852SStefano Zampini           array[k] = one;
3602da1bb401SStefano Zampini           auxlocal_primal[i] = k;
3603beed3852SStefano Zampini           break;
3604beed3852SStefano Zampini         }
3605beed3852SStefano Zampini       }
3606da1bb401SStefano Zampini       ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr);
3607beed3852SStefano Zampini     }
3608beed3852SStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3609da1bb401SStefano Zampini     ierr = VecSet(pcis->vec1_global,zero);CHKERRQ(ierr);
3610da1bb401SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3611da1bb401SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3612da1bb401SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3613da1bb401SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3614da1bb401SStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3615142dfd88SStefano Zampini     for (i=0;i<pcis->n;i++) { if ( PetscAbsScalar(array[i]) > zero) array[i] = one/array[i]; }
3616da1bb401SStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3617da1bb401SStefano Zampini     ierr = VecSet(pcis->vec1_global,zero);CHKERRQ(ierr);
3618da1bb401SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3619da1bb401SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3620da1bb401SStefano Zampini     ierr = VecSum(pcis->vec1_global,&coarsesum);CHKERRQ(ierr);
3621da1bb401SStefano Zampini     pcbddc->coarse_size = (PetscInt) coarsesum;
3622a0ba757dSStefano Zampini 
3623beed3852SStefano Zampini     /* Now assign them a global numbering */
3624beed3852SStefano Zampini     /* auxglobal_primal contains indices in global nodes numbering (internal and interface) */
3625beed3852SStefano Zampini     ierr = ISLocalToGlobalMappingApply(matis->mapping,pcbddc->local_primal_size,auxlocal_primal,auxglobal_primal);CHKERRQ(ierr);
3626142dfd88SStefano Zampini     ierr = PetscFree(auxlocal_primal);CHKERRQ(ierr);
3627beed3852SStefano Zampini     /* all_auxglobal_primal contains all primal nodes indices in global nodes numbering (internal and interface) */
3628beed3852SStefano Zampini     ierr = MPI_Gatherv(&auxglobal_primal[0],pcbddc->local_primal_size,MPIU_INT,&all_auxglobal_primal[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,0,prec_comm);CHKERRQ(ierr);
3629beed3852SStefano Zampini 
3630beed3852SStefano Zampini     /* After this block all_auxglobal_primal should contains one copy of each primal node's indices in global nodes numbering */
3631beed3852SStefano Zampini     if (rank_prec_comm==0) {
363217d7d925SStefano Zampini       j=pcbddc->replicated_primal_size;
363317d7d925SStefano Zampini       ierr = PetscSortRemoveDupsMPIInt(&j,all_auxglobal_primal);CHKERRQ(ierr);
36340bdf917eSStefano Zampini     } else {
36350bdf917eSStefano Zampini       ierr = PetscMalloc(pcbddc->coarse_size*sizeof(PetscMPIInt),&all_auxglobal_primal);CHKERRQ(ierr);
36360bdf917eSStefano Zampini     }
36370bdf917eSStefano Zampini     /* We only need to broadcast the indices from 0 to pcbddc->coarse_size. Remaning elements of array all_aux_global_primal are garbage. */
36380bdf917eSStefano Zampini     ierr = MPI_Bcast(all_auxglobal_primal,pcbddc->coarse_size,MPIU_INT,0,prec_comm);CHKERRQ(ierr);
36390bdf917eSStefano Zampini 
36400bdf917eSStefano Zampini     /* Now get global coarse numbering of local primal nodes */
36410bdf917eSStefano Zampini     for (i=0;i<pcbddc->local_primal_size;i++) {
3642beed3852SStefano Zampini       k=0;
36430bdf917eSStefano Zampini       while( all_auxglobal_primal[k] != auxglobal_primal[i] ) { k++;}
36440bdf917eSStefano Zampini       pcbddc->local_primal_indices[i]=k;
3645beed3852SStefano Zampini     }
36460bdf917eSStefano Zampini     ierr = PetscFree(auxglobal_primal);CHKERRQ(ierr);
3647beed3852SStefano Zampini     ierr = PetscFree(all_auxglobal_primal);CHKERRQ(ierr);
36480bdf917eSStefano Zampini     if (rank_prec_comm==0) {
36490bdf917eSStefano Zampini       j=pcbddc->replicated_primal_size;
36500bdf917eSStefano Zampini       ierr = PetscMalloc(j*sizeof(PetscMPIInt),&auxglobal_primal);CHKERRQ(ierr);
3651e269702eSStefano Zampini     }
36520bdf917eSStefano Zampini     ierr = MPI_Gatherv(pcbddc->local_primal_indices,pcbddc->local_primal_size,MPIU_INT,auxglobal_primal,pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,0,prec_comm);CHKERRQ(ierr);
36530bdf917eSStefano Zampini   }
36540bdf917eSStefano Zampini 
36550bdf917eSStefano Zampini   if (pcis->n) { im_active = 1; }
36560bdf917eSStefano Zampini   ierr = MPI_Allreduce(&im_active,&pcbddc->active_procs,1,MPIU_INT,MPI_SUM,prec_comm);CHKERRQ(ierr);
36570bdf917eSStefano Zampini 
36580bdf917eSStefano Zampini   /* adapt coarse problem type */
3659*4fad6a16SStefano Zampini   if (pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
3660*4fad6a16SStefano Zampini     if (pcbddc->current_level < pcbddc->max_levels) {
3661*4fad6a16SStefano Zampini       if ( (pcbddc->active_procs/pcbddc->coarsening_ratio) < 2 ) {
36620bdf917eSStefano Zampini         if (dbg_flag) {
3663*4fad6a16SStefano Zampini           ierr = PetscViewerASCIIPrintf(viewer,"Not enough active processes on level %d (active %d,ratio %d). Parallel direct solve for coarse problem\n",pcbddc->current_level,pcbddc->active_procs,pcbddc->coarsening_ratio);CHKERRQ(ierr);
36640bdf917eSStefano Zampini          ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
36650bdf917eSStefano Zampini         }
36660bdf917eSStefano Zampini         pcbddc->coarse_problem_type = PARALLEL_BDDC;
3667142dfd88SStefano Zampini       }
3668*4fad6a16SStefano Zampini     } else {
3669*4fad6a16SStefano Zampini       if (dbg_flag) {
3670*4fad6a16SStefano Zampini         ierr = PetscViewerASCIIPrintf(viewer,"Max number of levels reached. Using parallel direct solve for coarse problem\n",pcbddc->max_levels,pcbddc->active_procs,pcbddc->coarsening_ratio);CHKERRQ(ierr);
3671*4fad6a16SStefano Zampini         ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
3672*4fad6a16SStefano Zampini       }
3673*4fad6a16SStefano Zampini       pcbddc->coarse_problem_type = PARALLEL_BDDC;
3674*4fad6a16SStefano Zampini     }
3675*4fad6a16SStefano Zampini   }
3676beed3852SStefano Zampini 
36770c7d97c5SJed Brown   switch(pcbddc->coarse_problem_type){
36780c7d97c5SJed Brown 
3679da1bb401SStefano Zampini     case(MULTILEVEL_BDDC):   /* we define a coarse mesh where subdomains are elements */
36800c7d97c5SJed Brown     {
36810c7d97c5SJed Brown       /* we need additional variables */
36820c7d97c5SJed Brown       MetisInt    n_subdomains,n_parts,objval,ncon,faces_nvtxs;
36830c7d97c5SJed Brown       MetisInt    *metis_coarse_subdivision;
36840c7d97c5SJed Brown       MetisInt    options[METIS_NOPTIONS];
36850c7d97c5SJed Brown       PetscMPIInt size_coarse_comm,rank_coarse_comm;
36860c7d97c5SJed Brown       PetscMPIInt procs_jumps_coarse_comm;
36870c7d97c5SJed Brown       PetscMPIInt *coarse_subdivision;
36880c7d97c5SJed Brown       PetscMPIInt *total_count_recv;
36890c7d97c5SJed Brown       PetscMPIInt *total_ranks_recv;
36900c7d97c5SJed Brown       PetscMPIInt *displacements_recv;
36910c7d97c5SJed Brown       PetscMPIInt *my_faces_connectivity;
36920c7d97c5SJed Brown       PetscMPIInt *petsc_faces_adjncy;
36930c7d97c5SJed Brown       MetisInt    *faces_adjncy;
36940c7d97c5SJed Brown       MetisInt    *faces_xadj;
36950c7d97c5SJed Brown       PetscMPIInt *number_of_faces;
36960c7d97c5SJed Brown       PetscMPIInt *faces_displacements;
36970c7d97c5SJed Brown       PetscInt    *array_int;
36980c7d97c5SJed Brown       PetscMPIInt my_faces=0;
36990c7d97c5SJed Brown       PetscMPIInt total_faces=0;
37003828260eSStefano Zampini       PetscInt    ranks_stretching_ratio;
37010c7d97c5SJed Brown 
37020c7d97c5SJed Brown       /* define some quantities */
37030c7d97c5SJed Brown       pcbddc->coarse_communications_type = SCATTERS_BDDC;
37040c7d97c5SJed Brown       coarse_mat_type = MATIS;
37050c7d97c5SJed Brown       coarse_pc_type  = PCBDDC;
3706142dfd88SStefano Zampini       coarse_ksp_type = KSPRICHARDSON;
37070c7d97c5SJed Brown 
37080c7d97c5SJed Brown       /* details of coarse decomposition */
37090c7d97c5SJed Brown       n_subdomains = pcbddc->active_procs;
37100c7d97c5SJed Brown       n_parts      = n_subdomains/pcbddc->coarsening_ratio;
37113828260eSStefano Zampini       ranks_stretching_ratio = size_prec_comm/pcbddc->active_procs;
37123828260eSStefano Zampini       procs_jumps_coarse_comm = pcbddc->coarsening_ratio*ranks_stretching_ratio;
37133828260eSStefano Zampini 
3714*4fad6a16SStefano Zampini       /* build CSR graph of subdomains' connectivity */
37150c7d97c5SJed Brown       ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&array_int);CHKERRQ(ierr);
37163828260eSStefano Zampini       ierr = PetscMemzero(array_int,pcis->n*sizeof(PetscInt));CHKERRQ(ierr);
37170c7d97c5SJed Brown       for (i=1;i<pcis->n_neigh;i++){/* i=1 so I don't count myself -> faces nodes counts to 1 */
37180c7d97c5SJed Brown         for (j=0;j<pcis->n_shared[i];j++){
37190c7d97c5SJed Brown           array_int[ pcis->shared[i][j] ]+=1;
37200c7d97c5SJed Brown         }
37210c7d97c5SJed Brown       }
37220c7d97c5SJed Brown       for (i=1;i<pcis->n_neigh;i++){
37230c7d97c5SJed Brown         for (j=0;j<pcis->n_shared[i];j++){
3724*4fad6a16SStefano Zampini           if (array_int[ pcis->shared[i][j] ] > 0 ){
37250c7d97c5SJed Brown             my_faces++;
37260c7d97c5SJed Brown             break;
37270c7d97c5SJed Brown           }
37280c7d97c5SJed Brown         }
37290c7d97c5SJed Brown       }
37300c7d97c5SJed Brown 
373153cdbc3dSStefano Zampini       ierr = MPI_Reduce(&my_faces,&total_faces,1,MPIU_INT,MPI_SUM,master_proc,prec_comm);CHKERRQ(ierr);
37320c7d97c5SJed Brown       ierr = PetscMalloc (my_faces*sizeof(PetscInt),&my_faces_connectivity);CHKERRQ(ierr);
37330c7d97c5SJed Brown       my_faces=0;
37340c7d97c5SJed Brown       for (i=1;i<pcis->n_neigh;i++){
37350c7d97c5SJed Brown         for (j=0;j<pcis->n_shared[i];j++){
3736*4fad6a16SStefano Zampini           if (array_int[ pcis->shared[i][j] ] > 0 ){
37370c7d97c5SJed Brown             my_faces_connectivity[my_faces]=pcis->neigh[i];
37380c7d97c5SJed Brown             my_faces++;
37390c7d97c5SJed Brown             break;
37400c7d97c5SJed Brown           }
37410c7d97c5SJed Brown         }
37420c7d97c5SJed Brown       }
37430c7d97c5SJed Brown       if (rank_prec_comm == master_proc) {
37440c7d97c5SJed Brown         ierr = PetscMalloc (total_faces*sizeof(PetscMPIInt),&petsc_faces_adjncy);CHKERRQ(ierr);
37450c7d97c5SJed Brown         ierr = PetscMalloc (size_prec_comm*sizeof(PetscMPIInt),&number_of_faces);CHKERRQ(ierr);
37460c7d97c5SJed Brown         ierr = PetscMalloc (total_faces*sizeof(MetisInt),&faces_adjncy);CHKERRQ(ierr);
37470c7d97c5SJed Brown         ierr = PetscMalloc ((n_subdomains+1)*sizeof(MetisInt),&faces_xadj);CHKERRQ(ierr);
37480c7d97c5SJed Brown         ierr = PetscMalloc ((size_prec_comm+1)*sizeof(PetscMPIInt),&faces_displacements);CHKERRQ(ierr);
37490c7d97c5SJed Brown       }
375053cdbc3dSStefano Zampini       ierr = MPI_Gather(&my_faces,1,MPIU_INT,&number_of_faces[0],1,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr);
37510c7d97c5SJed Brown       if (rank_prec_comm == master_proc) {
37520c7d97c5SJed Brown         faces_xadj[0]=0;
37530c7d97c5SJed Brown         faces_displacements[0]=0;
37540c7d97c5SJed Brown         j=0;
37550c7d97c5SJed Brown         for (i=1;i<size_prec_comm+1;i++) {
37560c7d97c5SJed Brown           faces_displacements[i]=faces_displacements[i-1]+number_of_faces[i-1];
37570c7d97c5SJed Brown           if (number_of_faces[i-1]) {
37580c7d97c5SJed Brown             j++;
37590c7d97c5SJed Brown             faces_xadj[j]=faces_xadj[j-1]+number_of_faces[i-1];
37600c7d97c5SJed Brown           }
37610c7d97c5SJed Brown         }
37620c7d97c5SJed Brown       }
376353cdbc3dSStefano Zampini       ierr = MPI_Gatherv(&my_faces_connectivity[0],my_faces,MPIU_INT,&petsc_faces_adjncy[0],number_of_faces,faces_displacements,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr);
37640c7d97c5SJed Brown       ierr = PetscFree(my_faces_connectivity);CHKERRQ(ierr);
37650c7d97c5SJed Brown       ierr = PetscFree(array_int);CHKERRQ(ierr);
37660c7d97c5SJed Brown       if (rank_prec_comm == master_proc) {
37673828260eSStefano Zampini         for (i=0;i<total_faces;i++) faces_adjncy[i]=(MetisInt)(petsc_faces_adjncy[i]/ranks_stretching_ratio); /* cast to MetisInt */
3768da1bb401SStefano Zampini         /*printf("This is the face connectivity (actual ranks)\n");
37690c7d97c5SJed Brown         for (i=0;i<n_subdomains;i++){
37700c7d97c5SJed Brown           printf("proc %d is connected with \n",i);
37710c7d97c5SJed Brown           for (j=faces_xadj[i];j<faces_xadj[i+1];j++)
37720c7d97c5SJed Brown             printf("%d ",faces_adjncy[j]);
37730c7d97c5SJed Brown           printf("\n");
3774da1bb401SStefano Zampini         }*/
37750c7d97c5SJed Brown         ierr = PetscFree(faces_displacements);CHKERRQ(ierr);
37760c7d97c5SJed Brown         ierr = PetscFree(number_of_faces);CHKERRQ(ierr);
37770c7d97c5SJed Brown         ierr = PetscFree(petsc_faces_adjncy);CHKERRQ(ierr);
37780c7d97c5SJed Brown       }
37790c7d97c5SJed Brown 
37800c7d97c5SJed Brown       if ( rank_prec_comm == master_proc ) {
37810c7d97c5SJed Brown 
37823828260eSStefano Zampini         PetscInt heuristic_for_metis=3;
37833828260eSStefano Zampini 
37840c7d97c5SJed Brown         ncon=1;
37850c7d97c5SJed Brown         faces_nvtxs=n_subdomains;
37860c7d97c5SJed Brown         /* partition graoh induced by face connectivity */
37870c7d97c5SJed Brown         ierr = PetscMalloc (n_subdomains*sizeof(MetisInt),&metis_coarse_subdivision);CHKERRQ(ierr);
37880c7d97c5SJed Brown         ierr = METIS_SetDefaultOptions(options);
37890c7d97c5SJed Brown         /* we need a contiguous partition of the coarse mesh */
37900c7d97c5SJed Brown         options[METIS_OPTION_CONTIG]=1;
37910c7d97c5SJed Brown         options[METIS_OPTION_NITER]=30;
3792*4fad6a16SStefano Zampini         if (pcbddc->coarsening_ratio > 1) {
37933828260eSStefano Zampini           if (n_subdomains>n_parts*heuristic_for_metis) {
37943828260eSStefano Zampini             options[METIS_OPTION_IPTYPE]=METIS_IPTYPE_EDGE;
37953828260eSStefano Zampini             options[METIS_OPTION_OBJTYPE]=METIS_OBJTYPE_CUT;
37960c7d97c5SJed Brown             ierr = METIS_PartGraphKway(&faces_nvtxs,&ncon,faces_xadj,faces_adjncy,NULL,NULL,NULL,&n_parts,NULL,NULL,options,&objval,metis_coarse_subdivision);
3797142dfd88SStefano Zampini             if (ierr != METIS_OK) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in METIS_PartGraphKway (metis error code %D) called from PCBDDCSetupCoarseEnvironment\n",ierr);
37983828260eSStefano Zampini           } else {
37993828260eSStefano Zampini             ierr = METIS_PartGraphRecursive(&faces_nvtxs,&ncon,faces_xadj,faces_adjncy,NULL,NULL,NULL,&n_parts,NULL,NULL,options,&objval,metis_coarse_subdivision);
3800142dfd88SStefano Zampini             if (ierr != METIS_OK) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in METIS_PartGraphRecursive (metis error code %D) called from PCBDDCSetupCoarseEnvironment\n",ierr);
38013828260eSStefano Zampini           }
3802*4fad6a16SStefano Zampini         } else {
3803*4fad6a16SStefano Zampini           for (i=0;i<n_subdomains;i++) {
3804*4fad6a16SStefano Zampini             metis_coarse_subdivision[i]=i;
3805*4fad6a16SStefano Zampini           }
3806*4fad6a16SStefano Zampini         }
38070c7d97c5SJed Brown         ierr = PetscFree(faces_xadj);CHKERRQ(ierr);
38080c7d97c5SJed Brown         ierr = PetscFree(faces_adjncy);CHKERRQ(ierr);
38090bdf917eSStefano Zampini         ierr = PetscMalloc(size_prec_comm*sizeof(PetscMPIInt),&coarse_subdivision);CHKERRQ(ierr);
38100c7d97c5SJed Brown         /* copy/cast values avoiding possible type conflicts between PETSc, MPI and METIS */
38110bdf917eSStefano Zampini         for (i=0;i<size_prec_comm;i++) { coarse_subdivision[i]=MPI_PROC_NULL; }
38120bdf917eSStefano Zampini         for (i=0;i<n_subdomains;i++)   { coarse_subdivision[ranks_stretching_ratio*i]=(PetscInt)(metis_coarse_subdivision[i]); }
38130c7d97c5SJed Brown         ierr = PetscFree(metis_coarse_subdivision);CHKERRQ(ierr);
38140c7d97c5SJed Brown       }
38150c7d97c5SJed Brown 
38160c7d97c5SJed Brown       /* Create new communicator for coarse problem splitting the old one */
38170c7d97c5SJed Brown       if ( !(rank_prec_comm%procs_jumps_coarse_comm) && rank_prec_comm < procs_jumps_coarse_comm*n_parts ){
3818da1bb401SStefano Zampini         coarse_color=0;              /* for communicator splitting */
3819da1bb401SStefano Zampini         active_rank=rank_prec_comm;  /* for insertion of matrix values */
38200c7d97c5SJed Brown       }
3821da1bb401SStefano Zampini       /* procs with coarse_color = MPI_UNDEFINED will have coarse_comm = MPI_COMM_NULL (from mpi standards)
3822da1bb401SStefano Zampini          key = rank_prec_comm -> keep same ordering of ranks from the old to the new communicator */
382353cdbc3dSStefano Zampini       ierr = MPI_Comm_split(prec_comm,coarse_color,rank_prec_comm,&coarse_comm);CHKERRQ(ierr);
38240c7d97c5SJed Brown 
38250c7d97c5SJed Brown       if ( coarse_color == 0 ) {
382653cdbc3dSStefano Zampini         ierr = MPI_Comm_size(coarse_comm,&size_coarse_comm);CHKERRQ(ierr);
382753cdbc3dSStefano Zampini         ierr = MPI_Comm_rank(coarse_comm,&rank_coarse_comm);CHKERRQ(ierr);
38280c7d97c5SJed Brown       } else {
38290c7d97c5SJed Brown         rank_coarse_comm = MPI_PROC_NULL;
38300c7d97c5SJed Brown       }
38310c7d97c5SJed Brown 
38320c7d97c5SJed Brown       /* master proc take care of arranging and distributing coarse informations */
38330c7d97c5SJed Brown       if (rank_coarse_comm == master_proc) {
38340c7d97c5SJed Brown         ierr = PetscMalloc (size_coarse_comm*sizeof(PetscMPIInt),&displacements_recv);CHKERRQ(ierr);
38350bdf917eSStefano Zampini         ierr = PetscMalloc (size_coarse_comm*sizeof(PetscMPIInt),&total_count_recv);CHKERRQ(ierr);
38360bdf917eSStefano Zampini         ierr = PetscMalloc (n_subdomains*sizeof(PetscMPIInt),&total_ranks_recv);CHKERRQ(ierr);
38370c7d97c5SJed Brown         /* some initializations */
38380c7d97c5SJed Brown         displacements_recv[0]=0;
38390bdf917eSStefano Zampini         ierr = PetscMemzero(total_count_recv,size_coarse_comm*sizeof(PetscMPIInt));CHKERRQ(ierr);
38400c7d97c5SJed Brown         /* count from how many processes the j-th process of the coarse decomposition will receive data */
38410bdf917eSStefano Zampini         for (j=0;j<size_coarse_comm;j++) {
38420bdf917eSStefano Zampini           for (i=0;i<size_prec_comm;i++) {
38430bdf917eSStefano Zampini             if (coarse_subdivision[i]==j) {
38440c7d97c5SJed Brown               total_count_recv[j]++;
38450bdf917eSStefano Zampini             }
38460bdf917eSStefano Zampini           }
38470bdf917eSStefano Zampini         }
38480c7d97c5SJed Brown         /* displacements needed for scatterv of total_ranks_recv */
38490bdf917eSStefano Zampini         for (i=1;i<size_coarse_comm;i++) { displacements_recv[i]=displacements_recv[i-1]+total_count_recv[i-1]; }
38500c7d97c5SJed Brown         /* Now fill properly total_ranks_recv -> each coarse process will receive the ranks (in prec_comm communicator) of its friend (sending) processes */
38510c7d97c5SJed Brown         ierr = PetscMemzero(total_count_recv,size_coarse_comm*sizeof(PetscMPIInt));CHKERRQ(ierr);
38520c7d97c5SJed Brown         for (j=0;j<size_coarse_comm;j++) {
38533828260eSStefano Zampini           for (i=0;i<size_prec_comm;i++) {
38540c7d97c5SJed Brown             if (coarse_subdivision[i]==j) {
38550c7d97c5SJed Brown               total_ranks_recv[displacements_recv[j]+total_count_recv[j]]=i;
38563828260eSStefano Zampini               total_count_recv[j]+=1;
38570c7d97c5SJed Brown             }
38580c7d97c5SJed Brown           }
38590c7d97c5SJed Brown         }
3860da1bb401SStefano Zampini         /*for (j=0;j<size_coarse_comm;j++) {
38613828260eSStefano Zampini           printf("process %d in new rank will receive from %d processes (original ranks follows)\n",j,total_count_recv[j]);
38623828260eSStefano Zampini           for (i=0;i<total_count_recv[j];i++) {
38633828260eSStefano Zampini             printf("%d ",total_ranks_recv[displacements_recv[j]+i]);
38643828260eSStefano Zampini           }
38653828260eSStefano Zampini           printf("\n");
3866da1bb401SStefano Zampini         }*/
38670c7d97c5SJed Brown 
38680c7d97c5SJed Brown         /* identify new decomposition in terms of ranks in the old communicator */
38690bdf917eSStefano Zampini         for (i=0;i<n_subdomains;i++) {
38700bdf917eSStefano Zampini           coarse_subdivision[ranks_stretching_ratio*i]=coarse_subdivision[ranks_stretching_ratio*i]*procs_jumps_coarse_comm;
38710bdf917eSStefano Zampini         }
3872da1bb401SStefano Zampini         /*printf("coarse_subdivision in old end new ranks\n");
38730c7d97c5SJed Brown         for (i=0;i<size_prec_comm;i++)
38743828260eSStefano Zampini           if (coarse_subdivision[i]!=MPI_PROC_NULL) {
38753828260eSStefano Zampini             printf("%d=(%d %d), ",i,coarse_subdivision[i],coarse_subdivision[i]/procs_jumps_coarse_comm);
38763828260eSStefano Zampini           } else {
38773828260eSStefano Zampini             printf("%d=(%d %d), ",i,coarse_subdivision[i],coarse_subdivision[i]);
38783828260eSStefano Zampini           }
3879da1bb401SStefano Zampini         printf("\n");*/
38800c7d97c5SJed Brown       }
38810c7d97c5SJed Brown 
38820c7d97c5SJed Brown       /* Scatter new decomposition for send details */
388353cdbc3dSStefano Zampini       ierr = MPI_Scatter(&coarse_subdivision[0],1,MPIU_INT,&rank_coarse_proc_send_to,1,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr);
38840c7d97c5SJed Brown       /* Scatter receiving details to members of coarse decomposition */
38850c7d97c5SJed Brown       if ( coarse_color == 0) {
388653cdbc3dSStefano Zampini         ierr = MPI_Scatter(&total_count_recv[0],1,MPIU_INT,&count_recv,1,MPIU_INT,master_proc,coarse_comm);CHKERRQ(ierr);
38870c7d97c5SJed Brown         ierr = PetscMalloc (count_recv*sizeof(PetscMPIInt),&ranks_recv);CHKERRQ(ierr);
388853cdbc3dSStefano Zampini         ierr = MPI_Scatterv(&total_ranks_recv[0],total_count_recv,displacements_recv,MPIU_INT,&ranks_recv[0],count_recv,MPIU_INT,master_proc,coarse_comm);CHKERRQ(ierr);
38890c7d97c5SJed Brown       }
38900c7d97c5SJed Brown 
3891da1bb401SStefano Zampini       /*printf("I will send my matrix data to proc  %d\n",rank_coarse_proc_send_to);
3892da1bb401SStefano Zampini       if (coarse_color == 0) {
3893da1bb401SStefano Zampini         printf("I will receive some matrix data from %d processes (ranks follows)\n",count_recv);
3894da1bb401SStefano Zampini         for (i=0;i<count_recv;i++)
3895da1bb401SStefano Zampini           printf("%d ",ranks_recv[i]);
3896da1bb401SStefano Zampini         printf("\n");
3897da1bb401SStefano Zampini       }*/
38980c7d97c5SJed Brown 
38990c7d97c5SJed Brown       if (rank_prec_comm == master_proc) {
39000bdf917eSStefano Zampini         ierr = PetscFree(coarse_subdivision);CHKERRQ(ierr);
3901da1bb401SStefano Zampini         ierr = PetscFree(total_count_recv);CHKERRQ(ierr);
39020bdf917eSStefano Zampini         ierr = PetscFree(total_ranks_recv);CHKERRQ(ierr);
39030c7d97c5SJed Brown         ierr = PetscFree(displacements_recv);CHKERRQ(ierr);
39040c7d97c5SJed Brown       }
39050c7d97c5SJed Brown       break;
39060c7d97c5SJed Brown     }
39070c7d97c5SJed Brown 
39080c7d97c5SJed Brown     case(REPLICATED_BDDC):
39090c7d97c5SJed Brown 
39100c7d97c5SJed Brown       pcbddc->coarse_communications_type = GATHERS_BDDC;
39110c7d97c5SJed Brown       coarse_mat_type = MATSEQAIJ;
39120c7d97c5SJed Brown       coarse_pc_type  = PCLU;
391353cdbc3dSStefano Zampini       coarse_ksp_type  = KSPPREONLY;
39140c7d97c5SJed Brown       coarse_comm = PETSC_COMM_SELF;
39150c7d97c5SJed Brown       active_rank = rank_prec_comm;
39160c7d97c5SJed Brown       break;
39170c7d97c5SJed Brown 
39180c7d97c5SJed Brown     case(PARALLEL_BDDC):
39190c7d97c5SJed Brown 
39200c7d97c5SJed Brown       pcbddc->coarse_communications_type = SCATTERS_BDDC;
39210c7d97c5SJed Brown       coarse_mat_type = MATMPIAIJ;
39220c7d97c5SJed Brown       coarse_pc_type  = PCREDUNDANT;
392353cdbc3dSStefano Zampini       coarse_ksp_type  = KSPPREONLY;
39240c7d97c5SJed Brown       coarse_comm = prec_comm;
39250c7d97c5SJed Brown       active_rank = rank_prec_comm;
39260c7d97c5SJed Brown       break;
39270c7d97c5SJed Brown 
39280c7d97c5SJed Brown     case(SEQUENTIAL_BDDC):
39290c7d97c5SJed Brown       pcbddc->coarse_communications_type = GATHERS_BDDC;
39300c7d97c5SJed Brown       coarse_mat_type = MATSEQAIJ;
39310c7d97c5SJed Brown       coarse_pc_type = PCLU;
393253cdbc3dSStefano Zampini       coarse_ksp_type  = KSPPREONLY;
39330c7d97c5SJed Brown       coarse_comm = PETSC_COMM_SELF;
39340c7d97c5SJed Brown       active_rank = master_proc;
39350c7d97c5SJed Brown       break;
39360c7d97c5SJed Brown   }
39370c7d97c5SJed Brown 
39380c7d97c5SJed Brown   switch(pcbddc->coarse_communications_type){
39390c7d97c5SJed Brown 
39400c7d97c5SJed Brown     case(SCATTERS_BDDC):
39410c7d97c5SJed Brown       {
39420c7d97c5SJed Brown         if (pcbddc->coarse_problem_type==MULTILEVEL_BDDC) {
39430c7d97c5SJed Brown 
39440c7d97c5SJed Brown           PetscMPIInt send_size;
39450c7d97c5SJed Brown           PetscInt    *aux_ins_indices;
39460c7d97c5SJed Brown           PetscInt    ii,jj;
39470c7d97c5SJed Brown           MPI_Request *requests;
39480c7d97c5SJed Brown 
3949*4fad6a16SStefano Zampini           if(pcbddc->coarsening_ratio == 1) {
3950*4fad6a16SStefano Zampini             ins_local_primal_size = pcbddc->local_primal_size;
3951*4fad6a16SStefano Zampini             ierr = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&ins_local_primal_indices);CHKERRQ(ierr);
3952*4fad6a16SStefano Zampini             ierr = PetscMemcpy(ins_local_primal_indices,pcbddc->local_primal_indices,ins_local_primal_size*sizeof(PetscInt));CHKERRQ(ierr);
3953*4fad6a16SStefano Zampini             ierr = PetscMalloc(ins_local_primal_size*ins_local_primal_size*sizeof(PetscScalar),&ins_coarse_mat_vals);CHKERRQ(ierr);
3954*4fad6a16SStefano Zampini             ierr = PetscMemcpy(ins_coarse_mat_vals,coarse_submat_vals,ins_local_primal_size*ins_local_primal_size*sizeof(PetscScalar));CHKERRQ(ierr);
3955*4fad6a16SStefano Zampini           } else {
39560c7d97c5SJed Brown             /* allocate auxiliary space */
39575619798eSStefano Zampini             ierr = PetscMalloc (pcbddc->replicated_primal_size*sizeof(PetscMPIInt),&pcbddc->replicated_local_primal_indices);CHKERRQ(ierr);
39585619798eSStefano Zampini             ierr = MPI_Allgatherv(&pcbddc->local_primal_indices[0],pcbddc->local_primal_size,MPIU_INT,&pcbddc->replicated_local_primal_indices[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,prec_comm);CHKERRQ(ierr);
39590c7d97c5SJed Brown             ierr = PetscMalloc ( pcbddc->coarse_size*sizeof(PetscInt),&aux_ins_indices);CHKERRQ(ierr);
39600c7d97c5SJed Brown             ierr = PetscMemzero(aux_ins_indices,pcbddc->coarse_size*sizeof(PetscInt));CHKERRQ(ierr);
39610c7d97c5SJed Brown             /* allocate stuffs for message massing */
39620c7d97c5SJed Brown             ierr = PetscMalloc ( (count_recv+1)*sizeof(MPI_Request),&requests);CHKERRQ(ierr);
39630c7d97c5SJed Brown             for (i=0;i<count_recv+1;i++) requests[i]=MPI_REQUEST_NULL;
39640c7d97c5SJed Brown             ierr = PetscMalloc ( count_recv*sizeof(PetscMPIInt),&localsizes2);CHKERRQ(ierr);
39650c7d97c5SJed Brown             ierr = PetscMalloc ( count_recv*sizeof(PetscMPIInt),&localdispl2);CHKERRQ(ierr);
39660c7d97c5SJed Brown             /* fill up quantities */
39670c7d97c5SJed Brown             j=0;
39680c7d97c5SJed Brown             for (i=0;i<count_recv;i++){
39690c7d97c5SJed Brown               ii = ranks_recv[i];
39700c7d97c5SJed Brown               localsizes2[i]=pcbddc->local_primal_sizes[ii]*pcbddc->local_primal_sizes[ii];
39710c7d97c5SJed Brown               localdispl2[i]=j;
39720c7d97c5SJed Brown               j+=localsizes2[i];
39730c7d97c5SJed Brown               jj = pcbddc->local_primal_displacements[ii];
3974*4fad6a16SStefano Zampini               /* it counts the coarse subdomains sharing the coarse node */
3975*4fad6a16SStefano Zampini               for (k=0;k<pcbddc->local_primal_sizes[ii];k++) {
3976*4fad6a16SStefano Zampini                 aux_ins_indices[pcbddc->replicated_local_primal_indices[jj+k]]+=1;
39770c7d97c5SJed Brown               }
3978*4fad6a16SStefano Zampini             }
39790c7d97c5SJed Brown             /* temp_coarse_mat_vals used to store temporarly received matrix values */
39800c7d97c5SJed Brown             ierr = PetscMalloc ( j*sizeof(PetscScalar),&temp_coarse_mat_vals);CHKERRQ(ierr);
39810c7d97c5SJed Brown             /* evaluate how many values I will insert in coarse mat */
39820c7d97c5SJed Brown             ins_local_primal_size=0;
3983ea7e1babSStefano Zampini             for (i=0;i<pcbddc->coarse_size;i++){
3984ea7e1babSStefano Zampini               if (aux_ins_indices[i]){
39850c7d97c5SJed Brown                 ins_local_primal_size++;
3986ea7e1babSStefano Zampini               }
3987ea7e1babSStefano Zampini             }
39880c7d97c5SJed Brown             /* evaluate indices I will insert in coarse mat */
39890c7d97c5SJed Brown             ierr = PetscMalloc ( ins_local_primal_size*sizeof(PetscInt),&ins_local_primal_indices);CHKERRQ(ierr);
39900c7d97c5SJed Brown             j=0;
3991ea7e1babSStefano Zampini             for (i=0;i<pcbddc->coarse_size;i++){
3992ea7e1babSStefano Zampini               if (aux_ins_indices[i]){
39930c7d97c5SJed Brown                 ins_local_primal_indices[j++]=i;
3994ea7e1babSStefano Zampini               }
3995ea7e1babSStefano Zampini             }
39960c7d97c5SJed Brown             /* use aux_ins_indices to realize a global to local mapping */
39970c7d97c5SJed Brown             j=0;
39980c7d97c5SJed Brown             for (i=0;i<pcbddc->coarse_size;i++){
39990c7d97c5SJed Brown               if (aux_ins_indices[i]==0){
40000c7d97c5SJed Brown                 aux_ins_indices[i]=-1;
40010c7d97c5SJed Brown               } else {
40020c7d97c5SJed Brown                 aux_ins_indices[i]=j;
40030c7d97c5SJed Brown                 j++;
40040c7d97c5SJed Brown               }
40050c7d97c5SJed Brown             }
40060c7d97c5SJed Brown 
40070c7d97c5SJed Brown             /* processes partecipating in coarse problem receive matrix data from their friends */
4008*4fad6a16SStefano Zampini             for (i=0;i<count_recv;i++) {
4009*4fad6a16SStefano Zampini               ierr = MPI_Irecv(&temp_coarse_mat_vals[localdispl2[i]],localsizes2[i],MPIU_SCALAR,ranks_recv[i],666,prec_comm,&requests[i]);CHKERRQ(ierr); }
40100c7d97c5SJed Brown             if (rank_coarse_proc_send_to != MPI_PROC_NULL ) {
40110c7d97c5SJed Brown               send_size=pcbddc->local_primal_size*pcbddc->local_primal_size;
401253cdbc3dSStefano Zampini               ierr = MPI_Isend(&coarse_submat_vals[0],send_size,MPIU_SCALAR,rank_coarse_proc_send_to,666,prec_comm,&requests[count_recv]);CHKERRQ(ierr);
40130c7d97c5SJed Brown             }
401453cdbc3dSStefano Zampini             ierr = MPI_Waitall(count_recv+1,requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
40150c7d97c5SJed Brown 
40160c7d97c5SJed Brown             /* calculate data to insert in coarse mat */
40170c7d97c5SJed Brown             ierr = PetscMalloc ( ins_local_primal_size*ins_local_primal_size*sizeof(PetscScalar),&ins_coarse_mat_vals);CHKERRQ(ierr);
40180c7d97c5SJed Brown             PetscMemzero(ins_coarse_mat_vals,ins_local_primal_size*ins_local_primal_size*sizeof(PetscScalar));
40190c7d97c5SJed Brown 
40200c7d97c5SJed Brown             PetscMPIInt rr,kk,lps,lpd;
40210c7d97c5SJed Brown             PetscInt row_ind,col_ind;
40220c7d97c5SJed Brown             for (k=0;k<count_recv;k++){
40230c7d97c5SJed Brown               rr = ranks_recv[k];
40240c7d97c5SJed Brown               kk = localdispl2[k];
40250c7d97c5SJed Brown               lps = pcbddc->local_primal_sizes[rr];
40260c7d97c5SJed Brown               lpd = pcbddc->local_primal_displacements[rr];
40270c7d97c5SJed Brown               for (j=0;j<lps;j++){
40280c7d97c5SJed Brown                 col_ind=aux_ins_indices[pcbddc->replicated_local_primal_indices[lpd+j]];
40290c7d97c5SJed Brown                 for (i=0;i<lps;i++){
40300c7d97c5SJed Brown                   row_ind=aux_ins_indices[pcbddc->replicated_local_primal_indices[lpd+i]];
40310c7d97c5SJed Brown                   ins_coarse_mat_vals[col_ind*ins_local_primal_size+row_ind]+=temp_coarse_mat_vals[kk+j*lps+i];
40320c7d97c5SJed Brown                 }
40330c7d97c5SJed Brown               }
40340c7d97c5SJed Brown             }
40350c7d97c5SJed Brown             ierr = PetscFree(requests);CHKERRQ(ierr);
40360c7d97c5SJed Brown             ierr = PetscFree(aux_ins_indices);CHKERRQ(ierr);
40370c7d97c5SJed Brown             ierr = PetscFree(temp_coarse_mat_vals);CHKERRQ(ierr);
40380c7d97c5SJed Brown             if (coarse_color == 0) { ierr = PetscFree(ranks_recv);CHKERRQ(ierr); }
4039*4fad6a16SStefano Zampini           }
40400c7d97c5SJed Brown 
40410c7d97c5SJed Brown           /* create local to global mapping needed by coarse MATIS */
40420c7d97c5SJed Brown           {
40430c7d97c5SJed Brown             IS coarse_IS;
4044142dfd88SStefano Zampini             if (coarse_comm != MPI_COMM_NULL ) {ierr = MPI_Comm_free(&coarse_comm);CHKERRQ(ierr);}
40450c7d97c5SJed Brown             coarse_comm = prec_comm;
40460c7d97c5SJed Brown             active_rank=rank_prec_comm;
40470c7d97c5SJed Brown             ierr = ISCreateGeneral(coarse_comm,ins_local_primal_size,ins_local_primal_indices,PETSC_COPY_VALUES,&coarse_IS);CHKERRQ(ierr);
40480c7d97c5SJed Brown             ierr = ISLocalToGlobalMappingCreateIS(coarse_IS,&coarse_ISLG);CHKERRQ(ierr);
40490c7d97c5SJed Brown             ierr = ISDestroy(&coarse_IS);CHKERRQ(ierr);
40500c7d97c5SJed Brown           }
40510c7d97c5SJed Brown         }
40520c7d97c5SJed Brown         if (pcbddc->coarse_problem_type==PARALLEL_BDDC) {
40530c7d97c5SJed Brown           /* arrays for values insertion */
40540c7d97c5SJed Brown           ins_local_primal_size = pcbddc->local_primal_size;
40550c7d97c5SJed Brown           ierr = PetscMalloc ( ins_local_primal_size*sizeof(PetscMPIInt),&ins_local_primal_indices);CHKERRQ(ierr);
40560c7d97c5SJed Brown           ierr = PetscMalloc ( ins_local_primal_size*ins_local_primal_size*sizeof(PetscScalar),&ins_coarse_mat_vals);CHKERRQ(ierr);
40570c7d97c5SJed Brown           for (j=0;j<ins_local_primal_size;j++){
40580c7d97c5SJed Brown             ins_local_primal_indices[j]=pcbddc->local_primal_indices[j];
4059*4fad6a16SStefano Zampini             for (i=0;i<ins_local_primal_size;i++) {
4060*4fad6a16SStefano Zampini               ins_coarse_mat_vals[j*ins_local_primal_size+i]=coarse_submat_vals[j*ins_local_primal_size+i];
4061*4fad6a16SStefano Zampini             }
40620c7d97c5SJed Brown           }
40630c7d97c5SJed Brown         }
40640c7d97c5SJed Brown         break;
40650c7d97c5SJed Brown 
40660c7d97c5SJed Brown     }
40670c7d97c5SJed Brown 
40680c7d97c5SJed Brown     case(GATHERS_BDDC):
40690c7d97c5SJed Brown       {
40700c7d97c5SJed Brown 
40710c7d97c5SJed Brown         PetscMPIInt mysize,mysize2;
40720c7d97c5SJed Brown 
40730c7d97c5SJed Brown         if (rank_prec_comm==active_rank) {
40740c7d97c5SJed Brown           ierr = PetscMalloc ( pcbddc->replicated_primal_size*sizeof(PetscMPIInt),&pcbddc->replicated_local_primal_indices);CHKERRQ(ierr);
40750bdf917eSStefano Zampini           ierr = PetscMalloc ( pcbddc->replicated_primal_size*sizeof(PetscScalar),&pcbddc->replicated_local_primal_values);CHKERRQ(ierr);
40760c7d97c5SJed Brown           ierr = PetscMalloc ( size_prec_comm*sizeof(PetscMPIInt),&localsizes2);CHKERRQ(ierr);
40770c7d97c5SJed Brown           ierr = PetscMalloc ( size_prec_comm*sizeof(PetscMPIInt),&localdispl2);CHKERRQ(ierr);
40780c7d97c5SJed Brown           /* arrays for values insertion */
4079*4fad6a16SStefano Zampini           for (i=0;i<size_prec_comm;i++) { localsizes2[i]=pcbddc->local_primal_sizes[i]*pcbddc->local_primal_sizes[i]; }
40800c7d97c5SJed Brown           localdispl2[0]=0;
4081*4fad6a16SStefano Zampini           for (i=1;i<size_prec_comm;i++) { localdispl2[i]=localsizes2[i-1]+localdispl2[i-1]; }
40820c7d97c5SJed Brown           j=0;
4083*4fad6a16SStefano Zampini           for (i=0;i<size_prec_comm;i++) { j+=localsizes2[i]; }
40840c7d97c5SJed Brown           ierr = PetscMalloc ( j*sizeof(PetscScalar),&temp_coarse_mat_vals);CHKERRQ(ierr);
40850c7d97c5SJed Brown         }
40860c7d97c5SJed Brown 
40870c7d97c5SJed Brown         mysize=pcbddc->local_primal_size;
40880c7d97c5SJed Brown         mysize2=pcbddc->local_primal_size*pcbddc->local_primal_size;
40890c7d97c5SJed Brown         if (pcbddc->coarse_problem_type == SEQUENTIAL_BDDC){
409053cdbc3dSStefano Zampini           ierr = MPI_Gatherv(&pcbddc->local_primal_indices[0],mysize,MPIU_INT,&pcbddc->replicated_local_primal_indices[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr);
409153cdbc3dSStefano Zampini           ierr = MPI_Gatherv(&coarse_submat_vals[0],mysize2,MPIU_SCALAR,&temp_coarse_mat_vals[0],localsizes2,localdispl2,MPIU_SCALAR,master_proc,prec_comm);CHKERRQ(ierr);
40920c7d97c5SJed Brown         } else {
409353cdbc3dSStefano Zampini           ierr = MPI_Allgatherv(&pcbddc->local_primal_indices[0],mysize,MPIU_INT,&pcbddc->replicated_local_primal_indices[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,prec_comm);CHKERRQ(ierr);
409453cdbc3dSStefano Zampini           ierr = MPI_Allgatherv(&coarse_submat_vals[0],mysize2,MPIU_SCALAR,&temp_coarse_mat_vals[0],localsizes2,localdispl2,MPIU_SCALAR,prec_comm);CHKERRQ(ierr);
40950c7d97c5SJed Brown         }
40960c7d97c5SJed Brown         break;
4097da1bb401SStefano Zampini       }/* switch on coarse problem and communications associated with finished */
40980c7d97c5SJed Brown   }
40990c7d97c5SJed Brown 
41000c7d97c5SJed Brown   /* Now create and fill up coarse matrix */
41010c7d97c5SJed Brown   if ( rank_prec_comm == active_rank ) {
4102142dfd88SStefano Zampini 
4103142dfd88SStefano Zampini     Mat matis_coarse_local_mat;
4104142dfd88SStefano Zampini 
41050c7d97c5SJed Brown     if (pcbddc->coarse_problem_type != MULTILEVEL_BDDC) {
41060c7d97c5SJed Brown       ierr = MatCreate(coarse_comm,&pcbddc->coarse_mat);CHKERRQ(ierr);
41070c7d97c5SJed Brown       ierr = MatSetSizes(pcbddc->coarse_mat,PETSC_DECIDE,PETSC_DECIDE,pcbddc->coarse_size,pcbddc->coarse_size);CHKERRQ(ierr);
41080c7d97c5SJed Brown       ierr = MatSetType(pcbddc->coarse_mat,coarse_mat_type);CHKERRQ(ierr);
41093b03a366Sstefano_zampini       ierr = MatSetUp(pcbddc->coarse_mat);CHKERRQ(ierr);
4110da1bb401SStefano Zampini       ierr = MatSetOption(pcbddc->coarse_mat,MAT_ROW_ORIENTED,PETSC_FALSE);CHKERRQ(ierr); /* local values stored in column major */
41113b03a366Sstefano_zampini       ierr = MatSetOption(pcbddc->coarse_mat,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr);
41120c7d97c5SJed Brown     } else {
4113*4fad6a16SStefano Zampini       ierr = MatCreateIS(coarse_comm,1,PETSC_DECIDE,PETSC_DECIDE,pcbddc->coarse_size,pcbddc->coarse_size,coarse_ISLG,&pcbddc->coarse_mat);CHKERRQ(ierr);
41143b03a366Sstefano_zampini       ierr = MatSetUp(pcbddc->coarse_mat);CHKERRQ(ierr);
41150c7d97c5SJed Brown       ierr = MatISGetLocalMat(pcbddc->coarse_mat,&matis_coarse_local_mat);CHKERRQ(ierr);
41163b03a366Sstefano_zampini       ierr = MatSetUp(matis_coarse_local_mat);CHKERRQ(ierr);
4117da1bb401SStefano Zampini       ierr = MatSetOption(matis_coarse_local_mat,MAT_ROW_ORIENTED,PETSC_FALSE);CHKERRQ(ierr); /* local values stored in column major */
4118a0ba757dSStefano Zampini       ierr = MatSetOption(matis_coarse_local_mat,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr);
41190c7d97c5SJed Brown     }
4120142dfd88SStefano Zampini     /* preallocation */
4121142dfd88SStefano Zampini     if (pcbddc->coarse_problem_type != MULTILEVEL_BDDC) {
4122142dfd88SStefano Zampini       PetscInt *dnz,*onz;
4123142dfd88SStefano Zampini       PetscInt lrows,lcols;
4124142dfd88SStefano Zampini       ierr = MatGetLocalSize(pcbddc->coarse_mat,&lrows,&lcols);CHKERRQ(ierr);
4125142dfd88SStefano Zampini       ierr = MatPreallocateInitialize(coarse_comm,lrows,lcols,dnz,onz);CHKERRQ(ierr);
4126142dfd88SStefano Zampini       if (pcbddc->coarse_problem_type == PARALLEL_BDDC) {
4127142dfd88SStefano Zampini         PetscInt coarse_index_row,coarse_index_col,start_row,owner;
4128142dfd88SStefano Zampini         PetscMPIInt *auxpreall_displs;
4129142dfd88SStefano Zampini         PetscMPIInt *auxpreall_sizes;
4130142dfd88SStefano Zampini         PetscMPIInt *auxpreall_dnz;
4131142dfd88SStefano Zampini         PetscMPIInt *auxpreall_onz;
4132142dfd88SStefano Zampini         PetscInt    *auxpreall_ownership;
4133142dfd88SStefano Zampini         if (rank_prec_comm == 0) {
4134142dfd88SStefano Zampini           ierr = PetscMalloc((size_prec_comm+1)*sizeof(PetscMPIInt),&auxpreall_displs);CHKERRQ(ierr);
4135142dfd88SStefano Zampini           auxpreall_displs[size_prec_comm]=pcbddc->coarse_size;
4136142dfd88SStefano Zampini           ierr = PetscMalloc(size_prec_comm*sizeof(PetscMPIInt),&auxpreall_sizes);CHKERRQ(ierr);
4137142dfd88SStefano Zampini           ierr = PetscMalloc(pcbddc->coarse_size*sizeof(PetscMPIInt),&auxpreall_dnz);CHKERRQ(ierr);
4138142dfd88SStefano Zampini           ierr = PetscMemzero(auxpreall_dnz,pcbddc->coarse_size*sizeof(PetscMPIInt));CHKERRQ(ierr);
4139142dfd88SStefano Zampini           ierr = PetscMalloc(pcbddc->coarse_size*sizeof(PetscMPIInt),&auxpreall_onz);CHKERRQ(ierr);
4140142dfd88SStefano Zampini           ierr = PetscMemzero(auxpreall_onz,pcbddc->coarse_size*sizeof(PetscMPIInt));CHKERRQ(ierr);
4141142dfd88SStefano Zampini           ierr = PetscMalloc(pcbddc->coarse_size*sizeof(PetscInt),&auxpreall_ownership);CHKERRQ(ierr);
4142142dfd88SStefano Zampini         }
4143142dfd88SStefano Zampini         ierr = MatGetOwnershipRange(pcbddc->coarse_mat,&start_row,PETSC_NULL);CHKERRQ(ierr);
4144142dfd88SStefano Zampini         ierr = MPI_Gather(&start_row,1,MPIU_INT,auxpreall_displs,1,MPIU_INT,0,prec_comm);CHKERRQ(ierr);
4145142dfd88SStefano Zampini         if (rank_prec_comm == 0) {
4146142dfd88SStefano Zampini           k=0;
4147142dfd88SStefano Zampini           for (i=0;i<size_prec_comm;i++) {
4148142dfd88SStefano Zampini             auxpreall_sizes[i]=auxpreall_displs[i+1]-auxpreall_displs[i];
4149142dfd88SStefano Zampini             for (j=0;j<auxpreall_sizes[i];j++) {
4150142dfd88SStefano Zampini               auxpreall_ownership[auxpreall_displs[i]+j]=i;
4151142dfd88SStefano Zampini             }
4152142dfd88SStefano Zampini           }
4153142dfd88SStefano Zampini           for (i=0;i<size_prec_comm;i++) {
4154142dfd88SStefano Zampini             for (j=0;j<pcbddc->local_primal_sizes[i];j++) {
4155142dfd88SStefano Zampini               coarse_index_row=auxglobal_primal[j+pcbddc->local_primal_displacements[i]];
4156142dfd88SStefano Zampini               for (k=j;k<pcbddc->local_primal_sizes[i];k++) {
4157142dfd88SStefano Zampini                 coarse_index_col=auxglobal_primal[k+pcbddc->local_primal_displacements[i]];
4158142dfd88SStefano Zampini                 owner = auxpreall_ownership[coarse_index_row];
4159142dfd88SStefano Zampini                 if (coarse_index_col>auxpreall_displs[owner]-1 && coarse_index_col < auxpreall_displs[owner]+auxpreall_sizes[owner]) {
4160142dfd88SStefano Zampini                   auxpreall_dnz[coarse_index_row]++;
4161142dfd88SStefano Zampini                 } else {
4162142dfd88SStefano Zampini                   auxpreall_onz[coarse_index_row]++;
4163142dfd88SStefano Zampini                 }
4164142dfd88SStefano Zampini                 if (k != j) {
4165142dfd88SStefano Zampini                   owner = auxpreall_ownership[coarse_index_col];
4166142dfd88SStefano Zampini                   if (coarse_index_row>auxpreall_displs[owner]-1 && coarse_index_row < auxpreall_displs[owner]+auxpreall_sizes[owner]) {
4167142dfd88SStefano Zampini                     auxpreall_dnz[coarse_index_col]++;
4168142dfd88SStefano Zampini                   } else {
4169142dfd88SStefano Zampini                     auxpreall_onz[coarse_index_col]++;
4170142dfd88SStefano Zampini                   }
4171142dfd88SStefano Zampini                 }
4172142dfd88SStefano Zampini               }
4173142dfd88SStefano Zampini             }
4174142dfd88SStefano Zampini           }
4175142dfd88SStefano Zampini         }
4176142dfd88SStefano Zampini         ierr = MPI_Scatterv(auxpreall_dnz,auxpreall_sizes,auxpreall_displs,MPIU_INT,
4177142dfd88SStefano Zampini                             dnz,lrows,MPIU_INT,0,prec_comm);
4178142dfd88SStefano Zampini         ierr = MPI_Scatterv(auxpreall_onz,auxpreall_sizes,auxpreall_displs,MPIU_INT,
4179142dfd88SStefano Zampini                             onz,lrows,MPIU_INT,0,prec_comm);
4180142dfd88SStefano Zampini         if (rank_prec_comm == 0) {
4181142dfd88SStefano Zampini           ierr = PetscFree(auxpreall_displs);CHKERRQ(ierr);
4182142dfd88SStefano Zampini           ierr = PetscFree(auxpreall_sizes);CHKERRQ(ierr);
4183142dfd88SStefano Zampini           ierr = PetscFree(auxpreall_dnz);CHKERRQ(ierr);
4184142dfd88SStefano Zampini           ierr = PetscFree(auxpreall_onz);CHKERRQ(ierr);
4185142dfd88SStefano Zampini           ierr = PetscFree(auxpreall_ownership);CHKERRQ(ierr);
4186142dfd88SStefano Zampini         }
4187142dfd88SStefano Zampini       } else {
4188142dfd88SStefano Zampini         for (k=0;k<size_prec_comm;k++){
4189142dfd88SStefano Zampini           offset=pcbddc->local_primal_displacements[k];
4190142dfd88SStefano Zampini           offset2=localdispl2[k];
4191142dfd88SStefano Zampini           ins_local_primal_size = pcbddc->local_primal_sizes[k];
4192142dfd88SStefano Zampini           ins_local_primal_indices = &pcbddc->replicated_local_primal_indices[offset];
4193142dfd88SStefano Zampini           for (j=0;j<ins_local_primal_size;j++) {
4194142dfd88SStefano Zampini             ierr = MatPreallocateSet(ins_local_primal_indices[j],ins_local_primal_size,ins_local_primal_indices,dnz,onz);CHKERRQ(ierr);
4195142dfd88SStefano Zampini           }
4196142dfd88SStefano Zampini         }
4197142dfd88SStefano Zampini       }
4198142dfd88SStefano Zampini       /* check */
4199142dfd88SStefano Zampini       for (i=0;i<lrows;i++) {
4200142dfd88SStefano Zampini         if (dnz[i]>lcols) {
4201142dfd88SStefano Zampini           dnz[i]=lcols;
4202142dfd88SStefano Zampini         }
4203142dfd88SStefano Zampini         if (onz[i]>pcbddc->coarse_size-lcols) {
4204142dfd88SStefano Zampini           onz[i]=pcbddc->coarse_size-lcols;
4205142dfd88SStefano Zampini         }
4206142dfd88SStefano Zampini       }
4207142dfd88SStefano Zampini       ierr = MatSeqAIJSetPreallocation(pcbddc->coarse_mat,PETSC_NULL,dnz);CHKERRQ(ierr);
4208142dfd88SStefano Zampini       ierr = MatMPIAIJSetPreallocation(pcbddc->coarse_mat,PETSC_NULL,dnz,PETSC_NULL,onz);CHKERRQ(ierr);
4209142dfd88SStefano Zampini       ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr);
4210142dfd88SStefano Zampini     } else {
4211142dfd88SStefano Zampini       ierr = MatSeqAIJSetPreallocation(matis_coarse_local_mat,ins_local_primal_size,PETSC_NULL);CHKERRQ(ierr);
4212142dfd88SStefano Zampini     }
4213142dfd88SStefano Zampini     if (rank_prec_comm == 0) { ierr = PetscFree(auxglobal_primal);CHKERRQ(ierr); }
4214142dfd88SStefano Zampini     /* insert values */
4215ea7e1babSStefano Zampini     if (pcbddc->coarse_communications_type != GATHERS_BDDC) {
42160c7d97c5SJed Brown       ierr = MatSetValues(pcbddc->coarse_mat,ins_local_primal_size,ins_local_primal_indices,ins_local_primal_size,ins_local_primal_indices,ins_coarse_mat_vals,ADD_VALUES);CHKERRQ(ierr);
4217ea7e1babSStefano Zampini     } else {
4218ea7e1babSStefano Zampini       for (k=0;k<size_prec_comm;k++){
4219ea7e1babSStefano Zampini         offset=pcbddc->local_primal_displacements[k];
4220ea7e1babSStefano Zampini         offset2=localdispl2[k];
4221ea7e1babSStefano Zampini         ins_local_primal_size = pcbddc->local_primal_sizes[k];
4222ea7e1babSStefano Zampini         ins_local_primal_indices = &pcbddc->replicated_local_primal_indices[offset];
4223ea7e1babSStefano Zampini         ins_coarse_mat_vals = &temp_coarse_mat_vals[offset2];
4224ea7e1babSStefano Zampini         ierr = MatSetValues(pcbddc->coarse_mat,ins_local_primal_size,ins_local_primal_indices,ins_local_primal_size,ins_local_primal_indices,ins_coarse_mat_vals,ADD_VALUES);CHKERRQ(ierr);
4225ea7e1babSStefano Zampini       }
4226ea7e1babSStefano Zampini       ins_local_primal_indices = 0;
4227ea7e1babSStefano Zampini       ins_coarse_mat_vals = 0;
4228ea7e1babSStefano Zampini     }
42290c7d97c5SJed Brown     ierr = MatAssemblyBegin(pcbddc->coarse_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
42300c7d97c5SJed Brown     ierr = MatAssemblyEnd(pcbddc->coarse_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
4231142dfd88SStefano Zampini     /* symmetry of coarse matrix */
4232142dfd88SStefano Zampini     if (issym) {
4233142dfd88SStefano Zampini       ierr = MatSetOption(pcbddc->coarse_mat,MAT_SYMMETRIC,PETSC_TRUE);CHKERRQ(ierr);
4234142dfd88SStefano Zampini     }
42350c7d97c5SJed Brown     ierr = MatGetVecs(pcbddc->coarse_mat,&pcbddc->coarse_vec,&pcbddc->coarse_rhs);CHKERRQ(ierr);
42360bdf917eSStefano Zampini   }
42370bdf917eSStefano Zampini 
42380bdf917eSStefano Zampini   /* create loc to glob scatters if needed */
42390bdf917eSStefano Zampini   if (pcbddc->coarse_communications_type == SCATTERS_BDDC) {
42400bdf917eSStefano Zampini      IS local_IS,global_IS;
42410bdf917eSStefano Zampini      ierr = ISCreateStride(PETSC_COMM_SELF,pcbddc->local_primal_size,0,1,&local_IS);CHKERRQ(ierr);
42420bdf917eSStefano Zampini      ierr = ISCreateGeneral(PETSC_COMM_SELF,pcbddc->local_primal_size,pcbddc->local_primal_indices,PETSC_COPY_VALUES,&global_IS);CHKERRQ(ierr);
42430bdf917eSStefano Zampini      ierr = VecScatterCreate(pcbddc->vec1_P,local_IS,pcbddc->coarse_vec,global_IS,&pcbddc->coarse_loc_to_glob);CHKERRQ(ierr);
42440bdf917eSStefano Zampini      ierr = ISDestroy(&local_IS);CHKERRQ(ierr);
42450bdf917eSStefano Zampini      ierr = ISDestroy(&global_IS);CHKERRQ(ierr);
42460bdf917eSStefano Zampini   }
42470bdf917eSStefano Zampini 
42480bdf917eSStefano Zampini   /* Eval coarse null space */
42490bdf917eSStefano Zampini   if (pcbddc->NullSpace) {
42500bdf917eSStefano Zampini     const Vec      *nsp_vecs;
42510bdf917eSStefano Zampini     PetscInt       nsp_size,coarse_nsp_size;
42520bdf917eSStefano Zampini     PetscBool      nsp_has_cnst;
42530bdf917eSStefano Zampini     PetscReal      test_null;
42540bdf917eSStefano Zampini     Vec            *coarse_nsp_vecs;
42550bdf917eSStefano Zampini 
42560bdf917eSStefano Zampini     coarse_nsp_size = 0;
42570bdf917eSStefano Zampini     coarse_nsp_vecs = 0;
42580bdf917eSStefano Zampini     ierr = MatNullSpaceGetVecs(pcbddc->NullSpace,&nsp_has_cnst,&nsp_size,&nsp_vecs);CHKERRQ(ierr);
42590bdf917eSStefano Zampini     if (rank_prec_comm == active_rank) {
42600bdf917eSStefano Zampini       ierr = PetscMalloc((nsp_size+1)*sizeof(Vec),&coarse_nsp_vecs);CHKERRQ(ierr);
42610bdf917eSStefano Zampini       for (i=0;i<nsp_size+1;i++) {
42620bdf917eSStefano Zampini         ierr = VecDuplicate(pcbddc->coarse_vec,&coarse_nsp_vecs[i]);CHKERRQ(ierr);
42630bdf917eSStefano Zampini       }
42640bdf917eSStefano Zampini     }
42650bdf917eSStefano Zampini     if (nsp_has_cnst) {
42660bdf917eSStefano Zampini       ierr = VecSet(pcis->vec1_N,1.0);CHKERRQ(ierr);
42670bdf917eSStefano Zampini       ierr = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr);
42680bdf917eSStefano Zampini       ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->vec1_P,pcbddc->coarse_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
42690bdf917eSStefano Zampini       ierr = PCBDDCScatterCoarseDataEnd(pc,pcbddc->vec1_P,pcbddc->coarse_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
42700bdf917eSStefano Zampini       if (rank_prec_comm == active_rank) {
42710bdf917eSStefano Zampini         ierr = MatMult(pcbddc->coarse_mat,pcbddc->coarse_vec,pcbddc->coarse_rhs);CHKERRQ(ierr);
42720bdf917eSStefano Zampini         ierr = VecNorm(pcbddc->coarse_rhs,NORM_INFINITY,&test_null);CHKERRQ(ierr);
42730bdf917eSStefano Zampini         if (test_null > 1.0e-12 && pcbddc->dbg_flag ) {
42740bdf917eSStefano Zampini           ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Constant coarse null space error % 1.14e\n",test_null);CHKERRQ(ierr);
42750bdf917eSStefano Zampini         }
42760bdf917eSStefano Zampini         ierr = VecCopy(pcbddc->coarse_vec,coarse_nsp_vecs[coarse_nsp_size]);CHKERRQ(ierr);
42770bdf917eSStefano Zampini         coarse_nsp_size++;
42780bdf917eSStefano Zampini       }
42790bdf917eSStefano Zampini     }
42800bdf917eSStefano Zampini     for (i=0;i<nsp_size;i++)  {
42810bdf917eSStefano Zampini       ierr = VecScatterBegin(matis->ctx,nsp_vecs[i],pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
42820bdf917eSStefano Zampini       ierr = VecScatterEnd  (matis->ctx,nsp_vecs[i],pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
42830bdf917eSStefano Zampini       ierr = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr);
42840bdf917eSStefano Zampini       ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->vec1_P,pcbddc->coarse_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
42850bdf917eSStefano Zampini       ierr = PCBDDCScatterCoarseDataEnd(pc,pcbddc->vec1_P,pcbddc->coarse_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
42860bdf917eSStefano Zampini       if (rank_prec_comm == active_rank) {
42870bdf917eSStefano Zampini         ierr = MatMult(pcbddc->coarse_mat,pcbddc->coarse_vec,pcbddc->coarse_rhs);CHKERRQ(ierr);
42880bdf917eSStefano Zampini         ierr = VecNorm(pcbddc->coarse_rhs,NORM_2,&test_null);CHKERRQ(ierr);
42890bdf917eSStefano Zampini         if (test_null > 1.0e-12 && pcbddc->dbg_flag ) {
42900bdf917eSStefano Zampini           ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Vec %d coarse null space error % 1.14e\n",i,test_null);CHKERRQ(ierr);
42910bdf917eSStefano Zampini         }
42920bdf917eSStefano Zampini         ierr = VecCopy(pcbddc->coarse_vec,coarse_nsp_vecs[coarse_nsp_size]);CHKERRQ(ierr);
42930bdf917eSStefano Zampini         coarse_nsp_size++;
42940bdf917eSStefano Zampini       }
42950bdf917eSStefano Zampini     }
42960bdf917eSStefano Zampini     if (coarse_nsp_size > 0) {
42970bdf917eSStefano Zampini       /* TODO orthonormalize vecs */
42980bdf917eSStefano Zampini       ierr = VecNormalize(coarse_nsp_vecs[0],PETSC_NULL);CHKERRQ(ierr);
42990bdf917eSStefano Zampini       ierr = MatNullSpaceCreate(coarse_comm,PETSC_FALSE,coarse_nsp_size,coarse_nsp_vecs,&pcbddc->CoarseNullSpace);CHKERRQ(ierr);
43000bdf917eSStefano Zampini       for (i=0;i<nsp_size+1;i++) {
43010bdf917eSStefano Zampini         ierr = VecDestroy(&coarse_nsp_vecs[i]);CHKERRQ(ierr);
43020bdf917eSStefano Zampini       }
43030bdf917eSStefano Zampini     }
43040bdf917eSStefano Zampini     ierr = PetscFree(coarse_nsp_vecs);CHKERRQ(ierr);
43050bdf917eSStefano Zampini   }
43060bdf917eSStefano Zampini 
43070bdf917eSStefano Zampini   /* KSP for coarse problem */
43080bdf917eSStefano Zampini   if (rank_prec_comm == active_rank) {
43090bdf917eSStefano Zampini 
431053cdbc3dSStefano Zampini     ierr = KSPCreate(coarse_comm,&pcbddc->coarse_ksp);CHKERRQ(ierr);
431153cdbc3dSStefano Zampini     ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->coarse_ksp,(PetscObject)pc,1);CHKERRQ(ierr);
431253cdbc3dSStefano Zampini     ierr = KSPSetOperators(pcbddc->coarse_ksp,pcbddc->coarse_mat,pcbddc->coarse_mat,SAME_PRECONDITIONER);CHKERRQ(ierr);
43133b03a366Sstefano_zampini     ierr = KSPSetTolerances(pcbddc->coarse_ksp,PETSC_DEFAULT,PETSC_DEFAULT,PETSC_DEFAULT,max_it_coarse_ksp);CHKERRQ(ierr);
431453cdbc3dSStefano Zampini     ierr = KSPSetType(pcbddc->coarse_ksp,coarse_ksp_type);CHKERRQ(ierr);
431553cdbc3dSStefano Zampini     ierr = KSPGetPC(pcbddc->coarse_ksp,&pc_temp);CHKERRQ(ierr);
431653cdbc3dSStefano Zampini     ierr = PCSetType(pc_temp,coarse_pc_type);CHKERRQ(ierr);
43170c7d97c5SJed Brown     /* Allow user's customization */
4318da1bb401SStefano Zampini     ierr = KSPSetOptionsPrefix(pcbddc->coarse_ksp,"coarse_");CHKERRQ(ierr);
43190c7d97c5SJed Brown     /* Set Up PC for coarse problem BDDC */
432053cdbc3dSStefano Zampini     if (pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
4321*4fad6a16SStefano Zampini       i = pcbddc->current_level+1;
4322*4fad6a16SStefano Zampini       ierr = PCBDDCSetLevel(pc_temp,i);CHKERRQ(ierr);
4323*4fad6a16SStefano Zampini       ierr = PCBDDCSetCoarseningRatio(pc_temp,pcbddc->coarsening_ratio);CHKERRQ(ierr);
4324*4fad6a16SStefano Zampini       ierr = PCBDDCSetMaxLevels(pc_temp,pcbddc->max_levels);CHKERRQ(ierr);
432553cdbc3dSStefano Zampini       ierr = PCBDDCSetCoarseProblemType(pc_temp,MULTILEVEL_BDDC);CHKERRQ(ierr);
43260bdf917eSStefano Zampini       if (pcbddc->CoarseNullSpace) { ierr = PCBDDCSetNullSpace(pc_temp,pcbddc->CoarseNullSpace);CHKERRQ(ierr); }
4327e4886b5aSStefano Zampini       ierr = KSPSetNormType(pcbddc->coarse_ksp,KSP_NORM_NONE);CHKERRQ(ierr);
4328*4fad6a16SStefano Zampini       if (dbg_flag) {
4329*4fad6a16SStefano Zampini         ierr = PetscViewerASCIIPrintf(viewer,"----------------Level %d: Setting up level %d---------------\n",pcbddc->current_level,i);CHKERRQ(ierr);
4330*4fad6a16SStefano Zampini         ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
433153cdbc3dSStefano Zampini       }
4332*4fad6a16SStefano Zampini     }
4333*4fad6a16SStefano Zampini     ierr = KSPSetFromOptions(pcbddc->coarse_ksp);CHKERRQ(ierr);
433453cdbc3dSStefano Zampini     ierr = KSPSetUp(pcbddc->coarse_ksp);CHKERRQ(ierr);
4335142dfd88SStefano Zampini 
43360bdf917eSStefano Zampini     if (pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
43370bdf917eSStefano Zampini       /* TODO: this is a hack! need to be solved! */
4338142dfd88SStefano Zampini       PC_BDDC*     coarse_pcbddc = (PC_BDDC*)pc_temp->data;
4339142dfd88SStefano Zampini       coarse_pcbddc->use_exact_dirichlet = PETSC_FALSE;
43405619798eSStefano Zampini       if (dbg_flag) {
4341*4fad6a16SStefano Zampini         ierr = PetscViewerASCIIPrintf(viewer,"----------------Level %d set----------------------\n",i);CHKERRQ(ierr);
43425619798eSStefano Zampini         ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
43435619798eSStefano Zampini       }
43445619798eSStefano Zampini     }
43450c7d97c5SJed Brown   }
43463b03a366Sstefano_zampini   /* Evaluate condition number of coarse problem for cheby (and verbose output if requested) */
4347142dfd88SStefano Zampini   if ( dbg_flag && rank_prec_comm == active_rank ) {
4348142dfd88SStefano Zampini     KSP check_ksp;
4349142dfd88SStefano Zampini     PC  check_pc;
4350142dfd88SStefano Zampini     Vec check_vec;
4351142dfd88SStefano Zampini     PetscReal   abs_infty_error,infty_error,lambda_min,lambda_max;
4352142dfd88SStefano Zampini     const KSPType check_ksp_type;
43530c7d97c5SJed Brown 
4354142dfd88SStefano Zampini     /* Create ksp object suitable for extreme eigenvalues' estimation */
4355142dfd88SStefano Zampini     ierr = KSPCreate(coarse_comm,&check_ksp);CHKERRQ(ierr);
4356142dfd88SStefano Zampini     ierr = KSPSetOperators(check_ksp,pcbddc->coarse_mat,pcbddc->coarse_mat,SAME_PRECONDITIONER);CHKERRQ(ierr);
43570bdf917eSStefano Zampini     ierr = KSPSetTolerances(check_ksp,1.e-12,1.e-12,PETSC_DEFAULT,pcbddc->coarse_size);CHKERRQ(ierr);
4358142dfd88SStefano Zampini     if (pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
4359142dfd88SStefano Zampini       if (issym) {
4360142dfd88SStefano Zampini         check_ksp_type = KSPCG;
4361142dfd88SStefano Zampini       } else {
4362142dfd88SStefano Zampini         check_ksp_type = KSPGMRES;
4363142dfd88SStefano Zampini       }
4364142dfd88SStefano Zampini       ierr = KSPSetComputeSingularValues(check_ksp,PETSC_TRUE);CHKERRQ(ierr);
4365142dfd88SStefano Zampini     } else {
4366142dfd88SStefano Zampini       check_ksp_type = KSPPREONLY;
4367142dfd88SStefano Zampini     }
4368142dfd88SStefano Zampini     ierr = KSPSetType(check_ksp,check_ksp_type);CHKERRQ(ierr);
4369142dfd88SStefano Zampini     ierr = KSPGetPC(pcbddc->coarse_ksp,&check_pc);CHKERRQ(ierr);
4370142dfd88SStefano Zampini     ierr = KSPSetPC(check_ksp,check_pc);CHKERRQ(ierr);
4371142dfd88SStefano Zampini     ierr = KSPSetUp(check_ksp);CHKERRQ(ierr);
4372142dfd88SStefano Zampini     /* create random vec */
4373142dfd88SStefano Zampini     ierr = VecDuplicate(pcbddc->coarse_vec,&check_vec);CHKERRQ(ierr);
4374142dfd88SStefano Zampini     ierr = VecSetRandom(check_vec,PETSC_NULL);CHKERRQ(ierr);
43750bdf917eSStefano Zampini     if (pcbddc->CoarseNullSpace) { ierr = MatNullSpaceRemove(pcbddc->CoarseNullSpace,check_vec,PETSC_NULL);CHKERRQ(ierr); }
4376142dfd88SStefano Zampini     ierr = MatMult(pcbddc->coarse_mat,check_vec,pcbddc->coarse_rhs);CHKERRQ(ierr);
4377142dfd88SStefano Zampini     /* solve coarse problem */
4378142dfd88SStefano Zampini     ierr = KSPSolve(check_ksp,pcbddc->coarse_rhs,pcbddc->coarse_vec);CHKERRQ(ierr);
43790bdf917eSStefano Zampini     if (pcbddc->CoarseNullSpace) { ierr = MatNullSpaceRemove(pcbddc->CoarseNullSpace,pcbddc->coarse_vec,PETSC_NULL);CHKERRQ(ierr); }
4380142dfd88SStefano Zampini     /* check coarse problem residual error */
4381142dfd88SStefano Zampini     ierr = VecAXPY(check_vec,-1.0,pcbddc->coarse_vec);CHKERRQ(ierr);
4382142dfd88SStefano Zampini     ierr = VecNorm(check_vec,NORM_INFINITY,&infty_error);CHKERRQ(ierr);
4383142dfd88SStefano Zampini     ierr = MatMult(pcbddc->coarse_mat,check_vec,pcbddc->coarse_rhs);CHKERRQ(ierr);
4384142dfd88SStefano Zampini     ierr = VecNorm(pcbddc->coarse_rhs,NORM_INFINITY,&abs_infty_error);CHKERRQ(ierr);
4385142dfd88SStefano Zampini     ierr = VecDestroy(&check_vec);CHKERRQ(ierr);
4386142dfd88SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"Size of coarse problem %d\n",pcbddc->coarse_size);CHKERRQ(ierr);
4387142dfd88SStefano Zampini     /* get eigenvalue estimation if inexact */
4388142dfd88SStefano Zampini     if (pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
4389142dfd88SStefano Zampini       ierr = KSPComputeExtremeSingularValues(check_ksp,&lambda_max,&lambda_min);CHKERRQ(ierr);
4390142dfd88SStefano Zampini       ierr = KSPGetIterationNumber(check_ksp,&k);CHKERRQ(ierr);
4391142dfd88SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem eigenvalues estimated with %d iterations of %s.\n",k,check_ksp_type);CHKERRQ(ierr);
4392e269702eSStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem eigenvalues: % 1.14e %1.14e\n",lambda_min,lambda_max);CHKERRQ(ierr);
43933b03a366Sstefano_zampini     }
4394142dfd88SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem exact infty_error   : %1.14e\n",infty_error);CHKERRQ(ierr);
4395142dfd88SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem residual infty_error: %1.14e\n",abs_infty_error);CHKERRQ(ierr);
4396142dfd88SStefano Zampini     ierr = KSPDestroy(&check_ksp);CHKERRQ(ierr);
439753cdbc3dSStefano Zampini   }
4398142dfd88SStefano Zampini   if (dbg_flag) { ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); }
43990c7d97c5SJed Brown   /* free data structures no longer needed */
44000c7d97c5SJed Brown   if (coarse_ISLG)                { ierr = ISLocalToGlobalMappingDestroy(&coarse_ISLG);CHKERRQ(ierr); }
44010c7d97c5SJed Brown   if (ins_local_primal_indices)   { ierr = PetscFree(ins_local_primal_indices);CHKERRQ(ierr);  }
44020c7d97c5SJed Brown   if (ins_coarse_mat_vals)        { ierr = PetscFree(ins_coarse_mat_vals);CHKERRQ(ierr);}
44030c7d97c5SJed Brown   if (localsizes2)                { ierr = PetscFree(localsizes2);CHKERRQ(ierr);}
44040c7d97c5SJed Brown   if (localdispl2)                { ierr = PetscFree(localdispl2);CHKERRQ(ierr);}
44050c7d97c5SJed Brown   if (temp_coarse_mat_vals)       { ierr = PetscFree(temp_coarse_mat_vals);CHKERRQ(ierr);}
44060c7d97c5SJed Brown 
44070c7d97c5SJed Brown   PetscFunctionReturn(0);
44080c7d97c5SJed Brown }
44090c7d97c5SJed Brown 
44100c7d97c5SJed Brown #undef __FUNCT__
44110c7d97c5SJed Brown #define __FUNCT__ "PCBDDCManageLocalBoundaries"
441253cdbc3dSStefano Zampini static PetscErrorCode PCBDDCManageLocalBoundaries(PC pc)
44130c7d97c5SJed Brown {
44140c7d97c5SJed Brown 
44150c7d97c5SJed Brown   PC_BDDC     *pcbddc = (PC_BDDC*)pc->data;
44160c7d97c5SJed Brown   PC_IS         *pcis = (PC_IS*)pc->data;
44170c7d97c5SJed Brown   Mat_IS      *matis  = (Mat_IS*)pc->pmat->data;
4418da1bb401SStefano Zampini   PCBDDCGraph mat_graph=pcbddc->mat_graph;
44193972b0daSStefano Zampini   PetscInt    *queue_in_global_numbering,*is_indices,*auxis;
44203b03a366Sstefano_zampini   PetscInt    bs,ierr,i,j,s,k,iindex,neumann_bsize,dirichlet_bsize;
4421da1bb401SStefano Zampini   PetscInt    total_counts,nodes_touched,where_values=1,vertex_size;
4422534831adSStefano Zampini   PetscMPIInt adapt_interface=0,adapt_interface_reduced=0,NEUMANNCNT=0;
4423da1bb401SStefano Zampini   PetscBool   same_set;
4424a0ba757dSStefano Zampini   MPI_Comm    interface_comm=((PetscObject)pc)->comm;
44253b03a366Sstefano_zampini   PetscBool   use_faces=PETSC_FALSE,use_edges=PETSC_FALSE;
44263b03a366Sstefano_zampini   const PetscInt *neumann_nodes;
44273b03a366Sstefano_zampini   const PetscInt *dirichlet_nodes;
4428a81d60d8SStefano Zampini   IS          used_IS,*custom_ISForDofs;
4429da1bb401SStefano Zampini   PetscScalar *array;
4430da1bb401SStefano Zampini   PetscScalar *array2;
4431da1bb401SStefano Zampini   PetscViewer viewer=pcbddc->dbg_viewer;
44320c7d97c5SJed Brown 
44330c7d97c5SJed Brown   PetscFunctionBegin;
4434da1bb401SStefano Zampini   /* Setup local adjacency graph */
4435da1bb401SStefano Zampini   mat_graph->nvtxs=pcis->n;
4436534831adSStefano Zampini   if (!mat_graph->xadj) { NEUMANNCNT = 1; }
4437da1bb401SStefano Zampini   ierr = PCBDDCSetupLocalAdjacencyGraph(pc);CHKERRQ(ierr);
4438a0ba757dSStefano Zampini   i = mat_graph->nvtxs;
4439a0ba757dSStefano Zampini   ierr = PetscMalloc4(i,PetscInt,&mat_graph->where,i,PetscInt,&mat_graph->count,i+1,PetscInt,&mat_graph->cptr,i,PetscInt,&mat_graph->queue);CHKERRQ(ierr);
44403972b0daSStefano Zampini   ierr = PetscMalloc2(i,PetscInt,&mat_graph->which_dof,i,PetscBool,&mat_graph->touched);CHKERRQ(ierr);
44413972b0daSStefano Zampini   ierr = PetscMalloc(i*sizeof(PetscInt),&queue_in_global_numbering);CHKERRQ(ierr);
4442a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->where,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
4443a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->count,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
4444a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->which_dof,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
4445a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->queue,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
44463828260eSStefano Zampini   ierr = PetscMemzero(mat_graph->cptr,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr);
4447a0ba757dSStefano Zampini 
4448a81d60d8SStefano Zampini   /* Setting dofs splitting in mat_graph->which_dof
4449a81d60d8SStefano Zampini      Get information about dofs' splitting if provided by the user
4450a81d60d8SStefano Zampini      Otherwise it assumes a constant block size */
4451a81d60d8SStefano Zampini   vertex_size=0;
4452a81d60d8SStefano Zampini   if (!pcbddc->n_ISForDofs) {
4453a81d60d8SStefano Zampini     ierr = MatGetBlockSize(matis->A,&bs);CHKERRQ(ierr);
4454a81d60d8SStefano Zampini     ierr = PetscMalloc(bs*sizeof(IS),&custom_ISForDofs);CHKERRQ(ierr);
4455a81d60d8SStefano Zampini     for (i=0;i<bs;i++) {
4456a81d60d8SStefano Zampini       ierr = ISCreateStride(PETSC_COMM_SELF,pcis->n/bs,i,bs,&custom_ISForDofs[i]);CHKERRQ(ierr);
4457a81d60d8SStefano Zampini     }
4458a81d60d8SStefano Zampini     ierr = PCBDDCSetDofsSplitting(pc,bs,custom_ISForDofs);CHKERRQ(ierr);
4459a81d60d8SStefano Zampini     vertex_size=1;
4460a81d60d8SStefano Zampini     /* remove my references to IS objects */
4461a81d60d8SStefano Zampini     for (i=0;i<bs;i++) {
4462a81d60d8SStefano Zampini       ierr = ISDestroy(&custom_ISForDofs[i]);CHKERRQ(ierr);
4463a81d60d8SStefano Zampini     }
4464a81d60d8SStefano Zampini     ierr = PetscFree(custom_ISForDofs);CHKERRQ(ierr);
4465a81d60d8SStefano Zampini   }
44669c0446d6SStefano Zampini   for (i=0;i<pcbddc->n_ISForDofs;i++) {
4467a81d60d8SStefano Zampini     ierr = ISGetSize(pcbddc->ISForDofs[i],&k);CHKERRQ(ierr);
44689c0446d6SStefano Zampini     ierr = ISGetIndices(pcbddc->ISForDofs[i],(const PetscInt**)&is_indices);CHKERRQ(ierr);
4469a81d60d8SStefano Zampini     for (j=0;j<k;j++) {
44709c0446d6SStefano Zampini       mat_graph->which_dof[is_indices[j]]=i;
44719c0446d6SStefano Zampini     }
44729c0446d6SStefano Zampini     ierr = ISRestoreIndices(pcbddc->ISForDofs[i],(const PetscInt**)&is_indices);CHKERRQ(ierr);
44739c0446d6SStefano Zampini   }
4474a81d60d8SStefano Zampini   /* use mat block size as vertex size if it has not yet set */
4475a81d60d8SStefano Zampini   if (!vertex_size) {
44763b03a366Sstefano_zampini     ierr = MatGetBlockSize(matis->A,&vertex_size);CHKERRQ(ierr);
44770c7d97c5SJed Brown   }
4478a81d60d8SStefano Zampini 
44793b03a366Sstefano_zampini   /* count number of neigh per node */
44800c7d97c5SJed Brown   total_counts=0;
44813b03a366Sstefano_zampini   for (i=1;i<pcis->n_neigh;i++){
44820c7d97c5SJed Brown     s=pcis->n_shared[i];
44830c7d97c5SJed Brown     total_counts+=s;
448453cdbc3dSStefano Zampini     for (j=0;j<s;j++){
44850c7d97c5SJed Brown       mat_graph->count[pcis->shared[i][j]] += 1;
44860c7d97c5SJed Brown     }
44870c7d97c5SJed Brown   }
4488534831adSStefano Zampini   /* Take into account Neumann data -> it increments number of sharing subdomains for nodes lying on the interface */
448936e030ebSStefano Zampini   ierr = PCBDDCGetNeumannBoundaries(pc,&used_IS);CHKERRQ(ierr);
4490da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
4491da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
449236e030ebSStefano Zampini   if (used_IS) {
449336e030ebSStefano Zampini     ierr = ISGetSize(used_IS,&neumann_bsize);CHKERRQ(ierr);
449436e030ebSStefano Zampini     ierr = ISGetIndices(used_IS,&neumann_nodes);CHKERRQ(ierr);
449553cdbc3dSStefano Zampini     for (i=0;i<neumann_bsize;i++){
449653cdbc3dSStefano Zampini       iindex = neumann_nodes[i];
4497534831adSStefano Zampini       if (mat_graph->count[iindex] > NEUMANNCNT && array[iindex]==0.0){
449853cdbc3dSStefano Zampini         mat_graph->count[iindex]+=1;
44990c7d97c5SJed Brown         total_counts++;
4500da1bb401SStefano Zampini         array[iindex]=array[iindex]+1.0;
4501da1bb401SStefano Zampini       } else if (array[iindex]>0.0) {
4502da1bb401SStefano Zampini         SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_USER,"Error for neumann nodes provided to BDDC! They must be uniquely listed! Found duplicate node %d\n",iindex);
45030c7d97c5SJed Brown       }
45040c7d97c5SJed Brown     }
45050c7d97c5SJed Brown   }
4506da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
4507da1bb401SStefano Zampini   /* allocate space for storing the set of neighbours for each node */
4508da1bb401SStefano Zampini   ierr = PetscMalloc(mat_graph->nvtxs*sizeof(PetscInt*),&mat_graph->neighbours_set);CHKERRQ(ierr);
4509da1bb401SStefano Zampini   if (mat_graph->nvtxs) { ierr = PetscMalloc(total_counts*sizeof(PetscInt),&mat_graph->neighbours_set[0]);CHKERRQ(ierr); }
4510da1bb401SStefano Zampini   for (i=1;i<mat_graph->nvtxs;i++) mat_graph->neighbours_set[i]=mat_graph->neighbours_set[i-1]+mat_graph->count[i-1];
4511a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->count,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
45123b03a366Sstefano_zampini   for (i=1;i<pcis->n_neigh;i++){
45130c7d97c5SJed Brown     s=pcis->n_shared[i];
45140c7d97c5SJed Brown     for (j=0;j<s;j++) {
45150c7d97c5SJed Brown       k=pcis->shared[i][j];
4516da1bb401SStefano Zampini       mat_graph->neighbours_set[k][mat_graph->count[k]] = pcis->neigh[i];
45170c7d97c5SJed Brown       mat_graph->count[k]+=1;
45180c7d97c5SJed Brown     }
45190c7d97c5SJed Brown   }
4520da1bb401SStefano Zampini   /* Check consistency of Neumann nodes */
4521da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
4522da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4523da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4524da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4525da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4526da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
45273b03a366Sstefano_zampini   /* set -1 fake neighbour to mimic Neumann boundary */
452836e030ebSStefano Zampini   if (used_IS) {
452953cdbc3dSStefano Zampini     for (i=0;i<neumann_bsize;i++){
453053cdbc3dSStefano Zampini       iindex = neumann_nodes[i];
4531534831adSStefano Zampini       if (mat_graph->count[iindex] > NEUMANNCNT){
4532da1bb401SStefano Zampini         if (mat_graph->count[iindex]+1 != (PetscInt)array[iindex]) {
4533da1bb401SStefano Zampini           SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_USER,"Neumann nodes provided to BDDC must be consistent among neighbours!\nNode %d: number of sharing subdomains %d != number of subdomains for which it is a neumann node %d\n",iindex,mat_graph->count[iindex]+1,(PetscInt)array[iindex]);
4534da1bb401SStefano Zampini         }
4535da1bb401SStefano Zampini         mat_graph->neighbours_set[iindex][mat_graph->count[iindex]] = -1;
453653cdbc3dSStefano Zampini         mat_graph->count[iindex]+=1;
45370c7d97c5SJed Brown       }
45380c7d97c5SJed Brown     }
453936e030ebSStefano Zampini     ierr = ISRestoreIndices(used_IS,&neumann_nodes);CHKERRQ(ierr);
45400c7d97c5SJed Brown   }
4541da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
4542da1bb401SStefano Zampini   /* sort set of sharing subdomains */
4543da1bb401SStefano Zampini   for (i=0;i<mat_graph->nvtxs;i++) { ierr = PetscSortInt(mat_graph->count[i],mat_graph->neighbours_set[i]);CHKERRQ(ierr); }
45443b03a366Sstefano_zampini   /* remove interior nodes and dirichlet boundary nodes from the next search into the graph */
4545da1bb401SStefano Zampini   for (i=0;i<mat_graph->nvtxs;i++){mat_graph->touched[i]=PETSC_FALSE;}
4546da1bb401SStefano Zampini   nodes_touched=0;
454736e030ebSStefano Zampini   ierr = PCBDDCGetDirichletBoundaries(pc,&used_IS);CHKERRQ(ierr);
4548da1bb401SStefano Zampini   ierr = VecSet(pcis->vec2_N,0.0);CHKERRQ(ierr);
4549da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
4550da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec2_N,&array2);CHKERRQ(ierr);
4551da1bb401SStefano Zampini   if (used_IS) {
4552da1bb401SStefano Zampini     ierr = ISGetSize(used_IS,&dirichlet_bsize);CHKERRQ(ierr);
4553da1bb401SStefano Zampini     if (dirichlet_bsize && matis->pure_neumann) {
4554da1bb401SStefano Zampini       SETERRQ(PETSC_COMM_SELF,PETSC_ERR_USER,"Dirichlet boundaries are intended to be used with matrices with zeroed rows!\n");
4555da1bb401SStefano Zampini     }
4556da1bb401SStefano Zampini     ierr = ISGetIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr);
4557da1bb401SStefano Zampini     for (i=0;i<dirichlet_bsize;i++){
4558da1bb401SStefano Zampini       iindex=dirichlet_nodes[i];
4559da1bb401SStefano Zampini       if (mat_graph->count[iindex] && !mat_graph->touched[iindex]) {
4560da1bb401SStefano Zampini         if (array[iindex]>0.0) {
4561da1bb401SStefano Zampini           SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_USER,"BDDC cannot have nodes which are marked as Neumann and Dirichlet at the same time! Wrong node %d\n",iindex);
4562da1bb401SStefano Zampini         }
4563da1bb401SStefano Zampini         mat_graph->touched[iindex]=PETSC_TRUE;
4564da1bb401SStefano Zampini         mat_graph->where[iindex]=0;
4565da1bb401SStefano Zampini         nodes_touched++;
4566da1bb401SStefano Zampini         array2[iindex]=array2[iindex]+1.0;
4567da1bb401SStefano Zampini       }
4568da1bb401SStefano Zampini     }
4569da1bb401SStefano Zampini     ierr = ISRestoreIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr);
4570da1bb401SStefano Zampini   }
4571da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
4572da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec2_N,&array2);CHKERRQ(ierr);
4573da1bb401SStefano Zampini   /* Check consistency of Dirichlet nodes */
4574da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_N,1.0);CHKERRQ(ierr);
4575da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
4576da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4577da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4578da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4579da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4580da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
4581da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec2_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4582da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec2_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4583da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4584da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4585da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
4586da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec2_N,&array2);CHKERRQ(ierr);
458736e030ebSStefano Zampini   if (used_IS) {
458836e030ebSStefano Zampini     ierr = ISGetSize(used_IS,&dirichlet_bsize);CHKERRQ(ierr);
458936e030ebSStefano Zampini     ierr = ISGetIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr);
45903b03a366Sstefano_zampini     for (i=0;i<dirichlet_bsize;i++){
4591da1bb401SStefano Zampini       iindex=dirichlet_nodes[i];
4592da1bb401SStefano Zampini       if (array[iindex]>1.0 && array[iindex]!=array2[iindex] ) {
4593da1bb401SStefano Zampini          SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_USER,"Dirichlet nodes provided to BDDC must be consistent among neighbours!\nNode %d: number of sharing subdomains %d != number of subdomains for which it is a neumann node %d\n",iindex,(PetscInt)array[iindex],(PetscInt)array2[iindex]);
4594da1bb401SStefano Zampini       }
45953b03a366Sstefano_zampini     }
459636e030ebSStefano Zampini     ierr = ISRestoreIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr);
45973b03a366Sstefano_zampini   }
4598da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
4599da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec2_N,&array2);CHKERRQ(ierr);
4600da1bb401SStefano Zampini 
46010c7d97c5SJed Brown   for (i=0;i<mat_graph->nvtxs;i++){
46023b03a366Sstefano_zampini     if (!mat_graph->count[i]){  /* interior nodes */
46030c7d97c5SJed Brown       mat_graph->touched[i]=PETSC_TRUE;
46040c7d97c5SJed Brown       mat_graph->where[i]=0;
46050c7d97c5SJed Brown       nodes_touched++;
46060c7d97c5SJed Brown     }
46070c7d97c5SJed Brown   }
46080c7d97c5SJed Brown   mat_graph->ncmps = 0;
4609da1bb401SStefano Zampini   i=0;
46100c7d97c5SJed Brown   while(nodes_touched<mat_graph->nvtxs) {
4611a0ba757dSStefano Zampini     /*  find first untouched node in local ordering */
46120c7d97c5SJed Brown     while(mat_graph->touched[i]) i++;
46130c7d97c5SJed Brown     mat_graph->touched[i]=PETSC_TRUE;
4614a0ba757dSStefano Zampini     mat_graph->where[i]=where_values;
46150c7d97c5SJed Brown     nodes_touched++;
4616a0ba757dSStefano Zampini     /* now find all other nodes having the same set of sharing subdomains */
46170c7d97c5SJed Brown     for (j=i+1;j<mat_graph->nvtxs;j++){
4618a0ba757dSStefano Zampini       /* check for same number of sharing subdomains and dof number */
4619da1bb401SStefano Zampini       if (!mat_graph->touched[j] && mat_graph->count[i]==mat_graph->count[j] && mat_graph->which_dof[i] == mat_graph->which_dof[j] ){
4620a0ba757dSStefano Zampini         /* check for same set of sharing subdomains */
46210c7d97c5SJed Brown         same_set=PETSC_TRUE;
46220c7d97c5SJed Brown         for (k=0;k<mat_graph->count[j];k++){
4623da1bb401SStefano Zampini           if (mat_graph->neighbours_set[i][k]!=mat_graph->neighbours_set[j][k]) {
46240c7d97c5SJed Brown             same_set=PETSC_FALSE;
46250c7d97c5SJed Brown           }
46260c7d97c5SJed Brown         }
4627a0ba757dSStefano Zampini         /* I found a friend of mine */
46280c7d97c5SJed Brown         if (same_set) {
4629a0ba757dSStefano Zampini           mat_graph->where[j]=where_values;
46300c7d97c5SJed Brown           mat_graph->touched[j]=PETSC_TRUE;
46310c7d97c5SJed Brown           nodes_touched++;
46320c7d97c5SJed Brown         }
46330c7d97c5SJed Brown       }
46340c7d97c5SJed Brown     }
4635a0ba757dSStefano Zampini     where_values++;
46360c7d97c5SJed Brown   }
4637a0ba757dSStefano Zampini   where_values--; if (where_values<0) where_values=0;
4638a0ba757dSStefano Zampini   ierr = PetscMalloc(where_values*sizeof(PetscMPIInt),&mat_graph->where_ncmps);CHKERRQ(ierr);
4639a0ba757dSStefano Zampini   /* Find connected components defined on the shared interface */
4640a0ba757dSStefano Zampini   if (where_values) {
4641a0ba757dSStefano Zampini     ierr = PCBDDCFindConnectedComponents(mat_graph, where_values);
46423b03a366Sstefano_zampini     /* For consistency among neughbouring procs, I need to sort (by global ordering) each connected component */
4643a0ba757dSStefano Zampini     for (i=0;i<mat_graph->ncmps;i++) {
4644a0ba757dSStefano Zampini       ierr = ISLocalToGlobalMappingApply(matis->mapping,mat_graph->cptr[i+1]-mat_graph->cptr[i],&mat_graph->queue[mat_graph->cptr[i]],&queue_in_global_numbering[mat_graph->cptr[i]]);CHKERRQ(ierr);
4645a0ba757dSStefano Zampini       ierr = PetscSortIntWithArray(mat_graph->cptr[i+1]-mat_graph->cptr[i],&queue_in_global_numbering[mat_graph->cptr[i]],&mat_graph->queue[mat_graph->cptr[i]]);CHKERRQ(ierr);
4646a0ba757dSStefano Zampini     }
4647a0ba757dSStefano Zampini   }
4648a0ba757dSStefano Zampini   /* check consistency of connected components among neighbouring subdomains -> it adapt them in case it is needed */
4649a0ba757dSStefano Zampini   for (i=0;i<where_values;i++) {
46503b03a366Sstefano_zampini     /* We are not sure that two connected components will be the same among subdomains sharing a subset of local interface */
46513b03a366Sstefano_zampini     if (mat_graph->where_ncmps[i]>1) {
4652a0ba757dSStefano Zampini       adapt_interface=1;
4653a0ba757dSStefano Zampini       break;
4654a0ba757dSStefano Zampini     }
4655a0ba757dSStefano Zampini   }
4656a0ba757dSStefano Zampini   ierr = MPI_Allreduce(&adapt_interface,&adapt_interface_reduced,1,MPIU_INT,MPI_LOR,interface_comm);CHKERRQ(ierr);
4657da1bb401SStefano Zampini   if (pcbddc->dbg_flag && adapt_interface_reduced) {
4658d8923723SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"Adapting interface\n");CHKERRQ(ierr);
4659da1bb401SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
4660da1bb401SStefano Zampini   }
4661a0ba757dSStefano Zampini   if (where_values && adapt_interface_reduced) {
46620c7d97c5SJed Brown 
4663a0ba757dSStefano Zampini     PetscInt sum_requests=0,my_rank;
4664a0ba757dSStefano Zampini     PetscInt buffer_size,start_of_recv,size_of_recv,start_of_send;
4665a0ba757dSStefano Zampini     PetscInt temp_buffer_size,ins_val,global_where_counter;
4666a0ba757dSStefano Zampini     PetscInt *cum_recv_counts;
4667a0ba757dSStefano Zampini     PetscInt *where_to_nodes_indices;
4668a0ba757dSStefano Zampini     PetscInt *petsc_buffer;
4669a0ba757dSStefano Zampini     PetscMPIInt *recv_buffer;
4670a0ba757dSStefano Zampini     PetscMPIInt *recv_buffer_where;
4671a0ba757dSStefano Zampini     PetscMPIInt *send_buffer;
4672a0ba757dSStefano Zampini     PetscMPIInt size_of_send;
4673a0ba757dSStefano Zampini     PetscInt *sizes_of_sends;
4674a0ba757dSStefano Zampini     MPI_Request *send_requests;
4675a0ba757dSStefano Zampini     MPI_Request *recv_requests;
4676a0ba757dSStefano Zampini     PetscInt *where_cc_adapt;
4677a0ba757dSStefano Zampini     PetscInt **temp_buffer;
4678a0ba757dSStefano Zampini     PetscInt *nodes_to_temp_buffer_indices;
4679a0ba757dSStefano Zampini     PetscInt *add_to_where;
4680a0ba757dSStefano Zampini 
4681a0ba757dSStefano Zampini     ierr = MPI_Comm_rank(interface_comm,&my_rank);CHKERRQ(ierr);
4682a0ba757dSStefano Zampini     ierr = PetscMalloc((where_values+1)*sizeof(PetscInt),&cum_recv_counts);CHKERRQ(ierr);
4683a0ba757dSStefano Zampini     ierr = PetscMemzero(cum_recv_counts,(where_values+1)*sizeof(PetscInt));CHKERRQ(ierr);
4684a0ba757dSStefano Zampini     ierr = PetscMalloc(where_values*sizeof(PetscInt),&where_to_nodes_indices);CHKERRQ(ierr);
4685a0ba757dSStefano Zampini     /* first count how many neighbours per connected component I will receive from */
4686a0ba757dSStefano Zampini     cum_recv_counts[0]=0;
4687a0ba757dSStefano Zampini     for (i=1;i<where_values+1;i++){
4688a0ba757dSStefano Zampini       j=0;
4689d8923723SStefano Zampini       while(mat_graph->where[j] != i) { j++; }
4690a0ba757dSStefano Zampini       where_to_nodes_indices[i-1]=j;
4691da1bb401SStefano Zampini       if (mat_graph->neighbours_set[j][0]!=-1) { cum_recv_counts[i]=cum_recv_counts[i-1]+mat_graph->count[j]; } /* We don't want sends/recvs_to/from_self -> here I don't count myself  */
46923b03a366Sstefano_zampini       else { cum_recv_counts[i]=cum_recv_counts[i-1]+mat_graph->count[j]-1; }
4693a0ba757dSStefano Zampini     }
4694a0ba757dSStefano Zampini     ierr = PetscMalloc(2*cum_recv_counts[where_values]*sizeof(PetscMPIInt),&recv_buffer_where);CHKERRQ(ierr);
4695a0ba757dSStefano Zampini     ierr = PetscMalloc(cum_recv_counts[where_values]*sizeof(MPI_Request),&send_requests);CHKERRQ(ierr);
4696a0ba757dSStefano Zampini     ierr = PetscMalloc(cum_recv_counts[where_values]*sizeof(MPI_Request),&recv_requests);CHKERRQ(ierr);
4697a0ba757dSStefano Zampini     for (i=0;i<cum_recv_counts[where_values];i++) {
4698a0ba757dSStefano Zampini       send_requests[i]=MPI_REQUEST_NULL;
4699a0ba757dSStefano Zampini       recv_requests[i]=MPI_REQUEST_NULL;
4700a0ba757dSStefano Zampini     }
4701a0ba757dSStefano Zampini     /* exchange with my neighbours the number of my connected components on the shared interface */
4702a0ba757dSStefano Zampini     for (i=0;i<where_values;i++){
4703a0ba757dSStefano Zampini       j=where_to_nodes_indices[i];
4704da1bb401SStefano Zampini       k = (mat_graph->neighbours_set[j][0] == -1 ?  1 : 0);
4705a0ba757dSStefano Zampini       for (;k<mat_graph->count[j];k++){
4706da1bb401SStefano Zampini         ierr = MPI_Isend(&mat_graph->where_ncmps[i],1,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr);
4707da1bb401SStefano Zampini         ierr = MPI_Irecv(&recv_buffer_where[sum_requests],1,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr);
4708a0ba757dSStefano Zampini         sum_requests++;
4709a0ba757dSStefano Zampini       }
4710a0ba757dSStefano Zampini     }
4711a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
4712a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
4713a0ba757dSStefano Zampini     /* determine the connected component I need to adapt */
4714a0ba757dSStefano Zampini     ierr = PetscMalloc(where_values*sizeof(PetscInt),&where_cc_adapt);CHKERRQ(ierr);
4715a0ba757dSStefano Zampini     ierr = PetscMemzero(where_cc_adapt,where_values*sizeof(PetscInt));CHKERRQ(ierr);
4716a0ba757dSStefano Zampini     for (i=0;i<where_values;i++){
4717a0ba757dSStefano Zampini       for (j=cum_recv_counts[i];j<cum_recv_counts[i+1];j++){
47183b03a366Sstefano_zampini         /* The first condition is natural (i.e someone has a different number of cc than me), the second one is just to be safe */
47193b03a366Sstefano_zampini         if ( mat_graph->where_ncmps[i]!=recv_buffer_where[j] || mat_graph->where_ncmps[i] > 1 ) {
4720a0ba757dSStefano Zampini           where_cc_adapt[i]=PETSC_TRUE;
4721a0ba757dSStefano Zampini           break;
4722a0ba757dSStefano Zampini         }
4723a0ba757dSStefano Zampini       }
4724a0ba757dSStefano Zampini     }
4725d8923723SStefano Zampini     buffer_size = 0;
4726d8923723SStefano Zampini     for (i=0;i<where_values;i++) {
4727d8923723SStefano Zampini       if (where_cc_adapt[i]) {
4728d8923723SStefano Zampini         for (j=i;j<mat_graph->ncmps;j++) {
4729d8923723SStefano Zampini           if (mat_graph->where[mat_graph->queue[mat_graph->cptr[j]]] == i+1) { /* WARNING -> where values goes from 1 to where_values included */
4730d8923723SStefano Zampini             buffer_size += 1 + mat_graph->cptr[j+1]-mat_graph->cptr[j];
4731d8923723SStefano Zampini           }
4732d8923723SStefano Zampini         }
4733d8923723SStefano Zampini       }
4734d8923723SStefano Zampini     }
4735d8923723SStefano Zampini     ierr = PetscMalloc(buffer_size*sizeof(PetscMPIInt),&send_buffer);CHKERRQ(ierr);
4736a0ba757dSStefano Zampini     /* now get from neighbours their ccs (in global numbering) and adapt them (in case it is needed) */
4737a0ba757dSStefano Zampini     /* first determine how much data to send (size of each queue plus the global indices) and communicate it to neighbours */
4738a0ba757dSStefano Zampini     ierr = PetscMalloc(where_values*sizeof(PetscInt),&sizes_of_sends);CHKERRQ(ierr);
4739a0ba757dSStefano Zampini     ierr = PetscMemzero(sizes_of_sends,where_values*sizeof(PetscInt));CHKERRQ(ierr);
4740a0ba757dSStefano Zampini     sum_requests=0;
4741a0ba757dSStefano Zampini     start_of_send=0;
4742a0ba757dSStefano Zampini     start_of_recv=cum_recv_counts[where_values];
4743a0ba757dSStefano Zampini     for (i=0;i<where_values;i++) {
4744a0ba757dSStefano Zampini       if (where_cc_adapt[i]) {
4745a0ba757dSStefano Zampini         size_of_send=0;
4746a0ba757dSStefano Zampini         for (j=i;j<mat_graph->ncmps;j++) {
4747a0ba757dSStefano Zampini           if (mat_graph->where[mat_graph->queue[mat_graph->cptr[j]]] == i+1) { /* WARNING -> where values goes from 1 to where_values included */
4748a0ba757dSStefano Zampini             send_buffer[start_of_send+size_of_send]=mat_graph->cptr[j+1]-mat_graph->cptr[j];
4749a0ba757dSStefano Zampini             size_of_send+=1;
4750a0ba757dSStefano Zampini             for (k=0;k<mat_graph->cptr[j+1]-mat_graph->cptr[j];k++) {
4751a0ba757dSStefano Zampini               send_buffer[start_of_send+size_of_send+k]=queue_in_global_numbering[mat_graph->cptr[j]+k];
4752a0ba757dSStefano Zampini             }
4753a0ba757dSStefano Zampini             size_of_send=size_of_send+mat_graph->cptr[j+1]-mat_graph->cptr[j];
4754a0ba757dSStefano Zampini           }
4755a0ba757dSStefano Zampini         }
4756a0ba757dSStefano Zampini         j = where_to_nodes_indices[i];
4757da1bb401SStefano Zampini         k = (mat_graph->neighbours_set[j][0] == -1 ?  1 : 0);
475811d8f4c2SStefano Zampini         sizes_of_sends[i]=size_of_send;
4759a0ba757dSStefano Zampini         for (;k<mat_graph->count[j];k++){
476011d8f4c2SStefano Zampini           ierr = MPI_Isend(&sizes_of_sends[i],1,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr);
4761da1bb401SStefano Zampini           ierr = MPI_Irecv(&recv_buffer_where[sum_requests+start_of_recv],1,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr);
4762a0ba757dSStefano Zampini           sum_requests++;
4763a0ba757dSStefano Zampini         }
4764a0ba757dSStefano Zampini         start_of_send+=size_of_send;
4765a0ba757dSStefano Zampini       }
4766a0ba757dSStefano Zampini     }
4767a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
4768a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
4769a0ba757dSStefano Zampini     buffer_size=0;
4770a0ba757dSStefano Zampini     for (k=0;k<sum_requests;k++) { buffer_size+=recv_buffer_where[start_of_recv+k]; }
4771a0ba757dSStefano Zampini     ierr = PetscMalloc(buffer_size*sizeof(PetscMPIInt),&recv_buffer);CHKERRQ(ierr);
4772a0ba757dSStefano Zampini     /* now exchange the data */
4773a0ba757dSStefano Zampini     start_of_recv=0;
4774a0ba757dSStefano Zampini     start_of_send=0;
4775a0ba757dSStefano Zampini     sum_requests=0;
4776a0ba757dSStefano Zampini     for (i=0;i<where_values;i++) {
4777a0ba757dSStefano Zampini       if (where_cc_adapt[i]) {
4778a0ba757dSStefano Zampini         size_of_send = sizes_of_sends[i];
4779a0ba757dSStefano Zampini         j = where_to_nodes_indices[i];
4780da1bb401SStefano Zampini         k = (mat_graph->neighbours_set[j][0] == -1 ?  1 : 0);
4781a0ba757dSStefano Zampini         for (;k<mat_graph->count[j];k++){
4782da1bb401SStefano Zampini           ierr = MPI_Isend(&send_buffer[start_of_send],size_of_send,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr);
4783a0ba757dSStefano Zampini           size_of_recv=recv_buffer_where[cum_recv_counts[where_values]+sum_requests];
4784da1bb401SStefano Zampini           ierr = MPI_Irecv(&recv_buffer[start_of_recv],size_of_recv,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr);
4785a0ba757dSStefano Zampini           start_of_recv+=size_of_recv;
4786a0ba757dSStefano Zampini           sum_requests++;
4787a0ba757dSStefano Zampini         }
4788a0ba757dSStefano Zampini         start_of_send+=size_of_send;
4789a0ba757dSStefano Zampini       }
4790a0ba757dSStefano Zampini     }
4791a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
4792a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
4793a0ba757dSStefano Zampini     ierr = PetscMalloc(buffer_size*sizeof(PetscInt),&petsc_buffer);CHKERRQ(ierr);
4794a0ba757dSStefano Zampini     for (k=0;k<start_of_recv;k++) { petsc_buffer[k]=(PetscInt)recv_buffer[k]; }
4795a0ba757dSStefano Zampini     for (j=0;j<buffer_size;) {
4796a0ba757dSStefano Zampini        ierr = ISGlobalToLocalMappingApply(matis->mapping,IS_GTOLM_MASK,petsc_buffer[j],&petsc_buffer[j+1],&petsc_buffer[j],&petsc_buffer[j+1]);CHKERRQ(ierr);
4797a0ba757dSStefano Zampini        k=petsc_buffer[j]+1;
4798a0ba757dSStefano Zampini        j+=k;
4799a0ba757dSStefano Zampini     }
4800a0ba757dSStefano Zampini     sum_requests=cum_recv_counts[where_values];
4801a0ba757dSStefano Zampini     start_of_recv=0;
4802a0ba757dSStefano Zampini     ierr = PetscMalloc(mat_graph->nvtxs*sizeof(PetscInt),&nodes_to_temp_buffer_indices);CHKERRQ(ierr);
4803a0ba757dSStefano Zampini     global_where_counter=0;
4804a0ba757dSStefano Zampini     for (i=0;i<where_values;i++){
4805a0ba757dSStefano Zampini       if (where_cc_adapt[i]){
4806a0ba757dSStefano Zampini         temp_buffer_size=0;
4807a0ba757dSStefano Zampini         /* find nodes on the shared interface we need to adapt */
4808a0ba757dSStefano Zampini         for (j=0;j<mat_graph->nvtxs;j++){
4809a0ba757dSStefano Zampini           if (mat_graph->where[j]==i+1) {
4810a0ba757dSStefano Zampini             nodes_to_temp_buffer_indices[j]=temp_buffer_size;
4811a0ba757dSStefano Zampini             temp_buffer_size++;
4812a0ba757dSStefano Zampini           } else {
4813a0ba757dSStefano Zampini             nodes_to_temp_buffer_indices[j]=-1;
4814a0ba757dSStefano Zampini           }
4815a0ba757dSStefano Zampini         }
4816a0ba757dSStefano Zampini         /* allocate some temporary space */
4817a0ba757dSStefano Zampini         ierr = PetscMalloc(temp_buffer_size*sizeof(PetscInt*),&temp_buffer);CHKERRQ(ierr);
4818a0ba757dSStefano Zampini         ierr = PetscMalloc(temp_buffer_size*(cum_recv_counts[i+1]-cum_recv_counts[i])*sizeof(PetscInt),&temp_buffer[0]);CHKERRQ(ierr);
4819a0ba757dSStefano Zampini         ierr = PetscMemzero(temp_buffer[0],temp_buffer_size*(cum_recv_counts[i+1]-cum_recv_counts[i])*sizeof(PetscInt));CHKERRQ(ierr);
4820a0ba757dSStefano Zampini         for (j=1;j<temp_buffer_size;j++){
4821a0ba757dSStefano Zampini           temp_buffer[j]=temp_buffer[j-1]+cum_recv_counts[i+1]-cum_recv_counts[i];
4822a0ba757dSStefano Zampini         }
4823a0ba757dSStefano Zampini         /* analyze contributions from neighbouring subdomains for i-th conn comp
4824a0ba757dSStefano Zampini            temp buffer structure:
4825a0ba757dSStefano Zampini            supposing part of the interface has dimension 5 (global nodes 0,1,2,3,4)
4826a0ba757dSStefano Zampini            3 neighs procs with structured connected components:
4827a0ba757dSStefano Zampini              neigh 0: [0 1 4], [2 3];  (2 connected components)
4828a0ba757dSStefano Zampini              neigh 1: [0 1], [2 3 4];  (2 connected components)
4829a0ba757dSStefano Zampini              neigh 2: [0 4], [1], [2 3]; (3 connected components)
4830a0ba757dSStefano Zampini            tempbuffer (row-oriented) should be filled as:
4831a0ba757dSStefano Zampini              [ 0, 0, 0;
4832a0ba757dSStefano Zampini                0, 0, 1;
4833a0ba757dSStefano Zampini                1, 1, 2;
4834a0ba757dSStefano Zampini                1, 1, 2;
4835a0ba757dSStefano Zampini                0, 1, 0; ];
4836a0ba757dSStefano Zampini            This way we can simply recover the resulting structure account for possible intersections of ccs among neighs.
4837a0ba757dSStefano Zampini            The mat_graph->where array will be modified to reproduce the following 4 connected components [0], [1], [2 3], [4];
4838a0ba757dSStefano Zampini                                                                                                                                    */
4839a0ba757dSStefano Zampini         for (j=0;j<cum_recv_counts[i+1]-cum_recv_counts[i];j++) {
4840a0ba757dSStefano Zampini           ins_val=0;
4841a0ba757dSStefano Zampini           size_of_recv=recv_buffer_where[sum_requests];  /* total size of recv from neighs */
4842a0ba757dSStefano Zampini           for (buffer_size=0;buffer_size<size_of_recv;) {  /* loop until all data from neighs has been taken into account */
4843a0ba757dSStefano Zampini             for (k=1;k<petsc_buffer[buffer_size+start_of_recv]+1;k++) { /* filling properly temp_buffer using data from a single recv */
4844a0ba757dSStefano Zampini               temp_buffer[ nodes_to_temp_buffer_indices[ petsc_buffer[ start_of_recv+buffer_size+k ] ] ][j]=ins_val;
4845a0ba757dSStefano Zampini             }
4846a0ba757dSStefano Zampini             buffer_size+=k;
4847a0ba757dSStefano Zampini             ins_val++;
4848a0ba757dSStefano Zampini           }
4849a0ba757dSStefano Zampini           start_of_recv+=size_of_recv;
4850a0ba757dSStefano Zampini           sum_requests++;
4851a0ba757dSStefano Zampini         }
4852a0ba757dSStefano Zampini         ierr = PetscMalloc(temp_buffer_size*sizeof(PetscInt),&add_to_where);CHKERRQ(ierr);
4853a0ba757dSStefano Zampini         ierr = PetscMemzero(add_to_where,temp_buffer_size*sizeof(PetscInt));CHKERRQ(ierr);
4854a0ba757dSStefano Zampini         for (j=0;j<temp_buffer_size;j++){
4855a0ba757dSStefano Zampini           if (!add_to_where[j]){ /* found a new cc  */
4856a0ba757dSStefano Zampini             global_where_counter++;
4857a0ba757dSStefano Zampini             add_to_where[j]=global_where_counter;
4858a0ba757dSStefano Zampini             for (k=j+1;k<temp_buffer_size;k++){ /* check for other nodes in new cc */
4859a0ba757dSStefano Zampini               same_set=PETSC_TRUE;
4860a0ba757dSStefano Zampini               for (s=0;s<cum_recv_counts[i+1]-cum_recv_counts[i];s++){
4861a0ba757dSStefano Zampini                 if (temp_buffer[j][s]!=temp_buffer[k][s]) {
4862a0ba757dSStefano Zampini                   same_set=PETSC_FALSE;
4863a0ba757dSStefano Zampini                   break;
4864a0ba757dSStefano Zampini                 }
4865a0ba757dSStefano Zampini               }
4866a0ba757dSStefano Zampini               if (same_set) add_to_where[k]=global_where_counter;
4867a0ba757dSStefano Zampini             }
4868a0ba757dSStefano Zampini           }
4869a0ba757dSStefano Zampini         }
4870a0ba757dSStefano Zampini         /* insert new data in where array */
4871a0ba757dSStefano Zampini         temp_buffer_size=0;
4872a0ba757dSStefano Zampini         for (j=0;j<mat_graph->nvtxs;j++){
4873a0ba757dSStefano Zampini           if (mat_graph->where[j]==i+1) {
4874a0ba757dSStefano Zampini             mat_graph->where[j]=where_values+add_to_where[temp_buffer_size];
4875a0ba757dSStefano Zampini             temp_buffer_size++;
4876a0ba757dSStefano Zampini           }
4877a0ba757dSStefano Zampini         }
4878a0ba757dSStefano Zampini         ierr = PetscFree(temp_buffer[0]);CHKERRQ(ierr);
4879a0ba757dSStefano Zampini         ierr = PetscFree(temp_buffer);CHKERRQ(ierr);
4880a0ba757dSStefano Zampini         ierr = PetscFree(add_to_where);CHKERRQ(ierr);
4881a0ba757dSStefano Zampini       }
4882a0ba757dSStefano Zampini     }
4883a0ba757dSStefano Zampini     ierr = PetscFree(nodes_to_temp_buffer_indices);CHKERRQ(ierr);
4884a0ba757dSStefano Zampini     ierr = PetscFree(sizes_of_sends);CHKERRQ(ierr);
4885a0ba757dSStefano Zampini     ierr = PetscFree(send_requests);CHKERRQ(ierr);
4886a0ba757dSStefano Zampini     ierr = PetscFree(recv_requests);CHKERRQ(ierr);
4887a0ba757dSStefano Zampini     ierr = PetscFree(petsc_buffer);CHKERRQ(ierr);
4888a0ba757dSStefano Zampini     ierr = PetscFree(recv_buffer);CHKERRQ(ierr);
4889a0ba757dSStefano Zampini     ierr = PetscFree(recv_buffer_where);CHKERRQ(ierr);
4890a0ba757dSStefano Zampini     ierr = PetscFree(send_buffer);CHKERRQ(ierr);
4891a0ba757dSStefano Zampini     ierr = PetscFree(cum_recv_counts);CHKERRQ(ierr);
4892a0ba757dSStefano Zampini     ierr = PetscFree(where_to_nodes_indices);CHKERRQ(ierr);
489323d4d1a5SStefano Zampini     ierr = PetscFree(where_cc_adapt);CHKERRQ(ierr);
4894a0ba757dSStefano Zampini     /* We are ready to evaluate consistent connected components on each part of the shared interface */
4895a0ba757dSStefano Zampini     if (global_where_counter) {
4896a0ba757dSStefano Zampini       for (i=0;i<mat_graph->nvtxs;i++){ mat_graph->touched[i]=PETSC_FALSE; }
4897a0ba757dSStefano Zampini       global_where_counter=0;
4898a0ba757dSStefano Zampini       for (i=0;i<mat_graph->nvtxs;i++){
4899a0ba757dSStefano Zampini         if (mat_graph->where[i] && !mat_graph->touched[i]) {
4900a0ba757dSStefano Zampini           global_where_counter++;
4901a0ba757dSStefano Zampini           for (j=i+1;j<mat_graph->nvtxs;j++){
4902a0ba757dSStefano Zampini             if (!mat_graph->touched[j] && mat_graph->where[j]==mat_graph->where[i]) {
4903a0ba757dSStefano Zampini               mat_graph->where[j]=global_where_counter;
4904a0ba757dSStefano Zampini               mat_graph->touched[j]=PETSC_TRUE;
4905a0ba757dSStefano Zampini             }
4906a0ba757dSStefano Zampini           }
4907a0ba757dSStefano Zampini           mat_graph->where[i]=global_where_counter;
4908a0ba757dSStefano Zampini           mat_graph->touched[i]=PETSC_TRUE;
4909a0ba757dSStefano Zampini         }
4910a0ba757dSStefano Zampini       }
4911a0ba757dSStefano Zampini       where_values=global_where_counter;
4912a0ba757dSStefano Zampini     }
4913a0ba757dSStefano Zampini     if (global_where_counter) {
4914a0ba757dSStefano Zampini       ierr = PetscMemzero(mat_graph->cptr,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr);
4915a0ba757dSStefano Zampini       ierr = PetscMemzero(mat_graph->queue,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
4916a0ba757dSStefano Zampini       ierr = PetscFree(mat_graph->where_ncmps);CHKERRQ(ierr);
4917a0ba757dSStefano Zampini       ierr = PetscMalloc(where_values*sizeof(PetscMPIInt),&mat_graph->where_ncmps);CHKERRQ(ierr);
4918a0ba757dSStefano Zampini       ierr = PCBDDCFindConnectedComponents(mat_graph, where_values);
4919a0ba757dSStefano Zampini       for (i=0;i<mat_graph->ncmps;i++) {
4920a0ba757dSStefano Zampini         ierr = ISLocalToGlobalMappingApply(matis->mapping,mat_graph->cptr[i+1]-mat_graph->cptr[i],&mat_graph->queue[mat_graph->cptr[i]],&queue_in_global_numbering[mat_graph->cptr[i]]);CHKERRQ(ierr);
4921a0ba757dSStefano Zampini         ierr = PetscSortIntWithArray(mat_graph->cptr[i+1]-mat_graph->cptr[i],&queue_in_global_numbering[mat_graph->cptr[i]],&mat_graph->queue[mat_graph->cptr[i]]);CHKERRQ(ierr);
4922a0ba757dSStefano Zampini       }
4923a0ba757dSStefano Zampini     }
49243b03a366Sstefano_zampini   } /* Finished adapting interface */
49250c7d97c5SJed Brown   PetscInt nfc=0;
49260c7d97c5SJed Brown   PetscInt nec=0;
49270c7d97c5SJed Brown   PetscInt nvc=0;
49283b03a366Sstefano_zampini   PetscBool twodim_flag=PETSC_FALSE;
49290c7d97c5SJed Brown   for (i=0; i<mat_graph->ncmps; i++) {
49303b03a366Sstefano_zampini     if ( mat_graph->cptr[i+1]-mat_graph->cptr[i] > vertex_size ){
4931534831adSStefano Zampini       if (mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]==1){ /* 1 neigh Neumann fake included */
49320c7d97c5SJed Brown         nfc++;
49333b03a366Sstefano_zampini       } else { /* note that nec will be zero in 2d */
49343b03a366Sstefano_zampini         nec++;
49353b03a366Sstefano_zampini       }
49360c7d97c5SJed Brown     } else {
49373b03a366Sstefano_zampini       nvc+=mat_graph->cptr[i+1]-mat_graph->cptr[i];
49383b03a366Sstefano_zampini     }
49393b03a366Sstefano_zampini   }
49403b03a366Sstefano_zampini 
49413b03a366Sstefano_zampini   if (!nec) { /* we are in a 2d case -> no faces, only edges */
49423b03a366Sstefano_zampini     nec = nfc;
49433b03a366Sstefano_zampini     nfc = 0;
49443b03a366Sstefano_zampini     twodim_flag = PETSC_TRUE;
49453b03a366Sstefano_zampini   }
49463972b0daSStefano Zampini   /* allocate IS arrays for faces, edges. Vertices need a single index set. */
49473972b0daSStefano Zampini   k=0;
49483972b0daSStefano Zampini   for (i=0; i<mat_graph->ncmps; i++) {
49493972b0daSStefano Zampini     j=mat_graph->cptr[i+1]-mat_graph->cptr[i];
49503972b0daSStefano Zampini     if ( j > k) {
49513972b0daSStefano Zampini       k=j;
49523972b0daSStefano Zampini     }
4953ba1573a8SStefano Zampini     if (j<=vertex_size) {
4954ba1573a8SStefano Zampini       k+=vertex_size;
4955ba1573a8SStefano Zampini     }
49563972b0daSStefano Zampini   }
49573972b0daSStefano Zampini   ierr = PetscMalloc(k*sizeof(PetscInt),&auxis);CHKERRQ(ierr);
49583972b0daSStefano Zampini 
49593b03a366Sstefano_zampini   if (!pcbddc->vertices_flag && !pcbddc->edges_flag) {
49603b03a366Sstefano_zampini     ierr = PetscMalloc(nfc*sizeof(IS),&pcbddc->ISForFaces);CHKERRQ(ierr);
49613b03a366Sstefano_zampini     use_faces=PETSC_TRUE;
49623b03a366Sstefano_zampini   }
49633b03a366Sstefano_zampini   if (!pcbddc->vertices_flag && !pcbddc->faces_flag) {
49643b03a366Sstefano_zampini     ierr = PetscMalloc(nec*sizeof(IS),&pcbddc->ISForEdges);CHKERRQ(ierr);
49653b03a366Sstefano_zampini     use_edges=PETSC_TRUE;
49663b03a366Sstefano_zampini   }
49673b03a366Sstefano_zampini   nfc=0;
49683b03a366Sstefano_zampini   nec=0;
49693b03a366Sstefano_zampini   for (i=0; i<mat_graph->ncmps; i++) {
49703b03a366Sstefano_zampini     if ( mat_graph->cptr[i+1]-mat_graph->cptr[i] > vertex_size ){
49713b03a366Sstefano_zampini       for (j=0;j<mat_graph->cptr[i+1]-mat_graph->cptr[i];j++) {
49723972b0daSStefano Zampini         auxis[j]=mat_graph->queue[mat_graph->cptr[i]+j];
49733b03a366Sstefano_zampini       }
49743b03a366Sstefano_zampini       if (mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]==1){
49753b03a366Sstefano_zampini         if (twodim_flag) {
49763b03a366Sstefano_zampini           if (use_edges) {
49773972b0daSStefano Zampini             ierr = ISCreateGeneral(PETSC_COMM_SELF,j,auxis,PETSC_COPY_VALUES,&pcbddc->ISForEdges[nec]);CHKERRQ(ierr);
49783b03a366Sstefano_zampini             nec++;
49793b03a366Sstefano_zampini           }
49803b03a366Sstefano_zampini         } else {
49813b03a366Sstefano_zampini           if (use_faces) {
49823972b0daSStefano Zampini             ierr = ISCreateGeneral(PETSC_COMM_SELF,j,auxis,PETSC_COPY_VALUES,&pcbddc->ISForFaces[nfc]);CHKERRQ(ierr);
49833b03a366Sstefano_zampini             nfc++;
49843b03a366Sstefano_zampini           }
49853b03a366Sstefano_zampini         }
49863b03a366Sstefano_zampini       } else {
49873b03a366Sstefano_zampini         if (use_edges) {
49883972b0daSStefano Zampini           ierr = ISCreateGeneral(PETSC_COMM_SELF,j,auxis,PETSC_COPY_VALUES,&pcbddc->ISForEdges[nec]);CHKERRQ(ierr);
49890c7d97c5SJed Brown           nec++;
49900c7d97c5SJed Brown         }
49910c7d97c5SJed Brown       }
49920c7d97c5SJed Brown     }
49933b03a366Sstefano_zampini   }
49943b03a366Sstefano_zampini   pcbddc->n_ISForFaces=nfc;
49953b03a366Sstefano_zampini   pcbddc->n_ISForEdges=nec;
49963b03a366Sstefano_zampini   nvc=0;
49970c7d97c5SJed Brown   if ( !pcbddc->constraints_flag ) {
49983b03a366Sstefano_zampini     for (i=0; i<mat_graph->ncmps; i++) {
49993b03a366Sstefano_zampini       if ( mat_graph->cptr[i+1]-mat_graph->cptr[i] <= vertex_size ){
50003b03a366Sstefano_zampini         for ( j=mat_graph->cptr[i];j<mat_graph->cptr[i+1];j++) {
50013972b0daSStefano Zampini           auxis[nvc]=mat_graph->queue[j];
50020c7d97c5SJed Brown           nvc++;
50030c7d97c5SJed Brown         }
50040c7d97c5SJed Brown       }
50050c7d97c5SJed Brown     }
50060c7d97c5SJed Brown   }
5007a0ba757dSStefano Zampini   /* sort vertex set (by local ordering) */
50083972b0daSStefano Zampini   ierr = PetscSortInt(nvc,auxis);CHKERRQ(ierr);
50093972b0daSStefano Zampini   ierr = ISCreateGeneral(PETSC_COMM_SELF,nvc,auxis,PETSC_COPY_VALUES,&pcbddc->ISForVertices);CHKERRQ(ierr);
50100c7d97c5SJed Brown 
5011e269702eSStefano Zampini   if (pcbddc->dbg_flag) {
5012e269702eSStefano Zampini 
5013d49ef151SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"--------------------------------------------------------------\n");CHKERRQ(ierr);
5014d49ef151SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Details from PCBDDCManageLocalBoundaries for subdomain %04d\n",PetscGlobalRank);CHKERRQ(ierr);
5015d49ef151SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"--------------------------------------------------------------\n");CHKERRQ(ierr);
5016a0ba757dSStefano Zampini /*    ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Graph (adjacency structure) of local Neumann mat\n");CHKERRQ(ierr);
5017a0ba757dSStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"--------------------------------------------------------------\n");CHKERRQ(ierr);
5018e269702eSStefano Zampini     for (i=0;i<mat_graph->nvtxs;i++) {
5019a0ba757dSStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Nodes connected to node number %d are %d\n",i,mat_graph->xadj[i+1]-mat_graph->xadj[i]);CHKERRQ(ierr);
5020e269702eSStefano Zampini       for (j=mat_graph->xadj[i];j<mat_graph->xadj[i+1];j++){
5021a0ba757dSStefano Zampini         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d ",mat_graph->adjncy[j]);CHKERRQ(ierr);
5022e269702eSStefano Zampini       }
5023a0ba757dSStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\n--------------------------------------------------------------\n");CHKERRQ(ierr);
5024da1bb401SStefano Zampini     }*/
5025d49ef151SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Matrix graph has %d connected components", mat_graph->ncmps);CHKERRQ(ierr);
50260c7d97c5SJed Brown     for (i=0;i<mat_graph->ncmps;i++) {
50273b03a366Sstefano_zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\nDetails for connected component number %02d: size %04d, count %01d. Nodes follow.\n",
50283b03a366Sstefano_zampini              i,mat_graph->cptr[i+1]-mat_graph->cptr[i],mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]);CHKERRQ(ierr);
5029da1bb401SStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"subdomains: ");
5030da1bb401SStefano Zampini       for (j=0;j<mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]; j++) {
5031da1bb401SStefano Zampini         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d ",mat_graph->neighbours_set[mat_graph->queue[mat_graph->cptr[i]]][j]);
5032da1bb401SStefano Zampini       }
5033da1bb401SStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\n");
50340c7d97c5SJed Brown       for (j=mat_graph->cptr[i]; j<mat_graph->cptr[i+1]; j++){
5035da1bb401SStefano Zampini         /* ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d (%d), ",queue_in_global_numbering[j],mat_graph->queue[j]);CHKERRQ(ierr); */
5036da1bb401SStefano Zampini         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d, ",mat_graph->queue[j]);CHKERRQ(ierr);
50370c7d97c5SJed Brown       }
50380c7d97c5SJed Brown     }
5039da1bb401SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\n--------------------------------------------------------------\n");CHKERRQ(ierr);
50403b03a366Sstefano_zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local vertices\n",PetscGlobalRank,nvc);CHKERRQ(ierr);
50413b03a366Sstefano_zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local faces\n",PetscGlobalRank,nfc);CHKERRQ(ierr);
50423b03a366Sstefano_zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local edges\n",PetscGlobalRank,nec);CHKERRQ(ierr);
5043d49ef151SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
50440c7d97c5SJed Brown   }
50450c7d97c5SJed Brown 
50463972b0daSStefano Zampini   ierr = PetscFree(queue_in_global_numbering);CHKERRQ(ierr);
50473972b0daSStefano Zampini   ierr = PetscFree(auxis);CHKERRQ(ierr);
50480c7d97c5SJed Brown   PetscFunctionReturn(0);
50490c7d97c5SJed Brown 
50500c7d97c5SJed Brown }
50510c7d97c5SJed Brown 
50520c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
50530c7d97c5SJed Brown 
50540c7d97c5SJed Brown /* The following code has been adapted from function IsConnectedSubdomain contained
5055da1bb401SStefano Zampini    in source file contig.c of METIS library (version 5.0.1)
5056da1bb401SStefano Zampini    It finds connected components of each partition labeled from 1 to n_dist  */
50570c7d97c5SJed Brown 
50580c7d97c5SJed Brown #undef __FUNCT__
50590c7d97c5SJed Brown #define __FUNCT__ "PCBDDCFindConnectedComponents"
50609c0446d6SStefano Zampini static PetscErrorCode PCBDDCFindConnectedComponents(PCBDDCGraph graph, PetscInt n_dist )
50610c7d97c5SJed Brown {
50620c7d97c5SJed Brown   PetscInt i, j, k, nvtxs, first, last, nleft, ncmps,pid,cum_queue,n,ncmps_pid;
50630c7d97c5SJed Brown   PetscInt *xadj, *adjncy, *where, *queue;
50640c7d97c5SJed Brown   PetscInt *cptr;
50650c7d97c5SJed Brown   PetscBool *touched;
50660c7d97c5SJed Brown 
50670c7d97c5SJed Brown   PetscFunctionBegin;
50680c7d97c5SJed Brown 
50690c7d97c5SJed Brown   nvtxs   = graph->nvtxs;
50700c7d97c5SJed Brown   xadj    = graph->xadj;
50710c7d97c5SJed Brown   adjncy  = graph->adjncy;
50720c7d97c5SJed Brown   where   = graph->where;
50730c7d97c5SJed Brown   touched = graph->touched;
50740c7d97c5SJed Brown   queue   = graph->queue;
50750c7d97c5SJed Brown   cptr    = graph->cptr;
50760c7d97c5SJed Brown 
50770c7d97c5SJed Brown   for (i=0; i<nvtxs; i++)
50780c7d97c5SJed Brown     touched[i] = PETSC_FALSE;
50790c7d97c5SJed Brown 
50800c7d97c5SJed Brown   cum_queue=0;
50810c7d97c5SJed Brown   ncmps=0;
50820c7d97c5SJed Brown 
50830c7d97c5SJed Brown   for (n=0; n<n_dist; n++) {
5084da1bb401SStefano Zampini     pid = n+1;  /* partition labeled by 0 is discarded */
50850c7d97c5SJed Brown     nleft = 0;
50860c7d97c5SJed Brown     for (i=0; i<nvtxs; i++) {
50870c7d97c5SJed Brown       if (where[i] == pid)
50880c7d97c5SJed Brown         nleft++;
50890c7d97c5SJed Brown     }
50900c7d97c5SJed Brown     for (i=0; i<nvtxs; i++) {
50910c7d97c5SJed Brown       if (where[i] == pid)
50920c7d97c5SJed Brown         break;
50930c7d97c5SJed Brown     }
50940c7d97c5SJed Brown     touched[i] = PETSC_TRUE;
50950c7d97c5SJed Brown     queue[cum_queue] = i;
50960c7d97c5SJed Brown     first = 0; last = 1;
50970c7d97c5SJed Brown     cptr[ncmps] = cum_queue;  /* This actually points to queue */
50980c7d97c5SJed Brown     ncmps_pid = 0;
50990c7d97c5SJed Brown     while (first != nleft) {
51000c7d97c5SJed Brown       if (first == last) { /* Find another starting vertex */
51010c7d97c5SJed Brown         cptr[++ncmps] = first+cum_queue;
51020c7d97c5SJed Brown         ncmps_pid++;
51030c7d97c5SJed Brown         for (i=0; i<nvtxs; i++) {
51040c7d97c5SJed Brown           if (where[i] == pid && !touched[i])
51050c7d97c5SJed Brown             break;
51060c7d97c5SJed Brown         }
51070c7d97c5SJed Brown         queue[cum_queue+last] = i;
51080c7d97c5SJed Brown         last++;
51090c7d97c5SJed Brown         touched[i] = PETSC_TRUE;
51100c7d97c5SJed Brown       }
51110c7d97c5SJed Brown       i = queue[cum_queue+first];
51120c7d97c5SJed Brown       first++;
51130c7d97c5SJed Brown       for (j=xadj[i]; j<xadj[i+1]; j++) {
51140c7d97c5SJed Brown         k = adjncy[j];
51150c7d97c5SJed Brown         if (where[k] == pid && !touched[k]) {
51160c7d97c5SJed Brown           queue[cum_queue+last] = k;
51170c7d97c5SJed Brown           last++;
51180c7d97c5SJed Brown           touched[k] = PETSC_TRUE;
51190c7d97c5SJed Brown         }
51200c7d97c5SJed Brown       }
51210c7d97c5SJed Brown     }
51220c7d97c5SJed Brown     cptr[++ncmps] = first+cum_queue;
51230c7d97c5SJed Brown     ncmps_pid++;
51240c7d97c5SJed Brown     cum_queue=cptr[ncmps];
5125a0ba757dSStefano Zampini     graph->where_ncmps[n] = ncmps_pid;
51260c7d97c5SJed Brown   }
51270c7d97c5SJed Brown   graph->ncmps = ncmps;
51280c7d97c5SJed Brown 
51290c7d97c5SJed Brown   PetscFunctionReturn(0);
51300c7d97c5SJed Brown }
5131