xref: /petsc/src/ksp/pc/impls/bddc/bddc.c (revision 1a83f524638a4da8317a6bd80eb6d9a2936d8384)
153cdbc3dSStefano Zampini /* TODOLIST
2da1bb401SStefano Zampini    DofSplitting and DM attached to pc?
3da1bb401SStefano Zampini    Change SetNeumannBoundaries to SetNeumannBoundariesLocal and provide new SetNeumannBoundaries (same Dirichlet)
4831a100dSStefano Zampini      - change prec_type to switch_inexact_prec_type
53b03a366Sstefano_zampini    Inexact solvers: global preconditioner application is ready, ask to developers (Jed?) on how to best implement Dohrmann's approach (PCSHELL?)
6a0ba757dSStefano Zampini    change how to deal with the coarse problem (PCBDDCSetCoarseEnvironment):
7a0ba757dSStefano Zampini      - simplify coarse problem structure -> PCBDDC or PCREDUDANT, nothing else -> same comm for all levels?
8a0ba757dSStefano Zampini      - remove coarse enums and allow use of PCBDDCGetCoarseKSP
9a0ba757dSStefano Zampini      - remove metis dependency -> use MatPartitioning for multilevel -> Assemble serial adjacency in ManageLocalBoundaries?
10a0ba757dSStefano Zampini    code refactoring:
11a0ba757dSStefano Zampini      - pick up better names for static functions
12a0ba757dSStefano Zampini    change options structure:
13a0ba757dSStefano Zampini      - insert BDDC into MG framework?
14a0ba757dSStefano Zampini    provide other ops? Ask to developers
15a0ba757dSStefano Zampini    remove all unused printf
16a0ba757dSStefano Zampini    man pages
1753cdbc3dSStefano Zampini */
180c7d97c5SJed Brown 
1953cdbc3dSStefano Zampini /* ----------------------------------------------------------------------------------------------------------------------------------------------
200c7d97c5SJed Brown    Implementation of BDDC preconditioner based on:
210c7d97c5SJed Brown    C. Dohrmann "An approximate BDDC preconditioner", Numerical Linear Algebra with Applications Volume 14, Issue 2, pages 149-168, March 2007
2253cdbc3dSStefano Zampini    ---------------------------------------------------------------------------------------------------------------------------------------------- */
2353cdbc3dSStefano Zampini 
2453cdbc3dSStefano Zampini #include "bddc.h" /*I "petscpc.h" I*/  /* includes for fortran wrappers */
253b03a366Sstefano_zampini #include <petscblaslapack.h>
260c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
270c7d97c5SJed Brown #undef __FUNCT__
280c7d97c5SJed Brown #define __FUNCT__ "PCSetFromOptions_BDDC"
290c7d97c5SJed Brown PetscErrorCode PCSetFromOptions_BDDC(PC pc)
300c7d97c5SJed Brown {
310c7d97c5SJed Brown   PC_BDDC         *pcbddc = (PC_BDDC*)pc->data;
320c7d97c5SJed Brown   PetscErrorCode ierr;
330c7d97c5SJed Brown 
340c7d97c5SJed Brown   PetscFunctionBegin;
350c7d97c5SJed Brown   ierr = PetscOptionsHead("BDDC options");CHKERRQ(ierr);
360c7d97c5SJed Brown   /* Verbose debugging of main data structures */
37e269702eSStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_check_all"       ,"Verbose (debugging) output for PCBDDC"                       ,"none",pcbddc->dbg_flag      ,&pcbddc->dbg_flag      ,PETSC_NULL);CHKERRQ(ierr);
380c7d97c5SJed Brown   /* Some customization for default primal space */
39da1bb401SStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_vertices_only"   ,"Use only vertices in coarse space (i.e. discard constraints)","none",pcbddc->vertices_flag   ,&pcbddc->vertices_flag   ,PETSC_NULL);CHKERRQ(ierr);
40da1bb401SStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_constraints_only","Use only constraints in coarse space (i.e. discard vertices)","none",pcbddc->constraints_flag,&pcbddc->constraints_flag,PETSC_NULL);CHKERRQ(ierr);
41da1bb401SStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_faces_only"      ,"Use only faces among constraints of coarse space (i.e. discard edges)"         ,"none",pcbddc->faces_flag      ,&pcbddc->faces_flag      ,PETSC_NULL);CHKERRQ(ierr);
42da1bb401SStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_edges_only"      ,"Use only edges among constraints of coarse space (i.e. discard faces)"         ,"none",pcbddc->edges_flag      ,&pcbddc->edges_flag      ,PETSC_NULL);CHKERRQ(ierr);
430c7d97c5SJed Brown   /* Coarse solver context */
446c667b0aSStefano Zampini   static const char * const avail_coarse_problems[] = {"sequential","replicated","parallel","multilevel","CoarseProblemType","PC_BDDC_",0}; /*order of choiches depends on ENUM defined in bddc.h */
450c7d97c5SJed Brown   ierr = PetscOptionsEnum("-pc_bddc_coarse_problem_type","Set coarse problem type","none",avail_coarse_problems,(PetscEnum)pcbddc->coarse_problem_type,(PetscEnum*)&pcbddc->coarse_problem_type,PETSC_NULL);CHKERRQ(ierr);
460c7d97c5SJed Brown   /* Two different application of BDDC to the whole set of dofs, internal and interface */
470c7d97c5SJed Brown   ierr = PetscOptionsBool("-pc_bddc_switch_preconditioning_type","Switch between M_2 (default) and M_3 preconditioners (as defined by Dohrmann)","none",pcbddc->prec_type,&pcbddc->prec_type,PETSC_NULL);CHKERRQ(ierr);
48534831adSStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_use_change_of_basis","Use change of basis approach for primal space","none",pcbddc->usechangeofbasis,&pcbddc->usechangeofbasis,PETSC_NULL);CHKERRQ(ierr);
49534831adSStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_use_change_on_faces","Use change of basis approach for face constraints","none",pcbddc->usechangeonfaces,&pcbddc->usechangeonfaces,PETSC_NULL);CHKERRQ(ierr);
50534831adSStefano Zampini   pcbddc->usechangeonfaces = pcbddc->usechangeonfaces && pcbddc->usechangeofbasis;
510c7d97c5SJed Brown   ierr = PetscOptionsInt("-pc_bddc_coarsening_ratio","Set coarsening ratio used in multilevel coarsening","none",pcbddc->coarsening_ratio,&pcbddc->coarsening_ratio,PETSC_NULL);CHKERRQ(ierr);
524fad6a16SStefano Zampini   ierr = PetscOptionsInt("-pc_bddc_max_levels","Set maximum number of levels for multilevel","none",pcbddc->max_levels,&pcbddc->max_levels,PETSC_NULL);CHKERRQ(ierr);
530c7d97c5SJed Brown   ierr = PetscOptionsTail();CHKERRQ(ierr);
540c7d97c5SJed Brown   PetscFunctionReturn(0);
550c7d97c5SJed Brown }
560c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
570c7d97c5SJed Brown EXTERN_C_BEGIN
580c7d97c5SJed Brown #undef __FUNCT__
590c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetCoarseProblemType_BDDC"
6053cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetCoarseProblemType_BDDC(PC pc, CoarseProblemType CPT)
610c7d97c5SJed Brown {
620c7d97c5SJed Brown   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
630c7d97c5SJed Brown 
640c7d97c5SJed Brown   PetscFunctionBegin;
650c7d97c5SJed Brown   pcbddc->coarse_problem_type = CPT;
660c7d97c5SJed Brown   PetscFunctionReturn(0);
670c7d97c5SJed Brown }
680c7d97c5SJed Brown EXTERN_C_END
690c7d97c5SJed Brown #undef __FUNCT__
700c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetCoarseProblemType"
7153cdbc3dSStefano Zampini /*@
729c0446d6SStefano Zampini  PCBDDCSetCoarseProblemType - Set coarse problem type in PCBDDC.
7353cdbc3dSStefano Zampini 
749c0446d6SStefano Zampini    Not collective
7553cdbc3dSStefano Zampini 
7653cdbc3dSStefano Zampini    Input Parameters:
7753cdbc3dSStefano Zampini +  pc - the preconditioning context
7853cdbc3dSStefano Zampini -  CoarseProblemType - pick a better name and explain what this is
7953cdbc3dSStefano Zampini 
8053cdbc3dSStefano Zampini    Level: intermediate
8153cdbc3dSStefano Zampini 
8253cdbc3dSStefano Zampini    Notes:
83da1bb401SStefano Zampini    Not collective but all procs must call with same arguments.
8453cdbc3dSStefano Zampini 
8553cdbc3dSStefano Zampini .seealso: PCBDDC
8653cdbc3dSStefano Zampini @*/
870c7d97c5SJed Brown PetscErrorCode PCBDDCSetCoarseProblemType(PC pc, CoarseProblemType CPT)
880c7d97c5SJed Brown {
890c7d97c5SJed Brown   PetscErrorCode ierr;
900c7d97c5SJed Brown 
910c7d97c5SJed Brown   PetscFunctionBegin;
920c7d97c5SJed Brown   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
930c7d97c5SJed Brown   ierr = PetscTryMethod(pc,"PCBDDCSetCoarseProblemType_C",(PC,CoarseProblemType),(pc,CPT));CHKERRQ(ierr);
940c7d97c5SJed Brown   PetscFunctionReturn(0);
950c7d97c5SJed Brown }
960c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
970c7d97c5SJed Brown EXTERN_C_BEGIN
980c7d97c5SJed Brown #undef __FUNCT__
994fad6a16SStefano Zampini #define __FUNCT__ "PCBDDCSetCoarseningRatio_BDDC"
1004fad6a16SStefano Zampini static PetscErrorCode PCBDDCSetCoarseningRatio_BDDC(PC pc,PetscInt k)
1014fad6a16SStefano Zampini {
1024fad6a16SStefano Zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
1034fad6a16SStefano Zampini 
1044fad6a16SStefano Zampini   PetscFunctionBegin;
1054fad6a16SStefano Zampini   pcbddc->coarsening_ratio=k;
1064fad6a16SStefano Zampini   PetscFunctionReturn(0);
1074fad6a16SStefano Zampini }
1084fad6a16SStefano Zampini EXTERN_C_END
1094fad6a16SStefano Zampini #undef __FUNCT__
1104fad6a16SStefano Zampini #define __FUNCT__ "PCBDDCSetCoarseningRatio"
1114fad6a16SStefano Zampini /*@
1124fad6a16SStefano Zampini  PCBDDCSetCoarseningRatio - Set coarsening ratio used in multilevel coarsening
1134fad6a16SStefano Zampini 
1144fad6a16SStefano Zampini    Logically collective on PC
1154fad6a16SStefano Zampini 
1164fad6a16SStefano Zampini    Input Parameters:
1174fad6a16SStefano Zampini +  pc - the preconditioning context
1184fad6a16SStefano Zampini -  k - coarsening ratio
1194fad6a16SStefano Zampini 
1204fad6a16SStefano Zampini    Approximatively k subdomains at the finer level will be aggregated into a single subdomain at the coarser level.
1214fad6a16SStefano Zampini 
1224fad6a16SStefano Zampini    Level: intermediate
1234fad6a16SStefano Zampini 
1244fad6a16SStefano Zampini    Notes:
1254fad6a16SStefano Zampini 
1264fad6a16SStefano Zampini .seealso: PCBDDC
1274fad6a16SStefano Zampini @*/
1284fad6a16SStefano Zampini PetscErrorCode PCBDDCSetCoarseningRatio(PC pc,PetscInt k)
1294fad6a16SStefano Zampini {
1304fad6a16SStefano Zampini   PetscErrorCode ierr;
1314fad6a16SStefano Zampini 
1324fad6a16SStefano Zampini   PetscFunctionBegin;
1334fad6a16SStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
1344fad6a16SStefano Zampini   ierr = PetscTryMethod(pc,"PCBDDCSetCoarseningRatio_C",(PC,PetscInt),(pc,k));CHKERRQ(ierr);
1354fad6a16SStefano Zampini   PetscFunctionReturn(0);
1364fad6a16SStefano Zampini }
1374fad6a16SStefano Zampini /* -------------------------------------------------------------------------- */
1384fad6a16SStefano Zampini EXTERN_C_BEGIN
1394fad6a16SStefano Zampini #undef __FUNCT__
1404fad6a16SStefano Zampini #define __FUNCT__ "PCBDDCSetMaxLevels_BDDC"
1414fad6a16SStefano Zampini static PetscErrorCode PCBDDCSetMaxLevels_BDDC(PC pc,PetscInt max_levels)
1424fad6a16SStefano Zampini {
1434fad6a16SStefano Zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
1444fad6a16SStefano Zampini 
1454fad6a16SStefano Zampini   PetscFunctionBegin;
1464fad6a16SStefano Zampini   pcbddc->max_levels=max_levels;
1474fad6a16SStefano Zampini   PetscFunctionReturn(0);
1484fad6a16SStefano Zampini }
1494fad6a16SStefano Zampini EXTERN_C_END
1504fad6a16SStefano Zampini #undef __FUNCT__
1514fad6a16SStefano Zampini #define __FUNCT__ "PCBDDCSetMaxLevels"
1524fad6a16SStefano Zampini /*@
1534fad6a16SStefano Zampini  PCBDDCSetMaxLevels - Sets the maximum number of levels within the multilevel approach.
1544fad6a16SStefano Zampini 
1554fad6a16SStefano Zampini    Logically collective on PC
1564fad6a16SStefano Zampini 
1574fad6a16SStefano Zampini    Input Parameters:
1584fad6a16SStefano Zampini +  pc - the preconditioning context
1594fad6a16SStefano Zampini -  max_levels - the maximum number of levels
1604fad6a16SStefano Zampini 
1614fad6a16SStefano Zampini    Default value is 1, i.e. coarse problem will be solved inexactly with one application
1624fad6a16SStefano Zampini    of PCBDDC preconditioner if the multilevel approach is requested.
1634fad6a16SStefano Zampini 
1644fad6a16SStefano Zampini    Level: intermediate
1654fad6a16SStefano Zampini 
1664fad6a16SStefano Zampini    Notes:
1674fad6a16SStefano Zampini 
1684fad6a16SStefano Zampini .seealso: PCBDDC
1694fad6a16SStefano Zampini @*/
1704fad6a16SStefano Zampini PetscErrorCode PCBDDCSetMaxLevels(PC pc,PetscInt max_levels)
1714fad6a16SStefano Zampini {
1724fad6a16SStefano Zampini   PetscErrorCode ierr;
1734fad6a16SStefano Zampini 
1744fad6a16SStefano Zampini   PetscFunctionBegin;
1754fad6a16SStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
1764fad6a16SStefano Zampini   ierr = PetscTryMethod(pc,"PCBDDCSetMaxLevels_C",(PC,PetscInt),(pc,max_levels));CHKERRQ(ierr);
1774fad6a16SStefano Zampini   PetscFunctionReturn(0);
1784fad6a16SStefano Zampini }
1794fad6a16SStefano Zampini /* -------------------------------------------------------------------------- */
1804fad6a16SStefano Zampini EXTERN_C_BEGIN
1814fad6a16SStefano Zampini #undef __FUNCT__
1820bdf917eSStefano Zampini #define __FUNCT__ "PCBDDCSetNullSpace_BDDC"
1830bdf917eSStefano Zampini static PetscErrorCode PCBDDCSetNullSpace_BDDC(PC pc,MatNullSpace NullSpace)
1840bdf917eSStefano Zampini {
1850bdf917eSStefano Zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
1860bdf917eSStefano Zampini   PetscErrorCode ierr;
1870bdf917eSStefano Zampini 
1880bdf917eSStefano Zampini   PetscFunctionBegin;
1890bdf917eSStefano Zampini   ierr = PetscObjectReference((PetscObject)NullSpace);CHKERRQ(ierr);
1900bdf917eSStefano Zampini   ierr = MatNullSpaceDestroy(&pcbddc->NullSpace);CHKERRQ(ierr);
1910bdf917eSStefano Zampini   pcbddc->NullSpace=NullSpace;
1920bdf917eSStefano Zampini   PetscFunctionReturn(0);
1930bdf917eSStefano Zampini }
1940bdf917eSStefano Zampini EXTERN_C_END
1950bdf917eSStefano Zampini #undef __FUNCT__
1960bdf917eSStefano Zampini #define __FUNCT__ "PCBDDCSetNullSpace"
1970bdf917eSStefano Zampini /*@
1980bdf917eSStefano Zampini  PCBDDCSetNullSpace - Set NullSpace of global operator of BDDC preconditioned mat.
1990bdf917eSStefano Zampini 
2000bdf917eSStefano Zampini    Logically collective on PC and MatNullSpace
2010bdf917eSStefano Zampini 
2020bdf917eSStefano Zampini    Input Parameters:
2030bdf917eSStefano Zampini +  pc - the preconditioning context
2040bdf917eSStefano Zampini -  NullSpace - Null space of the linear operator to be preconditioned.
2050bdf917eSStefano Zampini 
2060bdf917eSStefano Zampini    Level: intermediate
2070bdf917eSStefano Zampini 
2080bdf917eSStefano Zampini    Notes:
2090bdf917eSStefano Zampini 
2100bdf917eSStefano Zampini .seealso: PCBDDC
2110bdf917eSStefano Zampini @*/
2120bdf917eSStefano Zampini PetscErrorCode PCBDDCSetNullSpace(PC pc,MatNullSpace NullSpace)
2130bdf917eSStefano Zampini {
2140bdf917eSStefano Zampini   PetscErrorCode ierr;
2150bdf917eSStefano Zampini 
2160bdf917eSStefano Zampini   PetscFunctionBegin;
2170bdf917eSStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
2180bdf917eSStefano Zampini   ierr = PetscTryMethod(pc,"PCBDDCSetNullSpace_C",(PC,MatNullSpace),(pc,NullSpace));CHKERRQ(ierr);
2190bdf917eSStefano Zampini   PetscFunctionReturn(0);
2200bdf917eSStefano Zampini }
2210bdf917eSStefano Zampini /* -------------------------------------------------------------------------- */
2220bdf917eSStefano Zampini EXTERN_C_BEGIN
2230bdf917eSStefano Zampini #undef __FUNCT__
2243b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCSetDirichletBoundaries_BDDC"
2253b03a366Sstefano_zampini static PetscErrorCode PCBDDCSetDirichletBoundaries_BDDC(PC pc,IS DirichletBoundaries)
2263b03a366Sstefano_zampini {
2273b03a366Sstefano_zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
2283b03a366Sstefano_zampini   PetscErrorCode ierr;
2293b03a366Sstefano_zampini 
2303b03a366Sstefano_zampini   PetscFunctionBegin;
2313b03a366Sstefano_zampini   ierr = ISDestroy(&pcbddc->DirichletBoundaries);CHKERRQ(ierr);
23236e030ebSStefano Zampini   ierr = PetscObjectReference((PetscObject)DirichletBoundaries);CHKERRQ(ierr);
23336e030ebSStefano Zampini   pcbddc->DirichletBoundaries=DirichletBoundaries;
2343b03a366Sstefano_zampini   PetscFunctionReturn(0);
2353b03a366Sstefano_zampini }
2363b03a366Sstefano_zampini EXTERN_C_END
2373b03a366Sstefano_zampini #undef __FUNCT__
2383b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCSetDirichletBoundaries"
2393b03a366Sstefano_zampini /*@
240da1bb401SStefano Zampini  PCBDDCSetDirichletBoundaries - Set index set defining subdomain part (in local ordering)
241da1bb401SStefano Zampini                               of Dirichlet boundaries for the global problem.
2423b03a366Sstefano_zampini 
2433b03a366Sstefano_zampini    Not collective
2443b03a366Sstefano_zampini 
2453b03a366Sstefano_zampini    Input Parameters:
2463b03a366Sstefano_zampini +  pc - the preconditioning context
2473b03a366Sstefano_zampini -  DirichletBoundaries - sequential index set defining the subdomain part of Dirichlet boundaries (can be PETSC_NULL)
2483b03a366Sstefano_zampini 
2493b03a366Sstefano_zampini    Level: intermediate
2503b03a366Sstefano_zampini 
2513b03a366Sstefano_zampini    Notes:
2523b03a366Sstefano_zampini 
2533b03a366Sstefano_zampini .seealso: PCBDDC
2543b03a366Sstefano_zampini @*/
2553b03a366Sstefano_zampini PetscErrorCode PCBDDCSetDirichletBoundaries(PC pc,IS DirichletBoundaries)
2563b03a366Sstefano_zampini {
2573b03a366Sstefano_zampini   PetscErrorCode ierr;
2583b03a366Sstefano_zampini 
2593b03a366Sstefano_zampini   PetscFunctionBegin;
2603b03a366Sstefano_zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
2613b03a366Sstefano_zampini   ierr = PetscTryMethod(pc,"PCBDDCSetDirichletBoundaries_C",(PC,IS),(pc,DirichletBoundaries));CHKERRQ(ierr);
2623b03a366Sstefano_zampini   PetscFunctionReturn(0);
2633b03a366Sstefano_zampini }
2643b03a366Sstefano_zampini /* -------------------------------------------------------------------------- */
2653b03a366Sstefano_zampini EXTERN_C_BEGIN
2663b03a366Sstefano_zampini #undef __FUNCT__
2670c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetNeumannBoundaries_BDDC"
26853cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetNeumannBoundaries_BDDC(PC pc,IS NeumannBoundaries)
2690c7d97c5SJed Brown {
2700c7d97c5SJed Brown   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
27153cdbc3dSStefano Zampini   PetscErrorCode ierr;
2720c7d97c5SJed Brown 
2730c7d97c5SJed Brown   PetscFunctionBegin;
27453cdbc3dSStefano Zampini   ierr = ISDestroy(&pcbddc->NeumannBoundaries);CHKERRQ(ierr);
27536e030ebSStefano Zampini   ierr = PetscObjectReference((PetscObject)NeumannBoundaries);CHKERRQ(ierr);
27636e030ebSStefano Zampini   pcbddc->NeumannBoundaries=NeumannBoundaries;
2770c7d97c5SJed Brown   PetscFunctionReturn(0);
2780c7d97c5SJed Brown }
2790c7d97c5SJed Brown EXTERN_C_END
2800c7d97c5SJed Brown #undef __FUNCT__
2810c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetNeumannBoundaries"
28257527edcSJed Brown /*@
283da1bb401SStefano Zampini  PCBDDCSetNeumannBoundaries - Set index set defining subdomain part (in local ordering)
284da1bb401SStefano Zampini                               of Neumann boundaries for the global problem.
28557527edcSJed Brown 
2869c0446d6SStefano Zampini    Not collective
28757527edcSJed Brown 
28857527edcSJed Brown    Input Parameters:
28957527edcSJed Brown +  pc - the preconditioning context
2909c0446d6SStefano Zampini -  NeumannBoundaries - sequential index set defining the subdomain part of Neumann boundaries (can be PETSC_NULL)
29157527edcSJed Brown 
29257527edcSJed Brown    Level: intermediate
29357527edcSJed Brown 
29457527edcSJed Brown    Notes:
29557527edcSJed Brown 
29657527edcSJed Brown .seealso: PCBDDC
29757527edcSJed Brown @*/
29853cdbc3dSStefano Zampini PetscErrorCode PCBDDCSetNeumannBoundaries(PC pc,IS NeumannBoundaries)
2990c7d97c5SJed Brown {
3000c7d97c5SJed Brown   PetscErrorCode ierr;
3010c7d97c5SJed Brown 
3020c7d97c5SJed Brown   PetscFunctionBegin;
3030c7d97c5SJed Brown   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
30453cdbc3dSStefano Zampini   ierr = PetscTryMethod(pc,"PCBDDCSetNeumannBoundaries_C",(PC,IS),(pc,NeumannBoundaries));CHKERRQ(ierr);
30553cdbc3dSStefano Zampini   PetscFunctionReturn(0);
30653cdbc3dSStefano Zampini }
30753cdbc3dSStefano Zampini /* -------------------------------------------------------------------------- */
30853cdbc3dSStefano Zampini EXTERN_C_BEGIN
30953cdbc3dSStefano Zampini #undef __FUNCT__
310da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCGetDirichletBoundaries_BDDC"
311da1bb401SStefano Zampini static PetscErrorCode PCBDDCGetDirichletBoundaries_BDDC(PC pc,IS *DirichletBoundaries)
312da1bb401SStefano Zampini {
313da1bb401SStefano Zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
314da1bb401SStefano Zampini 
315da1bb401SStefano Zampini   PetscFunctionBegin;
316da1bb401SStefano Zampini   *DirichletBoundaries = pcbddc->DirichletBoundaries;
317da1bb401SStefano Zampini   PetscFunctionReturn(0);
318da1bb401SStefano Zampini }
319da1bb401SStefano Zampini EXTERN_C_END
320da1bb401SStefano Zampini #undef __FUNCT__
321da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCGetDirichletBoundaries"
322da1bb401SStefano Zampini /*@
323da1bb401SStefano Zampini  PCBDDCGetDirichletBoundaries - Get index set defining subdomain part (in local ordering)
324da1bb401SStefano Zampini                                 of Dirichlet boundaries for the global problem.
325da1bb401SStefano Zampini 
326da1bb401SStefano Zampini    Not collective
327da1bb401SStefano Zampini 
328da1bb401SStefano Zampini    Input Parameters:
329da1bb401SStefano Zampini +  pc - the preconditioning context
330da1bb401SStefano Zampini 
331da1bb401SStefano Zampini    Output Parameters:
332da1bb401SStefano Zampini +  DirichletBoundaries - index set defining the subdomain part of Dirichlet boundaries
333da1bb401SStefano Zampini 
334da1bb401SStefano Zampini    Level: intermediate
335da1bb401SStefano Zampini 
336da1bb401SStefano Zampini    Notes:
337da1bb401SStefano Zampini 
338da1bb401SStefano Zampini .seealso: PCBDDC
339da1bb401SStefano Zampini @*/
340da1bb401SStefano Zampini PetscErrorCode PCBDDCGetDirichletBoundaries(PC pc,IS *DirichletBoundaries)
341da1bb401SStefano Zampini {
342da1bb401SStefano Zampini   PetscErrorCode ierr;
343da1bb401SStefano Zampini 
344da1bb401SStefano Zampini   PetscFunctionBegin;
345da1bb401SStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
346da1bb401SStefano Zampini   ierr = PetscUseMethod(pc,"PCBDDCGetDirichletBoundaries_C",(PC,IS*),(pc,DirichletBoundaries));CHKERRQ(ierr);
347da1bb401SStefano Zampini   PetscFunctionReturn(0);
348da1bb401SStefano Zampini }
349da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
350da1bb401SStefano Zampini EXTERN_C_BEGIN
351da1bb401SStefano Zampini #undef __FUNCT__
35253cdbc3dSStefano Zampini #define __FUNCT__ "PCBDDCGetNeumannBoundaries_BDDC"
35353cdbc3dSStefano Zampini static PetscErrorCode PCBDDCGetNeumannBoundaries_BDDC(PC pc,IS *NeumannBoundaries)
35453cdbc3dSStefano Zampini {
35553cdbc3dSStefano Zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
35653cdbc3dSStefano Zampini 
35753cdbc3dSStefano Zampini   PetscFunctionBegin;
35853cdbc3dSStefano Zampini   *NeumannBoundaries = pcbddc->NeumannBoundaries;
35953cdbc3dSStefano Zampini   PetscFunctionReturn(0);
36053cdbc3dSStefano Zampini }
36153cdbc3dSStefano Zampini EXTERN_C_END
36253cdbc3dSStefano Zampini #undef __FUNCT__
36353cdbc3dSStefano Zampini #define __FUNCT__ "PCBDDCGetNeumannBoundaries"
36453cdbc3dSStefano Zampini /*@
365da1bb401SStefano Zampini  PCBDDCGetNeumannBoundaries - Get index set defining subdomain part (in local ordering)
366da1bb401SStefano Zampini                               of Neumann boundaries for the global problem.
36753cdbc3dSStefano Zampini 
3689c0446d6SStefano Zampini    Not collective
36953cdbc3dSStefano Zampini 
37053cdbc3dSStefano Zampini    Input Parameters:
37153cdbc3dSStefano Zampini +  pc - the preconditioning context
37253cdbc3dSStefano Zampini 
37353cdbc3dSStefano Zampini    Output Parameters:
37453cdbc3dSStefano Zampini +  NeumannBoundaries - index set defining the subdomain part of Neumann boundaries
37553cdbc3dSStefano Zampini 
37653cdbc3dSStefano Zampini    Level: intermediate
37753cdbc3dSStefano Zampini 
37853cdbc3dSStefano Zampini    Notes:
37953cdbc3dSStefano Zampini 
38053cdbc3dSStefano Zampini .seealso: PCBDDC
38153cdbc3dSStefano Zampini @*/
38253cdbc3dSStefano Zampini PetscErrorCode PCBDDCGetNeumannBoundaries(PC pc,IS *NeumannBoundaries)
38353cdbc3dSStefano Zampini {
38453cdbc3dSStefano Zampini   PetscErrorCode ierr;
38553cdbc3dSStefano Zampini 
38653cdbc3dSStefano Zampini   PetscFunctionBegin;
38753cdbc3dSStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
38853cdbc3dSStefano Zampini   ierr = PetscUseMethod(pc,"PCBDDCGetNeumannBoundaries_C",(PC,IS*),(pc,NeumannBoundaries));CHKERRQ(ierr);
3890c7d97c5SJed Brown   PetscFunctionReturn(0);
3900c7d97c5SJed Brown }
39136e030ebSStefano Zampini /* -------------------------------------------------------------------------- */
39236e030ebSStefano Zampini EXTERN_C_BEGIN
39336e030ebSStefano Zampini #undef __FUNCT__
394da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetLocalAdjacencyGraph_BDDC"
395*1a83f524SJed Brown static PetscErrorCode PCBDDCSetLocalAdjacencyGraph_BDDC(PC pc, PetscInt nvtxs,const PetscInt xadj[],const PetscInt adjncy[], PetscCopyMode copymode)
39636e030ebSStefano Zampini {
39736e030ebSStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
398da1bb401SStefano Zampini   PCBDDCGraph    mat_graph=pcbddc->mat_graph;
399da1bb401SStefano Zampini   PetscErrorCode ierr;
40036e030ebSStefano Zampini 
40136e030ebSStefano Zampini   PetscFunctionBegin;
402da1bb401SStefano Zampini   mat_graph->nvtxs=nvtxs;
403da1bb401SStefano Zampini   ierr = PetscFree(mat_graph->xadj);CHKERRQ(ierr);
404da1bb401SStefano Zampini   ierr = PetscFree(mat_graph->adjncy);CHKERRQ(ierr);
405da1bb401SStefano Zampini   if (copymode == PETSC_COPY_VALUES) {
406da1bb401SStefano Zampini     ierr = PetscMalloc((mat_graph->nvtxs+1)*sizeof(PetscInt),&mat_graph->xadj);CHKERRQ(ierr);
407da1bb401SStefano Zampini     ierr = PetscMalloc(xadj[mat_graph->nvtxs]*sizeof(PetscInt),&mat_graph->adjncy);CHKERRQ(ierr);
408da1bb401SStefano Zampini     ierr = PetscMemcpy(mat_graph->xadj,xadj,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr);
409da1bb401SStefano Zampini     ierr = PetscMemcpy(mat_graph->adjncy,adjncy,xadj[mat_graph->nvtxs]*sizeof(PetscInt));CHKERRQ(ierr);
410da1bb401SStefano Zampini   } else if (copymode == PETSC_OWN_POINTER) {
411*1a83f524SJed Brown     mat_graph->xadj = (PetscInt*)xadj;
412*1a83f524SJed Brown     mat_graph->adjncy = (PetscInt*)adjncy;
413da1bb401SStefano Zampini   } else {
414da1bb401SStefano Zampini     SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_SUP,"Unsupported copy mode %d in %s\n",copymode,__FUNCT__);
415da1bb401SStefano Zampini   }
41636e030ebSStefano Zampini   PetscFunctionReturn(0);
41736e030ebSStefano Zampini }
41836e030ebSStefano Zampini EXTERN_C_END
41936e030ebSStefano Zampini #undef __FUNCT__
420da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetLocalAdjacencyGraph"
42136e030ebSStefano Zampini /*@
422da1bb401SStefano Zampini  PCBDDCSetLocalAdjacencyGraph - Set CSR graph of local matrix for use of PCBDDC.
42336e030ebSStefano Zampini 
42436e030ebSStefano Zampini    Not collective
42536e030ebSStefano Zampini 
42636e030ebSStefano Zampini    Input Parameters:
42736e030ebSStefano Zampini +  pc - the preconditioning context
428da1bb401SStefano Zampini -  nvtxs - number of local vertices of the graph
429da1bb401SStefano Zampini -  xadj, adjncy - the CSR graph
430da1bb401SStefano Zampini -  copymode - either PETSC_COPY_VALUES or PETSC_OWN_POINTER. In the former case the user must free the array passed in;
431da1bb401SStefano Zampini                                                              in the latter case, memory must be obtained with PetscMalloc.
43236e030ebSStefano Zampini 
43336e030ebSStefano Zampini    Level: intermediate
43436e030ebSStefano Zampini 
43536e030ebSStefano Zampini    Notes:
43636e030ebSStefano Zampini 
43736e030ebSStefano Zampini .seealso: PCBDDC
43836e030ebSStefano Zampini @*/
439*1a83f524SJed Brown PetscErrorCode PCBDDCSetLocalAdjacencyGraph(PC pc,PetscInt nvtxs,const PetscInt xadj[],const PetscInt adjncy[], PetscCopyMode copymode)
44036e030ebSStefano Zampini {
441da1bb401SStefano Zampini   PetscInt       nrows,ncols;
442da1bb401SStefano Zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
44336e030ebSStefano Zampini   PetscErrorCode ierr;
44436e030ebSStefano Zampini 
44536e030ebSStefano Zampini   PetscFunctionBegin;
44636e030ebSStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
447da1bb401SStefano Zampini   ierr = MatGetSize(matis->A,&nrows,&ncols);CHKERRQ(ierr);
448da1bb401SStefano Zampini   if (nvtxs != nrows) {
449da1bb401SStefano Zampini     SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Local adjacency size %d passed in %s differs from local problem size %d!\n",nvtxs,__FUNCT__,nrows);
450da1bb401SStefano Zampini   } else {
451*1a83f524SJed Brown     ierr = PetscTryMethod(pc,"PCBDDCSetLocalAdjacencyGraph_C",(PC,PetscInt,const PetscInt[],const PetscInt[],PetscCopyMode),(pc,nvtxs,xadj,adjncy,copymode));CHKERRQ(ierr);
452da1bb401SStefano Zampini   }
45336e030ebSStefano Zampini   PetscFunctionReturn(0);
45436e030ebSStefano Zampini }
4559c0446d6SStefano Zampini /* -------------------------------------------------------------------------- */
4569c0446d6SStefano Zampini EXTERN_C_BEGIN
4579c0446d6SStefano Zampini #undef __FUNCT__
4589c0446d6SStefano Zampini #define __FUNCT__ "PCBDDCSetDofsSplitting_BDDC"
4599c0446d6SStefano Zampini static PetscErrorCode PCBDDCSetDofsSplitting_BDDC(PC pc,PetscInt n_is, IS ISForDofs[])
4609c0446d6SStefano Zampini {
4619c0446d6SStefano Zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
4629c0446d6SStefano Zampini   PetscInt i;
4639c0446d6SStefano Zampini   PetscErrorCode ierr;
4649c0446d6SStefano Zampini 
4659c0446d6SStefano Zampini   PetscFunctionBegin;
466da1bb401SStefano Zampini   /* Destroy ISes if they were already set */
4679c0446d6SStefano Zampini   for (i=0;i<pcbddc->n_ISForDofs;i++) {
4689c0446d6SStefano Zampini     ierr = ISDestroy(&pcbddc->ISForDofs[i]);CHKERRQ(ierr);
4699c0446d6SStefano Zampini   }
470d11ae9bbSstefano_zampini   ierr = PetscFree(pcbddc->ISForDofs);CHKERRQ(ierr);
471da1bb401SStefano Zampini   /* allocate space then set */
4729c0446d6SStefano Zampini   ierr = PetscMalloc(n_is*sizeof(IS),&pcbddc->ISForDofs);CHKERRQ(ierr);
4739c0446d6SStefano Zampini   for (i=0;i<n_is;i++) {
474da1bb401SStefano Zampini     ierr = PetscObjectReference((PetscObject)ISForDofs[i]);CHKERRQ(ierr);
475da1bb401SStefano Zampini     pcbddc->ISForDofs[i]=ISForDofs[i];
4769c0446d6SStefano Zampini   }
4779c0446d6SStefano Zampini   pcbddc->n_ISForDofs=n_is;
4789c0446d6SStefano Zampini   PetscFunctionReturn(0);
4799c0446d6SStefano Zampini }
4809c0446d6SStefano Zampini EXTERN_C_END
4819c0446d6SStefano Zampini #undef __FUNCT__
4829c0446d6SStefano Zampini #define __FUNCT__ "PCBDDCSetDofsSplitting"
4839c0446d6SStefano Zampini /*@
484da1bb401SStefano Zampini  PCBDDCSetDofsSplitting - Set index sets defining fields of local mat.
4859c0446d6SStefano Zampini 
4869c0446d6SStefano Zampini    Not collective
4879c0446d6SStefano Zampini 
4889c0446d6SStefano Zampini    Input Parameters:
4899c0446d6SStefano Zampini +  pc - the preconditioning context
490da1bb401SStefano Zampini -  n - number of index sets defining the fields
491da1bb401SStefano Zampini -  IS[] - array of IS describing the fields
4929c0446d6SStefano Zampini 
4939c0446d6SStefano Zampini    Level: intermediate
4949c0446d6SStefano Zampini 
4959c0446d6SStefano Zampini    Notes:
4969c0446d6SStefano Zampini 
4979c0446d6SStefano Zampini .seealso: PCBDDC
4989c0446d6SStefano Zampini @*/
4999c0446d6SStefano Zampini PetscErrorCode PCBDDCSetDofsSplitting(PC pc,PetscInt n_is, IS ISForDofs[])
5009c0446d6SStefano Zampini {
5019c0446d6SStefano Zampini   PetscErrorCode ierr;
5029c0446d6SStefano Zampini 
5039c0446d6SStefano Zampini   PetscFunctionBegin;
5049c0446d6SStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
5059c0446d6SStefano Zampini   ierr = PetscTryMethod(pc,"PCBDDCSetDofsSplitting_C",(PC,PetscInt,IS[]),(pc,n_is,ISForDofs));CHKERRQ(ierr);
5069c0446d6SStefano Zampini   PetscFunctionReturn(0);
5079c0446d6SStefano Zampini }
508da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
509534831adSStefano Zampini #undef __FUNCT__
510534831adSStefano Zampini #define __FUNCT__ "PCPreSolve_BDDC"
511534831adSStefano Zampini /* -------------------------------------------------------------------------- */
512534831adSStefano Zampini /*
513534831adSStefano Zampini    PCPreSolve_BDDC - Changes the right hand side and (if necessary) the initial
514534831adSStefano Zampini                      guess if a transformation of basis approach has been selected.
5159c0446d6SStefano Zampini 
516534831adSStefano Zampini    Input Parameter:
517534831adSStefano Zampini +  pc - the preconditioner contex
518534831adSStefano Zampini 
519534831adSStefano Zampini    Application Interface Routine: PCPreSolve()
520534831adSStefano Zampini 
521534831adSStefano Zampini    Notes:
522534831adSStefano Zampini    The interface routine PCPreSolve() is not usually called directly by
523534831adSStefano Zampini    the user, but instead is called by KSPSolve().
524534831adSStefano Zampini */
525534831adSStefano Zampini static PetscErrorCode PCPreSolve_BDDC(PC pc, KSP ksp, Vec rhs, Vec x)
526534831adSStefano Zampini {
527534831adSStefano Zampini   PetscErrorCode ierr;
528534831adSStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
529534831adSStefano Zampini   PC_IS          *pcis = (PC_IS*)(pc->data);
530534831adSStefano Zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
531534831adSStefano Zampini   Mat            temp_mat;
5323972b0daSStefano Zampini   IS             dirIS;
5333972b0daSStefano Zampini   PetscInt       dirsize,i,*is_indices;
5343972b0daSStefano Zampini   PetscScalar    *array_x,*array_diagonal;
5353972b0daSStefano Zampini   Vec            used_vec;
5363972b0daSStefano Zampini   PetscBool      guess_nonzero;
537534831adSStefano Zampini 
538534831adSStefano Zampini   PetscFunctionBegin;
5393972b0daSStefano Zampini   if (x) {
5403972b0daSStefano Zampini     ierr = PetscObjectReference((PetscObject)x);CHKERRQ(ierr);
5413972b0daSStefano Zampini     used_vec = x;
5423972b0daSStefano Zampini   } else {
5433972b0daSStefano Zampini     ierr = PetscObjectReference((PetscObject)pcbddc->temp_solution);CHKERRQ(ierr);
5443972b0daSStefano Zampini     used_vec = pcbddc->temp_solution;
5453972b0daSStefano Zampini     ierr = VecSet(used_vec,0.0);CHKERRQ(ierr);
5463972b0daSStefano Zampini   }
5473972b0daSStefano Zampini   /* hack into ksp data structure PCPreSolve comes earlier in src/ksp/ksp/interface/itfunc.c */
5483972b0daSStefano Zampini   if (ksp) {
5493972b0daSStefano Zampini     ierr = KSPGetInitialGuessNonzero(ksp,&guess_nonzero);CHKERRQ(ierr);
5503972b0daSStefano Zampini     if ( !guess_nonzero ) {
5513972b0daSStefano Zampini       ierr = VecSet(used_vec,0.0);CHKERRQ(ierr);
5523972b0daSStefano Zampini     }
5533972b0daSStefano Zampini   }
5543972b0daSStefano Zampini   /* store the original rhs */
5553972b0daSStefano Zampini   ierr = VecCopy(rhs,pcbddc->original_rhs);CHKERRQ(ierr);
5563972b0daSStefano Zampini 
5573972b0daSStefano Zampini   /* Take into account zeroed rows -> change rhs and store solution removed */
5583972b0daSStefano Zampini   ierr = MatGetDiagonal(pc->pmat,pcis->vec1_global);CHKERRQ(ierr);
5593972b0daSStefano Zampini   ierr = VecPointwiseDivide(pcis->vec1_global,rhs,pcis->vec1_global);CHKERRQ(ierr);
5603972b0daSStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
5613972b0daSStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
5623972b0daSStefano Zampini   ierr = VecScatterBegin(matis->ctx,used_vec,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
5633972b0daSStefano Zampini   ierr = VecScatterEnd  (matis->ctx,used_vec,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
5643972b0daSStefano Zampini   ierr = PCBDDCGetDirichletBoundaries(pc,&dirIS);CHKERRQ(ierr);
5653972b0daSStefano Zampini   if (dirIS) {
5663972b0daSStefano Zampini     ierr = ISGetSize(dirIS,&dirsize);CHKERRQ(ierr);
5673972b0daSStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array_x);CHKERRQ(ierr);
5683972b0daSStefano Zampini     ierr = VecGetArray(pcis->vec2_N,&array_diagonal);CHKERRQ(ierr);
5693972b0daSStefano Zampini     ierr = ISGetIndices(dirIS,(const PetscInt**)&is_indices);CHKERRQ(ierr);
5703972b0daSStefano Zampini     for (i=0;i<dirsize;i++) {
5713972b0daSStefano Zampini       array_x[is_indices[i]]=array_diagonal[is_indices[i]];
5723972b0daSStefano Zampini     }
5733972b0daSStefano Zampini     ierr = ISRestoreIndices(dirIS,(const PetscInt**)&is_indices);CHKERRQ(ierr);
5743972b0daSStefano Zampini     ierr = VecRestoreArray(pcis->vec2_N,&array_diagonal);CHKERRQ(ierr);
5753972b0daSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array_x);CHKERRQ(ierr);
5763972b0daSStefano Zampini   }
5773972b0daSStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
5783972b0daSStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
579b76ba322SStefano Zampini 
5803972b0daSStefano Zampini   /* remove the computed solution from the rhs */
5813972b0daSStefano Zampini   ierr = VecScale(used_vec,-1.0);CHKERRQ(ierr);
5823972b0daSStefano Zampini   ierr = MatMultAdd(pc->pmat,used_vec,rhs,rhs);CHKERRQ(ierr);
5833972b0daSStefano Zampini   ierr = VecScale(used_vec,-1.0);CHKERRQ(ierr);
584b76ba322SStefano Zampini 
585b76ba322SStefano Zampini   /* store partially computed solution and set initial guess */
5863972b0daSStefano Zampini   if (x) {
5873972b0daSStefano Zampini     ierr = VecCopy(used_vec,pcbddc->temp_solution);CHKERRQ(ierr);
5883972b0daSStefano Zampini     ierr = VecSet(used_vec,0.0);CHKERRQ(ierr);
589b76ba322SStefano Zampini     if (pcbddc->use_exact_dirichlet) {
590b76ba322SStefano Zampini       ierr = VecScatterBegin(pcis->global_to_D,rhs,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
591b76ba322SStefano Zampini       ierr = VecScatterEnd  (pcis->global_to_D,rhs,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
592b76ba322SStefano Zampini       ierr = KSPSolve(pcbddc->ksp_D,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr);
593b76ba322SStefano Zampini       ierr = VecScatterBegin(pcis->global_to_D,pcis->vec2_D,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
594b76ba322SStefano Zampini       ierr = VecScatterEnd  (pcis->global_to_D,pcis->vec2_D,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
595b76ba322SStefano Zampini       if (ksp) {
596b76ba322SStefano Zampini         ierr = KSPSetInitialGuessNonzero(ksp,PETSC_TRUE);CHKERRQ(ierr);
597b76ba322SStefano Zampini       }
598b76ba322SStefano Zampini     }
5993972b0daSStefano Zampini   }
600b76ba322SStefano Zampini 
601b76ba322SStefano Zampini   /* rhs change of basis */
602b76ba322SStefano Zampini   if (pcbddc->usechangeofbasis) {
603b76ba322SStefano Zampini     /* swap pointers for local matrices */
604b76ba322SStefano Zampini     temp_mat = matis->A;
605b76ba322SStefano Zampini     matis->A = pcbddc->local_mat;
606b76ba322SStefano Zampini     pcbddc->local_mat = temp_mat;
607b76ba322SStefano Zampini     /* Get local rhs and apply transformation of basis */
608b76ba322SStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,rhs,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
609b76ba322SStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,rhs,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
610b76ba322SStefano Zampini     /* from original basis to modified basis */
611b76ba322SStefano Zampini     ierr = MatMultTranspose(pcbddc->ChangeOfBasisMatrix,pcis->vec1_B,pcis->vec2_B);CHKERRQ(ierr);
612b76ba322SStefano Zampini     /* put back modified values into the global vec using INSERT_VALUES copy mode */
613b76ba322SStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,pcis->vec2_B,rhs,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
614b76ba322SStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec2_B,rhs,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
6150bdf917eSStefano Zampini     if (ksp && pcbddc->NullSpace) {
6160bdf917eSStefano Zampini       ierr = MatNullSpaceRemove(pcbddc->NullSpace,used_vec,PETSC_NULL);CHKERRQ(ierr);
6170bdf917eSStefano Zampini       ierr = MatNullSpaceRemove(pcbddc->NullSpace,rhs,PETSC_NULL);CHKERRQ(ierr);
618b76ba322SStefano Zampini     }
6190bdf917eSStefano Zampini   }
6200bdf917eSStefano Zampini   ierr = VecDestroy(&used_vec);CHKERRQ(ierr);
621534831adSStefano Zampini   PetscFunctionReturn(0);
622534831adSStefano Zampini }
623534831adSStefano Zampini /* -------------------------------------------------------------------------- */
624534831adSStefano Zampini #undef __FUNCT__
625534831adSStefano Zampini #define __FUNCT__ "PCPostSolve_BDDC"
626534831adSStefano Zampini /* -------------------------------------------------------------------------- */
627534831adSStefano Zampini /*
628534831adSStefano Zampini    PCPostSolve_BDDC - Changes the computed solution if a transformation of basis
629534831adSStefano Zampini                      approach has been selected. Also, restores rhs to its original state.
630534831adSStefano Zampini 
631534831adSStefano Zampini    Input Parameter:
632534831adSStefano Zampini +  pc - the preconditioner contex
633534831adSStefano Zampini 
634534831adSStefano Zampini    Application Interface Routine: PCPostSolve()
635534831adSStefano Zampini 
636534831adSStefano Zampini    Notes:
637534831adSStefano Zampini    The interface routine PCPostSolve() is not usually called directly by
638534831adSStefano Zampini    the user, but instead is called by KSPSolve().
639534831adSStefano Zampini */
640534831adSStefano Zampini static PetscErrorCode PCPostSolve_BDDC(PC pc, KSP ksp, Vec rhs, Vec x)
641534831adSStefano Zampini {
642534831adSStefano Zampini   PetscErrorCode ierr;
643534831adSStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
644534831adSStefano Zampini   PC_IS          *pcis = (PC_IS*)(pc->data);
645534831adSStefano Zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
646534831adSStefano Zampini   Mat            temp_mat;
647534831adSStefano Zampini 
648534831adSStefano Zampini   PetscFunctionBegin;
649534831adSStefano Zampini   if (pcbddc->usechangeofbasis) {
650534831adSStefano Zampini     /* swap pointers for local matrices */
651534831adSStefano Zampini     temp_mat = matis->A;
652534831adSStefano Zampini     matis->A = pcbddc->local_mat;
653534831adSStefano Zampini     pcbddc->local_mat = temp_mat;
654534831adSStefano Zampini     /* restore rhs to its original state */
6553425bc38SStefano Zampini     if (rhs) {
6563425bc38SStefano Zampini       ierr = VecCopy(pcbddc->original_rhs,rhs);CHKERRQ(ierr);
6573425bc38SStefano Zampini     }
658534831adSStefano Zampini     /* Get Local boundary and apply transformation of basis to solution vector */
659534831adSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,x,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
660534831adSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,x,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
661534831adSStefano Zampini     /* from modified basis to original basis */
662534831adSStefano Zampini     ierr = MatMult(pcbddc->ChangeOfBasisMatrix,pcis->vec1_B,pcis->vec2_B);CHKERRQ(ierr);
663534831adSStefano Zampini     /* put back modified values into the global vec using INSERT_VALUES copy mode */
664534831adSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,pcis->vec2_B,x,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
665534831adSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec2_B,x,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
666534831adSStefano Zampini   }
6673972b0daSStefano Zampini   /* add solution removed in presolve */
6683425bc38SStefano Zampini   if (x) {
6693425bc38SStefano Zampini     ierr = VecAXPY(x,1.0,pcbddc->temp_solution);CHKERRQ(ierr);
6703425bc38SStefano Zampini   }
671534831adSStefano Zampini   PetscFunctionReturn(0);
672534831adSStefano Zampini }
673534831adSStefano Zampini /* -------------------------------------------------------------------------- */
67453cdbc3dSStefano Zampini #undef __FUNCT__
67553cdbc3dSStefano Zampini #define __FUNCT__ "PCSetUp_BDDC"
6760c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
6770c7d97c5SJed Brown /*
6780c7d97c5SJed Brown    PCSetUp_BDDC - Prepares for the use of the BDDC preconditioner
6790c7d97c5SJed Brown                   by setting data structures and options.
6800c7d97c5SJed Brown 
6810c7d97c5SJed Brown    Input Parameter:
68253cdbc3dSStefano Zampini +  pc - the preconditioner context
6830c7d97c5SJed Brown 
6840c7d97c5SJed Brown    Application Interface Routine: PCSetUp()
6850c7d97c5SJed Brown 
6860c7d97c5SJed Brown    Notes:
6870c7d97c5SJed Brown    The interface routine PCSetUp() is not usually called directly by
6880c7d97c5SJed Brown    the user, but instead is called by PCApply() if necessary.
6890c7d97c5SJed Brown */
69053cdbc3dSStefano Zampini PetscErrorCode PCSetUp_BDDC(PC pc)
6910c7d97c5SJed Brown {
6920c7d97c5SJed Brown   PetscErrorCode ierr;
6930c7d97c5SJed Brown   PC_BDDC*       pcbddc   = (PC_BDDC*)pc->data;
6940c7d97c5SJed Brown 
6950c7d97c5SJed Brown   PetscFunctionBegin;
6960c7d97c5SJed Brown   if (!pc->setupcalled) {
6973b03a366Sstefano_zampini     /* For BDDC we need to define a local "Neumann" problem different to that defined in PCISSetup
6989c0446d6SStefano Zampini        So, we set to pcnone the Neumann problem of pcis in order to avoid unneeded computation
6990c7d97c5SJed Brown        Also, we decide to directly build the (same) Dirichlet problem */
7000c7d97c5SJed Brown     ierr = PetscOptionsSetValue("-is_localN_pc_type","none");CHKERRQ(ierr);
7010c7d97c5SJed Brown     ierr = PetscOptionsSetValue("-is_localD_pc_type","none");CHKERRQ(ierr);
7020c7d97c5SJed Brown     /* Set up all the "iterative substructuring" common block */
7030bdf917eSStefano Zampini 
7040c7d97c5SJed Brown     ierr = PCISSetUp(pc);CHKERRQ(ierr);
7053b03a366Sstefano_zampini     /* Get stdout for dbg */
706e269702eSStefano Zampini     if (pcbddc->dbg_flag) {
707e269702eSStefano Zampini       ierr = PetscViewerASCIIGetStdout(((PetscObject)pc)->comm,&pcbddc->dbg_viewer);CHKERRQ(ierr);
708e269702eSStefano Zampini       ierr = PetscViewerASCIISynchronizedAllow(pcbddc->dbg_viewer,PETSC_TRUE);CHKERRQ(ierr);
709e269702eSStefano Zampini     }
7103b03a366Sstefano_zampini     /* Analyze local interface */
7110c7d97c5SJed Brown     ierr = PCBDDCManageLocalBoundaries(pc);CHKERRQ(ierr);
7123b03a366Sstefano_zampini     /* Set up local constraint matrix */
7133b03a366Sstefano_zampini     ierr = PCBDDCCreateConstraintMatrix(pc);CHKERRQ(ierr);
7140c7d97c5SJed Brown     /* Create coarse and local stuffs used for evaluating action of preconditioner */
7150c7d97c5SJed Brown     ierr = PCBDDCCoarseSetUp(pc);CHKERRQ(ierr);
7160c7d97c5SJed Brown   }
7170c7d97c5SJed Brown   PetscFunctionReturn(0);
7180c7d97c5SJed Brown }
7190c7d97c5SJed Brown 
7200c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
7210c7d97c5SJed Brown /*
7220c7d97c5SJed Brown    PCApply_BDDC - Applies the BDDC preconditioner to a vector.
7230c7d97c5SJed Brown 
7240c7d97c5SJed Brown    Input Parameters:
7250c7d97c5SJed Brown .  pc - the preconditioner context
7260c7d97c5SJed Brown .  r - input vector (global)
7270c7d97c5SJed Brown 
7280c7d97c5SJed Brown    Output Parameter:
7290c7d97c5SJed Brown .  z - output vector (global)
7300c7d97c5SJed Brown 
7310c7d97c5SJed Brown    Application Interface Routine: PCApply()
7320c7d97c5SJed Brown  */
7330c7d97c5SJed Brown #undef __FUNCT__
7340c7d97c5SJed Brown #define __FUNCT__ "PCApply_BDDC"
73553cdbc3dSStefano Zampini PetscErrorCode PCApply_BDDC(PC pc,Vec r,Vec z)
7360c7d97c5SJed Brown {
7370c7d97c5SJed Brown   PC_IS             *pcis = (PC_IS*)(pc->data);
7380c7d97c5SJed Brown   PC_BDDC           *pcbddc = (PC_BDDC*)(pc->data);
7390c7d97c5SJed Brown   PetscErrorCode    ierr;
7403b03a366Sstefano_zampini   const PetscScalar one = 1.0;
7413b03a366Sstefano_zampini   const PetscScalar m_one = -1.0;
7422617d88aSStefano Zampini   const PetscScalar zero = 0.0;
7430c7d97c5SJed Brown 
7440c7d97c5SJed Brown /* This code is similar to that provided in nn.c for PCNN
7450c7d97c5SJed Brown    NN interface preconditioner changed to BDDC
7460c7d97c5SJed Brown    Added support for M_3 preconditioenr in the reference article (code is active if pcbddc->prec_type = PETSC_TRUE) */
7470c7d97c5SJed Brown 
7480c7d97c5SJed Brown   PetscFunctionBegin;
749b76ba322SStefano Zampini   if (!pcbddc->use_exact_dirichlet) {
7500c7d97c5SJed Brown     /* First Dirichlet solve */
7510c7d97c5SJed Brown     ierr = VecScatterBegin(pcis->global_to_D,r,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
7520c7d97c5SJed Brown     ierr = VecScatterEnd  (pcis->global_to_D,r,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
75353cdbc3dSStefano Zampini     ierr = KSPSolve(pcbddc->ksp_D,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr);
7540c7d97c5SJed Brown     /*
7550c7d97c5SJed Brown       Assembling right hand side for BDDC operator
7560c7d97c5SJed Brown       - vec1_D for the Dirichlet part (if needed, i.e. prec_flag=PETSC_TRUE)
7570c7d97c5SJed Brown       - the interface part of the global vector z
7580c7d97c5SJed Brown     */
7590c7d97c5SJed Brown     ierr = VecScale(pcis->vec2_D,m_one);CHKERRQ(ierr);
7600c7d97c5SJed Brown     ierr = MatMult(pcis->A_BI,pcis->vec2_D,pcis->vec1_B);CHKERRQ(ierr);
7610c7d97c5SJed Brown     if (pcbddc->prec_type) { ierr = MatMultAdd(pcis->A_II,pcis->vec2_D,pcis->vec1_D,pcis->vec1_D);CHKERRQ(ierr); }
7620c7d97c5SJed Brown     ierr = VecScale(pcis->vec2_D,m_one);CHKERRQ(ierr);
7630c7d97c5SJed Brown     ierr = VecCopy(r,z);CHKERRQ(ierr);
7640c7d97c5SJed Brown     ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
7650c7d97c5SJed Brown     ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
7662617d88aSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
7672617d88aSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
768b76ba322SStefano Zampini   } else {
769b76ba322SStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,r,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
770b76ba322SStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,r,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
7710bdf917eSStefano Zampini     ierr = VecSet(pcis->vec1_D,zero);CHKERRQ(ierr);
772b76ba322SStefano Zampini     ierr = VecSet(pcis->vec2_D,zero);CHKERRQ(ierr);
773b76ba322SStefano Zampini   }
774b76ba322SStefano Zampini 
775b76ba322SStefano Zampini   /* Apply partition of unity */
7762617d88aSStefano Zampini   ierr = VecPointwiseMult(pcis->vec1_B,pcis->D,pcis->vec1_B);CHKERRQ(ierr);
7772617d88aSStefano Zampini 
7782617d88aSStefano Zampini   /* Apply interface preconditioner
7792617d88aSStefano Zampini      input/output vecs: pcis->vec1_B and pcis->vec1_D */
7802617d88aSStefano Zampini   ierr = PCBDDCApplyInterfacePreconditioner(pc);CHKERRQ(ierr);
7812617d88aSStefano Zampini 
7822617d88aSStefano Zampini   /* Apply partition of unity and sum boundary values */
7832617d88aSStefano Zampini   ierr = VecPointwiseMult(pcis->vec1_B,pcis->D,pcis->vec1_B);CHKERRQ(ierr);
7842617d88aSStefano Zampini   ierr = VecSet(z,zero);CHKERRQ(ierr);
7852617d88aSStefano Zampini   ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
7862617d88aSStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
7870c7d97c5SJed Brown 
7883b03a366Sstefano_zampini   /* Second Dirichlet solve and assembling of output */
7890c7d97c5SJed Brown   ierr = VecScatterBegin(pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
7900c7d97c5SJed Brown   ierr = VecScatterEnd  (pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
7910c7d97c5SJed Brown   ierr = MatMult(pcis->A_IB,pcis->vec1_B,pcis->vec3_D);CHKERRQ(ierr);
7920c7d97c5SJed Brown   if (pcbddc->prec_type) { ierr = MatMultAdd(pcis->A_II,pcis->vec1_D,pcis->vec3_D,pcis->vec3_D);CHKERRQ(ierr); }
79353cdbc3dSStefano Zampini   ierr = KSPSolve(pcbddc->ksp_D,pcis->vec3_D,pcbddc->vec4_D);CHKERRQ(ierr);
7940c7d97c5SJed Brown   ierr = VecScale(pcbddc->vec4_D,m_one);CHKERRQ(ierr);
7950c7d97c5SJed Brown   if (pcbddc->prec_type) { ierr = VecAXPY (pcbddc->vec4_D,one,pcis->vec1_D);CHKERRQ(ierr); }
7960c7d97c5SJed Brown   ierr = VecAXPY (pcis->vec2_D,one,pcbddc->vec4_D);CHKERRQ(ierr);
7970c7d97c5SJed Brown   ierr = VecScatterBegin(pcis->global_to_D,pcis->vec2_D,z,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
7980c7d97c5SJed Brown   ierr = VecScatterEnd  (pcis->global_to_D,pcis->vec2_D,z,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
7990c7d97c5SJed Brown   PetscFunctionReturn(0);
8000c7d97c5SJed Brown 
8010c7d97c5SJed Brown }
802da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
803da1bb401SStefano Zampini #undef __FUNCT__
804da1bb401SStefano Zampini #define __FUNCT__ "PCDestroy_BDDC"
805da1bb401SStefano Zampini PetscErrorCode PCDestroy_BDDC(PC pc)
806da1bb401SStefano Zampini {
807da1bb401SStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
8080bdf917eSStefano Zampini   PetscInt       i;
809da1bb401SStefano Zampini   PetscErrorCode ierr;
810da1bb401SStefano Zampini 
811da1bb401SStefano Zampini   PetscFunctionBegin;
812da1bb401SStefano Zampini   /* free data created by PCIS */
813da1bb401SStefano Zampini   ierr = PCISDestroy(pc);CHKERRQ(ierr);
814da1bb401SStefano Zampini   /* free BDDC data  */
8150bdf917eSStefano Zampini   ierr = MatNullSpaceDestroy(&pcbddc->CoarseNullSpace);CHKERRQ(ierr);
8160bdf917eSStefano Zampini   ierr = MatNullSpaceDestroy(&pcbddc->NullSpace);CHKERRQ(ierr);
8173972b0daSStefano Zampini   ierr = VecDestroy(&pcbddc->temp_solution);CHKERRQ(ierr);
818534831adSStefano Zampini   ierr = VecDestroy(&pcbddc->original_rhs);CHKERRQ(ierr);
819534831adSStefano Zampini   ierr = MatDestroy(&pcbddc->local_mat);CHKERRQ(ierr);
820534831adSStefano Zampini   ierr = MatDestroy(&pcbddc->ChangeOfBasisMatrix);CHKERRQ(ierr);
821da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->coarse_vec);CHKERRQ(ierr);
822da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->coarse_rhs);CHKERRQ(ierr);
823da1bb401SStefano Zampini   ierr = KSPDestroy(&pcbddc->coarse_ksp);CHKERRQ(ierr);
824da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->coarse_mat);CHKERRQ(ierr);
825da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->coarse_phi_B);CHKERRQ(ierr);
826da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->coarse_phi_D);CHKERRQ(ierr);
827da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec1_P);CHKERRQ(ierr);
828da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec1_C);CHKERRQ(ierr);
829da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->local_auxmat1);CHKERRQ(ierr);
830da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->local_auxmat2);CHKERRQ(ierr);
831da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec1_R);CHKERRQ(ierr);
832da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec2_R);CHKERRQ(ierr);
833da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec4_D);CHKERRQ(ierr);
834da1bb401SStefano Zampini   ierr = VecScatterDestroy(&pcbddc->R_to_B);CHKERRQ(ierr);
835da1bb401SStefano Zampini   ierr = VecScatterDestroy(&pcbddc->R_to_D);CHKERRQ(ierr);
836da1bb401SStefano Zampini   ierr = VecScatterDestroy(&pcbddc->coarse_loc_to_glob);CHKERRQ(ierr);
837da1bb401SStefano Zampini   ierr = KSPDestroy(&pcbddc->ksp_D);CHKERRQ(ierr);
838da1bb401SStefano Zampini   ierr = KSPDestroy(&pcbddc->ksp_R);CHKERRQ(ierr);
839da1bb401SStefano Zampini   ierr = ISDestroy(&pcbddc->NeumannBoundaries);CHKERRQ(ierr);
840da1bb401SStefano Zampini   ierr = ISDestroy(&pcbddc->DirichletBoundaries);CHKERRQ(ierr);
841da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->ConstraintMatrix);CHKERRQ(ierr);
842da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->local_primal_indices);CHKERRQ(ierr);
843da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->replicated_local_primal_indices);CHKERRQ(ierr);
8440bdf917eSStefano Zampini   ierr = PetscFree(pcbddc->replicated_local_primal_values);CHKERRQ(ierr);
845da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->local_primal_displacements);CHKERRQ(ierr);
846da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->local_primal_sizes);CHKERRQ(ierr);
847da1bb401SStefano Zampini   for (i=0;i<pcbddc->n_ISForDofs;i++) { ierr = ISDestroy(&pcbddc->ISForDofs[i]);CHKERRQ(ierr); }
848da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->ISForDofs);CHKERRQ(ierr);
849da1bb401SStefano Zampini   for (i=0;i<pcbddc->n_ISForFaces;i++) { ierr = ISDestroy(&pcbddc->ISForFaces[i]);CHKERRQ(ierr); }
850da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->ISForFaces);CHKERRQ(ierr);
851da1bb401SStefano Zampini   for (i=0;i<pcbddc->n_ISForEdges;i++) { ierr = ISDestroy(&pcbddc->ISForEdges[i]);CHKERRQ(ierr); }
852da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->ISForEdges);CHKERRQ(ierr);
853da1bb401SStefano Zampini   ierr = ISDestroy(&pcbddc->ISForVertices);CHKERRQ(ierr);
8543972b0daSStefano Zampini   /* Free graph structure */
855da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph->xadj);CHKERRQ(ierr);
856da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph->adjncy);CHKERRQ(ierr);
857142dfd88SStefano Zampini   if (pcbddc->mat_graph->nvtxs) {
858da1bb401SStefano Zampini     ierr = PetscFree(pcbddc->mat_graph->neighbours_set[0]);CHKERRQ(ierr);
859142dfd88SStefano Zampini   }
860da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph->neighbours_set);CHKERRQ(ierr);
8613972b0daSStefano Zampini   ierr = PetscFree4(pcbddc->mat_graph->where,pcbddc->mat_graph->count,pcbddc->mat_graph->cptr,pcbddc->mat_graph->queue);CHKERRQ(ierr);
8623972b0daSStefano Zampini   ierr = PetscFree2(pcbddc->mat_graph->which_dof,pcbddc->mat_graph->touched);CHKERRQ(ierr);
8633972b0daSStefano Zampini   ierr = PetscFree(pcbddc->mat_graph->where_ncmps);CHKERRQ(ierr);
864da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph);CHKERRQ(ierr);
8653425bc38SStefano Zampini   /* remove functions */
8664fad6a16SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetCoarseningRatio_C","",PETSC_NULL);CHKERRQ(ierr);
8674fad6a16SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetMaxLevels_C","",PETSC_NULL);CHKERRQ(ierr);
8680bdf917eSStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetNullSpace_C","",PETSC_NULL);CHKERRQ(ierr);
8693425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDirichletBoundaries_C","",PETSC_NULL);CHKERRQ(ierr);
8703425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetNeumannBoundaries_C","",PETSC_NULL);CHKERRQ(ierr);
8713425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetDirichletBoundaries_C","",PETSC_NULL);CHKERRQ(ierr);
8723425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetNeumannBoundaries_C","",PETSC_NULL);CHKERRQ(ierr);
8733425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetCoarseProblemType_C","",PETSC_NULL);CHKERRQ(ierr);
8743425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDofsSplitting_C","",PETSC_NULL);CHKERRQ(ierr);
8753425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetLocalAdjacencyGraph_C","",PETSC_NULL);CHKERRQ(ierr);
8763425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPreSolve_C","",PETSC_NULL);CHKERRQ(ierr);
8773425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPostSolve_C","",PETSC_NULL);CHKERRQ(ierr);
8783425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCCreateFETIDPOperators_C","",PETSC_NULL);CHKERRQ(ierr);
8793425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetRHS_C","",PETSC_NULL);CHKERRQ(ierr);
8803425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetSolution_C","",PETSC_NULL);CHKERRQ(ierr);
881da1bb401SStefano Zampini   /* Free the private data structure that was hanging off the PC */
882da1bb401SStefano Zampini   ierr = PetscFree(pcbddc);CHKERRQ(ierr);
883da1bb401SStefano Zampini   PetscFunctionReturn(0);
884da1bb401SStefano Zampini }
8853425bc38SStefano Zampini /* -------------------------------------------------------------------------- */
8863425bc38SStefano Zampini EXTERN_C_BEGIN
8873425bc38SStefano Zampini #undef __FUNCT__
8883425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetRHS_BDDC"
8893425bc38SStefano Zampini static PetscErrorCode PCBDDCMatFETIDPGetRHS_BDDC(Mat fetidp_mat, Vec standard_rhs, Vec fetidp_flux_rhs)
8903425bc38SStefano Zampini {
8913425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
8923425bc38SStefano Zampini   PC_IS*         pcis;
8933425bc38SStefano Zampini   PC_BDDC*       pcbddc;
8943425bc38SStefano Zampini   PetscErrorCode ierr;
8950c7d97c5SJed Brown 
8963425bc38SStefano Zampini   PetscFunctionBegin;
8973425bc38SStefano Zampini   ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr);
8983425bc38SStefano Zampini   pcis = (PC_IS*)mat_ctx->pc->data;
8993425bc38SStefano Zampini   pcbddc = (PC_BDDC*)mat_ctx->pc->data;
9003425bc38SStefano Zampini 
9013425bc38SStefano Zampini   /* change of basis for physical rhs if needed
9023425bc38SStefano Zampini      It also changes the rhs in case of dirichlet boundaries */
9033425bc38SStefano Zampini   (*mat_ctx->pc->ops->presolve)(mat_ctx->pc,PETSC_NULL,standard_rhs,PETSC_NULL);
9043425bc38SStefano Zampini   /* store vectors for computation of fetidp final solution */
9053425bc38SStefano Zampini   ierr = VecScatterBegin(pcis->global_to_D,standard_rhs,mat_ctx->temp_solution_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
9063425bc38SStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_D,standard_rhs,mat_ctx->temp_solution_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
9073425bc38SStefano Zampini   ierr = VecScatterBegin(pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
9083425bc38SStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
9093425bc38SStefano Zampini   /* scale rhs since it should be unassembled */
9103425bc38SStefano Zampini   ierr = VecPointwiseMult(mat_ctx->temp_solution_B,pcis->D,mat_ctx->temp_solution_B);CHKERRQ(ierr);
9113425bc38SStefano Zampini   if (!pcbddc->prec_type) {
9123425bc38SStefano Zampini     /* compute partially subassembled Schur complement right-hand side */
9133425bc38SStefano Zampini     ierr = KSPSolve(pcbddc->ksp_D,mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr);
9143425bc38SStefano Zampini     ierr = MatMult(pcis->A_BI,pcis->vec1_D,pcis->vec1_B);CHKERRQ(ierr);
9153425bc38SStefano Zampini     ierr = VecAXPY(mat_ctx->temp_solution_B,-1.0,pcis->vec1_B);CHKERRQ(ierr);
9163425bc38SStefano Zampini     ierr = VecSet(standard_rhs,0.0);CHKERRQ(ierr);
9173425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,mat_ctx->temp_solution_B,standard_rhs,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
9183425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,mat_ctx->temp_solution_B,standard_rhs,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
9193425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
9203425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
9213425bc38SStefano Zampini     ierr = VecPointwiseMult(mat_ctx->temp_solution_B,pcis->D,mat_ctx->temp_solution_B);CHKERRQ(ierr);
9223425bc38SStefano Zampini   }
9233425bc38SStefano Zampini   /* BDDC rhs */
9243425bc38SStefano Zampini   ierr = VecCopy(mat_ctx->temp_solution_B,pcis->vec1_B);CHKERRQ(ierr);
9253425bc38SStefano Zampini   if (pcbddc->prec_type) {
9263425bc38SStefano Zampini     ierr = VecCopy(mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr);
9273425bc38SStefano Zampini   }
9283425bc38SStefano Zampini   /* apply BDDC */
9293425bc38SStefano Zampini   ierr = PCBDDCApplyInterfacePreconditioner(mat_ctx->pc);CHKERRQ(ierr);
9303425bc38SStefano Zampini   /* Application of B_delta and assembling of rhs for fetidp fluxes */
9313425bc38SStefano Zampini   ierr = VecSet(fetidp_flux_rhs,0.0);CHKERRQ(ierr);
9323425bc38SStefano Zampini   ierr = MatMult(mat_ctx->B_delta,pcis->vec1_B,mat_ctx->lambda_local);CHKERRQ(ierr);
9333425bc38SStefano Zampini   ierr = VecScatterBegin(mat_ctx->l2g_lambda,mat_ctx->lambda_local,fetidp_flux_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
9343425bc38SStefano Zampini   ierr = VecScatterEnd  (mat_ctx->l2g_lambda,mat_ctx->lambda_local,fetidp_flux_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
9353425bc38SStefano Zampini   /* restore original rhs */
9363425bc38SStefano Zampini   ierr = VecCopy(pcbddc->original_rhs,standard_rhs);CHKERRQ(ierr);
9373425bc38SStefano Zampini   PetscFunctionReturn(0);
9383425bc38SStefano Zampini }
9393425bc38SStefano Zampini EXTERN_C_END
9403425bc38SStefano Zampini #undef __FUNCT__
9413425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetRHS"
9423425bc38SStefano Zampini /*@
9433425bc38SStefano Zampini  PCBDDCMatFETIDPGetRHS - Get rhs for FETIDP linear system.
9443425bc38SStefano Zampini 
9453425bc38SStefano Zampini    Collective
9463425bc38SStefano Zampini 
9473425bc38SStefano Zampini    Input Parameters:
9483425bc38SStefano Zampini +  fetidp_mat   - the FETIDP mat obtained by a call to PCBDDCCreateFETIDPOperators
9493425bc38SStefano Zampini +  standard_rhs - the rhs of your linear system
9503425bc38SStefano Zampini 
9513425bc38SStefano Zampini    Output Parameters:
9523425bc38SStefano Zampini +  fetidp_flux_rhs   - the rhs of the FETIDP linear system
9533425bc38SStefano Zampini 
9543425bc38SStefano Zampini    Level: developer
9553425bc38SStefano Zampini 
9563425bc38SStefano Zampini    Notes:
9573425bc38SStefano Zampini 
9583425bc38SStefano Zampini .seealso: PCBDDC
9593425bc38SStefano Zampini @*/
9603425bc38SStefano Zampini PetscErrorCode PCBDDCMatFETIDPGetRHS(Mat fetidp_mat, Vec standard_rhs, Vec fetidp_flux_rhs)
9613425bc38SStefano Zampini {
9623425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
9633425bc38SStefano Zampini   PetscErrorCode ierr;
9643425bc38SStefano Zampini 
9653425bc38SStefano Zampini   PetscFunctionBegin;
9663425bc38SStefano Zampini   ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr);
9673425bc38SStefano Zampini   ierr = PetscTryMethod(mat_ctx->pc,"PCBDDCMatFETIDPGetRHS_C",(Mat,Vec,Vec),(fetidp_mat,standard_rhs,fetidp_flux_rhs));CHKERRQ(ierr);
9683425bc38SStefano Zampini   PetscFunctionReturn(0);
9693425bc38SStefano Zampini }
9703425bc38SStefano Zampini /* -------------------------------------------------------------------------- */
9713425bc38SStefano Zampini EXTERN_C_BEGIN
9723425bc38SStefano Zampini #undef __FUNCT__
9733425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetSolution_BDDC"
9743425bc38SStefano Zampini static PetscErrorCode PCBDDCMatFETIDPGetSolution_BDDC(Mat fetidp_mat, Vec fetidp_flux_sol, Vec standard_sol)
9753425bc38SStefano Zampini {
9763425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
9773425bc38SStefano Zampini   PC_IS*         pcis;
9783425bc38SStefano Zampini   PC_BDDC*       pcbddc;
9793425bc38SStefano Zampini   PetscErrorCode ierr;
9803425bc38SStefano Zampini 
9813425bc38SStefano Zampini   PetscFunctionBegin;
9823425bc38SStefano Zampini   ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr);
9833425bc38SStefano Zampini   pcis = (PC_IS*)mat_ctx->pc->data;
9843425bc38SStefano Zampini   pcbddc = (PC_BDDC*)mat_ctx->pc->data;
9853425bc38SStefano Zampini 
9863425bc38SStefano Zampini   /* apply B_delta^T */
9873425bc38SStefano Zampini   ierr = VecScatterBegin(mat_ctx->l2g_lambda,fetidp_flux_sol,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
9883425bc38SStefano Zampini   ierr = VecScatterEnd  (mat_ctx->l2g_lambda,fetidp_flux_sol,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
9893425bc38SStefano Zampini   ierr = MatMultTranspose(mat_ctx->B_delta,mat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr);
9903425bc38SStefano Zampini   /* compute rhs for BDDC application */
9913425bc38SStefano Zampini   ierr = VecAYPX(pcis->vec1_B,-1.0,mat_ctx->temp_solution_B);CHKERRQ(ierr);
9923425bc38SStefano Zampini   if (pcbddc->prec_type) {
9933425bc38SStefano Zampini     ierr = VecCopy(mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr);
9943425bc38SStefano Zampini   }
9953425bc38SStefano Zampini   /* apply BDDC */
9963425bc38SStefano Zampini   ierr = PCBDDCApplyInterfacePreconditioner(mat_ctx->pc);CHKERRQ(ierr);
9973425bc38SStefano Zampini   /* put values into standard global vector */
9983425bc38SStefano Zampini   ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
9993425bc38SStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec1_B,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
10003425bc38SStefano Zampini   if (!pcbddc->prec_type) {
10013425bc38SStefano Zampini     /* compute values into the interior if solved for the partially subassembled Schur complement */
10023425bc38SStefano Zampini     ierr = MatMult(pcis->A_IB,pcis->vec1_B,pcis->vec1_D);CHKERRQ(ierr);
10033425bc38SStefano Zampini     ierr = VecAXPY(mat_ctx->temp_solution_D,-1.0,pcis->vec1_D);CHKERRQ(ierr);
10043425bc38SStefano Zampini     ierr = KSPSolve(pcbddc->ksp_D,mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr);
10053425bc38SStefano Zampini   }
10063425bc38SStefano Zampini   ierr = VecScatterBegin(pcis->global_to_D,pcis->vec1_D,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
10073425bc38SStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_D,pcis->vec1_D,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
10083425bc38SStefano Zampini   /* final change of basis if needed
10093425bc38SStefano Zampini      Is also sums the dirichlet part removed during RHS assembling */
10103425bc38SStefano Zampini   (*mat_ctx->pc->ops->postsolve)(mat_ctx->pc,PETSC_NULL,PETSC_NULL,standard_sol);
10113425bc38SStefano Zampini   PetscFunctionReturn(0);
10123425bc38SStefano Zampini 
10133425bc38SStefano Zampini }
10143425bc38SStefano Zampini EXTERN_C_END
10153425bc38SStefano Zampini #undef __FUNCT__
10163425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetSolution"
10173425bc38SStefano Zampini /*@
10183425bc38SStefano Zampini  PCBDDCMatFETIDPGetSolution - Get Solution for FETIDP linear system.
10193425bc38SStefano Zampini 
10203425bc38SStefano Zampini    Collective
10213425bc38SStefano Zampini 
10223425bc38SStefano Zampini    Input Parameters:
10233425bc38SStefano Zampini +  fetidp_mat        - the FETIDP mat obtained by a call to PCBDDCCreateFETIDPOperators
10243425bc38SStefano Zampini +  fetidp_flux_sol - the solution of the FETIDP linear system
10253425bc38SStefano Zampini 
10263425bc38SStefano Zampini    Output Parameters:
10273425bc38SStefano Zampini +  standard_sol      - the solution on the global domain
10283425bc38SStefano Zampini 
10293425bc38SStefano Zampini    Level: developer
10303425bc38SStefano Zampini 
10313425bc38SStefano Zampini    Notes:
10323425bc38SStefano Zampini 
10333425bc38SStefano Zampini .seealso: PCBDDC
10343425bc38SStefano Zampini @*/
10353425bc38SStefano Zampini PetscErrorCode PCBDDCMatFETIDPGetSolution(Mat fetidp_mat, Vec fetidp_flux_sol, Vec standard_sol)
10363425bc38SStefano Zampini {
10373425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
10383425bc38SStefano Zampini   PetscErrorCode ierr;
10393425bc38SStefano Zampini 
10403425bc38SStefano Zampini   PetscFunctionBegin;
10413425bc38SStefano Zampini   ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr);
10423425bc38SStefano Zampini   ierr = PetscTryMethod(mat_ctx->pc,"PCBDDCMatFETIDPGetSolution_C",(Mat,Vec,Vec),(fetidp_mat,fetidp_flux_sol,standard_sol));CHKERRQ(ierr);
10433425bc38SStefano Zampini   PetscFunctionReturn(0);
10443425bc38SStefano Zampini }
10453425bc38SStefano Zampini /* -------------------------------------------------------------------------- */
10463425bc38SStefano Zampini EXTERN_C_BEGIN
10473425bc38SStefano Zampini #undef __FUNCT__
10483425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPOperators_BDDC"
10493425bc38SStefano Zampini static PetscErrorCode PCBDDCCreateFETIDPOperators_BDDC(PC pc, Mat *fetidp_mat, PC *fetidp_pc)
10503425bc38SStefano Zampini {
10513425bc38SStefano Zampini   PETSC_EXTERN PetscErrorCode FETIDPMatMult(Mat,Vec,Vec);
10523425bc38SStefano Zampini   PETSC_EXTERN PetscErrorCode PCBDDCDestroyFETIDPMat(Mat);
10533425bc38SStefano Zampini   PETSC_EXTERN PetscErrorCode FETIDPPCApply(PC,Vec,Vec);
10543425bc38SStefano Zampini   PETSC_EXTERN PetscErrorCode PCBDDCDestroyFETIDPPC(PC);
10553425bc38SStefano Zampini 
10563425bc38SStefano Zampini   FETIDPMat_ctx  *fetidpmat_ctx;
10573425bc38SStefano Zampini   Mat            newmat;
10583425bc38SStefano Zampini   FETIDPPC_ctx  *fetidppc_ctx;
10593425bc38SStefano Zampini   PC             newpc;
10603425bc38SStefano Zampini   MPI_Comm       comm = ((PetscObject)pc)->comm;
10613425bc38SStefano Zampini   PetscErrorCode ierr;
10623425bc38SStefano Zampini 
10633425bc38SStefano Zampini   PetscFunctionBegin;
10643425bc38SStefano Zampini   /* FETIDP linear matrix */
10653425bc38SStefano Zampini   ierr = PCBDDCCreateFETIDPMatContext(pc, &fetidpmat_ctx);CHKERRQ(ierr);
10663425bc38SStefano Zampini   ierr = PCBDDCSetupFETIDPMatContext(fetidpmat_ctx);CHKERRQ(ierr);
10673425bc38SStefano Zampini   ierr = MatCreateShell(comm,PETSC_DECIDE,PETSC_DECIDE,fetidpmat_ctx->n_lambda,fetidpmat_ctx->n_lambda,fetidpmat_ctx,&newmat);CHKERRQ(ierr);
10683425bc38SStefano Zampini   ierr = MatShellSetOperation(newmat,MATOP_MULT,(void (*)(void))FETIDPMatMult);CHKERRQ(ierr);
10693425bc38SStefano Zampini   ierr = MatShellSetOperation(newmat,MATOP_DESTROY,(void (*)(void))PCBDDCDestroyFETIDPMat);CHKERRQ(ierr);
10703425bc38SStefano Zampini   ierr = MatSetUp(newmat);CHKERRQ(ierr);
10713425bc38SStefano Zampini   /* FETIDP preconditioner */
10723425bc38SStefano Zampini   ierr = PCBDDCCreateFETIDPPCContext(pc, &fetidppc_ctx);CHKERRQ(ierr);
10733425bc38SStefano Zampini   ierr = PCBDDCSetupFETIDPPCContext(newmat,fetidppc_ctx);CHKERRQ(ierr);
10743425bc38SStefano Zampini   ierr = PCCreate(comm,&newpc);CHKERRQ(ierr);
10753425bc38SStefano Zampini   ierr = PCSetType(newpc,PCSHELL);CHKERRQ(ierr);
10763425bc38SStefano Zampini   ierr = PCShellSetContext(newpc,fetidppc_ctx);CHKERRQ(ierr);
10773425bc38SStefano Zampini   ierr = PCShellSetApply(newpc,FETIDPPCApply);CHKERRQ(ierr);
10783425bc38SStefano Zampini   ierr = PCShellSetDestroy(newpc,PCBDDCDestroyFETIDPPC);CHKERRQ(ierr);
10793425bc38SStefano Zampini   ierr = PCSetOperators(newpc,newmat,newmat,SAME_PRECONDITIONER);CHKERRQ(ierr);
10803425bc38SStefano Zampini   ierr = PCSetUp(newpc);CHKERRQ(ierr);
10813425bc38SStefano Zampini   /* return pointers for objects created */
10823425bc38SStefano Zampini   *fetidp_mat=newmat;
10833425bc38SStefano Zampini   *fetidp_pc=newpc;
10843425bc38SStefano Zampini 
10853425bc38SStefano Zampini   PetscFunctionReturn(0);
10863425bc38SStefano Zampini }
10873425bc38SStefano Zampini EXTERN_C_END
10883425bc38SStefano Zampini #undef __FUNCT__
10893425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPOperators"
10903425bc38SStefano Zampini /*@
10913425bc38SStefano Zampini  PCBDDCCreateFETIDPOperators - Create operators for FETIDP.
10923425bc38SStefano Zampini 
10933425bc38SStefano Zampini    Collective
10943425bc38SStefano Zampini 
10953425bc38SStefano Zampini    Input Parameters:
10963425bc38SStefano Zampini +  pc - the BDDC preconditioning context (setup must be already called)
10973425bc38SStefano Zampini 
10983425bc38SStefano Zampini    Level: developer
10993425bc38SStefano Zampini 
11003425bc38SStefano Zampini    Notes:
11013425bc38SStefano Zampini 
11023425bc38SStefano Zampini .seealso: PCBDDC
11033425bc38SStefano Zampini @*/
11043425bc38SStefano Zampini PetscErrorCode PCBDDCCreateFETIDPOperators(PC pc, Mat *fetidp_mat, PC *fetidp_pc)
11053425bc38SStefano Zampini {
11063425bc38SStefano Zampini   PetscErrorCode ierr;
11073425bc38SStefano Zampini 
11083425bc38SStefano Zampini   PetscFunctionBegin;
11093425bc38SStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
11103425bc38SStefano Zampini   if (pc->setupcalled) {
11113425bc38SStefano Zampini     ierr = PetscTryMethod(pc,"PCBDDCCreateFETIDPOperators_C",(PC,Mat*,PC*),(pc,fetidp_mat,fetidp_pc));CHKERRQ(ierr);
11123425bc38SStefano Zampini   } else {
11133425bc38SStefano Zampini     SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SUP,"You must call PCSetup_BDDC before calling %s\n",__FUNCT__);
11143425bc38SStefano Zampini   }
11153425bc38SStefano Zampini   PetscFunctionReturn(0);
11163425bc38SStefano Zampini }
11170c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
1118da1bb401SStefano Zampini /*MC
1119da1bb401SStefano Zampini    PCBDDC - Balancing Domain Decomposition by Constraints.
11200c7d97c5SJed Brown 
1121da1bb401SStefano Zampini    Options Database Keys:
1122da1bb401SStefano Zampini .    -pcbddc ??? -
1123da1bb401SStefano Zampini 
1124da1bb401SStefano Zampini    Level: intermediate
1125da1bb401SStefano Zampini 
1126da1bb401SStefano Zampini    Notes: The matrix used with this preconditioner must be of type MATIS
1127da1bb401SStefano Zampini 
1128da1bb401SStefano Zampini           Unlike more 'conventional' interface preconditioners, this iterates over ALL the
1129da1bb401SStefano Zampini           degrees of freedom, NOT just those on the interface (this allows the use of approximate solvers
1130da1bb401SStefano Zampini           on the subdomains).
1131da1bb401SStefano Zampini 
1132da1bb401SStefano Zampini           Options for the coarse grid preconditioner can be set with -
1133da1bb401SStefano Zampini           Options for the Dirichlet subproblem can be set with -
1134da1bb401SStefano Zampini           Options for the Neumann subproblem can be set with -
1135da1bb401SStefano Zampini 
1136da1bb401SStefano Zampini    Contributed by Stefano Zampini
1137da1bb401SStefano Zampini 
1138da1bb401SStefano Zampini .seealso:  PCCreate(), PCSetType(), PCType (for list of available types), PC,  MATIS
1139da1bb401SStefano Zampini M*/
1140da1bb401SStefano Zampini EXTERN_C_BEGIN
1141da1bb401SStefano Zampini #undef __FUNCT__
1142da1bb401SStefano Zampini #define __FUNCT__ "PCCreate_BDDC"
1143da1bb401SStefano Zampini PetscErrorCode PCCreate_BDDC(PC pc)
1144da1bb401SStefano Zampini {
1145da1bb401SStefano Zampini   PetscErrorCode ierr;
1146da1bb401SStefano Zampini   PC_BDDC        *pcbddc;
1147da1bb401SStefano Zampini   PCBDDCGraph    mat_graph;
1148da1bb401SStefano Zampini 
1149da1bb401SStefano Zampini   PetscFunctionBegin;
1150da1bb401SStefano Zampini   /* Creates the private data structure for this preconditioner and attach it to the PC object. */
1151da1bb401SStefano Zampini   ierr      = PetscNewLog(pc,PC_BDDC,&pcbddc);CHKERRQ(ierr);
1152da1bb401SStefano Zampini   pc->data  = (void*)pcbddc;
1153da1bb401SStefano Zampini 
1154da1bb401SStefano Zampini   /* create PCIS data structure */
1155da1bb401SStefano Zampini   ierr = PCISCreate(pc);CHKERRQ(ierr);
1156da1bb401SStefano Zampini 
1157da1bb401SStefano Zampini   /* BDDC specific */
11580bdf917eSStefano Zampini   pcbddc->CoarseNullSpace            = 0;
11590bdf917eSStefano Zampini   pcbddc->NullSpace                  = 0;
11603972b0daSStefano Zampini   pcbddc->temp_solution              = 0;
1161534831adSStefano Zampini   pcbddc->original_rhs               = 0;
1162534831adSStefano Zampini   pcbddc->local_mat                  = 0;
1163534831adSStefano Zampini   pcbddc->ChangeOfBasisMatrix        = 0;
1164534831adSStefano Zampini   pcbddc->usechangeofbasis           = PETSC_TRUE;
1165534831adSStefano Zampini   pcbddc->usechangeonfaces           = PETSC_FALSE;
1166da1bb401SStefano Zampini   pcbddc->coarse_vec                 = 0;
1167da1bb401SStefano Zampini   pcbddc->coarse_rhs                 = 0;
1168da1bb401SStefano Zampini   pcbddc->coarse_ksp                 = 0;
1169da1bb401SStefano Zampini   pcbddc->coarse_phi_B               = 0;
1170da1bb401SStefano Zampini   pcbddc->coarse_phi_D               = 0;
1171da1bb401SStefano Zampini   pcbddc->vec1_P                     = 0;
1172da1bb401SStefano Zampini   pcbddc->vec1_R                     = 0;
1173da1bb401SStefano Zampini   pcbddc->vec2_R                     = 0;
1174da1bb401SStefano Zampini   pcbddc->local_auxmat1              = 0;
1175da1bb401SStefano Zampini   pcbddc->local_auxmat2              = 0;
1176da1bb401SStefano Zampini   pcbddc->R_to_B                     = 0;
1177da1bb401SStefano Zampini   pcbddc->R_to_D                     = 0;
1178da1bb401SStefano Zampini   pcbddc->ksp_D                      = 0;
1179da1bb401SStefano Zampini   pcbddc->ksp_R                      = 0;
1180da1bb401SStefano Zampini   pcbddc->local_primal_indices       = 0;
1181da1bb401SStefano Zampini   pcbddc->prec_type                  = PETSC_FALSE;
1182da1bb401SStefano Zampini   pcbddc->NeumannBoundaries          = 0;
1183da1bb401SStefano Zampini   pcbddc->ISForDofs                  = 0;
1184da1bb401SStefano Zampini   pcbddc->ISForVertices              = 0;
1185da1bb401SStefano Zampini   pcbddc->n_ISForFaces               = 0;
1186da1bb401SStefano Zampini   pcbddc->n_ISForEdges               = 0;
1187da1bb401SStefano Zampini   pcbddc->ConstraintMatrix           = 0;
1188da1bb401SStefano Zampini   pcbddc->use_nnsp_true              = PETSC_FALSE;
1189da1bb401SStefano Zampini   pcbddc->local_primal_sizes         = 0;
1190da1bb401SStefano Zampini   pcbddc->local_primal_displacements = 0;
1191da1bb401SStefano Zampini   pcbddc->replicated_local_primal_indices = 0;
1192da1bb401SStefano Zampini   pcbddc->replicated_local_primal_values  = 0;
1193da1bb401SStefano Zampini   pcbddc->coarse_loc_to_glob         = 0;
1194da1bb401SStefano Zampini   pcbddc->dbg_flag                   = PETSC_FALSE;
1195da1bb401SStefano Zampini   pcbddc->coarsening_ratio           = 8;
1196b76ba322SStefano Zampini   pcbddc->use_exact_dirichlet        = PETSC_TRUE;
11974fad6a16SStefano Zampini   pcbddc->current_level              = 0;
11984fad6a16SStefano Zampini   pcbddc->max_levels                 = 1;
1199da1bb401SStefano Zampini 
1200da1bb401SStefano Zampini   /* allocate and initialize needed graph structure */
1201da1bb401SStefano Zampini   ierr = PetscMalloc(sizeof(*mat_graph),&pcbddc->mat_graph);CHKERRQ(ierr);
1202da1bb401SStefano Zampini   pcbddc->mat_graph->xadj            = 0;
1203da1bb401SStefano Zampini   pcbddc->mat_graph->adjncy          = 0;
1204da1bb401SStefano Zampini 
1205da1bb401SStefano Zampini   /* function pointers */
1206da1bb401SStefano Zampini   pc->ops->apply               = PCApply_BDDC;
1207da1bb401SStefano Zampini   pc->ops->applytranspose      = 0;
1208da1bb401SStefano Zampini   pc->ops->setup               = PCSetUp_BDDC;
1209da1bb401SStefano Zampini   pc->ops->destroy             = PCDestroy_BDDC;
1210da1bb401SStefano Zampini   pc->ops->setfromoptions      = PCSetFromOptions_BDDC;
1211da1bb401SStefano Zampini   pc->ops->view                = 0;
1212da1bb401SStefano Zampini   pc->ops->applyrichardson     = 0;
1213da1bb401SStefano Zampini   pc->ops->applysymmetricleft  = 0;
1214da1bb401SStefano Zampini   pc->ops->applysymmetricright = 0;
1215534831adSStefano Zampini   pc->ops->presolve            = PCPreSolve_BDDC;
1216534831adSStefano Zampini   pc->ops->postsolve           = PCPostSolve_BDDC;
1217da1bb401SStefano Zampini 
1218da1bb401SStefano Zampini   /* composing function */
12194fad6a16SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetCoarseningRatio_C","PCBDDCSetCoarseningRatio_BDDC",
12204fad6a16SStefano Zampini                     PCBDDCSetCoarseningRatio_BDDC);CHKERRQ(ierr);
12214fad6a16SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetMaxLevels_C","PCBDDCSetMaxLevels_BDDC",
12224fad6a16SStefano Zampini                     PCBDDCSetMaxLevels_BDDC);CHKERRQ(ierr);
12230bdf917eSStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetNullSpace_C","PCBDDCSetNullSpace_BDDC",
12240bdf917eSStefano Zampini                     PCBDDCSetNullSpace_BDDC);CHKERRQ(ierr);
1225da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDirichletBoundaries_C","PCBDDCSetDirichletBoundaries_BDDC",
1226da1bb401SStefano Zampini                     PCBDDCSetDirichletBoundaries_BDDC);CHKERRQ(ierr);
1227da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetNeumannBoundaries_C","PCBDDCSetNeumannBoundaries_BDDC",
1228da1bb401SStefano Zampini                     PCBDDCSetNeumannBoundaries_BDDC);CHKERRQ(ierr);
1229da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetDirichletBoundaries_C","PCBDDCGetDirichletBoundaries_BDDC",
1230da1bb401SStefano Zampini                     PCBDDCGetDirichletBoundaries_BDDC);CHKERRQ(ierr);
1231da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetNeumannBoundaries_C","PCBDDCGetNeumannBoundaries_BDDC",
1232da1bb401SStefano Zampini                     PCBDDCGetNeumannBoundaries_BDDC);CHKERRQ(ierr);
1233da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetCoarseProblemType_C","PCBDDCSetCoarseProblemType_BDDC",
1234da1bb401SStefano Zampini                     PCBDDCSetCoarseProblemType_BDDC);CHKERRQ(ierr);
1235da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDofsSplitting_C","PCBDDCSetDofsSplitting_BDDC",
1236da1bb401SStefano Zampini                     PCBDDCSetDofsSplitting_BDDC);CHKERRQ(ierr);
1237da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetLocalAdjacencyGraph_C","PCBDDCSetLocalAdjacencyGraph_BDDC",
1238da1bb401SStefano Zampini                     PCBDDCSetLocalAdjacencyGraph_BDDC);CHKERRQ(ierr);
1239534831adSStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPreSolve_C","PCPreSolve_BDDC",
1240534831adSStefano Zampini                     PCPreSolve_BDDC);CHKERRQ(ierr);
1241534831adSStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPostSolve_C","PCPostSolve_BDDC",
1242534831adSStefano Zampini                     PCPostSolve_BDDC);CHKERRQ(ierr);
12433425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCCreateFETIDPOperators_C","PCBDDCCreateFETIDPOperators_BDDC",
12443425bc38SStefano Zampini                     PCBDDCCreateFETIDPOperators_BDDC);CHKERRQ(ierr);
12453425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetRHS_C","PCBDDCMatFETIDPGetRHS_BDDC",
12463425bc38SStefano Zampini                     PCBDDCMatFETIDPGetRHS_BDDC);CHKERRQ(ierr);
12473425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetSolution_C","PCBDDCMatFETIDPGetSolution_BDDC",
12483425bc38SStefano Zampini                     PCBDDCMatFETIDPGetSolution_BDDC);CHKERRQ(ierr);
1249da1bb401SStefano Zampini   PetscFunctionReturn(0);
1250da1bb401SStefano Zampini }
1251da1bb401SStefano Zampini EXTERN_C_END
12523425bc38SStefano Zampini 
1253da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
1254da1bb401SStefano Zampini /* All static functions from now on                                           */
1255da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
12564fad6a16SStefano Zampini #undef __FUNCT__
12572e8d2280SStefano Zampini #define __FUNCT__ "PCBDDCSetUseExactDirichlet"
12582e8d2280SStefano Zampini static PetscErrorCode PCBDDCSetUseExactDirichlet(PC pc,PetscBool use)
12592e8d2280SStefano Zampini {
12602e8d2280SStefano Zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
12612e8d2280SStefano Zampini 
12622e8d2280SStefano Zampini   PetscFunctionBegin;
12632e8d2280SStefano Zampini   pcbddc->use_exact_dirichlet=use;
12642e8d2280SStefano Zampini   PetscFunctionReturn(0);
12652e8d2280SStefano Zampini }
12662e8d2280SStefano Zampini 
12672e8d2280SStefano Zampini #undef __FUNCT__
12684fad6a16SStefano Zampini #define __FUNCT__ "PCBDDCSetLevel"
12694fad6a16SStefano Zampini static PetscErrorCode PCBDDCSetLevel(PC pc,PetscInt level)
12704fad6a16SStefano Zampini {
12714fad6a16SStefano Zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
12724fad6a16SStefano Zampini 
12734fad6a16SStefano Zampini   PetscFunctionBegin;
12744fad6a16SStefano Zampini   pcbddc->current_level=level;
12754fad6a16SStefano Zampini   PetscFunctionReturn(0);
12764fad6a16SStefano Zampini }
12773425bc38SStefano Zampini 
12783425bc38SStefano Zampini #undef __FUNCT__
12790bdf917eSStefano Zampini #define __FUNCT__ "PCBDDCAdaptNullSpace"
12800bdf917eSStefano Zampini static PetscErrorCode PCBDDCAdaptNullSpace(PC pc)
12810bdf917eSStefano Zampini {
12820bdf917eSStefano Zampini   PC_IS*         pcis = (PC_IS*)  (pc->data);
12830bdf917eSStefano Zampini   PC_BDDC*       pcbddc = (PC_BDDC*)(pc->data);
12840bdf917eSStefano Zampini   KSP            inv_change;
12850bdf917eSStefano Zampini   PC             pc_change;
12860bdf917eSStefano Zampini   const Vec      *nsp_vecs;
12870bdf917eSStefano Zampini   Vec            *new_nsp_vecs;
12880bdf917eSStefano Zampini   PetscInt       i,nsp_size,new_nsp_size,start_new;
12890bdf917eSStefano Zampini   PetscBool      nsp_has_cnst;
12900bdf917eSStefano Zampini   MatNullSpace   new_nsp;
12910bdf917eSStefano Zampini   PetscErrorCode ierr;
12920bdf917eSStefano Zampini 
12930bdf917eSStefano Zampini   PetscFunctionBegin;
12940bdf917eSStefano Zampini   ierr = MatNullSpaceGetVecs(pcbddc->NullSpace,&nsp_has_cnst,&nsp_size,&nsp_vecs);CHKERRQ(ierr);
12950bdf917eSStefano Zampini   ierr = KSPCreate(PETSC_COMM_SELF,&inv_change);CHKERRQ(ierr);
12960bdf917eSStefano Zampini   ierr = KSPSetOperators(inv_change,pcbddc->ChangeOfBasisMatrix,pcbddc->ChangeOfBasisMatrix,SAME_PRECONDITIONER);CHKERRQ(ierr);
12970bdf917eSStefano Zampini   ierr = KSPSetType(inv_change,KSPPREONLY);CHKERRQ(ierr);
12980bdf917eSStefano Zampini   ierr = KSPGetPC(inv_change,&pc_change);CHKERRQ(ierr);
12990bdf917eSStefano Zampini   ierr = PCSetType(pc_change,PCLU);CHKERRQ(ierr);
13000bdf917eSStefano Zampini   ierr = KSPSetUp(inv_change);CHKERRQ(ierr);
13010bdf917eSStefano Zampini   new_nsp_size = nsp_size;
13020bdf917eSStefano Zampini   if (nsp_has_cnst) { new_nsp_size++; }
13030bdf917eSStefano Zampini   ierr = PetscMalloc(new_nsp_size*sizeof(Vec),&new_nsp_vecs);CHKERRQ(ierr);
13040bdf917eSStefano Zampini   for (i=0;i<new_nsp_size;i++) { ierr = VecDuplicate(pcis->vec1_global,&new_nsp_vecs[i]);CHKERRQ(ierr); }
13050bdf917eSStefano Zampini   start_new = 0;
13060bdf917eSStefano Zampini   if (nsp_has_cnst) {
13070bdf917eSStefano Zampini     start_new = 1;
13080bdf917eSStefano Zampini     ierr = VecSet(new_nsp_vecs[0],1.0);CHKERRQ(ierr);
13090bdf917eSStefano Zampini     ierr = VecSet(pcis->vec1_B,1.0);CHKERRQ(ierr);
13100bdf917eSStefano Zampini     ierr = KSPSolve(inv_change,pcis->vec1_B,pcis->vec1_B);
13110bdf917eSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,new_nsp_vecs[0],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
13120bdf917eSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec1_B,new_nsp_vecs[0],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
13130bdf917eSStefano Zampini   }
13140bdf917eSStefano Zampini   for (i=0;i<nsp_size;i++) {
13150bdf917eSStefano Zampini     ierr = VecCopy(nsp_vecs[i],new_nsp_vecs[i+start_new]);CHKERRQ(ierr);
13160bdf917eSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,nsp_vecs[i],pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
13170bdf917eSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,nsp_vecs[i],pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
13180bdf917eSStefano Zampini     ierr = KSPSolve(inv_change,pcis->vec1_B,pcis->vec1_B);
13190bdf917eSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,new_nsp_vecs[i+start_new],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
13200bdf917eSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec1_B,new_nsp_vecs[i+start_new],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
13210bdf917eSStefano Zampini   }
13220bdf917eSStefano Zampini   ierr = VecNormalize(new_nsp_vecs[0],PETSC_NULL);CHKERRQ(ierr);
13230bdf917eSStefano Zampini   /* TODO : Orthonormalize vecs when new_nsp_size > 0! */
13240bdf917eSStefano Zampini 
13250bdf917eSStefano Zampini   /*PetscBool nsp_t=PETSC_FALSE;
13260bdf917eSStefano Zampini   ierr = MatNullSpaceTest(pcbddc->NullSpace,pc->pmat,&nsp_t);CHKERRQ(ierr);
13270bdf917eSStefano Zampini   printf("Original Null Space test: %d\n",nsp_t);
13280bdf917eSStefano Zampini   Mat temp_mat;
13290bdf917eSStefano Zampini   Mat_IS* matis = (Mat_IS*)pc->pmat->data;
13300bdf917eSStefano Zampini     temp_mat = matis->A;
13310bdf917eSStefano Zampini     matis->A = pcbddc->local_mat;
13320bdf917eSStefano Zampini     pcbddc->local_mat = temp_mat;
13330bdf917eSStefano Zampini   ierr = MatNullSpaceTest(pcbddc->NullSpace,pc->pmat,&nsp_t);CHKERRQ(ierr);
13340bdf917eSStefano Zampini   printf("Original Null Space, mat changed test: %d\n",nsp_t);
13350bdf917eSStefano Zampini   {
13360bdf917eSStefano Zampini     PetscReal test_norm;
13370bdf917eSStefano Zampini     for (i=0;i<new_nsp_size;i++) {
13380bdf917eSStefano Zampini       ierr = MatMult(pc->pmat,new_nsp_vecs[i],pcis->vec1_global);CHKERRQ(ierr);
13390bdf917eSStefano Zampini       ierr = VecNorm(pcis->vec1_global,NORM_2,&test_norm);CHKERRQ(ierr);
13400bdf917eSStefano Zampini       if (test_norm > 1.e-12) {
13410bdf917eSStefano Zampini         printf("------------ERROR VEC %d------------------\n",i);
13420bdf917eSStefano Zampini         ierr = VecView(pcis->vec1_global,PETSC_VIEWER_STDOUT_WORLD);
13430bdf917eSStefano Zampini         printf("------------------------------------------\n");
13440bdf917eSStefano Zampini       }
13450bdf917eSStefano Zampini     }
13460bdf917eSStefano Zampini   }*/
13470bdf917eSStefano Zampini 
13480bdf917eSStefano Zampini   ierr = KSPDestroy(&inv_change);CHKERRQ(ierr);
13490bdf917eSStefano Zampini   ierr = MatNullSpaceCreate(((PetscObject)pc)->comm,PETSC_FALSE,new_nsp_size,new_nsp_vecs,&new_nsp);CHKERRQ(ierr);
13500bdf917eSStefano Zampini   ierr = PCBDDCSetNullSpace(pc,new_nsp);CHKERRQ(ierr);
13510bdf917eSStefano Zampini   ierr = MatNullSpaceDestroy(&new_nsp);CHKERRQ(ierr);
13520bdf917eSStefano Zampini   /*
13530bdf917eSStefano Zampini   ierr = MatNullSpaceTest(pcbddc->NullSpace,pc->pmat,&nsp_t);CHKERRQ(ierr);
13540bdf917eSStefano Zampini   printf("New Null Space, mat changed: %d\n",nsp_t);
13550bdf917eSStefano Zampini     temp_mat = matis->A;
13560bdf917eSStefano Zampini     matis->A = pcbddc->local_mat;
13570bdf917eSStefano Zampini     pcbddc->local_mat = temp_mat;
13580bdf917eSStefano Zampini   ierr = MatNullSpaceTest(pcbddc->NullSpace,pc->pmat,&nsp_t);CHKERRQ(ierr);
13590bdf917eSStefano Zampini   printf("New Null Space, mat original: %d\n",nsp_t);*/
13600bdf917eSStefano Zampini 
13610bdf917eSStefano Zampini   for (i=0;i<new_nsp_size;i++) { ierr = VecDestroy(&new_nsp_vecs[i]);CHKERRQ(ierr); }
13620bdf917eSStefano Zampini   ierr = PetscFree(new_nsp_vecs);CHKERRQ(ierr);
13630bdf917eSStefano Zampini   PetscFunctionReturn(0);
13640bdf917eSStefano Zampini }
13650bdf917eSStefano Zampini 
13660bdf917eSStefano Zampini #undef __FUNCT__
13673425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPMatContext"
13683425bc38SStefano Zampini static PetscErrorCode PCBDDCCreateFETIDPMatContext(PC pc, FETIDPMat_ctx **fetidpmat_ctx)
13693425bc38SStefano Zampini {
13703425bc38SStefano Zampini   FETIDPMat_ctx  *newctx;
13713425bc38SStefano Zampini   PetscErrorCode ierr;
13723425bc38SStefano Zampini 
13733425bc38SStefano Zampini   PetscFunctionBegin;
13743425bc38SStefano Zampini   ierr = PetscMalloc(sizeof(*newctx),&newctx);CHKERRQ(ierr);
13753425bc38SStefano Zampini   newctx->lambda_local    = 0;
13763425bc38SStefano Zampini   newctx->temp_solution_B = 0;
13773425bc38SStefano Zampini   newctx->temp_solution_D = 0;
13783425bc38SStefano Zampini   newctx->B_delta         = 0;
13793425bc38SStefano Zampini   newctx->B_Ddelta        = 0; /* theoretically belongs to the FETIDP preconditioner */
13803425bc38SStefano Zampini   newctx->l2g_lambda      = 0;
13813425bc38SStefano Zampini   /* increase the reference count for BDDC preconditioner */
13823425bc38SStefano Zampini   ierr = PetscObjectReference((PetscObject)pc);CHKERRQ(ierr);
13833425bc38SStefano Zampini   newctx->pc              = pc;
13843425bc38SStefano Zampini   *fetidpmat_ctx          = newctx;
13853425bc38SStefano Zampini   PetscFunctionReturn(0);
13863425bc38SStefano Zampini }
13873425bc38SStefano Zampini 
13883425bc38SStefano Zampini #undef __FUNCT__
13893425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPPCContext"
13903425bc38SStefano Zampini static PetscErrorCode PCBDDCCreateFETIDPPCContext(PC pc, FETIDPPC_ctx **fetidppc_ctx)
13913425bc38SStefano Zampini {
13923425bc38SStefano Zampini   FETIDPPC_ctx  *newctx;
13933425bc38SStefano Zampini   PetscErrorCode ierr;
13943425bc38SStefano Zampini 
13953425bc38SStefano Zampini   PetscFunctionBegin;
13963425bc38SStefano Zampini   ierr = PetscMalloc(sizeof(*newctx),&newctx);CHKERRQ(ierr);
13973425bc38SStefano Zampini   newctx->lambda_local    = 0;
13983425bc38SStefano Zampini   newctx->B_Ddelta        = 0;
13993425bc38SStefano Zampini   newctx->l2g_lambda      = 0;
14003425bc38SStefano Zampini   /* increase the reference count for BDDC preconditioner */
14013425bc38SStefano Zampini   ierr = PetscObjectReference((PetscObject)pc);CHKERRQ(ierr);
14023425bc38SStefano Zampini   newctx->pc              = pc;
14033425bc38SStefano Zampini   *fetidppc_ctx           = newctx;
14043425bc38SStefano Zampini   PetscFunctionReturn(0);
14053425bc38SStefano Zampini }
14063425bc38SStefano Zampini 
14073425bc38SStefano Zampini #undef __FUNCT__
14083425bc38SStefano Zampini #define __FUNCT__ "PCBDDCDestroyFETIDPMat"
14093425bc38SStefano Zampini static PetscErrorCode PCBDDCDestroyFETIDPMat(Mat A)
14103425bc38SStefano Zampini {
14113425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
14123425bc38SStefano Zampini   PetscErrorCode ierr;
14133425bc38SStefano Zampini 
14143425bc38SStefano Zampini   PetscFunctionBegin;
14153425bc38SStefano Zampini   ierr = MatShellGetContext(A,(void**)&mat_ctx);CHKERRQ(ierr);
14163425bc38SStefano Zampini   ierr = VecDestroy(&mat_ctx->lambda_local);CHKERRQ(ierr);
14173425bc38SStefano Zampini   ierr = VecDestroy(&mat_ctx->temp_solution_D);CHKERRQ(ierr);
14183425bc38SStefano Zampini   ierr = VecDestroy(&mat_ctx->temp_solution_B);CHKERRQ(ierr);
14193425bc38SStefano Zampini   ierr = MatDestroy(&mat_ctx->B_delta);CHKERRQ(ierr);
14203425bc38SStefano Zampini   ierr = MatDestroy(&mat_ctx->B_Ddelta);CHKERRQ(ierr);
14213425bc38SStefano Zampini   ierr = VecScatterDestroy(&mat_ctx->l2g_lambda);CHKERRQ(ierr);
14223425bc38SStefano Zampini   ierr = PCDestroy(&mat_ctx->pc);CHKERRQ(ierr); /* actually it does not destroy BDDC, only decrease its reference count */
14233425bc38SStefano Zampini   ierr = PetscFree(mat_ctx);CHKERRQ(ierr);
14243425bc38SStefano Zampini   PetscFunctionReturn(0);
14253425bc38SStefano Zampini }
14263425bc38SStefano Zampini 
14273425bc38SStefano Zampini #undef __FUNCT__
14283425bc38SStefano Zampini #define __FUNCT__ "PCBDDCDestroyFETIDPPC"
14293425bc38SStefano Zampini static PetscErrorCode PCBDDCDestroyFETIDPPC(PC pc)
14303425bc38SStefano Zampini {
14313425bc38SStefano Zampini   FETIDPPC_ctx  *pc_ctx;
14323425bc38SStefano Zampini   PetscErrorCode ierr;
14333425bc38SStefano Zampini 
14343425bc38SStefano Zampini   PetscFunctionBegin;
14353425bc38SStefano Zampini   ierr = PCShellGetContext(pc,(void**)&pc_ctx);CHKERRQ(ierr);
14363425bc38SStefano Zampini   ierr = VecDestroy(&pc_ctx->lambda_local);CHKERRQ(ierr);
14373425bc38SStefano Zampini   ierr = MatDestroy(&pc_ctx->B_Ddelta);CHKERRQ(ierr);
14383425bc38SStefano Zampini   ierr = VecScatterDestroy(&pc_ctx->l2g_lambda);CHKERRQ(ierr);
14393425bc38SStefano Zampini   ierr = PCDestroy(&pc_ctx->pc);CHKERRQ(ierr); /* actually it does not destroy BDDC, only decrease its reference count */
14403425bc38SStefano Zampini   ierr = PetscFree(pc_ctx);CHKERRQ(ierr);
14413425bc38SStefano Zampini   PetscFunctionReturn(0);
14423425bc38SStefano Zampini }
14433425bc38SStefano Zampini 
14443425bc38SStefano Zampini #undef __FUNCT__
14453425bc38SStefano Zampini #define __FUNCT__ "PCBDDCSetupFETIDPMatContext"
14463425bc38SStefano Zampini static PetscErrorCode PCBDDCSetupFETIDPMatContext(FETIDPMat_ctx *fetidpmat_ctx )
14473425bc38SStefano Zampini {
14483425bc38SStefano Zampini   PetscErrorCode ierr;
14493425bc38SStefano Zampini   PC_IS          *pcis=(PC_IS*)fetidpmat_ctx->pc->data;
14503425bc38SStefano Zampini   PC_BDDC        *pcbddc=(PC_BDDC*)fetidpmat_ctx->pc->data;
14513425bc38SStefano Zampini   PCBDDCGraph    mat_graph=pcbddc->mat_graph;
14523425bc38SStefano Zampini   Mat_IS         *matis  = (Mat_IS*)fetidpmat_ctx->pc->pmat->data;
14533425bc38SStefano Zampini   MPI_Comm       comm = ((PetscObject)(fetidpmat_ctx->pc))->comm;
14543425bc38SStefano Zampini 
14553425bc38SStefano Zampini   Mat            ScalingMat;
14563425bc38SStefano Zampini   Vec            lambda_global;
14573425bc38SStefano Zampini   IS             IS_l2g_lambda;
14583425bc38SStefano Zampini 
14593425bc38SStefano Zampini   PetscBool      skip_node,fully_redundant;
1460ef028eecSStefano Zampini   PetscInt       i,j,k,s,n_boundary_dofs,n_global_lambda,n_vertices,partial_sum;
14613425bc38SStefano Zampini   PetscInt       n_local_lambda,n_lambda_for_dof,dual_size,n_neg_values,n_pos_values;
1462ef028eecSStefano Zampini   PetscMPIInt    rank,nprocs;
14633425bc38SStefano Zampini   PetscScalar    scalar_value;
14643425bc38SStefano Zampini 
14653425bc38SStefano Zampini   PetscInt       *vertex_indices,*temp_indices;
14663425bc38SStefano Zampini   PetscInt       *dual_dofs_boundary_indices,*aux_local_numbering_1,*aux_global_numbering;
14673425bc38SStefano Zampini   PetscInt       *aux_sums,*cols_B_delta,*l2g_indices;
14683425bc38SStefano Zampini   PetscScalar    *array,*scaling_factors,*vals_B_delta;
1469ef028eecSStefano Zampini   PetscInt       *aux_local_numbering_2,*dof_sizes,*dof_displs;
1470ef028eecSStefano Zampini   PetscInt       first_index,old_index;
1471ef028eecSStefano Zampini   PetscBool      first_found = PETSC_FALSE;
14723425bc38SStefano Zampini 
14733425bc38SStefano Zampini   /* For communication of scaling factors */
14743425bc38SStefano Zampini   PetscInt       *ptrs_buffer,neigh_position;
14753425bc38SStefano Zampini   PetscScalar    **all_factors,*send_buffer,*recv_buffer;
14763425bc38SStefano Zampini   MPI_Request    *send_reqs,*recv_reqs;
14773425bc38SStefano Zampini 
14783425bc38SStefano Zampini   /* tests */
14793425bc38SStefano Zampini   Vec            test_vec;
14803425bc38SStefano Zampini   PetscBool      test_fetidp;
14813425bc38SStefano Zampini   PetscViewer    viewer;
14823425bc38SStefano Zampini 
14833425bc38SStefano Zampini   PetscFunctionBegin;
14843425bc38SStefano Zampini   ierr = MPI_Comm_rank(comm,&rank);CHKERRQ(ierr);
14853425bc38SStefano Zampini   ierr = MPI_Comm_size(comm,&nprocs);CHKERRQ(ierr);
14863425bc38SStefano Zampini 
14873425bc38SStefano Zampini   /* Default type of lagrange multipliers is non-redundant */
14883425bc38SStefano Zampini   fully_redundant = PETSC_FALSE;
14893425bc38SStefano Zampini   ierr = PetscOptionsGetBool(PETSC_NULL,"-fetidp_fullyredundant",&fully_redundant,PETSC_NULL);CHKERRQ(ierr);
14903425bc38SStefano Zampini 
14913425bc38SStefano Zampini   /* Evaluate local and global number of lagrange multipliers */
14923425bc38SStefano Zampini   ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
14933425bc38SStefano Zampini   n_local_lambda = 0;
14943425bc38SStefano Zampini   partial_sum = 0;
14953425bc38SStefano Zampini   n_boundary_dofs = 0;
14963425bc38SStefano Zampini   s = 0;
14973425bc38SStefano Zampini   n_vertices = 0;
14983425bc38SStefano Zampini   /* Get Vertices used to define the BDDC */
14993425bc38SStefano Zampini   ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(*vertex_indices),&vertex_indices);CHKERRQ(ierr);
15003425bc38SStefano Zampini   for (i=0;i<pcbddc->local_primal_size;i++) {
15013425bc38SStefano Zampini     ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&j,(const PetscInt**)&temp_indices,PETSC_NULL);CHKERRQ(ierr);
15023425bc38SStefano Zampini     if (j == 1) {
15033425bc38SStefano Zampini       vertex_indices[n_vertices]=temp_indices[0];
15043425bc38SStefano Zampini       n_vertices++;
15053425bc38SStefano Zampini     }
15063425bc38SStefano Zampini     ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&j,(const PetscInt**)&temp_indices,PETSC_NULL);CHKERRQ(ierr);
15073425bc38SStefano Zampini   }
15083425bc38SStefano Zampini   dual_size = pcis->n_B-n_vertices;
1509f0474715SStefano Zampini   ierr = PetscSortInt(n_vertices,vertex_indices);CHKERRQ(ierr);
15103425bc38SStefano Zampini   ierr = PetscMalloc(dual_size*sizeof(*dual_dofs_boundary_indices),&dual_dofs_boundary_indices);CHKERRQ(ierr);
15113425bc38SStefano Zampini   ierr = PetscMalloc(dual_size*sizeof(*aux_local_numbering_1),&aux_local_numbering_1);CHKERRQ(ierr);
15123425bc38SStefano Zampini   ierr = PetscMalloc(dual_size*sizeof(*aux_local_numbering_2),&aux_local_numbering_2);CHKERRQ(ierr);
15133425bc38SStefano Zampini 
15143425bc38SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
15153425bc38SStefano Zampini   for (i=0;i<pcis->n;i++){
15163425bc38SStefano Zampini     j = mat_graph->count[i]; /* RECALL: mat_graph->count[i] does not count myself */
1517c6582918SStefano Zampini     k = 0;
1518c6582918SStefano Zampini     if (j > 0) {
15193425bc38SStefano Zampini       k = (mat_graph->neighbours_set[i][0] == -1 ?  1 : 0);
1520c6582918SStefano Zampini     }
15213425bc38SStefano Zampini     j = j - k ;
15223425bc38SStefano Zampini     if ( j > 0 ) { n_boundary_dofs++; }
15233425bc38SStefano Zampini 
15243425bc38SStefano Zampini     skip_node = PETSC_FALSE;
1525c6582918SStefano Zampini     if ( s < n_vertices && vertex_indices[s]==i) { /* it works for a sorted set of vertices */
15263425bc38SStefano Zampini       skip_node = PETSC_TRUE;
15273425bc38SStefano Zampini       s++;
15283425bc38SStefano Zampini     }
15293425bc38SStefano Zampini     if (j < 1) {skip_node = PETSC_TRUE;}
15303425bc38SStefano Zampini     if ( !skip_node ) {
15313425bc38SStefano Zampini       if (fully_redundant) {
15323425bc38SStefano Zampini         /* fully redundant set of lagrange multipliers */
15333425bc38SStefano Zampini         n_lambda_for_dof = (j*(j+1))/2;
15343425bc38SStefano Zampini       } else {
15353425bc38SStefano Zampini         n_lambda_for_dof = j;
15363425bc38SStefano Zampini       }
15373425bc38SStefano Zampini       n_local_lambda += j;
15383425bc38SStefano Zampini       /* needed to evaluate global number of lagrange multipliers */
15393425bc38SStefano Zampini       array[i]=(1.0*n_lambda_for_dof)/(j+1.0); /* already scaled for the next global sum */
15403425bc38SStefano Zampini       /* store some data needed */
15413425bc38SStefano Zampini       dual_dofs_boundary_indices[partial_sum] = n_boundary_dofs-1;
15423425bc38SStefano Zampini       aux_local_numbering_1[partial_sum] = i;
1543ef028eecSStefano Zampini       aux_local_numbering_2[partial_sum] = n_lambda_for_dof;
15443425bc38SStefano Zampini       partial_sum++;
15453425bc38SStefano Zampini     }
15463425bc38SStefano Zampini   }
15473425bc38SStefano Zampini   /*printf("I found %d local lambda dofs\n",n_local_lambda);
15483425bc38SStefano Zampini   printf("I found %d boundary dofs (should be %d)\n",n_boundary_dofs,pcis->n_B);
15493425bc38SStefano Zampini   printf("Partial sum %d should be %d\n",partial_sum,dual_size);*/
15503425bc38SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
1551ef028eecSStefano Zampini 
15523425bc38SStefano Zampini   ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
15533425bc38SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
15543425bc38SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
15553425bc38SStefano Zampini   ierr = VecSum(pcis->vec1_global,&scalar_value);CHKERRQ(ierr);
15563425bc38SStefano Zampini   fetidpmat_ctx->n_lambda = (PetscInt) scalar_value;
15573425bc38SStefano Zampini   /* printf("I found %d global multipliers (%f)\n",fetidpmat_ctx->n_lambda,scalar_value); */
15583425bc38SStefano Zampini 
15593425bc38SStefano Zampini   /* compute global ordering of lagrange multipliers and associate l2g map */
1560ef028eecSStefano Zampini   ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
1561ef028eecSStefano Zampini   ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
1562ef028eecSStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
1563ef028eecSStefano Zampini   for (i=0;i<dual_size;i++) {
1564ef028eecSStefano Zampini     array[aux_local_numbering_1[i]] = aux_local_numbering_2[i];
1565ef028eecSStefano Zampini   }
1566ef028eecSStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
1567ef028eecSStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
1568ef028eecSStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
1569ef028eecSStefano Zampini   ierr = VecSum(pcis->vec1_global,&scalar_value);CHKERRQ(ierr);
1570ef028eecSStefano Zampini   if (pcbddc->dbg_flag && (PetscInt)scalar_value != fetidpmat_ctx->n_lambda) {
1571ef028eecSStefano Zampini     SETERRQ3(PETSC_COMM_WORLD,PETSC_ERR_PLIB,"Error in %s: global number of multipliers mismatch! (%d!=%d)\n",__FUNCT__,(PetscInt)scalar_value,fetidpmat_ctx->n_lambda);
1572ef028eecSStefano Zampini   }
15733425bc38SStefano Zampini 
1574ef028eecSStefano Zampini   /* Fill pcis->vec1_global with cumulative function for global numbering */
1575ef028eecSStefano Zampini   ierr = VecGetArray(pcis->vec1_global,&array);CHKERRQ(ierr);
1576ef028eecSStefano Zampini   ierr = VecGetLocalSize(pcis->vec1_global,&s);CHKERRQ(ierr);
1577ef028eecSStefano Zampini   k = 0;
1578ef028eecSStefano Zampini   first_index = -1;
1579ef028eecSStefano Zampini   for (i=0;i<s;i++) {
1580ef028eecSStefano Zampini     if (!first_found && array[i] > 0.0) {
1581ef028eecSStefano Zampini       first_found = PETSC_TRUE;
1582ef028eecSStefano Zampini       first_index = i;
1583ef028eecSStefano Zampini     }
1584ef028eecSStefano Zampini     k += (PetscInt)array[i];
1585ef028eecSStefano Zampini   }
1586ef028eecSStefano Zampini   j = ( !rank ? nprocs : 0);
15873425bc38SStefano Zampini   ierr = PetscMalloc(j*sizeof(*dof_sizes),&dof_sizes);CHKERRQ(ierr);
15883425bc38SStefano Zampini   ierr = PetscMalloc(j*sizeof(*dof_displs),&dof_displs);CHKERRQ(ierr);
1589ef028eecSStefano Zampini   ierr = MPI_Gather(&k,1,MPIU_INT,dof_sizes,1,MPIU_INT,0,comm);CHKERRQ(ierr);
1590ef028eecSStefano Zampini   if (!rank) {
15913425bc38SStefano Zampini     dof_displs[0]=0;
15923425bc38SStefano Zampini     for (i=1;i<nprocs;i++) {
15933425bc38SStefano Zampini       dof_displs[i] = dof_displs[i-1]+dof_sizes[i-1];
15943425bc38SStefano Zampini     }
15953425bc38SStefano Zampini   }
1596ef028eecSStefano Zampini   ierr = MPI_Scatter(dof_displs,1,MPIU_INT,&k,1,MPIU_INT,0,comm);CHKERRQ(ierr);
1597ef028eecSStefano Zampini   if (first_found) {
1598ef028eecSStefano Zampini     array[first_index] += k;
1599ef028eecSStefano Zampini     old_index = first_index;
1600ef028eecSStefano Zampini     for (i=first_index+1;i<s;i++) {
1601ef028eecSStefano Zampini       if (array[i] > 0.0) {
1602ef028eecSStefano Zampini         array[i] += array[old_index];
1603ef028eecSStefano Zampini         old_index = i;
1604ef028eecSStefano Zampini       }
1605ef028eecSStefano Zampini     }
1606ef028eecSStefano Zampini   }
1607ef028eecSStefano Zampini   ierr = VecRestoreArray(pcis->vec1_global,&array);CHKERRQ(ierr);
1608ef028eecSStefano Zampini   ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
1609ef028eecSStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1610ef028eecSStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1611ef028eecSStefano Zampini   ierr = PetscMalloc(dual_size*sizeof(*aux_global_numbering),&aux_global_numbering);CHKERRQ(ierr);
1612ef028eecSStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
16133425bc38SStefano Zampini   for (i=0;i<dual_size;i++) {
1614ef028eecSStefano Zampini     aux_global_numbering[i] = (PetscInt)array[aux_local_numbering_1[i]]-aux_local_numbering_2[i];
16153425bc38SStefano Zampini   }
1616ef028eecSStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
1617f0474715SStefano Zampini   ierr = PetscFree(aux_local_numbering_2);CHKERRQ(ierr);
1618f0474715SStefano Zampini   ierr = PetscFree(dof_displs);CHKERRQ(ierr);
1619f0474715SStefano Zampini   ierr = PetscFree(dof_sizes);CHKERRQ(ierr);
16203425bc38SStefano Zampini 
16213425bc38SStefano Zampini   /* init data for scaling factors exchange */
16223425bc38SStefano Zampini   partial_sum = 0;
16233425bc38SStefano Zampini   j = 0;
16243425bc38SStefano Zampini   ierr = PetscMalloc(pcis->n_neigh*sizeof(PetscInt),&ptrs_buffer);CHKERRQ(ierr);
16253425bc38SStefano Zampini   ierr = PetscMalloc((pcis->n_neigh-1)*sizeof(MPI_Request),&send_reqs);CHKERRQ(ierr);
16263425bc38SStefano Zampini   ierr = PetscMalloc((pcis->n_neigh-1)*sizeof(MPI_Request),&recv_reqs);CHKERRQ(ierr);
16273425bc38SStefano Zampini   ierr = PetscMalloc(pcis->n*sizeof(PetscScalar*),&all_factors);CHKERRQ(ierr);
16283425bc38SStefano Zampini   ptrs_buffer[0]=0;
16293425bc38SStefano Zampini   for (i=1;i<pcis->n_neigh;i++) {
16303425bc38SStefano Zampini     partial_sum += pcis->n_shared[i];
16313425bc38SStefano Zampini     ptrs_buffer[i] = ptrs_buffer[i-1]+pcis->n_shared[i];
16323425bc38SStefano Zampini   }
16333425bc38SStefano Zampini   ierr = PetscMalloc( partial_sum*sizeof(PetscScalar),&send_buffer);CHKERRQ(ierr);
16343425bc38SStefano Zampini   ierr = PetscMalloc( partial_sum*sizeof(PetscScalar),&recv_buffer);CHKERRQ(ierr);
16353425bc38SStefano Zampini   ierr = PetscMalloc( partial_sum*sizeof(PetscScalar),&all_factors[0]);CHKERRQ(ierr);
16363425bc38SStefano Zampini   for (i=0;i<pcis->n-1;i++) {
16373425bc38SStefano Zampini     j = mat_graph->count[i];
16383425bc38SStefano Zampini     if (j>0) {
16393425bc38SStefano Zampini       k = (mat_graph->neighbours_set[i][0] == -1 ?  1 : 0);
16403425bc38SStefano Zampini       j = j - k;
16413425bc38SStefano Zampini     }
16423425bc38SStefano Zampini     all_factors[i+1]=all_factors[i]+j;
16433425bc38SStefano Zampini   }
16443425bc38SStefano Zampini   /* scatter B scaling to N vec */
16453425bc38SStefano Zampini   ierr = VecScatterBegin(pcis->N_to_B,pcis->D,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
16463425bc38SStefano Zampini   ierr = VecScatterEnd  (pcis->N_to_B,pcis->D,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
16473425bc38SStefano Zampini   /* communications */
16483425bc38SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
16493425bc38SStefano Zampini   for (i=1;i<pcis->n_neigh;i++) {
16503425bc38SStefano Zampini     for (j=0;j<pcis->n_shared[i];j++) {
16513425bc38SStefano Zampini       send_buffer[ptrs_buffer[i-1]+j]=array[pcis->shared[i][j]];
16523425bc38SStefano Zampini     }
16533425bc38SStefano Zampini     j = ptrs_buffer[i]-ptrs_buffer[i-1];
1654ea7e1babSStefano Zampini     ierr = MPI_Isend(&send_buffer[ptrs_buffer[i-1]],j,MPIU_SCALAR,pcis->neigh[i],0,comm,&send_reqs[i-1]);CHKERRQ(ierr);
1655ea7e1babSStefano Zampini     ierr = MPI_Irecv(&recv_buffer[ptrs_buffer[i-1]],j,MPIU_SCALAR,pcis->neigh[i],0,comm,&recv_reqs[i-1]);CHKERRQ(ierr);
16563425bc38SStefano Zampini   }
16573425bc38SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
1658ea7e1babSStefano Zampini   ierr = MPI_Waitall((pcis->n_neigh-1),recv_reqs,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
16593425bc38SStefano Zampini   /* put values in correct places */
16603425bc38SStefano Zampini   for (i=1;i<pcis->n_neigh;i++) {
16613425bc38SStefano Zampini     for (j=0;j<pcis->n_shared[i];j++) {
16623425bc38SStefano Zampini       k = pcis->shared[i][j];
16633425bc38SStefano Zampini       neigh_position = 0;
16643425bc38SStefano Zampini       while(mat_graph->neighbours_set[k][neigh_position] != pcis->neigh[i]) {neigh_position++;}
16653425bc38SStefano Zampini       s = (mat_graph->neighbours_set[k][0] == -1 ?  1 : 0);
16663425bc38SStefano Zampini       neigh_position = neigh_position - s;
16673425bc38SStefano Zampini       all_factors[k][neigh_position]=recv_buffer[ptrs_buffer[i-1]+j];
16683425bc38SStefano Zampini     }
16693425bc38SStefano Zampini   }
1670ea7e1babSStefano Zampini   ierr = MPI_Waitall((pcis->n_neigh-1),send_reqs,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
16713425bc38SStefano Zampini   ierr = PetscFree(send_reqs);CHKERRQ(ierr);
16723425bc38SStefano Zampini   ierr = PetscFree(recv_reqs);CHKERRQ(ierr);
16733425bc38SStefano Zampini   ierr = PetscFree(send_buffer);CHKERRQ(ierr);
16743425bc38SStefano Zampini   ierr = PetscFree(recv_buffer);CHKERRQ(ierr);
16753425bc38SStefano Zampini   ierr = PetscFree(ptrs_buffer);CHKERRQ(ierr);
16763425bc38SStefano Zampini 
16773425bc38SStefano Zampini   /* Compute B and B_delta (local actions) */
16783425bc38SStefano Zampini   ierr = PetscMalloc(pcis->n_neigh*sizeof(*aux_sums),&aux_sums);CHKERRQ(ierr);
16793425bc38SStefano Zampini   ierr = PetscMalloc(n_local_lambda*sizeof(*l2g_indices),&l2g_indices);CHKERRQ(ierr);
16803425bc38SStefano Zampini   ierr = PetscMalloc(n_local_lambda*sizeof(*vals_B_delta),&vals_B_delta);CHKERRQ(ierr);
16813425bc38SStefano Zampini   ierr = PetscMalloc(n_local_lambda*sizeof(*cols_B_delta),&cols_B_delta);CHKERRQ(ierr);
16823425bc38SStefano Zampini   ierr = PetscMalloc(n_local_lambda*sizeof(*scaling_factors),&scaling_factors);CHKERRQ(ierr);
16833425bc38SStefano Zampini   n_global_lambda=0;
16843425bc38SStefano Zampini   partial_sum=0;
16853425bc38SStefano Zampini   for (i=0;i<dual_size;i++) {
1686ef028eecSStefano Zampini     n_global_lambda = aux_global_numbering[i];
16873425bc38SStefano Zampini     j = mat_graph->count[aux_local_numbering_1[i]];
16883425bc38SStefano Zampini     k = (mat_graph->neighbours_set[aux_local_numbering_1[i]][0] == -1 ?  1 : 0);
16893425bc38SStefano Zampini     j = j - k;
16903425bc38SStefano Zampini     aux_sums[0]=0;
16913425bc38SStefano Zampini     for (s=1;s<j;s++) {
16923425bc38SStefano Zampini       aux_sums[s]=aux_sums[s-1]+j-s+1;
16933425bc38SStefano Zampini     }
16943425bc38SStefano Zampini     array = all_factors[aux_local_numbering_1[i]];
16953425bc38SStefano Zampini     n_neg_values = 0;
16963425bc38SStefano Zampini     while(n_neg_values < j && mat_graph->neighbours_set[aux_local_numbering_1[i]][n_neg_values+k] < rank) {n_neg_values++;}
16973425bc38SStefano Zampini     n_pos_values = j - n_neg_values;
16983425bc38SStefano Zampini     if (fully_redundant) {
16993425bc38SStefano Zampini       for (s=0;s<n_neg_values;s++) {
17003425bc38SStefano Zampini         l2g_indices    [partial_sum+s]=aux_sums[s]+n_neg_values-s-1+n_global_lambda;
17013425bc38SStefano Zampini         cols_B_delta   [partial_sum+s]=dual_dofs_boundary_indices[i];
17023425bc38SStefano Zampini         vals_B_delta   [partial_sum+s]=-1.0;
17033425bc38SStefano Zampini         scaling_factors[partial_sum+s]=array[s];
17043425bc38SStefano Zampini       }
17053425bc38SStefano Zampini       for (s=0;s<n_pos_values;s++) {
17063425bc38SStefano Zampini         l2g_indices    [partial_sum+s+n_neg_values]=aux_sums[n_neg_values]+s+n_global_lambda;
17073425bc38SStefano Zampini         cols_B_delta   [partial_sum+s+n_neg_values]=dual_dofs_boundary_indices[i];
17083425bc38SStefano Zampini         vals_B_delta   [partial_sum+s+n_neg_values]=1.0;
17093425bc38SStefano Zampini         scaling_factors[partial_sum+s+n_neg_values]=array[s+n_neg_values];
17103425bc38SStefano Zampini       }
17113425bc38SStefano Zampini       partial_sum += j;
17123425bc38SStefano Zampini     } else {
17133425bc38SStefano Zampini       /* l2g_indices and default cols and vals of B_delta */
17143425bc38SStefano Zampini       for (s=0;s<j;s++) {
17153425bc38SStefano Zampini         l2g_indices    [partial_sum+s]=n_global_lambda+s;
17163425bc38SStefano Zampini         cols_B_delta   [partial_sum+s]=dual_dofs_boundary_indices[i];
17173425bc38SStefano Zampini         vals_B_delta   [partial_sum+s]=0.0;
17183425bc38SStefano Zampini       }
17193425bc38SStefano Zampini       /* B_delta */
17203425bc38SStefano Zampini       if ( n_neg_values > 0 ) { /* there's a rank next to me to the left */
17213425bc38SStefano Zampini         vals_B_delta   [partial_sum+n_neg_values-1]=-1.0;
17223425bc38SStefano Zampini       }
17233425bc38SStefano Zampini       if ( n_neg_values < j ) { /* there's a rank next to me to the right */
17243425bc38SStefano Zampini         vals_B_delta   [partial_sum+n_neg_values]=1.0;
17253425bc38SStefano Zampini       }
17263425bc38SStefano Zampini       /* scaling as in Klawonn-Widlund 1999*/
17273425bc38SStefano Zampini       for (s=0;s<n_neg_values;s++) {
17283425bc38SStefano Zampini         scalar_value = 0.0;
17293425bc38SStefano Zampini         for (k=0;k<s+1;k++) {
17303425bc38SStefano Zampini           scalar_value += array[k];
17313425bc38SStefano Zampini         }
1732ef028eecSStefano Zampini         scaling_factors[partial_sum+s] = -scalar_value;
17333425bc38SStefano Zampini       }
17343425bc38SStefano Zampini       for (s=0;s<n_pos_values;s++) {
17353425bc38SStefano Zampini         scalar_value = 0.0;
17363425bc38SStefano Zampini         for (k=s+n_neg_values;k<j;k++) {
17373425bc38SStefano Zampini           scalar_value += array[k];
17383425bc38SStefano Zampini         }
17393425bc38SStefano Zampini         scaling_factors[partial_sum+s+n_neg_values] = scalar_value;
17403425bc38SStefano Zampini       }
17413425bc38SStefano Zampini       partial_sum += j;
17423425bc38SStefano Zampini     }
17433425bc38SStefano Zampini   }
1744ef028eecSStefano Zampini   ierr = PetscFree(aux_global_numbering);CHKERRQ(ierr);
1745f0474715SStefano Zampini   ierr = PetscFree(aux_sums);CHKERRQ(ierr);
1746f0474715SStefano Zampini   ierr = PetscFree(aux_local_numbering_1);CHKERRQ(ierr);
1747f0474715SStefano Zampini   ierr = PetscFree(dual_dofs_boundary_indices);CHKERRQ(ierr);
17483425bc38SStefano Zampini   ierr = PetscFree(all_factors[0]);CHKERRQ(ierr);
17493425bc38SStefano Zampini   ierr = PetscFree(all_factors);CHKERRQ(ierr);
17503425bc38SStefano Zampini   /* printf("I found %d local lambda dofs when numbering them (should be %d)\n",partial_sum,n_local_lambda); */
1751f0474715SStefano Zampini 
1752f0474715SStefano Zampini   /* Local to global mapping of fetidpmat */
1753f0474715SStefano Zampini   ierr = VecCreate(PETSC_COMM_SELF,&fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
1754f0474715SStefano Zampini   ierr = VecSetSizes(fetidpmat_ctx->lambda_local,n_local_lambda,n_local_lambda);CHKERRQ(ierr);
1755f0474715SStefano Zampini   ierr = VecSetType(fetidpmat_ctx->lambda_local,VECSEQ);CHKERRQ(ierr);
1756f0474715SStefano Zampini   ierr = VecCreate(comm,&lambda_global);CHKERRQ(ierr);
1757f0474715SStefano Zampini   ierr = VecSetSizes(lambda_global,PETSC_DECIDE,fetidpmat_ctx->n_lambda);CHKERRQ(ierr);
1758f0474715SStefano Zampini   ierr = VecSetType(lambda_global,VECMPI);CHKERRQ(ierr);
17593425bc38SStefano Zampini   ierr = ISCreateGeneral(comm,n_local_lambda,l2g_indices,PETSC_OWN_POINTER,&IS_l2g_lambda);CHKERRQ(ierr);
17603425bc38SStefano Zampini   ierr = VecScatterCreate(fetidpmat_ctx->lambda_local,(IS)0,lambda_global,IS_l2g_lambda,&fetidpmat_ctx->l2g_lambda);CHKERRQ(ierr);
1761f0474715SStefano Zampini   ierr = ISDestroy(&IS_l2g_lambda);CHKERRQ(ierr);
17623425bc38SStefano Zampini 
17633425bc38SStefano Zampini   /* Create local part of B_delta */
17643425bc38SStefano Zampini   ierr = MatCreate(PETSC_COMM_SELF,&fetidpmat_ctx->B_delta);
17653425bc38SStefano Zampini   ierr = MatSetSizes(fetidpmat_ctx->B_delta,n_local_lambda,pcis->n_B,n_local_lambda,pcis->n_B);CHKERRQ(ierr);
17663425bc38SStefano Zampini   ierr = MatSetType(fetidpmat_ctx->B_delta,MATSEQAIJ);CHKERRQ(ierr);
17673425bc38SStefano Zampini   ierr = MatSeqAIJSetPreallocation(fetidpmat_ctx->B_delta,1,PETSC_NULL);CHKERRQ(ierr);
17683425bc38SStefano Zampini   ierr = MatSetOption(fetidpmat_ctx->B_delta,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr);
17693425bc38SStefano Zampini   for (i=0;i<n_local_lambda;i++) {
17703425bc38SStefano Zampini     ierr = MatSetValue(fetidpmat_ctx->B_delta,i,cols_B_delta[i],vals_B_delta[i],INSERT_VALUES);CHKERRQ(ierr);
17713425bc38SStefano Zampini   }
1772f0474715SStefano Zampini   ierr = PetscFree(vals_B_delta);CHKERRQ(ierr);
17733425bc38SStefano Zampini   ierr = MatAssemblyBegin(fetidpmat_ctx->B_delta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
17743425bc38SStefano Zampini   ierr = MatAssemblyEnd  (fetidpmat_ctx->B_delta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
17753425bc38SStefano Zampini 
17763425bc38SStefano Zampini   if (fully_redundant) {
17773425bc38SStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&ScalingMat);
17783425bc38SStefano Zampini     ierr = MatSetSizes(ScalingMat,n_local_lambda,n_local_lambda,n_local_lambda,n_local_lambda);CHKERRQ(ierr);
17793425bc38SStefano Zampini     ierr = MatSetType(ScalingMat,MATSEQAIJ);CHKERRQ(ierr);
17803425bc38SStefano Zampini     ierr = MatSeqAIJSetPreallocation(ScalingMat,1,PETSC_NULL);CHKERRQ(ierr);
17813425bc38SStefano Zampini     for (i=0;i<n_local_lambda;i++) {
17823425bc38SStefano Zampini       ierr = MatSetValue(ScalingMat,i,i,scaling_factors[i],INSERT_VALUES);CHKERRQ(ierr);
17833425bc38SStefano Zampini     }
17843425bc38SStefano Zampini     ierr = MatAssemblyBegin(ScalingMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
17853425bc38SStefano Zampini     ierr = MatAssemblyEnd  (ScalingMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
17863425bc38SStefano Zampini     ierr = MatMatMult(ScalingMat,fetidpmat_ctx->B_delta,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&fetidpmat_ctx->B_Ddelta);CHKERRQ(ierr);
17873425bc38SStefano Zampini     ierr = MatDestroy(&ScalingMat);CHKERRQ(ierr);
17883425bc38SStefano Zampini   } else {
17893425bc38SStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&fetidpmat_ctx->B_Ddelta);
17903425bc38SStefano Zampini     ierr = MatSetSizes(fetidpmat_ctx->B_Ddelta,n_local_lambda,pcis->n_B,n_local_lambda,pcis->n_B);CHKERRQ(ierr);
17913425bc38SStefano Zampini     ierr = MatSetType(fetidpmat_ctx->B_Ddelta,MATSEQAIJ);CHKERRQ(ierr);
17923425bc38SStefano Zampini     ierr = MatSeqAIJSetPreallocation(fetidpmat_ctx->B_Ddelta,1,PETSC_NULL);CHKERRQ(ierr);
17933425bc38SStefano Zampini     for (i=0;i<n_local_lambda;i++) {
17943425bc38SStefano Zampini       ierr = MatSetValue(fetidpmat_ctx->B_Ddelta,i,cols_B_delta[i],scaling_factors[i],INSERT_VALUES);CHKERRQ(ierr);
17953425bc38SStefano Zampini     }
17963425bc38SStefano Zampini     ierr = MatAssemblyBegin(fetidpmat_ctx->B_Ddelta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
17973425bc38SStefano Zampini     ierr = MatAssemblyEnd  (fetidpmat_ctx->B_Ddelta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
17983425bc38SStefano Zampini   }
1799f0474715SStefano Zampini   ierr = PetscFree(scaling_factors);CHKERRQ(ierr);
1800f0474715SStefano Zampini   ierr = PetscFree(cols_B_delta);CHKERRQ(ierr);
18013425bc38SStefano Zampini 
18023425bc38SStefano Zampini   /* Create some vectors needed by fetidp */
18033425bc38SStefano Zampini   ierr = VecDuplicate(pcis->vec1_B,&fetidpmat_ctx->temp_solution_B);CHKERRQ(ierr);
18043425bc38SStefano Zampini   ierr = VecDuplicate(pcis->vec1_D,&fetidpmat_ctx->temp_solution_D);CHKERRQ(ierr);
18053425bc38SStefano Zampini 
18063425bc38SStefano Zampini   test_fetidp = PETSC_FALSE;
18073425bc38SStefano Zampini   ierr = PetscOptionsGetBool(PETSC_NULL,"-fetidp_check",&test_fetidp,PETSC_NULL);CHKERRQ(ierr);
18083425bc38SStefano Zampini 
18093425bc38SStefano Zampini   if (test_fetidp) {
18103425bc38SStefano Zampini 
18113425bc38SStefano Zampini     ierr = PetscViewerASCIIGetStdout(((PetscObject)(fetidpmat_ctx->pc))->comm,&viewer);CHKERRQ(ierr);
18123425bc38SStefano Zampini     ierr = PetscViewerASCIISynchronizedAllow(viewer,PETSC_TRUE);CHKERRQ(ierr);
18133425bc38SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"----------FETI_DP TESTS--------------\n");CHKERRQ(ierr);
18143425bc38SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"All tests should return zero!\n");CHKERRQ(ierr);
18153425bc38SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"FETIDP MAT context in the ");CHKERRQ(ierr);
18163425bc38SStefano Zampini     if (fully_redundant) {
18173425bc38SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"fully redundant case for lagrange multipliers.\n");CHKERRQ(ierr);
18183425bc38SStefano Zampini     } else {
18193425bc38SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Non-fully redundant case for lagrange multiplier.\n");CHKERRQ(ierr);
18203425bc38SStefano Zampini     }
18213425bc38SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
18223425bc38SStefano Zampini 
18233425bc38SStefano Zampini     /******************************************************************/
18243425bc38SStefano Zampini     /* TEST A/B: Test numbering of global lambda dofs             */
18253425bc38SStefano Zampini     /******************************************************************/
18263425bc38SStefano Zampini 
18273425bc38SStefano Zampini     ierr = VecDuplicate(fetidpmat_ctx->lambda_local,&test_vec);CHKERRQ(ierr);
18283425bc38SStefano Zampini     ierr = VecSet(lambda_global,1.0);CHKERRQ(ierr);
18293425bc38SStefano Zampini     ierr = VecSet(test_vec,1.0);CHKERRQ(ierr);
18303425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
18313425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
18323425bc38SStefano Zampini     scalar_value = -1.0;
18333425bc38SStefano Zampini     ierr = VecAXPY(test_vec,scalar_value,fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
18343425bc38SStefano Zampini     ierr = VecNorm(test_vec,NORM_INFINITY,&scalar_value);CHKERRQ(ierr);
18353425bc38SStefano Zampini     ierr = VecDestroy(&test_vec);CHKERRQ(ierr);
18363425bc38SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"A[%04d]: CHECK glob to loc: % 1.14e\n",rank,scalar_value);CHKERRQ(ierr);
18373425bc38SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
18383425bc38SStefano Zampini     if (fully_redundant) {
18393425bc38SStefano Zampini       ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr);
18403425bc38SStefano Zampini       ierr = VecSet(fetidpmat_ctx->lambda_local,0.5);CHKERRQ(ierr);
18413425bc38SStefano Zampini       ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18423425bc38SStefano Zampini       ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18433425bc38SStefano Zampini       ierr = VecSum(lambda_global,&scalar_value);CHKERRQ(ierr);
18443425bc38SStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"B[%04d]: CHECK loc to glob: % 1.14e\n",rank,scalar_value-fetidpmat_ctx->n_lambda);CHKERRQ(ierr);
18453425bc38SStefano Zampini       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
18463425bc38SStefano Zampini     }
18473425bc38SStefano Zampini 
18483425bc38SStefano Zampini     /******************************************************************/
18493425bc38SStefano Zampini     /* TEST C: It should holds B_delta*w=0, w\in\widehat{W}           */
18503425bc38SStefano Zampini     /* This is the meaning of the B matrix                            */
18513425bc38SStefano Zampini     /******************************************************************/
18523425bc38SStefano Zampini 
18533425bc38SStefano Zampini     ierr = VecSetRandom(pcis->vec1_N,PETSC_NULL);CHKERRQ(ierr);
18543425bc38SStefano Zampini     ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
18553425bc38SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
18563425bc38SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
18573425bc38SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18583425bc38SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18593425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18603425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18613425bc38SStefano Zampini     /* Action of B_delta */
18623425bc38SStefano Zampini     ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
18633425bc38SStefano Zampini     ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr);
18643425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18653425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18663425bc38SStefano Zampini     ierr = VecNorm(lambda_global,NORM_INFINITY,&scalar_value);CHKERRQ(ierr);
18673425bc38SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"C[coll]: CHECK infty norm of B_delta*w (w continuous): % 1.14e\n",scalar_value);CHKERRQ(ierr);
18683425bc38SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
18693425bc38SStefano Zampini 
18703425bc38SStefano Zampini     /******************************************************************/
18713425bc38SStefano Zampini     /* TEST D: It should holds E_Dw = w - P_Dw w\in\widetilde{W}     */
18723425bc38SStefano Zampini     /* E_D = R_D^TR                                                   */
18733425bc38SStefano Zampini     /* P_D = B_{D,delta}^T B_{delta}                                  */
18743425bc38SStefano Zampini     /* eq.44 Mandel Tezaur and Dohrmann 2005                          */
18753425bc38SStefano Zampini     /******************************************************************/
18763425bc38SStefano Zampini 
18773425bc38SStefano Zampini     /* compute a random vector in \widetilde{W} */
18783425bc38SStefano Zampini     ierr = VecSetRandom(pcis->vec1_N,PETSC_NULL);CHKERRQ(ierr);
18793425bc38SStefano Zampini     scalar_value = 0.0;  /* set zero at vertices */
18803425bc38SStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
18813425bc38SStefano Zampini     for (i=0;i<n_vertices;i++) { array[vertex_indices[i]]=scalar_value; }
18823425bc38SStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
18833425bc38SStefano Zampini     /* store w for final comparison */
18843425bc38SStefano Zampini     ierr = VecDuplicate(pcis->vec1_B,&test_vec);CHKERRQ(ierr);
18853425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,test_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18863425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,test_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18873425bc38SStefano Zampini 
18883425bc38SStefano Zampini     /* Jump operator P_D : results stored in pcis->vec1_B */
18893425bc38SStefano Zampini 
18903425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18913425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18923425bc38SStefano Zampini     /* Action of B_delta */
18933425bc38SStefano Zampini     ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
18943425bc38SStefano Zampini     ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr);
18953425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18963425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18973425bc38SStefano Zampini     /* Action of B_Ddelta^T */
18983425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
18993425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
19003425bc38SStefano Zampini     ierr = MatMultTranspose(fetidpmat_ctx->B_Ddelta,fetidpmat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr);
19013425bc38SStefano Zampini 
19023425bc38SStefano Zampini     /* Average operator E_D : results stored in pcis->vec2_B */
19033425bc38SStefano Zampini 
19043425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
19053425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
19063425bc38SStefano Zampini     ierr = VecPointwiseMult(pcis->vec2_B,pcis->D,pcis->vec2_B);CHKERRQ(ierr);
19073425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec2_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
19083425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec2_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
19093425bc38SStefano Zampini     ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
19103425bc38SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
19113425bc38SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
19123425bc38SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
19133425bc38SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
19143425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
19153425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
19163425bc38SStefano Zampini 
19173425bc38SStefano Zampini     /* test E_D=I-P_D */
19183425bc38SStefano Zampini     scalar_value = 1.0;
19193425bc38SStefano Zampini     ierr = VecAXPY(pcis->vec1_B,scalar_value,pcis->vec2_B);CHKERRQ(ierr);
19203425bc38SStefano Zampini     scalar_value = -1.0;
19213425bc38SStefano Zampini     ierr = VecAXPY(pcis->vec1_B,scalar_value,test_vec);CHKERRQ(ierr);
19223425bc38SStefano Zampini     ierr = VecNorm(pcis->vec1_B,NORM_INFINITY,&scalar_value);CHKERRQ(ierr);
19233425bc38SStefano Zampini     ierr = VecDestroy(&test_vec);CHKERRQ(ierr);
19243425bc38SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"D[%04d] CHECK infty norm of E_D + P_D - I: % 1.14e\n",rank,scalar_value);CHKERRQ(ierr);
19253425bc38SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
19263425bc38SStefano Zampini 
19273425bc38SStefano Zampini     /******************************************************************/
19283425bc38SStefano Zampini     /* TEST E: It should holds R_D^TP_Dw=0 w\in\widetilde{W}          */
19293425bc38SStefano Zampini     /* eq.48 Mandel Tezaur and Dohrmann 2005                          */
19303425bc38SStefano Zampini     /******************************************************************/
19313425bc38SStefano Zampini 
19323425bc38SStefano Zampini     ierr = VecSetRandom(pcis->vec1_N,PETSC_NULL);CHKERRQ(ierr);
19333425bc38SStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
19343425bc38SStefano Zampini     scalar_value = 0.0;  /* set zero at vertices */
19353425bc38SStefano Zampini     for (i=0;i<n_vertices;i++) { array[vertex_indices[i]]=scalar_value; }
19363425bc38SStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
19373425bc38SStefano Zampini 
19383425bc38SStefano Zampini     /* Jump operator P_D : results stored in pcis->vec1_B */
19393425bc38SStefano Zampini 
19403425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
19413425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
19423425bc38SStefano Zampini     /* Action of B_delta */
19433425bc38SStefano Zampini     ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
19443425bc38SStefano Zampini     ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr);
19453425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
19463425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
19473425bc38SStefano Zampini     /* Action of B_Ddelta^T */
19483425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
19493425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
19503425bc38SStefano Zampini     ierr = MatMultTranspose(fetidpmat_ctx->B_Ddelta,fetidpmat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr);
19513425bc38SStefano Zampini     /* diagonal scaling */
19523425bc38SStefano Zampini     ierr = VecPointwiseMult(pcis->vec1_B,pcis->D,pcis->vec1_B);CHKERRQ(ierr);
19533425bc38SStefano Zampini     /* sum on the interface */
19543425bc38SStefano Zampini     ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
19553425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
19563425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
19573425bc38SStefano Zampini     ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
19583425bc38SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
19593425bc38SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
19603425bc38SStefano Zampini     ierr = VecNorm(pcis->vec1_global,NORM_INFINITY,&scalar_value);CHKERRQ(ierr);
19613425bc38SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"E[coll]: CHECK infty norm of R^T_D P_D: % 1.14e\n",scalar_value);CHKERRQ(ierr);
19623425bc38SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
19633425bc38SStefano Zampini 
19643425bc38SStefano Zampini     if (!fully_redundant) {
19653425bc38SStefano Zampini       /******************************************************************/
19663425bc38SStefano Zampini       /* TEST F: It should holds B_{delta}B^T_{D,delta}=I               */
19673425bc38SStefano Zampini       /* Corollary thm 14 Mandel Tezaur and Dohrmann 2005               */
19683425bc38SStefano Zampini       /******************************************************************/
19693425bc38SStefano Zampini       ierr = VecDuplicate(lambda_global,&test_vec);CHKERRQ(ierr);
19703425bc38SStefano Zampini       ierr = VecSetRandom(lambda_global,PETSC_NULL);CHKERRQ(ierr);
19713425bc38SStefano Zampini       /* Action of B_Ddelta^T */
19723425bc38SStefano Zampini       ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
19733425bc38SStefano Zampini       ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
19743425bc38SStefano Zampini       ierr = MatMultTranspose(fetidpmat_ctx->B_Ddelta,fetidpmat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr);
19753425bc38SStefano Zampini       /* Action of B_delta */
19763425bc38SStefano Zampini       ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
19773425bc38SStefano Zampini       ierr = VecSet(test_vec,0.0);CHKERRQ(ierr);
19783425bc38SStefano Zampini       ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,test_vec,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
19793425bc38SStefano Zampini       ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,test_vec,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
19803425bc38SStefano Zampini       scalar_value = -1.0;
19813425bc38SStefano Zampini       ierr = VecAXPY(lambda_global,scalar_value,test_vec);CHKERRQ(ierr);
19823425bc38SStefano Zampini       ierr = VecNorm(lambda_global,NORM_INFINITY,&scalar_value);CHKERRQ(ierr);
19833425bc38SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"E[coll]: CHECK infty norm of P^T_D - I: % 1.14e\n",scalar_value);CHKERRQ(ierr);
19843425bc38SStefano Zampini       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
19853425bc38SStefano Zampini       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
19863425bc38SStefano Zampini       ierr = VecDestroy(&test_vec);CHKERRQ(ierr);
19873425bc38SStefano Zampini     }
19883425bc38SStefano Zampini   }
19893425bc38SStefano Zampini   /* final cleanup */
19903425bc38SStefano Zampini   ierr = PetscFree(vertex_indices);CHKERRQ(ierr);
19913425bc38SStefano Zampini   ierr = VecDestroy(&lambda_global);CHKERRQ(ierr);
19923425bc38SStefano Zampini 
19933425bc38SStefano Zampini   PetscFunctionReturn(0);
19943425bc38SStefano Zampini }
19953425bc38SStefano Zampini 
19963425bc38SStefano Zampini #undef __FUNCT__
19973425bc38SStefano Zampini #define __FUNCT__ "PCBDDCSetupFETIDPPCContext"
19983425bc38SStefano Zampini static PetscErrorCode PCBDDCSetupFETIDPPCContext(Mat fetimat, FETIDPPC_ctx *fetidppc_ctx)
19993425bc38SStefano Zampini {
20003425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
20013425bc38SStefano Zampini   PetscErrorCode ierr;
20023425bc38SStefano Zampini 
20033425bc38SStefano Zampini   PetscFunctionBegin;
20043425bc38SStefano Zampini   ierr = MatShellGetContext(fetimat,&mat_ctx);CHKERRQ(ierr);
20053425bc38SStefano Zampini   /* get references from objects created when setting up feti mat context */
20063425bc38SStefano Zampini   ierr = PetscObjectReference((PetscObject)mat_ctx->lambda_local);CHKERRQ(ierr);
20073425bc38SStefano Zampini   fetidppc_ctx->lambda_local = mat_ctx->lambda_local;
20083425bc38SStefano Zampini   ierr = PetscObjectReference((PetscObject)mat_ctx->B_Ddelta);CHKERRQ(ierr);
20093425bc38SStefano Zampini   fetidppc_ctx->B_Ddelta = mat_ctx->B_Ddelta;
20103425bc38SStefano Zampini   ierr = PetscObjectReference((PetscObject)mat_ctx->l2g_lambda);CHKERRQ(ierr);
20113425bc38SStefano Zampini   fetidppc_ctx->l2g_lambda = mat_ctx->l2g_lambda;
20123425bc38SStefano Zampini   PetscFunctionReturn(0);
20133425bc38SStefano Zampini }
20143425bc38SStefano Zampini 
20153425bc38SStefano Zampini #undef __FUNCT__
20163425bc38SStefano Zampini #define __FUNCT__ "FETIDPMatMult"
20173425bc38SStefano Zampini static PetscErrorCode FETIDPMatMult(Mat fetimat, Vec x, Vec y)
20183425bc38SStefano Zampini {
20193425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
20203425bc38SStefano Zampini   PC_IS          *pcis;
20213425bc38SStefano Zampini   PetscErrorCode ierr;
20223425bc38SStefano Zampini 
20233425bc38SStefano Zampini   PetscFunctionBegin;
20243425bc38SStefano Zampini   ierr = MatShellGetContext(fetimat,&mat_ctx);CHKERRQ(ierr);
20253425bc38SStefano Zampini   pcis = (PC_IS*)mat_ctx->pc->data;
20263425bc38SStefano Zampini   /* Application of B_delta^T */
20273425bc38SStefano Zampini   ierr = VecScatterBegin(mat_ctx->l2g_lambda,x,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
20283425bc38SStefano Zampini   ierr = VecScatterEnd(mat_ctx->l2g_lambda,x,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
20293425bc38SStefano Zampini   ierr = MatMultTranspose(mat_ctx->B_delta,mat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr);
20303425bc38SStefano Zampini   /* Application of \widetilde{S}^-1 */
20313425bc38SStefano Zampini   ierr = VecSet(pcis->vec1_D,0.0);CHKERRQ(ierr);
20323425bc38SStefano Zampini   ierr = PCBDDCApplyInterfacePreconditioner(mat_ctx->pc);CHKERRQ(ierr);
20333425bc38SStefano Zampini   /* Application of B_delta */
20343425bc38SStefano Zampini   ierr = MatMult(mat_ctx->B_delta,pcis->vec1_B,mat_ctx->lambda_local);CHKERRQ(ierr);
20353425bc38SStefano Zampini   ierr = VecSet(y,0.0);CHKERRQ(ierr);
20363425bc38SStefano Zampini   ierr = VecScatterBegin(mat_ctx->l2g_lambda,mat_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20373425bc38SStefano Zampini   ierr = VecScatterEnd(mat_ctx->l2g_lambda,mat_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20383425bc38SStefano Zampini   PetscFunctionReturn(0);
20393425bc38SStefano Zampini }
20403425bc38SStefano Zampini 
20413425bc38SStefano Zampini #undef __FUNCT__
20423425bc38SStefano Zampini #define __FUNCT__ "FETIDPPCApply"
20433425bc38SStefano Zampini static PetscErrorCode FETIDPPCApply(PC fetipc, Vec x, Vec y)
20443425bc38SStefano Zampini {
20453425bc38SStefano Zampini   FETIDPPC_ctx   *pc_ctx;
20463425bc38SStefano Zampini   PC_IS          *pcis;
20473425bc38SStefano Zampini   PetscErrorCode ierr;
20483425bc38SStefano Zampini 
20493425bc38SStefano Zampini   PetscFunctionBegin;
20503425bc38SStefano Zampini   ierr = PCShellGetContext(fetipc,(void**)&pc_ctx);
20513425bc38SStefano Zampini   pcis = (PC_IS*)pc_ctx->pc->data;
20523425bc38SStefano Zampini   /* Application of B_Ddelta^T */
20533425bc38SStefano Zampini   ierr = VecScatterBegin(pc_ctx->l2g_lambda,x,pc_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
20543425bc38SStefano Zampini   ierr = VecScatterEnd(pc_ctx->l2g_lambda,x,pc_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
20553425bc38SStefano Zampini   ierr = VecSet(pcis->vec2_B,0.0);CHKERRQ(ierr);
20563425bc38SStefano Zampini   ierr = MatMultTranspose(pc_ctx->B_Ddelta,pc_ctx->lambda_local,pcis->vec2_B);CHKERRQ(ierr);
20573425bc38SStefano Zampini   /* Application of S */
20583425bc38SStefano Zampini   ierr = PCISApplySchur(pc_ctx->pc,pcis->vec2_B,pcis->vec1_B,(Vec)0,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr);
20593425bc38SStefano Zampini   /* Application of B_Ddelta */
20603425bc38SStefano Zampini   ierr = MatMult(pc_ctx->B_Ddelta,pcis->vec1_B,pc_ctx->lambda_local);CHKERRQ(ierr);
20613425bc38SStefano Zampini   ierr = VecSet(y,0.0);CHKERRQ(ierr);
20623425bc38SStefano Zampini   ierr = VecScatterBegin(pc_ctx->l2g_lambda,pc_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20633425bc38SStefano Zampini   ierr = VecScatterEnd(pc_ctx->l2g_lambda,pc_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20643425bc38SStefano Zampini   PetscFunctionReturn(0);
20653425bc38SStefano Zampini }
20663425bc38SStefano Zampini 
2067da1bb401SStefano Zampini #undef __FUNCT__
2068da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetupLocalAdjacencyGraph"
2069da1bb401SStefano Zampini static PetscErrorCode PCBDDCSetupLocalAdjacencyGraph(PC pc)
2070da1bb401SStefano Zampini {
2071da1bb401SStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
2072da1bb401SStefano Zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
2073*1a83f524SJed Brown   PetscInt       nvtxs;
2074*1a83f524SJed Brown   const PetscInt *xadj,*adjncy;
2075da1bb401SStefano Zampini   Mat            mat_adj;
2076da1bb401SStefano Zampini   PetscBool      symmetrize_rowij=PETSC_TRUE,compressed_rowij=PETSC_FALSE,flg_row=PETSC_TRUE;
2077da1bb401SStefano Zampini   PCBDDCGraph    mat_graph=pcbddc->mat_graph;
2078da1bb401SStefano Zampini   PetscErrorCode ierr;
2079da1bb401SStefano Zampini 
2080da1bb401SStefano Zampini   PetscFunctionBegin;
2081da1bb401SStefano Zampini   /* get CSR adjacency from local matrix if user has not yet provided local graph using PCBDDCSetLocalAdjacencyGraph function */
2082da1bb401SStefano Zampini   if (!mat_graph->xadj) {
2083da1bb401SStefano Zampini     ierr = MatConvert(matis->A,MATMPIADJ,MAT_INITIAL_MATRIX,&mat_adj);CHKERRQ(ierr);
2084da1bb401SStefano Zampini     ierr = MatGetRowIJ(mat_adj,0,symmetrize_rowij,compressed_rowij,&nvtxs,&xadj,&adjncy,&flg_row);CHKERRQ(ierr);
2085da1bb401SStefano Zampini     if (!flg_row) {
2086da1bb401SStefano Zampini       SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in MatGetRowIJ called in %s\n",__FUNCT__);
2087da1bb401SStefano Zampini     }
2088da1bb401SStefano Zampini     /* Get adjacency into BDDC workspace */
2089da1bb401SStefano Zampini     ierr = PCBDDCSetLocalAdjacencyGraph(pc,nvtxs,xadj,adjncy,PETSC_COPY_VALUES);CHKERRQ(ierr);
2090da1bb401SStefano Zampini     ierr = MatRestoreRowIJ(mat_adj,0,symmetrize_rowij,compressed_rowij,&nvtxs,&xadj,&adjncy,&flg_row);CHKERRQ(ierr);
2091da1bb401SStefano Zampini     if (!flg_row) {
2092da1bb401SStefano Zampini       SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in MatRestoreRowIJ called in %s\n",__FUNCT__);
2093da1bb401SStefano Zampini     }
2094da1bb401SStefano Zampini     ierr = MatDestroy(&mat_adj);CHKERRQ(ierr);
2095da1bb401SStefano Zampini   }
2096da1bb401SStefano Zampini   PetscFunctionReturn(0);
2097da1bb401SStefano Zampini }
2098da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
20990c7d97c5SJed Brown #undef __FUNCT__
21000c7d97c5SJed Brown #define __FUNCT__ "PCBDDCApplyInterfacePreconditioner"
21012617d88aSStefano Zampini static PetscErrorCode  PCBDDCApplyInterfacePreconditioner(PC pc)
21020c7d97c5SJed Brown {
21030c7d97c5SJed Brown   PetscErrorCode ierr;
21040c7d97c5SJed Brown   PC_BDDC*        pcbddc = (PC_BDDC*)(pc->data);
21050c7d97c5SJed Brown   PC_IS*            pcis = (PC_IS*)  (pc->data);
21063b03a366Sstefano_zampini   const PetscScalar zero = 0.0;
21070c7d97c5SJed Brown 
21080c7d97c5SJed Brown   PetscFunctionBegin;
21090c7d97c5SJed Brown   /* Application of PHI^T  */
21100c7d97c5SJed Brown   ierr = MatMultTranspose(pcbddc->coarse_phi_B,pcis->vec1_B,pcbddc->vec1_P);CHKERRQ(ierr);
21110c7d97c5SJed Brown   if (pcbddc->prec_type) { ierr = MatMultTransposeAdd(pcbddc->coarse_phi_D,pcis->vec1_D,pcbddc->vec1_P,pcbddc->vec1_P);CHKERRQ(ierr); }
21120c7d97c5SJed Brown 
21130c7d97c5SJed Brown   /* Scatter data of coarse_rhs */
2114142dfd88SStefano Zampini   if (pcbddc->coarse_rhs) { ierr = VecSet(pcbddc->coarse_rhs,zero);CHKERRQ(ierr); }
21150c7d97c5SJed Brown   ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->vec1_P,pcbddc->coarse_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21160c7d97c5SJed Brown 
21170c7d97c5SJed Brown   /* Local solution on R nodes */
21180c7d97c5SJed Brown   ierr = VecSet(pcbddc->vec1_R,zero);CHKERRQ(ierr);
21190c7d97c5SJed Brown   ierr = VecScatterBegin(pcbddc->R_to_B,pcis->vec1_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21200c7d97c5SJed Brown   ierr = VecScatterEnd  (pcbddc->R_to_B,pcis->vec1_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21210c7d97c5SJed Brown   if (pcbddc->prec_type) {
21220c7d97c5SJed Brown     ierr = VecScatterBegin(pcbddc->R_to_D,pcis->vec1_D,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21230c7d97c5SJed Brown     ierr = VecScatterEnd  (pcbddc->R_to_D,pcis->vec1_D,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21240c7d97c5SJed Brown   }
21250c7d97c5SJed Brown   ierr = PCBDDCSolveSaddlePoint(pc);CHKERRQ(ierr);
21260c7d97c5SJed Brown   ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr);
21270c7d97c5SJed Brown   ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec2_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21280c7d97c5SJed Brown   ierr = VecScatterEnd  (pcbddc->R_to_B,pcbddc->vec2_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21290c7d97c5SJed Brown   if (pcbddc->prec_type) {
21300c7d97c5SJed Brown     ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec2_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21310c7d97c5SJed Brown     ierr = VecScatterEnd  (pcbddc->R_to_D,pcbddc->vec2_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21320c7d97c5SJed Brown   }
21330c7d97c5SJed Brown 
21340c7d97c5SJed Brown   /* Coarse solution */
21350c7d97c5SJed Brown   ierr = PCBDDCScatterCoarseDataEnd(pc,pcbddc->vec1_P,pcbddc->coarse_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21360bdf917eSStefano Zampini   if (pcbddc->coarse_rhs) {
21370bdf917eSStefano Zampini     if (pcbddc->CoarseNullSpace) {
21380bdf917eSStefano Zampini       ierr = MatNullSpaceRemove(pcbddc->CoarseNullSpace,pcbddc->coarse_rhs,PETSC_NULL);CHKERRQ(ierr);
21390bdf917eSStefano Zampini     }
21400bdf917eSStefano Zampini     ierr = KSPSolve(pcbddc->coarse_ksp,pcbddc->coarse_rhs,pcbddc->coarse_vec);CHKERRQ(ierr);
21410bdf917eSStefano Zampini     if (pcbddc->CoarseNullSpace) {
21420bdf917eSStefano Zampini       ierr = MatNullSpaceRemove(pcbddc->CoarseNullSpace,pcbddc->coarse_vec,PETSC_NULL);CHKERRQ(ierr);
21430bdf917eSStefano Zampini     }
21440bdf917eSStefano Zampini   }
21450c7d97c5SJed Brown   ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->coarse_vec,pcbddc->vec1_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21460c7d97c5SJed Brown   ierr = PCBDDCScatterCoarseDataEnd  (pc,pcbddc->coarse_vec,pcbddc->vec1_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21470c7d97c5SJed Brown 
21480c7d97c5SJed Brown   /* Sum contributions from two levels */
21490c7d97c5SJed Brown   ierr = MatMultAdd(pcbddc->coarse_phi_B,pcbddc->vec1_P,pcis->vec1_B,pcis->vec1_B);CHKERRQ(ierr);
21500c7d97c5SJed Brown   if (pcbddc->prec_type) { ierr = MatMultAdd(pcbddc->coarse_phi_D,pcbddc->vec1_P,pcis->vec1_D,pcis->vec1_D);CHKERRQ(ierr); }
21510c7d97c5SJed Brown   PetscFunctionReturn(0);
21520c7d97c5SJed Brown }
21530c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
21540c7d97c5SJed Brown #undef __FUNCT__
21550c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSolveSaddlePoint"
215653cdbc3dSStefano Zampini static PetscErrorCode  PCBDDCSolveSaddlePoint(PC pc)
21570c7d97c5SJed Brown {
21580c7d97c5SJed Brown   PetscErrorCode ierr;
21590c7d97c5SJed Brown   PC_BDDC*       pcbddc = (PC_BDDC*)(pc->data);
21600c7d97c5SJed Brown 
21610c7d97c5SJed Brown   PetscFunctionBegin;
216253cdbc3dSStefano Zampini   ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr);
2163534831adSStefano Zampini   if (pcbddc->local_auxmat1) {
21640c7d97c5SJed Brown     ierr = MatMult(pcbddc->local_auxmat1,pcbddc->vec2_R,pcbddc->vec1_C);CHKERRQ(ierr);
21650c7d97c5SJed Brown     ierr = MatMultAdd(pcbddc->local_auxmat2,pcbddc->vec1_C,pcbddc->vec2_R,pcbddc->vec2_R);CHKERRQ(ierr);
21660c7d97c5SJed Brown   }
21670c7d97c5SJed Brown   PetscFunctionReturn(0);
21680c7d97c5SJed Brown }
21690c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
21700c7d97c5SJed Brown #undef __FUNCT__
21710c7d97c5SJed Brown #define __FUNCT__ "PCBDDCScatterCoarseDataBegin"
217253cdbc3dSStefano Zampini static PetscErrorCode  PCBDDCScatterCoarseDataBegin(PC pc,Vec vec_from, Vec vec_to, InsertMode imode, ScatterMode smode)
21730c7d97c5SJed Brown {
21740c7d97c5SJed Brown   PetscErrorCode ierr;
21750c7d97c5SJed Brown   PC_BDDC*       pcbddc = (PC_BDDC*)(pc->data);
21760c7d97c5SJed Brown 
21770c7d97c5SJed Brown   PetscFunctionBegin;
21780c7d97c5SJed Brown   switch(pcbddc->coarse_communications_type){
21790c7d97c5SJed Brown     case SCATTERS_BDDC:
21800c7d97c5SJed Brown       ierr = VecScatterBegin(pcbddc->coarse_loc_to_glob,vec_from,vec_to,imode,smode);CHKERRQ(ierr);
21810c7d97c5SJed Brown       break;
21820c7d97c5SJed Brown     case GATHERS_BDDC:
21830c7d97c5SJed Brown       break;
21840c7d97c5SJed Brown   }
21850c7d97c5SJed Brown   PetscFunctionReturn(0);
21860c7d97c5SJed Brown }
21870c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
21880c7d97c5SJed Brown #undef __FUNCT__
21890c7d97c5SJed Brown #define __FUNCT__ "PCBDDCScatterCoarseDataEnd"
219053cdbc3dSStefano Zampini static PetscErrorCode  PCBDDCScatterCoarseDataEnd(PC pc,Vec vec_from, Vec vec_to, InsertMode imode, ScatterMode smode)
21910c7d97c5SJed Brown {
21920c7d97c5SJed Brown   PetscErrorCode ierr;
21930c7d97c5SJed Brown   PC_BDDC*       pcbddc = (PC_BDDC*)(pc->data);
21940c7d97c5SJed Brown   PetscScalar*   array_to;
21950c7d97c5SJed Brown   PetscScalar*   array_from;
21960c7d97c5SJed Brown   MPI_Comm       comm=((PetscObject)pc)->comm;
21970c7d97c5SJed Brown   PetscInt i;
21980c7d97c5SJed Brown 
21990c7d97c5SJed Brown   PetscFunctionBegin;
22000c7d97c5SJed Brown 
22010c7d97c5SJed Brown   switch(pcbddc->coarse_communications_type){
22020c7d97c5SJed Brown     case SCATTERS_BDDC:
22030c7d97c5SJed Brown       ierr = VecScatterEnd(pcbddc->coarse_loc_to_glob,vec_from,vec_to,imode,smode);CHKERRQ(ierr);
22040c7d97c5SJed Brown       break;
22050c7d97c5SJed Brown     case GATHERS_BDDC:
22060c7d97c5SJed Brown       if (vec_from) VecGetArray(vec_from,&array_from);
22070c7d97c5SJed Brown       if (vec_to)   VecGetArray(vec_to,&array_to);
22080c7d97c5SJed Brown       switch(pcbddc->coarse_problem_type){
22090c7d97c5SJed Brown         case SEQUENTIAL_BDDC:
22100c7d97c5SJed Brown           if (smode == SCATTER_FORWARD) {
221153cdbc3dSStefano Zampini             ierr = MPI_Gatherv(&array_from[0],pcbddc->local_primal_size,MPIU_SCALAR,&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,0,comm);CHKERRQ(ierr);
22120c7d97c5SJed Brown             if (vec_to) {
22130bdf917eSStefano Zampini               if (imode == ADD_VALUES) {
22140bdf917eSStefano Zampini                 for (i=0;i<pcbddc->replicated_primal_size;i++) {
22150c7d97c5SJed Brown                   array_to[pcbddc->replicated_local_primal_indices[i]]+=pcbddc->replicated_local_primal_values[i];
22160c7d97c5SJed Brown                 }
22170c7d97c5SJed Brown               } else {
22180bdf917eSStefano Zampini                 for (i=0;i<pcbddc->replicated_primal_size;i++) {
22190bdf917eSStefano Zampini                   array_to[pcbddc->replicated_local_primal_indices[i]]=pcbddc->replicated_local_primal_values[i];
22200bdf917eSStefano Zampini                 }
22210bdf917eSStefano Zampini               }
22220bdf917eSStefano Zampini             }
22230bdf917eSStefano Zampini           } else {
22240bdf917eSStefano Zampini             if (vec_from) {
22250bdf917eSStefano Zampini               if (imode == ADD_VALUES) {
22260bdf917eSStefano Zampini                 printf("Scatter mode %d, insert mode %d for case %d not implemented!\n",smode,imode,pcbddc->coarse_problem_type);
22270bdf917eSStefano Zampini               }
22280bdf917eSStefano Zampini               for (i=0;i<pcbddc->replicated_primal_size;i++) {
22290c7d97c5SJed Brown                 pcbddc->replicated_local_primal_values[i]=array_from[pcbddc->replicated_local_primal_indices[i]];
22300bdf917eSStefano Zampini               }
22310bdf917eSStefano Zampini             }
223253cdbc3dSStefano Zampini             ierr = MPI_Scatterv(&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,&array_to[0],pcbddc->local_primal_size,MPIU_SCALAR,0,comm);CHKERRQ(ierr);
22330c7d97c5SJed Brown           }
22340c7d97c5SJed Brown           break;
22350c7d97c5SJed Brown         case REPLICATED_BDDC:
22360c7d97c5SJed Brown           if (smode == SCATTER_FORWARD) {
223753cdbc3dSStefano Zampini             ierr = MPI_Allgatherv(&array_from[0],pcbddc->local_primal_size,MPIU_SCALAR,&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,comm);CHKERRQ(ierr);
22380bdf917eSStefano Zampini             if (imode == ADD_VALUES) {
22390bdf917eSStefano Zampini               for (i=0;i<pcbddc->replicated_primal_size;i++) {
22400c7d97c5SJed Brown                 array_to[pcbddc->replicated_local_primal_indices[i]]+=pcbddc->replicated_local_primal_values[i];
22410bdf917eSStefano Zampini               }
22420bdf917eSStefano Zampini             } else {
22430bdf917eSStefano Zampini               for (i=0;i<pcbddc->replicated_primal_size;i++) {
22440bdf917eSStefano Zampini                 array_to[pcbddc->replicated_local_primal_indices[i]]=pcbddc->replicated_local_primal_values[i];
22450bdf917eSStefano Zampini               }
22460bdf917eSStefano Zampini             }
22470c7d97c5SJed Brown           } else { /* no communications needed for SCATTER_REVERSE since needed data is already present */
22480bdf917eSStefano Zampini             if (imode == ADD_VALUES) {
22490bdf917eSStefano Zampini               for (i=0;i<pcbddc->local_primal_size;i++) {
22500bdf917eSStefano Zampini                 array_to[i]+=array_from[pcbddc->local_primal_indices[i]];
22510bdf917eSStefano Zampini               }
22520bdf917eSStefano Zampini             } else {
22530bdf917eSStefano Zampini               for (i=0;i<pcbddc->local_primal_size;i++) {
22540c7d97c5SJed Brown                 array_to[i]=array_from[pcbddc->local_primal_indices[i]];
22550c7d97c5SJed Brown               }
22560bdf917eSStefano Zampini             }
22570bdf917eSStefano Zampini           }
22580c7d97c5SJed Brown           break;
225953cdbc3dSStefano Zampini         case MULTILEVEL_BDDC:
226053cdbc3dSStefano Zampini           break;
226153cdbc3dSStefano Zampini         case PARALLEL_BDDC:
226253cdbc3dSStefano Zampini           break;
22630c7d97c5SJed Brown       }
22640c7d97c5SJed Brown       if (vec_from) VecRestoreArray(vec_from,&array_from);
22650c7d97c5SJed Brown       if (vec_to)   VecRestoreArray(vec_to,&array_to);
22660c7d97c5SJed Brown       break;
22670c7d97c5SJed Brown   }
22680c7d97c5SJed Brown   PetscFunctionReturn(0);
22690c7d97c5SJed Brown }
22700c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
22713b03a366Sstefano_zampini #undef __FUNCT__
22723b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCCreateConstraintMatrix"
22733b03a366Sstefano_zampini static PetscErrorCode PCBDDCCreateConstraintMatrix(PC pc)
22743b03a366Sstefano_zampini {
22753b03a366Sstefano_zampini   PetscErrorCode ierr;
22763b03a366Sstefano_zampini   PC_IS*         pcis = (PC_IS*)(pc->data);
22773b03a366Sstefano_zampini   PC_BDDC*       pcbddc = (PC_BDDC*)pc->data;
22783b03a366Sstefano_zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
227923d4d1a5SStefano Zampini   PetscInt       *nnz,*is_indices;
22803b03a366Sstefano_zampini   PetscScalar    *temp_quadrature_constraint;
2281534831adSStefano Zampini   PetscInt       *temp_indices,*temp_indices_to_constraint,*temp_indices_to_constraint_B,*local_to_B;
22823b03a366Sstefano_zampini   PetscInt       local_primal_size,i,j,k,total_counts,max_size_of_constraint;
22833b03a366Sstefano_zampini   PetscInt       n_constraints,n_vertices,size_of_constraint;
2284534831adSStefano Zampini   PetscScalar    quad_value;
22853b03a366Sstefano_zampini   PetscBool      nnsp_has_cnst=PETSC_FALSE,use_nnsp_true=pcbddc->use_nnsp_true;
22863b03a366Sstefano_zampini   PetscInt       nnsp_size=0,nnsp_addone=0,temp_constraints,temp_start_ptr;
22873b03a366Sstefano_zampini   IS             *used_IS;
228819fd82e9SBarry Smith   MatType        impMatType=MATSEQAIJ;
22893b03a366Sstefano_zampini   PetscBLASInt   Bs,Bt,lwork,lierr;
22903b03a366Sstefano_zampini   PetscReal      tol=1.0e-8;
2291fcda91b4SJed Brown   MatNullSpace   nearnullsp;
2292fcda91b4SJed Brown   const Vec      *nearnullvecs;
22933b03a366Sstefano_zampini   Vec            *localnearnullsp;
22943b03a366Sstefano_zampini   PetscScalar    *work,*temp_basis,*array_vector,*correlation_mat;
22953b03a366Sstefano_zampini   PetscReal      *rwork,*singular_vals;
2296534831adSStefano Zampini   PetscBLASInt   Bone=1,*ipiv;
2297534831adSStefano Zampini   Vec            temp_vec;
2298534831adSStefano Zampini   Mat            temp_mat;
2299534831adSStefano Zampini   KSP            temp_ksp;
2300ffe5efe1SStefano Zampini   PC             temp_pc;
2301534831adSStefano Zampini   PetscInt       s,start_constraint,dual_dofs;
2302534831adSStefano Zampini   PetscBool      compute_submatrix,useksp=PETSC_FALSE;
2303534831adSStefano Zampini   PetscInt       *aux_primal_permutation,*aux_primal_numbering;
2304534831adSStefano Zampini   PetscBool      boolforface,*change_basis;
2305de534f79Sstefano_zampini /* some ugly conditional declarations */
23063b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD)
23073b03a366Sstefano_zampini   PetscScalar    dot_result;
23083b03a366Sstefano_zampini   PetscScalar    one=1.0,zero=0.0;
23093b03a366Sstefano_zampini   PetscInt       ii;
23103425bc38SStefano Zampini   PetscScalar    *singular_vectors;
23113425bc38SStefano Zampini   PetscBLASInt   *iwork,*ifail;
23123425bc38SStefano Zampini   PetscReal      dummy_real,abs_tol;
23133425bc38SStefano Zampini   PetscBLASInt   eigs_found;
23143b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX)
23153b03a366Sstefano_zampini   PetscScalar    val1,val2;
23163b03a366Sstefano_zampini #endif
23173425bc38SStefano Zampini #endif
23183b03a366Sstefano_zampini   PetscBLASInt   dummy_int;
23193b03a366Sstefano_zampini   PetscScalar    dummy_scalar;
23203b03a366Sstefano_zampini 
23213b03a366Sstefano_zampini   PetscFunctionBegin;
23223b03a366Sstefano_zampini   /* check if near null space is attached to global mat */
2323fcda91b4SJed Brown   ierr = MatGetNearNullSpace(pc->pmat,&nearnullsp);CHKERRQ(ierr);
2324fcda91b4SJed Brown   if (nearnullsp) {
2325fcda91b4SJed Brown     ierr = MatNullSpaceGetVecs(nearnullsp,&nnsp_has_cnst,&nnsp_size,&nearnullvecs);CHKERRQ(ierr);
23263b03a366Sstefano_zampini   } else { /* if near null space is not provided it uses constants */
23273b03a366Sstefano_zampini     nnsp_has_cnst = PETSC_TRUE;
23283b03a366Sstefano_zampini     use_nnsp_true = PETSC_TRUE;
23293b03a366Sstefano_zampini   }
23303b03a366Sstefano_zampini   if (nnsp_has_cnst) {
23313b03a366Sstefano_zampini     nnsp_addone = 1;
23323b03a366Sstefano_zampini   }
23333b03a366Sstefano_zampini   /*
23343b03a366Sstefano_zampini        Evaluate maximum storage size needed by the procedure
23353b03a366Sstefano_zampini        - temp_indices will contain start index of each constraint stored as follows
23363b03a366Sstefano_zampini        - temp_indices_to_constraint  [temp_indices[i],...,temp[indices[i+1]-1] will contain the indices (in local numbering) on which the constraint acts
2337534831adSStefano Zampini        - temp_indices_to_constraint_B[temp_indices[i],...,temp[indices[i+1]-1] will contain the indices (in boundary numbering) on which the constraint acts
23383b03a366Sstefano_zampini        - temp_quadrature_constraint  [temp_indices[i],...,temp[indices[i+1]-1] will contain the scalars representing the constraint itself
23393b03a366Sstefano_zampini                                                                                                                                                          */
2340da1bb401SStefano Zampini 
23413b03a366Sstefano_zampini   total_counts = pcbddc->n_ISForFaces+pcbddc->n_ISForEdges;
23423b03a366Sstefano_zampini   total_counts *= (nnsp_addone+nnsp_size);
2343da1bb401SStefano Zampini   ierr = ISGetSize(pcbddc->ISForVertices,&n_vertices);CHKERRQ(ierr);
2344da1bb401SStefano Zampini   total_counts += n_vertices;
23453b03a366Sstefano_zampini   ierr = PetscMalloc((total_counts+1)*sizeof(PetscInt),&temp_indices);CHKERRQ(ierr);
2346534831adSStefano Zampini   ierr = PetscMalloc((total_counts+1)*sizeof(PetscBool),&change_basis);CHKERRQ(ierr);
23473b03a366Sstefano_zampini   total_counts = 0;
23483b03a366Sstefano_zampini   max_size_of_constraint = 0;
23493b03a366Sstefano_zampini   for (i=0;i<pcbddc->n_ISForEdges+pcbddc->n_ISForFaces;i++){
23503b03a366Sstefano_zampini     if (i<pcbddc->n_ISForEdges){
23513b03a366Sstefano_zampini       used_IS = &pcbddc->ISForEdges[i];
23523b03a366Sstefano_zampini     } else {
23533b03a366Sstefano_zampini       used_IS = &pcbddc->ISForFaces[i-pcbddc->n_ISForEdges];
23543b03a366Sstefano_zampini     }
23553b03a366Sstefano_zampini     ierr = ISGetSize(*used_IS,&j);CHKERRQ(ierr);
23563b03a366Sstefano_zampini     total_counts += j;
23573b03a366Sstefano_zampini     if (j>max_size_of_constraint) max_size_of_constraint=j;
23583b03a366Sstefano_zampini   }
23593b03a366Sstefano_zampini   total_counts *= (nnsp_addone+nnsp_size);
2360da1bb401SStefano Zampini   total_counts += n_vertices;
23613b03a366Sstefano_zampini   ierr = PetscMalloc(total_counts*sizeof(PetscScalar),&temp_quadrature_constraint);CHKERRQ(ierr);
23623b03a366Sstefano_zampini   ierr = PetscMalloc(total_counts*sizeof(PetscInt),&temp_indices_to_constraint);CHKERRQ(ierr);
2363534831adSStefano Zampini   ierr = PetscMalloc(total_counts*sizeof(PetscInt),&temp_indices_to_constraint_B);CHKERRQ(ierr);
2364534831adSStefano Zampini   ierr = PetscMalloc(pcis->n*sizeof(PetscInt),&local_to_B);CHKERRQ(ierr);
2365534831adSStefano Zampini   ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2366534831adSStefano Zampini   for (i=0;i<pcis->n;i++) {
2367534831adSStefano Zampini     local_to_B[i]=-1;
2368534831adSStefano Zampini   }
2369534831adSStefano Zampini   for (i=0;i<pcis->n_B;i++) {
2370534831adSStefano Zampini     local_to_B[is_indices[i]]=i;
2371534831adSStefano Zampini   }
2372534831adSStefano Zampini   ierr = ISRestoreIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2373534831adSStefano Zampini 
23743b03a366Sstefano_zampini   /* First we issue queries to allocate optimal workspace for LAPACKgesvd or LAPACKsyev/LAPACKheev */
23753b03a366Sstefano_zampini   rwork = 0;
23763b03a366Sstefano_zampini   work = 0;
23773b03a366Sstefano_zampini   singular_vals = 0;
23783b03a366Sstefano_zampini   temp_basis = 0;
23793b03a366Sstefano_zampini   correlation_mat = 0;
23803b03a366Sstefano_zampini   if (!pcbddc->use_nnsp_true) {
23813b03a366Sstefano_zampini     PetscScalar temp_work;
23823b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD)
23833b03a366Sstefano_zampini     /* POD */
23843b03a366Sstefano_zampini     PetscInt max_n;
23853b03a366Sstefano_zampini     max_n = nnsp_addone+nnsp_size;
23863b03a366Sstefano_zampini     /* using some techniques borrowed from Proper Orthogonal Decomposition */
23873b03a366Sstefano_zampini     ierr = PetscMalloc(max_n*max_n*sizeof(PetscScalar),&correlation_mat);CHKERRQ(ierr);
23883425bc38SStefano Zampini     ierr = PetscMalloc(max_n*max_n*sizeof(PetscScalar),&singular_vectors);CHKERRQ(ierr);
23893b03a366Sstefano_zampini     ierr = PetscMalloc(max_n*sizeof(PetscReal),&singular_vals);CHKERRQ(ierr);
23903b03a366Sstefano_zampini     ierr = PetscMalloc(max_size_of_constraint*(nnsp_addone+nnsp_size)*sizeof(PetscScalar),&temp_basis);CHKERRQ(ierr);
23913b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX)
23923b03a366Sstefano_zampini     ierr = PetscMalloc(3*max_n*sizeof(PetscReal),&rwork);CHKERRQ(ierr);
23933b03a366Sstefano_zampini #endif
23943425bc38SStefano Zampini     ierr = PetscMalloc(5*max_n*sizeof(PetscBLASInt),&iwork);CHKERRQ(ierr);
23953425bc38SStefano Zampini     ierr = PetscMalloc(max_n*sizeof(PetscBLASInt),&ifail);CHKERRQ(ierr);
23963b03a366Sstefano_zampini     /* now we evaluate the optimal workspace using query with lwork=-1 */
23973b03a366Sstefano_zampini     Bt = PetscBLASIntCast(max_n);
23983b03a366Sstefano_zampini     lwork=-1;
23993425bc38SStefano Zampini     ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
24003b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX)
24013425bc38SStefano Zampini     abs_tol=1.e-8;
24023425bc38SStefano Zampini /*    LAPACKsyev_("V","U",&Bt,correlation_mat,&Bt,singular_vals,&temp_work,&lwork,&lierr); */
24033425bc38SStefano Zampini     LAPACKsyevx_("V","A","U",&Bt,correlation_mat,&Bt,&dummy_real,&dummy_real,&dummy_int,&dummy_int,
24043425bc38SStefano Zampini                  &abs_tol,&eigs_found,singular_vals,singular_vectors,&Bt,&temp_work,&lwork,iwork,ifail,&lierr);
24053b03a366Sstefano_zampini #else
24063425bc38SStefano Zampini /*    LAPACKsyev_("V","U",&Bt,correlation_mat,&Bt,singular_vals,&temp_work,&lwork,rwork,&lierr); */
24073425bc38SStefano Zampini /*  LAPACK call is missing here! TODO */
24083425bc38SStefano Zampini     SETERRQ(((PetscObject) pc)->comm, PETSC_ERR_SUP, "Not yet implemented for complexes when PETSC_MISSING_GESVD = 1");
24093b03a366Sstefano_zampini #endif
24103425bc38SStefano Zampini     if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to SYEVX Lapack routine %d",(int)lierr);
24113425bc38SStefano Zampini     ierr = PetscFPTrapPop();CHKERRQ(ierr);
24123b03a366Sstefano_zampini #else /* on missing GESVD */
24133b03a366Sstefano_zampini     /* SVD */
24143b03a366Sstefano_zampini     PetscInt max_n,min_n;
24153b03a366Sstefano_zampini     max_n = max_size_of_constraint;
24163b03a366Sstefano_zampini     min_n = nnsp_addone+nnsp_size;
24173b03a366Sstefano_zampini     if (max_size_of_constraint < ( nnsp_addone+nnsp_size ) ) {
24183b03a366Sstefano_zampini       min_n = max_size_of_constraint;
24193b03a366Sstefano_zampini       max_n = nnsp_addone+nnsp_size;
24203b03a366Sstefano_zampini     }
24213b03a366Sstefano_zampini     ierr = PetscMalloc(min_n*sizeof(PetscReal),&singular_vals);CHKERRQ(ierr);
24223b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX)
24233b03a366Sstefano_zampini     ierr = PetscMalloc(5*min_n*sizeof(PetscReal),&rwork);CHKERRQ(ierr);
24243b03a366Sstefano_zampini #endif
24253b03a366Sstefano_zampini     /* now we evaluate the optimal workspace using query with lwork=-1 */
24263b03a366Sstefano_zampini     lwork=-1;
24273b03a366Sstefano_zampini     Bs = PetscBLASIntCast(max_n);
24283b03a366Sstefano_zampini     Bt = PetscBLASIntCast(min_n);
24293b03a366Sstefano_zampini     dummy_int = Bs;
2430670f3ff9SJed Brown     ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
24313b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX)
24323b03a366Sstefano_zampini     LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[0],&Bs,singular_vals,
24333b03a366Sstefano_zampini                  &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,&temp_work,&lwork,&lierr);
24343b03a366Sstefano_zampini #else
24353b03a366Sstefano_zampini     LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[0],&Bs,singular_vals,
24363b03a366Sstefano_zampini                  &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,&temp_work,&lwork,rwork,&lierr);
24373b03a366Sstefano_zampini #endif
24383b03a366Sstefano_zampini     if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to SVD Lapack routine %d",(int)lierr);
2439670f3ff9SJed Brown     ierr = PetscFPTrapPop();CHKERRQ(ierr);
24403b03a366Sstefano_zampini #endif
24413b03a366Sstefano_zampini     /* Allocate optimal workspace */
24423b03a366Sstefano_zampini     lwork = PetscBLASIntCast((PetscInt)PetscRealPart(temp_work));
24433b03a366Sstefano_zampini     total_counts = (PetscInt)lwork;
24443b03a366Sstefano_zampini     ierr = PetscMalloc(total_counts*sizeof(PetscScalar),&work);CHKERRQ(ierr);
24453b03a366Sstefano_zampini   }
24463b03a366Sstefano_zampini   /* get local part of global near null space vectors */
24473b03a366Sstefano_zampini   ierr = PetscMalloc(nnsp_size*sizeof(Vec),&localnearnullsp);CHKERRQ(ierr);
24483b03a366Sstefano_zampini   for (k=0;k<nnsp_size;k++) {
24493b03a366Sstefano_zampini     ierr = VecDuplicate(pcis->vec1_N,&localnearnullsp[k]);CHKERRQ(ierr);
2450fcda91b4SJed Brown     ierr = VecScatterBegin(matis->ctx,nearnullvecs[k],localnearnullsp[k],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
2451fcda91b4SJed Brown     ierr = VecScatterEnd  (matis->ctx,nearnullvecs[k],localnearnullsp[k],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
24523b03a366Sstefano_zampini   }
24533b03a366Sstefano_zampini   /* Now we can loop on constraining sets */
24543b03a366Sstefano_zampini   total_counts=0;
24553b03a366Sstefano_zampini   temp_indices[0]=0;
2456da1bb401SStefano Zampini   /* vertices */
2457da1bb401SStefano Zampini   PetscBool used_vertex;
2458da1bb401SStefano Zampini   ierr = ISGetIndices(pcbddc->ISForVertices,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2459da1bb401SStefano Zampini   if (nnsp_has_cnst) { /* consider all vertices */
2460da1bb401SStefano Zampini     for (i=0;i<n_vertices;i++) {
2461da1bb401SStefano Zampini       temp_indices_to_constraint[temp_indices[total_counts]]=is_indices[i];
2462534831adSStefano Zampini       temp_indices_to_constraint_B[temp_indices[total_counts]]=local_to_B[is_indices[i]];
2463da1bb401SStefano Zampini       temp_quadrature_constraint[temp_indices[total_counts]]=1.0;
2464da1bb401SStefano Zampini       temp_indices[total_counts+1]=temp_indices[total_counts]+1;
2465534831adSStefano Zampini       change_basis[total_counts]=PETSC_FALSE;
2466da1bb401SStefano Zampini       total_counts++;
2467da1bb401SStefano Zampini     }
2468da1bb401SStefano Zampini   } else { /* consider vertices for which exist at least a localnearnullsp which is not null there */
2469da1bb401SStefano Zampini     for (i=0;i<n_vertices;i++) {
2470da1bb401SStefano Zampini       used_vertex=PETSC_FALSE;
2471da1bb401SStefano Zampini       k=0;
2472da1bb401SStefano Zampini       while(!used_vertex && k<nnsp_size) {
2473da1bb401SStefano Zampini         ierr = VecGetArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr);
2474da1bb401SStefano Zampini         if (PetscAbsScalar(array_vector[is_indices[i]])>0.0) {
2475da1bb401SStefano Zampini           temp_indices_to_constraint[temp_indices[total_counts]]=is_indices[i];
2476534831adSStefano Zampini           temp_indices_to_constraint_B[temp_indices[total_counts]]=local_to_B[is_indices[i]];
2477da1bb401SStefano Zampini           temp_quadrature_constraint[temp_indices[total_counts]]=1.0;
2478da1bb401SStefano Zampini           temp_indices[total_counts+1]=temp_indices[total_counts]+1;
2479534831adSStefano Zampini           change_basis[total_counts]=PETSC_FALSE;
2480da1bb401SStefano Zampini           total_counts++;
2481da1bb401SStefano Zampini           used_vertex=PETSC_TRUE;
2482da1bb401SStefano Zampini         }
2483da1bb401SStefano Zampini         ierr = VecRestoreArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr);
2484da1bb401SStefano Zampini         k++;
2485da1bb401SStefano Zampini       }
2486da1bb401SStefano Zampini     }
2487da1bb401SStefano Zampini   }
2488da1bb401SStefano Zampini   ierr = ISRestoreIndices(pcbddc->ISForVertices,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2489da1bb401SStefano Zampini   n_vertices=total_counts;
2490da1bb401SStefano Zampini   /* edges and faces */
24913b03a366Sstefano_zampini   for (i=0;i<pcbddc->n_ISForEdges+pcbddc->n_ISForFaces;i++){
24923b03a366Sstefano_zampini     if (i<pcbddc->n_ISForEdges){
24933b03a366Sstefano_zampini       used_IS = &pcbddc->ISForEdges[i];
2494534831adSStefano Zampini       boolforface = pcbddc->usechangeofbasis;
24953b03a366Sstefano_zampini     } else {
24963b03a366Sstefano_zampini       used_IS = &pcbddc->ISForFaces[i-pcbddc->n_ISForEdges];
2497534831adSStefano Zampini       boolforface = pcbddc->usechangeonfaces;
24983b03a366Sstefano_zampini     }
24993b03a366Sstefano_zampini     temp_constraints = 0;          /* zero the number of constraints I have on this conn comp */
25003b03a366Sstefano_zampini     temp_start_ptr = total_counts; /* need to know the starting index of constraints stored */
25013b03a366Sstefano_zampini     ierr = ISGetSize(*used_IS,&size_of_constraint);CHKERRQ(ierr);
25023b03a366Sstefano_zampini     ierr = ISGetIndices(*used_IS,(const PetscInt**)&is_indices);CHKERRQ(ierr);
25033b03a366Sstefano_zampini     if (nnsp_has_cnst) {
25043b03a366Sstefano_zampini       temp_constraints++;
2505534831adSStefano Zampini       quad_value = (PetscScalar) (1.0/PetscSqrtReal((PetscReal)size_of_constraint));
25063b03a366Sstefano_zampini       for (j=0;j<size_of_constraint;j++) {
25073b03a366Sstefano_zampini         temp_indices_to_constraint[temp_indices[total_counts]+j]=is_indices[j];
2508534831adSStefano Zampini         temp_indices_to_constraint_B[temp_indices[total_counts]+j]=local_to_B[is_indices[j]];
25093b03a366Sstefano_zampini         temp_quadrature_constraint[temp_indices[total_counts]+j]=quad_value;
25103b03a366Sstefano_zampini       }
25113b03a366Sstefano_zampini       temp_indices[total_counts+1]=temp_indices[total_counts]+size_of_constraint;  /* store new starting point */
2512534831adSStefano Zampini       change_basis[total_counts]=boolforface;
25133b03a366Sstefano_zampini       total_counts++;
25143b03a366Sstefano_zampini     }
25153b03a366Sstefano_zampini     for (k=0;k<nnsp_size;k++) {
25163b03a366Sstefano_zampini       ierr = VecGetArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr);
25173b03a366Sstefano_zampini       for (j=0;j<size_of_constraint;j++) {
25183b03a366Sstefano_zampini         temp_indices_to_constraint[temp_indices[total_counts]+j]=is_indices[j];
2519534831adSStefano Zampini         temp_indices_to_constraint_B[temp_indices[total_counts]+j]=local_to_B[is_indices[j]];
25203b03a366Sstefano_zampini         temp_quadrature_constraint[temp_indices[total_counts]+j]=array_vector[is_indices[j]];
25213b03a366Sstefano_zampini       }
25223b03a366Sstefano_zampini       ierr = VecRestoreArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr);
2523de534f79Sstefano_zampini       quad_value = 1.0;
2524de534f79Sstefano_zampini       if ( use_nnsp_true ) { /* check if array is null on the connected component in case use_nnsp_true has been requested */
2525de534f79Sstefano_zampini         Bs = PetscBLASIntCast(size_of_constraint);
2526de534f79Sstefano_zampini         quad_value = BLASasum_(&Bs,&temp_quadrature_constraint[temp_indices[total_counts]],&Bone);
2527de534f79Sstefano_zampini       }
2528de534f79Sstefano_zampini       if ( quad_value > 0.0 ) { /* keep indices and values */
2529de534f79Sstefano_zampini         temp_constraints++;
25303b03a366Sstefano_zampini         temp_indices[total_counts+1]=temp_indices[total_counts]+size_of_constraint;  /* store new starting point */
2531534831adSStefano Zampini         change_basis[total_counts]=boolforface;
25323b03a366Sstefano_zampini         total_counts++;
25333b03a366Sstefano_zampini       }
2534de534f79Sstefano_zampini     }
25353b03a366Sstefano_zampini     ierr = ISRestoreIndices(*used_IS,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2536de534f79Sstefano_zampini     /* perform SVD on the constraint if use_nnsp_true has not be requested by the user */
25373b03a366Sstefano_zampini     if (!use_nnsp_true) {
2538de534f79Sstefano_zampini 
25393b03a366Sstefano_zampini       Bs = PetscBLASIntCast(size_of_constraint);
25403b03a366Sstefano_zampini       Bt = PetscBLASIntCast(temp_constraints);
2541de534f79Sstefano_zampini 
25423b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD)
25433b03a366Sstefano_zampini       ierr = PetscMemzero(correlation_mat,Bt*Bt*sizeof(PetscScalar));CHKERRQ(ierr);
25443b03a366Sstefano_zampini       /* Store upper triangular part of correlation matrix */
25453b03a366Sstefano_zampini       for (j=0;j<temp_constraints;j++) {
25463b03a366Sstefano_zampini         for (k=0;k<j+1;k++) {
25473b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX)
25483425bc38SStefano Zampini           /* hand made complex dot product -> replace */
25493b03a366Sstefano_zampini           dot_result = 0.0;
25503b03a366Sstefano_zampini           for (ii=0; ii<size_of_constraint; ii++) {
25513b03a366Sstefano_zampini             val1 = temp_quadrature_constraint[temp_indices[temp_start_ptr+j]+ii];
25523b03a366Sstefano_zampini             val2 = temp_quadrature_constraint[temp_indices[temp_start_ptr+k]+ii];
25533b03a366Sstefano_zampini             dot_result += val1*PetscConj(val2);
25543b03a366Sstefano_zampini           }
25553b03a366Sstefano_zampini #else
25563b03a366Sstefano_zampini           dot_result = BLASdot_(&Bs,&temp_quadrature_constraint[temp_indices[temp_start_ptr+j]],&Bone,
25573b03a366Sstefano_zampini                                     &temp_quadrature_constraint[temp_indices[temp_start_ptr+k]],&Bone);
25583b03a366Sstefano_zampini #endif
25593b03a366Sstefano_zampini           correlation_mat[j*temp_constraints+k]=dot_result;
25603b03a366Sstefano_zampini         }
25613b03a366Sstefano_zampini       }
25623425bc38SStefano Zampini       ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
25633b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX)
25643425bc38SStefano Zampini /*      LAPACKsyev_("V","U",&Bt,correlation_mat,&Bt,singular_vals,work,&lwork,&lierr); */
25653425bc38SStefano Zampini       LAPACKsyevx_("V","A","U",&Bt,correlation_mat,&Bt,&dummy_real,&dummy_real,&dummy_int,&dummy_int,
25663425bc38SStefano Zampini                  &abs_tol,&eigs_found,singular_vals,singular_vectors,&Bt,work,&lwork,iwork,ifail,&lierr);
25673b03a366Sstefano_zampini #else
25683425bc38SStefano Zampini /*  LAPACK call is missing here! TODO */
25693425bc38SStefano Zampini       SETERRQ(((PetscObject) pc)->comm, PETSC_ERR_SUP, "Not yet implemented for complexes when PETSC_MISSING_GESVD = 1");
25703b03a366Sstefano_zampini #endif
25713425bc38SStefano Zampini       if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYEVX Lapack routine %d",(int)lierr);
25723425bc38SStefano Zampini       ierr = PetscFPTrapPop();CHKERRQ(ierr);
25733b03a366Sstefano_zampini       /* retain eigenvalues greater than tol: note that lapack SYEV gives eigs in ascending order */
25743b03a366Sstefano_zampini       j=0;
25753b03a366Sstefano_zampini       while( j < Bt && singular_vals[j] < tol) j++;
25763b03a366Sstefano_zampini       total_counts=total_counts-j;
25773b03a366Sstefano_zampini       if (j<temp_constraints) {
25783b03a366Sstefano_zampini         for (k=j;k<Bt;k++) { singular_vals[k]=1.0/PetscSqrtReal(singular_vals[k]); }
25793425bc38SStefano Zampini         ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
25803b03a366Sstefano_zampini         BLASgemm_("N","N",&Bs,&Bt,&Bt,&one,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,correlation_mat,&Bt,&zero,temp_basis,&Bs);
25813425bc38SStefano Zampini         ierr = PetscFPTrapPop();CHKERRQ(ierr);
25823b03a366Sstefano_zampini         /* copy POD basis into used quadrature memory */
25833b03a366Sstefano_zampini         for (k=0;k<Bt-j;k++) {
25843b03a366Sstefano_zampini           for (ii=0;ii<size_of_constraint;ii++) {
25853b03a366Sstefano_zampini             temp_quadrature_constraint[temp_indices[temp_start_ptr+k]+ii]=singular_vals[Bt-1-k]*temp_basis[(Bt-1-k)*size_of_constraint+ii];
25863b03a366Sstefano_zampini           }
25873b03a366Sstefano_zampini         }
25883b03a366Sstefano_zampini       }
2589de534f79Sstefano_zampini 
25903b03a366Sstefano_zampini #else  /* on missing GESVD */
25913b03a366Sstefano_zampini       PetscInt min_n = temp_constraints;
25923b03a366Sstefano_zampini       if (min_n > size_of_constraint) min_n = size_of_constraint;
25933b03a366Sstefano_zampini       dummy_int = Bs;
2594670f3ff9SJed Brown       ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
25953b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX)
25963b03a366Sstefano_zampini       LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,singular_vals,
25973b03a366Sstefano_zampini                    &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,work,&lwork,&lierr);
25983b03a366Sstefano_zampini #else
25993b03a366Sstefano_zampini       LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,singular_vals,
26003b03a366Sstefano_zampini                    &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,work,&lwork,rwork,&lierr);
26013b03a366Sstefano_zampini #endif
26023b03a366Sstefano_zampini       if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SVD Lapack routine %d",(int)lierr);
2603670f3ff9SJed Brown       ierr = PetscFPTrapPop();CHKERRQ(ierr);
26043b03a366Sstefano_zampini       /* retain eigenvalues greater than tol: note that lapack SVD gives eigs in descending order */
26053b03a366Sstefano_zampini       j=0;
26063b03a366Sstefano_zampini       while( j < min_n && singular_vals[min_n-j-1] < tol) j++;
26073b03a366Sstefano_zampini       total_counts = total_counts-(PetscInt)Bt+(min_n-j);
26083b03a366Sstefano_zampini #endif
26093b03a366Sstefano_zampini     }
26103b03a366Sstefano_zampini   }
2611534831adSStefano Zampini 
2612da1bb401SStefano Zampini   n_constraints=total_counts-n_vertices;
2613da1bb401SStefano Zampini   local_primal_size = total_counts;
26143b03a366Sstefano_zampini   /* set quantities in pcbddc data structure */
26153b03a366Sstefano_zampini   pcbddc->n_vertices = n_vertices;
26163b03a366Sstefano_zampini   pcbddc->n_constraints = n_constraints;
2617da1bb401SStefano Zampini   pcbddc->local_primal_size = local_primal_size;
2618534831adSStefano Zampini 
2619534831adSStefano Zampini   /* Create constraint matrix */
2620534831adSStefano Zampini   /* The constraint matrix is used to compute the l2g map of primal dofs */
2621534831adSStefano Zampini   /* so we need to set it up properly either with or without change of basis */
2622534831adSStefano Zampini   ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->ConstraintMatrix);CHKERRQ(ierr);
2623534831adSStefano Zampini   ierr = MatSetType(pcbddc->ConstraintMatrix,impMatType);CHKERRQ(ierr);
2624534831adSStefano Zampini   ierr = MatSetSizes(pcbddc->ConstraintMatrix,local_primal_size,pcis->n,local_primal_size,pcis->n);CHKERRQ(ierr);
2625534831adSStefano Zampini   /* compute a local numbering of constraints : vertices first then constraints */
2626534831adSStefano Zampini   ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
2627534831adSStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array_vector);CHKERRQ(ierr);
2628534831adSStefano Zampini   ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&aux_primal_numbering);CHKERRQ(ierr);
2629534831adSStefano Zampini   ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&aux_primal_permutation);CHKERRQ(ierr);
2630534831adSStefano Zampini   total_counts=0;
2631534831adSStefano Zampini   /* find vertices: subdomain corners plus dofs with basis changed */
2632534831adSStefano Zampini   for (i=0;i<local_primal_size;i++) {
2633534831adSStefano Zampini     size_of_constraint=temp_indices[i+1]-temp_indices[i];
2634534831adSStefano Zampini     if (change_basis[i] || size_of_constraint == 1) {
2635534831adSStefano Zampini       k=0;
2636534831adSStefano Zampini       while(k < size_of_constraint && array_vector[temp_indices_to_constraint[temp_indices[i]+size_of_constraint-k-1]] != 0.0) {
2637534831adSStefano Zampini         k=k+1;
2638534831adSStefano Zampini       }
2639534831adSStefano Zampini       j=temp_indices_to_constraint[temp_indices[i]+size_of_constraint-k-1];
2640534831adSStefano Zampini       array_vector[j] = 1.0;
2641534831adSStefano Zampini       aux_primal_numbering[total_counts]=j;
2642534831adSStefano Zampini       aux_primal_permutation[total_counts]=total_counts;
2643534831adSStefano Zampini       total_counts++;
2644534831adSStefano Zampini     }
2645534831adSStefano Zampini   }
2646534831adSStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array_vector);CHKERRQ(ierr);
2647534831adSStefano Zampini   /* permute indices in order to have a sorted set of vertices */
2648534831adSStefano Zampini   ierr = PetscSortIntWithPermutation(total_counts,aux_primal_numbering,aux_primal_permutation);
2649534831adSStefano Zampini   /* nonzero structure */
2650534831adSStefano Zampini   ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&nnz);CHKERRQ(ierr);
2651534831adSStefano Zampini   for (i=0;i<total_counts;i++) {
2652534831adSStefano Zampini     nnz[i]=1;
2653534831adSStefano Zampini   }
2654534831adSStefano Zampini   j=total_counts;
2655534831adSStefano Zampini   for (i=n_vertices;i<local_primal_size;i++) {
2656534831adSStefano Zampini     if (!change_basis[i]) {
2657534831adSStefano Zampini       nnz[j]=temp_indices[i+1]-temp_indices[i];
2658534831adSStefano Zampini       j++;
2659534831adSStefano Zampini     }
2660534831adSStefano Zampini   }
2661534831adSStefano Zampini   ierr = MatSeqAIJSetPreallocation(pcbddc->ConstraintMatrix,0,nnz);CHKERRQ(ierr);
2662534831adSStefano Zampini   ierr = PetscFree(nnz);CHKERRQ(ierr);
2663534831adSStefano Zampini   /* set values in constraint matrix */
2664534831adSStefano Zampini   for (i=0;i<total_counts;i++) {
2665534831adSStefano Zampini     j = aux_primal_permutation[i];
2666534831adSStefano Zampini     k = aux_primal_numbering[j];
2667534831adSStefano Zampini     ierr = MatSetValue(pcbddc->ConstraintMatrix,i,k,1.0,INSERT_VALUES);CHKERRQ(ierr);
2668534831adSStefano Zampini   }
2669534831adSStefano Zampini   for (i=n_vertices;i<local_primal_size;i++) {
2670534831adSStefano Zampini     if (!change_basis[i]) {
2671534831adSStefano Zampini       size_of_constraint=temp_indices[i+1]-temp_indices[i];
2672534831adSStefano Zampini       ierr = MatSetValues(pcbddc->ConstraintMatrix,1,&total_counts,size_of_constraint,&temp_indices_to_constraint[temp_indices[i]],&temp_quadrature_constraint[temp_indices[i]],INSERT_VALUES);CHKERRQ(ierr);
2673534831adSStefano Zampini       total_counts++;
2674534831adSStefano Zampini     }
2675534831adSStefano Zampini   }
2676534831adSStefano Zampini   ierr = PetscFree(aux_primal_numbering);CHKERRQ(ierr);
2677534831adSStefano Zampini   ierr = PetscFree(aux_primal_permutation);CHKERRQ(ierr);
2678534831adSStefano Zampini   /* assembling */
2679534831adSStefano Zampini   ierr = MatAssemblyBegin(pcbddc->ConstraintMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2680534831adSStefano Zampini   ierr = MatAssemblyEnd(pcbddc->ConstraintMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2681534831adSStefano Zampini 
2682534831adSStefano Zampini   /* Create matrix for change of basis. We don't need it in case pcbddc->usechangeofbasis is FALSE */
2683534831adSStefano Zampini   if (pcbddc->usechangeofbasis) {
2684534831adSStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->ChangeOfBasisMatrix);CHKERRQ(ierr);
2685534831adSStefano Zampini     ierr = MatSetType(pcbddc->ChangeOfBasisMatrix,impMatType);CHKERRQ(ierr);
2686534831adSStefano Zampini     ierr = MatSetSizes(pcbddc->ChangeOfBasisMatrix,pcis->n_B,pcis->n_B,pcis->n_B,pcis->n_B);CHKERRQ(ierr);
2687534831adSStefano Zampini     /* work arrays */
2688534831adSStefano Zampini     /* we need to reuse these arrays, so we free them */
2689534831adSStefano Zampini     ierr = PetscFree(temp_basis);CHKERRQ(ierr);
2690534831adSStefano Zampini     ierr = PetscFree(work);CHKERRQ(ierr);
2691534831adSStefano Zampini     ierr = PetscMalloc(pcis->n_B*sizeof(PetscInt),&nnz);CHKERRQ(ierr);
2692534831adSStefano Zampini     ierr = PetscMalloc((nnsp_addone+nnsp_size)*(nnsp_addone+nnsp_size)*sizeof(PetscScalar),&temp_basis);CHKERRQ(ierr);
2693534831adSStefano Zampini     ierr = PetscMalloc((nnsp_addone+nnsp_size)*sizeof(PetscScalar),&work);CHKERRQ(ierr);
2694534831adSStefano Zampini     ierr = PetscMalloc((nnsp_addone+nnsp_size)*sizeof(PetscBLASInt),&ipiv);CHKERRQ(ierr);
2695534831adSStefano Zampini     for (i=0;i<pcis->n_B;i++) {
2696534831adSStefano Zampini       nnz[i]=1;
2697534831adSStefano Zampini     }
2698534831adSStefano Zampini     /* Overestimated nonzeros per row */
2699534831adSStefano Zampini     k=1;
2700534831adSStefano Zampini     for (i=pcbddc->n_vertices;i<local_primal_size;i++) {
2701534831adSStefano Zampini       if (change_basis[i]) {
2702534831adSStefano Zampini         size_of_constraint = temp_indices[i+1]-temp_indices[i];
2703534831adSStefano Zampini         if (k < size_of_constraint) {
2704534831adSStefano Zampini           k = size_of_constraint;
2705534831adSStefano Zampini         }
2706534831adSStefano Zampini         for (j=0;j<size_of_constraint;j++) {
2707534831adSStefano Zampini           nnz[temp_indices_to_constraint_B[temp_indices[i]+j]] = size_of_constraint;
2708534831adSStefano Zampini         }
2709534831adSStefano Zampini       }
2710534831adSStefano Zampini     }
2711534831adSStefano Zampini     ierr = MatSeqAIJSetPreallocation(pcbddc->ChangeOfBasisMatrix,0,nnz);CHKERRQ(ierr);
2712534831adSStefano Zampini     ierr = PetscFree(nnz);CHKERRQ(ierr);
2713534831adSStefano Zampini     /* Temporary array to store indices */
2714534831adSStefano Zampini     ierr = PetscMalloc(k*sizeof(PetscInt),&is_indices);CHKERRQ(ierr);
2715534831adSStefano Zampini     /* Set initial identity in the matrix */
2716534831adSStefano Zampini     for (i=0;i<pcis->n_B;i++) {
2717534831adSStefano Zampini       ierr = MatSetValue(pcbddc->ChangeOfBasisMatrix,i,i,1.0,INSERT_VALUES);CHKERRQ(ierr);
2718534831adSStefano Zampini     }
2719534831adSStefano Zampini     /* Now we loop on the constraints which need a change of basis */
2720534831adSStefano Zampini     /* Change of basis matrix is evaluated as the FIRST APPROACH in */
2721534831adSStefano Zampini     /* Klawonn and Widlund, Dual-primal FETI-DP methods for linear elasticity, (6.2.1) */
2722534831adSStefano Zampini     temp_constraints = 0;
272393dc3b60SStefano Zampini     if (pcbddc->n_vertices < local_primal_size) {
2724534831adSStefano Zampini       temp_start_ptr = temp_indices_to_constraint_B[temp_indices[pcbddc->n_vertices]];
272593dc3b60SStefano Zampini     }
2726534831adSStefano Zampini     for (i=pcbddc->n_vertices;i<local_primal_size;i++) {
2727534831adSStefano Zampini       if (change_basis[i]) {
2728534831adSStefano Zampini         compute_submatrix = PETSC_FALSE;
2729534831adSStefano Zampini         useksp = PETSC_FALSE;
2730534831adSStefano Zampini         if (temp_start_ptr == temp_indices_to_constraint_B[temp_indices[i]]) {
2731534831adSStefano Zampini           temp_constraints++;
273204eaf177SStefano Zampini           if (i == local_primal_size -1 ||  temp_start_ptr != temp_indices_to_constraint_B[temp_indices[i+1]]) {
2733534831adSStefano Zampini             compute_submatrix = PETSC_TRUE;
2734534831adSStefano Zampini           }
2735534831adSStefano Zampini         }
2736534831adSStefano Zampini         if (compute_submatrix) {
2737534831adSStefano Zampini           if (temp_constraints > 1 || pcbddc->use_nnsp_true) {
2738534831adSStefano Zampini             useksp = PETSC_TRUE;
2739534831adSStefano Zampini           }
2740534831adSStefano Zampini           size_of_constraint = temp_indices[i+1]-temp_indices[i];
2741534831adSStefano Zampini           if (useksp) { /* experimental */
2742534831adSStefano Zampini             ierr = MatCreate(PETSC_COMM_SELF,&temp_mat);CHKERRQ(ierr);
2743534831adSStefano Zampini             ierr = MatSetType(temp_mat,impMatType);CHKERRQ(ierr);
2744534831adSStefano Zampini             ierr = MatSetSizes(temp_mat,size_of_constraint,size_of_constraint,size_of_constraint,size_of_constraint);CHKERRQ(ierr);
2745534831adSStefano Zampini             ierr = MatSeqAIJSetPreallocation(temp_mat,size_of_constraint,PETSC_NULL);CHKERRQ(ierr);
2746534831adSStefano Zampini           }
2747534831adSStefano Zampini           /* First _size_of_constraint-temp_constraints_ columns */
2748534831adSStefano Zampini           dual_dofs = size_of_constraint-temp_constraints;
2749534831adSStefano Zampini           start_constraint = i+1-temp_constraints;
2750534831adSStefano Zampini           for (s=0;s<dual_dofs;s++) {
2751534831adSStefano Zampini             is_indices[0] = s;
2752534831adSStefano Zampini             for (j=0;j<temp_constraints;j++) {
2753534831adSStefano Zampini               for (k=0;k<temp_constraints;k++) {
2754534831adSStefano Zampini                 temp_basis[j*temp_constraints+k]=temp_quadrature_constraint[temp_indices[start_constraint+k]+s+j+1];
2755534831adSStefano Zampini               }
2756534831adSStefano Zampini               work[j]=-temp_quadrature_constraint[temp_indices[start_constraint+j]+s];
2757534831adSStefano Zampini               is_indices[j+1]=s+j+1;
2758534831adSStefano Zampini             }
2759534831adSStefano Zampini             Bt = temp_constraints;
2760534831adSStefano Zampini             ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
2761534831adSStefano Zampini             LAPACKgesv_(&Bt,&Bone,temp_basis,&Bt,ipiv,work,&Bt,&lierr);
2762534831adSStefano Zampini             if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GESV Lapack routine %d",(int)lierr);
2763534831adSStefano Zampini             ierr = PetscFPTrapPop();CHKERRQ(ierr);
2764534831adSStefano Zampini             j = temp_indices_to_constraint_B[temp_indices[start_constraint]+s];
2765534831adSStefano Zampini             ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,temp_constraints,&temp_indices_to_constraint_B[temp_indices[start_constraint]+s+1],1,&j,work,INSERT_VALUES);CHKERRQ(ierr);
2766534831adSStefano Zampini             if (useksp) {
2767534831adSStefano Zampini               /* temp mat with transposed rows and columns */
2768534831adSStefano Zampini               ierr = MatSetValues(temp_mat,1,&s,temp_constraints,&is_indices[1],work,INSERT_VALUES);CHKERRQ(ierr);
2769534831adSStefano Zampini               ierr = MatSetValue(temp_mat,is_indices[0],is_indices[0],1.0,INSERT_VALUES);CHKERRQ(ierr);
2770534831adSStefano Zampini             }
2771534831adSStefano Zampini           }
2772534831adSStefano Zampini           if (useksp) {
2773534831adSStefano Zampini             /* last rows of temp_mat */
2774534831adSStefano Zampini             for (j=0;j<size_of_constraint;j++) {
2775534831adSStefano Zampini               is_indices[j] = j;
2776534831adSStefano Zampini             }
2777534831adSStefano Zampini             for (s=0;s<temp_constraints;s++) {
2778534831adSStefano Zampini               k = s + dual_dofs;
2779534831adSStefano Zampini               ierr = MatSetValues(temp_mat,1,&k,size_of_constraint,is_indices,&temp_quadrature_constraint[temp_indices[start_constraint+s]],INSERT_VALUES);CHKERRQ(ierr);
2780534831adSStefano Zampini             }
2781534831adSStefano Zampini             ierr = MatAssemblyBegin(temp_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2782534831adSStefano Zampini             ierr = MatAssemblyEnd(temp_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2783534831adSStefano Zampini             ierr = MatGetVecs(temp_mat,&temp_vec,PETSC_NULL);CHKERRQ(ierr);
2784534831adSStefano Zampini             ierr = KSPCreate(PETSC_COMM_SELF,&temp_ksp);CHKERRQ(ierr);
2785534831adSStefano Zampini             ierr = KSPSetOperators(temp_ksp,temp_mat,temp_mat,SAME_PRECONDITIONER);CHKERRQ(ierr);
2786534831adSStefano Zampini             ierr = KSPSetType(temp_ksp,KSPPREONLY);CHKERRQ(ierr);
2787ffe5efe1SStefano Zampini             ierr = KSPGetPC(temp_ksp,&temp_pc);CHKERRQ(ierr);
2788ffe5efe1SStefano Zampini             ierr = PCSetType(temp_pc,PCLU);CHKERRQ(ierr);
2789534831adSStefano Zampini             ierr = KSPSetUp(temp_ksp);CHKERRQ(ierr);
2790534831adSStefano Zampini             for (s=0;s<temp_constraints;s++) {
2791534831adSStefano Zampini               ierr = VecSet(temp_vec,0.0);CHKERRQ(ierr);
2792534831adSStefano Zampini               ierr = VecSetValue(temp_vec,s+dual_dofs,1.0,INSERT_VALUES);CHKERRQ(ierr);
2793534831adSStefano Zampini               ierr = VecAssemblyBegin(temp_vec);CHKERRQ(ierr);
2794534831adSStefano Zampini               ierr = VecAssemblyEnd(temp_vec);CHKERRQ(ierr);
2795534831adSStefano Zampini               ierr = KSPSolve(temp_ksp,temp_vec,temp_vec);CHKERRQ(ierr);
2796534831adSStefano Zampini               ierr = VecGetArray(temp_vec,&array_vector);CHKERRQ(ierr);
2797534831adSStefano Zampini               j = temp_indices_to_constraint_B[temp_indices[start_constraint+s]+size_of_constraint-s-1];
2798534831adSStefano Zampini               /* last columns of change of basis matrix associated to new primal dofs */
2799534831adSStefano Zampini               ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,size_of_constraint,&temp_indices_to_constraint_B[temp_indices[start_constraint+s]],1,&j,array_vector,INSERT_VALUES);CHKERRQ(ierr);
2800534831adSStefano Zampini               ierr = VecRestoreArray(temp_vec,&array_vector);CHKERRQ(ierr);
2801534831adSStefano Zampini             }
2802534831adSStefano Zampini             ierr = MatDestroy(&temp_mat);CHKERRQ(ierr);
2803534831adSStefano Zampini             ierr = KSPDestroy(&temp_ksp);CHKERRQ(ierr);
2804534831adSStefano Zampini             ierr = VecDestroy(&temp_vec);CHKERRQ(ierr);
2805534831adSStefano Zampini           } else {
2806534831adSStefano Zampini             /* last columns of change of basis matrix associated to new primal dofs */
2807534831adSStefano Zampini             for (s=0;s<temp_constraints;s++) {
2808534831adSStefano Zampini               j = temp_indices_to_constraint_B[temp_indices[start_constraint+s]+size_of_constraint-s-1];
2809534831adSStefano Zampini               ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,size_of_constraint,&temp_indices_to_constraint_B[temp_indices[start_constraint+s]],1,&j,&temp_quadrature_constraint[temp_indices[start_constraint+s]],INSERT_VALUES);CHKERRQ(ierr);
2810534831adSStefano Zampini             }
2811534831adSStefano Zampini           }
2812534831adSStefano Zampini           /* prepare for the next cycle */
2813534831adSStefano Zampini           temp_constraints = 0;
281404eaf177SStefano Zampini           if (i != local_primal_size -1 ) {
2815534831adSStefano Zampini             temp_start_ptr = temp_indices_to_constraint_B[temp_indices[i+1]];
2816534831adSStefano Zampini           }
2817534831adSStefano Zampini         }
2818534831adSStefano Zampini       }
281904eaf177SStefano Zampini     }
2820534831adSStefano Zampini     /* assembling */
2821534831adSStefano Zampini     ierr = MatAssemblyBegin(pcbddc->ChangeOfBasisMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2822534831adSStefano Zampini     ierr = MatAssemblyEnd(pcbddc->ChangeOfBasisMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2823534831adSStefano Zampini     ierr = PetscFree(ipiv);CHKERRQ(ierr);
2824534831adSStefano Zampini     ierr = PetscFree(is_indices);CHKERRQ(ierr);
2825534831adSStefano Zampini   }
28263b03a366Sstefano_zampini   /* free workspace no longer needed */
28273b03a366Sstefano_zampini   ierr = PetscFree(rwork);CHKERRQ(ierr);
28283b03a366Sstefano_zampini   ierr = PetscFree(work);CHKERRQ(ierr);
28293b03a366Sstefano_zampini   ierr = PetscFree(temp_basis);CHKERRQ(ierr);
28303b03a366Sstefano_zampini   ierr = PetscFree(singular_vals);CHKERRQ(ierr);
28313b03a366Sstefano_zampini   ierr = PetscFree(correlation_mat);CHKERRQ(ierr);
28323b03a366Sstefano_zampini   ierr = PetscFree(temp_indices);CHKERRQ(ierr);
2833534831adSStefano Zampini   ierr = PetscFree(change_basis);CHKERRQ(ierr);
28343b03a366Sstefano_zampini   ierr = PetscFree(temp_indices_to_constraint);CHKERRQ(ierr);
2835534831adSStefano Zampini   ierr = PetscFree(temp_indices_to_constraint_B);CHKERRQ(ierr);
2836534831adSStefano Zampini   ierr = PetscFree(local_to_B);CHKERRQ(ierr);
28373b03a366Sstefano_zampini   ierr = PetscFree(temp_quadrature_constraint);CHKERRQ(ierr);
28383425bc38SStefano Zampini #if defined(PETSC_MISSING_LAPACK_GESVD)
28393425bc38SStefano Zampini   ierr = PetscFree(iwork);CHKERRQ(ierr);
28403425bc38SStefano Zampini   ierr = PetscFree(ifail);CHKERRQ(ierr);
28413425bc38SStefano Zampini   ierr = PetscFree(singular_vectors);CHKERRQ(ierr);
28423425bc38SStefano Zampini #endif
2843da1bb401SStefano Zampini   for (k=0;k<nnsp_size;k++) {
2844da1bb401SStefano Zampini     ierr = VecDestroy(&localnearnullsp[k]);CHKERRQ(ierr);
2845da1bb401SStefano Zampini   }
28463b03a366Sstefano_zampini   ierr = PetscFree(localnearnullsp);CHKERRQ(ierr);
28473b03a366Sstefano_zampini   PetscFunctionReturn(0);
28483b03a366Sstefano_zampini }
28493b03a366Sstefano_zampini /* -------------------------------------------------------------------------- */
28500c7d97c5SJed Brown #undef __FUNCT__
28510c7d97c5SJed Brown #define __FUNCT__ "PCBDDCCoarseSetUp"
285253cdbc3dSStefano Zampini static PetscErrorCode PCBDDCCoarseSetUp(PC pc)
28530c7d97c5SJed Brown {
28540c7d97c5SJed Brown   PetscErrorCode  ierr;
28550c7d97c5SJed Brown 
28560c7d97c5SJed Brown   PC_IS*            pcis = (PC_IS*)(pc->data);
28570c7d97c5SJed Brown   PC_BDDC*          pcbddc = (PC_BDDC*)pc->data;
28580c7d97c5SJed Brown   Mat_IS            *matis = (Mat_IS*)pc->pmat->data;
2859534831adSStefano Zampini   Mat               change_mat_all;
28600c7d97c5SJed Brown   IS                is_R_local;
28610c7d97c5SJed Brown   IS                is_V_local;
28620c7d97c5SJed Brown   IS                is_C_local;
28630c7d97c5SJed Brown   IS                is_aux1;
28640c7d97c5SJed Brown   IS                is_aux2;
286519fd82e9SBarry Smith   VecType           impVecType;
286619fd82e9SBarry Smith   MatType           impMatType;
28670c7d97c5SJed Brown   PetscInt          n_R=0;
28680c7d97c5SJed Brown   PetscInt          n_D=0;
28690c7d97c5SJed Brown   PetscInt          n_B=0;
28700c7d97c5SJed Brown   PetscScalar       zero=0.0;
28710c7d97c5SJed Brown   PetscScalar       one=1.0;
28720c7d97c5SJed Brown   PetscScalar       m_one=-1.0;
28730c7d97c5SJed Brown   PetscScalar*      array;
28740c7d97c5SJed Brown   PetscScalar       *coarse_submat_vals;
28750c7d97c5SJed Brown   PetscInt          *idx_R_local;
28760c7d97c5SJed Brown   PetscInt          *idx_V_B;
28770c7d97c5SJed Brown   PetscScalar       *coarsefunctions_errors;
28780c7d97c5SJed Brown   PetscScalar       *constraints_errors;
28790c7d97c5SJed Brown   /* auxiliary indices */
2880534831adSStefano Zampini   PetscInt          i,j,k;
2881e269702eSStefano Zampini   /* for verbose output of bddc */
2882e269702eSStefano Zampini   PetscViewer       viewer=pcbddc->dbg_viewer;
2883e269702eSStefano Zampini   PetscBool         dbg_flag=pcbddc->dbg_flag;
2884a0ba757dSStefano Zampini   /* for counting coarse dofs */
2885534831adSStefano Zampini   PetscInt          n_vertices,n_constraints;
28863b03a366Sstefano_zampini   PetscInt          size_of_constraint;
28873b03a366Sstefano_zampini   PetscInt          *row_cmat_indices;
28883b03a366Sstefano_zampini   PetscScalar       *row_cmat_values;
2889534831adSStefano Zampini   PetscInt          *vertices,*nnz,*is_indices,*temp_indices;
28900c7d97c5SJed Brown 
28910c7d97c5SJed Brown   PetscFunctionBegin;
28920c7d97c5SJed Brown   /* Set Non-overlapping dimensions */
28930c7d97c5SJed Brown   n_B = pcis->n_B; n_D = pcis->n - n_B;
2894534831adSStefano Zampini   /* Set types for local objects needed by BDDC precondtioner */
2895534831adSStefano Zampini   impMatType = MATSEQDENSE;
2896534831adSStefano Zampini   impVecType = VECSEQ;
2897da1bb401SStefano Zampini   /* get vertex indices from constraint matrix */
2898534831adSStefano Zampini   ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscInt),&vertices);CHKERRQ(ierr);
2899534831adSStefano Zampini   n_vertices=0;
2900da1bb401SStefano Zampini   for (i=0;i<pcbddc->local_primal_size;i++) {
2901da1bb401SStefano Zampini     ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr);
2902da1bb401SStefano Zampini     if (size_of_constraint == 1) {
2903534831adSStefano Zampini       vertices[n_vertices]=row_cmat_indices[0];
2904534831adSStefano Zampini       n_vertices++;
2905a0ba757dSStefano Zampini     }
2906da1bb401SStefano Zampini     ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr);
2907a0ba757dSStefano Zampini   }
2908534831adSStefano Zampini   /* Set number of constraints */
2909534831adSStefano Zampini   n_constraints = pcbddc->local_primal_size-n_vertices;
2910534831adSStefano Zampini 
2911534831adSStefano Zampini   /* vertices in boundary numbering */
2912534831adSStefano Zampini   if (n_vertices) {
2913534831adSStefano Zampini     ierr = VecSet(pcis->vec1_N,m_one);CHKERRQ(ierr);
2914534831adSStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
2915534831adSStefano Zampini     for (i=0; i<n_vertices; i++) { array[ vertices[i] ] = i; }
2916534831adSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
2917534831adSStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
2918534831adSStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
2919534831adSStefano Zampini     ierr = PetscMalloc(n_vertices*sizeof(PetscInt),&idx_V_B);CHKERRQ(ierr);
2920534831adSStefano Zampini     ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr);
2921534831adSStefano Zampini     for (i=0; i<n_vertices; i++) {
2922534831adSStefano Zampini       j=0;
2923534831adSStefano Zampini       while (array[j] != i ) {j++;}
2924534831adSStefano Zampini       idx_V_B[i]=j;
2925534831adSStefano Zampini     }
2926534831adSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr);
2927534831adSStefano Zampini   }
2928534831adSStefano Zampini 
2929534831adSStefano Zampini   /* transform local matrices if needed */
2930534831adSStefano Zampini   if (pcbddc->usechangeofbasis) {
2931534831adSStefano Zampini     ierr = PetscMalloc(pcis->n*sizeof(PetscInt),&nnz);CHKERRQ(ierr);
2932534831adSStefano Zampini     ierr = ISGetIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2933534831adSStefano Zampini     for (i=0;i<n_D;i++) {
2934534831adSStefano Zampini       nnz[is_indices[i]]=1;
2935534831adSStefano Zampini     }
2936534831adSStefano Zampini     ierr = ISRestoreIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2937534831adSStefano Zampini     ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2938534831adSStefano Zampini     k=1;
2939534831adSStefano Zampini     for (i=0;i<n_B;i++) {
2940534831adSStefano Zampini       ierr = MatGetRow(pcbddc->ChangeOfBasisMatrix,i,&j,PETSC_NULL,PETSC_NULL);CHKERRQ(ierr);
2941534831adSStefano Zampini       nnz[is_indices[i]]=j;
2942534831adSStefano Zampini       if ( k < j) {
2943534831adSStefano Zampini         k = j;
2944534831adSStefano Zampini       }
2945534831adSStefano Zampini       ierr = MatRestoreRow(pcbddc->ChangeOfBasisMatrix,i,&j,PETSC_NULL,PETSC_NULL);CHKERRQ(ierr);
2946534831adSStefano Zampini     }
2947534831adSStefano Zampini     ierr = ISRestoreIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2948534831adSStefano Zampini     /* assemble change of basis matrix on the whole set of local dofs */
2949534831adSStefano Zampini     ierr = PetscMalloc(k*sizeof(PetscInt),&temp_indices);CHKERRQ(ierr);
2950534831adSStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&change_mat_all);CHKERRQ(ierr);
2951534831adSStefano Zampini     ierr = MatSetSizes(change_mat_all,pcis->n,pcis->n,pcis->n,pcis->n);CHKERRQ(ierr);
2952534831adSStefano Zampini     ierr = MatSetType(change_mat_all,MATSEQAIJ);CHKERRQ(ierr);
2953534831adSStefano Zampini     ierr = MatSeqAIJSetPreallocation(change_mat_all,0,nnz);CHKERRQ(ierr);
2954534831adSStefano Zampini     ierr = ISGetIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2955534831adSStefano Zampini     for (i=0;i<n_D;i++) {
2956534831adSStefano Zampini       ierr = MatSetValue(change_mat_all,is_indices[i],is_indices[i],1.0,INSERT_VALUES);CHKERRQ(ierr);
2957534831adSStefano Zampini     }
2958534831adSStefano Zampini     ierr = ISRestoreIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2959534831adSStefano Zampini     ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2960534831adSStefano Zampini     for (i=0;i<n_B;i++) {
2961534831adSStefano Zampini       ierr = MatGetRow(pcbddc->ChangeOfBasisMatrix,i,&j,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr);
2962534831adSStefano Zampini       for (k=0;k<j;k++) {
2963534831adSStefano Zampini         temp_indices[k]=is_indices[row_cmat_indices[k]];
2964534831adSStefano Zampini       }
2965534831adSStefano Zampini       ierr = MatSetValues(change_mat_all,1,&is_indices[i],j,temp_indices,row_cmat_values,INSERT_VALUES);CHKERRQ(ierr);
2966534831adSStefano Zampini       ierr = MatRestoreRow(pcbddc->ChangeOfBasisMatrix,i,&j,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr);
2967534831adSStefano Zampini     }
2968534831adSStefano Zampini     ierr = MatAssemblyBegin(change_mat_all,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2969534831adSStefano Zampini     ierr = MatAssemblyEnd(change_mat_all,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2970534831adSStefano Zampini     ierr = MatPtAP(matis->A,change_mat_all,MAT_INITIAL_MATRIX,1.0,&pcbddc->local_mat);CHKERRQ(ierr);
2971534831adSStefano Zampini     ierr = MatDestroy(&pcis->A_IB);CHKERRQ(ierr);
2972534831adSStefano Zampini     ierr = MatDestroy(&pcis->A_BI);CHKERRQ(ierr);
2973534831adSStefano Zampini     ierr = MatDestroy(&pcis->A_BB);CHKERRQ(ierr);
2974534831adSStefano Zampini     ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_I_local,pcis->is_B_local,MAT_INITIAL_MATRIX,&pcis->A_IB);CHKERRQ(ierr);
2975534831adSStefano Zampini     ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_B_local,pcis->is_I_local,MAT_INITIAL_MATRIX,&pcis->A_BI);CHKERRQ(ierr);
2976534831adSStefano Zampini     ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_B_local,pcis->is_B_local,MAT_INITIAL_MATRIX,&pcis->A_BB);CHKERRQ(ierr);
2977534831adSStefano Zampini     ierr = MatDestroy(&change_mat_all);CHKERRQ(ierr);
2978534831adSStefano Zampini     ierr = PetscFree(nnz);CHKERRQ(ierr);
2979534831adSStefano Zampini     ierr = PetscFree(temp_indices);CHKERRQ(ierr);
2980534831adSStefano Zampini   } else {
2981534831adSStefano Zampini     /* without change of basis, the local matrix is unchanged */
2982534831adSStefano Zampini     ierr = PetscObjectReference((PetscObject)matis->A);CHKERRQ(ierr);
2983534831adSStefano Zampini     pcbddc->local_mat = matis->A;
2984534831adSStefano Zampini   }
29850bdf917eSStefano Zampini   /* Change global null space passed in by the user if change of basis has been performed */
29860bdf917eSStefano Zampini   if (pcbddc->NullSpace && pcbddc->usechangeofbasis) {
29870bdf917eSStefano Zampini     ierr = PCBDDCAdaptNullSpace(pc);CHKERRQ(ierr);
29880bdf917eSStefano Zampini   }
2989a0ba757dSStefano Zampini 
29900c7d97c5SJed Brown   /* Dohrmann's notation: dofs splitted in R (Remaining: all dofs but the vertices) and V (Vertices) */
29910c7d97c5SJed Brown   ierr = VecSet(pcis->vec1_N,one);CHKERRQ(ierr);
29920c7d97c5SJed Brown   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
29933b03a366Sstefano_zampini   for (i=0;i<n_vertices;i++) { array[ vertices[i] ] = zero; }
29943b03a366Sstefano_zampini   ierr = PetscMalloc(( pcis->n - n_vertices )*sizeof(PetscInt),&idx_R_local);CHKERRQ(ierr);
29950c7d97c5SJed Brown   for (i=0, n_R=0; i<pcis->n; i++) { if (array[i] == one) { idx_R_local[n_R] = i; n_R++; } }
29960c7d97c5SJed Brown   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
2997e269702eSStefano Zampini   if (dbg_flag) {
29980c7d97c5SJed Brown     ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
29990c7d97c5SJed Brown     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
30000c7d97c5SJed Brown     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d local dimensions\n",PetscGlobalRank);CHKERRQ(ierr);
30010c7d97c5SJed Brown     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local_size = %d, dirichlet_size = %d, boundary_size = %d\n",pcis->n,n_D,n_B);CHKERRQ(ierr);
30023b03a366Sstefano_zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"r_size = %d, v_size = %d, constraints = %d, local_primal_size = %d\n",n_R,n_vertices,n_constraints,pcbddc->local_primal_size);CHKERRQ(ierr);
3003534831adSStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"pcbddc->n_vertices = %d, pcbddc->n_constraints = %d\n",pcbddc->n_vertices,pcbddc->n_constraints);CHKERRQ(ierr);
30040c7d97c5SJed Brown     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
30050c7d97c5SJed Brown   }
3006534831adSStefano Zampini 
30070c7d97c5SJed Brown   /* Allocate needed vectors */
3008534831adSStefano Zampini   ierr = VecDuplicate(pcis->vec1_global,&pcbddc->original_rhs);CHKERRQ(ierr);
30093972b0daSStefano Zampini   ierr = VecDuplicate(pcis->vec1_global,&pcbddc->temp_solution);CHKERRQ(ierr);
30100c7d97c5SJed Brown   ierr = VecDuplicate(pcis->vec1_D,&pcbddc->vec4_D);CHKERRQ(ierr);
30110c7d97c5SJed Brown   ierr = VecCreate(PETSC_COMM_SELF,&pcbddc->vec1_R);CHKERRQ(ierr);
30120c7d97c5SJed Brown   ierr = VecSetSizes(pcbddc->vec1_R,n_R,n_R);CHKERRQ(ierr);
30130c7d97c5SJed Brown   ierr = VecSetType(pcbddc->vec1_R,impVecType);CHKERRQ(ierr);
3014d49ef151SStefano Zampini   ierr = VecDuplicate(pcbddc->vec1_R,&pcbddc->vec2_R);CHKERRQ(ierr);
30150c7d97c5SJed Brown   ierr = VecCreate(PETSC_COMM_SELF,&pcbddc->vec1_P);CHKERRQ(ierr);
30160c7d97c5SJed Brown   ierr = VecSetSizes(pcbddc->vec1_P,pcbddc->local_primal_size,pcbddc->local_primal_size);CHKERRQ(ierr);
30170c7d97c5SJed Brown   ierr = VecSetType(pcbddc->vec1_P,impVecType);CHKERRQ(ierr);
30180c7d97c5SJed Brown 
30190c7d97c5SJed Brown   /* Creating some index sets needed  */
30200c7d97c5SJed Brown   /* For submatrices */
3021da1bb401SStefano Zampini   ierr = ISCreateGeneral(PETSC_COMM_SELF,n_R,idx_R_local,PETSC_OWN_POINTER,&is_R_local);CHKERRQ(ierr);
30223b03a366Sstefano_zampini   if (n_vertices)    {
3023da1bb401SStefano Zampini     ierr = ISCreateGeneral(PETSC_COMM_SELF,n_vertices,vertices,PETSC_OWN_POINTER,&is_V_local);CHKERRQ(ierr);
30243b03a366Sstefano_zampini   }
3025da1bb401SStefano Zampini   if (n_constraints) {
3026da1bb401SStefano Zampini     ierr = ISCreateStride(PETSC_COMM_SELF,n_constraints,n_vertices,1,&is_C_local);CHKERRQ(ierr);
3027da1bb401SStefano Zampini   }
3028da1bb401SStefano Zampini 
30290c7d97c5SJed Brown   /* For VecScatters pcbddc->R_to_B and (optionally) pcbddc->R_to_D */
30300c7d97c5SJed Brown   {
30310c7d97c5SJed Brown     PetscInt   *aux_array1;
30320c7d97c5SJed Brown     PetscInt   *aux_array2;
30332e8d2280SStefano Zampini     PetscInt   *idx_I_local;
30340c7d97c5SJed Brown 
30353b03a366Sstefano_zampini     ierr = PetscMalloc( (pcis->n_B-n_vertices)*sizeof(PetscInt),&aux_array1);CHKERRQ(ierr);
30363b03a366Sstefano_zampini     ierr = PetscMalloc( (pcis->n_B-n_vertices)*sizeof(PetscInt),&aux_array2);CHKERRQ(ierr);
30370c7d97c5SJed Brown 
30382e8d2280SStefano Zampini     ierr = ISGetIndices(pcis->is_I_local,(const PetscInt**)&idx_I_local);CHKERRQ(ierr);
30390c7d97c5SJed Brown     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
30402e8d2280SStefano Zampini     for (i=0; i<n_D; i++) { array[idx_I_local[i]] = 0; }
30412e8d2280SStefano Zampini     ierr = ISRestoreIndices(pcis->is_I_local,(const PetscInt**)&idx_I_local);CHKERRQ(ierr);
30422e8d2280SStefano Zampini     for (i=0, j=0; i<n_R; i++) { if ( array[idx_R_local[i]] == one ) { aux_array1[j] = i; j++; } }
30430c7d97c5SJed Brown     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3044da1bb401SStefano Zampini     ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array1,PETSC_COPY_VALUES,&is_aux1);CHKERRQ(ierr);
30452e8d2280SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
30462e8d2280SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
30470c7d97c5SJed Brown     ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr);
30482e8d2280SStefano Zampini     for (i=0, j=0; i<n_B; i++) { if ( array[i] == one ) { aux_array2[j] = i; j++; } }
30493828260eSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr);
3050da1bb401SStefano Zampini     ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array2,PETSC_COPY_VALUES,&is_aux2);CHKERRQ(ierr);
30510c7d97c5SJed Brown     ierr = VecScatterCreate(pcbddc->vec1_R,is_aux1,pcis->vec1_B,is_aux2,&pcbddc->R_to_B);CHKERRQ(ierr);
30520c7d97c5SJed Brown     ierr = PetscFree(aux_array1);CHKERRQ(ierr);
30530c7d97c5SJed Brown     ierr = PetscFree(aux_array2);CHKERRQ(ierr);
30540c7d97c5SJed Brown     ierr = ISDestroy(&is_aux1);CHKERRQ(ierr);
30550c7d97c5SJed Brown     ierr = ISDestroy(&is_aux2);CHKERRQ(ierr);
30560c7d97c5SJed Brown 
3057e269702eSStefano Zampini     if (pcbddc->prec_type || dbg_flag ) {
30580c7d97c5SJed Brown       ierr = PetscMalloc(n_D*sizeof(PetscInt),&aux_array1);CHKERRQ(ierr);
30590c7d97c5SJed Brown       ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
30602e8d2280SStefano Zampini       for (i=0, j=0; i<n_R; i++) { if (array[idx_R_local[i]] == zero) { aux_array1[j] = i; j++; } }
30610c7d97c5SJed Brown       ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3062da1bb401SStefano Zampini       ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array1,PETSC_COPY_VALUES,&is_aux1);CHKERRQ(ierr);
30630c7d97c5SJed Brown       ierr = VecScatterCreate(pcbddc->vec1_R,is_aux1,pcis->vec1_D,(IS)0,&pcbddc->R_to_D);CHKERRQ(ierr);
30640c7d97c5SJed Brown       ierr = PetscFree(aux_array1);CHKERRQ(ierr);
30650c7d97c5SJed Brown       ierr = ISDestroy(&is_aux1);CHKERRQ(ierr);
30660c7d97c5SJed Brown     }
30670c7d97c5SJed Brown   }
30680c7d97c5SJed Brown 
30690c7d97c5SJed Brown   /* Creating PC contexts for local Dirichlet and Neumann problems */
30700c7d97c5SJed Brown   {
30710c7d97c5SJed Brown     Mat  A_RR;
307253cdbc3dSStefano Zampini     PC   pc_temp;
30730c7d97c5SJed Brown     /* Matrix for Dirichlet problem is A_II -> we already have it from pcis.c code */
307453cdbc3dSStefano Zampini     ierr = KSPCreate(PETSC_COMM_SELF,&pcbddc->ksp_D);CHKERRQ(ierr);
307553cdbc3dSStefano Zampini     ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->ksp_D,(PetscObject)pc,1);CHKERRQ(ierr);
307653cdbc3dSStefano Zampini     ierr = KSPSetOperators(pcbddc->ksp_D,pcis->A_II,pcis->A_II,SAME_PRECONDITIONER);CHKERRQ(ierr);
307753cdbc3dSStefano Zampini     ierr = KSPSetType(pcbddc->ksp_D,KSPPREONLY);CHKERRQ(ierr);
3078da1bb401SStefano Zampini     ierr = KSPSetOptionsPrefix(pcbddc->ksp_D,"dirichlet_");CHKERRQ(ierr);
30790c7d97c5SJed Brown     /* default */
308053cdbc3dSStefano Zampini     ierr = KSPGetPC(pcbddc->ksp_D,&pc_temp);CHKERRQ(ierr);
308153cdbc3dSStefano Zampini     ierr = PCSetType(pc_temp,PCLU);CHKERRQ(ierr);
30820c7d97c5SJed Brown     /* Allow user's customization */
308353cdbc3dSStefano Zampini     ierr = KSPSetFromOptions(pcbddc->ksp_D);CHKERRQ(ierr);
3084950d796eSStefano Zampini     /* umfpack interface has a bug when matrix dimension is zero */
3085950d796eSStefano Zampini     if (!n_D) {
30862e8d2280SStefano Zampini       ierr = PCSetType(pc_temp,PCNONE);CHKERRQ(ierr);
3087950d796eSStefano Zampini     }
308853cdbc3dSStefano Zampini     /* Set Up KSP for Dirichlet problem of BDDC */
308953cdbc3dSStefano Zampini     ierr = KSPSetUp(pcbddc->ksp_D);CHKERRQ(ierr);
30903972b0daSStefano Zampini     /* set ksp_D into pcis data */
30913972b0daSStefano Zampini     ierr = KSPDestroy(&pcis->ksp_D);CHKERRQ(ierr);
30923972b0daSStefano Zampini     ierr = PetscObjectReference((PetscObject)pcbddc->ksp_D);CHKERRQ(ierr);
30933972b0daSStefano Zampini     pcis->ksp_D = pcbddc->ksp_D;
30940c7d97c5SJed Brown     /* Matrix for Neumann problem is A_RR -> we need to create it */
3095534831adSStefano Zampini     ierr = MatGetSubMatrix(pcbddc->local_mat,is_R_local,is_R_local,MAT_INITIAL_MATRIX,&A_RR);CHKERRQ(ierr);
309653cdbc3dSStefano Zampini     ierr = KSPCreate(PETSC_COMM_SELF,&pcbddc->ksp_R);CHKERRQ(ierr);
309753cdbc3dSStefano Zampini     ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->ksp_R,(PetscObject)pc,1);CHKERRQ(ierr);
309853cdbc3dSStefano Zampini     ierr = KSPSetOperators(pcbddc->ksp_R,A_RR,A_RR,SAME_PRECONDITIONER);CHKERRQ(ierr);
309953cdbc3dSStefano Zampini     ierr = KSPSetType(pcbddc->ksp_R,KSPPREONLY);CHKERRQ(ierr);
3100da1bb401SStefano Zampini     ierr = KSPSetOptionsPrefix(pcbddc->ksp_R,"neumann_");CHKERRQ(ierr);
31010c7d97c5SJed Brown     /* default */
310253cdbc3dSStefano Zampini     ierr = KSPGetPC(pcbddc->ksp_R,&pc_temp);CHKERRQ(ierr);
310353cdbc3dSStefano Zampini     ierr = PCSetType(pc_temp,PCLU);CHKERRQ(ierr);
31040c7d97c5SJed Brown     /* Allow user's customization */
310553cdbc3dSStefano Zampini     ierr = KSPSetFromOptions(pcbddc->ksp_R);CHKERRQ(ierr);
3106950d796eSStefano Zampini     /* umfpack interface has a bug when matrix dimension is zero */
3107950d796eSStefano Zampini     if (!pcis->n) {
31082e8d2280SStefano Zampini       ierr = PCSetType(pc_temp,PCNONE);CHKERRQ(ierr);
3109950d796eSStefano Zampini     }
311053cdbc3dSStefano Zampini     /* Set Up KSP for Neumann problem of BDDC */
311153cdbc3dSStefano Zampini     ierr = KSPSetUp(pcbddc->ksp_R);CHKERRQ(ierr);
3112a0ba757dSStefano Zampini     /* check Dirichlet and Neumann solvers */
3113b76ba322SStefano Zampini     {
31140c7d97c5SJed Brown       Vec         temp_vec;
3115b76ba322SStefano Zampini       PetscReal   value;
3116b76ba322SStefano Zampini       PetscMPIInt use_exact,use_exact_reduced;
31170c7d97c5SJed Brown 
3118a0ba757dSStefano Zampini       ierr = VecDuplicate(pcis->vec1_D,&temp_vec);CHKERRQ(ierr);
3119a0ba757dSStefano Zampini       ierr = VecSetRandom(pcis->vec1_D,PETSC_NULL);CHKERRQ(ierr);
3120a0ba757dSStefano Zampini       ierr = MatMult(pcis->A_II,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr);
3121a0ba757dSStefano Zampini       ierr = KSPSolve(pcbddc->ksp_D,pcis->vec2_D,temp_vec);CHKERRQ(ierr);
3122a0ba757dSStefano Zampini       ierr = VecAXPY(temp_vec,m_one,pcis->vec1_D);CHKERRQ(ierr);
3123a0ba757dSStefano Zampini       ierr = VecNorm(temp_vec,NORM_INFINITY,&value);CHKERRQ(ierr);
3124b76ba322SStefano Zampini       use_exact = 1;
3125b76ba322SStefano Zampini       if (PetscAbsReal(value) > 1.e-4) {
3126b76ba322SStefano Zampini         use_exact = 0;
3127b76ba322SStefano Zampini       }
3128b76ba322SStefano Zampini       ierr = MPI_Allreduce(&use_exact,&use_exact_reduced,1,MPIU_INT,MPI_LAND,((PetscObject)pc)->comm);CHKERRQ(ierr);
3129b76ba322SStefano Zampini       pcbddc->use_exact_dirichlet = (PetscBool) use_exact_reduced;
3130a0ba757dSStefano Zampini       ierr = VecDestroy(&temp_vec);CHKERRQ(ierr);
3131b76ba322SStefano Zampini       if (dbg_flag) {
3132a0ba757dSStefano Zampini         ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
3133a0ba757dSStefano Zampini         ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
3134a0ba757dSStefano Zampini         ierr = PetscViewerASCIIPrintf(viewer,"Checking solution of Dirichlet and Neumann problems\n");CHKERRQ(ierr);
3135a0ba757dSStefano Zampini         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d infinity error for Dirichlet solve = % 1.14e \n",PetscGlobalRank,value);CHKERRQ(ierr);
3136d49ef151SStefano Zampini         ierr = VecDuplicate(pcbddc->vec1_R,&temp_vec);CHKERRQ(ierr);
3137d49ef151SStefano Zampini         ierr = VecSetRandom(pcbddc->vec1_R,PETSC_NULL);CHKERRQ(ierr);
3138d49ef151SStefano Zampini         ierr = MatMult(A_RR,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr);
3139d49ef151SStefano Zampini         ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec2_R,temp_vec);CHKERRQ(ierr);
3140d49ef151SStefano Zampini         ierr = VecAXPY(temp_vec,m_one,pcbddc->vec1_R);CHKERRQ(ierr);
3141d49ef151SStefano Zampini         ierr = VecNorm(temp_vec,NORM_INFINITY,&value);CHKERRQ(ierr);
3142e269702eSStefano Zampini         ierr = VecDestroy(&temp_vec);CHKERRQ(ierr);
31430c7d97c5SJed Brown         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d infinity error for  Neumann  solve = % 1.14e \n",PetscGlobalRank,value);CHKERRQ(ierr);
3144d49ef151SStefano Zampini         ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
31450c7d97c5SJed Brown       }
3146b76ba322SStefano Zampini     }
31470c7d97c5SJed Brown     /* free Neumann problem's matrix */
31480c7d97c5SJed Brown     ierr = MatDestroy(&A_RR);CHKERRQ(ierr);
31490c7d97c5SJed Brown   }
31500c7d97c5SJed Brown 
31510c7d97c5SJed Brown   /* Assemble all remaining stuff needed to apply BDDC  */
31520c7d97c5SJed Brown   {
31530c7d97c5SJed Brown     Mat          A_RV,A_VR,A_VV;
31540bdf917eSStefano Zampini     Mat          M1;
31550c7d97c5SJed Brown     Mat          C_CR;
31563b03a366Sstefano_zampini     Mat          AUXMAT;
31570c7d97c5SJed Brown     Vec          vec1_C;
31580c7d97c5SJed Brown     Vec          vec2_C;
31590c7d97c5SJed Brown     Vec          vec1_V;
31600c7d97c5SJed Brown     Vec          vec2_V;
31610c7d97c5SJed Brown     PetscInt     *nnz;
31620c7d97c5SJed Brown     PetscInt     *auxindices;
316353cdbc3dSStefano Zampini     PetscInt     index;
31640c7d97c5SJed Brown     PetscScalar* array2;
31650c7d97c5SJed Brown     MatFactorInfo matinfo;
31660c7d97c5SJed Brown 
31670c7d97c5SJed Brown     /* Allocating some extra storage just to be safe */
31680c7d97c5SJed Brown     ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&nnz);CHKERRQ(ierr);
31690c7d97c5SJed Brown     ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&auxindices);CHKERRQ(ierr);
31700c7d97c5SJed Brown     for (i=0;i<pcis->n;i++) {auxindices[i]=i;}
31710c7d97c5SJed Brown 
31720c7d97c5SJed Brown     /* some work vectors on vertices and/or constraints */
31733b03a366Sstefano_zampini     if (n_vertices) {
31740c7d97c5SJed Brown       ierr = VecCreate(PETSC_COMM_SELF,&vec1_V);CHKERRQ(ierr);
31753b03a366Sstefano_zampini       ierr = VecSetSizes(vec1_V,n_vertices,n_vertices);CHKERRQ(ierr);
31760c7d97c5SJed Brown       ierr = VecSetType(vec1_V,impVecType);CHKERRQ(ierr);
31770c7d97c5SJed Brown       ierr = VecDuplicate(vec1_V,&vec2_V);CHKERRQ(ierr);
31780c7d97c5SJed Brown     }
3179534831adSStefano Zampini     if (n_constraints) {
31800c7d97c5SJed Brown       ierr = VecCreate(PETSC_COMM_SELF,&vec1_C);CHKERRQ(ierr);
3181534831adSStefano Zampini       ierr = VecSetSizes(vec1_C,n_constraints,n_constraints);CHKERRQ(ierr);
31820c7d97c5SJed Brown       ierr = VecSetType(vec1_C,impVecType);CHKERRQ(ierr);
31830c7d97c5SJed Brown       ierr = VecDuplicate(vec1_C,&vec2_C);CHKERRQ(ierr);
31840c7d97c5SJed Brown       ierr = VecDuplicate(vec1_C,&pcbddc->vec1_C);CHKERRQ(ierr);
31850c7d97c5SJed Brown     }
31860c7d97c5SJed Brown     /* Precompute stuffs needed for preprocessing and application of BDDC*/
31873b03a366Sstefano_zampini     if (n_constraints) {
31880c7d97c5SJed Brown       ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->local_auxmat2);CHKERRQ(ierr);
31893b03a366Sstefano_zampini       ierr = MatSetSizes(pcbddc->local_auxmat2,n_R,n_constraints,n_R,n_constraints);CHKERRQ(ierr);
31900c7d97c5SJed Brown       ierr = MatSetType(pcbddc->local_auxmat2,impMatType);CHKERRQ(ierr);
31913b03a366Sstefano_zampini       ierr = MatSeqDenseSetPreallocation(pcbddc->local_auxmat2,PETSC_NULL);CHKERRQ(ierr);
31920c7d97c5SJed Brown 
319357a90decSStefano Zampini       /* Create Constraint matrix on R nodes: C_{CR}  */
319457a90decSStefano Zampini       ierr = MatGetSubMatrix(pcbddc->ConstraintMatrix,is_C_local,is_R_local,MAT_INITIAL_MATRIX,&C_CR);CHKERRQ(ierr);
319557a90decSStefano Zampini       ierr = ISDestroy(&is_C_local);CHKERRQ(ierr);
319657a90decSStefano Zampini 
31970c7d97c5SJed Brown       /* Assemble local_auxmat2 = - A_{RR}^{-1} C^T_{CR} needed by BDDC application */
31983b03a366Sstefano_zampini       for (i=0;i<n_constraints;i++) {
31993b03a366Sstefano_zampini         ierr = VecSet(pcbddc->vec1_R,zero);CHKERRQ(ierr);
32003b03a366Sstefano_zampini         /* Get row of constraint matrix in R numbering */
320157a90decSStefano Zampini         ierr = VecGetArray(pcbddc->vec1_R,&array);CHKERRQ(ierr);
320257a90decSStefano Zampini         ierr = MatGetRow(C_CR,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr);
32033b03a366Sstefano_zampini         for (j=0;j<size_of_constraint;j++) { array[ row_cmat_indices[j] ] = - row_cmat_values[j]; }
320457a90decSStefano Zampini         ierr = MatRestoreRow(C_CR,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr);
320557a90decSStefano Zampini         ierr = VecRestoreArray(pcbddc->vec1_R,&array);CHKERRQ(ierr);
32063b03a366Sstefano_zampini         /* Solve for row of constraint matrix in R numbering */
320753cdbc3dSStefano Zampini         ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr);
32083b03a366Sstefano_zampini         /* Set values */
32090c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec2_R,&array);CHKERRQ(ierr);
32103b03a366Sstefano_zampini         ierr = MatSetValues(pcbddc->local_auxmat2,n_R,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
32110c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec2_R,&array);CHKERRQ(ierr);
32120c7d97c5SJed Brown       }
32130c7d97c5SJed Brown       ierr = MatAssemblyBegin(pcbddc->local_auxmat2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
32140c7d97c5SJed Brown       ierr = MatAssemblyEnd(pcbddc->local_auxmat2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
32150c7d97c5SJed Brown 
32160c7d97c5SJed Brown       /* Assemble AUXMAT = ( LUFactor )( -C_{CR} A_{RR}^{-1} C^T_{CR} )^{-1} */
32170c7d97c5SJed Brown       ierr = MatMatMult(C_CR,pcbddc->local_auxmat2,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&AUXMAT);CHKERRQ(ierr);
3218d49ef151SStefano Zampini       ierr = MatFactorInfoInitialize(&matinfo);CHKERRQ(ierr);
32193b03a366Sstefano_zampini       ierr = ISCreateStride(PETSC_COMM_SELF,n_constraints,0,1,&is_aux1);CHKERRQ(ierr);
32200c7d97c5SJed Brown       ierr = MatLUFactor(AUXMAT,is_aux1,is_aux1,&matinfo);CHKERRQ(ierr);
32210c7d97c5SJed Brown       ierr = ISDestroy(&is_aux1);CHKERRQ(ierr);
32220c7d97c5SJed Brown 
32233b03a366Sstefano_zampini       /* Assemble explicitly M1 = ( C_{CR} A_{RR}^{-1} C^T_{CR} )^{-1} needed in preproc  */
3224d49ef151SStefano Zampini       ierr = MatCreate(PETSC_COMM_SELF,&M1);CHKERRQ(ierr);
32253b03a366Sstefano_zampini       ierr = MatSetSizes(M1,n_constraints,n_constraints,n_constraints,n_constraints);CHKERRQ(ierr);
32260c7d97c5SJed Brown       ierr = MatSetType(M1,impMatType);CHKERRQ(ierr);
32273b03a366Sstefano_zampini       ierr = MatSeqDenseSetPreallocation(M1,PETSC_NULL);CHKERRQ(ierr);
32283b03a366Sstefano_zampini       for (i=0;i<n_constraints;i++) {
32290c7d97c5SJed Brown         ierr = VecSet(vec1_C,zero);CHKERRQ(ierr);
32300c7d97c5SJed Brown         ierr = VecSetValue(vec1_C,i,one,INSERT_VALUES);CHKERRQ(ierr);
32310c7d97c5SJed Brown         ierr = VecAssemblyBegin(vec1_C);CHKERRQ(ierr);
32320c7d97c5SJed Brown         ierr = VecAssemblyEnd(vec1_C);CHKERRQ(ierr);
32330c7d97c5SJed Brown         ierr = MatSolve(AUXMAT,vec1_C,vec2_C);CHKERRQ(ierr);
32340c7d97c5SJed Brown         ierr = VecScale(vec2_C,m_one);CHKERRQ(ierr);
32350c7d97c5SJed Brown         ierr = VecGetArray(vec2_C,&array);CHKERRQ(ierr);
32363b03a366Sstefano_zampini         ierr = MatSetValues(M1,n_constraints,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
32370c7d97c5SJed Brown         ierr = VecRestoreArray(vec2_C,&array);CHKERRQ(ierr);
32380c7d97c5SJed Brown       }
32390c7d97c5SJed Brown       ierr = MatAssemblyBegin(M1,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
32400c7d97c5SJed Brown       ierr = MatAssemblyEnd(M1,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
32410c7d97c5SJed Brown       ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr);
32420c7d97c5SJed Brown       /* Assemble local_auxmat1 = M1*C_{CR} needed by BDDC application in KSP and in preproc */
32430c7d97c5SJed Brown       ierr = MatMatMult(M1,C_CR,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&pcbddc->local_auxmat1);CHKERRQ(ierr);
32440c7d97c5SJed Brown 
32450c7d97c5SJed Brown     }
32460c7d97c5SJed Brown 
32470c7d97c5SJed Brown     /* Get submatrices from subdomain matrix */
32483b03a366Sstefano_zampini     if (n_vertices){
3249534831adSStefano Zampini       ierr = MatGetSubMatrix(pcbddc->local_mat,is_R_local,is_V_local,MAT_INITIAL_MATRIX,&A_RV);CHKERRQ(ierr);
3250534831adSStefano Zampini       ierr = MatGetSubMatrix(pcbddc->local_mat,is_V_local,is_R_local,MAT_INITIAL_MATRIX,&A_VR);CHKERRQ(ierr);
3251534831adSStefano Zampini       ierr = MatGetSubMatrix(pcbddc->local_mat,is_V_local,is_V_local,MAT_INITIAL_MATRIX,&A_VV);CHKERRQ(ierr);
32520c7d97c5SJed Brown     }
32530c7d97c5SJed Brown 
32540c7d97c5SJed Brown     /* Matrix of coarse basis functions (local) */
3255d49ef151SStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->coarse_phi_B);CHKERRQ(ierr);
32560c7d97c5SJed Brown     ierr = MatSetSizes(pcbddc->coarse_phi_B,n_B,pcbddc->local_primal_size,n_B,pcbddc->local_primal_size);CHKERRQ(ierr);
32570c7d97c5SJed Brown     ierr = MatSetType(pcbddc->coarse_phi_B,impMatType);CHKERRQ(ierr);
32583b03a366Sstefano_zampini     ierr = MatSeqDenseSetPreallocation(pcbddc->coarse_phi_B,PETSC_NULL);CHKERRQ(ierr);
3259e269702eSStefano Zampini     if (pcbddc->prec_type || dbg_flag ) {
3260d49ef151SStefano Zampini       ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->coarse_phi_D);CHKERRQ(ierr);
32610c7d97c5SJed Brown       ierr = MatSetSizes(pcbddc->coarse_phi_D,n_D,pcbddc->local_primal_size,n_D,pcbddc->local_primal_size);CHKERRQ(ierr);
32620c7d97c5SJed Brown       ierr = MatSetType(pcbddc->coarse_phi_D,impMatType);CHKERRQ(ierr);
32633b03a366Sstefano_zampini       ierr = MatSeqDenseSetPreallocation(pcbddc->coarse_phi_D,PETSC_NULL);CHKERRQ(ierr);
32640c7d97c5SJed Brown     }
32650c7d97c5SJed Brown 
3266e269702eSStefano Zampini     if (dbg_flag) {
32670c7d97c5SJed Brown       ierr = PetscMalloc( pcbddc->local_primal_size*sizeof(PetscScalar),&coarsefunctions_errors);CHKERRQ(ierr);
32680c7d97c5SJed Brown       ierr = PetscMalloc( pcbddc->local_primal_size*sizeof(PetscScalar),&constraints_errors);CHKERRQ(ierr);
32690c7d97c5SJed Brown     }
32703b03a366Sstefano_zampini     /* Subdomain contribution (Non-overlapping) to coarse matrix  */
32710c7d97c5SJed Brown     ierr = PetscMalloc ((pcbddc->local_primal_size)*(pcbddc->local_primal_size)*sizeof(PetscScalar),&coarse_submat_vals);CHKERRQ(ierr);
32720c7d97c5SJed Brown 
32730c7d97c5SJed Brown     /* We are now ready to evaluate coarse basis functions and subdomain contribution to coarse problem */
32743b03a366Sstefano_zampini     for (i=0;i<n_vertices;i++){
32750c7d97c5SJed Brown       ierr = VecSet(vec1_V,zero);CHKERRQ(ierr);
32760c7d97c5SJed Brown       ierr = VecSetValue(vec1_V,i,one,INSERT_VALUES);CHKERRQ(ierr);
32770c7d97c5SJed Brown       ierr = VecAssemblyBegin(vec1_V);CHKERRQ(ierr);
32780c7d97c5SJed Brown       ierr = VecAssemblyEnd(vec1_V);CHKERRQ(ierr);
32790c7d97c5SJed Brown       /* solution of saddle point problem */
32800bdf917eSStefano Zampini       ierr = MatMult(A_RV,vec1_V,pcbddc->vec1_R);CHKERRQ(ierr);
32810bdf917eSStefano Zampini       ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec1_R);CHKERRQ(ierr);
32820c7d97c5SJed Brown       ierr = VecScale(pcbddc->vec1_R,m_one);CHKERRQ(ierr);
32833b03a366Sstefano_zampini       if (n_constraints) {
32840c7d97c5SJed Brown         ierr = MatMult(pcbddc->local_auxmat1,pcbddc->vec1_R,vec1_C);CHKERRQ(ierr);
32850c7d97c5SJed Brown         ierr = MatMultAdd(pcbddc->local_auxmat2,vec1_C,pcbddc->vec1_R,pcbddc->vec1_R);CHKERRQ(ierr);
32860c7d97c5SJed Brown         ierr = VecScale(vec1_C,m_one);CHKERRQ(ierr);
32870c7d97c5SJed Brown       }
32880c7d97c5SJed Brown       ierr = MatMult(A_VR,pcbddc->vec1_R,vec2_V);CHKERRQ(ierr);
32890c7d97c5SJed Brown       ierr = MatMultAdd(A_VV,vec1_V,vec2_V,vec2_V);CHKERRQ(ierr);
32900c7d97c5SJed Brown 
32910c7d97c5SJed Brown       /* Set values in coarse basis function and subdomain part of coarse_mat */
32920c7d97c5SJed Brown       /* coarse basis functions */
32930c7d97c5SJed Brown       ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr);
32940c7d97c5SJed Brown       ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
32950c7d97c5SJed Brown       ierr = VecScatterEnd  (pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
32960c7d97c5SJed Brown       ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr);
32973b03a366Sstefano_zampini       ierr = MatSetValues(pcbddc->coarse_phi_B,n_B,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
32980c7d97c5SJed Brown       ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr);
32990c7d97c5SJed Brown       ierr = MatSetValue(pcbddc->coarse_phi_B,idx_V_B[i],i,one,INSERT_VALUES);CHKERRQ(ierr);
3300e269702eSStefano Zampini       if ( pcbddc->prec_type || dbg_flag  ) {
33010c7d97c5SJed Brown         ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
33020c7d97c5SJed Brown         ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
33030c7d97c5SJed Brown         ierr = VecGetArray(pcis->vec1_D,&array);CHKERRQ(ierr);
33043b03a366Sstefano_zampini         ierr = MatSetValues(pcbddc->coarse_phi_D,n_D,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
33050c7d97c5SJed Brown         ierr = VecRestoreArray(pcis->vec1_D,&array);CHKERRQ(ierr);
33060c7d97c5SJed Brown       }
33070c7d97c5SJed Brown       /* subdomain contribution to coarse matrix */
33080c7d97c5SJed Brown       ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr);
3309da1bb401SStefano Zampini       for (j=0;j<n_vertices;j++) { coarse_submat_vals[i*pcbddc->local_primal_size+j] = array[j]; } /* WARNING -> column major ordering */
33100c7d97c5SJed Brown       ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr);
33113b03a366Sstefano_zampini       if (n_constraints) {
33120c7d97c5SJed Brown         ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr);
3313da1bb401SStefano Zampini         for (j=0;j<n_constraints;j++) { coarse_submat_vals[i*pcbddc->local_primal_size+j+n_vertices] = array[j]; } /* WARNING -> column major ordering */
33140c7d97c5SJed Brown         ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr);
33150c7d97c5SJed Brown       }
33160c7d97c5SJed Brown 
3317e269702eSStefano Zampini       if ( dbg_flag ) {
33180c7d97c5SJed Brown         /* assemble subdomain vector on nodes */
3319d49ef151SStefano Zampini         ierr = VecSet(pcis->vec1_N,zero);CHKERRQ(ierr);
33200c7d97c5SJed Brown         ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
33210c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr);
33220c7d97c5SJed Brown         for (j=0;j<n_R;j++) { array[idx_R_local[j]] = array2[j]; }
33233b03a366Sstefano_zampini         array[ vertices[i] ] = one;
33240c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr);
33250c7d97c5SJed Brown         ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
33260c7d97c5SJed Brown         /* assemble subdomain vector of lagrange multipliers (i.e. primal nodes) */
3327d49ef151SStefano Zampini         ierr = VecSet(pcbddc->vec1_P,zero);CHKERRQ(ierr);
33280c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr);
33290c7d97c5SJed Brown         ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr);
33303b03a366Sstefano_zampini         for (j=0;j<n_vertices;j++) { array2[j]=array[j]; }
33310c7d97c5SJed Brown         ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr);
33323b03a366Sstefano_zampini         if (n_constraints) {
33330c7d97c5SJed Brown           ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr);
33343b03a366Sstefano_zampini           for (j=0;j<n_constraints;j++) { array2[j+n_vertices]=array[j]; }
33350c7d97c5SJed Brown           ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr);
33360c7d97c5SJed Brown         }
33370c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr);
33380c7d97c5SJed Brown         ierr = VecScale(pcbddc->vec1_P,m_one);CHKERRQ(ierr);
33390c7d97c5SJed Brown         /* check saddle point solution */
3340534831adSStefano Zampini         ierr = MatMult(pcbddc->local_mat,pcis->vec1_N,pcis->vec2_N);CHKERRQ(ierr);
33413b03a366Sstefano_zampini         ierr = MatMultTransposeAdd(pcbddc->ConstraintMatrix,pcbddc->vec1_P,pcis->vec2_N,pcis->vec2_N);CHKERRQ(ierr);
33423b03a366Sstefano_zampini         ierr = VecNorm(pcis->vec2_N,NORM_INFINITY,&coarsefunctions_errors[i]);CHKERRQ(ierr);
33433b03a366Sstefano_zampini         ierr = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr);
33440c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
33453b03a366Sstefano_zampini         array[i]=array[i]+m_one;  /* shift by the identity matrix */
33460c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
33473b03a366Sstefano_zampini         ierr = VecNorm(pcbddc->vec1_P,NORM_INFINITY,&constraints_errors[i]);CHKERRQ(ierr);
33480c7d97c5SJed Brown       }
33490c7d97c5SJed Brown     }
33500c7d97c5SJed Brown 
33513b03a366Sstefano_zampini     for (i=0;i<n_constraints;i++){
3352d49ef151SStefano Zampini       ierr = VecSet(vec2_C,zero);CHKERRQ(ierr);
33530c7d97c5SJed Brown       ierr = VecSetValue(vec2_C,i,m_one,INSERT_VALUES);CHKERRQ(ierr);
33540c7d97c5SJed Brown       ierr = VecAssemblyBegin(vec2_C);CHKERRQ(ierr);
33550c7d97c5SJed Brown       ierr = VecAssemblyEnd(vec2_C);CHKERRQ(ierr);
33560c7d97c5SJed Brown       /* solution of saddle point problem */
33570c7d97c5SJed Brown       ierr = MatMult(M1,vec2_C,vec1_C);CHKERRQ(ierr);
33580c7d97c5SJed Brown       ierr = MatMult(pcbddc->local_auxmat2,vec1_C,pcbddc->vec1_R);CHKERRQ(ierr);
33590c7d97c5SJed Brown       ierr = VecScale(vec1_C,m_one);CHKERRQ(ierr);
33603b03a366Sstefano_zampini       if (n_vertices) { ierr = MatMult(A_VR,pcbddc->vec1_R,vec2_V);CHKERRQ(ierr); }
33610c7d97c5SJed Brown       /* Set values in coarse basis function and subdomain part of coarse_mat */
33620c7d97c5SJed Brown       /* coarse basis functions */
33633b03a366Sstefano_zampini       index=i+n_vertices;
33640c7d97c5SJed Brown       ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr);
33650c7d97c5SJed Brown       ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
33660c7d97c5SJed Brown       ierr = VecScatterEnd  (pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
33670c7d97c5SJed Brown       ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr);
336853cdbc3dSStefano Zampini       ierr = MatSetValues(pcbddc->coarse_phi_B,n_B,auxindices,1,&index,array,INSERT_VALUES);CHKERRQ(ierr);
33690c7d97c5SJed Brown       ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr);
3370e269702eSStefano Zampini       if ( pcbddc->prec_type || dbg_flag ) {
33710c7d97c5SJed Brown         ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
33720c7d97c5SJed Brown         ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
33730c7d97c5SJed Brown         ierr = VecGetArray(pcis->vec1_D,&array);CHKERRQ(ierr);
337453cdbc3dSStefano Zampini         ierr = MatSetValues(pcbddc->coarse_phi_D,n_D,auxindices,1,&index,array,INSERT_VALUES);CHKERRQ(ierr);
33750c7d97c5SJed Brown         ierr = VecRestoreArray(pcis->vec1_D,&array);CHKERRQ(ierr);
33760c7d97c5SJed Brown       }
33770c7d97c5SJed Brown       /* subdomain contribution to coarse matrix */
33783b03a366Sstefano_zampini       if (n_vertices) {
33790c7d97c5SJed Brown         ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr);
3380da1bb401SStefano Zampini         for (j=0;j<n_vertices;j++) {coarse_submat_vals[index*pcbddc->local_primal_size+j]=array[j];} /* WARNING -> column major ordering */
33810c7d97c5SJed Brown         ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr);
33820c7d97c5SJed Brown       }
33830c7d97c5SJed Brown       ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr);
3384da1bb401SStefano Zampini       for (j=0;j<n_constraints;j++) {coarse_submat_vals[index*pcbddc->local_primal_size+j+n_vertices]=array[j];} /* WARNING -> column major ordering */
33850c7d97c5SJed Brown       ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr);
33860c7d97c5SJed Brown 
3387e269702eSStefano Zampini       if ( dbg_flag ) {
33880c7d97c5SJed Brown         /* assemble subdomain vector on nodes */
338953cdbc3dSStefano Zampini         ierr = VecSet(pcis->vec1_N,zero);CHKERRQ(ierr);
33900c7d97c5SJed Brown         ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
33910c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr);
33920c7d97c5SJed Brown         for (j=0;j<n_R;j++){ array[ idx_R_local[j] ] = array2[j]; }
33930c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr);
33940c7d97c5SJed Brown         ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
33950c7d97c5SJed Brown         /* assemble subdomain vector of lagrange multipliers */
339653cdbc3dSStefano Zampini         ierr = VecSet(pcbddc->vec1_P,zero);CHKERRQ(ierr);
33970c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr);
33983b03a366Sstefano_zampini         if ( n_vertices) {
33990c7d97c5SJed Brown           ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr);
34003b03a366Sstefano_zampini           for (j=0;j<n_vertices;j++) {array2[j]=-array[j];}
34010c7d97c5SJed Brown           ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr);
34020c7d97c5SJed Brown         }
34030c7d97c5SJed Brown         ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr);
34043b03a366Sstefano_zampini         for (j=0;j<n_constraints;j++) {array2[j+n_vertices]=-array[j];}
34050c7d97c5SJed Brown         ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr);
34060c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr);
34073972b0daSStefano Zampini         /* check saddle point solution */
3408534831adSStefano Zampini         ierr = MatMult(pcbddc->local_mat,pcis->vec1_N,pcis->vec2_N);CHKERRQ(ierr);
34093b03a366Sstefano_zampini         ierr = MatMultTransposeAdd(pcbddc->ConstraintMatrix,pcbddc->vec1_P,pcis->vec2_N,pcis->vec2_N);CHKERRQ(ierr);
341053cdbc3dSStefano Zampini         ierr = VecNorm(pcis->vec2_N,NORM_INFINITY,&coarsefunctions_errors[index]);CHKERRQ(ierr);
34113b03a366Sstefano_zampini         ierr = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr);
34120c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
341353cdbc3dSStefano Zampini         array[index]=array[index]+m_one; /* shift by the identity matrix */
34140c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
341553cdbc3dSStefano Zampini         ierr = VecNorm(pcbddc->vec1_P,NORM_INFINITY,&constraints_errors[index]);CHKERRQ(ierr);
34160c7d97c5SJed Brown       }
34170c7d97c5SJed Brown     }
34180c7d97c5SJed Brown     ierr = MatAssemblyBegin(pcbddc->coarse_phi_B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
34190c7d97c5SJed Brown     ierr = MatAssemblyEnd  (pcbddc->coarse_phi_B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
3420e269702eSStefano Zampini     if ( pcbddc->prec_type || dbg_flag ) {
34210c7d97c5SJed Brown       ierr = MatAssemblyBegin(pcbddc->coarse_phi_D,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
34220c7d97c5SJed Brown       ierr = MatAssemblyEnd  (pcbddc->coarse_phi_D,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
34230c7d97c5SJed Brown     }
34240c7d97c5SJed Brown     /* Checking coarse_sub_mat and coarse basis functios */
34250c7d97c5SJed Brown     /* It shuld be \Phi^{(j)^T} A^{(j)} \Phi^{(j)}=coarse_sub_mat */
34269d2fce94SStefano Zampini     if (dbg_flag) {
34270c7d97c5SJed Brown       Mat         coarse_sub_mat;
34280c7d97c5SJed Brown       Mat         TM1,TM2,TM3,TM4;
34290c7d97c5SJed Brown       Mat         coarse_phi_D,coarse_phi_B,A_II,A_BB,A_IB,A_BI;
343019fd82e9SBarry Smith       MatType     checkmattype=MATSEQAIJ;
34310c7d97c5SJed Brown       PetscScalar value;
34320c7d97c5SJed Brown 
3433c042a7c3SStefano Zampini       ierr = MatConvert(pcis->A_II,checkmattype,MAT_INITIAL_MATRIX,&A_II);CHKERRQ(ierr);
3434c042a7c3SStefano Zampini       ierr = MatConvert(pcis->A_IB,checkmattype,MAT_INITIAL_MATRIX,&A_IB);CHKERRQ(ierr);
3435c042a7c3SStefano Zampini       ierr = MatConvert(pcis->A_BI,checkmattype,MAT_INITIAL_MATRIX,&A_BI);CHKERRQ(ierr);
3436c042a7c3SStefano Zampini       ierr = MatConvert(pcis->A_BB,checkmattype,MAT_INITIAL_MATRIX,&A_BB);CHKERRQ(ierr);
3437c042a7c3SStefano Zampini       ierr = MatConvert(pcbddc->coarse_phi_D,checkmattype,MAT_INITIAL_MATRIX,&coarse_phi_D);CHKERRQ(ierr);
3438c042a7c3SStefano Zampini       ierr = MatConvert(pcbddc->coarse_phi_B,checkmattype,MAT_INITIAL_MATRIX,&coarse_phi_B);CHKERRQ(ierr);
3439c042a7c3SStefano Zampini       ierr = MatCreateSeqDense(PETSC_COMM_SELF,pcbddc->local_primal_size,pcbddc->local_primal_size,coarse_submat_vals,&coarse_sub_mat);CHKERRQ(ierr);
3440c042a7c3SStefano Zampini       ierr = MatConvert(coarse_sub_mat,checkmattype,MAT_REUSE_MATRIX,&coarse_sub_mat);CHKERRQ(ierr);
34410c7d97c5SJed Brown 
3442da1bb401SStefano Zampini       /*PetscViewer view_out;
3443da1bb401SStefano Zampini       PetscMPIInt myrank;
3444da1bb401SStefano Zampini       char filename[256];
3445da1bb401SStefano Zampini       MPI_Comm_rank(((PetscObject)pc)->comm,&myrank);
3446da1bb401SStefano Zampini       sprintf(filename,"coarsesubmat_%04d.m",myrank);
3447da1bb401SStefano Zampini       ierr = PetscViewerASCIIOpen(PETSC_COMM_SELF,filename,&view_out);CHKERRQ(ierr);
3448da1bb401SStefano Zampini       ierr = PetscViewerSetFormat(view_out,PETSC_VIEWER_ASCII_MATLAB);CHKERRQ(ierr);
3449da1bb401SStefano Zampini       ierr = MatView(coarse_sub_mat,view_out);CHKERRQ(ierr);
3450da1bb401SStefano Zampini       ierr = PetscViewerDestroy(&view_out);CHKERRQ(ierr);*/
3451da1bb401SStefano Zampini 
34520c7d97c5SJed Brown       ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
34530c7d97c5SJed Brown       ierr = PetscViewerASCIIPrintf(viewer,"Check coarse sub mat and local basis functions\n");CHKERRQ(ierr);
34540c7d97c5SJed Brown       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
345553cdbc3dSStefano Zampini       ierr = MatPtAP(A_II,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&TM1);CHKERRQ(ierr);
345653cdbc3dSStefano Zampini       ierr = MatPtAP(A_BB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&TM2);CHKERRQ(ierr);
345753cdbc3dSStefano Zampini       ierr = MatMatMult(A_IB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr);
3458c042a7c3SStefano Zampini       ierr = MatTransposeMatMult(coarse_phi_D,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM3);CHKERRQ(ierr);
345953cdbc3dSStefano Zampini       ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr);
346053cdbc3dSStefano Zampini       ierr = MatMatMult(A_BI,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr);
3461c042a7c3SStefano Zampini       ierr = MatTransposeMatMult(coarse_phi_B,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM4);CHKERRQ(ierr);
346253cdbc3dSStefano Zampini       ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr);
346353cdbc3dSStefano Zampini       ierr = MatAXPY(TM1,one,TM2,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
346453cdbc3dSStefano Zampini       ierr = MatAXPY(TM1,one,TM3,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
346553cdbc3dSStefano Zampini       ierr = MatAXPY(TM1,one,TM4,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
346653cdbc3dSStefano Zampini       ierr = MatAXPY(TM1,m_one,coarse_sub_mat,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
346753cdbc3dSStefano Zampini       ierr = MatNorm(TM1,NORM_INFINITY,&value);CHKERRQ(ierr);
34680c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"----------------------------------\n");CHKERRQ(ierr);
34690c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d \n",PetscGlobalRank);CHKERRQ(ierr);
34700c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"matrix error = % 1.14e\n",value);CHKERRQ(ierr);
34710c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"coarse functions errors\n");CHKERRQ(ierr);
347253cdbc3dSStefano Zampini       for (i=0;i<pcbddc->local_primal_size;i++) { ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local %02d-th function error = % 1.14e\n",i,coarsefunctions_errors[i]);CHKERRQ(ierr); }
34730c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"constraints errors\n");CHKERRQ(ierr);
347453cdbc3dSStefano Zampini       for (i=0;i<pcbddc->local_primal_size;i++) { ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local %02d-th function error = % 1.14e\n",i,constraints_errors[i]);CHKERRQ(ierr); }
34750c7d97c5SJed Brown       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
347653cdbc3dSStefano Zampini       ierr = MatDestroy(&A_II);CHKERRQ(ierr);
347753cdbc3dSStefano Zampini       ierr = MatDestroy(&A_BB);CHKERRQ(ierr);
347853cdbc3dSStefano Zampini       ierr = MatDestroy(&A_IB);CHKERRQ(ierr);
347953cdbc3dSStefano Zampini       ierr = MatDestroy(&A_BI);CHKERRQ(ierr);
348053cdbc3dSStefano Zampini       ierr = MatDestroy(&TM1);CHKERRQ(ierr);
348153cdbc3dSStefano Zampini       ierr = MatDestroy(&TM2);CHKERRQ(ierr);
348253cdbc3dSStefano Zampini       ierr = MatDestroy(&TM3);CHKERRQ(ierr);
348353cdbc3dSStefano Zampini       ierr = MatDestroy(&TM4);CHKERRQ(ierr);
348453cdbc3dSStefano Zampini       ierr = MatDestroy(&coarse_phi_D);CHKERRQ(ierr);
348553cdbc3dSStefano Zampini       ierr = MatDestroy(&coarse_sub_mat);CHKERRQ(ierr);
348653cdbc3dSStefano Zampini       ierr = MatDestroy(&coarse_phi_B);CHKERRQ(ierr);
34870c7d97c5SJed Brown       ierr = PetscFree(coarsefunctions_errors);CHKERRQ(ierr);
34880c7d97c5SJed Brown       ierr = PetscFree(constraints_errors);CHKERRQ(ierr);
34890c7d97c5SJed Brown     }
34900c7d97c5SJed Brown 
34910c7d97c5SJed Brown     /* create coarse matrix and data structures for message passing associated actual choice of coarse problem type */
34920c7d97c5SJed Brown     ierr = PCBDDCSetupCoarseEnvironment(pc,coarse_submat_vals);CHKERRQ(ierr);
34930c7d97c5SJed Brown     /* free memory */
34940c7d97c5SJed Brown     ierr = PetscFree(coarse_submat_vals);CHKERRQ(ierr);
34950c7d97c5SJed Brown     ierr = PetscFree(auxindices);CHKERRQ(ierr);
34960c7d97c5SJed Brown     ierr = PetscFree(nnz);CHKERRQ(ierr);
34973b03a366Sstefano_zampini     if (n_vertices) {
34980c7d97c5SJed Brown       ierr = VecDestroy(&vec1_V);CHKERRQ(ierr);
34990c7d97c5SJed Brown       ierr = VecDestroy(&vec2_V);CHKERRQ(ierr);
35000c7d97c5SJed Brown       ierr = MatDestroy(&A_RV);CHKERRQ(ierr);
35010c7d97c5SJed Brown       ierr = MatDestroy(&A_VR);CHKERRQ(ierr);
35020c7d97c5SJed Brown       ierr = MatDestroy(&A_VV);CHKERRQ(ierr);
35030c7d97c5SJed Brown     }
3504534831adSStefano Zampini     if (n_constraints) {
35050c7d97c5SJed Brown       ierr = VecDestroy(&vec1_C);CHKERRQ(ierr);
35060c7d97c5SJed Brown       ierr = VecDestroy(&vec2_C);CHKERRQ(ierr);
35070c7d97c5SJed Brown       ierr = MatDestroy(&M1);CHKERRQ(ierr);
35080c7d97c5SJed Brown       ierr = MatDestroy(&C_CR);CHKERRQ(ierr);
35090c7d97c5SJed Brown     }
35100c7d97c5SJed Brown   }
35110c7d97c5SJed Brown   /* free memory */
35123b03a366Sstefano_zampini   if (n_vertices) {
35130c7d97c5SJed Brown     ierr = PetscFree(idx_V_B);CHKERRQ(ierr);
35140c7d97c5SJed Brown     ierr = ISDestroy(&is_V_local);CHKERRQ(ierr);
35150c7d97c5SJed Brown   }
35160c7d97c5SJed Brown   ierr = ISDestroy(&is_R_local);CHKERRQ(ierr);
35170c7d97c5SJed Brown 
35180c7d97c5SJed Brown   PetscFunctionReturn(0);
35190c7d97c5SJed Brown }
35200c7d97c5SJed Brown 
35210c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
35220c7d97c5SJed Brown 
35230c7d97c5SJed Brown #undef __FUNCT__
35240c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetupCoarseEnvironment"
352553cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetupCoarseEnvironment(PC pc,PetscScalar* coarse_submat_vals)
35260c7d97c5SJed Brown {
35270c7d97c5SJed Brown 
35280c7d97c5SJed Brown 
35290c7d97c5SJed Brown   Mat_IS    *matis    = (Mat_IS*)pc->pmat->data;
35300c7d97c5SJed Brown   PC_BDDC   *pcbddc   = (PC_BDDC*)pc->data;
35310c7d97c5SJed Brown   PC_IS     *pcis     = (PC_IS*)pc->data;
35320c7d97c5SJed Brown   MPI_Comm  prec_comm = ((PetscObject)pc)->comm;
35330c7d97c5SJed Brown   MPI_Comm  coarse_comm;
35340c7d97c5SJed Brown 
35350c7d97c5SJed Brown   /* common to all choiches */
35360c7d97c5SJed Brown   PetscScalar *temp_coarse_mat_vals;
35370c7d97c5SJed Brown   PetscScalar *ins_coarse_mat_vals;
35380c7d97c5SJed Brown   PetscInt    *ins_local_primal_indices;
35390c7d97c5SJed Brown   PetscMPIInt *localsizes2,*localdispl2;
35400c7d97c5SJed Brown   PetscMPIInt size_prec_comm;
35410c7d97c5SJed Brown   PetscMPIInt rank_prec_comm;
35420c7d97c5SJed Brown   PetscMPIInt active_rank=MPI_PROC_NULL;
35430c7d97c5SJed Brown   PetscMPIInt master_proc=0;
35440c7d97c5SJed Brown   PetscInt    ins_local_primal_size;
35450c7d97c5SJed Brown   /* specific to MULTILEVEL_BDDC */
35460c7d97c5SJed Brown   PetscMPIInt *ranks_recv;
35470c7d97c5SJed Brown   PetscMPIInt count_recv=0;
35480c7d97c5SJed Brown   PetscMPIInt rank_coarse_proc_send_to;
35490c7d97c5SJed Brown   PetscMPIInt coarse_color = MPI_UNDEFINED;
35500c7d97c5SJed Brown   ISLocalToGlobalMapping coarse_ISLG;
35510c7d97c5SJed Brown   /* some other variables */
35520c7d97c5SJed Brown   PetscErrorCode ierr;
355319fd82e9SBarry Smith   MatType coarse_mat_type;
355419fd82e9SBarry Smith   PCType  coarse_pc_type;
355519fd82e9SBarry Smith   KSPType coarse_ksp_type;
355653cdbc3dSStefano Zampini   PC pc_temp;
35574fad6a16SStefano Zampini   PetscInt i,j,k;
35583b03a366Sstefano_zampini   PetscInt max_it_coarse_ksp=1;  /* don't increase this value */
3559e269702eSStefano Zampini   /* verbose output viewer */
3560e269702eSStefano Zampini   PetscViewer viewer=pcbddc->dbg_viewer;
3561e269702eSStefano Zampini   PetscBool   dbg_flag=pcbddc->dbg_flag;
3562142dfd88SStefano Zampini 
3563ea7e1babSStefano Zampini   PetscInt      offset,offset2;
3564142dfd88SStefano Zampini   PetscMPIInt   im_active=0;
3565523858cfSStefano Zampini   PetscInt      *dnz,*onz;
3566142dfd88SStefano Zampini 
3567142dfd88SStefano Zampini   PetscBool     setsym,issym=PETSC_FALSE;
35680c7d97c5SJed Brown 
35690c7d97c5SJed Brown   PetscFunctionBegin;
35700c7d97c5SJed Brown   ins_local_primal_indices = 0;
35710c7d97c5SJed Brown   ins_coarse_mat_vals      = 0;
35720c7d97c5SJed Brown   localsizes2              = 0;
35730c7d97c5SJed Brown   localdispl2              = 0;
35740c7d97c5SJed Brown   temp_coarse_mat_vals     = 0;
35750c7d97c5SJed Brown   coarse_ISLG              = 0;
35760c7d97c5SJed Brown 
357753cdbc3dSStefano Zampini   ierr = MPI_Comm_size(prec_comm,&size_prec_comm);CHKERRQ(ierr);
357853cdbc3dSStefano Zampini   ierr = MPI_Comm_rank(prec_comm,&rank_prec_comm);CHKERRQ(ierr);
3579142dfd88SStefano Zampini   ierr = MatIsSymmetricKnown(pc->pmat,&setsym,&issym);CHKERRQ(ierr);
3580142dfd88SStefano Zampini 
3581beed3852SStefano Zampini   /* Assign global numbering to coarse dofs */
3582beed3852SStefano Zampini   {
3583ef028eecSStefano Zampini     PetscInt     *auxlocal_primal;
3584da1bb401SStefano Zampini     PetscInt     *row_cmat_indices;
35852e8d2280SStefano Zampini     PetscInt     *aux_ordering;
35862e8d2280SStefano Zampini     PetscInt     *row_cmat_global_indices;
3587ef028eecSStefano Zampini     PetscInt     *dof_sizes,*dof_displs;
35883b03a366Sstefano_zampini     PetscInt     size_of_constraint;
35892e8d2280SStefano Zampini     PetscBool    *array_bool;
3590ef028eecSStefano Zampini     PetscBool    first_found;
3591ef028eecSStefano Zampini     PetscInt     first_index,old_index,s;
3592ef028eecSStefano Zampini     PetscMPIInt  mpi_local_primal_size;
3593ef028eecSStefano Zampini     PetscScalar  coarsesum,*array;
3594ef028eecSStefano Zampini 
3595ef028eecSStefano Zampini     mpi_local_primal_size = (PetscMPIInt)pcbddc->local_primal_size;
3596beed3852SStefano Zampini 
3597beed3852SStefano Zampini     /* Construct needed data structures for message passing */
3598ef028eecSStefano Zampini     ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscInt),&pcbddc->local_primal_indices);CHKERRQ(ierr);
3599ffe5efe1SStefano Zampini     j = 0;
3600142dfd88SStefano Zampini     if (rank_prec_comm == 0 || pcbddc->coarse_problem_type == REPLICATED_BDDC || pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
3601ffe5efe1SStefano Zampini       j = size_prec_comm;
3602ffe5efe1SStefano Zampini     }
3603ffe5efe1SStefano Zampini     ierr = PetscMalloc(j*sizeof(PetscMPIInt),&pcbddc->local_primal_sizes);CHKERRQ(ierr);
3604ffe5efe1SStefano Zampini     ierr = PetscMalloc(j*sizeof(PetscMPIInt),&pcbddc->local_primal_displacements);CHKERRQ(ierr);
3605beed3852SStefano Zampini     /* Gather local_primal_size information for all processes  */
3606142dfd88SStefano Zampini     if (pcbddc->coarse_problem_type == REPLICATED_BDDC || pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
36075619798eSStefano Zampini       ierr = MPI_Allgather(&mpi_local_primal_size,1,MPIU_INT,&pcbddc->local_primal_sizes[0],1,MPIU_INT,prec_comm);CHKERRQ(ierr);
3608ffe5efe1SStefano Zampini     } else {
3609ffe5efe1SStefano Zampini       ierr = MPI_Gather(&mpi_local_primal_size,1,MPIU_INT,&pcbddc->local_primal_sizes[0],1,MPIU_INT,0,prec_comm);CHKERRQ(ierr);
3610ffe5efe1SStefano Zampini     }
3611beed3852SStefano Zampini     pcbddc->replicated_primal_size = 0;
3612ffe5efe1SStefano Zampini     for (i=0; i<j; i++) {
3613beed3852SStefano Zampini       pcbddc->local_primal_displacements[i] = pcbddc->replicated_primal_size ;
3614beed3852SStefano Zampini       pcbddc->replicated_primal_size += pcbddc->local_primal_sizes[i];
3615beed3852SStefano Zampini     }
3616beed3852SStefano Zampini 
3617da1bb401SStefano Zampini     /* First let's count coarse dofs.
3618beed3852SStefano Zampini        This code fragment assumes that the number of local constraints per connected component
3619beed3852SStefano Zampini        is not greater than the number of nodes defined for the connected component
3620beed3852SStefano Zampini        (otherwise we will surely have linear dependence between constraints and thus a singular coarse problem) */
3621ef028eecSStefano Zampini     ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscInt),&auxlocal_primal);CHKERRQ(ierr);
36222e8d2280SStefano Zampini     j = 0;
36232e8d2280SStefano Zampini     for (i=0;i<pcbddc->local_primal_size;i++) {
36242e8d2280SStefano Zampini       ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,PETSC_NULL,PETSC_NULL);CHKERRQ(ierr);
36252e8d2280SStefano Zampini       if ( j < size_of_constraint ) {
36262e8d2280SStefano Zampini         j = size_of_constraint;
36272e8d2280SStefano Zampini       }
36282e8d2280SStefano Zampini       ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,PETSC_NULL,PETSC_NULL);CHKERRQ(ierr);
36292e8d2280SStefano Zampini     }
36302e8d2280SStefano Zampini     ierr = PetscMalloc(j*sizeof(PetscInt),&aux_ordering);CHKERRQ(ierr);
36312e8d2280SStefano Zampini     ierr = PetscMalloc(j*sizeof(PetscInt),&row_cmat_global_indices);CHKERRQ(ierr);
36322e8d2280SStefano Zampini     ierr = PetscMalloc(pcis->n*sizeof(PetscBool),&array_bool);CHKERRQ(ierr);
36332e8d2280SStefano Zampini     for (i=0;i<pcis->n;i++) {
36342e8d2280SStefano Zampini       array_bool[i] = PETSC_FALSE;
36352e8d2280SStefano Zampini     }
3636da1bb401SStefano Zampini     for (i=0;i<pcbddc->local_primal_size;i++) {
3637da1bb401SStefano Zampini       ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr);
36383b03a366Sstefano_zampini       for (j=0; j<size_of_constraint; j++) {
36392e8d2280SStefano Zampini         aux_ordering[j] = j;
36402e8d2280SStefano Zampini       }
36412e8d2280SStefano Zampini       ierr = ISLocalToGlobalMappingApply(matis->mapping,size_of_constraint,row_cmat_indices,row_cmat_global_indices);CHKERRQ(ierr);
36422e8d2280SStefano Zampini       ierr = PetscSortIntWithPermutation(size_of_constraint,row_cmat_global_indices,aux_ordering);CHKERRQ(ierr);
36432e8d2280SStefano Zampini       for (j=0; j<size_of_constraint; j++) {
36442e8d2280SStefano Zampini         k = row_cmat_indices[aux_ordering[j]];
36452e8d2280SStefano Zampini         if ( !array_bool[k] ) {
36462e8d2280SStefano Zampini           array_bool[k] = PETSC_TRUE;
3647da1bb401SStefano Zampini           auxlocal_primal[i] = k;
3648beed3852SStefano Zampini           break;
3649beed3852SStefano Zampini         }
3650beed3852SStefano Zampini       }
3651da1bb401SStefano Zampini       ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr);
3652beed3852SStefano Zampini     }
36532e8d2280SStefano Zampini     ierr = PetscFree(aux_ordering);CHKERRQ(ierr);
3654ef028eecSStefano Zampini     ierr = PetscFree(array_bool);CHKERRQ(ierr);
3655ef028eecSStefano Zampini     ierr = PetscFree(row_cmat_global_indices);CHKERRQ(ierr);
36562e8d2280SStefano Zampini 
3657ef028eecSStefano Zampini     /* Compute number of coarse dofs */
3658ef028eecSStefano Zampini     ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
3659ef028eecSStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3660ef028eecSStefano Zampini     for (i=0;i<pcbddc->local_primal_size;i++) {
3661ef028eecSStefano Zampini       array[auxlocal_primal[i]]=1.0;
3662ef028eecSStefano Zampini     }
3663ef028eecSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3664ef028eecSStefano Zampini     ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
3665ef028eecSStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3666ef028eecSStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3667ef028eecSStefano Zampini     ierr = VecSum(pcis->vec1_global,&coarsesum);CHKERRQ(ierr);
3668ef028eecSStefano Zampini     pcbddc->coarse_size = (PetscInt)coarsesum;
3669ef028eecSStefano Zampini 
3670ef028eecSStefano Zampini     /* Fill pcis->vec1_global with cumulative function for global numbering */
3671ef028eecSStefano Zampini     ierr = VecGetArray(pcis->vec1_global,&array);CHKERRQ(ierr);
3672ef028eecSStefano Zampini     ierr = VecGetLocalSize(pcis->vec1_global,&s);CHKERRQ(ierr);
3673ef028eecSStefano Zampini     k = 0;
3674ef028eecSStefano Zampini     first_index = -1;
3675ef028eecSStefano Zampini     first_found = PETSC_FALSE;
3676ef028eecSStefano Zampini     for (i=0;i<s;i++) {
3677ef028eecSStefano Zampini       if (!first_found && array[i] > 0.0) {
3678ef028eecSStefano Zampini         first_found = PETSC_TRUE;
3679ef028eecSStefano Zampini         first_index = i;
3680ef028eecSStefano Zampini       }
3681ef028eecSStefano Zampini       k += (PetscInt)array[i];
3682ef028eecSStefano Zampini     }
3683ef028eecSStefano Zampini     j = ( !rank_prec_comm ? size_prec_comm : 0);
3684ef028eecSStefano Zampini     ierr = PetscMalloc(j*sizeof(*dof_sizes),&dof_sizes);CHKERRQ(ierr);
3685ef028eecSStefano Zampini     ierr = PetscMalloc(j*sizeof(*dof_displs),&dof_displs);CHKERRQ(ierr);
3686ef028eecSStefano Zampini     ierr = MPI_Gather(&k,1,MPIU_INT,dof_sizes,1,MPIU_INT,0,prec_comm);CHKERRQ(ierr);
3687ef028eecSStefano Zampini     if (!rank_prec_comm) {
3688ef028eecSStefano Zampini       dof_displs[0]=0;
3689ef028eecSStefano Zampini       for (i=1;i<size_prec_comm;i++) {
3690ef028eecSStefano Zampini         dof_displs[i] = dof_displs[i-1]+dof_sizes[i-1];
3691ef028eecSStefano Zampini       }
3692ef028eecSStefano Zampini     }
3693ef028eecSStefano Zampini     ierr = MPI_Scatter(dof_displs,1,MPIU_INT,&k,1,MPIU_INT,0,prec_comm);CHKERRQ(ierr);
3694ef028eecSStefano Zampini     if (first_found) {
3695ef028eecSStefano Zampini       array[first_index] += k;
3696ef028eecSStefano Zampini       old_index = first_index;
3697ef028eecSStefano Zampini       for (i=first_index+1;i<s;i++) {
3698ef028eecSStefano Zampini         if (array[i] > 0.0) {
3699ef028eecSStefano Zampini           array[i] += array[old_index];
3700ef028eecSStefano Zampini           old_index = i;
3701ef028eecSStefano Zampini         }
3702ef028eecSStefano Zampini       }
3703ef028eecSStefano Zampini     }
3704ef028eecSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_global,&array);CHKERRQ(ierr);
3705ef028eecSStefano Zampini     ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
3706ef028eecSStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3707ef028eecSStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3708ef028eecSStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3709ef028eecSStefano Zampini     for (i=0;i<pcbddc->local_primal_size;i++) {
3710ef028eecSStefano Zampini       pcbddc->local_primal_indices[i] = (PetscInt)array[auxlocal_primal[i]]-1;
3711ef028eecSStefano Zampini     }
3712ef028eecSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3713ef028eecSStefano Zampini     ierr = PetscFree(dof_displs);CHKERRQ(ierr);
3714ef028eecSStefano Zampini     ierr = PetscFree(dof_sizes);CHKERRQ(ierr);
3715ef028eecSStefano Zampini 
3716ef028eecSStefano Zampini     if (dbg_flag) {
37172e8d2280SStefano Zampini       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
37182e8d2280SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
37192e8d2280SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Check coarse indices\n");CHKERRQ(ierr);
37202e8d2280SStefano Zampini       ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
37212e8d2280SStefano Zampini       ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3722ef028eecSStefano Zampini       for (i=0;i<pcbddc->local_primal_size;i++) {
3723ef028eecSStefano Zampini         array[auxlocal_primal[i]]=1.0;
37242e8d2280SStefano Zampini       }
3725beed3852SStefano Zampini       ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
37262e8d2280SStefano Zampini       ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
3727da1bb401SStefano Zampini       ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3728da1bb401SStefano Zampini       ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3729da1bb401SStefano Zampini       ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3730da1bb401SStefano Zampini       ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3731da1bb401SStefano Zampini       ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
37322e8d2280SStefano Zampini       for (i=0;i<pcis->n;i++) {
37332e8d2280SStefano Zampini         if (array[i] == 1.0) {
37342e8d2280SStefano Zampini           ierr = ISLocalToGlobalMappingApply(matis->mapping,1,&i,&j);CHKERRQ(ierr);
37352e8d2280SStefano Zampini           ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d: WRONG COARSE INDEX %d (local %d)\n",PetscGlobalRank,j,i);CHKERRQ(ierr);
37362e8d2280SStefano Zampini         }
37372e8d2280SStefano Zampini       }
37382e8d2280SStefano Zampini       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
37392e8d2280SStefano Zampini       for (i=0;i<pcis->n;i++) {
37402e8d2280SStefano Zampini         if( array[i] > 0.0) {
37412e8d2280SStefano Zampini           array[i] = 1.0/array[i];
37422e8d2280SStefano Zampini         }
37432e8d2280SStefano Zampini       }
3744da1bb401SStefano Zampini       ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
37452e8d2280SStefano Zampini       ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
3746da1bb401SStefano Zampini       ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3747da1bb401SStefano Zampini       ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3748da1bb401SStefano Zampini       ierr = VecSum(pcis->vec1_global,&coarsesum);CHKERRQ(ierr);
37492e8d2280SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Size of coarse problem SHOULD be %lf\n",coarsesum);CHKERRQ(ierr);
37502e8d2280SStefano Zampini       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
37512e8d2280SStefano Zampini     }
3752142dfd88SStefano Zampini     ierr = PetscFree(auxlocal_primal);CHKERRQ(ierr);
37530bdf917eSStefano Zampini   }
37540bdf917eSStefano Zampini 
37552e8d2280SStefano Zampini   if (dbg_flag) {
37567cf533a6SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"Size of coarse problem is %d\n",pcbddc->coarse_size);CHKERRQ(ierr);
37572e8d2280SStefano Zampini     /*ierr = PetscViewerASCIIPrintf(viewer,"Distribution of local primal indices\n");CHKERRQ(ierr);
37582e8d2280SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
37592e8d2280SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d\n",PetscGlobalRank);CHKERRQ(ierr);
37602e8d2280SStefano Zampini     for (i=0;i<pcbddc->local_primal_size;i++) {
37612e8d2280SStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local_primal_indices[%d]=%d \n",i,pcbddc->local_primal_indices[i]);
37622e8d2280SStefano Zampini     }*/
37632e8d2280SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
37642e8d2280SStefano Zampini   }
37652e8d2280SStefano Zampini 
37660bdf917eSStefano Zampini   if (pcis->n) { im_active = 1; }
37670bdf917eSStefano Zampini   ierr = MPI_Allreduce(&im_active,&pcbddc->active_procs,1,MPIU_INT,MPI_SUM,prec_comm);CHKERRQ(ierr);
37680bdf917eSStefano Zampini 
37690bdf917eSStefano Zampini   /* adapt coarse problem type */
37704fad6a16SStefano Zampini   if (pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
37714fad6a16SStefano Zampini     if (pcbddc->current_level < pcbddc->max_levels) {
37724fad6a16SStefano Zampini       if ( (pcbddc->active_procs/pcbddc->coarsening_ratio) < 2 ) {
37730bdf917eSStefano Zampini         if (dbg_flag) {
37744fad6a16SStefano Zampini           ierr = PetscViewerASCIIPrintf(viewer,"Not enough active processes on level %d (active %d,ratio %d). Parallel direct solve for coarse problem\n",pcbddc->current_level,pcbddc->active_procs,pcbddc->coarsening_ratio);CHKERRQ(ierr);
37750bdf917eSStefano Zampini          ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
37760bdf917eSStefano Zampini         }
37770bdf917eSStefano Zampini         pcbddc->coarse_problem_type = PARALLEL_BDDC;
3778142dfd88SStefano Zampini       }
37794fad6a16SStefano Zampini     } else {
37804fad6a16SStefano Zampini       if (dbg_flag) {
37814fad6a16SStefano Zampini         ierr = PetscViewerASCIIPrintf(viewer,"Max number of levels reached. Using parallel direct solve for coarse problem\n",pcbddc->max_levels,pcbddc->active_procs,pcbddc->coarsening_ratio);CHKERRQ(ierr);
37824fad6a16SStefano Zampini         ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
37834fad6a16SStefano Zampini       }
37844fad6a16SStefano Zampini       pcbddc->coarse_problem_type = PARALLEL_BDDC;
37854fad6a16SStefano Zampini     }
37864fad6a16SStefano Zampini   }
3787beed3852SStefano Zampini 
37880c7d97c5SJed Brown   switch(pcbddc->coarse_problem_type){
37890c7d97c5SJed Brown 
3790da1bb401SStefano Zampini     case(MULTILEVEL_BDDC):   /* we define a coarse mesh where subdomains are elements */
37910c7d97c5SJed Brown     {
37920c7d97c5SJed Brown       /* we need additional variables */
37930c7d97c5SJed Brown       MetisInt    n_subdomains,n_parts,objval,ncon,faces_nvtxs;
37940c7d97c5SJed Brown       MetisInt    *metis_coarse_subdivision;
37950c7d97c5SJed Brown       MetisInt    options[METIS_NOPTIONS];
37960c7d97c5SJed Brown       PetscMPIInt size_coarse_comm,rank_coarse_comm;
37970c7d97c5SJed Brown       PetscMPIInt procs_jumps_coarse_comm;
37980c7d97c5SJed Brown       PetscMPIInt *coarse_subdivision;
37990c7d97c5SJed Brown       PetscMPIInt *total_count_recv;
38000c7d97c5SJed Brown       PetscMPIInt *total_ranks_recv;
38010c7d97c5SJed Brown       PetscMPIInt *displacements_recv;
38020c7d97c5SJed Brown       PetscMPIInt *my_faces_connectivity;
38030c7d97c5SJed Brown       PetscMPIInt *petsc_faces_adjncy;
38040c7d97c5SJed Brown       MetisInt    *faces_adjncy;
38050c7d97c5SJed Brown       MetisInt    *faces_xadj;
38060c7d97c5SJed Brown       PetscMPIInt *number_of_faces;
38070c7d97c5SJed Brown       PetscMPIInt *faces_displacements;
38080c7d97c5SJed Brown       PetscInt    *array_int;
38090c7d97c5SJed Brown       PetscMPIInt my_faces=0;
38100c7d97c5SJed Brown       PetscMPIInt total_faces=0;
38113828260eSStefano Zampini       PetscInt    ranks_stretching_ratio;
38120c7d97c5SJed Brown 
38130c7d97c5SJed Brown       /* define some quantities */
38140c7d97c5SJed Brown       pcbddc->coarse_communications_type = SCATTERS_BDDC;
38150c7d97c5SJed Brown       coarse_mat_type = MATIS;
38160c7d97c5SJed Brown       coarse_pc_type  = PCBDDC;
3817142dfd88SStefano Zampini       coarse_ksp_type = KSPRICHARDSON;
38180c7d97c5SJed Brown 
38190c7d97c5SJed Brown       /* details of coarse decomposition */
38200c7d97c5SJed Brown       n_subdomains = pcbddc->active_procs;
38210c7d97c5SJed Brown       n_parts      = n_subdomains/pcbddc->coarsening_ratio;
38223828260eSStefano Zampini       ranks_stretching_ratio = size_prec_comm/pcbddc->active_procs;
38233828260eSStefano Zampini       procs_jumps_coarse_comm = pcbddc->coarsening_ratio*ranks_stretching_ratio;
38243828260eSStefano Zampini 
38254fad6a16SStefano Zampini       /* build CSR graph of subdomains' connectivity */
38260c7d97c5SJed Brown       ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&array_int);CHKERRQ(ierr);
38273828260eSStefano Zampini       ierr = PetscMemzero(array_int,pcis->n*sizeof(PetscInt));CHKERRQ(ierr);
38280c7d97c5SJed Brown       for (i=1;i<pcis->n_neigh;i++){/* i=1 so I don't count myself -> faces nodes counts to 1 */
38290c7d97c5SJed Brown         for (j=0;j<pcis->n_shared[i];j++){
38300c7d97c5SJed Brown           array_int[ pcis->shared[i][j] ]+=1;
38310c7d97c5SJed Brown         }
38320c7d97c5SJed Brown       }
38330c7d97c5SJed Brown       for (i=1;i<pcis->n_neigh;i++){
38340c7d97c5SJed Brown         for (j=0;j<pcis->n_shared[i];j++){
38357cf533a6SStefano Zampini           if (array_int[ pcis->shared[i][j] ] > 0 ){
38360c7d97c5SJed Brown             my_faces++;
38370c7d97c5SJed Brown             break;
38380c7d97c5SJed Brown           }
38390c7d97c5SJed Brown         }
38400c7d97c5SJed Brown       }
38410c7d97c5SJed Brown 
384253cdbc3dSStefano Zampini       ierr = MPI_Reduce(&my_faces,&total_faces,1,MPIU_INT,MPI_SUM,master_proc,prec_comm);CHKERRQ(ierr);
38430c7d97c5SJed Brown       ierr = PetscMalloc (my_faces*sizeof(PetscInt),&my_faces_connectivity);CHKERRQ(ierr);
38440c7d97c5SJed Brown       my_faces=0;
38450c7d97c5SJed Brown       for (i=1;i<pcis->n_neigh;i++){
38460c7d97c5SJed Brown         for (j=0;j<pcis->n_shared[i];j++){
38477cf533a6SStefano Zampini           if (array_int[ pcis->shared[i][j] ] > 0 ){
38480c7d97c5SJed Brown             my_faces_connectivity[my_faces]=pcis->neigh[i];
38490c7d97c5SJed Brown             my_faces++;
38500c7d97c5SJed Brown             break;
38510c7d97c5SJed Brown           }
38520c7d97c5SJed Brown         }
38530c7d97c5SJed Brown       }
38540c7d97c5SJed Brown       if (rank_prec_comm == master_proc) {
38550c7d97c5SJed Brown         ierr = PetscMalloc (total_faces*sizeof(PetscMPIInt),&petsc_faces_adjncy);CHKERRQ(ierr);
38560c7d97c5SJed Brown         ierr = PetscMalloc (size_prec_comm*sizeof(PetscMPIInt),&number_of_faces);CHKERRQ(ierr);
38570c7d97c5SJed Brown         ierr = PetscMalloc (total_faces*sizeof(MetisInt),&faces_adjncy);CHKERRQ(ierr);
38580c7d97c5SJed Brown         ierr = PetscMalloc ((n_subdomains+1)*sizeof(MetisInt),&faces_xadj);CHKERRQ(ierr);
38590c7d97c5SJed Brown         ierr = PetscMalloc ((size_prec_comm+1)*sizeof(PetscMPIInt),&faces_displacements);CHKERRQ(ierr);
38600c7d97c5SJed Brown       }
386153cdbc3dSStefano Zampini       ierr = MPI_Gather(&my_faces,1,MPIU_INT,&number_of_faces[0],1,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr);
38620c7d97c5SJed Brown       if (rank_prec_comm == master_proc) {
38630c7d97c5SJed Brown         faces_xadj[0]=0;
38640c7d97c5SJed Brown         faces_displacements[0]=0;
38650c7d97c5SJed Brown         j=0;
38660c7d97c5SJed Brown         for (i=1;i<size_prec_comm+1;i++) {
38670c7d97c5SJed Brown           faces_displacements[i]=faces_displacements[i-1]+number_of_faces[i-1];
38680c7d97c5SJed Brown           if (number_of_faces[i-1]) {
38690c7d97c5SJed Brown             j++;
38700c7d97c5SJed Brown             faces_xadj[j]=faces_xadj[j-1]+number_of_faces[i-1];
38710c7d97c5SJed Brown           }
38720c7d97c5SJed Brown         }
38730c7d97c5SJed Brown       }
387453cdbc3dSStefano Zampini       ierr = MPI_Gatherv(&my_faces_connectivity[0],my_faces,MPIU_INT,&petsc_faces_adjncy[0],number_of_faces,faces_displacements,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr);
38750c7d97c5SJed Brown       ierr = PetscFree(my_faces_connectivity);CHKERRQ(ierr);
38760c7d97c5SJed Brown       ierr = PetscFree(array_int);CHKERRQ(ierr);
38770c7d97c5SJed Brown       if (rank_prec_comm == master_proc) {
38783828260eSStefano Zampini         for (i=0;i<total_faces;i++) faces_adjncy[i]=(MetisInt)(petsc_faces_adjncy[i]/ranks_stretching_ratio); /* cast to MetisInt */
3879da1bb401SStefano Zampini         /*printf("This is the face connectivity (actual ranks)\n");
38800c7d97c5SJed Brown         for (i=0;i<n_subdomains;i++){
38810c7d97c5SJed Brown           printf("proc %d is connected with \n",i);
38820c7d97c5SJed Brown           for (j=faces_xadj[i];j<faces_xadj[i+1];j++)
38830c7d97c5SJed Brown             printf("%d ",faces_adjncy[j]);
38840c7d97c5SJed Brown           printf("\n");
3885da1bb401SStefano Zampini         }*/
38860c7d97c5SJed Brown         ierr = PetscFree(faces_displacements);CHKERRQ(ierr);
38870c7d97c5SJed Brown         ierr = PetscFree(number_of_faces);CHKERRQ(ierr);
38880c7d97c5SJed Brown         ierr = PetscFree(petsc_faces_adjncy);CHKERRQ(ierr);
38890c7d97c5SJed Brown       }
38900c7d97c5SJed Brown 
38910c7d97c5SJed Brown       if ( rank_prec_comm == master_proc ) {
38920c7d97c5SJed Brown 
38933828260eSStefano Zampini         PetscInt heuristic_for_metis=3;
38943828260eSStefano Zampini 
38950c7d97c5SJed Brown         ncon=1;
38960c7d97c5SJed Brown         faces_nvtxs=n_subdomains;
38970c7d97c5SJed Brown         /* partition graoh induced by face connectivity */
38980c7d97c5SJed Brown         ierr = PetscMalloc (n_subdomains*sizeof(MetisInt),&metis_coarse_subdivision);CHKERRQ(ierr);
38990c7d97c5SJed Brown         ierr = METIS_SetDefaultOptions(options);
39000c7d97c5SJed Brown         /* we need a contiguous partition of the coarse mesh */
39010c7d97c5SJed Brown         options[METIS_OPTION_CONTIG]=1;
39020c7d97c5SJed Brown         options[METIS_OPTION_NITER]=30;
39034fad6a16SStefano Zampini         if (pcbddc->coarsening_ratio > 1) {
39043828260eSStefano Zampini           if (n_subdomains>n_parts*heuristic_for_metis) {
39053828260eSStefano Zampini             options[METIS_OPTION_IPTYPE]=METIS_IPTYPE_EDGE;
39063828260eSStefano Zampini             options[METIS_OPTION_OBJTYPE]=METIS_OBJTYPE_CUT;
39070c7d97c5SJed Brown             ierr = METIS_PartGraphKway(&faces_nvtxs,&ncon,faces_xadj,faces_adjncy,NULL,NULL,NULL,&n_parts,NULL,NULL,options,&objval,metis_coarse_subdivision);
3908142dfd88SStefano Zampini             if (ierr != METIS_OK) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in METIS_PartGraphKway (metis error code %D) called from PCBDDCSetupCoarseEnvironment\n",ierr);
39093828260eSStefano Zampini           } else {
39103828260eSStefano Zampini             ierr = METIS_PartGraphRecursive(&faces_nvtxs,&ncon,faces_xadj,faces_adjncy,NULL,NULL,NULL,&n_parts,NULL,NULL,options,&objval,metis_coarse_subdivision);
3911142dfd88SStefano Zampini             if (ierr != METIS_OK) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in METIS_PartGraphRecursive (metis error code %D) called from PCBDDCSetupCoarseEnvironment\n",ierr);
39123828260eSStefano Zampini           }
39134fad6a16SStefano Zampini         } else {
39144fad6a16SStefano Zampini           for (i=0;i<n_subdomains;i++) {
39154fad6a16SStefano Zampini             metis_coarse_subdivision[i]=i;
39164fad6a16SStefano Zampini           }
39174fad6a16SStefano Zampini         }
39180c7d97c5SJed Brown         ierr = PetscFree(faces_xadj);CHKERRQ(ierr);
39190c7d97c5SJed Brown         ierr = PetscFree(faces_adjncy);CHKERRQ(ierr);
39200bdf917eSStefano Zampini         ierr = PetscMalloc(size_prec_comm*sizeof(PetscMPIInt),&coarse_subdivision);CHKERRQ(ierr);
39210c7d97c5SJed Brown         /* copy/cast values avoiding possible type conflicts between PETSc, MPI and METIS */
39220bdf917eSStefano Zampini         for (i=0;i<size_prec_comm;i++) { coarse_subdivision[i]=MPI_PROC_NULL; }
39230bdf917eSStefano Zampini         for (i=0;i<n_subdomains;i++)   { coarse_subdivision[ranks_stretching_ratio*i]=(PetscInt)(metis_coarse_subdivision[i]); }
39240c7d97c5SJed Brown         ierr = PetscFree(metis_coarse_subdivision);CHKERRQ(ierr);
39250c7d97c5SJed Brown       }
39260c7d97c5SJed Brown 
39270c7d97c5SJed Brown       /* Create new communicator for coarse problem splitting the old one */
39280c7d97c5SJed Brown       if ( !(rank_prec_comm%procs_jumps_coarse_comm) && rank_prec_comm < procs_jumps_coarse_comm*n_parts ){
3929da1bb401SStefano Zampini         coarse_color=0;              /* for communicator splitting */
3930da1bb401SStefano Zampini         active_rank=rank_prec_comm;  /* for insertion of matrix values */
39310c7d97c5SJed Brown       }
3932da1bb401SStefano Zampini       /* procs with coarse_color = MPI_UNDEFINED will have coarse_comm = MPI_COMM_NULL (from mpi standards)
3933da1bb401SStefano Zampini          key = rank_prec_comm -> keep same ordering of ranks from the old to the new communicator */
393453cdbc3dSStefano Zampini       ierr = MPI_Comm_split(prec_comm,coarse_color,rank_prec_comm,&coarse_comm);CHKERRQ(ierr);
39350c7d97c5SJed Brown 
39360c7d97c5SJed Brown       if ( coarse_color == 0 ) {
393753cdbc3dSStefano Zampini         ierr = MPI_Comm_size(coarse_comm,&size_coarse_comm);CHKERRQ(ierr);
393853cdbc3dSStefano Zampini         ierr = MPI_Comm_rank(coarse_comm,&rank_coarse_comm);CHKERRQ(ierr);
39390c7d97c5SJed Brown       } else {
39400c7d97c5SJed Brown         rank_coarse_comm = MPI_PROC_NULL;
39410c7d97c5SJed Brown       }
39420c7d97c5SJed Brown 
39437cf533a6SStefano Zampini       /* master proc take care of arranging and distributing coarse information */
39440c7d97c5SJed Brown       if (rank_coarse_comm == master_proc) {
39450c7d97c5SJed Brown         ierr = PetscMalloc (size_coarse_comm*sizeof(PetscMPIInt),&displacements_recv);CHKERRQ(ierr);
39460bdf917eSStefano Zampini         ierr = PetscMalloc (size_coarse_comm*sizeof(PetscMPIInt),&total_count_recv);CHKERRQ(ierr);
39470bdf917eSStefano Zampini         ierr = PetscMalloc (n_subdomains*sizeof(PetscMPIInt),&total_ranks_recv);CHKERRQ(ierr);
39480c7d97c5SJed Brown         /* some initializations */
39490c7d97c5SJed Brown         displacements_recv[0]=0;
39500bdf917eSStefano Zampini         ierr = PetscMemzero(total_count_recv,size_coarse_comm*sizeof(PetscMPIInt));CHKERRQ(ierr);
39510c7d97c5SJed Brown         /* count from how many processes the j-th process of the coarse decomposition will receive data */
39520bdf917eSStefano Zampini         for (j=0;j<size_coarse_comm;j++) {
39530bdf917eSStefano Zampini           for (i=0;i<size_prec_comm;i++) {
39540bdf917eSStefano Zampini             if (coarse_subdivision[i]==j) {
39550c7d97c5SJed Brown               total_count_recv[j]++;
39560bdf917eSStefano Zampini             }
39570bdf917eSStefano Zampini           }
39580bdf917eSStefano Zampini         }
39590c7d97c5SJed Brown         /* displacements needed for scatterv of total_ranks_recv */
39600bdf917eSStefano Zampini         for (i=1;i<size_coarse_comm;i++) { displacements_recv[i]=displacements_recv[i-1]+total_count_recv[i-1]; }
39610c7d97c5SJed Brown         /* Now fill properly total_ranks_recv -> each coarse process will receive the ranks (in prec_comm communicator) of its friend (sending) processes */
39620c7d97c5SJed Brown         ierr = PetscMemzero(total_count_recv,size_coarse_comm*sizeof(PetscMPIInt));CHKERRQ(ierr);
39630c7d97c5SJed Brown         for (j=0;j<size_coarse_comm;j++) {
39643828260eSStefano Zampini           for (i=0;i<size_prec_comm;i++) {
39650c7d97c5SJed Brown             if (coarse_subdivision[i]==j) {
39660c7d97c5SJed Brown               total_ranks_recv[displacements_recv[j]+total_count_recv[j]]=i;
39673828260eSStefano Zampini               total_count_recv[j]+=1;
39680c7d97c5SJed Brown             }
39690c7d97c5SJed Brown           }
39700c7d97c5SJed Brown         }
3971da1bb401SStefano Zampini         /*for (j=0;j<size_coarse_comm;j++) {
39723828260eSStefano Zampini           printf("process %d in new rank will receive from %d processes (original ranks follows)\n",j,total_count_recv[j]);
39733828260eSStefano Zampini           for (i=0;i<total_count_recv[j];i++) {
39743828260eSStefano Zampini             printf("%d ",total_ranks_recv[displacements_recv[j]+i]);
39753828260eSStefano Zampini           }
39763828260eSStefano Zampini           printf("\n");
3977da1bb401SStefano Zampini         }*/
39780c7d97c5SJed Brown 
39790c7d97c5SJed Brown         /* identify new decomposition in terms of ranks in the old communicator */
39800bdf917eSStefano Zampini         for (i=0;i<n_subdomains;i++) {
39810bdf917eSStefano Zampini           coarse_subdivision[ranks_stretching_ratio*i]=coarse_subdivision[ranks_stretching_ratio*i]*procs_jumps_coarse_comm;
39820bdf917eSStefano Zampini         }
3983da1bb401SStefano Zampini         /*printf("coarse_subdivision in old end new ranks\n");
39840c7d97c5SJed Brown         for (i=0;i<size_prec_comm;i++)
39853828260eSStefano Zampini           if (coarse_subdivision[i]!=MPI_PROC_NULL) {
39863828260eSStefano Zampini             printf("%d=(%d %d), ",i,coarse_subdivision[i],coarse_subdivision[i]/procs_jumps_coarse_comm);
39873828260eSStefano Zampini           } else {
39883828260eSStefano Zampini             printf("%d=(%d %d), ",i,coarse_subdivision[i],coarse_subdivision[i]);
39893828260eSStefano Zampini           }
3990da1bb401SStefano Zampini         printf("\n");*/
39910c7d97c5SJed Brown       }
39920c7d97c5SJed Brown 
39930c7d97c5SJed Brown       /* Scatter new decomposition for send details */
399453cdbc3dSStefano Zampini       ierr = MPI_Scatter(&coarse_subdivision[0],1,MPIU_INT,&rank_coarse_proc_send_to,1,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr);
39950c7d97c5SJed Brown       /* Scatter receiving details to members of coarse decomposition */
39960c7d97c5SJed Brown       if ( coarse_color == 0) {
399753cdbc3dSStefano Zampini         ierr = MPI_Scatter(&total_count_recv[0],1,MPIU_INT,&count_recv,1,MPIU_INT,master_proc,coarse_comm);CHKERRQ(ierr);
39980c7d97c5SJed Brown         ierr = PetscMalloc (count_recv*sizeof(PetscMPIInt),&ranks_recv);CHKERRQ(ierr);
399953cdbc3dSStefano Zampini         ierr = MPI_Scatterv(&total_ranks_recv[0],total_count_recv,displacements_recv,MPIU_INT,&ranks_recv[0],count_recv,MPIU_INT,master_proc,coarse_comm);CHKERRQ(ierr);
40000c7d97c5SJed Brown       }
40010c7d97c5SJed Brown 
4002da1bb401SStefano Zampini       /*printf("I will send my matrix data to proc  %d\n",rank_coarse_proc_send_to);
4003da1bb401SStefano Zampini       if (coarse_color == 0) {
4004da1bb401SStefano Zampini         printf("I will receive some matrix data from %d processes (ranks follows)\n",count_recv);
4005da1bb401SStefano Zampini         for (i=0;i<count_recv;i++)
4006da1bb401SStefano Zampini           printf("%d ",ranks_recv[i]);
4007da1bb401SStefano Zampini         printf("\n");
4008da1bb401SStefano Zampini       }*/
40090c7d97c5SJed Brown 
40100c7d97c5SJed Brown       if (rank_prec_comm == master_proc) {
40110bdf917eSStefano Zampini         ierr = PetscFree(coarse_subdivision);CHKERRQ(ierr);
4012da1bb401SStefano Zampini         ierr = PetscFree(total_count_recv);CHKERRQ(ierr);
40130bdf917eSStefano Zampini         ierr = PetscFree(total_ranks_recv);CHKERRQ(ierr);
40140c7d97c5SJed Brown         ierr = PetscFree(displacements_recv);CHKERRQ(ierr);
40150c7d97c5SJed Brown       }
40160c7d97c5SJed Brown       break;
40170c7d97c5SJed Brown     }
40180c7d97c5SJed Brown 
40190c7d97c5SJed Brown     case(REPLICATED_BDDC):
40200c7d97c5SJed Brown 
40210c7d97c5SJed Brown       pcbddc->coarse_communications_type = GATHERS_BDDC;
40220c7d97c5SJed Brown       coarse_mat_type = MATSEQAIJ;
40230c7d97c5SJed Brown       coarse_pc_type  = PCLU;
402453cdbc3dSStefano Zampini       coarse_ksp_type  = KSPPREONLY;
40250c7d97c5SJed Brown       coarse_comm = PETSC_COMM_SELF;
40260c7d97c5SJed Brown       active_rank = rank_prec_comm;
40270c7d97c5SJed Brown       break;
40280c7d97c5SJed Brown 
40290c7d97c5SJed Brown     case(PARALLEL_BDDC):
40300c7d97c5SJed Brown 
40310c7d97c5SJed Brown       pcbddc->coarse_communications_type = SCATTERS_BDDC;
40320c7d97c5SJed Brown       coarse_mat_type = MATMPIAIJ;
40330c7d97c5SJed Brown       coarse_pc_type  = PCREDUNDANT;
403453cdbc3dSStefano Zampini       coarse_ksp_type  = KSPPREONLY;
40350c7d97c5SJed Brown       coarse_comm = prec_comm;
40360c7d97c5SJed Brown       active_rank = rank_prec_comm;
40370c7d97c5SJed Brown       break;
40380c7d97c5SJed Brown 
40390c7d97c5SJed Brown     case(SEQUENTIAL_BDDC):
40400c7d97c5SJed Brown       pcbddc->coarse_communications_type = GATHERS_BDDC;
40410c7d97c5SJed Brown       coarse_mat_type = MATSEQAIJ;
40420c7d97c5SJed Brown       coarse_pc_type = PCLU;
404353cdbc3dSStefano Zampini       coarse_ksp_type  = KSPPREONLY;
40440c7d97c5SJed Brown       coarse_comm = PETSC_COMM_SELF;
40450c7d97c5SJed Brown       active_rank = master_proc;
40460c7d97c5SJed Brown       break;
40470c7d97c5SJed Brown   }
40480c7d97c5SJed Brown 
40490c7d97c5SJed Brown   switch(pcbddc->coarse_communications_type){
40500c7d97c5SJed Brown 
40510c7d97c5SJed Brown     case(SCATTERS_BDDC):
40520c7d97c5SJed Brown       {
40530c7d97c5SJed Brown         if (pcbddc->coarse_problem_type==MULTILEVEL_BDDC) {
40540c7d97c5SJed Brown 
40552e8d2280SStefano Zampini           IS coarse_IS;
40562e8d2280SStefano Zampini 
4057523858cfSStefano Zampini           if(pcbddc->coarsening_ratio == 1) {
4058523858cfSStefano Zampini             ins_local_primal_size = pcbddc->local_primal_size;
4059523858cfSStefano Zampini             ins_local_primal_indices = pcbddc->local_primal_indices;
4060523858cfSStefano Zampini             if (coarse_color == 0) { ierr = PetscFree(ranks_recv);CHKERRQ(ierr); }
4061523858cfSStefano Zampini             /* nonzeros */
4062523858cfSStefano Zampini             ierr = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&dnz);CHKERRQ(ierr);
4063523858cfSStefano Zampini             ierr = PetscMemzero(dnz,ins_local_primal_size*sizeof(PetscInt));CHKERRQ(ierr);
4064523858cfSStefano Zampini             for (i=0;i<ins_local_primal_size;i++) {
4065523858cfSStefano Zampini               dnz[i] = ins_local_primal_size;
4066523858cfSStefano Zampini             }
4067523858cfSStefano Zampini           } else {
40680c7d97c5SJed Brown             PetscMPIInt send_size;
4069ef028eecSStefano Zampini             PetscMPIInt *send_buffer;
40700c7d97c5SJed Brown             PetscInt    *aux_ins_indices;
40710c7d97c5SJed Brown             PetscInt    ii,jj;
40720c7d97c5SJed Brown             MPI_Request *requests;
4073ef028eecSStefano Zampini 
4074523858cfSStefano Zampini             ierr = PetscMalloc(count_recv*sizeof(PetscMPIInt),&localdispl2);CHKERRQ(ierr);
4075523858cfSStefano Zampini             /* reusing pcbddc->local_primal_displacements and pcbddc->replicated_primal_size */
4076523858cfSStefano Zampini             ierr = PetscFree(pcbddc->local_primal_displacements);CHKERRQ(ierr);
4077523858cfSStefano Zampini             ierr = PetscMalloc((count_recv+1)*sizeof(PetscMPIInt),&pcbddc->local_primal_displacements);CHKERRQ(ierr);
4078523858cfSStefano Zampini             pcbddc->replicated_primal_size = count_recv;
4079523858cfSStefano Zampini             j = 0;
4080523858cfSStefano Zampini             for (i=0;i<count_recv;i++) {
4081523858cfSStefano Zampini               pcbddc->local_primal_displacements[i] = j;
4082523858cfSStefano Zampini               j += pcbddc->local_primal_sizes[ranks_recv[i]];
4083523858cfSStefano Zampini             }
4084523858cfSStefano Zampini             pcbddc->local_primal_displacements[count_recv] = j;
4085523858cfSStefano Zampini             ierr = PetscMalloc(j*sizeof(PetscMPIInt),&pcbddc->replicated_local_primal_indices);CHKERRQ(ierr);
40860c7d97c5SJed Brown             /* allocate auxiliary space */
4087523858cfSStefano Zampini             ierr = PetscMalloc(count_recv*sizeof(PetscMPIInt),&localsizes2);CHKERRQ(ierr);
40880c7d97c5SJed Brown             ierr = PetscMalloc(pcbddc->coarse_size*sizeof(PetscInt),&aux_ins_indices);CHKERRQ(ierr);
40890c7d97c5SJed Brown             ierr = PetscMemzero(aux_ins_indices,pcbddc->coarse_size*sizeof(PetscInt));CHKERRQ(ierr);
40900c7d97c5SJed Brown             /* allocate stuffs for message massing */
40910c7d97c5SJed Brown             ierr = PetscMalloc((count_recv+1)*sizeof(MPI_Request),&requests);CHKERRQ(ierr);
4092523858cfSStefano Zampini             for (i=0;i<count_recv+1;i++) { requests[i]=MPI_REQUEST_NULL; }
4093523858cfSStefano Zampini             /* send indices to be inserted */
4094523858cfSStefano Zampini             for (i=0;i<count_recv;i++) {
4095523858cfSStefano Zampini               send_size = pcbddc->local_primal_sizes[ranks_recv[i]];
4096523858cfSStefano Zampini               ierr = MPI_Irecv(&pcbddc->replicated_local_primal_indices[pcbddc->local_primal_displacements[i]],send_size,MPIU_INT,ranks_recv[i],999,prec_comm,&requests[i]);CHKERRQ(ierr);
4097523858cfSStefano Zampini             }
4098523858cfSStefano Zampini             if (rank_coarse_proc_send_to != MPI_PROC_NULL ) {
4099523858cfSStefano Zampini               send_size = pcbddc->local_primal_size;
4100ef028eecSStefano Zampini               ierr = PetscMalloc(send_size*sizeof(PetscMPIInt),&send_buffer);CHKERRQ(ierr);
4101ef028eecSStefano Zampini               for (i=0;i<send_size;i++) {
4102ef028eecSStefano Zampini                 send_buffer[i]=(PetscMPIInt)pcbddc->local_primal_indices[i];
4103ef028eecSStefano Zampini               }
4104ef028eecSStefano Zampini               ierr = MPI_Isend(send_buffer,send_size,MPIU_INT,rank_coarse_proc_send_to,999,prec_comm,&requests[count_recv]);CHKERRQ(ierr);
4105523858cfSStefano Zampini             }
4106523858cfSStefano Zampini             ierr = MPI_Waitall(count_recv+1,requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
4107ef028eecSStefano Zampini             if (rank_coarse_proc_send_to != MPI_PROC_NULL ) {
4108ef028eecSStefano Zampini               ierr = PetscFree(send_buffer);CHKERRQ(ierr);
4109ef028eecSStefano Zampini             }
41100c7d97c5SJed Brown             j = 0;
41110c7d97c5SJed Brown             for (i=0;i<count_recv;i++) {
41122e8d2280SStefano Zampini               ii = pcbddc->local_primal_displacements[i+1]-pcbddc->local_primal_displacements[i];
41132e8d2280SStefano Zampini               localsizes2[i] = ii*ii;
41140c7d97c5SJed Brown               localdispl2[i] = j;
41150c7d97c5SJed Brown               j += localsizes2[i];
4116523858cfSStefano Zampini               jj = pcbddc->local_primal_displacements[i];
41174fad6a16SStefano Zampini               /* it counts the coarse subdomains sharing the coarse node */
41182e8d2280SStefano Zampini               for (k=0;k<ii;k++) {
41194fad6a16SStefano Zampini                 aux_ins_indices[pcbddc->replicated_local_primal_indices[jj+k]] += 1;
41200c7d97c5SJed Brown               }
41214fad6a16SStefano Zampini             }
4122523858cfSStefano Zampini             /* temp_coarse_mat_vals used to store matrix values to be received */
41230c7d97c5SJed Brown             ierr = PetscMalloc(j*sizeof(PetscScalar),&temp_coarse_mat_vals);CHKERRQ(ierr);
41240c7d97c5SJed Brown             /* evaluate how many values I will insert in coarse mat */
41250c7d97c5SJed Brown             ins_local_primal_size = 0;
4126ea7e1babSStefano Zampini             for (i=0;i<pcbddc->coarse_size;i++) {
4127ea7e1babSStefano Zampini               if (aux_ins_indices[i]) {
41280c7d97c5SJed Brown                 ins_local_primal_size++;
4129ea7e1babSStefano Zampini               }
4130ea7e1babSStefano Zampini             }
41310c7d97c5SJed Brown             /* evaluate indices I will insert in coarse mat */
41320c7d97c5SJed Brown             ierr = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&ins_local_primal_indices);CHKERRQ(ierr);
41330c7d97c5SJed Brown             j = 0;
4134ea7e1babSStefano Zampini             for(i=0;i<pcbddc->coarse_size;i++) {
4135ea7e1babSStefano Zampini               if(aux_ins_indices[i]) {
41362e8d2280SStefano Zampini                 ins_local_primal_indices[j] = i;
41372e8d2280SStefano Zampini                 j++;
4138ea7e1babSStefano Zampini               }
4139ea7e1babSStefano Zampini             }
4140523858cfSStefano Zampini             /* processes partecipating in coarse problem receive matrix data from their friends */
4141523858cfSStefano Zampini             for (i=0;i<count_recv;i++) {
4142523858cfSStefano Zampini               ierr = MPI_Irecv(&temp_coarse_mat_vals[localdispl2[i]],localsizes2[i],MPIU_SCALAR,ranks_recv[i],666,prec_comm,&requests[i]);CHKERRQ(ierr);
4143523858cfSStefano Zampini             }
4144523858cfSStefano Zampini             if (rank_coarse_proc_send_to != MPI_PROC_NULL ) {
4145523858cfSStefano Zampini               send_size = pcbddc->local_primal_size*pcbddc->local_primal_size;
4146523858cfSStefano Zampini               ierr = MPI_Isend(&coarse_submat_vals[0],send_size,MPIU_SCALAR,rank_coarse_proc_send_to,666,prec_comm,&requests[count_recv]);CHKERRQ(ierr);
4147523858cfSStefano Zampini             }
4148523858cfSStefano Zampini             ierr = MPI_Waitall(count_recv+1,requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
4149523858cfSStefano Zampini             /* nonzeros */
4150523858cfSStefano Zampini             ierr = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&dnz);CHKERRQ(ierr);
4151523858cfSStefano Zampini             ierr = PetscMemzero(dnz,ins_local_primal_size*sizeof(PetscInt));CHKERRQ(ierr);
41520c7d97c5SJed Brown             /* use aux_ins_indices to realize a global to local mapping */
41530c7d97c5SJed Brown             j=0;
41540c7d97c5SJed Brown             for(i=0;i<pcbddc->coarse_size;i++){
41550c7d97c5SJed Brown               if(aux_ins_indices[i]==0){
41560c7d97c5SJed Brown                 aux_ins_indices[i]=-1;
41570c7d97c5SJed Brown               } else {
41580c7d97c5SJed Brown                 aux_ins_indices[i]=j;
41590c7d97c5SJed Brown                 j++;
41600c7d97c5SJed Brown               }
41610c7d97c5SJed Brown             }
41624fad6a16SStefano Zampini             for (i=0;i<count_recv;i++) {
4163523858cfSStefano Zampini               j = pcbddc->local_primal_sizes[ranks_recv[i]];
4164523858cfSStefano Zampini               for (k=0;k<j;k++) {
4165523858cfSStefano Zampini                 dnz[aux_ins_indices[pcbddc->replicated_local_primal_indices[pcbddc->local_primal_displacements[i]+k]]] += j;
41660c7d97c5SJed Brown               }
41670c7d97c5SJed Brown             }
4168523858cfSStefano Zampini             /* check */
4169523858cfSStefano Zampini             for (i=0;i<ins_local_primal_size;i++) {
4170523858cfSStefano Zampini               if (dnz[i] > ins_local_primal_size) {
4171523858cfSStefano Zampini                 dnz[i] = ins_local_primal_size;
41720c7d97c5SJed Brown               }
41730c7d97c5SJed Brown             }
41740c7d97c5SJed Brown             ierr = PetscFree(requests);CHKERRQ(ierr);
41750c7d97c5SJed Brown             ierr = PetscFree(aux_ins_indices);CHKERRQ(ierr);
41760c7d97c5SJed Brown             if (coarse_color == 0) { ierr = PetscFree(ranks_recv);CHKERRQ(ierr); }
41774fad6a16SStefano Zampini           }
41780c7d97c5SJed Brown           /* create local to global mapping needed by coarse MATIS */
4179142dfd88SStefano Zampini           if (coarse_comm != MPI_COMM_NULL ) {ierr = MPI_Comm_free(&coarse_comm);CHKERRQ(ierr);}
41800c7d97c5SJed Brown           coarse_comm = prec_comm;
41810c7d97c5SJed Brown           active_rank = rank_prec_comm;
41820c7d97c5SJed Brown           ierr = ISCreateGeneral(coarse_comm,ins_local_primal_size,ins_local_primal_indices,PETSC_COPY_VALUES,&coarse_IS);CHKERRQ(ierr);
41830c7d97c5SJed Brown           ierr = ISLocalToGlobalMappingCreateIS(coarse_IS,&coarse_ISLG);CHKERRQ(ierr);
41840c7d97c5SJed Brown           ierr = ISDestroy(&coarse_IS);CHKERRQ(ierr);
41852e8d2280SStefano Zampini         } else if (pcbddc->coarse_problem_type==PARALLEL_BDDC) {
41860c7d97c5SJed Brown           /* arrays for values insertion */
41870c7d97c5SJed Brown           ins_local_primal_size = pcbddc->local_primal_size;
41882e8d2280SStefano Zampini           ierr = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&ins_local_primal_indices);CHKERRQ(ierr);
41890c7d97c5SJed Brown           ierr = PetscMalloc(ins_local_primal_size*ins_local_primal_size*sizeof(PetscScalar),&ins_coarse_mat_vals);CHKERRQ(ierr);
41900c7d97c5SJed Brown           for (j=0;j<ins_local_primal_size;j++){
41910c7d97c5SJed Brown             ins_local_primal_indices[j]=pcbddc->local_primal_indices[j];
41924fad6a16SStefano Zampini             for (i=0;i<ins_local_primal_size;i++) {
41934fad6a16SStefano Zampini               ins_coarse_mat_vals[j*ins_local_primal_size+i]=coarse_submat_vals[j*ins_local_primal_size+i];
41944fad6a16SStefano Zampini             }
41950c7d97c5SJed Brown           }
41960c7d97c5SJed Brown         }
41970c7d97c5SJed Brown         break;
41980c7d97c5SJed Brown 
41990c7d97c5SJed Brown     }
42000c7d97c5SJed Brown 
42010c7d97c5SJed Brown     case(GATHERS_BDDC):
42020c7d97c5SJed Brown       {
42030c7d97c5SJed Brown 
42040c7d97c5SJed Brown         PetscMPIInt mysize,mysize2;
4205ef028eecSStefano Zampini         PetscMPIInt *send_buffer;
42060c7d97c5SJed Brown 
42070c7d97c5SJed Brown         if (rank_prec_comm==active_rank) {
42080c7d97c5SJed Brown           ierr = PetscMalloc ( pcbddc->replicated_primal_size*sizeof(PetscMPIInt),&pcbddc->replicated_local_primal_indices);CHKERRQ(ierr);
42090bdf917eSStefano Zampini           ierr = PetscMalloc ( pcbddc->replicated_primal_size*sizeof(PetscScalar),&pcbddc->replicated_local_primal_values);CHKERRQ(ierr);
42100c7d97c5SJed Brown           ierr = PetscMalloc ( size_prec_comm*sizeof(PetscMPIInt),&localsizes2);CHKERRQ(ierr);
42110c7d97c5SJed Brown           ierr = PetscMalloc ( size_prec_comm*sizeof(PetscMPIInt),&localdispl2);CHKERRQ(ierr);
42120c7d97c5SJed Brown           /* arrays for values insertion */
42134fad6a16SStefano Zampini           for (i=0;i<size_prec_comm;i++) { localsizes2[i]=pcbddc->local_primal_sizes[i]*pcbddc->local_primal_sizes[i]; }
42140c7d97c5SJed Brown           localdispl2[0]=0;
42154fad6a16SStefano Zampini           for (i=1;i<size_prec_comm;i++) { localdispl2[i]=localsizes2[i-1]+localdispl2[i-1]; }
42160c7d97c5SJed Brown           j=0;
42174fad6a16SStefano Zampini           for (i=0;i<size_prec_comm;i++) { j+=localsizes2[i]; }
42180c7d97c5SJed Brown           ierr = PetscMalloc ( j*sizeof(PetscScalar),&temp_coarse_mat_vals);CHKERRQ(ierr);
42190c7d97c5SJed Brown         }
42200c7d97c5SJed Brown 
42210c7d97c5SJed Brown         mysize=pcbddc->local_primal_size;
42220c7d97c5SJed Brown         mysize2=pcbddc->local_primal_size*pcbddc->local_primal_size;
4223ef028eecSStefano Zampini         ierr = PetscMalloc(mysize*sizeof(PetscMPIInt),&send_buffer);CHKERRQ(ierr);
4224ef028eecSStefano Zampini         for (i=0;i<mysize;i++) {
4225ef028eecSStefano Zampini           send_buffer[i]=(PetscMPIInt)pcbddc->local_primal_indices[i];
4226ef028eecSStefano Zampini         }
42270c7d97c5SJed Brown         if (pcbddc->coarse_problem_type == SEQUENTIAL_BDDC){
4228ef028eecSStefano Zampini           ierr = MPI_Gatherv(send_buffer,mysize,MPIU_INT,&pcbddc->replicated_local_primal_indices[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr);
422953cdbc3dSStefano Zampini           ierr = MPI_Gatherv(&coarse_submat_vals[0],mysize2,MPIU_SCALAR,&temp_coarse_mat_vals[0],localsizes2,localdispl2,MPIU_SCALAR,master_proc,prec_comm);CHKERRQ(ierr);
42300c7d97c5SJed Brown         } else {
4231ef028eecSStefano Zampini           ierr = MPI_Allgatherv(send_buffer,mysize,MPIU_INT,&pcbddc->replicated_local_primal_indices[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,prec_comm);CHKERRQ(ierr);
423253cdbc3dSStefano Zampini           ierr = MPI_Allgatherv(&coarse_submat_vals[0],mysize2,MPIU_SCALAR,&temp_coarse_mat_vals[0],localsizes2,localdispl2,MPIU_SCALAR,prec_comm);CHKERRQ(ierr);
42330c7d97c5SJed Brown         }
4234ef028eecSStefano Zampini         ierr = PetscFree(send_buffer);CHKERRQ(ierr);
42350c7d97c5SJed Brown         break;
4236da1bb401SStefano Zampini       }/* switch on coarse problem and communications associated with finished */
42370c7d97c5SJed Brown   }
42380c7d97c5SJed Brown 
42390c7d97c5SJed Brown   /* Now create and fill up coarse matrix */
42400c7d97c5SJed Brown   if ( rank_prec_comm == active_rank ) {
4241142dfd88SStefano Zampini 
4242142dfd88SStefano Zampini     Mat matis_coarse_local_mat;
4243142dfd88SStefano Zampini 
42440c7d97c5SJed Brown     if (pcbddc->coarse_problem_type != MULTILEVEL_BDDC) {
42450c7d97c5SJed Brown       ierr = MatCreate(coarse_comm,&pcbddc->coarse_mat);CHKERRQ(ierr);
42460c7d97c5SJed Brown       ierr = MatSetSizes(pcbddc->coarse_mat,PETSC_DECIDE,PETSC_DECIDE,pcbddc->coarse_size,pcbddc->coarse_size);CHKERRQ(ierr);
42470c7d97c5SJed Brown       ierr = MatSetType(pcbddc->coarse_mat,coarse_mat_type);CHKERRQ(ierr);
42483b03a366Sstefano_zampini       ierr = MatSetUp(pcbddc->coarse_mat);CHKERRQ(ierr);
4249da1bb401SStefano Zampini       ierr = MatSetOption(pcbddc->coarse_mat,MAT_ROW_ORIENTED,PETSC_FALSE);CHKERRQ(ierr); /* local values stored in column major */
42503b03a366Sstefano_zampini       ierr = MatSetOption(pcbddc->coarse_mat,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr);
42510c7d97c5SJed Brown     } else {
42524fad6a16SStefano Zampini       ierr = MatCreateIS(coarse_comm,1,PETSC_DECIDE,PETSC_DECIDE,pcbddc->coarse_size,pcbddc->coarse_size,coarse_ISLG,&pcbddc->coarse_mat);CHKERRQ(ierr);
42533b03a366Sstefano_zampini       ierr = MatSetUp(pcbddc->coarse_mat);CHKERRQ(ierr);
42540c7d97c5SJed Brown       ierr = MatISGetLocalMat(pcbddc->coarse_mat,&matis_coarse_local_mat);CHKERRQ(ierr);
42553b03a366Sstefano_zampini       ierr = MatSetUp(matis_coarse_local_mat);CHKERRQ(ierr);
4256da1bb401SStefano Zampini       ierr = MatSetOption(matis_coarse_local_mat,MAT_ROW_ORIENTED,PETSC_FALSE);CHKERRQ(ierr); /* local values stored in column major */
4257a0ba757dSStefano Zampini       ierr = MatSetOption(matis_coarse_local_mat,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr);
42580c7d97c5SJed Brown     }
4259142dfd88SStefano Zampini     /* preallocation */
4260142dfd88SStefano Zampini     if (pcbddc->coarse_problem_type != MULTILEVEL_BDDC) {
4261ef028eecSStefano Zampini 
4262142dfd88SStefano Zampini       PetscInt lrows,lcols;
4263ef028eecSStefano Zampini 
4264142dfd88SStefano Zampini       ierr = MatGetLocalSize(pcbddc->coarse_mat,&lrows,&lcols);CHKERRQ(ierr);
4265142dfd88SStefano Zampini       ierr = MatPreallocateInitialize(coarse_comm,lrows,lcols,dnz,onz);CHKERRQ(ierr);
4266ef028eecSStefano Zampini 
4267142dfd88SStefano Zampini       if (pcbddc->coarse_problem_type == PARALLEL_BDDC) {
4268ef028eecSStefano Zampini 
4269ef028eecSStefano Zampini         Vec         vec_dnz,vec_onz;
4270ef028eecSStefano Zampini         PetscScalar *my_dnz,*my_onz,*array;
4271ef028eecSStefano Zampini         PetscInt    *mat_ranges,*row_ownership;
4272ef028eecSStefano Zampini         PetscInt    coarse_index_row,coarse_index_col,owner;
4273ef028eecSStefano Zampini 
4274ef028eecSStefano Zampini         ierr = VecCreate(prec_comm,&vec_dnz);CHKERRQ(ierr);
4275ef028eecSStefano Zampini         ierr = VecSetSizes(vec_dnz,PETSC_DECIDE,pcbddc->coarse_size);CHKERRQ(ierr);
4276ef028eecSStefano Zampini         ierr = VecSetType(vec_dnz,VECMPI);CHKERRQ(ierr);
4277ef028eecSStefano Zampini         ierr = VecDuplicate(vec_dnz,&vec_onz);CHKERRQ(ierr);
4278ef028eecSStefano Zampini 
4279ef028eecSStefano Zampini         ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscScalar),&my_dnz);CHKERRQ(ierr);
4280ef028eecSStefano Zampini         ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscScalar),&my_onz);CHKERRQ(ierr);
4281ef028eecSStefano Zampini         ierr = PetscMemzero(my_dnz,pcbddc->local_primal_size*sizeof(PetscScalar));CHKERRQ(ierr);
4282ef028eecSStefano Zampini         ierr = PetscMemzero(my_onz,pcbddc->local_primal_size*sizeof(PetscScalar));CHKERRQ(ierr);
4283ef028eecSStefano Zampini 
4284ef028eecSStefano Zampini         ierr = PetscMalloc(pcbddc->coarse_size*sizeof(PetscInt),&row_ownership);CHKERRQ(ierr);
4285ef028eecSStefano Zampini         ierr = MatGetOwnershipRanges(pcbddc->coarse_mat,(const PetscInt**)&mat_ranges);CHKERRQ(ierr);
4286142dfd88SStefano Zampini         for (i=0;i<size_prec_comm;i++) {
4287ef028eecSStefano Zampini           for (j=mat_ranges[i];j<mat_ranges[i+1];j++) {
4288ef028eecSStefano Zampini             row_ownership[j]=i;
4289142dfd88SStefano Zampini           }
4290142dfd88SStefano Zampini         }
4291ef028eecSStefano Zampini 
4292ef028eecSStefano Zampini         for (i=0;i<pcbddc->local_primal_size;i++) {
4293ef028eecSStefano Zampini           coarse_index_row = pcbddc->local_primal_indices[i];
4294ef028eecSStefano Zampini           owner = row_ownership[coarse_index_row];
4295ef028eecSStefano Zampini           for (j=i;j<pcbddc->local_primal_size;j++) {
4296ef028eecSStefano Zampini             owner = row_ownership[coarse_index_row];
4297ef028eecSStefano Zampini             coarse_index_col = pcbddc->local_primal_indices[j];
4298ef028eecSStefano Zampini             if (coarse_index_col > mat_ranges[owner]-1 && coarse_index_col < mat_ranges[owner+1] ) {
4299ef028eecSStefano Zampini               my_dnz[i] += 1.0;
4300142dfd88SStefano Zampini             } else {
4301ef028eecSStefano Zampini               my_onz[i] += 1.0;
4302142dfd88SStefano Zampini             }
4303ef028eecSStefano Zampini             if (i != j) {
4304ef028eecSStefano Zampini               owner = row_ownership[coarse_index_col];
4305ef028eecSStefano Zampini               if (coarse_index_row > mat_ranges[owner]-1 && coarse_index_row < mat_ranges[owner+1] ) {
4306ef028eecSStefano Zampini                 my_dnz[j] += 1.0;
4307142dfd88SStefano Zampini               } else {
4308ef028eecSStefano Zampini                 my_onz[j] += 1.0;
4309142dfd88SStefano Zampini               }
4310142dfd88SStefano Zampini             }
4311142dfd88SStefano Zampini           }
4312142dfd88SStefano Zampini         }
4313ef028eecSStefano Zampini         ierr = VecSet(vec_dnz,0.0);CHKERRQ(ierr);
4314ef028eecSStefano Zampini         ierr = VecSet(vec_onz,0.0);CHKERRQ(ierr);
4315ef028eecSStefano Zampini         ierr = VecSetValues(vec_dnz,pcbddc->local_primal_size,pcbddc->local_primal_indices,my_dnz,ADD_VALUES);CHKERRQ(ierr);
4316ef028eecSStefano Zampini         ierr = VecSetValues(vec_onz,pcbddc->local_primal_size,pcbddc->local_primal_indices,my_onz,ADD_VALUES);CHKERRQ(ierr);
4317ef028eecSStefano Zampini         ierr = VecAssemblyBegin(vec_dnz);CHKERRQ(ierr);
4318ef028eecSStefano Zampini         ierr = VecAssemblyBegin(vec_onz);CHKERRQ(ierr);
4319ef028eecSStefano Zampini         ierr = VecAssemblyEnd(vec_dnz);CHKERRQ(ierr);
4320ef028eecSStefano Zampini         ierr = VecAssemblyEnd(vec_onz);CHKERRQ(ierr);
4321ef028eecSStefano Zampini         j = mat_ranges[rank_prec_comm+1]-mat_ranges[rank_prec_comm];
4322ef028eecSStefano Zampini         ierr = VecGetArray(vec_dnz,&array);CHKERRQ(ierr);
4323ef028eecSStefano Zampini         for (i=0;i<j;i++) {
4324ef028eecSStefano Zampini           dnz[i] = (PetscInt)array[i];
4325142dfd88SStefano Zampini         }
4326ef028eecSStefano Zampini         ierr = VecRestoreArray(vec_dnz,&array);CHKERRQ(ierr);
4327ef028eecSStefano Zampini         ierr = VecGetArray(vec_onz,&array);CHKERRQ(ierr);
4328ef028eecSStefano Zampini         for (i=0;i<j;i++) {
4329ef028eecSStefano Zampini           onz[i] = (PetscInt)array[i];
4330142dfd88SStefano Zampini         }
4331ef028eecSStefano Zampini         ierr = VecRestoreArray(vec_onz,&array);CHKERRQ(ierr);
4332ef028eecSStefano Zampini         ierr = PetscFree(my_dnz);CHKERRQ(ierr);
4333ef028eecSStefano Zampini         ierr = PetscFree(my_onz);CHKERRQ(ierr);
4334ef028eecSStefano Zampini         ierr = PetscFree(row_ownership);CHKERRQ(ierr);
4335ef028eecSStefano Zampini         ierr = VecDestroy(&vec_dnz);CHKERRQ(ierr);
4336ef028eecSStefano Zampini         ierr = VecDestroy(&vec_onz);CHKERRQ(ierr);
4337142dfd88SStefano Zampini       } else {
4338142dfd88SStefano Zampini         for (k=0;k<size_prec_comm;k++){
4339142dfd88SStefano Zampini           offset=pcbddc->local_primal_displacements[k];
4340142dfd88SStefano Zampini           offset2=localdispl2[k];
4341142dfd88SStefano Zampini           ins_local_primal_size = pcbddc->local_primal_sizes[k];
4342ef028eecSStefano Zampini           ierr = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&ins_local_primal_indices);CHKERRQ(ierr);
4343ef028eecSStefano Zampini           for (j=0;j<ins_local_primal_size;j++){
4344ef028eecSStefano Zampini             ins_local_primal_indices[j]=(PetscInt)pcbddc->replicated_local_primal_indices[offset+j];
4345ef028eecSStefano Zampini           }
4346142dfd88SStefano Zampini           for (j=0;j<ins_local_primal_size;j++) {
4347142dfd88SStefano Zampini             ierr = MatPreallocateSet(ins_local_primal_indices[j],ins_local_primal_size,ins_local_primal_indices,dnz,onz);CHKERRQ(ierr);
4348142dfd88SStefano Zampini           }
4349ef028eecSStefano Zampini           ierr = PetscFree(ins_local_primal_indices);CHKERRQ(ierr);
4350142dfd88SStefano Zampini         }
4351142dfd88SStefano Zampini       }
4352142dfd88SStefano Zampini       /* check */
4353142dfd88SStefano Zampini       for (i=0;i<lrows;i++) {
4354142dfd88SStefano Zampini         if (dnz[i]>lcols) {
4355142dfd88SStefano Zampini           dnz[i]=lcols;
4356142dfd88SStefano Zampini         }
4357142dfd88SStefano Zampini         if (onz[i]>pcbddc->coarse_size-lcols) {
4358142dfd88SStefano Zampini           onz[i]=pcbddc->coarse_size-lcols;
4359142dfd88SStefano Zampini         }
4360142dfd88SStefano Zampini       }
4361142dfd88SStefano Zampini       ierr = MatSeqAIJSetPreallocation(pcbddc->coarse_mat,PETSC_NULL,dnz);CHKERRQ(ierr);
4362142dfd88SStefano Zampini       ierr = MatMPIAIJSetPreallocation(pcbddc->coarse_mat,PETSC_NULL,dnz,PETSC_NULL,onz);CHKERRQ(ierr);
4363142dfd88SStefano Zampini       ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr);
4364142dfd88SStefano Zampini     } else {
4365523858cfSStefano Zampini       ierr = MatSeqAIJSetPreallocation(matis_coarse_local_mat,0,dnz);CHKERRQ(ierr);
4366523858cfSStefano Zampini       ierr = PetscFree(dnz);CHKERRQ(ierr);
4367142dfd88SStefano Zampini     }
4368142dfd88SStefano Zampini     /* insert values */
4369523858cfSStefano Zampini     if (pcbddc->coarse_problem_type == PARALLEL_BDDC) {
43700c7d97c5SJed Brown       ierr = MatSetValues(pcbddc->coarse_mat,ins_local_primal_size,ins_local_primal_indices,ins_local_primal_size,ins_local_primal_indices,ins_coarse_mat_vals,ADD_VALUES);CHKERRQ(ierr);
4371523858cfSStefano Zampini     } else if (pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
4372523858cfSStefano Zampini       if (pcbddc->coarsening_ratio == 1) {
4373523858cfSStefano Zampini         ins_coarse_mat_vals = coarse_submat_vals;
4374523858cfSStefano Zampini         ierr = MatSetValues(pcbddc->coarse_mat,ins_local_primal_size,ins_local_primal_indices,ins_local_primal_size,ins_local_primal_indices,ins_coarse_mat_vals,INSERT_VALUES);CHKERRQ(ierr);
4375523858cfSStefano Zampini       } else {
4376523858cfSStefano Zampini         ierr = PetscFree(ins_local_primal_indices);CHKERRQ(ierr);
4377523858cfSStefano Zampini         for (k=0;k<pcbddc->replicated_primal_size;k++) {
4378523858cfSStefano Zampini           offset = pcbddc->local_primal_displacements[k];
4379523858cfSStefano Zampini           offset2 = localdispl2[k];
4380523858cfSStefano Zampini           ins_local_primal_size = pcbddc->local_primal_displacements[k+1]-pcbddc->local_primal_displacements[k];
4381ef028eecSStefano Zampini           ierr = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&ins_local_primal_indices);CHKERRQ(ierr);
4382ef028eecSStefano Zampini           for (j=0;j<ins_local_primal_size;j++){
4383ef028eecSStefano Zampini             ins_local_primal_indices[j]=(PetscInt)pcbddc->replicated_local_primal_indices[offset+j];
4384ef028eecSStefano Zampini           }
4385523858cfSStefano Zampini           ins_coarse_mat_vals = &temp_coarse_mat_vals[offset2];
4386523858cfSStefano Zampini           ierr = MatSetValues(pcbddc->coarse_mat,ins_local_primal_size,ins_local_primal_indices,ins_local_primal_size,ins_local_primal_indices,ins_coarse_mat_vals,ADD_VALUES);CHKERRQ(ierr);
4387ef028eecSStefano Zampini           ierr = PetscFree(ins_local_primal_indices);CHKERRQ(ierr);
4388523858cfSStefano Zampini         }
4389523858cfSStefano Zampini       }
4390523858cfSStefano Zampini       ins_local_primal_indices = 0;
4391523858cfSStefano Zampini       ins_coarse_mat_vals = 0;
4392ea7e1babSStefano Zampini     } else {
4393ea7e1babSStefano Zampini       for (k=0;k<size_prec_comm;k++){
4394ea7e1babSStefano Zampini         offset=pcbddc->local_primal_displacements[k];
4395ea7e1babSStefano Zampini         offset2=localdispl2[k];
4396ea7e1babSStefano Zampini         ins_local_primal_size = pcbddc->local_primal_sizes[k];
4397ef028eecSStefano Zampini         ierr = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&ins_local_primal_indices);CHKERRQ(ierr);
4398ef028eecSStefano Zampini         for (j=0;j<ins_local_primal_size;j++){
4399ef028eecSStefano Zampini           ins_local_primal_indices[j]=(PetscInt)pcbddc->replicated_local_primal_indices[offset+j];
4400ef028eecSStefano Zampini         }
4401ea7e1babSStefano Zampini         ins_coarse_mat_vals = &temp_coarse_mat_vals[offset2];
4402ea7e1babSStefano Zampini         ierr = MatSetValues(pcbddc->coarse_mat,ins_local_primal_size,ins_local_primal_indices,ins_local_primal_size,ins_local_primal_indices,ins_coarse_mat_vals,ADD_VALUES);CHKERRQ(ierr);
4403ef028eecSStefano Zampini         ierr = PetscFree(ins_local_primal_indices);CHKERRQ(ierr);
4404ea7e1babSStefano Zampini       }
4405ea7e1babSStefano Zampini       ins_local_primal_indices = 0;
4406ea7e1babSStefano Zampini       ins_coarse_mat_vals = 0;
4407ea7e1babSStefano Zampini     }
44080c7d97c5SJed Brown     ierr = MatAssemblyBegin(pcbddc->coarse_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
44090c7d97c5SJed Brown     ierr = MatAssemblyEnd(pcbddc->coarse_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
4410142dfd88SStefano Zampini     /* symmetry of coarse matrix */
4411142dfd88SStefano Zampini     if (issym) {
4412142dfd88SStefano Zampini       ierr = MatSetOption(pcbddc->coarse_mat,MAT_SYMMETRIC,PETSC_TRUE);CHKERRQ(ierr);
4413142dfd88SStefano Zampini     }
44140c7d97c5SJed Brown     ierr = MatGetVecs(pcbddc->coarse_mat,&pcbddc->coarse_vec,&pcbddc->coarse_rhs);CHKERRQ(ierr);
44150bdf917eSStefano Zampini   }
44160bdf917eSStefano Zampini 
44170bdf917eSStefano Zampini   /* create loc to glob scatters if needed */
44180bdf917eSStefano Zampini   if (pcbddc->coarse_communications_type == SCATTERS_BDDC) {
44190bdf917eSStefano Zampini      IS local_IS,global_IS;
44200bdf917eSStefano Zampini      ierr = ISCreateStride(PETSC_COMM_SELF,pcbddc->local_primal_size,0,1,&local_IS);CHKERRQ(ierr);
44210bdf917eSStefano Zampini      ierr = ISCreateGeneral(PETSC_COMM_SELF,pcbddc->local_primal_size,pcbddc->local_primal_indices,PETSC_COPY_VALUES,&global_IS);CHKERRQ(ierr);
44220bdf917eSStefano Zampini      ierr = VecScatterCreate(pcbddc->vec1_P,local_IS,pcbddc->coarse_vec,global_IS,&pcbddc->coarse_loc_to_glob);CHKERRQ(ierr);
44230bdf917eSStefano Zampini      ierr = ISDestroy(&local_IS);CHKERRQ(ierr);
44240bdf917eSStefano Zampini      ierr = ISDestroy(&global_IS);CHKERRQ(ierr);
44250bdf917eSStefano Zampini   }
44260bdf917eSStefano Zampini 
44270bdf917eSStefano Zampini   /* Eval coarse null space */
44280bdf917eSStefano Zampini   if (pcbddc->NullSpace) {
44290bdf917eSStefano Zampini     const Vec      *nsp_vecs;
44300bdf917eSStefano Zampini     PetscInt       nsp_size,coarse_nsp_size;
44310bdf917eSStefano Zampini     PetscBool      nsp_has_cnst;
44320bdf917eSStefano Zampini     PetscReal      test_null;
44330bdf917eSStefano Zampini     Vec            *coarse_nsp_vecs;
44340bdf917eSStefano Zampini 
44350bdf917eSStefano Zampini     coarse_nsp_size = 0;
44360bdf917eSStefano Zampini     coarse_nsp_vecs = 0;
44370bdf917eSStefano Zampini     ierr = MatNullSpaceGetVecs(pcbddc->NullSpace,&nsp_has_cnst,&nsp_size,&nsp_vecs);CHKERRQ(ierr);
44380bdf917eSStefano Zampini     if (rank_prec_comm == active_rank) {
44390bdf917eSStefano Zampini       ierr = PetscMalloc((nsp_size+1)*sizeof(Vec),&coarse_nsp_vecs);CHKERRQ(ierr);
44400bdf917eSStefano Zampini       for (i=0;i<nsp_size+1;i++) {
44410bdf917eSStefano Zampini         ierr = VecDuplicate(pcbddc->coarse_vec,&coarse_nsp_vecs[i]);CHKERRQ(ierr);
44420bdf917eSStefano Zampini       }
44430bdf917eSStefano Zampini     }
44440bdf917eSStefano Zampini     if (nsp_has_cnst) {
44450bdf917eSStefano Zampini       ierr = VecSet(pcis->vec1_N,1.0);CHKERRQ(ierr);
44460bdf917eSStefano Zampini       ierr = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr);
44470bdf917eSStefano Zampini       ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->vec1_P,pcbddc->coarse_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
44480bdf917eSStefano Zampini       ierr = PCBDDCScatterCoarseDataEnd(pc,pcbddc->vec1_P,pcbddc->coarse_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
44490bdf917eSStefano Zampini       if (rank_prec_comm == active_rank) {
44500bdf917eSStefano Zampini         ierr = MatMult(pcbddc->coarse_mat,pcbddc->coarse_vec,pcbddc->coarse_rhs);CHKERRQ(ierr);
44510bdf917eSStefano Zampini         ierr = VecNorm(pcbddc->coarse_rhs,NORM_INFINITY,&test_null);CHKERRQ(ierr);
44520bdf917eSStefano Zampini         if (test_null > 1.0e-12 && pcbddc->dbg_flag ) {
44530bdf917eSStefano Zampini           ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Constant coarse null space error % 1.14e\n",test_null);CHKERRQ(ierr);
44540bdf917eSStefano Zampini         }
44550bdf917eSStefano Zampini         ierr = VecCopy(pcbddc->coarse_vec,coarse_nsp_vecs[coarse_nsp_size]);CHKERRQ(ierr);
44560bdf917eSStefano Zampini         coarse_nsp_size++;
44570bdf917eSStefano Zampini       }
44580bdf917eSStefano Zampini     }
44590bdf917eSStefano Zampini     for (i=0;i<nsp_size;i++)  {
44600bdf917eSStefano Zampini       ierr = VecScatterBegin(matis->ctx,nsp_vecs[i],pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
44610bdf917eSStefano Zampini       ierr = VecScatterEnd  (matis->ctx,nsp_vecs[i],pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
44620bdf917eSStefano Zampini       ierr = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr);
44630bdf917eSStefano Zampini       ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->vec1_P,pcbddc->coarse_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
44640bdf917eSStefano Zampini       ierr = PCBDDCScatterCoarseDataEnd(pc,pcbddc->vec1_P,pcbddc->coarse_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
44650bdf917eSStefano Zampini       if (rank_prec_comm == active_rank) {
44660bdf917eSStefano Zampini         ierr = MatMult(pcbddc->coarse_mat,pcbddc->coarse_vec,pcbddc->coarse_rhs);CHKERRQ(ierr);
44670bdf917eSStefano Zampini         ierr = VecNorm(pcbddc->coarse_rhs,NORM_2,&test_null);CHKERRQ(ierr);
44680bdf917eSStefano Zampini         if (test_null > 1.0e-12 && pcbddc->dbg_flag ) {
44690bdf917eSStefano Zampini           ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Vec %d coarse null space error % 1.14e\n",i,test_null);CHKERRQ(ierr);
44700bdf917eSStefano Zampini         }
44710bdf917eSStefano Zampini         ierr = VecCopy(pcbddc->coarse_vec,coarse_nsp_vecs[coarse_nsp_size]);CHKERRQ(ierr);
44720bdf917eSStefano Zampini         coarse_nsp_size++;
44730bdf917eSStefano Zampini       }
44740bdf917eSStefano Zampini     }
44750bdf917eSStefano Zampini     if (coarse_nsp_size > 0) {
44760bdf917eSStefano Zampini       /* TODO orthonormalize vecs */
44770bdf917eSStefano Zampini       ierr = VecNormalize(coarse_nsp_vecs[0],PETSC_NULL);CHKERRQ(ierr);
44780bdf917eSStefano Zampini       ierr = MatNullSpaceCreate(coarse_comm,PETSC_FALSE,coarse_nsp_size,coarse_nsp_vecs,&pcbddc->CoarseNullSpace);CHKERRQ(ierr);
44790bdf917eSStefano Zampini       for (i=0;i<nsp_size+1;i++) {
44800bdf917eSStefano Zampini         ierr = VecDestroy(&coarse_nsp_vecs[i]);CHKERRQ(ierr);
44810bdf917eSStefano Zampini       }
44820bdf917eSStefano Zampini     }
44830bdf917eSStefano Zampini     ierr = PetscFree(coarse_nsp_vecs);CHKERRQ(ierr);
44840bdf917eSStefano Zampini   }
44850bdf917eSStefano Zampini 
44860bdf917eSStefano Zampini   /* KSP for coarse problem */
44870bdf917eSStefano Zampini   if (rank_prec_comm == active_rank) {
44882e8d2280SStefano Zampini     PetscBool isbddc=PETSC_FALSE;
44890bdf917eSStefano Zampini 
449053cdbc3dSStefano Zampini     ierr = KSPCreate(coarse_comm,&pcbddc->coarse_ksp);CHKERRQ(ierr);
449153cdbc3dSStefano Zampini     ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->coarse_ksp,(PetscObject)pc,1);CHKERRQ(ierr);
449253cdbc3dSStefano Zampini     ierr = KSPSetOperators(pcbddc->coarse_ksp,pcbddc->coarse_mat,pcbddc->coarse_mat,SAME_PRECONDITIONER);CHKERRQ(ierr);
44933b03a366Sstefano_zampini     ierr = KSPSetTolerances(pcbddc->coarse_ksp,PETSC_DEFAULT,PETSC_DEFAULT,PETSC_DEFAULT,max_it_coarse_ksp);CHKERRQ(ierr);
449453cdbc3dSStefano Zampini     ierr = KSPSetType(pcbddc->coarse_ksp,coarse_ksp_type);CHKERRQ(ierr);
449553cdbc3dSStefano Zampini     ierr = KSPGetPC(pcbddc->coarse_ksp,&pc_temp);CHKERRQ(ierr);
449653cdbc3dSStefano Zampini     ierr = PCSetType(pc_temp,coarse_pc_type);CHKERRQ(ierr);
44970c7d97c5SJed Brown     /* Allow user's customization */
4498da1bb401SStefano Zampini     ierr = KSPSetOptionsPrefix(pcbddc->coarse_ksp,"coarse_");CHKERRQ(ierr);
44990c7d97c5SJed Brown     /* Set Up PC for coarse problem BDDC */
450053cdbc3dSStefano Zampini     if (pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
45014fad6a16SStefano Zampini       i = pcbddc->current_level+1;
45024fad6a16SStefano Zampini       ierr = PCBDDCSetLevel(pc_temp,i);CHKERRQ(ierr);
45034fad6a16SStefano Zampini       ierr = PCBDDCSetCoarseningRatio(pc_temp,pcbddc->coarsening_ratio);CHKERRQ(ierr);
45044fad6a16SStefano Zampini       ierr = PCBDDCSetMaxLevels(pc_temp,pcbddc->max_levels);CHKERRQ(ierr);
450553cdbc3dSStefano Zampini       ierr = PCBDDCSetCoarseProblemType(pc_temp,MULTILEVEL_BDDC);CHKERRQ(ierr);
45060bdf917eSStefano Zampini       if (pcbddc->CoarseNullSpace) { ierr = PCBDDCSetNullSpace(pc_temp,pcbddc->CoarseNullSpace);CHKERRQ(ierr); }
45074fad6a16SStefano Zampini       if (dbg_flag) {
45084fad6a16SStefano Zampini         ierr = PetscViewerASCIIPrintf(viewer,"----------------Level %d: Setting up level %d---------------\n",pcbddc->current_level,i);CHKERRQ(ierr);
45094fad6a16SStefano Zampini         ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
451053cdbc3dSStefano Zampini       }
45114fad6a16SStefano Zampini     }
45124fad6a16SStefano Zampini     ierr = KSPSetFromOptions(pcbddc->coarse_ksp);CHKERRQ(ierr);
451353cdbc3dSStefano Zampini     ierr = KSPSetUp(pcbddc->coarse_ksp);CHKERRQ(ierr);
4514142dfd88SStefano Zampini 
45152e8d2280SStefano Zampini     ierr = KSPGetTolerances(pcbddc->coarse_ksp,PETSC_NULL,PETSC_NULL,PETSC_NULL,&j);CHKERRQ(ierr);
45162e8d2280SStefano Zampini     ierr = KSPGetPC(pcbddc->coarse_ksp,&pc_temp);CHKERRQ(ierr);
45172e8d2280SStefano Zampini     ierr = PetscObjectTypeCompare((PetscObject)pc_temp,PCBDDC,&isbddc);CHKERRQ(ierr);
45182e8d2280SStefano Zampini     if (j == 1) {
45192e8d2280SStefano Zampini       ierr = KSPSetNormType(pcbddc->coarse_ksp,KSP_NORM_NONE);CHKERRQ(ierr);
45202e8d2280SStefano Zampini       if (isbddc) {
45212e8d2280SStefano Zampini         ierr = PCBDDCSetUseExactDirichlet(pc_temp,PETSC_FALSE);CHKERRQ(ierr);
45225619798eSStefano Zampini       }
45235619798eSStefano Zampini     }
45240c7d97c5SJed Brown   }
45253b03a366Sstefano_zampini   /* Evaluate condition number of coarse problem for cheby (and verbose output if requested) */
4526142dfd88SStefano Zampini   if ( dbg_flag && rank_prec_comm == active_rank ) {
4527142dfd88SStefano Zampini     KSP check_ksp;
4528142dfd88SStefano Zampini     PC  check_pc;
4529142dfd88SStefano Zampini     Vec check_vec;
4530142dfd88SStefano Zampini     PetscReal   abs_infty_error,infty_error,lambda_min,lambda_max;
453119fd82e9SBarry Smith     KSPType check_ksp_type;
45320c7d97c5SJed Brown 
4533142dfd88SStefano Zampini     /* Create ksp object suitable for extreme eigenvalues' estimation */
4534142dfd88SStefano Zampini     ierr = KSPCreate(coarse_comm,&check_ksp);CHKERRQ(ierr);
4535142dfd88SStefano Zampini     ierr = KSPSetOperators(check_ksp,pcbddc->coarse_mat,pcbddc->coarse_mat,SAME_PRECONDITIONER);CHKERRQ(ierr);
45360bdf917eSStefano Zampini     ierr = KSPSetTolerances(check_ksp,1.e-12,1.e-12,PETSC_DEFAULT,pcbddc->coarse_size);CHKERRQ(ierr);
4537142dfd88SStefano Zampini     if (pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
4538142dfd88SStefano Zampini       if (issym) {
4539142dfd88SStefano Zampini         check_ksp_type = KSPCG;
4540142dfd88SStefano Zampini       } else {
4541142dfd88SStefano Zampini         check_ksp_type = KSPGMRES;
4542142dfd88SStefano Zampini       }
4543142dfd88SStefano Zampini       ierr = KSPSetComputeSingularValues(check_ksp,PETSC_TRUE);CHKERRQ(ierr);
4544142dfd88SStefano Zampini     } else {
4545142dfd88SStefano Zampini       check_ksp_type = KSPPREONLY;
4546142dfd88SStefano Zampini     }
4547142dfd88SStefano Zampini     ierr = KSPSetType(check_ksp,check_ksp_type);CHKERRQ(ierr);
4548142dfd88SStefano Zampini     ierr = KSPGetPC(pcbddc->coarse_ksp,&check_pc);CHKERRQ(ierr);
4549142dfd88SStefano Zampini     ierr = KSPSetPC(check_ksp,check_pc);CHKERRQ(ierr);
4550142dfd88SStefano Zampini     ierr = KSPSetUp(check_ksp);CHKERRQ(ierr);
4551142dfd88SStefano Zampini     /* create random vec */
4552142dfd88SStefano Zampini     ierr = VecDuplicate(pcbddc->coarse_vec,&check_vec);CHKERRQ(ierr);
4553142dfd88SStefano Zampini     ierr = VecSetRandom(check_vec,PETSC_NULL);CHKERRQ(ierr);
45540bdf917eSStefano Zampini     if (pcbddc->CoarseNullSpace) { ierr = MatNullSpaceRemove(pcbddc->CoarseNullSpace,check_vec,PETSC_NULL);CHKERRQ(ierr); }
4555142dfd88SStefano Zampini     ierr = MatMult(pcbddc->coarse_mat,check_vec,pcbddc->coarse_rhs);CHKERRQ(ierr);
4556142dfd88SStefano Zampini     /* solve coarse problem */
4557142dfd88SStefano Zampini     ierr = KSPSolve(check_ksp,pcbddc->coarse_rhs,pcbddc->coarse_vec);CHKERRQ(ierr);
45580bdf917eSStefano Zampini     if (pcbddc->CoarseNullSpace) { ierr = MatNullSpaceRemove(pcbddc->CoarseNullSpace,pcbddc->coarse_vec,PETSC_NULL);CHKERRQ(ierr); }
4559142dfd88SStefano Zampini     /* check coarse problem residual error */
4560142dfd88SStefano Zampini     ierr = VecAXPY(check_vec,-1.0,pcbddc->coarse_vec);CHKERRQ(ierr);
4561142dfd88SStefano Zampini     ierr = VecNorm(check_vec,NORM_INFINITY,&infty_error);CHKERRQ(ierr);
4562142dfd88SStefano Zampini     ierr = MatMult(pcbddc->coarse_mat,check_vec,pcbddc->coarse_rhs);CHKERRQ(ierr);
4563142dfd88SStefano Zampini     ierr = VecNorm(pcbddc->coarse_rhs,NORM_INFINITY,&abs_infty_error);CHKERRQ(ierr);
4564142dfd88SStefano Zampini     ierr = VecDestroy(&check_vec);CHKERRQ(ierr);
4565142dfd88SStefano Zampini     /* get eigenvalue estimation if inexact */
4566142dfd88SStefano Zampini     if (pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
4567142dfd88SStefano Zampini       ierr = KSPComputeExtremeSingularValues(check_ksp,&lambda_max,&lambda_min);CHKERRQ(ierr);
4568142dfd88SStefano Zampini       ierr = KSPGetIterationNumber(check_ksp,&k);CHKERRQ(ierr);
4569142dfd88SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem eigenvalues estimated with %d iterations of %s.\n",k,check_ksp_type);CHKERRQ(ierr);
4570e269702eSStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem eigenvalues: % 1.14e %1.14e\n",lambda_min,lambda_max);CHKERRQ(ierr);
45713b03a366Sstefano_zampini     }
4572142dfd88SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem exact infty_error   : %1.14e\n",infty_error);CHKERRQ(ierr);
4573142dfd88SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem residual infty_error: %1.14e\n",abs_infty_error);CHKERRQ(ierr);
4574142dfd88SStefano Zampini     ierr = KSPDestroy(&check_ksp);CHKERRQ(ierr);
457553cdbc3dSStefano Zampini   }
4576142dfd88SStefano Zampini   if (dbg_flag) { ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); }
45770c7d97c5SJed Brown   /* free data structures no longer needed */
45780c7d97c5SJed Brown   if (coarse_ISLG)                { ierr = ISLocalToGlobalMappingDestroy(&coarse_ISLG);CHKERRQ(ierr); }
45790c7d97c5SJed Brown   if (ins_local_primal_indices)   { ierr = PetscFree(ins_local_primal_indices);CHKERRQ(ierr);  }
45800c7d97c5SJed Brown   if (ins_coarse_mat_vals)        { ierr = PetscFree(ins_coarse_mat_vals);CHKERRQ(ierr);}
45810c7d97c5SJed Brown   if (localsizes2)                { ierr = PetscFree(localsizes2);CHKERRQ(ierr);}
45820c7d97c5SJed Brown   if (localdispl2)                { ierr = PetscFree(localdispl2);CHKERRQ(ierr);}
45830c7d97c5SJed Brown   if (temp_coarse_mat_vals)       { ierr = PetscFree(temp_coarse_mat_vals);CHKERRQ(ierr);}
45840c7d97c5SJed Brown 
45850c7d97c5SJed Brown   PetscFunctionReturn(0);
45860c7d97c5SJed Brown }
45870c7d97c5SJed Brown 
45880c7d97c5SJed Brown #undef __FUNCT__
45890c7d97c5SJed Brown #define __FUNCT__ "PCBDDCManageLocalBoundaries"
459053cdbc3dSStefano Zampini static PetscErrorCode PCBDDCManageLocalBoundaries(PC pc)
45910c7d97c5SJed Brown {
45920c7d97c5SJed Brown 
45930c7d97c5SJed Brown   PC_BDDC     *pcbddc = (PC_BDDC*)pc->data;
45940c7d97c5SJed Brown   PC_IS         *pcis = (PC_IS*)pc->data;
45950c7d97c5SJed Brown   Mat_IS      *matis  = (Mat_IS*)pc->pmat->data;
4596da1bb401SStefano Zampini   PCBDDCGraph mat_graph=pcbddc->mat_graph;
45977cf533a6SStefano Zampini   PetscInt    *is_indices,*auxis;
45983b03a366Sstefano_zampini   PetscInt    bs,ierr,i,j,s,k,iindex,neumann_bsize,dirichlet_bsize;
4599da1bb401SStefano Zampini   PetscInt    total_counts,nodes_touched,where_values=1,vertex_size;
4600534831adSStefano Zampini   PetscMPIInt adapt_interface=0,adapt_interface_reduced=0,NEUMANNCNT=0;
4601da1bb401SStefano Zampini   PetscBool   same_set;
4602a0ba757dSStefano Zampini   MPI_Comm    interface_comm=((PetscObject)pc)->comm;
46033b03a366Sstefano_zampini   PetscBool   use_faces=PETSC_FALSE,use_edges=PETSC_FALSE;
46043b03a366Sstefano_zampini   const PetscInt *neumann_nodes;
46053b03a366Sstefano_zampini   const PetscInt *dirichlet_nodes;
4606a81d60d8SStefano Zampini   IS          used_IS,*custom_ISForDofs;
4607da1bb401SStefano Zampini   PetscScalar *array;
4608da1bb401SStefano Zampini   PetscScalar *array2;
4609da1bb401SStefano Zampini   PetscViewer viewer=pcbddc->dbg_viewer;
46100c7d97c5SJed Brown 
46110c7d97c5SJed Brown   PetscFunctionBegin;
4612da1bb401SStefano Zampini   /* Setup local adjacency graph */
4613da1bb401SStefano Zampini   mat_graph->nvtxs=pcis->n;
4614534831adSStefano Zampini   if (!mat_graph->xadj) { NEUMANNCNT = 1; }
4615da1bb401SStefano Zampini   ierr = PCBDDCSetupLocalAdjacencyGraph(pc);CHKERRQ(ierr);
4616a0ba757dSStefano Zampini   i = mat_graph->nvtxs;
4617a0ba757dSStefano Zampini   ierr = PetscMalloc4(i,PetscInt,&mat_graph->where,i,PetscInt,&mat_graph->count,i+1,PetscInt,&mat_graph->cptr,i,PetscInt,&mat_graph->queue);CHKERRQ(ierr);
46183972b0daSStefano Zampini   ierr = PetscMalloc2(i,PetscInt,&mat_graph->which_dof,i,PetscBool,&mat_graph->touched);CHKERRQ(ierr);
4619a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->where,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
4620a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->count,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
4621a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->which_dof,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
4622a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->queue,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
46233828260eSStefano Zampini   ierr = PetscMemzero(mat_graph->cptr,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr);
4624a0ba757dSStefano Zampini 
4625a81d60d8SStefano Zampini   /* Setting dofs splitting in mat_graph->which_dof
4626a81d60d8SStefano Zampini      Get information about dofs' splitting if provided by the user
4627a81d60d8SStefano Zampini      Otherwise it assumes a constant block size */
4628a81d60d8SStefano Zampini   vertex_size=0;
4629a81d60d8SStefano Zampini   if (!pcbddc->n_ISForDofs) {
4630a81d60d8SStefano Zampini     ierr = MatGetBlockSize(matis->A,&bs);CHKERRQ(ierr);
4631a81d60d8SStefano Zampini     ierr = PetscMalloc(bs*sizeof(IS),&custom_ISForDofs);CHKERRQ(ierr);
4632a81d60d8SStefano Zampini     for (i=0;i<bs;i++) {
4633a81d60d8SStefano Zampini       ierr = ISCreateStride(PETSC_COMM_SELF,pcis->n/bs,i,bs,&custom_ISForDofs[i]);CHKERRQ(ierr);
4634a81d60d8SStefano Zampini     }
4635a81d60d8SStefano Zampini     ierr = PCBDDCSetDofsSplitting(pc,bs,custom_ISForDofs);CHKERRQ(ierr);
4636a81d60d8SStefano Zampini     vertex_size=1;
4637a81d60d8SStefano Zampini     /* remove my references to IS objects */
4638a81d60d8SStefano Zampini     for (i=0;i<bs;i++) {
4639a81d60d8SStefano Zampini       ierr = ISDestroy(&custom_ISForDofs[i]);CHKERRQ(ierr);
4640a81d60d8SStefano Zampini     }
4641a81d60d8SStefano Zampini     ierr = PetscFree(custom_ISForDofs);CHKERRQ(ierr);
4642a81d60d8SStefano Zampini   }
46439c0446d6SStefano Zampini   for (i=0;i<pcbddc->n_ISForDofs;i++) {
4644a81d60d8SStefano Zampini     ierr = ISGetSize(pcbddc->ISForDofs[i],&k);CHKERRQ(ierr);
46459c0446d6SStefano Zampini     ierr = ISGetIndices(pcbddc->ISForDofs[i],(const PetscInt**)&is_indices);CHKERRQ(ierr);
4646a81d60d8SStefano Zampini     for (j=0;j<k;j++) {
46479c0446d6SStefano Zampini       mat_graph->which_dof[is_indices[j]]=i;
46489c0446d6SStefano Zampini     }
46499c0446d6SStefano Zampini     ierr = ISRestoreIndices(pcbddc->ISForDofs[i],(const PetscInt**)&is_indices);CHKERRQ(ierr);
46509c0446d6SStefano Zampini   }
4651a81d60d8SStefano Zampini   /* use mat block size as vertex size if it has not yet set */
4652a81d60d8SStefano Zampini   if (!vertex_size) {
46533b03a366Sstefano_zampini     ierr = MatGetBlockSize(matis->A,&vertex_size);CHKERRQ(ierr);
46540c7d97c5SJed Brown   }
4655a81d60d8SStefano Zampini 
46563b03a366Sstefano_zampini   /* count number of neigh per node */
46570c7d97c5SJed Brown   total_counts=0;
46583b03a366Sstefano_zampini   for (i=1;i<pcis->n_neigh;i++){
46590c7d97c5SJed Brown     s=pcis->n_shared[i];
46600c7d97c5SJed Brown     total_counts+=s;
466153cdbc3dSStefano Zampini     for (j=0;j<s;j++){
46620c7d97c5SJed Brown       mat_graph->count[pcis->shared[i][j]] += 1;
46630c7d97c5SJed Brown     }
46640c7d97c5SJed Brown   }
4665534831adSStefano Zampini   /* Take into account Neumann data -> it increments number of sharing subdomains for nodes lying on the interface */
466636e030ebSStefano Zampini   ierr = PCBDDCGetNeumannBoundaries(pc,&used_IS);CHKERRQ(ierr);
4667da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
4668da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
466936e030ebSStefano Zampini   if (used_IS) {
467036e030ebSStefano Zampini     ierr = ISGetSize(used_IS,&neumann_bsize);CHKERRQ(ierr);
467136e030ebSStefano Zampini     ierr = ISGetIndices(used_IS,&neumann_nodes);CHKERRQ(ierr);
467253cdbc3dSStefano Zampini     for (i=0;i<neumann_bsize;i++){
467353cdbc3dSStefano Zampini       iindex = neumann_nodes[i];
4674534831adSStefano Zampini       if (mat_graph->count[iindex] > NEUMANNCNT && array[iindex]==0.0){
467553cdbc3dSStefano Zampini         mat_graph->count[iindex]+=1;
46760c7d97c5SJed Brown         total_counts++;
4677da1bb401SStefano Zampini         array[iindex]=array[iindex]+1.0;
4678da1bb401SStefano Zampini       } else if (array[iindex]>0.0) {
4679da1bb401SStefano Zampini         SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_USER,"Error for neumann nodes provided to BDDC! They must be uniquely listed! Found duplicate node %d\n",iindex);
46800c7d97c5SJed Brown       }
46810c7d97c5SJed Brown     }
46820c7d97c5SJed Brown   }
4683da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
4684da1bb401SStefano Zampini   /* allocate space for storing the set of neighbours for each node */
4685da1bb401SStefano Zampini   ierr = PetscMalloc(mat_graph->nvtxs*sizeof(PetscInt*),&mat_graph->neighbours_set);CHKERRQ(ierr);
4686da1bb401SStefano Zampini   if (mat_graph->nvtxs) { ierr = PetscMalloc(total_counts*sizeof(PetscInt),&mat_graph->neighbours_set[0]);CHKERRQ(ierr); }
4687da1bb401SStefano Zampini   for (i=1;i<mat_graph->nvtxs;i++) mat_graph->neighbours_set[i]=mat_graph->neighbours_set[i-1]+mat_graph->count[i-1];
4688a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->count,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
46893b03a366Sstefano_zampini   for (i=1;i<pcis->n_neigh;i++){
46900c7d97c5SJed Brown     s=pcis->n_shared[i];
46910c7d97c5SJed Brown     for (j=0;j<s;j++) {
46920c7d97c5SJed Brown       k=pcis->shared[i][j];
4693da1bb401SStefano Zampini       mat_graph->neighbours_set[k][mat_graph->count[k]] = pcis->neigh[i];
46940c7d97c5SJed Brown       mat_graph->count[k]+=1;
46950c7d97c5SJed Brown     }
46960c7d97c5SJed Brown   }
4697da1bb401SStefano Zampini   /* Check consistency of Neumann nodes */
4698da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
4699da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4700da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4701da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4702da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4703da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
47043b03a366Sstefano_zampini   /* set -1 fake neighbour to mimic Neumann boundary */
470536e030ebSStefano Zampini   if (used_IS) {
470653cdbc3dSStefano Zampini     for (i=0;i<neumann_bsize;i++){
470753cdbc3dSStefano Zampini       iindex = neumann_nodes[i];
4708534831adSStefano Zampini       if (mat_graph->count[iindex] > NEUMANNCNT){
4709da1bb401SStefano Zampini         if (mat_graph->count[iindex]+1 != (PetscInt)array[iindex]) {
4710da1bb401SStefano Zampini           SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_USER,"Neumann nodes provided to BDDC must be consistent among neighbours!\nNode %d: number of sharing subdomains %d != number of subdomains for which it is a neumann node %d\n",iindex,mat_graph->count[iindex]+1,(PetscInt)array[iindex]);
4711da1bb401SStefano Zampini         }
4712da1bb401SStefano Zampini         mat_graph->neighbours_set[iindex][mat_graph->count[iindex]] = -1;
471353cdbc3dSStefano Zampini         mat_graph->count[iindex]+=1;
47140c7d97c5SJed Brown       }
47150c7d97c5SJed Brown     }
471636e030ebSStefano Zampini     ierr = ISRestoreIndices(used_IS,&neumann_nodes);CHKERRQ(ierr);
47170c7d97c5SJed Brown   }
4718da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
4719da1bb401SStefano Zampini   /* sort set of sharing subdomains */
4720da1bb401SStefano Zampini   for (i=0;i<mat_graph->nvtxs;i++) { ierr = PetscSortInt(mat_graph->count[i],mat_graph->neighbours_set[i]);CHKERRQ(ierr); }
47213b03a366Sstefano_zampini   /* remove interior nodes and dirichlet boundary nodes from the next search into the graph */
4722da1bb401SStefano Zampini   for (i=0;i<mat_graph->nvtxs;i++){mat_graph->touched[i]=PETSC_FALSE;}
4723da1bb401SStefano Zampini   nodes_touched=0;
472436e030ebSStefano Zampini   ierr = PCBDDCGetDirichletBoundaries(pc,&used_IS);CHKERRQ(ierr);
4725da1bb401SStefano Zampini   ierr = VecSet(pcis->vec2_N,0.0);CHKERRQ(ierr);
4726da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
4727da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec2_N,&array2);CHKERRQ(ierr);
4728da1bb401SStefano Zampini   if (used_IS) {
4729da1bb401SStefano Zampini     ierr = ISGetSize(used_IS,&dirichlet_bsize);CHKERRQ(ierr);
4730da1bb401SStefano Zampini     if (dirichlet_bsize && matis->pure_neumann) {
4731da1bb401SStefano Zampini       SETERRQ(PETSC_COMM_SELF,PETSC_ERR_USER,"Dirichlet boundaries are intended to be used with matrices with zeroed rows!\n");
4732da1bb401SStefano Zampini     }
4733da1bb401SStefano Zampini     ierr = ISGetIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr);
4734da1bb401SStefano Zampini     for (i=0;i<dirichlet_bsize;i++){
4735da1bb401SStefano Zampini       iindex=dirichlet_nodes[i];
4736da1bb401SStefano Zampini       if (mat_graph->count[iindex] && !mat_graph->touched[iindex]) {
4737da1bb401SStefano Zampini         if (array[iindex]>0.0) {
4738da1bb401SStefano Zampini           SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_USER,"BDDC cannot have nodes which are marked as Neumann and Dirichlet at the same time! Wrong node %d\n",iindex);
4739da1bb401SStefano Zampini         }
4740da1bb401SStefano Zampini         mat_graph->touched[iindex]=PETSC_TRUE;
4741da1bb401SStefano Zampini         mat_graph->where[iindex]=0;
4742da1bb401SStefano Zampini         nodes_touched++;
4743da1bb401SStefano Zampini         array2[iindex]=array2[iindex]+1.0;
4744da1bb401SStefano Zampini       }
4745da1bb401SStefano Zampini     }
4746da1bb401SStefano Zampini     ierr = ISRestoreIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr);
4747da1bb401SStefano Zampini   }
4748da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
4749da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec2_N,&array2);CHKERRQ(ierr);
4750da1bb401SStefano Zampini   /* Check consistency of Dirichlet nodes */
4751da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_N,1.0);CHKERRQ(ierr);
4752da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
4753da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4754da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4755da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4756da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4757da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
4758da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec2_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4759da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec2_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4760da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4761da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4762da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
4763da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec2_N,&array2);CHKERRQ(ierr);
476436e030ebSStefano Zampini   if (used_IS) {
476536e030ebSStefano Zampini     ierr = ISGetSize(used_IS,&dirichlet_bsize);CHKERRQ(ierr);
476636e030ebSStefano Zampini     ierr = ISGetIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr);
47673b03a366Sstefano_zampini     for (i=0;i<dirichlet_bsize;i++){
4768da1bb401SStefano Zampini       iindex=dirichlet_nodes[i];
4769da1bb401SStefano Zampini       if (array[iindex]>1.0 && array[iindex]!=array2[iindex] ) {
4770da1bb401SStefano Zampini          SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_USER,"Dirichlet nodes provided to BDDC must be consistent among neighbours!\nNode %d: number of sharing subdomains %d != number of subdomains for which it is a neumann node %d\n",iindex,(PetscInt)array[iindex],(PetscInt)array2[iindex]);
4771da1bb401SStefano Zampini       }
47723b03a366Sstefano_zampini     }
477336e030ebSStefano Zampini     ierr = ISRestoreIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr);
47743b03a366Sstefano_zampini   }
4775da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
4776da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec2_N,&array2);CHKERRQ(ierr);
4777da1bb401SStefano Zampini 
47780c7d97c5SJed Brown   for (i=0;i<mat_graph->nvtxs;i++){
47793b03a366Sstefano_zampini     if (!mat_graph->count[i]){  /* interior nodes */
47800c7d97c5SJed Brown       mat_graph->touched[i]=PETSC_TRUE;
47810c7d97c5SJed Brown       mat_graph->where[i]=0;
47820c7d97c5SJed Brown       nodes_touched++;
47830c7d97c5SJed Brown     }
47840c7d97c5SJed Brown   }
47850c7d97c5SJed Brown   mat_graph->ncmps = 0;
4786da1bb401SStefano Zampini   i=0;
47870c7d97c5SJed Brown   while(nodes_touched<mat_graph->nvtxs) {
4788a0ba757dSStefano Zampini     /*  find first untouched node in local ordering */
47890c7d97c5SJed Brown     while(mat_graph->touched[i]) i++;
47900c7d97c5SJed Brown     mat_graph->touched[i]=PETSC_TRUE;
4791a0ba757dSStefano Zampini     mat_graph->where[i]=where_values;
47920c7d97c5SJed Brown     nodes_touched++;
4793a0ba757dSStefano Zampini     /* now find all other nodes having the same set of sharing subdomains */
47940c7d97c5SJed Brown     for (j=i+1;j<mat_graph->nvtxs;j++){
4795a0ba757dSStefano Zampini       /* check for same number of sharing subdomains and dof number */
4796da1bb401SStefano Zampini       if (!mat_graph->touched[j] && mat_graph->count[i]==mat_graph->count[j] && mat_graph->which_dof[i] == mat_graph->which_dof[j] ){
4797a0ba757dSStefano Zampini         /* check for same set of sharing subdomains */
47980c7d97c5SJed Brown         same_set=PETSC_TRUE;
47990c7d97c5SJed Brown         for (k=0;k<mat_graph->count[j];k++){
4800da1bb401SStefano Zampini           if (mat_graph->neighbours_set[i][k]!=mat_graph->neighbours_set[j][k]) {
48010c7d97c5SJed Brown             same_set=PETSC_FALSE;
48020c7d97c5SJed Brown           }
48030c7d97c5SJed Brown         }
4804a0ba757dSStefano Zampini         /* I found a friend of mine */
48050c7d97c5SJed Brown         if (same_set) {
4806a0ba757dSStefano Zampini           mat_graph->where[j]=where_values;
48070c7d97c5SJed Brown           mat_graph->touched[j]=PETSC_TRUE;
48080c7d97c5SJed Brown           nodes_touched++;
48090c7d97c5SJed Brown         }
48100c7d97c5SJed Brown       }
48110c7d97c5SJed Brown     }
4812a0ba757dSStefano Zampini     where_values++;
48130c7d97c5SJed Brown   }
4814a0ba757dSStefano Zampini   where_values--; if (where_values<0) where_values=0;
4815a0ba757dSStefano Zampini   ierr = PetscMalloc(where_values*sizeof(PetscMPIInt),&mat_graph->where_ncmps);CHKERRQ(ierr);
4816a0ba757dSStefano Zampini   /* Find connected components defined on the shared interface */
4817a0ba757dSStefano Zampini   if (where_values) {
4818a0ba757dSStefano Zampini     ierr = PCBDDCFindConnectedComponents(mat_graph, where_values);
4819a0ba757dSStefano Zampini   }
4820a0ba757dSStefano Zampini   /* check consistency of connected components among neighbouring subdomains -> it adapt them in case it is needed */
4821a0ba757dSStefano Zampini   for (i=0;i<where_values;i++) {
48227cf533a6SStefano Zampini     /* We are not sure that on a given subset of the local interface,
48237cf533a6SStefano Zampini        two connected components will be the same among sharing subdomains */
48243b03a366Sstefano_zampini     if (mat_graph->where_ncmps[i]>1) {
4825a0ba757dSStefano Zampini       adapt_interface=1;
4826a0ba757dSStefano Zampini       break;
4827a0ba757dSStefano Zampini     }
4828a0ba757dSStefano Zampini   }
4829a0ba757dSStefano Zampini   ierr = MPI_Allreduce(&adapt_interface,&adapt_interface_reduced,1,MPIU_INT,MPI_LOR,interface_comm);CHKERRQ(ierr);
4830da1bb401SStefano Zampini   if (pcbddc->dbg_flag && adapt_interface_reduced) {
4831d8923723SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"Adapting interface\n");CHKERRQ(ierr);
4832da1bb401SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
4833da1bb401SStefano Zampini   }
4834a0ba757dSStefano Zampini   if (where_values && adapt_interface_reduced) {
48350c7d97c5SJed Brown 
4836a0ba757dSStefano Zampini     PetscInt sum_requests=0,my_rank;
4837a0ba757dSStefano Zampini     PetscInt buffer_size,start_of_recv,size_of_recv,start_of_send;
4838a0ba757dSStefano Zampini     PetscInt temp_buffer_size,ins_val,global_where_counter;
4839a0ba757dSStefano Zampini     PetscInt *cum_recv_counts;
4840a0ba757dSStefano Zampini     PetscInt *where_to_nodes_indices;
4841a0ba757dSStefano Zampini     PetscInt *petsc_buffer;
4842a0ba757dSStefano Zampini     PetscMPIInt *recv_buffer;
4843a0ba757dSStefano Zampini     PetscMPIInt *recv_buffer_where;
4844a0ba757dSStefano Zampini     PetscMPIInt *send_buffer;
4845a0ba757dSStefano Zampini     PetscMPIInt size_of_send;
4846a0ba757dSStefano Zampini     PetscInt *sizes_of_sends;
4847a0ba757dSStefano Zampini     MPI_Request *send_requests;
4848a0ba757dSStefano Zampini     MPI_Request *recv_requests;
4849a0ba757dSStefano Zampini     PetscInt *where_cc_adapt;
4850a0ba757dSStefano Zampini     PetscInt **temp_buffer;
4851a0ba757dSStefano Zampini     PetscInt *nodes_to_temp_buffer_indices;
4852a0ba757dSStefano Zampini     PetscInt *add_to_where;
48537cf533a6SStefano Zampini     PetscInt *aux_new_xadj,*new_xadj,*new_adjncy;
48547cf533a6SStefano Zampini     PetscInt *queue_in_global_numbering;
4855a0ba757dSStefano Zampini 
48567cf533a6SStefano Zampini     /* Retrict adjacency graph using information from connected components */
48577cf533a6SStefano Zampini     ierr = PetscMalloc(mat_graph->nvtxs*sizeof(PetscInt),&aux_new_xadj);CHKERRQ(ierr);
48587cf533a6SStefano Zampini     for (i=0;i<mat_graph->nvtxs;i++) {
48597cf533a6SStefano Zampini       aux_new_xadj[i]=1;
48607cf533a6SStefano Zampini     }
48617cf533a6SStefano Zampini     for (i=0;i<mat_graph->ncmps;i++) {
48627cf533a6SStefano Zampini       k = mat_graph->cptr[i+1]-mat_graph->cptr[i];
48637cf533a6SStefano Zampini       for (j=0;j<k;j++) {
48647cf533a6SStefano Zampini         aux_new_xadj[mat_graph->queue[mat_graph->cptr[i]+j]]=k;
48657cf533a6SStefano Zampini       }
48667cf533a6SStefano Zampini     }
48677cf533a6SStefano Zampini     j = 0;
48687cf533a6SStefano Zampini     for (i=0;i<mat_graph->nvtxs;i++) {
48697cf533a6SStefano Zampini       j += aux_new_xadj[i];
48707cf533a6SStefano Zampini     }
48717cf533a6SStefano Zampini     ierr = PetscMalloc((mat_graph->nvtxs+1)*sizeof(PetscInt),&new_xadj);CHKERRQ(ierr);
48727cf533a6SStefano Zampini     ierr = PetscMalloc(j*sizeof(PetscInt),&new_adjncy);CHKERRQ(ierr);
48737cf533a6SStefano Zampini     new_xadj[0]=0;
48747cf533a6SStefano Zampini     for (i=0;i<mat_graph->nvtxs;i++) {
48757cf533a6SStefano Zampini       new_xadj[i+1]=new_xadj[i]+aux_new_xadj[i];
48767cf533a6SStefano Zampini       if (aux_new_xadj[i]==1) {
48777cf533a6SStefano Zampini         new_adjncy[new_xadj[i]]=i;
48787cf533a6SStefano Zampini       }
48797cf533a6SStefano Zampini     }
4880354b9337SStefano Zampini     ierr = PetscFree(aux_new_xadj);CHKERRQ(ierr);
48817cf533a6SStefano Zampini     for (i=0;i<mat_graph->ncmps;i++) {
48827cf533a6SStefano Zampini       k = mat_graph->cptr[i+1]-mat_graph->cptr[i];
48837cf533a6SStefano Zampini       for (j=0;j<k;j++) {
48847cf533a6SStefano Zampini         ierr = PetscMemcpy(&new_adjncy[new_xadj[mat_graph->queue[mat_graph->cptr[i]+j]]],&mat_graph->queue[mat_graph->cptr[i]],k*sizeof(PetscInt));CHKERRQ(ierr);
48857cf533a6SStefano Zampini       }
48867cf533a6SStefano Zampini     }
48877cf533a6SStefano Zampini     ierr = PCBDDCSetLocalAdjacencyGraph(pc,mat_graph->nvtxs,new_xadj,new_adjncy,PETSC_OWN_POINTER);CHKERRQ(ierr);
48887cf533a6SStefano Zampini     /* For consistency among neughbouring procs, I need to sort (by global ordering) each connected component */
48897cf533a6SStefano Zampini     ierr = PetscMalloc(mat_graph->nvtxs*sizeof(PetscInt),&queue_in_global_numbering);CHKERRQ(ierr);
48907cf533a6SStefano Zampini     for (i=0;i<mat_graph->ncmps;i++) {
48917cf533a6SStefano Zampini       k = mat_graph->cptr[i+1]-mat_graph->cptr[i];
48927cf533a6SStefano Zampini       ierr = ISLocalToGlobalMappingApply(matis->mapping,k,&mat_graph->queue[mat_graph->cptr[i]],&queue_in_global_numbering[mat_graph->cptr[i]]);CHKERRQ(ierr);
48937cf533a6SStefano Zampini       ierr = PetscSortIntWithArray(k,&queue_in_global_numbering[mat_graph->cptr[i]],&mat_graph->queue[mat_graph->cptr[i]]);CHKERRQ(ierr);
48947cf533a6SStefano Zampini     }
48957cf533a6SStefano Zampini     /* allocate some space */
4896a0ba757dSStefano Zampini     ierr = MPI_Comm_rank(interface_comm,&my_rank);CHKERRQ(ierr);
4897a0ba757dSStefano Zampini     ierr = PetscMalloc((where_values+1)*sizeof(PetscInt),&cum_recv_counts);CHKERRQ(ierr);
4898a0ba757dSStefano Zampini     ierr = PetscMemzero(cum_recv_counts,(where_values+1)*sizeof(PetscInt));CHKERRQ(ierr);
4899a0ba757dSStefano Zampini     ierr = PetscMalloc(where_values*sizeof(PetscInt),&where_to_nodes_indices);CHKERRQ(ierr);
4900a0ba757dSStefano Zampini     /* first count how many neighbours per connected component I will receive from */
4901a0ba757dSStefano Zampini     cum_recv_counts[0]=0;
4902a0ba757dSStefano Zampini     for (i=1;i<where_values+1;i++){
4903a0ba757dSStefano Zampini       j=0;
4904d8923723SStefano Zampini       while(mat_graph->where[j] != i) { j++; }
4905a0ba757dSStefano Zampini       where_to_nodes_indices[i-1]=j;
4906da1bb401SStefano Zampini       if (mat_graph->neighbours_set[j][0]!=-1) { cum_recv_counts[i]=cum_recv_counts[i-1]+mat_graph->count[j]; } /* We don't want sends/recvs_to/from_self -> here I don't count myself  */
49073b03a366Sstefano_zampini       else { cum_recv_counts[i]=cum_recv_counts[i-1]+mat_graph->count[j]-1; }
4908a0ba757dSStefano Zampini     }
4909a0ba757dSStefano Zampini     ierr = PetscMalloc(2*cum_recv_counts[where_values]*sizeof(PetscMPIInt),&recv_buffer_where);CHKERRQ(ierr);
4910a0ba757dSStefano Zampini     ierr = PetscMalloc(cum_recv_counts[where_values]*sizeof(MPI_Request),&send_requests);CHKERRQ(ierr);
4911a0ba757dSStefano Zampini     ierr = PetscMalloc(cum_recv_counts[where_values]*sizeof(MPI_Request),&recv_requests);CHKERRQ(ierr);
4912a0ba757dSStefano Zampini     for (i=0;i<cum_recv_counts[where_values];i++) {
4913a0ba757dSStefano Zampini       send_requests[i]=MPI_REQUEST_NULL;
4914a0ba757dSStefano Zampini       recv_requests[i]=MPI_REQUEST_NULL;
4915a0ba757dSStefano Zampini     }
4916a0ba757dSStefano Zampini     /* exchange with my neighbours the number of my connected components on the shared interface */
4917a0ba757dSStefano Zampini     for (i=0;i<where_values;i++){
4918a0ba757dSStefano Zampini       j=where_to_nodes_indices[i];
4919da1bb401SStefano Zampini       k = (mat_graph->neighbours_set[j][0] == -1 ?  1 : 0);
4920a0ba757dSStefano Zampini       for (;k<mat_graph->count[j];k++){
4921da1bb401SStefano Zampini         ierr = MPI_Isend(&mat_graph->where_ncmps[i],1,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr);
4922da1bb401SStefano Zampini         ierr = MPI_Irecv(&recv_buffer_where[sum_requests],1,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr);
4923a0ba757dSStefano Zampini         sum_requests++;
4924a0ba757dSStefano Zampini       }
4925a0ba757dSStefano Zampini     }
4926a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
4927a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
4928a0ba757dSStefano Zampini     /* determine the connected component I need to adapt */
4929a0ba757dSStefano Zampini     ierr = PetscMalloc(where_values*sizeof(PetscInt),&where_cc_adapt);CHKERRQ(ierr);
4930a0ba757dSStefano Zampini     ierr = PetscMemzero(where_cc_adapt,where_values*sizeof(PetscInt));CHKERRQ(ierr);
4931a0ba757dSStefano Zampini     for (i=0;i<where_values;i++){
4932a0ba757dSStefano Zampini       for (j=cum_recv_counts[i];j<cum_recv_counts[i+1];j++){
49333b03a366Sstefano_zampini         /* The first condition is natural (i.e someone has a different number of cc than me), the second one is just to be safe */
49343b03a366Sstefano_zampini         if ( mat_graph->where_ncmps[i]!=recv_buffer_where[j] || mat_graph->where_ncmps[i] > 1 ) {
4935a0ba757dSStefano Zampini           where_cc_adapt[i]=PETSC_TRUE;
4936a0ba757dSStefano Zampini           break;
4937a0ba757dSStefano Zampini         }
4938a0ba757dSStefano Zampini       }
4939a0ba757dSStefano Zampini     }
4940d8923723SStefano Zampini     buffer_size = 0;
4941d8923723SStefano Zampini     for (i=0;i<where_values;i++) {
4942d8923723SStefano Zampini       if (where_cc_adapt[i]) {
4943d8923723SStefano Zampini         for (j=i;j<mat_graph->ncmps;j++) {
4944d8923723SStefano Zampini           if (mat_graph->where[mat_graph->queue[mat_graph->cptr[j]]] == i+1) { /* WARNING -> where values goes from 1 to where_values included */
4945d8923723SStefano Zampini             buffer_size += 1 + mat_graph->cptr[j+1]-mat_graph->cptr[j];
4946d8923723SStefano Zampini           }
4947d8923723SStefano Zampini         }
4948d8923723SStefano Zampini       }
4949d8923723SStefano Zampini     }
4950d8923723SStefano Zampini     ierr = PetscMalloc(buffer_size*sizeof(PetscMPIInt),&send_buffer);CHKERRQ(ierr);
4951a0ba757dSStefano Zampini     /* now get from neighbours their ccs (in global numbering) and adapt them (in case it is needed) */
4952a0ba757dSStefano Zampini     /* first determine how much data to send (size of each queue plus the global indices) and communicate it to neighbours */
4953a0ba757dSStefano Zampini     ierr = PetscMalloc(where_values*sizeof(PetscInt),&sizes_of_sends);CHKERRQ(ierr);
4954a0ba757dSStefano Zampini     ierr = PetscMemzero(sizes_of_sends,where_values*sizeof(PetscInt));CHKERRQ(ierr);
4955a0ba757dSStefano Zampini     sum_requests=0;
4956a0ba757dSStefano Zampini     start_of_send=0;
4957a0ba757dSStefano Zampini     start_of_recv=cum_recv_counts[where_values];
4958a0ba757dSStefano Zampini     for (i=0;i<where_values;i++) {
4959a0ba757dSStefano Zampini       if (where_cc_adapt[i]) {
4960a0ba757dSStefano Zampini         size_of_send=0;
4961a0ba757dSStefano Zampini         for (j=i;j<mat_graph->ncmps;j++) {
4962a0ba757dSStefano Zampini           if (mat_graph->where[mat_graph->queue[mat_graph->cptr[j]]] == i+1) { /* WARNING -> where values goes from 1 to where_values included */
4963a0ba757dSStefano Zampini             send_buffer[start_of_send+size_of_send]=mat_graph->cptr[j+1]-mat_graph->cptr[j];
4964a0ba757dSStefano Zampini             size_of_send+=1;
4965a0ba757dSStefano Zampini             for (k=0;k<mat_graph->cptr[j+1]-mat_graph->cptr[j];k++) {
4966a0ba757dSStefano Zampini               send_buffer[start_of_send+size_of_send+k]=queue_in_global_numbering[mat_graph->cptr[j]+k];
4967a0ba757dSStefano Zampini             }
4968a0ba757dSStefano Zampini             size_of_send=size_of_send+mat_graph->cptr[j+1]-mat_graph->cptr[j];
4969a0ba757dSStefano Zampini           }
4970a0ba757dSStefano Zampini         }
4971a0ba757dSStefano Zampini         j = where_to_nodes_indices[i];
4972da1bb401SStefano Zampini         k = (mat_graph->neighbours_set[j][0] == -1 ?  1 : 0);
497311d8f4c2SStefano Zampini         sizes_of_sends[i]=size_of_send;
4974a0ba757dSStefano Zampini         for (;k<mat_graph->count[j];k++){
497511d8f4c2SStefano Zampini           ierr = MPI_Isend(&sizes_of_sends[i],1,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr);
4976da1bb401SStefano Zampini           ierr = MPI_Irecv(&recv_buffer_where[sum_requests+start_of_recv],1,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr);
4977a0ba757dSStefano Zampini           sum_requests++;
4978a0ba757dSStefano Zampini         }
4979a0ba757dSStefano Zampini         start_of_send+=size_of_send;
4980a0ba757dSStefano Zampini       }
4981a0ba757dSStefano Zampini     }
4982a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
4983a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
4984a0ba757dSStefano Zampini     buffer_size=0;
4985a0ba757dSStefano Zampini     for (k=0;k<sum_requests;k++) { buffer_size+=recv_buffer_where[start_of_recv+k]; }
4986a0ba757dSStefano Zampini     ierr = PetscMalloc(buffer_size*sizeof(PetscMPIInt),&recv_buffer);CHKERRQ(ierr);
4987a0ba757dSStefano Zampini     /* now exchange the data */
4988a0ba757dSStefano Zampini     start_of_recv=0;
4989a0ba757dSStefano Zampini     start_of_send=0;
4990a0ba757dSStefano Zampini     sum_requests=0;
4991a0ba757dSStefano Zampini     for (i=0;i<where_values;i++) {
4992a0ba757dSStefano Zampini       if (where_cc_adapt[i]) {
4993a0ba757dSStefano Zampini         size_of_send = sizes_of_sends[i];
4994a0ba757dSStefano Zampini         j = where_to_nodes_indices[i];
4995da1bb401SStefano Zampini         k = (mat_graph->neighbours_set[j][0] == -1 ?  1 : 0);
4996a0ba757dSStefano Zampini         for (;k<mat_graph->count[j];k++){
4997da1bb401SStefano Zampini           ierr = MPI_Isend(&send_buffer[start_of_send],size_of_send,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr);
4998a0ba757dSStefano Zampini           size_of_recv=recv_buffer_where[cum_recv_counts[where_values]+sum_requests];
4999da1bb401SStefano Zampini           ierr = MPI_Irecv(&recv_buffer[start_of_recv],size_of_recv,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr);
5000a0ba757dSStefano Zampini           start_of_recv+=size_of_recv;
5001a0ba757dSStefano Zampini           sum_requests++;
5002a0ba757dSStefano Zampini         }
5003a0ba757dSStefano Zampini         start_of_send+=size_of_send;
5004a0ba757dSStefano Zampini       }
5005a0ba757dSStefano Zampini     }
5006a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
5007a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
5008a0ba757dSStefano Zampini     ierr = PetscMalloc(buffer_size*sizeof(PetscInt),&petsc_buffer);CHKERRQ(ierr);
5009a0ba757dSStefano Zampini     for (k=0;k<start_of_recv;k++) { petsc_buffer[k]=(PetscInt)recv_buffer[k]; }
5010a0ba757dSStefano Zampini     for (j=0;j<buffer_size;) {
5011a0ba757dSStefano Zampini        ierr = ISGlobalToLocalMappingApply(matis->mapping,IS_GTOLM_MASK,petsc_buffer[j],&petsc_buffer[j+1],&petsc_buffer[j],&petsc_buffer[j+1]);CHKERRQ(ierr);
5012a0ba757dSStefano Zampini        k=petsc_buffer[j]+1;
5013a0ba757dSStefano Zampini        j+=k;
5014a0ba757dSStefano Zampini     }
5015a0ba757dSStefano Zampini     sum_requests=cum_recv_counts[where_values];
5016a0ba757dSStefano Zampini     start_of_recv=0;
5017a0ba757dSStefano Zampini     ierr = PetscMalloc(mat_graph->nvtxs*sizeof(PetscInt),&nodes_to_temp_buffer_indices);CHKERRQ(ierr);
5018a0ba757dSStefano Zampini     global_where_counter=0;
5019a0ba757dSStefano Zampini     for (i=0;i<where_values;i++){
5020a0ba757dSStefano Zampini       if (where_cc_adapt[i]){
5021a0ba757dSStefano Zampini         temp_buffer_size=0;
5022a0ba757dSStefano Zampini         /* find nodes on the shared interface we need to adapt */
5023a0ba757dSStefano Zampini         for (j=0;j<mat_graph->nvtxs;j++){
5024a0ba757dSStefano Zampini           if (mat_graph->where[j]==i+1) {
5025a0ba757dSStefano Zampini             nodes_to_temp_buffer_indices[j]=temp_buffer_size;
5026a0ba757dSStefano Zampini             temp_buffer_size++;
5027a0ba757dSStefano Zampini           } else {
5028a0ba757dSStefano Zampini             nodes_to_temp_buffer_indices[j]=-1;
5029a0ba757dSStefano Zampini           }
5030a0ba757dSStefano Zampini         }
5031a0ba757dSStefano Zampini         /* allocate some temporary space */
5032a0ba757dSStefano Zampini         ierr = PetscMalloc(temp_buffer_size*sizeof(PetscInt*),&temp_buffer);CHKERRQ(ierr);
5033a0ba757dSStefano Zampini         ierr = PetscMalloc(temp_buffer_size*(cum_recv_counts[i+1]-cum_recv_counts[i])*sizeof(PetscInt),&temp_buffer[0]);CHKERRQ(ierr);
5034a0ba757dSStefano Zampini         ierr = PetscMemzero(temp_buffer[0],temp_buffer_size*(cum_recv_counts[i+1]-cum_recv_counts[i])*sizeof(PetscInt));CHKERRQ(ierr);
5035a0ba757dSStefano Zampini         for (j=1;j<temp_buffer_size;j++){
5036a0ba757dSStefano Zampini           temp_buffer[j]=temp_buffer[j-1]+cum_recv_counts[i+1]-cum_recv_counts[i];
5037a0ba757dSStefano Zampini         }
5038a0ba757dSStefano Zampini         /* analyze contributions from neighbouring subdomains for i-th conn comp
5039a0ba757dSStefano Zampini            temp buffer structure:
5040a0ba757dSStefano Zampini            supposing part of the interface has dimension 5 (global nodes 0,1,2,3,4)
5041a0ba757dSStefano Zampini            3 neighs procs with structured connected components:
5042a0ba757dSStefano Zampini              neigh 0: [0 1 4], [2 3];  (2 connected components)
5043a0ba757dSStefano Zampini              neigh 1: [0 1], [2 3 4];  (2 connected components)
5044a0ba757dSStefano Zampini              neigh 2: [0 4], [1], [2 3]; (3 connected components)
5045a0ba757dSStefano Zampini            tempbuffer (row-oriented) should be filled as:
5046a0ba757dSStefano Zampini              [ 0, 0, 0;
5047a0ba757dSStefano Zampini                0, 0, 1;
5048a0ba757dSStefano Zampini                1, 1, 2;
5049a0ba757dSStefano Zampini                1, 1, 2;
5050a0ba757dSStefano Zampini                0, 1, 0; ];
5051a0ba757dSStefano Zampini            This way we can simply recover the resulting structure account for possible intersections of ccs among neighs.
5052a0ba757dSStefano Zampini            The mat_graph->where array will be modified to reproduce the following 4 connected components [0], [1], [2 3], [4];
5053a0ba757dSStefano Zampini                                                                                                                                    */
5054a0ba757dSStefano Zampini         for (j=0;j<cum_recv_counts[i+1]-cum_recv_counts[i];j++) {
5055a0ba757dSStefano Zampini           ins_val=0;
5056a0ba757dSStefano Zampini           size_of_recv=recv_buffer_where[sum_requests];  /* total size of recv from neighs */
5057a0ba757dSStefano Zampini           for (buffer_size=0;buffer_size<size_of_recv;) {  /* loop until all data from neighs has been taken into account */
5058a0ba757dSStefano Zampini             for (k=1;k<petsc_buffer[buffer_size+start_of_recv]+1;k++) { /* filling properly temp_buffer using data from a single recv */
5059a0ba757dSStefano Zampini               temp_buffer[ nodes_to_temp_buffer_indices[ petsc_buffer[ start_of_recv+buffer_size+k ] ] ][j]=ins_val;
5060a0ba757dSStefano Zampini             }
5061a0ba757dSStefano Zampini             buffer_size+=k;
5062a0ba757dSStefano Zampini             ins_val++;
5063a0ba757dSStefano Zampini           }
5064a0ba757dSStefano Zampini           start_of_recv+=size_of_recv;
5065a0ba757dSStefano Zampini           sum_requests++;
5066a0ba757dSStefano Zampini         }
5067a0ba757dSStefano Zampini         ierr = PetscMalloc(temp_buffer_size*sizeof(PetscInt),&add_to_where);CHKERRQ(ierr);
5068a0ba757dSStefano Zampini         ierr = PetscMemzero(add_to_where,temp_buffer_size*sizeof(PetscInt));CHKERRQ(ierr);
5069a0ba757dSStefano Zampini         for (j=0;j<temp_buffer_size;j++){
5070a0ba757dSStefano Zampini           if (!add_to_where[j]){ /* found a new cc  */
5071a0ba757dSStefano Zampini             global_where_counter++;
5072a0ba757dSStefano Zampini             add_to_where[j]=global_where_counter;
5073a0ba757dSStefano Zampini             for (k=j+1;k<temp_buffer_size;k++){ /* check for other nodes in new cc */
5074a0ba757dSStefano Zampini               same_set=PETSC_TRUE;
5075a0ba757dSStefano Zampini               for (s=0;s<cum_recv_counts[i+1]-cum_recv_counts[i];s++){
5076a0ba757dSStefano Zampini                 if (temp_buffer[j][s]!=temp_buffer[k][s]) {
5077a0ba757dSStefano Zampini                   same_set=PETSC_FALSE;
5078a0ba757dSStefano Zampini                   break;
5079a0ba757dSStefano Zampini                 }
5080a0ba757dSStefano Zampini               }
50812e8d2280SStefano Zampini               if (same_set) { add_to_where[k]=global_where_counter; }
5082a0ba757dSStefano Zampini             }
5083a0ba757dSStefano Zampini           }
5084a0ba757dSStefano Zampini         }
5085a0ba757dSStefano Zampini         /* insert new data in where array */
5086a0ba757dSStefano Zampini         temp_buffer_size=0;
5087a0ba757dSStefano Zampini         for (j=0;j<mat_graph->nvtxs;j++){
5088a0ba757dSStefano Zampini           if (mat_graph->where[j]==i+1) {
5089a0ba757dSStefano Zampini             mat_graph->where[j]=where_values+add_to_where[temp_buffer_size];
5090a0ba757dSStefano Zampini             temp_buffer_size++;
5091a0ba757dSStefano Zampini           }
5092a0ba757dSStefano Zampini         }
5093a0ba757dSStefano Zampini         ierr = PetscFree(temp_buffer[0]);CHKERRQ(ierr);
5094a0ba757dSStefano Zampini         ierr = PetscFree(temp_buffer);CHKERRQ(ierr);
5095a0ba757dSStefano Zampini         ierr = PetscFree(add_to_where);CHKERRQ(ierr);
5096a0ba757dSStefano Zampini       }
5097a0ba757dSStefano Zampini     }
5098a0ba757dSStefano Zampini     ierr = PetscFree(nodes_to_temp_buffer_indices);CHKERRQ(ierr);
5099a0ba757dSStefano Zampini     ierr = PetscFree(sizes_of_sends);CHKERRQ(ierr);
5100a0ba757dSStefano Zampini     ierr = PetscFree(send_requests);CHKERRQ(ierr);
5101a0ba757dSStefano Zampini     ierr = PetscFree(recv_requests);CHKERRQ(ierr);
5102a0ba757dSStefano Zampini     ierr = PetscFree(petsc_buffer);CHKERRQ(ierr);
5103a0ba757dSStefano Zampini     ierr = PetscFree(recv_buffer);CHKERRQ(ierr);
5104a0ba757dSStefano Zampini     ierr = PetscFree(recv_buffer_where);CHKERRQ(ierr);
5105a0ba757dSStefano Zampini     ierr = PetscFree(send_buffer);CHKERRQ(ierr);
5106a0ba757dSStefano Zampini     ierr = PetscFree(cum_recv_counts);CHKERRQ(ierr);
5107a0ba757dSStefano Zampini     ierr = PetscFree(where_to_nodes_indices);CHKERRQ(ierr);
510823d4d1a5SStefano Zampini     ierr = PetscFree(where_cc_adapt);CHKERRQ(ierr);
5109a0ba757dSStefano Zampini     /* We are ready to evaluate consistent connected components on each part of the shared interface */
5110a0ba757dSStefano Zampini     if (global_where_counter) {
5111a0ba757dSStefano Zampini       for (i=0;i<mat_graph->nvtxs;i++){ mat_graph->touched[i]=PETSC_FALSE; }
5112a0ba757dSStefano Zampini       global_where_counter=0;
5113a0ba757dSStefano Zampini       for (i=0;i<mat_graph->nvtxs;i++){
5114a0ba757dSStefano Zampini         if (mat_graph->where[i] && !mat_graph->touched[i]) {
5115a0ba757dSStefano Zampini           global_where_counter++;
5116a0ba757dSStefano Zampini           for (j=i+1;j<mat_graph->nvtxs;j++){
5117a0ba757dSStefano Zampini             if (!mat_graph->touched[j] && mat_graph->where[j]==mat_graph->where[i]) {
5118a0ba757dSStefano Zampini               mat_graph->where[j]=global_where_counter;
5119a0ba757dSStefano Zampini               mat_graph->touched[j]=PETSC_TRUE;
5120a0ba757dSStefano Zampini             }
5121a0ba757dSStefano Zampini           }
5122a0ba757dSStefano Zampini           mat_graph->where[i]=global_where_counter;
5123a0ba757dSStefano Zampini           mat_graph->touched[i]=PETSC_TRUE;
5124a0ba757dSStefano Zampini         }
5125a0ba757dSStefano Zampini       }
5126a0ba757dSStefano Zampini       where_values=global_where_counter;
5127a0ba757dSStefano Zampini     }
5128a0ba757dSStefano Zampini     if (global_where_counter) {
5129a0ba757dSStefano Zampini       ierr = PetscMemzero(mat_graph->cptr,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr);
5130a0ba757dSStefano Zampini       ierr = PetscMemzero(mat_graph->queue,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
5131a0ba757dSStefano Zampini       ierr = PetscFree(mat_graph->where_ncmps);CHKERRQ(ierr);
5132a0ba757dSStefano Zampini       ierr = PetscMalloc(where_values*sizeof(PetscMPIInt),&mat_graph->where_ncmps);CHKERRQ(ierr);
5133a0ba757dSStefano Zampini       ierr = PCBDDCFindConnectedComponents(mat_graph, where_values);
5134a0ba757dSStefano Zampini     }
51357cf533a6SStefano Zampini     ierr = PetscFree(queue_in_global_numbering);CHKERRQ(ierr);
51363b03a366Sstefano_zampini   } /* Finished adapting interface */
51370c7d97c5SJed Brown   PetscInt nfc=0;
51380c7d97c5SJed Brown   PetscInt nec=0;
51390c7d97c5SJed Brown   PetscInt nvc=0;
51403b03a366Sstefano_zampini   PetscBool twodim_flag=PETSC_FALSE;
51410c7d97c5SJed Brown   for (i=0; i<mat_graph->ncmps; i++) {
51423b03a366Sstefano_zampini     if ( mat_graph->cptr[i+1]-mat_graph->cptr[i] > vertex_size ){
5143534831adSStefano Zampini       if (mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]==1){ /* 1 neigh Neumann fake included */
51440c7d97c5SJed Brown         nfc++;
51453b03a366Sstefano_zampini       } else { /* note that nec will be zero in 2d */
51463b03a366Sstefano_zampini         nec++;
51473b03a366Sstefano_zampini       }
51480c7d97c5SJed Brown     } else {
51493b03a366Sstefano_zampini       nvc+=mat_graph->cptr[i+1]-mat_graph->cptr[i];
51503b03a366Sstefano_zampini     }
51513b03a366Sstefano_zampini   }
51523b03a366Sstefano_zampini   if (!nec) { /* we are in a 2d case -> no faces, only edges */
51533b03a366Sstefano_zampini     nec = nfc;
51543b03a366Sstefano_zampini     nfc = 0;
51553b03a366Sstefano_zampini     twodim_flag = PETSC_TRUE;
51563b03a366Sstefano_zampini   }
51573972b0daSStefano Zampini   /* allocate IS arrays for faces, edges. Vertices need a single index set. */
51583972b0daSStefano Zampini   k=0;
51593972b0daSStefano Zampini   for (i=0; i<mat_graph->ncmps; i++) {
51603972b0daSStefano Zampini     j=mat_graph->cptr[i+1]-mat_graph->cptr[i];
51613972b0daSStefano Zampini     if ( j > k) {
51623972b0daSStefano Zampini       k=j;
51633972b0daSStefano Zampini     }
5164ba1573a8SStefano Zampini     if (j<=vertex_size) {
5165ba1573a8SStefano Zampini       k+=vertex_size;
5166ba1573a8SStefano Zampini     }
51673972b0daSStefano Zampini   }
51683972b0daSStefano Zampini   ierr = PetscMalloc(k*sizeof(PetscInt),&auxis);CHKERRQ(ierr);
51693b03a366Sstefano_zampini   if (!pcbddc->vertices_flag && !pcbddc->edges_flag) {
51703b03a366Sstefano_zampini     ierr = PetscMalloc(nfc*sizeof(IS),&pcbddc->ISForFaces);CHKERRQ(ierr);
51713b03a366Sstefano_zampini     use_faces=PETSC_TRUE;
51723b03a366Sstefano_zampini   }
51733b03a366Sstefano_zampini   if (!pcbddc->vertices_flag && !pcbddc->faces_flag) {
51743b03a366Sstefano_zampini     ierr = PetscMalloc(nec*sizeof(IS),&pcbddc->ISForEdges);CHKERRQ(ierr);
51753b03a366Sstefano_zampini     use_edges=PETSC_TRUE;
51763b03a366Sstefano_zampini   }
51773b03a366Sstefano_zampini   nfc=0;
51783b03a366Sstefano_zampini   nec=0;
51793b03a366Sstefano_zampini   for (i=0; i<mat_graph->ncmps; i++) {
51803b03a366Sstefano_zampini     if ( mat_graph->cptr[i+1]-mat_graph->cptr[i] > vertex_size ){
51813b03a366Sstefano_zampini       for (j=0;j<mat_graph->cptr[i+1]-mat_graph->cptr[i];j++) {
51823972b0daSStefano Zampini         auxis[j]=mat_graph->queue[mat_graph->cptr[i]+j];
51833b03a366Sstefano_zampini       }
51843b03a366Sstefano_zampini       if (mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]==1){
51853b03a366Sstefano_zampini         if (twodim_flag) {
51863b03a366Sstefano_zampini           if (use_edges) {
51873972b0daSStefano Zampini             ierr = ISCreateGeneral(PETSC_COMM_SELF,j,auxis,PETSC_COPY_VALUES,&pcbddc->ISForEdges[nec]);CHKERRQ(ierr);
51883b03a366Sstefano_zampini             nec++;
51893b03a366Sstefano_zampini           }
51903b03a366Sstefano_zampini         } else {
51913b03a366Sstefano_zampini           if (use_faces) {
51923972b0daSStefano Zampini             ierr = ISCreateGeneral(PETSC_COMM_SELF,j,auxis,PETSC_COPY_VALUES,&pcbddc->ISForFaces[nfc]);CHKERRQ(ierr);
51933b03a366Sstefano_zampini             nfc++;
51943b03a366Sstefano_zampini           }
51953b03a366Sstefano_zampini         }
51963b03a366Sstefano_zampini       } else {
51973b03a366Sstefano_zampini         if (use_edges) {
51983972b0daSStefano Zampini           ierr = ISCreateGeneral(PETSC_COMM_SELF,j,auxis,PETSC_COPY_VALUES,&pcbddc->ISForEdges[nec]);CHKERRQ(ierr);
51990c7d97c5SJed Brown           nec++;
52000c7d97c5SJed Brown         }
52010c7d97c5SJed Brown       }
52020c7d97c5SJed Brown     }
52033b03a366Sstefano_zampini   }
52043b03a366Sstefano_zampini   pcbddc->n_ISForFaces=nfc;
52053b03a366Sstefano_zampini   pcbddc->n_ISForEdges=nec;
52063b03a366Sstefano_zampini   nvc=0;
52070c7d97c5SJed Brown   if ( !pcbddc->constraints_flag ) {
52083b03a366Sstefano_zampini     for (i=0; i<mat_graph->ncmps; i++) {
52093b03a366Sstefano_zampini       if ( mat_graph->cptr[i+1]-mat_graph->cptr[i] <= vertex_size ){
52103b03a366Sstefano_zampini         for ( j=mat_graph->cptr[i];j<mat_graph->cptr[i+1];j++) {
52113972b0daSStefano Zampini           auxis[nvc]=mat_graph->queue[j];
52120c7d97c5SJed Brown           nvc++;
52130c7d97c5SJed Brown         }
52140c7d97c5SJed Brown       }
52150c7d97c5SJed Brown     }
52160c7d97c5SJed Brown   }
5217a0ba757dSStefano Zampini   /* sort vertex set (by local ordering) */
52183972b0daSStefano Zampini   ierr = PetscSortInt(nvc,auxis);CHKERRQ(ierr);
52193972b0daSStefano Zampini   ierr = ISCreateGeneral(PETSC_COMM_SELF,nvc,auxis,PETSC_COPY_VALUES,&pcbddc->ISForVertices);CHKERRQ(ierr);
5220e269702eSStefano Zampini   if (pcbddc->dbg_flag) {
5221d49ef151SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"--------------------------------------------------------------\n");CHKERRQ(ierr);
5222d49ef151SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Details from PCBDDCManageLocalBoundaries for subdomain %04d\n",PetscGlobalRank);CHKERRQ(ierr);
5223d49ef151SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Matrix graph has %d connected components", mat_graph->ncmps);CHKERRQ(ierr);
52240c7d97c5SJed Brown     for (i=0;i<mat_graph->ncmps;i++) {
52253b03a366Sstefano_zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\nDetails for connected component number %02d: size %04d, count %01d. Nodes follow.\n",
52263b03a366Sstefano_zampini              i,mat_graph->cptr[i+1]-mat_graph->cptr[i],mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]);CHKERRQ(ierr);
5227da1bb401SStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"subdomains: ");
5228da1bb401SStefano Zampini       for (j=0;j<mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]; j++) {
5229da1bb401SStefano Zampini         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d ",mat_graph->neighbours_set[mat_graph->queue[mat_graph->cptr[i]]][j]);
5230da1bb401SStefano Zampini       }
5231da1bb401SStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\n");
52320c7d97c5SJed Brown       for (j=mat_graph->cptr[i]; j<mat_graph->cptr[i+1]; j++){
52337cf533a6SStefano Zampini         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d, ",mat_graph->queue[j]);CHKERRQ(ierr);
52340c7d97c5SJed Brown       }
52350c7d97c5SJed Brown     }
5236da1bb401SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\n--------------------------------------------------------------\n");CHKERRQ(ierr);
52373b03a366Sstefano_zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local vertices\n",PetscGlobalRank,nvc);CHKERRQ(ierr);
52383b03a366Sstefano_zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local faces\n",PetscGlobalRank,nfc);CHKERRQ(ierr);
52393b03a366Sstefano_zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local edges\n",PetscGlobalRank,nec);CHKERRQ(ierr);
5240d49ef151SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
52410c7d97c5SJed Brown   }
52423972b0daSStefano Zampini   ierr = PetscFree(auxis);CHKERRQ(ierr);
52430c7d97c5SJed Brown   PetscFunctionReturn(0);
52440c7d97c5SJed Brown }
52450c7d97c5SJed Brown 
52460c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
52470c7d97c5SJed Brown 
52480c7d97c5SJed Brown /* The following code has been adapted from function IsConnectedSubdomain contained
5249da1bb401SStefano Zampini    in source file contig.c of METIS library (version 5.0.1)
5250da1bb401SStefano Zampini    It finds connected components of each partition labeled from 1 to n_dist  */
52510c7d97c5SJed Brown 
52520c7d97c5SJed Brown #undef __FUNCT__
52530c7d97c5SJed Brown #define __FUNCT__ "PCBDDCFindConnectedComponents"
52549c0446d6SStefano Zampini static PetscErrorCode PCBDDCFindConnectedComponents(PCBDDCGraph graph, PetscInt n_dist )
52550c7d97c5SJed Brown {
52560c7d97c5SJed Brown   PetscInt i, j, k, nvtxs, first, last, nleft, ncmps,pid,cum_queue,n,ncmps_pid;
52570c7d97c5SJed Brown   PetscInt *xadj, *adjncy, *where, *queue;
52580c7d97c5SJed Brown   PetscInt *cptr;
52590c7d97c5SJed Brown   PetscBool *touched;
52600c7d97c5SJed Brown 
52610c7d97c5SJed Brown   PetscFunctionBegin;
52620c7d97c5SJed Brown 
52630c7d97c5SJed Brown   nvtxs   = graph->nvtxs;
52640c7d97c5SJed Brown   xadj    = graph->xadj;
52650c7d97c5SJed Brown   adjncy  = graph->adjncy;
52660c7d97c5SJed Brown   where   = graph->where;
52670c7d97c5SJed Brown   touched = graph->touched;
52680c7d97c5SJed Brown   queue   = graph->queue;
52690c7d97c5SJed Brown   cptr    = graph->cptr;
52700c7d97c5SJed Brown 
52712e8d2280SStefano Zampini   for (i=0; i<nvtxs; i++) {
52720c7d97c5SJed Brown     touched[i] = PETSC_FALSE;
52732e8d2280SStefano Zampini   }
52740c7d97c5SJed Brown 
52750c7d97c5SJed Brown   cum_queue=0;
52760c7d97c5SJed Brown   ncmps=0;
52770c7d97c5SJed Brown 
52780c7d97c5SJed Brown   for (n=0; n<n_dist; n++) {
5279da1bb401SStefano Zampini     pid = n+1;  /* partition labeled by 0 is discarded */
52800c7d97c5SJed Brown     nleft = 0;
52810c7d97c5SJed Brown     for (i=0; i<nvtxs; i++) {
52820c7d97c5SJed Brown       if (where[i] == pid)
52830c7d97c5SJed Brown         nleft++;
52840c7d97c5SJed Brown     }
52850c7d97c5SJed Brown     for (i=0; i<nvtxs; i++) {
52860c7d97c5SJed Brown       if (where[i] == pid)
52870c7d97c5SJed Brown         break;
52880c7d97c5SJed Brown     }
52890c7d97c5SJed Brown     touched[i] = PETSC_TRUE;
52900c7d97c5SJed Brown     queue[cum_queue] = i;
52910c7d97c5SJed Brown     first = 0; last = 1;
52920c7d97c5SJed Brown     cptr[ncmps] = cum_queue;  /* This actually points to queue */
52930c7d97c5SJed Brown     ncmps_pid = 0;
52940c7d97c5SJed Brown     while (first != nleft) {
52950c7d97c5SJed Brown       if (first == last) { /* Find another starting vertex */
52960c7d97c5SJed Brown         cptr[++ncmps] = first+cum_queue;
52970c7d97c5SJed Brown         ncmps_pid++;
52980c7d97c5SJed Brown         for (i=0; i<nvtxs; i++) {
52990c7d97c5SJed Brown           if (where[i] == pid && !touched[i])
53000c7d97c5SJed Brown             break;
53010c7d97c5SJed Brown         }
53020c7d97c5SJed Brown         queue[cum_queue+last] = i;
53030c7d97c5SJed Brown         last++;
53040c7d97c5SJed Brown         touched[i] = PETSC_TRUE;
53050c7d97c5SJed Brown       }
53060c7d97c5SJed Brown       i = queue[cum_queue+first];
53070c7d97c5SJed Brown       first++;
53080c7d97c5SJed Brown       for (j=xadj[i]; j<xadj[i+1]; j++) {
53090c7d97c5SJed Brown         k = adjncy[j];
53100c7d97c5SJed Brown         if (where[k] == pid && !touched[k]) {
53110c7d97c5SJed Brown           queue[cum_queue+last] = k;
53120c7d97c5SJed Brown           last++;
53130c7d97c5SJed Brown           touched[k] = PETSC_TRUE;
53140c7d97c5SJed Brown         }
53150c7d97c5SJed Brown       }
53160c7d97c5SJed Brown     }
53170c7d97c5SJed Brown     cptr[++ncmps] = first+cum_queue;
53180c7d97c5SJed Brown     ncmps_pid++;
53190c7d97c5SJed Brown     cum_queue=cptr[ncmps];
5320a0ba757dSStefano Zampini     graph->where_ncmps[n] = ncmps_pid;
53210c7d97c5SJed Brown   }
53220c7d97c5SJed Brown   graph->ncmps = ncmps;
53230c7d97c5SJed Brown 
53240c7d97c5SJed Brown   PetscFunctionReturn(0);
53250c7d97c5SJed Brown }
5326