xref: /petsc/src/ksp/pc/impls/bddc/bddc.c (revision 07475bc16356fc37e8c66fcce1957fb7d8feef24)
153cdbc3dSStefano Zampini /* TODOLIST
2da1bb401SStefano Zampini    DofSplitting and DM attached to pc?
3da1bb401SStefano Zampini    Change SetNeumannBoundaries to SetNeumannBoundariesLocal and provide new SetNeumannBoundaries (same Dirichlet)
4a0ba757dSStefano Zampini    change how to deal with the coarse problem (PCBDDCSetCoarseEnvironment):
5a0ba757dSStefano Zampini      - simplify coarse problem structure -> PCBDDC or PCREDUDANT, nothing else -> same comm for all levels?
6a0ba757dSStefano Zampini      - remove coarse enums and allow use of PCBDDCGetCoarseKSP
7a0ba757dSStefano Zampini      - remove metis dependency -> use MatPartitioning for multilevel -> Assemble serial adjacency in ManageLocalBoundaries?
8a0ba757dSStefano Zampini    code refactoring:
9a0ba757dSStefano Zampini      - pick up better names for static functions
10a0ba757dSStefano Zampini    change options structure:
11a0ba757dSStefano Zampini      - insert BDDC into MG framework?
12a0ba757dSStefano Zampini    provide other ops? Ask to developers
13a0ba757dSStefano Zampini    remove all unused printf
14a0ba757dSStefano Zampini    man pages
1553cdbc3dSStefano Zampini */
160c7d97c5SJed Brown 
1753cdbc3dSStefano Zampini /* ----------------------------------------------------------------------------------------------------------------------------------------------
180c7d97c5SJed Brown    Implementation of BDDC preconditioner based on:
190c7d97c5SJed Brown    C. Dohrmann "An approximate BDDC preconditioner", Numerical Linear Algebra with Applications Volume 14, Issue 2, pages 149-168, March 2007
2053cdbc3dSStefano Zampini    ---------------------------------------------------------------------------------------------------------------------------------------------- */
2153cdbc3dSStefano Zampini 
22*07475bc1SBarry Smith #include "bddc.h" /*I "petscpc.h" I*/
233b03a366Sstefano_zampini #include <petscblaslapack.h>
240c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
250c7d97c5SJed Brown #undef __FUNCT__
260c7d97c5SJed Brown #define __FUNCT__ "PCSetFromOptions_BDDC"
270c7d97c5SJed Brown PetscErrorCode PCSetFromOptions_BDDC(PC pc)
280c7d97c5SJed Brown {
290c7d97c5SJed Brown   PC_BDDC         *pcbddc = (PC_BDDC*)pc->data;
300c7d97c5SJed Brown   PetscErrorCode ierr;
310c7d97c5SJed Brown 
320c7d97c5SJed Brown   PetscFunctionBegin;
330c7d97c5SJed Brown   ierr = PetscOptionsHead("BDDC options");CHKERRQ(ierr);
340c7d97c5SJed Brown   /* Verbose debugging of main data structures */
35e269702eSStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_check_all"       ,"Verbose (debugging) output for PCBDDC"                       ,"none",pcbddc->dbg_flag      ,&pcbddc->dbg_flag      ,PETSC_NULL);CHKERRQ(ierr);
360c7d97c5SJed Brown   /* Some customization for default primal space */
37da1bb401SStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_vertices_only"   ,"Use only vertices in coarse space (i.e. discard constraints)","none",pcbddc->vertices_flag   ,&pcbddc->vertices_flag   ,PETSC_NULL);CHKERRQ(ierr);
38da1bb401SStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_constraints_only","Use only constraints in coarse space (i.e. discard vertices)","none",pcbddc->constraints_flag,&pcbddc->constraints_flag,PETSC_NULL);CHKERRQ(ierr);
39da1bb401SStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_faces_only"      ,"Use only faces among constraints of coarse space (i.e. discard edges)"         ,"none",pcbddc->faces_flag      ,&pcbddc->faces_flag      ,PETSC_NULL);CHKERRQ(ierr);
40da1bb401SStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_edges_only"      ,"Use only edges among constraints of coarse space (i.e. discard faces)"         ,"none",pcbddc->edges_flag      ,&pcbddc->edges_flag      ,PETSC_NULL);CHKERRQ(ierr);
410c7d97c5SJed Brown   /* Coarse solver context */
426c667b0aSStefano Zampini   static const char * const avail_coarse_problems[] = {"sequential","replicated","parallel","multilevel","CoarseProblemType","PC_BDDC_",0}; /*order of choiches depends on ENUM defined in bddc.h */
430c7d97c5SJed Brown   ierr = PetscOptionsEnum("-pc_bddc_coarse_problem_type","Set coarse problem type","none",avail_coarse_problems,(PetscEnum)pcbddc->coarse_problem_type,(PetscEnum*)&pcbddc->coarse_problem_type,PETSC_NULL);CHKERRQ(ierr);
440c7d97c5SJed Brown   /* Two different application of BDDC to the whole set of dofs, internal and interface */
4529622bf0SStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_switch_preconditioning_type","Switch between M_2 (default) and M_3 preconditioners (as defined by Dohrmann)","none",pcbddc->inexact_prec_type,&pcbddc->inexact_prec_type,PETSC_NULL);CHKERRQ(ierr);
46534831adSStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_use_change_of_basis","Use change of basis approach for primal space","none",pcbddc->usechangeofbasis,&pcbddc->usechangeofbasis,PETSC_NULL);CHKERRQ(ierr);
47534831adSStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_use_change_on_faces","Use change of basis approach for face constraints","none",pcbddc->usechangeonfaces,&pcbddc->usechangeonfaces,PETSC_NULL);CHKERRQ(ierr);
48534831adSStefano Zampini   pcbddc->usechangeonfaces = pcbddc->usechangeonfaces && pcbddc->usechangeofbasis;
490c7d97c5SJed Brown   ierr = PetscOptionsInt("-pc_bddc_coarsening_ratio","Set coarsening ratio used in multilevel coarsening","none",pcbddc->coarsening_ratio,&pcbddc->coarsening_ratio,PETSC_NULL);CHKERRQ(ierr);
504fad6a16SStefano Zampini   ierr = PetscOptionsInt("-pc_bddc_max_levels","Set maximum number of levels for multilevel","none",pcbddc->max_levels,&pcbddc->max_levels,PETSC_NULL);CHKERRQ(ierr);
510c7d97c5SJed Brown   ierr = PetscOptionsTail();CHKERRQ(ierr);
520c7d97c5SJed Brown   PetscFunctionReturn(0);
530c7d97c5SJed Brown }
540c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
550c7d97c5SJed Brown EXTERN_C_BEGIN
560c7d97c5SJed Brown #undef __FUNCT__
570c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetCoarseProblemType_BDDC"
5853cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetCoarseProblemType_BDDC(PC pc, CoarseProblemType CPT)
590c7d97c5SJed Brown {
600c7d97c5SJed Brown   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
610c7d97c5SJed Brown 
620c7d97c5SJed Brown   PetscFunctionBegin;
630c7d97c5SJed Brown   pcbddc->coarse_problem_type = CPT;
640c7d97c5SJed Brown   PetscFunctionReturn(0);
650c7d97c5SJed Brown }
660c7d97c5SJed Brown EXTERN_C_END
670c7d97c5SJed Brown #undef __FUNCT__
680c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetCoarseProblemType"
6953cdbc3dSStefano Zampini /*@
709c0446d6SStefano Zampini  PCBDDCSetCoarseProblemType - Set coarse problem type in PCBDDC.
7153cdbc3dSStefano Zampini 
729c0446d6SStefano Zampini    Not collective
7353cdbc3dSStefano Zampini 
7453cdbc3dSStefano Zampini    Input Parameters:
7553cdbc3dSStefano Zampini +  pc - the preconditioning context
7653cdbc3dSStefano Zampini -  CoarseProblemType - pick a better name and explain what this is
7753cdbc3dSStefano Zampini 
7853cdbc3dSStefano Zampini    Level: intermediate
7953cdbc3dSStefano Zampini 
8053cdbc3dSStefano Zampini    Notes:
81da1bb401SStefano Zampini    Not collective but all procs must call with same arguments.
8253cdbc3dSStefano Zampini 
8353cdbc3dSStefano Zampini .seealso: PCBDDC
8453cdbc3dSStefano Zampini @*/
850c7d97c5SJed Brown PetscErrorCode PCBDDCSetCoarseProblemType(PC pc, CoarseProblemType CPT)
860c7d97c5SJed Brown {
870c7d97c5SJed Brown   PetscErrorCode ierr;
880c7d97c5SJed Brown 
890c7d97c5SJed Brown   PetscFunctionBegin;
900c7d97c5SJed Brown   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
910c7d97c5SJed Brown   ierr = PetscTryMethod(pc,"PCBDDCSetCoarseProblemType_C",(PC,CoarseProblemType),(pc,CPT));CHKERRQ(ierr);
920c7d97c5SJed Brown   PetscFunctionReturn(0);
930c7d97c5SJed Brown }
940c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
950c7d97c5SJed Brown EXTERN_C_BEGIN
960c7d97c5SJed Brown #undef __FUNCT__
974fad6a16SStefano Zampini #define __FUNCT__ "PCBDDCSetCoarseningRatio_BDDC"
984fad6a16SStefano Zampini static PetscErrorCode PCBDDCSetCoarseningRatio_BDDC(PC pc,PetscInt k)
994fad6a16SStefano Zampini {
1004fad6a16SStefano Zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
1014fad6a16SStefano Zampini 
1024fad6a16SStefano Zampini   PetscFunctionBegin;
1034fad6a16SStefano Zampini   pcbddc->coarsening_ratio=k;
1044fad6a16SStefano Zampini   PetscFunctionReturn(0);
1054fad6a16SStefano Zampini }
1064fad6a16SStefano Zampini EXTERN_C_END
1074fad6a16SStefano Zampini #undef __FUNCT__
1084fad6a16SStefano Zampini #define __FUNCT__ "PCBDDCSetCoarseningRatio"
1094fad6a16SStefano Zampini /*@
1104fad6a16SStefano Zampini  PCBDDCSetCoarseningRatio - Set coarsening ratio used in multilevel coarsening
1114fad6a16SStefano Zampini 
1124fad6a16SStefano Zampini    Logically collective on PC
1134fad6a16SStefano Zampini 
1144fad6a16SStefano Zampini    Input Parameters:
1154fad6a16SStefano Zampini +  pc - the preconditioning context
1164fad6a16SStefano Zampini -  k - coarsening ratio
1174fad6a16SStefano Zampini 
1184fad6a16SStefano Zampini    Approximatively k subdomains at the finer level will be aggregated into a single subdomain at the coarser level.
1194fad6a16SStefano Zampini 
1204fad6a16SStefano Zampini    Level: intermediate
1214fad6a16SStefano Zampini 
1224fad6a16SStefano Zampini    Notes:
1234fad6a16SStefano Zampini 
1244fad6a16SStefano Zampini .seealso: PCBDDC
1254fad6a16SStefano Zampini @*/
1264fad6a16SStefano Zampini PetscErrorCode PCBDDCSetCoarseningRatio(PC pc,PetscInt k)
1274fad6a16SStefano Zampini {
1284fad6a16SStefano Zampini   PetscErrorCode ierr;
1294fad6a16SStefano Zampini 
1304fad6a16SStefano Zampini   PetscFunctionBegin;
1314fad6a16SStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
1324fad6a16SStefano Zampini   ierr = PetscTryMethod(pc,"PCBDDCSetCoarseningRatio_C",(PC,PetscInt),(pc,k));CHKERRQ(ierr);
1334fad6a16SStefano Zampini   PetscFunctionReturn(0);
1344fad6a16SStefano Zampini }
1354fad6a16SStefano Zampini /* -------------------------------------------------------------------------- */
1364fad6a16SStefano Zampini EXTERN_C_BEGIN
1374fad6a16SStefano Zampini #undef __FUNCT__
1384fad6a16SStefano Zampini #define __FUNCT__ "PCBDDCSetMaxLevels_BDDC"
1394fad6a16SStefano Zampini static PetscErrorCode PCBDDCSetMaxLevels_BDDC(PC pc,PetscInt max_levels)
1404fad6a16SStefano Zampini {
1414fad6a16SStefano Zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
1424fad6a16SStefano Zampini 
1434fad6a16SStefano Zampini   PetscFunctionBegin;
1444fad6a16SStefano Zampini   pcbddc->max_levels=max_levels;
1454fad6a16SStefano Zampini   PetscFunctionReturn(0);
1464fad6a16SStefano Zampini }
1474fad6a16SStefano Zampini EXTERN_C_END
1484fad6a16SStefano Zampini #undef __FUNCT__
1494fad6a16SStefano Zampini #define __FUNCT__ "PCBDDCSetMaxLevels"
1504fad6a16SStefano Zampini /*@
1514fad6a16SStefano Zampini  PCBDDCSetMaxLevels - Sets the maximum number of levels within the multilevel approach.
1524fad6a16SStefano Zampini 
1534fad6a16SStefano Zampini    Logically collective on PC
1544fad6a16SStefano Zampini 
1554fad6a16SStefano Zampini    Input Parameters:
1564fad6a16SStefano Zampini +  pc - the preconditioning context
1574fad6a16SStefano Zampini -  max_levels - the maximum number of levels
1584fad6a16SStefano Zampini 
1594fad6a16SStefano Zampini    Default value is 1, i.e. coarse problem will be solved inexactly with one application
1604fad6a16SStefano Zampini    of PCBDDC preconditioner if the multilevel approach is requested.
1614fad6a16SStefano Zampini 
1624fad6a16SStefano Zampini    Level: intermediate
1634fad6a16SStefano Zampini 
1644fad6a16SStefano Zampini    Notes:
1654fad6a16SStefano Zampini 
1664fad6a16SStefano Zampini .seealso: PCBDDC
1674fad6a16SStefano Zampini @*/
1684fad6a16SStefano Zampini PetscErrorCode PCBDDCSetMaxLevels(PC pc,PetscInt max_levels)
1694fad6a16SStefano Zampini {
1704fad6a16SStefano Zampini   PetscErrorCode ierr;
1714fad6a16SStefano Zampini 
1724fad6a16SStefano Zampini   PetscFunctionBegin;
1734fad6a16SStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
1744fad6a16SStefano Zampini   ierr = PetscTryMethod(pc,"PCBDDCSetMaxLevels_C",(PC,PetscInt),(pc,max_levels));CHKERRQ(ierr);
1754fad6a16SStefano Zampini   PetscFunctionReturn(0);
1764fad6a16SStefano Zampini }
1774fad6a16SStefano Zampini /* -------------------------------------------------------------------------- */
1784fad6a16SStefano Zampini EXTERN_C_BEGIN
1794fad6a16SStefano Zampini #undef __FUNCT__
1800bdf917eSStefano Zampini #define __FUNCT__ "PCBDDCSetNullSpace_BDDC"
1810bdf917eSStefano Zampini static PetscErrorCode PCBDDCSetNullSpace_BDDC(PC pc,MatNullSpace NullSpace)
1820bdf917eSStefano Zampini {
1830bdf917eSStefano Zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
1840bdf917eSStefano Zampini   PetscErrorCode ierr;
1850bdf917eSStefano Zampini 
1860bdf917eSStefano Zampini   PetscFunctionBegin;
1870bdf917eSStefano Zampini   ierr = PetscObjectReference((PetscObject)NullSpace);CHKERRQ(ierr);
1880bdf917eSStefano Zampini   ierr = MatNullSpaceDestroy(&pcbddc->NullSpace);CHKERRQ(ierr);
1890bdf917eSStefano Zampini   pcbddc->NullSpace=NullSpace;
1900bdf917eSStefano Zampini   PetscFunctionReturn(0);
1910bdf917eSStefano Zampini }
1920bdf917eSStefano Zampini EXTERN_C_END
1930bdf917eSStefano Zampini #undef __FUNCT__
1940bdf917eSStefano Zampini #define __FUNCT__ "PCBDDCSetNullSpace"
1950bdf917eSStefano Zampini /*@
1960bdf917eSStefano Zampini  PCBDDCSetNullSpace - Set NullSpace of global operator of BDDC preconditioned mat.
1970bdf917eSStefano Zampini 
1980bdf917eSStefano Zampini    Logically collective on PC and MatNullSpace
1990bdf917eSStefano Zampini 
2000bdf917eSStefano Zampini    Input Parameters:
2010bdf917eSStefano Zampini +  pc - the preconditioning context
2020bdf917eSStefano Zampini -  NullSpace - Null space of the linear operator to be preconditioned.
2030bdf917eSStefano Zampini 
2040bdf917eSStefano Zampini    Level: intermediate
2050bdf917eSStefano Zampini 
2060bdf917eSStefano Zampini    Notes:
2070bdf917eSStefano Zampini 
2080bdf917eSStefano Zampini .seealso: PCBDDC
2090bdf917eSStefano Zampini @*/
2100bdf917eSStefano Zampini PetscErrorCode PCBDDCSetNullSpace(PC pc,MatNullSpace NullSpace)
2110bdf917eSStefano Zampini {
2120bdf917eSStefano Zampini   PetscErrorCode ierr;
2130bdf917eSStefano Zampini 
2140bdf917eSStefano Zampini   PetscFunctionBegin;
2150bdf917eSStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
2160bdf917eSStefano Zampini   ierr = PetscTryMethod(pc,"PCBDDCSetNullSpace_C",(PC,MatNullSpace),(pc,NullSpace));CHKERRQ(ierr);
2170bdf917eSStefano Zampini   PetscFunctionReturn(0);
2180bdf917eSStefano Zampini }
2190bdf917eSStefano Zampini /* -------------------------------------------------------------------------- */
2200bdf917eSStefano Zampini EXTERN_C_BEGIN
2210bdf917eSStefano Zampini #undef __FUNCT__
2223b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCSetDirichletBoundaries_BDDC"
2233b03a366Sstefano_zampini static PetscErrorCode PCBDDCSetDirichletBoundaries_BDDC(PC pc,IS DirichletBoundaries)
2243b03a366Sstefano_zampini {
2253b03a366Sstefano_zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
2263b03a366Sstefano_zampini   PetscErrorCode ierr;
2273b03a366Sstefano_zampini 
2283b03a366Sstefano_zampini   PetscFunctionBegin;
2293b03a366Sstefano_zampini   ierr = ISDestroy(&pcbddc->DirichletBoundaries);CHKERRQ(ierr);
23036e030ebSStefano Zampini   ierr = PetscObjectReference((PetscObject)DirichletBoundaries);CHKERRQ(ierr);
23136e030ebSStefano Zampini   pcbddc->DirichletBoundaries=DirichletBoundaries;
2323b03a366Sstefano_zampini   PetscFunctionReturn(0);
2333b03a366Sstefano_zampini }
2343b03a366Sstefano_zampini EXTERN_C_END
2353b03a366Sstefano_zampini #undef __FUNCT__
2363b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCSetDirichletBoundaries"
2373b03a366Sstefano_zampini /*@
238da1bb401SStefano Zampini  PCBDDCSetDirichletBoundaries - Set index set defining subdomain part (in local ordering)
239da1bb401SStefano Zampini                               of Dirichlet boundaries for the global problem.
2403b03a366Sstefano_zampini 
2413b03a366Sstefano_zampini    Not collective
2423b03a366Sstefano_zampini 
2433b03a366Sstefano_zampini    Input Parameters:
2443b03a366Sstefano_zampini +  pc - the preconditioning context
2453b03a366Sstefano_zampini -  DirichletBoundaries - sequential index set defining the subdomain part of Dirichlet boundaries (can be PETSC_NULL)
2463b03a366Sstefano_zampini 
2473b03a366Sstefano_zampini    Level: intermediate
2483b03a366Sstefano_zampini 
2493b03a366Sstefano_zampini    Notes:
2503b03a366Sstefano_zampini 
2513b03a366Sstefano_zampini .seealso: PCBDDC
2523b03a366Sstefano_zampini @*/
2533b03a366Sstefano_zampini PetscErrorCode PCBDDCSetDirichletBoundaries(PC pc,IS DirichletBoundaries)
2543b03a366Sstefano_zampini {
2553b03a366Sstefano_zampini   PetscErrorCode ierr;
2563b03a366Sstefano_zampini 
2573b03a366Sstefano_zampini   PetscFunctionBegin;
2583b03a366Sstefano_zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
2593b03a366Sstefano_zampini   ierr = PetscTryMethod(pc,"PCBDDCSetDirichletBoundaries_C",(PC,IS),(pc,DirichletBoundaries));CHKERRQ(ierr);
2603b03a366Sstefano_zampini   PetscFunctionReturn(0);
2613b03a366Sstefano_zampini }
2623b03a366Sstefano_zampini /* -------------------------------------------------------------------------- */
2633b03a366Sstefano_zampini EXTERN_C_BEGIN
2643b03a366Sstefano_zampini #undef __FUNCT__
2650c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetNeumannBoundaries_BDDC"
26653cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetNeumannBoundaries_BDDC(PC pc,IS NeumannBoundaries)
2670c7d97c5SJed Brown {
2680c7d97c5SJed Brown   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
26953cdbc3dSStefano Zampini   PetscErrorCode ierr;
2700c7d97c5SJed Brown 
2710c7d97c5SJed Brown   PetscFunctionBegin;
27253cdbc3dSStefano Zampini   ierr = ISDestroy(&pcbddc->NeumannBoundaries);CHKERRQ(ierr);
27336e030ebSStefano Zampini   ierr = PetscObjectReference((PetscObject)NeumannBoundaries);CHKERRQ(ierr);
27436e030ebSStefano Zampini   pcbddc->NeumannBoundaries=NeumannBoundaries;
2750c7d97c5SJed Brown   PetscFunctionReturn(0);
2760c7d97c5SJed Brown }
2770c7d97c5SJed Brown EXTERN_C_END
2780c7d97c5SJed Brown #undef __FUNCT__
2790c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetNeumannBoundaries"
28057527edcSJed Brown /*@
281da1bb401SStefano Zampini  PCBDDCSetNeumannBoundaries - Set index set defining subdomain part (in local ordering)
282da1bb401SStefano Zampini                               of Neumann boundaries for the global problem.
28357527edcSJed Brown 
2849c0446d6SStefano Zampini    Not collective
28557527edcSJed Brown 
28657527edcSJed Brown    Input Parameters:
28757527edcSJed Brown +  pc - the preconditioning context
2889c0446d6SStefano Zampini -  NeumannBoundaries - sequential index set defining the subdomain part of Neumann boundaries (can be PETSC_NULL)
28957527edcSJed Brown 
29057527edcSJed Brown    Level: intermediate
29157527edcSJed Brown 
29257527edcSJed Brown    Notes:
29357527edcSJed Brown 
29457527edcSJed Brown .seealso: PCBDDC
29557527edcSJed Brown @*/
29653cdbc3dSStefano Zampini PetscErrorCode PCBDDCSetNeumannBoundaries(PC pc,IS NeumannBoundaries)
2970c7d97c5SJed Brown {
2980c7d97c5SJed Brown   PetscErrorCode ierr;
2990c7d97c5SJed Brown 
3000c7d97c5SJed Brown   PetscFunctionBegin;
3010c7d97c5SJed Brown   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
30253cdbc3dSStefano Zampini   ierr = PetscTryMethod(pc,"PCBDDCSetNeumannBoundaries_C",(PC,IS),(pc,NeumannBoundaries));CHKERRQ(ierr);
30353cdbc3dSStefano Zampini   PetscFunctionReturn(0);
30453cdbc3dSStefano Zampini }
30553cdbc3dSStefano Zampini /* -------------------------------------------------------------------------- */
30653cdbc3dSStefano Zampini EXTERN_C_BEGIN
30753cdbc3dSStefano Zampini #undef __FUNCT__
308da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCGetDirichletBoundaries_BDDC"
309da1bb401SStefano Zampini static PetscErrorCode PCBDDCGetDirichletBoundaries_BDDC(PC pc,IS *DirichletBoundaries)
310da1bb401SStefano Zampini {
311da1bb401SStefano Zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
312da1bb401SStefano Zampini 
313da1bb401SStefano Zampini   PetscFunctionBegin;
314da1bb401SStefano Zampini   *DirichletBoundaries = pcbddc->DirichletBoundaries;
315da1bb401SStefano Zampini   PetscFunctionReturn(0);
316da1bb401SStefano Zampini }
317da1bb401SStefano Zampini EXTERN_C_END
318da1bb401SStefano Zampini #undef __FUNCT__
319da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCGetDirichletBoundaries"
320da1bb401SStefano Zampini /*@
321da1bb401SStefano Zampini  PCBDDCGetDirichletBoundaries - Get index set defining subdomain part (in local ordering)
322da1bb401SStefano Zampini                                 of Dirichlet boundaries for the global problem.
323da1bb401SStefano Zampini 
324da1bb401SStefano Zampini    Not collective
325da1bb401SStefano Zampini 
326da1bb401SStefano Zampini    Input Parameters:
327da1bb401SStefano Zampini +  pc - the preconditioning context
328da1bb401SStefano Zampini 
329da1bb401SStefano Zampini    Output Parameters:
330da1bb401SStefano Zampini +  DirichletBoundaries - index set defining the subdomain part of Dirichlet boundaries
331da1bb401SStefano Zampini 
332da1bb401SStefano Zampini    Level: intermediate
333da1bb401SStefano Zampini 
334da1bb401SStefano Zampini    Notes:
335da1bb401SStefano Zampini 
336da1bb401SStefano Zampini .seealso: PCBDDC
337da1bb401SStefano Zampini @*/
338da1bb401SStefano Zampini PetscErrorCode PCBDDCGetDirichletBoundaries(PC pc,IS *DirichletBoundaries)
339da1bb401SStefano Zampini {
340da1bb401SStefano Zampini   PetscErrorCode ierr;
341da1bb401SStefano Zampini 
342da1bb401SStefano Zampini   PetscFunctionBegin;
343da1bb401SStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
344da1bb401SStefano Zampini   ierr = PetscUseMethod(pc,"PCBDDCGetDirichletBoundaries_C",(PC,IS*),(pc,DirichletBoundaries));CHKERRQ(ierr);
345da1bb401SStefano Zampini   PetscFunctionReturn(0);
346da1bb401SStefano Zampini }
347da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
348da1bb401SStefano Zampini EXTERN_C_BEGIN
349da1bb401SStefano Zampini #undef __FUNCT__
35053cdbc3dSStefano Zampini #define __FUNCT__ "PCBDDCGetNeumannBoundaries_BDDC"
35153cdbc3dSStefano Zampini static PetscErrorCode PCBDDCGetNeumannBoundaries_BDDC(PC pc,IS *NeumannBoundaries)
35253cdbc3dSStefano Zampini {
35353cdbc3dSStefano Zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
35453cdbc3dSStefano Zampini 
35553cdbc3dSStefano Zampini   PetscFunctionBegin;
35653cdbc3dSStefano Zampini   *NeumannBoundaries = pcbddc->NeumannBoundaries;
35753cdbc3dSStefano Zampini   PetscFunctionReturn(0);
35853cdbc3dSStefano Zampini }
35953cdbc3dSStefano Zampini EXTERN_C_END
36053cdbc3dSStefano Zampini #undef __FUNCT__
36153cdbc3dSStefano Zampini #define __FUNCT__ "PCBDDCGetNeumannBoundaries"
36253cdbc3dSStefano Zampini /*@
363da1bb401SStefano Zampini  PCBDDCGetNeumannBoundaries - Get index set defining subdomain part (in local ordering)
364da1bb401SStefano Zampini                               of Neumann boundaries for the global problem.
36553cdbc3dSStefano Zampini 
3669c0446d6SStefano Zampini    Not collective
36753cdbc3dSStefano Zampini 
36853cdbc3dSStefano Zampini    Input Parameters:
36953cdbc3dSStefano Zampini +  pc - the preconditioning context
37053cdbc3dSStefano Zampini 
37153cdbc3dSStefano Zampini    Output Parameters:
37253cdbc3dSStefano Zampini +  NeumannBoundaries - index set defining the subdomain part of Neumann boundaries
37353cdbc3dSStefano Zampini 
37453cdbc3dSStefano Zampini    Level: intermediate
37553cdbc3dSStefano Zampini 
37653cdbc3dSStefano Zampini    Notes:
37753cdbc3dSStefano Zampini 
37853cdbc3dSStefano Zampini .seealso: PCBDDC
37953cdbc3dSStefano Zampini @*/
38053cdbc3dSStefano Zampini PetscErrorCode PCBDDCGetNeumannBoundaries(PC pc,IS *NeumannBoundaries)
38153cdbc3dSStefano Zampini {
38253cdbc3dSStefano Zampini   PetscErrorCode ierr;
38353cdbc3dSStefano Zampini 
38453cdbc3dSStefano Zampini   PetscFunctionBegin;
38553cdbc3dSStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
38653cdbc3dSStefano Zampini   ierr = PetscUseMethod(pc,"PCBDDCGetNeumannBoundaries_C",(PC,IS*),(pc,NeumannBoundaries));CHKERRQ(ierr);
3870c7d97c5SJed Brown   PetscFunctionReturn(0);
3880c7d97c5SJed Brown }
38936e030ebSStefano Zampini /* -------------------------------------------------------------------------- */
39036e030ebSStefano Zampini EXTERN_C_BEGIN
39136e030ebSStefano Zampini #undef __FUNCT__
392da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetLocalAdjacencyGraph_BDDC"
3931a83f524SJed Brown static PetscErrorCode PCBDDCSetLocalAdjacencyGraph_BDDC(PC pc, PetscInt nvtxs,const PetscInt xadj[],const PetscInt adjncy[], PetscCopyMode copymode)
39436e030ebSStefano Zampini {
39536e030ebSStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
396da1bb401SStefano Zampini   PCBDDCGraph    mat_graph=pcbddc->mat_graph;
397da1bb401SStefano Zampini   PetscErrorCode ierr;
39836e030ebSStefano Zampini 
39936e030ebSStefano Zampini   PetscFunctionBegin;
400da1bb401SStefano Zampini   mat_graph->nvtxs=nvtxs;
401da1bb401SStefano Zampini   ierr = PetscFree(mat_graph->xadj);CHKERRQ(ierr);
402da1bb401SStefano Zampini   ierr = PetscFree(mat_graph->adjncy);CHKERRQ(ierr);
403da1bb401SStefano Zampini   if (copymode == PETSC_COPY_VALUES) {
404da1bb401SStefano Zampini     ierr = PetscMalloc((mat_graph->nvtxs+1)*sizeof(PetscInt),&mat_graph->xadj);CHKERRQ(ierr);
405da1bb401SStefano Zampini     ierr = PetscMalloc(xadj[mat_graph->nvtxs]*sizeof(PetscInt),&mat_graph->adjncy);CHKERRQ(ierr);
406da1bb401SStefano Zampini     ierr = PetscMemcpy(mat_graph->xadj,xadj,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr);
407da1bb401SStefano Zampini     ierr = PetscMemcpy(mat_graph->adjncy,adjncy,xadj[mat_graph->nvtxs]*sizeof(PetscInt));CHKERRQ(ierr);
408da1bb401SStefano Zampini   } else if (copymode == PETSC_OWN_POINTER) {
4091a83f524SJed Brown     mat_graph->xadj = (PetscInt*)xadj;
4101a83f524SJed Brown     mat_graph->adjncy = (PetscInt*)adjncy;
411da1bb401SStefano Zampini   } else {
412da1bb401SStefano Zampini     SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_SUP,"Unsupported copy mode %d in %s\n",copymode,__FUNCT__);
413da1bb401SStefano Zampini   }
41436e030ebSStefano Zampini   PetscFunctionReturn(0);
41536e030ebSStefano Zampini }
41636e030ebSStefano Zampini EXTERN_C_END
41736e030ebSStefano Zampini #undef __FUNCT__
418da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetLocalAdjacencyGraph"
41936e030ebSStefano Zampini /*@
420da1bb401SStefano Zampini  PCBDDCSetLocalAdjacencyGraph - Set CSR graph of local matrix for use of PCBDDC.
42136e030ebSStefano Zampini 
42236e030ebSStefano Zampini    Not collective
42336e030ebSStefano Zampini 
42436e030ebSStefano Zampini    Input Parameters:
42536e030ebSStefano Zampini +  pc - the preconditioning context
426da1bb401SStefano Zampini -  nvtxs - number of local vertices of the graph
427da1bb401SStefano Zampini -  xadj, adjncy - the CSR graph
428da1bb401SStefano Zampini -  copymode - either PETSC_COPY_VALUES or PETSC_OWN_POINTER. In the former case the user must free the array passed in;
429da1bb401SStefano Zampini                                                              in the latter case, memory must be obtained with PetscMalloc.
43036e030ebSStefano Zampini 
43136e030ebSStefano Zampini    Level: intermediate
43236e030ebSStefano Zampini 
43336e030ebSStefano Zampini    Notes:
43436e030ebSStefano Zampini 
43536e030ebSStefano Zampini .seealso: PCBDDC
43636e030ebSStefano Zampini @*/
4371a83f524SJed Brown PetscErrorCode PCBDDCSetLocalAdjacencyGraph(PC pc,PetscInt nvtxs,const PetscInt xadj[],const PetscInt adjncy[], PetscCopyMode copymode)
43836e030ebSStefano Zampini {
439da1bb401SStefano Zampini   PetscInt       nrows,ncols;
440da1bb401SStefano Zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
44136e030ebSStefano Zampini   PetscErrorCode ierr;
44236e030ebSStefano Zampini 
44336e030ebSStefano Zampini   PetscFunctionBegin;
44436e030ebSStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
445da1bb401SStefano Zampini   ierr = MatGetSize(matis->A,&nrows,&ncols);CHKERRQ(ierr);
446da1bb401SStefano Zampini   if (nvtxs != nrows) {
447da1bb401SStefano Zampini     SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Local adjacency size %d passed in %s differs from local problem size %d!\n",nvtxs,__FUNCT__,nrows);
448da1bb401SStefano Zampini   } else {
4491a83f524SJed Brown     ierr = PetscTryMethod(pc,"PCBDDCSetLocalAdjacencyGraph_C",(PC,PetscInt,const PetscInt[],const PetscInt[],PetscCopyMode),(pc,nvtxs,xadj,adjncy,copymode));CHKERRQ(ierr);
450da1bb401SStefano Zampini   }
45136e030ebSStefano Zampini   PetscFunctionReturn(0);
45236e030ebSStefano Zampini }
4539c0446d6SStefano Zampini /* -------------------------------------------------------------------------- */
4549c0446d6SStefano Zampini EXTERN_C_BEGIN
4559c0446d6SStefano Zampini #undef __FUNCT__
4569c0446d6SStefano Zampini #define __FUNCT__ "PCBDDCSetDofsSplitting_BDDC"
4579c0446d6SStefano Zampini static PetscErrorCode PCBDDCSetDofsSplitting_BDDC(PC pc,PetscInt n_is, IS ISForDofs[])
4589c0446d6SStefano Zampini {
4599c0446d6SStefano Zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
4609c0446d6SStefano Zampini   PetscInt i;
4619c0446d6SStefano Zampini   PetscErrorCode ierr;
4629c0446d6SStefano Zampini 
4639c0446d6SStefano Zampini   PetscFunctionBegin;
464da1bb401SStefano Zampini   /* Destroy ISes if they were already set */
4659c0446d6SStefano Zampini   for (i=0;i<pcbddc->n_ISForDofs;i++) {
4669c0446d6SStefano Zampini     ierr = ISDestroy(&pcbddc->ISForDofs[i]);CHKERRQ(ierr);
4679c0446d6SStefano Zampini   }
468d11ae9bbSstefano_zampini   ierr = PetscFree(pcbddc->ISForDofs);CHKERRQ(ierr);
469da1bb401SStefano Zampini   /* allocate space then set */
4709c0446d6SStefano Zampini   ierr = PetscMalloc(n_is*sizeof(IS),&pcbddc->ISForDofs);CHKERRQ(ierr);
4719c0446d6SStefano Zampini   for (i=0;i<n_is;i++) {
472da1bb401SStefano Zampini     ierr = PetscObjectReference((PetscObject)ISForDofs[i]);CHKERRQ(ierr);
473da1bb401SStefano Zampini     pcbddc->ISForDofs[i]=ISForDofs[i];
4749c0446d6SStefano Zampini   }
4759c0446d6SStefano Zampini   pcbddc->n_ISForDofs=n_is;
4769c0446d6SStefano Zampini   PetscFunctionReturn(0);
4779c0446d6SStefano Zampini }
4789c0446d6SStefano Zampini EXTERN_C_END
4799c0446d6SStefano Zampini #undef __FUNCT__
4809c0446d6SStefano Zampini #define __FUNCT__ "PCBDDCSetDofsSplitting"
4819c0446d6SStefano Zampini /*@
482da1bb401SStefano Zampini  PCBDDCSetDofsSplitting - Set index sets defining fields of local mat.
4839c0446d6SStefano Zampini 
4849c0446d6SStefano Zampini    Not collective
4859c0446d6SStefano Zampini 
4869c0446d6SStefano Zampini    Input Parameters:
4879c0446d6SStefano Zampini +  pc - the preconditioning context
488da1bb401SStefano Zampini -  n - number of index sets defining the fields
489da1bb401SStefano Zampini -  IS[] - array of IS describing the fields
4909c0446d6SStefano Zampini 
4919c0446d6SStefano Zampini    Level: intermediate
4929c0446d6SStefano Zampini 
4939c0446d6SStefano Zampini    Notes:
4949c0446d6SStefano Zampini 
4959c0446d6SStefano Zampini .seealso: PCBDDC
4969c0446d6SStefano Zampini @*/
4979c0446d6SStefano Zampini PetscErrorCode PCBDDCSetDofsSplitting(PC pc,PetscInt n_is, IS ISForDofs[])
4989c0446d6SStefano Zampini {
4999c0446d6SStefano Zampini   PetscErrorCode ierr;
5009c0446d6SStefano Zampini 
5019c0446d6SStefano Zampini   PetscFunctionBegin;
5029c0446d6SStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
5039c0446d6SStefano Zampini   ierr = PetscTryMethod(pc,"PCBDDCSetDofsSplitting_C",(PC,PetscInt,IS[]),(pc,n_is,ISForDofs));CHKERRQ(ierr);
5049c0446d6SStefano Zampini   PetscFunctionReturn(0);
5059c0446d6SStefano Zampini }
506da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
507534831adSStefano Zampini #undef __FUNCT__
508534831adSStefano Zampini #define __FUNCT__ "PCPreSolve_BDDC"
509534831adSStefano Zampini /* -------------------------------------------------------------------------- */
510534831adSStefano Zampini /*
511534831adSStefano Zampini    PCPreSolve_BDDC - Changes the right hand side and (if necessary) the initial
512534831adSStefano Zampini                      guess if a transformation of basis approach has been selected.
5139c0446d6SStefano Zampini 
514534831adSStefano Zampini    Input Parameter:
515534831adSStefano Zampini +  pc - the preconditioner contex
516534831adSStefano Zampini 
517534831adSStefano Zampini    Application Interface Routine: PCPreSolve()
518534831adSStefano Zampini 
519534831adSStefano Zampini    Notes:
520534831adSStefano Zampini    The interface routine PCPreSolve() is not usually called directly by
521534831adSStefano Zampini    the user, but instead is called by KSPSolve().
522534831adSStefano Zampini */
523534831adSStefano Zampini static PetscErrorCode PCPreSolve_BDDC(PC pc, KSP ksp, Vec rhs, Vec x)
524534831adSStefano Zampini {
525534831adSStefano Zampini   PetscErrorCode ierr;
526534831adSStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
527534831adSStefano Zampini   PC_IS          *pcis = (PC_IS*)(pc->data);
528534831adSStefano Zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
529534831adSStefano Zampini   Mat            temp_mat;
5303972b0daSStefano Zampini   IS             dirIS;
5313972b0daSStefano Zampini   PetscInt       dirsize,i,*is_indices;
5323972b0daSStefano Zampini   PetscScalar    *array_x,*array_diagonal;
5333972b0daSStefano Zampini   Vec            used_vec;
5343972b0daSStefano Zampini   PetscBool      guess_nonzero;
535534831adSStefano Zampini 
536534831adSStefano Zampini   PetscFunctionBegin;
5373972b0daSStefano Zampini   if (x) {
5383972b0daSStefano Zampini     ierr = PetscObjectReference((PetscObject)x);CHKERRQ(ierr);
5393972b0daSStefano Zampini     used_vec = x;
5403972b0daSStefano Zampini   } else {
5413972b0daSStefano Zampini     ierr = PetscObjectReference((PetscObject)pcbddc->temp_solution);CHKERRQ(ierr);
5423972b0daSStefano Zampini     used_vec = pcbddc->temp_solution;
5433972b0daSStefano Zampini     ierr = VecSet(used_vec,0.0);CHKERRQ(ierr);
5443972b0daSStefano Zampini   }
5453972b0daSStefano Zampini   /* hack into ksp data structure PCPreSolve comes earlier in src/ksp/ksp/interface/itfunc.c */
5463972b0daSStefano Zampini   if (ksp) {
5473972b0daSStefano Zampini     ierr = KSPGetInitialGuessNonzero(ksp,&guess_nonzero);CHKERRQ(ierr);
5483972b0daSStefano Zampini     if ( !guess_nonzero ) {
5493972b0daSStefano Zampini       ierr = VecSet(used_vec,0.0);CHKERRQ(ierr);
5503972b0daSStefano Zampini     }
5513972b0daSStefano Zampini   }
5523972b0daSStefano Zampini   /* store the original rhs */
5533972b0daSStefano Zampini   ierr = VecCopy(rhs,pcbddc->original_rhs);CHKERRQ(ierr);
5543972b0daSStefano Zampini 
5553972b0daSStefano Zampini   /* Take into account zeroed rows -> change rhs and store solution removed */
5563972b0daSStefano Zampini   ierr = MatGetDiagonal(pc->pmat,pcis->vec1_global);CHKERRQ(ierr);
5573972b0daSStefano Zampini   ierr = VecPointwiseDivide(pcis->vec1_global,rhs,pcis->vec1_global);CHKERRQ(ierr);
5583972b0daSStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
5593972b0daSStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
5603972b0daSStefano Zampini   ierr = VecScatterBegin(matis->ctx,used_vec,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
5613972b0daSStefano Zampini   ierr = VecScatterEnd  (matis->ctx,used_vec,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
5623972b0daSStefano Zampini   ierr = PCBDDCGetDirichletBoundaries(pc,&dirIS);CHKERRQ(ierr);
5633972b0daSStefano Zampini   if (dirIS) {
5643972b0daSStefano Zampini     ierr = ISGetSize(dirIS,&dirsize);CHKERRQ(ierr);
5653972b0daSStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array_x);CHKERRQ(ierr);
5663972b0daSStefano Zampini     ierr = VecGetArray(pcis->vec2_N,&array_diagonal);CHKERRQ(ierr);
5673972b0daSStefano Zampini     ierr = ISGetIndices(dirIS,(const PetscInt**)&is_indices);CHKERRQ(ierr);
5683972b0daSStefano Zampini     for (i=0;i<dirsize;i++) {
5693972b0daSStefano Zampini       array_x[is_indices[i]]=array_diagonal[is_indices[i]];
5703972b0daSStefano Zampini     }
5713972b0daSStefano Zampini     ierr = ISRestoreIndices(dirIS,(const PetscInt**)&is_indices);CHKERRQ(ierr);
5723972b0daSStefano Zampini     ierr = VecRestoreArray(pcis->vec2_N,&array_diagonal);CHKERRQ(ierr);
5733972b0daSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array_x);CHKERRQ(ierr);
5743972b0daSStefano Zampini   }
5753972b0daSStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
5763972b0daSStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
577b76ba322SStefano Zampini 
5783972b0daSStefano Zampini   /* remove the computed solution from the rhs */
5793972b0daSStefano Zampini   ierr = VecScale(used_vec,-1.0);CHKERRQ(ierr);
5803972b0daSStefano Zampini   ierr = MatMultAdd(pc->pmat,used_vec,rhs,rhs);CHKERRQ(ierr);
5813972b0daSStefano Zampini   ierr = VecScale(used_vec,-1.0);CHKERRQ(ierr);
582b76ba322SStefano Zampini 
583b76ba322SStefano Zampini   /* store partially computed solution and set initial guess */
5843972b0daSStefano Zampini   if (x) {
5853972b0daSStefano Zampini     ierr = VecCopy(used_vec,pcbddc->temp_solution);CHKERRQ(ierr);
5863972b0daSStefano Zampini     ierr = VecSet(used_vec,0.0);CHKERRQ(ierr);
587b76ba322SStefano Zampini     if (pcbddc->use_exact_dirichlet) {
588b76ba322SStefano Zampini       ierr = VecScatterBegin(pcis->global_to_D,rhs,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
589b76ba322SStefano Zampini       ierr = VecScatterEnd  (pcis->global_to_D,rhs,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
590b76ba322SStefano Zampini       ierr = KSPSolve(pcbddc->ksp_D,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr);
591b76ba322SStefano Zampini       ierr = VecScatterBegin(pcis->global_to_D,pcis->vec2_D,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
592b76ba322SStefano Zampini       ierr = VecScatterEnd  (pcis->global_to_D,pcis->vec2_D,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
593b76ba322SStefano Zampini       if (ksp) {
594b76ba322SStefano Zampini         ierr = KSPSetInitialGuessNonzero(ksp,PETSC_TRUE);CHKERRQ(ierr);
595b76ba322SStefano Zampini       }
596b76ba322SStefano Zampini     }
5973972b0daSStefano Zampini   }
598b76ba322SStefano Zampini 
599b76ba322SStefano Zampini   /* rhs change of basis */
600b76ba322SStefano Zampini   if (pcbddc->usechangeofbasis) {
601b76ba322SStefano Zampini     /* swap pointers for local matrices */
602b76ba322SStefano Zampini     temp_mat = matis->A;
603b76ba322SStefano Zampini     matis->A = pcbddc->local_mat;
604b76ba322SStefano Zampini     pcbddc->local_mat = temp_mat;
605b76ba322SStefano Zampini     /* Get local rhs and apply transformation of basis */
606b76ba322SStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,rhs,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
607b76ba322SStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,rhs,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
608b76ba322SStefano Zampini     /* from original basis to modified basis */
609b76ba322SStefano Zampini     ierr = MatMultTranspose(pcbddc->ChangeOfBasisMatrix,pcis->vec1_B,pcis->vec2_B);CHKERRQ(ierr);
610b76ba322SStefano Zampini     /* put back modified values into the global vec using INSERT_VALUES copy mode */
611b76ba322SStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,pcis->vec2_B,rhs,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
612b76ba322SStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec2_B,rhs,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
6130bdf917eSStefano Zampini     if (ksp && pcbddc->NullSpace) {
6140bdf917eSStefano Zampini       ierr = MatNullSpaceRemove(pcbddc->NullSpace,used_vec,PETSC_NULL);CHKERRQ(ierr);
6150bdf917eSStefano Zampini       ierr = MatNullSpaceRemove(pcbddc->NullSpace,rhs,PETSC_NULL);CHKERRQ(ierr);
616b76ba322SStefano Zampini     }
6170bdf917eSStefano Zampini   }
6180bdf917eSStefano Zampini   ierr = VecDestroy(&used_vec);CHKERRQ(ierr);
619534831adSStefano Zampini   PetscFunctionReturn(0);
620534831adSStefano Zampini }
621534831adSStefano Zampini /* -------------------------------------------------------------------------- */
622534831adSStefano Zampini #undef __FUNCT__
623534831adSStefano Zampini #define __FUNCT__ "PCPostSolve_BDDC"
624534831adSStefano Zampini /* -------------------------------------------------------------------------- */
625534831adSStefano Zampini /*
626534831adSStefano Zampini    PCPostSolve_BDDC - Changes the computed solution if a transformation of basis
627534831adSStefano Zampini                      approach has been selected. Also, restores rhs to its original state.
628534831adSStefano Zampini 
629534831adSStefano Zampini    Input Parameter:
630534831adSStefano Zampini +  pc - the preconditioner contex
631534831adSStefano Zampini 
632534831adSStefano Zampini    Application Interface Routine: PCPostSolve()
633534831adSStefano Zampini 
634534831adSStefano Zampini    Notes:
635534831adSStefano Zampini    The interface routine PCPostSolve() is not usually called directly by
636534831adSStefano Zampini    the user, but instead is called by KSPSolve().
637534831adSStefano Zampini */
638534831adSStefano Zampini static PetscErrorCode PCPostSolve_BDDC(PC pc, KSP ksp, Vec rhs, Vec x)
639534831adSStefano Zampini {
640534831adSStefano Zampini   PetscErrorCode ierr;
641534831adSStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
642534831adSStefano Zampini   PC_IS          *pcis = (PC_IS*)(pc->data);
643534831adSStefano Zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
644534831adSStefano Zampini   Mat            temp_mat;
645534831adSStefano Zampini 
646534831adSStefano Zampini   PetscFunctionBegin;
647534831adSStefano Zampini   if (pcbddc->usechangeofbasis) {
648534831adSStefano Zampini     /* swap pointers for local matrices */
649534831adSStefano Zampini     temp_mat = matis->A;
650534831adSStefano Zampini     matis->A = pcbddc->local_mat;
651534831adSStefano Zampini     pcbddc->local_mat = temp_mat;
652534831adSStefano Zampini     /* restore rhs to its original state */
6533425bc38SStefano Zampini     if (rhs) {
6543425bc38SStefano Zampini       ierr = VecCopy(pcbddc->original_rhs,rhs);CHKERRQ(ierr);
6553425bc38SStefano Zampini     }
656534831adSStefano Zampini     /* Get Local boundary and apply transformation of basis to solution vector */
657534831adSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,x,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
658534831adSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,x,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
659534831adSStefano Zampini     /* from modified basis to original basis */
660534831adSStefano Zampini     ierr = MatMult(pcbddc->ChangeOfBasisMatrix,pcis->vec1_B,pcis->vec2_B);CHKERRQ(ierr);
661534831adSStefano Zampini     /* put back modified values into the global vec using INSERT_VALUES copy mode */
662534831adSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,pcis->vec2_B,x,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
663534831adSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec2_B,x,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
664534831adSStefano Zampini   }
6653972b0daSStefano Zampini   /* add solution removed in presolve */
6663425bc38SStefano Zampini   if (x) {
6673425bc38SStefano Zampini     ierr = VecAXPY(x,1.0,pcbddc->temp_solution);CHKERRQ(ierr);
6683425bc38SStefano Zampini   }
669534831adSStefano Zampini   PetscFunctionReturn(0);
670534831adSStefano Zampini }
671534831adSStefano Zampini /* -------------------------------------------------------------------------- */
67253cdbc3dSStefano Zampini #undef __FUNCT__
67353cdbc3dSStefano Zampini #define __FUNCT__ "PCSetUp_BDDC"
6740c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
6750c7d97c5SJed Brown /*
6760c7d97c5SJed Brown    PCSetUp_BDDC - Prepares for the use of the BDDC preconditioner
6770c7d97c5SJed Brown                   by setting data structures and options.
6780c7d97c5SJed Brown 
6790c7d97c5SJed Brown    Input Parameter:
68053cdbc3dSStefano Zampini +  pc - the preconditioner context
6810c7d97c5SJed Brown 
6820c7d97c5SJed Brown    Application Interface Routine: PCSetUp()
6830c7d97c5SJed Brown 
6840c7d97c5SJed Brown    Notes:
6850c7d97c5SJed Brown    The interface routine PCSetUp() is not usually called directly by
6860c7d97c5SJed Brown    the user, but instead is called by PCApply() if necessary.
6870c7d97c5SJed Brown */
68853cdbc3dSStefano Zampini PetscErrorCode PCSetUp_BDDC(PC pc)
6890c7d97c5SJed Brown {
6900c7d97c5SJed Brown   PetscErrorCode ierr;
6910c7d97c5SJed Brown   PC_BDDC*       pcbddc   = (PC_BDDC*)pc->data;
6920c7d97c5SJed Brown 
6930c7d97c5SJed Brown   PetscFunctionBegin;
6940c7d97c5SJed Brown   if (!pc->setupcalled) {
6953b03a366Sstefano_zampini     /* For BDDC we need to define a local "Neumann" problem different to that defined in PCISSetup
6969c0446d6SStefano Zampini        So, we set to pcnone the Neumann problem of pcis in order to avoid unneeded computation
6970c7d97c5SJed Brown        Also, we decide to directly build the (same) Dirichlet problem */
6980c7d97c5SJed Brown     ierr = PetscOptionsSetValue("-is_localN_pc_type","none");CHKERRQ(ierr);
6990c7d97c5SJed Brown     ierr = PetscOptionsSetValue("-is_localD_pc_type","none");CHKERRQ(ierr);
7000c7d97c5SJed Brown     /* Set up all the "iterative substructuring" common block */
7010bdf917eSStefano Zampini 
7020c7d97c5SJed Brown     ierr = PCISSetUp(pc);CHKERRQ(ierr);
7033b03a366Sstefano_zampini     /* Get stdout for dbg */
704e269702eSStefano Zampini     if (pcbddc->dbg_flag) {
705e269702eSStefano Zampini       ierr = PetscViewerASCIIGetStdout(((PetscObject)pc)->comm,&pcbddc->dbg_viewer);CHKERRQ(ierr);
706e269702eSStefano Zampini       ierr = PetscViewerASCIISynchronizedAllow(pcbddc->dbg_viewer,PETSC_TRUE);CHKERRQ(ierr);
707e269702eSStefano Zampini     }
7083b03a366Sstefano_zampini     /* Analyze local interface */
7090c7d97c5SJed Brown     ierr = PCBDDCManageLocalBoundaries(pc);CHKERRQ(ierr);
7103b03a366Sstefano_zampini     /* Set up local constraint matrix */
7113b03a366Sstefano_zampini     ierr = PCBDDCCreateConstraintMatrix(pc);CHKERRQ(ierr);
7120c7d97c5SJed Brown     /* Create coarse and local stuffs used for evaluating action of preconditioner */
7130c7d97c5SJed Brown     ierr = PCBDDCCoarseSetUp(pc);CHKERRQ(ierr);
7140c7d97c5SJed Brown   }
7150c7d97c5SJed Brown   PetscFunctionReturn(0);
7160c7d97c5SJed Brown }
7170c7d97c5SJed Brown 
7180c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
7190c7d97c5SJed Brown /*
7200c7d97c5SJed Brown    PCApply_BDDC - Applies the BDDC preconditioner to a vector.
7210c7d97c5SJed Brown 
7220c7d97c5SJed Brown    Input Parameters:
7230c7d97c5SJed Brown .  pc - the preconditioner context
7240c7d97c5SJed Brown .  r - input vector (global)
7250c7d97c5SJed Brown 
7260c7d97c5SJed Brown    Output Parameter:
7270c7d97c5SJed Brown .  z - output vector (global)
7280c7d97c5SJed Brown 
7290c7d97c5SJed Brown    Application Interface Routine: PCApply()
7300c7d97c5SJed Brown  */
7310c7d97c5SJed Brown #undef __FUNCT__
7320c7d97c5SJed Brown #define __FUNCT__ "PCApply_BDDC"
73353cdbc3dSStefano Zampini PetscErrorCode PCApply_BDDC(PC pc,Vec r,Vec z)
7340c7d97c5SJed Brown {
7350c7d97c5SJed Brown   PC_IS             *pcis = (PC_IS*)(pc->data);
7360c7d97c5SJed Brown   PC_BDDC           *pcbddc = (PC_BDDC*)(pc->data);
7370c7d97c5SJed Brown   PetscErrorCode    ierr;
7383b03a366Sstefano_zampini   const PetscScalar one = 1.0;
7393b03a366Sstefano_zampini   const PetscScalar m_one = -1.0;
7402617d88aSStefano Zampini   const PetscScalar zero = 0.0;
7410c7d97c5SJed Brown 
7420c7d97c5SJed Brown /* This code is similar to that provided in nn.c for PCNN
7430c7d97c5SJed Brown    NN interface preconditioner changed to BDDC
74429622bf0SStefano Zampini    Added support for M_3 preconditioner in the reference article (code is active if pcbddc->inexact_prec_type = PETSC_TRUE) */
7450c7d97c5SJed Brown 
7460c7d97c5SJed Brown   PetscFunctionBegin;
747b76ba322SStefano Zampini   if (!pcbddc->use_exact_dirichlet) {
7480c7d97c5SJed Brown     /* First Dirichlet solve */
7490c7d97c5SJed Brown     ierr = VecScatterBegin(pcis->global_to_D,r,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
7500c7d97c5SJed Brown     ierr = VecScatterEnd  (pcis->global_to_D,r,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
75153cdbc3dSStefano Zampini     ierr = KSPSolve(pcbddc->ksp_D,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr);
7520c7d97c5SJed Brown     /*
7530c7d97c5SJed Brown       Assembling right hand side for BDDC operator
7540c7d97c5SJed Brown       - vec1_D for the Dirichlet part (if needed, i.e. prec_flag=PETSC_TRUE)
7550c7d97c5SJed Brown       - the interface part of the global vector z
7560c7d97c5SJed Brown     */
7570c7d97c5SJed Brown     ierr = VecScale(pcis->vec2_D,m_one);CHKERRQ(ierr);
7580c7d97c5SJed Brown     ierr = MatMult(pcis->A_BI,pcis->vec2_D,pcis->vec1_B);CHKERRQ(ierr);
75929622bf0SStefano Zampini     if (pcbddc->inexact_prec_type) { ierr = MatMultAdd(pcis->A_II,pcis->vec2_D,pcis->vec1_D,pcis->vec1_D);CHKERRQ(ierr); }
7600c7d97c5SJed Brown     ierr = VecScale(pcis->vec2_D,m_one);CHKERRQ(ierr);
7610c7d97c5SJed Brown     ierr = VecCopy(r,z);CHKERRQ(ierr);
7620c7d97c5SJed Brown     ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
7630c7d97c5SJed Brown     ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
7642617d88aSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
7652617d88aSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
766b76ba322SStefano Zampini   } else {
767b76ba322SStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,r,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
768b76ba322SStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,r,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
7690bdf917eSStefano Zampini     ierr = VecSet(pcis->vec1_D,zero);CHKERRQ(ierr);
770b76ba322SStefano Zampini     ierr = VecSet(pcis->vec2_D,zero);CHKERRQ(ierr);
771b76ba322SStefano Zampini   }
772b76ba322SStefano Zampini 
773b76ba322SStefano Zampini   /* Apply partition of unity */
7742617d88aSStefano Zampini   ierr = VecPointwiseMult(pcis->vec1_B,pcis->D,pcis->vec1_B);CHKERRQ(ierr);
7752617d88aSStefano Zampini 
7762617d88aSStefano Zampini   /* Apply interface preconditioner
7772617d88aSStefano Zampini      input/output vecs: pcis->vec1_B and pcis->vec1_D */
7782617d88aSStefano Zampini   ierr = PCBDDCApplyInterfacePreconditioner(pc);CHKERRQ(ierr);
7792617d88aSStefano Zampini 
7802617d88aSStefano Zampini   /* Apply partition of unity and sum boundary values */
7812617d88aSStefano Zampini   ierr = VecPointwiseMult(pcis->vec1_B,pcis->D,pcis->vec1_B);CHKERRQ(ierr);
7822617d88aSStefano Zampini   ierr = VecSet(z,zero);CHKERRQ(ierr);
7832617d88aSStefano Zampini   ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
7842617d88aSStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
7850c7d97c5SJed Brown 
7863b03a366Sstefano_zampini   /* Second Dirichlet solve and assembling of output */
7870c7d97c5SJed Brown   ierr = VecScatterBegin(pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
7880c7d97c5SJed Brown   ierr = VecScatterEnd  (pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
7890c7d97c5SJed Brown   ierr = MatMult(pcis->A_IB,pcis->vec1_B,pcis->vec3_D);CHKERRQ(ierr);
79029622bf0SStefano Zampini   if (pcbddc->inexact_prec_type) { ierr = MatMultAdd(pcis->A_II,pcis->vec1_D,pcis->vec3_D,pcis->vec3_D);CHKERRQ(ierr); }
79153cdbc3dSStefano Zampini   ierr = KSPSolve(pcbddc->ksp_D,pcis->vec3_D,pcbddc->vec4_D);CHKERRQ(ierr);
7920c7d97c5SJed Brown   ierr = VecScale(pcbddc->vec4_D,m_one);CHKERRQ(ierr);
79329622bf0SStefano Zampini   if (pcbddc->inexact_prec_type) { ierr = VecAXPY (pcbddc->vec4_D,one,pcis->vec1_D);CHKERRQ(ierr); }
7940c7d97c5SJed Brown   ierr = VecAXPY (pcis->vec2_D,one,pcbddc->vec4_D);CHKERRQ(ierr);
7950c7d97c5SJed Brown   ierr = VecScatterBegin(pcis->global_to_D,pcis->vec2_D,z,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
7960c7d97c5SJed Brown   ierr = VecScatterEnd  (pcis->global_to_D,pcis->vec2_D,z,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
7970c7d97c5SJed Brown   PetscFunctionReturn(0);
7980c7d97c5SJed Brown 
7990c7d97c5SJed Brown }
800da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
801da1bb401SStefano Zampini #undef __FUNCT__
802da1bb401SStefano Zampini #define __FUNCT__ "PCDestroy_BDDC"
803da1bb401SStefano Zampini PetscErrorCode PCDestroy_BDDC(PC pc)
804da1bb401SStefano Zampini {
805da1bb401SStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
8060bdf917eSStefano Zampini   PetscInt       i;
807da1bb401SStefano Zampini   PetscErrorCode ierr;
808da1bb401SStefano Zampini 
809da1bb401SStefano Zampini   PetscFunctionBegin;
810da1bb401SStefano Zampini   /* free data created by PCIS */
811da1bb401SStefano Zampini   ierr = PCISDestroy(pc);CHKERRQ(ierr);
812da1bb401SStefano Zampini   /* free BDDC data  */
8130bdf917eSStefano Zampini   ierr = MatNullSpaceDestroy(&pcbddc->CoarseNullSpace);CHKERRQ(ierr);
8140bdf917eSStefano Zampini   ierr = MatNullSpaceDestroy(&pcbddc->NullSpace);CHKERRQ(ierr);
8153972b0daSStefano Zampini   ierr = VecDestroy(&pcbddc->temp_solution);CHKERRQ(ierr);
816534831adSStefano Zampini   ierr = VecDestroy(&pcbddc->original_rhs);CHKERRQ(ierr);
817534831adSStefano Zampini   ierr = MatDestroy(&pcbddc->local_mat);CHKERRQ(ierr);
818534831adSStefano Zampini   ierr = MatDestroy(&pcbddc->ChangeOfBasisMatrix);CHKERRQ(ierr);
819da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->coarse_vec);CHKERRQ(ierr);
820da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->coarse_rhs);CHKERRQ(ierr);
821da1bb401SStefano Zampini   ierr = KSPDestroy(&pcbddc->coarse_ksp);CHKERRQ(ierr);
822da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->coarse_mat);CHKERRQ(ierr);
823da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->coarse_phi_B);CHKERRQ(ierr);
824da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->coarse_phi_D);CHKERRQ(ierr);
825da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec1_P);CHKERRQ(ierr);
826da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec1_C);CHKERRQ(ierr);
827da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->local_auxmat1);CHKERRQ(ierr);
828da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->local_auxmat2);CHKERRQ(ierr);
829da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec1_R);CHKERRQ(ierr);
830da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec2_R);CHKERRQ(ierr);
831da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec4_D);CHKERRQ(ierr);
832da1bb401SStefano Zampini   ierr = VecScatterDestroy(&pcbddc->R_to_B);CHKERRQ(ierr);
833da1bb401SStefano Zampini   ierr = VecScatterDestroy(&pcbddc->R_to_D);CHKERRQ(ierr);
834da1bb401SStefano Zampini   ierr = VecScatterDestroy(&pcbddc->coarse_loc_to_glob);CHKERRQ(ierr);
835da1bb401SStefano Zampini   ierr = KSPDestroy(&pcbddc->ksp_D);CHKERRQ(ierr);
836da1bb401SStefano Zampini   ierr = KSPDestroy(&pcbddc->ksp_R);CHKERRQ(ierr);
837da1bb401SStefano Zampini   ierr = ISDestroy(&pcbddc->NeumannBoundaries);CHKERRQ(ierr);
838da1bb401SStefano Zampini   ierr = ISDestroy(&pcbddc->DirichletBoundaries);CHKERRQ(ierr);
839da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->ConstraintMatrix);CHKERRQ(ierr);
840da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->local_primal_indices);CHKERRQ(ierr);
841da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->replicated_local_primal_indices);CHKERRQ(ierr);
8420bdf917eSStefano Zampini   ierr = PetscFree(pcbddc->replicated_local_primal_values);CHKERRQ(ierr);
843da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->local_primal_displacements);CHKERRQ(ierr);
844da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->local_primal_sizes);CHKERRQ(ierr);
845da1bb401SStefano Zampini   for (i=0;i<pcbddc->n_ISForDofs;i++) { ierr = ISDestroy(&pcbddc->ISForDofs[i]);CHKERRQ(ierr); }
846da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->ISForDofs);CHKERRQ(ierr);
847da1bb401SStefano Zampini   for (i=0;i<pcbddc->n_ISForFaces;i++) { ierr = ISDestroy(&pcbddc->ISForFaces[i]);CHKERRQ(ierr); }
848da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->ISForFaces);CHKERRQ(ierr);
849da1bb401SStefano Zampini   for (i=0;i<pcbddc->n_ISForEdges;i++) { ierr = ISDestroy(&pcbddc->ISForEdges[i]);CHKERRQ(ierr); }
850da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->ISForEdges);CHKERRQ(ierr);
851da1bb401SStefano Zampini   ierr = ISDestroy(&pcbddc->ISForVertices);CHKERRQ(ierr);
8523972b0daSStefano Zampini   /* Free graph structure */
853da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph->xadj);CHKERRQ(ierr);
854da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph->adjncy);CHKERRQ(ierr);
855142dfd88SStefano Zampini   if (pcbddc->mat_graph->nvtxs) {
856da1bb401SStefano Zampini     ierr = PetscFree(pcbddc->mat_graph->neighbours_set[0]);CHKERRQ(ierr);
857142dfd88SStefano Zampini   }
858da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph->neighbours_set);CHKERRQ(ierr);
8593972b0daSStefano Zampini   ierr = PetscFree4(pcbddc->mat_graph->where,pcbddc->mat_graph->count,pcbddc->mat_graph->cptr,pcbddc->mat_graph->queue);CHKERRQ(ierr);
8603972b0daSStefano Zampini   ierr = PetscFree2(pcbddc->mat_graph->which_dof,pcbddc->mat_graph->touched);CHKERRQ(ierr);
8613972b0daSStefano Zampini   ierr = PetscFree(pcbddc->mat_graph->where_ncmps);CHKERRQ(ierr);
862da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph);CHKERRQ(ierr);
8633425bc38SStefano Zampini   /* remove functions */
8644fad6a16SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetCoarseningRatio_C","",PETSC_NULL);CHKERRQ(ierr);
8654fad6a16SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetMaxLevels_C","",PETSC_NULL);CHKERRQ(ierr);
8660bdf917eSStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetNullSpace_C","",PETSC_NULL);CHKERRQ(ierr);
8673425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDirichletBoundaries_C","",PETSC_NULL);CHKERRQ(ierr);
8683425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetNeumannBoundaries_C","",PETSC_NULL);CHKERRQ(ierr);
8693425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetDirichletBoundaries_C","",PETSC_NULL);CHKERRQ(ierr);
8703425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetNeumannBoundaries_C","",PETSC_NULL);CHKERRQ(ierr);
8713425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetCoarseProblemType_C","",PETSC_NULL);CHKERRQ(ierr);
8723425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDofsSplitting_C","",PETSC_NULL);CHKERRQ(ierr);
8733425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetLocalAdjacencyGraph_C","",PETSC_NULL);CHKERRQ(ierr);
8743425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPreSolve_C","",PETSC_NULL);CHKERRQ(ierr);
8753425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPostSolve_C","",PETSC_NULL);CHKERRQ(ierr);
8763425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCCreateFETIDPOperators_C","",PETSC_NULL);CHKERRQ(ierr);
8773425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetRHS_C","",PETSC_NULL);CHKERRQ(ierr);
8783425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetSolution_C","",PETSC_NULL);CHKERRQ(ierr);
879da1bb401SStefano Zampini   /* Free the private data structure that was hanging off the PC */
880da1bb401SStefano Zampini   ierr = PetscFree(pcbddc);CHKERRQ(ierr);
881da1bb401SStefano Zampini   PetscFunctionReturn(0);
882da1bb401SStefano Zampini }
8833425bc38SStefano Zampini /* -------------------------------------------------------------------------- */
8843425bc38SStefano Zampini EXTERN_C_BEGIN
8853425bc38SStefano Zampini #undef __FUNCT__
8863425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetRHS_BDDC"
8873425bc38SStefano Zampini static PetscErrorCode PCBDDCMatFETIDPGetRHS_BDDC(Mat fetidp_mat, Vec standard_rhs, Vec fetidp_flux_rhs)
8883425bc38SStefano Zampini {
8893425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
8903425bc38SStefano Zampini   PC_IS*         pcis;
8913425bc38SStefano Zampini   PC_BDDC*       pcbddc;
8923425bc38SStefano Zampini   PetscErrorCode ierr;
8930c7d97c5SJed Brown 
8943425bc38SStefano Zampini   PetscFunctionBegin;
8953425bc38SStefano Zampini   ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr);
8963425bc38SStefano Zampini   pcis = (PC_IS*)mat_ctx->pc->data;
8973425bc38SStefano Zampini   pcbddc = (PC_BDDC*)mat_ctx->pc->data;
8983425bc38SStefano Zampini 
8993425bc38SStefano Zampini   /* change of basis for physical rhs if needed
9003425bc38SStefano Zampini      It also changes the rhs in case of dirichlet boundaries */
9013425bc38SStefano Zampini   (*mat_ctx->pc->ops->presolve)(mat_ctx->pc,PETSC_NULL,standard_rhs,PETSC_NULL);
9023425bc38SStefano Zampini   /* store vectors for computation of fetidp final solution */
9033425bc38SStefano Zampini   ierr = VecScatterBegin(pcis->global_to_D,standard_rhs,mat_ctx->temp_solution_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
9043425bc38SStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_D,standard_rhs,mat_ctx->temp_solution_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
9053425bc38SStefano Zampini   ierr = VecScatterBegin(pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
9063425bc38SStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
9073425bc38SStefano Zampini   /* scale rhs since it should be unassembled */
9083425bc38SStefano Zampini   ierr = VecPointwiseMult(mat_ctx->temp_solution_B,pcis->D,mat_ctx->temp_solution_B);CHKERRQ(ierr);
90929622bf0SStefano Zampini   if (!pcbddc->inexact_prec_type) {
9103425bc38SStefano Zampini     /* compute partially subassembled Schur complement right-hand side */
9113425bc38SStefano Zampini     ierr = KSPSolve(pcbddc->ksp_D,mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr);
9123425bc38SStefano Zampini     ierr = MatMult(pcis->A_BI,pcis->vec1_D,pcis->vec1_B);CHKERRQ(ierr);
9133425bc38SStefano Zampini     ierr = VecAXPY(mat_ctx->temp_solution_B,-1.0,pcis->vec1_B);CHKERRQ(ierr);
9143425bc38SStefano Zampini     ierr = VecSet(standard_rhs,0.0);CHKERRQ(ierr);
9153425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,mat_ctx->temp_solution_B,standard_rhs,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
9163425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,mat_ctx->temp_solution_B,standard_rhs,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
9173425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
9183425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
9193425bc38SStefano Zampini     ierr = VecPointwiseMult(mat_ctx->temp_solution_B,pcis->D,mat_ctx->temp_solution_B);CHKERRQ(ierr);
9203425bc38SStefano Zampini   }
9213425bc38SStefano Zampini   /* BDDC rhs */
9223425bc38SStefano Zampini   ierr = VecCopy(mat_ctx->temp_solution_B,pcis->vec1_B);CHKERRQ(ierr);
92329622bf0SStefano Zampini   if (pcbddc->inexact_prec_type) {
9243425bc38SStefano Zampini     ierr = VecCopy(mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr);
9253425bc38SStefano Zampini   }
9263425bc38SStefano Zampini   /* apply BDDC */
9273425bc38SStefano Zampini   ierr = PCBDDCApplyInterfacePreconditioner(mat_ctx->pc);CHKERRQ(ierr);
9283425bc38SStefano Zampini   /* Application of B_delta and assembling of rhs for fetidp fluxes */
9293425bc38SStefano Zampini   ierr = VecSet(fetidp_flux_rhs,0.0);CHKERRQ(ierr);
9303425bc38SStefano Zampini   ierr = MatMult(mat_ctx->B_delta,pcis->vec1_B,mat_ctx->lambda_local);CHKERRQ(ierr);
9313425bc38SStefano Zampini   ierr = VecScatterBegin(mat_ctx->l2g_lambda,mat_ctx->lambda_local,fetidp_flux_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
9323425bc38SStefano Zampini   ierr = VecScatterEnd  (mat_ctx->l2g_lambda,mat_ctx->lambda_local,fetidp_flux_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
9333425bc38SStefano Zampini   /* restore original rhs */
9343425bc38SStefano Zampini   ierr = VecCopy(pcbddc->original_rhs,standard_rhs);CHKERRQ(ierr);
9353425bc38SStefano Zampini   PetscFunctionReturn(0);
9363425bc38SStefano Zampini }
9373425bc38SStefano Zampini EXTERN_C_END
9383425bc38SStefano Zampini #undef __FUNCT__
9393425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetRHS"
9403425bc38SStefano Zampini /*@
9413425bc38SStefano Zampini  PCBDDCMatFETIDPGetRHS - Get rhs for FETIDP linear system.
9423425bc38SStefano Zampini 
9433425bc38SStefano Zampini    Collective
9443425bc38SStefano Zampini 
9453425bc38SStefano Zampini    Input Parameters:
9463425bc38SStefano Zampini +  fetidp_mat   - the FETIDP mat obtained by a call to PCBDDCCreateFETIDPOperators
9473425bc38SStefano Zampini +  standard_rhs - the rhs of your linear system
9483425bc38SStefano Zampini 
9493425bc38SStefano Zampini    Output Parameters:
9503425bc38SStefano Zampini +  fetidp_flux_rhs   - the rhs of the FETIDP linear system
9513425bc38SStefano Zampini 
9523425bc38SStefano Zampini    Level: developer
9533425bc38SStefano Zampini 
9543425bc38SStefano Zampini    Notes:
9553425bc38SStefano Zampini 
9563425bc38SStefano Zampini .seealso: PCBDDC
9573425bc38SStefano Zampini @*/
9583425bc38SStefano Zampini PetscErrorCode PCBDDCMatFETIDPGetRHS(Mat fetidp_mat, Vec standard_rhs, Vec fetidp_flux_rhs)
9593425bc38SStefano Zampini {
9603425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
9613425bc38SStefano Zampini   PetscErrorCode ierr;
9623425bc38SStefano Zampini 
9633425bc38SStefano Zampini   PetscFunctionBegin;
9643425bc38SStefano Zampini   ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr);
9653425bc38SStefano Zampini   ierr = PetscTryMethod(mat_ctx->pc,"PCBDDCMatFETIDPGetRHS_C",(Mat,Vec,Vec),(fetidp_mat,standard_rhs,fetidp_flux_rhs));CHKERRQ(ierr);
9663425bc38SStefano Zampini   PetscFunctionReturn(0);
9673425bc38SStefano Zampini }
9683425bc38SStefano Zampini /* -------------------------------------------------------------------------- */
9693425bc38SStefano Zampini EXTERN_C_BEGIN
9703425bc38SStefano Zampini #undef __FUNCT__
9713425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetSolution_BDDC"
9723425bc38SStefano Zampini static PetscErrorCode PCBDDCMatFETIDPGetSolution_BDDC(Mat fetidp_mat, Vec fetidp_flux_sol, Vec standard_sol)
9733425bc38SStefano Zampini {
9743425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
9753425bc38SStefano Zampini   PC_IS*         pcis;
9763425bc38SStefano Zampini   PC_BDDC*       pcbddc;
9773425bc38SStefano Zampini   PetscErrorCode ierr;
9783425bc38SStefano Zampini 
9793425bc38SStefano Zampini   PetscFunctionBegin;
9803425bc38SStefano Zampini   ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr);
9813425bc38SStefano Zampini   pcis = (PC_IS*)mat_ctx->pc->data;
9823425bc38SStefano Zampini   pcbddc = (PC_BDDC*)mat_ctx->pc->data;
9833425bc38SStefano Zampini 
9843425bc38SStefano Zampini   /* apply B_delta^T */
9853425bc38SStefano Zampini   ierr = VecScatterBegin(mat_ctx->l2g_lambda,fetidp_flux_sol,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
9863425bc38SStefano Zampini   ierr = VecScatterEnd  (mat_ctx->l2g_lambda,fetidp_flux_sol,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
9873425bc38SStefano Zampini   ierr = MatMultTranspose(mat_ctx->B_delta,mat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr);
9883425bc38SStefano Zampini   /* compute rhs for BDDC application */
9893425bc38SStefano Zampini   ierr = VecAYPX(pcis->vec1_B,-1.0,mat_ctx->temp_solution_B);CHKERRQ(ierr);
99029622bf0SStefano Zampini   if (pcbddc->inexact_prec_type) {
9913425bc38SStefano Zampini     ierr = VecCopy(mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr);
9923425bc38SStefano Zampini   }
9933425bc38SStefano Zampini   /* apply BDDC */
9943425bc38SStefano Zampini   ierr = PCBDDCApplyInterfacePreconditioner(mat_ctx->pc);CHKERRQ(ierr);
9953425bc38SStefano Zampini   /* put values into standard global vector */
9963425bc38SStefano Zampini   ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
9973425bc38SStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec1_B,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
99829622bf0SStefano Zampini   if (!pcbddc->inexact_prec_type) {
9993425bc38SStefano Zampini     /* compute values into the interior if solved for the partially subassembled Schur complement */
10003425bc38SStefano Zampini     ierr = MatMult(pcis->A_IB,pcis->vec1_B,pcis->vec1_D);CHKERRQ(ierr);
10013425bc38SStefano Zampini     ierr = VecAXPY(mat_ctx->temp_solution_D,-1.0,pcis->vec1_D);CHKERRQ(ierr);
10023425bc38SStefano Zampini     ierr = KSPSolve(pcbddc->ksp_D,mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr);
10033425bc38SStefano Zampini   }
10043425bc38SStefano Zampini   ierr = VecScatterBegin(pcis->global_to_D,pcis->vec1_D,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
10053425bc38SStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_D,pcis->vec1_D,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
10063425bc38SStefano Zampini   /* final change of basis if needed
10073425bc38SStefano Zampini      Is also sums the dirichlet part removed during RHS assembling */
10083425bc38SStefano Zampini   (*mat_ctx->pc->ops->postsolve)(mat_ctx->pc,PETSC_NULL,PETSC_NULL,standard_sol);
10093425bc38SStefano Zampini   PetscFunctionReturn(0);
10103425bc38SStefano Zampini 
10113425bc38SStefano Zampini }
10123425bc38SStefano Zampini EXTERN_C_END
10133425bc38SStefano Zampini #undef __FUNCT__
10143425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetSolution"
10153425bc38SStefano Zampini /*@
10163425bc38SStefano Zampini  PCBDDCMatFETIDPGetSolution - Get Solution for FETIDP linear system.
10173425bc38SStefano Zampini 
10183425bc38SStefano Zampini    Collective
10193425bc38SStefano Zampini 
10203425bc38SStefano Zampini    Input Parameters:
10213425bc38SStefano Zampini +  fetidp_mat        - the FETIDP mat obtained by a call to PCBDDCCreateFETIDPOperators
10223425bc38SStefano Zampini +  fetidp_flux_sol - the solution of the FETIDP linear system
10233425bc38SStefano Zampini 
10243425bc38SStefano Zampini    Output Parameters:
10253425bc38SStefano Zampini +  standard_sol      - the solution on the global domain
10263425bc38SStefano Zampini 
10273425bc38SStefano Zampini    Level: developer
10283425bc38SStefano Zampini 
10293425bc38SStefano Zampini    Notes:
10303425bc38SStefano Zampini 
10313425bc38SStefano Zampini .seealso: PCBDDC
10323425bc38SStefano Zampini @*/
10333425bc38SStefano Zampini PetscErrorCode PCBDDCMatFETIDPGetSolution(Mat fetidp_mat, Vec fetidp_flux_sol, Vec standard_sol)
10343425bc38SStefano Zampini {
10353425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
10363425bc38SStefano Zampini   PetscErrorCode ierr;
10373425bc38SStefano Zampini 
10383425bc38SStefano Zampini   PetscFunctionBegin;
10393425bc38SStefano Zampini   ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr);
10403425bc38SStefano Zampini   ierr = PetscTryMethod(mat_ctx->pc,"PCBDDCMatFETIDPGetSolution_C",(Mat,Vec,Vec),(fetidp_mat,fetidp_flux_sol,standard_sol));CHKERRQ(ierr);
10413425bc38SStefano Zampini   PetscFunctionReturn(0);
10423425bc38SStefano Zampini }
10433425bc38SStefano Zampini /* -------------------------------------------------------------------------- */
10443425bc38SStefano Zampini EXTERN_C_BEGIN
10453425bc38SStefano Zampini #undef __FUNCT__
10463425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPOperators_BDDC"
10473425bc38SStefano Zampini static PetscErrorCode PCBDDCCreateFETIDPOperators_BDDC(PC pc, Mat *fetidp_mat, PC *fetidp_pc)
10483425bc38SStefano Zampini {
10493425bc38SStefano Zampini   PETSC_EXTERN PetscErrorCode FETIDPMatMult(Mat,Vec,Vec);
10503425bc38SStefano Zampini   PETSC_EXTERN PetscErrorCode PCBDDCDestroyFETIDPMat(Mat);
10513425bc38SStefano Zampini   PETSC_EXTERN PetscErrorCode FETIDPPCApply(PC,Vec,Vec);
10523425bc38SStefano Zampini   PETSC_EXTERN PetscErrorCode PCBDDCDestroyFETIDPPC(PC);
10533425bc38SStefano Zampini 
10543425bc38SStefano Zampini   FETIDPMat_ctx  *fetidpmat_ctx;
10553425bc38SStefano Zampini   Mat            newmat;
10563425bc38SStefano Zampini   FETIDPPC_ctx  *fetidppc_ctx;
10573425bc38SStefano Zampini   PC             newpc;
10583425bc38SStefano Zampini   MPI_Comm       comm = ((PetscObject)pc)->comm;
10593425bc38SStefano Zampini   PetscErrorCode ierr;
10603425bc38SStefano Zampini 
10613425bc38SStefano Zampini   PetscFunctionBegin;
10623425bc38SStefano Zampini   /* FETIDP linear matrix */
10633425bc38SStefano Zampini   ierr = PCBDDCCreateFETIDPMatContext(pc, &fetidpmat_ctx);CHKERRQ(ierr);
10643425bc38SStefano Zampini   ierr = PCBDDCSetupFETIDPMatContext(fetidpmat_ctx);CHKERRQ(ierr);
10653425bc38SStefano Zampini   ierr = MatCreateShell(comm,PETSC_DECIDE,PETSC_DECIDE,fetidpmat_ctx->n_lambda,fetidpmat_ctx->n_lambda,fetidpmat_ctx,&newmat);CHKERRQ(ierr);
10663425bc38SStefano Zampini   ierr = MatShellSetOperation(newmat,MATOP_MULT,(void (*)(void))FETIDPMatMult);CHKERRQ(ierr);
10673425bc38SStefano Zampini   ierr = MatShellSetOperation(newmat,MATOP_DESTROY,(void (*)(void))PCBDDCDestroyFETIDPMat);CHKERRQ(ierr);
10683425bc38SStefano Zampini   ierr = MatSetUp(newmat);CHKERRQ(ierr);
10693425bc38SStefano Zampini   /* FETIDP preconditioner */
10703425bc38SStefano Zampini   ierr = PCBDDCCreateFETIDPPCContext(pc, &fetidppc_ctx);CHKERRQ(ierr);
10713425bc38SStefano Zampini   ierr = PCBDDCSetupFETIDPPCContext(newmat,fetidppc_ctx);CHKERRQ(ierr);
10723425bc38SStefano Zampini   ierr = PCCreate(comm,&newpc);CHKERRQ(ierr);
10733425bc38SStefano Zampini   ierr = PCSetType(newpc,PCSHELL);CHKERRQ(ierr);
10743425bc38SStefano Zampini   ierr = PCShellSetContext(newpc,fetidppc_ctx);CHKERRQ(ierr);
10753425bc38SStefano Zampini   ierr = PCShellSetApply(newpc,FETIDPPCApply);CHKERRQ(ierr);
10763425bc38SStefano Zampini   ierr = PCShellSetDestroy(newpc,PCBDDCDestroyFETIDPPC);CHKERRQ(ierr);
10773425bc38SStefano Zampini   ierr = PCSetOperators(newpc,newmat,newmat,SAME_PRECONDITIONER);CHKERRQ(ierr);
10783425bc38SStefano Zampini   ierr = PCSetUp(newpc);CHKERRQ(ierr);
10793425bc38SStefano Zampini   /* return pointers for objects created */
10803425bc38SStefano Zampini   *fetidp_mat=newmat;
10813425bc38SStefano Zampini   *fetidp_pc=newpc;
10823425bc38SStefano Zampini 
10833425bc38SStefano Zampini   PetscFunctionReturn(0);
10843425bc38SStefano Zampini }
10853425bc38SStefano Zampini EXTERN_C_END
10863425bc38SStefano Zampini #undef __FUNCT__
10873425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPOperators"
10883425bc38SStefano Zampini /*@
10893425bc38SStefano Zampini  PCBDDCCreateFETIDPOperators - Create operators for FETIDP.
10903425bc38SStefano Zampini 
10913425bc38SStefano Zampini    Collective
10923425bc38SStefano Zampini 
10933425bc38SStefano Zampini    Input Parameters:
10943425bc38SStefano Zampini +  pc - the BDDC preconditioning context (setup must be already called)
10953425bc38SStefano Zampini 
10963425bc38SStefano Zampini    Level: developer
10973425bc38SStefano Zampini 
10983425bc38SStefano Zampini    Notes:
10993425bc38SStefano Zampini 
11003425bc38SStefano Zampini .seealso: PCBDDC
11013425bc38SStefano Zampini @*/
11023425bc38SStefano Zampini PetscErrorCode PCBDDCCreateFETIDPOperators(PC pc, Mat *fetidp_mat, PC *fetidp_pc)
11033425bc38SStefano Zampini {
11043425bc38SStefano Zampini   PetscErrorCode ierr;
11053425bc38SStefano Zampini 
11063425bc38SStefano Zampini   PetscFunctionBegin;
11073425bc38SStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
11083425bc38SStefano Zampini   if (pc->setupcalled) {
11093425bc38SStefano Zampini     ierr = PetscTryMethod(pc,"PCBDDCCreateFETIDPOperators_C",(PC,Mat*,PC*),(pc,fetidp_mat,fetidp_pc));CHKERRQ(ierr);
11103425bc38SStefano Zampini   } else {
11113425bc38SStefano Zampini     SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SUP,"You must call PCSetup_BDDC before calling %s\n",__FUNCT__);
11123425bc38SStefano Zampini   }
11133425bc38SStefano Zampini   PetscFunctionReturn(0);
11143425bc38SStefano Zampini }
11150c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
1116da1bb401SStefano Zampini /*MC
1117da1bb401SStefano Zampini    PCBDDC - Balancing Domain Decomposition by Constraints.
11180c7d97c5SJed Brown 
1119da1bb401SStefano Zampini    Options Database Keys:
1120da1bb401SStefano Zampini .    -pcbddc ??? -
1121da1bb401SStefano Zampini 
1122da1bb401SStefano Zampini    Level: intermediate
1123da1bb401SStefano Zampini 
1124da1bb401SStefano Zampini    Notes: The matrix used with this preconditioner must be of type MATIS
1125da1bb401SStefano Zampini 
1126da1bb401SStefano Zampini           Unlike more 'conventional' interface preconditioners, this iterates over ALL the
1127da1bb401SStefano Zampini           degrees of freedom, NOT just those on the interface (this allows the use of approximate solvers
1128da1bb401SStefano Zampini           on the subdomains).
1129da1bb401SStefano Zampini 
1130da1bb401SStefano Zampini           Options for the coarse grid preconditioner can be set with -
1131da1bb401SStefano Zampini           Options for the Dirichlet subproblem can be set with -
1132da1bb401SStefano Zampini           Options for the Neumann subproblem can be set with -
1133da1bb401SStefano Zampini 
1134da1bb401SStefano Zampini    Contributed by Stefano Zampini
1135da1bb401SStefano Zampini 
1136da1bb401SStefano Zampini .seealso:  PCCreate(), PCSetType(), PCType (for list of available types), PC,  MATIS
1137da1bb401SStefano Zampini M*/
1138da1bb401SStefano Zampini EXTERN_C_BEGIN
1139da1bb401SStefano Zampini #undef __FUNCT__
1140da1bb401SStefano Zampini #define __FUNCT__ "PCCreate_BDDC"
1141da1bb401SStefano Zampini PetscErrorCode PCCreate_BDDC(PC pc)
1142da1bb401SStefano Zampini {
1143da1bb401SStefano Zampini   PetscErrorCode ierr;
1144da1bb401SStefano Zampini   PC_BDDC        *pcbddc;
1145da1bb401SStefano Zampini   PCBDDCGraph    mat_graph;
1146da1bb401SStefano Zampini 
1147da1bb401SStefano Zampini   PetscFunctionBegin;
1148da1bb401SStefano Zampini   /* Creates the private data structure for this preconditioner and attach it to the PC object. */
1149da1bb401SStefano Zampini   ierr      = PetscNewLog(pc,PC_BDDC,&pcbddc);CHKERRQ(ierr);
1150da1bb401SStefano Zampini   pc->data  = (void*)pcbddc;
1151da1bb401SStefano Zampini 
1152da1bb401SStefano Zampini   /* create PCIS data structure */
1153da1bb401SStefano Zampini   ierr = PCISCreate(pc);CHKERRQ(ierr);
1154da1bb401SStefano Zampini 
1155da1bb401SStefano Zampini   /* BDDC specific */
11560bdf917eSStefano Zampini   pcbddc->CoarseNullSpace            = 0;
11570bdf917eSStefano Zampini   pcbddc->NullSpace                  = 0;
11583972b0daSStefano Zampini   pcbddc->temp_solution              = 0;
1159534831adSStefano Zampini   pcbddc->original_rhs               = 0;
1160534831adSStefano Zampini   pcbddc->local_mat                  = 0;
1161534831adSStefano Zampini   pcbddc->ChangeOfBasisMatrix        = 0;
1162534831adSStefano Zampini   pcbddc->usechangeofbasis           = PETSC_TRUE;
1163534831adSStefano Zampini   pcbddc->usechangeonfaces           = PETSC_FALSE;
1164da1bb401SStefano Zampini   pcbddc->coarse_vec                 = 0;
1165da1bb401SStefano Zampini   pcbddc->coarse_rhs                 = 0;
1166da1bb401SStefano Zampini   pcbddc->coarse_ksp                 = 0;
1167da1bb401SStefano Zampini   pcbddc->coarse_phi_B               = 0;
1168da1bb401SStefano Zampini   pcbddc->coarse_phi_D               = 0;
1169da1bb401SStefano Zampini   pcbddc->vec1_P                     = 0;
1170da1bb401SStefano Zampini   pcbddc->vec1_R                     = 0;
1171da1bb401SStefano Zampini   pcbddc->vec2_R                     = 0;
1172da1bb401SStefano Zampini   pcbddc->local_auxmat1              = 0;
1173da1bb401SStefano Zampini   pcbddc->local_auxmat2              = 0;
1174da1bb401SStefano Zampini   pcbddc->R_to_B                     = 0;
1175da1bb401SStefano Zampini   pcbddc->R_to_D                     = 0;
1176da1bb401SStefano Zampini   pcbddc->ksp_D                      = 0;
1177da1bb401SStefano Zampini   pcbddc->ksp_R                      = 0;
1178da1bb401SStefano Zampini   pcbddc->local_primal_indices       = 0;
117929622bf0SStefano Zampini   pcbddc->inexact_prec_type          = PETSC_FALSE;
1180da1bb401SStefano Zampini   pcbddc->NeumannBoundaries          = 0;
1181da1bb401SStefano Zampini   pcbddc->ISForDofs                  = 0;
1182da1bb401SStefano Zampini   pcbddc->ISForVertices              = 0;
1183da1bb401SStefano Zampini   pcbddc->n_ISForFaces               = 0;
1184da1bb401SStefano Zampini   pcbddc->n_ISForEdges               = 0;
1185da1bb401SStefano Zampini   pcbddc->ConstraintMatrix           = 0;
1186da1bb401SStefano Zampini   pcbddc->use_nnsp_true              = PETSC_FALSE;
1187da1bb401SStefano Zampini   pcbddc->local_primal_sizes         = 0;
1188da1bb401SStefano Zampini   pcbddc->local_primal_displacements = 0;
1189da1bb401SStefano Zampini   pcbddc->replicated_local_primal_indices = 0;
1190da1bb401SStefano Zampini   pcbddc->replicated_local_primal_values  = 0;
1191da1bb401SStefano Zampini   pcbddc->coarse_loc_to_glob         = 0;
1192da1bb401SStefano Zampini   pcbddc->dbg_flag                   = PETSC_FALSE;
1193da1bb401SStefano Zampini   pcbddc->coarsening_ratio           = 8;
1194b76ba322SStefano Zampini   pcbddc->use_exact_dirichlet        = PETSC_TRUE;
11954fad6a16SStefano Zampini   pcbddc->current_level              = 0;
11964fad6a16SStefano Zampini   pcbddc->max_levels                 = 1;
1197da1bb401SStefano Zampini 
1198da1bb401SStefano Zampini   /* allocate and initialize needed graph structure */
1199da1bb401SStefano Zampini   ierr = PetscMalloc(sizeof(*mat_graph),&pcbddc->mat_graph);CHKERRQ(ierr);
1200da1bb401SStefano Zampini   pcbddc->mat_graph->xadj            = 0;
1201da1bb401SStefano Zampini   pcbddc->mat_graph->adjncy          = 0;
1202da1bb401SStefano Zampini 
1203da1bb401SStefano Zampini   /* function pointers */
1204da1bb401SStefano Zampini   pc->ops->apply               = PCApply_BDDC;
1205da1bb401SStefano Zampini   pc->ops->applytranspose      = 0;
1206da1bb401SStefano Zampini   pc->ops->setup               = PCSetUp_BDDC;
1207da1bb401SStefano Zampini   pc->ops->destroy             = PCDestroy_BDDC;
1208da1bb401SStefano Zampini   pc->ops->setfromoptions      = PCSetFromOptions_BDDC;
1209da1bb401SStefano Zampini   pc->ops->view                = 0;
1210da1bb401SStefano Zampini   pc->ops->applyrichardson     = 0;
1211da1bb401SStefano Zampini   pc->ops->applysymmetricleft  = 0;
1212da1bb401SStefano Zampini   pc->ops->applysymmetricright = 0;
1213534831adSStefano Zampini   pc->ops->presolve            = PCPreSolve_BDDC;
1214534831adSStefano Zampini   pc->ops->postsolve           = PCPostSolve_BDDC;
1215da1bb401SStefano Zampini 
1216da1bb401SStefano Zampini   /* composing function */
12174fad6a16SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetCoarseningRatio_C","PCBDDCSetCoarseningRatio_BDDC",
12184fad6a16SStefano Zampini                     PCBDDCSetCoarseningRatio_BDDC);CHKERRQ(ierr);
12194fad6a16SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetMaxLevels_C","PCBDDCSetMaxLevels_BDDC",
12204fad6a16SStefano Zampini                     PCBDDCSetMaxLevels_BDDC);CHKERRQ(ierr);
12210bdf917eSStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetNullSpace_C","PCBDDCSetNullSpace_BDDC",
12220bdf917eSStefano Zampini                     PCBDDCSetNullSpace_BDDC);CHKERRQ(ierr);
1223da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDirichletBoundaries_C","PCBDDCSetDirichletBoundaries_BDDC",
1224da1bb401SStefano Zampini                     PCBDDCSetDirichletBoundaries_BDDC);CHKERRQ(ierr);
1225da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetNeumannBoundaries_C","PCBDDCSetNeumannBoundaries_BDDC",
1226da1bb401SStefano Zampini                     PCBDDCSetNeumannBoundaries_BDDC);CHKERRQ(ierr);
1227da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetDirichletBoundaries_C","PCBDDCGetDirichletBoundaries_BDDC",
1228da1bb401SStefano Zampini                     PCBDDCGetDirichletBoundaries_BDDC);CHKERRQ(ierr);
1229da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetNeumannBoundaries_C","PCBDDCGetNeumannBoundaries_BDDC",
1230da1bb401SStefano Zampini                     PCBDDCGetNeumannBoundaries_BDDC);CHKERRQ(ierr);
1231da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetCoarseProblemType_C","PCBDDCSetCoarseProblemType_BDDC",
1232da1bb401SStefano Zampini                     PCBDDCSetCoarseProblemType_BDDC);CHKERRQ(ierr);
1233da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDofsSplitting_C","PCBDDCSetDofsSplitting_BDDC",
1234da1bb401SStefano Zampini                     PCBDDCSetDofsSplitting_BDDC);CHKERRQ(ierr);
1235da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetLocalAdjacencyGraph_C","PCBDDCSetLocalAdjacencyGraph_BDDC",
1236da1bb401SStefano Zampini                     PCBDDCSetLocalAdjacencyGraph_BDDC);CHKERRQ(ierr);
1237534831adSStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPreSolve_C","PCPreSolve_BDDC",
1238534831adSStefano Zampini                     PCPreSolve_BDDC);CHKERRQ(ierr);
1239534831adSStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPostSolve_C","PCPostSolve_BDDC",
1240534831adSStefano Zampini                     PCPostSolve_BDDC);CHKERRQ(ierr);
12413425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCCreateFETIDPOperators_C","PCBDDCCreateFETIDPOperators_BDDC",
12423425bc38SStefano Zampini                     PCBDDCCreateFETIDPOperators_BDDC);CHKERRQ(ierr);
12433425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetRHS_C","PCBDDCMatFETIDPGetRHS_BDDC",
12443425bc38SStefano Zampini                     PCBDDCMatFETIDPGetRHS_BDDC);CHKERRQ(ierr);
12453425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetSolution_C","PCBDDCMatFETIDPGetSolution_BDDC",
12463425bc38SStefano Zampini                     PCBDDCMatFETIDPGetSolution_BDDC);CHKERRQ(ierr);
1247da1bb401SStefano Zampini   PetscFunctionReturn(0);
1248da1bb401SStefano Zampini }
1249da1bb401SStefano Zampini EXTERN_C_END
12503425bc38SStefano Zampini 
1251da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
1252da1bb401SStefano Zampini /* All static functions from now on                                           */
1253da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
12544fad6a16SStefano Zampini #undef __FUNCT__
125529622bf0SStefano Zampini #define __FUNCT__ "PCBDDCApplyNullSpaceCorrectionPC"
125629622bf0SStefano Zampini static PetscErrorCode PCBDDCApplyNullSpaceCorrectionPC(PC pc,Vec x,Vec y)
125729622bf0SStefano Zampini {
125829622bf0SStefano Zampini   NullSpaceCorrection_ctx *pc_ctx;
125929622bf0SStefano Zampini   PetscErrorCode ierr;
126029622bf0SStefano Zampini 
126129622bf0SStefano Zampini   PetscFunctionBegin;
126229622bf0SStefano Zampini   ierr = PCShellGetContext(pc,(void**)&pc_ctx);CHKERRQ(ierr);
126329622bf0SStefano Zampini   /* E */
126429622bf0SStefano Zampini   ierr = MatMultTranspose(pc_ctx->Lbasis_mat,x,pc_ctx->work_small_2);CHKERRQ(ierr);
126529622bf0SStefano Zampini   ierr = MatMultAdd(pc_ctx->Kbasis_mat,pc_ctx->work_small_2,x,pc_ctx->work_full_1);CHKERRQ(ierr);
126629622bf0SStefano Zampini   /* P^-1 */
126729622bf0SStefano Zampini   ierr = PCApply(pc_ctx->local_pc,pc_ctx->work_full_1,pc_ctx->work_full_2);CHKERRQ(ierr);
126829622bf0SStefano Zampini   /* E^T */
126929622bf0SStefano Zampini   ierr = MatMultTranspose(pc_ctx->Kbasis_mat,pc_ctx->work_full_2,pc_ctx->work_small_1);CHKERRQ(ierr);
127029622bf0SStefano Zampini   ierr = VecScale(pc_ctx->work_small_1,-1.0);CHKERRQ(ierr);
127129622bf0SStefano Zampini   ierr = MatMultAdd(pc_ctx->Lbasis_mat,pc_ctx->work_small_1,pc_ctx->work_full_2,pc_ctx->work_full_1);CHKERRQ(ierr);
127229622bf0SStefano Zampini   /* Sum contributions */
127329622bf0SStefano Zampini   ierr = MatMultAdd(pc_ctx->basis_mat,pc_ctx->work_small_2,pc_ctx->work_full_1,y);CHKERRQ(ierr);
127429622bf0SStefano Zampini   PetscFunctionReturn(0);
127529622bf0SStefano Zampini }
127629622bf0SStefano Zampini 
127729622bf0SStefano Zampini #undef __FUNCT__
127829622bf0SStefano Zampini #define __FUNCT__ "PCBDDCDestroyNullSpaceCorrectionPC"
127929622bf0SStefano Zampini static PetscErrorCode PCBDDCDestroyNullSpaceCorrectionPC(PC pc)
128029622bf0SStefano Zampini {
128129622bf0SStefano Zampini 
128229622bf0SStefano Zampini   NullSpaceCorrection_ctx *pc_ctx;
128329622bf0SStefano Zampini   PetscErrorCode          ierr;
128429622bf0SStefano Zampini 
128529622bf0SStefano Zampini   PetscFunctionBegin;
128629622bf0SStefano Zampini   ierr = PCShellGetContext(pc,(void**)&pc_ctx);CHKERRQ(ierr);
128729622bf0SStefano Zampini   ierr = VecDestroy(&pc_ctx->work_small_1);CHKERRQ(ierr);
128829622bf0SStefano Zampini   ierr = VecDestroy(&pc_ctx->work_small_2);CHKERRQ(ierr);
128929622bf0SStefano Zampini   ierr = VecDestroy(&pc_ctx->work_full_1);CHKERRQ(ierr);
129029622bf0SStefano Zampini   ierr = VecDestroy(&pc_ctx->work_full_2);CHKERRQ(ierr);
129129622bf0SStefano Zampini   ierr = MatDestroy(&pc_ctx->basis_mat);CHKERRQ(ierr);
129229622bf0SStefano Zampini   ierr = MatDestroy(&pc_ctx->Lbasis_mat);CHKERRQ(ierr);
129329622bf0SStefano Zampini   ierr = MatDestroy(&pc_ctx->Kbasis_mat);CHKERRQ(ierr);
129429622bf0SStefano Zampini   ierr = PCDestroy(&pc_ctx->local_pc);CHKERRQ(ierr);
129529622bf0SStefano Zampini   ierr = PetscFree(pc_ctx);CHKERRQ(ierr);
129629622bf0SStefano Zampini   PetscFunctionReturn(0);
129729622bf0SStefano Zampini }
129829622bf0SStefano Zampini 
129929622bf0SStefano Zampini #undef __FUNCT__
130029622bf0SStefano Zampini #define __FUNCT__ "PCBDDCAdaptLocalProblem"
130129622bf0SStefano Zampini static PetscErrorCode PCBDDCAdaptLocalProblem(PC pc,IS local_dofs)
130229622bf0SStefano Zampini {
130329622bf0SStefano Zampini   PETSC_EXTERN PetscErrorCode PCBDDCApplyNullSpaceCorrectionPC(PC,Vec,Vec);
130429622bf0SStefano Zampini   PETSC_EXTERN PetscErrorCode PCBDDCDestroyNullSpaceCorrectionPC(PC);
130529622bf0SStefano Zampini 
130629622bf0SStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
130729622bf0SStefano Zampini   PC_IS          *pcis = (PC_IS*)pc->data;
130829622bf0SStefano Zampini   Mat_IS*        matis = (Mat_IS*)pc->pmat->data;
130929622bf0SStefano Zampini   KSP            *local_ksp;
131029622bf0SStefano Zampini   PC             newpc;
131129622bf0SStefano Zampini   NullSpaceCorrection_ctx  *shell_ctx;
131229622bf0SStefano Zampini   Mat            local_mat,local_pmat,small_mat,inv_small_mat;
131329622bf0SStefano Zampini   MatStructure   local_mat_struct;
131429622bf0SStefano Zampini   Vec            work1,work2,work3;
131529622bf0SStefano Zampini   const Vec      *nullvecs;
131629622bf0SStefano Zampini   VecScatter     scatter_ctx;
131729622bf0SStefano Zampini   IS             is_aux;
131829622bf0SStefano Zampini   MatFactorInfo  matinfo;
131929622bf0SStefano Zampini   PetscScalar    *basis_mat,*Kbasis_mat,*array,*array_mat;
132029622bf0SStefano Zampini   PetscScalar    one = 1.0,zero = 0.0, m_one = -1.0;
132129622bf0SStefano Zampini   PetscInt       basis_dofs,basis_size,nnsp_size,i,k,n_I,n_R;
132229622bf0SStefano Zampini   PetscBool      nnsp_has_cnst;
132329622bf0SStefano Zampini   PetscErrorCode ierr;
132429622bf0SStefano Zampini 
132529622bf0SStefano Zampini   PetscFunctionBegin;
132629622bf0SStefano Zampini   /* Infer the local solver */
132729622bf0SStefano Zampini   ierr = ISGetSize(local_dofs,&basis_dofs);CHKERRQ(ierr);
132829622bf0SStefano Zampini   ierr = VecGetSize(pcis->vec1_D,&n_I);CHKERRQ(ierr);
132929622bf0SStefano Zampini   ierr = VecGetSize(pcbddc->vec1_R,&n_R);CHKERRQ(ierr);
133029622bf0SStefano Zampini   if (basis_dofs == n_I) {
133129622bf0SStefano Zampini     /* Dirichlet solver */
133229622bf0SStefano Zampini     local_ksp = &pcbddc->ksp_D;
133329622bf0SStefano Zampini   } else if (basis_dofs == n_R) {
133429622bf0SStefano Zampini     /* Neumann solver */
133529622bf0SStefano Zampini     local_ksp = &pcbddc->ksp_R;
133629622bf0SStefano Zampini   } else {
133729622bf0SStefano Zampini     SETERRQ4(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in %s: unknown local IS size %d. n_I=%d, n_R=%d)\n",__FUNCT__,basis_dofs,n_I,n_R);
133829622bf0SStefano Zampini   }
133929622bf0SStefano Zampini   ierr = KSPGetOperators(*local_ksp,&local_mat,&local_pmat,&local_mat_struct);CHKERRQ(ierr);
134029622bf0SStefano Zampini 
134129622bf0SStefano Zampini   /* Get null space vecs */
134229622bf0SStefano Zampini   ierr = MatNullSpaceGetVecs(pcbddc->NullSpace,&nnsp_has_cnst,&nnsp_size,&nullvecs);CHKERRQ(ierr);
134329622bf0SStefano Zampini   basis_size = nnsp_size;
134429622bf0SStefano Zampini   if (nnsp_has_cnst) {
134529622bf0SStefano Zampini     basis_size++;
134629622bf0SStefano Zampini   }
134729622bf0SStefano Zampini 
134829622bf0SStefano Zampini   /* Create shell ctx */
134929622bf0SStefano Zampini   ierr = PetscMalloc(sizeof(*shell_ctx),&shell_ctx);CHKERRQ(ierr);
135029622bf0SStefano Zampini 
135129622bf0SStefano Zampini   /* Create work vectors in shell context */
135229622bf0SStefano Zampini   ierr = VecCreate(PETSC_COMM_SELF,&shell_ctx->work_small_1);CHKERRQ(ierr);
135329622bf0SStefano Zampini   ierr = VecSetSizes(shell_ctx->work_small_1,basis_size,basis_size);CHKERRQ(ierr);
135429622bf0SStefano Zampini   ierr = VecSetType(shell_ctx->work_small_1,VECSEQ);CHKERRQ(ierr);
135529622bf0SStefano Zampini   ierr = VecDuplicate(shell_ctx->work_small_1,&shell_ctx->work_small_2);CHKERRQ(ierr);
135629622bf0SStefano Zampini   ierr = VecCreate(PETSC_COMM_SELF,&shell_ctx->work_full_1);CHKERRQ(ierr);
135729622bf0SStefano Zampini   ierr = VecSetSizes(shell_ctx->work_full_1,basis_dofs,basis_dofs);CHKERRQ(ierr);
135829622bf0SStefano Zampini   ierr = VecSetType(shell_ctx->work_full_1,VECSEQ);CHKERRQ(ierr);
135929622bf0SStefano Zampini   ierr = VecDuplicate(shell_ctx->work_full_1,&shell_ctx->work_full_2);CHKERRQ(ierr);
136029622bf0SStefano Zampini 
136129622bf0SStefano Zampini   /* Allocate workspace */
136229622bf0SStefano Zampini   ierr = MatCreateSeqDense(PETSC_COMM_SELF,basis_dofs,basis_size,PETSC_NULL,&shell_ctx->basis_mat );CHKERRQ(ierr);
136329622bf0SStefano Zampini   ierr = MatCreateSeqDense(PETSC_COMM_SELF,basis_dofs,basis_size,PETSC_NULL,&shell_ctx->Kbasis_mat);CHKERRQ(ierr);
136429622bf0SStefano Zampini   ierr = MatDenseGetArray(shell_ctx->basis_mat,&basis_mat);CHKERRQ(ierr);
136529622bf0SStefano Zampini   ierr = MatDenseGetArray(shell_ctx->Kbasis_mat,&Kbasis_mat);CHKERRQ(ierr);
136629622bf0SStefano Zampini 
136729622bf0SStefano Zampini   /* Restrict local null space on selected dofs (Dirichlet or Neumann)
136829622bf0SStefano Zampini      and compute matrices N and K*N */
136929622bf0SStefano Zampini   ierr = VecDuplicate(shell_ctx->work_full_1,&work1);CHKERRQ(ierr);
137029622bf0SStefano Zampini   ierr = VecDuplicate(shell_ctx->work_full_1,&work2);CHKERRQ(ierr);
137129622bf0SStefano Zampini   ierr = VecScatterCreate(pcis->vec1_N,local_dofs,work1,(IS)0,&scatter_ctx);CHKERRQ(ierr);
137229622bf0SStefano Zampini   k=0;
137329622bf0SStefano Zampini   for (;k<nnsp_size;k++) {
137429622bf0SStefano Zampini     ierr = VecScatterBegin(matis->ctx,nullvecs[k],pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
137529622bf0SStefano Zampini     ierr = VecScatterEnd(matis->ctx,nullvecs[k],pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
137629622bf0SStefano Zampini     ierr = VecPlaceArray(work1,(const PetscScalar*)&basis_mat[k*basis_dofs]);CHKERRQ(ierr);
137729622bf0SStefano Zampini     ierr = VecScatterBegin(scatter_ctx,pcis->vec1_N,work1,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
137829622bf0SStefano Zampini     ierr = VecScatterEnd(scatter_ctx,pcis->vec1_N,work1,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
137929622bf0SStefano Zampini     ierr = VecPlaceArray(work2,(const PetscScalar*)&Kbasis_mat[k*basis_dofs]);CHKERRQ(ierr);
138029622bf0SStefano Zampini     ierr = MatMult(local_mat,work1,work2);CHKERRQ(ierr);
138129622bf0SStefano Zampini     ierr = VecResetArray(work1);CHKERRQ(ierr);
138229622bf0SStefano Zampini     ierr = VecResetArray(work2);CHKERRQ(ierr);
138329622bf0SStefano Zampini   }
138429622bf0SStefano Zampini   if (nnsp_has_cnst) {
138529622bf0SStefano Zampini     ierr = VecPlaceArray(work1,(const PetscScalar*)&basis_mat[k*basis_dofs]);CHKERRQ(ierr);
138629622bf0SStefano Zampini     ierr = VecSet(work1,one);CHKERRQ(ierr);
138729622bf0SStefano Zampini     ierr = VecPlaceArray(work2,(const PetscScalar*)&Kbasis_mat[k*basis_dofs]);CHKERRQ(ierr);
138829622bf0SStefano Zampini     ierr = MatMult(local_mat,work1,work2);CHKERRQ(ierr);
138929622bf0SStefano Zampini     ierr = VecResetArray(work1);CHKERRQ(ierr);
139029622bf0SStefano Zampini     ierr = VecResetArray(work2);CHKERRQ(ierr);
139129622bf0SStefano Zampini   }
139229622bf0SStefano Zampini   ierr = VecDestroy(&work1);CHKERRQ(ierr);
139329622bf0SStefano Zampini   ierr = VecDestroy(&work2);CHKERRQ(ierr);
139429622bf0SStefano Zampini   ierr = VecScatterDestroy(&scatter_ctx);CHKERRQ(ierr);
139529622bf0SStefano Zampini   ierr = MatDenseRestoreArray(shell_ctx->basis_mat,&basis_mat);CHKERRQ(ierr);
139629622bf0SStefano Zampini   ierr = MatDenseRestoreArray(shell_ctx->Kbasis_mat,&Kbasis_mat);CHKERRQ(ierr);
139729622bf0SStefano Zampini 
139829622bf0SStefano Zampini   /* Assemble another Mat object in shell context */
139929622bf0SStefano Zampini   ierr = MatTransposeMatMult(shell_ctx->basis_mat,shell_ctx->Kbasis_mat,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&small_mat);CHKERRQ(ierr);
140029622bf0SStefano Zampini   ierr = MatFactorInfoInitialize(&matinfo);CHKERRQ(ierr);
140129622bf0SStefano Zampini   ierr = ISCreateStride(PETSC_COMM_SELF,basis_size,0,1,&is_aux);CHKERRQ(ierr);
140229622bf0SStefano Zampini   ierr = MatLUFactor(small_mat,is_aux,is_aux,&matinfo);CHKERRQ(ierr);
140329622bf0SStefano Zampini   ierr = ISDestroy(&is_aux);CHKERRQ(ierr);
140429622bf0SStefano Zampini   ierr = PetscMalloc(basis_size*basis_size*sizeof(PetscScalar),&array_mat);CHKERRQ(ierr);
140529622bf0SStefano Zampini   for (k=0;k<basis_size;k++) {
140629622bf0SStefano Zampini     ierr = VecSet(shell_ctx->work_small_1,zero);CHKERRQ(ierr);
140729622bf0SStefano Zampini     ierr = VecSetValue(shell_ctx->work_small_1,k,one,INSERT_VALUES);CHKERRQ(ierr);
140829622bf0SStefano Zampini     ierr = VecAssemblyBegin(shell_ctx->work_small_1);CHKERRQ(ierr);
140929622bf0SStefano Zampini     ierr = VecAssemblyEnd(shell_ctx->work_small_1);CHKERRQ(ierr);
141029622bf0SStefano Zampini     ierr = MatSolve(small_mat,shell_ctx->work_small_1,shell_ctx->work_small_2);CHKERRQ(ierr);
141129622bf0SStefano Zampini     ierr = VecGetArray(shell_ctx->work_small_2,&array);CHKERRQ(ierr);
141229622bf0SStefano Zampini     for (i=0;i<basis_size;i++) {
141329622bf0SStefano Zampini       array_mat[i*basis_size+k]=array[i];
141429622bf0SStefano Zampini     }
141529622bf0SStefano Zampini     ierr = VecRestoreArray(shell_ctx->work_small_2,&array);CHKERRQ(ierr);
141629622bf0SStefano Zampini   }
141729622bf0SStefano Zampini   ierr = MatCreateSeqDense(PETSC_COMM_SELF,basis_size,basis_size,array_mat,&inv_small_mat);CHKERRQ(ierr);
141829622bf0SStefano Zampini   ierr = MatMatMult(shell_ctx->basis_mat,inv_small_mat,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&shell_ctx->Lbasis_mat);CHKERRQ(ierr);
141929622bf0SStefano Zampini   ierr = PetscFree(array_mat);CHKERRQ(ierr);
142029622bf0SStefano Zampini   ierr = MatDestroy(&inv_small_mat);CHKERRQ(ierr);
142129622bf0SStefano Zampini   ierr = MatDestroy(&small_mat);CHKERRQ(ierr);
142229622bf0SStefano Zampini   ierr = MatScale(shell_ctx->Kbasis_mat,m_one);CHKERRQ(ierr);
142329622bf0SStefano Zampini 
142429622bf0SStefano Zampini   /* Rebuild local PC */
142529622bf0SStefano Zampini   ierr = KSPGetPC(*local_ksp,&shell_ctx->local_pc);CHKERRQ(ierr);
142629622bf0SStefano Zampini   ierr = PetscObjectReference((PetscObject)shell_ctx->local_pc);CHKERRQ(ierr);
142729622bf0SStefano Zampini   ierr = PCCreate(PETSC_COMM_SELF,&newpc);CHKERRQ(ierr);
142829622bf0SStefano Zampini   ierr = PCSetOperators(newpc,local_mat,local_mat,SAME_PRECONDITIONER);CHKERRQ(ierr);
142929622bf0SStefano Zampini   ierr = PCSetType(newpc,PCSHELL);CHKERRQ(ierr);
143029622bf0SStefano Zampini   ierr = PCShellSetContext(newpc,shell_ctx);CHKERRQ(ierr);
143129622bf0SStefano Zampini   ierr = PCShellSetApply(newpc,PCBDDCApplyNullSpaceCorrectionPC);CHKERRQ(ierr);
143229622bf0SStefano Zampini   ierr = PCShellSetDestroy(newpc,PCBDDCDestroyNullSpaceCorrectionPC);CHKERRQ(ierr);
143329622bf0SStefano Zampini   ierr = PCSetUp(newpc);CHKERRQ(ierr);
143429622bf0SStefano Zampini   ierr = KSPSetPC(*local_ksp,newpc);CHKERRQ(ierr);
143529622bf0SStefano Zampini   ierr = PCDestroy(&newpc);CHKERRQ(ierr);
143629622bf0SStefano Zampini   ierr = KSPSetUp(*local_ksp);CHKERRQ(ierr);
143729622bf0SStefano Zampini 
143829622bf0SStefano Zampini   /* test */
143929622bf0SStefano Zampini   if (pcbddc->dbg_flag) {
144029622bf0SStefano Zampini     PetscReal   test_err;
144129622bf0SStefano Zampini     KSP         check_ksp;
144229622bf0SStefano Zampini     PC          check_pc;
144329622bf0SStefano Zampini     PetscReal   lambda_min,lambda_max;
144429622bf0SStefano Zampini     Mat         test_mat;
144529622bf0SStefano Zampini     PetscViewer viewer=pcbddc->dbg_viewer;
144629622bf0SStefano Zampini     PetscBool   setsym,issym=PETSC_FALSE;
144729622bf0SStefano Zampini 
144829622bf0SStefano Zampini     ierr = KSPGetPC(*local_ksp,&check_pc);CHKERRQ(ierr);
144929622bf0SStefano Zampini     ierr = VecDuplicate(shell_ctx->work_full_1,&work1);CHKERRQ(ierr);
145029622bf0SStefano Zampini     ierr = VecDuplicate(shell_ctx->work_full_1,&work2);CHKERRQ(ierr);
145129622bf0SStefano Zampini     ierr = VecDuplicate(shell_ctx->work_full_1,&work3);CHKERRQ(ierr);
145229622bf0SStefano Zampini     ierr = VecSetRandom(shell_ctx->work_small_1,PETSC_NULL);CHKERRQ(ierr);
145329622bf0SStefano Zampini     ierr = MatMult(shell_ctx->basis_mat,shell_ctx->work_small_1,work1);CHKERRQ(ierr);
145429622bf0SStefano Zampini     ierr = VecCopy(work1,work2);CHKERRQ(ierr);
145529622bf0SStefano Zampini     ierr = MatMult(local_mat,work1,work3);CHKERRQ(ierr);
145629622bf0SStefano Zampini     ierr = PCApply(check_pc,work3,work1);CHKERRQ(ierr);
145729622bf0SStefano Zampini     ierr = VecAXPY(work1,m_one,work2);CHKERRQ(ierr);
145829622bf0SStefano Zampini     ierr = VecNorm(work1,NORM_INFINITY,&test_err);CHKERRQ(ierr);
145929622bf0SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d error for nullspace correction for ",PetscGlobalRank);
146029622bf0SStefano Zampini     if (basis_dofs == n_I) {
146129622bf0SStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Dirichlet ");
146229622bf0SStefano Zampini     } else {
146329622bf0SStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Neumann ");
146429622bf0SStefano Zampini     }
146529622bf0SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"solver is :%1.14e\n",test_err);
146629622bf0SStefano Zampini 
146729622bf0SStefano Zampini     ierr = MatTransposeMatMult(shell_ctx->Lbasis_mat,shell_ctx->Kbasis_mat,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&test_mat);CHKERRQ(ierr);
146829622bf0SStefano Zampini     ierr = MatShift(test_mat,one);CHKERRQ(ierr);
146929622bf0SStefano Zampini     ierr = MatNorm(test_mat,NORM_INFINITY,&test_err);CHKERRQ(ierr);
147029622bf0SStefano Zampini     ierr = MatDestroy(&test_mat);CHKERRQ(ierr);
147129622bf0SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d error for nullspace matrices is :%1.14e\n",PetscGlobalRank,test_err);
147229622bf0SStefano Zampini 
147329622bf0SStefano Zampini     /* Create ksp object suitable for extreme eigenvalues' estimation */
147429622bf0SStefano Zampini     ierr = KSPCreate(PETSC_COMM_SELF,&check_ksp);CHKERRQ(ierr);
147529622bf0SStefano Zampini     ierr = KSPSetOperators(check_ksp,local_mat,local_mat,SAME_PRECONDITIONER);CHKERRQ(ierr);
147629622bf0SStefano Zampini     ierr = KSPSetTolerances(check_ksp,1.e-8,1.e-8,PETSC_DEFAULT,basis_dofs);CHKERRQ(ierr);
147729622bf0SStefano Zampini     ierr = KSPSetComputeSingularValues(check_ksp,PETSC_TRUE);CHKERRQ(ierr);
147829622bf0SStefano Zampini     ierr = MatIsSymmetricKnown(pc->pmat,&setsym,&issym);CHKERRQ(ierr);
147929622bf0SStefano Zampini     if (issym) {
148029622bf0SStefano Zampini       ierr = KSPSetType(check_ksp,KSPCG);CHKERRQ(ierr);
148129622bf0SStefano Zampini     }
148229622bf0SStefano Zampini     ierr = KSPSetPC(check_ksp,check_pc);CHKERRQ(ierr);
148329622bf0SStefano Zampini     ierr = KSPSetUp(check_ksp);CHKERRQ(ierr);
148429622bf0SStefano Zampini     ierr = VecSetRandom(work1,PETSC_NULL);CHKERRQ(ierr);
148529622bf0SStefano Zampini     ierr = MatMult(local_mat,work1,work2);CHKERRQ(ierr);
148629622bf0SStefano Zampini     ierr = KSPSolve(check_ksp,work2,work2);CHKERRQ(ierr);
148729622bf0SStefano Zampini     ierr = VecAXPY(work2,m_one,work1);CHKERRQ(ierr);
148829622bf0SStefano Zampini     ierr = VecNorm(work2,NORM_INFINITY,&test_err);CHKERRQ(ierr);
148929622bf0SStefano Zampini     ierr = KSPComputeExtremeSingularValues(check_ksp,&lambda_max,&lambda_min);CHKERRQ(ierr);
149029622bf0SStefano Zampini     ierr = KSPGetIterationNumber(check_ksp,&k);CHKERRQ(ierr);
149129622bf0SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d error for adapted KSP %1.14e (it %d, eigs %1.6e %1.6e)\n",PetscGlobalRank,test_err,k,lambda_min,lambda_max);
149229622bf0SStefano Zampini     ierr = KSPDestroy(&check_ksp);CHKERRQ(ierr);
149329622bf0SStefano Zampini     ierr = VecDestroy(&work1);CHKERRQ(ierr);
149429622bf0SStefano Zampini     ierr = VecDestroy(&work2);CHKERRQ(ierr);
149529622bf0SStefano Zampini     ierr = VecDestroy(&work3);CHKERRQ(ierr);
149629622bf0SStefano Zampini   }
149729622bf0SStefano Zampini   PetscFunctionReturn(0);
149829622bf0SStefano Zampini }
149929622bf0SStefano Zampini 
150029622bf0SStefano Zampini #undef __FUNCT__
15012e8d2280SStefano Zampini #define __FUNCT__ "PCBDDCSetUseExactDirichlet"
15022e8d2280SStefano Zampini static PetscErrorCode PCBDDCSetUseExactDirichlet(PC pc,PetscBool use)
15032e8d2280SStefano Zampini {
15042e8d2280SStefano Zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
15052e8d2280SStefano Zampini 
15062e8d2280SStefano Zampini   PetscFunctionBegin;
15072e8d2280SStefano Zampini   pcbddc->use_exact_dirichlet=use;
15082e8d2280SStefano Zampini   PetscFunctionReturn(0);
15092e8d2280SStefano Zampini }
15102e8d2280SStefano Zampini 
15112e8d2280SStefano Zampini #undef __FUNCT__
15124fad6a16SStefano Zampini #define __FUNCT__ "PCBDDCSetLevel"
15134fad6a16SStefano Zampini static PetscErrorCode PCBDDCSetLevel(PC pc,PetscInt level)
15144fad6a16SStefano Zampini {
15154fad6a16SStefano Zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
15164fad6a16SStefano Zampini 
15174fad6a16SStefano Zampini   PetscFunctionBegin;
15184fad6a16SStefano Zampini   pcbddc->current_level=level;
15194fad6a16SStefano Zampini   PetscFunctionReturn(0);
15204fad6a16SStefano Zampini }
15213425bc38SStefano Zampini 
15223425bc38SStefano Zampini #undef __FUNCT__
15230bdf917eSStefano Zampini #define __FUNCT__ "PCBDDCAdaptNullSpace"
15240bdf917eSStefano Zampini static PetscErrorCode PCBDDCAdaptNullSpace(PC pc)
15250bdf917eSStefano Zampini {
15260bdf917eSStefano Zampini   PC_IS*         pcis = (PC_IS*)  (pc->data);
15270bdf917eSStefano Zampini   PC_BDDC*       pcbddc = (PC_BDDC*)(pc->data);
15280bdf917eSStefano Zampini   KSP            inv_change;
15290bdf917eSStefano Zampini   PC             pc_change;
15300bdf917eSStefano Zampini   const Vec      *nsp_vecs;
15310bdf917eSStefano Zampini   Vec            *new_nsp_vecs;
15320bdf917eSStefano Zampini   PetscInt       i,nsp_size,new_nsp_size,start_new;
15330bdf917eSStefano Zampini   PetscBool      nsp_has_cnst;
15340bdf917eSStefano Zampini   MatNullSpace   new_nsp;
15350bdf917eSStefano Zampini   PetscErrorCode ierr;
15360bdf917eSStefano Zampini 
15370bdf917eSStefano Zampini   PetscFunctionBegin;
15380bdf917eSStefano Zampini   ierr = MatNullSpaceGetVecs(pcbddc->NullSpace,&nsp_has_cnst,&nsp_size,&nsp_vecs);CHKERRQ(ierr);
15390bdf917eSStefano Zampini   ierr = KSPCreate(PETSC_COMM_SELF,&inv_change);CHKERRQ(ierr);
15400bdf917eSStefano Zampini   ierr = KSPSetOperators(inv_change,pcbddc->ChangeOfBasisMatrix,pcbddc->ChangeOfBasisMatrix,SAME_PRECONDITIONER);CHKERRQ(ierr);
15410bdf917eSStefano Zampini   ierr = KSPSetType(inv_change,KSPPREONLY);CHKERRQ(ierr);
15420bdf917eSStefano Zampini   ierr = KSPGetPC(inv_change,&pc_change);CHKERRQ(ierr);
15430bdf917eSStefano Zampini   ierr = PCSetType(pc_change,PCLU);CHKERRQ(ierr);
15440bdf917eSStefano Zampini   ierr = KSPSetUp(inv_change);CHKERRQ(ierr);
15450bdf917eSStefano Zampini   new_nsp_size = nsp_size;
15460bdf917eSStefano Zampini   if (nsp_has_cnst) { new_nsp_size++; }
15470bdf917eSStefano Zampini   ierr = PetscMalloc(new_nsp_size*sizeof(Vec),&new_nsp_vecs);CHKERRQ(ierr);
15480bdf917eSStefano Zampini   for (i=0;i<new_nsp_size;i++) { ierr = VecDuplicate(pcis->vec1_global,&new_nsp_vecs[i]);CHKERRQ(ierr); }
15490bdf917eSStefano Zampini   start_new = 0;
15500bdf917eSStefano Zampini   if (nsp_has_cnst) {
15510bdf917eSStefano Zampini     start_new = 1;
15520bdf917eSStefano Zampini     ierr = VecSet(new_nsp_vecs[0],1.0);CHKERRQ(ierr);
15530bdf917eSStefano Zampini     ierr = VecSet(pcis->vec1_B,1.0);CHKERRQ(ierr);
15540bdf917eSStefano Zampini     ierr = KSPSolve(inv_change,pcis->vec1_B,pcis->vec1_B);
15550bdf917eSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,new_nsp_vecs[0],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
15560bdf917eSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec1_B,new_nsp_vecs[0],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
15570bdf917eSStefano Zampini   }
15580bdf917eSStefano Zampini   for (i=0;i<nsp_size;i++) {
15590bdf917eSStefano Zampini     ierr = VecCopy(nsp_vecs[i],new_nsp_vecs[i+start_new]);CHKERRQ(ierr);
15600bdf917eSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,nsp_vecs[i],pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
15610bdf917eSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,nsp_vecs[i],pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
15620bdf917eSStefano Zampini     ierr = KSPSolve(inv_change,pcis->vec1_B,pcis->vec1_B);
15630bdf917eSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,new_nsp_vecs[i+start_new],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
15640bdf917eSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec1_B,new_nsp_vecs[i+start_new],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
15650bdf917eSStefano Zampini   }
15660bdf917eSStefano Zampini   ierr = VecNormalize(new_nsp_vecs[0],PETSC_NULL);CHKERRQ(ierr);
15670bdf917eSStefano Zampini   /* TODO : Orthonormalize vecs when new_nsp_size > 0! */
15680bdf917eSStefano Zampini 
15690bdf917eSStefano Zampini   /*PetscBool nsp_t=PETSC_FALSE;
15700bdf917eSStefano Zampini   ierr = MatNullSpaceTest(pcbddc->NullSpace,pc->pmat,&nsp_t);CHKERRQ(ierr);
15710bdf917eSStefano Zampini   printf("Original Null Space test: %d\n",nsp_t);
15720bdf917eSStefano Zampini   Mat temp_mat;
15730bdf917eSStefano Zampini   Mat_IS* matis = (Mat_IS*)pc->pmat->data;
15740bdf917eSStefano Zampini     temp_mat = matis->A;
15750bdf917eSStefano Zampini     matis->A = pcbddc->local_mat;
15760bdf917eSStefano Zampini     pcbddc->local_mat = temp_mat;
15770bdf917eSStefano Zampini   ierr = MatNullSpaceTest(pcbddc->NullSpace,pc->pmat,&nsp_t);CHKERRQ(ierr);
15780bdf917eSStefano Zampini   printf("Original Null Space, mat changed test: %d\n",nsp_t);
15790bdf917eSStefano Zampini   {
15800bdf917eSStefano Zampini     PetscReal test_norm;
15810bdf917eSStefano Zampini     for (i=0;i<new_nsp_size;i++) {
15820bdf917eSStefano Zampini       ierr = MatMult(pc->pmat,new_nsp_vecs[i],pcis->vec1_global);CHKERRQ(ierr);
15830bdf917eSStefano Zampini       ierr = VecNorm(pcis->vec1_global,NORM_2,&test_norm);CHKERRQ(ierr);
15840bdf917eSStefano Zampini       if (test_norm > 1.e-12) {
15850bdf917eSStefano Zampini         printf("------------ERROR VEC %d------------------\n",i);
15860bdf917eSStefano Zampini         ierr = VecView(pcis->vec1_global,PETSC_VIEWER_STDOUT_WORLD);
15870bdf917eSStefano Zampini         printf("------------------------------------------\n");
15880bdf917eSStefano Zampini       }
15890bdf917eSStefano Zampini     }
15900bdf917eSStefano Zampini   }*/
15910bdf917eSStefano Zampini 
15920bdf917eSStefano Zampini   ierr = KSPDestroy(&inv_change);CHKERRQ(ierr);
15930bdf917eSStefano Zampini   ierr = MatNullSpaceCreate(((PetscObject)pc)->comm,PETSC_FALSE,new_nsp_size,new_nsp_vecs,&new_nsp);CHKERRQ(ierr);
15940bdf917eSStefano Zampini   ierr = PCBDDCSetNullSpace(pc,new_nsp);CHKERRQ(ierr);
15950bdf917eSStefano Zampini   ierr = MatNullSpaceDestroy(&new_nsp);CHKERRQ(ierr);
15960bdf917eSStefano Zampini   /*
15970bdf917eSStefano Zampini   ierr = MatNullSpaceTest(pcbddc->NullSpace,pc->pmat,&nsp_t);CHKERRQ(ierr);
15980bdf917eSStefano Zampini   printf("New Null Space, mat changed: %d\n",nsp_t);
15990bdf917eSStefano Zampini     temp_mat = matis->A;
16000bdf917eSStefano Zampini     matis->A = pcbddc->local_mat;
16010bdf917eSStefano Zampini     pcbddc->local_mat = temp_mat;
16020bdf917eSStefano Zampini   ierr = MatNullSpaceTest(pcbddc->NullSpace,pc->pmat,&nsp_t);CHKERRQ(ierr);
16030bdf917eSStefano Zampini   printf("New Null Space, mat original: %d\n",nsp_t);*/
16040bdf917eSStefano Zampini 
16050bdf917eSStefano Zampini   for (i=0;i<new_nsp_size;i++) { ierr = VecDestroy(&new_nsp_vecs[i]);CHKERRQ(ierr); }
16060bdf917eSStefano Zampini   ierr = PetscFree(new_nsp_vecs);CHKERRQ(ierr);
16070bdf917eSStefano Zampini   PetscFunctionReturn(0);
16080bdf917eSStefano Zampini }
16090bdf917eSStefano Zampini 
16100bdf917eSStefano Zampini #undef __FUNCT__
16113425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPMatContext"
16123425bc38SStefano Zampini static PetscErrorCode PCBDDCCreateFETIDPMatContext(PC pc, FETIDPMat_ctx **fetidpmat_ctx)
16133425bc38SStefano Zampini {
16143425bc38SStefano Zampini   FETIDPMat_ctx  *newctx;
16153425bc38SStefano Zampini   PetscErrorCode ierr;
16163425bc38SStefano Zampini 
16173425bc38SStefano Zampini   PetscFunctionBegin;
16183425bc38SStefano Zampini   ierr = PetscMalloc(sizeof(*newctx),&newctx);CHKERRQ(ierr);
16193425bc38SStefano Zampini   newctx->lambda_local    = 0;
16203425bc38SStefano Zampini   newctx->temp_solution_B = 0;
16213425bc38SStefano Zampini   newctx->temp_solution_D = 0;
16223425bc38SStefano Zampini   newctx->B_delta         = 0;
16233425bc38SStefano Zampini   newctx->B_Ddelta        = 0; /* theoretically belongs to the FETIDP preconditioner */
16243425bc38SStefano Zampini   newctx->l2g_lambda      = 0;
16253425bc38SStefano Zampini   /* increase the reference count for BDDC preconditioner */
16263425bc38SStefano Zampini   ierr = PetscObjectReference((PetscObject)pc);CHKERRQ(ierr);
16273425bc38SStefano Zampini   newctx->pc              = pc;
16283425bc38SStefano Zampini   *fetidpmat_ctx          = newctx;
16293425bc38SStefano Zampini   PetscFunctionReturn(0);
16303425bc38SStefano Zampini }
16313425bc38SStefano Zampini 
16323425bc38SStefano Zampini #undef __FUNCT__
16333425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPPCContext"
16343425bc38SStefano Zampini static PetscErrorCode PCBDDCCreateFETIDPPCContext(PC pc, FETIDPPC_ctx **fetidppc_ctx)
16353425bc38SStefano Zampini {
16363425bc38SStefano Zampini   FETIDPPC_ctx  *newctx;
16373425bc38SStefano Zampini   PetscErrorCode ierr;
16383425bc38SStefano Zampini 
16393425bc38SStefano Zampini   PetscFunctionBegin;
16403425bc38SStefano Zampini   ierr = PetscMalloc(sizeof(*newctx),&newctx);CHKERRQ(ierr);
16413425bc38SStefano Zampini   newctx->lambda_local    = 0;
16423425bc38SStefano Zampini   newctx->B_Ddelta        = 0;
16433425bc38SStefano Zampini   newctx->l2g_lambda      = 0;
16443425bc38SStefano Zampini   /* increase the reference count for BDDC preconditioner */
16453425bc38SStefano Zampini   ierr = PetscObjectReference((PetscObject)pc);CHKERRQ(ierr);
16463425bc38SStefano Zampini   newctx->pc              = pc;
16473425bc38SStefano Zampini   *fetidppc_ctx           = newctx;
16483425bc38SStefano Zampini   PetscFunctionReturn(0);
16493425bc38SStefano Zampini }
16503425bc38SStefano Zampini 
16513425bc38SStefano Zampini #undef __FUNCT__
16523425bc38SStefano Zampini #define __FUNCT__ "PCBDDCDestroyFETIDPMat"
16533425bc38SStefano Zampini static PetscErrorCode PCBDDCDestroyFETIDPMat(Mat A)
16543425bc38SStefano Zampini {
16553425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
16563425bc38SStefano Zampini   PetscErrorCode ierr;
16573425bc38SStefano Zampini 
16583425bc38SStefano Zampini   PetscFunctionBegin;
16593425bc38SStefano Zampini   ierr = MatShellGetContext(A,(void**)&mat_ctx);CHKERRQ(ierr);
16603425bc38SStefano Zampini   ierr = VecDestroy(&mat_ctx->lambda_local);CHKERRQ(ierr);
16613425bc38SStefano Zampini   ierr = VecDestroy(&mat_ctx->temp_solution_D);CHKERRQ(ierr);
16623425bc38SStefano Zampini   ierr = VecDestroy(&mat_ctx->temp_solution_B);CHKERRQ(ierr);
16633425bc38SStefano Zampini   ierr = MatDestroy(&mat_ctx->B_delta);CHKERRQ(ierr);
16643425bc38SStefano Zampini   ierr = MatDestroy(&mat_ctx->B_Ddelta);CHKERRQ(ierr);
16653425bc38SStefano Zampini   ierr = VecScatterDestroy(&mat_ctx->l2g_lambda);CHKERRQ(ierr);
16663425bc38SStefano Zampini   ierr = PCDestroy(&mat_ctx->pc);CHKERRQ(ierr); /* actually it does not destroy BDDC, only decrease its reference count */
16673425bc38SStefano Zampini   ierr = PetscFree(mat_ctx);CHKERRQ(ierr);
16683425bc38SStefano Zampini   PetscFunctionReturn(0);
16693425bc38SStefano Zampini }
16703425bc38SStefano Zampini 
16713425bc38SStefano Zampini #undef __FUNCT__
16723425bc38SStefano Zampini #define __FUNCT__ "PCBDDCDestroyFETIDPPC"
16733425bc38SStefano Zampini static PetscErrorCode PCBDDCDestroyFETIDPPC(PC pc)
16743425bc38SStefano Zampini {
16753425bc38SStefano Zampini   FETIDPPC_ctx  *pc_ctx;
16763425bc38SStefano Zampini   PetscErrorCode ierr;
16773425bc38SStefano Zampini 
16783425bc38SStefano Zampini   PetscFunctionBegin;
16793425bc38SStefano Zampini   ierr = PCShellGetContext(pc,(void**)&pc_ctx);CHKERRQ(ierr);
16803425bc38SStefano Zampini   ierr = VecDestroy(&pc_ctx->lambda_local);CHKERRQ(ierr);
16813425bc38SStefano Zampini   ierr = MatDestroy(&pc_ctx->B_Ddelta);CHKERRQ(ierr);
16823425bc38SStefano Zampini   ierr = VecScatterDestroy(&pc_ctx->l2g_lambda);CHKERRQ(ierr);
16833425bc38SStefano Zampini   ierr = PCDestroy(&pc_ctx->pc);CHKERRQ(ierr); /* actually it does not destroy BDDC, only decrease its reference count */
16843425bc38SStefano Zampini   ierr = PetscFree(pc_ctx);CHKERRQ(ierr);
16853425bc38SStefano Zampini   PetscFunctionReturn(0);
16863425bc38SStefano Zampini }
16873425bc38SStefano Zampini 
16883425bc38SStefano Zampini #undef __FUNCT__
16893425bc38SStefano Zampini #define __FUNCT__ "PCBDDCSetupFETIDPMatContext"
16903425bc38SStefano Zampini static PetscErrorCode PCBDDCSetupFETIDPMatContext(FETIDPMat_ctx *fetidpmat_ctx )
16913425bc38SStefano Zampini {
16923425bc38SStefano Zampini   PetscErrorCode ierr;
16933425bc38SStefano Zampini   PC_IS          *pcis=(PC_IS*)fetidpmat_ctx->pc->data;
16943425bc38SStefano Zampini   PC_BDDC        *pcbddc=(PC_BDDC*)fetidpmat_ctx->pc->data;
16953425bc38SStefano Zampini   PCBDDCGraph    mat_graph=pcbddc->mat_graph;
16963425bc38SStefano Zampini   Mat_IS         *matis  = (Mat_IS*)fetidpmat_ctx->pc->pmat->data;
16973425bc38SStefano Zampini   MPI_Comm       comm = ((PetscObject)(fetidpmat_ctx->pc))->comm;
16983425bc38SStefano Zampini 
16993425bc38SStefano Zampini   Mat            ScalingMat;
17003425bc38SStefano Zampini   Vec            lambda_global;
17013425bc38SStefano Zampini   IS             IS_l2g_lambda;
17023425bc38SStefano Zampini 
17033425bc38SStefano Zampini   PetscBool      skip_node,fully_redundant;
1704ef028eecSStefano Zampini   PetscInt       i,j,k,s,n_boundary_dofs,n_global_lambda,n_vertices,partial_sum;
17053425bc38SStefano Zampini   PetscInt       n_local_lambda,n_lambda_for_dof,dual_size,n_neg_values,n_pos_values;
1706ef028eecSStefano Zampini   PetscMPIInt    rank,nprocs;
17073425bc38SStefano Zampini   PetscScalar    scalar_value;
17083425bc38SStefano Zampini 
17093425bc38SStefano Zampini   PetscInt       *vertex_indices,*temp_indices;
17103425bc38SStefano Zampini   PetscInt       *dual_dofs_boundary_indices,*aux_local_numbering_1,*aux_global_numbering;
17113425bc38SStefano Zampini   PetscInt       *aux_sums,*cols_B_delta,*l2g_indices;
17123425bc38SStefano Zampini   PetscScalar    *array,*scaling_factors,*vals_B_delta;
1713ef028eecSStefano Zampini   PetscInt       *aux_local_numbering_2,*dof_sizes,*dof_displs;
1714ef028eecSStefano Zampini   PetscInt       first_index,old_index;
1715ef028eecSStefano Zampini   PetscBool      first_found = PETSC_FALSE;
17163425bc38SStefano Zampini 
17173425bc38SStefano Zampini   /* For communication of scaling factors */
17183425bc38SStefano Zampini   PetscInt       *ptrs_buffer,neigh_position;
17193425bc38SStefano Zampini   PetscScalar    **all_factors,*send_buffer,*recv_buffer;
17203425bc38SStefano Zampini   MPI_Request    *send_reqs,*recv_reqs;
17213425bc38SStefano Zampini 
17223425bc38SStefano Zampini   /* tests */
17233425bc38SStefano Zampini   Vec            test_vec;
17243425bc38SStefano Zampini   PetscBool      test_fetidp;
17253425bc38SStefano Zampini   PetscViewer    viewer;
17263425bc38SStefano Zampini 
17273425bc38SStefano Zampini   PetscFunctionBegin;
17283425bc38SStefano Zampini   ierr = MPI_Comm_rank(comm,&rank);CHKERRQ(ierr);
17293425bc38SStefano Zampini   ierr = MPI_Comm_size(comm,&nprocs);CHKERRQ(ierr);
17303425bc38SStefano Zampini 
17313425bc38SStefano Zampini   /* Default type of lagrange multipliers is non-redundant */
17323425bc38SStefano Zampini   fully_redundant = PETSC_FALSE;
17333425bc38SStefano Zampini   ierr = PetscOptionsGetBool(PETSC_NULL,"-fetidp_fullyredundant",&fully_redundant,PETSC_NULL);CHKERRQ(ierr);
17343425bc38SStefano Zampini 
17353425bc38SStefano Zampini   /* Evaluate local and global number of lagrange multipliers */
17363425bc38SStefano Zampini   ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
17373425bc38SStefano Zampini   n_local_lambda = 0;
17383425bc38SStefano Zampini   partial_sum = 0;
17393425bc38SStefano Zampini   n_boundary_dofs = 0;
17403425bc38SStefano Zampini   s = 0;
17413425bc38SStefano Zampini   n_vertices = 0;
17423425bc38SStefano Zampini   /* Get Vertices used to define the BDDC */
17433425bc38SStefano Zampini   ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(*vertex_indices),&vertex_indices);CHKERRQ(ierr);
17443425bc38SStefano Zampini   for (i=0;i<pcbddc->local_primal_size;i++) {
17453425bc38SStefano Zampini     ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&j,(const PetscInt**)&temp_indices,PETSC_NULL);CHKERRQ(ierr);
17463425bc38SStefano Zampini     if (j == 1) {
17473425bc38SStefano Zampini       vertex_indices[n_vertices]=temp_indices[0];
17483425bc38SStefano Zampini       n_vertices++;
17493425bc38SStefano Zampini     }
17503425bc38SStefano Zampini     ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&j,(const PetscInt**)&temp_indices,PETSC_NULL);CHKERRQ(ierr);
17513425bc38SStefano Zampini   }
17523425bc38SStefano Zampini   dual_size = pcis->n_B-n_vertices;
1753f0474715SStefano Zampini   ierr = PetscSortInt(n_vertices,vertex_indices);CHKERRQ(ierr);
17543425bc38SStefano Zampini   ierr = PetscMalloc(dual_size*sizeof(*dual_dofs_boundary_indices),&dual_dofs_boundary_indices);CHKERRQ(ierr);
17553425bc38SStefano Zampini   ierr = PetscMalloc(dual_size*sizeof(*aux_local_numbering_1),&aux_local_numbering_1);CHKERRQ(ierr);
17563425bc38SStefano Zampini   ierr = PetscMalloc(dual_size*sizeof(*aux_local_numbering_2),&aux_local_numbering_2);CHKERRQ(ierr);
17573425bc38SStefano Zampini 
17583425bc38SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
17593425bc38SStefano Zampini   for (i=0;i<pcis->n;i++){
17603425bc38SStefano Zampini     j = mat_graph->count[i]; /* RECALL: mat_graph->count[i] does not count myself */
1761c6582918SStefano Zampini     k = 0;
1762c6582918SStefano Zampini     if (j > 0) {
17633425bc38SStefano Zampini       k = (mat_graph->neighbours_set[i][0] == -1 ?  1 : 0);
1764c6582918SStefano Zampini     }
17653425bc38SStefano Zampini     j = j - k ;
17663425bc38SStefano Zampini     if ( j > 0 ) { n_boundary_dofs++; }
17673425bc38SStefano Zampini 
17683425bc38SStefano Zampini     skip_node = PETSC_FALSE;
1769c6582918SStefano Zampini     if ( s < n_vertices && vertex_indices[s]==i) { /* it works for a sorted set of vertices */
17703425bc38SStefano Zampini       skip_node = PETSC_TRUE;
17713425bc38SStefano Zampini       s++;
17723425bc38SStefano Zampini     }
17733425bc38SStefano Zampini     if (j < 1) {skip_node = PETSC_TRUE;}
17743425bc38SStefano Zampini     if ( !skip_node ) {
17753425bc38SStefano Zampini       if (fully_redundant) {
17763425bc38SStefano Zampini         /* fully redundant set of lagrange multipliers */
17773425bc38SStefano Zampini         n_lambda_for_dof = (j*(j+1))/2;
17783425bc38SStefano Zampini       } else {
17793425bc38SStefano Zampini         n_lambda_for_dof = j;
17803425bc38SStefano Zampini       }
17813425bc38SStefano Zampini       n_local_lambda += j;
17823425bc38SStefano Zampini       /* needed to evaluate global number of lagrange multipliers */
17833425bc38SStefano Zampini       array[i]=(1.0*n_lambda_for_dof)/(j+1.0); /* already scaled for the next global sum */
17843425bc38SStefano Zampini       /* store some data needed */
17853425bc38SStefano Zampini       dual_dofs_boundary_indices[partial_sum] = n_boundary_dofs-1;
17863425bc38SStefano Zampini       aux_local_numbering_1[partial_sum] = i;
1787ef028eecSStefano Zampini       aux_local_numbering_2[partial_sum] = n_lambda_for_dof;
17883425bc38SStefano Zampini       partial_sum++;
17893425bc38SStefano Zampini     }
17903425bc38SStefano Zampini   }
17913425bc38SStefano Zampini   /*printf("I found %d local lambda dofs\n",n_local_lambda);
17923425bc38SStefano Zampini   printf("I found %d boundary dofs (should be %d)\n",n_boundary_dofs,pcis->n_B);
17933425bc38SStefano Zampini   printf("Partial sum %d should be %d\n",partial_sum,dual_size);*/
17943425bc38SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
1795ef028eecSStefano Zampini 
17963425bc38SStefano Zampini   ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
17973425bc38SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
17983425bc38SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
17993425bc38SStefano Zampini   ierr = VecSum(pcis->vec1_global,&scalar_value);CHKERRQ(ierr);
18003425bc38SStefano Zampini   fetidpmat_ctx->n_lambda = (PetscInt) scalar_value;
18013425bc38SStefano Zampini   /* printf("I found %d global multipliers (%f)\n",fetidpmat_ctx->n_lambda,scalar_value); */
18023425bc38SStefano Zampini 
18033425bc38SStefano Zampini   /* compute global ordering of lagrange multipliers and associate l2g map */
1804ef028eecSStefano Zampini   ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
1805ef028eecSStefano Zampini   ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
1806ef028eecSStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
1807ef028eecSStefano Zampini   for (i=0;i<dual_size;i++) {
1808ef028eecSStefano Zampini     array[aux_local_numbering_1[i]] = aux_local_numbering_2[i];
1809ef028eecSStefano Zampini   }
1810ef028eecSStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
1811ef028eecSStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
1812ef028eecSStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
1813ef028eecSStefano Zampini   ierr = VecSum(pcis->vec1_global,&scalar_value);CHKERRQ(ierr);
1814ef028eecSStefano Zampini   if (pcbddc->dbg_flag && (PetscInt)scalar_value != fetidpmat_ctx->n_lambda) {
1815ef028eecSStefano Zampini     SETERRQ3(PETSC_COMM_WORLD,PETSC_ERR_PLIB,"Error in %s: global number of multipliers mismatch! (%d!=%d)\n",__FUNCT__,(PetscInt)scalar_value,fetidpmat_ctx->n_lambda);
1816ef028eecSStefano Zampini   }
18173425bc38SStefano Zampini 
1818ef028eecSStefano Zampini   /* Fill pcis->vec1_global with cumulative function for global numbering */
1819ef028eecSStefano Zampini   ierr = VecGetArray(pcis->vec1_global,&array);CHKERRQ(ierr);
1820ef028eecSStefano Zampini   ierr = VecGetLocalSize(pcis->vec1_global,&s);CHKERRQ(ierr);
1821ef028eecSStefano Zampini   k = 0;
1822ef028eecSStefano Zampini   first_index = -1;
1823ef028eecSStefano Zampini   for (i=0;i<s;i++) {
1824ef028eecSStefano Zampini     if (!first_found && array[i] > 0.0) {
1825ef028eecSStefano Zampini       first_found = PETSC_TRUE;
1826ef028eecSStefano Zampini       first_index = i;
1827ef028eecSStefano Zampini     }
1828ef028eecSStefano Zampini     k += (PetscInt)array[i];
1829ef028eecSStefano Zampini   }
1830ef028eecSStefano Zampini   j = ( !rank ? nprocs : 0);
18313425bc38SStefano Zampini   ierr = PetscMalloc(j*sizeof(*dof_sizes),&dof_sizes);CHKERRQ(ierr);
18323425bc38SStefano Zampini   ierr = PetscMalloc(j*sizeof(*dof_displs),&dof_displs);CHKERRQ(ierr);
1833ef028eecSStefano Zampini   ierr = MPI_Gather(&k,1,MPIU_INT,dof_sizes,1,MPIU_INT,0,comm);CHKERRQ(ierr);
1834ef028eecSStefano Zampini   if (!rank) {
18353425bc38SStefano Zampini     dof_displs[0]=0;
18363425bc38SStefano Zampini     for (i=1;i<nprocs;i++) {
18373425bc38SStefano Zampini       dof_displs[i] = dof_displs[i-1]+dof_sizes[i-1];
18383425bc38SStefano Zampini     }
18393425bc38SStefano Zampini   }
1840ef028eecSStefano Zampini   ierr = MPI_Scatter(dof_displs,1,MPIU_INT,&k,1,MPIU_INT,0,comm);CHKERRQ(ierr);
1841ef028eecSStefano Zampini   if (first_found) {
1842ef028eecSStefano Zampini     array[first_index] += k;
1843ef028eecSStefano Zampini     old_index = first_index;
1844ef028eecSStefano Zampini     for (i=first_index+1;i<s;i++) {
1845ef028eecSStefano Zampini       if (array[i] > 0.0) {
1846ef028eecSStefano Zampini         array[i] += array[old_index];
1847ef028eecSStefano Zampini         old_index = i;
1848ef028eecSStefano Zampini       }
1849ef028eecSStefano Zampini     }
1850ef028eecSStefano Zampini   }
1851ef028eecSStefano Zampini   ierr = VecRestoreArray(pcis->vec1_global,&array);CHKERRQ(ierr);
1852ef028eecSStefano Zampini   ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
1853ef028eecSStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1854ef028eecSStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1855ef028eecSStefano Zampini   ierr = PetscMalloc(dual_size*sizeof(*aux_global_numbering),&aux_global_numbering);CHKERRQ(ierr);
1856ef028eecSStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
18573425bc38SStefano Zampini   for (i=0;i<dual_size;i++) {
1858ef028eecSStefano Zampini     aux_global_numbering[i] = (PetscInt)array[aux_local_numbering_1[i]]-aux_local_numbering_2[i];
18593425bc38SStefano Zampini   }
1860ef028eecSStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
1861f0474715SStefano Zampini   ierr = PetscFree(aux_local_numbering_2);CHKERRQ(ierr);
1862f0474715SStefano Zampini   ierr = PetscFree(dof_displs);CHKERRQ(ierr);
1863f0474715SStefano Zampini   ierr = PetscFree(dof_sizes);CHKERRQ(ierr);
18643425bc38SStefano Zampini 
18653425bc38SStefano Zampini   /* init data for scaling factors exchange */
18663425bc38SStefano Zampini   partial_sum = 0;
18673425bc38SStefano Zampini   j = 0;
18683425bc38SStefano Zampini   ierr = PetscMalloc(pcis->n_neigh*sizeof(PetscInt),&ptrs_buffer);CHKERRQ(ierr);
18693425bc38SStefano Zampini   ierr = PetscMalloc((pcis->n_neigh-1)*sizeof(MPI_Request),&send_reqs);CHKERRQ(ierr);
18703425bc38SStefano Zampini   ierr = PetscMalloc((pcis->n_neigh-1)*sizeof(MPI_Request),&recv_reqs);CHKERRQ(ierr);
18713425bc38SStefano Zampini   ierr = PetscMalloc(pcis->n*sizeof(PetscScalar*),&all_factors);CHKERRQ(ierr);
18723425bc38SStefano Zampini   ptrs_buffer[0]=0;
18733425bc38SStefano Zampini   for (i=1;i<pcis->n_neigh;i++) {
18743425bc38SStefano Zampini     partial_sum += pcis->n_shared[i];
18753425bc38SStefano Zampini     ptrs_buffer[i] = ptrs_buffer[i-1]+pcis->n_shared[i];
18763425bc38SStefano Zampini   }
18773425bc38SStefano Zampini   ierr = PetscMalloc( partial_sum*sizeof(PetscScalar),&send_buffer);CHKERRQ(ierr);
18783425bc38SStefano Zampini   ierr = PetscMalloc( partial_sum*sizeof(PetscScalar),&recv_buffer);CHKERRQ(ierr);
18793425bc38SStefano Zampini   ierr = PetscMalloc( partial_sum*sizeof(PetscScalar),&all_factors[0]);CHKERRQ(ierr);
18803425bc38SStefano Zampini   for (i=0;i<pcis->n-1;i++) {
18813425bc38SStefano Zampini     j = mat_graph->count[i];
18823425bc38SStefano Zampini     if (j>0) {
18833425bc38SStefano Zampini       k = (mat_graph->neighbours_set[i][0] == -1 ?  1 : 0);
18843425bc38SStefano Zampini       j = j - k;
18853425bc38SStefano Zampini     }
18863425bc38SStefano Zampini     all_factors[i+1]=all_factors[i]+j;
18873425bc38SStefano Zampini   }
18883425bc38SStefano Zampini   /* scatter B scaling to N vec */
18893425bc38SStefano Zampini   ierr = VecScatterBegin(pcis->N_to_B,pcis->D,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
18903425bc38SStefano Zampini   ierr = VecScatterEnd  (pcis->N_to_B,pcis->D,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
18913425bc38SStefano Zampini   /* communications */
18923425bc38SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
18933425bc38SStefano Zampini   for (i=1;i<pcis->n_neigh;i++) {
18943425bc38SStefano Zampini     for (j=0;j<pcis->n_shared[i];j++) {
18953425bc38SStefano Zampini       send_buffer[ptrs_buffer[i-1]+j]=array[pcis->shared[i][j]];
18963425bc38SStefano Zampini     }
18973425bc38SStefano Zampini     j = ptrs_buffer[i]-ptrs_buffer[i-1];
1898ea7e1babSStefano Zampini     ierr = MPI_Isend(&send_buffer[ptrs_buffer[i-1]],j,MPIU_SCALAR,pcis->neigh[i],0,comm,&send_reqs[i-1]);CHKERRQ(ierr);
1899ea7e1babSStefano Zampini     ierr = MPI_Irecv(&recv_buffer[ptrs_buffer[i-1]],j,MPIU_SCALAR,pcis->neigh[i],0,comm,&recv_reqs[i-1]);CHKERRQ(ierr);
19003425bc38SStefano Zampini   }
19013425bc38SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
1902ea7e1babSStefano Zampini   ierr = MPI_Waitall((pcis->n_neigh-1),recv_reqs,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
19033425bc38SStefano Zampini   /* put values in correct places */
19043425bc38SStefano Zampini   for (i=1;i<pcis->n_neigh;i++) {
19053425bc38SStefano Zampini     for (j=0;j<pcis->n_shared[i];j++) {
19063425bc38SStefano Zampini       k = pcis->shared[i][j];
19073425bc38SStefano Zampini       neigh_position = 0;
19083425bc38SStefano Zampini       while(mat_graph->neighbours_set[k][neigh_position] != pcis->neigh[i]) {neigh_position++;}
19093425bc38SStefano Zampini       s = (mat_graph->neighbours_set[k][0] == -1 ?  1 : 0);
19103425bc38SStefano Zampini       neigh_position = neigh_position - s;
19113425bc38SStefano Zampini       all_factors[k][neigh_position]=recv_buffer[ptrs_buffer[i-1]+j];
19123425bc38SStefano Zampini     }
19133425bc38SStefano Zampini   }
1914ea7e1babSStefano Zampini   ierr = MPI_Waitall((pcis->n_neigh-1),send_reqs,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
19153425bc38SStefano Zampini   ierr = PetscFree(send_reqs);CHKERRQ(ierr);
19163425bc38SStefano Zampini   ierr = PetscFree(recv_reqs);CHKERRQ(ierr);
19173425bc38SStefano Zampini   ierr = PetscFree(send_buffer);CHKERRQ(ierr);
19183425bc38SStefano Zampini   ierr = PetscFree(recv_buffer);CHKERRQ(ierr);
19193425bc38SStefano Zampini   ierr = PetscFree(ptrs_buffer);CHKERRQ(ierr);
19203425bc38SStefano Zampini 
19213425bc38SStefano Zampini   /* Compute B and B_delta (local actions) */
19223425bc38SStefano Zampini   ierr = PetscMalloc(pcis->n_neigh*sizeof(*aux_sums),&aux_sums);CHKERRQ(ierr);
19233425bc38SStefano Zampini   ierr = PetscMalloc(n_local_lambda*sizeof(*l2g_indices),&l2g_indices);CHKERRQ(ierr);
19243425bc38SStefano Zampini   ierr = PetscMalloc(n_local_lambda*sizeof(*vals_B_delta),&vals_B_delta);CHKERRQ(ierr);
19253425bc38SStefano Zampini   ierr = PetscMalloc(n_local_lambda*sizeof(*cols_B_delta),&cols_B_delta);CHKERRQ(ierr);
19263425bc38SStefano Zampini   ierr = PetscMalloc(n_local_lambda*sizeof(*scaling_factors),&scaling_factors);CHKERRQ(ierr);
19273425bc38SStefano Zampini   n_global_lambda=0;
19283425bc38SStefano Zampini   partial_sum=0;
19293425bc38SStefano Zampini   for (i=0;i<dual_size;i++) {
1930ef028eecSStefano Zampini     n_global_lambda = aux_global_numbering[i];
19313425bc38SStefano Zampini     j = mat_graph->count[aux_local_numbering_1[i]];
19323425bc38SStefano Zampini     k = (mat_graph->neighbours_set[aux_local_numbering_1[i]][0] == -1 ?  1 : 0);
19333425bc38SStefano Zampini     j = j - k;
19343425bc38SStefano Zampini     aux_sums[0]=0;
19353425bc38SStefano Zampini     for (s=1;s<j;s++) {
19363425bc38SStefano Zampini       aux_sums[s]=aux_sums[s-1]+j-s+1;
19373425bc38SStefano Zampini     }
19383425bc38SStefano Zampini     array = all_factors[aux_local_numbering_1[i]];
19393425bc38SStefano Zampini     n_neg_values = 0;
19403425bc38SStefano Zampini     while(n_neg_values < j && mat_graph->neighbours_set[aux_local_numbering_1[i]][n_neg_values+k] < rank) {n_neg_values++;}
19413425bc38SStefano Zampini     n_pos_values = j - n_neg_values;
19423425bc38SStefano Zampini     if (fully_redundant) {
19433425bc38SStefano Zampini       for (s=0;s<n_neg_values;s++) {
19443425bc38SStefano Zampini         l2g_indices    [partial_sum+s]=aux_sums[s]+n_neg_values-s-1+n_global_lambda;
19453425bc38SStefano Zampini         cols_B_delta   [partial_sum+s]=dual_dofs_boundary_indices[i];
19463425bc38SStefano Zampini         vals_B_delta   [partial_sum+s]=-1.0;
19473425bc38SStefano Zampini         scaling_factors[partial_sum+s]=array[s];
19483425bc38SStefano Zampini       }
19493425bc38SStefano Zampini       for (s=0;s<n_pos_values;s++) {
19503425bc38SStefano Zampini         l2g_indices    [partial_sum+s+n_neg_values]=aux_sums[n_neg_values]+s+n_global_lambda;
19513425bc38SStefano Zampini         cols_B_delta   [partial_sum+s+n_neg_values]=dual_dofs_boundary_indices[i];
19523425bc38SStefano Zampini         vals_B_delta   [partial_sum+s+n_neg_values]=1.0;
19533425bc38SStefano Zampini         scaling_factors[partial_sum+s+n_neg_values]=array[s+n_neg_values];
19543425bc38SStefano Zampini       }
19553425bc38SStefano Zampini       partial_sum += j;
19563425bc38SStefano Zampini     } else {
19573425bc38SStefano Zampini       /* l2g_indices and default cols and vals of B_delta */
19583425bc38SStefano Zampini       for (s=0;s<j;s++) {
19593425bc38SStefano Zampini         l2g_indices    [partial_sum+s]=n_global_lambda+s;
19603425bc38SStefano Zampini         cols_B_delta   [partial_sum+s]=dual_dofs_boundary_indices[i];
19613425bc38SStefano Zampini         vals_B_delta   [partial_sum+s]=0.0;
19623425bc38SStefano Zampini       }
19633425bc38SStefano Zampini       /* B_delta */
19643425bc38SStefano Zampini       if ( n_neg_values > 0 ) { /* there's a rank next to me to the left */
19653425bc38SStefano Zampini         vals_B_delta   [partial_sum+n_neg_values-1]=-1.0;
19663425bc38SStefano Zampini       }
19673425bc38SStefano Zampini       if ( n_neg_values < j ) { /* there's a rank next to me to the right */
19683425bc38SStefano Zampini         vals_B_delta   [partial_sum+n_neg_values]=1.0;
19693425bc38SStefano Zampini       }
19703425bc38SStefano Zampini       /* scaling as in Klawonn-Widlund 1999*/
19713425bc38SStefano Zampini       for (s=0;s<n_neg_values;s++) {
19723425bc38SStefano Zampini         scalar_value = 0.0;
19733425bc38SStefano Zampini         for (k=0;k<s+1;k++) {
19743425bc38SStefano Zampini           scalar_value += array[k];
19753425bc38SStefano Zampini         }
1976ef028eecSStefano Zampini         scaling_factors[partial_sum+s] = -scalar_value;
19773425bc38SStefano Zampini       }
19783425bc38SStefano Zampini       for (s=0;s<n_pos_values;s++) {
19793425bc38SStefano Zampini         scalar_value = 0.0;
19803425bc38SStefano Zampini         for (k=s+n_neg_values;k<j;k++) {
19813425bc38SStefano Zampini           scalar_value += array[k];
19823425bc38SStefano Zampini         }
19833425bc38SStefano Zampini         scaling_factors[partial_sum+s+n_neg_values] = scalar_value;
19843425bc38SStefano Zampini       }
19853425bc38SStefano Zampini       partial_sum += j;
19863425bc38SStefano Zampini     }
19873425bc38SStefano Zampini   }
1988ef028eecSStefano Zampini   ierr = PetscFree(aux_global_numbering);CHKERRQ(ierr);
1989f0474715SStefano Zampini   ierr = PetscFree(aux_sums);CHKERRQ(ierr);
1990f0474715SStefano Zampini   ierr = PetscFree(aux_local_numbering_1);CHKERRQ(ierr);
1991f0474715SStefano Zampini   ierr = PetscFree(dual_dofs_boundary_indices);CHKERRQ(ierr);
19923425bc38SStefano Zampini   ierr = PetscFree(all_factors[0]);CHKERRQ(ierr);
19933425bc38SStefano Zampini   ierr = PetscFree(all_factors);CHKERRQ(ierr);
19943425bc38SStefano Zampini   /* printf("I found %d local lambda dofs when numbering them (should be %d)\n",partial_sum,n_local_lambda); */
1995f0474715SStefano Zampini 
1996f0474715SStefano Zampini   /* Local to global mapping of fetidpmat */
1997f0474715SStefano Zampini   ierr = VecCreate(PETSC_COMM_SELF,&fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
1998f0474715SStefano Zampini   ierr = VecSetSizes(fetidpmat_ctx->lambda_local,n_local_lambda,n_local_lambda);CHKERRQ(ierr);
1999f0474715SStefano Zampini   ierr = VecSetType(fetidpmat_ctx->lambda_local,VECSEQ);CHKERRQ(ierr);
2000f0474715SStefano Zampini   ierr = VecCreate(comm,&lambda_global);CHKERRQ(ierr);
2001f0474715SStefano Zampini   ierr = VecSetSizes(lambda_global,PETSC_DECIDE,fetidpmat_ctx->n_lambda);CHKERRQ(ierr);
2002f0474715SStefano Zampini   ierr = VecSetType(lambda_global,VECMPI);CHKERRQ(ierr);
20033425bc38SStefano Zampini   ierr = ISCreateGeneral(comm,n_local_lambda,l2g_indices,PETSC_OWN_POINTER,&IS_l2g_lambda);CHKERRQ(ierr);
20043425bc38SStefano Zampini   ierr = VecScatterCreate(fetidpmat_ctx->lambda_local,(IS)0,lambda_global,IS_l2g_lambda,&fetidpmat_ctx->l2g_lambda);CHKERRQ(ierr);
2005f0474715SStefano Zampini   ierr = ISDestroy(&IS_l2g_lambda);CHKERRQ(ierr);
20063425bc38SStefano Zampini 
20073425bc38SStefano Zampini   /* Create local part of B_delta */
20083425bc38SStefano Zampini   ierr = MatCreate(PETSC_COMM_SELF,&fetidpmat_ctx->B_delta);
20093425bc38SStefano Zampini   ierr = MatSetSizes(fetidpmat_ctx->B_delta,n_local_lambda,pcis->n_B,n_local_lambda,pcis->n_B);CHKERRQ(ierr);
20103425bc38SStefano Zampini   ierr = MatSetType(fetidpmat_ctx->B_delta,MATSEQAIJ);CHKERRQ(ierr);
20113425bc38SStefano Zampini   ierr = MatSeqAIJSetPreallocation(fetidpmat_ctx->B_delta,1,PETSC_NULL);CHKERRQ(ierr);
20123425bc38SStefano Zampini   ierr = MatSetOption(fetidpmat_ctx->B_delta,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr);
20133425bc38SStefano Zampini   for (i=0;i<n_local_lambda;i++) {
20143425bc38SStefano Zampini     ierr = MatSetValue(fetidpmat_ctx->B_delta,i,cols_B_delta[i],vals_B_delta[i],INSERT_VALUES);CHKERRQ(ierr);
20153425bc38SStefano Zampini   }
2016f0474715SStefano Zampini   ierr = PetscFree(vals_B_delta);CHKERRQ(ierr);
20173425bc38SStefano Zampini   ierr = MatAssemblyBegin(fetidpmat_ctx->B_delta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
20183425bc38SStefano Zampini   ierr = MatAssemblyEnd  (fetidpmat_ctx->B_delta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
20193425bc38SStefano Zampini 
20203425bc38SStefano Zampini   if (fully_redundant) {
20213425bc38SStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&ScalingMat);
20223425bc38SStefano Zampini     ierr = MatSetSizes(ScalingMat,n_local_lambda,n_local_lambda,n_local_lambda,n_local_lambda);CHKERRQ(ierr);
20233425bc38SStefano Zampini     ierr = MatSetType(ScalingMat,MATSEQAIJ);CHKERRQ(ierr);
20243425bc38SStefano Zampini     ierr = MatSeqAIJSetPreallocation(ScalingMat,1,PETSC_NULL);CHKERRQ(ierr);
20253425bc38SStefano Zampini     for (i=0;i<n_local_lambda;i++) {
20263425bc38SStefano Zampini       ierr = MatSetValue(ScalingMat,i,i,scaling_factors[i],INSERT_VALUES);CHKERRQ(ierr);
20273425bc38SStefano Zampini     }
20283425bc38SStefano Zampini     ierr = MatAssemblyBegin(ScalingMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
20293425bc38SStefano Zampini     ierr = MatAssemblyEnd  (ScalingMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
20303425bc38SStefano Zampini     ierr = MatMatMult(ScalingMat,fetidpmat_ctx->B_delta,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&fetidpmat_ctx->B_Ddelta);CHKERRQ(ierr);
20313425bc38SStefano Zampini     ierr = MatDestroy(&ScalingMat);CHKERRQ(ierr);
20323425bc38SStefano Zampini   } else {
20333425bc38SStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&fetidpmat_ctx->B_Ddelta);
20343425bc38SStefano Zampini     ierr = MatSetSizes(fetidpmat_ctx->B_Ddelta,n_local_lambda,pcis->n_B,n_local_lambda,pcis->n_B);CHKERRQ(ierr);
20353425bc38SStefano Zampini     ierr = MatSetType(fetidpmat_ctx->B_Ddelta,MATSEQAIJ);CHKERRQ(ierr);
20363425bc38SStefano Zampini     ierr = MatSeqAIJSetPreallocation(fetidpmat_ctx->B_Ddelta,1,PETSC_NULL);CHKERRQ(ierr);
20373425bc38SStefano Zampini     for (i=0;i<n_local_lambda;i++) {
20383425bc38SStefano Zampini       ierr = MatSetValue(fetidpmat_ctx->B_Ddelta,i,cols_B_delta[i],scaling_factors[i],INSERT_VALUES);CHKERRQ(ierr);
20393425bc38SStefano Zampini     }
20403425bc38SStefano Zampini     ierr = MatAssemblyBegin(fetidpmat_ctx->B_Ddelta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
20413425bc38SStefano Zampini     ierr = MatAssemblyEnd  (fetidpmat_ctx->B_Ddelta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
20423425bc38SStefano Zampini   }
2043f0474715SStefano Zampini   ierr = PetscFree(scaling_factors);CHKERRQ(ierr);
2044f0474715SStefano Zampini   ierr = PetscFree(cols_B_delta);CHKERRQ(ierr);
20453425bc38SStefano Zampini 
20463425bc38SStefano Zampini   /* Create some vectors needed by fetidp */
20473425bc38SStefano Zampini   ierr = VecDuplicate(pcis->vec1_B,&fetidpmat_ctx->temp_solution_B);CHKERRQ(ierr);
20483425bc38SStefano Zampini   ierr = VecDuplicate(pcis->vec1_D,&fetidpmat_ctx->temp_solution_D);CHKERRQ(ierr);
20493425bc38SStefano Zampini 
20503425bc38SStefano Zampini   test_fetidp = PETSC_FALSE;
20513425bc38SStefano Zampini   ierr = PetscOptionsGetBool(PETSC_NULL,"-fetidp_check",&test_fetidp,PETSC_NULL);CHKERRQ(ierr);
20523425bc38SStefano Zampini 
20533425bc38SStefano Zampini   if (test_fetidp) {
20543425bc38SStefano Zampini 
20553425bc38SStefano Zampini     ierr = PetscViewerASCIIGetStdout(((PetscObject)(fetidpmat_ctx->pc))->comm,&viewer);CHKERRQ(ierr);
20563425bc38SStefano Zampini     ierr = PetscViewerASCIISynchronizedAllow(viewer,PETSC_TRUE);CHKERRQ(ierr);
20573425bc38SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"----------FETI_DP TESTS--------------\n");CHKERRQ(ierr);
20583425bc38SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"All tests should return zero!\n");CHKERRQ(ierr);
20593425bc38SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"FETIDP MAT context in the ");CHKERRQ(ierr);
20603425bc38SStefano Zampini     if (fully_redundant) {
20613425bc38SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"fully redundant case for lagrange multipliers.\n");CHKERRQ(ierr);
20623425bc38SStefano Zampini     } else {
20633425bc38SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Non-fully redundant case for lagrange multiplier.\n");CHKERRQ(ierr);
20643425bc38SStefano Zampini     }
20653425bc38SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
20663425bc38SStefano Zampini 
20673425bc38SStefano Zampini     /******************************************************************/
20683425bc38SStefano Zampini     /* TEST A/B: Test numbering of global lambda dofs             */
20693425bc38SStefano Zampini     /******************************************************************/
20703425bc38SStefano Zampini 
20713425bc38SStefano Zampini     ierr = VecDuplicate(fetidpmat_ctx->lambda_local,&test_vec);CHKERRQ(ierr);
20723425bc38SStefano Zampini     ierr = VecSet(lambda_global,1.0);CHKERRQ(ierr);
20733425bc38SStefano Zampini     ierr = VecSet(test_vec,1.0);CHKERRQ(ierr);
20743425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
20753425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
20763425bc38SStefano Zampini     scalar_value = -1.0;
20773425bc38SStefano Zampini     ierr = VecAXPY(test_vec,scalar_value,fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
20783425bc38SStefano Zampini     ierr = VecNorm(test_vec,NORM_INFINITY,&scalar_value);CHKERRQ(ierr);
20793425bc38SStefano Zampini     ierr = VecDestroy(&test_vec);CHKERRQ(ierr);
20803425bc38SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"A[%04d]: CHECK glob to loc: % 1.14e\n",rank,scalar_value);CHKERRQ(ierr);
20813425bc38SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
20823425bc38SStefano Zampini     if (fully_redundant) {
20833425bc38SStefano Zampini       ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr);
20843425bc38SStefano Zampini       ierr = VecSet(fetidpmat_ctx->lambda_local,0.5);CHKERRQ(ierr);
20853425bc38SStefano Zampini       ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20863425bc38SStefano Zampini       ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20873425bc38SStefano Zampini       ierr = VecSum(lambda_global,&scalar_value);CHKERRQ(ierr);
20883425bc38SStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"B[%04d]: CHECK loc to glob: % 1.14e\n",rank,scalar_value-fetidpmat_ctx->n_lambda);CHKERRQ(ierr);
20893425bc38SStefano Zampini       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
20903425bc38SStefano Zampini     }
20913425bc38SStefano Zampini 
20923425bc38SStefano Zampini     /******************************************************************/
20933425bc38SStefano Zampini     /* TEST C: It should holds B_delta*w=0, w\in\widehat{W}           */
20943425bc38SStefano Zampini     /* This is the meaning of the B matrix                            */
20953425bc38SStefano Zampini     /******************************************************************/
20963425bc38SStefano Zampini 
20973425bc38SStefano Zampini     ierr = VecSetRandom(pcis->vec1_N,PETSC_NULL);CHKERRQ(ierr);
20983425bc38SStefano Zampini     ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
20993425bc38SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21003425bc38SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21013425bc38SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21023425bc38SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21033425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21043425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21053425bc38SStefano Zampini     /* Action of B_delta */
21063425bc38SStefano Zampini     ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
21073425bc38SStefano Zampini     ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr);
21083425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21093425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21103425bc38SStefano Zampini     ierr = VecNorm(lambda_global,NORM_INFINITY,&scalar_value);CHKERRQ(ierr);
21113425bc38SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"C[coll]: CHECK infty norm of B_delta*w (w continuous): % 1.14e\n",scalar_value);CHKERRQ(ierr);
21123425bc38SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
21133425bc38SStefano Zampini 
21143425bc38SStefano Zampini     /******************************************************************/
21153425bc38SStefano Zampini     /* TEST D: It should holds E_Dw = w - P_Dw w\in\widetilde{W}     */
21163425bc38SStefano Zampini     /* E_D = R_D^TR                                                   */
21173425bc38SStefano Zampini     /* P_D = B_{D,delta}^T B_{delta}                                  */
21183425bc38SStefano Zampini     /* eq.44 Mandel Tezaur and Dohrmann 2005                          */
21193425bc38SStefano Zampini     /******************************************************************/
21203425bc38SStefano Zampini 
21213425bc38SStefano Zampini     /* compute a random vector in \widetilde{W} */
21223425bc38SStefano Zampini     ierr = VecSetRandom(pcis->vec1_N,PETSC_NULL);CHKERRQ(ierr);
21233425bc38SStefano Zampini     scalar_value = 0.0;  /* set zero at vertices */
21243425bc38SStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
21253425bc38SStefano Zampini     for (i=0;i<n_vertices;i++) { array[vertex_indices[i]]=scalar_value; }
21263425bc38SStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
21273425bc38SStefano Zampini     /* store w for final comparison */
21283425bc38SStefano Zampini     ierr = VecDuplicate(pcis->vec1_B,&test_vec);CHKERRQ(ierr);
21293425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,test_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21303425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,test_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21313425bc38SStefano Zampini 
21323425bc38SStefano Zampini     /* Jump operator P_D : results stored in pcis->vec1_B */
21333425bc38SStefano Zampini 
21343425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21353425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21363425bc38SStefano Zampini     /* Action of B_delta */
21373425bc38SStefano Zampini     ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
21383425bc38SStefano Zampini     ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr);
21393425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21403425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21413425bc38SStefano Zampini     /* Action of B_Ddelta^T */
21423425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21433425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21443425bc38SStefano Zampini     ierr = MatMultTranspose(fetidpmat_ctx->B_Ddelta,fetidpmat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr);
21453425bc38SStefano Zampini 
21463425bc38SStefano Zampini     /* Average operator E_D : results stored in pcis->vec2_B */
21473425bc38SStefano Zampini 
21483425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21493425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21503425bc38SStefano Zampini     ierr = VecPointwiseMult(pcis->vec2_B,pcis->D,pcis->vec2_B);CHKERRQ(ierr);
21513425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec2_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21523425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec2_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21533425bc38SStefano Zampini     ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
21543425bc38SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21553425bc38SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21563425bc38SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21573425bc38SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21583425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21593425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21603425bc38SStefano Zampini 
21613425bc38SStefano Zampini     /* test E_D=I-P_D */
21623425bc38SStefano Zampini     scalar_value = 1.0;
21633425bc38SStefano Zampini     ierr = VecAXPY(pcis->vec1_B,scalar_value,pcis->vec2_B);CHKERRQ(ierr);
21643425bc38SStefano Zampini     scalar_value = -1.0;
21653425bc38SStefano Zampini     ierr = VecAXPY(pcis->vec1_B,scalar_value,test_vec);CHKERRQ(ierr);
21663425bc38SStefano Zampini     ierr = VecNorm(pcis->vec1_B,NORM_INFINITY,&scalar_value);CHKERRQ(ierr);
21673425bc38SStefano Zampini     ierr = VecDestroy(&test_vec);CHKERRQ(ierr);
21683425bc38SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"D[%04d] CHECK infty norm of E_D + P_D - I: % 1.14e\n",rank,scalar_value);CHKERRQ(ierr);
21693425bc38SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
21703425bc38SStefano Zampini 
21713425bc38SStefano Zampini     /******************************************************************/
21723425bc38SStefano Zampini     /* TEST E: It should holds R_D^TP_Dw=0 w\in\widetilde{W}          */
21733425bc38SStefano Zampini     /* eq.48 Mandel Tezaur and Dohrmann 2005                          */
21743425bc38SStefano Zampini     /******************************************************************/
21753425bc38SStefano Zampini 
21763425bc38SStefano Zampini     ierr = VecSetRandom(pcis->vec1_N,PETSC_NULL);CHKERRQ(ierr);
21773425bc38SStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
21783425bc38SStefano Zampini     scalar_value = 0.0;  /* set zero at vertices */
21793425bc38SStefano Zampini     for (i=0;i<n_vertices;i++) { array[vertex_indices[i]]=scalar_value; }
21803425bc38SStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
21813425bc38SStefano Zampini 
21823425bc38SStefano Zampini     /* Jump operator P_D : results stored in pcis->vec1_B */
21833425bc38SStefano Zampini 
21843425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21853425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21863425bc38SStefano Zampini     /* Action of B_delta */
21873425bc38SStefano Zampini     ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
21883425bc38SStefano Zampini     ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr);
21893425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21903425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21913425bc38SStefano Zampini     /* Action of B_Ddelta^T */
21923425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21933425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21943425bc38SStefano Zampini     ierr = MatMultTranspose(fetidpmat_ctx->B_Ddelta,fetidpmat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr);
21953425bc38SStefano Zampini     /* diagonal scaling */
21963425bc38SStefano Zampini     ierr = VecPointwiseMult(pcis->vec1_B,pcis->D,pcis->vec1_B);CHKERRQ(ierr);
21973425bc38SStefano Zampini     /* sum on the interface */
21983425bc38SStefano Zampini     ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
21993425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
22003425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
22013425bc38SStefano Zampini     ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
22023425bc38SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
22033425bc38SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
22043425bc38SStefano Zampini     ierr = VecNorm(pcis->vec1_global,NORM_INFINITY,&scalar_value);CHKERRQ(ierr);
22053425bc38SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"E[coll]: CHECK infty norm of R^T_D P_D: % 1.14e\n",scalar_value);CHKERRQ(ierr);
22063425bc38SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
22073425bc38SStefano Zampini 
22083425bc38SStefano Zampini     if (!fully_redundant) {
22093425bc38SStefano Zampini       /******************************************************************/
22103425bc38SStefano Zampini       /* TEST F: It should holds B_{delta}B^T_{D,delta}=I               */
22113425bc38SStefano Zampini       /* Corollary thm 14 Mandel Tezaur and Dohrmann 2005               */
22123425bc38SStefano Zampini       /******************************************************************/
22133425bc38SStefano Zampini       ierr = VecDuplicate(lambda_global,&test_vec);CHKERRQ(ierr);
22143425bc38SStefano Zampini       ierr = VecSetRandom(lambda_global,PETSC_NULL);CHKERRQ(ierr);
22153425bc38SStefano Zampini       /* Action of B_Ddelta^T */
22163425bc38SStefano Zampini       ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
22173425bc38SStefano Zampini       ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
22183425bc38SStefano Zampini       ierr = MatMultTranspose(fetidpmat_ctx->B_Ddelta,fetidpmat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr);
22193425bc38SStefano Zampini       /* Action of B_delta */
22203425bc38SStefano Zampini       ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
22213425bc38SStefano Zampini       ierr = VecSet(test_vec,0.0);CHKERRQ(ierr);
22223425bc38SStefano Zampini       ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,test_vec,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
22233425bc38SStefano Zampini       ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,test_vec,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
22243425bc38SStefano Zampini       scalar_value = -1.0;
22253425bc38SStefano Zampini       ierr = VecAXPY(lambda_global,scalar_value,test_vec);CHKERRQ(ierr);
22263425bc38SStefano Zampini       ierr = VecNorm(lambda_global,NORM_INFINITY,&scalar_value);CHKERRQ(ierr);
22273425bc38SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"E[coll]: CHECK infty norm of P^T_D - I: % 1.14e\n",scalar_value);CHKERRQ(ierr);
22283425bc38SStefano Zampini       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
22293425bc38SStefano Zampini       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
22303425bc38SStefano Zampini       ierr = VecDestroy(&test_vec);CHKERRQ(ierr);
22313425bc38SStefano Zampini     }
22323425bc38SStefano Zampini   }
22333425bc38SStefano Zampini   /* final cleanup */
22343425bc38SStefano Zampini   ierr = PetscFree(vertex_indices);CHKERRQ(ierr);
22353425bc38SStefano Zampini   ierr = VecDestroy(&lambda_global);CHKERRQ(ierr);
22363425bc38SStefano Zampini 
22373425bc38SStefano Zampini   PetscFunctionReturn(0);
22383425bc38SStefano Zampini }
22393425bc38SStefano Zampini 
22403425bc38SStefano Zampini #undef __FUNCT__
22413425bc38SStefano Zampini #define __FUNCT__ "PCBDDCSetupFETIDPPCContext"
22423425bc38SStefano Zampini static PetscErrorCode PCBDDCSetupFETIDPPCContext(Mat fetimat, FETIDPPC_ctx *fetidppc_ctx)
22433425bc38SStefano Zampini {
22443425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
22453425bc38SStefano Zampini   PetscErrorCode ierr;
22463425bc38SStefano Zampini 
22473425bc38SStefano Zampini   PetscFunctionBegin;
22483425bc38SStefano Zampini   ierr = MatShellGetContext(fetimat,&mat_ctx);CHKERRQ(ierr);
22493425bc38SStefano Zampini   /* get references from objects created when setting up feti mat context */
22503425bc38SStefano Zampini   ierr = PetscObjectReference((PetscObject)mat_ctx->lambda_local);CHKERRQ(ierr);
22513425bc38SStefano Zampini   fetidppc_ctx->lambda_local = mat_ctx->lambda_local;
22523425bc38SStefano Zampini   ierr = PetscObjectReference((PetscObject)mat_ctx->B_Ddelta);CHKERRQ(ierr);
22533425bc38SStefano Zampini   fetidppc_ctx->B_Ddelta = mat_ctx->B_Ddelta;
22543425bc38SStefano Zampini   ierr = PetscObjectReference((PetscObject)mat_ctx->l2g_lambda);CHKERRQ(ierr);
22553425bc38SStefano Zampini   fetidppc_ctx->l2g_lambda = mat_ctx->l2g_lambda;
22563425bc38SStefano Zampini   PetscFunctionReturn(0);
22573425bc38SStefano Zampini }
22583425bc38SStefano Zampini 
22593425bc38SStefano Zampini #undef __FUNCT__
22603425bc38SStefano Zampini #define __FUNCT__ "FETIDPMatMult"
22613425bc38SStefano Zampini static PetscErrorCode FETIDPMatMult(Mat fetimat, Vec x, Vec y)
22623425bc38SStefano Zampini {
22633425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
22643425bc38SStefano Zampini   PC_IS          *pcis;
22653425bc38SStefano Zampini   PetscErrorCode ierr;
22663425bc38SStefano Zampini 
22673425bc38SStefano Zampini   PetscFunctionBegin;
22683425bc38SStefano Zampini   ierr = MatShellGetContext(fetimat,&mat_ctx);CHKERRQ(ierr);
22693425bc38SStefano Zampini   pcis = (PC_IS*)mat_ctx->pc->data;
22703425bc38SStefano Zampini   /* Application of B_delta^T */
22713425bc38SStefano Zampini   ierr = VecScatterBegin(mat_ctx->l2g_lambda,x,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
22723425bc38SStefano Zampini   ierr = VecScatterEnd(mat_ctx->l2g_lambda,x,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
22733425bc38SStefano Zampini   ierr = MatMultTranspose(mat_ctx->B_delta,mat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr);
22743425bc38SStefano Zampini   /* Application of \widetilde{S}^-1 */
22753425bc38SStefano Zampini   ierr = VecSet(pcis->vec1_D,0.0);CHKERRQ(ierr);
22763425bc38SStefano Zampini   ierr = PCBDDCApplyInterfacePreconditioner(mat_ctx->pc);CHKERRQ(ierr);
22773425bc38SStefano Zampini   /* Application of B_delta */
22783425bc38SStefano Zampini   ierr = MatMult(mat_ctx->B_delta,pcis->vec1_B,mat_ctx->lambda_local);CHKERRQ(ierr);
22793425bc38SStefano Zampini   ierr = VecSet(y,0.0);CHKERRQ(ierr);
22803425bc38SStefano Zampini   ierr = VecScatterBegin(mat_ctx->l2g_lambda,mat_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
22813425bc38SStefano Zampini   ierr = VecScatterEnd(mat_ctx->l2g_lambda,mat_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
22823425bc38SStefano Zampini   PetscFunctionReturn(0);
22833425bc38SStefano Zampini }
22843425bc38SStefano Zampini 
22853425bc38SStefano Zampini #undef __FUNCT__
22863425bc38SStefano Zampini #define __FUNCT__ "FETIDPPCApply"
22873425bc38SStefano Zampini static PetscErrorCode FETIDPPCApply(PC fetipc, Vec x, Vec y)
22883425bc38SStefano Zampini {
22893425bc38SStefano Zampini   FETIDPPC_ctx   *pc_ctx;
22903425bc38SStefano Zampini   PC_IS          *pcis;
22913425bc38SStefano Zampini   PetscErrorCode ierr;
22923425bc38SStefano Zampini 
22933425bc38SStefano Zampini   PetscFunctionBegin;
22943425bc38SStefano Zampini   ierr = PCShellGetContext(fetipc,(void**)&pc_ctx);
22953425bc38SStefano Zampini   pcis = (PC_IS*)pc_ctx->pc->data;
22963425bc38SStefano Zampini   /* Application of B_Ddelta^T */
22973425bc38SStefano Zampini   ierr = VecScatterBegin(pc_ctx->l2g_lambda,x,pc_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
22983425bc38SStefano Zampini   ierr = VecScatterEnd(pc_ctx->l2g_lambda,x,pc_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
22993425bc38SStefano Zampini   ierr = VecSet(pcis->vec2_B,0.0);CHKERRQ(ierr);
23003425bc38SStefano Zampini   ierr = MatMultTranspose(pc_ctx->B_Ddelta,pc_ctx->lambda_local,pcis->vec2_B);CHKERRQ(ierr);
23013425bc38SStefano Zampini   /* Application of S */
23023425bc38SStefano Zampini   ierr = PCISApplySchur(pc_ctx->pc,pcis->vec2_B,pcis->vec1_B,(Vec)0,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr);
23033425bc38SStefano Zampini   /* Application of B_Ddelta */
23043425bc38SStefano Zampini   ierr = MatMult(pc_ctx->B_Ddelta,pcis->vec1_B,pc_ctx->lambda_local);CHKERRQ(ierr);
23053425bc38SStefano Zampini   ierr = VecSet(y,0.0);CHKERRQ(ierr);
23063425bc38SStefano Zampini   ierr = VecScatterBegin(pc_ctx->l2g_lambda,pc_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
23073425bc38SStefano Zampini   ierr = VecScatterEnd(pc_ctx->l2g_lambda,pc_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
23083425bc38SStefano Zampini   PetscFunctionReturn(0);
23093425bc38SStefano Zampini }
23103425bc38SStefano Zampini 
2311da1bb401SStefano Zampini #undef __FUNCT__
2312da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetupLocalAdjacencyGraph"
2313da1bb401SStefano Zampini static PetscErrorCode PCBDDCSetupLocalAdjacencyGraph(PC pc)
2314da1bb401SStefano Zampini {
2315da1bb401SStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
2316da1bb401SStefano Zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
23171a83f524SJed Brown   PetscInt       nvtxs;
23181a83f524SJed Brown   const PetscInt *xadj,*adjncy;
2319da1bb401SStefano Zampini   Mat            mat_adj;
2320da1bb401SStefano Zampini   PetscBool      symmetrize_rowij=PETSC_TRUE,compressed_rowij=PETSC_FALSE,flg_row=PETSC_TRUE;
2321da1bb401SStefano Zampini   PCBDDCGraph    mat_graph=pcbddc->mat_graph;
2322da1bb401SStefano Zampini   PetscErrorCode ierr;
2323da1bb401SStefano Zampini 
2324da1bb401SStefano Zampini   PetscFunctionBegin;
2325da1bb401SStefano Zampini   /* get CSR adjacency from local matrix if user has not yet provided local graph using PCBDDCSetLocalAdjacencyGraph function */
2326da1bb401SStefano Zampini   if (!mat_graph->xadj) {
2327da1bb401SStefano Zampini     ierr = MatConvert(matis->A,MATMPIADJ,MAT_INITIAL_MATRIX,&mat_adj);CHKERRQ(ierr);
2328da1bb401SStefano Zampini     ierr = MatGetRowIJ(mat_adj,0,symmetrize_rowij,compressed_rowij,&nvtxs,&xadj,&adjncy,&flg_row);CHKERRQ(ierr);
2329da1bb401SStefano Zampini     if (!flg_row) {
2330da1bb401SStefano Zampini       SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in MatGetRowIJ called in %s\n",__FUNCT__);
2331da1bb401SStefano Zampini     }
2332da1bb401SStefano Zampini     /* Get adjacency into BDDC workspace */
2333da1bb401SStefano Zampini     ierr = PCBDDCSetLocalAdjacencyGraph(pc,nvtxs,xadj,adjncy,PETSC_COPY_VALUES);CHKERRQ(ierr);
2334da1bb401SStefano Zampini     ierr = MatRestoreRowIJ(mat_adj,0,symmetrize_rowij,compressed_rowij,&nvtxs,&xadj,&adjncy,&flg_row);CHKERRQ(ierr);
2335da1bb401SStefano Zampini     if (!flg_row) {
2336da1bb401SStefano Zampini       SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in MatRestoreRowIJ called in %s\n",__FUNCT__);
2337da1bb401SStefano Zampini     }
2338da1bb401SStefano Zampini     ierr = MatDestroy(&mat_adj);CHKERRQ(ierr);
2339da1bb401SStefano Zampini   }
2340da1bb401SStefano Zampini   PetscFunctionReturn(0);
2341da1bb401SStefano Zampini }
2342da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
23430c7d97c5SJed Brown #undef __FUNCT__
23440c7d97c5SJed Brown #define __FUNCT__ "PCBDDCApplyInterfacePreconditioner"
23452617d88aSStefano Zampini static PetscErrorCode  PCBDDCApplyInterfacePreconditioner(PC pc)
23460c7d97c5SJed Brown {
23470c7d97c5SJed Brown   PetscErrorCode ierr;
23480c7d97c5SJed Brown   PC_BDDC*        pcbddc = (PC_BDDC*)(pc->data);
23490c7d97c5SJed Brown   PC_IS*            pcis = (PC_IS*)  (pc->data);
23503b03a366Sstefano_zampini   const PetscScalar zero = 0.0;
23510c7d97c5SJed Brown 
23520c7d97c5SJed Brown   PetscFunctionBegin;
23530c7d97c5SJed Brown   /* Application of PHI^T  */
23540c7d97c5SJed Brown   ierr = MatMultTranspose(pcbddc->coarse_phi_B,pcis->vec1_B,pcbddc->vec1_P);CHKERRQ(ierr);
235529622bf0SStefano Zampini   if (pcbddc->inexact_prec_type) { ierr = MatMultTransposeAdd(pcbddc->coarse_phi_D,pcis->vec1_D,pcbddc->vec1_P,pcbddc->vec1_P);CHKERRQ(ierr); }
23560c7d97c5SJed Brown 
23570c7d97c5SJed Brown   /* Scatter data of coarse_rhs */
2358142dfd88SStefano Zampini   if (pcbddc->coarse_rhs) { ierr = VecSet(pcbddc->coarse_rhs,zero);CHKERRQ(ierr); }
23590c7d97c5SJed Brown   ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->vec1_P,pcbddc->coarse_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
23600c7d97c5SJed Brown 
23610c7d97c5SJed Brown   /* Local solution on R nodes */
23620c7d97c5SJed Brown   ierr = VecSet(pcbddc->vec1_R,zero);CHKERRQ(ierr);
23630c7d97c5SJed Brown   ierr = VecScatterBegin(pcbddc->R_to_B,pcis->vec1_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
23640c7d97c5SJed Brown   ierr = VecScatterEnd  (pcbddc->R_to_B,pcis->vec1_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
236529622bf0SStefano Zampini   if (pcbddc->inexact_prec_type) {
23660c7d97c5SJed Brown     ierr = VecScatterBegin(pcbddc->R_to_D,pcis->vec1_D,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
23670c7d97c5SJed Brown     ierr = VecScatterEnd  (pcbddc->R_to_D,pcis->vec1_D,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
23680c7d97c5SJed Brown   }
23690c7d97c5SJed Brown   ierr = PCBDDCSolveSaddlePoint(pc);CHKERRQ(ierr);
23700c7d97c5SJed Brown   ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr);
23710c7d97c5SJed Brown   ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec2_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
23720c7d97c5SJed Brown   ierr = VecScatterEnd  (pcbddc->R_to_B,pcbddc->vec2_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
237329622bf0SStefano Zampini   if (pcbddc->inexact_prec_type) {
23740c7d97c5SJed Brown     ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec2_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
23750c7d97c5SJed Brown     ierr = VecScatterEnd  (pcbddc->R_to_D,pcbddc->vec2_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
23760c7d97c5SJed Brown   }
23770c7d97c5SJed Brown 
23780c7d97c5SJed Brown   /* Coarse solution */
23790c7d97c5SJed Brown   ierr = PCBDDCScatterCoarseDataEnd(pc,pcbddc->vec1_P,pcbddc->coarse_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
23800bdf917eSStefano Zampini   if (pcbddc->coarse_rhs) {
23810bdf917eSStefano Zampini     if (pcbddc->CoarseNullSpace) {
23820bdf917eSStefano Zampini       ierr = MatNullSpaceRemove(pcbddc->CoarseNullSpace,pcbddc->coarse_rhs,PETSC_NULL);CHKERRQ(ierr);
23830bdf917eSStefano Zampini     }
23840bdf917eSStefano Zampini     ierr = KSPSolve(pcbddc->coarse_ksp,pcbddc->coarse_rhs,pcbddc->coarse_vec);CHKERRQ(ierr);
23850bdf917eSStefano Zampini     if (pcbddc->CoarseNullSpace) {
23860bdf917eSStefano Zampini       ierr = MatNullSpaceRemove(pcbddc->CoarseNullSpace,pcbddc->coarse_vec,PETSC_NULL);CHKERRQ(ierr);
23870bdf917eSStefano Zampini     }
23880bdf917eSStefano Zampini   }
23890c7d97c5SJed Brown   ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->coarse_vec,pcbddc->vec1_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
23900c7d97c5SJed Brown   ierr = PCBDDCScatterCoarseDataEnd  (pc,pcbddc->coarse_vec,pcbddc->vec1_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
23910c7d97c5SJed Brown 
23920c7d97c5SJed Brown   /* Sum contributions from two levels */
23930c7d97c5SJed Brown   ierr = MatMultAdd(pcbddc->coarse_phi_B,pcbddc->vec1_P,pcis->vec1_B,pcis->vec1_B);CHKERRQ(ierr);
239429622bf0SStefano Zampini   if (pcbddc->inexact_prec_type) { ierr = MatMultAdd(pcbddc->coarse_phi_D,pcbddc->vec1_P,pcis->vec1_D,pcis->vec1_D);CHKERRQ(ierr); }
23950c7d97c5SJed Brown   PetscFunctionReturn(0);
23960c7d97c5SJed Brown }
23970c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
23980c7d97c5SJed Brown #undef __FUNCT__
23990c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSolveSaddlePoint"
240053cdbc3dSStefano Zampini static PetscErrorCode  PCBDDCSolveSaddlePoint(PC pc)
24010c7d97c5SJed Brown {
24020c7d97c5SJed Brown   PetscErrorCode ierr;
24030c7d97c5SJed Brown   PC_BDDC*       pcbddc = (PC_BDDC*)(pc->data);
24040c7d97c5SJed Brown 
24050c7d97c5SJed Brown   PetscFunctionBegin;
240653cdbc3dSStefano Zampini   ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr);
2407534831adSStefano Zampini   if (pcbddc->local_auxmat1) {
24080c7d97c5SJed Brown     ierr = MatMult(pcbddc->local_auxmat1,pcbddc->vec2_R,pcbddc->vec1_C);CHKERRQ(ierr);
24090c7d97c5SJed Brown     ierr = MatMultAdd(pcbddc->local_auxmat2,pcbddc->vec1_C,pcbddc->vec2_R,pcbddc->vec2_R);CHKERRQ(ierr);
24100c7d97c5SJed Brown   }
24110c7d97c5SJed Brown   PetscFunctionReturn(0);
24120c7d97c5SJed Brown }
24130c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
24140c7d97c5SJed Brown #undef __FUNCT__
24150c7d97c5SJed Brown #define __FUNCT__ "PCBDDCScatterCoarseDataBegin"
241653cdbc3dSStefano Zampini static PetscErrorCode  PCBDDCScatterCoarseDataBegin(PC pc,Vec vec_from, Vec vec_to, InsertMode imode, ScatterMode smode)
24170c7d97c5SJed Brown {
24180c7d97c5SJed Brown   PetscErrorCode ierr;
24190c7d97c5SJed Brown   PC_BDDC*       pcbddc = (PC_BDDC*)(pc->data);
24200c7d97c5SJed Brown 
24210c7d97c5SJed Brown   PetscFunctionBegin;
24220c7d97c5SJed Brown   switch(pcbddc->coarse_communications_type){
24230c7d97c5SJed Brown     case SCATTERS_BDDC:
24240c7d97c5SJed Brown       ierr = VecScatterBegin(pcbddc->coarse_loc_to_glob,vec_from,vec_to,imode,smode);CHKERRQ(ierr);
24250c7d97c5SJed Brown       break;
24260c7d97c5SJed Brown     case GATHERS_BDDC:
24270c7d97c5SJed Brown       break;
24280c7d97c5SJed Brown   }
24290c7d97c5SJed Brown   PetscFunctionReturn(0);
24300c7d97c5SJed Brown }
24310c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
24320c7d97c5SJed Brown #undef __FUNCT__
24330c7d97c5SJed Brown #define __FUNCT__ "PCBDDCScatterCoarseDataEnd"
243453cdbc3dSStefano Zampini static PetscErrorCode  PCBDDCScatterCoarseDataEnd(PC pc,Vec vec_from, Vec vec_to, InsertMode imode, ScatterMode smode)
24350c7d97c5SJed Brown {
24360c7d97c5SJed Brown   PetscErrorCode ierr;
24370c7d97c5SJed Brown   PC_BDDC*       pcbddc = (PC_BDDC*)(pc->data);
24380c7d97c5SJed Brown   PetscScalar*   array_to;
24390c7d97c5SJed Brown   PetscScalar*   array_from;
24400c7d97c5SJed Brown   MPI_Comm       comm=((PetscObject)pc)->comm;
24410c7d97c5SJed Brown   PetscInt i;
24420c7d97c5SJed Brown 
24430c7d97c5SJed Brown   PetscFunctionBegin;
24440c7d97c5SJed Brown 
24450c7d97c5SJed Brown   switch(pcbddc->coarse_communications_type){
24460c7d97c5SJed Brown     case SCATTERS_BDDC:
24470c7d97c5SJed Brown       ierr = VecScatterEnd(pcbddc->coarse_loc_to_glob,vec_from,vec_to,imode,smode);CHKERRQ(ierr);
24480c7d97c5SJed Brown       break;
24490c7d97c5SJed Brown     case GATHERS_BDDC:
24500c7d97c5SJed Brown       if (vec_from) VecGetArray(vec_from,&array_from);
24510c7d97c5SJed Brown       if (vec_to)   VecGetArray(vec_to,&array_to);
24520c7d97c5SJed Brown       switch(pcbddc->coarse_problem_type){
24530c7d97c5SJed Brown         case SEQUENTIAL_BDDC:
24540c7d97c5SJed Brown           if (smode == SCATTER_FORWARD) {
245553cdbc3dSStefano Zampini             ierr = MPI_Gatherv(&array_from[0],pcbddc->local_primal_size,MPIU_SCALAR,&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,0,comm);CHKERRQ(ierr);
24560c7d97c5SJed Brown             if (vec_to) {
24570bdf917eSStefano Zampini               if (imode == ADD_VALUES) {
24580bdf917eSStefano Zampini                 for (i=0;i<pcbddc->replicated_primal_size;i++) {
24590c7d97c5SJed Brown                   array_to[pcbddc->replicated_local_primal_indices[i]]+=pcbddc->replicated_local_primal_values[i];
24600c7d97c5SJed Brown                 }
24610c7d97c5SJed Brown               } else {
24620bdf917eSStefano Zampini                 for (i=0;i<pcbddc->replicated_primal_size;i++) {
24630bdf917eSStefano Zampini                   array_to[pcbddc->replicated_local_primal_indices[i]]=pcbddc->replicated_local_primal_values[i];
24640bdf917eSStefano Zampini                 }
24650bdf917eSStefano Zampini               }
24660bdf917eSStefano Zampini             }
24670bdf917eSStefano Zampini           } else {
24680bdf917eSStefano Zampini             if (vec_from) {
24690bdf917eSStefano Zampini               if (imode == ADD_VALUES) {
24700bdf917eSStefano Zampini                 printf("Scatter mode %d, insert mode %d for case %d not implemented!\n",smode,imode,pcbddc->coarse_problem_type);
24710bdf917eSStefano Zampini               }
24720bdf917eSStefano Zampini               for (i=0;i<pcbddc->replicated_primal_size;i++) {
24730c7d97c5SJed Brown                 pcbddc->replicated_local_primal_values[i]=array_from[pcbddc->replicated_local_primal_indices[i]];
24740bdf917eSStefano Zampini               }
24750bdf917eSStefano Zampini             }
247653cdbc3dSStefano Zampini             ierr = MPI_Scatterv(&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,&array_to[0],pcbddc->local_primal_size,MPIU_SCALAR,0,comm);CHKERRQ(ierr);
24770c7d97c5SJed Brown           }
24780c7d97c5SJed Brown           break;
24790c7d97c5SJed Brown         case REPLICATED_BDDC:
24800c7d97c5SJed Brown           if (smode == SCATTER_FORWARD) {
248153cdbc3dSStefano Zampini             ierr = MPI_Allgatherv(&array_from[0],pcbddc->local_primal_size,MPIU_SCALAR,&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,comm);CHKERRQ(ierr);
24820bdf917eSStefano Zampini             if (imode == ADD_VALUES) {
24830bdf917eSStefano Zampini               for (i=0;i<pcbddc->replicated_primal_size;i++) {
24840c7d97c5SJed Brown                 array_to[pcbddc->replicated_local_primal_indices[i]]+=pcbddc->replicated_local_primal_values[i];
24850bdf917eSStefano Zampini               }
24860bdf917eSStefano Zampini             } else {
24870bdf917eSStefano Zampini               for (i=0;i<pcbddc->replicated_primal_size;i++) {
24880bdf917eSStefano Zampini                 array_to[pcbddc->replicated_local_primal_indices[i]]=pcbddc->replicated_local_primal_values[i];
24890bdf917eSStefano Zampini               }
24900bdf917eSStefano Zampini             }
24910c7d97c5SJed Brown           } else { /* no communications needed for SCATTER_REVERSE since needed data is already present */
24920bdf917eSStefano Zampini             if (imode == ADD_VALUES) {
24930bdf917eSStefano Zampini               for (i=0;i<pcbddc->local_primal_size;i++) {
24940bdf917eSStefano Zampini                 array_to[i]+=array_from[pcbddc->local_primal_indices[i]];
24950bdf917eSStefano Zampini               }
24960bdf917eSStefano Zampini             } else {
24970bdf917eSStefano Zampini               for (i=0;i<pcbddc->local_primal_size;i++) {
24980c7d97c5SJed Brown                 array_to[i]=array_from[pcbddc->local_primal_indices[i]];
24990c7d97c5SJed Brown               }
25000bdf917eSStefano Zampini             }
25010bdf917eSStefano Zampini           }
25020c7d97c5SJed Brown           break;
250353cdbc3dSStefano Zampini         case MULTILEVEL_BDDC:
250453cdbc3dSStefano Zampini           break;
250553cdbc3dSStefano Zampini         case PARALLEL_BDDC:
250653cdbc3dSStefano Zampini           break;
25070c7d97c5SJed Brown       }
25080c7d97c5SJed Brown       if (vec_from) VecRestoreArray(vec_from,&array_from);
25090c7d97c5SJed Brown       if (vec_to)   VecRestoreArray(vec_to,&array_to);
25100c7d97c5SJed Brown       break;
25110c7d97c5SJed Brown   }
25120c7d97c5SJed Brown   PetscFunctionReturn(0);
25130c7d97c5SJed Brown }
25140c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
25153b03a366Sstefano_zampini #undef __FUNCT__
25163b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCCreateConstraintMatrix"
25173b03a366Sstefano_zampini static PetscErrorCode PCBDDCCreateConstraintMatrix(PC pc)
25183b03a366Sstefano_zampini {
25193b03a366Sstefano_zampini   PetscErrorCode ierr;
25203b03a366Sstefano_zampini   PC_IS*         pcis = (PC_IS*)(pc->data);
25213b03a366Sstefano_zampini   PC_BDDC*       pcbddc = (PC_BDDC*)pc->data;
25223b03a366Sstefano_zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
252323d4d1a5SStefano Zampini   PetscInt       *nnz,*is_indices;
25243b03a366Sstefano_zampini   PetscScalar    *temp_quadrature_constraint;
2525534831adSStefano Zampini   PetscInt       *temp_indices,*temp_indices_to_constraint,*temp_indices_to_constraint_B,*local_to_B;
25263b03a366Sstefano_zampini   PetscInt       local_primal_size,i,j,k,total_counts,max_size_of_constraint;
25273b03a366Sstefano_zampini   PetscInt       n_constraints,n_vertices,size_of_constraint;
2528534831adSStefano Zampini   PetscScalar    quad_value;
25293b03a366Sstefano_zampini   PetscBool      nnsp_has_cnst=PETSC_FALSE,use_nnsp_true=pcbddc->use_nnsp_true;
25303b03a366Sstefano_zampini   PetscInt       nnsp_size=0,nnsp_addone=0,temp_constraints,temp_start_ptr;
25313b03a366Sstefano_zampini   IS             *used_IS;
253219fd82e9SBarry Smith   MatType        impMatType=MATSEQAIJ;
25333b03a366Sstefano_zampini   PetscBLASInt   Bs,Bt,lwork,lierr;
25343b03a366Sstefano_zampini   PetscReal      tol=1.0e-8;
2535fcda91b4SJed Brown   MatNullSpace   nearnullsp;
2536fcda91b4SJed Brown   const Vec      *nearnullvecs;
25373b03a366Sstefano_zampini   Vec            *localnearnullsp;
25383b03a366Sstefano_zampini   PetscScalar    *work,*temp_basis,*array_vector,*correlation_mat;
25393b03a366Sstefano_zampini   PetscReal      *rwork,*singular_vals;
2540534831adSStefano Zampini   PetscBLASInt   Bone=1,*ipiv;
2541534831adSStefano Zampini   Vec            temp_vec;
2542534831adSStefano Zampini   Mat            temp_mat;
2543534831adSStefano Zampini   KSP            temp_ksp;
2544ffe5efe1SStefano Zampini   PC             temp_pc;
2545534831adSStefano Zampini   PetscInt       s,start_constraint,dual_dofs;
2546534831adSStefano Zampini   PetscBool      compute_submatrix,useksp=PETSC_FALSE;
2547534831adSStefano Zampini   PetscInt       *aux_primal_permutation,*aux_primal_numbering;
2548534831adSStefano Zampini   PetscBool      boolforface,*change_basis;
2549de534f79Sstefano_zampini /* some ugly conditional declarations */
25503b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD)
25513b03a366Sstefano_zampini   PetscScalar    dot_result;
25523b03a366Sstefano_zampini   PetscScalar    one=1.0,zero=0.0;
25533b03a366Sstefano_zampini   PetscInt       ii;
25543425bc38SStefano Zampini   PetscScalar    *singular_vectors;
25553425bc38SStefano Zampini   PetscBLASInt   *iwork,*ifail;
25563425bc38SStefano Zampini   PetscReal      dummy_real,abs_tol;
25573425bc38SStefano Zampini   PetscBLASInt   eigs_found;
25583b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX)
25593b03a366Sstefano_zampini   PetscScalar    val1,val2;
25603b03a366Sstefano_zampini #endif
25613425bc38SStefano Zampini #endif
25623b03a366Sstefano_zampini   PetscBLASInt   dummy_int;
25633b03a366Sstefano_zampini   PetscScalar    dummy_scalar;
25643b03a366Sstefano_zampini 
25653b03a366Sstefano_zampini   PetscFunctionBegin;
25663b03a366Sstefano_zampini   /* check if near null space is attached to global mat */
2567fcda91b4SJed Brown   ierr = MatGetNearNullSpace(pc->pmat,&nearnullsp);CHKERRQ(ierr);
2568fcda91b4SJed Brown   if (nearnullsp) {
2569fcda91b4SJed Brown     ierr = MatNullSpaceGetVecs(nearnullsp,&nnsp_has_cnst,&nnsp_size,&nearnullvecs);CHKERRQ(ierr);
25703b03a366Sstefano_zampini   } else { /* if near null space is not provided it uses constants */
25713b03a366Sstefano_zampini     nnsp_has_cnst = PETSC_TRUE;
25723b03a366Sstefano_zampini     use_nnsp_true = PETSC_TRUE;
25733b03a366Sstefano_zampini   }
25743b03a366Sstefano_zampini   if (nnsp_has_cnst) {
25753b03a366Sstefano_zampini     nnsp_addone = 1;
25763b03a366Sstefano_zampini   }
25773b03a366Sstefano_zampini   /*
25783b03a366Sstefano_zampini        Evaluate maximum storage size needed by the procedure
25793b03a366Sstefano_zampini        - temp_indices will contain start index of each constraint stored as follows
25803b03a366Sstefano_zampini        - temp_indices_to_constraint  [temp_indices[i],...,temp[indices[i+1]-1] will contain the indices (in local numbering) on which the constraint acts
2581534831adSStefano Zampini        - temp_indices_to_constraint_B[temp_indices[i],...,temp[indices[i+1]-1] will contain the indices (in boundary numbering) on which the constraint acts
25823b03a366Sstefano_zampini        - temp_quadrature_constraint  [temp_indices[i],...,temp[indices[i+1]-1] will contain the scalars representing the constraint itself
25833b03a366Sstefano_zampini                                                                                                                                                          */
2584da1bb401SStefano Zampini 
25853b03a366Sstefano_zampini   total_counts = pcbddc->n_ISForFaces+pcbddc->n_ISForEdges;
25863b03a366Sstefano_zampini   total_counts *= (nnsp_addone+nnsp_size);
2587da1bb401SStefano Zampini   ierr = ISGetSize(pcbddc->ISForVertices,&n_vertices);CHKERRQ(ierr);
2588da1bb401SStefano Zampini   total_counts += n_vertices;
25893b03a366Sstefano_zampini   ierr = PetscMalloc((total_counts+1)*sizeof(PetscInt),&temp_indices);CHKERRQ(ierr);
2590534831adSStefano Zampini   ierr = PetscMalloc((total_counts+1)*sizeof(PetscBool),&change_basis);CHKERRQ(ierr);
25913b03a366Sstefano_zampini   total_counts = 0;
25923b03a366Sstefano_zampini   max_size_of_constraint = 0;
25933b03a366Sstefano_zampini   for (i=0;i<pcbddc->n_ISForEdges+pcbddc->n_ISForFaces;i++){
25943b03a366Sstefano_zampini     if (i<pcbddc->n_ISForEdges){
25953b03a366Sstefano_zampini       used_IS = &pcbddc->ISForEdges[i];
25963b03a366Sstefano_zampini     } else {
25973b03a366Sstefano_zampini       used_IS = &pcbddc->ISForFaces[i-pcbddc->n_ISForEdges];
25983b03a366Sstefano_zampini     }
25993b03a366Sstefano_zampini     ierr = ISGetSize(*used_IS,&j);CHKERRQ(ierr);
26003b03a366Sstefano_zampini     total_counts += j;
26013b03a366Sstefano_zampini     if (j>max_size_of_constraint) max_size_of_constraint=j;
26023b03a366Sstefano_zampini   }
26033b03a366Sstefano_zampini   total_counts *= (nnsp_addone+nnsp_size);
2604da1bb401SStefano Zampini   total_counts += n_vertices;
26053b03a366Sstefano_zampini   ierr = PetscMalloc(total_counts*sizeof(PetscScalar),&temp_quadrature_constraint);CHKERRQ(ierr);
26063b03a366Sstefano_zampini   ierr = PetscMalloc(total_counts*sizeof(PetscInt),&temp_indices_to_constraint);CHKERRQ(ierr);
2607534831adSStefano Zampini   ierr = PetscMalloc(total_counts*sizeof(PetscInt),&temp_indices_to_constraint_B);CHKERRQ(ierr);
2608534831adSStefano Zampini   ierr = PetscMalloc(pcis->n*sizeof(PetscInt),&local_to_B);CHKERRQ(ierr);
2609534831adSStefano Zampini   ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2610534831adSStefano Zampini   for (i=0;i<pcis->n;i++) {
2611534831adSStefano Zampini     local_to_B[i]=-1;
2612534831adSStefano Zampini   }
2613534831adSStefano Zampini   for (i=0;i<pcis->n_B;i++) {
2614534831adSStefano Zampini     local_to_B[is_indices[i]]=i;
2615534831adSStefano Zampini   }
2616534831adSStefano Zampini   ierr = ISRestoreIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2617534831adSStefano Zampini 
26183b03a366Sstefano_zampini   /* First we issue queries to allocate optimal workspace for LAPACKgesvd or LAPACKsyev/LAPACKheev */
26193b03a366Sstefano_zampini   rwork = 0;
26203b03a366Sstefano_zampini   work = 0;
26213b03a366Sstefano_zampini   singular_vals = 0;
26223b03a366Sstefano_zampini   temp_basis = 0;
26233b03a366Sstefano_zampini   correlation_mat = 0;
26243b03a366Sstefano_zampini   if (!pcbddc->use_nnsp_true) {
26253b03a366Sstefano_zampini     PetscScalar temp_work;
26263b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD)
26273b03a366Sstefano_zampini     /* POD */
26283b03a366Sstefano_zampini     PetscInt max_n;
26293b03a366Sstefano_zampini     max_n = nnsp_addone+nnsp_size;
26303b03a366Sstefano_zampini     /* using some techniques borrowed from Proper Orthogonal Decomposition */
26313b03a366Sstefano_zampini     ierr = PetscMalloc(max_n*max_n*sizeof(PetscScalar),&correlation_mat);CHKERRQ(ierr);
26323425bc38SStefano Zampini     ierr = PetscMalloc(max_n*max_n*sizeof(PetscScalar),&singular_vectors);CHKERRQ(ierr);
26333b03a366Sstefano_zampini     ierr = PetscMalloc(max_n*sizeof(PetscReal),&singular_vals);CHKERRQ(ierr);
26343b03a366Sstefano_zampini     ierr = PetscMalloc(max_size_of_constraint*(nnsp_addone+nnsp_size)*sizeof(PetscScalar),&temp_basis);CHKERRQ(ierr);
26353b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX)
26363b03a366Sstefano_zampini     ierr = PetscMalloc(3*max_n*sizeof(PetscReal),&rwork);CHKERRQ(ierr);
26373b03a366Sstefano_zampini #endif
26383425bc38SStefano Zampini     ierr = PetscMalloc(5*max_n*sizeof(PetscBLASInt),&iwork);CHKERRQ(ierr);
26393425bc38SStefano Zampini     ierr = PetscMalloc(max_n*sizeof(PetscBLASInt),&ifail);CHKERRQ(ierr);
26403b03a366Sstefano_zampini     /* now we evaluate the optimal workspace using query with lwork=-1 */
26413b03a366Sstefano_zampini     Bt = PetscBLASIntCast(max_n);
26423b03a366Sstefano_zampini     lwork=-1;
26433425bc38SStefano Zampini     ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
26443b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX)
26453425bc38SStefano Zampini     abs_tol=1.e-8;
26463425bc38SStefano Zampini /*    LAPACKsyev_("V","U",&Bt,correlation_mat,&Bt,singular_vals,&temp_work,&lwork,&lierr); */
26473425bc38SStefano Zampini     LAPACKsyevx_("V","A","U",&Bt,correlation_mat,&Bt,&dummy_real,&dummy_real,&dummy_int,&dummy_int,
26483425bc38SStefano Zampini                  &abs_tol,&eigs_found,singular_vals,singular_vectors,&Bt,&temp_work,&lwork,iwork,ifail,&lierr);
26493b03a366Sstefano_zampini #else
26503425bc38SStefano Zampini /*    LAPACKsyev_("V","U",&Bt,correlation_mat,&Bt,singular_vals,&temp_work,&lwork,rwork,&lierr); */
26513425bc38SStefano Zampini /*  LAPACK call is missing here! TODO */
26523425bc38SStefano Zampini     SETERRQ(((PetscObject) pc)->comm, PETSC_ERR_SUP, "Not yet implemented for complexes when PETSC_MISSING_GESVD = 1");
26533b03a366Sstefano_zampini #endif
26543425bc38SStefano Zampini     if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to SYEVX Lapack routine %d",(int)lierr);
26553425bc38SStefano Zampini     ierr = PetscFPTrapPop();CHKERRQ(ierr);
26563b03a366Sstefano_zampini #else /* on missing GESVD */
26573b03a366Sstefano_zampini     /* SVD */
26583b03a366Sstefano_zampini     PetscInt max_n,min_n;
26593b03a366Sstefano_zampini     max_n = max_size_of_constraint;
26603b03a366Sstefano_zampini     min_n = nnsp_addone+nnsp_size;
26613b03a366Sstefano_zampini     if (max_size_of_constraint < ( nnsp_addone+nnsp_size ) ) {
26623b03a366Sstefano_zampini       min_n = max_size_of_constraint;
26633b03a366Sstefano_zampini       max_n = nnsp_addone+nnsp_size;
26643b03a366Sstefano_zampini     }
26653b03a366Sstefano_zampini     ierr = PetscMalloc(min_n*sizeof(PetscReal),&singular_vals);CHKERRQ(ierr);
26663b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX)
26673b03a366Sstefano_zampini     ierr = PetscMalloc(5*min_n*sizeof(PetscReal),&rwork);CHKERRQ(ierr);
26683b03a366Sstefano_zampini #endif
26693b03a366Sstefano_zampini     /* now we evaluate the optimal workspace using query with lwork=-1 */
26703b03a366Sstefano_zampini     lwork=-1;
26713b03a366Sstefano_zampini     Bs = PetscBLASIntCast(max_n);
26723b03a366Sstefano_zampini     Bt = PetscBLASIntCast(min_n);
26733b03a366Sstefano_zampini     dummy_int = Bs;
2674670f3ff9SJed Brown     ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
26753b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX)
26763b03a366Sstefano_zampini     LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[0],&Bs,singular_vals,
26773b03a366Sstefano_zampini                  &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,&temp_work,&lwork,&lierr);
26783b03a366Sstefano_zampini #else
26793b03a366Sstefano_zampini     LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[0],&Bs,singular_vals,
26803b03a366Sstefano_zampini                  &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,&temp_work,&lwork,rwork,&lierr);
26813b03a366Sstefano_zampini #endif
26823b03a366Sstefano_zampini     if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to SVD Lapack routine %d",(int)lierr);
2683670f3ff9SJed Brown     ierr = PetscFPTrapPop();CHKERRQ(ierr);
26843b03a366Sstefano_zampini #endif
26853b03a366Sstefano_zampini     /* Allocate optimal workspace */
26863b03a366Sstefano_zampini     lwork = PetscBLASIntCast((PetscInt)PetscRealPart(temp_work));
26873b03a366Sstefano_zampini     total_counts = (PetscInt)lwork;
26883b03a366Sstefano_zampini     ierr = PetscMalloc(total_counts*sizeof(PetscScalar),&work);CHKERRQ(ierr);
26893b03a366Sstefano_zampini   }
26903b03a366Sstefano_zampini   /* get local part of global near null space vectors */
26913b03a366Sstefano_zampini   ierr = PetscMalloc(nnsp_size*sizeof(Vec),&localnearnullsp);CHKERRQ(ierr);
26923b03a366Sstefano_zampini   for (k=0;k<nnsp_size;k++) {
26933b03a366Sstefano_zampini     ierr = VecDuplicate(pcis->vec1_N,&localnearnullsp[k]);CHKERRQ(ierr);
2694fcda91b4SJed Brown     ierr = VecScatterBegin(matis->ctx,nearnullvecs[k],localnearnullsp[k],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
2695fcda91b4SJed Brown     ierr = VecScatterEnd  (matis->ctx,nearnullvecs[k],localnearnullsp[k],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
26963b03a366Sstefano_zampini   }
26973b03a366Sstefano_zampini   /* Now we can loop on constraining sets */
26983b03a366Sstefano_zampini   total_counts=0;
26993b03a366Sstefano_zampini   temp_indices[0]=0;
2700da1bb401SStefano Zampini   /* vertices */
2701da1bb401SStefano Zampini   PetscBool used_vertex;
2702da1bb401SStefano Zampini   ierr = ISGetIndices(pcbddc->ISForVertices,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2703da1bb401SStefano Zampini   if (nnsp_has_cnst) { /* consider all vertices */
2704da1bb401SStefano Zampini     for (i=0;i<n_vertices;i++) {
2705da1bb401SStefano Zampini       temp_indices_to_constraint[temp_indices[total_counts]]=is_indices[i];
2706534831adSStefano Zampini       temp_indices_to_constraint_B[temp_indices[total_counts]]=local_to_B[is_indices[i]];
2707da1bb401SStefano Zampini       temp_quadrature_constraint[temp_indices[total_counts]]=1.0;
2708da1bb401SStefano Zampini       temp_indices[total_counts+1]=temp_indices[total_counts]+1;
2709534831adSStefano Zampini       change_basis[total_counts]=PETSC_FALSE;
2710da1bb401SStefano Zampini       total_counts++;
2711da1bb401SStefano Zampini     }
2712da1bb401SStefano Zampini   } else { /* consider vertices for which exist at least a localnearnullsp which is not null there */
2713da1bb401SStefano Zampini     for (i=0;i<n_vertices;i++) {
2714da1bb401SStefano Zampini       used_vertex=PETSC_FALSE;
2715da1bb401SStefano Zampini       k=0;
2716da1bb401SStefano Zampini       while(!used_vertex && k<nnsp_size) {
2717da1bb401SStefano Zampini         ierr = VecGetArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr);
2718da1bb401SStefano Zampini         if (PetscAbsScalar(array_vector[is_indices[i]])>0.0) {
2719da1bb401SStefano Zampini           temp_indices_to_constraint[temp_indices[total_counts]]=is_indices[i];
2720534831adSStefano Zampini           temp_indices_to_constraint_B[temp_indices[total_counts]]=local_to_B[is_indices[i]];
2721da1bb401SStefano Zampini           temp_quadrature_constraint[temp_indices[total_counts]]=1.0;
2722da1bb401SStefano Zampini           temp_indices[total_counts+1]=temp_indices[total_counts]+1;
2723534831adSStefano Zampini           change_basis[total_counts]=PETSC_FALSE;
2724da1bb401SStefano Zampini           total_counts++;
2725da1bb401SStefano Zampini           used_vertex=PETSC_TRUE;
2726da1bb401SStefano Zampini         }
2727da1bb401SStefano Zampini         ierr = VecRestoreArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr);
2728da1bb401SStefano Zampini         k++;
2729da1bb401SStefano Zampini       }
2730da1bb401SStefano Zampini     }
2731da1bb401SStefano Zampini   }
2732da1bb401SStefano Zampini   ierr = ISRestoreIndices(pcbddc->ISForVertices,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2733da1bb401SStefano Zampini   n_vertices=total_counts;
2734da1bb401SStefano Zampini   /* edges and faces */
27353b03a366Sstefano_zampini   for (i=0;i<pcbddc->n_ISForEdges+pcbddc->n_ISForFaces;i++){
27363b03a366Sstefano_zampini     if (i<pcbddc->n_ISForEdges){
27373b03a366Sstefano_zampini       used_IS = &pcbddc->ISForEdges[i];
2738534831adSStefano Zampini       boolforface = pcbddc->usechangeofbasis;
27393b03a366Sstefano_zampini     } else {
27403b03a366Sstefano_zampini       used_IS = &pcbddc->ISForFaces[i-pcbddc->n_ISForEdges];
2741534831adSStefano Zampini       boolforface = pcbddc->usechangeonfaces;
27423b03a366Sstefano_zampini     }
27433b03a366Sstefano_zampini     temp_constraints = 0;          /* zero the number of constraints I have on this conn comp */
27443b03a366Sstefano_zampini     temp_start_ptr = total_counts; /* need to know the starting index of constraints stored */
27453b03a366Sstefano_zampini     ierr = ISGetSize(*used_IS,&size_of_constraint);CHKERRQ(ierr);
27463b03a366Sstefano_zampini     ierr = ISGetIndices(*used_IS,(const PetscInt**)&is_indices);CHKERRQ(ierr);
27473b03a366Sstefano_zampini     if (nnsp_has_cnst) {
27483b03a366Sstefano_zampini       temp_constraints++;
2749534831adSStefano Zampini       quad_value = (PetscScalar) (1.0/PetscSqrtReal((PetscReal)size_of_constraint));
27503b03a366Sstefano_zampini       for (j=0;j<size_of_constraint;j++) {
27513b03a366Sstefano_zampini         temp_indices_to_constraint[temp_indices[total_counts]+j]=is_indices[j];
2752534831adSStefano Zampini         temp_indices_to_constraint_B[temp_indices[total_counts]+j]=local_to_B[is_indices[j]];
27533b03a366Sstefano_zampini         temp_quadrature_constraint[temp_indices[total_counts]+j]=quad_value;
27543b03a366Sstefano_zampini       }
27553b03a366Sstefano_zampini       temp_indices[total_counts+1]=temp_indices[total_counts]+size_of_constraint;  /* store new starting point */
2756534831adSStefano Zampini       change_basis[total_counts]=boolforface;
27573b03a366Sstefano_zampini       total_counts++;
27583b03a366Sstefano_zampini     }
27593b03a366Sstefano_zampini     for (k=0;k<nnsp_size;k++) {
27603b03a366Sstefano_zampini       ierr = VecGetArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr);
27613b03a366Sstefano_zampini       for (j=0;j<size_of_constraint;j++) {
27623b03a366Sstefano_zampini         temp_indices_to_constraint[temp_indices[total_counts]+j]=is_indices[j];
2763534831adSStefano Zampini         temp_indices_to_constraint_B[temp_indices[total_counts]+j]=local_to_B[is_indices[j]];
27643b03a366Sstefano_zampini         temp_quadrature_constraint[temp_indices[total_counts]+j]=array_vector[is_indices[j]];
27653b03a366Sstefano_zampini       }
27663b03a366Sstefano_zampini       ierr = VecRestoreArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr);
2767de534f79Sstefano_zampini       quad_value = 1.0;
2768de534f79Sstefano_zampini       if ( use_nnsp_true ) { /* check if array is null on the connected component in case use_nnsp_true has been requested */
2769de534f79Sstefano_zampini         Bs = PetscBLASIntCast(size_of_constraint);
2770de534f79Sstefano_zampini         quad_value = BLASasum_(&Bs,&temp_quadrature_constraint[temp_indices[total_counts]],&Bone);
2771de534f79Sstefano_zampini       }
2772de534f79Sstefano_zampini       if ( quad_value > 0.0 ) { /* keep indices and values */
2773de534f79Sstefano_zampini         temp_constraints++;
27743b03a366Sstefano_zampini         temp_indices[total_counts+1]=temp_indices[total_counts]+size_of_constraint;  /* store new starting point */
2775534831adSStefano Zampini         change_basis[total_counts]=boolforface;
27763b03a366Sstefano_zampini         total_counts++;
27773b03a366Sstefano_zampini       }
2778de534f79Sstefano_zampini     }
27793b03a366Sstefano_zampini     ierr = ISRestoreIndices(*used_IS,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2780de534f79Sstefano_zampini     /* perform SVD on the constraint if use_nnsp_true has not be requested by the user */
27813b03a366Sstefano_zampini     if (!use_nnsp_true) {
2782de534f79Sstefano_zampini 
27833b03a366Sstefano_zampini       Bs = PetscBLASIntCast(size_of_constraint);
27843b03a366Sstefano_zampini       Bt = PetscBLASIntCast(temp_constraints);
2785de534f79Sstefano_zampini 
27863b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD)
27873b03a366Sstefano_zampini       ierr = PetscMemzero(correlation_mat,Bt*Bt*sizeof(PetscScalar));CHKERRQ(ierr);
27883b03a366Sstefano_zampini       /* Store upper triangular part of correlation matrix */
27893b03a366Sstefano_zampini       for (j=0;j<temp_constraints;j++) {
27903b03a366Sstefano_zampini         for (k=0;k<j+1;k++) {
27913b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX)
27923425bc38SStefano Zampini           /* hand made complex dot product -> replace */
27933b03a366Sstefano_zampini           dot_result = 0.0;
27943b03a366Sstefano_zampini           for (ii=0; ii<size_of_constraint; ii++) {
27953b03a366Sstefano_zampini             val1 = temp_quadrature_constraint[temp_indices[temp_start_ptr+j]+ii];
27963b03a366Sstefano_zampini             val2 = temp_quadrature_constraint[temp_indices[temp_start_ptr+k]+ii];
27973b03a366Sstefano_zampini             dot_result += val1*PetscConj(val2);
27983b03a366Sstefano_zampini           }
27993b03a366Sstefano_zampini #else
28003b03a366Sstefano_zampini           dot_result = BLASdot_(&Bs,&temp_quadrature_constraint[temp_indices[temp_start_ptr+j]],&Bone,
28013b03a366Sstefano_zampini                                     &temp_quadrature_constraint[temp_indices[temp_start_ptr+k]],&Bone);
28023b03a366Sstefano_zampini #endif
28033b03a366Sstefano_zampini           correlation_mat[j*temp_constraints+k]=dot_result;
28043b03a366Sstefano_zampini         }
28053b03a366Sstefano_zampini       }
28063425bc38SStefano Zampini       ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
28073b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX)
28083425bc38SStefano Zampini /*      LAPACKsyev_("V","U",&Bt,correlation_mat,&Bt,singular_vals,work,&lwork,&lierr); */
28093425bc38SStefano Zampini       LAPACKsyevx_("V","A","U",&Bt,correlation_mat,&Bt,&dummy_real,&dummy_real,&dummy_int,&dummy_int,
28103425bc38SStefano Zampini                  &abs_tol,&eigs_found,singular_vals,singular_vectors,&Bt,work,&lwork,iwork,ifail,&lierr);
28113b03a366Sstefano_zampini #else
28123425bc38SStefano Zampini /*  LAPACK call is missing here! TODO */
28133425bc38SStefano Zampini       SETERRQ(((PetscObject) pc)->comm, PETSC_ERR_SUP, "Not yet implemented for complexes when PETSC_MISSING_GESVD = 1");
28143b03a366Sstefano_zampini #endif
28153425bc38SStefano Zampini       if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYEVX Lapack routine %d",(int)lierr);
28163425bc38SStefano Zampini       ierr = PetscFPTrapPop();CHKERRQ(ierr);
28173b03a366Sstefano_zampini       /* retain eigenvalues greater than tol: note that lapack SYEV gives eigs in ascending order */
28183b03a366Sstefano_zampini       j=0;
28193b03a366Sstefano_zampini       while( j < Bt && singular_vals[j] < tol) j++;
28203b03a366Sstefano_zampini       total_counts=total_counts-j;
28213b03a366Sstefano_zampini       if (j<temp_constraints) {
28223b03a366Sstefano_zampini         for (k=j;k<Bt;k++) { singular_vals[k]=1.0/PetscSqrtReal(singular_vals[k]); }
28233425bc38SStefano Zampini         ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
28243b03a366Sstefano_zampini         BLASgemm_("N","N",&Bs,&Bt,&Bt,&one,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,correlation_mat,&Bt,&zero,temp_basis,&Bs);
28253425bc38SStefano Zampini         ierr = PetscFPTrapPop();CHKERRQ(ierr);
28263b03a366Sstefano_zampini         /* copy POD basis into used quadrature memory */
28273b03a366Sstefano_zampini         for (k=0;k<Bt-j;k++) {
28283b03a366Sstefano_zampini           for (ii=0;ii<size_of_constraint;ii++) {
28293b03a366Sstefano_zampini             temp_quadrature_constraint[temp_indices[temp_start_ptr+k]+ii]=singular_vals[Bt-1-k]*temp_basis[(Bt-1-k)*size_of_constraint+ii];
28303b03a366Sstefano_zampini           }
28313b03a366Sstefano_zampini         }
28323b03a366Sstefano_zampini       }
2833de534f79Sstefano_zampini 
28343b03a366Sstefano_zampini #else  /* on missing GESVD */
28353b03a366Sstefano_zampini       PetscInt min_n = temp_constraints;
28363b03a366Sstefano_zampini       if (min_n > size_of_constraint) min_n = size_of_constraint;
28373b03a366Sstefano_zampini       dummy_int = Bs;
2838670f3ff9SJed Brown       ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
28393b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX)
28403b03a366Sstefano_zampini       LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,singular_vals,
28413b03a366Sstefano_zampini                    &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,work,&lwork,&lierr);
28423b03a366Sstefano_zampini #else
28433b03a366Sstefano_zampini       LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,singular_vals,
28443b03a366Sstefano_zampini                    &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,work,&lwork,rwork,&lierr);
28453b03a366Sstefano_zampini #endif
28463b03a366Sstefano_zampini       if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SVD Lapack routine %d",(int)lierr);
2847670f3ff9SJed Brown       ierr = PetscFPTrapPop();CHKERRQ(ierr);
28483b03a366Sstefano_zampini       /* retain eigenvalues greater than tol: note that lapack SVD gives eigs in descending order */
28493b03a366Sstefano_zampini       j=0;
28503b03a366Sstefano_zampini       while( j < min_n && singular_vals[min_n-j-1] < tol) j++;
28513b03a366Sstefano_zampini       total_counts = total_counts-(PetscInt)Bt+(min_n-j);
28523b03a366Sstefano_zampini #endif
28533b03a366Sstefano_zampini     }
28543b03a366Sstefano_zampini   }
2855534831adSStefano Zampini 
2856da1bb401SStefano Zampini   n_constraints=total_counts-n_vertices;
2857da1bb401SStefano Zampini   local_primal_size = total_counts;
28583b03a366Sstefano_zampini   /* set quantities in pcbddc data structure */
28593b03a366Sstefano_zampini   pcbddc->n_vertices = n_vertices;
28603b03a366Sstefano_zampini   pcbddc->n_constraints = n_constraints;
2861da1bb401SStefano Zampini   pcbddc->local_primal_size = local_primal_size;
2862534831adSStefano Zampini 
2863534831adSStefano Zampini   /* Create constraint matrix */
2864534831adSStefano Zampini   /* The constraint matrix is used to compute the l2g map of primal dofs */
2865534831adSStefano Zampini   /* so we need to set it up properly either with or without change of basis */
2866534831adSStefano Zampini   ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->ConstraintMatrix);CHKERRQ(ierr);
2867534831adSStefano Zampini   ierr = MatSetType(pcbddc->ConstraintMatrix,impMatType);CHKERRQ(ierr);
2868534831adSStefano Zampini   ierr = MatSetSizes(pcbddc->ConstraintMatrix,local_primal_size,pcis->n,local_primal_size,pcis->n);CHKERRQ(ierr);
2869534831adSStefano Zampini   /* compute a local numbering of constraints : vertices first then constraints */
2870534831adSStefano Zampini   ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
2871534831adSStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array_vector);CHKERRQ(ierr);
2872534831adSStefano Zampini   ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&aux_primal_numbering);CHKERRQ(ierr);
2873534831adSStefano Zampini   ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&aux_primal_permutation);CHKERRQ(ierr);
2874534831adSStefano Zampini   total_counts=0;
2875534831adSStefano Zampini   /* find vertices: subdomain corners plus dofs with basis changed */
2876534831adSStefano Zampini   for (i=0;i<local_primal_size;i++) {
2877534831adSStefano Zampini     size_of_constraint=temp_indices[i+1]-temp_indices[i];
2878534831adSStefano Zampini     if (change_basis[i] || size_of_constraint == 1) {
2879534831adSStefano Zampini       k=0;
2880534831adSStefano Zampini       while(k < size_of_constraint && array_vector[temp_indices_to_constraint[temp_indices[i]+size_of_constraint-k-1]] != 0.0) {
2881534831adSStefano Zampini         k=k+1;
2882534831adSStefano Zampini       }
2883534831adSStefano Zampini       j=temp_indices_to_constraint[temp_indices[i]+size_of_constraint-k-1];
2884534831adSStefano Zampini       array_vector[j] = 1.0;
2885534831adSStefano Zampini       aux_primal_numbering[total_counts]=j;
2886534831adSStefano Zampini       aux_primal_permutation[total_counts]=total_counts;
2887534831adSStefano Zampini       total_counts++;
2888534831adSStefano Zampini     }
2889534831adSStefano Zampini   }
2890534831adSStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array_vector);CHKERRQ(ierr);
2891534831adSStefano Zampini   /* permute indices in order to have a sorted set of vertices */
2892534831adSStefano Zampini   ierr = PetscSortIntWithPermutation(total_counts,aux_primal_numbering,aux_primal_permutation);
2893534831adSStefano Zampini   /* nonzero structure */
2894534831adSStefano Zampini   ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&nnz);CHKERRQ(ierr);
2895534831adSStefano Zampini   for (i=0;i<total_counts;i++) {
2896534831adSStefano Zampini     nnz[i]=1;
2897534831adSStefano Zampini   }
2898534831adSStefano Zampini   j=total_counts;
2899534831adSStefano Zampini   for (i=n_vertices;i<local_primal_size;i++) {
2900534831adSStefano Zampini     if (!change_basis[i]) {
2901534831adSStefano Zampini       nnz[j]=temp_indices[i+1]-temp_indices[i];
2902534831adSStefano Zampini       j++;
2903534831adSStefano Zampini     }
2904534831adSStefano Zampini   }
2905534831adSStefano Zampini   ierr = MatSeqAIJSetPreallocation(pcbddc->ConstraintMatrix,0,nnz);CHKERRQ(ierr);
2906534831adSStefano Zampini   ierr = PetscFree(nnz);CHKERRQ(ierr);
2907534831adSStefano Zampini   /* set values in constraint matrix */
2908534831adSStefano Zampini   for (i=0;i<total_counts;i++) {
2909534831adSStefano Zampini     j = aux_primal_permutation[i];
2910534831adSStefano Zampini     k = aux_primal_numbering[j];
2911534831adSStefano Zampini     ierr = MatSetValue(pcbddc->ConstraintMatrix,i,k,1.0,INSERT_VALUES);CHKERRQ(ierr);
2912534831adSStefano Zampini   }
2913534831adSStefano Zampini   for (i=n_vertices;i<local_primal_size;i++) {
2914534831adSStefano Zampini     if (!change_basis[i]) {
2915534831adSStefano Zampini       size_of_constraint=temp_indices[i+1]-temp_indices[i];
2916534831adSStefano Zampini       ierr = MatSetValues(pcbddc->ConstraintMatrix,1,&total_counts,size_of_constraint,&temp_indices_to_constraint[temp_indices[i]],&temp_quadrature_constraint[temp_indices[i]],INSERT_VALUES);CHKERRQ(ierr);
2917534831adSStefano Zampini       total_counts++;
2918534831adSStefano Zampini     }
2919534831adSStefano Zampini   }
2920534831adSStefano Zampini   ierr = PetscFree(aux_primal_numbering);CHKERRQ(ierr);
2921534831adSStefano Zampini   ierr = PetscFree(aux_primal_permutation);CHKERRQ(ierr);
2922534831adSStefano Zampini   /* assembling */
2923534831adSStefano Zampini   ierr = MatAssemblyBegin(pcbddc->ConstraintMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2924534831adSStefano Zampini   ierr = MatAssemblyEnd(pcbddc->ConstraintMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2925534831adSStefano Zampini 
2926534831adSStefano Zampini   /* Create matrix for change of basis. We don't need it in case pcbddc->usechangeofbasis is FALSE */
2927534831adSStefano Zampini   if (pcbddc->usechangeofbasis) {
2928534831adSStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->ChangeOfBasisMatrix);CHKERRQ(ierr);
2929534831adSStefano Zampini     ierr = MatSetType(pcbddc->ChangeOfBasisMatrix,impMatType);CHKERRQ(ierr);
2930534831adSStefano Zampini     ierr = MatSetSizes(pcbddc->ChangeOfBasisMatrix,pcis->n_B,pcis->n_B,pcis->n_B,pcis->n_B);CHKERRQ(ierr);
2931534831adSStefano Zampini     /* work arrays */
2932534831adSStefano Zampini     /* we need to reuse these arrays, so we free them */
2933534831adSStefano Zampini     ierr = PetscFree(temp_basis);CHKERRQ(ierr);
2934534831adSStefano Zampini     ierr = PetscFree(work);CHKERRQ(ierr);
2935534831adSStefano Zampini     ierr = PetscMalloc(pcis->n_B*sizeof(PetscInt),&nnz);CHKERRQ(ierr);
2936534831adSStefano Zampini     ierr = PetscMalloc((nnsp_addone+nnsp_size)*(nnsp_addone+nnsp_size)*sizeof(PetscScalar),&temp_basis);CHKERRQ(ierr);
2937534831adSStefano Zampini     ierr = PetscMalloc((nnsp_addone+nnsp_size)*sizeof(PetscScalar),&work);CHKERRQ(ierr);
2938534831adSStefano Zampini     ierr = PetscMalloc((nnsp_addone+nnsp_size)*sizeof(PetscBLASInt),&ipiv);CHKERRQ(ierr);
2939534831adSStefano Zampini     for (i=0;i<pcis->n_B;i++) {
2940534831adSStefano Zampini       nnz[i]=1;
2941534831adSStefano Zampini     }
2942534831adSStefano Zampini     /* Overestimated nonzeros per row */
2943534831adSStefano Zampini     k=1;
2944534831adSStefano Zampini     for (i=pcbddc->n_vertices;i<local_primal_size;i++) {
2945534831adSStefano Zampini       if (change_basis[i]) {
2946534831adSStefano Zampini         size_of_constraint = temp_indices[i+1]-temp_indices[i];
2947534831adSStefano Zampini         if (k < size_of_constraint) {
2948534831adSStefano Zampini           k = size_of_constraint;
2949534831adSStefano Zampini         }
2950534831adSStefano Zampini         for (j=0;j<size_of_constraint;j++) {
2951534831adSStefano Zampini           nnz[temp_indices_to_constraint_B[temp_indices[i]+j]] = size_of_constraint;
2952534831adSStefano Zampini         }
2953534831adSStefano Zampini       }
2954534831adSStefano Zampini     }
2955534831adSStefano Zampini     ierr = MatSeqAIJSetPreallocation(pcbddc->ChangeOfBasisMatrix,0,nnz);CHKERRQ(ierr);
2956534831adSStefano Zampini     ierr = PetscFree(nnz);CHKERRQ(ierr);
2957534831adSStefano Zampini     /* Temporary array to store indices */
2958534831adSStefano Zampini     ierr = PetscMalloc(k*sizeof(PetscInt),&is_indices);CHKERRQ(ierr);
2959534831adSStefano Zampini     /* Set initial identity in the matrix */
2960534831adSStefano Zampini     for (i=0;i<pcis->n_B;i++) {
2961534831adSStefano Zampini       ierr = MatSetValue(pcbddc->ChangeOfBasisMatrix,i,i,1.0,INSERT_VALUES);CHKERRQ(ierr);
2962534831adSStefano Zampini     }
2963534831adSStefano Zampini     /* Now we loop on the constraints which need a change of basis */
2964534831adSStefano Zampini     /* Change of basis matrix is evaluated as the FIRST APPROACH in */
2965534831adSStefano Zampini     /* Klawonn and Widlund, Dual-primal FETI-DP methods for linear elasticity, (6.2.1) */
2966534831adSStefano Zampini     temp_constraints = 0;
296793dc3b60SStefano Zampini     if (pcbddc->n_vertices < local_primal_size) {
2968534831adSStefano Zampini       temp_start_ptr = temp_indices_to_constraint_B[temp_indices[pcbddc->n_vertices]];
296993dc3b60SStefano Zampini     }
2970534831adSStefano Zampini     for (i=pcbddc->n_vertices;i<local_primal_size;i++) {
2971534831adSStefano Zampini       if (change_basis[i]) {
2972534831adSStefano Zampini         compute_submatrix = PETSC_FALSE;
2973534831adSStefano Zampini         useksp = PETSC_FALSE;
2974534831adSStefano Zampini         if (temp_start_ptr == temp_indices_to_constraint_B[temp_indices[i]]) {
2975534831adSStefano Zampini           temp_constraints++;
297604eaf177SStefano Zampini           if (i == local_primal_size -1 ||  temp_start_ptr != temp_indices_to_constraint_B[temp_indices[i+1]]) {
2977534831adSStefano Zampini             compute_submatrix = PETSC_TRUE;
2978534831adSStefano Zampini           }
2979534831adSStefano Zampini         }
2980534831adSStefano Zampini         if (compute_submatrix) {
2981534831adSStefano Zampini           if (temp_constraints > 1 || pcbddc->use_nnsp_true) {
2982534831adSStefano Zampini             useksp = PETSC_TRUE;
2983534831adSStefano Zampini           }
2984534831adSStefano Zampini           size_of_constraint = temp_indices[i+1]-temp_indices[i];
2985534831adSStefano Zampini           if (useksp) { /* experimental */
2986534831adSStefano Zampini             ierr = MatCreate(PETSC_COMM_SELF,&temp_mat);CHKERRQ(ierr);
2987534831adSStefano Zampini             ierr = MatSetType(temp_mat,impMatType);CHKERRQ(ierr);
2988534831adSStefano Zampini             ierr = MatSetSizes(temp_mat,size_of_constraint,size_of_constraint,size_of_constraint,size_of_constraint);CHKERRQ(ierr);
2989534831adSStefano Zampini             ierr = MatSeqAIJSetPreallocation(temp_mat,size_of_constraint,PETSC_NULL);CHKERRQ(ierr);
2990534831adSStefano Zampini           }
2991534831adSStefano Zampini           /* First _size_of_constraint-temp_constraints_ columns */
2992534831adSStefano Zampini           dual_dofs = size_of_constraint-temp_constraints;
2993534831adSStefano Zampini           start_constraint = i+1-temp_constraints;
2994534831adSStefano Zampini           for (s=0;s<dual_dofs;s++) {
2995534831adSStefano Zampini             is_indices[0] = s;
2996534831adSStefano Zampini             for (j=0;j<temp_constraints;j++) {
2997534831adSStefano Zampini               for (k=0;k<temp_constraints;k++) {
2998534831adSStefano Zampini                 temp_basis[j*temp_constraints+k]=temp_quadrature_constraint[temp_indices[start_constraint+k]+s+j+1];
2999534831adSStefano Zampini               }
3000534831adSStefano Zampini               work[j]=-temp_quadrature_constraint[temp_indices[start_constraint+j]+s];
3001534831adSStefano Zampini               is_indices[j+1]=s+j+1;
3002534831adSStefano Zampini             }
3003534831adSStefano Zampini             Bt = temp_constraints;
3004534831adSStefano Zampini             ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
3005534831adSStefano Zampini             LAPACKgesv_(&Bt,&Bone,temp_basis,&Bt,ipiv,work,&Bt,&lierr);
3006534831adSStefano Zampini             if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GESV Lapack routine %d",(int)lierr);
3007534831adSStefano Zampini             ierr = PetscFPTrapPop();CHKERRQ(ierr);
3008534831adSStefano Zampini             j = temp_indices_to_constraint_B[temp_indices[start_constraint]+s];
3009534831adSStefano Zampini             ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,temp_constraints,&temp_indices_to_constraint_B[temp_indices[start_constraint]+s+1],1,&j,work,INSERT_VALUES);CHKERRQ(ierr);
3010534831adSStefano Zampini             if (useksp) {
3011534831adSStefano Zampini               /* temp mat with transposed rows and columns */
3012534831adSStefano Zampini               ierr = MatSetValues(temp_mat,1,&s,temp_constraints,&is_indices[1],work,INSERT_VALUES);CHKERRQ(ierr);
3013534831adSStefano Zampini               ierr = MatSetValue(temp_mat,is_indices[0],is_indices[0],1.0,INSERT_VALUES);CHKERRQ(ierr);
3014534831adSStefano Zampini             }
3015534831adSStefano Zampini           }
3016534831adSStefano Zampini           if (useksp) {
3017534831adSStefano Zampini             /* last rows of temp_mat */
3018534831adSStefano Zampini             for (j=0;j<size_of_constraint;j++) {
3019534831adSStefano Zampini               is_indices[j] = j;
3020534831adSStefano Zampini             }
3021534831adSStefano Zampini             for (s=0;s<temp_constraints;s++) {
3022534831adSStefano Zampini               k = s + dual_dofs;
3023534831adSStefano Zampini               ierr = MatSetValues(temp_mat,1,&k,size_of_constraint,is_indices,&temp_quadrature_constraint[temp_indices[start_constraint+s]],INSERT_VALUES);CHKERRQ(ierr);
3024534831adSStefano Zampini             }
3025534831adSStefano Zampini             ierr = MatAssemblyBegin(temp_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
3026534831adSStefano Zampini             ierr = MatAssemblyEnd(temp_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
3027534831adSStefano Zampini             ierr = MatGetVecs(temp_mat,&temp_vec,PETSC_NULL);CHKERRQ(ierr);
3028534831adSStefano Zampini             ierr = KSPCreate(PETSC_COMM_SELF,&temp_ksp);CHKERRQ(ierr);
3029534831adSStefano Zampini             ierr = KSPSetOperators(temp_ksp,temp_mat,temp_mat,SAME_PRECONDITIONER);CHKERRQ(ierr);
3030534831adSStefano Zampini             ierr = KSPSetType(temp_ksp,KSPPREONLY);CHKERRQ(ierr);
3031ffe5efe1SStefano Zampini             ierr = KSPGetPC(temp_ksp,&temp_pc);CHKERRQ(ierr);
3032ffe5efe1SStefano Zampini             ierr = PCSetType(temp_pc,PCLU);CHKERRQ(ierr);
3033534831adSStefano Zampini             ierr = KSPSetUp(temp_ksp);CHKERRQ(ierr);
3034534831adSStefano Zampini             for (s=0;s<temp_constraints;s++) {
3035534831adSStefano Zampini               ierr = VecSet(temp_vec,0.0);CHKERRQ(ierr);
3036534831adSStefano Zampini               ierr = VecSetValue(temp_vec,s+dual_dofs,1.0,INSERT_VALUES);CHKERRQ(ierr);
3037534831adSStefano Zampini               ierr = VecAssemblyBegin(temp_vec);CHKERRQ(ierr);
3038534831adSStefano Zampini               ierr = VecAssemblyEnd(temp_vec);CHKERRQ(ierr);
3039534831adSStefano Zampini               ierr = KSPSolve(temp_ksp,temp_vec,temp_vec);CHKERRQ(ierr);
3040534831adSStefano Zampini               ierr = VecGetArray(temp_vec,&array_vector);CHKERRQ(ierr);
3041534831adSStefano Zampini               j = temp_indices_to_constraint_B[temp_indices[start_constraint+s]+size_of_constraint-s-1];
3042534831adSStefano Zampini               /* last columns of change of basis matrix associated to new primal dofs */
3043534831adSStefano Zampini               ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,size_of_constraint,&temp_indices_to_constraint_B[temp_indices[start_constraint+s]],1,&j,array_vector,INSERT_VALUES);CHKERRQ(ierr);
3044534831adSStefano Zampini               ierr = VecRestoreArray(temp_vec,&array_vector);CHKERRQ(ierr);
3045534831adSStefano Zampini             }
3046534831adSStefano Zampini             ierr = MatDestroy(&temp_mat);CHKERRQ(ierr);
3047534831adSStefano Zampini             ierr = KSPDestroy(&temp_ksp);CHKERRQ(ierr);
3048534831adSStefano Zampini             ierr = VecDestroy(&temp_vec);CHKERRQ(ierr);
3049534831adSStefano Zampini           } else {
3050534831adSStefano Zampini             /* last columns of change of basis matrix associated to new primal dofs */
3051534831adSStefano Zampini             for (s=0;s<temp_constraints;s++) {
3052534831adSStefano Zampini               j = temp_indices_to_constraint_B[temp_indices[start_constraint+s]+size_of_constraint-s-1];
3053534831adSStefano Zampini               ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,size_of_constraint,&temp_indices_to_constraint_B[temp_indices[start_constraint+s]],1,&j,&temp_quadrature_constraint[temp_indices[start_constraint+s]],INSERT_VALUES);CHKERRQ(ierr);
3054534831adSStefano Zampini             }
3055534831adSStefano Zampini           }
3056534831adSStefano Zampini           /* prepare for the next cycle */
3057534831adSStefano Zampini           temp_constraints = 0;
305804eaf177SStefano Zampini           if (i != local_primal_size -1 ) {
3059534831adSStefano Zampini             temp_start_ptr = temp_indices_to_constraint_B[temp_indices[i+1]];
3060534831adSStefano Zampini           }
3061534831adSStefano Zampini         }
3062534831adSStefano Zampini       }
306304eaf177SStefano Zampini     }
3064534831adSStefano Zampini     /* assembling */
3065534831adSStefano Zampini     ierr = MatAssemblyBegin(pcbddc->ChangeOfBasisMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
3066534831adSStefano Zampini     ierr = MatAssemblyEnd(pcbddc->ChangeOfBasisMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
3067534831adSStefano Zampini     ierr = PetscFree(ipiv);CHKERRQ(ierr);
3068534831adSStefano Zampini     ierr = PetscFree(is_indices);CHKERRQ(ierr);
3069534831adSStefano Zampini   }
30703b03a366Sstefano_zampini   /* free workspace no longer needed */
30713b03a366Sstefano_zampini   ierr = PetscFree(rwork);CHKERRQ(ierr);
30723b03a366Sstefano_zampini   ierr = PetscFree(work);CHKERRQ(ierr);
30733b03a366Sstefano_zampini   ierr = PetscFree(temp_basis);CHKERRQ(ierr);
30743b03a366Sstefano_zampini   ierr = PetscFree(singular_vals);CHKERRQ(ierr);
30753b03a366Sstefano_zampini   ierr = PetscFree(correlation_mat);CHKERRQ(ierr);
30763b03a366Sstefano_zampini   ierr = PetscFree(temp_indices);CHKERRQ(ierr);
3077534831adSStefano Zampini   ierr = PetscFree(change_basis);CHKERRQ(ierr);
30783b03a366Sstefano_zampini   ierr = PetscFree(temp_indices_to_constraint);CHKERRQ(ierr);
3079534831adSStefano Zampini   ierr = PetscFree(temp_indices_to_constraint_B);CHKERRQ(ierr);
3080534831adSStefano Zampini   ierr = PetscFree(local_to_B);CHKERRQ(ierr);
30813b03a366Sstefano_zampini   ierr = PetscFree(temp_quadrature_constraint);CHKERRQ(ierr);
30823425bc38SStefano Zampini #if defined(PETSC_MISSING_LAPACK_GESVD)
30833425bc38SStefano Zampini   ierr = PetscFree(iwork);CHKERRQ(ierr);
30843425bc38SStefano Zampini   ierr = PetscFree(ifail);CHKERRQ(ierr);
30853425bc38SStefano Zampini   ierr = PetscFree(singular_vectors);CHKERRQ(ierr);
30863425bc38SStefano Zampini #endif
3087da1bb401SStefano Zampini   for (k=0;k<nnsp_size;k++) {
3088da1bb401SStefano Zampini     ierr = VecDestroy(&localnearnullsp[k]);CHKERRQ(ierr);
3089da1bb401SStefano Zampini   }
30903b03a366Sstefano_zampini   ierr = PetscFree(localnearnullsp);CHKERRQ(ierr);
30913b03a366Sstefano_zampini   PetscFunctionReturn(0);
30923b03a366Sstefano_zampini }
30933b03a366Sstefano_zampini /* -------------------------------------------------------------------------- */
30940c7d97c5SJed Brown #undef __FUNCT__
30950c7d97c5SJed Brown #define __FUNCT__ "PCBDDCCoarseSetUp"
309653cdbc3dSStefano Zampini static PetscErrorCode PCBDDCCoarseSetUp(PC pc)
30970c7d97c5SJed Brown {
30980c7d97c5SJed Brown   PetscErrorCode  ierr;
30990c7d97c5SJed Brown 
31000c7d97c5SJed Brown   PC_IS*            pcis = (PC_IS*)(pc->data);
31010c7d97c5SJed Brown   PC_BDDC*          pcbddc = (PC_BDDC*)pc->data;
31020c7d97c5SJed Brown   Mat_IS            *matis = (Mat_IS*)pc->pmat->data;
3103534831adSStefano Zampini   Mat               change_mat_all;
31040c7d97c5SJed Brown   IS                is_R_local;
31050c7d97c5SJed Brown   IS                is_V_local;
31060c7d97c5SJed Brown   IS                is_C_local;
31070c7d97c5SJed Brown   IS                is_aux1;
31080c7d97c5SJed Brown   IS                is_aux2;
310919fd82e9SBarry Smith   VecType           impVecType;
311019fd82e9SBarry Smith   MatType           impMatType;
31110c7d97c5SJed Brown   PetscInt          n_R=0;
31120c7d97c5SJed Brown   PetscInt          n_D=0;
31130c7d97c5SJed Brown   PetscInt          n_B=0;
31140c7d97c5SJed Brown   PetscScalar       zero=0.0;
31150c7d97c5SJed Brown   PetscScalar       one=1.0;
31160c7d97c5SJed Brown   PetscScalar       m_one=-1.0;
31170c7d97c5SJed Brown   PetscScalar*      array;
31180c7d97c5SJed Brown   PetscScalar       *coarse_submat_vals;
31190c7d97c5SJed Brown   PetscInt          *idx_R_local;
31200c7d97c5SJed Brown   PetscInt          *idx_V_B;
31210c7d97c5SJed Brown   PetscScalar       *coarsefunctions_errors;
31220c7d97c5SJed Brown   PetscScalar       *constraints_errors;
31230c7d97c5SJed Brown   /* auxiliary indices */
3124534831adSStefano Zampini   PetscInt          i,j,k;
3125e269702eSStefano Zampini   /* for verbose output of bddc */
3126e269702eSStefano Zampini   PetscViewer       viewer=pcbddc->dbg_viewer;
3127e269702eSStefano Zampini   PetscBool         dbg_flag=pcbddc->dbg_flag;
3128a0ba757dSStefano Zampini   /* for counting coarse dofs */
3129534831adSStefano Zampini   PetscInt          n_vertices,n_constraints;
31303b03a366Sstefano_zampini   PetscInt          size_of_constraint;
31313b03a366Sstefano_zampini   PetscInt          *row_cmat_indices;
31323b03a366Sstefano_zampini   PetscScalar       *row_cmat_values;
3133534831adSStefano Zampini   PetscInt          *vertices,*nnz,*is_indices,*temp_indices;
31340c7d97c5SJed Brown 
31350c7d97c5SJed Brown   PetscFunctionBegin;
31360c7d97c5SJed Brown   /* Set Non-overlapping dimensions */
31370c7d97c5SJed Brown   n_B = pcis->n_B; n_D = pcis->n - n_B;
3138534831adSStefano Zampini   /* Set types for local objects needed by BDDC precondtioner */
3139534831adSStefano Zampini   impMatType = MATSEQDENSE;
3140534831adSStefano Zampini   impVecType = VECSEQ;
3141da1bb401SStefano Zampini   /* get vertex indices from constraint matrix */
3142534831adSStefano Zampini   ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscInt),&vertices);CHKERRQ(ierr);
3143534831adSStefano Zampini   n_vertices=0;
3144da1bb401SStefano Zampini   for (i=0;i<pcbddc->local_primal_size;i++) {
3145da1bb401SStefano Zampini     ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr);
3146da1bb401SStefano Zampini     if (size_of_constraint == 1) {
3147534831adSStefano Zampini       vertices[n_vertices]=row_cmat_indices[0];
3148534831adSStefano Zampini       n_vertices++;
3149a0ba757dSStefano Zampini     }
3150da1bb401SStefano Zampini     ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr);
3151a0ba757dSStefano Zampini   }
3152534831adSStefano Zampini   /* Set number of constraints */
3153534831adSStefano Zampini   n_constraints = pcbddc->local_primal_size-n_vertices;
3154534831adSStefano Zampini 
3155534831adSStefano Zampini   /* vertices in boundary numbering */
3156534831adSStefano Zampini   if (n_vertices) {
3157534831adSStefano Zampini     ierr = VecSet(pcis->vec1_N,m_one);CHKERRQ(ierr);
3158534831adSStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3159534831adSStefano Zampini     for (i=0; i<n_vertices; i++) { array[ vertices[i] ] = i; }
3160534831adSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3161534831adSStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3162534831adSStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3163534831adSStefano Zampini     ierr = PetscMalloc(n_vertices*sizeof(PetscInt),&idx_V_B);CHKERRQ(ierr);
3164534831adSStefano Zampini     ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr);
3165534831adSStefano Zampini     for (i=0; i<n_vertices; i++) {
3166534831adSStefano Zampini       j=0;
3167534831adSStefano Zampini       while (array[j] != i ) {j++;}
3168534831adSStefano Zampini       idx_V_B[i]=j;
3169534831adSStefano Zampini     }
3170534831adSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr);
3171534831adSStefano Zampini   }
3172534831adSStefano Zampini 
3173534831adSStefano Zampini   /* transform local matrices if needed */
3174534831adSStefano Zampini   if (pcbddc->usechangeofbasis) {
3175534831adSStefano Zampini     ierr = PetscMalloc(pcis->n*sizeof(PetscInt),&nnz);CHKERRQ(ierr);
3176534831adSStefano Zampini     ierr = ISGetIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
3177534831adSStefano Zampini     for (i=0;i<n_D;i++) {
3178534831adSStefano Zampini       nnz[is_indices[i]]=1;
3179534831adSStefano Zampini     }
3180534831adSStefano Zampini     ierr = ISRestoreIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
3181534831adSStefano Zampini     ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
3182534831adSStefano Zampini     k=1;
3183534831adSStefano Zampini     for (i=0;i<n_B;i++) {
3184534831adSStefano Zampini       ierr = MatGetRow(pcbddc->ChangeOfBasisMatrix,i,&j,PETSC_NULL,PETSC_NULL);CHKERRQ(ierr);
3185534831adSStefano Zampini       nnz[is_indices[i]]=j;
3186534831adSStefano Zampini       if ( k < j) {
3187534831adSStefano Zampini         k = j;
3188534831adSStefano Zampini       }
3189534831adSStefano Zampini       ierr = MatRestoreRow(pcbddc->ChangeOfBasisMatrix,i,&j,PETSC_NULL,PETSC_NULL);CHKERRQ(ierr);
3190534831adSStefano Zampini     }
3191534831adSStefano Zampini     ierr = ISRestoreIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
3192534831adSStefano Zampini     /* assemble change of basis matrix on the whole set of local dofs */
3193534831adSStefano Zampini     ierr = PetscMalloc(k*sizeof(PetscInt),&temp_indices);CHKERRQ(ierr);
3194534831adSStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&change_mat_all);CHKERRQ(ierr);
3195534831adSStefano Zampini     ierr = MatSetSizes(change_mat_all,pcis->n,pcis->n,pcis->n,pcis->n);CHKERRQ(ierr);
3196534831adSStefano Zampini     ierr = MatSetType(change_mat_all,MATSEQAIJ);CHKERRQ(ierr);
3197534831adSStefano Zampini     ierr = MatSeqAIJSetPreallocation(change_mat_all,0,nnz);CHKERRQ(ierr);
3198534831adSStefano Zampini     ierr = ISGetIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
3199534831adSStefano Zampini     for (i=0;i<n_D;i++) {
3200534831adSStefano Zampini       ierr = MatSetValue(change_mat_all,is_indices[i],is_indices[i],1.0,INSERT_VALUES);CHKERRQ(ierr);
3201534831adSStefano Zampini     }
3202534831adSStefano Zampini     ierr = ISRestoreIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
3203534831adSStefano Zampini     ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
3204534831adSStefano Zampini     for (i=0;i<n_B;i++) {
3205534831adSStefano Zampini       ierr = MatGetRow(pcbddc->ChangeOfBasisMatrix,i,&j,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr);
3206534831adSStefano Zampini       for (k=0;k<j;k++) {
3207534831adSStefano Zampini         temp_indices[k]=is_indices[row_cmat_indices[k]];
3208534831adSStefano Zampini       }
3209534831adSStefano Zampini       ierr = MatSetValues(change_mat_all,1,&is_indices[i],j,temp_indices,row_cmat_values,INSERT_VALUES);CHKERRQ(ierr);
3210534831adSStefano Zampini       ierr = MatRestoreRow(pcbddc->ChangeOfBasisMatrix,i,&j,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr);
3211534831adSStefano Zampini     }
3212534831adSStefano Zampini     ierr = MatAssemblyBegin(change_mat_all,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
3213534831adSStefano Zampini     ierr = MatAssemblyEnd(change_mat_all,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
3214534831adSStefano Zampini     ierr = MatPtAP(matis->A,change_mat_all,MAT_INITIAL_MATRIX,1.0,&pcbddc->local_mat);CHKERRQ(ierr);
3215534831adSStefano Zampini     ierr = MatDestroy(&pcis->A_IB);CHKERRQ(ierr);
3216534831adSStefano Zampini     ierr = MatDestroy(&pcis->A_BI);CHKERRQ(ierr);
3217534831adSStefano Zampini     ierr = MatDestroy(&pcis->A_BB);CHKERRQ(ierr);
3218534831adSStefano Zampini     ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_I_local,pcis->is_B_local,MAT_INITIAL_MATRIX,&pcis->A_IB);CHKERRQ(ierr);
3219534831adSStefano Zampini     ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_B_local,pcis->is_I_local,MAT_INITIAL_MATRIX,&pcis->A_BI);CHKERRQ(ierr);
3220534831adSStefano Zampini     ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_B_local,pcis->is_B_local,MAT_INITIAL_MATRIX,&pcis->A_BB);CHKERRQ(ierr);
3221534831adSStefano Zampini     ierr = MatDestroy(&change_mat_all);CHKERRQ(ierr);
3222534831adSStefano Zampini     ierr = PetscFree(nnz);CHKERRQ(ierr);
3223534831adSStefano Zampini     ierr = PetscFree(temp_indices);CHKERRQ(ierr);
3224534831adSStefano Zampini   } else {
3225534831adSStefano Zampini     /* without change of basis, the local matrix is unchanged */
3226534831adSStefano Zampini     ierr = PetscObjectReference((PetscObject)matis->A);CHKERRQ(ierr);
3227534831adSStefano Zampini     pcbddc->local_mat = matis->A;
3228534831adSStefano Zampini   }
32290bdf917eSStefano Zampini   /* Change global null space passed in by the user if change of basis has been performed */
32300bdf917eSStefano Zampini   if (pcbddc->NullSpace && pcbddc->usechangeofbasis) {
32310bdf917eSStefano Zampini     ierr = PCBDDCAdaptNullSpace(pc);CHKERRQ(ierr);
32320bdf917eSStefano Zampini   }
3233a0ba757dSStefano Zampini 
32340c7d97c5SJed Brown   /* Dohrmann's notation: dofs splitted in R (Remaining: all dofs but the vertices) and V (Vertices) */
32350c7d97c5SJed Brown   ierr = VecSet(pcis->vec1_N,one);CHKERRQ(ierr);
32360c7d97c5SJed Brown   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
32373b03a366Sstefano_zampini   for (i=0;i<n_vertices;i++) { array[ vertices[i] ] = zero; }
32383b03a366Sstefano_zampini   ierr = PetscMalloc(( pcis->n - n_vertices )*sizeof(PetscInt),&idx_R_local);CHKERRQ(ierr);
32390c7d97c5SJed Brown   for (i=0, n_R=0; i<pcis->n; i++) { if (array[i] == one) { idx_R_local[n_R] = i; n_R++; } }
32400c7d97c5SJed Brown   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3241e269702eSStefano Zampini   if (dbg_flag) {
32420c7d97c5SJed Brown     ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
32430c7d97c5SJed Brown     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
32440c7d97c5SJed Brown     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d local dimensions\n",PetscGlobalRank);CHKERRQ(ierr);
32450c7d97c5SJed Brown     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local_size = %d, dirichlet_size = %d, boundary_size = %d\n",pcis->n,n_D,n_B);CHKERRQ(ierr);
32463b03a366Sstefano_zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"r_size = %d, v_size = %d, constraints = %d, local_primal_size = %d\n",n_R,n_vertices,n_constraints,pcbddc->local_primal_size);CHKERRQ(ierr);
3247534831adSStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"pcbddc->n_vertices = %d, pcbddc->n_constraints = %d\n",pcbddc->n_vertices,pcbddc->n_constraints);CHKERRQ(ierr);
32480c7d97c5SJed Brown     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
32490c7d97c5SJed Brown   }
3250534831adSStefano Zampini 
32510c7d97c5SJed Brown   /* Allocate needed vectors */
3252534831adSStefano Zampini   ierr = VecDuplicate(pcis->vec1_global,&pcbddc->original_rhs);CHKERRQ(ierr);
32533972b0daSStefano Zampini   ierr = VecDuplicate(pcis->vec1_global,&pcbddc->temp_solution);CHKERRQ(ierr);
32540c7d97c5SJed Brown   ierr = VecDuplicate(pcis->vec1_D,&pcbddc->vec4_D);CHKERRQ(ierr);
32550c7d97c5SJed Brown   ierr = VecCreate(PETSC_COMM_SELF,&pcbddc->vec1_R);CHKERRQ(ierr);
32560c7d97c5SJed Brown   ierr = VecSetSizes(pcbddc->vec1_R,n_R,n_R);CHKERRQ(ierr);
32570c7d97c5SJed Brown   ierr = VecSetType(pcbddc->vec1_R,impVecType);CHKERRQ(ierr);
3258d49ef151SStefano Zampini   ierr = VecDuplicate(pcbddc->vec1_R,&pcbddc->vec2_R);CHKERRQ(ierr);
32590c7d97c5SJed Brown   ierr = VecCreate(PETSC_COMM_SELF,&pcbddc->vec1_P);CHKERRQ(ierr);
32600c7d97c5SJed Brown   ierr = VecSetSizes(pcbddc->vec1_P,pcbddc->local_primal_size,pcbddc->local_primal_size);CHKERRQ(ierr);
32610c7d97c5SJed Brown   ierr = VecSetType(pcbddc->vec1_P,impVecType);CHKERRQ(ierr);
32620c7d97c5SJed Brown 
32630c7d97c5SJed Brown   /* Creating some index sets needed  */
32640c7d97c5SJed Brown   /* For submatrices */
3265da1bb401SStefano Zampini   ierr = ISCreateGeneral(PETSC_COMM_SELF,n_R,idx_R_local,PETSC_OWN_POINTER,&is_R_local);CHKERRQ(ierr);
32663b03a366Sstefano_zampini   if (n_vertices)    {
3267da1bb401SStefano Zampini     ierr = ISCreateGeneral(PETSC_COMM_SELF,n_vertices,vertices,PETSC_OWN_POINTER,&is_V_local);CHKERRQ(ierr);
32683b03a366Sstefano_zampini   }
3269da1bb401SStefano Zampini   if (n_constraints) {
3270da1bb401SStefano Zampini     ierr = ISCreateStride(PETSC_COMM_SELF,n_constraints,n_vertices,1,&is_C_local);CHKERRQ(ierr);
3271da1bb401SStefano Zampini   }
3272da1bb401SStefano Zampini 
32730c7d97c5SJed Brown   /* For VecScatters pcbddc->R_to_B and (optionally) pcbddc->R_to_D */
32740c7d97c5SJed Brown   {
32750c7d97c5SJed Brown     PetscInt   *aux_array1;
32760c7d97c5SJed Brown     PetscInt   *aux_array2;
32772e8d2280SStefano Zampini     PetscInt   *idx_I_local;
32780c7d97c5SJed Brown 
32793b03a366Sstefano_zampini     ierr = PetscMalloc( (pcis->n_B-n_vertices)*sizeof(PetscInt),&aux_array1);CHKERRQ(ierr);
32803b03a366Sstefano_zampini     ierr = PetscMalloc( (pcis->n_B-n_vertices)*sizeof(PetscInt),&aux_array2);CHKERRQ(ierr);
32810c7d97c5SJed Brown 
32822e8d2280SStefano Zampini     ierr = ISGetIndices(pcis->is_I_local,(const PetscInt**)&idx_I_local);CHKERRQ(ierr);
32830c7d97c5SJed Brown     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
32842e8d2280SStefano Zampini     for (i=0; i<n_D; i++) { array[idx_I_local[i]] = 0; }
32852e8d2280SStefano Zampini     ierr = ISRestoreIndices(pcis->is_I_local,(const PetscInt**)&idx_I_local);CHKERRQ(ierr);
32862e8d2280SStefano Zampini     for (i=0, j=0; i<n_R; i++) { if ( array[idx_R_local[i]] == one ) { aux_array1[j] = i; j++; } }
32870c7d97c5SJed Brown     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3288da1bb401SStefano Zampini     ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array1,PETSC_COPY_VALUES,&is_aux1);CHKERRQ(ierr);
32892e8d2280SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
32902e8d2280SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
32910c7d97c5SJed Brown     ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr);
32922e8d2280SStefano Zampini     for (i=0, j=0; i<n_B; i++) { if ( array[i] == one ) { aux_array2[j] = i; j++; } }
32933828260eSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr);
3294da1bb401SStefano Zampini     ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array2,PETSC_COPY_VALUES,&is_aux2);CHKERRQ(ierr);
32950c7d97c5SJed Brown     ierr = VecScatterCreate(pcbddc->vec1_R,is_aux1,pcis->vec1_B,is_aux2,&pcbddc->R_to_B);CHKERRQ(ierr);
32960c7d97c5SJed Brown     ierr = PetscFree(aux_array1);CHKERRQ(ierr);
32970c7d97c5SJed Brown     ierr = PetscFree(aux_array2);CHKERRQ(ierr);
32980c7d97c5SJed Brown     ierr = ISDestroy(&is_aux1);CHKERRQ(ierr);
32990c7d97c5SJed Brown     ierr = ISDestroy(&is_aux2);CHKERRQ(ierr);
33000c7d97c5SJed Brown 
330129622bf0SStefano Zampini     if (pcbddc->inexact_prec_type || dbg_flag ) {
33020c7d97c5SJed Brown       ierr = PetscMalloc(n_D*sizeof(PetscInt),&aux_array1);CHKERRQ(ierr);
33030c7d97c5SJed Brown       ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
33042e8d2280SStefano Zampini       for (i=0, j=0; i<n_R; i++) { if (array[idx_R_local[i]] == zero) { aux_array1[j] = i; j++; } }
33050c7d97c5SJed Brown       ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3306da1bb401SStefano Zampini       ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array1,PETSC_COPY_VALUES,&is_aux1);CHKERRQ(ierr);
33070c7d97c5SJed Brown       ierr = VecScatterCreate(pcbddc->vec1_R,is_aux1,pcis->vec1_D,(IS)0,&pcbddc->R_to_D);CHKERRQ(ierr);
33080c7d97c5SJed Brown       ierr = PetscFree(aux_array1);CHKERRQ(ierr);
33090c7d97c5SJed Brown       ierr = ISDestroy(&is_aux1);CHKERRQ(ierr);
33100c7d97c5SJed Brown     }
33110c7d97c5SJed Brown   }
33120c7d97c5SJed Brown 
33130c7d97c5SJed Brown   /* Creating PC contexts for local Dirichlet and Neumann problems */
33140c7d97c5SJed Brown   {
33150c7d97c5SJed Brown     Mat  A_RR;
331653cdbc3dSStefano Zampini     PC   pc_temp;
33170c7d97c5SJed Brown     /* Matrix for Dirichlet problem is A_II -> we already have it from pcis.c code */
331853cdbc3dSStefano Zampini     ierr = KSPCreate(PETSC_COMM_SELF,&pcbddc->ksp_D);CHKERRQ(ierr);
331953cdbc3dSStefano Zampini     ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->ksp_D,(PetscObject)pc,1);CHKERRQ(ierr);
332053cdbc3dSStefano Zampini     ierr = KSPSetOperators(pcbddc->ksp_D,pcis->A_II,pcis->A_II,SAME_PRECONDITIONER);CHKERRQ(ierr);
332153cdbc3dSStefano Zampini     ierr = KSPSetType(pcbddc->ksp_D,KSPPREONLY);CHKERRQ(ierr);
3322da1bb401SStefano Zampini     ierr = KSPSetOptionsPrefix(pcbddc->ksp_D,"dirichlet_");CHKERRQ(ierr);
33230c7d97c5SJed Brown     /* default */
332453cdbc3dSStefano Zampini     ierr = KSPGetPC(pcbddc->ksp_D,&pc_temp);CHKERRQ(ierr);
332553cdbc3dSStefano Zampini     ierr = PCSetType(pc_temp,PCLU);CHKERRQ(ierr);
33260c7d97c5SJed Brown     /* Allow user's customization */
332753cdbc3dSStefano Zampini     ierr = KSPSetFromOptions(pcbddc->ksp_D);CHKERRQ(ierr);
3328950d796eSStefano Zampini     /* umfpack interface has a bug when matrix dimension is zero */
3329950d796eSStefano Zampini     if (!n_D) {
33302e8d2280SStefano Zampini       ierr = PCSetType(pc_temp,PCNONE);CHKERRQ(ierr);
3331950d796eSStefano Zampini     }
333253cdbc3dSStefano Zampini     /* Set Up KSP for Dirichlet problem of BDDC */
333353cdbc3dSStefano Zampini     ierr = KSPSetUp(pcbddc->ksp_D);CHKERRQ(ierr);
33343972b0daSStefano Zampini     /* set ksp_D into pcis data */
33353972b0daSStefano Zampini     ierr = KSPDestroy(&pcis->ksp_D);CHKERRQ(ierr);
33363972b0daSStefano Zampini     ierr = PetscObjectReference((PetscObject)pcbddc->ksp_D);CHKERRQ(ierr);
33373972b0daSStefano Zampini     pcis->ksp_D = pcbddc->ksp_D;
33380c7d97c5SJed Brown     /* Matrix for Neumann problem is A_RR -> we need to create it */
3339534831adSStefano Zampini     ierr = MatGetSubMatrix(pcbddc->local_mat,is_R_local,is_R_local,MAT_INITIAL_MATRIX,&A_RR);CHKERRQ(ierr);
334053cdbc3dSStefano Zampini     ierr = KSPCreate(PETSC_COMM_SELF,&pcbddc->ksp_R);CHKERRQ(ierr);
334153cdbc3dSStefano Zampini     ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->ksp_R,(PetscObject)pc,1);CHKERRQ(ierr);
334253cdbc3dSStefano Zampini     ierr = KSPSetOperators(pcbddc->ksp_R,A_RR,A_RR,SAME_PRECONDITIONER);CHKERRQ(ierr);
334353cdbc3dSStefano Zampini     ierr = KSPSetType(pcbddc->ksp_R,KSPPREONLY);CHKERRQ(ierr);
3344da1bb401SStefano Zampini     ierr = KSPSetOptionsPrefix(pcbddc->ksp_R,"neumann_");CHKERRQ(ierr);
33450c7d97c5SJed Brown     /* default */
334653cdbc3dSStefano Zampini     ierr = KSPGetPC(pcbddc->ksp_R,&pc_temp);CHKERRQ(ierr);
334753cdbc3dSStefano Zampini     ierr = PCSetType(pc_temp,PCLU);CHKERRQ(ierr);
33480c7d97c5SJed Brown     /* Allow user's customization */
334953cdbc3dSStefano Zampini     ierr = KSPSetFromOptions(pcbddc->ksp_R);CHKERRQ(ierr);
3350950d796eSStefano Zampini     /* umfpack interface has a bug when matrix dimension is zero */
3351950d796eSStefano Zampini     if (!pcis->n) {
33522e8d2280SStefano Zampini       ierr = PCSetType(pc_temp,PCNONE);CHKERRQ(ierr);
3353950d796eSStefano Zampini     }
335453cdbc3dSStefano Zampini     /* Set Up KSP for Neumann problem of BDDC */
335553cdbc3dSStefano Zampini     ierr = KSPSetUp(pcbddc->ksp_R);CHKERRQ(ierr);
335629622bf0SStefano Zampini     /* check Dirichlet and Neumann solvers and adapt them is a nullspace correction is needed */
3357b76ba322SStefano Zampini     {
33580c7d97c5SJed Brown       Vec         temp_vec;
3359b76ba322SStefano Zampini       PetscReal   value;
3360b76ba322SStefano Zampini       PetscMPIInt use_exact,use_exact_reduced;
33610c7d97c5SJed Brown 
3362a0ba757dSStefano Zampini       ierr = VecDuplicate(pcis->vec1_D,&temp_vec);CHKERRQ(ierr);
3363a0ba757dSStefano Zampini       ierr = VecSetRandom(pcis->vec1_D,PETSC_NULL);CHKERRQ(ierr);
3364a0ba757dSStefano Zampini       ierr = MatMult(pcis->A_II,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr);
3365a0ba757dSStefano Zampini       ierr = KSPSolve(pcbddc->ksp_D,pcis->vec2_D,temp_vec);CHKERRQ(ierr);
3366a0ba757dSStefano Zampini       ierr = VecAXPY(temp_vec,m_one,pcis->vec1_D);CHKERRQ(ierr);
3367a0ba757dSStefano Zampini       ierr = VecNorm(temp_vec,NORM_INFINITY,&value);CHKERRQ(ierr);
336829622bf0SStefano Zampini       ierr = VecDestroy(&temp_vec);CHKERRQ(ierr);
3369b76ba322SStefano Zampini       use_exact = 1;
3370b76ba322SStefano Zampini       if (PetscAbsReal(value) > 1.e-4) {
3371b76ba322SStefano Zampini         use_exact = 0;
3372b76ba322SStefano Zampini       }
3373b76ba322SStefano Zampini       ierr = MPI_Allreduce(&use_exact,&use_exact_reduced,1,MPIU_INT,MPI_LAND,((PetscObject)pc)->comm);CHKERRQ(ierr);
3374b76ba322SStefano Zampini       pcbddc->use_exact_dirichlet = (PetscBool) use_exact_reduced;
3375b76ba322SStefano Zampini       if (dbg_flag) {
3376a0ba757dSStefano Zampini         ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
3377a0ba757dSStefano Zampini         ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
3378a0ba757dSStefano Zampini         ierr = PetscViewerASCIIPrintf(viewer,"Checking solution of Dirichlet and Neumann problems\n");CHKERRQ(ierr);
3379a0ba757dSStefano Zampini         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d infinity error for Dirichlet solve = % 1.14e \n",PetscGlobalRank,value);CHKERRQ(ierr);
338029622bf0SStefano Zampini       }
338129622bf0SStefano Zampini       if (pcbddc->NullSpace && !use_exact_reduced && !pcbddc->inexact_prec_type) {
338229622bf0SStefano Zampini         ierr = PCBDDCAdaptLocalProblem(pc,pcis->is_I_local);
338329622bf0SStefano Zampini       }
3384d49ef151SStefano Zampini       ierr = VecDuplicate(pcbddc->vec1_R,&temp_vec);CHKERRQ(ierr);
3385d49ef151SStefano Zampini       ierr = VecSetRandom(pcbddc->vec1_R,PETSC_NULL);CHKERRQ(ierr);
3386d49ef151SStefano Zampini       ierr = MatMult(A_RR,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr);
3387d49ef151SStefano Zampini       ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec2_R,temp_vec);CHKERRQ(ierr);
3388d49ef151SStefano Zampini       ierr = VecAXPY(temp_vec,m_one,pcbddc->vec1_R);CHKERRQ(ierr);
3389d49ef151SStefano Zampini       ierr = VecNorm(temp_vec,NORM_INFINITY,&value);CHKERRQ(ierr);
3390e269702eSStefano Zampini       ierr = VecDestroy(&temp_vec);CHKERRQ(ierr);
339129622bf0SStefano Zampini       use_exact = 1;
339229622bf0SStefano Zampini       if (PetscAbsReal(value) > 1.e-4) {
339329622bf0SStefano Zampini         use_exact = 0;
339429622bf0SStefano Zampini       }
339529622bf0SStefano Zampini       ierr = MPI_Allreduce(&use_exact,&use_exact_reduced,1,MPIU_INT,MPI_LAND,((PetscObject)pc)->comm);CHKERRQ(ierr);
339629622bf0SStefano Zampini       if (dbg_flag) {
33970c7d97c5SJed Brown         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d infinity error for  Neumann  solve = % 1.14e \n",PetscGlobalRank,value);CHKERRQ(ierr);
3398d49ef151SStefano Zampini         ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
33990c7d97c5SJed Brown       }
340029622bf0SStefano Zampini       if (pcbddc->NullSpace && !use_exact_reduced) {
340129622bf0SStefano Zampini         ierr = PCBDDCAdaptLocalProblem(pc,is_R_local);
340229622bf0SStefano Zampini       }
3403b76ba322SStefano Zampini     }
34040c7d97c5SJed Brown     /* free Neumann problem's matrix */
34050c7d97c5SJed Brown     ierr = MatDestroy(&A_RR);CHKERRQ(ierr);
34060c7d97c5SJed Brown   }
34070c7d97c5SJed Brown 
34080c7d97c5SJed Brown   /* Assemble all remaining stuff needed to apply BDDC  */
34090c7d97c5SJed Brown   {
34100c7d97c5SJed Brown     Mat          A_RV,A_VR,A_VV;
34110bdf917eSStefano Zampini     Mat          M1;
34120c7d97c5SJed Brown     Mat          C_CR;
34133b03a366Sstefano_zampini     Mat          AUXMAT;
34140c7d97c5SJed Brown     Vec          vec1_C;
34150c7d97c5SJed Brown     Vec          vec2_C;
34160c7d97c5SJed Brown     Vec          vec1_V;
34170c7d97c5SJed Brown     Vec          vec2_V;
34180c7d97c5SJed Brown     PetscInt     *nnz;
34190c7d97c5SJed Brown     PetscInt     *auxindices;
342053cdbc3dSStefano Zampini     PetscInt     index;
34210c7d97c5SJed Brown     PetscScalar* array2;
34220c7d97c5SJed Brown     MatFactorInfo matinfo;
34230c7d97c5SJed Brown 
34240c7d97c5SJed Brown     /* Allocating some extra storage just to be safe */
34250c7d97c5SJed Brown     ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&nnz);CHKERRQ(ierr);
34260c7d97c5SJed Brown     ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&auxindices);CHKERRQ(ierr);
34270c7d97c5SJed Brown     for (i=0;i<pcis->n;i++) {auxindices[i]=i;}
34280c7d97c5SJed Brown 
34290c7d97c5SJed Brown     /* some work vectors on vertices and/or constraints */
34303b03a366Sstefano_zampini     if (n_vertices) {
34310c7d97c5SJed Brown       ierr = VecCreate(PETSC_COMM_SELF,&vec1_V);CHKERRQ(ierr);
34323b03a366Sstefano_zampini       ierr = VecSetSizes(vec1_V,n_vertices,n_vertices);CHKERRQ(ierr);
34330c7d97c5SJed Brown       ierr = VecSetType(vec1_V,impVecType);CHKERRQ(ierr);
34340c7d97c5SJed Brown       ierr = VecDuplicate(vec1_V,&vec2_V);CHKERRQ(ierr);
34350c7d97c5SJed Brown     }
3436534831adSStefano Zampini     if (n_constraints) {
34370c7d97c5SJed Brown       ierr = VecCreate(PETSC_COMM_SELF,&vec1_C);CHKERRQ(ierr);
3438534831adSStefano Zampini       ierr = VecSetSizes(vec1_C,n_constraints,n_constraints);CHKERRQ(ierr);
34390c7d97c5SJed Brown       ierr = VecSetType(vec1_C,impVecType);CHKERRQ(ierr);
34400c7d97c5SJed Brown       ierr = VecDuplicate(vec1_C,&vec2_C);CHKERRQ(ierr);
34410c7d97c5SJed Brown       ierr = VecDuplicate(vec1_C,&pcbddc->vec1_C);CHKERRQ(ierr);
34420c7d97c5SJed Brown     }
34430c7d97c5SJed Brown     /* Precompute stuffs needed for preprocessing and application of BDDC*/
34443b03a366Sstefano_zampini     if (n_constraints) {
34450c7d97c5SJed Brown       ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->local_auxmat2);CHKERRQ(ierr);
34463b03a366Sstefano_zampini       ierr = MatSetSizes(pcbddc->local_auxmat2,n_R,n_constraints,n_R,n_constraints);CHKERRQ(ierr);
34470c7d97c5SJed Brown       ierr = MatSetType(pcbddc->local_auxmat2,impMatType);CHKERRQ(ierr);
34483b03a366Sstefano_zampini       ierr = MatSeqDenseSetPreallocation(pcbddc->local_auxmat2,PETSC_NULL);CHKERRQ(ierr);
34490c7d97c5SJed Brown 
345057a90decSStefano Zampini       /* Create Constraint matrix on R nodes: C_{CR}  */
345157a90decSStefano Zampini       ierr = MatGetSubMatrix(pcbddc->ConstraintMatrix,is_C_local,is_R_local,MAT_INITIAL_MATRIX,&C_CR);CHKERRQ(ierr);
345257a90decSStefano Zampini       ierr = ISDestroy(&is_C_local);CHKERRQ(ierr);
345357a90decSStefano Zampini 
34540c7d97c5SJed Brown       /* Assemble local_auxmat2 = - A_{RR}^{-1} C^T_{CR} needed by BDDC application */
34553b03a366Sstefano_zampini       for (i=0;i<n_constraints;i++) {
34563b03a366Sstefano_zampini         ierr = VecSet(pcbddc->vec1_R,zero);CHKERRQ(ierr);
34573b03a366Sstefano_zampini         /* Get row of constraint matrix in R numbering */
345857a90decSStefano Zampini         ierr = VecGetArray(pcbddc->vec1_R,&array);CHKERRQ(ierr);
345957a90decSStefano Zampini         ierr = MatGetRow(C_CR,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr);
34603b03a366Sstefano_zampini         for (j=0;j<size_of_constraint;j++) { array[ row_cmat_indices[j] ] = - row_cmat_values[j]; }
346157a90decSStefano Zampini         ierr = MatRestoreRow(C_CR,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr);
346257a90decSStefano Zampini         ierr = VecRestoreArray(pcbddc->vec1_R,&array);CHKERRQ(ierr);
34633b03a366Sstefano_zampini         /* Solve for row of constraint matrix in R numbering */
346453cdbc3dSStefano Zampini         ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr);
34653b03a366Sstefano_zampini         /* Set values */
34660c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec2_R,&array);CHKERRQ(ierr);
34673b03a366Sstefano_zampini         ierr = MatSetValues(pcbddc->local_auxmat2,n_R,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
34680c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec2_R,&array);CHKERRQ(ierr);
34690c7d97c5SJed Brown       }
34700c7d97c5SJed Brown       ierr = MatAssemblyBegin(pcbddc->local_auxmat2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
34710c7d97c5SJed Brown       ierr = MatAssemblyEnd(pcbddc->local_auxmat2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
34720c7d97c5SJed Brown 
34730c7d97c5SJed Brown       /* Assemble AUXMAT = ( LUFactor )( -C_{CR} A_{RR}^{-1} C^T_{CR} )^{-1} */
34740c7d97c5SJed Brown       ierr = MatMatMult(C_CR,pcbddc->local_auxmat2,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&AUXMAT);CHKERRQ(ierr);
3475d49ef151SStefano Zampini       ierr = MatFactorInfoInitialize(&matinfo);CHKERRQ(ierr);
34763b03a366Sstefano_zampini       ierr = ISCreateStride(PETSC_COMM_SELF,n_constraints,0,1,&is_aux1);CHKERRQ(ierr);
34770c7d97c5SJed Brown       ierr = MatLUFactor(AUXMAT,is_aux1,is_aux1,&matinfo);CHKERRQ(ierr);
34780c7d97c5SJed Brown       ierr = ISDestroy(&is_aux1);CHKERRQ(ierr);
34790c7d97c5SJed Brown 
34803b03a366Sstefano_zampini       /* Assemble explicitly M1 = ( C_{CR} A_{RR}^{-1} C^T_{CR} )^{-1} needed in preproc  */
3481d49ef151SStefano Zampini       ierr = MatCreate(PETSC_COMM_SELF,&M1);CHKERRQ(ierr);
34823b03a366Sstefano_zampini       ierr = MatSetSizes(M1,n_constraints,n_constraints,n_constraints,n_constraints);CHKERRQ(ierr);
34830c7d97c5SJed Brown       ierr = MatSetType(M1,impMatType);CHKERRQ(ierr);
34843b03a366Sstefano_zampini       ierr = MatSeqDenseSetPreallocation(M1,PETSC_NULL);CHKERRQ(ierr);
34853b03a366Sstefano_zampini       for (i=0;i<n_constraints;i++) {
34860c7d97c5SJed Brown         ierr = VecSet(vec1_C,zero);CHKERRQ(ierr);
34870c7d97c5SJed Brown         ierr = VecSetValue(vec1_C,i,one,INSERT_VALUES);CHKERRQ(ierr);
34880c7d97c5SJed Brown         ierr = VecAssemblyBegin(vec1_C);CHKERRQ(ierr);
34890c7d97c5SJed Brown         ierr = VecAssemblyEnd(vec1_C);CHKERRQ(ierr);
34900c7d97c5SJed Brown         ierr = MatSolve(AUXMAT,vec1_C,vec2_C);CHKERRQ(ierr);
34910c7d97c5SJed Brown         ierr = VecScale(vec2_C,m_one);CHKERRQ(ierr);
34920c7d97c5SJed Brown         ierr = VecGetArray(vec2_C,&array);CHKERRQ(ierr);
34933b03a366Sstefano_zampini         ierr = MatSetValues(M1,n_constraints,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
34940c7d97c5SJed Brown         ierr = VecRestoreArray(vec2_C,&array);CHKERRQ(ierr);
34950c7d97c5SJed Brown       }
34960c7d97c5SJed Brown       ierr = MatAssemblyBegin(M1,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
34970c7d97c5SJed Brown       ierr = MatAssemblyEnd(M1,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
34980c7d97c5SJed Brown       ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr);
34990c7d97c5SJed Brown       /* Assemble local_auxmat1 = M1*C_{CR} needed by BDDC application in KSP and in preproc */
35000c7d97c5SJed Brown       ierr = MatMatMult(M1,C_CR,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&pcbddc->local_auxmat1);CHKERRQ(ierr);
35010c7d97c5SJed Brown 
35020c7d97c5SJed Brown     }
35030c7d97c5SJed Brown 
35040c7d97c5SJed Brown     /* Get submatrices from subdomain matrix */
35053b03a366Sstefano_zampini     if (n_vertices){
3506534831adSStefano Zampini       ierr = MatGetSubMatrix(pcbddc->local_mat,is_R_local,is_V_local,MAT_INITIAL_MATRIX,&A_RV);CHKERRQ(ierr);
3507534831adSStefano Zampini       ierr = MatGetSubMatrix(pcbddc->local_mat,is_V_local,is_R_local,MAT_INITIAL_MATRIX,&A_VR);CHKERRQ(ierr);
3508534831adSStefano Zampini       ierr = MatGetSubMatrix(pcbddc->local_mat,is_V_local,is_V_local,MAT_INITIAL_MATRIX,&A_VV);CHKERRQ(ierr);
35090c7d97c5SJed Brown     }
35100c7d97c5SJed Brown 
35110c7d97c5SJed Brown     /* Matrix of coarse basis functions (local) */
3512d49ef151SStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->coarse_phi_B);CHKERRQ(ierr);
35130c7d97c5SJed Brown     ierr = MatSetSizes(pcbddc->coarse_phi_B,n_B,pcbddc->local_primal_size,n_B,pcbddc->local_primal_size);CHKERRQ(ierr);
35140c7d97c5SJed Brown     ierr = MatSetType(pcbddc->coarse_phi_B,impMatType);CHKERRQ(ierr);
35153b03a366Sstefano_zampini     ierr = MatSeqDenseSetPreallocation(pcbddc->coarse_phi_B,PETSC_NULL);CHKERRQ(ierr);
351629622bf0SStefano Zampini     if (pcbddc->inexact_prec_type || dbg_flag ) {
3517d49ef151SStefano Zampini       ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->coarse_phi_D);CHKERRQ(ierr);
35180c7d97c5SJed Brown       ierr = MatSetSizes(pcbddc->coarse_phi_D,n_D,pcbddc->local_primal_size,n_D,pcbddc->local_primal_size);CHKERRQ(ierr);
35190c7d97c5SJed Brown       ierr = MatSetType(pcbddc->coarse_phi_D,impMatType);CHKERRQ(ierr);
35203b03a366Sstefano_zampini       ierr = MatSeqDenseSetPreallocation(pcbddc->coarse_phi_D,PETSC_NULL);CHKERRQ(ierr);
35210c7d97c5SJed Brown     }
35220c7d97c5SJed Brown 
3523e269702eSStefano Zampini     if (dbg_flag) {
35240c7d97c5SJed Brown       ierr = PetscMalloc( pcbddc->local_primal_size*sizeof(PetscScalar),&coarsefunctions_errors);CHKERRQ(ierr);
35250c7d97c5SJed Brown       ierr = PetscMalloc( pcbddc->local_primal_size*sizeof(PetscScalar),&constraints_errors);CHKERRQ(ierr);
35260c7d97c5SJed Brown     }
35273b03a366Sstefano_zampini     /* Subdomain contribution (Non-overlapping) to coarse matrix  */
35280c7d97c5SJed Brown     ierr = PetscMalloc ((pcbddc->local_primal_size)*(pcbddc->local_primal_size)*sizeof(PetscScalar),&coarse_submat_vals);CHKERRQ(ierr);
35290c7d97c5SJed Brown 
35300c7d97c5SJed Brown     /* We are now ready to evaluate coarse basis functions and subdomain contribution to coarse problem */
35313b03a366Sstefano_zampini     for (i=0;i<n_vertices;i++){
35320c7d97c5SJed Brown       ierr = VecSet(vec1_V,zero);CHKERRQ(ierr);
35330c7d97c5SJed Brown       ierr = VecSetValue(vec1_V,i,one,INSERT_VALUES);CHKERRQ(ierr);
35340c7d97c5SJed Brown       ierr = VecAssemblyBegin(vec1_V);CHKERRQ(ierr);
35350c7d97c5SJed Brown       ierr = VecAssemblyEnd(vec1_V);CHKERRQ(ierr);
35360c7d97c5SJed Brown       /* solution of saddle point problem */
35370bdf917eSStefano Zampini       ierr = MatMult(A_RV,vec1_V,pcbddc->vec1_R);CHKERRQ(ierr);
35380bdf917eSStefano Zampini       ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec1_R);CHKERRQ(ierr);
35390c7d97c5SJed Brown       ierr = VecScale(pcbddc->vec1_R,m_one);CHKERRQ(ierr);
35403b03a366Sstefano_zampini       if (n_constraints) {
35410c7d97c5SJed Brown         ierr = MatMult(pcbddc->local_auxmat1,pcbddc->vec1_R,vec1_C);CHKERRQ(ierr);
35420c7d97c5SJed Brown         ierr = MatMultAdd(pcbddc->local_auxmat2,vec1_C,pcbddc->vec1_R,pcbddc->vec1_R);CHKERRQ(ierr);
35430c7d97c5SJed Brown         ierr = VecScale(vec1_C,m_one);CHKERRQ(ierr);
35440c7d97c5SJed Brown       }
35450c7d97c5SJed Brown       ierr = MatMult(A_VR,pcbddc->vec1_R,vec2_V);CHKERRQ(ierr);
35460c7d97c5SJed Brown       ierr = MatMultAdd(A_VV,vec1_V,vec2_V,vec2_V);CHKERRQ(ierr);
35470c7d97c5SJed Brown 
35480c7d97c5SJed Brown       /* Set values in coarse basis function and subdomain part of coarse_mat */
35490c7d97c5SJed Brown       /* coarse basis functions */
35500c7d97c5SJed Brown       ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr);
35510c7d97c5SJed Brown       ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
35520c7d97c5SJed Brown       ierr = VecScatterEnd  (pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
35530c7d97c5SJed Brown       ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr);
35543b03a366Sstefano_zampini       ierr = MatSetValues(pcbddc->coarse_phi_B,n_B,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
35550c7d97c5SJed Brown       ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr);
35560c7d97c5SJed Brown       ierr = MatSetValue(pcbddc->coarse_phi_B,idx_V_B[i],i,one,INSERT_VALUES);CHKERRQ(ierr);
355729622bf0SStefano Zampini       if ( pcbddc->inexact_prec_type || dbg_flag  ) {
35580c7d97c5SJed Brown         ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
35590c7d97c5SJed Brown         ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
35600c7d97c5SJed Brown         ierr = VecGetArray(pcis->vec1_D,&array);CHKERRQ(ierr);
35613b03a366Sstefano_zampini         ierr = MatSetValues(pcbddc->coarse_phi_D,n_D,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
35620c7d97c5SJed Brown         ierr = VecRestoreArray(pcis->vec1_D,&array);CHKERRQ(ierr);
35630c7d97c5SJed Brown       }
35640c7d97c5SJed Brown       /* subdomain contribution to coarse matrix */
35650c7d97c5SJed Brown       ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr);
3566da1bb401SStefano Zampini       for (j=0;j<n_vertices;j++) { coarse_submat_vals[i*pcbddc->local_primal_size+j] = array[j]; } /* WARNING -> column major ordering */
35670c7d97c5SJed Brown       ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr);
35683b03a366Sstefano_zampini       if (n_constraints) {
35690c7d97c5SJed Brown         ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr);
3570da1bb401SStefano Zampini         for (j=0;j<n_constraints;j++) { coarse_submat_vals[i*pcbddc->local_primal_size+j+n_vertices] = array[j]; } /* WARNING -> column major ordering */
35710c7d97c5SJed Brown         ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr);
35720c7d97c5SJed Brown       }
35730c7d97c5SJed Brown 
3574e269702eSStefano Zampini       if ( dbg_flag ) {
35750c7d97c5SJed Brown         /* assemble subdomain vector on nodes */
3576d49ef151SStefano Zampini         ierr = VecSet(pcis->vec1_N,zero);CHKERRQ(ierr);
35770c7d97c5SJed Brown         ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
35780c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr);
35790c7d97c5SJed Brown         for (j=0;j<n_R;j++) { array[idx_R_local[j]] = array2[j]; }
35803b03a366Sstefano_zampini         array[ vertices[i] ] = one;
35810c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr);
35820c7d97c5SJed Brown         ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
35830c7d97c5SJed Brown         /* assemble subdomain vector of lagrange multipliers (i.e. primal nodes) */
3584d49ef151SStefano Zampini         ierr = VecSet(pcbddc->vec1_P,zero);CHKERRQ(ierr);
35850c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr);
35860c7d97c5SJed Brown         ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr);
35873b03a366Sstefano_zampini         for (j=0;j<n_vertices;j++) { array2[j]=array[j]; }
35880c7d97c5SJed Brown         ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr);
35893b03a366Sstefano_zampini         if (n_constraints) {
35900c7d97c5SJed Brown           ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr);
35913b03a366Sstefano_zampini           for (j=0;j<n_constraints;j++) { array2[j+n_vertices]=array[j]; }
35920c7d97c5SJed Brown           ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr);
35930c7d97c5SJed Brown         }
35940c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr);
35950c7d97c5SJed Brown         ierr = VecScale(pcbddc->vec1_P,m_one);CHKERRQ(ierr);
35960c7d97c5SJed Brown         /* check saddle point solution */
3597534831adSStefano Zampini         ierr = MatMult(pcbddc->local_mat,pcis->vec1_N,pcis->vec2_N);CHKERRQ(ierr);
35983b03a366Sstefano_zampini         ierr = MatMultTransposeAdd(pcbddc->ConstraintMatrix,pcbddc->vec1_P,pcis->vec2_N,pcis->vec2_N);CHKERRQ(ierr);
35993b03a366Sstefano_zampini         ierr = VecNorm(pcis->vec2_N,NORM_INFINITY,&coarsefunctions_errors[i]);CHKERRQ(ierr);
36003b03a366Sstefano_zampini         ierr = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr);
36010c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
36023b03a366Sstefano_zampini         array[i]=array[i]+m_one;  /* shift by the identity matrix */
36030c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
36043b03a366Sstefano_zampini         ierr = VecNorm(pcbddc->vec1_P,NORM_INFINITY,&constraints_errors[i]);CHKERRQ(ierr);
36050c7d97c5SJed Brown       }
36060c7d97c5SJed Brown     }
36070c7d97c5SJed Brown 
36083b03a366Sstefano_zampini     for (i=0;i<n_constraints;i++){
3609d49ef151SStefano Zampini       ierr = VecSet(vec2_C,zero);CHKERRQ(ierr);
36100c7d97c5SJed Brown       ierr = VecSetValue(vec2_C,i,m_one,INSERT_VALUES);CHKERRQ(ierr);
36110c7d97c5SJed Brown       ierr = VecAssemblyBegin(vec2_C);CHKERRQ(ierr);
36120c7d97c5SJed Brown       ierr = VecAssemblyEnd(vec2_C);CHKERRQ(ierr);
36130c7d97c5SJed Brown       /* solution of saddle point problem */
36140c7d97c5SJed Brown       ierr = MatMult(M1,vec2_C,vec1_C);CHKERRQ(ierr);
36150c7d97c5SJed Brown       ierr = MatMult(pcbddc->local_auxmat2,vec1_C,pcbddc->vec1_R);CHKERRQ(ierr);
36160c7d97c5SJed Brown       ierr = VecScale(vec1_C,m_one);CHKERRQ(ierr);
36173b03a366Sstefano_zampini       if (n_vertices) { ierr = MatMult(A_VR,pcbddc->vec1_R,vec2_V);CHKERRQ(ierr); }
36180c7d97c5SJed Brown       /* Set values in coarse basis function and subdomain part of coarse_mat */
36190c7d97c5SJed Brown       /* coarse basis functions */
36203b03a366Sstefano_zampini       index=i+n_vertices;
36210c7d97c5SJed Brown       ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr);
36220c7d97c5SJed Brown       ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
36230c7d97c5SJed Brown       ierr = VecScatterEnd  (pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
36240c7d97c5SJed Brown       ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr);
362553cdbc3dSStefano Zampini       ierr = MatSetValues(pcbddc->coarse_phi_B,n_B,auxindices,1,&index,array,INSERT_VALUES);CHKERRQ(ierr);
36260c7d97c5SJed Brown       ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr);
362729622bf0SStefano Zampini       if ( pcbddc->inexact_prec_type || dbg_flag ) {
36280c7d97c5SJed Brown         ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
36290c7d97c5SJed Brown         ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
36300c7d97c5SJed Brown         ierr = VecGetArray(pcis->vec1_D,&array);CHKERRQ(ierr);
363153cdbc3dSStefano Zampini         ierr = MatSetValues(pcbddc->coarse_phi_D,n_D,auxindices,1,&index,array,INSERT_VALUES);CHKERRQ(ierr);
36320c7d97c5SJed Brown         ierr = VecRestoreArray(pcis->vec1_D,&array);CHKERRQ(ierr);
36330c7d97c5SJed Brown       }
36340c7d97c5SJed Brown       /* subdomain contribution to coarse matrix */
36353b03a366Sstefano_zampini       if (n_vertices) {
36360c7d97c5SJed Brown         ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr);
3637da1bb401SStefano Zampini         for (j=0;j<n_vertices;j++) {coarse_submat_vals[index*pcbddc->local_primal_size+j]=array[j];} /* WARNING -> column major ordering */
36380c7d97c5SJed Brown         ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr);
36390c7d97c5SJed Brown       }
36400c7d97c5SJed Brown       ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr);
3641da1bb401SStefano Zampini       for (j=0;j<n_constraints;j++) {coarse_submat_vals[index*pcbddc->local_primal_size+j+n_vertices]=array[j];} /* WARNING -> column major ordering */
36420c7d97c5SJed Brown       ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr);
36430c7d97c5SJed Brown 
3644e269702eSStefano Zampini       if ( dbg_flag ) {
36450c7d97c5SJed Brown         /* assemble subdomain vector on nodes */
364653cdbc3dSStefano Zampini         ierr = VecSet(pcis->vec1_N,zero);CHKERRQ(ierr);
36470c7d97c5SJed Brown         ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
36480c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr);
36490c7d97c5SJed Brown         for (j=0;j<n_R;j++){ array[ idx_R_local[j] ] = array2[j]; }
36500c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr);
36510c7d97c5SJed Brown         ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
36520c7d97c5SJed Brown         /* assemble subdomain vector of lagrange multipliers */
365353cdbc3dSStefano Zampini         ierr = VecSet(pcbddc->vec1_P,zero);CHKERRQ(ierr);
36540c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr);
36553b03a366Sstefano_zampini         if ( n_vertices) {
36560c7d97c5SJed Brown           ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr);
36573b03a366Sstefano_zampini           for (j=0;j<n_vertices;j++) {array2[j]=-array[j];}
36580c7d97c5SJed Brown           ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr);
36590c7d97c5SJed Brown         }
36600c7d97c5SJed Brown         ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr);
36613b03a366Sstefano_zampini         for (j=0;j<n_constraints;j++) {array2[j+n_vertices]=-array[j];}
36620c7d97c5SJed Brown         ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr);
36630c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr);
36643972b0daSStefano Zampini         /* check saddle point solution */
3665534831adSStefano Zampini         ierr = MatMult(pcbddc->local_mat,pcis->vec1_N,pcis->vec2_N);CHKERRQ(ierr);
36663b03a366Sstefano_zampini         ierr = MatMultTransposeAdd(pcbddc->ConstraintMatrix,pcbddc->vec1_P,pcis->vec2_N,pcis->vec2_N);CHKERRQ(ierr);
366753cdbc3dSStefano Zampini         ierr = VecNorm(pcis->vec2_N,NORM_INFINITY,&coarsefunctions_errors[index]);CHKERRQ(ierr);
36683b03a366Sstefano_zampini         ierr = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr);
36690c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
367053cdbc3dSStefano Zampini         array[index]=array[index]+m_one; /* shift by the identity matrix */
36710c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
367253cdbc3dSStefano Zampini         ierr = VecNorm(pcbddc->vec1_P,NORM_INFINITY,&constraints_errors[index]);CHKERRQ(ierr);
36730c7d97c5SJed Brown       }
36740c7d97c5SJed Brown     }
36750c7d97c5SJed Brown     ierr = MatAssemblyBegin(pcbddc->coarse_phi_B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
36760c7d97c5SJed Brown     ierr = MatAssemblyEnd  (pcbddc->coarse_phi_B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
367729622bf0SStefano Zampini     if ( pcbddc->inexact_prec_type || dbg_flag ) {
36780c7d97c5SJed Brown       ierr = MatAssemblyBegin(pcbddc->coarse_phi_D,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
36790c7d97c5SJed Brown       ierr = MatAssemblyEnd  (pcbddc->coarse_phi_D,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
36800c7d97c5SJed Brown     }
36810c7d97c5SJed Brown     /* Checking coarse_sub_mat and coarse basis functios */
36820c7d97c5SJed Brown     /* It shuld be \Phi^{(j)^T} A^{(j)} \Phi^{(j)}=coarse_sub_mat */
36839d2fce94SStefano Zampini     if (dbg_flag) {
36840c7d97c5SJed Brown       Mat         coarse_sub_mat;
36850c7d97c5SJed Brown       Mat         TM1,TM2,TM3,TM4;
36860c7d97c5SJed Brown       Mat         coarse_phi_D,coarse_phi_B,A_II,A_BB,A_IB,A_BI;
368719fd82e9SBarry Smith       MatType     checkmattype=MATSEQAIJ;
36880c7d97c5SJed Brown       PetscScalar value;
36890c7d97c5SJed Brown 
3690c042a7c3SStefano Zampini       ierr = MatConvert(pcis->A_II,checkmattype,MAT_INITIAL_MATRIX,&A_II);CHKERRQ(ierr);
3691c042a7c3SStefano Zampini       ierr = MatConvert(pcis->A_IB,checkmattype,MAT_INITIAL_MATRIX,&A_IB);CHKERRQ(ierr);
3692c042a7c3SStefano Zampini       ierr = MatConvert(pcis->A_BI,checkmattype,MAT_INITIAL_MATRIX,&A_BI);CHKERRQ(ierr);
3693c042a7c3SStefano Zampini       ierr = MatConvert(pcis->A_BB,checkmattype,MAT_INITIAL_MATRIX,&A_BB);CHKERRQ(ierr);
3694c042a7c3SStefano Zampini       ierr = MatConvert(pcbddc->coarse_phi_D,checkmattype,MAT_INITIAL_MATRIX,&coarse_phi_D);CHKERRQ(ierr);
3695c042a7c3SStefano Zampini       ierr = MatConvert(pcbddc->coarse_phi_B,checkmattype,MAT_INITIAL_MATRIX,&coarse_phi_B);CHKERRQ(ierr);
3696c042a7c3SStefano Zampini       ierr = MatCreateSeqDense(PETSC_COMM_SELF,pcbddc->local_primal_size,pcbddc->local_primal_size,coarse_submat_vals,&coarse_sub_mat);CHKERRQ(ierr);
3697c042a7c3SStefano Zampini       ierr = MatConvert(coarse_sub_mat,checkmattype,MAT_REUSE_MATRIX,&coarse_sub_mat);CHKERRQ(ierr);
36980c7d97c5SJed Brown 
3699da1bb401SStefano Zampini       /*PetscViewer view_out;
3700da1bb401SStefano Zampini       PetscMPIInt myrank;
3701da1bb401SStefano Zampini       char filename[256];
3702da1bb401SStefano Zampini       MPI_Comm_rank(((PetscObject)pc)->comm,&myrank);
3703da1bb401SStefano Zampini       sprintf(filename,"coarsesubmat_%04d.m",myrank);
3704da1bb401SStefano Zampini       ierr = PetscViewerASCIIOpen(PETSC_COMM_SELF,filename,&view_out);CHKERRQ(ierr);
3705da1bb401SStefano Zampini       ierr = PetscViewerSetFormat(view_out,PETSC_VIEWER_ASCII_MATLAB);CHKERRQ(ierr);
3706da1bb401SStefano Zampini       ierr = MatView(coarse_sub_mat,view_out);CHKERRQ(ierr);
3707da1bb401SStefano Zampini       ierr = PetscViewerDestroy(&view_out);CHKERRQ(ierr);*/
3708da1bb401SStefano Zampini 
37090c7d97c5SJed Brown       ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
37100c7d97c5SJed Brown       ierr = PetscViewerASCIIPrintf(viewer,"Check coarse sub mat and local basis functions\n");CHKERRQ(ierr);
37110c7d97c5SJed Brown       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
371253cdbc3dSStefano Zampini       ierr = MatPtAP(A_II,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&TM1);CHKERRQ(ierr);
371353cdbc3dSStefano Zampini       ierr = MatPtAP(A_BB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&TM2);CHKERRQ(ierr);
371453cdbc3dSStefano Zampini       ierr = MatMatMult(A_IB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr);
3715c042a7c3SStefano Zampini       ierr = MatTransposeMatMult(coarse_phi_D,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM3);CHKERRQ(ierr);
371653cdbc3dSStefano Zampini       ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr);
371753cdbc3dSStefano Zampini       ierr = MatMatMult(A_BI,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr);
3718c042a7c3SStefano Zampini       ierr = MatTransposeMatMult(coarse_phi_B,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM4);CHKERRQ(ierr);
371953cdbc3dSStefano Zampini       ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr);
372053cdbc3dSStefano Zampini       ierr = MatAXPY(TM1,one,TM2,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
372153cdbc3dSStefano Zampini       ierr = MatAXPY(TM1,one,TM3,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
372253cdbc3dSStefano Zampini       ierr = MatAXPY(TM1,one,TM4,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
372353cdbc3dSStefano Zampini       ierr = MatAXPY(TM1,m_one,coarse_sub_mat,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
372453cdbc3dSStefano Zampini       ierr = MatNorm(TM1,NORM_INFINITY,&value);CHKERRQ(ierr);
37250c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"----------------------------------\n");CHKERRQ(ierr);
37260c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d \n",PetscGlobalRank);CHKERRQ(ierr);
37270c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"matrix error = % 1.14e\n",value);CHKERRQ(ierr);
37280c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"coarse functions errors\n");CHKERRQ(ierr);
372953cdbc3dSStefano Zampini       for (i=0;i<pcbddc->local_primal_size;i++) { ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local %02d-th function error = % 1.14e\n",i,coarsefunctions_errors[i]);CHKERRQ(ierr); }
37300c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"constraints errors\n");CHKERRQ(ierr);
373153cdbc3dSStefano Zampini       for (i=0;i<pcbddc->local_primal_size;i++) { ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local %02d-th function error = % 1.14e\n",i,constraints_errors[i]);CHKERRQ(ierr); }
37320c7d97c5SJed Brown       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
373353cdbc3dSStefano Zampini       ierr = MatDestroy(&A_II);CHKERRQ(ierr);
373453cdbc3dSStefano Zampini       ierr = MatDestroy(&A_BB);CHKERRQ(ierr);
373553cdbc3dSStefano Zampini       ierr = MatDestroy(&A_IB);CHKERRQ(ierr);
373653cdbc3dSStefano Zampini       ierr = MatDestroy(&A_BI);CHKERRQ(ierr);
373753cdbc3dSStefano Zampini       ierr = MatDestroy(&TM1);CHKERRQ(ierr);
373853cdbc3dSStefano Zampini       ierr = MatDestroy(&TM2);CHKERRQ(ierr);
373953cdbc3dSStefano Zampini       ierr = MatDestroy(&TM3);CHKERRQ(ierr);
374053cdbc3dSStefano Zampini       ierr = MatDestroy(&TM4);CHKERRQ(ierr);
374153cdbc3dSStefano Zampini       ierr = MatDestroy(&coarse_phi_D);CHKERRQ(ierr);
374253cdbc3dSStefano Zampini       ierr = MatDestroy(&coarse_sub_mat);CHKERRQ(ierr);
374353cdbc3dSStefano Zampini       ierr = MatDestroy(&coarse_phi_B);CHKERRQ(ierr);
37440c7d97c5SJed Brown       ierr = PetscFree(coarsefunctions_errors);CHKERRQ(ierr);
37450c7d97c5SJed Brown       ierr = PetscFree(constraints_errors);CHKERRQ(ierr);
37460c7d97c5SJed Brown     }
37470c7d97c5SJed Brown     /* free memory */
37483b03a366Sstefano_zampini     if (n_vertices) {
37490c7d97c5SJed Brown       ierr = VecDestroy(&vec1_V);CHKERRQ(ierr);
37500c7d97c5SJed Brown       ierr = VecDestroy(&vec2_V);CHKERRQ(ierr);
37510c7d97c5SJed Brown       ierr = MatDestroy(&A_RV);CHKERRQ(ierr);
37520c7d97c5SJed Brown       ierr = MatDestroy(&A_VR);CHKERRQ(ierr);
37530c7d97c5SJed Brown       ierr = MatDestroy(&A_VV);CHKERRQ(ierr);
37540c7d97c5SJed Brown     }
3755534831adSStefano Zampini     if (n_constraints) {
37560c7d97c5SJed Brown       ierr = VecDestroy(&vec1_C);CHKERRQ(ierr);
37570c7d97c5SJed Brown       ierr = VecDestroy(&vec2_C);CHKERRQ(ierr);
37580c7d97c5SJed Brown       ierr = MatDestroy(&M1);CHKERRQ(ierr);
37590c7d97c5SJed Brown       ierr = MatDestroy(&C_CR);CHKERRQ(ierr);
37600c7d97c5SJed Brown     }
3761a929c220SStefano Zampini     ierr = PetscFree(auxindices);CHKERRQ(ierr);
3762a929c220SStefano Zampini     ierr = PetscFree(nnz);CHKERRQ(ierr);
3763a929c220SStefano Zampini     /* create coarse matrix and data structures for message passing associated actual choice of coarse problem type */
3764a929c220SStefano Zampini     ierr = PCBDDCSetupCoarseEnvironment(pc,coarse_submat_vals);CHKERRQ(ierr);
3765a929c220SStefano Zampini     ierr = PetscFree(coarse_submat_vals);CHKERRQ(ierr);
37660c7d97c5SJed Brown   }
37670c7d97c5SJed Brown   /* free memory */
37683b03a366Sstefano_zampini   if (n_vertices) {
37690c7d97c5SJed Brown     ierr = PetscFree(idx_V_B);CHKERRQ(ierr);
37700c7d97c5SJed Brown     ierr = ISDestroy(&is_V_local);CHKERRQ(ierr);
37710c7d97c5SJed Brown   }
37720c7d97c5SJed Brown   ierr = ISDestroy(&is_R_local);CHKERRQ(ierr);
37730c7d97c5SJed Brown 
37740c7d97c5SJed Brown   PetscFunctionReturn(0);
37750c7d97c5SJed Brown }
37760c7d97c5SJed Brown 
37770c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
37780c7d97c5SJed Brown 
37790c7d97c5SJed Brown #undef __FUNCT__
37800c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetupCoarseEnvironment"
378153cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetupCoarseEnvironment(PC pc,PetscScalar* coarse_submat_vals)
37820c7d97c5SJed Brown {
37830c7d97c5SJed Brown 
37840c7d97c5SJed Brown 
37850c7d97c5SJed Brown   Mat_IS    *matis    = (Mat_IS*)pc->pmat->data;
37860c7d97c5SJed Brown   PC_BDDC   *pcbddc   = (PC_BDDC*)pc->data;
37870c7d97c5SJed Brown   PC_IS     *pcis     = (PC_IS*)pc->data;
37880c7d97c5SJed Brown   MPI_Comm  prec_comm = ((PetscObject)pc)->comm;
37890c7d97c5SJed Brown   MPI_Comm  coarse_comm;
37900c7d97c5SJed Brown 
37910c7d97c5SJed Brown   /* common to all choiches */
37920c7d97c5SJed Brown   PetscScalar *temp_coarse_mat_vals;
37930c7d97c5SJed Brown   PetscScalar *ins_coarse_mat_vals;
37940c7d97c5SJed Brown   PetscInt    *ins_local_primal_indices;
37950c7d97c5SJed Brown   PetscMPIInt *localsizes2,*localdispl2;
37960c7d97c5SJed Brown   PetscMPIInt size_prec_comm;
37970c7d97c5SJed Brown   PetscMPIInt rank_prec_comm;
37980c7d97c5SJed Brown   PetscMPIInt active_rank=MPI_PROC_NULL;
37990c7d97c5SJed Brown   PetscMPIInt master_proc=0;
38000c7d97c5SJed Brown   PetscInt    ins_local_primal_size;
38010c7d97c5SJed Brown   /* specific to MULTILEVEL_BDDC */
38020c7d97c5SJed Brown   PetscMPIInt *ranks_recv;
38030c7d97c5SJed Brown   PetscMPIInt count_recv=0;
38040c7d97c5SJed Brown   PetscMPIInt rank_coarse_proc_send_to;
38050c7d97c5SJed Brown   PetscMPIInt coarse_color = MPI_UNDEFINED;
38060c7d97c5SJed Brown   ISLocalToGlobalMapping coarse_ISLG;
38070c7d97c5SJed Brown   /* some other variables */
38080c7d97c5SJed Brown   PetscErrorCode ierr;
380919fd82e9SBarry Smith   MatType coarse_mat_type;
381019fd82e9SBarry Smith   PCType  coarse_pc_type;
381119fd82e9SBarry Smith   KSPType coarse_ksp_type;
381253cdbc3dSStefano Zampini   PC pc_temp;
38134fad6a16SStefano Zampini   PetscInt i,j,k;
38143b03a366Sstefano_zampini   PetscInt max_it_coarse_ksp=1;  /* don't increase this value */
3815e269702eSStefano Zampini   /* verbose output viewer */
3816e269702eSStefano Zampini   PetscViewer viewer=pcbddc->dbg_viewer;
3817e269702eSStefano Zampini   PetscBool   dbg_flag=pcbddc->dbg_flag;
3818142dfd88SStefano Zampini 
3819ea7e1babSStefano Zampini   PetscInt      offset,offset2;
3820a929c220SStefano Zampini   PetscMPIInt   im_active,active_procs;
3821523858cfSStefano Zampini   PetscInt      *dnz,*onz;
3822142dfd88SStefano Zampini 
3823142dfd88SStefano Zampini   PetscBool     setsym,issym=PETSC_FALSE;
38240c7d97c5SJed Brown 
38250c7d97c5SJed Brown   PetscFunctionBegin;
38260c7d97c5SJed Brown   ins_local_primal_indices = 0;
38270c7d97c5SJed Brown   ins_coarse_mat_vals      = 0;
38280c7d97c5SJed Brown   localsizes2              = 0;
38290c7d97c5SJed Brown   localdispl2              = 0;
38300c7d97c5SJed Brown   temp_coarse_mat_vals     = 0;
38310c7d97c5SJed Brown   coarse_ISLG              = 0;
38320c7d97c5SJed Brown 
383353cdbc3dSStefano Zampini   ierr = MPI_Comm_size(prec_comm,&size_prec_comm);CHKERRQ(ierr);
383453cdbc3dSStefano Zampini   ierr = MPI_Comm_rank(prec_comm,&rank_prec_comm);CHKERRQ(ierr);
3835142dfd88SStefano Zampini   ierr = MatIsSymmetricKnown(pc->pmat,&setsym,&issym);CHKERRQ(ierr);
3836142dfd88SStefano Zampini 
3837beed3852SStefano Zampini   /* Assign global numbering to coarse dofs */
3838beed3852SStefano Zampini   {
3839ef028eecSStefano Zampini     PetscInt     *auxlocal_primal;
3840da1bb401SStefano Zampini     PetscInt     *row_cmat_indices;
38412e8d2280SStefano Zampini     PetscInt     *aux_ordering;
38422e8d2280SStefano Zampini     PetscInt     *row_cmat_global_indices;
3843ef028eecSStefano Zampini     PetscInt     *dof_sizes,*dof_displs;
38443b03a366Sstefano_zampini     PetscInt     size_of_constraint;
38452e8d2280SStefano Zampini     PetscBool    *array_bool;
3846ef028eecSStefano Zampini     PetscBool    first_found;
3847ef028eecSStefano Zampini     PetscInt     first_index,old_index,s;
3848ef028eecSStefano Zampini     PetscMPIInt  mpi_local_primal_size;
3849ef028eecSStefano Zampini     PetscScalar  coarsesum,*array;
3850ef028eecSStefano Zampini 
3851ef028eecSStefano Zampini     mpi_local_primal_size = (PetscMPIInt)pcbddc->local_primal_size;
3852beed3852SStefano Zampini 
3853beed3852SStefano Zampini     /* Construct needed data structures for message passing */
3854ef028eecSStefano Zampini     ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscInt),&pcbddc->local_primal_indices);CHKERRQ(ierr);
3855ffe5efe1SStefano Zampini     j = 0;
3856142dfd88SStefano Zampini     if (rank_prec_comm == 0 || pcbddc->coarse_problem_type == REPLICATED_BDDC || pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
3857ffe5efe1SStefano Zampini       j = size_prec_comm;
3858ffe5efe1SStefano Zampini     }
3859ffe5efe1SStefano Zampini     ierr = PetscMalloc(j*sizeof(PetscMPIInt),&pcbddc->local_primal_sizes);CHKERRQ(ierr);
3860ffe5efe1SStefano Zampini     ierr = PetscMalloc(j*sizeof(PetscMPIInt),&pcbddc->local_primal_displacements);CHKERRQ(ierr);
3861beed3852SStefano Zampini     /* Gather local_primal_size information for all processes  */
3862142dfd88SStefano Zampini     if (pcbddc->coarse_problem_type == REPLICATED_BDDC || pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
38635619798eSStefano Zampini       ierr = MPI_Allgather(&mpi_local_primal_size,1,MPIU_INT,&pcbddc->local_primal_sizes[0],1,MPIU_INT,prec_comm);CHKERRQ(ierr);
3864ffe5efe1SStefano Zampini     } else {
3865ffe5efe1SStefano Zampini       ierr = MPI_Gather(&mpi_local_primal_size,1,MPIU_INT,&pcbddc->local_primal_sizes[0],1,MPIU_INT,0,prec_comm);CHKERRQ(ierr);
3866ffe5efe1SStefano Zampini     }
3867beed3852SStefano Zampini     pcbddc->replicated_primal_size = 0;
3868ffe5efe1SStefano Zampini     for (i=0; i<j; i++) {
3869beed3852SStefano Zampini       pcbddc->local_primal_displacements[i] = pcbddc->replicated_primal_size ;
3870beed3852SStefano Zampini       pcbddc->replicated_primal_size += pcbddc->local_primal_sizes[i];
3871beed3852SStefano Zampini     }
3872beed3852SStefano Zampini 
3873da1bb401SStefano Zampini     /* First let's count coarse dofs.
3874beed3852SStefano Zampini        This code fragment assumes that the number of local constraints per connected component
3875beed3852SStefano Zampini        is not greater than the number of nodes defined for the connected component
3876beed3852SStefano Zampini        (otherwise we will surely have linear dependence between constraints and thus a singular coarse problem) */
3877ef028eecSStefano Zampini     ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscInt),&auxlocal_primal);CHKERRQ(ierr);
38782e8d2280SStefano Zampini     j = 0;
38792e8d2280SStefano Zampini     for (i=0;i<pcbddc->local_primal_size;i++) {
38802e8d2280SStefano Zampini       ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,PETSC_NULL,PETSC_NULL);CHKERRQ(ierr);
38812e8d2280SStefano Zampini       if ( j < size_of_constraint ) {
38822e8d2280SStefano Zampini         j = size_of_constraint;
38832e8d2280SStefano Zampini       }
38842e8d2280SStefano Zampini       ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,PETSC_NULL,PETSC_NULL);CHKERRQ(ierr);
38852e8d2280SStefano Zampini     }
38862e8d2280SStefano Zampini     ierr = PetscMalloc(j*sizeof(PetscInt),&aux_ordering);CHKERRQ(ierr);
38872e8d2280SStefano Zampini     ierr = PetscMalloc(j*sizeof(PetscInt),&row_cmat_global_indices);CHKERRQ(ierr);
38882e8d2280SStefano Zampini     ierr = PetscMalloc(pcis->n*sizeof(PetscBool),&array_bool);CHKERRQ(ierr);
38892e8d2280SStefano Zampini     for (i=0;i<pcis->n;i++) {
38902e8d2280SStefano Zampini       array_bool[i] = PETSC_FALSE;
38912e8d2280SStefano Zampini     }
3892da1bb401SStefano Zampini     for (i=0;i<pcbddc->local_primal_size;i++) {
3893da1bb401SStefano Zampini       ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr);
38943b03a366Sstefano_zampini       for (j=0; j<size_of_constraint; j++) {
38952e8d2280SStefano Zampini         aux_ordering[j] = j;
38962e8d2280SStefano Zampini       }
38972e8d2280SStefano Zampini       ierr = ISLocalToGlobalMappingApply(matis->mapping,size_of_constraint,row_cmat_indices,row_cmat_global_indices);CHKERRQ(ierr);
38982e8d2280SStefano Zampini       ierr = PetscSortIntWithPermutation(size_of_constraint,row_cmat_global_indices,aux_ordering);CHKERRQ(ierr);
38992e8d2280SStefano Zampini       for (j=0; j<size_of_constraint; j++) {
39002e8d2280SStefano Zampini         k = row_cmat_indices[aux_ordering[j]];
39012e8d2280SStefano Zampini         if ( !array_bool[k] ) {
39022e8d2280SStefano Zampini           array_bool[k] = PETSC_TRUE;
3903da1bb401SStefano Zampini           auxlocal_primal[i] = k;
3904beed3852SStefano Zampini           break;
3905beed3852SStefano Zampini         }
3906beed3852SStefano Zampini       }
3907da1bb401SStefano Zampini       ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr);
3908beed3852SStefano Zampini     }
39092e8d2280SStefano Zampini     ierr = PetscFree(aux_ordering);CHKERRQ(ierr);
3910ef028eecSStefano Zampini     ierr = PetscFree(array_bool);CHKERRQ(ierr);
3911ef028eecSStefano Zampini     ierr = PetscFree(row_cmat_global_indices);CHKERRQ(ierr);
39122e8d2280SStefano Zampini 
3913ef028eecSStefano Zampini     /* Compute number of coarse dofs */
3914ef028eecSStefano Zampini     ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
3915ef028eecSStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3916ef028eecSStefano Zampini     for (i=0;i<pcbddc->local_primal_size;i++) {
3917ef028eecSStefano Zampini       array[auxlocal_primal[i]]=1.0;
3918ef028eecSStefano Zampini     }
3919ef028eecSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3920ef028eecSStefano Zampini     ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
3921ef028eecSStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3922ef028eecSStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3923ef028eecSStefano Zampini     ierr = VecSum(pcis->vec1_global,&coarsesum);CHKERRQ(ierr);
3924ef028eecSStefano Zampini     pcbddc->coarse_size = (PetscInt)coarsesum;
3925ef028eecSStefano Zampini 
3926ef028eecSStefano Zampini     /* Fill pcis->vec1_global with cumulative function for global numbering */
3927ef028eecSStefano Zampini     ierr = VecGetArray(pcis->vec1_global,&array);CHKERRQ(ierr);
3928ef028eecSStefano Zampini     ierr = VecGetLocalSize(pcis->vec1_global,&s);CHKERRQ(ierr);
3929ef028eecSStefano Zampini     k = 0;
3930ef028eecSStefano Zampini     first_index = -1;
3931ef028eecSStefano Zampini     first_found = PETSC_FALSE;
3932ef028eecSStefano Zampini     for (i=0;i<s;i++) {
3933ef028eecSStefano Zampini       if (!first_found && array[i] > 0.0) {
3934ef028eecSStefano Zampini         first_found = PETSC_TRUE;
3935ef028eecSStefano Zampini         first_index = i;
3936ef028eecSStefano Zampini       }
3937ef028eecSStefano Zampini       k += (PetscInt)array[i];
3938ef028eecSStefano Zampini     }
3939ef028eecSStefano Zampini     j = ( !rank_prec_comm ? size_prec_comm : 0);
3940ef028eecSStefano Zampini     ierr = PetscMalloc(j*sizeof(*dof_sizes),&dof_sizes);CHKERRQ(ierr);
3941ef028eecSStefano Zampini     ierr = PetscMalloc(j*sizeof(*dof_displs),&dof_displs);CHKERRQ(ierr);
3942ef028eecSStefano Zampini     ierr = MPI_Gather(&k,1,MPIU_INT,dof_sizes,1,MPIU_INT,0,prec_comm);CHKERRQ(ierr);
3943ef028eecSStefano Zampini     if (!rank_prec_comm) {
3944ef028eecSStefano Zampini       dof_displs[0]=0;
3945ef028eecSStefano Zampini       for (i=1;i<size_prec_comm;i++) {
3946ef028eecSStefano Zampini         dof_displs[i] = dof_displs[i-1]+dof_sizes[i-1];
3947ef028eecSStefano Zampini       }
3948ef028eecSStefano Zampini     }
3949ef028eecSStefano Zampini     ierr = MPI_Scatter(dof_displs,1,MPIU_INT,&k,1,MPIU_INT,0,prec_comm);CHKERRQ(ierr);
3950ef028eecSStefano Zampini     if (first_found) {
3951ef028eecSStefano Zampini       array[first_index] += k;
3952ef028eecSStefano Zampini       old_index = first_index;
3953ef028eecSStefano Zampini       for (i=first_index+1;i<s;i++) {
3954ef028eecSStefano Zampini         if (array[i] > 0.0) {
3955ef028eecSStefano Zampini           array[i] += array[old_index];
3956ef028eecSStefano Zampini           old_index = i;
3957ef028eecSStefano Zampini         }
3958ef028eecSStefano Zampini       }
3959ef028eecSStefano Zampini     }
3960ef028eecSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_global,&array);CHKERRQ(ierr);
3961ef028eecSStefano Zampini     ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
3962ef028eecSStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3963ef028eecSStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3964ef028eecSStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3965ef028eecSStefano Zampini     for (i=0;i<pcbddc->local_primal_size;i++) {
3966ef028eecSStefano Zampini       pcbddc->local_primal_indices[i] = (PetscInt)array[auxlocal_primal[i]]-1;
3967ef028eecSStefano Zampini     }
3968ef028eecSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3969ef028eecSStefano Zampini     ierr = PetscFree(dof_displs);CHKERRQ(ierr);
3970ef028eecSStefano Zampini     ierr = PetscFree(dof_sizes);CHKERRQ(ierr);
3971ef028eecSStefano Zampini 
3972ef028eecSStefano Zampini     if (dbg_flag) {
39732e8d2280SStefano Zampini       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
39742e8d2280SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
39752e8d2280SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Check coarse indices\n");CHKERRQ(ierr);
39762e8d2280SStefano Zampini       ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
39772e8d2280SStefano Zampini       ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3978ef028eecSStefano Zampini       for (i=0;i<pcbddc->local_primal_size;i++) {
3979ef028eecSStefano Zampini         array[auxlocal_primal[i]]=1.0;
39802e8d2280SStefano Zampini       }
3981beed3852SStefano Zampini       ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
39822e8d2280SStefano Zampini       ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
3983da1bb401SStefano Zampini       ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3984da1bb401SStefano Zampini       ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3985da1bb401SStefano Zampini       ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3986da1bb401SStefano Zampini       ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3987da1bb401SStefano Zampini       ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
39882e8d2280SStefano Zampini       for (i=0;i<pcis->n;i++) {
39892e8d2280SStefano Zampini         if (array[i] == 1.0) {
39902e8d2280SStefano Zampini           ierr = ISLocalToGlobalMappingApply(matis->mapping,1,&i,&j);CHKERRQ(ierr);
39912e8d2280SStefano Zampini           ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d: WRONG COARSE INDEX %d (local %d)\n",PetscGlobalRank,j,i);CHKERRQ(ierr);
39922e8d2280SStefano Zampini         }
39932e8d2280SStefano Zampini       }
39942e8d2280SStefano Zampini       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
39952e8d2280SStefano Zampini       for (i=0;i<pcis->n;i++) {
39962e8d2280SStefano Zampini         if( array[i] > 0.0) {
39972e8d2280SStefano Zampini           array[i] = 1.0/array[i];
39982e8d2280SStefano Zampini         }
39992e8d2280SStefano Zampini       }
4000da1bb401SStefano Zampini       ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
40012e8d2280SStefano Zampini       ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
4002da1bb401SStefano Zampini       ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4003da1bb401SStefano Zampini       ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4004da1bb401SStefano Zampini       ierr = VecSum(pcis->vec1_global,&coarsesum);CHKERRQ(ierr);
40052e8d2280SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Size of coarse problem SHOULD be %lf\n",coarsesum);CHKERRQ(ierr);
40062e8d2280SStefano Zampini       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
40072e8d2280SStefano Zampini     }
4008142dfd88SStefano Zampini     ierr = PetscFree(auxlocal_primal);CHKERRQ(ierr);
40090bdf917eSStefano Zampini   }
40100bdf917eSStefano Zampini 
40112e8d2280SStefano Zampini   if (dbg_flag) {
40127cf533a6SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"Size of coarse problem is %d\n",pcbddc->coarse_size);CHKERRQ(ierr);
40132e8d2280SStefano Zampini     /*ierr = PetscViewerASCIIPrintf(viewer,"Distribution of local primal indices\n");CHKERRQ(ierr);
40142e8d2280SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
40152e8d2280SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d\n",PetscGlobalRank);CHKERRQ(ierr);
40162e8d2280SStefano Zampini     for (i=0;i<pcbddc->local_primal_size;i++) {
40172e8d2280SStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local_primal_indices[%d]=%d \n",i,pcbddc->local_primal_indices[i]);
40182e8d2280SStefano Zampini     }*/
40192e8d2280SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
40202e8d2280SStefano Zampini   }
40212e8d2280SStefano Zampini 
4022a929c220SStefano Zampini   im_active = 0;
40230bdf917eSStefano Zampini   if (pcis->n) { im_active = 1; }
4024a929c220SStefano Zampini   ierr = MPI_Allreduce(&im_active,&active_procs,1,MPIU_INT,MPI_SUM,prec_comm);CHKERRQ(ierr);
40250bdf917eSStefano Zampini 
40260bdf917eSStefano Zampini   /* adapt coarse problem type */
40274fad6a16SStefano Zampini   if (pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
40284fad6a16SStefano Zampini     if (pcbddc->current_level < pcbddc->max_levels) {
4029a929c220SStefano Zampini       if ( (active_procs/pcbddc->coarsening_ratio) < 2 ) {
40300bdf917eSStefano Zampini         if (dbg_flag) {
4031a929c220SStefano Zampini           ierr = PetscViewerASCIIPrintf(viewer,"Not enough active processes on level %d (active %d,ratio %d). Parallel direct solve for coarse problem\n",pcbddc->current_level,active_procs,pcbddc->coarsening_ratio);CHKERRQ(ierr);
40320bdf917eSStefano Zampini          ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
40330bdf917eSStefano Zampini         }
40340bdf917eSStefano Zampini         pcbddc->coarse_problem_type = PARALLEL_BDDC;
4035142dfd88SStefano Zampini       }
40364fad6a16SStefano Zampini     } else {
40374fad6a16SStefano Zampini       if (dbg_flag) {
4038a929c220SStefano Zampini         ierr = PetscViewerASCIIPrintf(viewer,"Max number of levels reached. Using parallel direct solve for coarse problem\n",pcbddc->max_levels,active_procs,pcbddc->coarsening_ratio);CHKERRQ(ierr);
40394fad6a16SStefano Zampini         ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
40404fad6a16SStefano Zampini       }
40414fad6a16SStefano Zampini       pcbddc->coarse_problem_type = PARALLEL_BDDC;
40424fad6a16SStefano Zampini     }
40434fad6a16SStefano Zampini   }
4044beed3852SStefano Zampini 
40450c7d97c5SJed Brown   switch(pcbddc->coarse_problem_type){
40460c7d97c5SJed Brown 
4047da1bb401SStefano Zampini     case(MULTILEVEL_BDDC):   /* we define a coarse mesh where subdomains are elements */
40480c7d97c5SJed Brown     {
40490c7d97c5SJed Brown       /* we need additional variables */
40500c7d97c5SJed Brown       MetisInt    n_subdomains,n_parts,objval,ncon,faces_nvtxs;
40510c7d97c5SJed Brown       MetisInt    *metis_coarse_subdivision;
40520c7d97c5SJed Brown       MetisInt    options[METIS_NOPTIONS];
40530c7d97c5SJed Brown       PetscMPIInt size_coarse_comm,rank_coarse_comm;
40540c7d97c5SJed Brown       PetscMPIInt procs_jumps_coarse_comm;
40550c7d97c5SJed Brown       PetscMPIInt *coarse_subdivision;
40560c7d97c5SJed Brown       PetscMPIInt *total_count_recv;
40570c7d97c5SJed Brown       PetscMPIInt *total_ranks_recv;
40580c7d97c5SJed Brown       PetscMPIInt *displacements_recv;
40590c7d97c5SJed Brown       PetscMPIInt *my_faces_connectivity;
40600c7d97c5SJed Brown       PetscMPIInt *petsc_faces_adjncy;
40610c7d97c5SJed Brown       MetisInt    *faces_adjncy;
40620c7d97c5SJed Brown       MetisInt    *faces_xadj;
40630c7d97c5SJed Brown       PetscMPIInt *number_of_faces;
40640c7d97c5SJed Brown       PetscMPIInt *faces_displacements;
40650c7d97c5SJed Brown       PetscInt    *array_int;
40660c7d97c5SJed Brown       PetscMPIInt my_faces=0;
40670c7d97c5SJed Brown       PetscMPIInt total_faces=0;
40683828260eSStefano Zampini       PetscInt    ranks_stretching_ratio;
40690c7d97c5SJed Brown 
40700c7d97c5SJed Brown       /* define some quantities */
40710c7d97c5SJed Brown       pcbddc->coarse_communications_type = SCATTERS_BDDC;
40720c7d97c5SJed Brown       coarse_mat_type = MATIS;
40730c7d97c5SJed Brown       coarse_pc_type  = PCBDDC;
4074142dfd88SStefano Zampini       coarse_ksp_type = KSPRICHARDSON;
40750c7d97c5SJed Brown 
40760c7d97c5SJed Brown       /* details of coarse decomposition */
4077a929c220SStefano Zampini       n_subdomains = active_procs;
40780c7d97c5SJed Brown       n_parts      = n_subdomains/pcbddc->coarsening_ratio;
4079a929c220SStefano Zampini       ranks_stretching_ratio = size_prec_comm/active_procs;
40803828260eSStefano Zampini       procs_jumps_coarse_comm = pcbddc->coarsening_ratio*ranks_stretching_ratio;
40813828260eSStefano Zampini 
4082a929c220SStefano Zampini #if 0
4083a929c220SStefano Zampini       PetscMPIInt *old_ranks;
4084a929c220SStefano Zampini       PetscInt    *new_ranks,*jj,*ii;
4085a929c220SStefano Zampini       MatPartitioning mat_part;
4086a929c220SStefano Zampini       IS coarse_new_decomposition,is_numbering;
4087a929c220SStefano Zampini       PetscViewer viewer_test;
4088a929c220SStefano Zampini       MPI_Comm    test_coarse_comm;
4089a929c220SStefano Zampini       PetscMPIInt test_coarse_color;
4090a929c220SStefano Zampini       Mat         mat_adj;
4091a929c220SStefano Zampini       /* Create new communicator for coarse problem splitting the old one */
4092a929c220SStefano Zampini       /* procs with coarse_color = MPI_UNDEFINED will have coarse_comm = MPI_COMM_NULL (from mpi standards)
4093a929c220SStefano Zampini          key = rank_prec_comm -> keep same ordering of ranks from the old to the new communicator */
4094a929c220SStefano Zampini       test_coarse_color = ( im_active ? 0 : MPI_UNDEFINED );
4095a929c220SStefano Zampini       test_coarse_comm = MPI_COMM_NULL;
4096a929c220SStefano Zampini       ierr = MPI_Comm_split(prec_comm,test_coarse_color,rank_prec_comm,&test_coarse_comm);CHKERRQ(ierr);
4097a929c220SStefano Zampini       if (im_active) {
4098a929c220SStefano Zampini         ierr = PetscMalloc(n_subdomains*sizeof(PetscMPIInt),&old_ranks);
4099a929c220SStefano Zampini         ierr = PetscMalloc(size_prec_comm*sizeof(PetscInt),&new_ranks);
4100a929c220SStefano Zampini         ierr = MPI_Comm_rank(test_coarse_comm,&rank_coarse_comm);CHKERRQ(ierr);
4101a929c220SStefano Zampini         ierr = MPI_Comm_size(test_coarse_comm,&j);CHKERRQ(ierr);
4102a929c220SStefano Zampini         ierr = MPI_Allgather(&rank_prec_comm,1,MPIU_INT,old_ranks,1,MPIU_INT,test_coarse_comm);CHKERRQ(ierr);
4103a929c220SStefano Zampini         for (i=0;i<size_prec_comm;i++) {
4104a929c220SStefano Zampini           new_ranks[i] = -1;
4105a929c220SStefano Zampini         }
4106a929c220SStefano Zampini         for (i=0;i<n_subdomains;i++) {
4107a929c220SStefano Zampini           new_ranks[old_ranks[i]] = i;
4108a929c220SStefano Zampini         }
4109a929c220SStefano Zampini         ierr = PetscViewerASCIIOpen(test_coarse_comm,"test_mat_part.out",&viewer_test);CHKERRQ(ierr);
4110a929c220SStefano Zampini         k = pcis->n_neigh-1;
4111a929c220SStefano Zampini         ierr = PetscMalloc(2*sizeof(PetscInt),&ii);
4112a929c220SStefano Zampini         ii[0]=0;
4113a929c220SStefano Zampini         ii[1]=k;
4114a929c220SStefano Zampini         ierr = PetscMalloc(k*sizeof(PetscInt),&jj);
4115a929c220SStefano Zampini         for (i=0;i<k;i++) {
4116a929c220SStefano Zampini           jj[i]=new_ranks[pcis->neigh[i+1]];
4117a929c220SStefano Zampini         }
4118a929c220SStefano Zampini         ierr = PetscSortInt(k,jj);CHKERRQ(ierr);
4119a929c220SStefano Zampini         ierr = MatCreateMPIAdj(test_coarse_comm,1,n_subdomains,ii,jj,PETSC_NULL,&mat_adj);CHKERRQ(ierr);
4120a929c220SStefano Zampini         ierr = MatView(mat_adj,viewer_test);CHKERRQ(ierr);
4121a929c220SStefano Zampini         ierr = MatPartitioningCreate(test_coarse_comm,&mat_part);CHKERRQ(ierr);
4122a929c220SStefano Zampini         ierr = MatPartitioningSetAdjacency(mat_part,mat_adj);CHKERRQ(ierr);
4123a929c220SStefano Zampini         ierr = MatPartitioningSetFromOptions(mat_part);CHKERRQ(ierr);
4124a929c220SStefano Zampini         printf("Setting Nparts %d\n",n_parts);
4125a929c220SStefano Zampini         ierr = MatPartitioningSetNParts(mat_part,n_parts);CHKERRQ(ierr);
4126a929c220SStefano Zampini         ierr = MatPartitioningView(mat_part,viewer_test);CHKERRQ(ierr);
4127a929c220SStefano Zampini         ierr = MatPartitioningApply(mat_part,&coarse_new_decomposition);CHKERRQ(ierr);
4128a929c220SStefano Zampini         ierr = ISView(coarse_new_decomposition,viewer_test);CHKERRQ(ierr);
4129a929c220SStefano Zampini         ierr = ISPartitioningToNumbering(coarse_new_decomposition,&is_numbering);CHKERRQ(ierr);
4130a929c220SStefano Zampini         ierr = ISView(is_numbering,viewer_test);CHKERRQ(ierr);
4131a929c220SStefano Zampini         ierr = PetscViewerDestroy(&viewer_test);CHKERRQ(ierr);
4132a929c220SStefano Zampini         ierr = ISDestroy(&coarse_new_decomposition);CHKERRQ(ierr);
4133a929c220SStefano Zampini         ierr = ISDestroy(&is_numbering);CHKERRQ(ierr);
4134a929c220SStefano Zampini         ierr = MatPartitioningDestroy(&mat_part);CHKERRQ(ierr);
4135a929c220SStefano Zampini         ierr = PetscFree(old_ranks);CHKERRQ(ierr);
4136a929c220SStefano Zampini         ierr = PetscFree(new_ranks);CHKERRQ(ierr);
4137a929c220SStefano Zampini         ierr = MPI_Comm_free(&test_coarse_comm);CHKERRQ(ierr);
4138a929c220SStefano Zampini       }
4139a929c220SStefano Zampini #endif
4140a929c220SStefano Zampini 
41414fad6a16SStefano Zampini       /* build CSR graph of subdomains' connectivity */
41420c7d97c5SJed Brown       ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&array_int);CHKERRQ(ierr);
41433828260eSStefano Zampini       ierr = PetscMemzero(array_int,pcis->n*sizeof(PetscInt));CHKERRQ(ierr);
41440c7d97c5SJed Brown       for (i=1;i<pcis->n_neigh;i++){/* i=1 so I don't count myself -> faces nodes counts to 1 */
41450c7d97c5SJed Brown         for (j=0;j<pcis->n_shared[i];j++){
41460c7d97c5SJed Brown           array_int[ pcis->shared[i][j] ]+=1;
41470c7d97c5SJed Brown         }
41480c7d97c5SJed Brown       }
41490c7d97c5SJed Brown       for (i=1;i<pcis->n_neigh;i++){
41500c7d97c5SJed Brown         for (j=0;j<pcis->n_shared[i];j++){
41517cf533a6SStefano Zampini           if (array_int[ pcis->shared[i][j] ] > 0 ){
41520c7d97c5SJed Brown             my_faces++;
41530c7d97c5SJed Brown             break;
41540c7d97c5SJed Brown           }
41550c7d97c5SJed Brown         }
41560c7d97c5SJed Brown       }
41570c7d97c5SJed Brown 
415853cdbc3dSStefano Zampini       ierr = MPI_Reduce(&my_faces,&total_faces,1,MPIU_INT,MPI_SUM,master_proc,prec_comm);CHKERRQ(ierr);
41590c7d97c5SJed Brown       ierr = PetscMalloc (my_faces*sizeof(PetscInt),&my_faces_connectivity);CHKERRQ(ierr);
41600c7d97c5SJed Brown       my_faces=0;
41610c7d97c5SJed Brown       for (i=1;i<pcis->n_neigh;i++){
41620c7d97c5SJed Brown         for (j=0;j<pcis->n_shared[i];j++){
41637cf533a6SStefano Zampini           if (array_int[ pcis->shared[i][j] ] > 0 ){
41640c7d97c5SJed Brown             my_faces_connectivity[my_faces]=pcis->neigh[i];
41650c7d97c5SJed Brown             my_faces++;
41660c7d97c5SJed Brown             break;
41670c7d97c5SJed Brown           }
41680c7d97c5SJed Brown         }
41690c7d97c5SJed Brown       }
41700c7d97c5SJed Brown       if (rank_prec_comm == master_proc) {
41710c7d97c5SJed Brown         ierr = PetscMalloc (total_faces*sizeof(PetscMPIInt),&petsc_faces_adjncy);CHKERRQ(ierr);
41720c7d97c5SJed Brown         ierr = PetscMalloc (size_prec_comm*sizeof(PetscMPIInt),&number_of_faces);CHKERRQ(ierr);
41730c7d97c5SJed Brown         ierr = PetscMalloc (total_faces*sizeof(MetisInt),&faces_adjncy);CHKERRQ(ierr);
41740c7d97c5SJed Brown         ierr = PetscMalloc ((n_subdomains+1)*sizeof(MetisInt),&faces_xadj);CHKERRQ(ierr);
41750c7d97c5SJed Brown         ierr = PetscMalloc ((size_prec_comm+1)*sizeof(PetscMPIInt),&faces_displacements);CHKERRQ(ierr);
41760c7d97c5SJed Brown       }
417753cdbc3dSStefano Zampini       ierr = MPI_Gather(&my_faces,1,MPIU_INT,&number_of_faces[0],1,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr);
41780c7d97c5SJed Brown       if (rank_prec_comm == master_proc) {
41790c7d97c5SJed Brown         faces_xadj[0]=0;
41800c7d97c5SJed Brown         faces_displacements[0]=0;
41810c7d97c5SJed Brown         j=0;
41820c7d97c5SJed Brown         for (i=1;i<size_prec_comm+1;i++) {
41830c7d97c5SJed Brown           faces_displacements[i]=faces_displacements[i-1]+number_of_faces[i-1];
41840c7d97c5SJed Brown           if (number_of_faces[i-1]) {
41850c7d97c5SJed Brown             j++;
41860c7d97c5SJed Brown             faces_xadj[j]=faces_xadj[j-1]+number_of_faces[i-1];
41870c7d97c5SJed Brown           }
41880c7d97c5SJed Brown         }
41890c7d97c5SJed Brown       }
419053cdbc3dSStefano Zampini       ierr = MPI_Gatherv(&my_faces_connectivity[0],my_faces,MPIU_INT,&petsc_faces_adjncy[0],number_of_faces,faces_displacements,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr);
41910c7d97c5SJed Brown       ierr = PetscFree(my_faces_connectivity);CHKERRQ(ierr);
41920c7d97c5SJed Brown       ierr = PetscFree(array_int);CHKERRQ(ierr);
41930c7d97c5SJed Brown       if (rank_prec_comm == master_proc) {
41943828260eSStefano Zampini         for (i=0;i<total_faces;i++) faces_adjncy[i]=(MetisInt)(petsc_faces_adjncy[i]/ranks_stretching_ratio); /* cast to MetisInt */
4195da1bb401SStefano Zampini         /*printf("This is the face connectivity (actual ranks)\n");
41960c7d97c5SJed Brown         for (i=0;i<n_subdomains;i++){
41970c7d97c5SJed Brown           printf("proc %d is connected with \n",i);
41980c7d97c5SJed Brown           for (j=faces_xadj[i];j<faces_xadj[i+1];j++)
41990c7d97c5SJed Brown             printf("%d ",faces_adjncy[j]);
42000c7d97c5SJed Brown           printf("\n");
4201da1bb401SStefano Zampini         }*/
42020c7d97c5SJed Brown         ierr = PetscFree(faces_displacements);CHKERRQ(ierr);
42030c7d97c5SJed Brown         ierr = PetscFree(number_of_faces);CHKERRQ(ierr);
42040c7d97c5SJed Brown         ierr = PetscFree(petsc_faces_adjncy);CHKERRQ(ierr);
42050c7d97c5SJed Brown       }
42060c7d97c5SJed Brown 
42070c7d97c5SJed Brown       if ( rank_prec_comm == master_proc ) {
42080c7d97c5SJed Brown 
42093828260eSStefano Zampini         PetscInt heuristic_for_metis=3;
42103828260eSStefano Zampini 
42110c7d97c5SJed Brown         ncon=1;
42120c7d97c5SJed Brown         faces_nvtxs=n_subdomains;
42130c7d97c5SJed Brown         /* partition graoh induced by face connectivity */
42140c7d97c5SJed Brown         ierr = PetscMalloc (n_subdomains*sizeof(MetisInt),&metis_coarse_subdivision);CHKERRQ(ierr);
42150c7d97c5SJed Brown         ierr = METIS_SetDefaultOptions(options);
42160c7d97c5SJed Brown         /* we need a contiguous partition of the coarse mesh */
42170c7d97c5SJed Brown         options[METIS_OPTION_CONTIG]=1;
42180c7d97c5SJed Brown         options[METIS_OPTION_NITER]=30;
42194fad6a16SStefano Zampini         if (pcbddc->coarsening_ratio > 1) {
42203828260eSStefano Zampini           if (n_subdomains>n_parts*heuristic_for_metis) {
42213828260eSStefano Zampini             options[METIS_OPTION_IPTYPE]=METIS_IPTYPE_EDGE;
42223828260eSStefano Zampini             options[METIS_OPTION_OBJTYPE]=METIS_OBJTYPE_CUT;
42230c7d97c5SJed Brown             ierr = METIS_PartGraphKway(&faces_nvtxs,&ncon,faces_xadj,faces_adjncy,NULL,NULL,NULL,&n_parts,NULL,NULL,options,&objval,metis_coarse_subdivision);
4224142dfd88SStefano Zampini             if (ierr != METIS_OK) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in METIS_PartGraphKway (metis error code %D) called from PCBDDCSetupCoarseEnvironment\n",ierr);
42253828260eSStefano Zampini           } else {
42263828260eSStefano Zampini             ierr = METIS_PartGraphRecursive(&faces_nvtxs,&ncon,faces_xadj,faces_adjncy,NULL,NULL,NULL,&n_parts,NULL,NULL,options,&objval,metis_coarse_subdivision);
4227142dfd88SStefano Zampini             if (ierr != METIS_OK) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in METIS_PartGraphRecursive (metis error code %D) called from PCBDDCSetupCoarseEnvironment\n",ierr);
42283828260eSStefano Zampini           }
42294fad6a16SStefano Zampini         } else {
42304fad6a16SStefano Zampini           for (i=0;i<n_subdomains;i++) {
42314fad6a16SStefano Zampini             metis_coarse_subdivision[i]=i;
42324fad6a16SStefano Zampini           }
42334fad6a16SStefano Zampini         }
42340c7d97c5SJed Brown         ierr = PetscFree(faces_xadj);CHKERRQ(ierr);
42350c7d97c5SJed Brown         ierr = PetscFree(faces_adjncy);CHKERRQ(ierr);
42360bdf917eSStefano Zampini         ierr = PetscMalloc(size_prec_comm*sizeof(PetscMPIInt),&coarse_subdivision);CHKERRQ(ierr);
42370c7d97c5SJed Brown         /* copy/cast values avoiding possible type conflicts between PETSc, MPI and METIS */
42380bdf917eSStefano Zampini         for (i=0;i<size_prec_comm;i++) { coarse_subdivision[i]=MPI_PROC_NULL; }
42390bdf917eSStefano Zampini         for (i=0;i<n_subdomains;i++)   { coarse_subdivision[ranks_stretching_ratio*i]=(PetscInt)(metis_coarse_subdivision[i]); }
42400c7d97c5SJed Brown         ierr = PetscFree(metis_coarse_subdivision);CHKERRQ(ierr);
42410c7d97c5SJed Brown       }
42420c7d97c5SJed Brown 
42430c7d97c5SJed Brown       /* Create new communicator for coarse problem splitting the old one */
42440c7d97c5SJed Brown       if ( !(rank_prec_comm%procs_jumps_coarse_comm) && rank_prec_comm < procs_jumps_coarse_comm*n_parts ){
4245da1bb401SStefano Zampini         coarse_color=0;              /* for communicator splitting */
4246da1bb401SStefano Zampini         active_rank=rank_prec_comm;  /* for insertion of matrix values */
42470c7d97c5SJed Brown       }
4248da1bb401SStefano Zampini       /* procs with coarse_color = MPI_UNDEFINED will have coarse_comm = MPI_COMM_NULL (from mpi standards)
4249da1bb401SStefano Zampini          key = rank_prec_comm -> keep same ordering of ranks from the old to the new communicator */
425053cdbc3dSStefano Zampini       ierr = MPI_Comm_split(prec_comm,coarse_color,rank_prec_comm,&coarse_comm);CHKERRQ(ierr);
42510c7d97c5SJed Brown 
42520c7d97c5SJed Brown       if ( coarse_color == 0 ) {
425353cdbc3dSStefano Zampini         ierr = MPI_Comm_size(coarse_comm,&size_coarse_comm);CHKERRQ(ierr);
425453cdbc3dSStefano Zampini         ierr = MPI_Comm_rank(coarse_comm,&rank_coarse_comm);CHKERRQ(ierr);
42550c7d97c5SJed Brown       } else {
42560c7d97c5SJed Brown         rank_coarse_comm = MPI_PROC_NULL;
42570c7d97c5SJed Brown       }
42580c7d97c5SJed Brown 
42597cf533a6SStefano Zampini       /* master proc take care of arranging and distributing coarse information */
42600c7d97c5SJed Brown       if (rank_coarse_comm == master_proc) {
42610c7d97c5SJed Brown         ierr = PetscMalloc (size_coarse_comm*sizeof(PetscMPIInt),&displacements_recv);CHKERRQ(ierr);
42620bdf917eSStefano Zampini         ierr = PetscMalloc (size_coarse_comm*sizeof(PetscMPIInt),&total_count_recv);CHKERRQ(ierr);
42630bdf917eSStefano Zampini         ierr = PetscMalloc (n_subdomains*sizeof(PetscMPIInt),&total_ranks_recv);CHKERRQ(ierr);
42640c7d97c5SJed Brown         /* some initializations */
42650c7d97c5SJed Brown         displacements_recv[0]=0;
42660bdf917eSStefano Zampini         ierr = PetscMemzero(total_count_recv,size_coarse_comm*sizeof(PetscMPIInt));CHKERRQ(ierr);
42670c7d97c5SJed Brown         /* count from how many processes the j-th process of the coarse decomposition will receive data */
42680bdf917eSStefano Zampini         for (j=0;j<size_coarse_comm;j++) {
42690bdf917eSStefano Zampini           for (i=0;i<size_prec_comm;i++) {
42700bdf917eSStefano Zampini             if (coarse_subdivision[i]==j) {
42710c7d97c5SJed Brown               total_count_recv[j]++;
42720bdf917eSStefano Zampini             }
42730bdf917eSStefano Zampini           }
42740bdf917eSStefano Zampini         }
42750c7d97c5SJed Brown         /* displacements needed for scatterv of total_ranks_recv */
42760bdf917eSStefano Zampini         for (i=1;i<size_coarse_comm;i++) { displacements_recv[i]=displacements_recv[i-1]+total_count_recv[i-1]; }
42770c7d97c5SJed Brown         /* Now fill properly total_ranks_recv -> each coarse process will receive the ranks (in prec_comm communicator) of its friend (sending) processes */
42780c7d97c5SJed Brown         ierr = PetscMemzero(total_count_recv,size_coarse_comm*sizeof(PetscMPIInt));CHKERRQ(ierr);
42790c7d97c5SJed Brown         for (j=0;j<size_coarse_comm;j++) {
42803828260eSStefano Zampini           for (i=0;i<size_prec_comm;i++) {
42810c7d97c5SJed Brown             if (coarse_subdivision[i]==j) {
42820c7d97c5SJed Brown               total_ranks_recv[displacements_recv[j]+total_count_recv[j]]=i;
42833828260eSStefano Zampini               total_count_recv[j]+=1;
42840c7d97c5SJed Brown             }
42850c7d97c5SJed Brown           }
42860c7d97c5SJed Brown         }
4287da1bb401SStefano Zampini         /*for (j=0;j<size_coarse_comm;j++) {
42883828260eSStefano Zampini           printf("process %d in new rank will receive from %d processes (original ranks follows)\n",j,total_count_recv[j]);
42893828260eSStefano Zampini           for (i=0;i<total_count_recv[j];i++) {
42903828260eSStefano Zampini             printf("%d ",total_ranks_recv[displacements_recv[j]+i]);
42913828260eSStefano Zampini           }
42923828260eSStefano Zampini           printf("\n");
4293da1bb401SStefano Zampini         }*/
42940c7d97c5SJed Brown 
42950c7d97c5SJed Brown         /* identify new decomposition in terms of ranks in the old communicator */
42960bdf917eSStefano Zampini         for (i=0;i<n_subdomains;i++) {
42970bdf917eSStefano Zampini           coarse_subdivision[ranks_stretching_ratio*i]=coarse_subdivision[ranks_stretching_ratio*i]*procs_jumps_coarse_comm;
42980bdf917eSStefano Zampini         }
4299da1bb401SStefano Zampini         /*printf("coarse_subdivision in old end new ranks\n");
43000c7d97c5SJed Brown         for (i=0;i<size_prec_comm;i++)
43013828260eSStefano Zampini           if (coarse_subdivision[i]!=MPI_PROC_NULL) {
43023828260eSStefano Zampini             printf("%d=(%d %d), ",i,coarse_subdivision[i],coarse_subdivision[i]/procs_jumps_coarse_comm);
43033828260eSStefano Zampini           } else {
43043828260eSStefano Zampini             printf("%d=(%d %d), ",i,coarse_subdivision[i],coarse_subdivision[i]);
43053828260eSStefano Zampini           }
4306da1bb401SStefano Zampini         printf("\n");*/
43070c7d97c5SJed Brown       }
43080c7d97c5SJed Brown 
43090c7d97c5SJed Brown       /* Scatter new decomposition for send details */
431053cdbc3dSStefano Zampini       ierr = MPI_Scatter(&coarse_subdivision[0],1,MPIU_INT,&rank_coarse_proc_send_to,1,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr);
43110c7d97c5SJed Brown       /* Scatter receiving details to members of coarse decomposition */
43120c7d97c5SJed Brown       if ( coarse_color == 0) {
431353cdbc3dSStefano Zampini         ierr = MPI_Scatter(&total_count_recv[0],1,MPIU_INT,&count_recv,1,MPIU_INT,master_proc,coarse_comm);CHKERRQ(ierr);
43140c7d97c5SJed Brown         ierr = PetscMalloc (count_recv*sizeof(PetscMPIInt),&ranks_recv);CHKERRQ(ierr);
431553cdbc3dSStefano Zampini         ierr = MPI_Scatterv(&total_ranks_recv[0],total_count_recv,displacements_recv,MPIU_INT,&ranks_recv[0],count_recv,MPIU_INT,master_proc,coarse_comm);CHKERRQ(ierr);
43160c7d97c5SJed Brown       }
43170c7d97c5SJed Brown 
4318da1bb401SStefano Zampini       /*printf("I will send my matrix data to proc  %d\n",rank_coarse_proc_send_to);
4319da1bb401SStefano Zampini       if (coarse_color == 0) {
4320da1bb401SStefano Zampini         printf("I will receive some matrix data from %d processes (ranks follows)\n",count_recv);
4321da1bb401SStefano Zampini         for (i=0;i<count_recv;i++)
4322da1bb401SStefano Zampini           printf("%d ",ranks_recv[i]);
4323da1bb401SStefano Zampini         printf("\n");
4324da1bb401SStefano Zampini       }*/
43250c7d97c5SJed Brown 
43260c7d97c5SJed Brown       if (rank_prec_comm == master_proc) {
43270bdf917eSStefano Zampini         ierr = PetscFree(coarse_subdivision);CHKERRQ(ierr);
4328da1bb401SStefano Zampini         ierr = PetscFree(total_count_recv);CHKERRQ(ierr);
43290bdf917eSStefano Zampini         ierr = PetscFree(total_ranks_recv);CHKERRQ(ierr);
43300c7d97c5SJed Brown         ierr = PetscFree(displacements_recv);CHKERRQ(ierr);
43310c7d97c5SJed Brown       }
43320c7d97c5SJed Brown       break;
43330c7d97c5SJed Brown     }
43340c7d97c5SJed Brown 
43350c7d97c5SJed Brown     case(REPLICATED_BDDC):
43360c7d97c5SJed Brown 
43370c7d97c5SJed Brown       pcbddc->coarse_communications_type = GATHERS_BDDC;
43380c7d97c5SJed Brown       coarse_mat_type = MATSEQAIJ;
43390c7d97c5SJed Brown       coarse_pc_type  = PCLU;
434053cdbc3dSStefano Zampini       coarse_ksp_type  = KSPPREONLY;
43410c7d97c5SJed Brown       coarse_comm = PETSC_COMM_SELF;
43420c7d97c5SJed Brown       active_rank = rank_prec_comm;
43430c7d97c5SJed Brown       break;
43440c7d97c5SJed Brown 
43450c7d97c5SJed Brown     case(PARALLEL_BDDC):
43460c7d97c5SJed Brown 
43470c7d97c5SJed Brown       pcbddc->coarse_communications_type = SCATTERS_BDDC;
43480c7d97c5SJed Brown       coarse_mat_type = MATMPIAIJ;
43490c7d97c5SJed Brown       coarse_pc_type  = PCREDUNDANT;
435053cdbc3dSStefano Zampini       coarse_ksp_type  = KSPPREONLY;
43510c7d97c5SJed Brown       coarse_comm = prec_comm;
43520c7d97c5SJed Brown       active_rank = rank_prec_comm;
43530c7d97c5SJed Brown       break;
43540c7d97c5SJed Brown 
43550c7d97c5SJed Brown     case(SEQUENTIAL_BDDC):
43560c7d97c5SJed Brown       pcbddc->coarse_communications_type = GATHERS_BDDC;
43570c7d97c5SJed Brown       coarse_mat_type = MATSEQAIJ;
43580c7d97c5SJed Brown       coarse_pc_type = PCLU;
435953cdbc3dSStefano Zampini       coarse_ksp_type  = KSPPREONLY;
43600c7d97c5SJed Brown       coarse_comm = PETSC_COMM_SELF;
43610c7d97c5SJed Brown       active_rank = master_proc;
43620c7d97c5SJed Brown       break;
43630c7d97c5SJed Brown   }
43640c7d97c5SJed Brown 
43650c7d97c5SJed Brown   switch(pcbddc->coarse_communications_type){
43660c7d97c5SJed Brown 
43670c7d97c5SJed Brown     case(SCATTERS_BDDC):
43680c7d97c5SJed Brown       {
43690c7d97c5SJed Brown         if (pcbddc->coarse_problem_type==MULTILEVEL_BDDC) {
43700c7d97c5SJed Brown 
43712e8d2280SStefano Zampini           IS coarse_IS;
43722e8d2280SStefano Zampini 
4373523858cfSStefano Zampini           if(pcbddc->coarsening_ratio == 1) {
4374523858cfSStefano Zampini             ins_local_primal_size = pcbddc->local_primal_size;
4375523858cfSStefano Zampini             ins_local_primal_indices = pcbddc->local_primal_indices;
4376523858cfSStefano Zampini             if (coarse_color == 0) { ierr = PetscFree(ranks_recv);CHKERRQ(ierr); }
4377523858cfSStefano Zampini             /* nonzeros */
4378523858cfSStefano Zampini             ierr = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&dnz);CHKERRQ(ierr);
4379523858cfSStefano Zampini             ierr = PetscMemzero(dnz,ins_local_primal_size*sizeof(PetscInt));CHKERRQ(ierr);
4380523858cfSStefano Zampini             for (i=0;i<ins_local_primal_size;i++) {
4381523858cfSStefano Zampini               dnz[i] = ins_local_primal_size;
4382523858cfSStefano Zampini             }
4383523858cfSStefano Zampini           } else {
43840c7d97c5SJed Brown             PetscMPIInt send_size;
4385ef028eecSStefano Zampini             PetscMPIInt *send_buffer;
43860c7d97c5SJed Brown             PetscInt    *aux_ins_indices;
43870c7d97c5SJed Brown             PetscInt    ii,jj;
43880c7d97c5SJed Brown             MPI_Request *requests;
4389ef028eecSStefano Zampini 
4390523858cfSStefano Zampini             ierr = PetscMalloc(count_recv*sizeof(PetscMPIInt),&localdispl2);CHKERRQ(ierr);
4391523858cfSStefano Zampini             /* reusing pcbddc->local_primal_displacements and pcbddc->replicated_primal_size */
4392523858cfSStefano Zampini             ierr = PetscFree(pcbddc->local_primal_displacements);CHKERRQ(ierr);
4393523858cfSStefano Zampini             ierr = PetscMalloc((count_recv+1)*sizeof(PetscMPIInt),&pcbddc->local_primal_displacements);CHKERRQ(ierr);
4394523858cfSStefano Zampini             pcbddc->replicated_primal_size = count_recv;
4395523858cfSStefano Zampini             j = 0;
4396523858cfSStefano Zampini             for (i=0;i<count_recv;i++) {
4397523858cfSStefano Zampini               pcbddc->local_primal_displacements[i] = j;
4398523858cfSStefano Zampini               j += pcbddc->local_primal_sizes[ranks_recv[i]];
4399523858cfSStefano Zampini             }
4400523858cfSStefano Zampini             pcbddc->local_primal_displacements[count_recv] = j;
4401523858cfSStefano Zampini             ierr = PetscMalloc(j*sizeof(PetscMPIInt),&pcbddc->replicated_local_primal_indices);CHKERRQ(ierr);
44020c7d97c5SJed Brown             /* allocate auxiliary space */
4403523858cfSStefano Zampini             ierr = PetscMalloc(count_recv*sizeof(PetscMPIInt),&localsizes2);CHKERRQ(ierr);
44040c7d97c5SJed Brown             ierr = PetscMalloc(pcbddc->coarse_size*sizeof(PetscInt),&aux_ins_indices);CHKERRQ(ierr);
44050c7d97c5SJed Brown             ierr = PetscMemzero(aux_ins_indices,pcbddc->coarse_size*sizeof(PetscInt));CHKERRQ(ierr);
44060c7d97c5SJed Brown             /* allocate stuffs for message massing */
44070c7d97c5SJed Brown             ierr = PetscMalloc((count_recv+1)*sizeof(MPI_Request),&requests);CHKERRQ(ierr);
4408523858cfSStefano Zampini             for (i=0;i<count_recv+1;i++) { requests[i]=MPI_REQUEST_NULL; }
4409523858cfSStefano Zampini             /* send indices to be inserted */
4410523858cfSStefano Zampini             for (i=0;i<count_recv;i++) {
4411523858cfSStefano Zampini               send_size = pcbddc->local_primal_sizes[ranks_recv[i]];
4412523858cfSStefano Zampini               ierr = MPI_Irecv(&pcbddc->replicated_local_primal_indices[pcbddc->local_primal_displacements[i]],send_size,MPIU_INT,ranks_recv[i],999,prec_comm,&requests[i]);CHKERRQ(ierr);
4413523858cfSStefano Zampini             }
4414523858cfSStefano Zampini             if (rank_coarse_proc_send_to != MPI_PROC_NULL ) {
4415523858cfSStefano Zampini               send_size = pcbddc->local_primal_size;
4416ef028eecSStefano Zampini               ierr = PetscMalloc(send_size*sizeof(PetscMPIInt),&send_buffer);CHKERRQ(ierr);
4417ef028eecSStefano Zampini               for (i=0;i<send_size;i++) {
4418ef028eecSStefano Zampini                 send_buffer[i]=(PetscMPIInt)pcbddc->local_primal_indices[i];
4419ef028eecSStefano Zampini               }
4420ef028eecSStefano Zampini               ierr = MPI_Isend(send_buffer,send_size,MPIU_INT,rank_coarse_proc_send_to,999,prec_comm,&requests[count_recv]);CHKERRQ(ierr);
4421523858cfSStefano Zampini             }
4422523858cfSStefano Zampini             ierr = MPI_Waitall(count_recv+1,requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
4423ef028eecSStefano Zampini             if (rank_coarse_proc_send_to != MPI_PROC_NULL ) {
4424ef028eecSStefano Zampini               ierr = PetscFree(send_buffer);CHKERRQ(ierr);
4425ef028eecSStefano Zampini             }
44260c7d97c5SJed Brown             j = 0;
44270c7d97c5SJed Brown             for (i=0;i<count_recv;i++) {
44282e8d2280SStefano Zampini               ii = pcbddc->local_primal_displacements[i+1]-pcbddc->local_primal_displacements[i];
44292e8d2280SStefano Zampini               localsizes2[i] = ii*ii;
44300c7d97c5SJed Brown               localdispl2[i] = j;
44310c7d97c5SJed Brown               j += localsizes2[i];
4432523858cfSStefano Zampini               jj = pcbddc->local_primal_displacements[i];
44334fad6a16SStefano Zampini               /* it counts the coarse subdomains sharing the coarse node */
44342e8d2280SStefano Zampini               for (k=0;k<ii;k++) {
44354fad6a16SStefano Zampini                 aux_ins_indices[pcbddc->replicated_local_primal_indices[jj+k]] += 1;
44360c7d97c5SJed Brown               }
44374fad6a16SStefano Zampini             }
4438523858cfSStefano Zampini             /* temp_coarse_mat_vals used to store matrix values to be received */
44390c7d97c5SJed Brown             ierr = PetscMalloc(j*sizeof(PetscScalar),&temp_coarse_mat_vals);CHKERRQ(ierr);
44400c7d97c5SJed Brown             /* evaluate how many values I will insert in coarse mat */
44410c7d97c5SJed Brown             ins_local_primal_size = 0;
4442ea7e1babSStefano Zampini             for (i=0;i<pcbddc->coarse_size;i++) {
4443ea7e1babSStefano Zampini               if (aux_ins_indices[i]) {
44440c7d97c5SJed Brown                 ins_local_primal_size++;
4445ea7e1babSStefano Zampini               }
4446ea7e1babSStefano Zampini             }
44470c7d97c5SJed Brown             /* evaluate indices I will insert in coarse mat */
44480c7d97c5SJed Brown             ierr = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&ins_local_primal_indices);CHKERRQ(ierr);
44490c7d97c5SJed Brown             j = 0;
4450ea7e1babSStefano Zampini             for(i=0;i<pcbddc->coarse_size;i++) {
4451ea7e1babSStefano Zampini               if(aux_ins_indices[i]) {
44522e8d2280SStefano Zampini                 ins_local_primal_indices[j] = i;
44532e8d2280SStefano Zampini                 j++;
4454ea7e1babSStefano Zampini               }
4455ea7e1babSStefano Zampini             }
4456523858cfSStefano Zampini             /* processes partecipating in coarse problem receive matrix data from their friends */
4457523858cfSStefano Zampini             for (i=0;i<count_recv;i++) {
4458523858cfSStefano Zampini               ierr = MPI_Irecv(&temp_coarse_mat_vals[localdispl2[i]],localsizes2[i],MPIU_SCALAR,ranks_recv[i],666,prec_comm,&requests[i]);CHKERRQ(ierr);
4459523858cfSStefano Zampini             }
4460523858cfSStefano Zampini             if (rank_coarse_proc_send_to != MPI_PROC_NULL ) {
4461523858cfSStefano Zampini               send_size = pcbddc->local_primal_size*pcbddc->local_primal_size;
4462523858cfSStefano Zampini               ierr = MPI_Isend(&coarse_submat_vals[0],send_size,MPIU_SCALAR,rank_coarse_proc_send_to,666,prec_comm,&requests[count_recv]);CHKERRQ(ierr);
4463523858cfSStefano Zampini             }
4464523858cfSStefano Zampini             ierr = MPI_Waitall(count_recv+1,requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
4465523858cfSStefano Zampini             /* nonzeros */
4466523858cfSStefano Zampini             ierr = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&dnz);CHKERRQ(ierr);
4467523858cfSStefano Zampini             ierr = PetscMemzero(dnz,ins_local_primal_size*sizeof(PetscInt));CHKERRQ(ierr);
44680c7d97c5SJed Brown             /* use aux_ins_indices to realize a global to local mapping */
44690c7d97c5SJed Brown             j=0;
44700c7d97c5SJed Brown             for(i=0;i<pcbddc->coarse_size;i++){
44710c7d97c5SJed Brown               if(aux_ins_indices[i]==0){
44720c7d97c5SJed Brown                 aux_ins_indices[i]=-1;
44730c7d97c5SJed Brown               } else {
44740c7d97c5SJed Brown                 aux_ins_indices[i]=j;
44750c7d97c5SJed Brown                 j++;
44760c7d97c5SJed Brown               }
44770c7d97c5SJed Brown             }
44784fad6a16SStefano Zampini             for (i=0;i<count_recv;i++) {
4479523858cfSStefano Zampini               j = pcbddc->local_primal_sizes[ranks_recv[i]];
4480523858cfSStefano Zampini               for (k=0;k<j;k++) {
4481523858cfSStefano Zampini                 dnz[aux_ins_indices[pcbddc->replicated_local_primal_indices[pcbddc->local_primal_displacements[i]+k]]] += j;
44820c7d97c5SJed Brown               }
44830c7d97c5SJed Brown             }
4484523858cfSStefano Zampini             /* check */
4485523858cfSStefano Zampini             for (i=0;i<ins_local_primal_size;i++) {
4486523858cfSStefano Zampini               if (dnz[i] > ins_local_primal_size) {
4487523858cfSStefano Zampini                 dnz[i] = ins_local_primal_size;
44880c7d97c5SJed Brown               }
44890c7d97c5SJed Brown             }
44900c7d97c5SJed Brown             ierr = PetscFree(requests);CHKERRQ(ierr);
44910c7d97c5SJed Brown             ierr = PetscFree(aux_ins_indices);CHKERRQ(ierr);
44920c7d97c5SJed Brown             if (coarse_color == 0) { ierr = PetscFree(ranks_recv);CHKERRQ(ierr); }
44934fad6a16SStefano Zampini           }
44940c7d97c5SJed Brown           /* create local to global mapping needed by coarse MATIS */
4495142dfd88SStefano Zampini           if (coarse_comm != MPI_COMM_NULL ) {ierr = MPI_Comm_free(&coarse_comm);CHKERRQ(ierr);}
44960c7d97c5SJed Brown           coarse_comm = prec_comm;
44970c7d97c5SJed Brown           active_rank = rank_prec_comm;
44980c7d97c5SJed Brown           ierr = ISCreateGeneral(coarse_comm,ins_local_primal_size,ins_local_primal_indices,PETSC_COPY_VALUES,&coarse_IS);CHKERRQ(ierr);
44990c7d97c5SJed Brown           ierr = ISLocalToGlobalMappingCreateIS(coarse_IS,&coarse_ISLG);CHKERRQ(ierr);
45000c7d97c5SJed Brown           ierr = ISDestroy(&coarse_IS);CHKERRQ(ierr);
45012e8d2280SStefano Zampini         } else if (pcbddc->coarse_problem_type==PARALLEL_BDDC) {
45020c7d97c5SJed Brown           /* arrays for values insertion */
45030c7d97c5SJed Brown           ins_local_primal_size = pcbddc->local_primal_size;
45042e8d2280SStefano Zampini           ierr = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&ins_local_primal_indices);CHKERRQ(ierr);
45050c7d97c5SJed Brown           ierr = PetscMalloc(ins_local_primal_size*ins_local_primal_size*sizeof(PetscScalar),&ins_coarse_mat_vals);CHKERRQ(ierr);
45060c7d97c5SJed Brown           for (j=0;j<ins_local_primal_size;j++){
45070c7d97c5SJed Brown             ins_local_primal_indices[j]=pcbddc->local_primal_indices[j];
45084fad6a16SStefano Zampini             for (i=0;i<ins_local_primal_size;i++) {
45094fad6a16SStefano Zampini               ins_coarse_mat_vals[j*ins_local_primal_size+i]=coarse_submat_vals[j*ins_local_primal_size+i];
45104fad6a16SStefano Zampini             }
45110c7d97c5SJed Brown           }
45120c7d97c5SJed Brown         }
45130c7d97c5SJed Brown         break;
45140c7d97c5SJed Brown 
45150c7d97c5SJed Brown     }
45160c7d97c5SJed Brown 
45170c7d97c5SJed Brown     case(GATHERS_BDDC):
45180c7d97c5SJed Brown       {
45190c7d97c5SJed Brown 
45200c7d97c5SJed Brown         PetscMPIInt mysize,mysize2;
4521ef028eecSStefano Zampini         PetscMPIInt *send_buffer;
45220c7d97c5SJed Brown 
45230c7d97c5SJed Brown         if (rank_prec_comm==active_rank) {
45240c7d97c5SJed Brown           ierr = PetscMalloc ( pcbddc->replicated_primal_size*sizeof(PetscMPIInt),&pcbddc->replicated_local_primal_indices);CHKERRQ(ierr);
45250bdf917eSStefano Zampini           ierr = PetscMalloc ( pcbddc->replicated_primal_size*sizeof(PetscScalar),&pcbddc->replicated_local_primal_values);CHKERRQ(ierr);
45260c7d97c5SJed Brown           ierr = PetscMalloc ( size_prec_comm*sizeof(PetscMPIInt),&localsizes2);CHKERRQ(ierr);
45270c7d97c5SJed Brown           ierr = PetscMalloc ( size_prec_comm*sizeof(PetscMPIInt),&localdispl2);CHKERRQ(ierr);
45280c7d97c5SJed Brown           /* arrays for values insertion */
45294fad6a16SStefano Zampini           for (i=0;i<size_prec_comm;i++) { localsizes2[i]=pcbddc->local_primal_sizes[i]*pcbddc->local_primal_sizes[i]; }
45300c7d97c5SJed Brown           localdispl2[0]=0;
45314fad6a16SStefano Zampini           for (i=1;i<size_prec_comm;i++) { localdispl2[i]=localsizes2[i-1]+localdispl2[i-1]; }
45320c7d97c5SJed Brown           j=0;
45334fad6a16SStefano Zampini           for (i=0;i<size_prec_comm;i++) { j+=localsizes2[i]; }
45340c7d97c5SJed Brown           ierr = PetscMalloc ( j*sizeof(PetscScalar),&temp_coarse_mat_vals);CHKERRQ(ierr);
45350c7d97c5SJed Brown         }
45360c7d97c5SJed Brown 
45370c7d97c5SJed Brown         mysize=pcbddc->local_primal_size;
45380c7d97c5SJed Brown         mysize2=pcbddc->local_primal_size*pcbddc->local_primal_size;
4539ef028eecSStefano Zampini         ierr = PetscMalloc(mysize*sizeof(PetscMPIInt),&send_buffer);CHKERRQ(ierr);
4540ef028eecSStefano Zampini         for (i=0;i<mysize;i++) {
4541ef028eecSStefano Zampini           send_buffer[i]=(PetscMPIInt)pcbddc->local_primal_indices[i];
4542ef028eecSStefano Zampini         }
45430c7d97c5SJed Brown         if (pcbddc->coarse_problem_type == SEQUENTIAL_BDDC){
4544ef028eecSStefano Zampini           ierr = MPI_Gatherv(send_buffer,mysize,MPIU_INT,&pcbddc->replicated_local_primal_indices[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr);
454553cdbc3dSStefano Zampini           ierr = MPI_Gatherv(&coarse_submat_vals[0],mysize2,MPIU_SCALAR,&temp_coarse_mat_vals[0],localsizes2,localdispl2,MPIU_SCALAR,master_proc,prec_comm);CHKERRQ(ierr);
45460c7d97c5SJed Brown         } else {
4547ef028eecSStefano Zampini           ierr = MPI_Allgatherv(send_buffer,mysize,MPIU_INT,&pcbddc->replicated_local_primal_indices[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,prec_comm);CHKERRQ(ierr);
454853cdbc3dSStefano Zampini           ierr = MPI_Allgatherv(&coarse_submat_vals[0],mysize2,MPIU_SCALAR,&temp_coarse_mat_vals[0],localsizes2,localdispl2,MPIU_SCALAR,prec_comm);CHKERRQ(ierr);
45490c7d97c5SJed Brown         }
4550ef028eecSStefano Zampini         ierr = PetscFree(send_buffer);CHKERRQ(ierr);
45510c7d97c5SJed Brown         break;
4552da1bb401SStefano Zampini       }/* switch on coarse problem and communications associated with finished */
45530c7d97c5SJed Brown   }
45540c7d97c5SJed Brown 
45550c7d97c5SJed Brown   /* Now create and fill up coarse matrix */
45560c7d97c5SJed Brown   if ( rank_prec_comm == active_rank ) {
4557142dfd88SStefano Zampini 
4558142dfd88SStefano Zampini     Mat matis_coarse_local_mat;
4559142dfd88SStefano Zampini 
45600c7d97c5SJed Brown     if (pcbddc->coarse_problem_type != MULTILEVEL_BDDC) {
45610c7d97c5SJed Brown       ierr = MatCreate(coarse_comm,&pcbddc->coarse_mat);CHKERRQ(ierr);
45620c7d97c5SJed Brown       ierr = MatSetSizes(pcbddc->coarse_mat,PETSC_DECIDE,PETSC_DECIDE,pcbddc->coarse_size,pcbddc->coarse_size);CHKERRQ(ierr);
45630c7d97c5SJed Brown       ierr = MatSetType(pcbddc->coarse_mat,coarse_mat_type);CHKERRQ(ierr);
45643b03a366Sstefano_zampini       ierr = MatSetUp(pcbddc->coarse_mat);CHKERRQ(ierr);
4565da1bb401SStefano Zampini       ierr = MatSetOption(pcbddc->coarse_mat,MAT_ROW_ORIENTED,PETSC_FALSE);CHKERRQ(ierr); /* local values stored in column major */
45663b03a366Sstefano_zampini       ierr = MatSetOption(pcbddc->coarse_mat,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr);
45670c7d97c5SJed Brown     } else {
45684fad6a16SStefano Zampini       ierr = MatCreateIS(coarse_comm,1,PETSC_DECIDE,PETSC_DECIDE,pcbddc->coarse_size,pcbddc->coarse_size,coarse_ISLG,&pcbddc->coarse_mat);CHKERRQ(ierr);
45693b03a366Sstefano_zampini       ierr = MatSetUp(pcbddc->coarse_mat);CHKERRQ(ierr);
45700c7d97c5SJed Brown       ierr = MatISGetLocalMat(pcbddc->coarse_mat,&matis_coarse_local_mat);CHKERRQ(ierr);
45713b03a366Sstefano_zampini       ierr = MatSetUp(matis_coarse_local_mat);CHKERRQ(ierr);
4572da1bb401SStefano Zampini       ierr = MatSetOption(matis_coarse_local_mat,MAT_ROW_ORIENTED,PETSC_FALSE);CHKERRQ(ierr); /* local values stored in column major */
4573a0ba757dSStefano Zampini       ierr = MatSetOption(matis_coarse_local_mat,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr);
45740c7d97c5SJed Brown     }
4575142dfd88SStefano Zampini     /* preallocation */
4576142dfd88SStefano Zampini     if (pcbddc->coarse_problem_type != MULTILEVEL_BDDC) {
4577ef028eecSStefano Zampini 
4578142dfd88SStefano Zampini       PetscInt lrows,lcols;
4579ef028eecSStefano Zampini 
4580142dfd88SStefano Zampini       ierr = MatGetLocalSize(pcbddc->coarse_mat,&lrows,&lcols);CHKERRQ(ierr);
4581142dfd88SStefano Zampini       ierr = MatPreallocateInitialize(coarse_comm,lrows,lcols,dnz,onz);CHKERRQ(ierr);
4582ef028eecSStefano Zampini 
4583142dfd88SStefano Zampini       if (pcbddc->coarse_problem_type == PARALLEL_BDDC) {
4584ef028eecSStefano Zampini 
4585ef028eecSStefano Zampini         Vec         vec_dnz,vec_onz;
4586ef028eecSStefano Zampini         PetscScalar *my_dnz,*my_onz,*array;
4587ef028eecSStefano Zampini         PetscInt    *mat_ranges,*row_ownership;
4588ef028eecSStefano Zampini         PetscInt    coarse_index_row,coarse_index_col,owner;
4589ef028eecSStefano Zampini 
4590ef028eecSStefano Zampini         ierr = VecCreate(prec_comm,&vec_dnz);CHKERRQ(ierr);
4591ef028eecSStefano Zampini         ierr = VecSetSizes(vec_dnz,PETSC_DECIDE,pcbddc->coarse_size);CHKERRQ(ierr);
4592ef028eecSStefano Zampini         ierr = VecSetType(vec_dnz,VECMPI);CHKERRQ(ierr);
4593ef028eecSStefano Zampini         ierr = VecDuplicate(vec_dnz,&vec_onz);CHKERRQ(ierr);
4594ef028eecSStefano Zampini 
4595ef028eecSStefano Zampini         ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscScalar),&my_dnz);CHKERRQ(ierr);
4596ef028eecSStefano Zampini         ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscScalar),&my_onz);CHKERRQ(ierr);
4597ef028eecSStefano Zampini         ierr = PetscMemzero(my_dnz,pcbddc->local_primal_size*sizeof(PetscScalar));CHKERRQ(ierr);
4598ef028eecSStefano Zampini         ierr = PetscMemzero(my_onz,pcbddc->local_primal_size*sizeof(PetscScalar));CHKERRQ(ierr);
4599ef028eecSStefano Zampini 
4600ef028eecSStefano Zampini         ierr = PetscMalloc(pcbddc->coarse_size*sizeof(PetscInt),&row_ownership);CHKERRQ(ierr);
4601ef028eecSStefano Zampini         ierr = MatGetOwnershipRanges(pcbddc->coarse_mat,(const PetscInt**)&mat_ranges);CHKERRQ(ierr);
4602142dfd88SStefano Zampini         for (i=0;i<size_prec_comm;i++) {
4603ef028eecSStefano Zampini           for (j=mat_ranges[i];j<mat_ranges[i+1];j++) {
4604ef028eecSStefano Zampini             row_ownership[j]=i;
4605142dfd88SStefano Zampini           }
4606142dfd88SStefano Zampini         }
4607ef028eecSStefano Zampini 
4608ef028eecSStefano Zampini         for (i=0;i<pcbddc->local_primal_size;i++) {
4609ef028eecSStefano Zampini           coarse_index_row = pcbddc->local_primal_indices[i];
4610ef028eecSStefano Zampini           owner = row_ownership[coarse_index_row];
4611ef028eecSStefano Zampini           for (j=i;j<pcbddc->local_primal_size;j++) {
4612ef028eecSStefano Zampini             owner = row_ownership[coarse_index_row];
4613ef028eecSStefano Zampini             coarse_index_col = pcbddc->local_primal_indices[j];
4614ef028eecSStefano Zampini             if (coarse_index_col > mat_ranges[owner]-1 && coarse_index_col < mat_ranges[owner+1] ) {
4615ef028eecSStefano Zampini               my_dnz[i] += 1.0;
4616142dfd88SStefano Zampini             } else {
4617ef028eecSStefano Zampini               my_onz[i] += 1.0;
4618142dfd88SStefano Zampini             }
4619ef028eecSStefano Zampini             if (i != j) {
4620ef028eecSStefano Zampini               owner = row_ownership[coarse_index_col];
4621ef028eecSStefano Zampini               if (coarse_index_row > mat_ranges[owner]-1 && coarse_index_row < mat_ranges[owner+1] ) {
4622ef028eecSStefano Zampini                 my_dnz[j] += 1.0;
4623142dfd88SStefano Zampini               } else {
4624ef028eecSStefano Zampini                 my_onz[j] += 1.0;
4625142dfd88SStefano Zampini               }
4626142dfd88SStefano Zampini             }
4627142dfd88SStefano Zampini           }
4628142dfd88SStefano Zampini         }
4629ef028eecSStefano Zampini         ierr = VecSet(vec_dnz,0.0);CHKERRQ(ierr);
4630ef028eecSStefano Zampini         ierr = VecSet(vec_onz,0.0);CHKERRQ(ierr);
4631a929c220SStefano Zampini         if (pcbddc->local_primal_size) {
4632ef028eecSStefano Zampini           ierr = VecSetValues(vec_dnz,pcbddc->local_primal_size,pcbddc->local_primal_indices,my_dnz,ADD_VALUES);CHKERRQ(ierr);
4633ef028eecSStefano Zampini           ierr = VecSetValues(vec_onz,pcbddc->local_primal_size,pcbddc->local_primal_indices,my_onz,ADD_VALUES);CHKERRQ(ierr);
4634a929c220SStefano Zampini         }
4635ef028eecSStefano Zampini         ierr = VecAssemblyBegin(vec_dnz);CHKERRQ(ierr);
4636ef028eecSStefano Zampini         ierr = VecAssemblyBegin(vec_onz);CHKERRQ(ierr);
4637ef028eecSStefano Zampini         ierr = VecAssemblyEnd(vec_dnz);CHKERRQ(ierr);
4638ef028eecSStefano Zampini         ierr = VecAssemblyEnd(vec_onz);CHKERRQ(ierr);
4639ef028eecSStefano Zampini         j = mat_ranges[rank_prec_comm+1]-mat_ranges[rank_prec_comm];
4640ef028eecSStefano Zampini         ierr = VecGetArray(vec_dnz,&array);CHKERRQ(ierr);
4641ef028eecSStefano Zampini         for (i=0;i<j;i++) {
4642ef028eecSStefano Zampini           dnz[i] = (PetscInt)array[i];
4643142dfd88SStefano Zampini         }
4644ef028eecSStefano Zampini         ierr = VecRestoreArray(vec_dnz,&array);CHKERRQ(ierr);
4645ef028eecSStefano Zampini         ierr = VecGetArray(vec_onz,&array);CHKERRQ(ierr);
4646ef028eecSStefano Zampini         for (i=0;i<j;i++) {
4647ef028eecSStefano Zampini           onz[i] = (PetscInt)array[i];
4648142dfd88SStefano Zampini         }
4649ef028eecSStefano Zampini         ierr = VecRestoreArray(vec_onz,&array);CHKERRQ(ierr);
4650ef028eecSStefano Zampini         ierr = PetscFree(my_dnz);CHKERRQ(ierr);
4651ef028eecSStefano Zampini         ierr = PetscFree(my_onz);CHKERRQ(ierr);
4652ef028eecSStefano Zampini         ierr = PetscFree(row_ownership);CHKERRQ(ierr);
4653ef028eecSStefano Zampini         ierr = VecDestroy(&vec_dnz);CHKERRQ(ierr);
4654ef028eecSStefano Zampini         ierr = VecDestroy(&vec_onz);CHKERRQ(ierr);
4655142dfd88SStefano Zampini       } else {
4656142dfd88SStefano Zampini         for (k=0;k<size_prec_comm;k++){
4657142dfd88SStefano Zampini           offset=pcbddc->local_primal_displacements[k];
4658142dfd88SStefano Zampini           offset2=localdispl2[k];
4659142dfd88SStefano Zampini           ins_local_primal_size = pcbddc->local_primal_sizes[k];
4660ef028eecSStefano Zampini           ierr = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&ins_local_primal_indices);CHKERRQ(ierr);
4661ef028eecSStefano Zampini           for (j=0;j<ins_local_primal_size;j++){
4662ef028eecSStefano Zampini             ins_local_primal_indices[j]=(PetscInt)pcbddc->replicated_local_primal_indices[offset+j];
4663ef028eecSStefano Zampini           }
4664142dfd88SStefano Zampini           for (j=0;j<ins_local_primal_size;j++) {
4665142dfd88SStefano Zampini             ierr = MatPreallocateSet(ins_local_primal_indices[j],ins_local_primal_size,ins_local_primal_indices,dnz,onz);CHKERRQ(ierr);
4666142dfd88SStefano Zampini           }
4667ef028eecSStefano Zampini           ierr = PetscFree(ins_local_primal_indices);CHKERRQ(ierr);
4668142dfd88SStefano Zampini         }
4669142dfd88SStefano Zampini       }
4670142dfd88SStefano Zampini       /* check */
4671142dfd88SStefano Zampini       for (i=0;i<lrows;i++) {
4672142dfd88SStefano Zampini         if (dnz[i]>lcols) {
4673142dfd88SStefano Zampini           dnz[i]=lcols;
4674142dfd88SStefano Zampini         }
4675142dfd88SStefano Zampini         if (onz[i]>pcbddc->coarse_size-lcols) {
4676142dfd88SStefano Zampini           onz[i]=pcbddc->coarse_size-lcols;
4677142dfd88SStefano Zampini         }
4678142dfd88SStefano Zampini       }
4679142dfd88SStefano Zampini       ierr = MatSeqAIJSetPreallocation(pcbddc->coarse_mat,PETSC_NULL,dnz);CHKERRQ(ierr);
4680142dfd88SStefano Zampini       ierr = MatMPIAIJSetPreallocation(pcbddc->coarse_mat,PETSC_NULL,dnz,PETSC_NULL,onz);CHKERRQ(ierr);
4681142dfd88SStefano Zampini       ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr);
4682142dfd88SStefano Zampini     } else {
4683523858cfSStefano Zampini       ierr = MatSeqAIJSetPreallocation(matis_coarse_local_mat,0,dnz);CHKERRQ(ierr);
4684523858cfSStefano Zampini       ierr = PetscFree(dnz);CHKERRQ(ierr);
4685142dfd88SStefano Zampini     }
4686142dfd88SStefano Zampini     /* insert values */
4687523858cfSStefano Zampini     if (pcbddc->coarse_problem_type == PARALLEL_BDDC) {
46880c7d97c5SJed Brown       ierr = MatSetValues(pcbddc->coarse_mat,ins_local_primal_size,ins_local_primal_indices,ins_local_primal_size,ins_local_primal_indices,ins_coarse_mat_vals,ADD_VALUES);CHKERRQ(ierr);
4689523858cfSStefano Zampini     } else if (pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
4690523858cfSStefano Zampini       if (pcbddc->coarsening_ratio == 1) {
4691523858cfSStefano Zampini         ins_coarse_mat_vals = coarse_submat_vals;
4692523858cfSStefano Zampini         ierr = MatSetValues(pcbddc->coarse_mat,ins_local_primal_size,ins_local_primal_indices,ins_local_primal_size,ins_local_primal_indices,ins_coarse_mat_vals,INSERT_VALUES);CHKERRQ(ierr);
4693523858cfSStefano Zampini       } else {
4694523858cfSStefano Zampini         ierr = PetscFree(ins_local_primal_indices);CHKERRQ(ierr);
4695523858cfSStefano Zampini         for (k=0;k<pcbddc->replicated_primal_size;k++) {
4696523858cfSStefano Zampini           offset = pcbddc->local_primal_displacements[k];
4697523858cfSStefano Zampini           offset2 = localdispl2[k];
4698523858cfSStefano Zampini           ins_local_primal_size = pcbddc->local_primal_displacements[k+1]-pcbddc->local_primal_displacements[k];
4699ef028eecSStefano Zampini           ierr = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&ins_local_primal_indices);CHKERRQ(ierr);
4700ef028eecSStefano Zampini           for (j=0;j<ins_local_primal_size;j++){
4701ef028eecSStefano Zampini             ins_local_primal_indices[j]=(PetscInt)pcbddc->replicated_local_primal_indices[offset+j];
4702ef028eecSStefano Zampini           }
4703523858cfSStefano Zampini           ins_coarse_mat_vals = &temp_coarse_mat_vals[offset2];
4704523858cfSStefano Zampini           ierr = MatSetValues(pcbddc->coarse_mat,ins_local_primal_size,ins_local_primal_indices,ins_local_primal_size,ins_local_primal_indices,ins_coarse_mat_vals,ADD_VALUES);CHKERRQ(ierr);
4705ef028eecSStefano Zampini           ierr = PetscFree(ins_local_primal_indices);CHKERRQ(ierr);
4706523858cfSStefano Zampini         }
4707523858cfSStefano Zampini       }
4708523858cfSStefano Zampini       ins_local_primal_indices = 0;
4709523858cfSStefano Zampini       ins_coarse_mat_vals = 0;
4710ea7e1babSStefano Zampini     } else {
4711ea7e1babSStefano Zampini       for (k=0;k<size_prec_comm;k++){
4712ea7e1babSStefano Zampini         offset=pcbddc->local_primal_displacements[k];
4713ea7e1babSStefano Zampini         offset2=localdispl2[k];
4714ea7e1babSStefano Zampini         ins_local_primal_size = pcbddc->local_primal_sizes[k];
4715ef028eecSStefano Zampini         ierr = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&ins_local_primal_indices);CHKERRQ(ierr);
4716ef028eecSStefano Zampini         for (j=0;j<ins_local_primal_size;j++){
4717ef028eecSStefano Zampini           ins_local_primal_indices[j]=(PetscInt)pcbddc->replicated_local_primal_indices[offset+j];
4718ef028eecSStefano Zampini         }
4719ea7e1babSStefano Zampini         ins_coarse_mat_vals = &temp_coarse_mat_vals[offset2];
4720ea7e1babSStefano Zampini         ierr = MatSetValues(pcbddc->coarse_mat,ins_local_primal_size,ins_local_primal_indices,ins_local_primal_size,ins_local_primal_indices,ins_coarse_mat_vals,ADD_VALUES);CHKERRQ(ierr);
4721ef028eecSStefano Zampini         ierr = PetscFree(ins_local_primal_indices);CHKERRQ(ierr);
4722ea7e1babSStefano Zampini       }
4723ea7e1babSStefano Zampini       ins_local_primal_indices = 0;
4724ea7e1babSStefano Zampini       ins_coarse_mat_vals = 0;
4725ea7e1babSStefano Zampini     }
47260c7d97c5SJed Brown     ierr = MatAssemblyBegin(pcbddc->coarse_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
47270c7d97c5SJed Brown     ierr = MatAssemblyEnd(pcbddc->coarse_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
4728142dfd88SStefano Zampini     /* symmetry of coarse matrix */
4729142dfd88SStefano Zampini     if (issym) {
4730142dfd88SStefano Zampini       ierr = MatSetOption(pcbddc->coarse_mat,MAT_SYMMETRIC,PETSC_TRUE);CHKERRQ(ierr);
4731142dfd88SStefano Zampini     }
47320c7d97c5SJed Brown     ierr = MatGetVecs(pcbddc->coarse_mat,&pcbddc->coarse_vec,&pcbddc->coarse_rhs);CHKERRQ(ierr);
47330bdf917eSStefano Zampini   }
47340bdf917eSStefano Zampini 
47350bdf917eSStefano Zampini   /* create loc to glob scatters if needed */
47360bdf917eSStefano Zampini   if (pcbddc->coarse_communications_type == SCATTERS_BDDC) {
47370bdf917eSStefano Zampini      IS local_IS,global_IS;
47380bdf917eSStefano Zampini      ierr = ISCreateStride(PETSC_COMM_SELF,pcbddc->local_primal_size,0,1,&local_IS);CHKERRQ(ierr);
47390bdf917eSStefano Zampini      ierr = ISCreateGeneral(PETSC_COMM_SELF,pcbddc->local_primal_size,pcbddc->local_primal_indices,PETSC_COPY_VALUES,&global_IS);CHKERRQ(ierr);
47400bdf917eSStefano Zampini      ierr = VecScatterCreate(pcbddc->vec1_P,local_IS,pcbddc->coarse_vec,global_IS,&pcbddc->coarse_loc_to_glob);CHKERRQ(ierr);
47410bdf917eSStefano Zampini      ierr = ISDestroy(&local_IS);CHKERRQ(ierr);
47420bdf917eSStefano Zampini      ierr = ISDestroy(&global_IS);CHKERRQ(ierr);
47430bdf917eSStefano Zampini   }
47440bdf917eSStefano Zampini 
4745a929c220SStefano Zampini   /* free memory no longer needed */
4746a929c220SStefano Zampini   if (coarse_ISLG)              { ierr = ISLocalToGlobalMappingDestroy(&coarse_ISLG);CHKERRQ(ierr); }
4747a929c220SStefano Zampini   if (ins_local_primal_indices) { ierr = PetscFree(ins_local_primal_indices);CHKERRQ(ierr); }
4748a929c220SStefano Zampini   if (ins_coarse_mat_vals)      { ierr = PetscFree(ins_coarse_mat_vals);CHKERRQ(ierr); }
4749a929c220SStefano Zampini   if (localsizes2)              { ierr = PetscFree(localsizes2);CHKERRQ(ierr); }
4750a929c220SStefano Zampini   if (localdispl2)              { ierr = PetscFree(localdispl2);CHKERRQ(ierr); }
4751a929c220SStefano Zampini   if (temp_coarse_mat_vals)     { ierr = PetscFree(temp_coarse_mat_vals);CHKERRQ(ierr); }
4752a929c220SStefano Zampini 
47530bdf917eSStefano Zampini   /* Eval coarse null space */
47540bdf917eSStefano Zampini   if (pcbddc->NullSpace) {
47550bdf917eSStefano Zampini     const Vec      *nsp_vecs;
47560bdf917eSStefano Zampini     PetscInt       nsp_size,coarse_nsp_size;
47570bdf917eSStefano Zampini     PetscBool      nsp_has_cnst;
47580bdf917eSStefano Zampini     PetscReal      test_null;
47590bdf917eSStefano Zampini     Vec            *coarse_nsp_vecs;
47600bdf917eSStefano Zampini 
47610bdf917eSStefano Zampini     coarse_nsp_size = 0;
47620bdf917eSStefano Zampini     coarse_nsp_vecs = 0;
47630bdf917eSStefano Zampini     ierr = MatNullSpaceGetVecs(pcbddc->NullSpace,&nsp_has_cnst,&nsp_size,&nsp_vecs);CHKERRQ(ierr);
47640bdf917eSStefano Zampini     if (rank_prec_comm == active_rank) {
47650bdf917eSStefano Zampini       ierr = PetscMalloc((nsp_size+1)*sizeof(Vec),&coarse_nsp_vecs);CHKERRQ(ierr);
47660bdf917eSStefano Zampini       for (i=0;i<nsp_size+1;i++) {
47670bdf917eSStefano Zampini         ierr = VecDuplicate(pcbddc->coarse_vec,&coarse_nsp_vecs[i]);CHKERRQ(ierr);
47680bdf917eSStefano Zampini       }
47690bdf917eSStefano Zampini     }
47700bdf917eSStefano Zampini     if (nsp_has_cnst) {
47710bdf917eSStefano Zampini       ierr = VecSet(pcis->vec1_N,1.0);CHKERRQ(ierr);
47720bdf917eSStefano Zampini       ierr = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr);
47730bdf917eSStefano Zampini       ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->vec1_P,pcbddc->coarse_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
47740bdf917eSStefano Zampini       ierr = PCBDDCScatterCoarseDataEnd(pc,pcbddc->vec1_P,pcbddc->coarse_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
47750bdf917eSStefano Zampini       if (rank_prec_comm == active_rank) {
47760bdf917eSStefano Zampini         ierr = MatMult(pcbddc->coarse_mat,pcbddc->coarse_vec,pcbddc->coarse_rhs);CHKERRQ(ierr);
47770bdf917eSStefano Zampini         ierr = VecNorm(pcbddc->coarse_rhs,NORM_INFINITY,&test_null);CHKERRQ(ierr);
47780bdf917eSStefano Zampini         if (test_null > 1.0e-12 && pcbddc->dbg_flag ) {
47790bdf917eSStefano Zampini           ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Constant coarse null space error % 1.14e\n",test_null);CHKERRQ(ierr);
47800bdf917eSStefano Zampini         }
47810bdf917eSStefano Zampini         ierr = VecCopy(pcbddc->coarse_vec,coarse_nsp_vecs[coarse_nsp_size]);CHKERRQ(ierr);
47820bdf917eSStefano Zampini         coarse_nsp_size++;
47830bdf917eSStefano Zampini       }
47840bdf917eSStefano Zampini     }
47850bdf917eSStefano Zampini     for (i=0;i<nsp_size;i++)  {
47860bdf917eSStefano Zampini       ierr = VecScatterBegin(matis->ctx,nsp_vecs[i],pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
47870bdf917eSStefano Zampini       ierr = VecScatterEnd  (matis->ctx,nsp_vecs[i],pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
47880bdf917eSStefano Zampini       ierr = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr);
47890bdf917eSStefano Zampini       ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->vec1_P,pcbddc->coarse_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
47900bdf917eSStefano Zampini       ierr = PCBDDCScatterCoarseDataEnd(pc,pcbddc->vec1_P,pcbddc->coarse_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
47910bdf917eSStefano Zampini       if (rank_prec_comm == active_rank) {
47920bdf917eSStefano Zampini         ierr = MatMult(pcbddc->coarse_mat,pcbddc->coarse_vec,pcbddc->coarse_rhs);CHKERRQ(ierr);
47930bdf917eSStefano Zampini         ierr = VecNorm(pcbddc->coarse_rhs,NORM_2,&test_null);CHKERRQ(ierr);
47940bdf917eSStefano Zampini         if (test_null > 1.0e-12 && pcbddc->dbg_flag ) {
47950bdf917eSStefano Zampini           ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Vec %d coarse null space error % 1.14e\n",i,test_null);CHKERRQ(ierr);
47960bdf917eSStefano Zampini         }
47970bdf917eSStefano Zampini         ierr = VecCopy(pcbddc->coarse_vec,coarse_nsp_vecs[coarse_nsp_size]);CHKERRQ(ierr);
47980bdf917eSStefano Zampini         coarse_nsp_size++;
47990bdf917eSStefano Zampini       }
48000bdf917eSStefano Zampini     }
48010bdf917eSStefano Zampini     if (coarse_nsp_size > 0) {
48020bdf917eSStefano Zampini       /* TODO orthonormalize vecs */
48030bdf917eSStefano Zampini       ierr = VecNormalize(coarse_nsp_vecs[0],PETSC_NULL);CHKERRQ(ierr);
48040bdf917eSStefano Zampini       ierr = MatNullSpaceCreate(coarse_comm,PETSC_FALSE,coarse_nsp_size,coarse_nsp_vecs,&pcbddc->CoarseNullSpace);CHKERRQ(ierr);
48050bdf917eSStefano Zampini       for (i=0;i<nsp_size+1;i++) {
48060bdf917eSStefano Zampini         ierr = VecDestroy(&coarse_nsp_vecs[i]);CHKERRQ(ierr);
48070bdf917eSStefano Zampini       }
48080bdf917eSStefano Zampini     }
48090bdf917eSStefano Zampini     ierr = PetscFree(coarse_nsp_vecs);CHKERRQ(ierr);
48100bdf917eSStefano Zampini   }
48110bdf917eSStefano Zampini 
48120bdf917eSStefano Zampini   /* KSP for coarse problem */
48130bdf917eSStefano Zampini   if (rank_prec_comm == active_rank) {
48142e8d2280SStefano Zampini     PetscBool isbddc=PETSC_FALSE;
48150bdf917eSStefano Zampini 
481653cdbc3dSStefano Zampini     ierr = KSPCreate(coarse_comm,&pcbddc->coarse_ksp);CHKERRQ(ierr);
481753cdbc3dSStefano Zampini     ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->coarse_ksp,(PetscObject)pc,1);CHKERRQ(ierr);
481853cdbc3dSStefano Zampini     ierr = KSPSetOperators(pcbddc->coarse_ksp,pcbddc->coarse_mat,pcbddc->coarse_mat,SAME_PRECONDITIONER);CHKERRQ(ierr);
48193b03a366Sstefano_zampini     ierr = KSPSetTolerances(pcbddc->coarse_ksp,PETSC_DEFAULT,PETSC_DEFAULT,PETSC_DEFAULT,max_it_coarse_ksp);CHKERRQ(ierr);
482053cdbc3dSStefano Zampini     ierr = KSPSetType(pcbddc->coarse_ksp,coarse_ksp_type);CHKERRQ(ierr);
482153cdbc3dSStefano Zampini     ierr = KSPGetPC(pcbddc->coarse_ksp,&pc_temp);CHKERRQ(ierr);
482253cdbc3dSStefano Zampini     ierr = PCSetType(pc_temp,coarse_pc_type);CHKERRQ(ierr);
48230c7d97c5SJed Brown     /* Allow user's customization */
4824da1bb401SStefano Zampini     ierr = KSPSetOptionsPrefix(pcbddc->coarse_ksp,"coarse_");CHKERRQ(ierr);
48250c7d97c5SJed Brown     /* Set Up PC for coarse problem BDDC */
482653cdbc3dSStefano Zampini     if (pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
48274fad6a16SStefano Zampini       i = pcbddc->current_level+1;
48284fad6a16SStefano Zampini       ierr = PCBDDCSetLevel(pc_temp,i);CHKERRQ(ierr);
48294fad6a16SStefano Zampini       ierr = PCBDDCSetCoarseningRatio(pc_temp,pcbddc->coarsening_ratio);CHKERRQ(ierr);
48304fad6a16SStefano Zampini       ierr = PCBDDCSetMaxLevels(pc_temp,pcbddc->max_levels);CHKERRQ(ierr);
483153cdbc3dSStefano Zampini       ierr = PCBDDCSetCoarseProblemType(pc_temp,MULTILEVEL_BDDC);CHKERRQ(ierr);
48320bdf917eSStefano Zampini       if (pcbddc->CoarseNullSpace) { ierr = PCBDDCSetNullSpace(pc_temp,pcbddc->CoarseNullSpace);CHKERRQ(ierr); }
48334fad6a16SStefano Zampini       if (dbg_flag) {
48344fad6a16SStefano Zampini         ierr = PetscViewerASCIIPrintf(viewer,"----------------Level %d: Setting up level %d---------------\n",pcbddc->current_level,i);CHKERRQ(ierr);
48354fad6a16SStefano Zampini         ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
483653cdbc3dSStefano Zampini       }
48374fad6a16SStefano Zampini     }
48384fad6a16SStefano Zampini     ierr = KSPSetFromOptions(pcbddc->coarse_ksp);CHKERRQ(ierr);
483953cdbc3dSStefano Zampini     ierr = KSPSetUp(pcbddc->coarse_ksp);CHKERRQ(ierr);
4840142dfd88SStefano Zampini 
48412e8d2280SStefano Zampini     ierr = KSPGetTolerances(pcbddc->coarse_ksp,PETSC_NULL,PETSC_NULL,PETSC_NULL,&j);CHKERRQ(ierr);
48422e8d2280SStefano Zampini     ierr = KSPGetPC(pcbddc->coarse_ksp,&pc_temp);CHKERRQ(ierr);
48432e8d2280SStefano Zampini     ierr = PetscObjectTypeCompare((PetscObject)pc_temp,PCBDDC,&isbddc);CHKERRQ(ierr);
48442e8d2280SStefano Zampini     if (j == 1) {
48452e8d2280SStefano Zampini       ierr = KSPSetNormType(pcbddc->coarse_ksp,KSP_NORM_NONE);CHKERRQ(ierr);
48462e8d2280SStefano Zampini       if (isbddc) {
48472e8d2280SStefano Zampini         ierr = PCBDDCSetUseExactDirichlet(pc_temp,PETSC_FALSE);CHKERRQ(ierr);
48485619798eSStefano Zampini       }
48495619798eSStefano Zampini     }
48500c7d97c5SJed Brown   }
4851a929c220SStefano Zampini   /* Check coarse problem if requested */
4852142dfd88SStefano Zampini   if ( dbg_flag && rank_prec_comm == active_rank ) {
4853142dfd88SStefano Zampini     KSP check_ksp;
4854142dfd88SStefano Zampini     PC  check_pc;
4855142dfd88SStefano Zampini     Vec check_vec;
4856142dfd88SStefano Zampini     PetscReal   abs_infty_error,infty_error,lambda_min,lambda_max;
485719fd82e9SBarry Smith     KSPType check_ksp_type;
48580c7d97c5SJed Brown 
4859142dfd88SStefano Zampini     /* Create ksp object suitable for extreme eigenvalues' estimation */
4860142dfd88SStefano Zampini     ierr = KSPCreate(coarse_comm,&check_ksp);CHKERRQ(ierr);
4861142dfd88SStefano Zampini     ierr = KSPSetOperators(check_ksp,pcbddc->coarse_mat,pcbddc->coarse_mat,SAME_PRECONDITIONER);CHKERRQ(ierr);
48620bdf917eSStefano Zampini     ierr = KSPSetTolerances(check_ksp,1.e-12,1.e-12,PETSC_DEFAULT,pcbddc->coarse_size);CHKERRQ(ierr);
4863142dfd88SStefano Zampini     if (pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
4864142dfd88SStefano Zampini       if (issym) {
4865142dfd88SStefano Zampini         check_ksp_type = KSPCG;
4866142dfd88SStefano Zampini       } else {
4867142dfd88SStefano Zampini         check_ksp_type = KSPGMRES;
4868142dfd88SStefano Zampini       }
4869142dfd88SStefano Zampini       ierr = KSPSetComputeSingularValues(check_ksp,PETSC_TRUE);CHKERRQ(ierr);
4870142dfd88SStefano Zampini     } else {
4871142dfd88SStefano Zampini       check_ksp_type = KSPPREONLY;
4872142dfd88SStefano Zampini     }
4873142dfd88SStefano Zampini     ierr = KSPSetType(check_ksp,check_ksp_type);CHKERRQ(ierr);
4874142dfd88SStefano Zampini     ierr = KSPGetPC(pcbddc->coarse_ksp,&check_pc);CHKERRQ(ierr);
4875142dfd88SStefano Zampini     ierr = KSPSetPC(check_ksp,check_pc);CHKERRQ(ierr);
4876142dfd88SStefano Zampini     ierr = KSPSetUp(check_ksp);CHKERRQ(ierr);
4877142dfd88SStefano Zampini     /* create random vec */
4878142dfd88SStefano Zampini     ierr = VecDuplicate(pcbddc->coarse_vec,&check_vec);CHKERRQ(ierr);
4879142dfd88SStefano Zampini     ierr = VecSetRandom(check_vec,PETSC_NULL);CHKERRQ(ierr);
48800bdf917eSStefano Zampini     if (pcbddc->CoarseNullSpace) { ierr = MatNullSpaceRemove(pcbddc->CoarseNullSpace,check_vec,PETSC_NULL);CHKERRQ(ierr); }
4881142dfd88SStefano Zampini     ierr = MatMult(pcbddc->coarse_mat,check_vec,pcbddc->coarse_rhs);CHKERRQ(ierr);
4882142dfd88SStefano Zampini     /* solve coarse problem */
4883142dfd88SStefano Zampini     ierr = KSPSolve(check_ksp,pcbddc->coarse_rhs,pcbddc->coarse_vec);CHKERRQ(ierr);
48840bdf917eSStefano Zampini     if (pcbddc->CoarseNullSpace) { ierr = MatNullSpaceRemove(pcbddc->CoarseNullSpace,pcbddc->coarse_vec,PETSC_NULL);CHKERRQ(ierr); }
4885142dfd88SStefano Zampini     /* check coarse problem residual error */
4886142dfd88SStefano Zampini     ierr = VecAXPY(check_vec,-1.0,pcbddc->coarse_vec);CHKERRQ(ierr);
4887142dfd88SStefano Zampini     ierr = VecNorm(check_vec,NORM_INFINITY,&infty_error);CHKERRQ(ierr);
4888142dfd88SStefano Zampini     ierr = MatMult(pcbddc->coarse_mat,check_vec,pcbddc->coarse_rhs);CHKERRQ(ierr);
4889142dfd88SStefano Zampini     ierr = VecNorm(pcbddc->coarse_rhs,NORM_INFINITY,&abs_infty_error);CHKERRQ(ierr);
4890142dfd88SStefano Zampini     ierr = VecDestroy(&check_vec);CHKERRQ(ierr);
4891142dfd88SStefano Zampini     /* get eigenvalue estimation if inexact */
4892142dfd88SStefano Zampini     if (pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
4893142dfd88SStefano Zampini       ierr = KSPComputeExtremeSingularValues(check_ksp,&lambda_max,&lambda_min);CHKERRQ(ierr);
4894142dfd88SStefano Zampini       ierr = KSPGetIterationNumber(check_ksp,&k);CHKERRQ(ierr);
4895142dfd88SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem eigenvalues estimated with %d iterations of %s.\n",k,check_ksp_type);CHKERRQ(ierr);
4896e269702eSStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem eigenvalues: % 1.14e %1.14e\n",lambda_min,lambda_max);CHKERRQ(ierr);
48973b03a366Sstefano_zampini     }
4898142dfd88SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem exact infty_error   : %1.14e\n",infty_error);CHKERRQ(ierr);
4899142dfd88SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem residual infty_error: %1.14e\n",abs_infty_error);CHKERRQ(ierr);
4900142dfd88SStefano Zampini     ierr = KSPDestroy(&check_ksp);CHKERRQ(ierr);
490153cdbc3dSStefano Zampini   }
4902142dfd88SStefano Zampini   if (dbg_flag) { ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); }
49030c7d97c5SJed Brown 
49040c7d97c5SJed Brown   PetscFunctionReturn(0);
49050c7d97c5SJed Brown }
49060c7d97c5SJed Brown 
49070c7d97c5SJed Brown #undef __FUNCT__
49080c7d97c5SJed Brown #define __FUNCT__ "PCBDDCManageLocalBoundaries"
490953cdbc3dSStefano Zampini static PetscErrorCode PCBDDCManageLocalBoundaries(PC pc)
49100c7d97c5SJed Brown {
49110c7d97c5SJed Brown 
49120c7d97c5SJed Brown   PC_BDDC     *pcbddc = (PC_BDDC*)pc->data;
49130c7d97c5SJed Brown   PC_IS         *pcis = (PC_IS*)pc->data;
49140c7d97c5SJed Brown   Mat_IS      *matis  = (Mat_IS*)pc->pmat->data;
4915da1bb401SStefano Zampini   PCBDDCGraph mat_graph=pcbddc->mat_graph;
49167cf533a6SStefano Zampini   PetscInt    *is_indices,*auxis;
49173b03a366Sstefano_zampini   PetscInt    bs,ierr,i,j,s,k,iindex,neumann_bsize,dirichlet_bsize;
4918da1bb401SStefano Zampini   PetscInt    total_counts,nodes_touched,where_values=1,vertex_size;
4919534831adSStefano Zampini   PetscMPIInt adapt_interface=0,adapt_interface_reduced=0,NEUMANNCNT=0;
4920da1bb401SStefano Zampini   PetscBool   same_set;
4921a0ba757dSStefano Zampini   MPI_Comm    interface_comm=((PetscObject)pc)->comm;
49223b03a366Sstefano_zampini   PetscBool   use_faces=PETSC_FALSE,use_edges=PETSC_FALSE;
49233b03a366Sstefano_zampini   const PetscInt *neumann_nodes;
49243b03a366Sstefano_zampini   const PetscInt *dirichlet_nodes;
4925a81d60d8SStefano Zampini   IS          used_IS,*custom_ISForDofs;
4926da1bb401SStefano Zampini   PetscScalar *array;
4927da1bb401SStefano Zampini   PetscScalar *array2;
4928da1bb401SStefano Zampini   PetscViewer viewer=pcbddc->dbg_viewer;
4929a929c220SStefano Zampini   PetscInt    *queue_in_global_numbering;
49300c7d97c5SJed Brown 
49310c7d97c5SJed Brown   PetscFunctionBegin;
4932da1bb401SStefano Zampini   /* Setup local adjacency graph */
4933da1bb401SStefano Zampini   mat_graph->nvtxs=pcis->n;
4934534831adSStefano Zampini   if (!mat_graph->xadj) { NEUMANNCNT = 1; }
4935da1bb401SStefano Zampini   ierr = PCBDDCSetupLocalAdjacencyGraph(pc);CHKERRQ(ierr);
4936a0ba757dSStefano Zampini   i = mat_graph->nvtxs;
4937a0ba757dSStefano Zampini   ierr = PetscMalloc4(i,PetscInt,&mat_graph->where,i,PetscInt,&mat_graph->count,i+1,PetscInt,&mat_graph->cptr,i,PetscInt,&mat_graph->queue);CHKERRQ(ierr);
49383972b0daSStefano Zampini   ierr = PetscMalloc2(i,PetscInt,&mat_graph->which_dof,i,PetscBool,&mat_graph->touched);CHKERRQ(ierr);
4939a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->where,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
4940a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->count,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
4941a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->which_dof,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
4942a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->queue,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
49433828260eSStefano Zampini   ierr = PetscMemzero(mat_graph->cptr,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr);
4944a0ba757dSStefano Zampini 
4945a81d60d8SStefano Zampini   /* Setting dofs splitting in mat_graph->which_dof
4946a81d60d8SStefano Zampini      Get information about dofs' splitting if provided by the user
4947a81d60d8SStefano Zampini      Otherwise it assumes a constant block size */
4948a81d60d8SStefano Zampini   vertex_size=0;
4949a81d60d8SStefano Zampini   if (!pcbddc->n_ISForDofs) {
4950a81d60d8SStefano Zampini     ierr = MatGetBlockSize(matis->A,&bs);CHKERRQ(ierr);
4951a81d60d8SStefano Zampini     ierr = PetscMalloc(bs*sizeof(IS),&custom_ISForDofs);CHKERRQ(ierr);
4952a81d60d8SStefano Zampini     for (i=0;i<bs;i++) {
4953a81d60d8SStefano Zampini       ierr = ISCreateStride(PETSC_COMM_SELF,pcis->n/bs,i,bs,&custom_ISForDofs[i]);CHKERRQ(ierr);
4954a81d60d8SStefano Zampini     }
4955a81d60d8SStefano Zampini     ierr = PCBDDCSetDofsSplitting(pc,bs,custom_ISForDofs);CHKERRQ(ierr);
4956a81d60d8SStefano Zampini     vertex_size=1;
4957a81d60d8SStefano Zampini     /* remove my references to IS objects */
4958a81d60d8SStefano Zampini     for (i=0;i<bs;i++) {
4959a81d60d8SStefano Zampini       ierr = ISDestroy(&custom_ISForDofs[i]);CHKERRQ(ierr);
4960a81d60d8SStefano Zampini     }
4961a81d60d8SStefano Zampini     ierr = PetscFree(custom_ISForDofs);CHKERRQ(ierr);
4962a81d60d8SStefano Zampini   }
49639c0446d6SStefano Zampini   for (i=0;i<pcbddc->n_ISForDofs;i++) {
4964a81d60d8SStefano Zampini     ierr = ISGetSize(pcbddc->ISForDofs[i],&k);CHKERRQ(ierr);
49659c0446d6SStefano Zampini     ierr = ISGetIndices(pcbddc->ISForDofs[i],(const PetscInt**)&is_indices);CHKERRQ(ierr);
4966a81d60d8SStefano Zampini     for (j=0;j<k;j++) {
49679c0446d6SStefano Zampini       mat_graph->which_dof[is_indices[j]]=i;
49689c0446d6SStefano Zampini     }
49699c0446d6SStefano Zampini     ierr = ISRestoreIndices(pcbddc->ISForDofs[i],(const PetscInt**)&is_indices);CHKERRQ(ierr);
49709c0446d6SStefano Zampini   }
4971a81d60d8SStefano Zampini   /* use mat block size as vertex size if it has not yet set */
4972a81d60d8SStefano Zampini   if (!vertex_size) {
49733b03a366Sstefano_zampini     ierr = MatGetBlockSize(matis->A,&vertex_size);CHKERRQ(ierr);
49740c7d97c5SJed Brown   }
4975a81d60d8SStefano Zampini 
49763b03a366Sstefano_zampini   /* count number of neigh per node */
49770c7d97c5SJed Brown   total_counts=0;
49783b03a366Sstefano_zampini   for (i=1;i<pcis->n_neigh;i++){
49790c7d97c5SJed Brown     s=pcis->n_shared[i];
49800c7d97c5SJed Brown     total_counts+=s;
498153cdbc3dSStefano Zampini     for (j=0;j<s;j++){
49820c7d97c5SJed Brown       mat_graph->count[pcis->shared[i][j]] += 1;
49830c7d97c5SJed Brown     }
49840c7d97c5SJed Brown   }
4985534831adSStefano Zampini   /* Take into account Neumann data -> it increments number of sharing subdomains for nodes lying on the interface */
498636e030ebSStefano Zampini   ierr = PCBDDCGetNeumannBoundaries(pc,&used_IS);CHKERRQ(ierr);
4987da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
4988da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
498936e030ebSStefano Zampini   if (used_IS) {
499036e030ebSStefano Zampini     ierr = ISGetSize(used_IS,&neumann_bsize);CHKERRQ(ierr);
499136e030ebSStefano Zampini     ierr = ISGetIndices(used_IS,&neumann_nodes);CHKERRQ(ierr);
499253cdbc3dSStefano Zampini     for (i=0;i<neumann_bsize;i++){
499353cdbc3dSStefano Zampini       iindex = neumann_nodes[i];
4994534831adSStefano Zampini       if (mat_graph->count[iindex] > NEUMANNCNT && array[iindex]==0.0){
499553cdbc3dSStefano Zampini         mat_graph->count[iindex]+=1;
49960c7d97c5SJed Brown         total_counts++;
4997da1bb401SStefano Zampini         array[iindex]=array[iindex]+1.0;
4998da1bb401SStefano Zampini       } else if (array[iindex]>0.0) {
4999da1bb401SStefano Zampini         SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_USER,"Error for neumann nodes provided to BDDC! They must be uniquely listed! Found duplicate node %d\n",iindex);
50000c7d97c5SJed Brown       }
50010c7d97c5SJed Brown     }
50020c7d97c5SJed Brown   }
5003da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
5004da1bb401SStefano Zampini   /* allocate space for storing the set of neighbours for each node */
5005da1bb401SStefano Zampini   ierr = PetscMalloc(mat_graph->nvtxs*sizeof(PetscInt*),&mat_graph->neighbours_set);CHKERRQ(ierr);
5006da1bb401SStefano Zampini   if (mat_graph->nvtxs) { ierr = PetscMalloc(total_counts*sizeof(PetscInt),&mat_graph->neighbours_set[0]);CHKERRQ(ierr); }
5007da1bb401SStefano Zampini   for (i=1;i<mat_graph->nvtxs;i++) mat_graph->neighbours_set[i]=mat_graph->neighbours_set[i-1]+mat_graph->count[i-1];
5008a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->count,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
50093b03a366Sstefano_zampini   for (i=1;i<pcis->n_neigh;i++){
50100c7d97c5SJed Brown     s=pcis->n_shared[i];
50110c7d97c5SJed Brown     for (j=0;j<s;j++) {
50120c7d97c5SJed Brown       k=pcis->shared[i][j];
5013da1bb401SStefano Zampini       mat_graph->neighbours_set[k][mat_graph->count[k]] = pcis->neigh[i];
50140c7d97c5SJed Brown       mat_graph->count[k]+=1;
50150c7d97c5SJed Brown     }
50160c7d97c5SJed Brown   }
5017da1bb401SStefano Zampini   /* Check consistency of Neumann nodes */
5018da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
5019da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
5020da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
5021da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
5022da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
5023da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
50243b03a366Sstefano_zampini   /* set -1 fake neighbour to mimic Neumann boundary */
502536e030ebSStefano Zampini   if (used_IS) {
502653cdbc3dSStefano Zampini     for (i=0;i<neumann_bsize;i++){
502753cdbc3dSStefano Zampini       iindex = neumann_nodes[i];
5028534831adSStefano Zampini       if (mat_graph->count[iindex] > NEUMANNCNT){
5029da1bb401SStefano Zampini         if (mat_graph->count[iindex]+1 != (PetscInt)array[iindex]) {
5030da1bb401SStefano Zampini           SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_USER,"Neumann nodes provided to BDDC must be consistent among neighbours!\nNode %d: number of sharing subdomains %d != number of subdomains for which it is a neumann node %d\n",iindex,mat_graph->count[iindex]+1,(PetscInt)array[iindex]);
5031da1bb401SStefano Zampini         }
5032da1bb401SStefano Zampini         mat_graph->neighbours_set[iindex][mat_graph->count[iindex]] = -1;
503353cdbc3dSStefano Zampini         mat_graph->count[iindex]+=1;
50340c7d97c5SJed Brown       }
50350c7d97c5SJed Brown     }
503636e030ebSStefano Zampini     ierr = ISRestoreIndices(used_IS,&neumann_nodes);CHKERRQ(ierr);
50370c7d97c5SJed Brown   }
5038da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
5039da1bb401SStefano Zampini   /* sort set of sharing subdomains */
5040da1bb401SStefano Zampini   for (i=0;i<mat_graph->nvtxs;i++) { ierr = PetscSortInt(mat_graph->count[i],mat_graph->neighbours_set[i]);CHKERRQ(ierr); }
50413b03a366Sstefano_zampini   /* remove interior nodes and dirichlet boundary nodes from the next search into the graph */
5042da1bb401SStefano Zampini   for (i=0;i<mat_graph->nvtxs;i++){mat_graph->touched[i]=PETSC_FALSE;}
5043da1bb401SStefano Zampini   nodes_touched=0;
504436e030ebSStefano Zampini   ierr = PCBDDCGetDirichletBoundaries(pc,&used_IS);CHKERRQ(ierr);
5045da1bb401SStefano Zampini   ierr = VecSet(pcis->vec2_N,0.0);CHKERRQ(ierr);
5046da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
5047da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec2_N,&array2);CHKERRQ(ierr);
5048da1bb401SStefano Zampini   if (used_IS) {
5049da1bb401SStefano Zampini     ierr = ISGetSize(used_IS,&dirichlet_bsize);CHKERRQ(ierr);
5050da1bb401SStefano Zampini     if (dirichlet_bsize && matis->pure_neumann) {
5051da1bb401SStefano Zampini       SETERRQ(PETSC_COMM_SELF,PETSC_ERR_USER,"Dirichlet boundaries are intended to be used with matrices with zeroed rows!\n");
5052da1bb401SStefano Zampini     }
5053da1bb401SStefano Zampini     ierr = ISGetIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr);
5054da1bb401SStefano Zampini     for (i=0;i<dirichlet_bsize;i++){
5055da1bb401SStefano Zampini       iindex=dirichlet_nodes[i];
5056da1bb401SStefano Zampini       if (mat_graph->count[iindex] && !mat_graph->touched[iindex]) {
5057da1bb401SStefano Zampini         if (array[iindex]>0.0) {
5058da1bb401SStefano Zampini           SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_USER,"BDDC cannot have nodes which are marked as Neumann and Dirichlet at the same time! Wrong node %d\n",iindex);
5059da1bb401SStefano Zampini         }
5060da1bb401SStefano Zampini         mat_graph->touched[iindex]=PETSC_TRUE;
5061da1bb401SStefano Zampini         mat_graph->where[iindex]=0;
5062da1bb401SStefano Zampini         nodes_touched++;
5063da1bb401SStefano Zampini         array2[iindex]=array2[iindex]+1.0;
5064da1bb401SStefano Zampini       }
5065da1bb401SStefano Zampini     }
5066da1bb401SStefano Zampini     ierr = ISRestoreIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr);
5067da1bb401SStefano Zampini   }
5068da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
5069da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec2_N,&array2);CHKERRQ(ierr);
5070da1bb401SStefano Zampini   /* Check consistency of Dirichlet nodes */
5071da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_N,1.0);CHKERRQ(ierr);
5072da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
5073da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
5074da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
5075da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
5076da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
5077da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
5078da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec2_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
5079da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec2_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
5080da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
5081da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
5082da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
5083da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec2_N,&array2);CHKERRQ(ierr);
508436e030ebSStefano Zampini   if (used_IS) {
508536e030ebSStefano Zampini     ierr = ISGetSize(used_IS,&dirichlet_bsize);CHKERRQ(ierr);
508636e030ebSStefano Zampini     ierr = ISGetIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr);
50873b03a366Sstefano_zampini     for (i=0;i<dirichlet_bsize;i++){
5088da1bb401SStefano Zampini       iindex=dirichlet_nodes[i];
5089da1bb401SStefano Zampini       if (array[iindex]>1.0 && array[iindex]!=array2[iindex] ) {
5090da1bb401SStefano Zampini          SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_USER,"Dirichlet nodes provided to BDDC must be consistent among neighbours!\nNode %d: number of sharing subdomains %d != number of subdomains for which it is a neumann node %d\n",iindex,(PetscInt)array[iindex],(PetscInt)array2[iindex]);
5091da1bb401SStefano Zampini       }
50923b03a366Sstefano_zampini     }
509336e030ebSStefano Zampini     ierr = ISRestoreIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr);
50943b03a366Sstefano_zampini   }
5095da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
5096da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec2_N,&array2);CHKERRQ(ierr);
5097da1bb401SStefano Zampini 
50980c7d97c5SJed Brown   for (i=0;i<mat_graph->nvtxs;i++){
50993b03a366Sstefano_zampini     if (!mat_graph->count[i]){  /* interior nodes */
51000c7d97c5SJed Brown       mat_graph->touched[i]=PETSC_TRUE;
51010c7d97c5SJed Brown       mat_graph->where[i]=0;
51020c7d97c5SJed Brown       nodes_touched++;
51030c7d97c5SJed Brown     }
51040c7d97c5SJed Brown   }
51050c7d97c5SJed Brown   mat_graph->ncmps = 0;
5106da1bb401SStefano Zampini   i=0;
51070c7d97c5SJed Brown   while(nodes_touched<mat_graph->nvtxs) {
5108a0ba757dSStefano Zampini     /*  find first untouched node in local ordering */
51090c7d97c5SJed Brown     while(mat_graph->touched[i]) i++;
51100c7d97c5SJed Brown     mat_graph->touched[i]=PETSC_TRUE;
5111a0ba757dSStefano Zampini     mat_graph->where[i]=where_values;
51120c7d97c5SJed Brown     nodes_touched++;
5113a0ba757dSStefano Zampini     /* now find all other nodes having the same set of sharing subdomains */
51140c7d97c5SJed Brown     for (j=i+1;j<mat_graph->nvtxs;j++){
5115a0ba757dSStefano Zampini       /* check for same number of sharing subdomains and dof number */
5116da1bb401SStefano Zampini       if (!mat_graph->touched[j] && mat_graph->count[i]==mat_graph->count[j] && mat_graph->which_dof[i] == mat_graph->which_dof[j] ){
5117a0ba757dSStefano Zampini         /* check for same set of sharing subdomains */
51180c7d97c5SJed Brown         same_set=PETSC_TRUE;
51190c7d97c5SJed Brown         for (k=0;k<mat_graph->count[j];k++){
5120da1bb401SStefano Zampini           if (mat_graph->neighbours_set[i][k]!=mat_graph->neighbours_set[j][k]) {
51210c7d97c5SJed Brown             same_set=PETSC_FALSE;
51220c7d97c5SJed Brown           }
51230c7d97c5SJed Brown         }
5124a0ba757dSStefano Zampini         /* I found a friend of mine */
51250c7d97c5SJed Brown         if (same_set) {
5126a0ba757dSStefano Zampini           mat_graph->where[j]=where_values;
51270c7d97c5SJed Brown           mat_graph->touched[j]=PETSC_TRUE;
51280c7d97c5SJed Brown           nodes_touched++;
51290c7d97c5SJed Brown         }
51300c7d97c5SJed Brown       }
51310c7d97c5SJed Brown     }
5132a0ba757dSStefano Zampini     where_values++;
51330c7d97c5SJed Brown   }
5134a0ba757dSStefano Zampini   where_values--; if (where_values<0) where_values=0;
5135a0ba757dSStefano Zampini   ierr = PetscMalloc(where_values*sizeof(PetscMPIInt),&mat_graph->where_ncmps);CHKERRQ(ierr);
5136a0ba757dSStefano Zampini   /* Find connected components defined on the shared interface */
5137a0ba757dSStefano Zampini   if (where_values) {
5138a0ba757dSStefano Zampini     ierr = PCBDDCFindConnectedComponents(mat_graph, where_values);
5139a0ba757dSStefano Zampini   }
5140a929c220SStefano Zampini   ierr = PetscMalloc(mat_graph->nvtxs*sizeof(PetscInt),&queue_in_global_numbering);CHKERRQ(ierr);
5141a0ba757dSStefano Zampini   /* check consistency of connected components among neighbouring subdomains -> it adapt them in case it is needed */
5142a0ba757dSStefano Zampini   for (i=0;i<where_values;i++) {
51437cf533a6SStefano Zampini     /* We are not sure that on a given subset of the local interface,
51447cf533a6SStefano Zampini        two connected components will be the same among sharing subdomains */
51453b03a366Sstefano_zampini     if (mat_graph->where_ncmps[i]>1) {
5146a0ba757dSStefano Zampini       adapt_interface=1;
5147a0ba757dSStefano Zampini       break;
5148a0ba757dSStefano Zampini     }
5149a0ba757dSStefano Zampini   }
5150a0ba757dSStefano Zampini   ierr = MPI_Allreduce(&adapt_interface,&adapt_interface_reduced,1,MPIU_INT,MPI_LOR,interface_comm);CHKERRQ(ierr);
5151da1bb401SStefano Zampini   if (pcbddc->dbg_flag && adapt_interface_reduced) {
5152d8923723SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"Adapting interface\n");CHKERRQ(ierr);
5153da1bb401SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
5154da1bb401SStefano Zampini   }
5155a0ba757dSStefano Zampini   if (where_values && adapt_interface_reduced) {
51560c7d97c5SJed Brown 
5157a0ba757dSStefano Zampini     PetscInt sum_requests=0,my_rank;
5158a0ba757dSStefano Zampini     PetscInt buffer_size,start_of_recv,size_of_recv,start_of_send;
5159a0ba757dSStefano Zampini     PetscInt temp_buffer_size,ins_val,global_where_counter;
5160a0ba757dSStefano Zampini     PetscInt *cum_recv_counts;
5161a0ba757dSStefano Zampini     PetscInt *where_to_nodes_indices;
5162a0ba757dSStefano Zampini     PetscInt *petsc_buffer;
5163a0ba757dSStefano Zampini     PetscMPIInt *recv_buffer;
5164a0ba757dSStefano Zampini     PetscMPIInt *recv_buffer_where;
5165a0ba757dSStefano Zampini     PetscMPIInt *send_buffer;
5166a0ba757dSStefano Zampini     PetscMPIInt size_of_send;
5167a0ba757dSStefano Zampini     PetscInt *sizes_of_sends;
5168a0ba757dSStefano Zampini     MPI_Request *send_requests;
5169a0ba757dSStefano Zampini     MPI_Request *recv_requests;
5170a0ba757dSStefano Zampini     PetscInt *where_cc_adapt;
5171a0ba757dSStefano Zampini     PetscInt **temp_buffer;
5172a0ba757dSStefano Zampini     PetscInt *nodes_to_temp_buffer_indices;
5173a0ba757dSStefano Zampini     PetscInt *add_to_where;
51747cf533a6SStefano Zampini     PetscInt *aux_new_xadj,*new_xadj,*new_adjncy;
5175a0ba757dSStefano Zampini 
51767cf533a6SStefano Zampini     /* Retrict adjacency graph using information from connected components */
51777cf533a6SStefano Zampini     ierr = PetscMalloc(mat_graph->nvtxs*sizeof(PetscInt),&aux_new_xadj);CHKERRQ(ierr);
51787cf533a6SStefano Zampini     for (i=0;i<mat_graph->nvtxs;i++) {
51797cf533a6SStefano Zampini       aux_new_xadj[i]=1;
51807cf533a6SStefano Zampini     }
51817cf533a6SStefano Zampini     for (i=0;i<mat_graph->ncmps;i++) {
51827cf533a6SStefano Zampini       k = mat_graph->cptr[i+1]-mat_graph->cptr[i];
51837cf533a6SStefano Zampini       for (j=0;j<k;j++) {
51847cf533a6SStefano Zampini         aux_new_xadj[mat_graph->queue[mat_graph->cptr[i]+j]]=k;
51857cf533a6SStefano Zampini       }
51867cf533a6SStefano Zampini     }
51877cf533a6SStefano Zampini     j = 0;
51887cf533a6SStefano Zampini     for (i=0;i<mat_graph->nvtxs;i++) {
51897cf533a6SStefano Zampini       j += aux_new_xadj[i];
51907cf533a6SStefano Zampini     }
51917cf533a6SStefano Zampini     ierr = PetscMalloc((mat_graph->nvtxs+1)*sizeof(PetscInt),&new_xadj);CHKERRQ(ierr);
51927cf533a6SStefano Zampini     ierr = PetscMalloc(j*sizeof(PetscInt),&new_adjncy);CHKERRQ(ierr);
51937cf533a6SStefano Zampini     new_xadj[0]=0;
51947cf533a6SStefano Zampini     for (i=0;i<mat_graph->nvtxs;i++) {
51957cf533a6SStefano Zampini       new_xadj[i+1]=new_xadj[i]+aux_new_xadj[i];
51967cf533a6SStefano Zampini       if (aux_new_xadj[i]==1) {
51977cf533a6SStefano Zampini         new_adjncy[new_xadj[i]]=i;
51987cf533a6SStefano Zampini       }
51997cf533a6SStefano Zampini     }
5200354b9337SStefano Zampini     ierr = PetscFree(aux_new_xadj);CHKERRQ(ierr);
52017cf533a6SStefano Zampini     for (i=0;i<mat_graph->ncmps;i++) {
52027cf533a6SStefano Zampini       k = mat_graph->cptr[i+1]-mat_graph->cptr[i];
52037cf533a6SStefano Zampini       for (j=0;j<k;j++) {
52047cf533a6SStefano Zampini         ierr = PetscMemcpy(&new_adjncy[new_xadj[mat_graph->queue[mat_graph->cptr[i]+j]]],&mat_graph->queue[mat_graph->cptr[i]],k*sizeof(PetscInt));CHKERRQ(ierr);
52057cf533a6SStefano Zampini       }
52067cf533a6SStefano Zampini     }
52077cf533a6SStefano Zampini     ierr = PCBDDCSetLocalAdjacencyGraph(pc,mat_graph->nvtxs,new_xadj,new_adjncy,PETSC_OWN_POINTER);CHKERRQ(ierr);
52087cf533a6SStefano Zampini     /* For consistency among neughbouring procs, I need to sort (by global ordering) each connected component */
52097cf533a6SStefano Zampini     for (i=0;i<mat_graph->ncmps;i++) {
52107cf533a6SStefano Zampini       k = mat_graph->cptr[i+1]-mat_graph->cptr[i];
52117cf533a6SStefano Zampini       ierr = ISLocalToGlobalMappingApply(matis->mapping,k,&mat_graph->queue[mat_graph->cptr[i]],&queue_in_global_numbering[mat_graph->cptr[i]]);CHKERRQ(ierr);
52127cf533a6SStefano Zampini       ierr = PetscSortIntWithArray(k,&queue_in_global_numbering[mat_graph->cptr[i]],&mat_graph->queue[mat_graph->cptr[i]]);CHKERRQ(ierr);
52137cf533a6SStefano Zampini     }
52147cf533a6SStefano Zampini     /* allocate some space */
5215a0ba757dSStefano Zampini     ierr = MPI_Comm_rank(interface_comm,&my_rank);CHKERRQ(ierr);
5216a0ba757dSStefano Zampini     ierr = PetscMalloc((where_values+1)*sizeof(PetscInt),&cum_recv_counts);CHKERRQ(ierr);
5217a0ba757dSStefano Zampini     ierr = PetscMemzero(cum_recv_counts,(where_values+1)*sizeof(PetscInt));CHKERRQ(ierr);
5218a0ba757dSStefano Zampini     ierr = PetscMalloc(where_values*sizeof(PetscInt),&where_to_nodes_indices);CHKERRQ(ierr);
5219a0ba757dSStefano Zampini     /* first count how many neighbours per connected component I will receive from */
5220a0ba757dSStefano Zampini     cum_recv_counts[0]=0;
5221a0ba757dSStefano Zampini     for (i=1;i<where_values+1;i++){
5222a0ba757dSStefano Zampini       j=0;
5223d8923723SStefano Zampini       while(mat_graph->where[j] != i) { j++; }
5224a0ba757dSStefano Zampini       where_to_nodes_indices[i-1]=j;
5225da1bb401SStefano Zampini       if (mat_graph->neighbours_set[j][0]!=-1) { cum_recv_counts[i]=cum_recv_counts[i-1]+mat_graph->count[j]; } /* We don't want sends/recvs_to/from_self -> here I don't count myself  */
52263b03a366Sstefano_zampini       else { cum_recv_counts[i]=cum_recv_counts[i-1]+mat_graph->count[j]-1; }
5227a0ba757dSStefano Zampini     }
5228a0ba757dSStefano Zampini     ierr = PetscMalloc(2*cum_recv_counts[where_values]*sizeof(PetscMPIInt),&recv_buffer_where);CHKERRQ(ierr);
5229a0ba757dSStefano Zampini     ierr = PetscMalloc(cum_recv_counts[where_values]*sizeof(MPI_Request),&send_requests);CHKERRQ(ierr);
5230a0ba757dSStefano Zampini     ierr = PetscMalloc(cum_recv_counts[where_values]*sizeof(MPI_Request),&recv_requests);CHKERRQ(ierr);
5231a0ba757dSStefano Zampini     for (i=0;i<cum_recv_counts[where_values];i++) {
5232a0ba757dSStefano Zampini       send_requests[i]=MPI_REQUEST_NULL;
5233a0ba757dSStefano Zampini       recv_requests[i]=MPI_REQUEST_NULL;
5234a0ba757dSStefano Zampini     }
5235a0ba757dSStefano Zampini     /* exchange with my neighbours the number of my connected components on the shared interface */
5236a0ba757dSStefano Zampini     for (i=0;i<where_values;i++){
5237a0ba757dSStefano Zampini       j=where_to_nodes_indices[i];
5238da1bb401SStefano Zampini       k = (mat_graph->neighbours_set[j][0] == -1 ?  1 : 0);
5239a0ba757dSStefano Zampini       for (;k<mat_graph->count[j];k++){
5240da1bb401SStefano Zampini         ierr = MPI_Isend(&mat_graph->where_ncmps[i],1,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr);
5241da1bb401SStefano Zampini         ierr = MPI_Irecv(&recv_buffer_where[sum_requests],1,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr);
5242a0ba757dSStefano Zampini         sum_requests++;
5243a0ba757dSStefano Zampini       }
5244a0ba757dSStefano Zampini     }
5245a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
5246a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
5247a0ba757dSStefano Zampini     /* determine the connected component I need to adapt */
5248a0ba757dSStefano Zampini     ierr = PetscMalloc(where_values*sizeof(PetscInt),&where_cc_adapt);CHKERRQ(ierr);
5249a0ba757dSStefano Zampini     ierr = PetscMemzero(where_cc_adapt,where_values*sizeof(PetscInt));CHKERRQ(ierr);
5250a0ba757dSStefano Zampini     for (i=0;i<where_values;i++){
5251a0ba757dSStefano Zampini       for (j=cum_recv_counts[i];j<cum_recv_counts[i+1];j++){
52523b03a366Sstefano_zampini         /* The first condition is natural (i.e someone has a different number of cc than me), the second one is just to be safe */
52533b03a366Sstefano_zampini         if ( mat_graph->where_ncmps[i]!=recv_buffer_where[j] || mat_graph->where_ncmps[i] > 1 ) {
5254a0ba757dSStefano Zampini           where_cc_adapt[i]=PETSC_TRUE;
5255a0ba757dSStefano Zampini           break;
5256a0ba757dSStefano Zampini         }
5257a0ba757dSStefano Zampini       }
5258a0ba757dSStefano Zampini     }
5259d8923723SStefano Zampini     buffer_size = 0;
5260d8923723SStefano Zampini     for (i=0;i<where_values;i++) {
5261d8923723SStefano Zampini       if (where_cc_adapt[i]) {
5262d8923723SStefano Zampini         for (j=i;j<mat_graph->ncmps;j++) {
5263d8923723SStefano Zampini           if (mat_graph->where[mat_graph->queue[mat_graph->cptr[j]]] == i+1) { /* WARNING -> where values goes from 1 to where_values included */
5264d8923723SStefano Zampini             buffer_size += 1 + mat_graph->cptr[j+1]-mat_graph->cptr[j];
5265d8923723SStefano Zampini           }
5266d8923723SStefano Zampini         }
5267d8923723SStefano Zampini       }
5268d8923723SStefano Zampini     }
5269d8923723SStefano Zampini     ierr = PetscMalloc(buffer_size*sizeof(PetscMPIInt),&send_buffer);CHKERRQ(ierr);
5270a0ba757dSStefano Zampini     /* now get from neighbours their ccs (in global numbering) and adapt them (in case it is needed) */
5271a0ba757dSStefano Zampini     /* first determine how much data to send (size of each queue plus the global indices) and communicate it to neighbours */
5272a0ba757dSStefano Zampini     ierr = PetscMalloc(where_values*sizeof(PetscInt),&sizes_of_sends);CHKERRQ(ierr);
5273a0ba757dSStefano Zampini     ierr = PetscMemzero(sizes_of_sends,where_values*sizeof(PetscInt));CHKERRQ(ierr);
5274a0ba757dSStefano Zampini     sum_requests=0;
5275a0ba757dSStefano Zampini     start_of_send=0;
5276a0ba757dSStefano Zampini     start_of_recv=cum_recv_counts[where_values];
5277a0ba757dSStefano Zampini     for (i=0;i<where_values;i++) {
5278a0ba757dSStefano Zampini       if (where_cc_adapt[i]) {
5279a0ba757dSStefano Zampini         size_of_send=0;
5280a0ba757dSStefano Zampini         for (j=i;j<mat_graph->ncmps;j++) {
5281a0ba757dSStefano Zampini           if (mat_graph->where[mat_graph->queue[mat_graph->cptr[j]]] == i+1) { /* WARNING -> where values goes from 1 to where_values included */
5282a0ba757dSStefano Zampini             send_buffer[start_of_send+size_of_send]=mat_graph->cptr[j+1]-mat_graph->cptr[j];
5283a0ba757dSStefano Zampini             size_of_send+=1;
5284a0ba757dSStefano Zampini             for (k=0;k<mat_graph->cptr[j+1]-mat_graph->cptr[j];k++) {
5285a0ba757dSStefano Zampini               send_buffer[start_of_send+size_of_send+k]=queue_in_global_numbering[mat_graph->cptr[j]+k];
5286a0ba757dSStefano Zampini             }
5287a0ba757dSStefano Zampini             size_of_send=size_of_send+mat_graph->cptr[j+1]-mat_graph->cptr[j];
5288a0ba757dSStefano Zampini           }
5289a0ba757dSStefano Zampini         }
5290a0ba757dSStefano Zampini         j = where_to_nodes_indices[i];
5291da1bb401SStefano Zampini         k = (mat_graph->neighbours_set[j][0] == -1 ?  1 : 0);
529211d8f4c2SStefano Zampini         sizes_of_sends[i]=size_of_send;
5293a0ba757dSStefano Zampini         for (;k<mat_graph->count[j];k++){
529411d8f4c2SStefano Zampini           ierr = MPI_Isend(&sizes_of_sends[i],1,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr);
5295da1bb401SStefano Zampini           ierr = MPI_Irecv(&recv_buffer_where[sum_requests+start_of_recv],1,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr);
5296a0ba757dSStefano Zampini           sum_requests++;
5297a0ba757dSStefano Zampini         }
5298a0ba757dSStefano Zampini         start_of_send+=size_of_send;
5299a0ba757dSStefano Zampini       }
5300a0ba757dSStefano Zampini     }
5301a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
5302a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
5303a0ba757dSStefano Zampini     buffer_size=0;
5304a0ba757dSStefano Zampini     for (k=0;k<sum_requests;k++) { buffer_size+=recv_buffer_where[start_of_recv+k]; }
5305a0ba757dSStefano Zampini     ierr = PetscMalloc(buffer_size*sizeof(PetscMPIInt),&recv_buffer);CHKERRQ(ierr);
5306a0ba757dSStefano Zampini     /* now exchange the data */
5307a0ba757dSStefano Zampini     start_of_recv=0;
5308a0ba757dSStefano Zampini     start_of_send=0;
5309a0ba757dSStefano Zampini     sum_requests=0;
5310a0ba757dSStefano Zampini     for (i=0;i<where_values;i++) {
5311a0ba757dSStefano Zampini       if (where_cc_adapt[i]) {
5312a0ba757dSStefano Zampini         size_of_send = sizes_of_sends[i];
5313a0ba757dSStefano Zampini         j = where_to_nodes_indices[i];
5314da1bb401SStefano Zampini         k = (mat_graph->neighbours_set[j][0] == -1 ?  1 : 0);
5315a0ba757dSStefano Zampini         for (;k<mat_graph->count[j];k++){
5316da1bb401SStefano Zampini           ierr = MPI_Isend(&send_buffer[start_of_send],size_of_send,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr);
5317a0ba757dSStefano Zampini           size_of_recv=recv_buffer_where[cum_recv_counts[where_values]+sum_requests];
5318da1bb401SStefano Zampini           ierr = MPI_Irecv(&recv_buffer[start_of_recv],size_of_recv,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr);
5319a0ba757dSStefano Zampini           start_of_recv+=size_of_recv;
5320a0ba757dSStefano Zampini           sum_requests++;
5321a0ba757dSStefano Zampini         }
5322a0ba757dSStefano Zampini         start_of_send+=size_of_send;
5323a0ba757dSStefano Zampini       }
5324a0ba757dSStefano Zampini     }
5325a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
5326a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
5327a0ba757dSStefano Zampini     ierr = PetscMalloc(buffer_size*sizeof(PetscInt),&petsc_buffer);CHKERRQ(ierr);
5328a0ba757dSStefano Zampini     for (k=0;k<start_of_recv;k++) { petsc_buffer[k]=(PetscInt)recv_buffer[k]; }
5329a0ba757dSStefano Zampini     for (j=0;j<buffer_size;) {
5330a0ba757dSStefano Zampini        ierr = ISGlobalToLocalMappingApply(matis->mapping,IS_GTOLM_MASK,petsc_buffer[j],&petsc_buffer[j+1],&petsc_buffer[j],&petsc_buffer[j+1]);CHKERRQ(ierr);
5331a0ba757dSStefano Zampini        k=petsc_buffer[j]+1;
5332a0ba757dSStefano Zampini        j+=k;
5333a0ba757dSStefano Zampini     }
5334a0ba757dSStefano Zampini     sum_requests=cum_recv_counts[where_values];
5335a0ba757dSStefano Zampini     start_of_recv=0;
5336a0ba757dSStefano Zampini     ierr = PetscMalloc(mat_graph->nvtxs*sizeof(PetscInt),&nodes_to_temp_buffer_indices);CHKERRQ(ierr);
5337a0ba757dSStefano Zampini     global_where_counter=0;
5338a0ba757dSStefano Zampini     for (i=0;i<where_values;i++){
5339a0ba757dSStefano Zampini       if (where_cc_adapt[i]){
5340a0ba757dSStefano Zampini         temp_buffer_size=0;
5341a0ba757dSStefano Zampini         /* find nodes on the shared interface we need to adapt */
5342a0ba757dSStefano Zampini         for (j=0;j<mat_graph->nvtxs;j++){
5343a0ba757dSStefano Zampini           if (mat_graph->where[j]==i+1) {
5344a0ba757dSStefano Zampini             nodes_to_temp_buffer_indices[j]=temp_buffer_size;
5345a0ba757dSStefano Zampini             temp_buffer_size++;
5346a0ba757dSStefano Zampini           } else {
5347a0ba757dSStefano Zampini             nodes_to_temp_buffer_indices[j]=-1;
5348a0ba757dSStefano Zampini           }
5349a0ba757dSStefano Zampini         }
5350a0ba757dSStefano Zampini         /* allocate some temporary space */
5351a0ba757dSStefano Zampini         ierr = PetscMalloc(temp_buffer_size*sizeof(PetscInt*),&temp_buffer);CHKERRQ(ierr);
5352a0ba757dSStefano Zampini         ierr = PetscMalloc(temp_buffer_size*(cum_recv_counts[i+1]-cum_recv_counts[i])*sizeof(PetscInt),&temp_buffer[0]);CHKERRQ(ierr);
5353a0ba757dSStefano Zampini         ierr = PetscMemzero(temp_buffer[0],temp_buffer_size*(cum_recv_counts[i+1]-cum_recv_counts[i])*sizeof(PetscInt));CHKERRQ(ierr);
5354a0ba757dSStefano Zampini         for (j=1;j<temp_buffer_size;j++){
5355a0ba757dSStefano Zampini           temp_buffer[j]=temp_buffer[j-1]+cum_recv_counts[i+1]-cum_recv_counts[i];
5356a0ba757dSStefano Zampini         }
5357a0ba757dSStefano Zampini         /* analyze contributions from neighbouring subdomains for i-th conn comp
5358a0ba757dSStefano Zampini            temp buffer structure:
5359a0ba757dSStefano Zampini            supposing part of the interface has dimension 5 (global nodes 0,1,2,3,4)
5360a0ba757dSStefano Zampini            3 neighs procs with structured connected components:
5361a0ba757dSStefano Zampini              neigh 0: [0 1 4], [2 3];  (2 connected components)
5362a0ba757dSStefano Zampini              neigh 1: [0 1], [2 3 4];  (2 connected components)
5363a0ba757dSStefano Zampini              neigh 2: [0 4], [1], [2 3]; (3 connected components)
5364a0ba757dSStefano Zampini            tempbuffer (row-oriented) should be filled as:
5365a0ba757dSStefano Zampini              [ 0, 0, 0;
5366a0ba757dSStefano Zampini                0, 0, 1;
5367a0ba757dSStefano Zampini                1, 1, 2;
5368a0ba757dSStefano Zampini                1, 1, 2;
5369a0ba757dSStefano Zampini                0, 1, 0; ];
5370a0ba757dSStefano Zampini            This way we can simply recover the resulting structure account for possible intersections of ccs among neighs.
5371a0ba757dSStefano Zampini            The mat_graph->where array will be modified to reproduce the following 4 connected components [0], [1], [2 3], [4];
5372a0ba757dSStefano Zampini                                                                                                                                    */
5373a0ba757dSStefano Zampini         for (j=0;j<cum_recv_counts[i+1]-cum_recv_counts[i];j++) {
5374a0ba757dSStefano Zampini           ins_val=0;
5375a0ba757dSStefano Zampini           size_of_recv=recv_buffer_where[sum_requests];  /* total size of recv from neighs */
5376a0ba757dSStefano Zampini           for (buffer_size=0;buffer_size<size_of_recv;) {  /* loop until all data from neighs has been taken into account */
5377a0ba757dSStefano Zampini             for (k=1;k<petsc_buffer[buffer_size+start_of_recv]+1;k++) { /* filling properly temp_buffer using data from a single recv */
5378a0ba757dSStefano Zampini               temp_buffer[ nodes_to_temp_buffer_indices[ petsc_buffer[ start_of_recv+buffer_size+k ] ] ][j]=ins_val;
5379a0ba757dSStefano Zampini             }
5380a0ba757dSStefano Zampini             buffer_size+=k;
5381a0ba757dSStefano Zampini             ins_val++;
5382a0ba757dSStefano Zampini           }
5383a0ba757dSStefano Zampini           start_of_recv+=size_of_recv;
5384a0ba757dSStefano Zampini           sum_requests++;
5385a0ba757dSStefano Zampini         }
5386a0ba757dSStefano Zampini         ierr = PetscMalloc(temp_buffer_size*sizeof(PetscInt),&add_to_where);CHKERRQ(ierr);
5387a0ba757dSStefano Zampini         ierr = PetscMemzero(add_to_where,temp_buffer_size*sizeof(PetscInt));CHKERRQ(ierr);
5388a0ba757dSStefano Zampini         for (j=0;j<temp_buffer_size;j++){
5389a0ba757dSStefano Zampini           if (!add_to_where[j]){ /* found a new cc  */
5390a0ba757dSStefano Zampini             global_where_counter++;
5391a0ba757dSStefano Zampini             add_to_where[j]=global_where_counter;
5392a0ba757dSStefano Zampini             for (k=j+1;k<temp_buffer_size;k++){ /* check for other nodes in new cc */
5393a0ba757dSStefano Zampini               same_set=PETSC_TRUE;
5394a0ba757dSStefano Zampini               for (s=0;s<cum_recv_counts[i+1]-cum_recv_counts[i];s++){
5395a0ba757dSStefano Zampini                 if (temp_buffer[j][s]!=temp_buffer[k][s]) {
5396a0ba757dSStefano Zampini                   same_set=PETSC_FALSE;
5397a0ba757dSStefano Zampini                   break;
5398a0ba757dSStefano Zampini                 }
5399a0ba757dSStefano Zampini               }
54002e8d2280SStefano Zampini               if (same_set) { add_to_where[k]=global_where_counter; }
5401a0ba757dSStefano Zampini             }
5402a0ba757dSStefano Zampini           }
5403a0ba757dSStefano Zampini         }
5404a0ba757dSStefano Zampini         /* insert new data in where array */
5405a0ba757dSStefano Zampini         temp_buffer_size=0;
5406a0ba757dSStefano Zampini         for (j=0;j<mat_graph->nvtxs;j++){
5407a0ba757dSStefano Zampini           if (mat_graph->where[j]==i+1) {
5408a0ba757dSStefano Zampini             mat_graph->where[j]=where_values+add_to_where[temp_buffer_size];
5409a0ba757dSStefano Zampini             temp_buffer_size++;
5410a0ba757dSStefano Zampini           }
5411a0ba757dSStefano Zampini         }
5412a0ba757dSStefano Zampini         ierr = PetscFree(temp_buffer[0]);CHKERRQ(ierr);
5413a0ba757dSStefano Zampini         ierr = PetscFree(temp_buffer);CHKERRQ(ierr);
5414a0ba757dSStefano Zampini         ierr = PetscFree(add_to_where);CHKERRQ(ierr);
5415a0ba757dSStefano Zampini       }
5416a0ba757dSStefano Zampini     }
5417a0ba757dSStefano Zampini     ierr = PetscFree(nodes_to_temp_buffer_indices);CHKERRQ(ierr);
5418a0ba757dSStefano Zampini     ierr = PetscFree(sizes_of_sends);CHKERRQ(ierr);
5419a0ba757dSStefano Zampini     ierr = PetscFree(send_requests);CHKERRQ(ierr);
5420a0ba757dSStefano Zampini     ierr = PetscFree(recv_requests);CHKERRQ(ierr);
5421a0ba757dSStefano Zampini     ierr = PetscFree(petsc_buffer);CHKERRQ(ierr);
5422a0ba757dSStefano Zampini     ierr = PetscFree(recv_buffer);CHKERRQ(ierr);
5423a0ba757dSStefano Zampini     ierr = PetscFree(recv_buffer_where);CHKERRQ(ierr);
5424a0ba757dSStefano Zampini     ierr = PetscFree(send_buffer);CHKERRQ(ierr);
5425a0ba757dSStefano Zampini     ierr = PetscFree(cum_recv_counts);CHKERRQ(ierr);
5426a0ba757dSStefano Zampini     ierr = PetscFree(where_to_nodes_indices);CHKERRQ(ierr);
542723d4d1a5SStefano Zampini     ierr = PetscFree(where_cc_adapt);CHKERRQ(ierr);
5428a0ba757dSStefano Zampini     /* We are ready to evaluate consistent connected components on each part of the shared interface */
5429a0ba757dSStefano Zampini     if (global_where_counter) {
5430a0ba757dSStefano Zampini       for (i=0;i<mat_graph->nvtxs;i++){ mat_graph->touched[i]=PETSC_FALSE; }
5431a0ba757dSStefano Zampini       global_where_counter=0;
5432a0ba757dSStefano Zampini       for (i=0;i<mat_graph->nvtxs;i++){
5433a0ba757dSStefano Zampini         if (mat_graph->where[i] && !mat_graph->touched[i]) {
5434a0ba757dSStefano Zampini           global_where_counter++;
5435a0ba757dSStefano Zampini           for (j=i+1;j<mat_graph->nvtxs;j++){
5436a0ba757dSStefano Zampini             if (!mat_graph->touched[j] && mat_graph->where[j]==mat_graph->where[i]) {
5437a0ba757dSStefano Zampini               mat_graph->where[j]=global_where_counter;
5438a0ba757dSStefano Zampini               mat_graph->touched[j]=PETSC_TRUE;
5439a0ba757dSStefano Zampini             }
5440a0ba757dSStefano Zampini           }
5441a0ba757dSStefano Zampini           mat_graph->where[i]=global_where_counter;
5442a0ba757dSStefano Zampini           mat_graph->touched[i]=PETSC_TRUE;
5443a0ba757dSStefano Zampini         }
5444a0ba757dSStefano Zampini       }
5445a0ba757dSStefano Zampini       where_values=global_where_counter;
5446a0ba757dSStefano Zampini     }
5447a0ba757dSStefano Zampini     if (global_where_counter) {
5448a0ba757dSStefano Zampini       ierr = PetscMemzero(mat_graph->cptr,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr);
5449a0ba757dSStefano Zampini       ierr = PetscMemzero(mat_graph->queue,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
5450a0ba757dSStefano Zampini       ierr = PetscFree(mat_graph->where_ncmps);CHKERRQ(ierr);
5451a0ba757dSStefano Zampini       ierr = PetscMalloc(where_values*sizeof(PetscMPIInt),&mat_graph->where_ncmps);CHKERRQ(ierr);
5452a0ba757dSStefano Zampini       ierr = PCBDDCFindConnectedComponents(mat_graph, where_values);
5453a0ba757dSStefano Zampini     }
54543b03a366Sstefano_zampini   } /* Finished adapting interface */
5455a929c220SStefano Zampini   /* For consistency among neughbouring procs, I need to sort (by global ordering) each connected component */
5456a929c220SStefano Zampini   for (i=0;i<mat_graph->ncmps;i++) {
5457a929c220SStefano Zampini     k = mat_graph->cptr[i+1]-mat_graph->cptr[i];
5458a929c220SStefano Zampini     ierr = ISLocalToGlobalMappingApply(matis->mapping,k,&mat_graph->queue[mat_graph->cptr[i]],&queue_in_global_numbering[mat_graph->cptr[i]]);CHKERRQ(ierr);
5459a929c220SStefano Zampini     ierr = PetscSortIntWithArray(k,&queue_in_global_numbering[mat_graph->cptr[i]],&mat_graph->queue[mat_graph->cptr[i]]);CHKERRQ(ierr);
5460a929c220SStefano Zampini   }
5461a929c220SStefano Zampini 
54620c7d97c5SJed Brown   PetscInt nfc=0;
54630c7d97c5SJed Brown   PetscInt nec=0;
54640c7d97c5SJed Brown   PetscInt nvc=0;
54653b03a366Sstefano_zampini   PetscBool twodim_flag=PETSC_FALSE;
54660c7d97c5SJed Brown   for (i=0; i<mat_graph->ncmps; i++) {
54673b03a366Sstefano_zampini     if ( mat_graph->cptr[i+1]-mat_graph->cptr[i] > vertex_size ){
5468534831adSStefano Zampini       if (mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]==1){ /* 1 neigh Neumann fake included */
54690c7d97c5SJed Brown         nfc++;
54703b03a366Sstefano_zampini       } else { /* note that nec will be zero in 2d */
54713b03a366Sstefano_zampini         nec++;
54723b03a366Sstefano_zampini       }
54730c7d97c5SJed Brown     } else {
54743b03a366Sstefano_zampini       nvc+=mat_graph->cptr[i+1]-mat_graph->cptr[i];
54753b03a366Sstefano_zampini     }
54763b03a366Sstefano_zampini   }
54773b03a366Sstefano_zampini   if (!nec) { /* we are in a 2d case -> no faces, only edges */
54783b03a366Sstefano_zampini     nec = nfc;
54793b03a366Sstefano_zampini     nfc = 0;
54803b03a366Sstefano_zampini     twodim_flag = PETSC_TRUE;
54813b03a366Sstefano_zampini   }
54823972b0daSStefano Zampini   /* allocate IS arrays for faces, edges. Vertices need a single index set. */
54833972b0daSStefano Zampini   k=0;
54843972b0daSStefano Zampini   for (i=0; i<mat_graph->ncmps; i++) {
54853972b0daSStefano Zampini     j=mat_graph->cptr[i+1]-mat_graph->cptr[i];
54863972b0daSStefano Zampini     if ( j > k) {
54873972b0daSStefano Zampini       k=j;
54883972b0daSStefano Zampini     }
5489ba1573a8SStefano Zampini     if (j<=vertex_size) {
5490ba1573a8SStefano Zampini       k+=vertex_size;
5491ba1573a8SStefano Zampini     }
54923972b0daSStefano Zampini   }
54933972b0daSStefano Zampini   ierr = PetscMalloc(k*sizeof(PetscInt),&auxis);CHKERRQ(ierr);
54943b03a366Sstefano_zampini   if (!pcbddc->vertices_flag && !pcbddc->edges_flag) {
54953b03a366Sstefano_zampini     ierr = PetscMalloc(nfc*sizeof(IS),&pcbddc->ISForFaces);CHKERRQ(ierr);
54963b03a366Sstefano_zampini     use_faces=PETSC_TRUE;
54973b03a366Sstefano_zampini   }
54983b03a366Sstefano_zampini   if (!pcbddc->vertices_flag && !pcbddc->faces_flag) {
54993b03a366Sstefano_zampini     ierr = PetscMalloc(nec*sizeof(IS),&pcbddc->ISForEdges);CHKERRQ(ierr);
55003b03a366Sstefano_zampini     use_edges=PETSC_TRUE;
55013b03a366Sstefano_zampini   }
55023b03a366Sstefano_zampini   nfc=0;
55033b03a366Sstefano_zampini   nec=0;
55043b03a366Sstefano_zampini   for (i=0; i<mat_graph->ncmps; i++) {
55053b03a366Sstefano_zampini     if ( mat_graph->cptr[i+1]-mat_graph->cptr[i] > vertex_size ){
55063b03a366Sstefano_zampini       for (j=0;j<mat_graph->cptr[i+1]-mat_graph->cptr[i];j++) {
55073972b0daSStefano Zampini         auxis[j]=mat_graph->queue[mat_graph->cptr[i]+j];
55083b03a366Sstefano_zampini       }
55093b03a366Sstefano_zampini       if (mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]==1){
55103b03a366Sstefano_zampini         if (twodim_flag) {
55113b03a366Sstefano_zampini           if (use_edges) {
55123972b0daSStefano Zampini             ierr = ISCreateGeneral(PETSC_COMM_SELF,j,auxis,PETSC_COPY_VALUES,&pcbddc->ISForEdges[nec]);CHKERRQ(ierr);
55133b03a366Sstefano_zampini             nec++;
55143b03a366Sstefano_zampini           }
55153b03a366Sstefano_zampini         } else {
55163b03a366Sstefano_zampini           if (use_faces) {
55173972b0daSStefano Zampini             ierr = ISCreateGeneral(PETSC_COMM_SELF,j,auxis,PETSC_COPY_VALUES,&pcbddc->ISForFaces[nfc]);CHKERRQ(ierr);
55183b03a366Sstefano_zampini             nfc++;
55193b03a366Sstefano_zampini           }
55203b03a366Sstefano_zampini         }
55213b03a366Sstefano_zampini       } else {
55223b03a366Sstefano_zampini         if (use_edges) {
55233972b0daSStefano Zampini           ierr = ISCreateGeneral(PETSC_COMM_SELF,j,auxis,PETSC_COPY_VALUES,&pcbddc->ISForEdges[nec]);CHKERRQ(ierr);
55240c7d97c5SJed Brown           nec++;
55250c7d97c5SJed Brown         }
55260c7d97c5SJed Brown       }
55270c7d97c5SJed Brown     }
55283b03a366Sstefano_zampini   }
55293b03a366Sstefano_zampini   pcbddc->n_ISForFaces=nfc;
55303b03a366Sstefano_zampini   pcbddc->n_ISForEdges=nec;
55313b03a366Sstefano_zampini   nvc=0;
55320c7d97c5SJed Brown   if ( !pcbddc->constraints_flag ) {
55333b03a366Sstefano_zampini     for (i=0; i<mat_graph->ncmps; i++) {
55343b03a366Sstefano_zampini       if ( mat_graph->cptr[i+1]-mat_graph->cptr[i] <= vertex_size ){
55353b03a366Sstefano_zampini         for ( j=mat_graph->cptr[i];j<mat_graph->cptr[i+1];j++) {
55363972b0daSStefano Zampini           auxis[nvc]=mat_graph->queue[j];
55370c7d97c5SJed Brown           nvc++;
55380c7d97c5SJed Brown         }
55390c7d97c5SJed Brown       }
55400c7d97c5SJed Brown     }
55410c7d97c5SJed Brown   }
5542a0ba757dSStefano Zampini   /* sort vertex set (by local ordering) */
55433972b0daSStefano Zampini   ierr = PetscSortInt(nvc,auxis);CHKERRQ(ierr);
55443972b0daSStefano Zampini   ierr = ISCreateGeneral(PETSC_COMM_SELF,nvc,auxis,PETSC_COPY_VALUES,&pcbddc->ISForVertices);CHKERRQ(ierr);
5545e269702eSStefano Zampini   if (pcbddc->dbg_flag) {
5546d49ef151SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"--------------------------------------------------------------\n");CHKERRQ(ierr);
5547d49ef151SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Details from PCBDDCManageLocalBoundaries for subdomain %04d\n",PetscGlobalRank);CHKERRQ(ierr);
5548d49ef151SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Matrix graph has %d connected components", mat_graph->ncmps);CHKERRQ(ierr);
55490c7d97c5SJed Brown     for (i=0;i<mat_graph->ncmps;i++) {
55503b03a366Sstefano_zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\nDetails for connected component number %02d: size %04d, count %01d. Nodes follow.\n",
55513b03a366Sstefano_zampini              i,mat_graph->cptr[i+1]-mat_graph->cptr[i],mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]);CHKERRQ(ierr);
5552da1bb401SStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"subdomains: ");
5553da1bb401SStefano Zampini       for (j=0;j<mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]; j++) {
5554da1bb401SStefano Zampini         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d ",mat_graph->neighbours_set[mat_graph->queue[mat_graph->cptr[i]]][j]);
5555da1bb401SStefano Zampini       }
5556da1bb401SStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\n");
55570c7d97c5SJed Brown       for (j=mat_graph->cptr[i]; j<mat_graph->cptr[i+1]; j++){
5558a929c220SStefano Zampini         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d (%d), ",mat_graph->queue[j],queue_in_global_numbering[j]);CHKERRQ(ierr);
55590c7d97c5SJed Brown       }
55600c7d97c5SJed Brown     }
5561da1bb401SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\n--------------------------------------------------------------\n");CHKERRQ(ierr);
55623b03a366Sstefano_zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local vertices\n",PetscGlobalRank,nvc);CHKERRQ(ierr);
55633b03a366Sstefano_zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local faces\n",PetscGlobalRank,nfc);CHKERRQ(ierr);
55643b03a366Sstefano_zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local edges\n",PetscGlobalRank,nec);CHKERRQ(ierr);
5565d49ef151SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
55660c7d97c5SJed Brown   }
55673972b0daSStefano Zampini   ierr = PetscFree(auxis);CHKERRQ(ierr);
5568a929c220SStefano Zampini   ierr = PetscFree(queue_in_global_numbering);CHKERRQ(ierr);
55690c7d97c5SJed Brown   PetscFunctionReturn(0);
55700c7d97c5SJed Brown }
55710c7d97c5SJed Brown 
55720c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
55730c7d97c5SJed Brown 
55740c7d97c5SJed Brown /* The following code has been adapted from function IsConnectedSubdomain contained
5575da1bb401SStefano Zampini    in source file contig.c of METIS library (version 5.0.1)
5576da1bb401SStefano Zampini    It finds connected components of each partition labeled from 1 to n_dist  */
55770c7d97c5SJed Brown 
55780c7d97c5SJed Brown #undef __FUNCT__
55790c7d97c5SJed Brown #define __FUNCT__ "PCBDDCFindConnectedComponents"
55809c0446d6SStefano Zampini static PetscErrorCode PCBDDCFindConnectedComponents(PCBDDCGraph graph, PetscInt n_dist )
55810c7d97c5SJed Brown {
55820c7d97c5SJed Brown   PetscInt i, j, k, nvtxs, first, last, nleft, ncmps,pid,cum_queue,n,ncmps_pid;
55830c7d97c5SJed Brown   PetscInt *xadj, *adjncy, *where, *queue;
55840c7d97c5SJed Brown   PetscInt *cptr;
55850c7d97c5SJed Brown   PetscBool *touched;
55860c7d97c5SJed Brown 
55870c7d97c5SJed Brown   PetscFunctionBegin;
55880c7d97c5SJed Brown 
55890c7d97c5SJed Brown   nvtxs   = graph->nvtxs;
55900c7d97c5SJed Brown   xadj    = graph->xadj;
55910c7d97c5SJed Brown   adjncy  = graph->adjncy;
55920c7d97c5SJed Brown   where   = graph->where;
55930c7d97c5SJed Brown   touched = graph->touched;
55940c7d97c5SJed Brown   queue   = graph->queue;
55950c7d97c5SJed Brown   cptr    = graph->cptr;
55960c7d97c5SJed Brown 
55972e8d2280SStefano Zampini   for (i=0; i<nvtxs; i++) {
55980c7d97c5SJed Brown     touched[i] = PETSC_FALSE;
55992e8d2280SStefano Zampini   }
56000c7d97c5SJed Brown 
56010c7d97c5SJed Brown   cum_queue=0;
56020c7d97c5SJed Brown   ncmps=0;
56030c7d97c5SJed Brown 
56040c7d97c5SJed Brown   for (n=0; n<n_dist; n++) {
5605da1bb401SStefano Zampini     pid = n+1;  /* partition labeled by 0 is discarded */
56060c7d97c5SJed Brown     nleft = 0;
56070c7d97c5SJed Brown     for (i=0; i<nvtxs; i++) {
56080c7d97c5SJed Brown       if (where[i] == pid)
56090c7d97c5SJed Brown         nleft++;
56100c7d97c5SJed Brown     }
56110c7d97c5SJed Brown     for (i=0; i<nvtxs; i++) {
56120c7d97c5SJed Brown       if (where[i] == pid)
56130c7d97c5SJed Brown         break;
56140c7d97c5SJed Brown     }
56150c7d97c5SJed Brown     touched[i] = PETSC_TRUE;
56160c7d97c5SJed Brown     queue[cum_queue] = i;
56170c7d97c5SJed Brown     first = 0; last = 1;
56180c7d97c5SJed Brown     cptr[ncmps] = cum_queue;  /* This actually points to queue */
56190c7d97c5SJed Brown     ncmps_pid = 0;
56200c7d97c5SJed Brown     while (first != nleft) {
56210c7d97c5SJed Brown       if (first == last) { /* Find another starting vertex */
56220c7d97c5SJed Brown         cptr[++ncmps] = first+cum_queue;
56230c7d97c5SJed Brown         ncmps_pid++;
56240c7d97c5SJed Brown         for (i=0; i<nvtxs; i++) {
56250c7d97c5SJed Brown           if (where[i] == pid && !touched[i])
56260c7d97c5SJed Brown             break;
56270c7d97c5SJed Brown         }
56280c7d97c5SJed Brown         queue[cum_queue+last] = i;
56290c7d97c5SJed Brown         last++;
56300c7d97c5SJed Brown         touched[i] = PETSC_TRUE;
56310c7d97c5SJed Brown       }
56320c7d97c5SJed Brown       i = queue[cum_queue+first];
56330c7d97c5SJed Brown       first++;
56340c7d97c5SJed Brown       for (j=xadj[i]; j<xadj[i+1]; j++) {
56350c7d97c5SJed Brown         k = adjncy[j];
56360c7d97c5SJed Brown         if (where[k] == pid && !touched[k]) {
56370c7d97c5SJed Brown           queue[cum_queue+last] = k;
56380c7d97c5SJed Brown           last++;
56390c7d97c5SJed Brown           touched[k] = PETSC_TRUE;
56400c7d97c5SJed Brown         }
56410c7d97c5SJed Brown       }
56420c7d97c5SJed Brown     }
56430c7d97c5SJed Brown     cptr[++ncmps] = first+cum_queue;
56440c7d97c5SJed Brown     ncmps_pid++;
56450c7d97c5SJed Brown     cum_queue=cptr[ncmps];
5646a0ba757dSStefano Zampini     graph->where_ncmps[n] = ncmps_pid;
56470c7d97c5SJed Brown   }
56480c7d97c5SJed Brown   graph->ncmps = ncmps;
56490c7d97c5SJed Brown 
56500c7d97c5SJed Brown   PetscFunctionReturn(0);
56510c7d97c5SJed Brown }
5652