xref: /petsc/src/ksp/pc/impls/bddc/bddc.c (revision 2fa5cd679192b9b390e47ae2d0650965e6b1d9fa)
153cdbc3dSStefano Zampini /* TODOLIST
2da1bb401SStefano Zampini    DofSplitting and DM attached to pc?
3da1bb401SStefano Zampini    Change SetNeumannBoundaries to SetNeumannBoundariesLocal and provide new SetNeumannBoundaries (same Dirichlet)
4a0ba757dSStefano Zampini    change how to deal with the coarse problem (PCBDDCSetCoarseEnvironment):
5a0ba757dSStefano Zampini      - simplify coarse problem structure -> PCBDDC or PCREDUDANT, nothing else -> same comm for all levels?
6a0ba757dSStefano Zampini      - remove coarse enums and allow use of PCBDDCGetCoarseKSP
7a0ba757dSStefano Zampini      - remove metis dependency -> use MatPartitioning for multilevel -> Assemble serial adjacency in ManageLocalBoundaries?
8a0ba757dSStefano Zampini    code refactoring:
9a0ba757dSStefano Zampini      - pick up better names for static functions
10a0ba757dSStefano Zampini    change options structure:
11a0ba757dSStefano Zampini      - insert BDDC into MG framework?
12a0ba757dSStefano Zampini    provide other ops? Ask to developers
13a0ba757dSStefano Zampini    remove all unused printf
14a0ba757dSStefano Zampini    man pages
1553cdbc3dSStefano Zampini */
160c7d97c5SJed Brown 
1753cdbc3dSStefano Zampini /* ----------------------------------------------------------------------------------------------------------------------------------------------
180c7d97c5SJed Brown    Implementation of BDDC preconditioner based on:
190c7d97c5SJed Brown    C. Dohrmann "An approximate BDDC preconditioner", Numerical Linear Algebra with Applications Volume 14, Issue 2, pages 149-168, March 2007
2053cdbc3dSStefano Zampini    ---------------------------------------------------------------------------------------------------------------------------------------------- */
2153cdbc3dSStefano Zampini 
2207475bc1SBarry Smith #include "bddc.h" /*I "petscpc.h" I*/
233b03a366Sstefano_zampini #include <petscblaslapack.h>
240c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
250c7d97c5SJed Brown #undef __FUNCT__
260c7d97c5SJed Brown #define __FUNCT__ "PCSetFromOptions_BDDC"
270c7d97c5SJed Brown PetscErrorCode PCSetFromOptions_BDDC(PC pc)
280c7d97c5SJed Brown {
290c7d97c5SJed Brown   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
300c7d97c5SJed Brown   PetscErrorCode ierr;
310c7d97c5SJed Brown 
320c7d97c5SJed Brown   PetscFunctionBegin;
330c7d97c5SJed Brown   ierr = PetscOptionsHead("BDDC options");CHKERRQ(ierr);
340c7d97c5SJed Brown   /* Verbose debugging of main data structures */
35e269702eSStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_check_all"       ,"Verbose (debugging) output for PCBDDC"                       ,"none",pcbddc->dbg_flag      ,&pcbddc->dbg_flag      ,PETSC_NULL);CHKERRQ(ierr);
360c7d97c5SJed Brown   /* Some customization for default primal space */
37da1bb401SStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_vertices_only"   ,"Use only vertices in coarse space (i.e. discard constraints)","none",pcbddc->vertices_flag   ,&pcbddc->vertices_flag   ,PETSC_NULL);CHKERRQ(ierr);
38da1bb401SStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_constraints_only","Use only constraints in coarse space (i.e. discard vertices)","none",pcbddc->constraints_flag,&pcbddc->constraints_flag,PETSC_NULL);CHKERRQ(ierr);
39da1bb401SStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_faces_only"      ,"Use only faces among constraints of coarse space (i.e. discard edges)"         ,"none",pcbddc->faces_flag      ,&pcbddc->faces_flag      ,PETSC_NULL);CHKERRQ(ierr);
40da1bb401SStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_edges_only"      ,"Use only edges among constraints of coarse space (i.e. discard faces)"         ,"none",pcbddc->edges_flag      ,&pcbddc->edges_flag      ,PETSC_NULL);CHKERRQ(ierr);
41*2fa5cd67SKarl Rupp 
420c7d97c5SJed Brown   /* Coarse solver context */
436c667b0aSStefano Zampini   static const char * const avail_coarse_problems[] = {"sequential","replicated","parallel","multilevel","CoarseProblemType","PC_BDDC_",0}; /* order of choiches depends on ENUM defined in bddc.h */
440c7d97c5SJed Brown   ierr = PetscOptionsEnum("-pc_bddc_coarse_problem_type","Set coarse problem type","none",avail_coarse_problems,(PetscEnum)pcbddc->coarse_problem_type,(PetscEnum*)&pcbddc->coarse_problem_type,PETSC_NULL);CHKERRQ(ierr);
45*2fa5cd67SKarl Rupp 
460c7d97c5SJed Brown   /* Two different application of BDDC to the whole set of dofs, internal and interface */
4729622bf0SStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_switch_preconditioning_type","Switch between M_2 (default) and M_3 preconditioners (as defined by Dohrmann)","none",pcbddc->inexact_prec_type,&pcbddc->inexact_prec_type,PETSC_NULL);CHKERRQ(ierr);
48534831adSStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_use_change_of_basis","Use change of basis approach for primal space","none",pcbddc->usechangeofbasis,&pcbddc->usechangeofbasis,PETSC_NULL);CHKERRQ(ierr);
49534831adSStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_use_change_on_faces","Use change of basis approach for face constraints","none",pcbddc->usechangeonfaces,&pcbddc->usechangeonfaces,PETSC_NULL);CHKERRQ(ierr);
50*2fa5cd67SKarl Rupp 
51534831adSStefano Zampini   pcbddc->usechangeonfaces = pcbddc->usechangeonfaces && pcbddc->usechangeofbasis;
52*2fa5cd67SKarl Rupp 
530c7d97c5SJed Brown   ierr = PetscOptionsInt("-pc_bddc_coarsening_ratio","Set coarsening ratio used in multilevel coarsening","none",pcbddc->coarsening_ratio,&pcbddc->coarsening_ratio,PETSC_NULL);CHKERRQ(ierr);
544fad6a16SStefano Zampini   ierr = PetscOptionsInt("-pc_bddc_max_levels","Set maximum number of levels for multilevel","none",pcbddc->max_levels,&pcbddc->max_levels,PETSC_NULL);CHKERRQ(ierr);
550c7d97c5SJed Brown   ierr = PetscOptionsTail();CHKERRQ(ierr);
560c7d97c5SJed Brown   PetscFunctionReturn(0);
570c7d97c5SJed Brown }
580c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
590c7d97c5SJed Brown EXTERN_C_BEGIN
600c7d97c5SJed Brown #undef __FUNCT__
610c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetCoarseProblemType_BDDC"
6253cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetCoarseProblemType_BDDC(PC pc, CoarseProblemType CPT)
630c7d97c5SJed Brown {
640c7d97c5SJed Brown   PC_BDDC *pcbddc = (PC_BDDC*)pc->data;
650c7d97c5SJed Brown 
660c7d97c5SJed Brown   PetscFunctionBegin;
670c7d97c5SJed Brown   pcbddc->coarse_problem_type = CPT;
680c7d97c5SJed Brown   PetscFunctionReturn(0);
690c7d97c5SJed Brown }
700c7d97c5SJed Brown EXTERN_C_END
710c7d97c5SJed Brown #undef __FUNCT__
720c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetCoarseProblemType"
7353cdbc3dSStefano Zampini /*@
749c0446d6SStefano Zampini  PCBDDCSetCoarseProblemType - Set coarse problem type in PCBDDC.
7553cdbc3dSStefano Zampini 
769c0446d6SStefano Zampini    Not collective
7753cdbc3dSStefano Zampini 
7853cdbc3dSStefano Zampini    Input Parameters:
7953cdbc3dSStefano Zampini +  pc - the preconditioning context
8053cdbc3dSStefano Zampini -  CoarseProblemType - pick a better name and explain what this is
8153cdbc3dSStefano Zampini 
8253cdbc3dSStefano Zampini    Level: intermediate
8353cdbc3dSStefano Zampini 
8453cdbc3dSStefano Zampini    Notes:
85da1bb401SStefano Zampini    Not collective but all procs must call with same arguments.
8653cdbc3dSStefano Zampini 
8753cdbc3dSStefano Zampini .seealso: PCBDDC
8853cdbc3dSStefano Zampini @*/
890c7d97c5SJed Brown PetscErrorCode PCBDDCSetCoarseProblemType(PC pc, CoarseProblemType CPT)
900c7d97c5SJed Brown {
910c7d97c5SJed Brown   PetscErrorCode ierr;
920c7d97c5SJed Brown 
930c7d97c5SJed Brown   PetscFunctionBegin;
940c7d97c5SJed Brown   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
950c7d97c5SJed Brown   ierr = PetscTryMethod(pc,"PCBDDCSetCoarseProblemType_C",(PC,CoarseProblemType),(pc,CPT));CHKERRQ(ierr);
960c7d97c5SJed Brown   PetscFunctionReturn(0);
970c7d97c5SJed Brown }
980c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
990c7d97c5SJed Brown EXTERN_C_BEGIN
1000c7d97c5SJed Brown #undef __FUNCT__
1014fad6a16SStefano Zampini #define __FUNCT__ "PCBDDCSetCoarseningRatio_BDDC"
1024fad6a16SStefano Zampini static PetscErrorCode PCBDDCSetCoarseningRatio_BDDC(PC pc,PetscInt k)
1034fad6a16SStefano Zampini {
1044fad6a16SStefano Zampini   PC_BDDC *pcbddc = (PC_BDDC*)pc->data;
1054fad6a16SStefano Zampini 
1064fad6a16SStefano Zampini   PetscFunctionBegin;
1074fad6a16SStefano Zampini   pcbddc->coarsening_ratio=k;
1084fad6a16SStefano Zampini   PetscFunctionReturn(0);
1094fad6a16SStefano Zampini }
1104fad6a16SStefano Zampini EXTERN_C_END
1114fad6a16SStefano Zampini #undef __FUNCT__
1124fad6a16SStefano Zampini #define __FUNCT__ "PCBDDCSetCoarseningRatio"
1134fad6a16SStefano Zampini /*@
1144fad6a16SStefano Zampini  PCBDDCSetCoarseningRatio - Set coarsening ratio used in multilevel coarsening
1154fad6a16SStefano Zampini 
1164fad6a16SStefano Zampini    Logically collective on PC
1174fad6a16SStefano Zampini 
1184fad6a16SStefano Zampini    Input Parameters:
1194fad6a16SStefano Zampini +  pc - the preconditioning context
1204fad6a16SStefano Zampini -  k - coarsening ratio
1214fad6a16SStefano Zampini 
1224fad6a16SStefano Zampini    Approximatively k subdomains at the finer level will be aggregated into a single subdomain at the coarser level.
1234fad6a16SStefano Zampini 
1244fad6a16SStefano Zampini    Level: intermediate
1254fad6a16SStefano Zampini 
1264fad6a16SStefano Zampini    Notes:
1274fad6a16SStefano Zampini 
1284fad6a16SStefano Zampini .seealso: PCBDDC
1294fad6a16SStefano Zampini @*/
1304fad6a16SStefano Zampini PetscErrorCode PCBDDCSetCoarseningRatio(PC pc,PetscInt k)
1314fad6a16SStefano Zampini {
1324fad6a16SStefano Zampini   PetscErrorCode ierr;
1334fad6a16SStefano Zampini 
1344fad6a16SStefano Zampini   PetscFunctionBegin;
1354fad6a16SStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
1364fad6a16SStefano Zampini   ierr = PetscTryMethod(pc,"PCBDDCSetCoarseningRatio_C",(PC,PetscInt),(pc,k));CHKERRQ(ierr);
1374fad6a16SStefano Zampini   PetscFunctionReturn(0);
1384fad6a16SStefano Zampini }
1394fad6a16SStefano Zampini /* -------------------------------------------------------------------------- */
1404fad6a16SStefano Zampini EXTERN_C_BEGIN
1414fad6a16SStefano Zampini #undef __FUNCT__
1424fad6a16SStefano Zampini #define __FUNCT__ "PCBDDCSetMaxLevels_BDDC"
1434fad6a16SStefano Zampini static PetscErrorCode PCBDDCSetMaxLevels_BDDC(PC pc,PetscInt max_levels)
1444fad6a16SStefano Zampini {
1454fad6a16SStefano Zampini   PC_BDDC *pcbddc = (PC_BDDC*)pc->data;
1464fad6a16SStefano Zampini 
1474fad6a16SStefano Zampini   PetscFunctionBegin;
1484fad6a16SStefano Zampini   pcbddc->max_levels=max_levels;
1494fad6a16SStefano Zampini   PetscFunctionReturn(0);
1504fad6a16SStefano Zampini }
1514fad6a16SStefano Zampini EXTERN_C_END
1524fad6a16SStefano Zampini #undef __FUNCT__
1534fad6a16SStefano Zampini #define __FUNCT__ "PCBDDCSetMaxLevels"
1544fad6a16SStefano Zampini /*@
1554fad6a16SStefano Zampini  PCBDDCSetMaxLevels - Sets the maximum number of levels within the multilevel approach.
1564fad6a16SStefano Zampini 
1574fad6a16SStefano Zampini    Logically collective on PC
1584fad6a16SStefano Zampini 
1594fad6a16SStefano Zampini    Input Parameters:
1604fad6a16SStefano Zampini +  pc - the preconditioning context
1614fad6a16SStefano Zampini -  max_levels - the maximum number of levels
1624fad6a16SStefano Zampini 
1634fad6a16SStefano Zampini    Default value is 1, i.e. coarse problem will be solved inexactly with one application
1644fad6a16SStefano Zampini    of PCBDDC preconditioner if the multilevel approach is requested.
1654fad6a16SStefano Zampini 
1664fad6a16SStefano Zampini    Level: intermediate
1674fad6a16SStefano Zampini 
1684fad6a16SStefano Zampini    Notes:
1694fad6a16SStefano Zampini 
1704fad6a16SStefano Zampini .seealso: PCBDDC
1714fad6a16SStefano Zampini @*/
1724fad6a16SStefano Zampini PetscErrorCode PCBDDCSetMaxLevels(PC pc,PetscInt max_levels)
1734fad6a16SStefano Zampini {
1744fad6a16SStefano Zampini   PetscErrorCode ierr;
1754fad6a16SStefano Zampini 
1764fad6a16SStefano Zampini   PetscFunctionBegin;
1774fad6a16SStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
1784fad6a16SStefano Zampini   ierr = PetscTryMethod(pc,"PCBDDCSetMaxLevels_C",(PC,PetscInt),(pc,max_levels));CHKERRQ(ierr);
1794fad6a16SStefano Zampini   PetscFunctionReturn(0);
1804fad6a16SStefano Zampini }
1814fad6a16SStefano Zampini /* -------------------------------------------------------------------------- */
1824fad6a16SStefano Zampini EXTERN_C_BEGIN
1834fad6a16SStefano Zampini #undef __FUNCT__
1840bdf917eSStefano Zampini #define __FUNCT__ "PCBDDCSetNullSpace_BDDC"
1850bdf917eSStefano Zampini static PetscErrorCode PCBDDCSetNullSpace_BDDC(PC pc,MatNullSpace NullSpace)
1860bdf917eSStefano Zampini {
1870bdf917eSStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
1880bdf917eSStefano Zampini   PetscErrorCode ierr;
1890bdf917eSStefano Zampini 
1900bdf917eSStefano Zampini   PetscFunctionBegin;
1910bdf917eSStefano Zampini   ierr = PetscObjectReference((PetscObject)NullSpace);CHKERRQ(ierr);
1920bdf917eSStefano Zampini   ierr = MatNullSpaceDestroy(&pcbddc->NullSpace);CHKERRQ(ierr);
193*2fa5cd67SKarl Rupp 
1940bdf917eSStefano Zampini   pcbddc->NullSpace = NullSpace;
1950bdf917eSStefano Zampini   PetscFunctionReturn(0);
1960bdf917eSStefano Zampini }
1970bdf917eSStefano Zampini EXTERN_C_END
1980bdf917eSStefano Zampini #undef __FUNCT__
1990bdf917eSStefano Zampini #define __FUNCT__ "PCBDDCSetNullSpace"
2000bdf917eSStefano Zampini /*@
2010bdf917eSStefano Zampini  PCBDDCSetNullSpace - Set NullSpace of global operator of BDDC preconditioned mat.
2020bdf917eSStefano Zampini 
2030bdf917eSStefano Zampini    Logically collective on PC and MatNullSpace
2040bdf917eSStefano Zampini 
2050bdf917eSStefano Zampini    Input Parameters:
2060bdf917eSStefano Zampini +  pc - the preconditioning context
2070bdf917eSStefano Zampini -  NullSpace - Null space of the linear operator to be preconditioned.
2080bdf917eSStefano Zampini 
2090bdf917eSStefano Zampini    Level: intermediate
2100bdf917eSStefano Zampini 
2110bdf917eSStefano Zampini    Notes:
2120bdf917eSStefano Zampini 
2130bdf917eSStefano Zampini .seealso: PCBDDC
2140bdf917eSStefano Zampini @*/
2150bdf917eSStefano Zampini PetscErrorCode PCBDDCSetNullSpace(PC pc,MatNullSpace NullSpace)
2160bdf917eSStefano Zampini {
2170bdf917eSStefano Zampini   PetscErrorCode ierr;
2180bdf917eSStefano Zampini 
2190bdf917eSStefano Zampini   PetscFunctionBegin;
2200bdf917eSStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
2210bdf917eSStefano Zampini   ierr = PetscTryMethod(pc,"PCBDDCSetNullSpace_C",(PC,MatNullSpace),(pc,NullSpace));CHKERRQ(ierr);
2220bdf917eSStefano Zampini   PetscFunctionReturn(0);
2230bdf917eSStefano Zampini }
2240bdf917eSStefano Zampini /* -------------------------------------------------------------------------- */
2250bdf917eSStefano Zampini EXTERN_C_BEGIN
2260bdf917eSStefano Zampini #undef __FUNCT__
2273b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCSetDirichletBoundaries_BDDC"
2283b03a366Sstefano_zampini static PetscErrorCode PCBDDCSetDirichletBoundaries_BDDC(PC pc,IS DirichletBoundaries)
2293b03a366Sstefano_zampini {
2303b03a366Sstefano_zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
2313b03a366Sstefano_zampini   PetscErrorCode ierr;
2323b03a366Sstefano_zampini 
2333b03a366Sstefano_zampini   PetscFunctionBegin;
2343b03a366Sstefano_zampini   ierr = ISDestroy(&pcbddc->DirichletBoundaries);CHKERRQ(ierr);
23536e030ebSStefano Zampini   ierr = PetscObjectReference((PetscObject)DirichletBoundaries);CHKERRQ(ierr);
236*2fa5cd67SKarl Rupp 
23736e030ebSStefano Zampini   pcbddc->DirichletBoundaries = DirichletBoundaries;
2383b03a366Sstefano_zampini   PetscFunctionReturn(0);
2393b03a366Sstefano_zampini }
2403b03a366Sstefano_zampini EXTERN_C_END
2413b03a366Sstefano_zampini #undef __FUNCT__
2423b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCSetDirichletBoundaries"
2433b03a366Sstefano_zampini /*@
244da1bb401SStefano Zampini  PCBDDCSetDirichletBoundaries - Set index set defining subdomain part (in local ordering)
245da1bb401SStefano Zampini                               of Dirichlet boundaries for the global problem.
2463b03a366Sstefano_zampini 
2473b03a366Sstefano_zampini    Not collective
2483b03a366Sstefano_zampini 
2493b03a366Sstefano_zampini    Input Parameters:
2503b03a366Sstefano_zampini +  pc - the preconditioning context
2513b03a366Sstefano_zampini -  DirichletBoundaries - sequential index set defining the subdomain part of Dirichlet boundaries (can be PETSC_NULL)
2523b03a366Sstefano_zampini 
2533b03a366Sstefano_zampini    Level: intermediate
2543b03a366Sstefano_zampini 
2553b03a366Sstefano_zampini    Notes:
2563b03a366Sstefano_zampini 
2573b03a366Sstefano_zampini .seealso: PCBDDC
2583b03a366Sstefano_zampini @*/
2593b03a366Sstefano_zampini PetscErrorCode PCBDDCSetDirichletBoundaries(PC pc,IS DirichletBoundaries)
2603b03a366Sstefano_zampini {
2613b03a366Sstefano_zampini   PetscErrorCode ierr;
2623b03a366Sstefano_zampini 
2633b03a366Sstefano_zampini   PetscFunctionBegin;
2643b03a366Sstefano_zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
2653b03a366Sstefano_zampini   ierr = PetscTryMethod(pc,"PCBDDCSetDirichletBoundaries_C",(PC,IS),(pc,DirichletBoundaries));CHKERRQ(ierr);
2663b03a366Sstefano_zampini   PetscFunctionReturn(0);
2673b03a366Sstefano_zampini }
2683b03a366Sstefano_zampini /* -------------------------------------------------------------------------- */
2693b03a366Sstefano_zampini EXTERN_C_BEGIN
2703b03a366Sstefano_zampini #undef __FUNCT__
2710c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetNeumannBoundaries_BDDC"
27253cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetNeumannBoundaries_BDDC(PC pc,IS NeumannBoundaries)
2730c7d97c5SJed Brown {
2740c7d97c5SJed Brown   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
27553cdbc3dSStefano Zampini   PetscErrorCode ierr;
2760c7d97c5SJed Brown 
2770c7d97c5SJed Brown   PetscFunctionBegin;
27853cdbc3dSStefano Zampini   ierr = ISDestroy(&pcbddc->NeumannBoundaries);CHKERRQ(ierr);
27936e030ebSStefano Zampini   ierr = PetscObjectReference((PetscObject)NeumannBoundaries);CHKERRQ(ierr);
280*2fa5cd67SKarl Rupp 
28136e030ebSStefano Zampini   pcbddc->NeumannBoundaries = NeumannBoundaries;
2820c7d97c5SJed Brown   PetscFunctionReturn(0);
2830c7d97c5SJed Brown }
2840c7d97c5SJed Brown EXTERN_C_END
2850c7d97c5SJed Brown #undef __FUNCT__
2860c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetNeumannBoundaries"
28757527edcSJed Brown /*@
288da1bb401SStefano Zampini  PCBDDCSetNeumannBoundaries - Set index set defining subdomain part (in local ordering)
289da1bb401SStefano Zampini                               of Neumann boundaries for the global problem.
29057527edcSJed Brown 
2919c0446d6SStefano Zampini    Not collective
29257527edcSJed Brown 
29357527edcSJed Brown    Input Parameters:
29457527edcSJed Brown +  pc - the preconditioning context
2959c0446d6SStefano Zampini -  NeumannBoundaries - sequential index set defining the subdomain part of Neumann boundaries (can be PETSC_NULL)
29657527edcSJed Brown 
29757527edcSJed Brown    Level: intermediate
29857527edcSJed Brown 
29957527edcSJed Brown    Notes:
30057527edcSJed Brown 
30157527edcSJed Brown .seealso: PCBDDC
30257527edcSJed Brown @*/
30353cdbc3dSStefano Zampini PetscErrorCode PCBDDCSetNeumannBoundaries(PC pc,IS NeumannBoundaries)
3040c7d97c5SJed Brown {
3050c7d97c5SJed Brown   PetscErrorCode ierr;
3060c7d97c5SJed Brown 
3070c7d97c5SJed Brown   PetscFunctionBegin;
3080c7d97c5SJed Brown   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
30953cdbc3dSStefano Zampini   ierr = PetscTryMethod(pc,"PCBDDCSetNeumannBoundaries_C",(PC,IS),(pc,NeumannBoundaries));CHKERRQ(ierr);
31053cdbc3dSStefano Zampini   PetscFunctionReturn(0);
31153cdbc3dSStefano Zampini }
31253cdbc3dSStefano Zampini /* -------------------------------------------------------------------------- */
31353cdbc3dSStefano Zampini EXTERN_C_BEGIN
31453cdbc3dSStefano Zampini #undef __FUNCT__
315da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCGetDirichletBoundaries_BDDC"
316da1bb401SStefano Zampini static PetscErrorCode PCBDDCGetDirichletBoundaries_BDDC(PC pc,IS *DirichletBoundaries)
317da1bb401SStefano Zampini {
318da1bb401SStefano Zampini   PC_BDDC *pcbddc = (PC_BDDC*)pc->data;
319da1bb401SStefano Zampini 
320da1bb401SStefano Zampini   PetscFunctionBegin;
321da1bb401SStefano Zampini   *DirichletBoundaries = pcbddc->DirichletBoundaries;
322da1bb401SStefano Zampini   PetscFunctionReturn(0);
323da1bb401SStefano Zampini }
324da1bb401SStefano Zampini EXTERN_C_END
325da1bb401SStefano Zampini #undef __FUNCT__
326da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCGetDirichletBoundaries"
327da1bb401SStefano Zampini /*@
328da1bb401SStefano Zampini  PCBDDCGetDirichletBoundaries - Get index set defining subdomain part (in local ordering)
329da1bb401SStefano Zampini                                 of Dirichlet boundaries for the global problem.
330da1bb401SStefano Zampini 
331da1bb401SStefano Zampini    Not collective
332da1bb401SStefano Zampini 
333da1bb401SStefano Zampini    Input Parameters:
334da1bb401SStefano Zampini +  pc - the preconditioning context
335da1bb401SStefano Zampini 
336da1bb401SStefano Zampini    Output Parameters:
337da1bb401SStefano Zampini +  DirichletBoundaries - index set defining the subdomain part of Dirichlet boundaries
338da1bb401SStefano Zampini 
339da1bb401SStefano Zampini    Level: intermediate
340da1bb401SStefano Zampini 
341da1bb401SStefano Zampini    Notes:
342da1bb401SStefano Zampini 
343da1bb401SStefano Zampini .seealso: PCBDDC
344da1bb401SStefano Zampini @*/
345da1bb401SStefano Zampini PetscErrorCode PCBDDCGetDirichletBoundaries(PC pc,IS *DirichletBoundaries)
346da1bb401SStefano Zampini {
347da1bb401SStefano Zampini   PetscErrorCode ierr;
348da1bb401SStefano Zampini 
349da1bb401SStefano Zampini   PetscFunctionBegin;
350da1bb401SStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
351da1bb401SStefano Zampini   ierr = PetscUseMethod(pc,"PCBDDCGetDirichletBoundaries_C",(PC,IS*),(pc,DirichletBoundaries));CHKERRQ(ierr);
352da1bb401SStefano Zampini   PetscFunctionReturn(0);
353da1bb401SStefano Zampini }
354da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
355da1bb401SStefano Zampini EXTERN_C_BEGIN
356da1bb401SStefano Zampini #undef __FUNCT__
35753cdbc3dSStefano Zampini #define __FUNCT__ "PCBDDCGetNeumannBoundaries_BDDC"
35853cdbc3dSStefano Zampini static PetscErrorCode PCBDDCGetNeumannBoundaries_BDDC(PC pc,IS *NeumannBoundaries)
35953cdbc3dSStefano Zampini {
36053cdbc3dSStefano Zampini   PC_BDDC *pcbddc = (PC_BDDC*)pc->data;
36153cdbc3dSStefano Zampini 
36253cdbc3dSStefano Zampini   PetscFunctionBegin;
36353cdbc3dSStefano Zampini   *NeumannBoundaries = pcbddc->NeumannBoundaries;
36453cdbc3dSStefano Zampini   PetscFunctionReturn(0);
36553cdbc3dSStefano Zampini }
36653cdbc3dSStefano Zampini EXTERN_C_END
36753cdbc3dSStefano Zampini #undef __FUNCT__
36853cdbc3dSStefano Zampini #define __FUNCT__ "PCBDDCGetNeumannBoundaries"
36953cdbc3dSStefano Zampini /*@
370da1bb401SStefano Zampini  PCBDDCGetNeumannBoundaries - Get index set defining subdomain part (in local ordering)
371da1bb401SStefano Zampini                               of Neumann boundaries for the global problem.
37253cdbc3dSStefano Zampini 
3739c0446d6SStefano Zampini    Not collective
37453cdbc3dSStefano Zampini 
37553cdbc3dSStefano Zampini    Input Parameters:
37653cdbc3dSStefano Zampini +  pc - the preconditioning context
37753cdbc3dSStefano Zampini 
37853cdbc3dSStefano Zampini    Output Parameters:
37953cdbc3dSStefano Zampini +  NeumannBoundaries - index set defining the subdomain part of Neumann boundaries
38053cdbc3dSStefano Zampini 
38153cdbc3dSStefano Zampini    Level: intermediate
38253cdbc3dSStefano Zampini 
38353cdbc3dSStefano Zampini    Notes:
38453cdbc3dSStefano Zampini 
38553cdbc3dSStefano Zampini .seealso: PCBDDC
38653cdbc3dSStefano Zampini @*/
38753cdbc3dSStefano Zampini PetscErrorCode PCBDDCGetNeumannBoundaries(PC pc,IS *NeumannBoundaries)
38853cdbc3dSStefano Zampini {
38953cdbc3dSStefano Zampini   PetscErrorCode ierr;
39053cdbc3dSStefano Zampini 
39153cdbc3dSStefano Zampini   PetscFunctionBegin;
39253cdbc3dSStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
39353cdbc3dSStefano Zampini   ierr = PetscUseMethod(pc,"PCBDDCGetNeumannBoundaries_C",(PC,IS*),(pc,NeumannBoundaries));CHKERRQ(ierr);
3940c7d97c5SJed Brown   PetscFunctionReturn(0);
3950c7d97c5SJed Brown }
39636e030ebSStefano Zampini /* -------------------------------------------------------------------------- */
39736e030ebSStefano Zampini EXTERN_C_BEGIN
39836e030ebSStefano Zampini #undef __FUNCT__
399da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetLocalAdjacencyGraph_BDDC"
4001a83f524SJed Brown static PetscErrorCode PCBDDCSetLocalAdjacencyGraph_BDDC(PC pc, PetscInt nvtxs,const PetscInt xadj[],const PetscInt adjncy[], PetscCopyMode copymode)
40136e030ebSStefano Zampini {
40236e030ebSStefano Zampini   PC_BDDC        *pcbddc  = (PC_BDDC*)pc->data;
403da1bb401SStefano Zampini   PCBDDCGraph    mat_graph=pcbddc->mat_graph;
404da1bb401SStefano Zampini   PetscErrorCode ierr;
40536e030ebSStefano Zampini 
40636e030ebSStefano Zampini   PetscFunctionBegin;
407da1bb401SStefano Zampini   mat_graph->nvtxs=nvtxs;
408*2fa5cd67SKarl Rupp 
409da1bb401SStefano Zampini   ierr = PetscFree(mat_graph->xadj);CHKERRQ(ierr);
410da1bb401SStefano Zampini   ierr = PetscFree(mat_graph->adjncy);CHKERRQ(ierr);
411da1bb401SStefano Zampini   if (copymode == PETSC_COPY_VALUES) {
412da1bb401SStefano Zampini     ierr = PetscMalloc((mat_graph->nvtxs+1)*sizeof(PetscInt),&mat_graph->xadj);CHKERRQ(ierr);
413da1bb401SStefano Zampini     ierr = PetscMalloc(xadj[mat_graph->nvtxs]*sizeof(PetscInt),&mat_graph->adjncy);CHKERRQ(ierr);
414da1bb401SStefano Zampini     ierr = PetscMemcpy(mat_graph->xadj,xadj,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr);
415da1bb401SStefano Zampini     ierr = PetscMemcpy(mat_graph->adjncy,adjncy,xadj[mat_graph->nvtxs]*sizeof(PetscInt));CHKERRQ(ierr);
416da1bb401SStefano Zampini   } else if (copymode == PETSC_OWN_POINTER) {
4171a83f524SJed Brown     mat_graph->xadj   = (PetscInt*)xadj;
4181a83f524SJed Brown     mat_graph->adjncy = (PetscInt*)adjncy;
419acee19a7SJed Brown   } else SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SUP,"Unsupported copy mode %d\n",copymode);
42036e030ebSStefano Zampini   PetscFunctionReturn(0);
42136e030ebSStefano Zampini }
42236e030ebSStefano Zampini EXTERN_C_END
42336e030ebSStefano Zampini #undef __FUNCT__
424da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetLocalAdjacencyGraph"
42536e030ebSStefano Zampini /*@
426da1bb401SStefano Zampini  PCBDDCSetLocalAdjacencyGraph - Set CSR graph of local matrix for use of PCBDDC.
42736e030ebSStefano Zampini 
42836e030ebSStefano Zampini    Not collective
42936e030ebSStefano Zampini 
43036e030ebSStefano Zampini    Input Parameters:
43136e030ebSStefano Zampini +  pc - the preconditioning context
432da1bb401SStefano Zampini -  nvtxs - number of local vertices of the graph
433da1bb401SStefano Zampini -  xadj, adjncy - the CSR graph
434da1bb401SStefano Zampini -  copymode - either PETSC_COPY_VALUES or PETSC_OWN_POINTER. In the former case the user must free the array passed in;
435da1bb401SStefano Zampini                                                              in the latter case, memory must be obtained with PetscMalloc.
43636e030ebSStefano Zampini 
43736e030ebSStefano Zampini    Level: intermediate
43836e030ebSStefano Zampini 
43936e030ebSStefano Zampini    Notes:
44036e030ebSStefano Zampini 
44136e030ebSStefano Zampini .seealso: PCBDDC
44236e030ebSStefano Zampini @*/
4431a83f524SJed Brown PetscErrorCode PCBDDCSetLocalAdjacencyGraph(PC pc,PetscInt nvtxs,const PetscInt xadj[],const PetscInt adjncy[], PetscCopyMode copymode)
44436e030ebSStefano Zampini {
445da1bb401SStefano Zampini   PetscInt       nrows,ncols;
446da1bb401SStefano Zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
44736e030ebSStefano Zampini   PetscErrorCode ierr;
44836e030ebSStefano Zampini 
44936e030ebSStefano Zampini   PetscFunctionBegin;
45036e030ebSStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
451da1bb401SStefano Zampini   ierr = MatGetSize(matis->A,&nrows,&ncols);CHKERRQ(ierr);
452f23aa3ddSBarry Smith   if (nvtxs != nrows) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Local adjacency size %d passed in %s differs from local problem size %d!\n",nvtxs,nrows);
453f23aa3ddSBarry Smith   else {
4541a83f524SJed Brown     ierr = PetscTryMethod(pc,"PCBDDCSetLocalAdjacencyGraph_C",(PC,PetscInt,const PetscInt[],const PetscInt[],PetscCopyMode),(pc,nvtxs,xadj,adjncy,copymode));CHKERRQ(ierr);
455da1bb401SStefano Zampini   }
45636e030ebSStefano Zampini   PetscFunctionReturn(0);
45736e030ebSStefano Zampini }
4589c0446d6SStefano Zampini /* -------------------------------------------------------------------------- */
4599c0446d6SStefano Zampini EXTERN_C_BEGIN
4609c0446d6SStefano Zampini #undef __FUNCT__
4619c0446d6SStefano Zampini #define __FUNCT__ "PCBDDCSetDofsSplitting_BDDC"
4629c0446d6SStefano Zampini static PetscErrorCode PCBDDCSetDofsSplitting_BDDC(PC pc,PetscInt n_is, IS ISForDofs[])
4639c0446d6SStefano Zampini {
4649c0446d6SStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
4659c0446d6SStefano Zampini   PetscInt       i;
4669c0446d6SStefano Zampini   PetscErrorCode ierr;
4679c0446d6SStefano Zampini 
4689c0446d6SStefano Zampini   PetscFunctionBegin;
469da1bb401SStefano Zampini   /* Destroy ISes if they were already set */
4709c0446d6SStefano Zampini   for (i=0; i<pcbddc->n_ISForDofs; i++) {
4719c0446d6SStefano Zampini     ierr = ISDestroy(&pcbddc->ISForDofs[i]);CHKERRQ(ierr);
4729c0446d6SStefano Zampini   }
473d11ae9bbSstefano_zampini   ierr = PetscFree(pcbddc->ISForDofs);CHKERRQ(ierr);
474da1bb401SStefano Zampini   /* allocate space then set */
4759c0446d6SStefano Zampini   ierr = PetscMalloc(n_is*sizeof(IS),&pcbddc->ISForDofs);CHKERRQ(ierr);
4769c0446d6SStefano Zampini   for (i=0; i<n_is; i++) {
477da1bb401SStefano Zampini     ierr = PetscObjectReference((PetscObject)ISForDofs[i]);CHKERRQ(ierr);
478*2fa5cd67SKarl Rupp 
479da1bb401SStefano Zampini     pcbddc->ISForDofs[i]=ISForDofs[i];
4809c0446d6SStefano Zampini   }
4819c0446d6SStefano Zampini   pcbddc->n_ISForDofs=n_is;
4829c0446d6SStefano Zampini   PetscFunctionReturn(0);
4839c0446d6SStefano Zampini }
4849c0446d6SStefano Zampini EXTERN_C_END
4859c0446d6SStefano Zampini #undef __FUNCT__
4869c0446d6SStefano Zampini #define __FUNCT__ "PCBDDCSetDofsSplitting"
4879c0446d6SStefano Zampini /*@
488da1bb401SStefano Zampini  PCBDDCSetDofsSplitting - Set index sets defining fields of local mat.
4899c0446d6SStefano Zampini 
4909c0446d6SStefano Zampini    Not collective
4919c0446d6SStefano Zampini 
4929c0446d6SStefano Zampini    Input Parameters:
4939c0446d6SStefano Zampini +  pc - the preconditioning context
494da1bb401SStefano Zampini -  n - number of index sets defining the fields
495da1bb401SStefano Zampini -  IS[] - array of IS describing the fields
4969c0446d6SStefano Zampini 
4979c0446d6SStefano Zampini    Level: intermediate
4989c0446d6SStefano Zampini 
4999c0446d6SStefano Zampini    Notes:
5009c0446d6SStefano Zampini 
5019c0446d6SStefano Zampini .seealso: PCBDDC
5029c0446d6SStefano Zampini @*/
5039c0446d6SStefano Zampini PetscErrorCode PCBDDCSetDofsSplitting(PC pc,PetscInt n_is, IS ISForDofs[])
5049c0446d6SStefano Zampini {
5059c0446d6SStefano Zampini   PetscErrorCode ierr;
5069c0446d6SStefano Zampini 
5079c0446d6SStefano Zampini   PetscFunctionBegin;
5089c0446d6SStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
5099c0446d6SStefano Zampini   ierr = PetscTryMethod(pc,"PCBDDCSetDofsSplitting_C",(PC,PetscInt,IS[]),(pc,n_is,ISForDofs));CHKERRQ(ierr);
5109c0446d6SStefano Zampini   PetscFunctionReturn(0);
5119c0446d6SStefano Zampini }
512da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
513534831adSStefano Zampini #undef __FUNCT__
514534831adSStefano Zampini #define __FUNCT__ "PCPreSolve_BDDC"
515534831adSStefano Zampini /* -------------------------------------------------------------------------- */
516534831adSStefano Zampini /*
517534831adSStefano Zampini    PCPreSolve_BDDC - Changes the right hand side and (if necessary) the initial
518534831adSStefano Zampini                      guess if a transformation of basis approach has been selected.
5199c0446d6SStefano Zampini 
520534831adSStefano Zampini    Input Parameter:
521534831adSStefano Zampini +  pc - the preconditioner contex
522534831adSStefano Zampini 
523534831adSStefano Zampini    Application Interface Routine: PCPreSolve()
524534831adSStefano Zampini 
525534831adSStefano Zampini    Notes:
526534831adSStefano Zampini    The interface routine PCPreSolve() is not usually called directly by
527534831adSStefano Zampini    the user, but instead is called by KSPSolve().
528534831adSStefano Zampini */
529534831adSStefano Zampini static PetscErrorCode PCPreSolve_BDDC(PC pc, KSP ksp, Vec rhs, Vec x)
530534831adSStefano Zampini {
531534831adSStefano Zampini   PetscErrorCode ierr;
532534831adSStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
533534831adSStefano Zampini   PC_IS          *pcis   = (PC_IS*)(pc->data);
534534831adSStefano Zampini   Mat_IS         *matis  = (Mat_IS*)pc->pmat->data;
535534831adSStefano Zampini   Mat            temp_mat;
5363972b0daSStefano Zampini   IS             dirIS;
5373972b0daSStefano Zampini   PetscInt       dirsize,i,*is_indices;
5383972b0daSStefano Zampini   PetscScalar    *array_x,*array_diagonal;
5393972b0daSStefano Zampini   Vec            used_vec;
5403972b0daSStefano Zampini   PetscBool      guess_nonzero;
541534831adSStefano Zampini 
542534831adSStefano Zampini   PetscFunctionBegin;
5433972b0daSStefano Zampini   if (x) {
5443972b0daSStefano Zampini     ierr     = PetscObjectReference((PetscObject)x);CHKERRQ(ierr);
5453972b0daSStefano Zampini     used_vec = x;
5463972b0daSStefano Zampini   } else {
5473972b0daSStefano Zampini     ierr     = PetscObjectReference((PetscObject)pcbddc->temp_solution);CHKERRQ(ierr);
5483972b0daSStefano Zampini     used_vec = pcbddc->temp_solution;
5493972b0daSStefano Zampini     ierr     = VecSet(used_vec,0.0);CHKERRQ(ierr);
5503972b0daSStefano Zampini   }
5513972b0daSStefano Zampini   /* hack into ksp data structure PCPreSolve comes earlier in src/ksp/ksp/interface/itfunc.c */
5523972b0daSStefano Zampini   if (ksp) {
5533972b0daSStefano Zampini     ierr = KSPGetInitialGuessNonzero(ksp,&guess_nonzero);CHKERRQ(ierr);
5543972b0daSStefano Zampini     if (!guess_nonzero) {
5553972b0daSStefano Zampini       ierr = VecSet(used_vec,0.0);CHKERRQ(ierr);
5563972b0daSStefano Zampini     }
5573972b0daSStefano Zampini   }
5583972b0daSStefano Zampini   /* store the original rhs */
5593972b0daSStefano Zampini   ierr = VecCopy(rhs,pcbddc->original_rhs);CHKERRQ(ierr);
5603972b0daSStefano Zampini 
5613972b0daSStefano Zampini   /* Take into account zeroed rows -> change rhs and store solution removed */
5623972b0daSStefano Zampini   ierr = MatGetDiagonal(pc->pmat,pcis->vec1_global);CHKERRQ(ierr);
5633972b0daSStefano Zampini   ierr = VecPointwiseDivide(pcis->vec1_global,rhs,pcis->vec1_global);CHKERRQ(ierr);
5643972b0daSStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
5653972b0daSStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
5663972b0daSStefano Zampini   ierr = VecScatterBegin(matis->ctx,used_vec,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
5673972b0daSStefano Zampini   ierr = VecScatterEnd  (matis->ctx,used_vec,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
5683972b0daSStefano Zampini   ierr = PCBDDCGetDirichletBoundaries(pc,&dirIS);CHKERRQ(ierr);
5693972b0daSStefano Zampini   if (dirIS) {
5703972b0daSStefano Zampini     ierr = ISGetSize(dirIS,&dirsize);CHKERRQ(ierr);
5713972b0daSStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array_x);CHKERRQ(ierr);
5723972b0daSStefano Zampini     ierr = VecGetArray(pcis->vec2_N,&array_diagonal);CHKERRQ(ierr);
5733972b0daSStefano Zampini     ierr = ISGetIndices(dirIS,(const PetscInt**)&is_indices);CHKERRQ(ierr);
574*2fa5cd67SKarl Rupp     for (i=0; i<dirsize; i++) array_x[is_indices[i]] = array_diagonal[is_indices[i]];
575*2fa5cd67SKarl Rupp 
5763972b0daSStefano Zampini     ierr = ISRestoreIndices(dirIS,(const PetscInt**)&is_indices);CHKERRQ(ierr);
5773972b0daSStefano Zampini     ierr = VecRestoreArray(pcis->vec2_N,&array_diagonal);CHKERRQ(ierr);
5783972b0daSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array_x);CHKERRQ(ierr);
5793972b0daSStefano Zampini   }
5803972b0daSStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
5813972b0daSStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
582b76ba322SStefano Zampini 
5833972b0daSStefano Zampini   /* remove the computed solution from the rhs */
5843972b0daSStefano Zampini   ierr = VecScale(used_vec,-1.0);CHKERRQ(ierr);
5853972b0daSStefano Zampini   ierr = MatMultAdd(pc->pmat,used_vec,rhs,rhs);CHKERRQ(ierr);
5863972b0daSStefano Zampini   ierr = VecScale(used_vec,-1.0);CHKERRQ(ierr);
587b76ba322SStefano Zampini 
588b76ba322SStefano Zampini   /* store partially computed solution and set initial guess */
5893972b0daSStefano Zampini   if (x) {
5903972b0daSStefano Zampini     ierr = VecCopy(used_vec,pcbddc->temp_solution);CHKERRQ(ierr);
5913972b0daSStefano Zampini     ierr = VecSet(used_vec,0.0);CHKERRQ(ierr);
592b76ba322SStefano Zampini     if (pcbddc->use_exact_dirichlet) {
593b76ba322SStefano Zampini       ierr = VecScatterBegin(pcis->global_to_D,rhs,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
594b76ba322SStefano Zampini       ierr = VecScatterEnd  (pcis->global_to_D,rhs,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
595b76ba322SStefano Zampini       ierr = KSPSolve(pcbddc->ksp_D,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr);
596b76ba322SStefano Zampini       ierr = VecScatterBegin(pcis->global_to_D,pcis->vec2_D,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
597b76ba322SStefano Zampini       ierr = VecScatterEnd  (pcis->global_to_D,pcis->vec2_D,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
598b76ba322SStefano Zampini       if (ksp) {
599b76ba322SStefano Zampini         ierr = KSPSetInitialGuessNonzero(ksp,PETSC_TRUE);CHKERRQ(ierr);
600b76ba322SStefano Zampini       }
601b76ba322SStefano Zampini     }
6023972b0daSStefano Zampini   }
603b76ba322SStefano Zampini 
604b76ba322SStefano Zampini   /* rhs change of basis */
605b76ba322SStefano Zampini   if (pcbddc->usechangeofbasis) {
606b76ba322SStefano Zampini     /* swap pointers for local matrices */
607b76ba322SStefano Zampini     temp_mat          = matis->A;
608b76ba322SStefano Zampini     matis->A          = pcbddc->local_mat;
609b76ba322SStefano Zampini     pcbddc->local_mat = temp_mat;
610b76ba322SStefano Zampini     /* Get local rhs and apply transformation of basis */
611b76ba322SStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,rhs,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
612b76ba322SStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,rhs,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
613b76ba322SStefano Zampini     /* from original basis to modified basis */
614b76ba322SStefano Zampini     ierr = MatMultTranspose(pcbddc->ChangeOfBasisMatrix,pcis->vec1_B,pcis->vec2_B);CHKERRQ(ierr);
615b76ba322SStefano Zampini     /* put back modified values into the global vec using INSERT_VALUES copy mode */
616b76ba322SStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,pcis->vec2_B,rhs,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
617b76ba322SStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec2_B,rhs,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
6180bdf917eSStefano Zampini     if (ksp && pcbddc->NullSpace) {
6190bdf917eSStefano Zampini       ierr = MatNullSpaceRemove(pcbddc->NullSpace,used_vec,PETSC_NULL);CHKERRQ(ierr);
6200bdf917eSStefano Zampini       ierr = MatNullSpaceRemove(pcbddc->NullSpace,rhs,PETSC_NULL);CHKERRQ(ierr);
621b76ba322SStefano Zampini     }
6220bdf917eSStefano Zampini   }
6230bdf917eSStefano Zampini   ierr = VecDestroy(&used_vec);CHKERRQ(ierr);
624534831adSStefano Zampini   PetscFunctionReturn(0);
625534831adSStefano Zampini }
626534831adSStefano Zampini /* -------------------------------------------------------------------------- */
627534831adSStefano Zampini #undef __FUNCT__
628534831adSStefano Zampini #define __FUNCT__ "PCPostSolve_BDDC"
629534831adSStefano Zampini /* -------------------------------------------------------------------------- */
630534831adSStefano Zampini /*
631534831adSStefano Zampini    PCPostSolve_BDDC - Changes the computed solution if a transformation of basis
632534831adSStefano Zampini                      approach has been selected. Also, restores rhs to its original state.
633534831adSStefano Zampini 
634534831adSStefano Zampini    Input Parameter:
635534831adSStefano Zampini +  pc - the preconditioner contex
636534831adSStefano Zampini 
637534831adSStefano Zampini    Application Interface Routine: PCPostSolve()
638534831adSStefano Zampini 
639534831adSStefano Zampini    Notes:
640534831adSStefano Zampini    The interface routine PCPostSolve() is not usually called directly by
641534831adSStefano Zampini    the user, but instead is called by KSPSolve().
642534831adSStefano Zampini */
643534831adSStefano Zampini static PetscErrorCode PCPostSolve_BDDC(PC pc, KSP ksp, Vec rhs, Vec x)
644534831adSStefano Zampini {
645534831adSStefano Zampini   PetscErrorCode ierr;
646534831adSStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
647534831adSStefano Zampini   PC_IS          *pcis   = (PC_IS*)(pc->data);
648534831adSStefano Zampini   Mat_IS         *matis  = (Mat_IS*)pc->pmat->data;
649534831adSStefano Zampini   Mat            temp_mat;
650534831adSStefano Zampini 
651534831adSStefano Zampini   PetscFunctionBegin;
652534831adSStefano Zampini   if (pcbddc->usechangeofbasis) {
653534831adSStefano Zampini     /* swap pointers for local matrices */
654534831adSStefano Zampini     temp_mat          = matis->A;
655534831adSStefano Zampini     matis->A          = pcbddc->local_mat;
656534831adSStefano Zampini     pcbddc->local_mat = temp_mat;
657534831adSStefano Zampini     /* restore rhs to its original state */
6583425bc38SStefano Zampini     if (rhs) {
6593425bc38SStefano Zampini       ierr = VecCopy(pcbddc->original_rhs,rhs);CHKERRQ(ierr);
6603425bc38SStefano Zampini     }
661534831adSStefano Zampini     /* Get Local boundary and apply transformation of basis to solution vector */
662534831adSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,x,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
663534831adSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,x,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
664534831adSStefano Zampini     /* from modified basis to original basis */
665534831adSStefano Zampini     ierr = MatMult(pcbddc->ChangeOfBasisMatrix,pcis->vec1_B,pcis->vec2_B);CHKERRQ(ierr);
666534831adSStefano Zampini     /* put back modified values into the global vec using INSERT_VALUES copy mode */
667534831adSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,pcis->vec2_B,x,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
668534831adSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec2_B,x,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
669534831adSStefano Zampini   }
6703972b0daSStefano Zampini   /* add solution removed in presolve */
6713425bc38SStefano Zampini   if (x) {
6723425bc38SStefano Zampini     ierr = VecAXPY(x,1.0,pcbddc->temp_solution);CHKERRQ(ierr);
6733425bc38SStefano Zampini   }
674534831adSStefano Zampini   PetscFunctionReturn(0);
675534831adSStefano Zampini }
676534831adSStefano Zampini /* -------------------------------------------------------------------------- */
67753cdbc3dSStefano Zampini #undef __FUNCT__
67853cdbc3dSStefano Zampini #define __FUNCT__ "PCSetUp_BDDC"
6790c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
6800c7d97c5SJed Brown /*
6810c7d97c5SJed Brown    PCSetUp_BDDC - Prepares for the use of the BDDC preconditioner
6820c7d97c5SJed Brown                   by setting data structures and options.
6830c7d97c5SJed Brown 
6840c7d97c5SJed Brown    Input Parameter:
68553cdbc3dSStefano Zampini +  pc - the preconditioner context
6860c7d97c5SJed Brown 
6870c7d97c5SJed Brown    Application Interface Routine: PCSetUp()
6880c7d97c5SJed Brown 
6890c7d97c5SJed Brown    Notes:
6900c7d97c5SJed Brown    The interface routine PCSetUp() is not usually called directly by
6910c7d97c5SJed Brown    the user, but instead is called by PCApply() if necessary.
6920c7d97c5SJed Brown */
69353cdbc3dSStefano Zampini PetscErrorCode PCSetUp_BDDC(PC pc)
6940c7d97c5SJed Brown {
6950c7d97c5SJed Brown   PetscErrorCode ierr;
6960c7d97c5SJed Brown   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
6970c7d97c5SJed Brown 
6980c7d97c5SJed Brown   PetscFunctionBegin;
6990c7d97c5SJed Brown   if (!pc->setupcalled) {
7003b03a366Sstefano_zampini     /* For BDDC we need to define a local "Neumann" problem different to that defined in PCISSetup
7019c0446d6SStefano Zampini        So, we set to pcnone the Neumann problem of pcis in order to avoid unneeded computation
7020c7d97c5SJed Brown        Also, we decide to directly build the (same) Dirichlet problem */
7030c7d97c5SJed Brown     ierr = PetscOptionsSetValue("-is_localN_pc_type","none");CHKERRQ(ierr);
7040c7d97c5SJed Brown     ierr = PetscOptionsSetValue("-is_localD_pc_type","none");CHKERRQ(ierr);
7050c7d97c5SJed Brown     /* Set up all the "iterative substructuring" common block */
7060bdf917eSStefano Zampini 
7070c7d97c5SJed Brown     ierr = PCISSetUp(pc);CHKERRQ(ierr);
7083b03a366Sstefano_zampini     /* Get stdout for dbg */
709e269702eSStefano Zampini     if (pcbddc->dbg_flag) {
710e269702eSStefano Zampini       ierr = PetscViewerASCIIGetStdout(((PetscObject)pc)->comm,&pcbddc->dbg_viewer);CHKERRQ(ierr);
711e269702eSStefano Zampini       ierr = PetscViewerASCIISynchronizedAllow(pcbddc->dbg_viewer,PETSC_TRUE);CHKERRQ(ierr);
712e269702eSStefano Zampini     }
7133b03a366Sstefano_zampini     /* Analyze local interface */
7140c7d97c5SJed Brown     ierr = PCBDDCManageLocalBoundaries(pc);CHKERRQ(ierr);
7153b03a366Sstefano_zampini     /* Set up local constraint matrix */
7163b03a366Sstefano_zampini     ierr = PCBDDCCreateConstraintMatrix(pc);CHKERRQ(ierr);
7170c7d97c5SJed Brown     /* Create coarse and local stuffs used for evaluating action of preconditioner */
7180c7d97c5SJed Brown     ierr = PCBDDCCoarseSetUp(pc);CHKERRQ(ierr);
7190c7d97c5SJed Brown   }
7200c7d97c5SJed Brown   PetscFunctionReturn(0);
7210c7d97c5SJed Brown }
7220c7d97c5SJed Brown 
7230c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
7240c7d97c5SJed Brown /*
7250c7d97c5SJed Brown    PCApply_BDDC - Applies the BDDC preconditioner to a vector.
7260c7d97c5SJed Brown 
7270c7d97c5SJed Brown    Input Parameters:
7280c7d97c5SJed Brown .  pc - the preconditioner context
7290c7d97c5SJed Brown .  r - input vector (global)
7300c7d97c5SJed Brown 
7310c7d97c5SJed Brown    Output Parameter:
7320c7d97c5SJed Brown .  z - output vector (global)
7330c7d97c5SJed Brown 
7340c7d97c5SJed Brown    Application Interface Routine: PCApply()
7350c7d97c5SJed Brown  */
7360c7d97c5SJed Brown #undef __FUNCT__
7370c7d97c5SJed Brown #define __FUNCT__ "PCApply_BDDC"
73853cdbc3dSStefano Zampini PetscErrorCode PCApply_BDDC(PC pc,Vec r,Vec z)
7390c7d97c5SJed Brown {
7400c7d97c5SJed Brown   PC_IS             *pcis   = (PC_IS*)(pc->data);
7410c7d97c5SJed Brown   PC_BDDC           *pcbddc = (PC_BDDC*)(pc->data);
7420c7d97c5SJed Brown   PetscErrorCode    ierr;
7433b03a366Sstefano_zampini   const PetscScalar one   = 1.0;
7443b03a366Sstefano_zampini   const PetscScalar m_one = -1.0;
7452617d88aSStefano Zampini   const PetscScalar zero  = 0.0;
7460c7d97c5SJed Brown 
7470c7d97c5SJed Brown /* This code is similar to that provided in nn.c for PCNN
7480c7d97c5SJed Brown    NN interface preconditioner changed to BDDC
74929622bf0SStefano Zampini    Added support for M_3 preconditioner in the reference article (code is active if pcbddc->inexact_prec_type = PETSC_TRUE) */
7500c7d97c5SJed Brown 
7510c7d97c5SJed Brown   PetscFunctionBegin;
752b76ba322SStefano Zampini   if (!pcbddc->use_exact_dirichlet) {
7530c7d97c5SJed Brown     /* First Dirichlet solve */
7540c7d97c5SJed Brown     ierr = VecScatterBegin(pcis->global_to_D,r,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
7550c7d97c5SJed Brown     ierr = VecScatterEnd  (pcis->global_to_D,r,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
75653cdbc3dSStefano Zampini     ierr = KSPSolve(pcbddc->ksp_D,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr);
7570c7d97c5SJed Brown     /*
7580c7d97c5SJed Brown       Assembling right hand side for BDDC operator
7590c7d97c5SJed Brown       - vec1_D for the Dirichlet part (if needed, i.e. prec_flag=PETSC_TRUE)
7600c7d97c5SJed Brown       - the interface part of the global vector z
7610c7d97c5SJed Brown     */
7620c7d97c5SJed Brown     ierr = VecScale(pcis->vec2_D,m_one);CHKERRQ(ierr);
7630c7d97c5SJed Brown     ierr = MatMult(pcis->A_BI,pcis->vec2_D,pcis->vec1_B);CHKERRQ(ierr);
76429622bf0SStefano Zampini     if (pcbddc->inexact_prec_type) { ierr = MatMultAdd(pcis->A_II,pcis->vec2_D,pcis->vec1_D,pcis->vec1_D);CHKERRQ(ierr); }
7650c7d97c5SJed Brown     ierr = VecScale(pcis->vec2_D,m_one);CHKERRQ(ierr);
7660c7d97c5SJed Brown     ierr = VecCopy(r,z);CHKERRQ(ierr);
7670c7d97c5SJed Brown     ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
7680c7d97c5SJed Brown     ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
7692617d88aSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
7702617d88aSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
771b76ba322SStefano Zampini   } else {
772b76ba322SStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,r,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
773b76ba322SStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,r,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
7740bdf917eSStefano Zampini     ierr = VecSet(pcis->vec1_D,zero);CHKERRQ(ierr);
775b76ba322SStefano Zampini     ierr = VecSet(pcis->vec2_D,zero);CHKERRQ(ierr);
776b76ba322SStefano Zampini   }
777b76ba322SStefano Zampini 
778b76ba322SStefano Zampini   /* Apply partition of unity */
7792617d88aSStefano Zampini   ierr = VecPointwiseMult(pcis->vec1_B,pcis->D,pcis->vec1_B);CHKERRQ(ierr);
7802617d88aSStefano Zampini 
7812617d88aSStefano Zampini   /* Apply interface preconditioner
7822617d88aSStefano Zampini      input/output vecs: pcis->vec1_B and pcis->vec1_D */
7832617d88aSStefano Zampini   ierr = PCBDDCApplyInterfacePreconditioner(pc);CHKERRQ(ierr);
7842617d88aSStefano Zampini 
7852617d88aSStefano Zampini   /* Apply partition of unity and sum boundary values */
7862617d88aSStefano Zampini   ierr = VecPointwiseMult(pcis->vec1_B,pcis->D,pcis->vec1_B);CHKERRQ(ierr);
7872617d88aSStefano Zampini   ierr = VecSet(z,zero);CHKERRQ(ierr);
7882617d88aSStefano Zampini   ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
7892617d88aSStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
7900c7d97c5SJed Brown 
7913b03a366Sstefano_zampini   /* Second Dirichlet solve and assembling of output */
7920c7d97c5SJed Brown   ierr = VecScatterBegin(pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
7930c7d97c5SJed Brown   ierr = VecScatterEnd  (pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
7940c7d97c5SJed Brown   ierr = MatMult(pcis->A_IB,pcis->vec1_B,pcis->vec3_D);CHKERRQ(ierr);
79529622bf0SStefano Zampini   if (pcbddc->inexact_prec_type) { ierr = MatMultAdd(pcis->A_II,pcis->vec1_D,pcis->vec3_D,pcis->vec3_D);CHKERRQ(ierr); }
79653cdbc3dSStefano Zampini   ierr = KSPSolve(pcbddc->ksp_D,pcis->vec3_D,pcbddc->vec4_D);CHKERRQ(ierr);
7970c7d97c5SJed Brown   ierr = VecScale(pcbddc->vec4_D,m_one);CHKERRQ(ierr);
79829622bf0SStefano Zampini   if (pcbddc->inexact_prec_type) { ierr = VecAXPY (pcbddc->vec4_D,one,pcis->vec1_D);CHKERRQ(ierr); }
7990c7d97c5SJed Brown   ierr = VecAXPY (pcis->vec2_D,one,pcbddc->vec4_D);CHKERRQ(ierr);
8000c7d97c5SJed Brown   ierr = VecScatterBegin(pcis->global_to_D,pcis->vec2_D,z,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
8010c7d97c5SJed Brown   ierr = VecScatterEnd  (pcis->global_to_D,pcis->vec2_D,z,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
8020c7d97c5SJed Brown   PetscFunctionReturn(0);
8030c7d97c5SJed Brown 
8040c7d97c5SJed Brown }
805da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
806da1bb401SStefano Zampini #undef __FUNCT__
807da1bb401SStefano Zampini #define __FUNCT__ "PCDestroy_BDDC"
808da1bb401SStefano Zampini PetscErrorCode PCDestroy_BDDC(PC pc)
809da1bb401SStefano Zampini {
810da1bb401SStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
8110bdf917eSStefano Zampini   PetscInt       i;
812da1bb401SStefano Zampini   PetscErrorCode ierr;
813da1bb401SStefano Zampini 
814da1bb401SStefano Zampini   PetscFunctionBegin;
815da1bb401SStefano Zampini   /* free data created by PCIS */
816da1bb401SStefano Zampini   ierr = PCISDestroy(pc);CHKERRQ(ierr);
817da1bb401SStefano Zampini   /* free BDDC data  */
8180bdf917eSStefano Zampini   ierr = MatNullSpaceDestroy(&pcbddc->CoarseNullSpace);CHKERRQ(ierr);
8190bdf917eSStefano Zampini   ierr = MatNullSpaceDestroy(&pcbddc->NullSpace);CHKERRQ(ierr);
8203972b0daSStefano Zampini   ierr = VecDestroy(&pcbddc->temp_solution);CHKERRQ(ierr);
821534831adSStefano Zampini   ierr = VecDestroy(&pcbddc->original_rhs);CHKERRQ(ierr);
822534831adSStefano Zampini   ierr = MatDestroy(&pcbddc->local_mat);CHKERRQ(ierr);
823534831adSStefano Zampini   ierr = MatDestroy(&pcbddc->ChangeOfBasisMatrix);CHKERRQ(ierr);
824da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->coarse_vec);CHKERRQ(ierr);
825da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->coarse_rhs);CHKERRQ(ierr);
826da1bb401SStefano Zampini   ierr = KSPDestroy(&pcbddc->coarse_ksp);CHKERRQ(ierr);
827da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->coarse_mat);CHKERRQ(ierr);
828da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->coarse_phi_B);CHKERRQ(ierr);
829da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->coarse_phi_D);CHKERRQ(ierr);
830da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec1_P);CHKERRQ(ierr);
831da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec1_C);CHKERRQ(ierr);
832da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->local_auxmat1);CHKERRQ(ierr);
833da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->local_auxmat2);CHKERRQ(ierr);
834da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec1_R);CHKERRQ(ierr);
835da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec2_R);CHKERRQ(ierr);
836da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec4_D);CHKERRQ(ierr);
837da1bb401SStefano Zampini   ierr = VecScatterDestroy(&pcbddc->R_to_B);CHKERRQ(ierr);
838da1bb401SStefano Zampini   ierr = VecScatterDestroy(&pcbddc->R_to_D);CHKERRQ(ierr);
839da1bb401SStefano Zampini   ierr = VecScatterDestroy(&pcbddc->coarse_loc_to_glob);CHKERRQ(ierr);
840da1bb401SStefano Zampini   ierr = KSPDestroy(&pcbddc->ksp_D);CHKERRQ(ierr);
841da1bb401SStefano Zampini   ierr = KSPDestroy(&pcbddc->ksp_R);CHKERRQ(ierr);
842da1bb401SStefano Zampini   ierr = ISDestroy(&pcbddc->NeumannBoundaries);CHKERRQ(ierr);
843da1bb401SStefano Zampini   ierr = ISDestroy(&pcbddc->DirichletBoundaries);CHKERRQ(ierr);
844da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->ConstraintMatrix);CHKERRQ(ierr);
845da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->local_primal_indices);CHKERRQ(ierr);
846da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->replicated_local_primal_indices);CHKERRQ(ierr);
8470bdf917eSStefano Zampini   ierr = PetscFree(pcbddc->replicated_local_primal_values);CHKERRQ(ierr);
848da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->local_primal_displacements);CHKERRQ(ierr);
849da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->local_primal_sizes);CHKERRQ(ierr);
850*2fa5cd67SKarl Rupp   for (i=0; i<pcbddc->n_ISForDofs; i++) {
851*2fa5cd67SKarl Rupp     ierr = ISDestroy(&pcbddc->ISForDofs[i]);CHKERRQ(ierr);
852*2fa5cd67SKarl Rupp   }
853da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->ISForDofs);CHKERRQ(ierr);
854*2fa5cd67SKarl Rupp   for (i=0; i<pcbddc->n_ISForFaces; i++) {
855*2fa5cd67SKarl Rupp     ierr = ISDestroy(&pcbddc->ISForFaces[i]);CHKERRQ(ierr);
856*2fa5cd67SKarl Rupp   }
857da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->ISForFaces);CHKERRQ(ierr);
858*2fa5cd67SKarl Rupp   for (i=0; i<pcbddc->n_ISForEdges; i++) {
859*2fa5cd67SKarl Rupp     ierr = ISDestroy(&pcbddc->ISForEdges[i]);CHKERRQ(ierr);
860*2fa5cd67SKarl Rupp   }
861da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->ISForEdges);CHKERRQ(ierr);
862da1bb401SStefano Zampini   ierr = ISDestroy(&pcbddc->ISForVertices);CHKERRQ(ierr);
8633972b0daSStefano Zampini   /* Free graph structure */
864da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph->xadj);CHKERRQ(ierr);
865da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph->adjncy);CHKERRQ(ierr);
866142dfd88SStefano Zampini   if (pcbddc->mat_graph->nvtxs) {
867da1bb401SStefano Zampini     ierr = PetscFree(pcbddc->mat_graph->neighbours_set[0]);CHKERRQ(ierr);
868142dfd88SStefano Zampini   }
869da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph->neighbours_set);CHKERRQ(ierr);
8703972b0daSStefano Zampini   ierr = PetscFree4(pcbddc->mat_graph->where,pcbddc->mat_graph->count,pcbddc->mat_graph->cptr,pcbddc->mat_graph->queue);CHKERRQ(ierr);
8713972b0daSStefano Zampini   ierr = PetscFree2(pcbddc->mat_graph->which_dof,pcbddc->mat_graph->touched);CHKERRQ(ierr);
8723972b0daSStefano Zampini   ierr = PetscFree(pcbddc->mat_graph->where_ncmps);CHKERRQ(ierr);
873da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph);CHKERRQ(ierr);
8743425bc38SStefano Zampini   /* remove functions */
8754fad6a16SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetCoarseningRatio_C","",PETSC_NULL);CHKERRQ(ierr);
8764fad6a16SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetMaxLevels_C","",PETSC_NULL);CHKERRQ(ierr);
8770bdf917eSStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetNullSpace_C","",PETSC_NULL);CHKERRQ(ierr);
8783425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDirichletBoundaries_C","",PETSC_NULL);CHKERRQ(ierr);
8793425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetNeumannBoundaries_C","",PETSC_NULL);CHKERRQ(ierr);
8803425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetDirichletBoundaries_C","",PETSC_NULL);CHKERRQ(ierr);
8813425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetNeumannBoundaries_C","",PETSC_NULL);CHKERRQ(ierr);
8823425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetCoarseProblemType_C","",PETSC_NULL);CHKERRQ(ierr);
8833425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDofsSplitting_C","",PETSC_NULL);CHKERRQ(ierr);
8843425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetLocalAdjacencyGraph_C","",PETSC_NULL);CHKERRQ(ierr);
8853425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPreSolve_C","",PETSC_NULL);CHKERRQ(ierr);
8863425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPostSolve_C","",PETSC_NULL);CHKERRQ(ierr);
8873425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCCreateFETIDPOperators_C","",PETSC_NULL);CHKERRQ(ierr);
8883425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetRHS_C","",PETSC_NULL);CHKERRQ(ierr);
8893425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetSolution_C","",PETSC_NULL);CHKERRQ(ierr);
890da1bb401SStefano Zampini   /* Free the private data structure that was hanging off the PC */
891da1bb401SStefano Zampini   ierr = PetscFree(pcbddc);CHKERRQ(ierr);
892da1bb401SStefano Zampini   PetscFunctionReturn(0);
893da1bb401SStefano Zampini }
8943425bc38SStefano Zampini /* -------------------------------------------------------------------------- */
8953425bc38SStefano Zampini EXTERN_C_BEGIN
8963425bc38SStefano Zampini #undef __FUNCT__
8973425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetRHS_BDDC"
8983425bc38SStefano Zampini static PetscErrorCode PCBDDCMatFETIDPGetRHS_BDDC(Mat fetidp_mat, Vec standard_rhs, Vec fetidp_flux_rhs)
8993425bc38SStefano Zampini {
9003425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
9013425bc38SStefano Zampini   PC_IS          * pcis;
9023425bc38SStefano Zampini   PC_BDDC        * pcbddc;
9033425bc38SStefano Zampini   PetscErrorCode ierr;
9040c7d97c5SJed Brown 
9053425bc38SStefano Zampini   PetscFunctionBegin;
9063425bc38SStefano Zampini   ierr   = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr);
9073425bc38SStefano Zampini   pcis   = (PC_IS*)mat_ctx->pc->data;
9083425bc38SStefano Zampini   pcbddc = (PC_BDDC*)mat_ctx->pc->data;
9093425bc38SStefano Zampini 
9103425bc38SStefano Zampini   /* change of basis for physical rhs if needed
9113425bc38SStefano Zampini      It also changes the rhs in case of dirichlet boundaries */
9123425bc38SStefano Zampini   (*mat_ctx->pc->ops->presolve)(mat_ctx->pc,PETSC_NULL,standard_rhs,PETSC_NULL);
9133425bc38SStefano Zampini   /* store vectors for computation of fetidp final solution */
9143425bc38SStefano Zampini   ierr = VecScatterBegin(pcis->global_to_D,standard_rhs,mat_ctx->temp_solution_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
9153425bc38SStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_D,standard_rhs,mat_ctx->temp_solution_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
9163425bc38SStefano Zampini   ierr = VecScatterBegin(pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
9173425bc38SStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
9183425bc38SStefano Zampini   /* scale rhs since it should be unassembled */
9193425bc38SStefano Zampini   ierr = VecPointwiseMult(mat_ctx->temp_solution_B,pcis->D,mat_ctx->temp_solution_B);CHKERRQ(ierr);
92029622bf0SStefano Zampini   if (!pcbddc->inexact_prec_type) {
9213425bc38SStefano Zampini     /* compute partially subassembled Schur complement right-hand side */
9223425bc38SStefano Zampini     ierr = KSPSolve(pcbddc->ksp_D,mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr);
9233425bc38SStefano Zampini     ierr = MatMult(pcis->A_BI,pcis->vec1_D,pcis->vec1_B);CHKERRQ(ierr);
9243425bc38SStefano Zampini     ierr = VecAXPY(mat_ctx->temp_solution_B,-1.0,pcis->vec1_B);CHKERRQ(ierr);
9253425bc38SStefano Zampini     ierr = VecSet(standard_rhs,0.0);CHKERRQ(ierr);
9263425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,mat_ctx->temp_solution_B,standard_rhs,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
9273425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,mat_ctx->temp_solution_B,standard_rhs,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
9283425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
9293425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
9303425bc38SStefano Zampini     ierr = VecPointwiseMult(mat_ctx->temp_solution_B,pcis->D,mat_ctx->temp_solution_B);CHKERRQ(ierr);
9313425bc38SStefano Zampini   }
9323425bc38SStefano Zampini   /* BDDC rhs */
9333425bc38SStefano Zampini   ierr = VecCopy(mat_ctx->temp_solution_B,pcis->vec1_B);CHKERRQ(ierr);
93429622bf0SStefano Zampini   if (pcbddc->inexact_prec_type) {
9353425bc38SStefano Zampini     ierr = VecCopy(mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr);
9363425bc38SStefano Zampini   }
9373425bc38SStefano Zampini   /* apply BDDC */
9383425bc38SStefano Zampini   ierr = PCBDDCApplyInterfacePreconditioner(mat_ctx->pc);CHKERRQ(ierr);
9393425bc38SStefano Zampini   /* Application of B_delta and assembling of rhs for fetidp fluxes */
9403425bc38SStefano Zampini   ierr = VecSet(fetidp_flux_rhs,0.0);CHKERRQ(ierr);
9413425bc38SStefano Zampini   ierr = MatMult(mat_ctx->B_delta,pcis->vec1_B,mat_ctx->lambda_local);CHKERRQ(ierr);
9423425bc38SStefano Zampini   ierr = VecScatterBegin(mat_ctx->l2g_lambda,mat_ctx->lambda_local,fetidp_flux_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
9433425bc38SStefano Zampini   ierr = VecScatterEnd  (mat_ctx->l2g_lambda,mat_ctx->lambda_local,fetidp_flux_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
9443425bc38SStefano Zampini   /* restore original rhs */
9453425bc38SStefano Zampini   ierr = VecCopy(pcbddc->original_rhs,standard_rhs);CHKERRQ(ierr);
9463425bc38SStefano Zampini   PetscFunctionReturn(0);
9473425bc38SStefano Zampini }
9483425bc38SStefano Zampini EXTERN_C_END
9493425bc38SStefano Zampini #undef __FUNCT__
9503425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetRHS"
9513425bc38SStefano Zampini /*@
9523425bc38SStefano Zampini  PCBDDCMatFETIDPGetRHS - Get rhs for FETIDP linear system.
9533425bc38SStefano Zampini 
9543425bc38SStefano Zampini    Collective
9553425bc38SStefano Zampini 
9563425bc38SStefano Zampini    Input Parameters:
9573425bc38SStefano Zampini +  fetidp_mat   - the FETIDP mat obtained by a call to PCBDDCCreateFETIDPOperators
9583425bc38SStefano Zampini +  standard_rhs - the rhs of your linear system
9593425bc38SStefano Zampini 
9603425bc38SStefano Zampini    Output Parameters:
9613425bc38SStefano Zampini +  fetidp_flux_rhs   - the rhs of the FETIDP linear system
9623425bc38SStefano Zampini 
9633425bc38SStefano Zampini    Level: developer
9643425bc38SStefano Zampini 
9653425bc38SStefano Zampini    Notes:
9663425bc38SStefano Zampini 
9673425bc38SStefano Zampini .seealso: PCBDDC
9683425bc38SStefano Zampini @*/
9693425bc38SStefano Zampini PetscErrorCode PCBDDCMatFETIDPGetRHS(Mat fetidp_mat, Vec standard_rhs, Vec fetidp_flux_rhs)
9703425bc38SStefano Zampini {
9713425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
9723425bc38SStefano Zampini   PetscErrorCode ierr;
9733425bc38SStefano Zampini 
9743425bc38SStefano Zampini   PetscFunctionBegin;
9753425bc38SStefano Zampini   ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr);
9763425bc38SStefano Zampini   ierr = PetscTryMethod(mat_ctx->pc,"PCBDDCMatFETIDPGetRHS_C",(Mat,Vec,Vec),(fetidp_mat,standard_rhs,fetidp_flux_rhs));CHKERRQ(ierr);
9773425bc38SStefano Zampini   PetscFunctionReturn(0);
9783425bc38SStefano Zampini }
9793425bc38SStefano Zampini /* -------------------------------------------------------------------------- */
9803425bc38SStefano Zampini EXTERN_C_BEGIN
9813425bc38SStefano Zampini #undef __FUNCT__
9823425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetSolution_BDDC"
9833425bc38SStefano Zampini static PetscErrorCode PCBDDCMatFETIDPGetSolution_BDDC(Mat fetidp_mat, Vec fetidp_flux_sol, Vec standard_sol)
9843425bc38SStefano Zampini {
9853425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
9863425bc38SStefano Zampini   PC_IS          *pcis;
9873425bc38SStefano Zampini   PC_BDDC        *pcbddc;
9883425bc38SStefano Zampini   PetscErrorCode ierr;
9893425bc38SStefano Zampini 
9903425bc38SStefano Zampini   PetscFunctionBegin;
9913425bc38SStefano Zampini   ierr   = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr);
9923425bc38SStefano Zampini   pcis   = (PC_IS*)mat_ctx->pc->data;
9933425bc38SStefano Zampini   pcbddc = (PC_BDDC*)mat_ctx->pc->data;
9943425bc38SStefano Zampini 
9953425bc38SStefano Zampini   /* apply B_delta^T */
9963425bc38SStefano Zampini   ierr = VecScatterBegin(mat_ctx->l2g_lambda,fetidp_flux_sol,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
9973425bc38SStefano Zampini   ierr = VecScatterEnd  (mat_ctx->l2g_lambda,fetidp_flux_sol,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
9983425bc38SStefano Zampini   ierr = MatMultTranspose(mat_ctx->B_delta,mat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr);
9993425bc38SStefano Zampini   /* compute rhs for BDDC application */
10003425bc38SStefano Zampini   ierr = VecAYPX(pcis->vec1_B,-1.0,mat_ctx->temp_solution_B);CHKERRQ(ierr);
100129622bf0SStefano Zampini   if (pcbddc->inexact_prec_type) {
10023425bc38SStefano Zampini     ierr = VecCopy(mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr);
10033425bc38SStefano Zampini   }
10043425bc38SStefano Zampini   /* apply BDDC */
10053425bc38SStefano Zampini   ierr = PCBDDCApplyInterfacePreconditioner(mat_ctx->pc);CHKERRQ(ierr);
10063425bc38SStefano Zampini   /* put values into standard global vector */
10073425bc38SStefano Zampini   ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
10083425bc38SStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec1_B,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
100929622bf0SStefano Zampini   if (!pcbddc->inexact_prec_type) {
10103425bc38SStefano Zampini     /* compute values into the interior if solved for the partially subassembled Schur complement */
10113425bc38SStefano Zampini     ierr = MatMult(pcis->A_IB,pcis->vec1_B,pcis->vec1_D);CHKERRQ(ierr);
10123425bc38SStefano Zampini     ierr = VecAXPY(mat_ctx->temp_solution_D,-1.0,pcis->vec1_D);CHKERRQ(ierr);
10133425bc38SStefano Zampini     ierr = KSPSolve(pcbddc->ksp_D,mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr);
10143425bc38SStefano Zampini   }
10153425bc38SStefano Zampini   ierr = VecScatterBegin(pcis->global_to_D,pcis->vec1_D,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
10163425bc38SStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_D,pcis->vec1_D,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
10173425bc38SStefano Zampini   /* final change of basis if needed
10183425bc38SStefano Zampini      Is also sums the dirichlet part removed during RHS assembling */
10193425bc38SStefano Zampini   (*mat_ctx->pc->ops->postsolve)(mat_ctx->pc,PETSC_NULL,PETSC_NULL,standard_sol);
10203425bc38SStefano Zampini   PetscFunctionReturn(0);
10213425bc38SStefano Zampini 
10223425bc38SStefano Zampini }
10233425bc38SStefano Zampini EXTERN_C_END
10243425bc38SStefano Zampini #undef __FUNCT__
10253425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetSolution"
10263425bc38SStefano Zampini /*@
10273425bc38SStefano Zampini  PCBDDCMatFETIDPGetSolution - Get Solution for FETIDP linear system.
10283425bc38SStefano Zampini 
10293425bc38SStefano Zampini    Collective
10303425bc38SStefano Zampini 
10313425bc38SStefano Zampini    Input Parameters:
10323425bc38SStefano Zampini +  fetidp_mat        - the FETIDP mat obtained by a call to PCBDDCCreateFETIDPOperators
10333425bc38SStefano Zampini +  fetidp_flux_sol - the solution of the FETIDP linear system
10343425bc38SStefano Zampini 
10353425bc38SStefano Zampini    Output Parameters:
10363425bc38SStefano Zampini +  standard_sol      - the solution on the global domain
10373425bc38SStefano Zampini 
10383425bc38SStefano Zampini    Level: developer
10393425bc38SStefano Zampini 
10403425bc38SStefano Zampini    Notes:
10413425bc38SStefano Zampini 
10423425bc38SStefano Zampini .seealso: PCBDDC
10433425bc38SStefano Zampini @*/
10443425bc38SStefano Zampini PetscErrorCode PCBDDCMatFETIDPGetSolution(Mat fetidp_mat, Vec fetidp_flux_sol, Vec standard_sol)
10453425bc38SStefano Zampini {
10463425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
10473425bc38SStefano Zampini   PetscErrorCode ierr;
10483425bc38SStefano Zampini 
10493425bc38SStefano Zampini   PetscFunctionBegin;
10503425bc38SStefano Zampini   ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr);
10513425bc38SStefano Zampini   ierr = PetscTryMethod(mat_ctx->pc,"PCBDDCMatFETIDPGetSolution_C",(Mat,Vec,Vec),(fetidp_mat,fetidp_flux_sol,standard_sol));CHKERRQ(ierr);
10523425bc38SStefano Zampini   PetscFunctionReturn(0);
10533425bc38SStefano Zampini }
10543425bc38SStefano Zampini /* -------------------------------------------------------------------------- */
10553425bc38SStefano Zampini EXTERN_C_BEGIN
1056f23aa3ddSBarry Smith extern PetscErrorCode FETIDPMatMult(Mat,Vec,Vec);
1057f23aa3ddSBarry Smith extern PetscErrorCode PCBDDCDestroyFETIDPMat(Mat);
1058f23aa3ddSBarry Smith extern PetscErrorCode FETIDPPCApply(PC,Vec,Vec);
1059f23aa3ddSBarry Smith extern PetscErrorCode PCBDDCDestroyFETIDPPC(PC);
10603425bc38SStefano Zampini #undef __FUNCT__
10613425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPOperators_BDDC"
10623425bc38SStefano Zampini static PetscErrorCode PCBDDCCreateFETIDPOperators_BDDC(PC pc, Mat *fetidp_mat, PC *fetidp_pc)
10633425bc38SStefano Zampini {
10643425bc38SStefano Zampini   FETIDPMat_ctx  *fetidpmat_ctx;
10653425bc38SStefano Zampini   Mat            newmat;
10663425bc38SStefano Zampini   FETIDPPC_ctx   *fetidppc_ctx;
10673425bc38SStefano Zampini   PC             newpc;
10683425bc38SStefano Zampini   MPI_Comm       comm = ((PetscObject)pc)->comm;
10693425bc38SStefano Zampini   PetscErrorCode ierr;
10703425bc38SStefano Zampini 
10713425bc38SStefano Zampini   PetscFunctionBegin;
10723425bc38SStefano Zampini   /* FETIDP linear matrix */
10733425bc38SStefano Zampini   ierr = PCBDDCCreateFETIDPMatContext(pc, &fetidpmat_ctx);CHKERRQ(ierr);
10743425bc38SStefano Zampini   ierr = PCBDDCSetupFETIDPMatContext(fetidpmat_ctx);CHKERRQ(ierr);
10753425bc38SStefano Zampini   ierr = MatCreateShell(comm,PETSC_DECIDE,PETSC_DECIDE,fetidpmat_ctx->n_lambda,fetidpmat_ctx->n_lambda,fetidpmat_ctx,&newmat);CHKERRQ(ierr);
10763425bc38SStefano Zampini   ierr = MatShellSetOperation(newmat,MATOP_MULT,(void (*)(void))FETIDPMatMult);CHKERRQ(ierr);
10773425bc38SStefano Zampini   ierr = MatShellSetOperation(newmat,MATOP_DESTROY,(void (*)(void))PCBDDCDestroyFETIDPMat);CHKERRQ(ierr);
10783425bc38SStefano Zampini   ierr = MatSetUp(newmat);CHKERRQ(ierr);
10793425bc38SStefano Zampini   /* FETIDP preconditioner */
10803425bc38SStefano Zampini   ierr = PCBDDCCreateFETIDPPCContext(pc, &fetidppc_ctx);CHKERRQ(ierr);
10813425bc38SStefano Zampini   ierr = PCBDDCSetupFETIDPPCContext(newmat,fetidppc_ctx);CHKERRQ(ierr);
10823425bc38SStefano Zampini   ierr = PCCreate(comm,&newpc);CHKERRQ(ierr);
10833425bc38SStefano Zampini   ierr = PCSetType(newpc,PCSHELL);CHKERRQ(ierr);
10843425bc38SStefano Zampini   ierr = PCShellSetContext(newpc,fetidppc_ctx);CHKERRQ(ierr);
10853425bc38SStefano Zampini   ierr = PCShellSetApply(newpc,FETIDPPCApply);CHKERRQ(ierr);
10863425bc38SStefano Zampini   ierr = PCShellSetDestroy(newpc,PCBDDCDestroyFETIDPPC);CHKERRQ(ierr);
10873425bc38SStefano Zampini   ierr = PCSetOperators(newpc,newmat,newmat,SAME_PRECONDITIONER);CHKERRQ(ierr);
10883425bc38SStefano Zampini   ierr = PCSetUp(newpc);CHKERRQ(ierr);
1089*2fa5cd67SKarl Rupp 
10903425bc38SStefano Zampini   /* return pointers for objects created */
10913425bc38SStefano Zampini   *fetidp_mat = newmat;
10923425bc38SStefano Zampini   *fetidp_pc  = newpc;
10933425bc38SStefano Zampini   PetscFunctionReturn(0);
10943425bc38SStefano Zampini }
10953425bc38SStefano Zampini EXTERN_C_END
10963425bc38SStefano Zampini #undef __FUNCT__
10973425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPOperators"
10983425bc38SStefano Zampini /*@
10993425bc38SStefano Zampini  PCBDDCCreateFETIDPOperators - Create operators for FETIDP.
11003425bc38SStefano Zampini 
11013425bc38SStefano Zampini    Collective
11023425bc38SStefano Zampini 
11033425bc38SStefano Zampini    Input Parameters:
11043425bc38SStefano Zampini +  pc - the BDDC preconditioning context (setup must be already called)
11053425bc38SStefano Zampini 
11063425bc38SStefano Zampini    Level: developer
11073425bc38SStefano Zampini 
11083425bc38SStefano Zampini    Notes:
11093425bc38SStefano Zampini 
11103425bc38SStefano Zampini .seealso: PCBDDC
11113425bc38SStefano Zampini @*/
11123425bc38SStefano Zampini PetscErrorCode PCBDDCCreateFETIDPOperators(PC pc, Mat *fetidp_mat, PC *fetidp_pc)
11133425bc38SStefano Zampini {
11143425bc38SStefano Zampini   PetscErrorCode ierr;
11153425bc38SStefano Zampini 
11163425bc38SStefano Zampini   PetscFunctionBegin;
11173425bc38SStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
11183425bc38SStefano Zampini   if (pc->setupcalled) {
11193425bc38SStefano Zampini     ierr = PetscTryMethod(pc,"PCBDDCCreateFETIDPOperators_C",(PC,Mat*,PC*),(pc,fetidp_mat,fetidp_pc));CHKERRQ(ierr);
1120f23aa3ddSBarry Smith   } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"You must call PCSetup_BDDC() first \n");
11213425bc38SStefano Zampini   PetscFunctionReturn(0);
11223425bc38SStefano Zampini }
11230c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
1124da1bb401SStefano Zampini /*MC
1125da1bb401SStefano Zampini    PCBDDC - Balancing Domain Decomposition by Constraints.
11260c7d97c5SJed Brown 
1127da1bb401SStefano Zampini    Options Database Keys:
1128da1bb401SStefano Zampini .    -pcbddc ??? -
1129da1bb401SStefano Zampini 
1130da1bb401SStefano Zampini    Level: intermediate
1131da1bb401SStefano Zampini 
1132da1bb401SStefano Zampini    Notes: The matrix used with this preconditioner must be of type MATIS
1133da1bb401SStefano Zampini 
1134da1bb401SStefano Zampini           Unlike more 'conventional' interface preconditioners, this iterates over ALL the
1135da1bb401SStefano Zampini           degrees of freedom, NOT just those on the interface (this allows the use of approximate solvers
1136da1bb401SStefano Zampini           on the subdomains).
1137da1bb401SStefano Zampini 
1138da1bb401SStefano Zampini           Options for the coarse grid preconditioner can be set with -
1139da1bb401SStefano Zampini           Options for the Dirichlet subproblem can be set with -
1140da1bb401SStefano Zampini           Options for the Neumann subproblem can be set with -
1141da1bb401SStefano Zampini 
1142da1bb401SStefano Zampini    Contributed by Stefano Zampini
1143da1bb401SStefano Zampini 
1144da1bb401SStefano Zampini .seealso:  PCCreate(), PCSetType(), PCType (for list of available types), PC,  MATIS
1145da1bb401SStefano Zampini M*/
1146da1bb401SStefano Zampini EXTERN_C_BEGIN
1147da1bb401SStefano Zampini #undef __FUNCT__
1148da1bb401SStefano Zampini #define __FUNCT__ "PCCreate_BDDC"
1149da1bb401SStefano Zampini PetscErrorCode PCCreate_BDDC(PC pc)
1150da1bb401SStefano Zampini {
1151da1bb401SStefano Zampini   PetscErrorCode ierr;
1152da1bb401SStefano Zampini   PC_BDDC        *pcbddc;
1153da1bb401SStefano Zampini   PCBDDCGraph    mat_graph;
1154da1bb401SStefano Zampini 
1155da1bb401SStefano Zampini   PetscFunctionBegin;
1156da1bb401SStefano Zampini   /* Creates the private data structure for this preconditioner and attach it to the PC object. */
1157da1bb401SStefano Zampini   ierr     = PetscNewLog(pc,PC_BDDC,&pcbddc);CHKERRQ(ierr);
1158da1bb401SStefano Zampini   pc->data = (void*)pcbddc;
1159da1bb401SStefano Zampini 
1160da1bb401SStefano Zampini   /* create PCIS data structure */
1161da1bb401SStefano Zampini   ierr = PCISCreate(pc);CHKERRQ(ierr);
1162da1bb401SStefano Zampini 
1163da1bb401SStefano Zampini   /* BDDC specific */
11640bdf917eSStefano Zampini   pcbddc->CoarseNullSpace                 = 0;
11650bdf917eSStefano Zampini   pcbddc->NullSpace                       = 0;
11663972b0daSStefano Zampini   pcbddc->temp_solution                   = 0;
1167534831adSStefano Zampini   pcbddc->original_rhs                    = 0;
1168534831adSStefano Zampini   pcbddc->local_mat                       = 0;
1169534831adSStefano Zampini   pcbddc->ChangeOfBasisMatrix             = 0;
1170534831adSStefano Zampini   pcbddc->usechangeofbasis                = PETSC_TRUE;
1171534831adSStefano Zampini   pcbddc->usechangeonfaces                = PETSC_FALSE;
1172da1bb401SStefano Zampini   pcbddc->coarse_vec                      = 0;
1173da1bb401SStefano Zampini   pcbddc->coarse_rhs                      = 0;
1174da1bb401SStefano Zampini   pcbddc->coarse_ksp                      = 0;
1175da1bb401SStefano Zampini   pcbddc->coarse_phi_B                    = 0;
1176da1bb401SStefano Zampini   pcbddc->coarse_phi_D                    = 0;
1177da1bb401SStefano Zampini   pcbddc->vec1_P                          = 0;
1178da1bb401SStefano Zampini   pcbddc->vec1_R                          = 0;
1179da1bb401SStefano Zampini   pcbddc->vec2_R                          = 0;
1180da1bb401SStefano Zampini   pcbddc->local_auxmat1                   = 0;
1181da1bb401SStefano Zampini   pcbddc->local_auxmat2                   = 0;
1182da1bb401SStefano Zampini   pcbddc->R_to_B                          = 0;
1183da1bb401SStefano Zampini   pcbddc->R_to_D                          = 0;
1184da1bb401SStefano Zampini   pcbddc->ksp_D                           = 0;
1185da1bb401SStefano Zampini   pcbddc->ksp_R                           = 0;
1186da1bb401SStefano Zampini   pcbddc->local_primal_indices            = 0;
118729622bf0SStefano Zampini   pcbddc->inexact_prec_type               = PETSC_FALSE;
1188da1bb401SStefano Zampini   pcbddc->NeumannBoundaries               = 0;
1189da1bb401SStefano Zampini   pcbddc->ISForDofs                       = 0;
1190da1bb401SStefano Zampini   pcbddc->ISForVertices                   = 0;
1191da1bb401SStefano Zampini   pcbddc->n_ISForFaces                    = 0;
1192da1bb401SStefano Zampini   pcbddc->n_ISForEdges                    = 0;
1193da1bb401SStefano Zampini   pcbddc->ConstraintMatrix                = 0;
1194da1bb401SStefano Zampini   pcbddc->use_nnsp_true                   = PETSC_FALSE;
1195da1bb401SStefano Zampini   pcbddc->local_primal_sizes              = 0;
1196da1bb401SStefano Zampini   pcbddc->local_primal_displacements      = 0;
1197da1bb401SStefano Zampini   pcbddc->replicated_local_primal_indices = 0;
1198da1bb401SStefano Zampini   pcbddc->replicated_local_primal_values  = 0;
1199da1bb401SStefano Zampini   pcbddc->coarse_loc_to_glob              = 0;
1200da1bb401SStefano Zampini   pcbddc->dbg_flag                        = PETSC_FALSE;
1201da1bb401SStefano Zampini   pcbddc->coarsening_ratio                = 8;
1202b76ba322SStefano Zampini   pcbddc->use_exact_dirichlet             = PETSC_TRUE;
12034fad6a16SStefano Zampini   pcbddc->current_level                   = 0;
12044fad6a16SStefano Zampini   pcbddc->max_levels                      = 1;
1205da1bb401SStefano Zampini 
1206da1bb401SStefano Zampini   /* allocate and initialize needed graph structure */
1207da1bb401SStefano Zampini   ierr                      = PetscMalloc(sizeof(*mat_graph),&pcbddc->mat_graph);CHKERRQ(ierr);
1208da1bb401SStefano Zampini   pcbddc->mat_graph->xadj   = 0;
1209da1bb401SStefano Zampini   pcbddc->mat_graph->adjncy = 0;
1210da1bb401SStefano Zampini 
1211da1bb401SStefano Zampini   /* function pointers */
1212da1bb401SStefano Zampini   pc->ops->apply               = PCApply_BDDC;
1213da1bb401SStefano Zampini   pc->ops->applytranspose      = 0;
1214da1bb401SStefano Zampini   pc->ops->setup               = PCSetUp_BDDC;
1215da1bb401SStefano Zampini   pc->ops->destroy             = PCDestroy_BDDC;
1216da1bb401SStefano Zampini   pc->ops->setfromoptions      = PCSetFromOptions_BDDC;
1217da1bb401SStefano Zampini   pc->ops->view                = 0;
1218da1bb401SStefano Zampini   pc->ops->applyrichardson     = 0;
1219da1bb401SStefano Zampini   pc->ops->applysymmetricleft  = 0;
1220da1bb401SStefano Zampini   pc->ops->applysymmetricright = 0;
1221534831adSStefano Zampini   pc->ops->presolve            = PCPreSolve_BDDC;
1222534831adSStefano Zampini   pc->ops->postsolve           = PCPostSolve_BDDC;
1223da1bb401SStefano Zampini 
1224da1bb401SStefano Zampini   /* composing function */
12254fad6a16SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetCoarseningRatio_C","PCBDDCSetCoarseningRatio_BDDC",
12264fad6a16SStefano Zampini                                            PCBDDCSetCoarseningRatio_BDDC);CHKERRQ(ierr);
12274fad6a16SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetMaxLevels_C","PCBDDCSetMaxLevels_BDDC",
12284fad6a16SStefano Zampini                                            PCBDDCSetMaxLevels_BDDC);CHKERRQ(ierr);
12290bdf917eSStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetNullSpace_C","PCBDDCSetNullSpace_BDDC",
12300bdf917eSStefano Zampini                                            PCBDDCSetNullSpace_BDDC);CHKERRQ(ierr);
1231da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDirichletBoundaries_C","PCBDDCSetDirichletBoundaries_BDDC",
1232da1bb401SStefano Zampini                                            PCBDDCSetDirichletBoundaries_BDDC);CHKERRQ(ierr);
1233da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetNeumannBoundaries_C","PCBDDCSetNeumannBoundaries_BDDC",
1234da1bb401SStefano Zampini                                            PCBDDCSetNeumannBoundaries_BDDC);CHKERRQ(ierr);
1235da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetDirichletBoundaries_C","PCBDDCGetDirichletBoundaries_BDDC",
1236da1bb401SStefano Zampini                                            PCBDDCGetDirichletBoundaries_BDDC);CHKERRQ(ierr);
1237da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetNeumannBoundaries_C","PCBDDCGetNeumannBoundaries_BDDC",
1238da1bb401SStefano Zampini                                            PCBDDCGetNeumannBoundaries_BDDC);CHKERRQ(ierr);
1239da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetCoarseProblemType_C","PCBDDCSetCoarseProblemType_BDDC",
1240da1bb401SStefano Zampini                                            PCBDDCSetCoarseProblemType_BDDC);CHKERRQ(ierr);
1241da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDofsSplitting_C","PCBDDCSetDofsSplitting_BDDC",
1242da1bb401SStefano Zampini                                            PCBDDCSetDofsSplitting_BDDC);CHKERRQ(ierr);
1243da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetLocalAdjacencyGraph_C","PCBDDCSetLocalAdjacencyGraph_BDDC",
1244da1bb401SStefano Zampini                                            PCBDDCSetLocalAdjacencyGraph_BDDC);CHKERRQ(ierr);
1245534831adSStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPreSolve_C","PCPreSolve_BDDC",
1246534831adSStefano Zampini                                            PCPreSolve_BDDC);CHKERRQ(ierr);
1247534831adSStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPostSolve_C","PCPostSolve_BDDC",
1248534831adSStefano Zampini                                            PCPostSolve_BDDC);CHKERRQ(ierr);
12493425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCCreateFETIDPOperators_C","PCBDDCCreateFETIDPOperators_BDDC",
12503425bc38SStefano Zampini                                            PCBDDCCreateFETIDPOperators_BDDC);CHKERRQ(ierr);
12513425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetRHS_C","PCBDDCMatFETIDPGetRHS_BDDC",
12523425bc38SStefano Zampini                                            PCBDDCMatFETIDPGetRHS_BDDC);CHKERRQ(ierr);
12533425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetSolution_C","PCBDDCMatFETIDPGetSolution_BDDC",
12543425bc38SStefano Zampini                                            PCBDDCMatFETIDPGetSolution_BDDC);CHKERRQ(ierr);
1255da1bb401SStefano Zampini   PetscFunctionReturn(0);
1256da1bb401SStefano Zampini }
1257da1bb401SStefano Zampini EXTERN_C_END
12583425bc38SStefano Zampini 
1259da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
1260da1bb401SStefano Zampini /* All static functions from now on                                           */
1261da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
12624fad6a16SStefano Zampini #undef __FUNCT__
126329622bf0SStefano Zampini #define __FUNCT__ "PCBDDCApplyNullSpaceCorrectionPC"
126429622bf0SStefano Zampini static PetscErrorCode PCBDDCApplyNullSpaceCorrectionPC(PC pc,Vec x,Vec y)
126529622bf0SStefano Zampini {
126629622bf0SStefano Zampini   NullSpaceCorrection_ctx *pc_ctx;
126729622bf0SStefano Zampini   PetscErrorCode          ierr;
126829622bf0SStefano Zampini 
126929622bf0SStefano Zampini   PetscFunctionBegin;
127029622bf0SStefano Zampini   ierr = PCShellGetContext(pc,(void**)&pc_ctx);CHKERRQ(ierr);
127129622bf0SStefano Zampini   /* E */
127229622bf0SStefano Zampini   ierr = MatMultTranspose(pc_ctx->Lbasis_mat,x,pc_ctx->work_small_2);CHKERRQ(ierr);
127329622bf0SStefano Zampini   ierr = MatMultAdd(pc_ctx->Kbasis_mat,pc_ctx->work_small_2,x,pc_ctx->work_full_1);CHKERRQ(ierr);
127429622bf0SStefano Zampini   /* P^-1 */
127529622bf0SStefano Zampini   ierr = PCApply(pc_ctx->local_pc,pc_ctx->work_full_1,pc_ctx->work_full_2);CHKERRQ(ierr);
127629622bf0SStefano Zampini   /* E^T */
127729622bf0SStefano Zampini   ierr = MatMultTranspose(pc_ctx->Kbasis_mat,pc_ctx->work_full_2,pc_ctx->work_small_1);CHKERRQ(ierr);
127829622bf0SStefano Zampini   ierr = VecScale(pc_ctx->work_small_1,-1.0);CHKERRQ(ierr);
127929622bf0SStefano Zampini   ierr = MatMultAdd(pc_ctx->Lbasis_mat,pc_ctx->work_small_1,pc_ctx->work_full_2,pc_ctx->work_full_1);CHKERRQ(ierr);
128029622bf0SStefano Zampini   /* Sum contributions */
128129622bf0SStefano Zampini   ierr = MatMultAdd(pc_ctx->basis_mat,pc_ctx->work_small_2,pc_ctx->work_full_1,y);CHKERRQ(ierr);
128229622bf0SStefano Zampini   PetscFunctionReturn(0);
128329622bf0SStefano Zampini }
128429622bf0SStefano Zampini 
128529622bf0SStefano Zampini #undef __FUNCT__
128629622bf0SStefano Zampini #define __FUNCT__ "PCBDDCDestroyNullSpaceCorrectionPC"
128729622bf0SStefano Zampini static PetscErrorCode PCBDDCDestroyNullSpaceCorrectionPC(PC pc)
128829622bf0SStefano Zampini {
128929622bf0SStefano Zampini   NullSpaceCorrection_ctx *pc_ctx;
129029622bf0SStefano Zampini   PetscErrorCode          ierr;
129129622bf0SStefano Zampini 
129229622bf0SStefano Zampini   PetscFunctionBegin;
129329622bf0SStefano Zampini   ierr = PCShellGetContext(pc,(void**)&pc_ctx);CHKERRQ(ierr);
129429622bf0SStefano Zampini   ierr = VecDestroy(&pc_ctx->work_small_1);CHKERRQ(ierr);
129529622bf0SStefano Zampini   ierr = VecDestroy(&pc_ctx->work_small_2);CHKERRQ(ierr);
129629622bf0SStefano Zampini   ierr = VecDestroy(&pc_ctx->work_full_1);CHKERRQ(ierr);
129729622bf0SStefano Zampini   ierr = VecDestroy(&pc_ctx->work_full_2);CHKERRQ(ierr);
129829622bf0SStefano Zampini   ierr = MatDestroy(&pc_ctx->basis_mat);CHKERRQ(ierr);
129929622bf0SStefano Zampini   ierr = MatDestroy(&pc_ctx->Lbasis_mat);CHKERRQ(ierr);
130029622bf0SStefano Zampini   ierr = MatDestroy(&pc_ctx->Kbasis_mat);CHKERRQ(ierr);
130129622bf0SStefano Zampini   ierr = PCDestroy(&pc_ctx->local_pc);CHKERRQ(ierr);
130229622bf0SStefano Zampini   ierr = PetscFree(pc_ctx);CHKERRQ(ierr);
130329622bf0SStefano Zampini   PetscFunctionReturn(0);
130429622bf0SStefano Zampini }
130529622bf0SStefano Zampini 
130629622bf0SStefano Zampini #undef __FUNCT__
130729622bf0SStefano Zampini #define __FUNCT__ "PCBDDCAdaptLocalProblem"
130829622bf0SStefano Zampini static PetscErrorCode PCBDDCAdaptLocalProblem(PC pc,IS local_dofs)
130929622bf0SStefano Zampini {
1310f23aa3ddSBarry Smith   extern PetscErrorCode PCBDDCApplyNullSpaceCorrectionPC(PC,Vec,Vec);
1311f23aa3ddSBarry Smith   extern PetscErrorCode PCBDDCDestroyNullSpaceCorrectionPC(PC);
131229622bf0SStefano Zampini 
131329622bf0SStefano Zampini   PC_BDDC                 *pcbddc = (PC_BDDC*)pc->data;
131429622bf0SStefano Zampini   PC_IS                   *pcis   = (PC_IS*)pc->data;
131529622bf0SStefano Zampini   Mat_IS                  * matis = (Mat_IS*)pc->pmat->data;
131629622bf0SStefano Zampini   KSP                     *local_ksp;
131729622bf0SStefano Zampini   PC                      newpc;
131829622bf0SStefano Zampini   NullSpaceCorrection_ctx *shell_ctx;
131929622bf0SStefano Zampini   Mat                     local_mat,local_pmat,small_mat,inv_small_mat;
132029622bf0SStefano Zampini   MatStructure            local_mat_struct;
132129622bf0SStefano Zampini   Vec                     work1,work2,work3;
132229622bf0SStefano Zampini   const Vec               *nullvecs;
132329622bf0SStefano Zampini   VecScatter              scatter_ctx;
132429622bf0SStefano Zampini   IS                      is_aux;
132529622bf0SStefano Zampini   MatFactorInfo           matinfo;
132629622bf0SStefano Zampini   PetscScalar             *basis_mat,*Kbasis_mat,*array,*array_mat;
132729622bf0SStefano Zampini   PetscScalar             one = 1.0,zero = 0.0, m_one = -1.0;
132829622bf0SStefano Zampini   PetscInt                basis_dofs,basis_size,nnsp_size,i,k,n_I,n_R;
132929622bf0SStefano Zampini   PetscBool               nnsp_has_cnst;
133029622bf0SStefano Zampini   PetscErrorCode          ierr;
133129622bf0SStefano Zampini 
133229622bf0SStefano Zampini   PetscFunctionBegin;
133329622bf0SStefano Zampini   /* Infer the local solver */
133429622bf0SStefano Zampini   ierr = ISGetSize(local_dofs,&basis_dofs);CHKERRQ(ierr);
133529622bf0SStefano Zampini   ierr = VecGetSize(pcis->vec1_D,&n_I);CHKERRQ(ierr);
133629622bf0SStefano Zampini   ierr = VecGetSize(pcbddc->vec1_R,&n_R);CHKERRQ(ierr);
133729622bf0SStefano Zampini   if (basis_dofs == n_I) {
133829622bf0SStefano Zampini     /* Dirichlet solver */
133929622bf0SStefano Zampini     local_ksp = &pcbddc->ksp_D;
134029622bf0SStefano Zampini   } else if (basis_dofs == n_R) {
134129622bf0SStefano Zampini     /* Neumann solver */
134229622bf0SStefano Zampini     local_ksp = &pcbddc->ksp_R;
1343f23aa3ddSBarry Smith   } else SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in %s: unknown local IS size %d. n_I=%d, n_R=%d)\n",basis_dofs,n_I,n_R);
134429622bf0SStefano Zampini   ierr = KSPGetOperators(*local_ksp,&local_mat,&local_pmat,&local_mat_struct);CHKERRQ(ierr);
134529622bf0SStefano Zampini 
134629622bf0SStefano Zampini   /* Get null space vecs */
134729622bf0SStefano Zampini   ierr = MatNullSpaceGetVecs(pcbddc->NullSpace,&nnsp_has_cnst,&nnsp_size,&nullvecs);CHKERRQ(ierr);
134829622bf0SStefano Zampini   basis_size = nnsp_size;
1349*2fa5cd67SKarl Rupp   if (nnsp_has_cnst) basis_size++;
135029622bf0SStefano Zampini 
135129622bf0SStefano Zampini   /* Create shell ctx */
135229622bf0SStefano Zampini   ierr = PetscMalloc(sizeof(*shell_ctx),&shell_ctx);CHKERRQ(ierr);
135329622bf0SStefano Zampini 
135429622bf0SStefano Zampini   /* Create work vectors in shell context */
135529622bf0SStefano Zampini   ierr = VecCreate(PETSC_COMM_SELF,&shell_ctx->work_small_1);CHKERRQ(ierr);
135629622bf0SStefano Zampini   ierr = VecSetSizes(shell_ctx->work_small_1,basis_size,basis_size);CHKERRQ(ierr);
135729622bf0SStefano Zampini   ierr = VecSetType(shell_ctx->work_small_1,VECSEQ);CHKERRQ(ierr);
135829622bf0SStefano Zampini   ierr = VecDuplicate(shell_ctx->work_small_1,&shell_ctx->work_small_2);CHKERRQ(ierr);
135929622bf0SStefano Zampini   ierr = VecCreate(PETSC_COMM_SELF,&shell_ctx->work_full_1);CHKERRQ(ierr);
136029622bf0SStefano Zampini   ierr = VecSetSizes(shell_ctx->work_full_1,basis_dofs,basis_dofs);CHKERRQ(ierr);
136129622bf0SStefano Zampini   ierr = VecSetType(shell_ctx->work_full_1,VECSEQ);CHKERRQ(ierr);
136229622bf0SStefano Zampini   ierr = VecDuplicate(shell_ctx->work_full_1,&shell_ctx->work_full_2);CHKERRQ(ierr);
136329622bf0SStefano Zampini 
136429622bf0SStefano Zampini   /* Allocate workspace */
136529622bf0SStefano Zampini   ierr = MatCreateSeqDense(PETSC_COMM_SELF,basis_dofs,basis_size,PETSC_NULL,&shell_ctx->basis_mat);CHKERRQ(ierr);
136629622bf0SStefano Zampini   ierr = MatCreateSeqDense(PETSC_COMM_SELF,basis_dofs,basis_size,PETSC_NULL,&shell_ctx->Kbasis_mat);CHKERRQ(ierr);
136729622bf0SStefano Zampini   ierr = MatDenseGetArray(shell_ctx->basis_mat,&basis_mat);CHKERRQ(ierr);
136829622bf0SStefano Zampini   ierr = MatDenseGetArray(shell_ctx->Kbasis_mat,&Kbasis_mat);CHKERRQ(ierr);
136929622bf0SStefano Zampini 
137029622bf0SStefano Zampini   /* Restrict local null space on selected dofs (Dirichlet or Neumann)
137129622bf0SStefano Zampini      and compute matrices N and K*N */
137229622bf0SStefano Zampini   ierr = VecDuplicate(shell_ctx->work_full_1,&work1);CHKERRQ(ierr);
137329622bf0SStefano Zampini   ierr = VecDuplicate(shell_ctx->work_full_1,&work2);CHKERRQ(ierr);
137429622bf0SStefano Zampini   ierr = VecScatterCreate(pcis->vec1_N,local_dofs,work1,(IS)0,&scatter_ctx);CHKERRQ(ierr);
137529622bf0SStefano Zampini   k    = 0;
137629622bf0SStefano Zampini   for (; k<nnsp_size; k++) {
137729622bf0SStefano Zampini     ierr = VecScatterBegin(matis->ctx,nullvecs[k],pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
137829622bf0SStefano Zampini     ierr = VecScatterEnd(matis->ctx,nullvecs[k],pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
137929622bf0SStefano Zampini     ierr = VecPlaceArray(work1,(const PetscScalar*)&basis_mat[k*basis_dofs]);CHKERRQ(ierr);
138029622bf0SStefano Zampini     ierr = VecScatterBegin(scatter_ctx,pcis->vec1_N,work1,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
138129622bf0SStefano Zampini     ierr = VecScatterEnd(scatter_ctx,pcis->vec1_N,work1,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
138229622bf0SStefano Zampini     ierr = VecPlaceArray(work2,(const PetscScalar*)&Kbasis_mat[k*basis_dofs]);CHKERRQ(ierr);
138329622bf0SStefano Zampini     ierr = MatMult(local_mat,work1,work2);CHKERRQ(ierr);
138429622bf0SStefano Zampini     ierr = VecResetArray(work1);CHKERRQ(ierr);
138529622bf0SStefano Zampini     ierr = VecResetArray(work2);CHKERRQ(ierr);
138629622bf0SStefano Zampini   }
138729622bf0SStefano Zampini   if (nnsp_has_cnst) {
138829622bf0SStefano Zampini     ierr = VecPlaceArray(work1,(const PetscScalar*)&basis_mat[k*basis_dofs]);CHKERRQ(ierr);
138929622bf0SStefano Zampini     ierr = VecSet(work1,one);CHKERRQ(ierr);
139029622bf0SStefano Zampini     ierr = VecPlaceArray(work2,(const PetscScalar*)&Kbasis_mat[k*basis_dofs]);CHKERRQ(ierr);
139129622bf0SStefano Zampini     ierr = MatMult(local_mat,work1,work2);CHKERRQ(ierr);
139229622bf0SStefano Zampini     ierr = VecResetArray(work1);CHKERRQ(ierr);
139329622bf0SStefano Zampini     ierr = VecResetArray(work2);CHKERRQ(ierr);
139429622bf0SStefano Zampini   }
139529622bf0SStefano Zampini   ierr = VecDestroy(&work1);CHKERRQ(ierr);
139629622bf0SStefano Zampini   ierr = VecDestroy(&work2);CHKERRQ(ierr);
139729622bf0SStefano Zampini   ierr = VecScatterDestroy(&scatter_ctx);CHKERRQ(ierr);
139829622bf0SStefano Zampini   ierr = MatDenseRestoreArray(shell_ctx->basis_mat,&basis_mat);CHKERRQ(ierr);
139929622bf0SStefano Zampini   ierr = MatDenseRestoreArray(shell_ctx->Kbasis_mat,&Kbasis_mat);CHKERRQ(ierr);
140029622bf0SStefano Zampini 
140129622bf0SStefano Zampini   /* Assemble another Mat object in shell context */
140229622bf0SStefano Zampini   ierr = MatTransposeMatMult(shell_ctx->basis_mat,shell_ctx->Kbasis_mat,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&small_mat);CHKERRQ(ierr);
140329622bf0SStefano Zampini   ierr = MatFactorInfoInitialize(&matinfo);CHKERRQ(ierr);
140429622bf0SStefano Zampini   ierr = ISCreateStride(PETSC_COMM_SELF,basis_size,0,1,&is_aux);CHKERRQ(ierr);
140529622bf0SStefano Zampini   ierr = MatLUFactor(small_mat,is_aux,is_aux,&matinfo);CHKERRQ(ierr);
140629622bf0SStefano Zampini   ierr = ISDestroy(&is_aux);CHKERRQ(ierr);
140729622bf0SStefano Zampini   ierr = PetscMalloc(basis_size*basis_size*sizeof(PetscScalar),&array_mat);CHKERRQ(ierr);
140829622bf0SStefano Zampini   for (k=0; k<basis_size; k++) {
140929622bf0SStefano Zampini     ierr = VecSet(shell_ctx->work_small_1,zero);CHKERRQ(ierr);
141029622bf0SStefano Zampini     ierr = VecSetValue(shell_ctx->work_small_1,k,one,INSERT_VALUES);CHKERRQ(ierr);
141129622bf0SStefano Zampini     ierr = VecAssemblyBegin(shell_ctx->work_small_1);CHKERRQ(ierr);
141229622bf0SStefano Zampini     ierr = VecAssemblyEnd(shell_ctx->work_small_1);CHKERRQ(ierr);
141329622bf0SStefano Zampini     ierr = MatSolve(small_mat,shell_ctx->work_small_1,shell_ctx->work_small_2);CHKERRQ(ierr);
141429622bf0SStefano Zampini     ierr = VecGetArray(shell_ctx->work_small_2,&array);CHKERRQ(ierr);
1415*2fa5cd67SKarl Rupp     for (i=0; i<basis_size; i++) array_mat[i*basis_size+k]=array[i];
141629622bf0SStefano Zampini     ierr = VecRestoreArray(shell_ctx->work_small_2,&array);CHKERRQ(ierr);
141729622bf0SStefano Zampini   }
141829622bf0SStefano Zampini   ierr = MatCreateSeqDense(PETSC_COMM_SELF,basis_size,basis_size,array_mat,&inv_small_mat);CHKERRQ(ierr);
141929622bf0SStefano Zampini   ierr = MatMatMult(shell_ctx->basis_mat,inv_small_mat,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&shell_ctx->Lbasis_mat);CHKERRQ(ierr);
142029622bf0SStefano Zampini   ierr = PetscFree(array_mat);CHKERRQ(ierr);
142129622bf0SStefano Zampini   ierr = MatDestroy(&inv_small_mat);CHKERRQ(ierr);
142229622bf0SStefano Zampini   ierr = MatDestroy(&small_mat);CHKERRQ(ierr);
142329622bf0SStefano Zampini   ierr = MatScale(shell_ctx->Kbasis_mat,m_one);CHKERRQ(ierr);
142429622bf0SStefano Zampini 
142529622bf0SStefano Zampini   /* Rebuild local PC */
142629622bf0SStefano Zampini   ierr = KSPGetPC(*local_ksp,&shell_ctx->local_pc);CHKERRQ(ierr);
142729622bf0SStefano Zampini   ierr = PetscObjectReference((PetscObject)shell_ctx->local_pc);CHKERRQ(ierr);
142829622bf0SStefano Zampini   ierr = PCCreate(PETSC_COMM_SELF,&newpc);CHKERRQ(ierr);
142929622bf0SStefano Zampini   ierr = PCSetOperators(newpc,local_mat,local_mat,SAME_PRECONDITIONER);CHKERRQ(ierr);
143029622bf0SStefano Zampini   ierr = PCSetType(newpc,PCSHELL);CHKERRQ(ierr);
143129622bf0SStefano Zampini   ierr = PCShellSetContext(newpc,shell_ctx);CHKERRQ(ierr);
143229622bf0SStefano Zampini   ierr = PCShellSetApply(newpc,PCBDDCApplyNullSpaceCorrectionPC);CHKERRQ(ierr);
143329622bf0SStefano Zampini   ierr = PCShellSetDestroy(newpc,PCBDDCDestroyNullSpaceCorrectionPC);CHKERRQ(ierr);
143429622bf0SStefano Zampini   ierr = PCSetUp(newpc);CHKERRQ(ierr);
143529622bf0SStefano Zampini   ierr = KSPSetPC(*local_ksp,newpc);CHKERRQ(ierr);
143629622bf0SStefano Zampini   ierr = PCDestroy(&newpc);CHKERRQ(ierr);
143729622bf0SStefano Zampini   ierr = KSPSetUp(*local_ksp);CHKERRQ(ierr);
143829622bf0SStefano Zampini 
143929622bf0SStefano Zampini   /* test */
144029622bf0SStefano Zampini   if (pcbddc->dbg_flag) {
144129622bf0SStefano Zampini     PetscReal   test_err;
144229622bf0SStefano Zampini     KSP         check_ksp;
144329622bf0SStefano Zampini     PC          check_pc;
144429622bf0SStefano Zampini     PetscReal   lambda_min,lambda_max;
144529622bf0SStefano Zampini     Mat         test_mat;
144629622bf0SStefano Zampini     PetscViewer viewer=pcbddc->dbg_viewer;
144729622bf0SStefano Zampini     PetscBool   setsym,issym=PETSC_FALSE;
144829622bf0SStefano Zampini 
144929622bf0SStefano Zampini     ierr = KSPGetPC(*local_ksp,&check_pc);CHKERRQ(ierr);
145029622bf0SStefano Zampini     ierr = VecDuplicate(shell_ctx->work_full_1,&work1);CHKERRQ(ierr);
145129622bf0SStefano Zampini     ierr = VecDuplicate(shell_ctx->work_full_1,&work2);CHKERRQ(ierr);
145229622bf0SStefano Zampini     ierr = VecDuplicate(shell_ctx->work_full_1,&work3);CHKERRQ(ierr);
145329622bf0SStefano Zampini     ierr = VecSetRandom(shell_ctx->work_small_1,PETSC_NULL);CHKERRQ(ierr);
145429622bf0SStefano Zampini     ierr = MatMult(shell_ctx->basis_mat,shell_ctx->work_small_1,work1);CHKERRQ(ierr);
145529622bf0SStefano Zampini     ierr = VecCopy(work1,work2);CHKERRQ(ierr);
145629622bf0SStefano Zampini     ierr = MatMult(local_mat,work1,work3);CHKERRQ(ierr);
145729622bf0SStefano Zampini     ierr = PCApply(check_pc,work3,work1);CHKERRQ(ierr);
145829622bf0SStefano Zampini     ierr = VecAXPY(work1,m_one,work2);CHKERRQ(ierr);
145929622bf0SStefano Zampini     ierr = VecNorm(work1,NORM_INFINITY,&test_err);CHKERRQ(ierr);
146029622bf0SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d error for nullspace correction for ",PetscGlobalRank);
146129622bf0SStefano Zampini     if (basis_dofs == n_I) {
1462*2fa5cd67SKarl Rupp       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Dirichlet ");CHKERRQ(ierr);
146329622bf0SStefano Zampini     } else {
1464*2fa5cd67SKarl Rupp       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Neumann ");CHKERRQ(ierr);
146529622bf0SStefano Zampini     }
146629622bf0SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"solver is :%1.14e\n",test_err);
146729622bf0SStefano Zampini 
146829622bf0SStefano Zampini     ierr = MatTransposeMatMult(shell_ctx->Lbasis_mat,shell_ctx->Kbasis_mat,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&test_mat);CHKERRQ(ierr);
146929622bf0SStefano Zampini     ierr = MatShift(test_mat,one);CHKERRQ(ierr);
147029622bf0SStefano Zampini     ierr = MatNorm(test_mat,NORM_INFINITY,&test_err);CHKERRQ(ierr);
147129622bf0SStefano Zampini     ierr = MatDestroy(&test_mat);CHKERRQ(ierr);
147229622bf0SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d error for nullspace matrices is :%1.14e\n",PetscGlobalRank,test_err);
147329622bf0SStefano Zampini 
147429622bf0SStefano Zampini     /* Create ksp object suitable for extreme eigenvalues' estimation */
147529622bf0SStefano Zampini     ierr = KSPCreate(PETSC_COMM_SELF,&check_ksp);CHKERRQ(ierr);
147629622bf0SStefano Zampini     ierr = KSPSetOperators(check_ksp,local_mat,local_mat,SAME_PRECONDITIONER);CHKERRQ(ierr);
147729622bf0SStefano Zampini     ierr = KSPSetTolerances(check_ksp,1.e-8,1.e-8,PETSC_DEFAULT,basis_dofs);CHKERRQ(ierr);
147829622bf0SStefano Zampini     ierr = KSPSetComputeSingularValues(check_ksp,PETSC_TRUE);CHKERRQ(ierr);
147929622bf0SStefano Zampini     ierr = MatIsSymmetricKnown(pc->pmat,&setsym,&issym);CHKERRQ(ierr);
148029622bf0SStefano Zampini     if (issym) {
148129622bf0SStefano Zampini       ierr = KSPSetType(check_ksp,KSPCG);CHKERRQ(ierr);
148229622bf0SStefano Zampini     }
148329622bf0SStefano Zampini     ierr = KSPSetPC(check_ksp,check_pc);CHKERRQ(ierr);
148429622bf0SStefano Zampini     ierr = KSPSetUp(check_ksp);CHKERRQ(ierr);
148529622bf0SStefano Zampini     ierr = VecSetRandom(work1,PETSC_NULL);CHKERRQ(ierr);
148629622bf0SStefano Zampini     ierr = MatMult(local_mat,work1,work2);CHKERRQ(ierr);
148729622bf0SStefano Zampini     ierr = KSPSolve(check_ksp,work2,work2);CHKERRQ(ierr);
148829622bf0SStefano Zampini     ierr = VecAXPY(work2,m_one,work1);CHKERRQ(ierr);
148929622bf0SStefano Zampini     ierr = VecNorm(work2,NORM_INFINITY,&test_err);CHKERRQ(ierr);
149029622bf0SStefano Zampini     ierr = KSPComputeExtremeSingularValues(check_ksp,&lambda_max,&lambda_min);CHKERRQ(ierr);
149129622bf0SStefano Zampini     ierr = KSPGetIterationNumber(check_ksp,&k);CHKERRQ(ierr);
149229622bf0SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d error for adapted KSP %1.14e (it %d, eigs %1.6e %1.6e)\n",PetscGlobalRank,test_err,k,lambda_min,lambda_max);
149329622bf0SStefano Zampini     ierr = KSPDestroy(&check_ksp);CHKERRQ(ierr);
149429622bf0SStefano Zampini     ierr = VecDestroy(&work1);CHKERRQ(ierr);
149529622bf0SStefano Zampini     ierr = VecDestroy(&work2);CHKERRQ(ierr);
149629622bf0SStefano Zampini     ierr = VecDestroy(&work3);CHKERRQ(ierr);
149729622bf0SStefano Zampini   }
149829622bf0SStefano Zampini   PetscFunctionReturn(0);
149929622bf0SStefano Zampini }
150029622bf0SStefano Zampini 
150129622bf0SStefano Zampini #undef __FUNCT__
15022e8d2280SStefano Zampini #define __FUNCT__ "PCBDDCSetUseExactDirichlet"
15032e8d2280SStefano Zampini static PetscErrorCode PCBDDCSetUseExactDirichlet(PC pc,PetscBool use)
15042e8d2280SStefano Zampini {
15052e8d2280SStefano Zampini   PC_BDDC *pcbddc = (PC_BDDC*)pc->data;
15062e8d2280SStefano Zampini 
15072e8d2280SStefano Zampini   PetscFunctionBegin;
15082e8d2280SStefano Zampini   pcbddc->use_exact_dirichlet=use;
15092e8d2280SStefano Zampini   PetscFunctionReturn(0);
15102e8d2280SStefano Zampini }
15112e8d2280SStefano Zampini 
15122e8d2280SStefano Zampini #undef __FUNCT__
15134fad6a16SStefano Zampini #define __FUNCT__ "PCBDDCSetLevel"
15144fad6a16SStefano Zampini static PetscErrorCode PCBDDCSetLevel(PC pc,PetscInt level)
15154fad6a16SStefano Zampini {
15164fad6a16SStefano Zampini   PC_BDDC *pcbddc = (PC_BDDC*)pc->data;
15174fad6a16SStefano Zampini 
15184fad6a16SStefano Zampini   PetscFunctionBegin;
15194fad6a16SStefano Zampini   pcbddc->current_level=level;
15204fad6a16SStefano Zampini   PetscFunctionReturn(0);
15214fad6a16SStefano Zampini }
15223425bc38SStefano Zampini 
15233425bc38SStefano Zampini #undef __FUNCT__
15240bdf917eSStefano Zampini #define __FUNCT__ "PCBDDCAdaptNullSpace"
15250bdf917eSStefano Zampini static PetscErrorCode PCBDDCAdaptNullSpace(PC pc)
15260bdf917eSStefano Zampini {
15270bdf917eSStefano Zampini   PC_IS          *pcis   = (PC_IS*)  (pc->data);
15280bdf917eSStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)(pc->data);
15290bdf917eSStefano Zampini   KSP            inv_change;
15300bdf917eSStefano Zampini   PC             pc_change;
15310bdf917eSStefano Zampini   const Vec      *nsp_vecs;
15320bdf917eSStefano Zampini   Vec            *new_nsp_vecs;
15330bdf917eSStefano Zampini   PetscInt       i,nsp_size,new_nsp_size,start_new;
15340bdf917eSStefano Zampini   PetscBool      nsp_has_cnst;
15350bdf917eSStefano Zampini   MatNullSpace   new_nsp;
15360bdf917eSStefano Zampini   PetscErrorCode ierr;
15370bdf917eSStefano Zampini 
15380bdf917eSStefano Zampini   PetscFunctionBegin;
15390bdf917eSStefano Zampini   ierr = MatNullSpaceGetVecs(pcbddc->NullSpace,&nsp_has_cnst,&nsp_size,&nsp_vecs);CHKERRQ(ierr);
15400bdf917eSStefano Zampini   ierr = KSPCreate(PETSC_COMM_SELF,&inv_change);CHKERRQ(ierr);
15410bdf917eSStefano Zampini   ierr = KSPSetOperators(inv_change,pcbddc->ChangeOfBasisMatrix,pcbddc->ChangeOfBasisMatrix,SAME_PRECONDITIONER);CHKERRQ(ierr);
15420bdf917eSStefano Zampini   ierr = KSPSetType(inv_change,KSPPREONLY);CHKERRQ(ierr);
15430bdf917eSStefano Zampini   ierr = KSPGetPC(inv_change,&pc_change);CHKERRQ(ierr);
15440bdf917eSStefano Zampini   ierr = PCSetType(pc_change,PCLU);CHKERRQ(ierr);
15450bdf917eSStefano Zampini   ierr = KSPSetUp(inv_change);CHKERRQ(ierr);
1546*2fa5cd67SKarl Rupp 
15470bdf917eSStefano Zampini   new_nsp_size = nsp_size;
1548*2fa5cd67SKarl Rupp   if (nsp_has_cnst) new_nsp_size++;
15490bdf917eSStefano Zampini   ierr = PetscMalloc(new_nsp_size*sizeof(Vec),&new_nsp_vecs);CHKERRQ(ierr);
15500bdf917eSStefano Zampini   for (i=0;i<new_nsp_size;i++) { ierr = VecDuplicate(pcis->vec1_global,&new_nsp_vecs[i]);CHKERRQ(ierr); }
15510bdf917eSStefano Zampini   start_new = 0;
15520bdf917eSStefano Zampini   if (nsp_has_cnst) {
15530bdf917eSStefano Zampini     start_new = 1;
15540bdf917eSStefano Zampini     ierr      = VecSet(new_nsp_vecs[0],1.0);CHKERRQ(ierr);
15550bdf917eSStefano Zampini     ierr      = VecSet(pcis->vec1_B,1.0);CHKERRQ(ierr);
15560bdf917eSStefano Zampini     ierr      = KSPSolve(inv_change,pcis->vec1_B,pcis->vec1_B);
15570bdf917eSStefano Zampini     ierr      = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,new_nsp_vecs[0],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
15580bdf917eSStefano Zampini     ierr      = VecScatterEnd  (pcis->global_to_B,pcis->vec1_B,new_nsp_vecs[0],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
15590bdf917eSStefano Zampini   }
15600bdf917eSStefano Zampini   for (i=0; i<nsp_size; i++) {
15610bdf917eSStefano Zampini     ierr = VecCopy(nsp_vecs[i],new_nsp_vecs[i+start_new]);CHKERRQ(ierr);
15620bdf917eSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,nsp_vecs[i],pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
15630bdf917eSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,nsp_vecs[i],pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
15640bdf917eSStefano Zampini     ierr = KSPSolve(inv_change,pcis->vec1_B,pcis->vec1_B);
15650bdf917eSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,new_nsp_vecs[i+start_new],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
15660bdf917eSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec1_B,new_nsp_vecs[i+start_new],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
15670bdf917eSStefano Zampini   }
15680bdf917eSStefano Zampini   ierr = VecNormalize(new_nsp_vecs[0],PETSC_NULL);CHKERRQ(ierr);
15690bdf917eSStefano Zampini   /* TODO : Orthonormalize vecs when new_nsp_size > 0! */
15700bdf917eSStefano Zampini 
15710bdf917eSStefano Zampini   ierr = KSPDestroy(&inv_change);CHKERRQ(ierr);
15720bdf917eSStefano Zampini   ierr = MatNullSpaceCreate(((PetscObject)pc)->comm,PETSC_FALSE,new_nsp_size,new_nsp_vecs,&new_nsp);CHKERRQ(ierr);
15730bdf917eSStefano Zampini   ierr = PCBDDCSetNullSpace(pc,new_nsp);CHKERRQ(ierr);
15740bdf917eSStefano Zampini   ierr = MatNullSpaceDestroy(&new_nsp);CHKERRQ(ierr);
15750bdf917eSStefano Zampini   /*
15760bdf917eSStefano Zampini   ierr = MatNullSpaceTest(pcbddc->NullSpace,pc->pmat,&nsp_t);CHKERRQ(ierr);
15770bdf917eSStefano Zampini   printf("New Null Space, mat changed: %d\n",nsp_t);
15780bdf917eSStefano Zampini     temp_mat = matis->A;
15790bdf917eSStefano Zampini     matis->A = pcbddc->local_mat;
15800bdf917eSStefano Zampini     pcbddc->local_mat = temp_mat;
15810bdf917eSStefano Zampini   ierr = MatNullSpaceTest(pcbddc->NullSpace,pc->pmat,&nsp_t);CHKERRQ(ierr);
15820bdf917eSStefano Zampini   printf("New Null Space, mat original: %d\n",nsp_t);*/
15830bdf917eSStefano Zampini 
15840bdf917eSStefano Zampini   for (i=0; i<new_nsp_size; i++) { ierr = VecDestroy(&new_nsp_vecs[i]);CHKERRQ(ierr); }
15850bdf917eSStefano Zampini   ierr = PetscFree(new_nsp_vecs);CHKERRQ(ierr);
15860bdf917eSStefano Zampini   PetscFunctionReturn(0);
15870bdf917eSStefano Zampini }
15880bdf917eSStefano Zampini 
15890bdf917eSStefano Zampini #undef __FUNCT__
15903425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPMatContext"
15913425bc38SStefano Zampini static PetscErrorCode PCBDDCCreateFETIDPMatContext(PC pc, FETIDPMat_ctx **fetidpmat_ctx)
15923425bc38SStefano Zampini {
15933425bc38SStefano Zampini   FETIDPMat_ctx  *newctx;
15943425bc38SStefano Zampini   PetscErrorCode ierr;
15953425bc38SStefano Zampini 
15963425bc38SStefano Zampini   PetscFunctionBegin;
15973425bc38SStefano Zampini   ierr = PetscMalloc(sizeof(*newctx),&newctx);CHKERRQ(ierr);
1598*2fa5cd67SKarl Rupp 
15993425bc38SStefano Zampini   newctx->lambda_local    = 0;
16003425bc38SStefano Zampini   newctx->temp_solution_B = 0;
16013425bc38SStefano Zampini   newctx->temp_solution_D = 0;
16023425bc38SStefano Zampini   newctx->B_delta         = 0;
16033425bc38SStefano Zampini   newctx->B_Ddelta        = 0; /* theoretically belongs to the FETIDP preconditioner */
16043425bc38SStefano Zampini   newctx->l2g_lambda      = 0;
1605*2fa5cd67SKarl Rupp 
16063425bc38SStefano Zampini   /* increase the reference count for BDDC preconditioner */
16073425bc38SStefano Zampini   ierr           = PetscObjectReference((PetscObject)pc);CHKERRQ(ierr);
16083425bc38SStefano Zampini   newctx->pc     = pc;
16093425bc38SStefano Zampini   *fetidpmat_ctx = newctx;
16103425bc38SStefano Zampini   PetscFunctionReturn(0);
16113425bc38SStefano Zampini }
16123425bc38SStefano Zampini 
16133425bc38SStefano Zampini #undef __FUNCT__
16143425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPPCContext"
16153425bc38SStefano Zampini static PetscErrorCode PCBDDCCreateFETIDPPCContext(PC pc, FETIDPPC_ctx **fetidppc_ctx)
16163425bc38SStefano Zampini {
16173425bc38SStefano Zampini   FETIDPPC_ctx   *newctx;
16183425bc38SStefano Zampini   PetscErrorCode ierr;
16193425bc38SStefano Zampini 
16203425bc38SStefano Zampini   PetscFunctionBegin;
16213425bc38SStefano Zampini   ierr = PetscMalloc(sizeof(*newctx),&newctx);CHKERRQ(ierr);
1622*2fa5cd67SKarl Rupp 
16233425bc38SStefano Zampini   newctx->lambda_local = 0;
16243425bc38SStefano Zampini   newctx->B_Ddelta     = 0;
16253425bc38SStefano Zampini   newctx->l2g_lambda   = 0;
1626*2fa5cd67SKarl Rupp 
16273425bc38SStefano Zampini   /* increase the reference count for BDDC preconditioner */
16283425bc38SStefano Zampini   ierr          = PetscObjectReference((PetscObject)pc);CHKERRQ(ierr);
16293425bc38SStefano Zampini   newctx->pc    = pc;
16303425bc38SStefano Zampini   *fetidppc_ctx = newctx;
16313425bc38SStefano Zampini   PetscFunctionReturn(0);
16323425bc38SStefano Zampini }
16333425bc38SStefano Zampini 
16343425bc38SStefano Zampini #undef __FUNCT__
16353425bc38SStefano Zampini #define __FUNCT__ "PCBDDCDestroyFETIDPMat"
16363425bc38SStefano Zampini static PetscErrorCode PCBDDCDestroyFETIDPMat(Mat A)
16373425bc38SStefano Zampini {
16383425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
16393425bc38SStefano Zampini   PetscErrorCode ierr;
16403425bc38SStefano Zampini 
16413425bc38SStefano Zampini   PetscFunctionBegin;
16423425bc38SStefano Zampini   ierr = MatShellGetContext(A,(void**)&mat_ctx);CHKERRQ(ierr);
16433425bc38SStefano Zampini   ierr = VecDestroy(&mat_ctx->lambda_local);CHKERRQ(ierr);
16443425bc38SStefano Zampini   ierr = VecDestroy(&mat_ctx->temp_solution_D);CHKERRQ(ierr);
16453425bc38SStefano Zampini   ierr = VecDestroy(&mat_ctx->temp_solution_B);CHKERRQ(ierr);
16463425bc38SStefano Zampini   ierr = MatDestroy(&mat_ctx->B_delta);CHKERRQ(ierr);
16473425bc38SStefano Zampini   ierr = MatDestroy(&mat_ctx->B_Ddelta);CHKERRQ(ierr);
16483425bc38SStefano Zampini   ierr = VecScatterDestroy(&mat_ctx->l2g_lambda);CHKERRQ(ierr);
16493425bc38SStefano Zampini   ierr = PCDestroy(&mat_ctx->pc);CHKERRQ(ierr); /* actually it does not destroy BDDC, only decrease its reference count */
16503425bc38SStefano Zampini   ierr = PetscFree(mat_ctx);CHKERRQ(ierr);
16513425bc38SStefano Zampini   PetscFunctionReturn(0);
16523425bc38SStefano Zampini }
16533425bc38SStefano Zampini 
16543425bc38SStefano Zampini #undef __FUNCT__
16553425bc38SStefano Zampini #define __FUNCT__ "PCBDDCDestroyFETIDPPC"
16563425bc38SStefano Zampini static PetscErrorCode PCBDDCDestroyFETIDPPC(PC pc)
16573425bc38SStefano Zampini {
16583425bc38SStefano Zampini   FETIDPPC_ctx   *pc_ctx;
16593425bc38SStefano Zampini   PetscErrorCode ierr;
16603425bc38SStefano Zampini 
16613425bc38SStefano Zampini   PetscFunctionBegin;
16623425bc38SStefano Zampini   ierr = PCShellGetContext(pc,(void**)&pc_ctx);CHKERRQ(ierr);
16633425bc38SStefano Zampini   ierr = VecDestroy(&pc_ctx->lambda_local);CHKERRQ(ierr);
16643425bc38SStefano Zampini   ierr = MatDestroy(&pc_ctx->B_Ddelta);CHKERRQ(ierr);
16653425bc38SStefano Zampini   ierr = VecScatterDestroy(&pc_ctx->l2g_lambda);CHKERRQ(ierr);
16663425bc38SStefano Zampini   ierr = PCDestroy(&pc_ctx->pc);CHKERRQ(ierr); /* actually it does not destroy BDDC, only decrease its reference count */
16673425bc38SStefano Zampini   ierr = PetscFree(pc_ctx);CHKERRQ(ierr);
16683425bc38SStefano Zampini   PetscFunctionReturn(0);
16693425bc38SStefano Zampini }
16703425bc38SStefano Zampini 
16713425bc38SStefano Zampini #undef __FUNCT__
16723425bc38SStefano Zampini #define __FUNCT__ "PCBDDCSetupFETIDPMatContext"
16733425bc38SStefano Zampini static PetscErrorCode PCBDDCSetupFETIDPMatContext(FETIDPMat_ctx *fetidpmat_ctx)
16743425bc38SStefano Zampini {
16753425bc38SStefano Zampini   PetscErrorCode ierr;
16763425bc38SStefano Zampini   PC_IS          *pcis    =(PC_IS*)fetidpmat_ctx->pc->data;
16773425bc38SStefano Zampini   PC_BDDC        *pcbddc  =(PC_BDDC*)fetidpmat_ctx->pc->data;
16783425bc38SStefano Zampini   PCBDDCGraph    mat_graph=pcbddc->mat_graph;
16793425bc38SStefano Zampini   Mat_IS         *matis   = (Mat_IS*)fetidpmat_ctx->pc->pmat->data;
16803425bc38SStefano Zampini   MPI_Comm       comm     = ((PetscObject)(fetidpmat_ctx->pc))->comm;
16813425bc38SStefano Zampini 
16823425bc38SStefano Zampini   Mat ScalingMat;
16833425bc38SStefano Zampini   Vec lambda_global;
16843425bc38SStefano Zampini   IS  IS_l2g_lambda;
16853425bc38SStefano Zampini 
16863425bc38SStefano Zampini   PetscBool   skip_node,fully_redundant;
1687ef028eecSStefano Zampini   PetscInt    i,j,k,s,n_boundary_dofs,n_global_lambda,n_vertices,partial_sum;
16883425bc38SStefano Zampini   PetscInt    n_local_lambda,n_lambda_for_dof,dual_size,n_neg_values,n_pos_values;
1689ef028eecSStefano Zampini   PetscMPIInt rank,nprocs;
16903425bc38SStefano Zampini   PetscScalar scalar_value;
16913425bc38SStefano Zampini 
16923425bc38SStefano Zampini   PetscInt    *vertex_indices,*temp_indices;
16933425bc38SStefano Zampini   PetscInt    *dual_dofs_boundary_indices,*aux_local_numbering_1,*aux_global_numbering;
16943425bc38SStefano Zampini   PetscInt    *aux_sums,*cols_B_delta,*l2g_indices;
16953425bc38SStefano Zampini   PetscScalar *array,*scaling_factors,*vals_B_delta;
1696ef028eecSStefano Zampini   PetscInt    *aux_local_numbering_2,*dof_sizes,*dof_displs;
1697ef028eecSStefano Zampini   PetscInt    first_index,old_index;
1698ef028eecSStefano Zampini   PetscBool   first_found = PETSC_FALSE;
16993425bc38SStefano Zampini 
17003425bc38SStefano Zampini   /* For communication of scaling factors */
17013425bc38SStefano Zampini   PetscInt    *ptrs_buffer,neigh_position;
17023425bc38SStefano Zampini   PetscScalar **all_factors,*send_buffer,*recv_buffer;
17033425bc38SStefano Zampini   MPI_Request *send_reqs,*recv_reqs;
17043425bc38SStefano Zampini 
17053425bc38SStefano Zampini   /* tests */
17063425bc38SStefano Zampini   Vec         test_vec;
17073425bc38SStefano Zampini   PetscBool   test_fetidp;
17083425bc38SStefano Zampini   PetscViewer viewer;
17093425bc38SStefano Zampini 
17103425bc38SStefano Zampini   PetscFunctionBegin;
17113425bc38SStefano Zampini   ierr = MPI_Comm_rank(comm,&rank);CHKERRQ(ierr);
17123425bc38SStefano Zampini   ierr = MPI_Comm_size(comm,&nprocs);CHKERRQ(ierr);
17133425bc38SStefano Zampini 
17143425bc38SStefano Zampini   /* Default type of lagrange multipliers is non-redundant */
17153425bc38SStefano Zampini   fully_redundant = PETSC_FALSE;
17163425bc38SStefano Zampini   ierr            = PetscOptionsGetBool(PETSC_NULL,"-fetidp_fullyredundant",&fully_redundant,PETSC_NULL);CHKERRQ(ierr);
17173425bc38SStefano Zampini 
17183425bc38SStefano Zampini   /* Evaluate local and global number of lagrange multipliers */
17193425bc38SStefano Zampini   ierr            = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
17203425bc38SStefano Zampini   n_local_lambda  = 0;
17213425bc38SStefano Zampini   partial_sum     = 0;
17223425bc38SStefano Zampini   n_boundary_dofs = 0;
17233425bc38SStefano Zampini   s               = 0;
17243425bc38SStefano Zampini   n_vertices      = 0;
17253425bc38SStefano Zampini   /* Get Vertices used to define the BDDC */
17263425bc38SStefano Zampini   ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(*vertex_indices),&vertex_indices);CHKERRQ(ierr);
17273425bc38SStefano Zampini   for (i=0; i<pcbddc->local_primal_size; i++) {
17283425bc38SStefano Zampini     ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&j,(const PetscInt**)&temp_indices,PETSC_NULL);CHKERRQ(ierr);
17293425bc38SStefano Zampini     if (j == 1) {
17303425bc38SStefano Zampini       vertex_indices[n_vertices]=temp_indices[0];
17313425bc38SStefano Zampini       n_vertices++;
17323425bc38SStefano Zampini     }
17333425bc38SStefano Zampini     ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&j,(const PetscInt**)&temp_indices,PETSC_NULL);CHKERRQ(ierr);
17343425bc38SStefano Zampini   }
17353425bc38SStefano Zampini   dual_size = pcis->n_B-n_vertices;
1736*2fa5cd67SKarl Rupp 
1737f0474715SStefano Zampini   ierr = PetscSortInt(n_vertices,vertex_indices);CHKERRQ(ierr);
17383425bc38SStefano Zampini   ierr = PetscMalloc(dual_size*sizeof(*dual_dofs_boundary_indices),&dual_dofs_boundary_indices);CHKERRQ(ierr);
17393425bc38SStefano Zampini   ierr = PetscMalloc(dual_size*sizeof(*aux_local_numbering_1),&aux_local_numbering_1);CHKERRQ(ierr);
17403425bc38SStefano Zampini   ierr = PetscMalloc(dual_size*sizeof(*aux_local_numbering_2),&aux_local_numbering_2);CHKERRQ(ierr);
17413425bc38SStefano Zampini 
17423425bc38SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
17433425bc38SStefano Zampini   for (i=0; i<pcis->n; i++) {
17443425bc38SStefano Zampini     j = mat_graph->count[i]; /* RECALL: mat_graph->count[i] does not count myself */
1745c6582918SStefano Zampini     k = 0;
1746*2fa5cd67SKarl Rupp     if (j > 0) k = (mat_graph->neighbours_set[i][0] == -1 ?  1 : 0);
17473425bc38SStefano Zampini     j = j - k;
1748*2fa5cd67SKarl Rupp     if (j > 0) n_boundary_dofs++;
17493425bc38SStefano Zampini 
17503425bc38SStefano Zampini     skip_node = PETSC_FALSE;
1751c6582918SStefano Zampini     if (s < n_vertices && vertex_indices[s]==i) { /* it works for a sorted set of vertices */
17523425bc38SStefano Zampini       skip_node = PETSC_TRUE;
17533425bc38SStefano Zampini       s++;
17543425bc38SStefano Zampini     }
1755*2fa5cd67SKarl Rupp     if (j < 1) skip_node = PETSC_TRUE;
17563425bc38SStefano Zampini     if (!skip_node) {
17573425bc38SStefano Zampini       if (fully_redundant) {
17583425bc38SStefano Zampini         /* fully redundant set of lagrange multipliers */
17593425bc38SStefano Zampini         n_lambda_for_dof = (j*(j+1))/2;
17603425bc38SStefano Zampini       } else {
17613425bc38SStefano Zampini         n_lambda_for_dof = j;
17623425bc38SStefano Zampini       }
17633425bc38SStefano Zampini       n_local_lambda += j;
17643425bc38SStefano Zampini       /* needed to evaluate global number of lagrange multipliers */
17653425bc38SStefano Zampini       array[i]=(1.0*n_lambda_for_dof)/(j+1.0); /* already scaled for the next global sum */
17663425bc38SStefano Zampini       /* store some data needed */
17673425bc38SStefano Zampini       dual_dofs_boundary_indices[partial_sum] = n_boundary_dofs-1;
17683425bc38SStefano Zampini       aux_local_numbering_1[partial_sum]      = i;
1769ef028eecSStefano Zampini       aux_local_numbering_2[partial_sum]      = n_lambda_for_dof;
17703425bc38SStefano Zampini       partial_sum++;
17713425bc38SStefano Zampini     }
17723425bc38SStefano Zampini   }
17733425bc38SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
1774ef028eecSStefano Zampini 
17753425bc38SStefano Zampini   ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
17763425bc38SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
17773425bc38SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
17783425bc38SStefano Zampini   ierr = VecSum(pcis->vec1_global,&scalar_value);CHKERRQ(ierr);
1779*2fa5cd67SKarl Rupp 
17803425bc38SStefano Zampini   fetidpmat_ctx->n_lambda = (PetscInt) scalar_value;
17813425bc38SStefano Zampini   /* printf("I found %d global multipliers (%f)\n",fetidpmat_ctx->n_lambda,scalar_value); */
17823425bc38SStefano Zampini 
17833425bc38SStefano Zampini   /* compute global ordering of lagrange multipliers and associate l2g map */
1784ef028eecSStefano Zampini   ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
1785ef028eecSStefano Zampini   ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
1786ef028eecSStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
1787*2fa5cd67SKarl Rupp   for (i=0;i<dual_size;i++) array[aux_local_numbering_1[i]] = aux_local_numbering_2[i];
1788ef028eecSStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
1789ef028eecSStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
1790ef028eecSStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
1791ef028eecSStefano Zampini   ierr = VecSum(pcis->vec1_global,&scalar_value);CHKERRQ(ierr);
1792ef028eecSStefano Zampini   if (pcbddc->dbg_flag && (PetscInt)scalar_value != fetidpmat_ctx->n_lambda) {
1793acee19a7SJed Brown     SETERRQ2(PETSC_COMM_WORLD,PETSC_ERR_PLIB,"Global number of multipliers mismatch! (%d!=%d)\n",(PetscInt)scalar_value,fetidpmat_ctx->n_lambda);
1794ef028eecSStefano Zampini   }
17953425bc38SStefano Zampini 
1796ef028eecSStefano Zampini   /* Fill pcis->vec1_global with cumulative function for global numbering */
1797ef028eecSStefano Zampini   ierr        = VecGetArray(pcis->vec1_global,&array);CHKERRQ(ierr);
1798ef028eecSStefano Zampini   ierr        = VecGetLocalSize(pcis->vec1_global,&s);CHKERRQ(ierr);
1799ef028eecSStefano Zampini   k           = 0;
1800ef028eecSStefano Zampini   first_index = -1;
1801ef028eecSStefano Zampini   for (i=0; i<s; i++) {
1802ef028eecSStefano Zampini     if (!first_found && array[i] > 0.0) {
1803ef028eecSStefano Zampini       first_found = PETSC_TRUE;
1804ef028eecSStefano Zampini       first_index = i;
1805ef028eecSStefano Zampini     }
1806ef028eecSStefano Zampini     k += (PetscInt)array[i];
1807ef028eecSStefano Zampini   }
1808ef028eecSStefano Zampini   j    = (!rank ? nprocs : 0);
18093425bc38SStefano Zampini   ierr = PetscMalloc(j*sizeof(*dof_sizes),&dof_sizes);CHKERRQ(ierr);
18103425bc38SStefano Zampini   ierr = PetscMalloc(j*sizeof(*dof_displs),&dof_displs);CHKERRQ(ierr);
1811ef028eecSStefano Zampini   ierr = MPI_Gather(&k,1,MPIU_INT,dof_sizes,1,MPIU_INT,0,comm);CHKERRQ(ierr);
1812ef028eecSStefano Zampini   if (!rank) {
18133425bc38SStefano Zampini     dof_displs[0]=0;
1814*2fa5cd67SKarl Rupp     for (i=1; i<nprocs; i++) dof_displs[i] = dof_displs[i-1]+dof_sizes[i-1];
18153425bc38SStefano Zampini   }
1816ef028eecSStefano Zampini   ierr = MPI_Scatter(dof_displs,1,MPIU_INT,&k,1,MPIU_INT,0,comm);CHKERRQ(ierr);
1817ef028eecSStefano Zampini   if (first_found) {
1818ef028eecSStefano Zampini     array[first_index] += k;
1819*2fa5cd67SKarl Rupp 
1820ef028eecSStefano Zampini     old_index = first_index;
1821ef028eecSStefano Zampini     for (i=first_index+1; i<s; i++) {
1822ef028eecSStefano Zampini       if (array[i] > 0.0) {
1823ef028eecSStefano Zampini         array[i] += array[old_index];
1824ef028eecSStefano Zampini         old_index = i;
1825ef028eecSStefano Zampini       }
1826ef028eecSStefano Zampini     }
1827ef028eecSStefano Zampini   }
1828ef028eecSStefano Zampini   ierr = VecRestoreArray(pcis->vec1_global,&array);CHKERRQ(ierr);
1829ef028eecSStefano Zampini   ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
1830ef028eecSStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1831ef028eecSStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1832ef028eecSStefano Zampini   ierr = PetscMalloc(dual_size*sizeof(*aux_global_numbering),&aux_global_numbering);CHKERRQ(ierr);
1833ef028eecSStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
18343425bc38SStefano Zampini   for (i=0; i<dual_size; i++) {
1835ef028eecSStefano Zampini     aux_global_numbering[i] = (PetscInt)array[aux_local_numbering_1[i]]-aux_local_numbering_2[i];
18363425bc38SStefano Zampini   }
1837ef028eecSStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
1838f0474715SStefano Zampini   ierr = PetscFree(aux_local_numbering_2);CHKERRQ(ierr);
1839f0474715SStefano Zampini   ierr = PetscFree(dof_displs);CHKERRQ(ierr);
1840f0474715SStefano Zampini   ierr = PetscFree(dof_sizes);CHKERRQ(ierr);
18413425bc38SStefano Zampini 
18423425bc38SStefano Zampini   /* init data for scaling factors exchange */
18433425bc38SStefano Zampini   partial_sum = 0;
18443425bc38SStefano Zampini   j           = 0;
1845*2fa5cd67SKarl Rupp 
18463425bc38SStefano Zampini   ierr = PetscMalloc(pcis->n_neigh*sizeof(PetscInt),&ptrs_buffer);CHKERRQ(ierr);
18473425bc38SStefano Zampini   ierr = PetscMalloc((pcis->n_neigh-1)*sizeof(MPI_Request),&send_reqs);CHKERRQ(ierr);
18483425bc38SStefano Zampini   ierr = PetscMalloc((pcis->n_neigh-1)*sizeof(MPI_Request),&recv_reqs);CHKERRQ(ierr);
18493425bc38SStefano Zampini   ierr = PetscMalloc(pcis->n*sizeof(PetscScalar*),&all_factors);CHKERRQ(ierr);
1850*2fa5cd67SKarl Rupp 
18513425bc38SStefano Zampini   ptrs_buffer[0] = 0;
18523425bc38SStefano Zampini   for (i=1; i<pcis->n_neigh; i++) {
18533425bc38SStefano Zampini     partial_sum += pcis->n_shared[i];
18543425bc38SStefano Zampini     ptrs_buffer[i] = ptrs_buffer[i-1]+pcis->n_shared[i];
18553425bc38SStefano Zampini   }
18563425bc38SStefano Zampini   ierr = PetscMalloc(partial_sum*sizeof(PetscScalar),&send_buffer);CHKERRQ(ierr);
18573425bc38SStefano Zampini   ierr = PetscMalloc(partial_sum*sizeof(PetscScalar),&recv_buffer);CHKERRQ(ierr);
18583425bc38SStefano Zampini   ierr = PetscMalloc(partial_sum*sizeof(PetscScalar),&all_factors[0]);CHKERRQ(ierr);
18593425bc38SStefano Zampini   for (i=0; i<pcis->n-1; i++) {
18603425bc38SStefano Zampini     j = mat_graph->count[i];
18613425bc38SStefano Zampini     if (j>0) {
18623425bc38SStefano Zampini       k = (mat_graph->neighbours_set[i][0] == -1 ?  1 : 0);
18633425bc38SStefano Zampini       j = j - k;
18643425bc38SStefano Zampini     }
18653425bc38SStefano Zampini     all_factors[i+1]=all_factors[i]+j;
18663425bc38SStefano Zampini   }
18673425bc38SStefano Zampini   /* scatter B scaling to N vec */
18683425bc38SStefano Zampini   ierr = VecScatterBegin(pcis->N_to_B,pcis->D,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
18693425bc38SStefano Zampini   ierr = VecScatterEnd  (pcis->N_to_B,pcis->D,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
18703425bc38SStefano Zampini   /* communications */
18713425bc38SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
18723425bc38SStefano Zampini   for (i=1; i<pcis->n_neigh; i++) {
1873*2fa5cd67SKarl Rupp     for (j=0; j<pcis->n_shared[i]; j++)  send_buffer[ptrs_buffer[i-1]+j] = array[pcis->shared[i][j]];
1874*2fa5cd67SKarl Rupp 
18753425bc38SStefano Zampini     j    = ptrs_buffer[i]-ptrs_buffer[i-1];
1876ea7e1babSStefano Zampini     ierr = MPI_Isend(&send_buffer[ptrs_buffer[i-1]],j,MPIU_SCALAR,pcis->neigh[i],0,comm,&send_reqs[i-1]);CHKERRQ(ierr);
1877ea7e1babSStefano Zampini     ierr = MPI_Irecv(&recv_buffer[ptrs_buffer[i-1]],j,MPIU_SCALAR,pcis->neigh[i],0,comm,&recv_reqs[i-1]);CHKERRQ(ierr);
18783425bc38SStefano Zampini   }
18793425bc38SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
1880ea7e1babSStefano Zampini   ierr = MPI_Waitall((pcis->n_neigh-1),recv_reqs,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
18813425bc38SStefano Zampini   /* put values in correct places */
18823425bc38SStefano Zampini   for (i=1; i<pcis->n_neigh; i++) {
18833425bc38SStefano Zampini     for (j=0; j<pcis->n_shared[i]; j++) {
18843425bc38SStefano Zampini       k = pcis->shared[i][j];
1885*2fa5cd67SKarl Rupp 
18863425bc38SStefano Zampini       neigh_position = 0;
1887*2fa5cd67SKarl Rupp       while (mat_graph->neighbours_set[k][neigh_position] != pcis->neigh[i]) neigh_position++;
18883425bc38SStefano Zampini       s = (mat_graph->neighbours_set[k][0] == -1 ? 1 : 0);
1889*2fa5cd67SKarl Rupp 
18903425bc38SStefano Zampini       neigh_position = neigh_position - s;
1891*2fa5cd67SKarl Rupp 
18923425bc38SStefano Zampini       all_factors[k][neigh_position]=recv_buffer[ptrs_buffer[i-1]+j];
18933425bc38SStefano Zampini     }
18943425bc38SStefano Zampini   }
1895ea7e1babSStefano Zampini   ierr = MPI_Waitall((pcis->n_neigh-1),send_reqs,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
18963425bc38SStefano Zampini   ierr = PetscFree(send_reqs);CHKERRQ(ierr);
18973425bc38SStefano Zampini   ierr = PetscFree(recv_reqs);CHKERRQ(ierr);
18983425bc38SStefano Zampini   ierr = PetscFree(send_buffer);CHKERRQ(ierr);
18993425bc38SStefano Zampini   ierr = PetscFree(recv_buffer);CHKERRQ(ierr);
19003425bc38SStefano Zampini   ierr = PetscFree(ptrs_buffer);CHKERRQ(ierr);
19013425bc38SStefano Zampini 
19023425bc38SStefano Zampini   /* Compute B and B_delta (local actions) */
19033425bc38SStefano Zampini   ierr = PetscMalloc(pcis->n_neigh*sizeof(*aux_sums),&aux_sums);CHKERRQ(ierr);
19043425bc38SStefano Zampini   ierr = PetscMalloc(n_local_lambda*sizeof(*l2g_indices),&l2g_indices);CHKERRQ(ierr);
19053425bc38SStefano Zampini   ierr = PetscMalloc(n_local_lambda*sizeof(*vals_B_delta),&vals_B_delta);CHKERRQ(ierr);
19063425bc38SStefano Zampini   ierr = PetscMalloc(n_local_lambda*sizeof(*cols_B_delta),&cols_B_delta);CHKERRQ(ierr);
19073425bc38SStefano Zampini   ierr = PetscMalloc(n_local_lambda*sizeof(*scaling_factors),&scaling_factors);CHKERRQ(ierr);
1908*2fa5cd67SKarl Rupp 
19093425bc38SStefano Zampini   n_global_lambda = 0;
19103425bc38SStefano Zampini   partial_sum     = 0;
1911*2fa5cd67SKarl Rupp 
19123425bc38SStefano Zampini   for (i=0;i<dual_size;i++) {
1913ef028eecSStefano Zampini     n_global_lambda = aux_global_numbering[i];
19143425bc38SStefano Zampini     j               = mat_graph->count[aux_local_numbering_1[i]];
19153425bc38SStefano Zampini     k               = (mat_graph->neighbours_set[aux_local_numbering_1[i]][0] == -1 ?  1 : 0);
19163425bc38SStefano Zampini     j               = j - k;
19173425bc38SStefano Zampini     aux_sums[0]     = 0;
1918*2fa5cd67SKarl Rupp     for (s=1; s<j; s++) aux_sums[s]=aux_sums[s-1]+j-s+1;
1919*2fa5cd67SKarl Rupp 
19203425bc38SStefano Zampini     array        = all_factors[aux_local_numbering_1[i]];
19213425bc38SStefano Zampini     n_neg_values = 0;
1922*2fa5cd67SKarl Rupp 
1923*2fa5cd67SKarl Rupp     while (n_neg_values < j && mat_graph->neighbours_set[aux_local_numbering_1[i]][n_neg_values+k] < rank) n_neg_values++;
19243425bc38SStefano Zampini     n_pos_values = j - n_neg_values;
1925*2fa5cd67SKarl Rupp 
19263425bc38SStefano Zampini     if (fully_redundant) {
19273425bc38SStefano Zampini       for (s=0; s<n_neg_values; s++) {
19283425bc38SStefano Zampini         l2g_indices    [partial_sum+s]=aux_sums[s]+n_neg_values-s-1+n_global_lambda;
19293425bc38SStefano Zampini         cols_B_delta   [partial_sum+s]=dual_dofs_boundary_indices[i];
19303425bc38SStefano Zampini         vals_B_delta   [partial_sum+s]=-1.0;
19313425bc38SStefano Zampini         scaling_factors[partial_sum+s]=array[s];
19323425bc38SStefano Zampini       }
19333425bc38SStefano Zampini       for (s=0; s<n_pos_values; s++) {
19343425bc38SStefano Zampini         l2g_indices    [partial_sum+s+n_neg_values]=aux_sums[n_neg_values]+s+n_global_lambda;
19353425bc38SStefano Zampini         cols_B_delta   [partial_sum+s+n_neg_values]=dual_dofs_boundary_indices[i];
19363425bc38SStefano Zampini         vals_B_delta   [partial_sum+s+n_neg_values]=1.0;
19373425bc38SStefano Zampini         scaling_factors[partial_sum+s+n_neg_values]=array[s+n_neg_values];
19383425bc38SStefano Zampini       }
19393425bc38SStefano Zampini       partial_sum += j;
19403425bc38SStefano Zampini     } else {
19413425bc38SStefano Zampini       /* l2g_indices and default cols and vals of B_delta */
19423425bc38SStefano Zampini       for (s=0; s<j; s++) {
19433425bc38SStefano Zampini         l2g_indices    [partial_sum+s]=n_global_lambda+s;
19443425bc38SStefano Zampini         cols_B_delta   [partial_sum+s]=dual_dofs_boundary_indices[i];
19453425bc38SStefano Zampini         vals_B_delta   [partial_sum+s]=0.0;
19463425bc38SStefano Zampini       }
19473425bc38SStefano Zampini       /* B_delta */
1948*2fa5cd67SKarl Rupp       if (n_neg_values > 0) vals_B_delta[partial_sum+n_neg_values-1] = -1.0; /* there's a rank next to me to the left */
1949*2fa5cd67SKarl Rupp       if (n_neg_values < j) vals_B_delta[partial_sum+n_neg_values] = 1.0; /* there's a rank next to me to the right */
1950*2fa5cd67SKarl Rupp 
19513425bc38SStefano Zampini       /* scaling as in Klawonn-Widlund 1999*/
19523425bc38SStefano Zampini       for (s=0;s<n_neg_values;s++) {
19533425bc38SStefano Zampini         scalar_value = 0.0;
1954*2fa5cd67SKarl Rupp         for (k=0;k<s+1;k++) scalar_value += array[k];
1955ef028eecSStefano Zampini         scaling_factors[partial_sum+s] = -scalar_value;
19563425bc38SStefano Zampini       }
19573425bc38SStefano Zampini       for (s=0;s<n_pos_values;s++) {
19583425bc38SStefano Zampini         scalar_value = 0.0;
1959*2fa5cd67SKarl Rupp         for (k=s+n_neg_values;k<j;k++) scalar_value += array[k];
19603425bc38SStefano Zampini         scaling_factors[partial_sum+s+n_neg_values] = scalar_value;
19613425bc38SStefano Zampini       }
19623425bc38SStefano Zampini       partial_sum += j;
19633425bc38SStefano Zampini     }
19643425bc38SStefano Zampini   }
1965ef028eecSStefano Zampini   ierr = PetscFree(aux_global_numbering);CHKERRQ(ierr);
1966f0474715SStefano Zampini   ierr = PetscFree(aux_sums);CHKERRQ(ierr);
1967f0474715SStefano Zampini   ierr = PetscFree(aux_local_numbering_1);CHKERRQ(ierr);
1968f0474715SStefano Zampini   ierr = PetscFree(dual_dofs_boundary_indices);CHKERRQ(ierr);
19693425bc38SStefano Zampini   ierr = PetscFree(all_factors[0]);CHKERRQ(ierr);
19703425bc38SStefano Zampini   ierr = PetscFree(all_factors);CHKERRQ(ierr);
19713425bc38SStefano Zampini   /* printf("I found %d local lambda dofs when numbering them (should be %d)\n",partial_sum,n_local_lambda); */
1972f0474715SStefano Zampini 
1973f0474715SStefano Zampini   /* Local to global mapping of fetidpmat */
1974f0474715SStefano Zampini   ierr = VecCreate(PETSC_COMM_SELF,&fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
1975f0474715SStefano Zampini   ierr = VecSetSizes(fetidpmat_ctx->lambda_local,n_local_lambda,n_local_lambda);CHKERRQ(ierr);
1976f0474715SStefano Zampini   ierr = VecSetType(fetidpmat_ctx->lambda_local,VECSEQ);CHKERRQ(ierr);
1977f0474715SStefano Zampini   ierr = VecCreate(comm,&lambda_global);CHKERRQ(ierr);
1978f0474715SStefano Zampini   ierr = VecSetSizes(lambda_global,PETSC_DECIDE,fetidpmat_ctx->n_lambda);CHKERRQ(ierr);
1979f0474715SStefano Zampini   ierr = VecSetType(lambda_global,VECMPI);CHKERRQ(ierr);
19803425bc38SStefano Zampini   ierr = ISCreateGeneral(comm,n_local_lambda,l2g_indices,PETSC_OWN_POINTER,&IS_l2g_lambda);CHKERRQ(ierr);
19813425bc38SStefano Zampini   ierr = VecScatterCreate(fetidpmat_ctx->lambda_local,(IS)0,lambda_global,IS_l2g_lambda,&fetidpmat_ctx->l2g_lambda);CHKERRQ(ierr);
1982f0474715SStefano Zampini   ierr = ISDestroy(&IS_l2g_lambda);CHKERRQ(ierr);
19833425bc38SStefano Zampini 
19843425bc38SStefano Zampini   /* Create local part of B_delta */
19853425bc38SStefano Zampini   ierr = MatCreate(PETSC_COMM_SELF,&fetidpmat_ctx->B_delta);
19863425bc38SStefano Zampini   ierr = MatSetSizes(fetidpmat_ctx->B_delta,n_local_lambda,pcis->n_B,n_local_lambda,pcis->n_B);CHKERRQ(ierr);
19873425bc38SStefano Zampini   ierr = MatSetType(fetidpmat_ctx->B_delta,MATSEQAIJ);CHKERRQ(ierr);
19883425bc38SStefano Zampini   ierr = MatSeqAIJSetPreallocation(fetidpmat_ctx->B_delta,1,PETSC_NULL);CHKERRQ(ierr);
19893425bc38SStefano Zampini   ierr = MatSetOption(fetidpmat_ctx->B_delta,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr);
19903425bc38SStefano Zampini   for (i=0; i<n_local_lambda; i++) {
19913425bc38SStefano Zampini     ierr = MatSetValue(fetidpmat_ctx->B_delta,i,cols_B_delta[i],vals_B_delta[i],INSERT_VALUES);CHKERRQ(ierr);
19923425bc38SStefano Zampini   }
1993f0474715SStefano Zampini   ierr = PetscFree(vals_B_delta);CHKERRQ(ierr);
19943425bc38SStefano Zampini   ierr = MatAssemblyBegin(fetidpmat_ctx->B_delta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
19953425bc38SStefano Zampini   ierr = MatAssemblyEnd  (fetidpmat_ctx->B_delta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
19963425bc38SStefano Zampini 
19973425bc38SStefano Zampini   if (fully_redundant) {
19983425bc38SStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&ScalingMat);
19993425bc38SStefano Zampini     ierr = MatSetSizes(ScalingMat,n_local_lambda,n_local_lambda,n_local_lambda,n_local_lambda);CHKERRQ(ierr);
20003425bc38SStefano Zampini     ierr = MatSetType(ScalingMat,MATSEQAIJ);CHKERRQ(ierr);
20013425bc38SStefano Zampini     ierr = MatSeqAIJSetPreallocation(ScalingMat,1,PETSC_NULL);CHKERRQ(ierr);
20023425bc38SStefano Zampini     for (i=0; i<n_local_lambda; i++) {
20033425bc38SStefano Zampini       ierr = MatSetValue(ScalingMat,i,i,scaling_factors[i],INSERT_VALUES);CHKERRQ(ierr);
20043425bc38SStefano Zampini     }
20053425bc38SStefano Zampini     ierr = MatAssemblyBegin(ScalingMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
20063425bc38SStefano Zampini     ierr = MatAssemblyEnd  (ScalingMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
20073425bc38SStefano Zampini     ierr = MatMatMult(ScalingMat,fetidpmat_ctx->B_delta,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&fetidpmat_ctx->B_Ddelta);CHKERRQ(ierr);
20083425bc38SStefano Zampini     ierr = MatDestroy(&ScalingMat);CHKERRQ(ierr);
20093425bc38SStefano Zampini   } else {
20103425bc38SStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&fetidpmat_ctx->B_Ddelta);
20113425bc38SStefano Zampini     ierr = MatSetSizes(fetidpmat_ctx->B_Ddelta,n_local_lambda,pcis->n_B,n_local_lambda,pcis->n_B);CHKERRQ(ierr);
20123425bc38SStefano Zampini     ierr = MatSetType(fetidpmat_ctx->B_Ddelta,MATSEQAIJ);CHKERRQ(ierr);
20133425bc38SStefano Zampini     ierr = MatSeqAIJSetPreallocation(fetidpmat_ctx->B_Ddelta,1,PETSC_NULL);CHKERRQ(ierr);
20143425bc38SStefano Zampini     for (i=0; i<n_local_lambda; i++) {
20153425bc38SStefano Zampini       ierr = MatSetValue(fetidpmat_ctx->B_Ddelta,i,cols_B_delta[i],scaling_factors[i],INSERT_VALUES);CHKERRQ(ierr);
20163425bc38SStefano Zampini     }
20173425bc38SStefano Zampini     ierr = MatAssemblyBegin(fetidpmat_ctx->B_Ddelta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
20183425bc38SStefano Zampini     ierr = MatAssemblyEnd  (fetidpmat_ctx->B_Ddelta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
20193425bc38SStefano Zampini   }
2020f0474715SStefano Zampini   ierr = PetscFree(scaling_factors);CHKERRQ(ierr);
2021f0474715SStefano Zampini   ierr = PetscFree(cols_B_delta);CHKERRQ(ierr);
20223425bc38SStefano Zampini 
20233425bc38SStefano Zampini   /* Create some vectors needed by fetidp */
20243425bc38SStefano Zampini   ierr = VecDuplicate(pcis->vec1_B,&fetidpmat_ctx->temp_solution_B);CHKERRQ(ierr);
20253425bc38SStefano Zampini   ierr = VecDuplicate(pcis->vec1_D,&fetidpmat_ctx->temp_solution_D);CHKERRQ(ierr);
20263425bc38SStefano Zampini 
20273425bc38SStefano Zampini   test_fetidp = PETSC_FALSE;
2028*2fa5cd67SKarl Rupp 
20293425bc38SStefano Zampini   ierr = PetscOptionsGetBool(PETSC_NULL,"-fetidp_check",&test_fetidp,PETSC_NULL);CHKERRQ(ierr);
20303425bc38SStefano Zampini 
20313425bc38SStefano Zampini   if (test_fetidp) {
20323425bc38SStefano Zampini 
20333425bc38SStefano Zampini     ierr = PetscViewerASCIIGetStdout(((PetscObject)(fetidpmat_ctx->pc))->comm,&viewer);CHKERRQ(ierr);
20343425bc38SStefano Zampini     ierr = PetscViewerASCIISynchronizedAllow(viewer,PETSC_TRUE);CHKERRQ(ierr);
20353425bc38SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"----------FETI_DP TESTS--------------\n");CHKERRQ(ierr);
20363425bc38SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"All tests should return zero!\n");CHKERRQ(ierr);
20373425bc38SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"FETIDP MAT context in the ");CHKERRQ(ierr);
20383425bc38SStefano Zampini     if (fully_redundant) {
20393425bc38SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"fully redundant case for lagrange multipliers.\n");CHKERRQ(ierr);
20403425bc38SStefano Zampini     } else {
20413425bc38SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Non-fully redundant case for lagrange multiplier.\n");CHKERRQ(ierr);
20423425bc38SStefano Zampini     }
20433425bc38SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
20443425bc38SStefano Zampini 
20453425bc38SStefano Zampini     /* TEST A/B: Test numbering of global lambda dofs             */
20463425bc38SStefano Zampini 
20473425bc38SStefano Zampini     ierr         = VecDuplicate(fetidpmat_ctx->lambda_local,&test_vec);CHKERRQ(ierr);
20483425bc38SStefano Zampini     ierr         = VecSet(lambda_global,1.0);CHKERRQ(ierr);
20493425bc38SStefano Zampini     ierr         = VecSet(test_vec,1.0);CHKERRQ(ierr);
20503425bc38SStefano Zampini     ierr         = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
20513425bc38SStefano Zampini     ierr         = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
20523425bc38SStefano Zampini     scalar_value = -1.0;
20533425bc38SStefano Zampini     ierr         = VecAXPY(test_vec,scalar_value,fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
20543425bc38SStefano Zampini     ierr         = VecNorm(test_vec,NORM_INFINITY,&scalar_value);CHKERRQ(ierr);
20553425bc38SStefano Zampini     ierr         = VecDestroy(&test_vec);CHKERRQ(ierr);
20563425bc38SStefano Zampini     ierr         = PetscViewerASCIISynchronizedPrintf(viewer,"A[%04d]: CHECK glob to loc: % 1.14e\n",rank,scalar_value);CHKERRQ(ierr);
20573425bc38SStefano Zampini     ierr         = PetscViewerFlush(viewer);CHKERRQ(ierr);
20583425bc38SStefano Zampini     if (fully_redundant) {
20593425bc38SStefano Zampini       ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr);
20603425bc38SStefano Zampini       ierr = VecSet(fetidpmat_ctx->lambda_local,0.5);CHKERRQ(ierr);
20613425bc38SStefano Zampini       ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20623425bc38SStefano Zampini       ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20633425bc38SStefano Zampini       ierr = VecSum(lambda_global,&scalar_value);CHKERRQ(ierr);
20643425bc38SStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"B[%04d]: CHECK loc to glob: % 1.14e\n",rank,scalar_value-fetidpmat_ctx->n_lambda);CHKERRQ(ierr);
20653425bc38SStefano Zampini       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
20663425bc38SStefano Zampini     }
20673425bc38SStefano Zampini 
20683425bc38SStefano Zampini     /* TEST C: It should holds B_delta*w=0, w\in\widehat{W}           */
20693425bc38SStefano Zampini     /* This is the meaning of the B matrix                            */
20703425bc38SStefano Zampini 
20713425bc38SStefano Zampini     ierr = VecSetRandom(pcis->vec1_N,PETSC_NULL);CHKERRQ(ierr);
20723425bc38SStefano Zampini     ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
20733425bc38SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
20743425bc38SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
20753425bc38SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20763425bc38SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20773425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20783425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20793425bc38SStefano Zampini     /* Action of B_delta */
20803425bc38SStefano Zampini     ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
20813425bc38SStefano Zampini     ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr);
20823425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20833425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20843425bc38SStefano Zampini     ierr = VecNorm(lambda_global,NORM_INFINITY,&scalar_value);CHKERRQ(ierr);
20853425bc38SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"C[coll]: CHECK infty norm of B_delta*w (w continuous): % 1.14e\n",scalar_value);CHKERRQ(ierr);
20863425bc38SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
20873425bc38SStefano Zampini 
20883425bc38SStefano Zampini     /* TEST D: It should holds E_Dw = w - P_Dw w\in\widetilde{W}     */
20893425bc38SStefano Zampini     /* E_D = R_D^TR                                                   */
20903425bc38SStefano Zampini     /* P_D = B_{D,delta}^T B_{delta}                                  */
20913425bc38SStefano Zampini     /* eq.44 Mandel Tezaur and Dohrmann 2005                          */
20923425bc38SStefano Zampini 
20933425bc38SStefano Zampini     /* compute a random vector in \widetilde{W} */
20943425bc38SStefano Zampini     ierr = VecSetRandom(pcis->vec1_N,PETSC_NULL);CHKERRQ(ierr);
2095*2fa5cd67SKarl Rupp 
20963425bc38SStefano Zampini     scalar_value = 0.0; /* set zero at vertices */
20973425bc38SStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
2098*2fa5cd67SKarl Rupp     for (i=0;i<n_vertices;i++) array[vertex_indices[i]] = scalar_value;
20993425bc38SStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
2100*2fa5cd67SKarl Rupp 
21013425bc38SStefano Zampini     /* store w for final comparison */
21023425bc38SStefano Zampini     ierr = VecDuplicate(pcis->vec1_B,&test_vec);CHKERRQ(ierr);
21033425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,test_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21043425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,test_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21053425bc38SStefano Zampini 
21063425bc38SStefano Zampini     /* Jump operator P_D : results stored in pcis->vec1_B */
21073425bc38SStefano Zampini 
21083425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21093425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21103425bc38SStefano Zampini     /* Action of B_delta */
21113425bc38SStefano Zampini     ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
21123425bc38SStefano Zampini     ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr);
21133425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21143425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21153425bc38SStefano Zampini     /* Action of B_Ddelta^T */
21163425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21173425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21183425bc38SStefano Zampini     ierr = MatMultTranspose(fetidpmat_ctx->B_Ddelta,fetidpmat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr);
21193425bc38SStefano Zampini 
21203425bc38SStefano Zampini     /* Average operator E_D : results stored in pcis->vec2_B */
21213425bc38SStefano Zampini 
21223425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21233425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21243425bc38SStefano Zampini     ierr = VecPointwiseMult(pcis->vec2_B,pcis->D,pcis->vec2_B);CHKERRQ(ierr);
21253425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec2_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21263425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec2_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21273425bc38SStefano Zampini     ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
21283425bc38SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21293425bc38SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21303425bc38SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21313425bc38SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21323425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21333425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21343425bc38SStefano Zampini 
21353425bc38SStefano Zampini     /* test E_D=I-P_D */
21363425bc38SStefano Zampini     scalar_value = 1.0;
21373425bc38SStefano Zampini     ierr         = VecAXPY(pcis->vec1_B,scalar_value,pcis->vec2_B);CHKERRQ(ierr);
21383425bc38SStefano Zampini     scalar_value = -1.0;
21393425bc38SStefano Zampini     ierr         = VecAXPY(pcis->vec1_B,scalar_value,test_vec);CHKERRQ(ierr);
21403425bc38SStefano Zampini     ierr         = VecNorm(pcis->vec1_B,NORM_INFINITY,&scalar_value);CHKERRQ(ierr);
21413425bc38SStefano Zampini     ierr         = VecDestroy(&test_vec);CHKERRQ(ierr);
21423425bc38SStefano Zampini     ierr         = PetscViewerASCIISynchronizedPrintf(viewer,"D[%04d] CHECK infty norm of E_D + P_D - I: % 1.14e\n",rank,scalar_value);CHKERRQ(ierr);
21433425bc38SStefano Zampini     ierr         = PetscViewerFlush(viewer);CHKERRQ(ierr);
21443425bc38SStefano Zampini 
21453425bc38SStefano Zampini     /* TEST E: It should holds R_D^TP_Dw=0 w\in\widetilde{W}          */
21463425bc38SStefano Zampini     /* eq.48 Mandel Tezaur and Dohrmann 2005                          */
21473425bc38SStefano Zampini 
21483425bc38SStefano Zampini     ierr = VecSetRandom(pcis->vec1_N,PETSC_NULL);CHKERRQ(ierr);
21493425bc38SStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
2150*2fa5cd67SKarl Rupp 
21513425bc38SStefano Zampini     scalar_value = 0.0; /* set zero at vertices */
2152*2fa5cd67SKarl Rupp     for (i=0;i<n_vertices;i++) array[vertex_indices[i]]=scalar_value;
21533425bc38SStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
21543425bc38SStefano Zampini 
21553425bc38SStefano Zampini     /* Jump operator P_D : results stored in pcis->vec1_B */
21563425bc38SStefano Zampini 
21573425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21583425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21593425bc38SStefano Zampini     /* Action of B_delta */
21603425bc38SStefano Zampini     ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
21613425bc38SStefano Zampini     ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr);
21623425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21633425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21643425bc38SStefano Zampini     /* Action of B_Ddelta^T */
21653425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21663425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21673425bc38SStefano Zampini     ierr = MatMultTranspose(fetidpmat_ctx->B_Ddelta,fetidpmat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr);
21683425bc38SStefano Zampini     /* diagonal scaling */
21693425bc38SStefano Zampini     ierr = VecPointwiseMult(pcis->vec1_B,pcis->D,pcis->vec1_B);CHKERRQ(ierr);
21703425bc38SStefano Zampini     /* sum on the interface */
21713425bc38SStefano Zampini     ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
21723425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21733425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21743425bc38SStefano Zampini     ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
21753425bc38SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21763425bc38SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21773425bc38SStefano Zampini     ierr = VecNorm(pcis->vec1_global,NORM_INFINITY,&scalar_value);CHKERRQ(ierr);
21783425bc38SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"E[coll]: CHECK infty norm of R^T_D P_D: % 1.14e\n",scalar_value);CHKERRQ(ierr);
21793425bc38SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
21803425bc38SStefano Zampini 
21813425bc38SStefano Zampini     if (!fully_redundant) {
21823425bc38SStefano Zampini       /* TEST F: It should holds B_{delta}B^T_{D,delta}=I               */
21833425bc38SStefano Zampini       /* Corollary thm 14 Mandel Tezaur and Dohrmann 2005               */
21843425bc38SStefano Zampini       ierr = VecDuplicate(lambda_global,&test_vec);CHKERRQ(ierr);
21853425bc38SStefano Zampini       ierr = VecSetRandom(lambda_global,PETSC_NULL);CHKERRQ(ierr);
21863425bc38SStefano Zampini       /* Action of B_Ddelta^T */
21873425bc38SStefano Zampini       ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21883425bc38SStefano Zampini       ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21893425bc38SStefano Zampini       ierr = MatMultTranspose(fetidpmat_ctx->B_Ddelta,fetidpmat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr);
21903425bc38SStefano Zampini       /* Action of B_delta */
21913425bc38SStefano Zampini       ierr         = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
21923425bc38SStefano Zampini       ierr         = VecSet(test_vec,0.0);CHKERRQ(ierr);
21933425bc38SStefano Zampini       ierr         = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,test_vec,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21943425bc38SStefano Zampini       ierr         = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,test_vec,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21953425bc38SStefano Zampini       scalar_value = -1.0;
21963425bc38SStefano Zampini       ierr         = VecAXPY(lambda_global,scalar_value,test_vec);CHKERRQ(ierr);
21973425bc38SStefano Zampini       ierr         = VecNorm(lambda_global,NORM_INFINITY,&scalar_value);CHKERRQ(ierr);
21983425bc38SStefano Zampini       ierr         = PetscViewerASCIIPrintf(viewer,"E[coll]: CHECK infty norm of P^T_D - I: % 1.14e\n",scalar_value);CHKERRQ(ierr);
21993425bc38SStefano Zampini       ierr         = PetscViewerFlush(viewer);CHKERRQ(ierr);
22003425bc38SStefano Zampini       ierr         = PetscViewerFlush(viewer);CHKERRQ(ierr);
22013425bc38SStefano Zampini       ierr         = VecDestroy(&test_vec);CHKERRQ(ierr);
22023425bc38SStefano Zampini     }
22033425bc38SStefano Zampini   }
22043425bc38SStefano Zampini   /* final cleanup */
22053425bc38SStefano Zampini   ierr = PetscFree(vertex_indices);CHKERRQ(ierr);
22063425bc38SStefano Zampini   ierr = VecDestroy(&lambda_global);CHKERRQ(ierr);
22073425bc38SStefano Zampini   PetscFunctionReturn(0);
22083425bc38SStefano Zampini }
22093425bc38SStefano Zampini 
22103425bc38SStefano Zampini #undef __FUNCT__
22113425bc38SStefano Zampini #define __FUNCT__ "PCBDDCSetupFETIDPPCContext"
22123425bc38SStefano Zampini static PetscErrorCode PCBDDCSetupFETIDPPCContext(Mat fetimat, FETIDPPC_ctx *fetidppc_ctx)
22133425bc38SStefano Zampini {
22143425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
22153425bc38SStefano Zampini   PetscErrorCode ierr;
22163425bc38SStefano Zampini 
22173425bc38SStefano Zampini   PetscFunctionBegin;
22183425bc38SStefano Zampini   ierr = MatShellGetContext(fetimat,&mat_ctx);CHKERRQ(ierr);
22193425bc38SStefano Zampini   /* get references from objects created when setting up feti mat context */
22203425bc38SStefano Zampini   ierr = PetscObjectReference((PetscObject)mat_ctx->lambda_local);CHKERRQ(ierr);
2221*2fa5cd67SKarl Rupp 
22223425bc38SStefano Zampini   fetidppc_ctx->lambda_local = mat_ctx->lambda_local;
2223*2fa5cd67SKarl Rupp 
22243425bc38SStefano Zampini   ierr = PetscObjectReference((PetscObject)mat_ctx->B_Ddelta);CHKERRQ(ierr);
2225*2fa5cd67SKarl Rupp 
22263425bc38SStefano Zampini   fetidppc_ctx->B_Ddelta = mat_ctx->B_Ddelta;
2227*2fa5cd67SKarl Rupp 
22283425bc38SStefano Zampini   ierr = PetscObjectReference((PetscObject)mat_ctx->l2g_lambda);CHKERRQ(ierr);
2229*2fa5cd67SKarl Rupp 
22303425bc38SStefano Zampini   fetidppc_ctx->l2g_lambda = mat_ctx->l2g_lambda;
22313425bc38SStefano Zampini   PetscFunctionReturn(0);
22323425bc38SStefano Zampini }
22333425bc38SStefano Zampini 
22343425bc38SStefano Zampini #undef __FUNCT__
22353425bc38SStefano Zampini #define __FUNCT__ "FETIDPMatMult"
22363425bc38SStefano Zampini static PetscErrorCode FETIDPMatMult(Mat fetimat, Vec x, Vec y)
22373425bc38SStefano Zampini {
22383425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
22393425bc38SStefano Zampini   PC_IS          *pcis;
22403425bc38SStefano Zampini   PetscErrorCode ierr;
22413425bc38SStefano Zampini 
22423425bc38SStefano Zampini   PetscFunctionBegin;
22433425bc38SStefano Zampini   ierr = MatShellGetContext(fetimat,&mat_ctx);CHKERRQ(ierr);
22443425bc38SStefano Zampini   pcis = (PC_IS*)mat_ctx->pc->data;
22453425bc38SStefano Zampini   /* Application of B_delta^T */
22463425bc38SStefano Zampini   ierr = VecScatterBegin(mat_ctx->l2g_lambda,x,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
22473425bc38SStefano Zampini   ierr = VecScatterEnd(mat_ctx->l2g_lambda,x,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
22483425bc38SStefano Zampini   ierr = MatMultTranspose(mat_ctx->B_delta,mat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr);
22493425bc38SStefano Zampini   /* Application of \widetilde{S}^-1 */
22503425bc38SStefano Zampini   ierr = VecSet(pcis->vec1_D,0.0);CHKERRQ(ierr);
22513425bc38SStefano Zampini   ierr = PCBDDCApplyInterfacePreconditioner(mat_ctx->pc);CHKERRQ(ierr);
22523425bc38SStefano Zampini   /* Application of B_delta */
22533425bc38SStefano Zampini   ierr = MatMult(mat_ctx->B_delta,pcis->vec1_B,mat_ctx->lambda_local);CHKERRQ(ierr);
22543425bc38SStefano Zampini   ierr = VecSet(y,0.0);CHKERRQ(ierr);
22553425bc38SStefano Zampini   ierr = VecScatterBegin(mat_ctx->l2g_lambda,mat_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
22563425bc38SStefano Zampini   ierr = VecScatterEnd(mat_ctx->l2g_lambda,mat_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
22573425bc38SStefano Zampini   PetscFunctionReturn(0);
22583425bc38SStefano Zampini }
22593425bc38SStefano Zampini 
22603425bc38SStefano Zampini #undef __FUNCT__
22613425bc38SStefano Zampini #define __FUNCT__ "FETIDPPCApply"
22623425bc38SStefano Zampini static PetscErrorCode FETIDPPCApply(PC fetipc, Vec x, Vec y)
22633425bc38SStefano Zampini {
22643425bc38SStefano Zampini   FETIDPPC_ctx   *pc_ctx;
22653425bc38SStefano Zampini   PC_IS          *pcis;
22663425bc38SStefano Zampini   PetscErrorCode ierr;
22673425bc38SStefano Zampini 
22683425bc38SStefano Zampini   PetscFunctionBegin;
22693425bc38SStefano Zampini   ierr = PCShellGetContext(fetipc,(void**)&pc_ctx);
22703425bc38SStefano Zampini   pcis = (PC_IS*)pc_ctx->pc->data;
22713425bc38SStefano Zampini   /* Application of B_Ddelta^T */
22723425bc38SStefano Zampini   ierr = VecScatterBegin(pc_ctx->l2g_lambda,x,pc_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
22733425bc38SStefano Zampini   ierr = VecScatterEnd(pc_ctx->l2g_lambda,x,pc_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
22743425bc38SStefano Zampini   ierr = VecSet(pcis->vec2_B,0.0);CHKERRQ(ierr);
22753425bc38SStefano Zampini   ierr = MatMultTranspose(pc_ctx->B_Ddelta,pc_ctx->lambda_local,pcis->vec2_B);CHKERRQ(ierr);
22763425bc38SStefano Zampini   /* Application of S */
22773425bc38SStefano Zampini   ierr = PCISApplySchur(pc_ctx->pc,pcis->vec2_B,pcis->vec1_B,(Vec)0,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr);
22783425bc38SStefano Zampini   /* Application of B_Ddelta */
22793425bc38SStefano Zampini   ierr = MatMult(pc_ctx->B_Ddelta,pcis->vec1_B,pc_ctx->lambda_local);CHKERRQ(ierr);
22803425bc38SStefano Zampini   ierr = VecSet(y,0.0);CHKERRQ(ierr);
22813425bc38SStefano Zampini   ierr = VecScatterBegin(pc_ctx->l2g_lambda,pc_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
22823425bc38SStefano Zampini   ierr = VecScatterEnd(pc_ctx->l2g_lambda,pc_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
22833425bc38SStefano Zampini   PetscFunctionReturn(0);
22843425bc38SStefano Zampini }
22853425bc38SStefano Zampini 
2286da1bb401SStefano Zampini #undef __FUNCT__
2287da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetupLocalAdjacencyGraph"
2288da1bb401SStefano Zampini static PetscErrorCode PCBDDCSetupLocalAdjacencyGraph(PC pc)
2289da1bb401SStefano Zampini {
2290da1bb401SStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
2291da1bb401SStefano Zampini   Mat_IS         *matis  = (Mat_IS*)pc->pmat->data;
22921a83f524SJed Brown   PetscInt       nvtxs;
22931a83f524SJed Brown   const PetscInt *xadj,*adjncy;
2294da1bb401SStefano Zampini   Mat            mat_adj;
2295da1bb401SStefano Zampini   PetscBool      symmetrize_rowij=PETSC_TRUE,compressed_rowij=PETSC_FALSE,flg_row=PETSC_TRUE;
2296da1bb401SStefano Zampini   PCBDDCGraph    mat_graph       =pcbddc->mat_graph;
2297da1bb401SStefano Zampini   PetscErrorCode ierr;
2298da1bb401SStefano Zampini 
2299da1bb401SStefano Zampini   PetscFunctionBegin;
2300da1bb401SStefano Zampini   /* get CSR adjacency from local matrix if user has not yet provided local graph using PCBDDCSetLocalAdjacencyGraph function */
2301da1bb401SStefano Zampini   if (!mat_graph->xadj) {
2302da1bb401SStefano Zampini     ierr = MatConvert(matis->A,MATMPIADJ,MAT_INITIAL_MATRIX,&mat_adj);CHKERRQ(ierr);
2303da1bb401SStefano Zampini     ierr = MatGetRowIJ(mat_adj,0,symmetrize_rowij,compressed_rowij,&nvtxs,&xadj,&adjncy,&flg_row);CHKERRQ(ierr);
2304acee19a7SJed Brown     if (!flg_row) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in MatGetRowIJ()\n");
2305da1bb401SStefano Zampini     /* Get adjacency into BDDC workspace */
2306da1bb401SStefano Zampini     ierr = PCBDDCSetLocalAdjacencyGraph(pc,nvtxs,xadj,adjncy,PETSC_COPY_VALUES);CHKERRQ(ierr);
2307da1bb401SStefano Zampini     ierr = MatRestoreRowIJ(mat_adj,0,symmetrize_rowij,compressed_rowij,&nvtxs,&xadj,&adjncy,&flg_row);CHKERRQ(ierr);
2308acee19a7SJed Brown     if (!flg_row) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in MatRestoreRowIJ()\n");
2309da1bb401SStefano Zampini     ierr = MatDestroy(&mat_adj);CHKERRQ(ierr);
2310da1bb401SStefano Zampini   }
2311da1bb401SStefano Zampini   PetscFunctionReturn(0);
2312da1bb401SStefano Zampini }
2313da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
23140c7d97c5SJed Brown #undef __FUNCT__
23150c7d97c5SJed Brown #define __FUNCT__ "PCBDDCApplyInterfacePreconditioner"
23162617d88aSStefano Zampini static PetscErrorCode  PCBDDCApplyInterfacePreconditioner(PC pc)
23170c7d97c5SJed Brown {
23180c7d97c5SJed Brown   PetscErrorCode    ierr;
23190c7d97c5SJed Brown   PC_BDDC           *pcbddc = (PC_BDDC*)(pc->data);
23200c7d97c5SJed Brown   PC_IS             *pcis   = (PC_IS*)(pc->data);
23213b03a366Sstefano_zampini   const PetscScalar zero     = 0.0;
23220c7d97c5SJed Brown 
23230c7d97c5SJed Brown   PetscFunctionBegin;
23240c7d97c5SJed Brown   /* Application of PHI^T  */
23250c7d97c5SJed Brown   ierr = MatMultTranspose(pcbddc->coarse_phi_B,pcis->vec1_B,pcbddc->vec1_P);CHKERRQ(ierr);
232629622bf0SStefano Zampini   if (pcbddc->inexact_prec_type) { ierr = MatMultTransposeAdd(pcbddc->coarse_phi_D,pcis->vec1_D,pcbddc->vec1_P,pcbddc->vec1_P);CHKERRQ(ierr); }
23270c7d97c5SJed Brown 
23280c7d97c5SJed Brown   /* Scatter data of coarse_rhs */
2329142dfd88SStefano Zampini   if (pcbddc->coarse_rhs) { ierr = VecSet(pcbddc->coarse_rhs,zero);CHKERRQ(ierr); }
23300c7d97c5SJed Brown   ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->vec1_P,pcbddc->coarse_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
23310c7d97c5SJed Brown 
23320c7d97c5SJed Brown   /* Local solution on R nodes */
23330c7d97c5SJed Brown   ierr = VecSet(pcbddc->vec1_R,zero);CHKERRQ(ierr);
23340c7d97c5SJed Brown   ierr = VecScatterBegin(pcbddc->R_to_B,pcis->vec1_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
23350c7d97c5SJed Brown   ierr = VecScatterEnd  (pcbddc->R_to_B,pcis->vec1_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
233629622bf0SStefano Zampini   if (pcbddc->inexact_prec_type) {
23370c7d97c5SJed Brown     ierr = VecScatterBegin(pcbddc->R_to_D,pcis->vec1_D,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
23380c7d97c5SJed Brown     ierr = VecScatterEnd  (pcbddc->R_to_D,pcis->vec1_D,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
23390c7d97c5SJed Brown   }
23400c7d97c5SJed Brown   ierr = PCBDDCSolveSaddlePoint(pc);CHKERRQ(ierr);
23410c7d97c5SJed Brown   ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr);
23420c7d97c5SJed Brown   ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec2_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
23430c7d97c5SJed Brown   ierr = VecScatterEnd  (pcbddc->R_to_B,pcbddc->vec2_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
234429622bf0SStefano Zampini   if (pcbddc->inexact_prec_type) {
23450c7d97c5SJed Brown     ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec2_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
23460c7d97c5SJed Brown     ierr = VecScatterEnd  (pcbddc->R_to_D,pcbddc->vec2_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
23470c7d97c5SJed Brown   }
23480c7d97c5SJed Brown 
23490c7d97c5SJed Brown   /* Coarse solution */
23500c7d97c5SJed Brown   ierr = PCBDDCScatterCoarseDataEnd(pc,pcbddc->vec1_P,pcbddc->coarse_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
23510bdf917eSStefano Zampini   if (pcbddc->coarse_rhs) {
23520bdf917eSStefano Zampini     if (pcbddc->CoarseNullSpace) {
23530bdf917eSStefano Zampini       ierr = MatNullSpaceRemove(pcbddc->CoarseNullSpace,pcbddc->coarse_rhs,PETSC_NULL);CHKERRQ(ierr);
23540bdf917eSStefano Zampini     }
23550bdf917eSStefano Zampini     ierr = KSPSolve(pcbddc->coarse_ksp,pcbddc->coarse_rhs,pcbddc->coarse_vec);CHKERRQ(ierr);
23560bdf917eSStefano Zampini     if (pcbddc->CoarseNullSpace) {
23570bdf917eSStefano Zampini       ierr = MatNullSpaceRemove(pcbddc->CoarseNullSpace,pcbddc->coarse_vec,PETSC_NULL);CHKERRQ(ierr);
23580bdf917eSStefano Zampini     }
23590bdf917eSStefano Zampini   }
23600c7d97c5SJed Brown   ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->coarse_vec,pcbddc->vec1_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
23610c7d97c5SJed Brown   ierr = PCBDDCScatterCoarseDataEnd  (pc,pcbddc->coarse_vec,pcbddc->vec1_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
23620c7d97c5SJed Brown 
23630c7d97c5SJed Brown   /* Sum contributions from two levels */
23640c7d97c5SJed Brown   ierr = MatMultAdd(pcbddc->coarse_phi_B,pcbddc->vec1_P,pcis->vec1_B,pcis->vec1_B);CHKERRQ(ierr);
236529622bf0SStefano Zampini   if (pcbddc->inexact_prec_type) { ierr = MatMultAdd(pcbddc->coarse_phi_D,pcbddc->vec1_P,pcis->vec1_D,pcis->vec1_D);CHKERRQ(ierr); }
23660c7d97c5SJed Brown   PetscFunctionReturn(0);
23670c7d97c5SJed Brown }
23680c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
23690c7d97c5SJed Brown #undef __FUNCT__
23700c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSolveSaddlePoint"
237153cdbc3dSStefano Zampini static PetscErrorCode  PCBDDCSolveSaddlePoint(PC pc)
23720c7d97c5SJed Brown {
23730c7d97c5SJed Brown   PetscErrorCode ierr;
23740c7d97c5SJed Brown   PC_BDDC        *pcbddc = (PC_BDDC*)(pc->data);
23750c7d97c5SJed Brown 
23760c7d97c5SJed Brown   PetscFunctionBegin;
237753cdbc3dSStefano Zampini   ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr);
2378534831adSStefano Zampini   if (pcbddc->local_auxmat1) {
23790c7d97c5SJed Brown     ierr = MatMult(pcbddc->local_auxmat1,pcbddc->vec2_R,pcbddc->vec1_C);CHKERRQ(ierr);
23800c7d97c5SJed Brown     ierr = MatMultAdd(pcbddc->local_auxmat2,pcbddc->vec1_C,pcbddc->vec2_R,pcbddc->vec2_R);CHKERRQ(ierr);
23810c7d97c5SJed Brown   }
23820c7d97c5SJed Brown   PetscFunctionReturn(0);
23830c7d97c5SJed Brown }
23840c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
23850c7d97c5SJed Brown #undef __FUNCT__
23860c7d97c5SJed Brown #define __FUNCT__ "PCBDDCScatterCoarseDataBegin"
238753cdbc3dSStefano Zampini static PetscErrorCode  PCBDDCScatterCoarseDataBegin(PC pc,Vec vec_from, Vec vec_to, InsertMode imode, ScatterMode smode)
23880c7d97c5SJed Brown {
23890c7d97c5SJed Brown   PetscErrorCode ierr;
23900c7d97c5SJed Brown   PC_BDDC        *pcbddc = (PC_BDDC*)(pc->data);
23910c7d97c5SJed Brown 
23920c7d97c5SJed Brown   PetscFunctionBegin;
23930c7d97c5SJed Brown   switch (pcbddc->coarse_communications_type) {
23940c7d97c5SJed Brown   case SCATTERS_BDDC:
23950c7d97c5SJed Brown     ierr = VecScatterBegin(pcbddc->coarse_loc_to_glob,vec_from,vec_to,imode,smode);CHKERRQ(ierr);
23960c7d97c5SJed Brown     break;
23970c7d97c5SJed Brown   case GATHERS_BDDC:
23980c7d97c5SJed Brown     break;
23990c7d97c5SJed Brown   }
24000c7d97c5SJed Brown   PetscFunctionReturn(0);
24010c7d97c5SJed Brown }
24020c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
24030c7d97c5SJed Brown #undef __FUNCT__
24040c7d97c5SJed Brown #define __FUNCT__ "PCBDDCScatterCoarseDataEnd"
240553cdbc3dSStefano Zampini static PetscErrorCode  PCBDDCScatterCoarseDataEnd(PC pc,Vec vec_from, Vec vec_to, InsertMode imode, ScatterMode smode)
24060c7d97c5SJed Brown {
24070c7d97c5SJed Brown   PetscErrorCode ierr;
24080c7d97c5SJed Brown   PC_BDDC        *pcbddc = (PC_BDDC*)(pc->data);
24090c7d97c5SJed Brown   PetscScalar    *array_to;
24100c7d97c5SJed Brown   PetscScalar    *array_from;
24110c7d97c5SJed Brown   MPI_Comm       comm=((PetscObject)pc)->comm;
24120c7d97c5SJed Brown   PetscInt       i;
24130c7d97c5SJed Brown 
24140c7d97c5SJed Brown   PetscFunctionBegin;
24150c7d97c5SJed Brown   switch (pcbddc->coarse_communications_type) {
24160c7d97c5SJed Brown   case SCATTERS_BDDC:
24170c7d97c5SJed Brown     ierr = VecScatterEnd(pcbddc->coarse_loc_to_glob,vec_from,vec_to,imode,smode);CHKERRQ(ierr);
24180c7d97c5SJed Brown     break;
24190c7d97c5SJed Brown   case GATHERS_BDDC:
24200c7d97c5SJed Brown     if (vec_from) VecGetArray(vec_from,&array_from);
24210c7d97c5SJed Brown     if (vec_to) VecGetArray(vec_to,&array_to);
24220c7d97c5SJed Brown     switch (pcbddc->coarse_problem_type) {
24230c7d97c5SJed Brown     case SEQUENTIAL_BDDC:
24240c7d97c5SJed Brown       if (smode == SCATTER_FORWARD) {
242553cdbc3dSStefano Zampini         ierr = MPI_Gatherv(&array_from[0],pcbddc->local_primal_size,MPIU_SCALAR,&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,0,comm);CHKERRQ(ierr);
24260c7d97c5SJed Brown         if (vec_to) {
24270bdf917eSStefano Zampini           if (imode == ADD_VALUES) {
24280bdf917eSStefano Zampini             for (i=0;i<pcbddc->replicated_primal_size;i++) {
24290c7d97c5SJed Brown               array_to[pcbddc->replicated_local_primal_indices[i]]+=pcbddc->replicated_local_primal_values[i];
24300c7d97c5SJed Brown             }
24310c7d97c5SJed Brown           } else {
24320bdf917eSStefano Zampini             for (i=0;i<pcbddc->replicated_primal_size;i++) {
24330bdf917eSStefano Zampini               array_to[pcbddc->replicated_local_primal_indices[i]]=pcbddc->replicated_local_primal_values[i];
24340bdf917eSStefano Zampini             }
24350bdf917eSStefano Zampini           }
24360bdf917eSStefano Zampini         }
24370bdf917eSStefano Zampini       } else {
24380bdf917eSStefano Zampini         if (vec_from) {
24390bdf917eSStefano Zampini           if (imode == ADD_VALUES) {
24400bdf917eSStefano Zampini             printf("Scatter mode %d, insert mode %d for case %d not implemented!\n",smode,imode,pcbddc->coarse_problem_type);
24410bdf917eSStefano Zampini           }
24420bdf917eSStefano Zampini           for (i=0;i<pcbddc->replicated_primal_size;i++) {
24430c7d97c5SJed Brown             pcbddc->replicated_local_primal_values[i]=array_from[pcbddc->replicated_local_primal_indices[i]];
24440bdf917eSStefano Zampini           }
24450bdf917eSStefano Zampini         }
244653cdbc3dSStefano Zampini         ierr = MPI_Scatterv(&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,&array_to[0],pcbddc->local_primal_size,MPIU_SCALAR,0,comm);CHKERRQ(ierr);
24470c7d97c5SJed Brown       }
24480c7d97c5SJed Brown       break;
24490c7d97c5SJed Brown     case REPLICATED_BDDC:
24500c7d97c5SJed Brown       if (smode == SCATTER_FORWARD) {
245153cdbc3dSStefano Zampini         ierr = MPI_Allgatherv(&array_from[0],pcbddc->local_primal_size,MPIU_SCALAR,&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,comm);CHKERRQ(ierr);
24520bdf917eSStefano Zampini         if (imode == ADD_VALUES) {
24530bdf917eSStefano Zampini           for (i=0;i<pcbddc->replicated_primal_size;i++) {
24540c7d97c5SJed Brown             array_to[pcbddc->replicated_local_primal_indices[i]]+=pcbddc->replicated_local_primal_values[i];
24550bdf917eSStefano Zampini           }
24560bdf917eSStefano Zampini         } else {
24570bdf917eSStefano Zampini           for (i=0;i<pcbddc->replicated_primal_size;i++) {
24580bdf917eSStefano Zampini             array_to[pcbddc->replicated_local_primal_indices[i]]=pcbddc->replicated_local_primal_values[i];
24590bdf917eSStefano Zampini           }
24600bdf917eSStefano Zampini         }
24610c7d97c5SJed Brown       } else { /* no communications needed for SCATTER_REVERSE since needed data is already present */
24620bdf917eSStefano Zampini         if (imode == ADD_VALUES) {
24630bdf917eSStefano Zampini           for (i=0;i<pcbddc->local_primal_size;i++) {
24640bdf917eSStefano Zampini             array_to[i]+=array_from[pcbddc->local_primal_indices[i]];
24650bdf917eSStefano Zampini           }
24660bdf917eSStefano Zampini         } else {
24670bdf917eSStefano Zampini           for (i=0;i<pcbddc->local_primal_size;i++) {
24680c7d97c5SJed Brown             array_to[i]=array_from[pcbddc->local_primal_indices[i]];
24690c7d97c5SJed Brown           }
24700bdf917eSStefano Zampini         }
24710bdf917eSStefano Zampini       }
24720c7d97c5SJed Brown       break;
247353cdbc3dSStefano Zampini     case MULTILEVEL_BDDC:
247453cdbc3dSStefano Zampini       break;
247553cdbc3dSStefano Zampini     case PARALLEL_BDDC:
247653cdbc3dSStefano Zampini       break;
24770c7d97c5SJed Brown     }
24780c7d97c5SJed Brown     if (vec_from) VecRestoreArray(vec_from,&array_from);
24790c7d97c5SJed Brown     if (vec_to) VecRestoreArray(vec_to,&array_to);
24800c7d97c5SJed Brown     break;
24810c7d97c5SJed Brown   }
24820c7d97c5SJed Brown   PetscFunctionReturn(0);
24830c7d97c5SJed Brown }
24840c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
24853b03a366Sstefano_zampini #undef __FUNCT__
24863b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCCreateConstraintMatrix"
24873b03a366Sstefano_zampini static PetscErrorCode PCBDDCCreateConstraintMatrix(PC pc)
24883b03a366Sstefano_zampini {
24893b03a366Sstefano_zampini   PetscErrorCode ierr;
24903b03a366Sstefano_zampini   PC_IS          *pcis    = (PC_IS*)(pc->data);
24913b03a366Sstefano_zampini   PC_BDDC        *pcbddc  = (PC_BDDC*)pc->data;
24923b03a366Sstefano_zampini   Mat_IS         *matis   = (Mat_IS*)pc->pmat->data;
249323d4d1a5SStefano Zampini   PetscInt       *nnz,*is_indices;
24943b03a366Sstefano_zampini   PetscScalar    *temp_quadrature_constraint;
2495534831adSStefano Zampini   PetscInt       *temp_indices,*temp_indices_to_constraint,*temp_indices_to_constraint_B,*local_to_B;
24963b03a366Sstefano_zampini   PetscInt       local_primal_size,i,j,k,total_counts,max_size_of_constraint;
24973b03a366Sstefano_zampini   PetscInt       n_constraints,n_vertices,size_of_constraint;
2498534831adSStefano Zampini   PetscScalar    quad_value;
24993b03a366Sstefano_zampini   PetscBool      nnsp_has_cnst=PETSC_FALSE,use_nnsp_true=pcbddc->use_nnsp_true;
25003b03a366Sstefano_zampini   PetscInt       nnsp_size    =0,nnsp_addone=0,temp_constraints,temp_start_ptr;
25013b03a366Sstefano_zampini   IS             *used_IS;
250219fd82e9SBarry Smith   MatType        impMatType=MATSEQAIJ;
25033b03a366Sstefano_zampini   PetscBLASInt   Bs,Bt,lwork,lierr;
25043b03a366Sstefano_zampini   PetscReal      tol=1.0e-8;
2505fcda91b4SJed Brown   MatNullSpace   nearnullsp;
2506fcda91b4SJed Brown   const Vec      *nearnullvecs;
25073b03a366Sstefano_zampini   Vec            *localnearnullsp;
25083b03a366Sstefano_zampini   PetscScalar    *work,*temp_basis,*array_vector,*correlation_mat;
25093b03a366Sstefano_zampini   PetscReal      *rwork,*singular_vals;
2510534831adSStefano Zampini   PetscBLASInt   Bone=1,*ipiv;
2511534831adSStefano Zampini   Vec            temp_vec;
2512534831adSStefano Zampini   Mat            temp_mat;
2513534831adSStefano Zampini   KSP            temp_ksp;
2514ffe5efe1SStefano Zampini   PC             temp_pc;
2515534831adSStefano Zampini   PetscInt       s,start_constraint,dual_dofs;
2516534831adSStefano Zampini   PetscBool      compute_submatrix,useksp=PETSC_FALSE;
2517534831adSStefano Zampini   PetscInt       *aux_primal_permutation,*aux_primal_numbering;
2518534831adSStefano Zampini   PetscBool      boolforface,*change_basis;
2519*2fa5cd67SKarl Rupp 
2520de534f79Sstefano_zampini /* some ugly conditional declarations */
25213b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD)
25223b03a366Sstefano_zampini   PetscScalar  dot_result;
25233b03a366Sstefano_zampini   PetscScalar  one=1.0,zero=0.0;
25243b03a366Sstefano_zampini   PetscInt     ii;
25253425bc38SStefano Zampini   PetscScalar  *singular_vectors;
25263425bc38SStefano Zampini   PetscBLASInt *iwork,*ifail;
25273425bc38SStefano Zampini   PetscReal    dummy_real,abs_tol;
25283425bc38SStefano Zampini   PetscBLASInt eigs_found;
25293b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX)
25303b03a366Sstefano_zampini   PetscScalar val1,val2;
25313b03a366Sstefano_zampini #endif
25323425bc38SStefano Zampini #endif
25333b03a366Sstefano_zampini   PetscBLASInt dummy_int;
25343b03a366Sstefano_zampini   PetscScalar  dummy_scalar;
25353b03a366Sstefano_zampini 
25363b03a366Sstefano_zampini   PetscFunctionBegin;
25373b03a366Sstefano_zampini   /* check if near null space is attached to global mat */
2538fcda91b4SJed Brown   ierr = MatGetNearNullSpace(pc->pmat,&nearnullsp);CHKERRQ(ierr);
2539fcda91b4SJed Brown   if (nearnullsp) {
2540fcda91b4SJed Brown     ierr = MatNullSpaceGetVecs(nearnullsp,&nnsp_has_cnst,&nnsp_size,&nearnullvecs);CHKERRQ(ierr);
25413b03a366Sstefano_zampini   } else { /* if near null space is not provided it uses constants */
25423b03a366Sstefano_zampini     nnsp_has_cnst = PETSC_TRUE;
25433b03a366Sstefano_zampini     use_nnsp_true = PETSC_TRUE;
25443b03a366Sstefano_zampini   }
2545*2fa5cd67SKarl Rupp   if (nnsp_has_cnst) nnsp_addone = 1;
2546*2fa5cd67SKarl Rupp 
25473b03a366Sstefano_zampini   /*
25483b03a366Sstefano_zampini        Evaluate maximum storage size needed by the procedure
25493b03a366Sstefano_zampini        - temp_indices will contain start index of each constraint stored as follows
25503b03a366Sstefano_zampini        - temp_indices_to_constraint  [temp_indices[i],...,temp[indices[i+1]-1] will contain the indices (in local numbering) on which the constraint acts
2551534831adSStefano Zampini        - temp_indices_to_constraint_B[temp_indices[i],...,temp[indices[i+1]-1] will contain the indices (in boundary numbering) on which the constraint acts
25523b03a366Sstefano_zampini        - temp_quadrature_constraint  [temp_indices[i],...,temp[indices[i+1]-1] will contain the scalars representing the constraint itself
25533b03a366Sstefano_zampini                                                                                                                                                          */
2554da1bb401SStefano Zampini 
25553b03a366Sstefano_zampini   total_counts  = pcbddc->n_ISForFaces+pcbddc->n_ISForEdges;
25563b03a366Sstefano_zampini   total_counts *= (nnsp_addone+nnsp_size);
2557*2fa5cd67SKarl Rupp 
2558da1bb401SStefano Zampini   ierr = ISGetSize(pcbddc->ISForVertices,&n_vertices);CHKERRQ(ierr);
2559*2fa5cd67SKarl Rupp 
2560da1bb401SStefano Zampini   total_counts += n_vertices;
2561*2fa5cd67SKarl Rupp 
25623b03a366Sstefano_zampini   ierr = PetscMalloc((total_counts+1)*sizeof(PetscInt),&temp_indices);CHKERRQ(ierr);
2563534831adSStefano Zampini   ierr = PetscMalloc((total_counts+1)*sizeof(PetscBool),&change_basis);CHKERRQ(ierr);
2564*2fa5cd67SKarl Rupp 
25653b03a366Sstefano_zampini   total_counts           = 0;
25663b03a366Sstefano_zampini   max_size_of_constraint = 0;
25673b03a366Sstefano_zampini   for (i=0;i<pcbddc->n_ISForEdges+pcbddc->n_ISForFaces;i++) {
2568*2fa5cd67SKarl Rupp     if (i<pcbddc->n_ISForEdges) used_IS = &pcbddc->ISForEdges[i];
2569*2fa5cd67SKarl Rupp     else used_IS = &pcbddc->ISForFaces[i-pcbddc->n_ISForEdges];
25703b03a366Sstefano_zampini     ierr = ISGetSize(*used_IS,&j);CHKERRQ(ierr);
25713b03a366Sstefano_zampini     total_counts += j;
25723b03a366Sstefano_zampini     if (j>max_size_of_constraint) max_size_of_constraint=j;
25733b03a366Sstefano_zampini   }
25743b03a366Sstefano_zampini   total_counts *= (nnsp_addone+nnsp_size);
2575da1bb401SStefano Zampini   total_counts += n_vertices;
2576*2fa5cd67SKarl Rupp 
25773b03a366Sstefano_zampini   ierr = PetscMalloc(total_counts*sizeof(PetscScalar),&temp_quadrature_constraint);CHKERRQ(ierr);
25783b03a366Sstefano_zampini   ierr = PetscMalloc(total_counts*sizeof(PetscInt),&temp_indices_to_constraint);CHKERRQ(ierr);
2579534831adSStefano Zampini   ierr = PetscMalloc(total_counts*sizeof(PetscInt),&temp_indices_to_constraint_B);CHKERRQ(ierr);
2580534831adSStefano Zampini   ierr = PetscMalloc(pcis->n*sizeof(PetscInt),&local_to_B);CHKERRQ(ierr);
2581534831adSStefano Zampini   ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2582*2fa5cd67SKarl Rupp 
2583*2fa5cd67SKarl Rupp   for (i=0;i<pcis->n;i++) local_to_B[i]=-1;
2584*2fa5cd67SKarl Rupp   for (i=0;i<pcis->n_B;i++) local_to_B[is_indices[i]]=i;
2585534831adSStefano Zampini   ierr = ISRestoreIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2586534831adSStefano Zampini 
25873b03a366Sstefano_zampini   /* First we issue queries to allocate optimal workspace for LAPACKgesvd or LAPACKsyev/LAPACKheev */
25883b03a366Sstefano_zampini   rwork           = 0;
25893b03a366Sstefano_zampini   work            = 0;
25903b03a366Sstefano_zampini   singular_vals   = 0;
25913b03a366Sstefano_zampini   temp_basis      = 0;
25923b03a366Sstefano_zampini   correlation_mat = 0;
25933b03a366Sstefano_zampini   if (!pcbddc->use_nnsp_true) {
25943b03a366Sstefano_zampini     PetscScalar temp_work;
25953b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD)
25963b03a366Sstefano_zampini     /* POD */
25973b03a366Sstefano_zampini     PetscInt max_n;
25983b03a366Sstefano_zampini     max_n = nnsp_addone+nnsp_size;
25993b03a366Sstefano_zampini     /* using some techniques borrowed from Proper Orthogonal Decomposition */
26003b03a366Sstefano_zampini     ierr = PetscMalloc(max_n*max_n*sizeof(PetscScalar),&correlation_mat);CHKERRQ(ierr);
26013425bc38SStefano Zampini     ierr = PetscMalloc(max_n*max_n*sizeof(PetscScalar),&singular_vectors);CHKERRQ(ierr);
26023b03a366Sstefano_zampini     ierr = PetscMalloc(max_n*sizeof(PetscReal),&singular_vals);CHKERRQ(ierr);
26033b03a366Sstefano_zampini     ierr = PetscMalloc(max_size_of_constraint*(nnsp_addone+nnsp_size)*sizeof(PetscScalar),&temp_basis);CHKERRQ(ierr);
26043b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX)
26053b03a366Sstefano_zampini     ierr = PetscMalloc(3*max_n*sizeof(PetscReal),&rwork);CHKERRQ(ierr);
26063b03a366Sstefano_zampini #endif
26073425bc38SStefano Zampini     ierr = PetscMalloc(5*max_n*sizeof(PetscBLASInt),&iwork);CHKERRQ(ierr);
26083425bc38SStefano Zampini     ierr = PetscMalloc(max_n*sizeof(PetscBLASInt),&ifail);CHKERRQ(ierr);
26093b03a366Sstefano_zampini     /* now we evaluate the optimal workspace using query with lwork=-1 */
2610c5df96a5SBarry Smith     ierr  = PetscBLASIntCast(max_n,&Bt);CHKERRQ(ierr);
26113b03a366Sstefano_zampini     lwork =-1;
26123425bc38SStefano Zampini     ierr  = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
26133b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX)
26143425bc38SStefano Zampini     abs_tol=1.e-8;
26153425bc38SStefano Zampini     LAPACKsyevx_("V","A","U",&Bt,correlation_mat,&Bt,&dummy_real,&dummy_real,&dummy_int,&dummy_int,
26163425bc38SStefano Zampini                  &abs_tol,&eigs_found,singular_vals,singular_vectors,&Bt,&temp_work,&lwork,iwork,ifail,&lierr);
26173b03a366Sstefano_zampini #else
26183425bc38SStefano Zampini     SETERRQ(((PetscObject) pc)->comm, PETSC_ERR_SUP, "Not yet implemented for complexes when PETSC_MISSING_GESVD = 1");
26193b03a366Sstefano_zampini #endif
26203425bc38SStefano Zampini     if (lierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to SYEVX Lapack routine %d",(int)lierr);
26213425bc38SStefano Zampini     ierr = PetscFPTrapPop();CHKERRQ(ierr);
26223b03a366Sstefano_zampini #else /* on missing GESVD */
26233b03a366Sstefano_zampini       /* SVD */
26243b03a366Sstefano_zampini     PetscInt max_n,min_n;
26253b03a366Sstefano_zampini     max_n = max_size_of_constraint;
26263b03a366Sstefano_zampini     min_n = nnsp_addone+nnsp_size;
26273b03a366Sstefano_zampini     if (max_size_of_constraint < (nnsp_addone+nnsp_size)) {
26283b03a366Sstefano_zampini       min_n = max_size_of_constraint;
26293b03a366Sstefano_zampini       max_n = nnsp_addone+nnsp_size;
26303b03a366Sstefano_zampini     }
26313b03a366Sstefano_zampini     ierr = PetscMalloc(min_n*sizeof(PetscReal),&singular_vals);CHKERRQ(ierr);
26323b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX)
26333b03a366Sstefano_zampini     ierr = PetscMalloc(5*min_n*sizeof(PetscReal),&rwork);CHKERRQ(ierr);
26343b03a366Sstefano_zampini #endif
26353b03a366Sstefano_zampini     /* now we evaluate the optimal workspace using query with lwork=-1 */
26363b03a366Sstefano_zampini     lwork     =-1;
2637c5df96a5SBarry Smith     ierr      = PetscBLASIntCast(max_n,&Bs);CHKERRQ(ierr);
2638c5df96a5SBarry Smith     ierr      = PetscBLASIntCast(min_n,&Bt);CHKERRQ(ierr);
26393b03a366Sstefano_zampini     dummy_int = Bs;
2640670f3ff9SJed Brown     ierr      = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
26413b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX)
26423b03a366Sstefano_zampini     LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[0],&Bs,singular_vals,
26433b03a366Sstefano_zampini                  &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,&temp_work,&lwork,&lierr);
26443b03a366Sstefano_zampini #else
26453b03a366Sstefano_zampini     LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[0],&Bs,singular_vals,
26463b03a366Sstefano_zampini                  &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,&temp_work,&lwork,rwork,&lierr);
26473b03a366Sstefano_zampini #endif
26483b03a366Sstefano_zampini     if (lierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to SVD Lapack routine %d",(int)lierr);
2649670f3ff9SJed Brown     ierr = PetscFPTrapPop();CHKERRQ(ierr);
26503b03a366Sstefano_zampini #endif
26513b03a366Sstefano_zampini     /* Allocate optimal workspace */
2652c5df96a5SBarry Smith     ierr         = PetscBLASIntCast((PetscInt)PetscRealPart(temp_work),&lwork);CHKERRQ(ierr);
26533b03a366Sstefano_zampini     total_counts = (PetscInt)lwork;
26543b03a366Sstefano_zampini     ierr         = PetscMalloc(total_counts*sizeof(PetscScalar),&work);CHKERRQ(ierr);
26553b03a366Sstefano_zampini   }
26563b03a366Sstefano_zampini   /* get local part of global near null space vectors */
26573b03a366Sstefano_zampini   ierr = PetscMalloc(nnsp_size*sizeof(Vec),&localnearnullsp);CHKERRQ(ierr);
26583b03a366Sstefano_zampini   for (k=0; k<nnsp_size; k++) {
26593b03a366Sstefano_zampini     ierr = VecDuplicate(pcis->vec1_N,&localnearnullsp[k]);CHKERRQ(ierr);
2660fcda91b4SJed Brown     ierr = VecScatterBegin(matis->ctx,nearnullvecs[k],localnearnullsp[k],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
2661fcda91b4SJed Brown     ierr = VecScatterEnd  (matis->ctx,nearnullvecs[k],localnearnullsp[k],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
26623b03a366Sstefano_zampini   }
26633b03a366Sstefano_zampini   /* Now we can loop on constraining sets */
26643b03a366Sstefano_zampini   total_counts   =0;
26653b03a366Sstefano_zampini   temp_indices[0]=0;
2666da1bb401SStefano Zampini   /* vertices */
2667da1bb401SStefano Zampini   PetscBool used_vertex;
2668da1bb401SStefano Zampini   ierr = ISGetIndices(pcbddc->ISForVertices,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2669da1bb401SStefano Zampini   if (nnsp_has_cnst) { /* consider all vertices */
2670da1bb401SStefano Zampini     for (i=0; i<n_vertices; i++) {
2671da1bb401SStefano Zampini       temp_indices_to_constraint[temp_indices[total_counts]]  = is_indices[i];
2672534831adSStefano Zampini       temp_indices_to_constraint_B[temp_indices[total_counts]]= local_to_B[is_indices[i]];
2673da1bb401SStefano Zampini       temp_quadrature_constraint[temp_indices[total_counts]]  = 1.0;
2674da1bb401SStefano Zampini       temp_indices[total_counts+1]                            = temp_indices[total_counts]+1;
2675534831adSStefano Zampini       change_basis[total_counts]                              = PETSC_FALSE;
2676da1bb401SStefano Zampini       total_counts++;
2677da1bb401SStefano Zampini     }
2678da1bb401SStefano Zampini   } else { /* consider vertices for which exist at least a localnearnullsp which is not null there */
2679da1bb401SStefano Zampini     for (i=0; i<n_vertices; i++) {
2680da1bb401SStefano Zampini       used_vertex = PETSC_FALSE;
2681da1bb401SStefano Zampini       k           = 0;
2682da1bb401SStefano Zampini       while (!used_vertex && k<nnsp_size) {
2683da1bb401SStefano Zampini         ierr = VecGetArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr);
2684da1bb401SStefano Zampini         if (PetscAbsScalar(array_vector[is_indices[i]])>0.0) {
2685da1bb401SStefano Zampini           temp_indices_to_constraint[temp_indices[total_counts]]  =is_indices[i];
2686534831adSStefano Zampini           temp_indices_to_constraint_B[temp_indices[total_counts]]=local_to_B[is_indices[i]];
2687da1bb401SStefano Zampini           temp_quadrature_constraint[temp_indices[total_counts]]  =1.0;
2688da1bb401SStefano Zampini           temp_indices[total_counts+1]                            =temp_indices[total_counts]+1;
2689534831adSStefano Zampini           change_basis[total_counts]                              =PETSC_FALSE;
2690da1bb401SStefano Zampini           total_counts++;
2691da1bb401SStefano Zampini           used_vertex=PETSC_TRUE;
2692da1bb401SStefano Zampini         }
2693da1bb401SStefano Zampini         ierr = VecRestoreArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr);
2694da1bb401SStefano Zampini         k++;
2695da1bb401SStefano Zampini       }
2696da1bb401SStefano Zampini     }
2697da1bb401SStefano Zampini   }
2698da1bb401SStefano Zampini   ierr       = ISRestoreIndices(pcbddc->ISForVertices,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2699da1bb401SStefano Zampini   n_vertices = total_counts;
2700*2fa5cd67SKarl Rupp 
2701da1bb401SStefano Zampini   /* edges and faces */
27023b03a366Sstefano_zampini   for (i=0; i<pcbddc->n_ISForEdges+pcbddc->n_ISForFaces; i++) {
27033b03a366Sstefano_zampini     if (i<pcbddc->n_ISForEdges) {
27043b03a366Sstefano_zampini       used_IS     = &pcbddc->ISForEdges[i];
2705534831adSStefano Zampini       boolforface = pcbddc->usechangeofbasis;
27063b03a366Sstefano_zampini     } else {
27073b03a366Sstefano_zampini       used_IS     = &pcbddc->ISForFaces[i-pcbddc->n_ISForEdges];
2708534831adSStefano Zampini       boolforface = pcbddc->usechangeonfaces;
27093b03a366Sstefano_zampini     }
27103b03a366Sstefano_zampini     temp_constraints = 0;          /* zero the number of constraints I have on this conn comp */
27113b03a366Sstefano_zampini     temp_start_ptr   = total_counts; /* need to know the starting index of constraints stored */
27123b03a366Sstefano_zampini     ierr             = ISGetSize(*used_IS,&size_of_constraint);CHKERRQ(ierr);
27133b03a366Sstefano_zampini     ierr             = ISGetIndices(*used_IS,(const PetscInt**)&is_indices);CHKERRQ(ierr);
27143b03a366Sstefano_zampini     if (nnsp_has_cnst) {
27153b03a366Sstefano_zampini       temp_constraints++;
2716534831adSStefano Zampini       quad_value = (PetscScalar) (1.0/PetscSqrtReal((PetscReal)size_of_constraint));
27173b03a366Sstefano_zampini       for (j=0; j<size_of_constraint; j++) {
27183b03a366Sstefano_zampini         temp_indices_to_constraint[temp_indices[total_counts]+j]  =is_indices[j];
2719534831adSStefano Zampini         temp_indices_to_constraint_B[temp_indices[total_counts]+j]=local_to_B[is_indices[j]];
27203b03a366Sstefano_zampini         temp_quadrature_constraint[temp_indices[total_counts]+j]  =quad_value;
27213b03a366Sstefano_zampini       }
27223b03a366Sstefano_zampini       temp_indices[total_counts+1]=temp_indices[total_counts]+size_of_constraint;  /* store new starting point */
2723534831adSStefano Zampini       change_basis[total_counts]  =boolforface;
27243b03a366Sstefano_zampini       total_counts++;
27253b03a366Sstefano_zampini     }
27263b03a366Sstefano_zampini     for (k=0; k<nnsp_size; k++) {
27273b03a366Sstefano_zampini       ierr = VecGetArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr);
27283b03a366Sstefano_zampini       for (j=0; j<size_of_constraint; j++) {
27293b03a366Sstefano_zampini         temp_indices_to_constraint[temp_indices[total_counts]+j]  =is_indices[j];
2730534831adSStefano Zampini         temp_indices_to_constraint_B[temp_indices[total_counts]+j]=local_to_B[is_indices[j]];
27313b03a366Sstefano_zampini         temp_quadrature_constraint[temp_indices[total_counts]+j]  =array_vector[is_indices[j]];
27323b03a366Sstefano_zampini       }
27333b03a366Sstefano_zampini       ierr       = VecRestoreArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr);
2734de534f79Sstefano_zampini       quad_value = 1.0;
2735de534f79Sstefano_zampini       if (use_nnsp_true) { /* check if array is null on the connected component in case use_nnsp_true has been requested */
2736c5df96a5SBarry Smith         ierr       = PetscBLASIntCast(size_of_constraint,&Bs);CHKERRQ(ierr);
2737de534f79Sstefano_zampini         quad_value = BLASasum_(&Bs,&temp_quadrature_constraint[temp_indices[total_counts]],&Bone);
2738de534f79Sstefano_zampini       }
2739de534f79Sstefano_zampini       if (quad_value > 0.0) { /* keep indices and values */
2740de534f79Sstefano_zampini         temp_constraints++;
27413b03a366Sstefano_zampini         temp_indices[total_counts+1]=temp_indices[total_counts]+size_of_constraint;  /* store new starting point */
2742534831adSStefano Zampini         change_basis[total_counts]  =boolforface;
27433b03a366Sstefano_zampini         total_counts++;
27443b03a366Sstefano_zampini       }
2745de534f79Sstefano_zampini     }
27463b03a366Sstefano_zampini     ierr = ISRestoreIndices(*used_IS,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2747de534f79Sstefano_zampini     /* perform SVD on the constraint if use_nnsp_true has not be requested by the user */
27483b03a366Sstefano_zampini     if (!use_nnsp_true) {
2749c5df96a5SBarry Smith       ierr = PetscBLASIntCast(size_of_constraint,&Bs);CHKERRQ(ierr);
2750c5df96a5SBarry Smith       ierr = PetscBLASIntCast(temp_constraints,&Bt);CHKERRQ(ierr);
2751de534f79Sstefano_zampini 
27523b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD)
27533b03a366Sstefano_zampini       ierr = PetscMemzero(correlation_mat,Bt*Bt*sizeof(PetscScalar));CHKERRQ(ierr);
27543b03a366Sstefano_zampini       /* Store upper triangular part of correlation matrix */
27553b03a366Sstefano_zampini       for (j=0; j<temp_constraints; j++) {
27563b03a366Sstefano_zampini         for (k=0; k<j+1; k++) {
27573b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX)
27583425bc38SStefano Zampini           /* hand made complex dot product -> replace */
27593b03a366Sstefano_zampini           dot_result = 0.0;
27603b03a366Sstefano_zampini           for (ii=0; ii<size_of_constraint; ii++) {
27613b03a366Sstefano_zampini             val1        = temp_quadrature_constraint[temp_indices[temp_start_ptr+j]+ii];
27623b03a366Sstefano_zampini             val2        = temp_quadrature_constraint[temp_indices[temp_start_ptr+k]+ii];
27633b03a366Sstefano_zampini             dot_result += val1*PetscConj(val2);
27643b03a366Sstefano_zampini           }
27653b03a366Sstefano_zampini #else
27663b03a366Sstefano_zampini           dot_result = BLASdot_(&Bs,&temp_quadrature_constraint[temp_indices[temp_start_ptr+j]],&Bone,
27673b03a366Sstefano_zampini                                     &temp_quadrature_constraint[temp_indices[temp_start_ptr+k]],&Bone);
27683b03a366Sstefano_zampini #endif
27693b03a366Sstefano_zampini           correlation_mat[j*temp_constraints+k]=dot_result;
27703b03a366Sstefano_zampini         }
27713b03a366Sstefano_zampini       }
27723425bc38SStefano Zampini       ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
27733b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX)
27743425bc38SStefano Zampini /*      LAPACKsyev_("V","U",&Bt,correlation_mat,&Bt,singular_vals,work,&lwork,&lierr); */
27753425bc38SStefano Zampini       LAPACKsyevx_("V","A","U",&Bt,correlation_mat,&Bt,&dummy_real,&dummy_real,&dummy_int,&dummy_int,
27763425bc38SStefano Zampini                    &abs_tol,&eigs_found,singular_vals,singular_vectors,&Bt,work,&lwork,iwork,ifail,&lierr);
27773b03a366Sstefano_zampini #else
27783425bc38SStefano Zampini /*  LAPACK call is missing here! TODO */
27793425bc38SStefano Zampini       SETERRQ(((PetscObject) pc)->comm, PETSC_ERR_SUP, "Not yet implemented for complexes when PETSC_MISSING_GESVD = 1");
27803b03a366Sstefano_zampini #endif
27813425bc38SStefano Zampini       if (lierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYEVX Lapack routine %d",(int)lierr);
27823425bc38SStefano Zampini       ierr = PetscFPTrapPop();CHKERRQ(ierr);
27833b03a366Sstefano_zampini       /* retain eigenvalues greater than tol: note that lapack SYEV gives eigs in ascending order */
27843b03a366Sstefano_zampini       j=0;
27853b03a366Sstefano_zampini       while (j < Bt && singular_vals[j] < tol) j++;
27863b03a366Sstefano_zampini       total_counts=total_counts-j;
27873b03a366Sstefano_zampini       if (j<temp_constraints) {
2788*2fa5cd67SKarl Rupp         for (k=j;k<Bt;k++) singular_vals[k]=1.0/PetscSqrtReal(singular_vals[k]);
27893425bc38SStefano Zampini         ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
27903b03a366Sstefano_zampini         BLASgemm_("N","N",&Bs,&Bt,&Bt,&one,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,correlation_mat,&Bt,&zero,temp_basis,&Bs);
27913425bc38SStefano Zampini         ierr = PetscFPTrapPop();CHKERRQ(ierr);
27923b03a366Sstefano_zampini         /* copy POD basis into used quadrature memory */
27933b03a366Sstefano_zampini         for (k=0;k<Bt-j;k++) {
27943b03a366Sstefano_zampini           for (ii=0;ii<size_of_constraint;ii++) {
27953b03a366Sstefano_zampini             temp_quadrature_constraint[temp_indices[temp_start_ptr+k]+ii]=singular_vals[Bt-1-k]*temp_basis[(Bt-1-k)*size_of_constraint+ii];
27963b03a366Sstefano_zampini           }
27973b03a366Sstefano_zampini         }
27983b03a366Sstefano_zampini       }
2799de534f79Sstefano_zampini 
28003b03a366Sstefano_zampini #else  /* on missing GESVD */
28013b03a366Sstefano_zampini       PetscInt min_n = temp_constraints;
28023b03a366Sstefano_zampini       if (min_n > size_of_constraint) min_n = size_of_constraint;
28033b03a366Sstefano_zampini       dummy_int = Bs;
2804670f3ff9SJed Brown       ierr      = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
28053b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX)
28063b03a366Sstefano_zampini       LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,singular_vals,
28073b03a366Sstefano_zampini                    &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,work,&lwork,&lierr);
28083b03a366Sstefano_zampini #else
28093b03a366Sstefano_zampini       LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,singular_vals,
28103b03a366Sstefano_zampini                    &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,work,&lwork,rwork,&lierr);
28113b03a366Sstefano_zampini #endif
28123b03a366Sstefano_zampini       if (lierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SVD Lapack routine %d",(int)lierr);
2813670f3ff9SJed Brown       ierr = PetscFPTrapPop();CHKERRQ(ierr);
28143b03a366Sstefano_zampini       /* retain eigenvalues greater than tol: note that lapack SVD gives eigs in descending order */
28153b03a366Sstefano_zampini       j=0;
28163b03a366Sstefano_zampini       while (j < min_n && singular_vals[min_n-j-1] < tol) j++;
28173b03a366Sstefano_zampini       total_counts = total_counts-(PetscInt)Bt+(min_n-j);
28183b03a366Sstefano_zampini #endif
28193b03a366Sstefano_zampini     }
28203b03a366Sstefano_zampini   }
2821534831adSStefano Zampini 
2822da1bb401SStefano Zampini   n_constraints     =total_counts-n_vertices;
2823da1bb401SStefano Zampini   local_primal_size = total_counts;
28243b03a366Sstefano_zampini   /* set quantities in pcbddc data structure */
28253b03a366Sstefano_zampini   pcbddc->n_vertices        = n_vertices;
28263b03a366Sstefano_zampini   pcbddc->n_constraints     = n_constraints;
2827da1bb401SStefano Zampini   pcbddc->local_primal_size = local_primal_size;
2828534831adSStefano Zampini 
2829534831adSStefano Zampini   /* Create constraint matrix */
2830534831adSStefano Zampini   /* The constraint matrix is used to compute the l2g map of primal dofs */
2831534831adSStefano Zampini   /* so we need to set it up properly either with or without change of basis */
2832534831adSStefano Zampini   ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->ConstraintMatrix);CHKERRQ(ierr);
2833534831adSStefano Zampini   ierr = MatSetType(pcbddc->ConstraintMatrix,impMatType);CHKERRQ(ierr);
2834534831adSStefano Zampini   ierr = MatSetSizes(pcbddc->ConstraintMatrix,local_primal_size,pcis->n,local_primal_size,pcis->n);CHKERRQ(ierr);
2835*2fa5cd67SKarl Rupp 
2836534831adSStefano Zampini   /* compute a local numbering of constraints : vertices first then constraints */
2837534831adSStefano Zampini   ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
2838534831adSStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array_vector);CHKERRQ(ierr);
2839534831adSStefano Zampini   ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&aux_primal_numbering);CHKERRQ(ierr);
2840534831adSStefano Zampini   ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&aux_primal_permutation);CHKERRQ(ierr);
2841*2fa5cd67SKarl Rupp 
2842534831adSStefano Zampini   total_counts=0;
2843*2fa5cd67SKarl Rupp 
2844534831adSStefano Zampini   /* find vertices: subdomain corners plus dofs with basis changed */
2845534831adSStefano Zampini   for (i=0; i<local_primal_size; i++) {
2846534831adSStefano Zampini     size_of_constraint=temp_indices[i+1]-temp_indices[i];
2847534831adSStefano Zampini     if (change_basis[i] || size_of_constraint == 1) {
2848534831adSStefano Zampini       k=0;
2849534831adSStefano Zampini       while (k < size_of_constraint && array_vector[temp_indices_to_constraint[temp_indices[i]+size_of_constraint-k-1]] != 0.0) {
2850534831adSStefano Zampini         k=k+1;
2851534831adSStefano Zampini       }
2852534831adSStefano Zampini       j = temp_indices_to_constraint[temp_indices[i]+size_of_constraint-k-1];
2853*2fa5cd67SKarl Rupp 
2854534831adSStefano Zampini       array_vector[j]                      = 1.0;
2855534831adSStefano Zampini       aux_primal_numbering[total_counts]   = j;
2856534831adSStefano Zampini       aux_primal_permutation[total_counts] = total_counts;
2857534831adSStefano Zampini       total_counts++;
2858534831adSStefano Zampini     }
2859534831adSStefano Zampini   }
2860534831adSStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array_vector);CHKERRQ(ierr);
2861534831adSStefano Zampini   /* permute indices in order to have a sorted set of vertices */
2862534831adSStefano Zampini   ierr = PetscSortIntWithPermutation(total_counts,aux_primal_numbering,aux_primal_permutation);
2863534831adSStefano Zampini   /* nonzero structure */
2864534831adSStefano Zampini   ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&nnz);CHKERRQ(ierr);
2865*2fa5cd67SKarl Rupp   for (i=0;i<total_counts;i++) nnz[i]=1;
2866*2fa5cd67SKarl Rupp 
2867534831adSStefano Zampini   j=total_counts;
2868534831adSStefano Zampini   for (i=n_vertices; i<local_primal_size; i++) {
2869534831adSStefano Zampini     if (!change_basis[i]) {
2870534831adSStefano Zampini       nnz[j]=temp_indices[i+1]-temp_indices[i];
2871534831adSStefano Zampini       j++;
2872534831adSStefano Zampini     }
2873534831adSStefano Zampini   }
2874534831adSStefano Zampini   ierr = MatSeqAIJSetPreallocation(pcbddc->ConstraintMatrix,0,nnz);CHKERRQ(ierr);
2875534831adSStefano Zampini   ierr = PetscFree(nnz);CHKERRQ(ierr);
2876534831adSStefano Zampini   /* set values in constraint matrix */
2877534831adSStefano Zampini   for (i=0; i<total_counts; i++) {
2878534831adSStefano Zampini     j    = aux_primal_permutation[i];
2879534831adSStefano Zampini     k    = aux_primal_numbering[j];
2880534831adSStefano Zampini     ierr = MatSetValue(pcbddc->ConstraintMatrix,i,k,1.0,INSERT_VALUES);CHKERRQ(ierr);
2881534831adSStefano Zampini   }
2882534831adSStefano Zampini   for (i=n_vertices; i<local_primal_size; i++) {
2883534831adSStefano Zampini     if (!change_basis[i]) {
2884534831adSStefano Zampini       size_of_constraint = temp_indices[i+1]-temp_indices[i];
2885534831adSStefano Zampini       ierr               = MatSetValues(pcbddc->ConstraintMatrix,1,&total_counts,size_of_constraint,&temp_indices_to_constraint[temp_indices[i]],&temp_quadrature_constraint[temp_indices[i]],INSERT_VALUES);CHKERRQ(ierr);
2886534831adSStefano Zampini       total_counts++;
2887534831adSStefano Zampini     }
2888534831adSStefano Zampini   }
2889534831adSStefano Zampini   ierr = PetscFree(aux_primal_numbering);CHKERRQ(ierr);
2890534831adSStefano Zampini   ierr = PetscFree(aux_primal_permutation);CHKERRQ(ierr);
2891534831adSStefano Zampini   /* assembling */
2892534831adSStefano Zampini   ierr = MatAssemblyBegin(pcbddc->ConstraintMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2893534831adSStefano Zampini   ierr = MatAssemblyEnd(pcbddc->ConstraintMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2894534831adSStefano Zampini 
2895534831adSStefano Zampini   /* Create matrix for change of basis. We don't need it in case pcbddc->usechangeofbasis is FALSE */
2896534831adSStefano Zampini   if (pcbddc->usechangeofbasis) {
2897534831adSStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->ChangeOfBasisMatrix);CHKERRQ(ierr);
2898534831adSStefano Zampini     ierr = MatSetType(pcbddc->ChangeOfBasisMatrix,impMatType);CHKERRQ(ierr);
2899534831adSStefano Zampini     ierr = MatSetSizes(pcbddc->ChangeOfBasisMatrix,pcis->n_B,pcis->n_B,pcis->n_B,pcis->n_B);CHKERRQ(ierr);
2900534831adSStefano Zampini     /* work arrays */
2901534831adSStefano Zampini     /* we need to reuse these arrays, so we free them */
2902534831adSStefano Zampini     ierr = PetscFree(temp_basis);CHKERRQ(ierr);
2903534831adSStefano Zampini     ierr = PetscFree(work);CHKERRQ(ierr);
2904534831adSStefano Zampini     ierr = PetscMalloc(pcis->n_B*sizeof(PetscInt),&nnz);CHKERRQ(ierr);
2905534831adSStefano Zampini     ierr = PetscMalloc((nnsp_addone+nnsp_size)*(nnsp_addone+nnsp_size)*sizeof(PetscScalar),&temp_basis);CHKERRQ(ierr);
2906534831adSStefano Zampini     ierr = PetscMalloc((nnsp_addone+nnsp_size)*sizeof(PetscScalar),&work);CHKERRQ(ierr);
2907534831adSStefano Zampini     ierr = PetscMalloc((nnsp_addone+nnsp_size)*sizeof(PetscBLASInt),&ipiv);CHKERRQ(ierr);
2908*2fa5cd67SKarl Rupp     for (i=0;i<pcis->n_B;i++) nnz[i]=1;
2909*2fa5cd67SKarl Rupp 
2910534831adSStefano Zampini     /* Overestimated nonzeros per row */
2911534831adSStefano Zampini     k=1;
2912534831adSStefano Zampini     for (i=pcbddc->n_vertices;i<local_primal_size;i++) {
2913534831adSStefano Zampini       if (change_basis[i]) {
2914534831adSStefano Zampini         size_of_constraint = temp_indices[i+1]-temp_indices[i];
2915*2fa5cd67SKarl Rupp         if (k < size_of_constraint) k = size_of_constraint;
2916*2fa5cd67SKarl Rupp 
2917534831adSStefano Zampini         for (j=0;j<size_of_constraint;j++) {
2918534831adSStefano Zampini           nnz[temp_indices_to_constraint_B[temp_indices[i]+j]] = size_of_constraint;
2919534831adSStefano Zampini         }
2920534831adSStefano Zampini       }
2921534831adSStefano Zampini     }
2922534831adSStefano Zampini     ierr = MatSeqAIJSetPreallocation(pcbddc->ChangeOfBasisMatrix,0,nnz);CHKERRQ(ierr);
2923534831adSStefano Zampini     ierr = PetscFree(nnz);CHKERRQ(ierr);
2924534831adSStefano Zampini     /* Temporary array to store indices */
2925534831adSStefano Zampini     ierr = PetscMalloc(k*sizeof(PetscInt),&is_indices);CHKERRQ(ierr);
2926534831adSStefano Zampini     /* Set initial identity in the matrix */
2927534831adSStefano Zampini     for (i=0; i<pcis->n_B; i++) {
2928534831adSStefano Zampini       ierr = MatSetValue(pcbddc->ChangeOfBasisMatrix,i,i,1.0,INSERT_VALUES);CHKERRQ(ierr);
2929534831adSStefano Zampini     }
2930534831adSStefano Zampini     /* Now we loop on the constraints which need a change of basis */
2931534831adSStefano Zampini     /* Change of basis matrix is evaluated as the FIRST APPROACH in */
2932534831adSStefano Zampini     /* Klawonn and Widlund, Dual-primal FETI-DP methods for linear elasticity, (6.2.1) */
2933534831adSStefano Zampini     temp_constraints = 0;
293493dc3b60SStefano Zampini     if (pcbddc->n_vertices < local_primal_size) {
2935534831adSStefano Zampini       temp_start_ptr = temp_indices_to_constraint_B[temp_indices[pcbddc->n_vertices]];
293693dc3b60SStefano Zampini     }
2937534831adSStefano Zampini     for (i=pcbddc->n_vertices; i<local_primal_size; i++) {
2938534831adSStefano Zampini       if (change_basis[i]) {
2939534831adSStefano Zampini         compute_submatrix = PETSC_FALSE;
2940534831adSStefano Zampini         useksp            = PETSC_FALSE;
2941534831adSStefano Zampini         if (temp_start_ptr == temp_indices_to_constraint_B[temp_indices[i]]) {
2942534831adSStefano Zampini           temp_constraints++;
294304eaf177SStefano Zampini           if (i == local_primal_size -1 ||  temp_start_ptr != temp_indices_to_constraint_B[temp_indices[i+1]]) {
2944534831adSStefano Zampini             compute_submatrix = PETSC_TRUE;
2945534831adSStefano Zampini           }
2946534831adSStefano Zampini         }
2947534831adSStefano Zampini         if (compute_submatrix) {
2948*2fa5cd67SKarl Rupp           if (temp_constraints > 1 || pcbddc->use_nnsp_true) useksp = PETSC_TRUE;
2949534831adSStefano Zampini           size_of_constraint = temp_indices[i+1]-temp_indices[i];
2950534831adSStefano Zampini           if (useksp) { /* experimental */
2951534831adSStefano Zampini             ierr = MatCreate(PETSC_COMM_SELF,&temp_mat);CHKERRQ(ierr);
2952534831adSStefano Zampini             ierr = MatSetType(temp_mat,impMatType);CHKERRQ(ierr);
2953534831adSStefano Zampini             ierr = MatSetSizes(temp_mat,size_of_constraint,size_of_constraint,size_of_constraint,size_of_constraint);CHKERRQ(ierr);
2954534831adSStefano Zampini             ierr = MatSeqAIJSetPreallocation(temp_mat,size_of_constraint,PETSC_NULL);CHKERRQ(ierr);
2955534831adSStefano Zampini           }
2956534831adSStefano Zampini           /* First _size_of_constraint-temp_constraints_ columns */
2957534831adSStefano Zampini           dual_dofs        = size_of_constraint-temp_constraints;
2958534831adSStefano Zampini           start_constraint = i+1-temp_constraints;
2959534831adSStefano Zampini           for (s=0; s<dual_dofs; s++) {
2960534831adSStefano Zampini             is_indices[0] = s;
2961534831adSStefano Zampini             for (j=0;j<temp_constraints;j++) {
2962534831adSStefano Zampini               for (k=0;k<temp_constraints;k++) {
2963534831adSStefano Zampini                 temp_basis[j*temp_constraints+k]=temp_quadrature_constraint[temp_indices[start_constraint+k]+s+j+1];
2964534831adSStefano Zampini               }
2965534831adSStefano Zampini               work[j]         = -temp_quadrature_constraint[temp_indices[start_constraint+j]+s];
2966534831adSStefano Zampini               is_indices[j+1] = s+j+1;
2967534831adSStefano Zampini             }
2968534831adSStefano Zampini             Bt   = temp_constraints;
2969534831adSStefano Zampini             ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
2970534831adSStefano Zampini             LAPACKgesv_(&Bt,&Bone,temp_basis,&Bt,ipiv,work,&Bt,&lierr);
2971534831adSStefano Zampini             if (lierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GESV Lapack routine %d",(int)lierr);
2972534831adSStefano Zampini             ierr = PetscFPTrapPop();CHKERRQ(ierr);
2973534831adSStefano Zampini             j    = temp_indices_to_constraint_B[temp_indices[start_constraint]+s];
2974534831adSStefano Zampini             ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,temp_constraints,&temp_indices_to_constraint_B[temp_indices[start_constraint]+s+1],1,&j,work,INSERT_VALUES);CHKERRQ(ierr);
2975534831adSStefano Zampini             if (useksp) {
2976534831adSStefano Zampini               /* temp mat with transposed rows and columns */
2977534831adSStefano Zampini               ierr = MatSetValues(temp_mat,1,&s,temp_constraints,&is_indices[1],work,INSERT_VALUES);CHKERRQ(ierr);
2978534831adSStefano Zampini               ierr = MatSetValue(temp_mat,is_indices[0],is_indices[0],1.0,INSERT_VALUES);CHKERRQ(ierr);
2979534831adSStefano Zampini             }
2980534831adSStefano Zampini           }
2981534831adSStefano Zampini           if (useksp) {
2982534831adSStefano Zampini             /* last rows of temp_mat */
2983*2fa5cd67SKarl Rupp             for (j=0;j<size_of_constraint;j++) is_indices[j] = j;
2984*2fa5cd67SKarl Rupp 
2985534831adSStefano Zampini             for (s=0;s<temp_constraints;s++) {
2986534831adSStefano Zampini               k = s + dual_dofs;
2987534831adSStefano Zampini               ierr = MatSetValues(temp_mat,1,&k,size_of_constraint,is_indices,&temp_quadrature_constraint[temp_indices[start_constraint+s]],INSERT_VALUES);CHKERRQ(ierr);
2988534831adSStefano Zampini             }
2989534831adSStefano Zampini             ierr = MatAssemblyBegin(temp_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2990534831adSStefano Zampini             ierr = MatAssemblyEnd(temp_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2991534831adSStefano Zampini             ierr = MatGetVecs(temp_mat,&temp_vec,PETSC_NULL);CHKERRQ(ierr);
2992534831adSStefano Zampini             ierr = KSPCreate(PETSC_COMM_SELF,&temp_ksp);CHKERRQ(ierr);
2993534831adSStefano Zampini             ierr = KSPSetOperators(temp_ksp,temp_mat,temp_mat,SAME_PRECONDITIONER);CHKERRQ(ierr);
2994534831adSStefano Zampini             ierr = KSPSetType(temp_ksp,KSPPREONLY);CHKERRQ(ierr);
2995ffe5efe1SStefano Zampini             ierr = KSPGetPC(temp_ksp,&temp_pc);CHKERRQ(ierr);
2996ffe5efe1SStefano Zampini             ierr = PCSetType(temp_pc,PCLU);CHKERRQ(ierr);
2997534831adSStefano Zampini             ierr = KSPSetUp(temp_ksp);CHKERRQ(ierr);
2998534831adSStefano Zampini             for (s=0; s<temp_constraints; s++) {
2999534831adSStefano Zampini               ierr = VecSet(temp_vec,0.0);CHKERRQ(ierr);
3000534831adSStefano Zampini               ierr = VecSetValue(temp_vec,s+dual_dofs,1.0,INSERT_VALUES);CHKERRQ(ierr);
3001534831adSStefano Zampini               ierr = VecAssemblyBegin(temp_vec);CHKERRQ(ierr);
3002534831adSStefano Zampini               ierr = VecAssemblyEnd(temp_vec);CHKERRQ(ierr);
3003534831adSStefano Zampini               ierr = KSPSolve(temp_ksp,temp_vec,temp_vec);CHKERRQ(ierr);
3004534831adSStefano Zampini               ierr = VecGetArray(temp_vec,&array_vector);CHKERRQ(ierr);
3005534831adSStefano Zampini               j    = temp_indices_to_constraint_B[temp_indices[start_constraint+s]+size_of_constraint-s-1];
3006534831adSStefano Zampini               /* last columns of change of basis matrix associated to new primal dofs */
3007534831adSStefano Zampini               ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,size_of_constraint,&temp_indices_to_constraint_B[temp_indices[start_constraint+s]],1,&j,array_vector,INSERT_VALUES);CHKERRQ(ierr);
3008534831adSStefano Zampini               ierr = VecRestoreArray(temp_vec,&array_vector);CHKERRQ(ierr);
3009534831adSStefano Zampini             }
3010534831adSStefano Zampini             ierr = MatDestroy(&temp_mat);CHKERRQ(ierr);
3011534831adSStefano Zampini             ierr = KSPDestroy(&temp_ksp);CHKERRQ(ierr);
3012534831adSStefano Zampini             ierr = VecDestroy(&temp_vec);CHKERRQ(ierr);
3013534831adSStefano Zampini           } else {
3014534831adSStefano Zampini             /* last columns of change of basis matrix associated to new primal dofs */
3015534831adSStefano Zampini             for (s=0; s<temp_constraints; s++) {
3016534831adSStefano Zampini               j    = temp_indices_to_constraint_B[temp_indices[start_constraint+s]+size_of_constraint-s-1];
3017534831adSStefano Zampini               ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,size_of_constraint,&temp_indices_to_constraint_B[temp_indices[start_constraint+s]],1,&j,&temp_quadrature_constraint[temp_indices[start_constraint+s]],INSERT_VALUES);CHKERRQ(ierr);
3018534831adSStefano Zampini             }
3019534831adSStefano Zampini           }
3020534831adSStefano Zampini           /* prepare for the next cycle */
3021534831adSStefano Zampini           temp_constraints = 0;
3022*2fa5cd67SKarl Rupp           if (i != local_primal_size -1) temp_start_ptr = temp_indices_to_constraint_B[temp_indices[i+1]];
3023534831adSStefano Zampini         }
3024534831adSStefano Zampini       }
302504eaf177SStefano Zampini     }
3026534831adSStefano Zampini     /* assembling */
3027534831adSStefano Zampini     ierr = MatAssemblyBegin(pcbddc->ChangeOfBasisMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
3028534831adSStefano Zampini     ierr = MatAssemblyEnd(pcbddc->ChangeOfBasisMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
3029534831adSStefano Zampini     ierr = PetscFree(ipiv);CHKERRQ(ierr);
3030534831adSStefano Zampini     ierr = PetscFree(is_indices);CHKERRQ(ierr);
3031534831adSStefano Zampini   }
30323b03a366Sstefano_zampini   /* free workspace no longer needed */
30333b03a366Sstefano_zampini   ierr = PetscFree(rwork);CHKERRQ(ierr);
30343b03a366Sstefano_zampini   ierr = PetscFree(work);CHKERRQ(ierr);
30353b03a366Sstefano_zampini   ierr = PetscFree(temp_basis);CHKERRQ(ierr);
30363b03a366Sstefano_zampini   ierr = PetscFree(singular_vals);CHKERRQ(ierr);
30373b03a366Sstefano_zampini   ierr = PetscFree(correlation_mat);CHKERRQ(ierr);
30383b03a366Sstefano_zampini   ierr = PetscFree(temp_indices);CHKERRQ(ierr);
3039534831adSStefano Zampini   ierr = PetscFree(change_basis);CHKERRQ(ierr);
30403b03a366Sstefano_zampini   ierr = PetscFree(temp_indices_to_constraint);CHKERRQ(ierr);
3041534831adSStefano Zampini   ierr = PetscFree(temp_indices_to_constraint_B);CHKERRQ(ierr);
3042534831adSStefano Zampini   ierr = PetscFree(local_to_B);CHKERRQ(ierr);
30433b03a366Sstefano_zampini   ierr = PetscFree(temp_quadrature_constraint);CHKERRQ(ierr);
30443425bc38SStefano Zampini #if defined(PETSC_MISSING_LAPACK_GESVD)
30453425bc38SStefano Zampini   ierr = PetscFree(iwork);CHKERRQ(ierr);
30463425bc38SStefano Zampini   ierr = PetscFree(ifail);CHKERRQ(ierr);
30473425bc38SStefano Zampini   ierr = PetscFree(singular_vectors);CHKERRQ(ierr);
30483425bc38SStefano Zampini #endif
3049da1bb401SStefano Zampini   for (k=0; k<nnsp_size; k++) {
3050da1bb401SStefano Zampini     ierr = VecDestroy(&localnearnullsp[k]);CHKERRQ(ierr);
3051da1bb401SStefano Zampini   }
30523b03a366Sstefano_zampini   ierr = PetscFree(localnearnullsp);CHKERRQ(ierr);
30533b03a366Sstefano_zampini   PetscFunctionReturn(0);
30543b03a366Sstefano_zampini }
30553b03a366Sstefano_zampini /* -------------------------------------------------------------------------- */
30560c7d97c5SJed Brown #undef __FUNCT__
30570c7d97c5SJed Brown #define __FUNCT__ "PCBDDCCoarseSetUp"
305853cdbc3dSStefano Zampini static PetscErrorCode PCBDDCCoarseSetUp(PC pc)
30590c7d97c5SJed Brown {
30600c7d97c5SJed Brown   PetscErrorCode ierr;
30610c7d97c5SJed Brown   PC_IS          *pcis    = (PC_IS*)(pc->data);
30620c7d97c5SJed Brown   PC_BDDC        *pcbddc  = (PC_BDDC*)pc->data;
30630c7d97c5SJed Brown   Mat_IS         *matis   = (Mat_IS*)pc->pmat->data;
3064534831adSStefano Zampini   Mat            change_mat_all;
30650c7d97c5SJed Brown   IS             is_R_local;
30660c7d97c5SJed Brown   IS             is_V_local;
30670c7d97c5SJed Brown   IS             is_C_local;
30680c7d97c5SJed Brown   IS             is_aux1;
30690c7d97c5SJed Brown   IS             is_aux2;
307019fd82e9SBarry Smith   VecType        impVecType;
307119fd82e9SBarry Smith   MatType        impMatType;
30720c7d97c5SJed Brown   PetscInt       n_R  =0;
30730c7d97c5SJed Brown   PetscInt       n_D  =0;
30740c7d97c5SJed Brown   PetscInt       n_B  =0;
30750c7d97c5SJed Brown   PetscScalar    zero =0.0;
30760c7d97c5SJed Brown   PetscScalar    one  =1.0;
30770c7d97c5SJed Brown   PetscScalar    m_one=-1.0;
30780c7d97c5SJed Brown   PetscScalar    * array;
30790c7d97c5SJed Brown   PetscScalar    *coarse_submat_vals;
30800c7d97c5SJed Brown   PetscInt       *idx_R_local;
30810c7d97c5SJed Brown   PetscInt       *idx_V_B;
30820c7d97c5SJed Brown   PetscScalar    *coarsefunctions_errors;
30830c7d97c5SJed Brown   PetscScalar    *constraints_errors;
3084*2fa5cd67SKarl Rupp 
30850c7d97c5SJed Brown   /* auxiliary indices */
3086534831adSStefano Zampini   PetscInt i,j,k;
3087*2fa5cd67SKarl Rupp 
3088e269702eSStefano Zampini   /* for verbose output of bddc */
3089e269702eSStefano Zampini   PetscViewer viewer  =pcbddc->dbg_viewer;
3090e269702eSStefano Zampini   PetscBool   dbg_flag=pcbddc->dbg_flag;
3091*2fa5cd67SKarl Rupp 
3092a0ba757dSStefano Zampini   /* for counting coarse dofs */
3093534831adSStefano Zampini   PetscInt    n_vertices,n_constraints;
30943b03a366Sstefano_zampini   PetscInt    size_of_constraint;
30953b03a366Sstefano_zampini   PetscInt    *row_cmat_indices;
30963b03a366Sstefano_zampini   PetscScalar *row_cmat_values;
3097534831adSStefano Zampini   PetscInt    *vertices,*nnz,*is_indices,*temp_indices;
30980c7d97c5SJed Brown 
30990c7d97c5SJed Brown   PetscFunctionBegin;
31000c7d97c5SJed Brown   /* Set Non-overlapping dimensions */
31010c7d97c5SJed Brown   n_B = pcis->n_B; n_D = pcis->n - n_B;
3102534831adSStefano Zampini   /* Set types for local objects needed by BDDC precondtioner */
3103534831adSStefano Zampini   impMatType = MATSEQDENSE;
3104534831adSStefano Zampini   impVecType = VECSEQ;
3105*2fa5cd67SKarl Rupp 
3106da1bb401SStefano Zampini   /* get vertex indices from constraint matrix */
3107534831adSStefano Zampini   ierr      = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscInt),&vertices);CHKERRQ(ierr);
3108534831adSStefano Zampini   n_vertices=0;
3109da1bb401SStefano Zampini   for (i=0; i<pcbddc->local_primal_size; i++) {
3110da1bb401SStefano Zampini     ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr);
3111da1bb401SStefano Zampini     if (size_of_constraint == 1) {
3112534831adSStefano Zampini       vertices[n_vertices]=row_cmat_indices[0];
3113534831adSStefano Zampini       n_vertices++;
3114a0ba757dSStefano Zampini     }
3115da1bb401SStefano Zampini     ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr);
3116a0ba757dSStefano Zampini   }
3117534831adSStefano Zampini   /* Set number of constraints */
3118534831adSStefano Zampini   n_constraints = pcbddc->local_primal_size-n_vertices;
3119534831adSStefano Zampini 
3120534831adSStefano Zampini   /* vertices in boundary numbering */
3121534831adSStefano Zampini   if (n_vertices) {
3122534831adSStefano Zampini     ierr = VecSet(pcis->vec1_N,m_one);CHKERRQ(ierr);
3123534831adSStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3124*2fa5cd67SKarl Rupp     for (i=0; i<n_vertices; i++) array[vertices[i]] = i;
3125534831adSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3126534831adSStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3127534831adSStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3128534831adSStefano Zampini     ierr = PetscMalloc(n_vertices*sizeof(PetscInt),&idx_V_B);CHKERRQ(ierr);
3129534831adSStefano Zampini     ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr);
3130534831adSStefano Zampini     for (i=0; i<n_vertices; i++) {
3131534831adSStefano Zampini       j=0;
3132*2fa5cd67SKarl Rupp       while (array[j] != i) j++;
3133534831adSStefano Zampini       idx_V_B[i]=j;
3134534831adSStefano Zampini     }
3135534831adSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr);
3136534831adSStefano Zampini   }
3137534831adSStefano Zampini 
3138534831adSStefano Zampini   /* transform local matrices if needed */
3139534831adSStefano Zampini   if (pcbddc->usechangeofbasis) {
3140534831adSStefano Zampini     ierr = PetscMalloc(pcis->n*sizeof(PetscInt),&nnz);CHKERRQ(ierr);
3141534831adSStefano Zampini     ierr = ISGetIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
3142*2fa5cd67SKarl Rupp     for (i=0;i<n_D;i++) nnz[is_indices[i]] = 1;
3143534831adSStefano Zampini     ierr = ISRestoreIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
3144534831adSStefano Zampini     ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
3145534831adSStefano Zampini     k=1;
3146534831adSStefano Zampini     for (i=0;i<n_B;i++) {
3147534831adSStefano Zampini       ierr = MatGetRow(pcbddc->ChangeOfBasisMatrix,i,&j,PETSC_NULL,PETSC_NULL);CHKERRQ(ierr);
3148534831adSStefano Zampini       nnz[is_indices[i]]=j;
3149*2fa5cd67SKarl Rupp       if (k < j) k = j;
3150534831adSStefano Zampini       ierr = MatRestoreRow(pcbddc->ChangeOfBasisMatrix,i,&j,PETSC_NULL,PETSC_NULL);CHKERRQ(ierr);
3151534831adSStefano Zampini     }
3152534831adSStefano Zampini     ierr = ISRestoreIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
3153534831adSStefano Zampini     /* assemble change of basis matrix on the whole set of local dofs */
3154534831adSStefano Zampini     ierr = PetscMalloc(k*sizeof(PetscInt),&temp_indices);CHKERRQ(ierr);
3155534831adSStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&change_mat_all);CHKERRQ(ierr);
3156534831adSStefano Zampini     ierr = MatSetSizes(change_mat_all,pcis->n,pcis->n,pcis->n,pcis->n);CHKERRQ(ierr);
3157534831adSStefano Zampini     ierr = MatSetType(change_mat_all,MATSEQAIJ);CHKERRQ(ierr);
3158534831adSStefano Zampini     ierr = MatSeqAIJSetPreallocation(change_mat_all,0,nnz);CHKERRQ(ierr);
3159534831adSStefano Zampini     ierr = ISGetIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
3160534831adSStefano Zampini     for (i=0; i<n_D; i++) {
3161534831adSStefano Zampini       ierr = MatSetValue(change_mat_all,is_indices[i],is_indices[i],1.0,INSERT_VALUES);CHKERRQ(ierr);
3162534831adSStefano Zampini     }
3163534831adSStefano Zampini     ierr = ISRestoreIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
3164534831adSStefano Zampini     ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
3165534831adSStefano Zampini     for (i=0; i<n_B; i++) {
3166534831adSStefano Zampini       ierr = MatGetRow(pcbddc->ChangeOfBasisMatrix,i,&j,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr);
3167*2fa5cd67SKarl Rupp       for (k=0; k<j; k++) temp_indices[k]=is_indices[row_cmat_indices[k]];
3168534831adSStefano Zampini       ierr = MatSetValues(change_mat_all,1,&is_indices[i],j,temp_indices,row_cmat_values,INSERT_VALUES);CHKERRQ(ierr);
3169534831adSStefano Zampini       ierr = MatRestoreRow(pcbddc->ChangeOfBasisMatrix,i,&j,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr);
3170534831adSStefano Zampini     }
3171534831adSStefano Zampini     ierr = MatAssemblyBegin(change_mat_all,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
3172534831adSStefano Zampini     ierr = MatAssemblyEnd(change_mat_all,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
3173534831adSStefano Zampini     ierr = MatPtAP(matis->A,change_mat_all,MAT_INITIAL_MATRIX,1.0,&pcbddc->local_mat);CHKERRQ(ierr);
3174534831adSStefano Zampini     ierr = MatDestroy(&pcis->A_IB);CHKERRQ(ierr);
3175534831adSStefano Zampini     ierr = MatDestroy(&pcis->A_BI);CHKERRQ(ierr);
3176534831adSStefano Zampini     ierr = MatDestroy(&pcis->A_BB);CHKERRQ(ierr);
3177534831adSStefano Zampini     ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_I_local,pcis->is_B_local,MAT_INITIAL_MATRIX,&pcis->A_IB);CHKERRQ(ierr);
3178534831adSStefano Zampini     ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_B_local,pcis->is_I_local,MAT_INITIAL_MATRIX,&pcis->A_BI);CHKERRQ(ierr);
3179534831adSStefano Zampini     ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_B_local,pcis->is_B_local,MAT_INITIAL_MATRIX,&pcis->A_BB);CHKERRQ(ierr);
3180534831adSStefano Zampini     ierr = MatDestroy(&change_mat_all);CHKERRQ(ierr);
3181534831adSStefano Zampini     ierr = PetscFree(nnz);CHKERRQ(ierr);
3182534831adSStefano Zampini     ierr = PetscFree(temp_indices);CHKERRQ(ierr);
3183534831adSStefano Zampini   } else {
3184534831adSStefano Zampini     /* without change of basis, the local matrix is unchanged */
3185534831adSStefano Zampini     ierr = PetscObjectReference((PetscObject)matis->A);CHKERRQ(ierr);
3186*2fa5cd67SKarl Rupp 
3187534831adSStefano Zampini     pcbddc->local_mat = matis->A;
3188534831adSStefano Zampini   }
31890bdf917eSStefano Zampini   /* Change global null space passed in by the user if change of basis has been performed */
31900bdf917eSStefano Zampini   if (pcbddc->NullSpace && pcbddc->usechangeofbasis) {
31910bdf917eSStefano Zampini     ierr = PCBDDCAdaptNullSpace(pc);CHKERRQ(ierr);
31920bdf917eSStefano Zampini   }
3193a0ba757dSStefano Zampini 
31940c7d97c5SJed Brown   /* Dohrmann's notation: dofs splitted in R (Remaining: all dofs but the vertices) and V (Vertices) */
31950c7d97c5SJed Brown   ierr = VecSet(pcis->vec1_N,one);CHKERRQ(ierr);
31960c7d97c5SJed Brown   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3197*2fa5cd67SKarl Rupp   for (i=0;i<n_vertices;i++) array[vertices[i]] = zero;
31983b03a366Sstefano_zampini   ierr = PetscMalloc((pcis->n - n_vertices)*sizeof(PetscInt),&idx_R_local);CHKERRQ(ierr);
3199*2fa5cd67SKarl Rupp   for (i=0, n_R=0; i<pcis->n; i++) {
3200*2fa5cd67SKarl Rupp     if (array[i] == one) {
3201*2fa5cd67SKarl Rupp       idx_R_local[n_R] = i;
3202*2fa5cd67SKarl Rupp       n_R++;
3203*2fa5cd67SKarl Rupp     }
3204*2fa5cd67SKarl Rupp   }
32050c7d97c5SJed Brown   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3206e269702eSStefano Zampini   if (dbg_flag) {
32070c7d97c5SJed Brown     ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
32080c7d97c5SJed Brown     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
32090c7d97c5SJed Brown     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d local dimensions\n",PetscGlobalRank);CHKERRQ(ierr);
32100c7d97c5SJed Brown     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local_size = %d, dirichlet_size = %d, boundary_size = %d\n",pcis->n,n_D,n_B);CHKERRQ(ierr);
32113b03a366Sstefano_zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"r_size = %d, v_size = %d, constraints = %d, local_primal_size = %d\n",n_R,n_vertices,n_constraints,pcbddc->local_primal_size);CHKERRQ(ierr);
3212534831adSStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"pcbddc->n_vertices = %d, pcbddc->n_constraints = %d\n",pcbddc->n_vertices,pcbddc->n_constraints);CHKERRQ(ierr);
32130c7d97c5SJed Brown     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
32140c7d97c5SJed Brown   }
3215534831adSStefano Zampini 
32160c7d97c5SJed Brown   /* Allocate needed vectors */
3217534831adSStefano Zampini   ierr = VecDuplicate(pcis->vec1_global,&pcbddc->original_rhs);CHKERRQ(ierr);
32183972b0daSStefano Zampini   ierr = VecDuplicate(pcis->vec1_global,&pcbddc->temp_solution);CHKERRQ(ierr);
32190c7d97c5SJed Brown   ierr = VecDuplicate(pcis->vec1_D,&pcbddc->vec4_D);CHKERRQ(ierr);
32200c7d97c5SJed Brown   ierr = VecCreate(PETSC_COMM_SELF,&pcbddc->vec1_R);CHKERRQ(ierr);
32210c7d97c5SJed Brown   ierr = VecSetSizes(pcbddc->vec1_R,n_R,n_R);CHKERRQ(ierr);
32220c7d97c5SJed Brown   ierr = VecSetType(pcbddc->vec1_R,impVecType);CHKERRQ(ierr);
3223d49ef151SStefano Zampini   ierr = VecDuplicate(pcbddc->vec1_R,&pcbddc->vec2_R);CHKERRQ(ierr);
32240c7d97c5SJed Brown   ierr = VecCreate(PETSC_COMM_SELF,&pcbddc->vec1_P);CHKERRQ(ierr);
32250c7d97c5SJed Brown   ierr = VecSetSizes(pcbddc->vec1_P,pcbddc->local_primal_size,pcbddc->local_primal_size);CHKERRQ(ierr);
32260c7d97c5SJed Brown   ierr = VecSetType(pcbddc->vec1_P,impVecType);CHKERRQ(ierr);
32270c7d97c5SJed Brown 
32280c7d97c5SJed Brown   /* Creating some index sets needed  */
32290c7d97c5SJed Brown   /* For submatrices */
3230da1bb401SStefano Zampini   ierr = ISCreateGeneral(PETSC_COMM_SELF,n_R,idx_R_local,PETSC_OWN_POINTER,&is_R_local);CHKERRQ(ierr);
32313b03a366Sstefano_zampini   if (n_vertices) {
3232da1bb401SStefano Zampini     ierr = ISCreateGeneral(PETSC_COMM_SELF,n_vertices,vertices,PETSC_OWN_POINTER,&is_V_local);CHKERRQ(ierr);
32333b03a366Sstefano_zampini   }
3234da1bb401SStefano Zampini   if (n_constraints) {
3235da1bb401SStefano Zampini     ierr = ISCreateStride(PETSC_COMM_SELF,n_constraints,n_vertices,1,&is_C_local);CHKERRQ(ierr);
3236da1bb401SStefano Zampini   }
3237da1bb401SStefano Zampini 
32380c7d97c5SJed Brown   /* For VecScatters pcbddc->R_to_B and (optionally) pcbddc->R_to_D */
32390c7d97c5SJed Brown   {
32400c7d97c5SJed Brown     PetscInt *aux_array1;
32410c7d97c5SJed Brown     PetscInt *aux_array2;
32422e8d2280SStefano Zampini     PetscInt *idx_I_local;
32430c7d97c5SJed Brown 
32443b03a366Sstefano_zampini     ierr = PetscMalloc((pcis->n_B-n_vertices)*sizeof(PetscInt),&aux_array1);CHKERRQ(ierr);
32453b03a366Sstefano_zampini     ierr = PetscMalloc((pcis->n_B-n_vertices)*sizeof(PetscInt),&aux_array2);CHKERRQ(ierr);
32460c7d97c5SJed Brown 
32472e8d2280SStefano Zampini     ierr = ISGetIndices(pcis->is_I_local,(const PetscInt**)&idx_I_local);CHKERRQ(ierr);
32480c7d97c5SJed Brown     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3249*2fa5cd67SKarl Rupp     for (i=0; i<n_D; i++) array[idx_I_local[i]] = 0;
32502e8d2280SStefano Zampini     ierr = ISRestoreIndices(pcis->is_I_local,(const PetscInt**)&idx_I_local);CHKERRQ(ierr);
3251*2fa5cd67SKarl Rupp     for (i=0, j=0; i<n_R; i++) {
3252*2fa5cd67SKarl Rupp       if (array[idx_R_local[i]] == one) {
3253*2fa5cd67SKarl Rupp         aux_array1[j] = i;
3254*2fa5cd67SKarl Rupp         j++;
3255*2fa5cd67SKarl Rupp       }
3256*2fa5cd67SKarl Rupp     }
32570c7d97c5SJed Brown     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3258da1bb401SStefano Zampini     ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array1,PETSC_COPY_VALUES,&is_aux1);CHKERRQ(ierr);
32592e8d2280SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
32602e8d2280SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
32610c7d97c5SJed Brown     ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr);
3262*2fa5cd67SKarl Rupp     for (i=0, j=0; i<n_B; i++) {
3263*2fa5cd67SKarl Rupp       if (array[i] == one) {
3264*2fa5cd67SKarl Rupp         aux_array2[j] = i; j++;
3265*2fa5cd67SKarl Rupp       }
3266*2fa5cd67SKarl Rupp     }
32673828260eSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr);
3268da1bb401SStefano Zampini     ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array2,PETSC_COPY_VALUES,&is_aux2);CHKERRQ(ierr);
32690c7d97c5SJed Brown     ierr = VecScatterCreate(pcbddc->vec1_R,is_aux1,pcis->vec1_B,is_aux2,&pcbddc->R_to_B);CHKERRQ(ierr);
32700c7d97c5SJed Brown     ierr = PetscFree(aux_array1);CHKERRQ(ierr);
32710c7d97c5SJed Brown     ierr = PetscFree(aux_array2);CHKERRQ(ierr);
32720c7d97c5SJed Brown     ierr = ISDestroy(&is_aux1);CHKERRQ(ierr);
32730c7d97c5SJed Brown     ierr = ISDestroy(&is_aux2);CHKERRQ(ierr);
32740c7d97c5SJed Brown 
327529622bf0SStefano Zampini     if (pcbddc->inexact_prec_type || dbg_flag) {
32760c7d97c5SJed Brown       ierr = PetscMalloc(n_D*sizeof(PetscInt),&aux_array1);CHKERRQ(ierr);
32770c7d97c5SJed Brown       ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3278*2fa5cd67SKarl Rupp       for (i=0, j=0; i<n_R; i++) {
3279*2fa5cd67SKarl Rupp         if (array[idx_R_local[i]] == zero) {
3280*2fa5cd67SKarl Rupp           aux_array1[j] = i;
3281*2fa5cd67SKarl Rupp           j++;
3282*2fa5cd67SKarl Rupp         }
3283*2fa5cd67SKarl Rupp       }
32840c7d97c5SJed Brown       ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3285da1bb401SStefano Zampini       ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array1,PETSC_COPY_VALUES,&is_aux1);CHKERRQ(ierr);
32860c7d97c5SJed Brown       ierr = VecScatterCreate(pcbddc->vec1_R,is_aux1,pcis->vec1_D,(IS)0,&pcbddc->R_to_D);CHKERRQ(ierr);
32870c7d97c5SJed Brown       ierr = PetscFree(aux_array1);CHKERRQ(ierr);
32880c7d97c5SJed Brown       ierr = ISDestroy(&is_aux1);CHKERRQ(ierr);
32890c7d97c5SJed Brown     }
32900c7d97c5SJed Brown   }
32910c7d97c5SJed Brown 
32920c7d97c5SJed Brown   /* Creating PC contexts for local Dirichlet and Neumann problems */
32930c7d97c5SJed Brown   {
32940c7d97c5SJed Brown     Mat A_RR;
329553cdbc3dSStefano Zampini     PC  pc_temp;
3296*2fa5cd67SKarl Rupp 
32970c7d97c5SJed Brown     /* Matrix for Dirichlet problem is A_II -> we already have it from pcis.c code */
329853cdbc3dSStefano Zampini     ierr = KSPCreate(PETSC_COMM_SELF,&pcbddc->ksp_D);CHKERRQ(ierr);
329953cdbc3dSStefano Zampini     ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->ksp_D,(PetscObject)pc,1);CHKERRQ(ierr);
330053cdbc3dSStefano Zampini     ierr = KSPSetOperators(pcbddc->ksp_D,pcis->A_II,pcis->A_II,SAME_PRECONDITIONER);CHKERRQ(ierr);
330153cdbc3dSStefano Zampini     ierr = KSPSetType(pcbddc->ksp_D,KSPPREONLY);CHKERRQ(ierr);
3302da1bb401SStefano Zampini     ierr = KSPSetOptionsPrefix(pcbddc->ksp_D,"dirichlet_");CHKERRQ(ierr);
3303*2fa5cd67SKarl Rupp 
33040c7d97c5SJed Brown     /* default */
330553cdbc3dSStefano Zampini     ierr = KSPGetPC(pcbddc->ksp_D,&pc_temp);CHKERRQ(ierr);
330653cdbc3dSStefano Zampini     ierr = PCSetType(pc_temp,PCLU);CHKERRQ(ierr);
3307*2fa5cd67SKarl Rupp 
33080c7d97c5SJed Brown     /* Allow user's customization */
330953cdbc3dSStefano Zampini     ierr = KSPSetFromOptions(pcbddc->ksp_D);CHKERRQ(ierr);
3310*2fa5cd67SKarl Rupp 
3311950d796eSStefano Zampini     /* umfpack interface has a bug when matrix dimension is zero */
3312950d796eSStefano Zampini     if (!n_D) {
33132e8d2280SStefano Zampini       ierr = PCSetType(pc_temp,PCNONE);CHKERRQ(ierr);
3314950d796eSStefano Zampini     }
3315*2fa5cd67SKarl Rupp 
331653cdbc3dSStefano Zampini     /* Set Up KSP for Dirichlet problem of BDDC */
331753cdbc3dSStefano Zampini     ierr = KSPSetUp(pcbddc->ksp_D);CHKERRQ(ierr);
3318*2fa5cd67SKarl Rupp 
33193972b0daSStefano Zampini     /* set ksp_D into pcis data */
33203972b0daSStefano Zampini     ierr        = KSPDestroy(&pcis->ksp_D);CHKERRQ(ierr);
33213972b0daSStefano Zampini     ierr        = PetscObjectReference((PetscObject)pcbddc->ksp_D);CHKERRQ(ierr);
33223972b0daSStefano Zampini     pcis->ksp_D = pcbddc->ksp_D;
3323*2fa5cd67SKarl Rupp 
33240c7d97c5SJed Brown     /* Matrix for Neumann problem is A_RR -> we need to create it */
3325534831adSStefano Zampini     ierr = MatGetSubMatrix(pcbddc->local_mat,is_R_local,is_R_local,MAT_INITIAL_MATRIX,&A_RR);CHKERRQ(ierr);
332653cdbc3dSStefano Zampini     ierr = KSPCreate(PETSC_COMM_SELF,&pcbddc->ksp_R);CHKERRQ(ierr);
332753cdbc3dSStefano Zampini     ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->ksp_R,(PetscObject)pc,1);CHKERRQ(ierr);
332853cdbc3dSStefano Zampini     ierr = KSPSetOperators(pcbddc->ksp_R,A_RR,A_RR,SAME_PRECONDITIONER);CHKERRQ(ierr);
332953cdbc3dSStefano Zampini     ierr = KSPSetType(pcbddc->ksp_R,KSPPREONLY);CHKERRQ(ierr);
3330da1bb401SStefano Zampini     ierr = KSPSetOptionsPrefix(pcbddc->ksp_R,"neumann_");CHKERRQ(ierr);
3331*2fa5cd67SKarl Rupp 
33320c7d97c5SJed Brown     /* default */
333353cdbc3dSStefano Zampini     ierr = KSPGetPC(pcbddc->ksp_R,&pc_temp);CHKERRQ(ierr);
333453cdbc3dSStefano Zampini     ierr = PCSetType(pc_temp,PCLU);CHKERRQ(ierr);
3335*2fa5cd67SKarl Rupp 
33360c7d97c5SJed Brown     /* Allow user's customization */
333753cdbc3dSStefano Zampini     ierr = KSPSetFromOptions(pcbddc->ksp_R);CHKERRQ(ierr);
3338*2fa5cd67SKarl Rupp 
3339950d796eSStefano Zampini     /* umfpack interface has a bug when matrix dimension is zero */
3340950d796eSStefano Zampini     if (!pcis->n) {
33412e8d2280SStefano Zampini       ierr = PCSetType(pc_temp,PCNONE);CHKERRQ(ierr);
3342950d796eSStefano Zampini     }
3343*2fa5cd67SKarl Rupp 
334453cdbc3dSStefano Zampini     /* Set Up KSP for Neumann problem of BDDC */
334553cdbc3dSStefano Zampini     ierr = KSPSetUp(pcbddc->ksp_R);CHKERRQ(ierr);
3346*2fa5cd67SKarl Rupp 
334729622bf0SStefano Zampini     /* check Dirichlet and Neumann solvers and adapt them is a nullspace correction is needed */
3348b76ba322SStefano Zampini     {
33490c7d97c5SJed Brown       Vec         temp_vec;
3350b76ba322SStefano Zampini       PetscReal   value;
3351b76ba322SStefano Zampini       PetscMPIInt use_exact,use_exact_reduced;
33520c7d97c5SJed Brown 
3353a0ba757dSStefano Zampini       ierr = VecDuplicate(pcis->vec1_D,&temp_vec);CHKERRQ(ierr);
3354a0ba757dSStefano Zampini       ierr = VecSetRandom(pcis->vec1_D,PETSC_NULL);CHKERRQ(ierr);
3355a0ba757dSStefano Zampini       ierr = MatMult(pcis->A_II,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr);
3356a0ba757dSStefano Zampini       ierr = KSPSolve(pcbddc->ksp_D,pcis->vec2_D,temp_vec);CHKERRQ(ierr);
3357a0ba757dSStefano Zampini       ierr = VecAXPY(temp_vec,m_one,pcis->vec1_D);CHKERRQ(ierr);
3358a0ba757dSStefano Zampini       ierr = VecNorm(temp_vec,NORM_INFINITY,&value);CHKERRQ(ierr);
335929622bf0SStefano Zampini       ierr = VecDestroy(&temp_vec);CHKERRQ(ierr);
3360b76ba322SStefano Zampini       use_exact = 1;
3361*2fa5cd67SKarl Rupp       if (PetscAbsReal(value) > 1.e-4) use_exact = 0;
3362*2fa5cd67SKarl Rupp 
3363b76ba322SStefano Zampini       ierr = MPI_Allreduce(&use_exact,&use_exact_reduced,1,MPIU_INT,MPI_LAND,((PetscObject)pc)->comm);CHKERRQ(ierr);
3364b76ba322SStefano Zampini       pcbddc->use_exact_dirichlet = (PetscBool) use_exact_reduced;
3365b76ba322SStefano Zampini       if (dbg_flag) {
3366a0ba757dSStefano Zampini         ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
3367a0ba757dSStefano Zampini         ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
3368a0ba757dSStefano Zampini         ierr = PetscViewerASCIIPrintf(viewer,"Checking solution of Dirichlet and Neumann problems\n");CHKERRQ(ierr);
3369a0ba757dSStefano Zampini         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d infinity error for Dirichlet solve = % 1.14e \n",PetscGlobalRank,value);CHKERRQ(ierr);
337029622bf0SStefano Zampini       }
337129622bf0SStefano Zampini       if (pcbddc->NullSpace && !use_exact_reduced && !pcbddc->inexact_prec_type) {
337229622bf0SStefano Zampini         ierr = PCBDDCAdaptLocalProblem(pc,pcis->is_I_local);
337329622bf0SStefano Zampini       }
3374d49ef151SStefano Zampini       ierr = VecDuplicate(pcbddc->vec1_R,&temp_vec);CHKERRQ(ierr);
3375d49ef151SStefano Zampini       ierr = VecSetRandom(pcbddc->vec1_R,PETSC_NULL);CHKERRQ(ierr);
3376d49ef151SStefano Zampini       ierr = MatMult(A_RR,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr);
3377d49ef151SStefano Zampini       ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec2_R,temp_vec);CHKERRQ(ierr);
3378d49ef151SStefano Zampini       ierr = VecAXPY(temp_vec,m_one,pcbddc->vec1_R);CHKERRQ(ierr);
3379d49ef151SStefano Zampini       ierr = VecNorm(temp_vec,NORM_INFINITY,&value);CHKERRQ(ierr);
3380e269702eSStefano Zampini       ierr = VecDestroy(&temp_vec);CHKERRQ(ierr);
3381*2fa5cd67SKarl Rupp 
338229622bf0SStefano Zampini       use_exact = 1;
3383*2fa5cd67SKarl Rupp       if (PetscAbsReal(value) > 1.e-4) use_exact = 0;
338429622bf0SStefano Zampini       ierr = MPI_Allreduce(&use_exact,&use_exact_reduced,1,MPIU_INT,MPI_LAND,((PetscObject)pc)->comm);CHKERRQ(ierr);
338529622bf0SStefano Zampini       if (dbg_flag) {
33860c7d97c5SJed Brown         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d infinity error for  Neumann  solve = % 1.14e \n",PetscGlobalRank,value);CHKERRQ(ierr);
3387d49ef151SStefano Zampini         ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
33880c7d97c5SJed Brown       }
338929622bf0SStefano Zampini       if (pcbddc->NullSpace && !use_exact_reduced) {
339029622bf0SStefano Zampini         ierr = PCBDDCAdaptLocalProblem(pc,is_R_local);
339129622bf0SStefano Zampini       }
3392b76ba322SStefano Zampini     }
33930c7d97c5SJed Brown     /* free Neumann problem's matrix */
33940c7d97c5SJed Brown     ierr = MatDestroy(&A_RR);CHKERRQ(ierr);
33950c7d97c5SJed Brown   }
33960c7d97c5SJed Brown 
33970c7d97c5SJed Brown   /* Assemble all remaining stuff needed to apply BDDC  */
33980c7d97c5SJed Brown   {
33990c7d97c5SJed Brown     Mat           A_RV,A_VR,A_VV;
34000bdf917eSStefano Zampini     Mat           M1;
34010c7d97c5SJed Brown     Mat           C_CR;
34023b03a366Sstefano_zampini     Mat           AUXMAT;
34030c7d97c5SJed Brown     Vec           vec1_C;
34040c7d97c5SJed Brown     Vec           vec2_C;
34050c7d97c5SJed Brown     Vec           vec1_V;
34060c7d97c5SJed Brown     Vec           vec2_V;
34070c7d97c5SJed Brown     PetscInt      *nnz;
34080c7d97c5SJed Brown     PetscInt      *auxindices;
340953cdbc3dSStefano Zampini     PetscInt      index;
34100c7d97c5SJed Brown     PetscScalar   *array2;
34110c7d97c5SJed Brown     MatFactorInfo matinfo;
34120c7d97c5SJed Brown 
34130c7d97c5SJed Brown     /* Allocating some extra storage just to be safe */
34140c7d97c5SJed Brown     ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&nnz);CHKERRQ(ierr);
34150c7d97c5SJed Brown     ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&auxindices);CHKERRQ(ierr);
3416*2fa5cd67SKarl Rupp     for (i=0;i<pcis->n;i++) auxindices[i]=i;
34170c7d97c5SJed Brown 
34180c7d97c5SJed Brown     /* some work vectors on vertices and/or constraints */
34193b03a366Sstefano_zampini     if (n_vertices) {
34200c7d97c5SJed Brown       ierr = VecCreate(PETSC_COMM_SELF,&vec1_V);CHKERRQ(ierr);
34213b03a366Sstefano_zampini       ierr = VecSetSizes(vec1_V,n_vertices,n_vertices);CHKERRQ(ierr);
34220c7d97c5SJed Brown       ierr = VecSetType(vec1_V,impVecType);CHKERRQ(ierr);
34230c7d97c5SJed Brown       ierr = VecDuplicate(vec1_V,&vec2_V);CHKERRQ(ierr);
34240c7d97c5SJed Brown     }
3425534831adSStefano Zampini     if (n_constraints) {
34260c7d97c5SJed Brown       ierr = VecCreate(PETSC_COMM_SELF,&vec1_C);CHKERRQ(ierr);
3427534831adSStefano Zampini       ierr = VecSetSizes(vec1_C,n_constraints,n_constraints);CHKERRQ(ierr);
34280c7d97c5SJed Brown       ierr = VecSetType(vec1_C,impVecType);CHKERRQ(ierr);
34290c7d97c5SJed Brown       ierr = VecDuplicate(vec1_C,&vec2_C);CHKERRQ(ierr);
34300c7d97c5SJed Brown       ierr = VecDuplicate(vec1_C,&pcbddc->vec1_C);CHKERRQ(ierr);
34310c7d97c5SJed Brown     }
34320c7d97c5SJed Brown     /* Precompute stuffs needed for preprocessing and application of BDDC*/
34333b03a366Sstefano_zampini     if (n_constraints) {
34340c7d97c5SJed Brown       ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->local_auxmat2);CHKERRQ(ierr);
34353b03a366Sstefano_zampini       ierr = MatSetSizes(pcbddc->local_auxmat2,n_R,n_constraints,n_R,n_constraints);CHKERRQ(ierr);
34360c7d97c5SJed Brown       ierr = MatSetType(pcbddc->local_auxmat2,impMatType);CHKERRQ(ierr);
34373b03a366Sstefano_zampini       ierr = MatSeqDenseSetPreallocation(pcbddc->local_auxmat2,PETSC_NULL);CHKERRQ(ierr);
34380c7d97c5SJed Brown 
343957a90decSStefano Zampini       /* Create Constraint matrix on R nodes: C_{CR}  */
344057a90decSStefano Zampini       ierr = MatGetSubMatrix(pcbddc->ConstraintMatrix,is_C_local,is_R_local,MAT_INITIAL_MATRIX,&C_CR);CHKERRQ(ierr);
344157a90decSStefano Zampini       ierr = ISDestroy(&is_C_local);CHKERRQ(ierr);
344257a90decSStefano Zampini 
34430c7d97c5SJed Brown       /* Assemble local_auxmat2 = - A_{RR}^{-1} C^T_{CR} needed by BDDC application */
34443b03a366Sstefano_zampini       for (i=0; i<n_constraints; i++) {
34453b03a366Sstefano_zampini         ierr = VecSet(pcbddc->vec1_R,zero);CHKERRQ(ierr);
3446*2fa5cd67SKarl Rupp 
34473b03a366Sstefano_zampini         /* Get row of constraint matrix in R numbering */
344857a90decSStefano Zampini         ierr = VecGetArray(pcbddc->vec1_R,&array);CHKERRQ(ierr);
344957a90decSStefano Zampini         ierr = MatGetRow(C_CR,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr);
3450*2fa5cd67SKarl Rupp         for (j=0;j<size_of_constraint;j++) array[row_cmat_indices[j]] = -row_cmat_values[j];
345157a90decSStefano Zampini         ierr = MatRestoreRow(C_CR,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr);
345257a90decSStefano Zampini         ierr = VecRestoreArray(pcbddc->vec1_R,&array);CHKERRQ(ierr);
3453*2fa5cd67SKarl Rupp 
34543b03a366Sstefano_zampini         /* Solve for row of constraint matrix in R numbering */
345553cdbc3dSStefano Zampini         ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr);
3456*2fa5cd67SKarl Rupp 
34573b03a366Sstefano_zampini         /* Set values */
34580c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec2_R,&array);CHKERRQ(ierr);
34593b03a366Sstefano_zampini         ierr = MatSetValues(pcbddc->local_auxmat2,n_R,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
34600c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec2_R,&array);CHKERRQ(ierr);
34610c7d97c5SJed Brown       }
34620c7d97c5SJed Brown       ierr = MatAssemblyBegin(pcbddc->local_auxmat2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
34630c7d97c5SJed Brown       ierr = MatAssemblyEnd(pcbddc->local_auxmat2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
34640c7d97c5SJed Brown 
34650c7d97c5SJed Brown       /* Assemble AUXMAT = (LUFactor)(-C_{CR} A_{RR}^{-1} C^T_{CR})^{-1} */
34660c7d97c5SJed Brown       ierr = MatMatMult(C_CR,pcbddc->local_auxmat2,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&AUXMAT);CHKERRQ(ierr);
3467d49ef151SStefano Zampini       ierr = MatFactorInfoInitialize(&matinfo);CHKERRQ(ierr);
34683b03a366Sstefano_zampini       ierr = ISCreateStride(PETSC_COMM_SELF,n_constraints,0,1,&is_aux1);CHKERRQ(ierr);
34690c7d97c5SJed Brown       ierr = MatLUFactor(AUXMAT,is_aux1,is_aux1,&matinfo);CHKERRQ(ierr);
34700c7d97c5SJed Brown       ierr = ISDestroy(&is_aux1);CHKERRQ(ierr);
34710c7d97c5SJed Brown 
34723b03a366Sstefano_zampini       /* Assemble explicitly M1 = (C_{CR} A_{RR}^{-1} C^T_{CR})^{-1} needed in preproc  */
3473d49ef151SStefano Zampini       ierr = MatCreate(PETSC_COMM_SELF,&M1);CHKERRQ(ierr);
34743b03a366Sstefano_zampini       ierr = MatSetSizes(M1,n_constraints,n_constraints,n_constraints,n_constraints);CHKERRQ(ierr);
34750c7d97c5SJed Brown       ierr = MatSetType(M1,impMatType);CHKERRQ(ierr);
34763b03a366Sstefano_zampini       ierr = MatSeqDenseSetPreallocation(M1,PETSC_NULL);CHKERRQ(ierr);
34773b03a366Sstefano_zampini       for (i=0; i<n_constraints; i++) {
34780c7d97c5SJed Brown         ierr = VecSet(vec1_C,zero);CHKERRQ(ierr);
34790c7d97c5SJed Brown         ierr = VecSetValue(vec1_C,i,one,INSERT_VALUES);CHKERRQ(ierr);
34800c7d97c5SJed Brown         ierr = VecAssemblyBegin(vec1_C);CHKERRQ(ierr);
34810c7d97c5SJed Brown         ierr = VecAssemblyEnd(vec1_C);CHKERRQ(ierr);
34820c7d97c5SJed Brown         ierr = MatSolve(AUXMAT,vec1_C,vec2_C);CHKERRQ(ierr);
34830c7d97c5SJed Brown         ierr = VecScale(vec2_C,m_one);CHKERRQ(ierr);
34840c7d97c5SJed Brown         ierr = VecGetArray(vec2_C,&array);CHKERRQ(ierr);
34853b03a366Sstefano_zampini         ierr = MatSetValues(M1,n_constraints,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
34860c7d97c5SJed Brown         ierr = VecRestoreArray(vec2_C,&array);CHKERRQ(ierr);
34870c7d97c5SJed Brown       }
34880c7d97c5SJed Brown       ierr = MatAssemblyBegin(M1,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
34890c7d97c5SJed Brown       ierr = MatAssemblyEnd(M1,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
34900c7d97c5SJed Brown       ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr);
34910c7d97c5SJed Brown       /* Assemble local_auxmat1 = M1*C_{CR} needed by BDDC application in KSP and in preproc */
34920c7d97c5SJed Brown       ierr = MatMatMult(M1,C_CR,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&pcbddc->local_auxmat1);CHKERRQ(ierr);
34930c7d97c5SJed Brown 
34940c7d97c5SJed Brown     }
34950c7d97c5SJed Brown 
34960c7d97c5SJed Brown     /* Get submatrices from subdomain matrix */
34973b03a366Sstefano_zampini     if (n_vertices) {
3498534831adSStefano Zampini       ierr = MatGetSubMatrix(pcbddc->local_mat,is_R_local,is_V_local,MAT_INITIAL_MATRIX,&A_RV);CHKERRQ(ierr);
3499534831adSStefano Zampini       ierr = MatGetSubMatrix(pcbddc->local_mat,is_V_local,is_R_local,MAT_INITIAL_MATRIX,&A_VR);CHKERRQ(ierr);
3500534831adSStefano Zampini       ierr = MatGetSubMatrix(pcbddc->local_mat,is_V_local,is_V_local,MAT_INITIAL_MATRIX,&A_VV);CHKERRQ(ierr);
35010c7d97c5SJed Brown     }
35020c7d97c5SJed Brown 
35030c7d97c5SJed Brown     /* Matrix of coarse basis functions (local) */
3504d49ef151SStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->coarse_phi_B);CHKERRQ(ierr);
35050c7d97c5SJed Brown     ierr = MatSetSizes(pcbddc->coarse_phi_B,n_B,pcbddc->local_primal_size,n_B,pcbddc->local_primal_size);CHKERRQ(ierr);
35060c7d97c5SJed Brown     ierr = MatSetType(pcbddc->coarse_phi_B,impMatType);CHKERRQ(ierr);
35073b03a366Sstefano_zampini     ierr = MatSeqDenseSetPreallocation(pcbddc->coarse_phi_B,PETSC_NULL);CHKERRQ(ierr);
350829622bf0SStefano Zampini     if (pcbddc->inexact_prec_type || dbg_flag) {
3509d49ef151SStefano Zampini       ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->coarse_phi_D);CHKERRQ(ierr);
35100c7d97c5SJed Brown       ierr = MatSetSizes(pcbddc->coarse_phi_D,n_D,pcbddc->local_primal_size,n_D,pcbddc->local_primal_size);CHKERRQ(ierr);
35110c7d97c5SJed Brown       ierr = MatSetType(pcbddc->coarse_phi_D,impMatType);CHKERRQ(ierr);
35123b03a366Sstefano_zampini       ierr = MatSeqDenseSetPreallocation(pcbddc->coarse_phi_D,PETSC_NULL);CHKERRQ(ierr);
35130c7d97c5SJed Brown     }
35140c7d97c5SJed Brown 
3515e269702eSStefano Zampini     if (dbg_flag) {
35160c7d97c5SJed Brown       ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscScalar),&coarsefunctions_errors);CHKERRQ(ierr);
35170c7d97c5SJed Brown       ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscScalar),&constraints_errors);CHKERRQ(ierr);
35180c7d97c5SJed Brown     }
35193b03a366Sstefano_zampini     /* Subdomain contribution (Non-overlapping) to coarse matrix  */
35200c7d97c5SJed Brown     ierr = PetscMalloc ((pcbddc->local_primal_size)*(pcbddc->local_primal_size)*sizeof(PetscScalar),&coarse_submat_vals);CHKERRQ(ierr);
35210c7d97c5SJed Brown 
35220c7d97c5SJed Brown     /* We are now ready to evaluate coarse basis functions and subdomain contribution to coarse problem */
35233b03a366Sstefano_zampini     for (i=0; i<n_vertices; i++) {
35240c7d97c5SJed Brown       ierr = VecSet(vec1_V,zero);CHKERRQ(ierr);
35250c7d97c5SJed Brown       ierr = VecSetValue(vec1_V,i,one,INSERT_VALUES);CHKERRQ(ierr);
35260c7d97c5SJed Brown       ierr = VecAssemblyBegin(vec1_V);CHKERRQ(ierr);
35270c7d97c5SJed Brown       ierr = VecAssemblyEnd(vec1_V);CHKERRQ(ierr);
35280c7d97c5SJed Brown       /* solution of saddle point problem */
35290bdf917eSStefano Zampini       ierr = MatMult(A_RV,vec1_V,pcbddc->vec1_R);CHKERRQ(ierr);
35300bdf917eSStefano Zampini       ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec1_R);CHKERRQ(ierr);
35310c7d97c5SJed Brown       ierr = VecScale(pcbddc->vec1_R,m_one);CHKERRQ(ierr);
35323b03a366Sstefano_zampini       if (n_constraints) {
35330c7d97c5SJed Brown         ierr = MatMult(pcbddc->local_auxmat1,pcbddc->vec1_R,vec1_C);CHKERRQ(ierr);
35340c7d97c5SJed Brown         ierr = MatMultAdd(pcbddc->local_auxmat2,vec1_C,pcbddc->vec1_R,pcbddc->vec1_R);CHKERRQ(ierr);
35350c7d97c5SJed Brown         ierr = VecScale(vec1_C,m_one);CHKERRQ(ierr);
35360c7d97c5SJed Brown       }
35370c7d97c5SJed Brown       ierr = MatMult(A_VR,pcbddc->vec1_R,vec2_V);CHKERRQ(ierr);
35380c7d97c5SJed Brown       ierr = MatMultAdd(A_VV,vec1_V,vec2_V,vec2_V);CHKERRQ(ierr);
35390c7d97c5SJed Brown 
35400c7d97c5SJed Brown       /* Set values in coarse basis function and subdomain part of coarse_mat */
35410c7d97c5SJed Brown       /* coarse basis functions */
35420c7d97c5SJed Brown       ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr);
35430c7d97c5SJed Brown       ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
35440c7d97c5SJed Brown       ierr = VecScatterEnd  (pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
35450c7d97c5SJed Brown       ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr);
35463b03a366Sstefano_zampini       ierr = MatSetValues(pcbddc->coarse_phi_B,n_B,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
35470c7d97c5SJed Brown       ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr);
35480c7d97c5SJed Brown       ierr = MatSetValue(pcbddc->coarse_phi_B,idx_V_B[i],i,one,INSERT_VALUES);CHKERRQ(ierr);
354929622bf0SStefano Zampini       if (pcbddc->inexact_prec_type || dbg_flag) {
35500c7d97c5SJed Brown         ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
35510c7d97c5SJed Brown         ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
35520c7d97c5SJed Brown         ierr = VecGetArray(pcis->vec1_D,&array);CHKERRQ(ierr);
35533b03a366Sstefano_zampini         ierr = MatSetValues(pcbddc->coarse_phi_D,n_D,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
35540c7d97c5SJed Brown         ierr = VecRestoreArray(pcis->vec1_D,&array);CHKERRQ(ierr);
35550c7d97c5SJed Brown       }
35560c7d97c5SJed Brown       /* subdomain contribution to coarse matrix */
35570c7d97c5SJed Brown       ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr);
3558*2fa5cd67SKarl Rupp       for (j=0; j<n_vertices; j++) coarse_submat_vals[i*pcbddc->local_primal_size+j] = array[j];   /* WARNING -> column major ordering */
35590c7d97c5SJed Brown       ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr);
35603b03a366Sstefano_zampini       if (n_constraints) {
35610c7d97c5SJed Brown         ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr);
3562*2fa5cd67SKarl Rupp         for (j=0; j<n_constraints; j++) coarse_submat_vals[i*pcbddc->local_primal_size+j+n_vertices] = array[j];   /* WARNING -> column major ordering */
35630c7d97c5SJed Brown         ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr);
35640c7d97c5SJed Brown       }
35650c7d97c5SJed Brown 
3566e269702eSStefano Zampini       if (dbg_flag) {
35670c7d97c5SJed Brown         /* assemble subdomain vector on nodes */
3568d49ef151SStefano Zampini         ierr = VecSet(pcis->vec1_N,zero);CHKERRQ(ierr);
35690c7d97c5SJed Brown         ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
35700c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr);
3571*2fa5cd67SKarl Rupp         for (j=0;j<n_R;j++) array[idx_R_local[j]] = array2[j];
35723b03a366Sstefano_zampini         array[vertices[i]] = one;
35730c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr);
35740c7d97c5SJed Brown         ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3575*2fa5cd67SKarl Rupp 
35760c7d97c5SJed Brown         /* assemble subdomain vector of lagrange multipliers (i.e. primal nodes) */
3577d49ef151SStefano Zampini         ierr = VecSet(pcbddc->vec1_P,zero);CHKERRQ(ierr);
35780c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr);
35790c7d97c5SJed Brown         ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr);
3580*2fa5cd67SKarl Rupp         for (j=0;j<n_vertices;j++) array2[j]=array[j];
35810c7d97c5SJed Brown         ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr);
35823b03a366Sstefano_zampini         if (n_constraints) {
35830c7d97c5SJed Brown           ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr);
3584*2fa5cd67SKarl Rupp           for (j=0;j<n_constraints;j++) array2[j+n_vertices]=array[j];
35850c7d97c5SJed Brown           ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr);
35860c7d97c5SJed Brown         }
35870c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr);
35880c7d97c5SJed Brown         ierr = VecScale(pcbddc->vec1_P,m_one);CHKERRQ(ierr);
3589*2fa5cd67SKarl Rupp 
35900c7d97c5SJed Brown         /* check saddle point solution */
3591534831adSStefano Zampini         ierr    = MatMult(pcbddc->local_mat,pcis->vec1_N,pcis->vec2_N);CHKERRQ(ierr);
35923b03a366Sstefano_zampini         ierr    = MatMultTransposeAdd(pcbddc->ConstraintMatrix,pcbddc->vec1_P,pcis->vec2_N,pcis->vec2_N);CHKERRQ(ierr);
35933b03a366Sstefano_zampini         ierr    = VecNorm(pcis->vec2_N,NORM_INFINITY,&coarsefunctions_errors[i]);CHKERRQ(ierr);
35943b03a366Sstefano_zampini         ierr    = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr);
35950c7d97c5SJed Brown         ierr    = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
35963b03a366Sstefano_zampini         array[i]=array[i]+m_one;  /* shift by the identity matrix */
35970c7d97c5SJed Brown         ierr    = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
35983b03a366Sstefano_zampini         ierr    = VecNorm(pcbddc->vec1_P,NORM_INFINITY,&constraints_errors[i]);CHKERRQ(ierr);
35990c7d97c5SJed Brown       }
36000c7d97c5SJed Brown     }
36010c7d97c5SJed Brown 
36023b03a366Sstefano_zampini     for (i=0; i<n_constraints; i++) {
3603d49ef151SStefano Zampini       ierr = VecSet(vec2_C,zero);CHKERRQ(ierr);
36040c7d97c5SJed Brown       ierr = VecSetValue(vec2_C,i,m_one,INSERT_VALUES);CHKERRQ(ierr);
36050c7d97c5SJed Brown       ierr = VecAssemblyBegin(vec2_C);CHKERRQ(ierr);
36060c7d97c5SJed Brown       ierr = VecAssemblyEnd(vec2_C);CHKERRQ(ierr);
3607*2fa5cd67SKarl Rupp 
36080c7d97c5SJed Brown       /* solution of saddle point problem */
36090c7d97c5SJed Brown       ierr = MatMult(M1,vec2_C,vec1_C);CHKERRQ(ierr);
36100c7d97c5SJed Brown       ierr = MatMult(pcbddc->local_auxmat2,vec1_C,pcbddc->vec1_R);CHKERRQ(ierr);
36110c7d97c5SJed Brown       ierr = VecScale(vec1_C,m_one);CHKERRQ(ierr);
36123b03a366Sstefano_zampini       if (n_vertices) { ierr = MatMult(A_VR,pcbddc->vec1_R,vec2_V);CHKERRQ(ierr); }
3613*2fa5cd67SKarl Rupp 
36140c7d97c5SJed Brown       /* Set values in coarse basis function and subdomain part of coarse_mat */
36150c7d97c5SJed Brown       /* coarse basis functions */
36163b03a366Sstefano_zampini       index=i+n_vertices;
36170c7d97c5SJed Brown       ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr);
36180c7d97c5SJed Brown       ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
36190c7d97c5SJed Brown       ierr = VecScatterEnd  (pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
36200c7d97c5SJed Brown       ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr);
362153cdbc3dSStefano Zampini       ierr = MatSetValues(pcbddc->coarse_phi_B,n_B,auxindices,1,&index,array,INSERT_VALUES);CHKERRQ(ierr);
36220c7d97c5SJed Brown       ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr);
362329622bf0SStefano Zampini       if (pcbddc->inexact_prec_type || dbg_flag) {
36240c7d97c5SJed Brown         ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
36250c7d97c5SJed Brown         ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
36260c7d97c5SJed Brown         ierr = VecGetArray(pcis->vec1_D,&array);CHKERRQ(ierr);
362753cdbc3dSStefano Zampini         ierr = MatSetValues(pcbddc->coarse_phi_D,n_D,auxindices,1,&index,array,INSERT_VALUES);CHKERRQ(ierr);
36280c7d97c5SJed Brown         ierr = VecRestoreArray(pcis->vec1_D,&array);CHKERRQ(ierr);
36290c7d97c5SJed Brown       }
3630*2fa5cd67SKarl Rupp 
36310c7d97c5SJed Brown       /* subdomain contribution to coarse matrix */
36323b03a366Sstefano_zampini       if (n_vertices) {
36330c7d97c5SJed Brown         ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr);
3634*2fa5cd67SKarl Rupp         for (j=0; j<n_vertices; j++) coarse_submat_vals[index*pcbddc->local_primal_size+j]=array[j]; /* WARNING -> column major ordering */
36350c7d97c5SJed Brown         ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr);
36360c7d97c5SJed Brown       }
36370c7d97c5SJed Brown       ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr);
3638*2fa5cd67SKarl Rupp       for (j=0; j<n_constraints; j++) coarse_submat_vals[index*pcbddc->local_primal_size+j+n_vertices]=array[j]; /* WARNING -> column major ordering */
36390c7d97c5SJed Brown       ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr);
36400c7d97c5SJed Brown 
3641e269702eSStefano Zampini       if (dbg_flag) {
36420c7d97c5SJed Brown         /* assemble subdomain vector on nodes */
364353cdbc3dSStefano Zampini         ierr = VecSet(pcis->vec1_N,zero);CHKERRQ(ierr);
36440c7d97c5SJed Brown         ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
36450c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr);
3646*2fa5cd67SKarl Rupp         for (j=0;j<n_R;j++) array[idx_R_local[j]] = array2[j];
36470c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr);
36480c7d97c5SJed Brown         ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3649*2fa5cd67SKarl Rupp 
36500c7d97c5SJed Brown         /* assemble subdomain vector of lagrange multipliers */
365153cdbc3dSStefano Zampini         ierr = VecSet(pcbddc->vec1_P,zero);CHKERRQ(ierr);
36520c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr);
36533b03a366Sstefano_zampini         if (n_vertices) {
36540c7d97c5SJed Brown           ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr);
3655*2fa5cd67SKarl Rupp           for (j=0;j<n_vertices;j++) array2[j]=-array[j];
36560c7d97c5SJed Brown           ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr);
36570c7d97c5SJed Brown         }
36580c7d97c5SJed Brown         ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr);
36593b03a366Sstefano_zampini         for (j=0;j<n_constraints;j++) {array2[j+n_vertices]=-array[j];}
36600c7d97c5SJed Brown         ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr);
36610c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr);
3662*2fa5cd67SKarl Rupp 
36633972b0daSStefano Zampini         /* check saddle point solution */
3664534831adSStefano Zampini         ierr         = MatMult(pcbddc->local_mat,pcis->vec1_N,pcis->vec2_N);CHKERRQ(ierr);
36653b03a366Sstefano_zampini         ierr         = MatMultTransposeAdd(pcbddc->ConstraintMatrix,pcbddc->vec1_P,pcis->vec2_N,pcis->vec2_N);CHKERRQ(ierr);
366653cdbc3dSStefano Zampini         ierr         = VecNorm(pcis->vec2_N,NORM_INFINITY,&coarsefunctions_errors[index]);CHKERRQ(ierr);
36673b03a366Sstefano_zampini         ierr         = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr);
36680c7d97c5SJed Brown         ierr         = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
366953cdbc3dSStefano Zampini         array[index] = array[index]+m_one; /* shift by the identity matrix */
36700c7d97c5SJed Brown         ierr         = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
367153cdbc3dSStefano Zampini         ierr         = VecNorm(pcbddc->vec1_P,NORM_INFINITY,&constraints_errors[index]);CHKERRQ(ierr);
36720c7d97c5SJed Brown       }
36730c7d97c5SJed Brown     }
36740c7d97c5SJed Brown     ierr = MatAssemblyBegin(pcbddc->coarse_phi_B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
36750c7d97c5SJed Brown     ierr = MatAssemblyEnd  (pcbddc->coarse_phi_B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
367629622bf0SStefano Zampini     if (pcbddc->inexact_prec_type || dbg_flag) {
36770c7d97c5SJed Brown       ierr = MatAssemblyBegin(pcbddc->coarse_phi_D,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
36780c7d97c5SJed Brown       ierr = MatAssemblyEnd  (pcbddc->coarse_phi_D,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
36790c7d97c5SJed Brown     }
36800c7d97c5SJed Brown     /* Checking coarse_sub_mat and coarse basis functios */
36810c7d97c5SJed Brown     /* It shuld be \Phi^{(j)^T} A^{(j)} \Phi^{(j)}=coarse_sub_mat */
36829d2fce94SStefano Zampini     if (dbg_flag) {
36830c7d97c5SJed Brown       Mat         coarse_sub_mat;
36840c7d97c5SJed Brown       Mat         TM1,TM2,TM3,TM4;
36850c7d97c5SJed Brown       Mat         coarse_phi_D,coarse_phi_B,A_II,A_BB,A_IB,A_BI;
368619fd82e9SBarry Smith       MatType     checkmattype=MATSEQAIJ;
36870c7d97c5SJed Brown       PetscScalar value;
36880c7d97c5SJed Brown 
3689c042a7c3SStefano Zampini       ierr = MatConvert(pcis->A_II,checkmattype,MAT_INITIAL_MATRIX,&A_II);CHKERRQ(ierr);
3690c042a7c3SStefano Zampini       ierr = MatConvert(pcis->A_IB,checkmattype,MAT_INITIAL_MATRIX,&A_IB);CHKERRQ(ierr);
3691c042a7c3SStefano Zampini       ierr = MatConvert(pcis->A_BI,checkmattype,MAT_INITIAL_MATRIX,&A_BI);CHKERRQ(ierr);
3692c042a7c3SStefano Zampini       ierr = MatConvert(pcis->A_BB,checkmattype,MAT_INITIAL_MATRIX,&A_BB);CHKERRQ(ierr);
3693c042a7c3SStefano Zampini       ierr = MatConvert(pcbddc->coarse_phi_D,checkmattype,MAT_INITIAL_MATRIX,&coarse_phi_D);CHKERRQ(ierr);
3694c042a7c3SStefano Zampini       ierr = MatConvert(pcbddc->coarse_phi_B,checkmattype,MAT_INITIAL_MATRIX,&coarse_phi_B);CHKERRQ(ierr);
3695c042a7c3SStefano Zampini       ierr = MatCreateSeqDense(PETSC_COMM_SELF,pcbddc->local_primal_size,pcbddc->local_primal_size,coarse_submat_vals,&coarse_sub_mat);CHKERRQ(ierr);
3696c042a7c3SStefano Zampini       ierr = MatConvert(coarse_sub_mat,checkmattype,MAT_REUSE_MATRIX,&coarse_sub_mat);CHKERRQ(ierr);
36970c7d97c5SJed Brown 
36980c7d97c5SJed Brown       ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
36990c7d97c5SJed Brown       ierr = PetscViewerASCIIPrintf(viewer,"Check coarse sub mat and local basis functions\n");CHKERRQ(ierr);
37000c7d97c5SJed Brown       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
370153cdbc3dSStefano Zampini       ierr = MatPtAP(A_II,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&TM1);CHKERRQ(ierr);
370253cdbc3dSStefano Zampini       ierr = MatPtAP(A_BB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&TM2);CHKERRQ(ierr);
370353cdbc3dSStefano Zampini       ierr = MatMatMult(A_IB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr);
3704c042a7c3SStefano Zampini       ierr = MatTransposeMatMult(coarse_phi_D,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM3);CHKERRQ(ierr);
370553cdbc3dSStefano Zampini       ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr);
370653cdbc3dSStefano Zampini       ierr = MatMatMult(A_BI,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr);
3707c042a7c3SStefano Zampini       ierr = MatTransposeMatMult(coarse_phi_B,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM4);CHKERRQ(ierr);
370853cdbc3dSStefano Zampini       ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr);
370953cdbc3dSStefano Zampini       ierr = MatAXPY(TM1,one,TM2,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
371053cdbc3dSStefano Zampini       ierr = MatAXPY(TM1,one,TM3,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
371153cdbc3dSStefano Zampini       ierr = MatAXPY(TM1,one,TM4,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
371253cdbc3dSStefano Zampini       ierr = MatAXPY(TM1,m_one,coarse_sub_mat,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
371353cdbc3dSStefano Zampini       ierr = MatNorm(TM1,NORM_INFINITY,&value);CHKERRQ(ierr);
37140c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"----------------------------------\n");CHKERRQ(ierr);
37150c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d \n",PetscGlobalRank);CHKERRQ(ierr);
37160c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"matrix error = % 1.14e\n",value);CHKERRQ(ierr);
37170c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"coarse functions errors\n");CHKERRQ(ierr);
371853cdbc3dSStefano Zampini       for (i=0; i<pcbddc->local_primal_size; i++) { ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local %02d-th function error = % 1.14e\n",i,coarsefunctions_errors[i]);CHKERRQ(ierr); }
37190c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"constraints errors\n");CHKERRQ(ierr);
372053cdbc3dSStefano Zampini       for (i=0; i<pcbddc->local_primal_size; i++) { ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local %02d-th function error = % 1.14e\n",i,constraints_errors[i]);CHKERRQ(ierr); }
37210c7d97c5SJed Brown       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
372253cdbc3dSStefano Zampini       ierr = MatDestroy(&A_II);CHKERRQ(ierr);
372353cdbc3dSStefano Zampini       ierr = MatDestroy(&A_BB);CHKERRQ(ierr);
372453cdbc3dSStefano Zampini       ierr = MatDestroy(&A_IB);CHKERRQ(ierr);
372553cdbc3dSStefano Zampini       ierr = MatDestroy(&A_BI);CHKERRQ(ierr);
372653cdbc3dSStefano Zampini       ierr = MatDestroy(&TM1);CHKERRQ(ierr);
372753cdbc3dSStefano Zampini       ierr = MatDestroy(&TM2);CHKERRQ(ierr);
372853cdbc3dSStefano Zampini       ierr = MatDestroy(&TM3);CHKERRQ(ierr);
372953cdbc3dSStefano Zampini       ierr = MatDestroy(&TM4);CHKERRQ(ierr);
373053cdbc3dSStefano Zampini       ierr = MatDestroy(&coarse_phi_D);CHKERRQ(ierr);
373153cdbc3dSStefano Zampini       ierr = MatDestroy(&coarse_sub_mat);CHKERRQ(ierr);
373253cdbc3dSStefano Zampini       ierr = MatDestroy(&coarse_phi_B);CHKERRQ(ierr);
37330c7d97c5SJed Brown       ierr = PetscFree(coarsefunctions_errors);CHKERRQ(ierr);
37340c7d97c5SJed Brown       ierr = PetscFree(constraints_errors);CHKERRQ(ierr);
37350c7d97c5SJed Brown     }
37360c7d97c5SJed Brown     /* free memory */
37373b03a366Sstefano_zampini     if (n_vertices) {
37380c7d97c5SJed Brown       ierr = VecDestroy(&vec1_V);CHKERRQ(ierr);
37390c7d97c5SJed Brown       ierr = VecDestroy(&vec2_V);CHKERRQ(ierr);
37400c7d97c5SJed Brown       ierr = MatDestroy(&A_RV);CHKERRQ(ierr);
37410c7d97c5SJed Brown       ierr = MatDestroy(&A_VR);CHKERRQ(ierr);
37420c7d97c5SJed Brown       ierr = MatDestroy(&A_VV);CHKERRQ(ierr);
37430c7d97c5SJed Brown     }
3744534831adSStefano Zampini     if (n_constraints) {
37450c7d97c5SJed Brown       ierr = VecDestroy(&vec1_C);CHKERRQ(ierr);
37460c7d97c5SJed Brown       ierr = VecDestroy(&vec2_C);CHKERRQ(ierr);
37470c7d97c5SJed Brown       ierr = MatDestroy(&M1);CHKERRQ(ierr);
37480c7d97c5SJed Brown       ierr = MatDestroy(&C_CR);CHKERRQ(ierr);
37490c7d97c5SJed Brown     }
3750a929c220SStefano Zampini     ierr = PetscFree(auxindices);CHKERRQ(ierr);
3751a929c220SStefano Zampini     ierr = PetscFree(nnz);CHKERRQ(ierr);
3752a929c220SStefano Zampini     /* create coarse matrix and data structures for message passing associated actual choice of coarse problem type */
3753a929c220SStefano Zampini     ierr = PCBDDCSetupCoarseEnvironment(pc,coarse_submat_vals);CHKERRQ(ierr);
3754a929c220SStefano Zampini     ierr = PetscFree(coarse_submat_vals);CHKERRQ(ierr);
37550c7d97c5SJed Brown   }
37560c7d97c5SJed Brown   /* free memory */
37573b03a366Sstefano_zampini   if (n_vertices) {
37580c7d97c5SJed Brown     ierr = PetscFree(idx_V_B);CHKERRQ(ierr);
37590c7d97c5SJed Brown     ierr = ISDestroy(&is_V_local);CHKERRQ(ierr);
37600c7d97c5SJed Brown   }
37610c7d97c5SJed Brown   ierr = ISDestroy(&is_R_local);CHKERRQ(ierr);
37620c7d97c5SJed Brown   PetscFunctionReturn(0);
37630c7d97c5SJed Brown }
37640c7d97c5SJed Brown 
37650c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
37660c7d97c5SJed Brown 
37670c7d97c5SJed Brown #undef __FUNCT__
37680c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetupCoarseEnvironment"
376953cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetupCoarseEnvironment(PC pc,PetscScalar* coarse_submat_vals)
37700c7d97c5SJed Brown {
37710c7d97c5SJed Brown   Mat_IS   *matis    = (Mat_IS*)pc->pmat->data;
37720c7d97c5SJed Brown   PC_BDDC  *pcbddc   = (PC_BDDC*)pc->data;
37730c7d97c5SJed Brown   PC_IS    *pcis     = (PC_IS*)pc->data;
37740c7d97c5SJed Brown   MPI_Comm prec_comm = ((PetscObject)pc)->comm;
37750c7d97c5SJed Brown   MPI_Comm coarse_comm;
37760c7d97c5SJed Brown 
37770c7d97c5SJed Brown   /* common to all choiches */
37780c7d97c5SJed Brown   PetscScalar *temp_coarse_mat_vals;
37790c7d97c5SJed Brown   PetscScalar *ins_coarse_mat_vals;
37800c7d97c5SJed Brown   PetscInt    *ins_local_primal_indices;
37810c7d97c5SJed Brown   PetscMPIInt *localsizes2,*localdispl2;
37820c7d97c5SJed Brown   PetscMPIInt size_prec_comm;
37830c7d97c5SJed Brown   PetscMPIInt rank_prec_comm;
37840c7d97c5SJed Brown   PetscMPIInt active_rank=MPI_PROC_NULL;
37850c7d97c5SJed Brown   PetscMPIInt master_proc=0;
37860c7d97c5SJed Brown   PetscInt    ins_local_primal_size;
3787*2fa5cd67SKarl Rupp 
37880c7d97c5SJed Brown   /* specific to MULTILEVEL_BDDC */
37890c7d97c5SJed Brown   PetscMPIInt            *ranks_recv;
37900c7d97c5SJed Brown   PetscMPIInt            count_recv=0;
37910c7d97c5SJed Brown   PetscMPIInt            rank_coarse_proc_send_to;
37920c7d97c5SJed Brown   PetscMPIInt            coarse_color = MPI_UNDEFINED;
37930c7d97c5SJed Brown   ISLocalToGlobalMapping coarse_ISLG;
3794*2fa5cd67SKarl Rupp 
37950c7d97c5SJed Brown   /* some other variables */
37960c7d97c5SJed Brown   PetscErrorCode ierr;
379719fd82e9SBarry Smith   MatType        coarse_mat_type;
379819fd82e9SBarry Smith   PCType         coarse_pc_type;
379919fd82e9SBarry Smith   KSPType        coarse_ksp_type;
380053cdbc3dSStefano Zampini   PC             pc_temp;
38014fad6a16SStefano Zampini   PetscInt       i,j,k;
38023b03a366Sstefano_zampini   PetscInt       max_it_coarse_ksp=1;          /* don't increase this value */
3803*2fa5cd67SKarl Rupp 
3804e269702eSStefano Zampini   /* verbose output viewer */
3805e269702eSStefano Zampini   PetscViewer viewer   = pcbddc->dbg_viewer;
3806e269702eSStefano Zampini   PetscBool   dbg_flag = pcbddc->dbg_flag;
3807142dfd88SStefano Zampini 
3808ea7e1babSStefano Zampini   PetscInt    offset,offset2;
3809a929c220SStefano Zampini   PetscMPIInt im_active,active_procs;
3810523858cfSStefano Zampini   PetscInt    *dnz,*onz;
3811142dfd88SStefano Zampini 
3812142dfd88SStefano Zampini   PetscBool setsym,issym=PETSC_FALSE;
38130c7d97c5SJed Brown 
38140c7d97c5SJed Brown   PetscFunctionBegin;
38150c7d97c5SJed Brown   ins_local_primal_indices = 0;
38160c7d97c5SJed Brown   ins_coarse_mat_vals      = 0;
38170c7d97c5SJed Brown   localsizes2              = 0;
38180c7d97c5SJed Brown   localdispl2              = 0;
38190c7d97c5SJed Brown   temp_coarse_mat_vals     = 0;
38200c7d97c5SJed Brown   coarse_ISLG              = 0;
38210c7d97c5SJed Brown 
382253cdbc3dSStefano Zampini   ierr = MPI_Comm_size(prec_comm,&size_prec_comm);CHKERRQ(ierr);
382353cdbc3dSStefano Zampini   ierr = MPI_Comm_rank(prec_comm,&rank_prec_comm);CHKERRQ(ierr);
3824142dfd88SStefano Zampini   ierr = MatIsSymmetricKnown(pc->pmat,&setsym,&issym);CHKERRQ(ierr);
3825142dfd88SStefano Zampini 
3826beed3852SStefano Zampini   /* Assign global numbering to coarse dofs */
3827beed3852SStefano Zampini   {
3828ef028eecSStefano Zampini     PetscInt    *auxlocal_primal;
3829da1bb401SStefano Zampini     PetscInt    *row_cmat_indices;
38302e8d2280SStefano Zampini     PetscInt    *aux_ordering;
38312e8d2280SStefano Zampini     PetscInt    *row_cmat_global_indices;
3832ef028eecSStefano Zampini     PetscInt    *dof_sizes,*dof_displs;
38333b03a366Sstefano_zampini     PetscInt    size_of_constraint;
38342e8d2280SStefano Zampini     PetscBool   *array_bool;
3835ef028eecSStefano Zampini     PetscBool   first_found;
3836ef028eecSStefano Zampini     PetscInt    first_index,old_index,s;
3837ef028eecSStefano Zampini     PetscMPIInt mpi_local_primal_size;
3838ef028eecSStefano Zampini     PetscScalar coarsesum,*array;
3839ef028eecSStefano Zampini 
3840ef028eecSStefano Zampini     mpi_local_primal_size = (PetscMPIInt)pcbddc->local_primal_size;
3841beed3852SStefano Zampini 
3842beed3852SStefano Zampini     /* Construct needed data structures for message passing */
3843ef028eecSStefano Zampini     ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscInt),&pcbddc->local_primal_indices);CHKERRQ(ierr);
3844ffe5efe1SStefano Zampini     j = 0;
3845142dfd88SStefano Zampini     if (rank_prec_comm == 0 || pcbddc->coarse_problem_type == REPLICATED_BDDC || pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
3846ffe5efe1SStefano Zampini       j = size_prec_comm;
3847ffe5efe1SStefano Zampini     }
3848ffe5efe1SStefano Zampini     ierr = PetscMalloc(j*sizeof(PetscMPIInt),&pcbddc->local_primal_sizes);CHKERRQ(ierr);
3849ffe5efe1SStefano Zampini     ierr = PetscMalloc(j*sizeof(PetscMPIInt),&pcbddc->local_primal_displacements);CHKERRQ(ierr);
3850beed3852SStefano Zampini     /* Gather local_primal_size information for all processes  */
3851142dfd88SStefano Zampini     if (pcbddc->coarse_problem_type == REPLICATED_BDDC || pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
38525619798eSStefano Zampini       ierr = MPI_Allgather(&mpi_local_primal_size,1,MPIU_INT,&pcbddc->local_primal_sizes[0],1,MPIU_INT,prec_comm);CHKERRQ(ierr);
3853ffe5efe1SStefano Zampini     } else {
3854ffe5efe1SStefano Zampini       ierr = MPI_Gather(&mpi_local_primal_size,1,MPIU_INT,&pcbddc->local_primal_sizes[0],1,MPIU_INT,0,prec_comm);CHKERRQ(ierr);
3855ffe5efe1SStefano Zampini     }
3856beed3852SStefano Zampini     pcbddc->replicated_primal_size = 0;
3857ffe5efe1SStefano Zampini     for (i=0; i<j; i++) {
3858beed3852SStefano Zampini       pcbddc->local_primal_displacements[i] = pcbddc->replicated_primal_size;
3859beed3852SStefano Zampini       pcbddc->replicated_primal_size       += pcbddc->local_primal_sizes[i];
3860beed3852SStefano Zampini     }
3861beed3852SStefano Zampini 
3862da1bb401SStefano Zampini     /* First let's count coarse dofs.
3863beed3852SStefano Zampini        This code fragment assumes that the number of local constraints per connected component
3864beed3852SStefano Zampini        is not greater than the number of nodes defined for the connected component
3865beed3852SStefano Zampini        (otherwise we will surely have linear dependence between constraints and thus a singular coarse problem) */
3866ef028eecSStefano Zampini     ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscInt),&auxlocal_primal);CHKERRQ(ierr);
38672e8d2280SStefano Zampini     j    = 0;
38682e8d2280SStefano Zampini     for (i=0; i<pcbddc->local_primal_size; i++) {
38692e8d2280SStefano Zampini       ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,PETSC_NULL,PETSC_NULL);CHKERRQ(ierr);
3870*2fa5cd67SKarl Rupp       if (j < size_of_constraint) j = size_of_constraint;
38712e8d2280SStefano Zampini       ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,PETSC_NULL,PETSC_NULL);CHKERRQ(ierr);
38722e8d2280SStefano Zampini     }
38732e8d2280SStefano Zampini     ierr = PetscMalloc(j*sizeof(PetscInt),&aux_ordering);CHKERRQ(ierr);
38742e8d2280SStefano Zampini     ierr = PetscMalloc(j*sizeof(PetscInt),&row_cmat_global_indices);CHKERRQ(ierr);
38752e8d2280SStefano Zampini     ierr = PetscMalloc(pcis->n*sizeof(PetscBool),&array_bool);CHKERRQ(ierr);
3876*2fa5cd67SKarl Rupp     for (i=0;i<pcis->n;i++) array_bool[i] = PETSC_FALSE;
3877*2fa5cd67SKarl Rupp 
3878da1bb401SStefano Zampini     for (i=0;i<pcbddc->local_primal_size;i++) {
3879da1bb401SStefano Zampini       ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr);
3880*2fa5cd67SKarl Rupp       for (j=0; j<size_of_constraint; j++) aux_ordering[j] = j;
3881*2fa5cd67SKarl Rupp 
38822e8d2280SStefano Zampini       ierr = ISLocalToGlobalMappingApply(matis->mapping,size_of_constraint,row_cmat_indices,row_cmat_global_indices);CHKERRQ(ierr);
38832e8d2280SStefano Zampini       ierr = PetscSortIntWithPermutation(size_of_constraint,row_cmat_global_indices,aux_ordering);CHKERRQ(ierr);
38842e8d2280SStefano Zampini       for (j=0; j<size_of_constraint; j++) {
38852e8d2280SStefano Zampini         k = row_cmat_indices[aux_ordering[j]];
38862e8d2280SStefano Zampini         if (!array_bool[k]) {
38872e8d2280SStefano Zampini           array_bool[k]      = PETSC_TRUE;
3888da1bb401SStefano Zampini           auxlocal_primal[i] = k;
3889beed3852SStefano Zampini           break;
3890beed3852SStefano Zampini         }
3891beed3852SStefano Zampini       }
3892da1bb401SStefano Zampini       ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr);
3893beed3852SStefano Zampini     }
38942e8d2280SStefano Zampini     ierr = PetscFree(aux_ordering);CHKERRQ(ierr);
3895ef028eecSStefano Zampini     ierr = PetscFree(array_bool);CHKERRQ(ierr);
3896ef028eecSStefano Zampini     ierr = PetscFree(row_cmat_global_indices);CHKERRQ(ierr);
38972e8d2280SStefano Zampini 
3898ef028eecSStefano Zampini     /* Compute number of coarse dofs */
3899ef028eecSStefano Zampini     ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
3900ef028eecSStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3901*2fa5cd67SKarl Rupp     for (i=0;i<pcbddc->local_primal_size;i++) array[auxlocal_primal[i]] = 1.0;
3902ef028eecSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3903ef028eecSStefano Zampini     ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
3904ef028eecSStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3905ef028eecSStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3906ef028eecSStefano Zampini     ierr = VecSum(pcis->vec1_global,&coarsesum);CHKERRQ(ierr);
3907ef028eecSStefano Zampini     pcbddc->coarse_size = (PetscInt)coarsesum;
3908ef028eecSStefano Zampini 
3909ef028eecSStefano Zampini     /* Fill pcis->vec1_global with cumulative function for global numbering */
3910ef028eecSStefano Zampini     ierr        = VecGetArray(pcis->vec1_global,&array);CHKERRQ(ierr);
3911ef028eecSStefano Zampini     ierr        = VecGetLocalSize(pcis->vec1_global,&s);CHKERRQ(ierr);
3912ef028eecSStefano Zampini     k           = 0;
3913ef028eecSStefano Zampini     first_index = -1;
3914ef028eecSStefano Zampini     first_found = PETSC_FALSE;
3915ef028eecSStefano Zampini     for (i=0; i<s; i++) {
3916ef028eecSStefano Zampini       if (!first_found && array[i] > 0.0) {
3917ef028eecSStefano Zampini         first_found = PETSC_TRUE;
3918ef028eecSStefano Zampini         first_index = i;
3919ef028eecSStefano Zampini       }
3920ef028eecSStefano Zampini       k += (PetscInt)array[i];
3921ef028eecSStefano Zampini     }
3922ef028eecSStefano Zampini     j    = (!rank_prec_comm ? size_prec_comm : 0);
3923ef028eecSStefano Zampini     ierr = PetscMalloc(j*sizeof(*dof_sizes),&dof_sizes);CHKERRQ(ierr);
3924ef028eecSStefano Zampini     ierr = PetscMalloc(j*sizeof(*dof_displs),&dof_displs);CHKERRQ(ierr);
3925ef028eecSStefano Zampini     ierr = MPI_Gather(&k,1,MPIU_INT,dof_sizes,1,MPIU_INT,0,prec_comm);CHKERRQ(ierr);
3926ef028eecSStefano Zampini     if (!rank_prec_comm) {
3927ef028eecSStefano Zampini       dof_displs[0]=0;
3928*2fa5cd67SKarl Rupp       for (i=1;i<size_prec_comm;i++) dof_displs[i] = dof_displs[i-1]+dof_sizes[i-1];
3929ef028eecSStefano Zampini     }
3930ef028eecSStefano Zampini     ierr = MPI_Scatter(dof_displs,1,MPIU_INT,&k,1,MPIU_INT,0,prec_comm);CHKERRQ(ierr);
3931ef028eecSStefano Zampini     if (first_found) {
3932ef028eecSStefano Zampini       array[first_index] += k;
3933ef028eecSStefano Zampini       old_index = first_index;
3934ef028eecSStefano Zampini       for (i=first_index+1;i<s;i++) {
3935ef028eecSStefano Zampini         if (array[i] > 0.0) {
3936ef028eecSStefano Zampini           array[i] += array[old_index];
3937ef028eecSStefano Zampini           old_index = i;
3938ef028eecSStefano Zampini         }
3939ef028eecSStefano Zampini       }
3940ef028eecSStefano Zampini     }
3941ef028eecSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_global,&array);CHKERRQ(ierr);
3942ef028eecSStefano Zampini     ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
3943ef028eecSStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3944ef028eecSStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3945ef028eecSStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3946*2fa5cd67SKarl Rupp     for (i=0;i<pcbddc->local_primal_size;i++) pcbddc->local_primal_indices[i] = (PetscInt)array[auxlocal_primal[i]]-1;
3947ef028eecSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3948ef028eecSStefano Zampini     ierr = PetscFree(dof_displs);CHKERRQ(ierr);
3949ef028eecSStefano Zampini     ierr = PetscFree(dof_sizes);CHKERRQ(ierr);
3950ef028eecSStefano Zampini 
3951ef028eecSStefano Zampini     if (dbg_flag) {
39522e8d2280SStefano Zampini       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
39532e8d2280SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
39542e8d2280SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Check coarse indices\n");CHKERRQ(ierr);
39552e8d2280SStefano Zampini       ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
39562e8d2280SStefano Zampini       ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3957*2fa5cd67SKarl Rupp       for (i=0;i<pcbddc->local_primal_size;i++) array[auxlocal_primal[i]]=1.0;
3958beed3852SStefano Zampini       ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
39592e8d2280SStefano Zampini       ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
3960da1bb401SStefano Zampini       ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3961da1bb401SStefano Zampini       ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3962da1bb401SStefano Zampini       ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3963da1bb401SStefano Zampini       ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3964da1bb401SStefano Zampini       ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
39652e8d2280SStefano Zampini       for (i=0;i<pcis->n;i++) {
39662e8d2280SStefano Zampini         if (array[i] == 1.0) {
39672e8d2280SStefano Zampini           ierr = ISLocalToGlobalMappingApply(matis->mapping,1,&i,&j);CHKERRQ(ierr);
39682e8d2280SStefano Zampini           ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d: WRONG COARSE INDEX %d (local %d)\n",PetscGlobalRank,j,i);CHKERRQ(ierr);
39692e8d2280SStefano Zampini         }
39702e8d2280SStefano Zampini       }
39712e8d2280SStefano Zampini       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
39722e8d2280SStefano Zampini       for (i=0;i<pcis->n;i++) {
3973*2fa5cd67SKarl Rupp         if (array[i] > 0.0) array[i] = 1.0/array[i];
39742e8d2280SStefano Zampini       }
3975da1bb401SStefano Zampini       ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
39762e8d2280SStefano Zampini       ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
3977da1bb401SStefano Zampini       ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3978da1bb401SStefano Zampini       ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3979da1bb401SStefano Zampini       ierr = VecSum(pcis->vec1_global,&coarsesum);CHKERRQ(ierr);
39802e8d2280SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Size of coarse problem SHOULD be %lf\n",coarsesum);CHKERRQ(ierr);
39812e8d2280SStefano Zampini       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
39822e8d2280SStefano Zampini     }
3983142dfd88SStefano Zampini     ierr = PetscFree(auxlocal_primal);CHKERRQ(ierr);
39840bdf917eSStefano Zampini   }
39850bdf917eSStefano Zampini 
39862e8d2280SStefano Zampini   if (dbg_flag) {
39877cf533a6SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"Size of coarse problem is %d\n",pcbddc->coarse_size);CHKERRQ(ierr);
39882e8d2280SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
39892e8d2280SStefano Zampini   }
39902e8d2280SStefano Zampini 
3991a929c220SStefano Zampini   im_active = 0;
3992*2fa5cd67SKarl Rupp   if (pcis->n) im_active = 1;
3993a929c220SStefano Zampini   ierr = MPI_Allreduce(&im_active,&active_procs,1,MPIU_INT,MPI_SUM,prec_comm);CHKERRQ(ierr);
39940bdf917eSStefano Zampini 
39950bdf917eSStefano Zampini   /* adapt coarse problem type */
39964fad6a16SStefano Zampini   if (pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
39974fad6a16SStefano Zampini     if (pcbddc->current_level < pcbddc->max_levels) {
3998a929c220SStefano Zampini       if ((active_procs/pcbddc->coarsening_ratio) < 2) {
39990bdf917eSStefano Zampini         if (dbg_flag) {
4000a929c220SStefano Zampini           ierr = PetscViewerASCIIPrintf(viewer,"Not enough active processes on level %d (active %d,ratio %d). Parallel direct solve for coarse problem\n",pcbddc->current_level,active_procs,pcbddc->coarsening_ratio);CHKERRQ(ierr);
40010bdf917eSStefano Zampini           ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
40020bdf917eSStefano Zampini         }
40030bdf917eSStefano Zampini         pcbddc->coarse_problem_type = PARALLEL_BDDC;
4004142dfd88SStefano Zampini       }
40054fad6a16SStefano Zampini     } else {
40064fad6a16SStefano Zampini       if (dbg_flag) {
4007a929c220SStefano Zampini         ierr = PetscViewerASCIIPrintf(viewer,"Max number of levels reached. Using parallel direct solve for coarse problem\n",pcbddc->max_levels,active_procs,pcbddc->coarsening_ratio);CHKERRQ(ierr);
40084fad6a16SStefano Zampini         ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
40094fad6a16SStefano Zampini       }
40104fad6a16SStefano Zampini       pcbddc->coarse_problem_type = PARALLEL_BDDC;
40114fad6a16SStefano Zampini     }
40124fad6a16SStefano Zampini   }
4013beed3852SStefano Zampini 
40140c7d97c5SJed Brown   switch (pcbddc->coarse_problem_type) {
40150c7d97c5SJed Brown 
4016da1bb401SStefano Zampini   case (MULTILEVEL_BDDC):    /* we define a coarse mesh where subdomains are elements */
40170c7d97c5SJed Brown   {
40180c7d97c5SJed Brown     /* we need additional variables */
40190c7d97c5SJed Brown     MetisInt    n_subdomains,n_parts,objval,ncon,faces_nvtxs;
40200c7d97c5SJed Brown     MetisInt    *metis_coarse_subdivision;
40210c7d97c5SJed Brown     MetisInt    options[METIS_NOPTIONS];
40220c7d97c5SJed Brown     PetscMPIInt size_coarse_comm,rank_coarse_comm;
40230c7d97c5SJed Brown     PetscMPIInt procs_jumps_coarse_comm;
40240c7d97c5SJed Brown     PetscMPIInt *coarse_subdivision;
40250c7d97c5SJed Brown     PetscMPIInt *total_count_recv;
40260c7d97c5SJed Brown     PetscMPIInt *total_ranks_recv;
40270c7d97c5SJed Brown     PetscMPIInt *displacements_recv;
40280c7d97c5SJed Brown     PetscMPIInt *my_faces_connectivity;
40290c7d97c5SJed Brown     PetscMPIInt *petsc_faces_adjncy;
40300c7d97c5SJed Brown     MetisInt    *faces_adjncy;
40310c7d97c5SJed Brown     MetisInt    *faces_xadj;
40320c7d97c5SJed Brown     PetscMPIInt *number_of_faces;
40330c7d97c5SJed Brown     PetscMPIInt *faces_displacements;
40340c7d97c5SJed Brown     PetscInt    *array_int;
40350c7d97c5SJed Brown     PetscMPIInt my_faces   =0;
40360c7d97c5SJed Brown     PetscMPIInt total_faces=0;
40373828260eSStefano Zampini     PetscInt    ranks_stretching_ratio;
40380c7d97c5SJed Brown 
40390c7d97c5SJed Brown     /* define some quantities */
40400c7d97c5SJed Brown     pcbddc->coarse_communications_type = SCATTERS_BDDC;
40410c7d97c5SJed Brown     coarse_mat_type                    = MATIS;
40420c7d97c5SJed Brown     coarse_pc_type                     = PCBDDC;
4043142dfd88SStefano Zampini     coarse_ksp_type                    = KSPRICHARDSON;
40440c7d97c5SJed Brown 
40450c7d97c5SJed Brown     /* details of coarse decomposition */
4046a929c220SStefano Zampini     n_subdomains            = active_procs;
40470c7d97c5SJed Brown     n_parts                 = n_subdomains/pcbddc->coarsening_ratio;
4048a929c220SStefano Zampini     ranks_stretching_ratio  = size_prec_comm/active_procs;
40493828260eSStefano Zampini     procs_jumps_coarse_comm = pcbddc->coarsening_ratio*ranks_stretching_ratio;
40503828260eSStefano Zampini 
4051a929c220SStefano Zampini #if 0
4052a929c220SStefano Zampini     PetscMPIInt     *old_ranks;
4053a929c220SStefano Zampini     PetscInt        *new_ranks,*jj,*ii;
4054a929c220SStefano Zampini     MatPartitioning mat_part;
4055a929c220SStefano Zampini     IS              coarse_new_decomposition,is_numbering;
4056a929c220SStefano Zampini     PetscViewer     viewer_test;
4057a929c220SStefano Zampini     MPI_Comm        test_coarse_comm;
4058a929c220SStefano Zampini     PetscMPIInt     test_coarse_color;
4059a929c220SStefano Zampini     Mat             mat_adj;
4060a929c220SStefano Zampini     /* Create new communicator for coarse problem splitting the old one */
4061a929c220SStefano Zampini     /* procs with coarse_color = MPI_UNDEFINED will have coarse_comm = MPI_COMM_NULL (from mpi standards)
4062a929c220SStefano Zampini        key = rank_prec_comm -> keep same ordering of ranks from the old to the new communicator */
4063a929c220SStefano Zampini     test_coarse_color = (im_active ? 0 : MPI_UNDEFINED);
4064a929c220SStefano Zampini     test_coarse_comm  = MPI_COMM_NULL;
4065a929c220SStefano Zampini     ierr              = MPI_Comm_split(prec_comm,test_coarse_color,rank_prec_comm,&test_coarse_comm);CHKERRQ(ierr);
4066a929c220SStefano Zampini     if (im_active) {
4067a929c220SStefano Zampini       ierr = PetscMalloc(n_subdomains*sizeof(PetscMPIInt),&old_ranks);
4068a929c220SStefano Zampini       ierr = PetscMalloc(size_prec_comm*sizeof(PetscInt),&new_ranks);
4069a929c220SStefano Zampini       ierr = MPI_Comm_rank(test_coarse_comm,&rank_coarse_comm);CHKERRQ(ierr);
4070a929c220SStefano Zampini       ierr = MPI_Comm_size(test_coarse_comm,&j);CHKERRQ(ierr);
4071a929c220SStefano Zampini       ierr = MPI_Allgather(&rank_prec_comm,1,MPIU_INT,old_ranks,1,MPIU_INT,test_coarse_comm);CHKERRQ(ierr);
4072*2fa5cd67SKarl Rupp       for (i=0; i<size_prec_comm; i++)
4073a929c220SStefano Zampini         new_ranks[i] = -1;
4074*2fa5cd67SKarl Rupp       for (i=0; i<n_subdomains; i++)
4075a929c220SStefano Zampini         new_ranks[old_ranks[i]] = i;
4076a929c220SStefano Zampini       ierr = PetscViewerASCIIOpen(test_coarse_comm,"test_mat_part.out",&viewer_test);CHKERRQ(ierr);
4077a929c220SStefano Zampini       k    = pcis->n_neigh-1;
4078a929c220SStefano Zampini       ierr = PetscMalloc(2*sizeof(PetscInt),&ii);
4079a929c220SStefano Zampini       ii[0]=0;
4080a929c220SStefano Zampini       ii[1]=k;
4081a929c220SStefano Zampini       ierr = PetscMalloc(k*sizeof(PetscInt),&jj);
4082*2fa5cd67SKarl Rupp       for (i=0; i<k; i++)
4083a929c220SStefano Zampini         jj[i]=new_ranks[pcis->neigh[i+1]];
4084a929c220SStefano Zampini       ierr = PetscSortInt(k,jj);CHKERRQ(ierr);
4085a929c220SStefano Zampini       ierr = MatCreateMPIAdj(test_coarse_comm,1,n_subdomains,ii,jj,PETSC_NULL,&mat_adj);CHKERRQ(ierr);
4086a929c220SStefano Zampini       ierr = MatView(mat_adj,viewer_test);CHKERRQ(ierr);
4087a929c220SStefano Zampini       ierr = MatPartitioningCreate(test_coarse_comm,&mat_part);CHKERRQ(ierr);
4088a929c220SStefano Zampini       ierr = MatPartitioningSetAdjacency(mat_part,mat_adj);CHKERRQ(ierr);
4089a929c220SStefano Zampini       ierr = MatPartitioningSetFromOptions(mat_part);CHKERRQ(ierr);
4090a929c220SStefano Zampini       printf("Setting Nparts %d\n",n_parts);
4091a929c220SStefano Zampini       ierr = MatPartitioningSetNParts(mat_part,n_parts);CHKERRQ(ierr);
4092a929c220SStefano Zampini       ierr = MatPartitioningView(mat_part,viewer_test);CHKERRQ(ierr);
4093a929c220SStefano Zampini       ierr = MatPartitioningApply(mat_part,&coarse_new_decomposition);CHKERRQ(ierr);
4094a929c220SStefano Zampini       ierr = ISView(coarse_new_decomposition,viewer_test);CHKERRQ(ierr);
4095a929c220SStefano Zampini       ierr = ISPartitioningToNumbering(coarse_new_decomposition,&is_numbering);CHKERRQ(ierr);
4096a929c220SStefano Zampini       ierr = ISView(is_numbering,viewer_test);CHKERRQ(ierr);
4097a929c220SStefano Zampini       ierr = PetscViewerDestroy(&viewer_test);CHKERRQ(ierr);
4098a929c220SStefano Zampini       ierr = ISDestroy(&coarse_new_decomposition);CHKERRQ(ierr);
4099a929c220SStefano Zampini       ierr = ISDestroy(&is_numbering);CHKERRQ(ierr);
4100a929c220SStefano Zampini       ierr = MatPartitioningDestroy(&mat_part);CHKERRQ(ierr);
4101a929c220SStefano Zampini       ierr = PetscFree(old_ranks);CHKERRQ(ierr);
4102a929c220SStefano Zampini       ierr = PetscFree(new_ranks);CHKERRQ(ierr);
4103a929c220SStefano Zampini       ierr = MPI_Comm_free(&test_coarse_comm);CHKERRQ(ierr);
4104a929c220SStefano Zampini     }
4105a929c220SStefano Zampini #endif
4106a929c220SStefano Zampini 
41074fad6a16SStefano Zampini     /* build CSR graph of subdomains' connectivity */
41080c7d97c5SJed Brown     ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&array_int);CHKERRQ(ierr);
41093828260eSStefano Zampini     ierr = PetscMemzero(array_int,pcis->n*sizeof(PetscInt));CHKERRQ(ierr);
41100c7d97c5SJed Brown     for (i=1;i<pcis->n_neigh;i++) {/* i=1 so I don't count myself -> faces nodes counts to 1 */
41110c7d97c5SJed Brown       for (j=0;j<pcis->n_shared[i];j++) {
41120c7d97c5SJed Brown         array_int[pcis->shared[i][j]]+=1;
41130c7d97c5SJed Brown       }
41140c7d97c5SJed Brown     }
41150c7d97c5SJed Brown     for (i=1;i<pcis->n_neigh;i++) {
41160c7d97c5SJed Brown       for (j=0;j<pcis->n_shared[i];j++) {
41177cf533a6SStefano Zampini         if (array_int[pcis->shared[i][j]] > 0) {
41180c7d97c5SJed Brown           my_faces++;
41190c7d97c5SJed Brown           break;
41200c7d97c5SJed Brown         }
41210c7d97c5SJed Brown       }
41220c7d97c5SJed Brown     }
41230c7d97c5SJed Brown 
412453cdbc3dSStefano Zampini     ierr = MPI_Reduce(&my_faces,&total_faces,1,MPIU_INT,MPI_SUM,master_proc,prec_comm);CHKERRQ(ierr);
41250c7d97c5SJed Brown     ierr = PetscMalloc (my_faces*sizeof(PetscInt),&my_faces_connectivity);CHKERRQ(ierr);
41260c7d97c5SJed Brown     my_faces=0;
41270c7d97c5SJed Brown     for (i=1;i<pcis->n_neigh;i++) {
41280c7d97c5SJed Brown       for (j=0;j<pcis->n_shared[i];j++) {
41297cf533a6SStefano Zampini         if (array_int[pcis->shared[i][j]] > 0) {
41300c7d97c5SJed Brown           my_faces_connectivity[my_faces]=pcis->neigh[i];
41310c7d97c5SJed Brown           my_faces++;
41320c7d97c5SJed Brown           break;
41330c7d97c5SJed Brown         }
41340c7d97c5SJed Brown       }
41350c7d97c5SJed Brown     }
41360c7d97c5SJed Brown     if (rank_prec_comm == master_proc) {
41370c7d97c5SJed Brown       ierr = PetscMalloc (total_faces*sizeof(PetscMPIInt),&petsc_faces_adjncy);CHKERRQ(ierr);
41380c7d97c5SJed Brown       ierr = PetscMalloc (size_prec_comm*sizeof(PetscMPIInt),&number_of_faces);CHKERRQ(ierr);
41390c7d97c5SJed Brown       ierr = PetscMalloc (total_faces*sizeof(MetisInt),&faces_adjncy);CHKERRQ(ierr);
41400c7d97c5SJed Brown       ierr = PetscMalloc ((n_subdomains+1)*sizeof(MetisInt),&faces_xadj);CHKERRQ(ierr);
41410c7d97c5SJed Brown       ierr = PetscMalloc ((size_prec_comm+1)*sizeof(PetscMPIInt),&faces_displacements);CHKERRQ(ierr);
41420c7d97c5SJed Brown     }
414353cdbc3dSStefano Zampini     ierr = MPI_Gather(&my_faces,1,MPIU_INT,&number_of_faces[0],1,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr);
41440c7d97c5SJed Brown     if (rank_prec_comm == master_proc) {
41450c7d97c5SJed Brown       faces_xadj[0]          = 0;
41460c7d97c5SJed Brown       faces_displacements[0] = 0;
4147*2fa5cd67SKarl Rupp 
41480c7d97c5SJed Brown       j=0;
41490c7d97c5SJed Brown       for (i=1;i<size_prec_comm+1;i++) {
41500c7d97c5SJed Brown         faces_displacements[i]=faces_displacements[i-1]+number_of_faces[i-1];
41510c7d97c5SJed Brown         if (number_of_faces[i-1]) {
41520c7d97c5SJed Brown           j++;
41530c7d97c5SJed Brown           faces_xadj[j]=faces_xadj[j-1]+number_of_faces[i-1];
41540c7d97c5SJed Brown         }
41550c7d97c5SJed Brown       }
41560c7d97c5SJed Brown     }
415753cdbc3dSStefano Zampini     ierr = MPI_Gatherv(&my_faces_connectivity[0],my_faces,MPIU_INT,&petsc_faces_adjncy[0],number_of_faces,faces_displacements,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr);
41580c7d97c5SJed Brown     ierr = PetscFree(my_faces_connectivity);CHKERRQ(ierr);
41590c7d97c5SJed Brown     ierr = PetscFree(array_int);CHKERRQ(ierr);
41600c7d97c5SJed Brown     if (rank_prec_comm == master_proc) {
41613828260eSStefano Zampini       for (i=0; i<total_faces; i++) faces_adjncy[i]=(MetisInt)(petsc_faces_adjncy[i]/ranks_stretching_ratio); /* cast to MetisInt */
41620c7d97c5SJed Brown       ierr = PetscFree(faces_displacements);CHKERRQ(ierr);
41630c7d97c5SJed Brown       ierr = PetscFree(number_of_faces);CHKERRQ(ierr);
41640c7d97c5SJed Brown       ierr = PetscFree(petsc_faces_adjncy);CHKERRQ(ierr);
41650c7d97c5SJed Brown     }
41660c7d97c5SJed Brown 
41670c7d97c5SJed Brown     if (rank_prec_comm == master_proc) {
41683828260eSStefano Zampini       PetscInt heuristic_for_metis=3;
41690c7d97c5SJed Brown       ncon       =1;
41700c7d97c5SJed Brown       faces_nvtxs=n_subdomains;
41710c7d97c5SJed Brown       /* partition graoh induced by face connectivity */
41720c7d97c5SJed Brown       ierr = PetscMalloc (n_subdomains*sizeof(MetisInt),&metis_coarse_subdivision);CHKERRQ(ierr);
41730c7d97c5SJed Brown       ierr = METIS_SetDefaultOptions(options);
41740c7d97c5SJed Brown       /* we need a contiguous partition of the coarse mesh */
41750c7d97c5SJed Brown       options[METIS_OPTION_CONTIG]=1;
41760c7d97c5SJed Brown       options[METIS_OPTION_NITER] =30;
41774fad6a16SStefano Zampini       if (pcbddc->coarsening_ratio > 1) {
41783828260eSStefano Zampini         if (n_subdomains>n_parts*heuristic_for_metis) {
41793828260eSStefano Zampini           options[METIS_OPTION_IPTYPE] =METIS_IPTYPE_EDGE;
41803828260eSStefano Zampini           options[METIS_OPTION_OBJTYPE]=METIS_OBJTYPE_CUT;
4181*2fa5cd67SKarl Rupp 
41820c7d97c5SJed Brown           ierr = METIS_PartGraphKway(&faces_nvtxs,&ncon,faces_xadj,faces_adjncy,NULL,NULL,NULL,&n_parts,NULL,NULL,options,&objval,metis_coarse_subdivision);
4183142dfd88SStefano Zampini           if (ierr != METIS_OK) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in METIS_PartGraphKway (metis error code %D) called from PCBDDCSetupCoarseEnvironment\n",ierr);
41843828260eSStefano Zampini         } else {
41853828260eSStefano Zampini           ierr = METIS_PartGraphRecursive(&faces_nvtxs,&ncon,faces_xadj,faces_adjncy,NULL,NULL,NULL,&n_parts,NULL,NULL,options,&objval,metis_coarse_subdivision);
4186142dfd88SStefano Zampini           if (ierr != METIS_OK) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in METIS_PartGraphRecursive (metis error code %D) called from PCBDDCSetupCoarseEnvironment\n",ierr);
41873828260eSStefano Zampini         }
41884fad6a16SStefano Zampini       } else {
4189*2fa5cd67SKarl Rupp         for (i=0;i<n_subdomains;i++) metis_coarse_subdivision[i]=i;
41904fad6a16SStefano Zampini       }
41910c7d97c5SJed Brown       ierr = PetscFree(faces_xadj);CHKERRQ(ierr);
41920c7d97c5SJed Brown       ierr = PetscFree(faces_adjncy);CHKERRQ(ierr);
41930bdf917eSStefano Zampini       ierr = PetscMalloc(size_prec_comm*sizeof(PetscMPIInt),&coarse_subdivision);CHKERRQ(ierr);
4194*2fa5cd67SKarl Rupp 
41950c7d97c5SJed Brown       /* copy/cast values avoiding possible type conflicts between PETSc, MPI and METIS */
4196*2fa5cd67SKarl Rupp       for (i=0;i<size_prec_comm;i++) coarse_subdivision[i]=MPI_PROC_NULL;
4197*2fa5cd67SKarl Rupp       for (i=0;i<n_subdomains;i++) coarse_subdivision[ranks_stretching_ratio*i]=(PetscInt)(metis_coarse_subdivision[i]);
41980c7d97c5SJed Brown       ierr = PetscFree(metis_coarse_subdivision);CHKERRQ(ierr);
41990c7d97c5SJed Brown     }
42000c7d97c5SJed Brown 
42010c7d97c5SJed Brown     /* Create new communicator for coarse problem splitting the old one */
42020c7d97c5SJed Brown     if (!(rank_prec_comm%procs_jumps_coarse_comm) && rank_prec_comm < procs_jumps_coarse_comm*n_parts) {
4203da1bb401SStefano Zampini       coarse_color=0;                /* for communicator splitting */
4204da1bb401SStefano Zampini       active_rank =rank_prec_comm;   /* for insertion of matrix values */
42050c7d97c5SJed Brown     }
4206da1bb401SStefano Zampini     /* procs with coarse_color = MPI_UNDEFINED will have coarse_comm = MPI_COMM_NULL (from mpi standards)
4207da1bb401SStefano Zampini        key = rank_prec_comm -> keep same ordering of ranks from the old to the new communicator */
420853cdbc3dSStefano Zampini     ierr = MPI_Comm_split(prec_comm,coarse_color,rank_prec_comm,&coarse_comm);CHKERRQ(ierr);
42090c7d97c5SJed Brown 
42100c7d97c5SJed Brown     if (coarse_color == 0) {
421153cdbc3dSStefano Zampini       ierr = MPI_Comm_size(coarse_comm,&size_coarse_comm);CHKERRQ(ierr);
421253cdbc3dSStefano Zampini       ierr = MPI_Comm_rank(coarse_comm,&rank_coarse_comm);CHKERRQ(ierr);
42130c7d97c5SJed Brown     } else {
42140c7d97c5SJed Brown       rank_coarse_comm = MPI_PROC_NULL;
42150c7d97c5SJed Brown     }
42160c7d97c5SJed Brown 
42177cf533a6SStefano Zampini     /* master proc take care of arranging and distributing coarse information */
42180c7d97c5SJed Brown     if (rank_coarse_comm == master_proc) {
42190c7d97c5SJed Brown       ierr = PetscMalloc (size_coarse_comm*sizeof(PetscMPIInt),&displacements_recv);CHKERRQ(ierr);
42200bdf917eSStefano Zampini       ierr = PetscMalloc (size_coarse_comm*sizeof(PetscMPIInt),&total_count_recv);CHKERRQ(ierr);
42210bdf917eSStefano Zampini       ierr = PetscMalloc (n_subdomains*sizeof(PetscMPIInt),&total_ranks_recv);CHKERRQ(ierr);
42220c7d97c5SJed Brown       /* some initializations */
42230c7d97c5SJed Brown       displacements_recv[0]=0;
42240bdf917eSStefano Zampini       ierr = PetscMemzero(total_count_recv,size_coarse_comm*sizeof(PetscMPIInt));CHKERRQ(ierr);
42250c7d97c5SJed Brown       /* count from how many processes the j-th process of the coarse decomposition will receive data */
42260bdf917eSStefano Zampini       for (j=0; j<size_coarse_comm; j++) {
42270bdf917eSStefano Zampini         for (i=0; i<size_prec_comm; i++) {
4228*2fa5cd67SKarl Rupp           if (coarse_subdivision[i]==j) total_count_recv[j]++;
42290bdf917eSStefano Zampini         }
42300bdf917eSStefano Zampini       }
42310c7d97c5SJed Brown       /* displacements needed for scatterv of total_ranks_recv */
4232*2fa5cd67SKarl Rupp       for (i=1; i<size_coarse_comm; i++) displacements_recv[i]=displacements_recv[i-1]+total_count_recv[i-1];
4233*2fa5cd67SKarl Rupp 
42340c7d97c5SJed Brown       /* Now fill properly total_ranks_recv -> each coarse process will receive the ranks (in prec_comm communicator) of its friend (sending) processes */
42350c7d97c5SJed Brown       ierr = PetscMemzero(total_count_recv,size_coarse_comm*sizeof(PetscMPIInt));CHKERRQ(ierr);
42360c7d97c5SJed Brown       for (j=0; j<size_coarse_comm; j++) {
42373828260eSStefano Zampini         for (i=0; i<size_prec_comm; i++) {
42380c7d97c5SJed Brown           if (coarse_subdivision[i]==j) {
42390c7d97c5SJed Brown             total_ranks_recv[displacements_recv[j]+total_count_recv[j]] = i;
4240*2fa5cd67SKarl Rupp 
42413828260eSStefano Zampini             total_count_recv[j] += 1;
42420c7d97c5SJed Brown           }
42430c7d97c5SJed Brown         }
42440c7d97c5SJed Brown       }
4245da1bb401SStefano Zampini       /* for (j=0;j<size_coarse_comm;j++) {
42463828260eSStefano Zampini         printf("process %d in new rank will receive from %d processes (original ranks follows)\n",j,total_count_recv[j]);
42473828260eSStefano Zampini         for (i=0;i<total_count_recv[j];i++) {
42483828260eSStefano Zampini           printf("%d ",total_ranks_recv[displacements_recv[j]+i]);
42493828260eSStefano Zampini         }
42503828260eSStefano Zampini         printf("\n");
4251da1bb401SStefano Zampini       } */
42520c7d97c5SJed Brown 
42530c7d97c5SJed Brown       /* identify new decomposition in terms of ranks in the old communicator */
42540bdf917eSStefano Zampini       for (i=0; i<n_subdomains; i++) {
42550bdf917eSStefano Zampini         coarse_subdivision[ranks_stretching_ratio*i]=coarse_subdivision[ranks_stretching_ratio*i]*procs_jumps_coarse_comm;
42560bdf917eSStefano Zampini       }
4257da1bb401SStefano Zampini       /* printf("coarse_subdivision in old end new ranks\n");
4258*2fa5cd67SKarl Rupp       for (i=0;i<size_prec_comm;i++) {
42593828260eSStefano Zampini         if (coarse_subdivision[i]!=MPI_PROC_NULL) {
42603828260eSStefano Zampini           printf("%d=(%d %d), ",i,coarse_subdivision[i],coarse_subdivision[i]/procs_jumps_coarse_comm);
42613828260eSStefano Zampini         } else {
42623828260eSStefano Zampini           printf("%d=(%d %d), ",i,coarse_subdivision[i],coarse_subdivision[i]);
42633828260eSStefano Zampini         }
4264*2fa5cd67SKarl Rupp       }
4265da1bb401SStefano Zampini       printf("\n"); */
42660c7d97c5SJed Brown     }
42670c7d97c5SJed Brown 
42680c7d97c5SJed Brown     /* Scatter new decomposition for send details */
426953cdbc3dSStefano Zampini     ierr = MPI_Scatter(&coarse_subdivision[0],1,MPIU_INT,&rank_coarse_proc_send_to,1,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr);
42700c7d97c5SJed Brown     /* Scatter receiving details to members of coarse decomposition */
42710c7d97c5SJed Brown     if (coarse_color == 0) {
427253cdbc3dSStefano Zampini       ierr = MPI_Scatter(&total_count_recv[0],1,MPIU_INT,&count_recv,1,MPIU_INT,master_proc,coarse_comm);CHKERRQ(ierr);
42730c7d97c5SJed Brown       ierr = PetscMalloc (count_recv*sizeof(PetscMPIInt),&ranks_recv);CHKERRQ(ierr);
427453cdbc3dSStefano Zampini       ierr = MPI_Scatterv(&total_ranks_recv[0],total_count_recv,displacements_recv,MPIU_INT,&ranks_recv[0],count_recv,MPIU_INT,master_proc,coarse_comm);CHKERRQ(ierr);
42750c7d97c5SJed Brown     }
42760c7d97c5SJed Brown 
4277da1bb401SStefano Zampini     /* printf("I will send my matrix data to proc  %d\n",rank_coarse_proc_send_to);
4278da1bb401SStefano Zampini     if (coarse_color == 0) {
4279da1bb401SStefano Zampini       printf("I will receive some matrix data from %d processes (ranks follows)\n",count_recv);
4280da1bb401SStefano Zampini       for (i=0;i<count_recv;i++)
4281da1bb401SStefano Zampini         printf("%d ",ranks_recv[i]);
4282da1bb401SStefano Zampini       printf("\n");
4283da1bb401SStefano Zampini     } */
42840c7d97c5SJed Brown 
42850c7d97c5SJed Brown     if (rank_prec_comm == master_proc) {
42860bdf917eSStefano Zampini       ierr = PetscFree(coarse_subdivision);CHKERRQ(ierr);
4287da1bb401SStefano Zampini       ierr = PetscFree(total_count_recv);CHKERRQ(ierr);
42880bdf917eSStefano Zampini       ierr = PetscFree(total_ranks_recv);CHKERRQ(ierr);
42890c7d97c5SJed Brown       ierr = PetscFree(displacements_recv);CHKERRQ(ierr);
42900c7d97c5SJed Brown     }
42910c7d97c5SJed Brown     break;
42920c7d97c5SJed Brown   }
42930c7d97c5SJed Brown 
42940c7d97c5SJed Brown   case (REPLICATED_BDDC):
42950c7d97c5SJed Brown 
42960c7d97c5SJed Brown     pcbddc->coarse_communications_type = GATHERS_BDDC;
42970c7d97c5SJed Brown     coarse_mat_type                    = MATSEQAIJ;
42980c7d97c5SJed Brown     coarse_pc_type                     = PCLU;
429953cdbc3dSStefano Zampini     coarse_ksp_type                    = KSPPREONLY;
43000c7d97c5SJed Brown     coarse_comm                        = PETSC_COMM_SELF;
43010c7d97c5SJed Brown     active_rank                        = rank_prec_comm;
43020c7d97c5SJed Brown     break;
43030c7d97c5SJed Brown 
43040c7d97c5SJed Brown   case (PARALLEL_BDDC):
43050c7d97c5SJed Brown 
43060c7d97c5SJed Brown     pcbddc->coarse_communications_type = SCATTERS_BDDC;
43070c7d97c5SJed Brown     coarse_mat_type                    = MATMPIAIJ;
43080c7d97c5SJed Brown     coarse_pc_type                     = PCREDUNDANT;
430953cdbc3dSStefano Zampini     coarse_ksp_type                    = KSPPREONLY;
43100c7d97c5SJed Brown     coarse_comm                        = prec_comm;
43110c7d97c5SJed Brown     active_rank                        = rank_prec_comm;
43120c7d97c5SJed Brown     break;
43130c7d97c5SJed Brown 
43140c7d97c5SJed Brown   case (SEQUENTIAL_BDDC):
43150c7d97c5SJed Brown     pcbddc->coarse_communications_type = GATHERS_BDDC;
43160c7d97c5SJed Brown     coarse_mat_type                    = MATSEQAIJ;
43170c7d97c5SJed Brown     coarse_pc_type                     = PCLU;
431853cdbc3dSStefano Zampini     coarse_ksp_type                    = KSPPREONLY;
43190c7d97c5SJed Brown     coarse_comm                        = PETSC_COMM_SELF;
43200c7d97c5SJed Brown     active_rank                        = master_proc;
43210c7d97c5SJed Brown     break;
43220c7d97c5SJed Brown   }
43230c7d97c5SJed Brown 
43240c7d97c5SJed Brown   switch (pcbddc->coarse_communications_type) {
43250c7d97c5SJed Brown 
43260c7d97c5SJed Brown   case(SCATTERS_BDDC):
43270c7d97c5SJed Brown   {
43280c7d97c5SJed Brown     if (pcbddc->coarse_problem_type==MULTILEVEL_BDDC) {
43290c7d97c5SJed Brown 
43302e8d2280SStefano Zampini       IS coarse_IS;
43312e8d2280SStefano Zampini 
4332523858cfSStefano Zampini       if (pcbddc->coarsening_ratio == 1) {
4333523858cfSStefano Zampini         ins_local_primal_size = pcbddc->local_primal_size;
4334523858cfSStefano Zampini         ins_local_primal_indices = pcbddc->local_primal_indices;
4335523858cfSStefano Zampini         if (coarse_color == 0) { ierr = PetscFree(ranks_recv);CHKERRQ(ierr); }
4336523858cfSStefano Zampini         /* nonzeros */
4337523858cfSStefano Zampini         ierr = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&dnz);CHKERRQ(ierr);
4338523858cfSStefano Zampini         ierr = PetscMemzero(dnz,ins_local_primal_size*sizeof(PetscInt));CHKERRQ(ierr);
4339523858cfSStefano Zampini         for (i=0;i<ins_local_primal_size;i++) {
4340523858cfSStefano Zampini           dnz[i] = ins_local_primal_size;
4341523858cfSStefano Zampini         }
4342523858cfSStefano Zampini       } else {
43430c7d97c5SJed Brown         PetscMPIInt send_size;
4344ef028eecSStefano Zampini         PetscMPIInt *send_buffer;
43450c7d97c5SJed Brown         PetscInt    *aux_ins_indices;
43460c7d97c5SJed Brown         PetscInt    ii,jj;
43470c7d97c5SJed Brown         MPI_Request *requests;
4348ef028eecSStefano Zampini 
4349523858cfSStefano Zampini         ierr = PetscMalloc(count_recv*sizeof(PetscMPIInt),&localdispl2);CHKERRQ(ierr);
4350523858cfSStefano Zampini         /* reusing pcbddc->local_primal_displacements and pcbddc->replicated_primal_size */
4351523858cfSStefano Zampini         ierr = PetscFree(pcbddc->local_primal_displacements);CHKERRQ(ierr);
4352523858cfSStefano Zampini         ierr = PetscMalloc((count_recv+1)*sizeof(PetscMPIInt),&pcbddc->local_primal_displacements);CHKERRQ(ierr);
4353523858cfSStefano Zampini         pcbddc->replicated_primal_size = count_recv;
4354523858cfSStefano Zampini         j = 0;
4355523858cfSStefano Zampini         for (i=0;i<count_recv;i++) {
4356523858cfSStefano Zampini           pcbddc->local_primal_displacements[i] = j;
4357523858cfSStefano Zampini           j += pcbddc->local_primal_sizes[ranks_recv[i]];
4358523858cfSStefano Zampini         }
4359523858cfSStefano Zampini         pcbddc->local_primal_displacements[count_recv] = j;
4360523858cfSStefano Zampini         ierr = PetscMalloc(j*sizeof(PetscMPIInt),&pcbddc->replicated_local_primal_indices);CHKERRQ(ierr);
43610c7d97c5SJed Brown         /* allocate auxiliary space */
4362523858cfSStefano Zampini         ierr = PetscMalloc(count_recv*sizeof(PetscMPIInt),&localsizes2);CHKERRQ(ierr);
43630c7d97c5SJed Brown         ierr = PetscMalloc(pcbddc->coarse_size*sizeof(PetscInt),&aux_ins_indices);CHKERRQ(ierr);
43640c7d97c5SJed Brown         ierr = PetscMemzero(aux_ins_indices,pcbddc->coarse_size*sizeof(PetscInt));CHKERRQ(ierr);
43650c7d97c5SJed Brown         /* allocate stuffs for message massing */
43660c7d97c5SJed Brown         ierr = PetscMalloc((count_recv+1)*sizeof(MPI_Request),&requests);CHKERRQ(ierr);
4367523858cfSStefano Zampini         for (i=0;i<count_recv+1;i++) { requests[i]=MPI_REQUEST_NULL; }
4368523858cfSStefano Zampini         /* send indices to be inserted */
4369523858cfSStefano Zampini         for (i=0;i<count_recv;i++) {
4370523858cfSStefano Zampini           send_size = pcbddc->local_primal_sizes[ranks_recv[i]];
4371523858cfSStefano Zampini           ierr = MPI_Irecv(&pcbddc->replicated_local_primal_indices[pcbddc->local_primal_displacements[i]],send_size,MPIU_INT,ranks_recv[i],999,prec_comm,&requests[i]);CHKERRQ(ierr);
4372523858cfSStefano Zampini         }
4373523858cfSStefano Zampini         if (rank_coarse_proc_send_to != MPI_PROC_NULL) {
4374523858cfSStefano Zampini           send_size = pcbddc->local_primal_size;
4375ef028eecSStefano Zampini           ierr = PetscMalloc(send_size*sizeof(PetscMPIInt),&send_buffer);CHKERRQ(ierr);
4376ef028eecSStefano Zampini           for (i=0;i<send_size;i++) {
4377ef028eecSStefano Zampini             send_buffer[i]=(PetscMPIInt)pcbddc->local_primal_indices[i];
4378ef028eecSStefano Zampini           }
4379ef028eecSStefano Zampini           ierr = MPI_Isend(send_buffer,send_size,MPIU_INT,rank_coarse_proc_send_to,999,prec_comm,&requests[count_recv]);CHKERRQ(ierr);
4380523858cfSStefano Zampini         }
4381523858cfSStefano Zampini         ierr = MPI_Waitall(count_recv+1,requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
4382ef028eecSStefano Zampini         if (rank_coarse_proc_send_to != MPI_PROC_NULL) {
4383ef028eecSStefano Zampini           ierr = PetscFree(send_buffer);CHKERRQ(ierr);
4384ef028eecSStefano Zampini         }
43850c7d97c5SJed Brown         j = 0;
43860c7d97c5SJed Brown         for (i=0;i<count_recv;i++) {
43872e8d2280SStefano Zampini           ii = pcbddc->local_primal_displacements[i+1]-pcbddc->local_primal_displacements[i];
43882e8d2280SStefano Zampini           localsizes2[i] = ii*ii;
43890c7d97c5SJed Brown           localdispl2[i] = j;
43900c7d97c5SJed Brown           j += localsizes2[i];
4391523858cfSStefano Zampini           jj = pcbddc->local_primal_displacements[i];
43924fad6a16SStefano Zampini           /* it counts the coarse subdomains sharing the coarse node */
43932e8d2280SStefano Zampini           for (k=0;k<ii;k++) {
43944fad6a16SStefano Zampini             aux_ins_indices[pcbddc->replicated_local_primal_indices[jj+k]] += 1;
43950c7d97c5SJed Brown           }
43964fad6a16SStefano Zampini         }
4397523858cfSStefano Zampini         /* temp_coarse_mat_vals used to store matrix values to be received */
43980c7d97c5SJed Brown         ierr = PetscMalloc(j*sizeof(PetscScalar),&temp_coarse_mat_vals);CHKERRQ(ierr);
43990c7d97c5SJed Brown         /* evaluate how many values I will insert in coarse mat */
44000c7d97c5SJed Brown         ins_local_primal_size = 0;
4401ea7e1babSStefano Zampini         for (i=0;i<pcbddc->coarse_size;i++) {
4402ea7e1babSStefano Zampini           if (aux_ins_indices[i]) {
44030c7d97c5SJed Brown             ins_local_primal_size++;
4404ea7e1babSStefano Zampini           }
4405ea7e1babSStefano Zampini         }
44060c7d97c5SJed Brown         /* evaluate indices I will insert in coarse mat */
44070c7d97c5SJed Brown         ierr = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&ins_local_primal_indices);CHKERRQ(ierr);
44080c7d97c5SJed Brown         j = 0;
4409ea7e1babSStefano Zampini         for (i=0;i<pcbddc->coarse_size;i++) {
4410ea7e1babSStefano Zampini           if (aux_ins_indices[i]) {
44112e8d2280SStefano Zampini             ins_local_primal_indices[j] = i;
44122e8d2280SStefano Zampini             j++;
4413ea7e1babSStefano Zampini           }
4414ea7e1babSStefano Zampini         }
4415523858cfSStefano Zampini         /* processes partecipating in coarse problem receive matrix data from their friends */
4416523858cfSStefano Zampini         for (i=0;i<count_recv;i++) {
4417523858cfSStefano Zampini           ierr = MPI_Irecv(&temp_coarse_mat_vals[localdispl2[i]],localsizes2[i],MPIU_SCALAR,ranks_recv[i],666,prec_comm,&requests[i]);CHKERRQ(ierr);
4418523858cfSStefano Zampini         }
4419523858cfSStefano Zampini         if (rank_coarse_proc_send_to != MPI_PROC_NULL) {
4420523858cfSStefano Zampini           send_size = pcbddc->local_primal_size*pcbddc->local_primal_size;
4421523858cfSStefano Zampini           ierr = MPI_Isend(&coarse_submat_vals[0],send_size,MPIU_SCALAR,rank_coarse_proc_send_to,666,prec_comm,&requests[count_recv]);CHKERRQ(ierr);
4422523858cfSStefano Zampini         }
4423523858cfSStefano Zampini         ierr = MPI_Waitall(count_recv+1,requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
4424523858cfSStefano Zampini         /* nonzeros */
4425523858cfSStefano Zampini         ierr = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&dnz);CHKERRQ(ierr);
4426523858cfSStefano Zampini         ierr = PetscMemzero(dnz,ins_local_primal_size*sizeof(PetscInt));CHKERRQ(ierr);
44270c7d97c5SJed Brown         /* use aux_ins_indices to realize a global to local mapping */
44280c7d97c5SJed Brown         j=0;
44290c7d97c5SJed Brown         for (i=0;i<pcbddc->coarse_size;i++) {
44300c7d97c5SJed Brown           if (aux_ins_indices[i]==0) {
44310c7d97c5SJed Brown             aux_ins_indices[i]=-1;
44320c7d97c5SJed Brown           } else {
44330c7d97c5SJed Brown             aux_ins_indices[i]=j;
44340c7d97c5SJed Brown             j++;
44350c7d97c5SJed Brown           }
44360c7d97c5SJed Brown         }
44374fad6a16SStefano Zampini         for (i=0;i<count_recv;i++) {
4438523858cfSStefano Zampini           j = pcbddc->local_primal_sizes[ranks_recv[i]];
4439523858cfSStefano Zampini           for (k=0;k<j;k++) {
4440523858cfSStefano Zampini             dnz[aux_ins_indices[pcbddc->replicated_local_primal_indices[pcbddc->local_primal_displacements[i]+k]]] += j;
44410c7d97c5SJed Brown           }
44420c7d97c5SJed Brown         }
4443523858cfSStefano Zampini         /* check */
4444523858cfSStefano Zampini         for (i=0;i<ins_local_primal_size;i++) {
4445523858cfSStefano Zampini           if (dnz[i] > ins_local_primal_size) {
4446523858cfSStefano Zampini             dnz[i] = ins_local_primal_size;
44470c7d97c5SJed Brown           }
44480c7d97c5SJed Brown         }
44490c7d97c5SJed Brown         ierr = PetscFree(requests);CHKERRQ(ierr);
44500c7d97c5SJed Brown         ierr = PetscFree(aux_ins_indices);CHKERRQ(ierr);
44510c7d97c5SJed Brown         if (coarse_color == 0) { ierr = PetscFree(ranks_recv);CHKERRQ(ierr); }
44524fad6a16SStefano Zampini       }
44530c7d97c5SJed Brown       /* create local to global mapping needed by coarse MATIS */
4454142dfd88SStefano Zampini       if (coarse_comm != MPI_COMM_NULL) {ierr = MPI_Comm_free(&coarse_comm);CHKERRQ(ierr);}
44550c7d97c5SJed Brown       coarse_comm = prec_comm;
44560c7d97c5SJed Brown       active_rank = rank_prec_comm;
44570c7d97c5SJed Brown       ierr = ISCreateGeneral(coarse_comm,ins_local_primal_size,ins_local_primal_indices,PETSC_COPY_VALUES,&coarse_IS);CHKERRQ(ierr);
44580c7d97c5SJed Brown       ierr = ISLocalToGlobalMappingCreateIS(coarse_IS,&coarse_ISLG);CHKERRQ(ierr);
44590c7d97c5SJed Brown       ierr = ISDestroy(&coarse_IS);CHKERRQ(ierr);
44602e8d2280SStefano Zampini     } else if (pcbddc->coarse_problem_type==PARALLEL_BDDC) {
44610c7d97c5SJed Brown       /* arrays for values insertion */
44620c7d97c5SJed Brown       ins_local_primal_size = pcbddc->local_primal_size;
44632e8d2280SStefano Zampini       ierr = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&ins_local_primal_indices);CHKERRQ(ierr);
44640c7d97c5SJed Brown       ierr = PetscMalloc(ins_local_primal_size*ins_local_primal_size*sizeof(PetscScalar),&ins_coarse_mat_vals);CHKERRQ(ierr);
44650c7d97c5SJed Brown       for (j=0;j<ins_local_primal_size;j++) {
44660c7d97c5SJed Brown         ins_local_primal_indices[j]=pcbddc->local_primal_indices[j];
44674fad6a16SStefano Zampini         for (i=0;i<ins_local_primal_size;i++) {
44684fad6a16SStefano Zampini           ins_coarse_mat_vals[j*ins_local_primal_size+i]=coarse_submat_vals[j*ins_local_primal_size+i];
44694fad6a16SStefano Zampini         }
44700c7d97c5SJed Brown       }
44710c7d97c5SJed Brown     }
44720c7d97c5SJed Brown     break;
44730c7d97c5SJed Brown   }
44740c7d97c5SJed Brown 
44750c7d97c5SJed Brown   case (GATHERS_BDDC):
44760c7d97c5SJed Brown   {
44770c7d97c5SJed Brown     PetscMPIInt mysize,mysize2;
4478ef028eecSStefano Zampini     PetscMPIInt *send_buffer;
44790c7d97c5SJed Brown 
44800c7d97c5SJed Brown     if (rank_prec_comm==active_rank) {
44810c7d97c5SJed Brown       ierr = PetscMalloc (pcbddc->replicated_primal_size*sizeof(PetscMPIInt),&pcbddc->replicated_local_primal_indices);CHKERRQ(ierr);
44820bdf917eSStefano Zampini       ierr = PetscMalloc (pcbddc->replicated_primal_size*sizeof(PetscScalar),&pcbddc->replicated_local_primal_values);CHKERRQ(ierr);
44830c7d97c5SJed Brown       ierr = PetscMalloc (size_prec_comm*sizeof(PetscMPIInt),&localsizes2);CHKERRQ(ierr);
44840c7d97c5SJed Brown       ierr = PetscMalloc (size_prec_comm*sizeof(PetscMPIInt),&localdispl2);CHKERRQ(ierr);
44850c7d97c5SJed Brown       /* arrays for values insertion */
4486*2fa5cd67SKarl Rupp       for (i=0;i<size_prec_comm;i++) localsizes2[i]=pcbddc->local_primal_sizes[i]*pcbddc->local_primal_sizes[i];
44870c7d97c5SJed Brown       localdispl2[0]=0;
4488*2fa5cd67SKarl Rupp       for (i=1;i<size_prec_comm;i++) localdispl2[i]=localsizes2[i-1]+localdispl2[i-1];
44890c7d97c5SJed Brown       j = 0;
4490*2fa5cd67SKarl Rupp       for (i=0;i<size_prec_comm;i++) j+=localsizes2[i];
44910c7d97c5SJed Brown       ierr = PetscMalloc (j*sizeof(PetscScalar),&temp_coarse_mat_vals);CHKERRQ(ierr);
44920c7d97c5SJed Brown     }
44930c7d97c5SJed Brown 
44940c7d97c5SJed Brown     mysize =pcbddc->local_primal_size;
44950c7d97c5SJed Brown     mysize2=pcbddc->local_primal_size*pcbddc->local_primal_size;
4496ef028eecSStefano Zampini     ierr   = PetscMalloc(mysize*sizeof(PetscMPIInt),&send_buffer);CHKERRQ(ierr);
4497*2fa5cd67SKarl Rupp     for (i=0; i<mysize; i++) send_buffer[i]=(PetscMPIInt)pcbddc->local_primal_indices[i];
4498*2fa5cd67SKarl Rupp 
44990c7d97c5SJed Brown     if (pcbddc->coarse_problem_type == SEQUENTIAL_BDDC) {
4500ef028eecSStefano Zampini       ierr = MPI_Gatherv(send_buffer,mysize,MPIU_INT,&pcbddc->replicated_local_primal_indices[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr);
450153cdbc3dSStefano Zampini       ierr = MPI_Gatherv(&coarse_submat_vals[0],mysize2,MPIU_SCALAR,&temp_coarse_mat_vals[0],localsizes2,localdispl2,MPIU_SCALAR,master_proc,prec_comm);CHKERRQ(ierr);
45020c7d97c5SJed Brown     } else {
4503ef028eecSStefano Zampini       ierr = MPI_Allgatherv(send_buffer,mysize,MPIU_INT,&pcbddc->replicated_local_primal_indices[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,prec_comm);CHKERRQ(ierr);
450453cdbc3dSStefano Zampini       ierr = MPI_Allgatherv(&coarse_submat_vals[0],mysize2,MPIU_SCALAR,&temp_coarse_mat_vals[0],localsizes2,localdispl2,MPIU_SCALAR,prec_comm);CHKERRQ(ierr);
45050c7d97c5SJed Brown     }
4506ef028eecSStefano Zampini     ierr = PetscFree(send_buffer);CHKERRQ(ierr);
45070c7d97c5SJed Brown     break;
4508da1bb401SStefano Zampini   }/* switch on coarse problem and communications associated with finished */
45090c7d97c5SJed Brown   }
45100c7d97c5SJed Brown 
45110c7d97c5SJed Brown   /* Now create and fill up coarse matrix */
45120c7d97c5SJed Brown   if (rank_prec_comm == active_rank) {
4513142dfd88SStefano Zampini 
4514142dfd88SStefano Zampini     Mat matis_coarse_local_mat;
4515142dfd88SStefano Zampini 
45160c7d97c5SJed Brown     if (pcbddc->coarse_problem_type != MULTILEVEL_BDDC) {
45170c7d97c5SJed Brown       ierr = MatCreate(coarse_comm,&pcbddc->coarse_mat);CHKERRQ(ierr);
45180c7d97c5SJed Brown       ierr = MatSetSizes(pcbddc->coarse_mat,PETSC_DECIDE,PETSC_DECIDE,pcbddc->coarse_size,pcbddc->coarse_size);CHKERRQ(ierr);
45190c7d97c5SJed Brown       ierr = MatSetType(pcbddc->coarse_mat,coarse_mat_type);CHKERRQ(ierr);
45203b03a366Sstefano_zampini       ierr = MatSetUp(pcbddc->coarse_mat);CHKERRQ(ierr);
4521da1bb401SStefano Zampini       ierr = MatSetOption(pcbddc->coarse_mat,MAT_ROW_ORIENTED,PETSC_FALSE);CHKERRQ(ierr); /* local values stored in column major */
45223b03a366Sstefano_zampini       ierr = MatSetOption(pcbddc->coarse_mat,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr);
45230c7d97c5SJed Brown     } else {
45244fad6a16SStefano Zampini       ierr = MatCreateIS(coarse_comm,1,PETSC_DECIDE,PETSC_DECIDE,pcbddc->coarse_size,pcbddc->coarse_size,coarse_ISLG,&pcbddc->coarse_mat);CHKERRQ(ierr);
45253b03a366Sstefano_zampini       ierr = MatSetUp(pcbddc->coarse_mat);CHKERRQ(ierr);
45260c7d97c5SJed Brown       ierr = MatISGetLocalMat(pcbddc->coarse_mat,&matis_coarse_local_mat);CHKERRQ(ierr);
45273b03a366Sstefano_zampini       ierr = MatSetUp(matis_coarse_local_mat);CHKERRQ(ierr);
4528da1bb401SStefano Zampini       ierr = MatSetOption(matis_coarse_local_mat,MAT_ROW_ORIENTED,PETSC_FALSE);CHKERRQ(ierr); /* local values stored in column major */
4529a0ba757dSStefano Zampini       ierr = MatSetOption(matis_coarse_local_mat,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr);
45300c7d97c5SJed Brown     }
4531142dfd88SStefano Zampini     /* preallocation */
4532142dfd88SStefano Zampini     if (pcbddc->coarse_problem_type != MULTILEVEL_BDDC) {
4533ef028eecSStefano Zampini 
4534142dfd88SStefano Zampini       PetscInt lrows,lcols;
4535ef028eecSStefano Zampini 
4536142dfd88SStefano Zampini       ierr = MatGetLocalSize(pcbddc->coarse_mat,&lrows,&lcols);CHKERRQ(ierr);
4537142dfd88SStefano Zampini       ierr = MatPreallocateInitialize(coarse_comm,lrows,lcols,dnz,onz);CHKERRQ(ierr);
4538ef028eecSStefano Zampini 
4539142dfd88SStefano Zampini       if (pcbddc->coarse_problem_type == PARALLEL_BDDC) {
4540ef028eecSStefano Zampini 
4541ef028eecSStefano Zampini         Vec         vec_dnz,vec_onz;
4542ef028eecSStefano Zampini         PetscScalar *my_dnz,*my_onz,*array;
4543ef028eecSStefano Zampini         PetscInt    *mat_ranges,*row_ownership;
4544ef028eecSStefano Zampini         PetscInt    coarse_index_row,coarse_index_col,owner;
4545ef028eecSStefano Zampini 
4546ef028eecSStefano Zampini         ierr = VecCreate(prec_comm,&vec_dnz);CHKERRQ(ierr);
4547ef028eecSStefano Zampini         ierr = VecSetSizes(vec_dnz,PETSC_DECIDE,pcbddc->coarse_size);CHKERRQ(ierr);
4548ef028eecSStefano Zampini         ierr = VecSetType(vec_dnz,VECMPI);CHKERRQ(ierr);
4549ef028eecSStefano Zampini         ierr = VecDuplicate(vec_dnz,&vec_onz);CHKERRQ(ierr);
4550ef028eecSStefano Zampini 
4551ef028eecSStefano Zampini         ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscScalar),&my_dnz);CHKERRQ(ierr);
4552ef028eecSStefano Zampini         ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscScalar),&my_onz);CHKERRQ(ierr);
4553ef028eecSStefano Zampini         ierr = PetscMemzero(my_dnz,pcbddc->local_primal_size*sizeof(PetscScalar));CHKERRQ(ierr);
4554ef028eecSStefano Zampini         ierr = PetscMemzero(my_onz,pcbddc->local_primal_size*sizeof(PetscScalar));CHKERRQ(ierr);
4555ef028eecSStefano Zampini 
4556ef028eecSStefano Zampini         ierr = PetscMalloc(pcbddc->coarse_size*sizeof(PetscInt),&row_ownership);CHKERRQ(ierr);
4557ef028eecSStefano Zampini         ierr = MatGetOwnershipRanges(pcbddc->coarse_mat,(const PetscInt**)&mat_ranges);CHKERRQ(ierr);
4558142dfd88SStefano Zampini         for (i=0; i<size_prec_comm; i++) {
4559ef028eecSStefano Zampini           for (j=mat_ranges[i]; j<mat_ranges[i+1]; j++) {
4560ef028eecSStefano Zampini             row_ownership[j]=i;
4561142dfd88SStefano Zampini           }
4562142dfd88SStefano Zampini         }
4563ef028eecSStefano Zampini 
4564ef028eecSStefano Zampini         for (i=0; i<pcbddc->local_primal_size; i++) {
4565ef028eecSStefano Zampini           coarse_index_row = pcbddc->local_primal_indices[i];
4566ef028eecSStefano Zampini           owner = row_ownership[coarse_index_row];
4567ef028eecSStefano Zampini           for (j=i; j<pcbddc->local_primal_size; j++) {
4568ef028eecSStefano Zampini             owner = row_ownership[coarse_index_row];
4569ef028eecSStefano Zampini             coarse_index_col = pcbddc->local_primal_indices[j];
4570ef028eecSStefano Zampini             if (coarse_index_col > mat_ranges[owner]-1 && coarse_index_col < mat_ranges[owner+1]) {
4571ef028eecSStefano Zampini               my_dnz[i] += 1.0;
4572142dfd88SStefano Zampini             } else {
4573ef028eecSStefano Zampini               my_onz[i] += 1.0;
4574142dfd88SStefano Zampini             }
4575ef028eecSStefano Zampini             if (i != j) {
4576ef028eecSStefano Zampini               owner = row_ownership[coarse_index_col];
4577ef028eecSStefano Zampini               if (coarse_index_row > mat_ranges[owner]-1 && coarse_index_row < mat_ranges[owner+1]) {
4578ef028eecSStefano Zampini                 my_dnz[j] += 1.0;
4579142dfd88SStefano Zampini               } else {
4580ef028eecSStefano Zampini                 my_onz[j] += 1.0;
4581142dfd88SStefano Zampini               }
4582142dfd88SStefano Zampini             }
4583142dfd88SStefano Zampini           }
4584142dfd88SStefano Zampini         }
4585ef028eecSStefano Zampini         ierr = VecSet(vec_dnz,0.0);CHKERRQ(ierr);
4586ef028eecSStefano Zampini         ierr = VecSet(vec_onz,0.0);CHKERRQ(ierr);
4587a929c220SStefano Zampini         if (pcbddc->local_primal_size) {
4588ef028eecSStefano Zampini           ierr = VecSetValues(vec_dnz,pcbddc->local_primal_size,pcbddc->local_primal_indices,my_dnz,ADD_VALUES);CHKERRQ(ierr);
4589ef028eecSStefano Zampini           ierr = VecSetValues(vec_onz,pcbddc->local_primal_size,pcbddc->local_primal_indices,my_onz,ADD_VALUES);CHKERRQ(ierr);
4590a929c220SStefano Zampini         }
4591ef028eecSStefano Zampini         ierr = VecAssemblyBegin(vec_dnz);CHKERRQ(ierr);
4592ef028eecSStefano Zampini         ierr = VecAssemblyBegin(vec_onz);CHKERRQ(ierr);
4593ef028eecSStefano Zampini         ierr = VecAssemblyEnd(vec_dnz);CHKERRQ(ierr);
4594ef028eecSStefano Zampini         ierr = VecAssemblyEnd(vec_onz);CHKERRQ(ierr);
4595ef028eecSStefano Zampini         j    = mat_ranges[rank_prec_comm+1]-mat_ranges[rank_prec_comm];
4596ef028eecSStefano Zampini         ierr = VecGetArray(vec_dnz,&array);CHKERRQ(ierr);
4597*2fa5cd67SKarl Rupp         for (i=0; i<j; i++) dnz[i] = (PetscInt)array[i];
4598*2fa5cd67SKarl Rupp 
4599ef028eecSStefano Zampini         ierr = VecRestoreArray(vec_dnz,&array);CHKERRQ(ierr);
4600ef028eecSStefano Zampini         ierr = VecGetArray(vec_onz,&array);CHKERRQ(ierr);
4601*2fa5cd67SKarl Rupp         for (i=0;i<j;i++) onz[i] = (PetscInt)array[i];
4602*2fa5cd67SKarl Rupp 
4603ef028eecSStefano Zampini         ierr = VecRestoreArray(vec_onz,&array);CHKERRQ(ierr);
4604ef028eecSStefano Zampini         ierr = PetscFree(my_dnz);CHKERRQ(ierr);
4605ef028eecSStefano Zampini         ierr = PetscFree(my_onz);CHKERRQ(ierr);
4606ef028eecSStefano Zampini         ierr = PetscFree(row_ownership);CHKERRQ(ierr);
4607ef028eecSStefano Zampini         ierr = VecDestroy(&vec_dnz);CHKERRQ(ierr);
4608ef028eecSStefano Zampini         ierr = VecDestroy(&vec_onz);CHKERRQ(ierr);
4609142dfd88SStefano Zampini       } else {
4610142dfd88SStefano Zampini         for (k=0;k<size_prec_comm;k++) {
4611142dfd88SStefano Zampini           offset=pcbddc->local_primal_displacements[k];
4612142dfd88SStefano Zampini           offset2=localdispl2[k];
4613142dfd88SStefano Zampini           ins_local_primal_size = pcbddc->local_primal_sizes[k];
4614ef028eecSStefano Zampini           ierr = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&ins_local_primal_indices);CHKERRQ(ierr);
4615ef028eecSStefano Zampini           for (j=0;j<ins_local_primal_size;j++) {
4616ef028eecSStefano Zampini             ins_local_primal_indices[j]=(PetscInt)pcbddc->replicated_local_primal_indices[offset+j];
4617ef028eecSStefano Zampini           }
4618142dfd88SStefano Zampini           for (j=0;j<ins_local_primal_size;j++) {
4619142dfd88SStefano Zampini             ierr = MatPreallocateSet(ins_local_primal_indices[j],ins_local_primal_size,ins_local_primal_indices,dnz,onz);CHKERRQ(ierr);
4620142dfd88SStefano Zampini           }
4621ef028eecSStefano Zampini           ierr = PetscFree(ins_local_primal_indices);CHKERRQ(ierr);
4622142dfd88SStefano Zampini         }
4623142dfd88SStefano Zampini       }
4624*2fa5cd67SKarl Rupp 
4625142dfd88SStefano Zampini       /* check */
4626142dfd88SStefano Zampini       for (i=0;i<lrows;i++) {
4627*2fa5cd67SKarl Rupp         if (dnz[i]>lcols) dnz[i]=lcols;
4628*2fa5cd67SKarl Rupp         if (onz[i]>pcbddc->coarse_size-lcols) onz[i]=pcbddc->coarse_size-lcols;
4629142dfd88SStefano Zampini       }
4630142dfd88SStefano Zampini       ierr = MatSeqAIJSetPreallocation(pcbddc->coarse_mat,PETSC_NULL,dnz);CHKERRQ(ierr);
4631142dfd88SStefano Zampini       ierr = MatMPIAIJSetPreallocation(pcbddc->coarse_mat,PETSC_NULL,dnz,PETSC_NULL,onz);CHKERRQ(ierr);
4632142dfd88SStefano Zampini       ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr);
4633142dfd88SStefano Zampini     } else {
4634523858cfSStefano Zampini       ierr = MatSeqAIJSetPreallocation(matis_coarse_local_mat,0,dnz);CHKERRQ(ierr);
4635523858cfSStefano Zampini       ierr = PetscFree(dnz);CHKERRQ(ierr);
4636142dfd88SStefano Zampini     }
4637*2fa5cd67SKarl Rupp 
4638142dfd88SStefano Zampini     /* insert values */
4639523858cfSStefano Zampini     if (pcbddc->coarse_problem_type == PARALLEL_BDDC) {
46400c7d97c5SJed Brown       ierr = MatSetValues(pcbddc->coarse_mat,ins_local_primal_size,ins_local_primal_indices,ins_local_primal_size,ins_local_primal_indices,ins_coarse_mat_vals,ADD_VALUES);CHKERRQ(ierr);
4641523858cfSStefano Zampini     } else if (pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
4642523858cfSStefano Zampini       if (pcbddc->coarsening_ratio == 1) {
4643523858cfSStefano Zampini         ins_coarse_mat_vals = coarse_submat_vals;
4644523858cfSStefano Zampini         ierr                = MatSetValues(pcbddc->coarse_mat,ins_local_primal_size,ins_local_primal_indices,ins_local_primal_size,ins_local_primal_indices,ins_coarse_mat_vals,INSERT_VALUES);CHKERRQ(ierr);
4645523858cfSStefano Zampini       } else {
4646523858cfSStefano Zampini         ierr = PetscFree(ins_local_primal_indices);CHKERRQ(ierr);
4647523858cfSStefano Zampini         for (k=0; k<pcbddc->replicated_primal_size; k++) {
4648523858cfSStefano Zampini           offset                = pcbddc->local_primal_displacements[k];
4649523858cfSStefano Zampini           offset2               = localdispl2[k];
4650523858cfSStefano Zampini           ins_local_primal_size = pcbddc->local_primal_displacements[k+1]-pcbddc->local_primal_displacements[k];
4651ef028eecSStefano Zampini           ierr                  = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&ins_local_primal_indices);CHKERRQ(ierr);
4652ef028eecSStefano Zampini           for (j=0; j<ins_local_primal_size; j++) {
4653ef028eecSStefano Zampini             ins_local_primal_indices[j]=(PetscInt)pcbddc->replicated_local_primal_indices[offset+j];
4654ef028eecSStefano Zampini           }
4655523858cfSStefano Zampini           ins_coarse_mat_vals = &temp_coarse_mat_vals[offset2];
4656523858cfSStefano Zampini           ierr                = MatSetValues(pcbddc->coarse_mat,ins_local_primal_size,ins_local_primal_indices,ins_local_primal_size,ins_local_primal_indices,ins_coarse_mat_vals,ADD_VALUES);CHKERRQ(ierr);
4657ef028eecSStefano Zampini           ierr                = PetscFree(ins_local_primal_indices);CHKERRQ(ierr);
4658523858cfSStefano Zampini         }
4659523858cfSStefano Zampini       }
4660523858cfSStefano Zampini       ins_local_primal_indices = 0;
4661523858cfSStefano Zampini       ins_coarse_mat_vals      = 0;
4662ea7e1babSStefano Zampini     } else {
4663ea7e1babSStefano Zampini       for (k=0; k<size_prec_comm; k++) {
4664ea7e1babSStefano Zampini         offset                =pcbddc->local_primal_displacements[k];
4665ea7e1babSStefano Zampini         offset2               =localdispl2[k];
4666ea7e1babSStefano Zampini         ins_local_primal_size = pcbddc->local_primal_sizes[k];
4667ef028eecSStefano Zampini         ierr                  = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&ins_local_primal_indices);CHKERRQ(ierr);
4668ef028eecSStefano Zampini         for (j=0; j<ins_local_primal_size; j++) {
4669ef028eecSStefano Zampini           ins_local_primal_indices[j]=(PetscInt)pcbddc->replicated_local_primal_indices[offset+j];
4670ef028eecSStefano Zampini         }
4671ea7e1babSStefano Zampini         ins_coarse_mat_vals = &temp_coarse_mat_vals[offset2];
4672ea7e1babSStefano Zampini         ierr                = MatSetValues(pcbddc->coarse_mat,ins_local_primal_size,ins_local_primal_indices,ins_local_primal_size,ins_local_primal_indices,ins_coarse_mat_vals,ADD_VALUES);CHKERRQ(ierr);
4673ef028eecSStefano Zampini         ierr                = PetscFree(ins_local_primal_indices);CHKERRQ(ierr);
4674ea7e1babSStefano Zampini       }
4675ea7e1babSStefano Zampini       ins_local_primal_indices = 0;
4676ea7e1babSStefano Zampini       ins_coarse_mat_vals      = 0;
4677ea7e1babSStefano Zampini     }
46780c7d97c5SJed Brown     ierr = MatAssemblyBegin(pcbddc->coarse_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
46790c7d97c5SJed Brown     ierr = MatAssemblyEnd(pcbddc->coarse_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
4680142dfd88SStefano Zampini     /* symmetry of coarse matrix */
4681142dfd88SStefano Zampini     if (issym) {
4682142dfd88SStefano Zampini       ierr = MatSetOption(pcbddc->coarse_mat,MAT_SYMMETRIC,PETSC_TRUE);CHKERRQ(ierr);
4683142dfd88SStefano Zampini     }
46840c7d97c5SJed Brown     ierr = MatGetVecs(pcbddc->coarse_mat,&pcbddc->coarse_vec,&pcbddc->coarse_rhs);CHKERRQ(ierr);
46850bdf917eSStefano Zampini   }
46860bdf917eSStefano Zampini 
46870bdf917eSStefano Zampini   /* create loc to glob scatters if needed */
46880bdf917eSStefano Zampini   if (pcbddc->coarse_communications_type == SCATTERS_BDDC) {
46890bdf917eSStefano Zampini     IS local_IS,global_IS;
46900bdf917eSStefano Zampini     ierr = ISCreateStride(PETSC_COMM_SELF,pcbddc->local_primal_size,0,1,&local_IS);CHKERRQ(ierr);
46910bdf917eSStefano Zampini     ierr = ISCreateGeneral(PETSC_COMM_SELF,pcbddc->local_primal_size,pcbddc->local_primal_indices,PETSC_COPY_VALUES,&global_IS);CHKERRQ(ierr);
46920bdf917eSStefano Zampini     ierr = VecScatterCreate(pcbddc->vec1_P,local_IS,pcbddc->coarse_vec,global_IS,&pcbddc->coarse_loc_to_glob);CHKERRQ(ierr);
46930bdf917eSStefano Zampini     ierr = ISDestroy(&local_IS);CHKERRQ(ierr);
46940bdf917eSStefano Zampini     ierr = ISDestroy(&global_IS);CHKERRQ(ierr);
46950bdf917eSStefano Zampini   }
46960bdf917eSStefano Zampini 
4697a929c220SStefano Zampini   /* free memory no longer needed */
4698a929c220SStefano Zampini   if (coarse_ISLG)              { ierr = ISLocalToGlobalMappingDestroy(&coarse_ISLG);CHKERRQ(ierr); }
4699a929c220SStefano Zampini   if (ins_local_primal_indices) { ierr = PetscFree(ins_local_primal_indices);CHKERRQ(ierr); }
4700a929c220SStefano Zampini   if (ins_coarse_mat_vals)      { ierr = PetscFree(ins_coarse_mat_vals);CHKERRQ(ierr); }
4701a929c220SStefano Zampini   if (localsizes2)              { ierr = PetscFree(localsizes2);CHKERRQ(ierr); }
4702a929c220SStefano Zampini   if (localdispl2)              { ierr = PetscFree(localdispl2);CHKERRQ(ierr); }
4703a929c220SStefano Zampini   if (temp_coarse_mat_vals)     { ierr = PetscFree(temp_coarse_mat_vals);CHKERRQ(ierr); }
4704a929c220SStefano Zampini 
47050bdf917eSStefano Zampini   /* Eval coarse null space */
47060bdf917eSStefano Zampini   if (pcbddc->NullSpace) {
47070bdf917eSStefano Zampini     const Vec *nsp_vecs;
47080bdf917eSStefano Zampini     PetscInt  nsp_size,coarse_nsp_size;
47090bdf917eSStefano Zampini     PetscBool nsp_has_cnst;
47100bdf917eSStefano Zampini     PetscReal test_null;
47110bdf917eSStefano Zampini     Vec       *coarse_nsp_vecs;
47120bdf917eSStefano Zampini 
47130bdf917eSStefano Zampini     coarse_nsp_size = 0;
47140bdf917eSStefano Zampini     coarse_nsp_vecs = 0;
47150bdf917eSStefano Zampini     ierr            = MatNullSpaceGetVecs(pcbddc->NullSpace,&nsp_has_cnst,&nsp_size,&nsp_vecs);CHKERRQ(ierr);
47160bdf917eSStefano Zampini     if (rank_prec_comm == active_rank) {
47170bdf917eSStefano Zampini       ierr = PetscMalloc((nsp_size+1)*sizeof(Vec),&coarse_nsp_vecs);CHKERRQ(ierr);
47180bdf917eSStefano Zampini       for (i=0; i<nsp_size+1; i++) {
47190bdf917eSStefano Zampini         ierr = VecDuplicate(pcbddc->coarse_vec,&coarse_nsp_vecs[i]);CHKERRQ(ierr);
47200bdf917eSStefano Zampini       }
47210bdf917eSStefano Zampini     }
47220bdf917eSStefano Zampini     if (nsp_has_cnst) {
47230bdf917eSStefano Zampini       ierr = VecSet(pcis->vec1_N,1.0);CHKERRQ(ierr);
47240bdf917eSStefano Zampini       ierr = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr);
47250bdf917eSStefano Zampini       ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->vec1_P,pcbddc->coarse_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
47260bdf917eSStefano Zampini       ierr = PCBDDCScatterCoarseDataEnd(pc,pcbddc->vec1_P,pcbddc->coarse_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
47270bdf917eSStefano Zampini       if (rank_prec_comm == active_rank) {
47280bdf917eSStefano Zampini         ierr = MatMult(pcbddc->coarse_mat,pcbddc->coarse_vec,pcbddc->coarse_rhs);CHKERRQ(ierr);
47290bdf917eSStefano Zampini         ierr = VecNorm(pcbddc->coarse_rhs,NORM_INFINITY,&test_null);CHKERRQ(ierr);
47300bdf917eSStefano Zampini         if (test_null > 1.0e-12 && pcbddc->dbg_flag) {
47310bdf917eSStefano Zampini           ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Constant coarse null space error % 1.14e\n",test_null);CHKERRQ(ierr);
47320bdf917eSStefano Zampini         }
47330bdf917eSStefano Zampini         ierr = VecCopy(pcbddc->coarse_vec,coarse_nsp_vecs[coarse_nsp_size]);CHKERRQ(ierr);
47340bdf917eSStefano Zampini         coarse_nsp_size++;
47350bdf917eSStefano Zampini       }
47360bdf917eSStefano Zampini     }
47370bdf917eSStefano Zampini     for (i=0; i<nsp_size; i++)  {
47380bdf917eSStefano Zampini       ierr = VecScatterBegin(matis->ctx,nsp_vecs[i],pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
47390bdf917eSStefano Zampini       ierr = VecScatterEnd  (matis->ctx,nsp_vecs[i],pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
47400bdf917eSStefano Zampini       ierr = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr);
47410bdf917eSStefano Zampini       ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->vec1_P,pcbddc->coarse_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
47420bdf917eSStefano Zampini       ierr = PCBDDCScatterCoarseDataEnd(pc,pcbddc->vec1_P,pcbddc->coarse_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
47430bdf917eSStefano Zampini       if (rank_prec_comm == active_rank) {
47440bdf917eSStefano Zampini         ierr = MatMult(pcbddc->coarse_mat,pcbddc->coarse_vec,pcbddc->coarse_rhs);CHKERRQ(ierr);
47450bdf917eSStefano Zampini         ierr = VecNorm(pcbddc->coarse_rhs,NORM_2,&test_null);CHKERRQ(ierr);
47460bdf917eSStefano Zampini         if (test_null > 1.0e-12 && pcbddc->dbg_flag) {
47470bdf917eSStefano Zampini           ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Vec %d coarse null space error % 1.14e\n",i,test_null);CHKERRQ(ierr);
47480bdf917eSStefano Zampini         }
47490bdf917eSStefano Zampini         ierr = VecCopy(pcbddc->coarse_vec,coarse_nsp_vecs[coarse_nsp_size]);CHKERRQ(ierr);
47500bdf917eSStefano Zampini         coarse_nsp_size++;
47510bdf917eSStefano Zampini       }
47520bdf917eSStefano Zampini     }
47530bdf917eSStefano Zampini     if (coarse_nsp_size > 0) {
47540bdf917eSStefano Zampini       /* TODO orthonormalize vecs */
47550bdf917eSStefano Zampini       ierr = VecNormalize(coarse_nsp_vecs[0],PETSC_NULL);CHKERRQ(ierr);
47560bdf917eSStefano Zampini       ierr = MatNullSpaceCreate(coarse_comm,PETSC_FALSE,coarse_nsp_size,coarse_nsp_vecs,&pcbddc->CoarseNullSpace);CHKERRQ(ierr);
47570bdf917eSStefano Zampini       for (i=0; i<nsp_size+1; i++) {
47580bdf917eSStefano Zampini         ierr = VecDestroy(&coarse_nsp_vecs[i]);CHKERRQ(ierr);
47590bdf917eSStefano Zampini       }
47600bdf917eSStefano Zampini     }
47610bdf917eSStefano Zampini     ierr = PetscFree(coarse_nsp_vecs);CHKERRQ(ierr);
47620bdf917eSStefano Zampini   }
47630bdf917eSStefano Zampini 
47640bdf917eSStefano Zampini   /* KSP for coarse problem */
47650bdf917eSStefano Zampini   if (rank_prec_comm == active_rank) {
47662e8d2280SStefano Zampini     PetscBool isbddc=PETSC_FALSE;
47670bdf917eSStefano Zampini 
476853cdbc3dSStefano Zampini     ierr = KSPCreate(coarse_comm,&pcbddc->coarse_ksp);CHKERRQ(ierr);
476953cdbc3dSStefano Zampini     ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->coarse_ksp,(PetscObject)pc,1);CHKERRQ(ierr);
477053cdbc3dSStefano Zampini     ierr = KSPSetOperators(pcbddc->coarse_ksp,pcbddc->coarse_mat,pcbddc->coarse_mat,SAME_PRECONDITIONER);CHKERRQ(ierr);
47713b03a366Sstefano_zampini     ierr = KSPSetTolerances(pcbddc->coarse_ksp,PETSC_DEFAULT,PETSC_DEFAULT,PETSC_DEFAULT,max_it_coarse_ksp);CHKERRQ(ierr);
477253cdbc3dSStefano Zampini     ierr = KSPSetType(pcbddc->coarse_ksp,coarse_ksp_type);CHKERRQ(ierr);
477353cdbc3dSStefano Zampini     ierr = KSPGetPC(pcbddc->coarse_ksp,&pc_temp);CHKERRQ(ierr);
477453cdbc3dSStefano Zampini     ierr = PCSetType(pc_temp,coarse_pc_type);CHKERRQ(ierr);
47750c7d97c5SJed Brown     /* Allow user's customization */
4776da1bb401SStefano Zampini     ierr = KSPSetOptionsPrefix(pcbddc->coarse_ksp,"coarse_");CHKERRQ(ierr);
47770c7d97c5SJed Brown     /* Set Up PC for coarse problem BDDC */
477853cdbc3dSStefano Zampini     if (pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
47794fad6a16SStefano Zampini       i    = pcbddc->current_level+1;
47804fad6a16SStefano Zampini       ierr = PCBDDCSetLevel(pc_temp,i);CHKERRQ(ierr);
47814fad6a16SStefano Zampini       ierr = PCBDDCSetCoarseningRatio(pc_temp,pcbddc->coarsening_ratio);CHKERRQ(ierr);
47824fad6a16SStefano Zampini       ierr = PCBDDCSetMaxLevels(pc_temp,pcbddc->max_levels);CHKERRQ(ierr);
478353cdbc3dSStefano Zampini       ierr = PCBDDCSetCoarseProblemType(pc_temp,MULTILEVEL_BDDC);CHKERRQ(ierr);
47840bdf917eSStefano Zampini       if (pcbddc->CoarseNullSpace) { ierr = PCBDDCSetNullSpace(pc_temp,pcbddc->CoarseNullSpace);CHKERRQ(ierr); }
47854fad6a16SStefano Zampini       if (dbg_flag) {
47864fad6a16SStefano Zampini         ierr = PetscViewerASCIIPrintf(viewer,"----------------Level %d: Setting up level %d---------------\n",pcbddc->current_level,i);CHKERRQ(ierr);
47874fad6a16SStefano Zampini         ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
478853cdbc3dSStefano Zampini       }
47894fad6a16SStefano Zampini     }
47904fad6a16SStefano Zampini     ierr = KSPSetFromOptions(pcbddc->coarse_ksp);CHKERRQ(ierr);
479153cdbc3dSStefano Zampini     ierr = KSPSetUp(pcbddc->coarse_ksp);CHKERRQ(ierr);
4792142dfd88SStefano Zampini 
47932e8d2280SStefano Zampini     ierr = KSPGetTolerances(pcbddc->coarse_ksp,PETSC_NULL,PETSC_NULL,PETSC_NULL,&j);CHKERRQ(ierr);
47942e8d2280SStefano Zampini     ierr = KSPGetPC(pcbddc->coarse_ksp,&pc_temp);CHKERRQ(ierr);
47952e8d2280SStefano Zampini     ierr = PetscObjectTypeCompare((PetscObject)pc_temp,PCBDDC,&isbddc);CHKERRQ(ierr);
47962e8d2280SStefano Zampini     if (j == 1) {
47972e8d2280SStefano Zampini       ierr = KSPSetNormType(pcbddc->coarse_ksp,KSP_NORM_NONE);CHKERRQ(ierr);
47982e8d2280SStefano Zampini       if (isbddc) {
47992e8d2280SStefano Zampini         ierr = PCBDDCSetUseExactDirichlet(pc_temp,PETSC_FALSE);CHKERRQ(ierr);
48005619798eSStefano Zampini       }
48015619798eSStefano Zampini     }
48020c7d97c5SJed Brown   }
4803a929c220SStefano Zampini   /* Check coarse problem if requested */
4804142dfd88SStefano Zampini   if (dbg_flag && rank_prec_comm == active_rank) {
4805142dfd88SStefano Zampini     KSP       check_ksp;
4806142dfd88SStefano Zampini     PC        check_pc;
4807142dfd88SStefano Zampini     Vec       check_vec;
4808142dfd88SStefano Zampini     PetscReal abs_infty_error,infty_error,lambda_min,lambda_max;
480919fd82e9SBarry Smith     KSPType   check_ksp_type;
48100c7d97c5SJed Brown 
4811142dfd88SStefano Zampini     /* Create ksp object suitable for extreme eigenvalues' estimation */
4812142dfd88SStefano Zampini     ierr = KSPCreate(coarse_comm,&check_ksp);CHKERRQ(ierr);
4813142dfd88SStefano Zampini     ierr = KSPSetOperators(check_ksp,pcbddc->coarse_mat,pcbddc->coarse_mat,SAME_PRECONDITIONER);CHKERRQ(ierr);
48140bdf917eSStefano Zampini     ierr = KSPSetTolerances(check_ksp,1.e-12,1.e-12,PETSC_DEFAULT,pcbddc->coarse_size);CHKERRQ(ierr);
4815142dfd88SStefano Zampini     if (pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
4816*2fa5cd67SKarl Rupp       if (issym) check_ksp_type = KSPCG;
4817*2fa5cd67SKarl Rupp       else check_ksp_type = KSPGMRES;
4818142dfd88SStefano Zampini       ierr = KSPSetComputeSingularValues(check_ksp,PETSC_TRUE);CHKERRQ(ierr);
4819142dfd88SStefano Zampini     } else {
4820142dfd88SStefano Zampini       check_ksp_type = KSPPREONLY;
4821142dfd88SStefano Zampini     }
4822142dfd88SStefano Zampini     ierr = KSPSetType(check_ksp,check_ksp_type);CHKERRQ(ierr);
4823142dfd88SStefano Zampini     ierr = KSPGetPC(pcbddc->coarse_ksp,&check_pc);CHKERRQ(ierr);
4824142dfd88SStefano Zampini     ierr = KSPSetPC(check_ksp,check_pc);CHKERRQ(ierr);
4825142dfd88SStefano Zampini     ierr = KSPSetUp(check_ksp);CHKERRQ(ierr);
4826142dfd88SStefano Zampini     /* create random vec */
4827142dfd88SStefano Zampini     ierr = VecDuplicate(pcbddc->coarse_vec,&check_vec);CHKERRQ(ierr);
4828142dfd88SStefano Zampini     ierr = VecSetRandom(check_vec,PETSC_NULL);CHKERRQ(ierr);
48290bdf917eSStefano Zampini     if (pcbddc->CoarseNullSpace) { ierr = MatNullSpaceRemove(pcbddc->CoarseNullSpace,check_vec,PETSC_NULL);CHKERRQ(ierr); }
4830142dfd88SStefano Zampini     ierr = MatMult(pcbddc->coarse_mat,check_vec,pcbddc->coarse_rhs);CHKERRQ(ierr);
4831142dfd88SStefano Zampini     /* solve coarse problem */
4832142dfd88SStefano Zampini     ierr = KSPSolve(check_ksp,pcbddc->coarse_rhs,pcbddc->coarse_vec);CHKERRQ(ierr);
48330bdf917eSStefano Zampini     if (pcbddc->CoarseNullSpace) { ierr = MatNullSpaceRemove(pcbddc->CoarseNullSpace,pcbddc->coarse_vec,PETSC_NULL);CHKERRQ(ierr); }
4834142dfd88SStefano Zampini     /* check coarse problem residual error */
4835142dfd88SStefano Zampini     ierr = VecAXPY(check_vec,-1.0,pcbddc->coarse_vec);CHKERRQ(ierr);
4836142dfd88SStefano Zampini     ierr = VecNorm(check_vec,NORM_INFINITY,&infty_error);CHKERRQ(ierr);
4837142dfd88SStefano Zampini     ierr = MatMult(pcbddc->coarse_mat,check_vec,pcbddc->coarse_rhs);CHKERRQ(ierr);
4838142dfd88SStefano Zampini     ierr = VecNorm(pcbddc->coarse_rhs,NORM_INFINITY,&abs_infty_error);CHKERRQ(ierr);
4839142dfd88SStefano Zampini     ierr = VecDestroy(&check_vec);CHKERRQ(ierr);
4840142dfd88SStefano Zampini     /* get eigenvalue estimation if inexact */
4841142dfd88SStefano Zampini     if (pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
4842142dfd88SStefano Zampini       ierr = KSPComputeExtremeSingularValues(check_ksp,&lambda_max,&lambda_min);CHKERRQ(ierr);
4843142dfd88SStefano Zampini       ierr = KSPGetIterationNumber(check_ksp,&k);CHKERRQ(ierr);
4844142dfd88SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem eigenvalues estimated with %d iterations of %s.\n",k,check_ksp_type);CHKERRQ(ierr);
4845e269702eSStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem eigenvalues: % 1.14e %1.14e\n",lambda_min,lambda_max);CHKERRQ(ierr);
48463b03a366Sstefano_zampini     }
4847142dfd88SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem exact infty_error   : %1.14e\n",infty_error);CHKERRQ(ierr);
4848142dfd88SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem residual infty_error: %1.14e\n",abs_infty_error);CHKERRQ(ierr);
4849142dfd88SStefano Zampini     ierr = KSPDestroy(&check_ksp);CHKERRQ(ierr);
485053cdbc3dSStefano Zampini   }
4851142dfd88SStefano Zampini   if (dbg_flag) { ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); }
48520c7d97c5SJed Brown   PetscFunctionReturn(0);
48530c7d97c5SJed Brown }
48540c7d97c5SJed Brown 
48550c7d97c5SJed Brown #undef __FUNCT__
48560c7d97c5SJed Brown #define __FUNCT__ "PCBDDCManageLocalBoundaries"
485753cdbc3dSStefano Zampini static PetscErrorCode PCBDDCManageLocalBoundaries(PC pc)
48580c7d97c5SJed Brown {
48590c7d97c5SJed Brown   PC_BDDC        *pcbddc  = (PC_BDDC*)pc->data;
48600c7d97c5SJed Brown   PC_IS          *pcis    = (PC_IS*)pc->data;
48610c7d97c5SJed Brown   Mat_IS         *matis   = (Mat_IS*)pc->pmat->data;
4862da1bb401SStefano Zampini   PCBDDCGraph    mat_graph=pcbddc->mat_graph;
48637cf533a6SStefano Zampini   PetscInt       *is_indices,*auxis;
48643b03a366Sstefano_zampini   PetscInt       bs,ierr,i,j,s,k,iindex,neumann_bsize,dirichlet_bsize;
4865da1bb401SStefano Zampini   PetscInt       total_counts,nodes_touched,where_values=1,vertex_size;
4866534831adSStefano Zampini   PetscMPIInt    adapt_interface=0,adapt_interface_reduced=0,NEUMANNCNT=0;
4867da1bb401SStefano Zampini   PetscBool      same_set;
4868a0ba757dSStefano Zampini   MPI_Comm       interface_comm=((PetscObject)pc)->comm;
48693b03a366Sstefano_zampini   PetscBool      use_faces     =PETSC_FALSE,use_edges=PETSC_FALSE;
48703b03a366Sstefano_zampini   const PetscInt *neumann_nodes;
48713b03a366Sstefano_zampini   const PetscInt *dirichlet_nodes;
4872a81d60d8SStefano Zampini   IS             used_IS,*custom_ISForDofs;
4873da1bb401SStefano Zampini   PetscScalar    *array;
4874da1bb401SStefano Zampini   PetscScalar    *array2;
4875da1bb401SStefano Zampini   PetscViewer    viewer=pcbddc->dbg_viewer;
4876a929c220SStefano Zampini   PetscInt       *queue_in_global_numbering;
48770c7d97c5SJed Brown 
48780c7d97c5SJed Brown   PetscFunctionBegin;
4879da1bb401SStefano Zampini   /* Setup local adjacency graph */
4880da1bb401SStefano Zampini   mat_graph->nvtxs=pcis->n;
4881*2fa5cd67SKarl Rupp   if (!mat_graph->xadj) NEUMANNCNT = 1;
4882da1bb401SStefano Zampini   ierr = PCBDDCSetupLocalAdjacencyGraph(pc);CHKERRQ(ierr);
4883*2fa5cd67SKarl Rupp 
4884a0ba757dSStefano Zampini   i    = mat_graph->nvtxs;
4885a0ba757dSStefano Zampini   ierr = PetscMalloc4(i,PetscInt,&mat_graph->where,i,PetscInt,&mat_graph->count,i+1,PetscInt,&mat_graph->cptr,i,PetscInt,&mat_graph->queue);CHKERRQ(ierr);
48863972b0daSStefano Zampini   ierr = PetscMalloc2(i,PetscInt,&mat_graph->which_dof,i,PetscBool,&mat_graph->touched);CHKERRQ(ierr);
4887a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->where,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
4888a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->count,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
4889a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->which_dof,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
4890a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->queue,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
48913828260eSStefano Zampini   ierr = PetscMemzero(mat_graph->cptr,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr);
4892a0ba757dSStefano Zampini 
4893a81d60d8SStefano Zampini   /* Setting dofs splitting in mat_graph->which_dof
4894a81d60d8SStefano Zampini      Get information about dofs' splitting if provided by the user
4895a81d60d8SStefano Zampini      Otherwise it assumes a constant block size */
4896a81d60d8SStefano Zampini   vertex_size=0;
4897a81d60d8SStefano Zampini   if (!pcbddc->n_ISForDofs) {
4898a81d60d8SStefano Zampini     ierr = MatGetBlockSize(matis->A,&bs);CHKERRQ(ierr);
4899a81d60d8SStefano Zampini     ierr = PetscMalloc(bs*sizeof(IS),&custom_ISForDofs);CHKERRQ(ierr);
4900a81d60d8SStefano Zampini     for (i=0; i<bs; i++) {
4901a81d60d8SStefano Zampini       ierr = ISCreateStride(PETSC_COMM_SELF,pcis->n/bs,i,bs,&custom_ISForDofs[i]);CHKERRQ(ierr);
4902a81d60d8SStefano Zampini     }
4903a81d60d8SStefano Zampini     ierr = PCBDDCSetDofsSplitting(pc,bs,custom_ISForDofs);CHKERRQ(ierr);
4904a81d60d8SStefano Zampini     vertex_size=1;
4905a81d60d8SStefano Zampini     /* remove my references to IS objects */
4906a81d60d8SStefano Zampini     for (i=0; i<bs; i++) {
4907a81d60d8SStefano Zampini       ierr = ISDestroy(&custom_ISForDofs[i]);CHKERRQ(ierr);
4908a81d60d8SStefano Zampini     }
4909a81d60d8SStefano Zampini     ierr = PetscFree(custom_ISForDofs);CHKERRQ(ierr);
4910a81d60d8SStefano Zampini   }
49119c0446d6SStefano Zampini   for (i=0; i<pcbddc->n_ISForDofs; i++) {
4912a81d60d8SStefano Zampini     ierr = ISGetSize(pcbddc->ISForDofs[i],&k);CHKERRQ(ierr);
49139c0446d6SStefano Zampini     ierr = ISGetIndices(pcbddc->ISForDofs[i],(const PetscInt**)&is_indices);CHKERRQ(ierr);
4914*2fa5cd67SKarl Rupp     for (j=0; j<k; j++) mat_graph->which_dof[is_indices[j]]=i;
49159c0446d6SStefano Zampini     ierr = ISRestoreIndices(pcbddc->ISForDofs[i],(const PetscInt**)&is_indices);CHKERRQ(ierr);
49169c0446d6SStefano Zampini   }
4917a81d60d8SStefano Zampini   /* use mat block size as vertex size if it has not yet set */
4918a81d60d8SStefano Zampini   if (!vertex_size) {
49193b03a366Sstefano_zampini     ierr = MatGetBlockSize(matis->A,&vertex_size);CHKERRQ(ierr);
49200c7d97c5SJed Brown   }
4921a81d60d8SStefano Zampini 
49223b03a366Sstefano_zampini   /* count number of neigh per node */
49230c7d97c5SJed Brown   total_counts=0;
49243b03a366Sstefano_zampini   for (i=1; i<pcis->n_neigh; i++) {
49250c7d97c5SJed Brown     s             = pcis->n_shared[i];
49260c7d97c5SJed Brown     total_counts += s;
4927*2fa5cd67SKarl Rupp     for (j=0;j<s;j++) mat_graph->count[pcis->shared[i][j]] += 1;
49280c7d97c5SJed Brown   }
4929*2fa5cd67SKarl Rupp 
4930534831adSStefano Zampini   /* Take into account Neumann data -> it increments number of sharing subdomains for nodes lying on the interface */
493136e030ebSStefano Zampini   ierr = PCBDDCGetNeumannBoundaries(pc,&used_IS);CHKERRQ(ierr);
4932da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
4933da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
493436e030ebSStefano Zampini   if (used_IS) {
493536e030ebSStefano Zampini     ierr = ISGetSize(used_IS,&neumann_bsize);CHKERRQ(ierr);
493636e030ebSStefano Zampini     ierr = ISGetIndices(used_IS,&neumann_nodes);CHKERRQ(ierr);
493753cdbc3dSStefano Zampini     for (i=0; i<neumann_bsize; i++) {
493853cdbc3dSStefano Zampini       iindex = neumann_nodes[i];
4939534831adSStefano Zampini       if (mat_graph->count[iindex] > NEUMANNCNT && array[iindex]==0.0) {
494053cdbc3dSStefano Zampini         mat_graph->count[iindex]+=1;
49410c7d97c5SJed Brown         total_counts++;
4942da1bb401SStefano Zampini         array[iindex]=array[iindex]+1.0;
4943f23aa3ddSBarry Smith       } else if (array[iindex]>0.0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_USER,"Error for neumann nodes provided to BDDC! They must be uniquely listed! Found duplicate node %d\n",iindex);
49440c7d97c5SJed Brown     }
49450c7d97c5SJed Brown   }
4946da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
4947da1bb401SStefano Zampini   /* allocate space for storing the set of neighbours for each node */
4948da1bb401SStefano Zampini   ierr = PetscMalloc(mat_graph->nvtxs*sizeof(PetscInt*),&mat_graph->neighbours_set);CHKERRQ(ierr);
4949da1bb401SStefano Zampini   if (mat_graph->nvtxs) { ierr = PetscMalloc(total_counts*sizeof(PetscInt),&mat_graph->neighbours_set[0]);CHKERRQ(ierr); }
4950da1bb401SStefano Zampini   for (i=1; i<mat_graph->nvtxs; i++) mat_graph->neighbours_set[i]=mat_graph->neighbours_set[i-1]+mat_graph->count[i-1];
4951a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->count,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
49523b03a366Sstefano_zampini   for (i=1; i<pcis->n_neigh; i++) {
49530c7d97c5SJed Brown     s=pcis->n_shared[i];
49540c7d97c5SJed Brown     for (j=0; j<s; j++) {
49550c7d97c5SJed Brown       k=pcis->shared[i][j];
4956*2fa5cd67SKarl Rupp 
4957da1bb401SStefano Zampini       mat_graph->neighbours_set[k][mat_graph->count[k]] = pcis->neigh[i];
4958*2fa5cd67SKarl Rupp 
49590c7d97c5SJed Brown       mat_graph->count[k]+=1;
49600c7d97c5SJed Brown     }
49610c7d97c5SJed Brown   }
4962da1bb401SStefano Zampini   /* Check consistency of Neumann nodes */
4963da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
4964da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4965da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4966da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4967da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4968da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
49693b03a366Sstefano_zampini   /* set -1 fake neighbour to mimic Neumann boundary */
497036e030ebSStefano Zampini   if (used_IS) {
497153cdbc3dSStefano Zampini     for (i=0; i<neumann_bsize; i++) {
497253cdbc3dSStefano Zampini       iindex = neumann_nodes[i];
4973534831adSStefano Zampini       if (mat_graph->count[iindex] > NEUMANNCNT) {
4974*2fa5cd67SKarl Rupp         if (mat_graph->count[iindex]+1 != (PetscInt)array[iindex]) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_USER,"Neumann nodes provided to BDDC must be consistent among neighbours!\nNode %d: number of sharing subdomains %d != number of subdomains for which it is a neumann node %d\n",iindex,mat_graph->count[iindex]+1,(PetscInt)array[iindex]);
4975da1bb401SStefano Zampini         mat_graph->neighbours_set[iindex][mat_graph->count[iindex]] = -1;
4976*2fa5cd67SKarl Rupp 
497753cdbc3dSStefano Zampini         mat_graph->count[iindex]+=1;
49780c7d97c5SJed Brown       }
49790c7d97c5SJed Brown     }
498036e030ebSStefano Zampini     ierr = ISRestoreIndices(used_IS,&neumann_nodes);CHKERRQ(ierr);
49810c7d97c5SJed Brown   }
4982da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
4983da1bb401SStefano Zampini   /* sort set of sharing subdomains */
4984*2fa5cd67SKarl Rupp   for (i=0;i<mat_graph->nvtxs;i++) {
4985*2fa5cd67SKarl Rupp     ierr = PetscSortInt(mat_graph->count[i],mat_graph->neighbours_set[i]);CHKERRQ(ierr);
4986*2fa5cd67SKarl Rupp   }
4987*2fa5cd67SKarl Rupp 
49883b03a366Sstefano_zampini   /* remove interior nodes and dirichlet boundary nodes from the next search into the graph */
4989*2fa5cd67SKarl Rupp   for (i=0;i<mat_graph->nvtxs;i++) mat_graph->touched[i]=PETSC_FALSE;
4990da1bb401SStefano Zampini   nodes_touched=0;
4991*2fa5cd67SKarl Rupp 
499236e030ebSStefano Zampini   ierr = PCBDDCGetDirichletBoundaries(pc,&used_IS);CHKERRQ(ierr);
4993da1bb401SStefano Zampini   ierr = VecSet(pcis->vec2_N,0.0);CHKERRQ(ierr);
4994da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
4995da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec2_N,&array2);CHKERRQ(ierr);
4996da1bb401SStefano Zampini   if (used_IS) {
4997da1bb401SStefano Zampini     ierr = ISGetSize(used_IS,&dirichlet_bsize);CHKERRQ(ierr);
4998f23aa3ddSBarry Smith     if (dirichlet_bsize && matis->pure_neumann) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_USER,"Dirichlet boundaries are intended to be used with matrices with zeroed rows!\n");
4999da1bb401SStefano Zampini     ierr = ISGetIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr);
5000da1bb401SStefano Zampini     for (i=0; i<dirichlet_bsize; i++) {
5001da1bb401SStefano Zampini       iindex = dirichlet_nodes[i];
5002da1bb401SStefano Zampini       if (mat_graph->count[iindex] && !mat_graph->touched[iindex]) {
5003f23aa3ddSBarry Smith         if (array[iindex]>0.0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_USER,"BDDC cannot have nodes which are marked as Neumann and Dirichlet at the same time! Wrong node %d\n",iindex);
5004da1bb401SStefano Zampini         mat_graph->touched[iindex] = PETSC_TRUE;
5005da1bb401SStefano Zampini         mat_graph->where[iindex]   = 0;
5006da1bb401SStefano Zampini         nodes_touched++;
5007da1bb401SStefano Zampini         array2[iindex] = array2[iindex]+1.0;
5008da1bb401SStefano Zampini       }
5009da1bb401SStefano Zampini     }
5010da1bb401SStefano Zampini     ierr = ISRestoreIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr);
5011da1bb401SStefano Zampini   }
5012da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
5013da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec2_N,&array2);CHKERRQ(ierr);
5014*2fa5cd67SKarl Rupp 
5015da1bb401SStefano Zampini   /* Check consistency of Dirichlet nodes */
5016da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_N,1.0);CHKERRQ(ierr);
5017da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
5018da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
5019da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
5020da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
5021da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
5022da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
5023da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec2_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
5024da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec2_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
5025da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
5026da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
5027da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
5028da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec2_N,&array2);CHKERRQ(ierr);
502936e030ebSStefano Zampini   if (used_IS) {
503036e030ebSStefano Zampini     ierr = ISGetSize(used_IS,&dirichlet_bsize);CHKERRQ(ierr);
503136e030ebSStefano Zampini     ierr = ISGetIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr);
50323b03a366Sstefano_zampini     for (i=0; i<dirichlet_bsize; i++) {
5033da1bb401SStefano Zampini       iindex=dirichlet_nodes[i];
5034*2fa5cd67SKarl Rupp       if (array[iindex]>1.0 && array[iindex]!=array2[iindex]) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_USER,"Dirichlet nodes provided to BDDC must be consistent among neighbours!\nNode %d: number of sharing subdomains %d != number of subdomains for which it is a neumann node %d\n",iindex,(PetscInt)array[iindex],(PetscInt)array2[iindex]);
50353b03a366Sstefano_zampini     }
503636e030ebSStefano Zampini     ierr = ISRestoreIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr);
50373b03a366Sstefano_zampini   }
5038da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
5039da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec2_N,&array2);CHKERRQ(ierr);
5040da1bb401SStefano Zampini 
50410c7d97c5SJed Brown   for (i=0; i<mat_graph->nvtxs; i++) {
50423b03a366Sstefano_zampini     if (!mat_graph->count[i]) {  /* interior nodes */
50430c7d97c5SJed Brown       mat_graph->touched[i] = PETSC_TRUE;
50440c7d97c5SJed Brown       mat_graph->where[i]   = 0;
50450c7d97c5SJed Brown       nodes_touched++;
50460c7d97c5SJed Brown     }
50470c7d97c5SJed Brown   }
50480c7d97c5SJed Brown   mat_graph->ncmps = 0;
5049*2fa5cd67SKarl Rupp 
5050da1bb401SStefano Zampini   i=0;
50510c7d97c5SJed Brown   while (nodes_touched<mat_graph->nvtxs) {
5052a0ba757dSStefano Zampini     /*  find first untouched node in local ordering */
50530c7d97c5SJed Brown     while (mat_graph->touched[i]) i++;
50540c7d97c5SJed Brown     mat_graph->touched[i]=PETSC_TRUE;
5055a0ba757dSStefano Zampini     mat_graph->where[i]  =where_values;
50560c7d97c5SJed Brown     nodes_touched++;
5057a0ba757dSStefano Zampini     /* now find all other nodes having the same set of sharing subdomains */
50580c7d97c5SJed Brown     for (j=i+1; j<mat_graph->nvtxs; j++) {
5059a0ba757dSStefano Zampini       /* check for same number of sharing subdomains and dof number */
5060da1bb401SStefano Zampini       if (!mat_graph->touched[j] && mat_graph->count[i]==mat_graph->count[j] && mat_graph->which_dof[i] == mat_graph->which_dof[j]) {
5061a0ba757dSStefano Zampini         /* check for same set of sharing subdomains */
50620c7d97c5SJed Brown         same_set=PETSC_TRUE;
50630c7d97c5SJed Brown         for (k=0; k<mat_graph->count[j]; k++) {
5064da1bb401SStefano Zampini           if (mat_graph->neighbours_set[i][k] != mat_graph->neighbours_set[j][k]) {
50650c7d97c5SJed Brown             same_set=PETSC_FALSE;
50660c7d97c5SJed Brown           }
50670c7d97c5SJed Brown         }
5068a0ba757dSStefano Zampini         /* I found a friend of mine */
50690c7d97c5SJed Brown         if (same_set) {
5070a0ba757dSStefano Zampini           mat_graph->where[j]   = where_values;
50710c7d97c5SJed Brown           mat_graph->touched[j] = PETSC_TRUE;
50720c7d97c5SJed Brown           nodes_touched++;
50730c7d97c5SJed Brown         }
50740c7d97c5SJed Brown       }
50750c7d97c5SJed Brown     }
5076a0ba757dSStefano Zampini     where_values++;
50770c7d97c5SJed Brown   }
5078a0ba757dSStefano Zampini   where_values--; if (where_values<0) where_values=0;
5079a0ba757dSStefano Zampini   ierr = PetscMalloc(where_values*sizeof(PetscMPIInt),&mat_graph->where_ncmps);CHKERRQ(ierr);
5080a0ba757dSStefano Zampini   /* Find connected components defined on the shared interface */
5081a0ba757dSStefano Zampini   if (where_values) {
5082*2fa5cd67SKarl Rupp     ierr = PCBDDCFindConnectedComponents(mat_graph, where_values);CHKERRQ(ierr);
5083a0ba757dSStefano Zampini   }
5084a929c220SStefano Zampini   ierr = PetscMalloc(mat_graph->nvtxs*sizeof(PetscInt),&queue_in_global_numbering);CHKERRQ(ierr);
5085a0ba757dSStefano Zampini   /* check consistency of connected components among neighbouring subdomains -> it adapt them in case it is needed */
5086a0ba757dSStefano Zampini   for (i=0;i<where_values;i++) {
50877cf533a6SStefano Zampini     /* We are not sure that on a given subset of the local interface,
50887cf533a6SStefano Zampini        two connected components will be the same among sharing subdomains */
50893b03a366Sstefano_zampini     if (mat_graph->where_ncmps[i]>1) {
5090a0ba757dSStefano Zampini       adapt_interface=1;
5091a0ba757dSStefano Zampini       break;
5092a0ba757dSStefano Zampini     }
5093a0ba757dSStefano Zampini   }
5094*2fa5cd67SKarl Rupp 
5095a0ba757dSStefano Zampini   ierr = MPI_Allreduce(&adapt_interface,&adapt_interface_reduced,1,MPIU_INT,MPI_LOR,interface_comm);CHKERRQ(ierr);
5096da1bb401SStefano Zampini   if (pcbddc->dbg_flag && adapt_interface_reduced) {
5097d8923723SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"Adapting interface\n");CHKERRQ(ierr);
5098da1bb401SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
5099da1bb401SStefano Zampini   }
5100a0ba757dSStefano Zampini   if (where_values && adapt_interface_reduced) {
5101a0ba757dSStefano Zampini     PetscInt    sum_requests=0,my_rank;
5102a0ba757dSStefano Zampini     PetscInt    buffer_size,start_of_recv,size_of_recv,start_of_send;
5103a0ba757dSStefano Zampini     PetscInt    temp_buffer_size,ins_val,global_where_counter;
5104a0ba757dSStefano Zampini     PetscInt    *cum_recv_counts;
5105a0ba757dSStefano Zampini     PetscInt    *where_to_nodes_indices;
5106a0ba757dSStefano Zampini     PetscInt    *petsc_buffer;
5107a0ba757dSStefano Zampini     PetscMPIInt *recv_buffer;
5108a0ba757dSStefano Zampini     PetscMPIInt *recv_buffer_where;
5109a0ba757dSStefano Zampini     PetscMPIInt *send_buffer;
5110a0ba757dSStefano Zampini     PetscMPIInt size_of_send;
5111a0ba757dSStefano Zampini     PetscInt    *sizes_of_sends;
5112a0ba757dSStefano Zampini     MPI_Request *send_requests;
5113a0ba757dSStefano Zampini     MPI_Request *recv_requests;
5114a0ba757dSStefano Zampini     PetscInt    *where_cc_adapt;
5115a0ba757dSStefano Zampini     PetscInt    **temp_buffer;
5116a0ba757dSStefano Zampini     PetscInt    *nodes_to_temp_buffer_indices;
5117a0ba757dSStefano Zampini     PetscInt    *add_to_where;
51187cf533a6SStefano Zampini     PetscInt    *aux_new_xadj,*new_xadj,*new_adjncy;
5119a0ba757dSStefano Zampini 
51207cf533a6SStefano Zampini     /* Retrict adjacency graph using information from connected components */
51217cf533a6SStefano Zampini     ierr = PetscMalloc(mat_graph->nvtxs*sizeof(PetscInt),&aux_new_xadj);CHKERRQ(ierr);
5122*2fa5cd67SKarl Rupp     for (i=0; i<mat_graph->nvtxs; i++) aux_new_xadj[i]=1;
51237cf533a6SStefano Zampini     for (i=0;i<mat_graph->ncmps;i++) {
51247cf533a6SStefano Zampini       k = mat_graph->cptr[i+1]-mat_graph->cptr[i];
5125*2fa5cd67SKarl Rupp       for (j=0;j<k;j++) aux_new_xadj[mat_graph->queue[mat_graph->cptr[i]+j]]=k;
51267cf533a6SStefano Zampini     }
51277cf533a6SStefano Zampini     j = 0;
5128*2fa5cd67SKarl Rupp     for (i=0;i<mat_graph->nvtxs;i++) j += aux_new_xadj[i];
5129*2fa5cd67SKarl Rupp 
51307cf533a6SStefano Zampini     ierr = PetscMalloc((mat_graph->nvtxs+1)*sizeof(PetscInt),&new_xadj);CHKERRQ(ierr);
51317cf533a6SStefano Zampini     ierr = PetscMalloc(j*sizeof(PetscInt),&new_adjncy);CHKERRQ(ierr);
51327cf533a6SStefano Zampini     new_xadj[0]=0;
51337cf533a6SStefano Zampini     for (i=0;i<mat_graph->nvtxs;i++) {
51347cf533a6SStefano Zampini       new_xadj[i+1]=new_xadj[i]+aux_new_xadj[i];
5135*2fa5cd67SKarl Rupp       if (aux_new_xadj[i]==1) new_adjncy[new_xadj[i]]=i;
51367cf533a6SStefano Zampini     }
5137354b9337SStefano Zampini     ierr = PetscFree(aux_new_xadj);CHKERRQ(ierr);
51387cf533a6SStefano Zampini     for (i=0; i<mat_graph->ncmps; i++) {
51397cf533a6SStefano Zampini       k = mat_graph->cptr[i+1]-mat_graph->cptr[i];
51407cf533a6SStefano Zampini       for (j=0; j<k; j++) {
51417cf533a6SStefano Zampini         ierr = PetscMemcpy(&new_adjncy[new_xadj[mat_graph->queue[mat_graph->cptr[i]+j]]],&mat_graph->queue[mat_graph->cptr[i]],k*sizeof(PetscInt));CHKERRQ(ierr);
51427cf533a6SStefano Zampini       }
51437cf533a6SStefano Zampini     }
51447cf533a6SStefano Zampini     ierr = PCBDDCSetLocalAdjacencyGraph(pc,mat_graph->nvtxs,new_xadj,new_adjncy,PETSC_OWN_POINTER);CHKERRQ(ierr);
51457cf533a6SStefano Zampini     /* For consistency among neughbouring procs, I need to sort (by global ordering) each connected component */
51467cf533a6SStefano Zampini     for (i=0; i<mat_graph->ncmps; i++) {
51477cf533a6SStefano Zampini       k    = mat_graph->cptr[i+1]-mat_graph->cptr[i];
51487cf533a6SStefano Zampini       ierr = ISLocalToGlobalMappingApply(matis->mapping,k,&mat_graph->queue[mat_graph->cptr[i]],&queue_in_global_numbering[mat_graph->cptr[i]]);CHKERRQ(ierr);
51497cf533a6SStefano Zampini       ierr = PetscSortIntWithArray(k,&queue_in_global_numbering[mat_graph->cptr[i]],&mat_graph->queue[mat_graph->cptr[i]]);CHKERRQ(ierr);
51507cf533a6SStefano Zampini     }
51517cf533a6SStefano Zampini     /* allocate some space */
5152a0ba757dSStefano Zampini     ierr = MPI_Comm_rank(interface_comm,&my_rank);CHKERRQ(ierr);
5153a0ba757dSStefano Zampini     ierr = PetscMalloc((where_values+1)*sizeof(PetscInt),&cum_recv_counts);CHKERRQ(ierr);
5154a0ba757dSStefano Zampini     ierr = PetscMemzero(cum_recv_counts,(where_values+1)*sizeof(PetscInt));CHKERRQ(ierr);
5155a0ba757dSStefano Zampini     ierr = PetscMalloc(where_values*sizeof(PetscInt),&where_to_nodes_indices);CHKERRQ(ierr);
5156a0ba757dSStefano Zampini     /* first count how many neighbours per connected component I will receive from */
5157a0ba757dSStefano Zampini     cum_recv_counts[0]=0;
5158a0ba757dSStefano Zampini     for (i=1; i<where_values+1; i++) {
5159a0ba757dSStefano Zampini       j=0;
5160*2fa5cd67SKarl Rupp       while (mat_graph->where[j] != i) j++;
5161a0ba757dSStefano Zampini       where_to_nodes_indices[i-1]=j;
5162*2fa5cd67SKarl Rupp       if (mat_graph->neighbours_set[j][0]!=-1) cum_recv_counts[i]=cum_recv_counts[i-1]+mat_graph->count[j]; /* We don't want sends/recvs_to/from_self -> here I don't count myself  */
5163*2fa5cd67SKarl Rupp       else cum_recv_counts[i]=cum_recv_counts[i-1]+mat_graph->count[j]-1;
5164a0ba757dSStefano Zampini     }
5165a0ba757dSStefano Zampini     ierr = PetscMalloc(2*cum_recv_counts[where_values]*sizeof(PetscMPIInt),&recv_buffer_where);CHKERRQ(ierr);
5166a0ba757dSStefano Zampini     ierr = PetscMalloc(cum_recv_counts[where_values]*sizeof(MPI_Request),&send_requests);CHKERRQ(ierr);
5167a0ba757dSStefano Zampini     ierr = PetscMalloc(cum_recv_counts[where_values]*sizeof(MPI_Request),&recv_requests);CHKERRQ(ierr);
5168a0ba757dSStefano Zampini     for (i=0; i<cum_recv_counts[where_values]; i++) {
5169a0ba757dSStefano Zampini       send_requests[i]=MPI_REQUEST_NULL;
5170a0ba757dSStefano Zampini       recv_requests[i]=MPI_REQUEST_NULL;
5171a0ba757dSStefano Zampini     }
5172a0ba757dSStefano Zampini     /* exchange with my neighbours the number of my connected components on the shared interface */
5173a0ba757dSStefano Zampini     for (i=0; i<where_values; i++) {
5174a0ba757dSStefano Zampini       j = where_to_nodes_indices[i];
5175da1bb401SStefano Zampini       k = (mat_graph->neighbours_set[j][0] == -1 ?  1 : 0);
5176a0ba757dSStefano Zampini       for (; k<mat_graph->count[j]; k++) {
5177da1bb401SStefano Zampini         ierr = MPI_Isend(&mat_graph->where_ncmps[i],1,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr);
5178da1bb401SStefano Zampini         ierr = MPI_Irecv(&recv_buffer_where[sum_requests],1,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr);
5179a0ba757dSStefano Zampini         sum_requests++;
5180a0ba757dSStefano Zampini       }
5181a0ba757dSStefano Zampini     }
5182a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
5183a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
5184a0ba757dSStefano Zampini     /* determine the connected component I need to adapt */
5185a0ba757dSStefano Zampini     ierr = PetscMalloc(where_values*sizeof(PetscInt),&where_cc_adapt);CHKERRQ(ierr);
5186a0ba757dSStefano Zampini     ierr = PetscMemzero(where_cc_adapt,where_values*sizeof(PetscInt));CHKERRQ(ierr);
5187a0ba757dSStefano Zampini     for (i=0; i<where_values; i++) {
5188a0ba757dSStefano Zampini       for (j=cum_recv_counts[i]; j<cum_recv_counts[i+1]; j++) {
51893b03a366Sstefano_zampini         /* The first condition is natural (i.e someone has a different number of cc than me), the second one is just to be safe */
51903b03a366Sstefano_zampini         if (mat_graph->where_ncmps[i]!=recv_buffer_where[j] || mat_graph->where_ncmps[i] > 1) {
5191a0ba757dSStefano Zampini           where_cc_adapt[i]=PETSC_TRUE;
5192a0ba757dSStefano Zampini           break;
5193a0ba757dSStefano Zampini         }
5194a0ba757dSStefano Zampini       }
5195a0ba757dSStefano Zampini     }
5196d8923723SStefano Zampini     buffer_size = 0;
5197d8923723SStefano Zampini     for (i=0; i<where_values; i++) {
5198d8923723SStefano Zampini       if (where_cc_adapt[i]) {
5199d8923723SStefano Zampini         for (j=i; j<mat_graph->ncmps; j++) {
5200d8923723SStefano Zampini           if (mat_graph->where[mat_graph->queue[mat_graph->cptr[j]]] == i+1) { /* WARNING -> where values goes from 1 to where_values included */
5201d8923723SStefano Zampini             buffer_size += 1 + mat_graph->cptr[j+1]-mat_graph->cptr[j];
5202d8923723SStefano Zampini           }
5203d8923723SStefano Zampini         }
5204d8923723SStefano Zampini       }
5205d8923723SStefano Zampini     }
5206d8923723SStefano Zampini     ierr = PetscMalloc(buffer_size*sizeof(PetscMPIInt),&send_buffer);CHKERRQ(ierr);
5207a0ba757dSStefano Zampini     /* now get from neighbours their ccs (in global numbering) and adapt them (in case it is needed) */
5208a0ba757dSStefano Zampini     /* first determine how much data to send (size of each queue plus the global indices) and communicate it to neighbours */
5209a0ba757dSStefano Zampini     ierr = PetscMalloc(where_values*sizeof(PetscInt),&sizes_of_sends);CHKERRQ(ierr);
5210a0ba757dSStefano Zampini     ierr = PetscMemzero(sizes_of_sends,where_values*sizeof(PetscInt));CHKERRQ(ierr);
5211*2fa5cd67SKarl Rupp 
5212a0ba757dSStefano Zampini     sum_requests  = 0;
5213a0ba757dSStefano Zampini     start_of_send = 0;
5214a0ba757dSStefano Zampini     start_of_recv = cum_recv_counts[where_values];
5215a0ba757dSStefano Zampini     for (i=0; i<where_values; i++) {
5216a0ba757dSStefano Zampini       if (where_cc_adapt[i]) {
5217a0ba757dSStefano Zampini         size_of_send=0;
5218a0ba757dSStefano Zampini         for (j=i; j<mat_graph->ncmps; j++) {
5219a0ba757dSStefano Zampini           if (mat_graph->where[mat_graph->queue[mat_graph->cptr[j]]] == i+1) { /* WARNING -> where values goes from 1 to where_values included */
5220a0ba757dSStefano Zampini             send_buffer[start_of_send+size_of_send]=mat_graph->cptr[j+1]-mat_graph->cptr[j];
5221a0ba757dSStefano Zampini             size_of_send += 1;
5222a0ba757dSStefano Zampini             for (k=0; k<mat_graph->cptr[j+1]-mat_graph->cptr[j]; k++) {
5223a0ba757dSStefano Zampini               send_buffer[start_of_send+size_of_send+k]=queue_in_global_numbering[mat_graph->cptr[j]+k];
5224a0ba757dSStefano Zampini             }
5225a0ba757dSStefano Zampini             size_of_send=size_of_send+mat_graph->cptr[j+1]-mat_graph->cptr[j];
5226a0ba757dSStefano Zampini           }
5227a0ba757dSStefano Zampini         }
5228a0ba757dSStefano Zampini         j = where_to_nodes_indices[i];
5229da1bb401SStefano Zampini         k = (mat_graph->neighbours_set[j][0] == -1 ?  1 : 0);
523011d8f4c2SStefano Zampini         sizes_of_sends[i]=size_of_send;
5231a0ba757dSStefano Zampini         for (; k<mat_graph->count[j]; k++) {
523211d8f4c2SStefano Zampini           ierr = MPI_Isend(&sizes_of_sends[i],1,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr);
5233da1bb401SStefano Zampini           ierr = MPI_Irecv(&recv_buffer_where[sum_requests+start_of_recv],1,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr);
5234a0ba757dSStefano Zampini           sum_requests++;
5235a0ba757dSStefano Zampini         }
5236a0ba757dSStefano Zampini         start_of_send+=size_of_send;
5237a0ba757dSStefano Zampini       }
5238a0ba757dSStefano Zampini     }
5239a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
5240a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
5241*2fa5cd67SKarl Rupp 
5242a0ba757dSStefano Zampini     buffer_size=0;
5243*2fa5cd67SKarl Rupp 
5244*2fa5cd67SKarl Rupp     for (k=0;k<sum_requests;k++) buffer_size += recv_buffer_where[start_of_recv+k];
5245a0ba757dSStefano Zampini     ierr = PetscMalloc(buffer_size*sizeof(PetscMPIInt),&recv_buffer);CHKERRQ(ierr);
5246a0ba757dSStefano Zampini     /* now exchange the data */
5247a0ba757dSStefano Zampini     start_of_recv = 0;
5248a0ba757dSStefano Zampini     start_of_send = 0;
5249a0ba757dSStefano Zampini     sum_requests  = 0;
5250a0ba757dSStefano Zampini     for (i=0; i<where_values; i++) {
5251a0ba757dSStefano Zampini       if (where_cc_adapt[i]) {
5252a0ba757dSStefano Zampini         size_of_send = sizes_of_sends[i];
5253*2fa5cd67SKarl Rupp 
5254a0ba757dSStefano Zampini         j = where_to_nodes_indices[i];
5255da1bb401SStefano Zampini         k = (mat_graph->neighbours_set[j][0] == -1 ?  1 : 0);
5256a0ba757dSStefano Zampini         for (; k<mat_graph->count[j]; k++) {
5257da1bb401SStefano Zampini           ierr          = MPI_Isend(&send_buffer[start_of_send],size_of_send,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr);
5258a0ba757dSStefano Zampini           size_of_recv  = recv_buffer_where[cum_recv_counts[where_values]+sum_requests];
5259da1bb401SStefano Zampini           ierr          = MPI_Irecv(&recv_buffer[start_of_recv],size_of_recv,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr);
5260a0ba757dSStefano Zampini           start_of_recv+=size_of_recv;
5261a0ba757dSStefano Zampini           sum_requests++;
5262a0ba757dSStefano Zampini         }
5263a0ba757dSStefano Zampini         start_of_send+=size_of_send;
5264a0ba757dSStefano Zampini       }
5265a0ba757dSStefano Zampini     }
5266a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
5267a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
5268a0ba757dSStefano Zampini     ierr = PetscMalloc(buffer_size*sizeof(PetscInt),&petsc_buffer);CHKERRQ(ierr);
5269*2fa5cd67SKarl Rupp     for (k=0;k<start_of_recv;k++) petsc_buffer[k]=(PetscInt)recv_buffer[k];
5270a0ba757dSStefano Zampini     for (j=0;j<buffer_size;) {
5271a0ba757dSStefano Zampini       ierr = ISGlobalToLocalMappingApply(matis->mapping,IS_GTOLM_MASK,petsc_buffer[j],&petsc_buffer[j+1],&petsc_buffer[j],&petsc_buffer[j+1]);CHKERRQ(ierr);
5272a0ba757dSStefano Zampini       k    = petsc_buffer[j]+1;
5273a0ba757dSStefano Zampini       j   += k;
5274a0ba757dSStefano Zampini     }
5275a0ba757dSStefano Zampini     sum_requests  = cum_recv_counts[where_values];
5276a0ba757dSStefano Zampini     start_of_recv = 0;
5277*2fa5cd67SKarl Rupp 
5278a0ba757dSStefano Zampini     ierr = PetscMalloc(mat_graph->nvtxs*sizeof(PetscInt),&nodes_to_temp_buffer_indices);CHKERRQ(ierr);
5279a0ba757dSStefano Zampini     global_where_counter=0;
5280a0ba757dSStefano Zampini     for (i=0; i<where_values; i++) {
5281a0ba757dSStefano Zampini       if (where_cc_adapt[i]) {
5282a0ba757dSStefano Zampini         temp_buffer_size=0;
5283a0ba757dSStefano Zampini         /* find nodes on the shared interface we need to adapt */
5284a0ba757dSStefano Zampini         for (j=0; j<mat_graph->nvtxs; j++) {
5285a0ba757dSStefano Zampini           if (mat_graph->where[j]==i+1) {
5286a0ba757dSStefano Zampini             nodes_to_temp_buffer_indices[j]=temp_buffer_size;
5287a0ba757dSStefano Zampini             temp_buffer_size++;
5288a0ba757dSStefano Zampini           } else {
5289a0ba757dSStefano Zampini             nodes_to_temp_buffer_indices[j]=-1;
5290a0ba757dSStefano Zampini           }
5291a0ba757dSStefano Zampini         }
5292*2fa5cd67SKarl Rupp 
5293a0ba757dSStefano Zampini         /* allocate some temporary space */
5294a0ba757dSStefano Zampini         ierr = PetscMalloc(temp_buffer_size*sizeof(PetscInt*),&temp_buffer);CHKERRQ(ierr);
5295a0ba757dSStefano Zampini         ierr = PetscMalloc(temp_buffer_size*(cum_recv_counts[i+1]-cum_recv_counts[i])*sizeof(PetscInt),&temp_buffer[0]);CHKERRQ(ierr);
5296a0ba757dSStefano Zampini         ierr = PetscMemzero(temp_buffer[0],temp_buffer_size*(cum_recv_counts[i+1]-cum_recv_counts[i])*sizeof(PetscInt));CHKERRQ(ierr);
5297a0ba757dSStefano Zampini         for (j=1; j<temp_buffer_size; j++) {
5298a0ba757dSStefano Zampini           temp_buffer[j]=temp_buffer[j-1]+cum_recv_counts[i+1]-cum_recv_counts[i];
5299a0ba757dSStefano Zampini         }
5300a0ba757dSStefano Zampini         /* analyze contributions from neighbouring subdomains for i-th conn comp
5301a0ba757dSStefano Zampini            temp buffer structure:
5302a0ba757dSStefano Zampini            supposing part of the interface has dimension 5 (global nodes 0,1,2,3,4)
5303a0ba757dSStefano Zampini            3 neighs procs with structured connected components:
5304a0ba757dSStefano Zampini              neigh 0: [0 1 4], [2 3];  (2 connected components)
5305a0ba757dSStefano Zampini              neigh 1: [0 1], [2 3 4];  (2 connected components)
5306a0ba757dSStefano Zampini              neigh 2: [0 4], [1], [2 3]; (3 connected components)
5307a0ba757dSStefano Zampini            tempbuffer (row-oriented) should be filled as:
5308a0ba757dSStefano Zampini              [ 0, 0, 0;
5309a0ba757dSStefano Zampini                0, 0, 1;
5310a0ba757dSStefano Zampini                1, 1, 2;
5311a0ba757dSStefano Zampini                1, 1, 2;
5312a0ba757dSStefano Zampini                0, 1, 0; ];
5313a0ba757dSStefano Zampini            This way we can simply recover the resulting structure account for possible intersections of ccs among neighs.
5314a0ba757dSStefano Zampini            The mat_graph->where array will be modified to reproduce the following 4 connected components [0], [1], [2 3], [4];
5315a0ba757dSStefano Zampini                                                                                                                                    */
5316a0ba757dSStefano Zampini         for (j=0;j<cum_recv_counts[i+1]-cum_recv_counts[i];j++) {
5317a0ba757dSStefano Zampini           ins_val=0;
5318a0ba757dSStefano Zampini           size_of_recv=recv_buffer_where[sum_requests];  /* total size of recv from neighs */
5319a0ba757dSStefano Zampini           for (buffer_size=0;buffer_size<size_of_recv;) {  /* loop until all data from neighs has been taken into account */
5320a0ba757dSStefano Zampini             for (k=1;k<petsc_buffer[buffer_size+start_of_recv]+1;k++) { /* filling properly temp_buffer using data from a single recv */
5321a0ba757dSStefano Zampini               temp_buffer[nodes_to_temp_buffer_indices[petsc_buffer[start_of_recv+buffer_size+k]]][j] = ins_val;
5322a0ba757dSStefano Zampini             }
5323a0ba757dSStefano Zampini             buffer_size+=k;
5324a0ba757dSStefano Zampini             ins_val++;
5325a0ba757dSStefano Zampini           }
5326a0ba757dSStefano Zampini           start_of_recv+=size_of_recv;
5327a0ba757dSStefano Zampini           sum_requests++;
5328a0ba757dSStefano Zampini         }
5329a0ba757dSStefano Zampini         ierr = PetscMalloc(temp_buffer_size*sizeof(PetscInt),&add_to_where);CHKERRQ(ierr);
5330a0ba757dSStefano Zampini         ierr = PetscMemzero(add_to_where,temp_buffer_size*sizeof(PetscInt));CHKERRQ(ierr);
5331a0ba757dSStefano Zampini         for (j=0; j<temp_buffer_size; j++) {
5332a0ba757dSStefano Zampini           if (!add_to_where[j]) { /* found a new cc  */
5333a0ba757dSStefano Zampini             global_where_counter++;
5334a0ba757dSStefano Zampini             add_to_where[j]=global_where_counter;
5335a0ba757dSStefano Zampini             for (k=j+1; k<temp_buffer_size; k++) { /* check for other nodes in new cc */
5336a0ba757dSStefano Zampini               same_set=PETSC_TRUE;
5337a0ba757dSStefano Zampini               for (s=0; s<cum_recv_counts[i+1]-cum_recv_counts[i]; s++) {
5338a0ba757dSStefano Zampini                 if (temp_buffer[j][s]!=temp_buffer[k][s]) {
5339a0ba757dSStefano Zampini                   same_set=PETSC_FALSE;
5340a0ba757dSStefano Zampini                   break;
5341a0ba757dSStefano Zampini                 }
5342a0ba757dSStefano Zampini               }
5343*2fa5cd67SKarl Rupp               if (same_set) add_to_where[k] = global_where_counter;
5344a0ba757dSStefano Zampini             }
5345a0ba757dSStefano Zampini           }
5346a0ba757dSStefano Zampini         }
5347a0ba757dSStefano Zampini         /* insert new data in where array */
5348a0ba757dSStefano Zampini         temp_buffer_size=0;
5349a0ba757dSStefano Zampini         for (j=0;j<mat_graph->nvtxs;j++) {
5350a0ba757dSStefano Zampini           if (mat_graph->where[j]==i+1) {
5351a0ba757dSStefano Zampini             mat_graph->where[j]=where_values+add_to_where[temp_buffer_size];
5352a0ba757dSStefano Zampini             temp_buffer_size++;
5353a0ba757dSStefano Zampini           }
5354a0ba757dSStefano Zampini         }
5355a0ba757dSStefano Zampini         ierr = PetscFree(temp_buffer[0]);CHKERRQ(ierr);
5356a0ba757dSStefano Zampini         ierr = PetscFree(temp_buffer);CHKERRQ(ierr);
5357a0ba757dSStefano Zampini         ierr = PetscFree(add_to_where);CHKERRQ(ierr);
5358a0ba757dSStefano Zampini       }
5359a0ba757dSStefano Zampini     }
5360a0ba757dSStefano Zampini     ierr = PetscFree(nodes_to_temp_buffer_indices);CHKERRQ(ierr);
5361a0ba757dSStefano Zampini     ierr = PetscFree(sizes_of_sends);CHKERRQ(ierr);
5362a0ba757dSStefano Zampini     ierr = PetscFree(send_requests);CHKERRQ(ierr);
5363a0ba757dSStefano Zampini     ierr = PetscFree(recv_requests);CHKERRQ(ierr);
5364a0ba757dSStefano Zampini     ierr = PetscFree(petsc_buffer);CHKERRQ(ierr);
5365a0ba757dSStefano Zampini     ierr = PetscFree(recv_buffer);CHKERRQ(ierr);
5366a0ba757dSStefano Zampini     ierr = PetscFree(recv_buffer_where);CHKERRQ(ierr);
5367a0ba757dSStefano Zampini     ierr = PetscFree(send_buffer);CHKERRQ(ierr);
5368a0ba757dSStefano Zampini     ierr = PetscFree(cum_recv_counts);CHKERRQ(ierr);
5369a0ba757dSStefano Zampini     ierr = PetscFree(where_to_nodes_indices);CHKERRQ(ierr);
537023d4d1a5SStefano Zampini     ierr = PetscFree(where_cc_adapt);CHKERRQ(ierr);
5371*2fa5cd67SKarl Rupp 
5372a0ba757dSStefano Zampini     /* We are ready to evaluate consistent connected components on each part of the shared interface */
5373a0ba757dSStefano Zampini     if (global_where_counter) {
5374*2fa5cd67SKarl Rupp       for (i=0;i<mat_graph->nvtxs;i++) mat_graph->touched[i]=PETSC_FALSE;
5375a0ba757dSStefano Zampini       global_where_counter=0;
5376a0ba757dSStefano Zampini       for (i=0;i<mat_graph->nvtxs;i++) {
5377a0ba757dSStefano Zampini         if (mat_graph->where[i] && !mat_graph->touched[i]) {
5378a0ba757dSStefano Zampini           global_where_counter++;
5379a0ba757dSStefano Zampini           for (j=i+1;j<mat_graph->nvtxs;j++) {
5380a0ba757dSStefano Zampini             if (!mat_graph->touched[j] && mat_graph->where[j]==mat_graph->where[i]) {
5381a0ba757dSStefano Zampini               mat_graph->where[j]   = global_where_counter;
5382a0ba757dSStefano Zampini               mat_graph->touched[j] = PETSC_TRUE;
5383a0ba757dSStefano Zampini             }
5384a0ba757dSStefano Zampini           }
5385a0ba757dSStefano Zampini           mat_graph->where[i]   = global_where_counter;
5386a0ba757dSStefano Zampini           mat_graph->touched[i] = PETSC_TRUE;
5387a0ba757dSStefano Zampini         }
5388a0ba757dSStefano Zampini       }
5389a0ba757dSStefano Zampini       where_values=global_where_counter;
5390a0ba757dSStefano Zampini     }
5391a0ba757dSStefano Zampini     if (global_where_counter) {
5392a0ba757dSStefano Zampini       ierr = PetscMemzero(mat_graph->cptr,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr);
5393a0ba757dSStefano Zampini       ierr = PetscMemzero(mat_graph->queue,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
5394a0ba757dSStefano Zampini       ierr = PetscFree(mat_graph->where_ncmps);CHKERRQ(ierr);
5395a0ba757dSStefano Zampini       ierr = PetscMalloc(where_values*sizeof(PetscMPIInt),&mat_graph->where_ncmps);CHKERRQ(ierr);
5396a0ba757dSStefano Zampini       ierr = PCBDDCFindConnectedComponents(mat_graph, where_values);
5397a0ba757dSStefano Zampini     }
53983b03a366Sstefano_zampini   } /* Finished adapting interface */
5399*2fa5cd67SKarl Rupp 
5400a929c220SStefano Zampini   /* For consistency among neughbouring procs, I need to sort (by global ordering) each connected component */
5401a929c220SStefano Zampini   for (i=0; i<mat_graph->ncmps; i++) {
5402a929c220SStefano Zampini     k    = mat_graph->cptr[i+1]-mat_graph->cptr[i];
5403a929c220SStefano Zampini     ierr = ISLocalToGlobalMappingApply(matis->mapping,k,&mat_graph->queue[mat_graph->cptr[i]],&queue_in_global_numbering[mat_graph->cptr[i]]);CHKERRQ(ierr);
5404a929c220SStefano Zampini     ierr = PetscSortIntWithArray(k,&queue_in_global_numbering[mat_graph->cptr[i]],&mat_graph->queue[mat_graph->cptr[i]]);CHKERRQ(ierr);
5405a929c220SStefano Zampini   }
5406a929c220SStefano Zampini 
54070c7d97c5SJed Brown   PetscInt  nfc         = 0;
54080c7d97c5SJed Brown   PetscInt  nec         = 0;
54090c7d97c5SJed Brown   PetscInt  nvc         = 0;
54103b03a366Sstefano_zampini   PetscBool twodim_flag = PETSC_FALSE;
54110c7d97c5SJed Brown   for (i=0; i<mat_graph->ncmps; i++) {
54123b03a366Sstefano_zampini     if (mat_graph->cptr[i+1]-mat_graph->cptr[i] > vertex_size) {
5413*2fa5cd67SKarl Rupp       if (mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]==1) nfc++; /* 1 neigh Neumann fake included */
5414*2fa5cd67SKarl Rupp       else nec++; /* note that nec will be zero in 2d */
54150c7d97c5SJed Brown     } else {
54163b03a366Sstefano_zampini       nvc+=mat_graph->cptr[i+1]-mat_graph->cptr[i];
54173b03a366Sstefano_zampini     }
54183b03a366Sstefano_zampini   }
54193b03a366Sstefano_zampini   if (!nec) { /* we are in a 2d case -> no faces, only edges */
54203b03a366Sstefano_zampini     nec         = nfc;
54213b03a366Sstefano_zampini     nfc         = 0;
54223b03a366Sstefano_zampini     twodim_flag = PETSC_TRUE;
54233b03a366Sstefano_zampini   }
54243972b0daSStefano Zampini   /* allocate IS arrays for faces, edges. Vertices need a single index set. */
54253972b0daSStefano Zampini   k=0;
54263972b0daSStefano Zampini   for (i=0; i<mat_graph->ncmps; i++) {
54273972b0daSStefano Zampini     j=mat_graph->cptr[i+1]-mat_graph->cptr[i];
5428*2fa5cd67SKarl Rupp     if (j > k) k=j;
5429*2fa5cd67SKarl Rupp 
5430*2fa5cd67SKarl Rupp     if (j<=vertex_size) k+=vertex_size;
54313972b0daSStefano Zampini   }
54323972b0daSStefano Zampini   ierr = PetscMalloc(k*sizeof(PetscInt),&auxis);CHKERRQ(ierr);
54333b03a366Sstefano_zampini   if (!pcbddc->vertices_flag && !pcbddc->edges_flag) {
54343b03a366Sstefano_zampini     ierr      = PetscMalloc(nfc*sizeof(IS),&pcbddc->ISForFaces);CHKERRQ(ierr);
54353b03a366Sstefano_zampini     use_faces = PETSC_TRUE;
54363b03a366Sstefano_zampini   }
54373b03a366Sstefano_zampini   if (!pcbddc->vertices_flag && !pcbddc->faces_flag) {
54383b03a366Sstefano_zampini     ierr      = PetscMalloc(nec*sizeof(IS),&pcbddc->ISForEdges);CHKERRQ(ierr);
54393b03a366Sstefano_zampini     use_edges = PETSC_TRUE;
54403b03a366Sstefano_zampini   }
54413b03a366Sstefano_zampini   nfc=0;
54423b03a366Sstefano_zampini   nec=0;
54433b03a366Sstefano_zampini   for (i=0; i<mat_graph->ncmps; i++) {
54443b03a366Sstefano_zampini     if (mat_graph->cptr[i+1]-mat_graph->cptr[i] > vertex_size) {
54453b03a366Sstefano_zampini       for (j=0; j<mat_graph->cptr[i+1]-mat_graph->cptr[i]; j++) {
54463972b0daSStefano Zampini         auxis[j]=mat_graph->queue[mat_graph->cptr[i]+j];
54473b03a366Sstefano_zampini       }
54483b03a366Sstefano_zampini       if (mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]==1) {
54493b03a366Sstefano_zampini         if (twodim_flag) {
54503b03a366Sstefano_zampini           if (use_edges) {
54513972b0daSStefano Zampini             ierr = ISCreateGeneral(PETSC_COMM_SELF,j,auxis,PETSC_COPY_VALUES,&pcbddc->ISForEdges[nec]);CHKERRQ(ierr);
54523b03a366Sstefano_zampini             nec++;
54533b03a366Sstefano_zampini           }
54543b03a366Sstefano_zampini         } else {
54553b03a366Sstefano_zampini           if (use_faces) {
54563972b0daSStefano Zampini             ierr = ISCreateGeneral(PETSC_COMM_SELF,j,auxis,PETSC_COPY_VALUES,&pcbddc->ISForFaces[nfc]);CHKERRQ(ierr);
54573b03a366Sstefano_zampini             nfc++;
54583b03a366Sstefano_zampini           }
54593b03a366Sstefano_zampini         }
54603b03a366Sstefano_zampini       } else {
54613b03a366Sstefano_zampini         if (use_edges) {
54623972b0daSStefano Zampini           ierr = ISCreateGeneral(PETSC_COMM_SELF,j,auxis,PETSC_COPY_VALUES,&pcbddc->ISForEdges[nec]);CHKERRQ(ierr);
54630c7d97c5SJed Brown           nec++;
54640c7d97c5SJed Brown         }
54650c7d97c5SJed Brown       }
54660c7d97c5SJed Brown     }
54673b03a366Sstefano_zampini   }
54683b03a366Sstefano_zampini   pcbddc->n_ISForFaces = nfc;
54693b03a366Sstefano_zampini   pcbddc->n_ISForEdges = nec;
5470*2fa5cd67SKarl Rupp 
54713b03a366Sstefano_zampini   nvc = 0;
54720c7d97c5SJed Brown   if (!pcbddc->constraints_flag) {
54733b03a366Sstefano_zampini     for (i=0; i<mat_graph->ncmps; i++) {
54743b03a366Sstefano_zampini       if (mat_graph->cptr[i+1]-mat_graph->cptr[i] <= vertex_size) {
54753b03a366Sstefano_zampini         for (j = mat_graph->cptr[i]; j<mat_graph->cptr[i+1]; j++) {
54763972b0daSStefano Zampini           auxis[nvc]=mat_graph->queue[j];
54770c7d97c5SJed Brown           nvc++;
54780c7d97c5SJed Brown         }
54790c7d97c5SJed Brown       }
54800c7d97c5SJed Brown     }
54810c7d97c5SJed Brown   }
5482*2fa5cd67SKarl Rupp 
5483a0ba757dSStefano Zampini   /* sort vertex set (by local ordering) */
54843972b0daSStefano Zampini   ierr = PetscSortInt(nvc,auxis);CHKERRQ(ierr);
54853972b0daSStefano Zampini   ierr = ISCreateGeneral(PETSC_COMM_SELF,nvc,auxis,PETSC_COPY_VALUES,&pcbddc->ISForVertices);CHKERRQ(ierr);
5486e269702eSStefano Zampini   if (pcbddc->dbg_flag) {
5487d49ef151SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"--------------------------------------------------------------\n");CHKERRQ(ierr);
5488d49ef151SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Details from PCBDDCManageLocalBoundaries for subdomain %04d\n",PetscGlobalRank);CHKERRQ(ierr);
5489d49ef151SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Matrix graph has %d connected components", mat_graph->ncmps);CHKERRQ(ierr);
54900c7d97c5SJed Brown     for (i=0; i<mat_graph->ncmps; i++) {
54913b03a366Sstefano_zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\nDetails for connected component number %02d: size %04d, count %01d. Nodes follow.\n",
54923b03a366Sstefano_zampini                                                 i,mat_graph->cptr[i+1]-mat_graph->cptr[i],mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]);CHKERRQ(ierr);
5493da1bb401SStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"subdomains: ");
5494da1bb401SStefano Zampini       for (j=0; j<mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]; j++) {
5495*2fa5cd67SKarl Rupp         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d ",mat_graph->neighbours_set[mat_graph->queue[mat_graph->cptr[i]]][j]);CHKERRQ(ierr);
5496da1bb401SStefano Zampini       }
5497da1bb401SStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\n");
54980c7d97c5SJed Brown       for (j=mat_graph->cptr[i]; j<mat_graph->cptr[i+1]; j++) {
5499a929c220SStefano Zampini         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d (%d), ",mat_graph->queue[j],queue_in_global_numbering[j]);CHKERRQ(ierr);
55000c7d97c5SJed Brown       }
55010c7d97c5SJed Brown     }
5502da1bb401SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\n--------------------------------------------------------------\n");CHKERRQ(ierr);
55033b03a366Sstefano_zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local vertices\n",PetscGlobalRank,nvc);CHKERRQ(ierr);
55043b03a366Sstefano_zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local faces\n",PetscGlobalRank,nfc);CHKERRQ(ierr);
55053b03a366Sstefano_zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local edges\n",PetscGlobalRank,nec);CHKERRQ(ierr);
5506d49ef151SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
55070c7d97c5SJed Brown   }
55083972b0daSStefano Zampini   ierr = PetscFree(auxis);CHKERRQ(ierr);
5509a929c220SStefano Zampini   ierr = PetscFree(queue_in_global_numbering);CHKERRQ(ierr);
55100c7d97c5SJed Brown   PetscFunctionReturn(0);
55110c7d97c5SJed Brown }
55120c7d97c5SJed Brown 
55130c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
55140c7d97c5SJed Brown 
55150c7d97c5SJed Brown /* The following code has been adapted from function IsConnectedSubdomain contained
5516da1bb401SStefano Zampini    in source file contig.c of METIS library (version 5.0.1)
5517da1bb401SStefano Zampini    It finds connected components of each partition labeled from 1 to n_dist  */
55180c7d97c5SJed Brown 
55190c7d97c5SJed Brown #undef __FUNCT__
55200c7d97c5SJed Brown #define __FUNCT__ "PCBDDCFindConnectedComponents"
55219c0446d6SStefano Zampini static PetscErrorCode PCBDDCFindConnectedComponents(PCBDDCGraph graph, PetscInt n_dist)
55220c7d97c5SJed Brown {
55230c7d97c5SJed Brown   PetscInt  i, j, k, nvtxs, first, last, nleft, ncmps,pid,cum_queue,n,ncmps_pid;
55240c7d97c5SJed Brown   PetscInt  *xadj, *adjncy, *where, *queue;
55250c7d97c5SJed Brown   PetscInt  *cptr;
55260c7d97c5SJed Brown   PetscBool *touched;
55270c7d97c5SJed Brown 
55280c7d97c5SJed Brown   PetscFunctionBegin;
55290c7d97c5SJed Brown   nvtxs   = graph->nvtxs;
55300c7d97c5SJed Brown   xadj    = graph->xadj;
55310c7d97c5SJed Brown   adjncy  = graph->adjncy;
55320c7d97c5SJed Brown   where   = graph->where;
55330c7d97c5SJed Brown   touched = graph->touched;
55340c7d97c5SJed Brown   queue   = graph->queue;
55350c7d97c5SJed Brown   cptr    = graph->cptr;
55360c7d97c5SJed Brown 
5537*2fa5cd67SKarl Rupp   for (i=0; i<nvtxs; i++) touched[i] = PETSC_FALSE;
55380c7d97c5SJed Brown 
55390c7d97c5SJed Brown   cum_queue = 0;
55400c7d97c5SJed Brown   ncmps     = 0;
55410c7d97c5SJed Brown 
55420c7d97c5SJed Brown   for (n=0; n<n_dist; n++) {
5543da1bb401SStefano Zampini     pid   = n+1; /* partition labeled by 0 is discarded */
55440c7d97c5SJed Brown     nleft = 0;
55450c7d97c5SJed Brown     for (i=0; i<nvtxs; i++) {
5546*2fa5cd67SKarl Rupp       if (where[i] == pid) nleft++;
55470c7d97c5SJed Brown     }
55480c7d97c5SJed Brown     for (i=0; i<nvtxs; i++) {
5549*2fa5cd67SKarl Rupp       if (where[i] == pid) break;
55500c7d97c5SJed Brown     }
55510c7d97c5SJed Brown     touched[i]       = PETSC_TRUE;
55520c7d97c5SJed Brown     queue[cum_queue] = i;
55530c7d97c5SJed Brown     first = 0; last = 1;
5554*2fa5cd67SKarl Rupp 
55550c7d97c5SJed Brown     cptr[ncmps] = cum_queue;  /* This actually points to queue */
55560c7d97c5SJed Brown     ncmps_pid   = 0;
5557*2fa5cd67SKarl Rupp 
55580c7d97c5SJed Brown     while (first != nleft) {
55590c7d97c5SJed Brown       if (first == last) { /* Find another starting vertex */
55600c7d97c5SJed Brown         cptr[++ncmps] = first+cum_queue;
55610c7d97c5SJed Brown         ncmps_pid++;
55620c7d97c5SJed Brown         for (i=0; i<nvtxs; i++) {
5563*2fa5cd67SKarl Rupp           if (where[i] == pid && !touched[i]) break;
55640c7d97c5SJed Brown         }
55650c7d97c5SJed Brown         queue[cum_queue+last] = i;
55660c7d97c5SJed Brown         last++;
55670c7d97c5SJed Brown         touched[i] = PETSC_TRUE;
55680c7d97c5SJed Brown       }
55690c7d97c5SJed Brown       i = queue[cum_queue+first];
55700c7d97c5SJed Brown       first++;
55710c7d97c5SJed Brown       for (j=xadj[i]; j<xadj[i+1]; j++) {
55720c7d97c5SJed Brown         k = adjncy[j];
55730c7d97c5SJed Brown         if (where[k] == pid && !touched[k]) {
55740c7d97c5SJed Brown           queue[cum_queue+last] = k;
55750c7d97c5SJed Brown           last++;
55760c7d97c5SJed Brown           touched[k] = PETSC_TRUE;
55770c7d97c5SJed Brown         }
55780c7d97c5SJed Brown       }
55790c7d97c5SJed Brown     }
55800c7d97c5SJed Brown     cptr[++ncmps] = first+cum_queue;
55810c7d97c5SJed Brown     ncmps_pid++;
55820c7d97c5SJed Brown     cum_queue             = cptr[ncmps];
5583a0ba757dSStefano Zampini     graph->where_ncmps[n] = ncmps_pid;
55840c7d97c5SJed Brown   }
55850c7d97c5SJed Brown   graph->ncmps = ncmps;
55860c7d97c5SJed Brown   PetscFunctionReturn(0);
55870c7d97c5SJed Brown }
5588