xref: /petsc/src/ksp/pc/impls/bddc/bddc.c (revision 1e6b0712040ec8365256c86ba1b999c3f2b9df53)
153cdbc3dSStefano Zampini /* TODOLIST
2da1bb401SStefano Zampini    DofSplitting and DM attached to pc?
3da1bb401SStefano Zampini    Change SetNeumannBoundaries to SetNeumannBoundariesLocal and provide new SetNeumannBoundaries (same Dirichlet)
4a0ba757dSStefano Zampini    change how to deal with the coarse problem (PCBDDCSetCoarseEnvironment):
5a0ba757dSStefano Zampini      - simplify coarse problem structure -> PCBDDC or PCREDUDANT, nothing else -> same comm for all levels?
6a0ba757dSStefano Zampini      - remove coarse enums and allow use of PCBDDCGetCoarseKSP
7a0ba757dSStefano Zampini      - remove metis dependency -> use MatPartitioning for multilevel -> Assemble serial adjacency in ManageLocalBoundaries?
8a0ba757dSStefano Zampini    code refactoring:
9a0ba757dSStefano Zampini      - pick up better names for static functions
10a0ba757dSStefano Zampini    change options structure:
11a0ba757dSStefano Zampini      - insert BDDC into MG framework?
12a0ba757dSStefano Zampini    provide other ops? Ask to developers
13a0ba757dSStefano Zampini    remove all unused printf
14a0ba757dSStefano Zampini    man pages
1553cdbc3dSStefano Zampini */
160c7d97c5SJed Brown 
1753cdbc3dSStefano Zampini /* ----------------------------------------------------------------------------------------------------------------------------------------------
180c7d97c5SJed Brown    Implementation of BDDC preconditioner based on:
190c7d97c5SJed Brown    C. Dohrmann "An approximate BDDC preconditioner", Numerical Linear Algebra with Applications Volume 14, Issue 2, pages 149-168, March 2007
2053cdbc3dSStefano Zampini    ---------------------------------------------------------------------------------------------------------------------------------------------- */
2153cdbc3dSStefano Zampini 
2207475bc1SBarry Smith #include "bddc.h" /*I "petscpc.h" I*/
233b03a366Sstefano_zampini #include <petscblaslapack.h>
240c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
250c7d97c5SJed Brown #undef __FUNCT__
260c7d97c5SJed Brown #define __FUNCT__ "PCSetFromOptions_BDDC"
270c7d97c5SJed Brown PetscErrorCode PCSetFromOptions_BDDC(PC pc)
280c7d97c5SJed Brown {
290c7d97c5SJed Brown   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
300c7d97c5SJed Brown   PetscErrorCode ierr;
310c7d97c5SJed Brown 
320c7d97c5SJed Brown   PetscFunctionBegin;
330c7d97c5SJed Brown   ierr = PetscOptionsHead("BDDC options");CHKERRQ(ierr);
340c7d97c5SJed Brown   /* Verbose debugging of main data structures */
350298fd71SBarry Smith   ierr = PetscOptionsBool("-pc_bddc_check_all"       ,"Verbose (debugging) output for PCBDDC"                       ,"none",pcbddc->dbg_flag      ,&pcbddc->dbg_flag      ,NULL);CHKERRQ(ierr);
360c7d97c5SJed Brown   /* Some customization for default primal space */
370298fd71SBarry Smith   ierr = PetscOptionsBool("-pc_bddc_vertices_only"   ,"Use only vertices in coarse space (i.e. discard constraints)","none",pcbddc->vertices_flag   ,&pcbddc->vertices_flag   ,NULL);CHKERRQ(ierr);
380298fd71SBarry Smith   ierr = PetscOptionsBool("-pc_bddc_constraints_only","Use only constraints in coarse space (i.e. discard vertices)","none",pcbddc->constraints_flag,&pcbddc->constraints_flag,NULL);CHKERRQ(ierr);
390298fd71SBarry Smith   ierr = PetscOptionsBool("-pc_bddc_faces_only"      ,"Use only faces among constraints of coarse space (i.e. discard edges)"         ,"none",pcbddc->faces_flag      ,&pcbddc->faces_flag      ,NULL);CHKERRQ(ierr);
400298fd71SBarry Smith   ierr = PetscOptionsBool("-pc_bddc_edges_only"      ,"Use only edges among constraints of coarse space (i.e. discard faces)"         ,"none",pcbddc->edges_flag      ,&pcbddc->edges_flag      ,NULL);CHKERRQ(ierr);
412fa5cd67SKarl Rupp 
420c7d97c5SJed Brown   /* Coarse solver context */
436c667b0aSStefano Zampini   static const char * const avail_coarse_problems[] = {"sequential","replicated","parallel","multilevel","CoarseProblemType","PC_BDDC_",0}; /* order of choiches depends on ENUM defined in bddc.h */
440298fd71SBarry Smith   ierr = PetscOptionsEnum("-pc_bddc_coarse_problem_type","Set coarse problem type","none",avail_coarse_problems,(PetscEnum)pcbddc->coarse_problem_type,(PetscEnum*)&pcbddc->coarse_problem_type,NULL);CHKERRQ(ierr);
452fa5cd67SKarl Rupp 
460c7d97c5SJed Brown   /* Two different application of BDDC to the whole set of dofs, internal and interface */
470298fd71SBarry Smith   ierr = PetscOptionsBool("-pc_bddc_switch_preconditioning_type","Switch between M_2 (default) and M_3 preconditioners (as defined by Dohrmann)","none",pcbddc->inexact_prec_type,&pcbddc->inexact_prec_type,NULL);CHKERRQ(ierr);
480298fd71SBarry Smith   ierr = PetscOptionsBool("-pc_bddc_use_change_of_basis","Use change of basis approach for primal space","none",pcbddc->usechangeofbasis,&pcbddc->usechangeofbasis,NULL);CHKERRQ(ierr);
490298fd71SBarry Smith   ierr = PetscOptionsBool("-pc_bddc_use_change_on_faces","Use change of basis approach for face constraints","none",pcbddc->usechangeonfaces,&pcbddc->usechangeonfaces,NULL);CHKERRQ(ierr);
502fa5cd67SKarl Rupp 
51534831adSStefano Zampini   pcbddc->usechangeonfaces = pcbddc->usechangeonfaces && pcbddc->usechangeofbasis;
522fa5cd67SKarl Rupp 
530298fd71SBarry Smith   ierr = PetscOptionsInt("-pc_bddc_coarsening_ratio","Set coarsening ratio used in multilevel coarsening","none",pcbddc->coarsening_ratio,&pcbddc->coarsening_ratio,NULL);CHKERRQ(ierr);
540298fd71SBarry Smith   ierr = PetscOptionsInt("-pc_bddc_max_levels","Set maximum number of levels for multilevel","none",pcbddc->max_levels,&pcbddc->max_levels,NULL);CHKERRQ(ierr);
550c7d97c5SJed Brown   ierr = PetscOptionsTail();CHKERRQ(ierr);
560c7d97c5SJed Brown   PetscFunctionReturn(0);
570c7d97c5SJed Brown }
580c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
59*1e6b0712SBarry Smith 
600c7d97c5SJed Brown #undef __FUNCT__
610c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetCoarseProblemType_BDDC"
6253cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetCoarseProblemType_BDDC(PC pc, CoarseProblemType CPT)
630c7d97c5SJed Brown {
640c7d97c5SJed Brown   PC_BDDC *pcbddc = (PC_BDDC*)pc->data;
650c7d97c5SJed Brown 
660c7d97c5SJed Brown   PetscFunctionBegin;
670c7d97c5SJed Brown   pcbddc->coarse_problem_type = CPT;
680c7d97c5SJed Brown   PetscFunctionReturn(0);
690c7d97c5SJed Brown }
70*1e6b0712SBarry Smith 
710c7d97c5SJed Brown #undef __FUNCT__
720c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetCoarseProblemType"
7353cdbc3dSStefano Zampini /*@
749c0446d6SStefano Zampini  PCBDDCSetCoarseProblemType - Set coarse problem type in PCBDDC.
7553cdbc3dSStefano Zampini 
769c0446d6SStefano Zampini    Not collective
7753cdbc3dSStefano Zampini 
7853cdbc3dSStefano Zampini    Input Parameters:
7953cdbc3dSStefano Zampini +  pc - the preconditioning context
8053cdbc3dSStefano Zampini -  CoarseProblemType - pick a better name and explain what this is
8153cdbc3dSStefano Zampini 
8253cdbc3dSStefano Zampini    Level: intermediate
8353cdbc3dSStefano Zampini 
8453cdbc3dSStefano Zampini    Notes:
85da1bb401SStefano Zampini    Not collective but all procs must call with same arguments.
8653cdbc3dSStefano Zampini 
8753cdbc3dSStefano Zampini .seealso: PCBDDC
8853cdbc3dSStefano Zampini @*/
890c7d97c5SJed Brown PetscErrorCode PCBDDCSetCoarseProblemType(PC pc, CoarseProblemType CPT)
900c7d97c5SJed Brown {
910c7d97c5SJed Brown   PetscErrorCode ierr;
920c7d97c5SJed Brown 
930c7d97c5SJed Brown   PetscFunctionBegin;
940c7d97c5SJed Brown   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
950c7d97c5SJed Brown   ierr = PetscTryMethod(pc,"PCBDDCSetCoarseProblemType_C",(PC,CoarseProblemType),(pc,CPT));CHKERRQ(ierr);
960c7d97c5SJed Brown   PetscFunctionReturn(0);
970c7d97c5SJed Brown }
980c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
990c7d97c5SJed Brown #undef __FUNCT__
1004fad6a16SStefano Zampini #define __FUNCT__ "PCBDDCSetCoarseningRatio_BDDC"
1014fad6a16SStefano Zampini static PetscErrorCode PCBDDCSetCoarseningRatio_BDDC(PC pc,PetscInt k)
1024fad6a16SStefano Zampini {
1034fad6a16SStefano Zampini   PC_BDDC *pcbddc = (PC_BDDC*)pc->data;
1044fad6a16SStefano Zampini 
1054fad6a16SStefano Zampini   PetscFunctionBegin;
1064fad6a16SStefano Zampini   pcbddc->coarsening_ratio=k;
1074fad6a16SStefano Zampini   PetscFunctionReturn(0);
1084fad6a16SStefano Zampini }
109*1e6b0712SBarry Smith 
1104fad6a16SStefano Zampini #undef __FUNCT__
1114fad6a16SStefano Zampini #define __FUNCT__ "PCBDDCSetCoarseningRatio"
1124fad6a16SStefano Zampini /*@
1134fad6a16SStefano Zampini  PCBDDCSetCoarseningRatio - Set coarsening ratio used in multilevel coarsening
1144fad6a16SStefano Zampini 
1154fad6a16SStefano Zampini    Logically collective on PC
1164fad6a16SStefano Zampini 
1174fad6a16SStefano Zampini    Input Parameters:
1184fad6a16SStefano Zampini +  pc - the preconditioning context
1194fad6a16SStefano Zampini -  k - coarsening ratio
1204fad6a16SStefano Zampini 
1214fad6a16SStefano Zampini    Approximatively k subdomains at the finer level will be aggregated into a single subdomain at the coarser level.
1224fad6a16SStefano Zampini 
1234fad6a16SStefano Zampini    Level: intermediate
1244fad6a16SStefano Zampini 
1254fad6a16SStefano Zampini    Notes:
1264fad6a16SStefano Zampini 
1274fad6a16SStefano Zampini .seealso: PCBDDC
1284fad6a16SStefano Zampini @*/
1294fad6a16SStefano Zampini PetscErrorCode PCBDDCSetCoarseningRatio(PC pc,PetscInt k)
1304fad6a16SStefano Zampini {
1314fad6a16SStefano Zampini   PetscErrorCode ierr;
1324fad6a16SStefano Zampini 
1334fad6a16SStefano Zampini   PetscFunctionBegin;
1344fad6a16SStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
1354fad6a16SStefano Zampini   ierr = PetscTryMethod(pc,"PCBDDCSetCoarseningRatio_C",(PC,PetscInt),(pc,k));CHKERRQ(ierr);
1364fad6a16SStefano Zampini   PetscFunctionReturn(0);
1374fad6a16SStefano Zampini }
1384fad6a16SStefano Zampini /* -------------------------------------------------------------------------- */
139*1e6b0712SBarry Smith 
1404fad6a16SStefano Zampini #undef __FUNCT__
1414fad6a16SStefano Zampini #define __FUNCT__ "PCBDDCSetMaxLevels_BDDC"
1424fad6a16SStefano Zampini static PetscErrorCode PCBDDCSetMaxLevels_BDDC(PC pc,PetscInt max_levels)
1434fad6a16SStefano Zampini {
1444fad6a16SStefano Zampini   PC_BDDC *pcbddc = (PC_BDDC*)pc->data;
1454fad6a16SStefano Zampini 
1464fad6a16SStefano Zampini   PetscFunctionBegin;
1474fad6a16SStefano Zampini   pcbddc->max_levels=max_levels;
1484fad6a16SStefano Zampini   PetscFunctionReturn(0);
1494fad6a16SStefano Zampini }
150*1e6b0712SBarry Smith 
1514fad6a16SStefano Zampini #undef __FUNCT__
1524fad6a16SStefano Zampini #define __FUNCT__ "PCBDDCSetMaxLevels"
1534fad6a16SStefano Zampini /*@
1544fad6a16SStefano Zampini  PCBDDCSetMaxLevels - Sets the maximum number of levels within the multilevel approach.
1554fad6a16SStefano Zampini 
1564fad6a16SStefano Zampini    Logically collective on PC
1574fad6a16SStefano Zampini 
1584fad6a16SStefano Zampini    Input Parameters:
1594fad6a16SStefano Zampini +  pc - the preconditioning context
1604fad6a16SStefano Zampini -  max_levels - the maximum number of levels
1614fad6a16SStefano Zampini 
1624fad6a16SStefano Zampini    Default value is 1, i.e. coarse problem will be solved inexactly with one application
1634fad6a16SStefano Zampini    of PCBDDC preconditioner if the multilevel approach is requested.
1644fad6a16SStefano Zampini 
1654fad6a16SStefano Zampini    Level: intermediate
1664fad6a16SStefano Zampini 
1674fad6a16SStefano Zampini    Notes:
1684fad6a16SStefano Zampini 
1694fad6a16SStefano Zampini .seealso: PCBDDC
1704fad6a16SStefano Zampini @*/
1714fad6a16SStefano Zampini PetscErrorCode PCBDDCSetMaxLevels(PC pc,PetscInt max_levels)
1724fad6a16SStefano Zampini {
1734fad6a16SStefano Zampini   PetscErrorCode ierr;
1744fad6a16SStefano Zampini 
1754fad6a16SStefano Zampini   PetscFunctionBegin;
1764fad6a16SStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
1774fad6a16SStefano Zampini   ierr = PetscTryMethod(pc,"PCBDDCSetMaxLevels_C",(PC,PetscInt),(pc,max_levels));CHKERRQ(ierr);
1784fad6a16SStefano Zampini   PetscFunctionReturn(0);
1794fad6a16SStefano Zampini }
1804fad6a16SStefano Zampini /* -------------------------------------------------------------------------- */
181*1e6b0712SBarry Smith 
1824fad6a16SStefano Zampini #undef __FUNCT__
1830bdf917eSStefano Zampini #define __FUNCT__ "PCBDDCSetNullSpace_BDDC"
1840bdf917eSStefano Zampini static PetscErrorCode PCBDDCSetNullSpace_BDDC(PC pc,MatNullSpace NullSpace)
1850bdf917eSStefano Zampini {
1860bdf917eSStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
1870bdf917eSStefano Zampini   PetscErrorCode ierr;
1880bdf917eSStefano Zampini 
1890bdf917eSStefano Zampini   PetscFunctionBegin;
1900bdf917eSStefano Zampini   ierr = PetscObjectReference((PetscObject)NullSpace);CHKERRQ(ierr);
1910bdf917eSStefano Zampini   ierr = MatNullSpaceDestroy(&pcbddc->NullSpace);CHKERRQ(ierr);
1922fa5cd67SKarl Rupp 
1930bdf917eSStefano Zampini   pcbddc->NullSpace = NullSpace;
1940bdf917eSStefano Zampini   PetscFunctionReturn(0);
1950bdf917eSStefano Zampini }
196*1e6b0712SBarry Smith 
1970bdf917eSStefano Zampini #undef __FUNCT__
1980bdf917eSStefano Zampini #define __FUNCT__ "PCBDDCSetNullSpace"
1990bdf917eSStefano Zampini /*@
2000bdf917eSStefano Zampini  PCBDDCSetNullSpace - Set NullSpace of global operator of BDDC preconditioned mat.
2010bdf917eSStefano Zampini 
2020bdf917eSStefano Zampini    Logically collective on PC and MatNullSpace
2030bdf917eSStefano Zampini 
2040bdf917eSStefano Zampini    Input Parameters:
2050bdf917eSStefano Zampini +  pc - the preconditioning context
2060bdf917eSStefano Zampini -  NullSpace - Null space of the linear operator to be preconditioned.
2070bdf917eSStefano Zampini 
2080bdf917eSStefano Zampini    Level: intermediate
2090bdf917eSStefano Zampini 
2100bdf917eSStefano Zampini    Notes:
2110bdf917eSStefano Zampini 
2120bdf917eSStefano Zampini .seealso: PCBDDC
2130bdf917eSStefano Zampini @*/
2140bdf917eSStefano Zampini PetscErrorCode PCBDDCSetNullSpace(PC pc,MatNullSpace NullSpace)
2150bdf917eSStefano Zampini {
2160bdf917eSStefano Zampini   PetscErrorCode ierr;
2170bdf917eSStefano Zampini 
2180bdf917eSStefano Zampini   PetscFunctionBegin;
2190bdf917eSStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
2200bdf917eSStefano Zampini   ierr = PetscTryMethod(pc,"PCBDDCSetNullSpace_C",(PC,MatNullSpace),(pc,NullSpace));CHKERRQ(ierr);
2210bdf917eSStefano Zampini   PetscFunctionReturn(0);
2220bdf917eSStefano Zampini }
2230bdf917eSStefano Zampini /* -------------------------------------------------------------------------- */
224*1e6b0712SBarry Smith 
2250bdf917eSStefano Zampini #undef __FUNCT__
2263b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCSetDirichletBoundaries_BDDC"
2273b03a366Sstefano_zampini static PetscErrorCode PCBDDCSetDirichletBoundaries_BDDC(PC pc,IS DirichletBoundaries)
2283b03a366Sstefano_zampini {
2293b03a366Sstefano_zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
2303b03a366Sstefano_zampini   PetscErrorCode ierr;
2313b03a366Sstefano_zampini 
2323b03a366Sstefano_zampini   PetscFunctionBegin;
2333b03a366Sstefano_zampini   ierr = ISDestroy(&pcbddc->DirichletBoundaries);CHKERRQ(ierr);
23436e030ebSStefano Zampini   ierr = PetscObjectReference((PetscObject)DirichletBoundaries);CHKERRQ(ierr);
2352fa5cd67SKarl Rupp 
23636e030ebSStefano Zampini   pcbddc->DirichletBoundaries = DirichletBoundaries;
2373b03a366Sstefano_zampini   PetscFunctionReturn(0);
2383b03a366Sstefano_zampini }
239*1e6b0712SBarry Smith 
2403b03a366Sstefano_zampini #undef __FUNCT__
2413b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCSetDirichletBoundaries"
2423b03a366Sstefano_zampini /*@
243da1bb401SStefano Zampini  PCBDDCSetDirichletBoundaries - Set index set defining subdomain part (in local ordering)
244da1bb401SStefano Zampini                               of Dirichlet boundaries for the global problem.
2453b03a366Sstefano_zampini 
2463b03a366Sstefano_zampini    Not collective
2473b03a366Sstefano_zampini 
2483b03a366Sstefano_zampini    Input Parameters:
2493b03a366Sstefano_zampini +  pc - the preconditioning context
2500298fd71SBarry Smith -  DirichletBoundaries - sequential index set defining the subdomain part of Dirichlet boundaries (can be NULL)
2513b03a366Sstefano_zampini 
2523b03a366Sstefano_zampini    Level: intermediate
2533b03a366Sstefano_zampini 
2543b03a366Sstefano_zampini    Notes:
2553b03a366Sstefano_zampini 
2563b03a366Sstefano_zampini .seealso: PCBDDC
2573b03a366Sstefano_zampini @*/
2583b03a366Sstefano_zampini PetscErrorCode PCBDDCSetDirichletBoundaries(PC pc,IS DirichletBoundaries)
2593b03a366Sstefano_zampini {
2603b03a366Sstefano_zampini   PetscErrorCode ierr;
2613b03a366Sstefano_zampini 
2623b03a366Sstefano_zampini   PetscFunctionBegin;
2633b03a366Sstefano_zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
2643b03a366Sstefano_zampini   ierr = PetscTryMethod(pc,"PCBDDCSetDirichletBoundaries_C",(PC,IS),(pc,DirichletBoundaries));CHKERRQ(ierr);
2653b03a366Sstefano_zampini   PetscFunctionReturn(0);
2663b03a366Sstefano_zampini }
2673b03a366Sstefano_zampini /* -------------------------------------------------------------------------- */
268*1e6b0712SBarry Smith 
2693b03a366Sstefano_zampini #undef __FUNCT__
2700c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetNeumannBoundaries_BDDC"
27153cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetNeumannBoundaries_BDDC(PC pc,IS NeumannBoundaries)
2720c7d97c5SJed Brown {
2730c7d97c5SJed Brown   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
27453cdbc3dSStefano Zampini   PetscErrorCode ierr;
2750c7d97c5SJed Brown 
2760c7d97c5SJed Brown   PetscFunctionBegin;
27753cdbc3dSStefano Zampini   ierr = ISDestroy(&pcbddc->NeumannBoundaries);CHKERRQ(ierr);
27836e030ebSStefano Zampini   ierr = PetscObjectReference((PetscObject)NeumannBoundaries);CHKERRQ(ierr);
2792fa5cd67SKarl Rupp 
28036e030ebSStefano Zampini   pcbddc->NeumannBoundaries = NeumannBoundaries;
2810c7d97c5SJed Brown   PetscFunctionReturn(0);
2820c7d97c5SJed Brown }
283*1e6b0712SBarry Smith 
2840c7d97c5SJed Brown #undef __FUNCT__
2850c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetNeumannBoundaries"
28657527edcSJed Brown /*@
287da1bb401SStefano Zampini  PCBDDCSetNeumannBoundaries - Set index set defining subdomain part (in local ordering)
288da1bb401SStefano Zampini                               of Neumann boundaries for the global problem.
28957527edcSJed Brown 
2909c0446d6SStefano Zampini    Not collective
29157527edcSJed Brown 
29257527edcSJed Brown    Input Parameters:
29357527edcSJed Brown +  pc - the preconditioning context
2940298fd71SBarry Smith -  NeumannBoundaries - sequential index set defining the subdomain part of Neumann boundaries (can be NULL)
29557527edcSJed Brown 
29657527edcSJed Brown    Level: intermediate
29757527edcSJed Brown 
29857527edcSJed Brown    Notes:
29957527edcSJed Brown 
30057527edcSJed Brown .seealso: PCBDDC
30157527edcSJed Brown @*/
30253cdbc3dSStefano Zampini PetscErrorCode PCBDDCSetNeumannBoundaries(PC pc,IS NeumannBoundaries)
3030c7d97c5SJed Brown {
3040c7d97c5SJed Brown   PetscErrorCode ierr;
3050c7d97c5SJed Brown 
3060c7d97c5SJed Brown   PetscFunctionBegin;
3070c7d97c5SJed Brown   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
30853cdbc3dSStefano Zampini   ierr = PetscTryMethod(pc,"PCBDDCSetNeumannBoundaries_C",(PC,IS),(pc,NeumannBoundaries));CHKERRQ(ierr);
30953cdbc3dSStefano Zampini   PetscFunctionReturn(0);
31053cdbc3dSStefano Zampini }
31153cdbc3dSStefano Zampini /* -------------------------------------------------------------------------- */
312*1e6b0712SBarry Smith 
31353cdbc3dSStefano Zampini #undef __FUNCT__
314da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCGetDirichletBoundaries_BDDC"
315da1bb401SStefano Zampini static PetscErrorCode PCBDDCGetDirichletBoundaries_BDDC(PC pc,IS *DirichletBoundaries)
316da1bb401SStefano Zampini {
317da1bb401SStefano Zampini   PC_BDDC *pcbddc = (PC_BDDC*)pc->data;
318da1bb401SStefano Zampini 
319da1bb401SStefano Zampini   PetscFunctionBegin;
320da1bb401SStefano Zampini   *DirichletBoundaries = pcbddc->DirichletBoundaries;
321da1bb401SStefano Zampini   PetscFunctionReturn(0);
322da1bb401SStefano Zampini }
323*1e6b0712SBarry Smith 
324da1bb401SStefano Zampini #undef __FUNCT__
325da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCGetDirichletBoundaries"
326da1bb401SStefano Zampini /*@
327da1bb401SStefano Zampini  PCBDDCGetDirichletBoundaries - Get index set defining subdomain part (in local ordering)
328da1bb401SStefano Zampini                                 of Dirichlet boundaries for the global problem.
329da1bb401SStefano Zampini 
330da1bb401SStefano Zampini    Not collective
331da1bb401SStefano Zampini 
332da1bb401SStefano Zampini    Input Parameters:
333da1bb401SStefano Zampini +  pc - the preconditioning context
334da1bb401SStefano Zampini 
335da1bb401SStefano Zampini    Output Parameters:
336da1bb401SStefano Zampini +  DirichletBoundaries - index set defining the subdomain part of Dirichlet boundaries
337da1bb401SStefano Zampini 
338da1bb401SStefano Zampini    Level: intermediate
339da1bb401SStefano Zampini 
340da1bb401SStefano Zampini    Notes:
341da1bb401SStefano Zampini 
342da1bb401SStefano Zampini .seealso: PCBDDC
343da1bb401SStefano Zampini @*/
344da1bb401SStefano Zampini PetscErrorCode PCBDDCGetDirichletBoundaries(PC pc,IS *DirichletBoundaries)
345da1bb401SStefano Zampini {
346da1bb401SStefano Zampini   PetscErrorCode ierr;
347da1bb401SStefano Zampini 
348da1bb401SStefano Zampini   PetscFunctionBegin;
349da1bb401SStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
350da1bb401SStefano Zampini   ierr = PetscUseMethod(pc,"PCBDDCGetDirichletBoundaries_C",(PC,IS*),(pc,DirichletBoundaries));CHKERRQ(ierr);
351da1bb401SStefano Zampini   PetscFunctionReturn(0);
352da1bb401SStefano Zampini }
353da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
354*1e6b0712SBarry Smith 
355da1bb401SStefano Zampini #undef __FUNCT__
35653cdbc3dSStefano Zampini #define __FUNCT__ "PCBDDCGetNeumannBoundaries_BDDC"
35753cdbc3dSStefano Zampini static PetscErrorCode PCBDDCGetNeumannBoundaries_BDDC(PC pc,IS *NeumannBoundaries)
35853cdbc3dSStefano Zampini {
35953cdbc3dSStefano Zampini   PC_BDDC *pcbddc = (PC_BDDC*)pc->data;
36053cdbc3dSStefano Zampini 
36153cdbc3dSStefano Zampini   PetscFunctionBegin;
36253cdbc3dSStefano Zampini   *NeumannBoundaries = pcbddc->NeumannBoundaries;
36353cdbc3dSStefano Zampini   PetscFunctionReturn(0);
36453cdbc3dSStefano Zampini }
365*1e6b0712SBarry Smith 
36653cdbc3dSStefano Zampini #undef __FUNCT__
36753cdbc3dSStefano Zampini #define __FUNCT__ "PCBDDCGetNeumannBoundaries"
36853cdbc3dSStefano Zampini /*@
369da1bb401SStefano Zampini  PCBDDCGetNeumannBoundaries - Get index set defining subdomain part (in local ordering)
370da1bb401SStefano Zampini                               of Neumann boundaries for the global problem.
37153cdbc3dSStefano Zampini 
3729c0446d6SStefano Zampini    Not collective
37353cdbc3dSStefano Zampini 
37453cdbc3dSStefano Zampini    Input Parameters:
37553cdbc3dSStefano Zampini +  pc - the preconditioning context
37653cdbc3dSStefano Zampini 
37753cdbc3dSStefano Zampini    Output Parameters:
37853cdbc3dSStefano Zampini +  NeumannBoundaries - index set defining the subdomain part of Neumann boundaries
37953cdbc3dSStefano Zampini 
38053cdbc3dSStefano Zampini    Level: intermediate
38153cdbc3dSStefano Zampini 
38253cdbc3dSStefano Zampini    Notes:
38353cdbc3dSStefano Zampini 
38453cdbc3dSStefano Zampini .seealso: PCBDDC
38553cdbc3dSStefano Zampini @*/
38653cdbc3dSStefano Zampini PetscErrorCode PCBDDCGetNeumannBoundaries(PC pc,IS *NeumannBoundaries)
38753cdbc3dSStefano Zampini {
38853cdbc3dSStefano Zampini   PetscErrorCode ierr;
38953cdbc3dSStefano Zampini 
39053cdbc3dSStefano Zampini   PetscFunctionBegin;
39153cdbc3dSStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
39253cdbc3dSStefano Zampini   ierr = PetscUseMethod(pc,"PCBDDCGetNeumannBoundaries_C",(PC,IS*),(pc,NeumannBoundaries));CHKERRQ(ierr);
3930c7d97c5SJed Brown   PetscFunctionReturn(0);
3940c7d97c5SJed Brown }
39536e030ebSStefano Zampini /* -------------------------------------------------------------------------- */
396*1e6b0712SBarry Smith 
39736e030ebSStefano Zampini #undef __FUNCT__
398da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetLocalAdjacencyGraph_BDDC"
3991a83f524SJed Brown static PetscErrorCode PCBDDCSetLocalAdjacencyGraph_BDDC(PC pc, PetscInt nvtxs,const PetscInt xadj[],const PetscInt adjncy[], PetscCopyMode copymode)
40036e030ebSStefano Zampini {
40136e030ebSStefano Zampini   PC_BDDC        *pcbddc  = (PC_BDDC*)pc->data;
402da1bb401SStefano Zampini   PCBDDCGraph    mat_graph=pcbddc->mat_graph;
403da1bb401SStefano Zampini   PetscErrorCode ierr;
40436e030ebSStefano Zampini 
40536e030ebSStefano Zampini   PetscFunctionBegin;
406da1bb401SStefano Zampini   mat_graph->nvtxs=nvtxs;
4072fa5cd67SKarl Rupp 
408da1bb401SStefano Zampini   ierr = PetscFree(mat_graph->xadj);CHKERRQ(ierr);
409da1bb401SStefano Zampini   ierr = PetscFree(mat_graph->adjncy);CHKERRQ(ierr);
410da1bb401SStefano Zampini   if (copymode == PETSC_COPY_VALUES) {
411da1bb401SStefano Zampini     ierr = PetscMalloc((mat_graph->nvtxs+1)*sizeof(PetscInt),&mat_graph->xadj);CHKERRQ(ierr);
412da1bb401SStefano Zampini     ierr = PetscMalloc(xadj[mat_graph->nvtxs]*sizeof(PetscInt),&mat_graph->adjncy);CHKERRQ(ierr);
413da1bb401SStefano Zampini     ierr = PetscMemcpy(mat_graph->xadj,xadj,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr);
414da1bb401SStefano Zampini     ierr = PetscMemcpy(mat_graph->adjncy,adjncy,xadj[mat_graph->nvtxs]*sizeof(PetscInt));CHKERRQ(ierr);
415da1bb401SStefano Zampini   } else if (copymode == PETSC_OWN_POINTER) {
4161a83f524SJed Brown     mat_graph->xadj   = (PetscInt*)xadj;
4171a83f524SJed Brown     mat_graph->adjncy = (PetscInt*)adjncy;
418acee19a7SJed Brown   } else SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SUP,"Unsupported copy mode %d\n",copymode);
41936e030ebSStefano Zampini   PetscFunctionReturn(0);
42036e030ebSStefano Zampini }
421*1e6b0712SBarry Smith 
42236e030ebSStefano Zampini #undef __FUNCT__
423da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetLocalAdjacencyGraph"
42436e030ebSStefano Zampini /*@
425da1bb401SStefano Zampini  PCBDDCSetLocalAdjacencyGraph - Set CSR graph of local matrix for use of PCBDDC.
42636e030ebSStefano Zampini 
42736e030ebSStefano Zampini    Not collective
42836e030ebSStefano Zampini 
42936e030ebSStefano Zampini    Input Parameters:
43036e030ebSStefano Zampini +  pc - the preconditioning context
431da1bb401SStefano Zampini -  nvtxs - number of local vertices of the graph
432da1bb401SStefano Zampini -  xadj, adjncy - the CSR graph
433da1bb401SStefano Zampini -  copymode - either PETSC_COPY_VALUES or PETSC_OWN_POINTER. In the former case the user must free the array passed in;
434da1bb401SStefano Zampini                                                              in the latter case, memory must be obtained with PetscMalloc.
43536e030ebSStefano Zampini 
43636e030ebSStefano Zampini    Level: intermediate
43736e030ebSStefano Zampini 
43836e030ebSStefano Zampini    Notes:
43936e030ebSStefano Zampini 
44036e030ebSStefano Zampini .seealso: PCBDDC
44136e030ebSStefano Zampini @*/
4421a83f524SJed Brown PetscErrorCode PCBDDCSetLocalAdjacencyGraph(PC pc,PetscInt nvtxs,const PetscInt xadj[],const PetscInt adjncy[], PetscCopyMode copymode)
44336e030ebSStefano Zampini {
444da1bb401SStefano Zampini   PetscInt       nrows,ncols;
445da1bb401SStefano Zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
44636e030ebSStefano Zampini   PetscErrorCode ierr;
44736e030ebSStefano Zampini 
44836e030ebSStefano Zampini   PetscFunctionBegin;
44936e030ebSStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
450da1bb401SStefano Zampini   ierr = MatGetSize(matis->A,&nrows,&ncols);CHKERRQ(ierr);
451f23aa3ddSBarry Smith   if (nvtxs != nrows) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Local adjacency size %d passed in %s differs from local problem size %d!\n",nvtxs,nrows);
452f23aa3ddSBarry Smith   else {
4531a83f524SJed Brown     ierr = PetscTryMethod(pc,"PCBDDCSetLocalAdjacencyGraph_C",(PC,PetscInt,const PetscInt[],const PetscInt[],PetscCopyMode),(pc,nvtxs,xadj,adjncy,copymode));CHKERRQ(ierr);
454da1bb401SStefano Zampini   }
45536e030ebSStefano Zampini   PetscFunctionReturn(0);
45636e030ebSStefano Zampini }
4579c0446d6SStefano Zampini /* -------------------------------------------------------------------------- */
458*1e6b0712SBarry Smith 
4599c0446d6SStefano Zampini #undef __FUNCT__
4609c0446d6SStefano Zampini #define __FUNCT__ "PCBDDCSetDofsSplitting_BDDC"
4619c0446d6SStefano Zampini static PetscErrorCode PCBDDCSetDofsSplitting_BDDC(PC pc,PetscInt n_is, IS ISForDofs[])
4629c0446d6SStefano Zampini {
4639c0446d6SStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
4649c0446d6SStefano Zampini   PetscInt       i;
4659c0446d6SStefano Zampini   PetscErrorCode ierr;
4669c0446d6SStefano Zampini 
4679c0446d6SStefano Zampini   PetscFunctionBegin;
468da1bb401SStefano Zampini   /* Destroy ISes if they were already set */
4699c0446d6SStefano Zampini   for (i=0; i<pcbddc->n_ISForDofs; i++) {
4709c0446d6SStefano Zampini     ierr = ISDestroy(&pcbddc->ISForDofs[i]);CHKERRQ(ierr);
4719c0446d6SStefano Zampini   }
472d11ae9bbSstefano_zampini   ierr = PetscFree(pcbddc->ISForDofs);CHKERRQ(ierr);
473da1bb401SStefano Zampini   /* allocate space then set */
4749c0446d6SStefano Zampini   ierr = PetscMalloc(n_is*sizeof(IS),&pcbddc->ISForDofs);CHKERRQ(ierr);
4759c0446d6SStefano Zampini   for (i=0; i<n_is; i++) {
476da1bb401SStefano Zampini     ierr = PetscObjectReference((PetscObject)ISForDofs[i]);CHKERRQ(ierr);
4772fa5cd67SKarl Rupp 
478da1bb401SStefano Zampini     pcbddc->ISForDofs[i]=ISForDofs[i];
4799c0446d6SStefano Zampini   }
4809c0446d6SStefano Zampini   pcbddc->n_ISForDofs=n_is;
4819c0446d6SStefano Zampini   PetscFunctionReturn(0);
4829c0446d6SStefano Zampini }
483*1e6b0712SBarry Smith 
4849c0446d6SStefano Zampini #undef __FUNCT__
4859c0446d6SStefano Zampini #define __FUNCT__ "PCBDDCSetDofsSplitting"
4869c0446d6SStefano Zampini /*@
487da1bb401SStefano Zampini  PCBDDCSetDofsSplitting - Set index sets defining fields of local mat.
4889c0446d6SStefano Zampini 
4899c0446d6SStefano Zampini    Not collective
4909c0446d6SStefano Zampini 
4919c0446d6SStefano Zampini    Input Parameters:
4929c0446d6SStefano Zampini +  pc - the preconditioning context
493da1bb401SStefano Zampini -  n - number of index sets defining the fields
494da1bb401SStefano Zampini -  IS[] - array of IS describing the fields
4959c0446d6SStefano Zampini 
4969c0446d6SStefano Zampini    Level: intermediate
4979c0446d6SStefano Zampini 
4989c0446d6SStefano Zampini    Notes:
4999c0446d6SStefano Zampini 
5009c0446d6SStefano Zampini .seealso: PCBDDC
5019c0446d6SStefano Zampini @*/
5029c0446d6SStefano Zampini PetscErrorCode PCBDDCSetDofsSplitting(PC pc,PetscInt n_is, IS ISForDofs[])
5039c0446d6SStefano Zampini {
5049c0446d6SStefano Zampini   PetscErrorCode ierr;
5059c0446d6SStefano Zampini 
5069c0446d6SStefano Zampini   PetscFunctionBegin;
5079c0446d6SStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
5089c0446d6SStefano Zampini   ierr = PetscTryMethod(pc,"PCBDDCSetDofsSplitting_C",(PC,PetscInt,IS[]),(pc,n_is,ISForDofs));CHKERRQ(ierr);
5099c0446d6SStefano Zampini   PetscFunctionReturn(0);
5109c0446d6SStefano Zampini }
511da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
512534831adSStefano Zampini #undef __FUNCT__
513534831adSStefano Zampini #define __FUNCT__ "PCPreSolve_BDDC"
514534831adSStefano Zampini /* -------------------------------------------------------------------------- */
515534831adSStefano Zampini /*
516534831adSStefano Zampini    PCPreSolve_BDDC - Changes the right hand side and (if necessary) the initial
517534831adSStefano Zampini                      guess if a transformation of basis approach has been selected.
5189c0446d6SStefano Zampini 
519534831adSStefano Zampini    Input Parameter:
520534831adSStefano Zampini +  pc - the preconditioner contex
521534831adSStefano Zampini 
522534831adSStefano Zampini    Application Interface Routine: PCPreSolve()
523534831adSStefano Zampini 
524534831adSStefano Zampini    Notes:
525534831adSStefano Zampini    The interface routine PCPreSolve() is not usually called directly by
526534831adSStefano Zampini    the user, but instead is called by KSPSolve().
527534831adSStefano Zampini */
528534831adSStefano Zampini static PetscErrorCode PCPreSolve_BDDC(PC pc, KSP ksp, Vec rhs, Vec x)
529534831adSStefano Zampini {
530534831adSStefano Zampini   PetscErrorCode ierr;
531534831adSStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
532534831adSStefano Zampini   PC_IS          *pcis   = (PC_IS*)(pc->data);
533534831adSStefano Zampini   Mat_IS         *matis  = (Mat_IS*)pc->pmat->data;
534534831adSStefano Zampini   Mat            temp_mat;
5353972b0daSStefano Zampini   IS             dirIS;
5363972b0daSStefano Zampini   PetscInt       dirsize,i,*is_indices;
5373972b0daSStefano Zampini   PetscScalar    *array_x,*array_diagonal;
5383972b0daSStefano Zampini   Vec            used_vec;
5393972b0daSStefano Zampini   PetscBool      guess_nonzero;
540534831adSStefano Zampini 
541534831adSStefano Zampini   PetscFunctionBegin;
5423972b0daSStefano Zampini   if (x) {
5433972b0daSStefano Zampini     ierr     = PetscObjectReference((PetscObject)x);CHKERRQ(ierr);
5443972b0daSStefano Zampini     used_vec = x;
5453972b0daSStefano Zampini   } else {
5463972b0daSStefano Zampini     ierr     = PetscObjectReference((PetscObject)pcbddc->temp_solution);CHKERRQ(ierr);
5473972b0daSStefano Zampini     used_vec = pcbddc->temp_solution;
5483972b0daSStefano Zampini     ierr     = VecSet(used_vec,0.0);CHKERRQ(ierr);
5493972b0daSStefano Zampini   }
5503972b0daSStefano Zampini   /* hack into ksp data structure PCPreSolve comes earlier in src/ksp/ksp/interface/itfunc.c */
5513972b0daSStefano Zampini   if (ksp) {
5523972b0daSStefano Zampini     ierr = KSPGetInitialGuessNonzero(ksp,&guess_nonzero);CHKERRQ(ierr);
5533972b0daSStefano Zampini     if (!guess_nonzero) {
5543972b0daSStefano Zampini       ierr = VecSet(used_vec,0.0);CHKERRQ(ierr);
5553972b0daSStefano Zampini     }
5563972b0daSStefano Zampini   }
5573972b0daSStefano Zampini   /* store the original rhs */
5583972b0daSStefano Zampini   ierr = VecCopy(rhs,pcbddc->original_rhs);CHKERRQ(ierr);
5593972b0daSStefano Zampini 
5603972b0daSStefano Zampini   /* Take into account zeroed rows -> change rhs and store solution removed */
5613972b0daSStefano Zampini   ierr = MatGetDiagonal(pc->pmat,pcis->vec1_global);CHKERRQ(ierr);
5623972b0daSStefano Zampini   ierr = VecPointwiseDivide(pcis->vec1_global,rhs,pcis->vec1_global);CHKERRQ(ierr);
5633972b0daSStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
5643972b0daSStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
5653972b0daSStefano Zampini   ierr = VecScatterBegin(matis->ctx,used_vec,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
5663972b0daSStefano Zampini   ierr = VecScatterEnd  (matis->ctx,used_vec,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
5673972b0daSStefano Zampini   ierr = PCBDDCGetDirichletBoundaries(pc,&dirIS);CHKERRQ(ierr);
5683972b0daSStefano Zampini   if (dirIS) {
5693972b0daSStefano Zampini     ierr = ISGetSize(dirIS,&dirsize);CHKERRQ(ierr);
5703972b0daSStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array_x);CHKERRQ(ierr);
5713972b0daSStefano Zampini     ierr = VecGetArray(pcis->vec2_N,&array_diagonal);CHKERRQ(ierr);
5723972b0daSStefano Zampini     ierr = ISGetIndices(dirIS,(const PetscInt**)&is_indices);CHKERRQ(ierr);
5732fa5cd67SKarl Rupp     for (i=0; i<dirsize; i++) array_x[is_indices[i]] = array_diagonal[is_indices[i]];
5742fa5cd67SKarl Rupp 
5753972b0daSStefano Zampini     ierr = ISRestoreIndices(dirIS,(const PetscInt**)&is_indices);CHKERRQ(ierr);
5763972b0daSStefano Zampini     ierr = VecRestoreArray(pcis->vec2_N,&array_diagonal);CHKERRQ(ierr);
5773972b0daSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array_x);CHKERRQ(ierr);
5783972b0daSStefano Zampini   }
5793972b0daSStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
5803972b0daSStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
581b76ba322SStefano Zampini 
5823972b0daSStefano Zampini   /* remove the computed solution from the rhs */
5833972b0daSStefano Zampini   ierr = VecScale(used_vec,-1.0);CHKERRQ(ierr);
5843972b0daSStefano Zampini   ierr = MatMultAdd(pc->pmat,used_vec,rhs,rhs);CHKERRQ(ierr);
5853972b0daSStefano Zampini   ierr = VecScale(used_vec,-1.0);CHKERRQ(ierr);
586b76ba322SStefano Zampini 
587b76ba322SStefano Zampini   /* store partially computed solution and set initial guess */
5883972b0daSStefano Zampini   if (x) {
5893972b0daSStefano Zampini     ierr = VecCopy(used_vec,pcbddc->temp_solution);CHKERRQ(ierr);
5903972b0daSStefano Zampini     ierr = VecSet(used_vec,0.0);CHKERRQ(ierr);
591b76ba322SStefano Zampini     if (pcbddc->use_exact_dirichlet) {
592b76ba322SStefano Zampini       ierr = VecScatterBegin(pcis->global_to_D,rhs,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
593b76ba322SStefano Zampini       ierr = VecScatterEnd  (pcis->global_to_D,rhs,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
594b76ba322SStefano Zampini       ierr = KSPSolve(pcbddc->ksp_D,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr);
595b76ba322SStefano Zampini       ierr = VecScatterBegin(pcis->global_to_D,pcis->vec2_D,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
596b76ba322SStefano Zampini       ierr = VecScatterEnd  (pcis->global_to_D,pcis->vec2_D,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
597b76ba322SStefano Zampini       if (ksp) {
598b76ba322SStefano Zampini         ierr = KSPSetInitialGuessNonzero(ksp,PETSC_TRUE);CHKERRQ(ierr);
599b76ba322SStefano Zampini       }
600b76ba322SStefano Zampini     }
6013972b0daSStefano Zampini   }
602b76ba322SStefano Zampini 
603b76ba322SStefano Zampini   /* rhs change of basis */
604b76ba322SStefano Zampini   if (pcbddc->usechangeofbasis) {
605b76ba322SStefano Zampini     /* swap pointers for local matrices */
606b76ba322SStefano Zampini     temp_mat          = matis->A;
607b76ba322SStefano Zampini     matis->A          = pcbddc->local_mat;
608b76ba322SStefano Zampini     pcbddc->local_mat = temp_mat;
609b76ba322SStefano Zampini     /* Get local rhs and apply transformation of basis */
610b76ba322SStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,rhs,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
611b76ba322SStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,rhs,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
612b76ba322SStefano Zampini     /* from original basis to modified basis */
613b76ba322SStefano Zampini     ierr = MatMultTranspose(pcbddc->ChangeOfBasisMatrix,pcis->vec1_B,pcis->vec2_B);CHKERRQ(ierr);
614b76ba322SStefano Zampini     /* put back modified values into the global vec using INSERT_VALUES copy mode */
615b76ba322SStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,pcis->vec2_B,rhs,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
616b76ba322SStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec2_B,rhs,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
6170bdf917eSStefano Zampini     if (ksp && pcbddc->NullSpace) {
6180298fd71SBarry Smith       ierr = MatNullSpaceRemove(pcbddc->NullSpace,used_vec,NULL);CHKERRQ(ierr);
6190298fd71SBarry Smith       ierr = MatNullSpaceRemove(pcbddc->NullSpace,rhs,NULL);CHKERRQ(ierr);
620b76ba322SStefano Zampini     }
6210bdf917eSStefano Zampini   }
6220bdf917eSStefano Zampini   ierr = VecDestroy(&used_vec);CHKERRQ(ierr);
623534831adSStefano Zampini   PetscFunctionReturn(0);
624534831adSStefano Zampini }
625534831adSStefano Zampini /* -------------------------------------------------------------------------- */
626534831adSStefano Zampini #undef __FUNCT__
627534831adSStefano Zampini #define __FUNCT__ "PCPostSolve_BDDC"
628534831adSStefano Zampini /* -------------------------------------------------------------------------- */
629534831adSStefano Zampini /*
630534831adSStefano Zampini    PCPostSolve_BDDC - Changes the computed solution if a transformation of basis
631534831adSStefano Zampini                      approach has been selected. Also, restores rhs to its original state.
632534831adSStefano Zampini 
633534831adSStefano Zampini    Input Parameter:
634534831adSStefano Zampini +  pc - the preconditioner contex
635534831adSStefano Zampini 
636534831adSStefano Zampini    Application Interface Routine: PCPostSolve()
637534831adSStefano Zampini 
638534831adSStefano Zampini    Notes:
639534831adSStefano Zampini    The interface routine PCPostSolve() is not usually called directly by
640534831adSStefano Zampini    the user, but instead is called by KSPSolve().
641534831adSStefano Zampini */
642534831adSStefano Zampini static PetscErrorCode PCPostSolve_BDDC(PC pc, KSP ksp, Vec rhs, Vec x)
643534831adSStefano Zampini {
644534831adSStefano Zampini   PetscErrorCode ierr;
645534831adSStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
646534831adSStefano Zampini   PC_IS          *pcis   = (PC_IS*)(pc->data);
647534831adSStefano Zampini   Mat_IS         *matis  = (Mat_IS*)pc->pmat->data;
648534831adSStefano Zampini   Mat            temp_mat;
649534831adSStefano Zampini 
650534831adSStefano Zampini   PetscFunctionBegin;
651534831adSStefano Zampini   if (pcbddc->usechangeofbasis) {
652534831adSStefano Zampini     /* swap pointers for local matrices */
653534831adSStefano Zampini     temp_mat          = matis->A;
654534831adSStefano Zampini     matis->A          = pcbddc->local_mat;
655534831adSStefano Zampini     pcbddc->local_mat = temp_mat;
656534831adSStefano Zampini     /* restore rhs to its original state */
6573425bc38SStefano Zampini     if (rhs) {
6583425bc38SStefano Zampini       ierr = VecCopy(pcbddc->original_rhs,rhs);CHKERRQ(ierr);
6593425bc38SStefano Zampini     }
660534831adSStefano Zampini     /* Get Local boundary and apply transformation of basis to solution vector */
661534831adSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,x,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
662534831adSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,x,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
663534831adSStefano Zampini     /* from modified basis to original basis */
664534831adSStefano Zampini     ierr = MatMult(pcbddc->ChangeOfBasisMatrix,pcis->vec1_B,pcis->vec2_B);CHKERRQ(ierr);
665534831adSStefano Zampini     /* put back modified values into the global vec using INSERT_VALUES copy mode */
666534831adSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,pcis->vec2_B,x,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
667534831adSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec2_B,x,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
668534831adSStefano Zampini   }
6693972b0daSStefano Zampini   /* add solution removed in presolve */
6703425bc38SStefano Zampini   if (x) {
6713425bc38SStefano Zampini     ierr = VecAXPY(x,1.0,pcbddc->temp_solution);CHKERRQ(ierr);
6723425bc38SStefano Zampini   }
673534831adSStefano Zampini   PetscFunctionReturn(0);
674534831adSStefano Zampini }
675534831adSStefano Zampini /* -------------------------------------------------------------------------- */
67653cdbc3dSStefano Zampini #undef __FUNCT__
67753cdbc3dSStefano Zampini #define __FUNCT__ "PCSetUp_BDDC"
6780c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
6790c7d97c5SJed Brown /*
6800c7d97c5SJed Brown    PCSetUp_BDDC - Prepares for the use of the BDDC preconditioner
6810c7d97c5SJed Brown                   by setting data structures and options.
6820c7d97c5SJed Brown 
6830c7d97c5SJed Brown    Input Parameter:
68453cdbc3dSStefano Zampini +  pc - the preconditioner context
6850c7d97c5SJed Brown 
6860c7d97c5SJed Brown    Application Interface Routine: PCSetUp()
6870c7d97c5SJed Brown 
6880c7d97c5SJed Brown    Notes:
6890c7d97c5SJed Brown    The interface routine PCSetUp() is not usually called directly by
6900c7d97c5SJed Brown    the user, but instead is called by PCApply() if necessary.
6910c7d97c5SJed Brown */
69253cdbc3dSStefano Zampini PetscErrorCode PCSetUp_BDDC(PC pc)
6930c7d97c5SJed Brown {
6940c7d97c5SJed Brown   PetscErrorCode ierr;
6950c7d97c5SJed Brown   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
6960c7d97c5SJed Brown 
6970c7d97c5SJed Brown   PetscFunctionBegin;
6980c7d97c5SJed Brown   if (!pc->setupcalled) {
6993b03a366Sstefano_zampini     /* For BDDC we need to define a local "Neumann" problem different to that defined in PCISSetup
7009c0446d6SStefano Zampini        So, we set to pcnone the Neumann problem of pcis in order to avoid unneeded computation
7010c7d97c5SJed Brown        Also, we decide to directly build the (same) Dirichlet problem */
7020c7d97c5SJed Brown     ierr = PetscOptionsSetValue("-is_localN_pc_type","none");CHKERRQ(ierr);
7030c7d97c5SJed Brown     ierr = PetscOptionsSetValue("-is_localD_pc_type","none");CHKERRQ(ierr);
7040c7d97c5SJed Brown     /* Set up all the "iterative substructuring" common block */
7050bdf917eSStefano Zampini 
7060c7d97c5SJed Brown     ierr = PCISSetUp(pc);CHKERRQ(ierr);
7073b03a366Sstefano_zampini     /* Get stdout for dbg */
708e269702eSStefano Zampini     if (pcbddc->dbg_flag) {
709ce94432eSBarry Smith       ierr = PetscViewerASCIIGetStdout(PetscObjectComm((PetscObject)pc),&pcbddc->dbg_viewer);CHKERRQ(ierr);
710e269702eSStefano Zampini       ierr = PetscViewerASCIISynchronizedAllow(pcbddc->dbg_viewer,PETSC_TRUE);CHKERRQ(ierr);
711e269702eSStefano Zampini     }
7123b03a366Sstefano_zampini     /* Analyze local interface */
7130c7d97c5SJed Brown     ierr = PCBDDCManageLocalBoundaries(pc);CHKERRQ(ierr);
7143b03a366Sstefano_zampini     /* Set up local constraint matrix */
7153b03a366Sstefano_zampini     ierr = PCBDDCCreateConstraintMatrix(pc);CHKERRQ(ierr);
7160c7d97c5SJed Brown     /* Create coarse and local stuffs used for evaluating action of preconditioner */
7170c7d97c5SJed Brown     ierr = PCBDDCCoarseSetUp(pc);CHKERRQ(ierr);
7180c7d97c5SJed Brown   }
7190c7d97c5SJed Brown   PetscFunctionReturn(0);
7200c7d97c5SJed Brown }
7210c7d97c5SJed Brown 
7220c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
7230c7d97c5SJed Brown /*
7240c7d97c5SJed Brown    PCApply_BDDC - Applies the BDDC preconditioner to a vector.
7250c7d97c5SJed Brown 
7260c7d97c5SJed Brown    Input Parameters:
7270c7d97c5SJed Brown .  pc - the preconditioner context
7280c7d97c5SJed Brown .  r - input vector (global)
7290c7d97c5SJed Brown 
7300c7d97c5SJed Brown    Output Parameter:
7310c7d97c5SJed Brown .  z - output vector (global)
7320c7d97c5SJed Brown 
7330c7d97c5SJed Brown    Application Interface Routine: PCApply()
7340c7d97c5SJed Brown  */
7350c7d97c5SJed Brown #undef __FUNCT__
7360c7d97c5SJed Brown #define __FUNCT__ "PCApply_BDDC"
73753cdbc3dSStefano Zampini PetscErrorCode PCApply_BDDC(PC pc,Vec r,Vec z)
7380c7d97c5SJed Brown {
7390c7d97c5SJed Brown   PC_IS             *pcis   = (PC_IS*)(pc->data);
7400c7d97c5SJed Brown   PC_BDDC           *pcbddc = (PC_BDDC*)(pc->data);
7410c7d97c5SJed Brown   PetscErrorCode    ierr;
7423b03a366Sstefano_zampini   const PetscScalar one   = 1.0;
7433b03a366Sstefano_zampini   const PetscScalar m_one = -1.0;
7442617d88aSStefano Zampini   const PetscScalar zero  = 0.0;
7450c7d97c5SJed Brown 
7460c7d97c5SJed Brown /* This code is similar to that provided in nn.c for PCNN
7470c7d97c5SJed Brown    NN interface preconditioner changed to BDDC
74829622bf0SStefano Zampini    Added support for M_3 preconditioner in the reference article (code is active if pcbddc->inexact_prec_type = PETSC_TRUE) */
7490c7d97c5SJed Brown 
7500c7d97c5SJed Brown   PetscFunctionBegin;
751b76ba322SStefano Zampini   if (!pcbddc->use_exact_dirichlet) {
7520c7d97c5SJed Brown     /* First Dirichlet solve */
7530c7d97c5SJed Brown     ierr = VecScatterBegin(pcis->global_to_D,r,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
7540c7d97c5SJed Brown     ierr = VecScatterEnd  (pcis->global_to_D,r,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
75553cdbc3dSStefano Zampini     ierr = KSPSolve(pcbddc->ksp_D,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr);
7560c7d97c5SJed Brown     /*
7570c7d97c5SJed Brown       Assembling right hand side for BDDC operator
7580c7d97c5SJed Brown       - vec1_D for the Dirichlet part (if needed, i.e. prec_flag=PETSC_TRUE)
7590c7d97c5SJed Brown       - the interface part of the global vector z
7600c7d97c5SJed Brown     */
7610c7d97c5SJed Brown     ierr = VecScale(pcis->vec2_D,m_one);CHKERRQ(ierr);
7620c7d97c5SJed Brown     ierr = MatMult(pcis->A_BI,pcis->vec2_D,pcis->vec1_B);CHKERRQ(ierr);
76329622bf0SStefano Zampini     if (pcbddc->inexact_prec_type) { ierr = MatMultAdd(pcis->A_II,pcis->vec2_D,pcis->vec1_D,pcis->vec1_D);CHKERRQ(ierr); }
7640c7d97c5SJed Brown     ierr = VecScale(pcis->vec2_D,m_one);CHKERRQ(ierr);
7650c7d97c5SJed Brown     ierr = VecCopy(r,z);CHKERRQ(ierr);
7660c7d97c5SJed Brown     ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
7670c7d97c5SJed Brown     ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
7682617d88aSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
7692617d88aSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
770b76ba322SStefano Zampini   } else {
771b76ba322SStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,r,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
772b76ba322SStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,r,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
7730bdf917eSStefano Zampini     ierr = VecSet(pcis->vec1_D,zero);CHKERRQ(ierr);
774b76ba322SStefano Zampini     ierr = VecSet(pcis->vec2_D,zero);CHKERRQ(ierr);
775b76ba322SStefano Zampini   }
776b76ba322SStefano Zampini 
777b76ba322SStefano Zampini   /* Apply partition of unity */
7782617d88aSStefano Zampini   ierr = VecPointwiseMult(pcis->vec1_B,pcis->D,pcis->vec1_B);CHKERRQ(ierr);
7792617d88aSStefano Zampini 
7802617d88aSStefano Zampini   /* Apply interface preconditioner
7812617d88aSStefano Zampini      input/output vecs: pcis->vec1_B and pcis->vec1_D */
7822617d88aSStefano Zampini   ierr = PCBDDCApplyInterfacePreconditioner(pc);CHKERRQ(ierr);
7832617d88aSStefano Zampini 
7842617d88aSStefano Zampini   /* Apply partition of unity and sum boundary values */
7852617d88aSStefano Zampini   ierr = VecPointwiseMult(pcis->vec1_B,pcis->D,pcis->vec1_B);CHKERRQ(ierr);
7862617d88aSStefano Zampini   ierr = VecSet(z,zero);CHKERRQ(ierr);
7872617d88aSStefano Zampini   ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
7882617d88aSStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
7890c7d97c5SJed Brown 
7903b03a366Sstefano_zampini   /* Second Dirichlet solve and assembling of output */
7910c7d97c5SJed Brown   ierr = VecScatterBegin(pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
7920c7d97c5SJed Brown   ierr = VecScatterEnd  (pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
7930c7d97c5SJed Brown   ierr = MatMult(pcis->A_IB,pcis->vec1_B,pcis->vec3_D);CHKERRQ(ierr);
79429622bf0SStefano Zampini   if (pcbddc->inexact_prec_type) { ierr = MatMultAdd(pcis->A_II,pcis->vec1_D,pcis->vec3_D,pcis->vec3_D);CHKERRQ(ierr); }
79553cdbc3dSStefano Zampini   ierr = KSPSolve(pcbddc->ksp_D,pcis->vec3_D,pcbddc->vec4_D);CHKERRQ(ierr);
7960c7d97c5SJed Brown   ierr = VecScale(pcbddc->vec4_D,m_one);CHKERRQ(ierr);
79729622bf0SStefano Zampini   if (pcbddc->inexact_prec_type) { ierr = VecAXPY (pcbddc->vec4_D,one,pcis->vec1_D);CHKERRQ(ierr); }
7980c7d97c5SJed Brown   ierr = VecAXPY (pcis->vec2_D,one,pcbddc->vec4_D);CHKERRQ(ierr);
7990c7d97c5SJed Brown   ierr = VecScatterBegin(pcis->global_to_D,pcis->vec2_D,z,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
8000c7d97c5SJed Brown   ierr = VecScatterEnd  (pcis->global_to_D,pcis->vec2_D,z,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
8010c7d97c5SJed Brown   PetscFunctionReturn(0);
8020c7d97c5SJed Brown 
8030c7d97c5SJed Brown }
804da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
805da1bb401SStefano Zampini #undef __FUNCT__
806da1bb401SStefano Zampini #define __FUNCT__ "PCDestroy_BDDC"
807da1bb401SStefano Zampini PetscErrorCode PCDestroy_BDDC(PC pc)
808da1bb401SStefano Zampini {
809da1bb401SStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
8100bdf917eSStefano Zampini   PetscInt       i;
811da1bb401SStefano Zampini   PetscErrorCode ierr;
812da1bb401SStefano Zampini 
813da1bb401SStefano Zampini   PetscFunctionBegin;
814da1bb401SStefano Zampini   /* free data created by PCIS */
815da1bb401SStefano Zampini   ierr = PCISDestroy(pc);CHKERRQ(ierr);
816da1bb401SStefano Zampini   /* free BDDC data  */
8170bdf917eSStefano Zampini   ierr = MatNullSpaceDestroy(&pcbddc->CoarseNullSpace);CHKERRQ(ierr);
8180bdf917eSStefano Zampini   ierr = MatNullSpaceDestroy(&pcbddc->NullSpace);CHKERRQ(ierr);
8193972b0daSStefano Zampini   ierr = VecDestroy(&pcbddc->temp_solution);CHKERRQ(ierr);
820534831adSStefano Zampini   ierr = VecDestroy(&pcbddc->original_rhs);CHKERRQ(ierr);
821534831adSStefano Zampini   ierr = MatDestroy(&pcbddc->local_mat);CHKERRQ(ierr);
822534831adSStefano Zampini   ierr = MatDestroy(&pcbddc->ChangeOfBasisMatrix);CHKERRQ(ierr);
823da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->coarse_vec);CHKERRQ(ierr);
824da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->coarse_rhs);CHKERRQ(ierr);
825da1bb401SStefano Zampini   ierr = KSPDestroy(&pcbddc->coarse_ksp);CHKERRQ(ierr);
826da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->coarse_mat);CHKERRQ(ierr);
827da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->coarse_phi_B);CHKERRQ(ierr);
828da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->coarse_phi_D);CHKERRQ(ierr);
829da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec1_P);CHKERRQ(ierr);
830da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec1_C);CHKERRQ(ierr);
831da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->local_auxmat1);CHKERRQ(ierr);
832da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->local_auxmat2);CHKERRQ(ierr);
833da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec1_R);CHKERRQ(ierr);
834da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec2_R);CHKERRQ(ierr);
835da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec4_D);CHKERRQ(ierr);
836da1bb401SStefano Zampini   ierr = VecScatterDestroy(&pcbddc->R_to_B);CHKERRQ(ierr);
837da1bb401SStefano Zampini   ierr = VecScatterDestroy(&pcbddc->R_to_D);CHKERRQ(ierr);
838da1bb401SStefano Zampini   ierr = VecScatterDestroy(&pcbddc->coarse_loc_to_glob);CHKERRQ(ierr);
839da1bb401SStefano Zampini   ierr = KSPDestroy(&pcbddc->ksp_D);CHKERRQ(ierr);
840da1bb401SStefano Zampini   ierr = KSPDestroy(&pcbddc->ksp_R);CHKERRQ(ierr);
841da1bb401SStefano Zampini   ierr = ISDestroy(&pcbddc->NeumannBoundaries);CHKERRQ(ierr);
842da1bb401SStefano Zampini   ierr = ISDestroy(&pcbddc->DirichletBoundaries);CHKERRQ(ierr);
843da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->ConstraintMatrix);CHKERRQ(ierr);
844da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->local_primal_indices);CHKERRQ(ierr);
845da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->replicated_local_primal_indices);CHKERRQ(ierr);
8460bdf917eSStefano Zampini   ierr = PetscFree(pcbddc->replicated_local_primal_values);CHKERRQ(ierr);
847da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->local_primal_displacements);CHKERRQ(ierr);
848da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->local_primal_sizes);CHKERRQ(ierr);
8492fa5cd67SKarl Rupp   for (i=0; i<pcbddc->n_ISForDofs; i++) {
8502fa5cd67SKarl Rupp     ierr = ISDestroy(&pcbddc->ISForDofs[i]);CHKERRQ(ierr);
8512fa5cd67SKarl Rupp   }
852da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->ISForDofs);CHKERRQ(ierr);
8532fa5cd67SKarl Rupp   for (i=0; i<pcbddc->n_ISForFaces; i++) {
8542fa5cd67SKarl Rupp     ierr = ISDestroy(&pcbddc->ISForFaces[i]);CHKERRQ(ierr);
8552fa5cd67SKarl Rupp   }
856da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->ISForFaces);CHKERRQ(ierr);
8572fa5cd67SKarl Rupp   for (i=0; i<pcbddc->n_ISForEdges; i++) {
8582fa5cd67SKarl Rupp     ierr = ISDestroy(&pcbddc->ISForEdges[i]);CHKERRQ(ierr);
8592fa5cd67SKarl Rupp   }
860da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->ISForEdges);CHKERRQ(ierr);
861da1bb401SStefano Zampini   ierr = ISDestroy(&pcbddc->ISForVertices);CHKERRQ(ierr);
8623972b0daSStefano Zampini   /* Free graph structure */
863da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph->xadj);CHKERRQ(ierr);
864da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph->adjncy);CHKERRQ(ierr);
865142dfd88SStefano Zampini   if (pcbddc->mat_graph->nvtxs) {
866da1bb401SStefano Zampini     ierr = PetscFree(pcbddc->mat_graph->neighbours_set[0]);CHKERRQ(ierr);
867142dfd88SStefano Zampini   }
868da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph->neighbours_set);CHKERRQ(ierr);
8693972b0daSStefano Zampini   ierr = PetscFree4(pcbddc->mat_graph->where,pcbddc->mat_graph->count,pcbddc->mat_graph->cptr,pcbddc->mat_graph->queue);CHKERRQ(ierr);
8703972b0daSStefano Zampini   ierr = PetscFree2(pcbddc->mat_graph->which_dof,pcbddc->mat_graph->touched);CHKERRQ(ierr);
8713972b0daSStefano Zampini   ierr = PetscFree(pcbddc->mat_graph->where_ncmps);CHKERRQ(ierr);
872da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph);CHKERRQ(ierr);
8733425bc38SStefano Zampini   /* remove functions */
87400de8ff0SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCSetCoarseningRatio_C","",NULL);CHKERRQ(ierr);
87500de8ff0SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCSetMaxLevels_C","",NULL);CHKERRQ(ierr);
87600de8ff0SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCSetNullSpace_C","",NULL);CHKERRQ(ierr);
87700de8ff0SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCSetDirichletBoundaries_C","",NULL);CHKERRQ(ierr);
87800de8ff0SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCSetNeumannBoundaries_C","",NULL);CHKERRQ(ierr);
87900de8ff0SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCGetDirichletBoundaries_C","",NULL);CHKERRQ(ierr);
88000de8ff0SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCGetNeumannBoundaries_C","",NULL);CHKERRQ(ierr);
88100de8ff0SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCSetCoarseProblemType_C","",NULL);CHKERRQ(ierr);
88200de8ff0SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCSetDofsSplitting_C","",NULL);CHKERRQ(ierr);
88300de8ff0SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCSetLocalAdjacencyGraph_C","",NULL);CHKERRQ(ierr);
88400de8ff0SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)pc,"PCPreSolve_C","",NULL);CHKERRQ(ierr);
88500de8ff0SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)pc,"PCPostSolve_C","",NULL);CHKERRQ(ierr);
88600de8ff0SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCCreateFETIDPOperators_C","",NULL);CHKERRQ(ierr);
88700de8ff0SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCMatFETIDPGetRHS_C","",NULL);CHKERRQ(ierr);
88800de8ff0SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCMatFETIDPGetSolution_C","",NULL);CHKERRQ(ierr);
889da1bb401SStefano Zampini   /* Free the private data structure that was hanging off the PC */
890da1bb401SStefano Zampini   ierr = PetscFree(pcbddc);CHKERRQ(ierr);
891da1bb401SStefano Zampini   PetscFunctionReturn(0);
892da1bb401SStefano Zampini }
8933425bc38SStefano Zampini /* -------------------------------------------------------------------------- */
894*1e6b0712SBarry Smith 
8953425bc38SStefano Zampini #undef __FUNCT__
8963425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetRHS_BDDC"
8973425bc38SStefano Zampini static PetscErrorCode PCBDDCMatFETIDPGetRHS_BDDC(Mat fetidp_mat, Vec standard_rhs, Vec fetidp_flux_rhs)
8983425bc38SStefano Zampini {
8993425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
9003425bc38SStefano Zampini   PC_IS          * pcis;
9013425bc38SStefano Zampini   PC_BDDC        * pcbddc;
9023425bc38SStefano Zampini   PetscErrorCode ierr;
9030c7d97c5SJed Brown 
9043425bc38SStefano Zampini   PetscFunctionBegin;
9053425bc38SStefano Zampini   ierr   = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr);
9063425bc38SStefano Zampini   pcis   = (PC_IS*)mat_ctx->pc->data;
9073425bc38SStefano Zampini   pcbddc = (PC_BDDC*)mat_ctx->pc->data;
9083425bc38SStefano Zampini 
9093425bc38SStefano Zampini   /* change of basis for physical rhs if needed
9103425bc38SStefano Zampini      It also changes the rhs in case of dirichlet boundaries */
9110298fd71SBarry Smith   (*mat_ctx->pc->ops->presolve)(mat_ctx->pc,NULL,standard_rhs,NULL);
9123425bc38SStefano Zampini   /* store vectors for computation of fetidp final solution */
9133425bc38SStefano Zampini   ierr = VecScatterBegin(pcis->global_to_D,standard_rhs,mat_ctx->temp_solution_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
9143425bc38SStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_D,standard_rhs,mat_ctx->temp_solution_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
9153425bc38SStefano Zampini   ierr = VecScatterBegin(pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
9163425bc38SStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
9173425bc38SStefano Zampini   /* scale rhs since it should be unassembled */
9183425bc38SStefano Zampini   ierr = VecPointwiseMult(mat_ctx->temp_solution_B,pcis->D,mat_ctx->temp_solution_B);CHKERRQ(ierr);
91929622bf0SStefano Zampini   if (!pcbddc->inexact_prec_type) {
9203425bc38SStefano Zampini     /* compute partially subassembled Schur complement right-hand side */
9213425bc38SStefano Zampini     ierr = KSPSolve(pcbddc->ksp_D,mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr);
9223425bc38SStefano Zampini     ierr = MatMult(pcis->A_BI,pcis->vec1_D,pcis->vec1_B);CHKERRQ(ierr);
9233425bc38SStefano Zampini     ierr = VecAXPY(mat_ctx->temp_solution_B,-1.0,pcis->vec1_B);CHKERRQ(ierr);
9243425bc38SStefano Zampini     ierr = VecSet(standard_rhs,0.0);CHKERRQ(ierr);
9253425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,mat_ctx->temp_solution_B,standard_rhs,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
9263425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,mat_ctx->temp_solution_B,standard_rhs,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
9273425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
9283425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
9293425bc38SStefano Zampini     ierr = VecPointwiseMult(mat_ctx->temp_solution_B,pcis->D,mat_ctx->temp_solution_B);CHKERRQ(ierr);
9303425bc38SStefano Zampini   }
9313425bc38SStefano Zampini   /* BDDC rhs */
9323425bc38SStefano Zampini   ierr = VecCopy(mat_ctx->temp_solution_B,pcis->vec1_B);CHKERRQ(ierr);
93329622bf0SStefano Zampini   if (pcbddc->inexact_prec_type) {
9343425bc38SStefano Zampini     ierr = VecCopy(mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr);
9353425bc38SStefano Zampini   }
9363425bc38SStefano Zampini   /* apply BDDC */
9373425bc38SStefano Zampini   ierr = PCBDDCApplyInterfacePreconditioner(mat_ctx->pc);CHKERRQ(ierr);
9383425bc38SStefano Zampini   /* Application of B_delta and assembling of rhs for fetidp fluxes */
9393425bc38SStefano Zampini   ierr = VecSet(fetidp_flux_rhs,0.0);CHKERRQ(ierr);
9403425bc38SStefano Zampini   ierr = MatMult(mat_ctx->B_delta,pcis->vec1_B,mat_ctx->lambda_local);CHKERRQ(ierr);
9413425bc38SStefano Zampini   ierr = VecScatterBegin(mat_ctx->l2g_lambda,mat_ctx->lambda_local,fetidp_flux_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
9423425bc38SStefano Zampini   ierr = VecScatterEnd  (mat_ctx->l2g_lambda,mat_ctx->lambda_local,fetidp_flux_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
9433425bc38SStefano Zampini   /* restore original rhs */
9443425bc38SStefano Zampini   ierr = VecCopy(pcbddc->original_rhs,standard_rhs);CHKERRQ(ierr);
9453425bc38SStefano Zampini   PetscFunctionReturn(0);
9463425bc38SStefano Zampini }
947*1e6b0712SBarry Smith 
9483425bc38SStefano Zampini #undef __FUNCT__
9493425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetRHS"
9503425bc38SStefano Zampini /*@
9513425bc38SStefano Zampini  PCBDDCMatFETIDPGetRHS - Get rhs for FETIDP linear system.
9523425bc38SStefano Zampini 
9533425bc38SStefano Zampini    Collective
9543425bc38SStefano Zampini 
9553425bc38SStefano Zampini    Input Parameters:
9563425bc38SStefano Zampini +  fetidp_mat   - the FETIDP mat obtained by a call to PCBDDCCreateFETIDPOperators
9573425bc38SStefano Zampini +  standard_rhs - the rhs of your linear system
9583425bc38SStefano Zampini 
9593425bc38SStefano Zampini    Output Parameters:
9603425bc38SStefano Zampini +  fetidp_flux_rhs   - the rhs of the FETIDP linear system
9613425bc38SStefano Zampini 
9623425bc38SStefano Zampini    Level: developer
9633425bc38SStefano Zampini 
9643425bc38SStefano Zampini    Notes:
9653425bc38SStefano Zampini 
9663425bc38SStefano Zampini .seealso: PCBDDC
9673425bc38SStefano Zampini @*/
9683425bc38SStefano Zampini PetscErrorCode PCBDDCMatFETIDPGetRHS(Mat fetidp_mat, Vec standard_rhs, Vec fetidp_flux_rhs)
9693425bc38SStefano Zampini {
9703425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
9713425bc38SStefano Zampini   PetscErrorCode ierr;
9723425bc38SStefano Zampini 
9733425bc38SStefano Zampini   PetscFunctionBegin;
9743425bc38SStefano Zampini   ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr);
9753425bc38SStefano Zampini   ierr = PetscTryMethod(mat_ctx->pc,"PCBDDCMatFETIDPGetRHS_C",(Mat,Vec,Vec),(fetidp_mat,standard_rhs,fetidp_flux_rhs));CHKERRQ(ierr);
9763425bc38SStefano Zampini   PetscFunctionReturn(0);
9773425bc38SStefano Zampini }
9783425bc38SStefano Zampini /* -------------------------------------------------------------------------- */
979*1e6b0712SBarry Smith 
9803425bc38SStefano Zampini #undef __FUNCT__
9813425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetSolution_BDDC"
9823425bc38SStefano Zampini static PetscErrorCode PCBDDCMatFETIDPGetSolution_BDDC(Mat fetidp_mat, Vec fetidp_flux_sol, Vec standard_sol)
9833425bc38SStefano Zampini {
9843425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
9853425bc38SStefano Zampini   PC_IS          *pcis;
9863425bc38SStefano Zampini   PC_BDDC        *pcbddc;
9873425bc38SStefano Zampini   PetscErrorCode ierr;
9883425bc38SStefano Zampini 
9893425bc38SStefano Zampini   PetscFunctionBegin;
9903425bc38SStefano Zampini   ierr   = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr);
9913425bc38SStefano Zampini   pcis   = (PC_IS*)mat_ctx->pc->data;
9923425bc38SStefano Zampini   pcbddc = (PC_BDDC*)mat_ctx->pc->data;
9933425bc38SStefano Zampini 
9943425bc38SStefano Zampini   /* apply B_delta^T */
9953425bc38SStefano Zampini   ierr = VecScatterBegin(mat_ctx->l2g_lambda,fetidp_flux_sol,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
9963425bc38SStefano Zampini   ierr = VecScatterEnd  (mat_ctx->l2g_lambda,fetidp_flux_sol,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
9973425bc38SStefano Zampini   ierr = MatMultTranspose(mat_ctx->B_delta,mat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr);
9983425bc38SStefano Zampini   /* compute rhs for BDDC application */
9993425bc38SStefano Zampini   ierr = VecAYPX(pcis->vec1_B,-1.0,mat_ctx->temp_solution_B);CHKERRQ(ierr);
100029622bf0SStefano Zampini   if (pcbddc->inexact_prec_type) {
10013425bc38SStefano Zampini     ierr = VecCopy(mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr);
10023425bc38SStefano Zampini   }
10033425bc38SStefano Zampini   /* apply BDDC */
10043425bc38SStefano Zampini   ierr = PCBDDCApplyInterfacePreconditioner(mat_ctx->pc);CHKERRQ(ierr);
10053425bc38SStefano Zampini   /* put values into standard global vector */
10063425bc38SStefano Zampini   ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
10073425bc38SStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec1_B,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
100829622bf0SStefano Zampini   if (!pcbddc->inexact_prec_type) {
10093425bc38SStefano Zampini     /* compute values into the interior if solved for the partially subassembled Schur complement */
10103425bc38SStefano Zampini     ierr = MatMult(pcis->A_IB,pcis->vec1_B,pcis->vec1_D);CHKERRQ(ierr);
10113425bc38SStefano Zampini     ierr = VecAXPY(mat_ctx->temp_solution_D,-1.0,pcis->vec1_D);CHKERRQ(ierr);
10123425bc38SStefano Zampini     ierr = KSPSolve(pcbddc->ksp_D,mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr);
10133425bc38SStefano Zampini   }
10143425bc38SStefano Zampini   ierr = VecScatterBegin(pcis->global_to_D,pcis->vec1_D,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
10153425bc38SStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_D,pcis->vec1_D,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
10163425bc38SStefano Zampini   /* final change of basis if needed
10173425bc38SStefano Zampini      Is also sums the dirichlet part removed during RHS assembling */
10180298fd71SBarry Smith   (*mat_ctx->pc->ops->postsolve)(mat_ctx->pc,NULL,NULL,standard_sol);
10193425bc38SStefano Zampini   PetscFunctionReturn(0);
10203425bc38SStefano Zampini 
10213425bc38SStefano Zampini }
1022*1e6b0712SBarry Smith 
10233425bc38SStefano Zampini #undef __FUNCT__
10243425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetSolution"
10253425bc38SStefano Zampini /*@
10263425bc38SStefano Zampini  PCBDDCMatFETIDPGetSolution - Get Solution for FETIDP linear system.
10273425bc38SStefano Zampini 
10283425bc38SStefano Zampini    Collective
10293425bc38SStefano Zampini 
10303425bc38SStefano Zampini    Input Parameters:
10313425bc38SStefano Zampini +  fetidp_mat        - the FETIDP mat obtained by a call to PCBDDCCreateFETIDPOperators
10323425bc38SStefano Zampini +  fetidp_flux_sol - the solution of the FETIDP linear system
10333425bc38SStefano Zampini 
10343425bc38SStefano Zampini    Output Parameters:
10353425bc38SStefano Zampini +  standard_sol      - the solution on the global domain
10363425bc38SStefano Zampini 
10373425bc38SStefano Zampini    Level: developer
10383425bc38SStefano Zampini 
10393425bc38SStefano Zampini    Notes:
10403425bc38SStefano Zampini 
10413425bc38SStefano Zampini .seealso: PCBDDC
10423425bc38SStefano Zampini @*/
10433425bc38SStefano Zampini PetscErrorCode PCBDDCMatFETIDPGetSolution(Mat fetidp_mat, Vec fetidp_flux_sol, Vec standard_sol)
10443425bc38SStefano Zampini {
10453425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
10463425bc38SStefano Zampini   PetscErrorCode ierr;
10473425bc38SStefano Zampini 
10483425bc38SStefano Zampini   PetscFunctionBegin;
10493425bc38SStefano Zampini   ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr);
10503425bc38SStefano Zampini   ierr = PetscTryMethod(mat_ctx->pc,"PCBDDCMatFETIDPGetSolution_C",(Mat,Vec,Vec),(fetidp_mat,fetidp_flux_sol,standard_sol));CHKERRQ(ierr);
10513425bc38SStefano Zampini   PetscFunctionReturn(0);
10523425bc38SStefano Zampini }
10533425bc38SStefano Zampini /* -------------------------------------------------------------------------- */
1054*1e6b0712SBarry Smith 
1055f23aa3ddSBarry Smith extern PetscErrorCode FETIDPMatMult(Mat,Vec,Vec);
1056f23aa3ddSBarry Smith extern PetscErrorCode PCBDDCDestroyFETIDPMat(Mat);
1057f23aa3ddSBarry Smith extern PetscErrorCode FETIDPPCApply(PC,Vec,Vec);
1058f23aa3ddSBarry Smith extern PetscErrorCode PCBDDCDestroyFETIDPPC(PC);
10593425bc38SStefano Zampini #undef __FUNCT__
10603425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPOperators_BDDC"
10613425bc38SStefano Zampini static PetscErrorCode PCBDDCCreateFETIDPOperators_BDDC(PC pc, Mat *fetidp_mat, PC *fetidp_pc)
10623425bc38SStefano Zampini {
10633425bc38SStefano Zampini   FETIDPMat_ctx  *fetidpmat_ctx;
10643425bc38SStefano Zampini   Mat            newmat;
10653425bc38SStefano Zampini   FETIDPPC_ctx   *fetidppc_ctx;
10663425bc38SStefano Zampini   PC             newpc;
1067ce94432eSBarry Smith   MPI_Comm       comm;
10683425bc38SStefano Zampini   PetscErrorCode ierr;
10693425bc38SStefano Zampini 
10703425bc38SStefano Zampini   PetscFunctionBegin;
1071ce94432eSBarry Smith   ierr = PetscObjectGetComm((PetscObject)pc,&comm);CHKERRQ(ierr);
10723425bc38SStefano Zampini   /* FETIDP linear matrix */
10733425bc38SStefano Zampini   ierr = PCBDDCCreateFETIDPMatContext(pc, &fetidpmat_ctx);CHKERRQ(ierr);
10743425bc38SStefano Zampini   ierr = PCBDDCSetupFETIDPMatContext(fetidpmat_ctx);CHKERRQ(ierr);
10753425bc38SStefano Zampini   ierr = MatCreateShell(comm,PETSC_DECIDE,PETSC_DECIDE,fetidpmat_ctx->n_lambda,fetidpmat_ctx->n_lambda,fetidpmat_ctx,&newmat);CHKERRQ(ierr);
10763425bc38SStefano Zampini   ierr = MatShellSetOperation(newmat,MATOP_MULT,(void (*)(void))FETIDPMatMult);CHKERRQ(ierr);
10773425bc38SStefano Zampini   ierr = MatShellSetOperation(newmat,MATOP_DESTROY,(void (*)(void))PCBDDCDestroyFETIDPMat);CHKERRQ(ierr);
10783425bc38SStefano Zampini   ierr = MatSetUp(newmat);CHKERRQ(ierr);
10793425bc38SStefano Zampini   /* FETIDP preconditioner */
10803425bc38SStefano Zampini   ierr = PCBDDCCreateFETIDPPCContext(pc, &fetidppc_ctx);CHKERRQ(ierr);
10813425bc38SStefano Zampini   ierr = PCBDDCSetupFETIDPPCContext(newmat,fetidppc_ctx);CHKERRQ(ierr);
10823425bc38SStefano Zampini   ierr = PCCreate(comm,&newpc);CHKERRQ(ierr);
10833425bc38SStefano Zampini   ierr = PCSetType(newpc,PCSHELL);CHKERRQ(ierr);
10843425bc38SStefano Zampini   ierr = PCShellSetContext(newpc,fetidppc_ctx);CHKERRQ(ierr);
10853425bc38SStefano Zampini   ierr = PCShellSetApply(newpc,FETIDPPCApply);CHKERRQ(ierr);
10863425bc38SStefano Zampini   ierr = PCShellSetDestroy(newpc,PCBDDCDestroyFETIDPPC);CHKERRQ(ierr);
10873425bc38SStefano Zampini   ierr = PCSetOperators(newpc,newmat,newmat,SAME_PRECONDITIONER);CHKERRQ(ierr);
10883425bc38SStefano Zampini   ierr = PCSetUp(newpc);CHKERRQ(ierr);
10892fa5cd67SKarl Rupp 
10903425bc38SStefano Zampini   /* return pointers for objects created */
10913425bc38SStefano Zampini   *fetidp_mat = newmat;
10923425bc38SStefano Zampini   *fetidp_pc  = newpc;
10933425bc38SStefano Zampini   PetscFunctionReturn(0);
10943425bc38SStefano Zampini }
1095*1e6b0712SBarry Smith 
10963425bc38SStefano Zampini #undef __FUNCT__
10973425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPOperators"
10983425bc38SStefano Zampini /*@
10993425bc38SStefano Zampini  PCBDDCCreateFETIDPOperators - Create operators for FETIDP.
11003425bc38SStefano Zampini 
11013425bc38SStefano Zampini    Collective
11023425bc38SStefano Zampini 
11033425bc38SStefano Zampini    Input Parameters:
11043425bc38SStefano Zampini +  pc - the BDDC preconditioning context (setup must be already called)
11053425bc38SStefano Zampini 
11063425bc38SStefano Zampini    Level: developer
11073425bc38SStefano Zampini 
11083425bc38SStefano Zampini    Notes:
11093425bc38SStefano Zampini 
11103425bc38SStefano Zampini .seealso: PCBDDC
11113425bc38SStefano Zampini @*/
11123425bc38SStefano Zampini PetscErrorCode PCBDDCCreateFETIDPOperators(PC pc, Mat *fetidp_mat, PC *fetidp_pc)
11133425bc38SStefano Zampini {
11143425bc38SStefano Zampini   PetscErrorCode ierr;
11153425bc38SStefano Zampini 
11163425bc38SStefano Zampini   PetscFunctionBegin;
11173425bc38SStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
11183425bc38SStefano Zampini   if (pc->setupcalled) {
11193425bc38SStefano Zampini     ierr = PetscTryMethod(pc,"PCBDDCCreateFETIDPOperators_C",(PC,Mat*,PC*),(pc,fetidp_mat,fetidp_pc));CHKERRQ(ierr);
1120f23aa3ddSBarry Smith   } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"You must call PCSetup_BDDC() first \n");
11213425bc38SStefano Zampini   PetscFunctionReturn(0);
11223425bc38SStefano Zampini }
11230c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
1124da1bb401SStefano Zampini /*MC
1125da1bb401SStefano Zampini    PCBDDC - Balancing Domain Decomposition by Constraints.
11260c7d97c5SJed Brown 
1127da1bb401SStefano Zampini    Options Database Keys:
1128da1bb401SStefano Zampini .    -pcbddc ??? -
1129da1bb401SStefano Zampini 
1130da1bb401SStefano Zampini    Level: intermediate
1131da1bb401SStefano Zampini 
1132da1bb401SStefano Zampini    Notes: The matrix used with this preconditioner must be of type MATIS
1133da1bb401SStefano Zampini 
1134da1bb401SStefano Zampini           Unlike more 'conventional' interface preconditioners, this iterates over ALL the
1135da1bb401SStefano Zampini           degrees of freedom, NOT just those on the interface (this allows the use of approximate solvers
1136da1bb401SStefano Zampini           on the subdomains).
1137da1bb401SStefano Zampini 
1138da1bb401SStefano Zampini           Options for the coarse grid preconditioner can be set with -
1139da1bb401SStefano Zampini           Options for the Dirichlet subproblem can be set with -
1140da1bb401SStefano Zampini           Options for the Neumann subproblem can be set with -
1141da1bb401SStefano Zampini 
1142da1bb401SStefano Zampini    Contributed by Stefano Zampini
1143da1bb401SStefano Zampini 
1144da1bb401SStefano Zampini .seealso:  PCCreate(), PCSetType(), PCType (for list of available types), PC,  MATIS
1145da1bb401SStefano Zampini M*/
1146da1bb401SStefano Zampini EXTERN_C_BEGIN
1147da1bb401SStefano Zampini #undef __FUNCT__
1148da1bb401SStefano Zampini #define __FUNCT__ "PCCreate_BDDC"
1149da1bb401SStefano Zampini PetscErrorCode PCCreate_BDDC(PC pc)
1150da1bb401SStefano Zampini {
1151da1bb401SStefano Zampini   PetscErrorCode ierr;
1152da1bb401SStefano Zampini   PC_BDDC        *pcbddc;
1153da1bb401SStefano Zampini   PCBDDCGraph    mat_graph;
1154da1bb401SStefano Zampini 
1155da1bb401SStefano Zampini   PetscFunctionBegin;
1156da1bb401SStefano Zampini   /* Creates the private data structure for this preconditioner and attach it to the PC object. */
1157da1bb401SStefano Zampini   ierr     = PetscNewLog(pc,PC_BDDC,&pcbddc);CHKERRQ(ierr);
1158da1bb401SStefano Zampini   pc->data = (void*)pcbddc;
1159da1bb401SStefano Zampini 
1160da1bb401SStefano Zampini   /* create PCIS data structure */
1161da1bb401SStefano Zampini   ierr = PCISCreate(pc);CHKERRQ(ierr);
1162da1bb401SStefano Zampini 
1163da1bb401SStefano Zampini   /* BDDC specific */
11640bdf917eSStefano Zampini   pcbddc->CoarseNullSpace                 = 0;
11650bdf917eSStefano Zampini   pcbddc->NullSpace                       = 0;
11663972b0daSStefano Zampini   pcbddc->temp_solution                   = 0;
1167534831adSStefano Zampini   pcbddc->original_rhs                    = 0;
1168534831adSStefano Zampini   pcbddc->local_mat                       = 0;
1169534831adSStefano Zampini   pcbddc->ChangeOfBasisMatrix             = 0;
1170534831adSStefano Zampini   pcbddc->usechangeofbasis                = PETSC_TRUE;
1171534831adSStefano Zampini   pcbddc->usechangeonfaces                = PETSC_FALSE;
1172da1bb401SStefano Zampini   pcbddc->coarse_vec                      = 0;
1173da1bb401SStefano Zampini   pcbddc->coarse_rhs                      = 0;
1174da1bb401SStefano Zampini   pcbddc->coarse_ksp                      = 0;
1175da1bb401SStefano Zampini   pcbddc->coarse_phi_B                    = 0;
1176da1bb401SStefano Zampini   pcbddc->coarse_phi_D                    = 0;
1177da1bb401SStefano Zampini   pcbddc->vec1_P                          = 0;
1178da1bb401SStefano Zampini   pcbddc->vec1_R                          = 0;
1179da1bb401SStefano Zampini   pcbddc->vec2_R                          = 0;
1180da1bb401SStefano Zampini   pcbddc->local_auxmat1                   = 0;
1181da1bb401SStefano Zampini   pcbddc->local_auxmat2                   = 0;
1182da1bb401SStefano Zampini   pcbddc->R_to_B                          = 0;
1183da1bb401SStefano Zampini   pcbddc->R_to_D                          = 0;
1184da1bb401SStefano Zampini   pcbddc->ksp_D                           = 0;
1185da1bb401SStefano Zampini   pcbddc->ksp_R                           = 0;
1186da1bb401SStefano Zampini   pcbddc->local_primal_indices            = 0;
118729622bf0SStefano Zampini   pcbddc->inexact_prec_type               = PETSC_FALSE;
1188da1bb401SStefano Zampini   pcbddc->NeumannBoundaries               = 0;
1189da1bb401SStefano Zampini   pcbddc->ISForDofs                       = 0;
1190da1bb401SStefano Zampini   pcbddc->ISForVertices                   = 0;
1191da1bb401SStefano Zampini   pcbddc->n_ISForFaces                    = 0;
1192da1bb401SStefano Zampini   pcbddc->n_ISForEdges                    = 0;
1193da1bb401SStefano Zampini   pcbddc->ConstraintMatrix                = 0;
1194da1bb401SStefano Zampini   pcbddc->use_nnsp_true                   = PETSC_FALSE;
1195da1bb401SStefano Zampini   pcbddc->local_primal_sizes              = 0;
1196da1bb401SStefano Zampini   pcbddc->local_primal_displacements      = 0;
1197da1bb401SStefano Zampini   pcbddc->replicated_local_primal_indices = 0;
1198da1bb401SStefano Zampini   pcbddc->replicated_local_primal_values  = 0;
1199da1bb401SStefano Zampini   pcbddc->coarse_loc_to_glob              = 0;
1200da1bb401SStefano Zampini   pcbddc->dbg_flag                        = PETSC_FALSE;
1201da1bb401SStefano Zampini   pcbddc->coarsening_ratio                = 8;
1202b76ba322SStefano Zampini   pcbddc->use_exact_dirichlet             = PETSC_TRUE;
12034fad6a16SStefano Zampini   pcbddc->current_level                   = 0;
12044fad6a16SStefano Zampini   pcbddc->max_levels                      = 1;
1205da1bb401SStefano Zampini 
1206da1bb401SStefano Zampini   /* allocate and initialize needed graph structure */
1207da1bb401SStefano Zampini   ierr                      = PetscMalloc(sizeof(*mat_graph),&pcbddc->mat_graph);CHKERRQ(ierr);
1208da1bb401SStefano Zampini   pcbddc->mat_graph->xadj   = 0;
1209da1bb401SStefano Zampini   pcbddc->mat_graph->adjncy = 0;
1210da1bb401SStefano Zampini 
1211da1bb401SStefano Zampini   /* function pointers */
1212da1bb401SStefano Zampini   pc->ops->apply               = PCApply_BDDC;
1213da1bb401SStefano Zampini   pc->ops->applytranspose      = 0;
1214da1bb401SStefano Zampini   pc->ops->setup               = PCSetUp_BDDC;
1215da1bb401SStefano Zampini   pc->ops->destroy             = PCDestroy_BDDC;
1216da1bb401SStefano Zampini   pc->ops->setfromoptions      = PCSetFromOptions_BDDC;
1217da1bb401SStefano Zampini   pc->ops->view                = 0;
1218da1bb401SStefano Zampini   pc->ops->applyrichardson     = 0;
1219da1bb401SStefano Zampini   pc->ops->applysymmetricleft  = 0;
1220da1bb401SStefano Zampini   pc->ops->applysymmetricright = 0;
1221534831adSStefano Zampini   pc->ops->presolve            = PCPreSolve_BDDC;
1222534831adSStefano Zampini   pc->ops->postsolve           = PCPostSolve_BDDC;
1223da1bb401SStefano Zampini 
1224da1bb401SStefano Zampini   /* composing function */
122500de8ff0SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCSetCoarseningRatio_C","PCBDDCSetCoarseningRatio_BDDC",PCBDDCSetCoarseningRatio_BDDC);CHKERRQ(ierr);
122600de8ff0SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCSetMaxLevels_C","PCBDDCSetMaxLevels_BDDC",PCBDDCSetMaxLevels_BDDC);CHKERRQ(ierr);
122700de8ff0SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCSetNullSpace_C","PCBDDCSetNullSpace_BDDC",PCBDDCSetNullSpace_BDDC);CHKERRQ(ierr);
122800de8ff0SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCSetDirichletBoundaries_C","PCBDDCSetDirichletBoundaries_BDDC",PCBDDCSetDirichletBoundaries_BDDC);CHKERRQ(ierr);
122900de8ff0SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCSetNeumannBoundaries_C","PCBDDCSetNeumannBoundaries_BDDC",PCBDDCSetNeumannBoundaries_BDDC);CHKERRQ(ierr);
123000de8ff0SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCGetDirichletBoundaries_C","PCBDDCGetDirichletBoundaries_BDDC",PCBDDCGetDirichletBoundaries_BDDC);CHKERRQ(ierr);
123100de8ff0SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCGetNeumannBoundaries_C","PCBDDCGetNeumannBoundaries_BDDC",PCBDDCGetNeumannBoundaries_BDDC);CHKERRQ(ierr);
123200de8ff0SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCSetCoarseProblemType_C","PCBDDCSetCoarseProblemType_BDDC",PCBDDCSetCoarseProblemType_BDDC);CHKERRQ(ierr);
123300de8ff0SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCSetDofsSplitting_C","PCBDDCSetDofsSplitting_BDDC",PCBDDCSetDofsSplitting_BDDC);CHKERRQ(ierr);
123400de8ff0SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCSetLocalAdjacencyGraph_C","PCBDDCSetLocalAdjacencyGraph_BDDC",PCBDDCSetLocalAdjacencyGraph_BDDC);CHKERRQ(ierr);
123500de8ff0SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)pc,"PCPreSolve_C","PCPreSolve_BDDC",PCPreSolve_BDDC);CHKERRQ(ierr);
123600de8ff0SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)pc,"PCPostSolve_C","PCPostSolve_BDDC",PCPostSolve_BDDC);CHKERRQ(ierr);
123700de8ff0SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCCreateFETIDPOperators_C","PCBDDCCreateFETIDPOperators_BDDC",PCBDDCCreateFETIDPOperators_BDDC);CHKERRQ(ierr);
123800de8ff0SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCMatFETIDPGetRHS_C","PCBDDCMatFETIDPGetRHS_BDDC",PCBDDCMatFETIDPGetRHS_BDDC);CHKERRQ(ierr);
123900de8ff0SBarry Smith   ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCMatFETIDPGetSolution_C","PCBDDCMatFETIDPGetSolution_BDDC",PCBDDCMatFETIDPGetSolution_BDDC);CHKERRQ(ierr);
1240da1bb401SStefano Zampini   PetscFunctionReturn(0);
1241da1bb401SStefano Zampini }
1242da1bb401SStefano Zampini EXTERN_C_END
12433425bc38SStefano Zampini 
1244da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
1245da1bb401SStefano Zampini /* All static functions from now on                                           */
1246da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
12474fad6a16SStefano Zampini #undef __FUNCT__
124829622bf0SStefano Zampini #define __FUNCT__ "PCBDDCApplyNullSpaceCorrectionPC"
124929622bf0SStefano Zampini static PetscErrorCode PCBDDCApplyNullSpaceCorrectionPC(PC pc,Vec x,Vec y)
125029622bf0SStefano Zampini {
125129622bf0SStefano Zampini   NullSpaceCorrection_ctx *pc_ctx;
125229622bf0SStefano Zampini   PetscErrorCode          ierr;
125329622bf0SStefano Zampini 
125429622bf0SStefano Zampini   PetscFunctionBegin;
125529622bf0SStefano Zampini   ierr = PCShellGetContext(pc,(void**)&pc_ctx);CHKERRQ(ierr);
125629622bf0SStefano Zampini   /* E */
125729622bf0SStefano Zampini   ierr = MatMultTranspose(pc_ctx->Lbasis_mat,x,pc_ctx->work_small_2);CHKERRQ(ierr);
125829622bf0SStefano Zampini   ierr = MatMultAdd(pc_ctx->Kbasis_mat,pc_ctx->work_small_2,x,pc_ctx->work_full_1);CHKERRQ(ierr);
125929622bf0SStefano Zampini   /* P^-1 */
126029622bf0SStefano Zampini   ierr = PCApply(pc_ctx->local_pc,pc_ctx->work_full_1,pc_ctx->work_full_2);CHKERRQ(ierr);
126129622bf0SStefano Zampini   /* E^T */
126229622bf0SStefano Zampini   ierr = MatMultTranspose(pc_ctx->Kbasis_mat,pc_ctx->work_full_2,pc_ctx->work_small_1);CHKERRQ(ierr);
126329622bf0SStefano Zampini   ierr = VecScale(pc_ctx->work_small_1,-1.0);CHKERRQ(ierr);
126429622bf0SStefano Zampini   ierr = MatMultAdd(pc_ctx->Lbasis_mat,pc_ctx->work_small_1,pc_ctx->work_full_2,pc_ctx->work_full_1);CHKERRQ(ierr);
126529622bf0SStefano Zampini   /* Sum contributions */
126629622bf0SStefano Zampini   ierr = MatMultAdd(pc_ctx->basis_mat,pc_ctx->work_small_2,pc_ctx->work_full_1,y);CHKERRQ(ierr);
126729622bf0SStefano Zampini   PetscFunctionReturn(0);
126829622bf0SStefano Zampini }
126929622bf0SStefano Zampini 
127029622bf0SStefano Zampini #undef __FUNCT__
127129622bf0SStefano Zampini #define __FUNCT__ "PCBDDCDestroyNullSpaceCorrectionPC"
127229622bf0SStefano Zampini static PetscErrorCode PCBDDCDestroyNullSpaceCorrectionPC(PC pc)
127329622bf0SStefano Zampini {
127429622bf0SStefano Zampini   NullSpaceCorrection_ctx *pc_ctx;
127529622bf0SStefano Zampini   PetscErrorCode          ierr;
127629622bf0SStefano Zampini 
127729622bf0SStefano Zampini   PetscFunctionBegin;
127829622bf0SStefano Zampini   ierr = PCShellGetContext(pc,(void**)&pc_ctx);CHKERRQ(ierr);
127929622bf0SStefano Zampini   ierr = VecDestroy(&pc_ctx->work_small_1);CHKERRQ(ierr);
128029622bf0SStefano Zampini   ierr = VecDestroy(&pc_ctx->work_small_2);CHKERRQ(ierr);
128129622bf0SStefano Zampini   ierr = VecDestroy(&pc_ctx->work_full_1);CHKERRQ(ierr);
128229622bf0SStefano Zampini   ierr = VecDestroy(&pc_ctx->work_full_2);CHKERRQ(ierr);
128329622bf0SStefano Zampini   ierr = MatDestroy(&pc_ctx->basis_mat);CHKERRQ(ierr);
128429622bf0SStefano Zampini   ierr = MatDestroy(&pc_ctx->Lbasis_mat);CHKERRQ(ierr);
128529622bf0SStefano Zampini   ierr = MatDestroy(&pc_ctx->Kbasis_mat);CHKERRQ(ierr);
128629622bf0SStefano Zampini   ierr = PCDestroy(&pc_ctx->local_pc);CHKERRQ(ierr);
128729622bf0SStefano Zampini   ierr = PetscFree(pc_ctx);CHKERRQ(ierr);
128829622bf0SStefano Zampini   PetscFunctionReturn(0);
128929622bf0SStefano Zampini }
129029622bf0SStefano Zampini 
129129622bf0SStefano Zampini #undef __FUNCT__
129229622bf0SStefano Zampini #define __FUNCT__ "PCBDDCAdaptLocalProblem"
129329622bf0SStefano Zampini static PetscErrorCode PCBDDCAdaptLocalProblem(PC pc,IS local_dofs)
129429622bf0SStefano Zampini {
1295f23aa3ddSBarry Smith   extern PetscErrorCode PCBDDCApplyNullSpaceCorrectionPC(PC,Vec,Vec);
1296f23aa3ddSBarry Smith   extern PetscErrorCode PCBDDCDestroyNullSpaceCorrectionPC(PC);
129729622bf0SStefano Zampini 
129829622bf0SStefano Zampini   PC_BDDC                 *pcbddc = (PC_BDDC*)pc->data;
129929622bf0SStefano Zampini   PC_IS                   *pcis   = (PC_IS*)pc->data;
130029622bf0SStefano Zampini   Mat_IS                  * matis = (Mat_IS*)pc->pmat->data;
130129622bf0SStefano Zampini   KSP                     *local_ksp;
130229622bf0SStefano Zampini   PC                      newpc;
130329622bf0SStefano Zampini   NullSpaceCorrection_ctx *shell_ctx;
130429622bf0SStefano Zampini   Mat                     local_mat,local_pmat,small_mat,inv_small_mat;
130529622bf0SStefano Zampini   MatStructure            local_mat_struct;
130629622bf0SStefano Zampini   Vec                     work1,work2,work3;
130729622bf0SStefano Zampini   const Vec               *nullvecs;
130829622bf0SStefano Zampini   VecScatter              scatter_ctx;
130929622bf0SStefano Zampini   IS                      is_aux;
131029622bf0SStefano Zampini   MatFactorInfo           matinfo;
131129622bf0SStefano Zampini   PetscScalar             *basis_mat,*Kbasis_mat,*array,*array_mat;
131229622bf0SStefano Zampini   PetscScalar             one = 1.0,zero = 0.0, m_one = -1.0;
131329622bf0SStefano Zampini   PetscInt                basis_dofs,basis_size,nnsp_size,i,k,n_I,n_R;
131429622bf0SStefano Zampini   PetscBool               nnsp_has_cnst;
131529622bf0SStefano Zampini   PetscErrorCode          ierr;
131629622bf0SStefano Zampini 
131729622bf0SStefano Zampini   PetscFunctionBegin;
131829622bf0SStefano Zampini   /* Infer the local solver */
131929622bf0SStefano Zampini   ierr = ISGetSize(local_dofs,&basis_dofs);CHKERRQ(ierr);
132029622bf0SStefano Zampini   ierr = VecGetSize(pcis->vec1_D,&n_I);CHKERRQ(ierr);
132129622bf0SStefano Zampini   ierr = VecGetSize(pcbddc->vec1_R,&n_R);CHKERRQ(ierr);
132229622bf0SStefano Zampini   if (basis_dofs == n_I) {
132329622bf0SStefano Zampini     /* Dirichlet solver */
132429622bf0SStefano Zampini     local_ksp = &pcbddc->ksp_D;
132529622bf0SStefano Zampini   } else if (basis_dofs == n_R) {
132629622bf0SStefano Zampini     /* Neumann solver */
132729622bf0SStefano Zampini     local_ksp = &pcbddc->ksp_R;
1328f23aa3ddSBarry Smith   } else SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in %s: unknown local IS size %d. n_I=%d, n_R=%d)\n",basis_dofs,n_I,n_R);
132929622bf0SStefano Zampini   ierr = KSPGetOperators(*local_ksp,&local_mat,&local_pmat,&local_mat_struct);CHKERRQ(ierr);
133029622bf0SStefano Zampini 
133129622bf0SStefano Zampini   /* Get null space vecs */
133229622bf0SStefano Zampini   ierr = MatNullSpaceGetVecs(pcbddc->NullSpace,&nnsp_has_cnst,&nnsp_size,&nullvecs);CHKERRQ(ierr);
133329622bf0SStefano Zampini   basis_size = nnsp_size;
13342fa5cd67SKarl Rupp   if (nnsp_has_cnst) basis_size++;
133529622bf0SStefano Zampini 
133629622bf0SStefano Zampini   /* Create shell ctx */
133729622bf0SStefano Zampini   ierr = PetscMalloc(sizeof(*shell_ctx),&shell_ctx);CHKERRQ(ierr);
133829622bf0SStefano Zampini 
133929622bf0SStefano Zampini   /* Create work vectors in shell context */
134029622bf0SStefano Zampini   ierr = VecCreate(PETSC_COMM_SELF,&shell_ctx->work_small_1);CHKERRQ(ierr);
134129622bf0SStefano Zampini   ierr = VecSetSizes(shell_ctx->work_small_1,basis_size,basis_size);CHKERRQ(ierr);
134229622bf0SStefano Zampini   ierr = VecSetType(shell_ctx->work_small_1,VECSEQ);CHKERRQ(ierr);
134329622bf0SStefano Zampini   ierr = VecDuplicate(shell_ctx->work_small_1,&shell_ctx->work_small_2);CHKERRQ(ierr);
134429622bf0SStefano Zampini   ierr = VecCreate(PETSC_COMM_SELF,&shell_ctx->work_full_1);CHKERRQ(ierr);
134529622bf0SStefano Zampini   ierr = VecSetSizes(shell_ctx->work_full_1,basis_dofs,basis_dofs);CHKERRQ(ierr);
134629622bf0SStefano Zampini   ierr = VecSetType(shell_ctx->work_full_1,VECSEQ);CHKERRQ(ierr);
134729622bf0SStefano Zampini   ierr = VecDuplicate(shell_ctx->work_full_1,&shell_ctx->work_full_2);CHKERRQ(ierr);
134829622bf0SStefano Zampini 
134929622bf0SStefano Zampini   /* Allocate workspace */
13500298fd71SBarry Smith   ierr = MatCreateSeqDense(PETSC_COMM_SELF,basis_dofs,basis_size,NULL,&shell_ctx->basis_mat);CHKERRQ(ierr);
13510298fd71SBarry Smith   ierr = MatCreateSeqDense(PETSC_COMM_SELF,basis_dofs,basis_size,NULL,&shell_ctx->Kbasis_mat);CHKERRQ(ierr);
135229622bf0SStefano Zampini   ierr = MatDenseGetArray(shell_ctx->basis_mat,&basis_mat);CHKERRQ(ierr);
135329622bf0SStefano Zampini   ierr = MatDenseGetArray(shell_ctx->Kbasis_mat,&Kbasis_mat);CHKERRQ(ierr);
135429622bf0SStefano Zampini 
135529622bf0SStefano Zampini   /* Restrict local null space on selected dofs (Dirichlet or Neumann)
135629622bf0SStefano Zampini      and compute matrices N and K*N */
135729622bf0SStefano Zampini   ierr = VecDuplicate(shell_ctx->work_full_1,&work1);CHKERRQ(ierr);
135829622bf0SStefano Zampini   ierr = VecDuplicate(shell_ctx->work_full_1,&work2);CHKERRQ(ierr);
135929622bf0SStefano Zampini   ierr = VecScatterCreate(pcis->vec1_N,local_dofs,work1,(IS)0,&scatter_ctx);CHKERRQ(ierr);
136029622bf0SStefano Zampini   k    = 0;
136129622bf0SStefano Zampini   for (; k<nnsp_size; k++) {
136229622bf0SStefano Zampini     ierr = VecScatterBegin(matis->ctx,nullvecs[k],pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
136329622bf0SStefano Zampini     ierr = VecScatterEnd(matis->ctx,nullvecs[k],pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
136429622bf0SStefano Zampini     ierr = VecPlaceArray(work1,(const PetscScalar*)&basis_mat[k*basis_dofs]);CHKERRQ(ierr);
136529622bf0SStefano Zampini     ierr = VecScatterBegin(scatter_ctx,pcis->vec1_N,work1,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
136629622bf0SStefano Zampini     ierr = VecScatterEnd(scatter_ctx,pcis->vec1_N,work1,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
136729622bf0SStefano Zampini     ierr = VecPlaceArray(work2,(const PetscScalar*)&Kbasis_mat[k*basis_dofs]);CHKERRQ(ierr);
136829622bf0SStefano Zampini     ierr = MatMult(local_mat,work1,work2);CHKERRQ(ierr);
136929622bf0SStefano Zampini     ierr = VecResetArray(work1);CHKERRQ(ierr);
137029622bf0SStefano Zampini     ierr = VecResetArray(work2);CHKERRQ(ierr);
137129622bf0SStefano Zampini   }
137229622bf0SStefano Zampini   if (nnsp_has_cnst) {
137329622bf0SStefano Zampini     ierr = VecPlaceArray(work1,(const PetscScalar*)&basis_mat[k*basis_dofs]);CHKERRQ(ierr);
137429622bf0SStefano Zampini     ierr = VecSet(work1,one);CHKERRQ(ierr);
137529622bf0SStefano Zampini     ierr = VecPlaceArray(work2,(const PetscScalar*)&Kbasis_mat[k*basis_dofs]);CHKERRQ(ierr);
137629622bf0SStefano Zampini     ierr = MatMult(local_mat,work1,work2);CHKERRQ(ierr);
137729622bf0SStefano Zampini     ierr = VecResetArray(work1);CHKERRQ(ierr);
137829622bf0SStefano Zampini     ierr = VecResetArray(work2);CHKERRQ(ierr);
137929622bf0SStefano Zampini   }
138029622bf0SStefano Zampini   ierr = VecDestroy(&work1);CHKERRQ(ierr);
138129622bf0SStefano Zampini   ierr = VecDestroy(&work2);CHKERRQ(ierr);
138229622bf0SStefano Zampini   ierr = VecScatterDestroy(&scatter_ctx);CHKERRQ(ierr);
138329622bf0SStefano Zampini   ierr = MatDenseRestoreArray(shell_ctx->basis_mat,&basis_mat);CHKERRQ(ierr);
138429622bf0SStefano Zampini   ierr = MatDenseRestoreArray(shell_ctx->Kbasis_mat,&Kbasis_mat);CHKERRQ(ierr);
138529622bf0SStefano Zampini 
138629622bf0SStefano Zampini   /* Assemble another Mat object in shell context */
138729622bf0SStefano Zampini   ierr = MatTransposeMatMult(shell_ctx->basis_mat,shell_ctx->Kbasis_mat,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&small_mat);CHKERRQ(ierr);
138829622bf0SStefano Zampini   ierr = MatFactorInfoInitialize(&matinfo);CHKERRQ(ierr);
138929622bf0SStefano Zampini   ierr = ISCreateStride(PETSC_COMM_SELF,basis_size,0,1,&is_aux);CHKERRQ(ierr);
139029622bf0SStefano Zampini   ierr = MatLUFactor(small_mat,is_aux,is_aux,&matinfo);CHKERRQ(ierr);
139129622bf0SStefano Zampini   ierr = ISDestroy(&is_aux);CHKERRQ(ierr);
139229622bf0SStefano Zampini   ierr = PetscMalloc(basis_size*basis_size*sizeof(PetscScalar),&array_mat);CHKERRQ(ierr);
139329622bf0SStefano Zampini   for (k=0; k<basis_size; k++) {
139429622bf0SStefano Zampini     ierr = VecSet(shell_ctx->work_small_1,zero);CHKERRQ(ierr);
139529622bf0SStefano Zampini     ierr = VecSetValue(shell_ctx->work_small_1,k,one,INSERT_VALUES);CHKERRQ(ierr);
139629622bf0SStefano Zampini     ierr = VecAssemblyBegin(shell_ctx->work_small_1);CHKERRQ(ierr);
139729622bf0SStefano Zampini     ierr = VecAssemblyEnd(shell_ctx->work_small_1);CHKERRQ(ierr);
139829622bf0SStefano Zampini     ierr = MatSolve(small_mat,shell_ctx->work_small_1,shell_ctx->work_small_2);CHKERRQ(ierr);
139929622bf0SStefano Zampini     ierr = VecGetArray(shell_ctx->work_small_2,&array);CHKERRQ(ierr);
14002fa5cd67SKarl Rupp     for (i=0; i<basis_size; i++) array_mat[i*basis_size+k]=array[i];
140129622bf0SStefano Zampini     ierr = VecRestoreArray(shell_ctx->work_small_2,&array);CHKERRQ(ierr);
140229622bf0SStefano Zampini   }
140329622bf0SStefano Zampini   ierr = MatCreateSeqDense(PETSC_COMM_SELF,basis_size,basis_size,array_mat,&inv_small_mat);CHKERRQ(ierr);
140429622bf0SStefano Zampini   ierr = MatMatMult(shell_ctx->basis_mat,inv_small_mat,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&shell_ctx->Lbasis_mat);CHKERRQ(ierr);
140529622bf0SStefano Zampini   ierr = PetscFree(array_mat);CHKERRQ(ierr);
140629622bf0SStefano Zampini   ierr = MatDestroy(&inv_small_mat);CHKERRQ(ierr);
140729622bf0SStefano Zampini   ierr = MatDestroy(&small_mat);CHKERRQ(ierr);
140829622bf0SStefano Zampini   ierr = MatScale(shell_ctx->Kbasis_mat,m_one);CHKERRQ(ierr);
140929622bf0SStefano Zampini 
141029622bf0SStefano Zampini   /* Rebuild local PC */
141129622bf0SStefano Zampini   ierr = KSPGetPC(*local_ksp,&shell_ctx->local_pc);CHKERRQ(ierr);
141229622bf0SStefano Zampini   ierr = PetscObjectReference((PetscObject)shell_ctx->local_pc);CHKERRQ(ierr);
141329622bf0SStefano Zampini   ierr = PCCreate(PETSC_COMM_SELF,&newpc);CHKERRQ(ierr);
141429622bf0SStefano Zampini   ierr = PCSetOperators(newpc,local_mat,local_mat,SAME_PRECONDITIONER);CHKERRQ(ierr);
141529622bf0SStefano Zampini   ierr = PCSetType(newpc,PCSHELL);CHKERRQ(ierr);
141629622bf0SStefano Zampini   ierr = PCShellSetContext(newpc,shell_ctx);CHKERRQ(ierr);
141729622bf0SStefano Zampini   ierr = PCShellSetApply(newpc,PCBDDCApplyNullSpaceCorrectionPC);CHKERRQ(ierr);
141829622bf0SStefano Zampini   ierr = PCShellSetDestroy(newpc,PCBDDCDestroyNullSpaceCorrectionPC);CHKERRQ(ierr);
141929622bf0SStefano Zampini   ierr = PCSetUp(newpc);CHKERRQ(ierr);
142029622bf0SStefano Zampini   ierr = KSPSetPC(*local_ksp,newpc);CHKERRQ(ierr);
142129622bf0SStefano Zampini   ierr = PCDestroy(&newpc);CHKERRQ(ierr);
142229622bf0SStefano Zampini   ierr = KSPSetUp(*local_ksp);CHKERRQ(ierr);
142329622bf0SStefano Zampini 
142429622bf0SStefano Zampini   /* test */
142529622bf0SStefano Zampini   if (pcbddc->dbg_flag) {
142629622bf0SStefano Zampini     PetscReal   test_err;
142729622bf0SStefano Zampini     KSP         check_ksp;
142829622bf0SStefano Zampini     PC          check_pc;
142929622bf0SStefano Zampini     PetscReal   lambda_min,lambda_max;
143029622bf0SStefano Zampini     Mat         test_mat;
143129622bf0SStefano Zampini     PetscViewer viewer=pcbddc->dbg_viewer;
143229622bf0SStefano Zampini     PetscBool   setsym,issym=PETSC_FALSE;
143329622bf0SStefano Zampini 
143429622bf0SStefano Zampini     ierr = KSPGetPC(*local_ksp,&check_pc);CHKERRQ(ierr);
143529622bf0SStefano Zampini     ierr = VecDuplicate(shell_ctx->work_full_1,&work1);CHKERRQ(ierr);
143629622bf0SStefano Zampini     ierr = VecDuplicate(shell_ctx->work_full_1,&work2);CHKERRQ(ierr);
143729622bf0SStefano Zampini     ierr = VecDuplicate(shell_ctx->work_full_1,&work3);CHKERRQ(ierr);
14380298fd71SBarry Smith     ierr = VecSetRandom(shell_ctx->work_small_1,NULL);CHKERRQ(ierr);
143929622bf0SStefano Zampini     ierr = MatMult(shell_ctx->basis_mat,shell_ctx->work_small_1,work1);CHKERRQ(ierr);
144029622bf0SStefano Zampini     ierr = VecCopy(work1,work2);CHKERRQ(ierr);
144129622bf0SStefano Zampini     ierr = MatMult(local_mat,work1,work3);CHKERRQ(ierr);
144229622bf0SStefano Zampini     ierr = PCApply(check_pc,work3,work1);CHKERRQ(ierr);
144329622bf0SStefano Zampini     ierr = VecAXPY(work1,m_one,work2);CHKERRQ(ierr);
144429622bf0SStefano Zampini     ierr = VecNorm(work1,NORM_INFINITY,&test_err);CHKERRQ(ierr);
144529622bf0SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d error for nullspace correction for ",PetscGlobalRank);
144629622bf0SStefano Zampini     if (basis_dofs == n_I) {
14472fa5cd67SKarl Rupp       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Dirichlet ");CHKERRQ(ierr);
144829622bf0SStefano Zampini     } else {
14492fa5cd67SKarl Rupp       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Neumann ");CHKERRQ(ierr);
145029622bf0SStefano Zampini     }
145129622bf0SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"solver is :%1.14e\n",test_err);
145229622bf0SStefano Zampini 
145329622bf0SStefano Zampini     ierr = MatTransposeMatMult(shell_ctx->Lbasis_mat,shell_ctx->Kbasis_mat,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&test_mat);CHKERRQ(ierr);
145429622bf0SStefano Zampini     ierr = MatShift(test_mat,one);CHKERRQ(ierr);
145529622bf0SStefano Zampini     ierr = MatNorm(test_mat,NORM_INFINITY,&test_err);CHKERRQ(ierr);
145629622bf0SStefano Zampini     ierr = MatDestroy(&test_mat);CHKERRQ(ierr);
145729622bf0SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d error for nullspace matrices is :%1.14e\n",PetscGlobalRank,test_err);
145829622bf0SStefano Zampini 
145929622bf0SStefano Zampini     /* Create ksp object suitable for extreme eigenvalues' estimation */
146029622bf0SStefano Zampini     ierr = KSPCreate(PETSC_COMM_SELF,&check_ksp);CHKERRQ(ierr);
146129622bf0SStefano Zampini     ierr = KSPSetOperators(check_ksp,local_mat,local_mat,SAME_PRECONDITIONER);CHKERRQ(ierr);
146229622bf0SStefano Zampini     ierr = KSPSetTolerances(check_ksp,1.e-8,1.e-8,PETSC_DEFAULT,basis_dofs);CHKERRQ(ierr);
146329622bf0SStefano Zampini     ierr = KSPSetComputeSingularValues(check_ksp,PETSC_TRUE);CHKERRQ(ierr);
146429622bf0SStefano Zampini     ierr = MatIsSymmetricKnown(pc->pmat,&setsym,&issym);CHKERRQ(ierr);
146529622bf0SStefano Zampini     if (issym) {
146629622bf0SStefano Zampini       ierr = KSPSetType(check_ksp,KSPCG);CHKERRQ(ierr);
146729622bf0SStefano Zampini     }
146829622bf0SStefano Zampini     ierr = KSPSetPC(check_ksp,check_pc);CHKERRQ(ierr);
146929622bf0SStefano Zampini     ierr = KSPSetUp(check_ksp);CHKERRQ(ierr);
14700298fd71SBarry Smith     ierr = VecSetRandom(work1,NULL);CHKERRQ(ierr);
147129622bf0SStefano Zampini     ierr = MatMult(local_mat,work1,work2);CHKERRQ(ierr);
147229622bf0SStefano Zampini     ierr = KSPSolve(check_ksp,work2,work2);CHKERRQ(ierr);
147329622bf0SStefano Zampini     ierr = VecAXPY(work2,m_one,work1);CHKERRQ(ierr);
147429622bf0SStefano Zampini     ierr = VecNorm(work2,NORM_INFINITY,&test_err);CHKERRQ(ierr);
147529622bf0SStefano Zampini     ierr = KSPComputeExtremeSingularValues(check_ksp,&lambda_max,&lambda_min);CHKERRQ(ierr);
147629622bf0SStefano Zampini     ierr = KSPGetIterationNumber(check_ksp,&k);CHKERRQ(ierr);
147729622bf0SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d error for adapted KSP %1.14e (it %d, eigs %1.6e %1.6e)\n",PetscGlobalRank,test_err,k,lambda_min,lambda_max);
147829622bf0SStefano Zampini     ierr = KSPDestroy(&check_ksp);CHKERRQ(ierr);
147929622bf0SStefano Zampini     ierr = VecDestroy(&work1);CHKERRQ(ierr);
148029622bf0SStefano Zampini     ierr = VecDestroy(&work2);CHKERRQ(ierr);
148129622bf0SStefano Zampini     ierr = VecDestroy(&work3);CHKERRQ(ierr);
148229622bf0SStefano Zampini   }
148329622bf0SStefano Zampini   PetscFunctionReturn(0);
148429622bf0SStefano Zampini }
148529622bf0SStefano Zampini 
148629622bf0SStefano Zampini #undef __FUNCT__
14872e8d2280SStefano Zampini #define __FUNCT__ "PCBDDCSetUseExactDirichlet"
14882e8d2280SStefano Zampini static PetscErrorCode PCBDDCSetUseExactDirichlet(PC pc,PetscBool use)
14892e8d2280SStefano Zampini {
14902e8d2280SStefano Zampini   PC_BDDC *pcbddc = (PC_BDDC*)pc->data;
14912e8d2280SStefano Zampini 
14922e8d2280SStefano Zampini   PetscFunctionBegin;
14932e8d2280SStefano Zampini   pcbddc->use_exact_dirichlet=use;
14942e8d2280SStefano Zampini   PetscFunctionReturn(0);
14952e8d2280SStefano Zampini }
14962e8d2280SStefano Zampini 
14972e8d2280SStefano Zampini #undef __FUNCT__
14984fad6a16SStefano Zampini #define __FUNCT__ "PCBDDCSetLevel"
14994fad6a16SStefano Zampini static PetscErrorCode PCBDDCSetLevel(PC pc,PetscInt level)
15004fad6a16SStefano Zampini {
15014fad6a16SStefano Zampini   PC_BDDC *pcbddc = (PC_BDDC*)pc->data;
15024fad6a16SStefano Zampini 
15034fad6a16SStefano Zampini   PetscFunctionBegin;
15044fad6a16SStefano Zampini   pcbddc->current_level=level;
15054fad6a16SStefano Zampini   PetscFunctionReturn(0);
15064fad6a16SStefano Zampini }
15073425bc38SStefano Zampini 
15083425bc38SStefano Zampini #undef __FUNCT__
15090bdf917eSStefano Zampini #define __FUNCT__ "PCBDDCAdaptNullSpace"
15100bdf917eSStefano Zampini static PetscErrorCode PCBDDCAdaptNullSpace(PC pc)
15110bdf917eSStefano Zampini {
15120bdf917eSStefano Zampini   PC_IS          *pcis   = (PC_IS*)  (pc->data);
15130bdf917eSStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)(pc->data);
15140bdf917eSStefano Zampini   KSP            inv_change;
15150bdf917eSStefano Zampini   PC             pc_change;
15160bdf917eSStefano Zampini   const Vec      *nsp_vecs;
15170bdf917eSStefano Zampini   Vec            *new_nsp_vecs;
15180bdf917eSStefano Zampini   PetscInt       i,nsp_size,new_nsp_size,start_new;
15190bdf917eSStefano Zampini   PetscBool      nsp_has_cnst;
15200bdf917eSStefano Zampini   MatNullSpace   new_nsp;
15210bdf917eSStefano Zampini   PetscErrorCode ierr;
15220bdf917eSStefano Zampini 
15230bdf917eSStefano Zampini   PetscFunctionBegin;
15240bdf917eSStefano Zampini   ierr = MatNullSpaceGetVecs(pcbddc->NullSpace,&nsp_has_cnst,&nsp_size,&nsp_vecs);CHKERRQ(ierr);
15250bdf917eSStefano Zampini   ierr = KSPCreate(PETSC_COMM_SELF,&inv_change);CHKERRQ(ierr);
15260bdf917eSStefano Zampini   ierr = KSPSetOperators(inv_change,pcbddc->ChangeOfBasisMatrix,pcbddc->ChangeOfBasisMatrix,SAME_PRECONDITIONER);CHKERRQ(ierr);
15270bdf917eSStefano Zampini   ierr = KSPSetType(inv_change,KSPPREONLY);CHKERRQ(ierr);
15280bdf917eSStefano Zampini   ierr = KSPGetPC(inv_change,&pc_change);CHKERRQ(ierr);
15290bdf917eSStefano Zampini   ierr = PCSetType(pc_change,PCLU);CHKERRQ(ierr);
15300bdf917eSStefano Zampini   ierr = KSPSetUp(inv_change);CHKERRQ(ierr);
15312fa5cd67SKarl Rupp 
15320bdf917eSStefano Zampini   new_nsp_size = nsp_size;
15332fa5cd67SKarl Rupp   if (nsp_has_cnst) new_nsp_size++;
15340bdf917eSStefano Zampini   ierr = PetscMalloc(new_nsp_size*sizeof(Vec),&new_nsp_vecs);CHKERRQ(ierr);
15350bdf917eSStefano Zampini   for (i=0;i<new_nsp_size;i++) { ierr = VecDuplicate(pcis->vec1_global,&new_nsp_vecs[i]);CHKERRQ(ierr); }
15360bdf917eSStefano Zampini   start_new = 0;
15370bdf917eSStefano Zampini   if (nsp_has_cnst) {
15380bdf917eSStefano Zampini     start_new = 1;
15390bdf917eSStefano Zampini     ierr      = VecSet(new_nsp_vecs[0],1.0);CHKERRQ(ierr);
15400bdf917eSStefano Zampini     ierr      = VecSet(pcis->vec1_B,1.0);CHKERRQ(ierr);
15410bdf917eSStefano Zampini     ierr      = KSPSolve(inv_change,pcis->vec1_B,pcis->vec1_B);
15420bdf917eSStefano Zampini     ierr      = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,new_nsp_vecs[0],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
15430bdf917eSStefano Zampini     ierr      = VecScatterEnd  (pcis->global_to_B,pcis->vec1_B,new_nsp_vecs[0],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
15440bdf917eSStefano Zampini   }
15450bdf917eSStefano Zampini   for (i=0; i<nsp_size; i++) {
15460bdf917eSStefano Zampini     ierr = VecCopy(nsp_vecs[i],new_nsp_vecs[i+start_new]);CHKERRQ(ierr);
15470bdf917eSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,nsp_vecs[i],pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
15480bdf917eSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,nsp_vecs[i],pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
15490bdf917eSStefano Zampini     ierr = KSPSolve(inv_change,pcis->vec1_B,pcis->vec1_B);
15500bdf917eSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,new_nsp_vecs[i+start_new],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
15510bdf917eSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec1_B,new_nsp_vecs[i+start_new],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
15520bdf917eSStefano Zampini   }
15530298fd71SBarry Smith   ierr = VecNormalize(new_nsp_vecs[0],NULL);CHKERRQ(ierr);
15540bdf917eSStefano Zampini   /* TODO : Orthonormalize vecs when new_nsp_size > 0! */
15550bdf917eSStefano Zampini 
15560bdf917eSStefano Zampini   ierr = KSPDestroy(&inv_change);CHKERRQ(ierr);
1557ce94432eSBarry Smith   ierr = MatNullSpaceCreate(PetscObjectComm((PetscObject)pc),PETSC_FALSE,new_nsp_size,new_nsp_vecs,&new_nsp);CHKERRQ(ierr);
15580bdf917eSStefano Zampini   ierr = PCBDDCSetNullSpace(pc,new_nsp);CHKERRQ(ierr);
15590bdf917eSStefano Zampini   ierr = MatNullSpaceDestroy(&new_nsp);CHKERRQ(ierr);
15600bdf917eSStefano Zampini   /*
15610bdf917eSStefano Zampini   ierr = MatNullSpaceTest(pcbddc->NullSpace,pc->pmat,&nsp_t);CHKERRQ(ierr);
15620bdf917eSStefano Zampini   printf("New Null Space, mat changed: %d\n",nsp_t);
15630bdf917eSStefano Zampini     temp_mat = matis->A;
15640bdf917eSStefano Zampini     matis->A = pcbddc->local_mat;
15650bdf917eSStefano Zampini     pcbddc->local_mat = temp_mat;
15660bdf917eSStefano Zampini   ierr = MatNullSpaceTest(pcbddc->NullSpace,pc->pmat,&nsp_t);CHKERRQ(ierr);
15670bdf917eSStefano Zampini   printf("New Null Space, mat original: %d\n",nsp_t);*/
15680bdf917eSStefano Zampini 
15690bdf917eSStefano Zampini   for (i=0; i<new_nsp_size; i++) { ierr = VecDestroy(&new_nsp_vecs[i]);CHKERRQ(ierr); }
15700bdf917eSStefano Zampini   ierr = PetscFree(new_nsp_vecs);CHKERRQ(ierr);
15710bdf917eSStefano Zampini   PetscFunctionReturn(0);
15720bdf917eSStefano Zampini }
15730bdf917eSStefano Zampini 
15740bdf917eSStefano Zampini #undef __FUNCT__
15753425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPMatContext"
15763425bc38SStefano Zampini static PetscErrorCode PCBDDCCreateFETIDPMatContext(PC pc, FETIDPMat_ctx **fetidpmat_ctx)
15773425bc38SStefano Zampini {
15783425bc38SStefano Zampini   FETIDPMat_ctx  *newctx;
15793425bc38SStefano Zampini   PetscErrorCode ierr;
15803425bc38SStefano Zampini 
15813425bc38SStefano Zampini   PetscFunctionBegin;
15823425bc38SStefano Zampini   ierr = PetscMalloc(sizeof(*newctx),&newctx);CHKERRQ(ierr);
15832fa5cd67SKarl Rupp 
15843425bc38SStefano Zampini   newctx->lambda_local    = 0;
15853425bc38SStefano Zampini   newctx->temp_solution_B = 0;
15863425bc38SStefano Zampini   newctx->temp_solution_D = 0;
15873425bc38SStefano Zampini   newctx->B_delta         = 0;
15883425bc38SStefano Zampini   newctx->B_Ddelta        = 0; /* theoretically belongs to the FETIDP preconditioner */
15893425bc38SStefano Zampini   newctx->l2g_lambda      = 0;
15902fa5cd67SKarl Rupp 
15913425bc38SStefano Zampini   /* increase the reference count for BDDC preconditioner */
15923425bc38SStefano Zampini   ierr           = PetscObjectReference((PetscObject)pc);CHKERRQ(ierr);
15933425bc38SStefano Zampini   newctx->pc     = pc;
15943425bc38SStefano Zampini   *fetidpmat_ctx = newctx;
15953425bc38SStefano Zampini   PetscFunctionReturn(0);
15963425bc38SStefano Zampini }
15973425bc38SStefano Zampini 
15983425bc38SStefano Zampini #undef __FUNCT__
15993425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPPCContext"
16003425bc38SStefano Zampini static PetscErrorCode PCBDDCCreateFETIDPPCContext(PC pc, FETIDPPC_ctx **fetidppc_ctx)
16013425bc38SStefano Zampini {
16023425bc38SStefano Zampini   FETIDPPC_ctx   *newctx;
16033425bc38SStefano Zampini   PetscErrorCode ierr;
16043425bc38SStefano Zampini 
16053425bc38SStefano Zampini   PetscFunctionBegin;
16063425bc38SStefano Zampini   ierr = PetscMalloc(sizeof(*newctx),&newctx);CHKERRQ(ierr);
16072fa5cd67SKarl Rupp 
16083425bc38SStefano Zampini   newctx->lambda_local = 0;
16093425bc38SStefano Zampini   newctx->B_Ddelta     = 0;
16103425bc38SStefano Zampini   newctx->l2g_lambda   = 0;
16112fa5cd67SKarl Rupp 
16123425bc38SStefano Zampini   /* increase the reference count for BDDC preconditioner */
16133425bc38SStefano Zampini   ierr          = PetscObjectReference((PetscObject)pc);CHKERRQ(ierr);
16143425bc38SStefano Zampini   newctx->pc    = pc;
16153425bc38SStefano Zampini   *fetidppc_ctx = newctx;
16163425bc38SStefano Zampini   PetscFunctionReturn(0);
16173425bc38SStefano Zampini }
16183425bc38SStefano Zampini 
16193425bc38SStefano Zampini #undef __FUNCT__
16203425bc38SStefano Zampini #define __FUNCT__ "PCBDDCDestroyFETIDPMat"
16213425bc38SStefano Zampini static PetscErrorCode PCBDDCDestroyFETIDPMat(Mat A)
16223425bc38SStefano Zampini {
16233425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
16243425bc38SStefano Zampini   PetscErrorCode ierr;
16253425bc38SStefano Zampini 
16263425bc38SStefano Zampini   PetscFunctionBegin;
16273425bc38SStefano Zampini   ierr = MatShellGetContext(A,(void**)&mat_ctx);CHKERRQ(ierr);
16283425bc38SStefano Zampini   ierr = VecDestroy(&mat_ctx->lambda_local);CHKERRQ(ierr);
16293425bc38SStefano Zampini   ierr = VecDestroy(&mat_ctx->temp_solution_D);CHKERRQ(ierr);
16303425bc38SStefano Zampini   ierr = VecDestroy(&mat_ctx->temp_solution_B);CHKERRQ(ierr);
16313425bc38SStefano Zampini   ierr = MatDestroy(&mat_ctx->B_delta);CHKERRQ(ierr);
16323425bc38SStefano Zampini   ierr = MatDestroy(&mat_ctx->B_Ddelta);CHKERRQ(ierr);
16333425bc38SStefano Zampini   ierr = VecScatterDestroy(&mat_ctx->l2g_lambda);CHKERRQ(ierr);
16343425bc38SStefano Zampini   ierr = PCDestroy(&mat_ctx->pc);CHKERRQ(ierr); /* actually it does not destroy BDDC, only decrease its reference count */
16353425bc38SStefano Zampini   ierr = PetscFree(mat_ctx);CHKERRQ(ierr);
16363425bc38SStefano Zampini   PetscFunctionReturn(0);
16373425bc38SStefano Zampini }
16383425bc38SStefano Zampini 
16393425bc38SStefano Zampini #undef __FUNCT__
16403425bc38SStefano Zampini #define __FUNCT__ "PCBDDCDestroyFETIDPPC"
16413425bc38SStefano Zampini static PetscErrorCode PCBDDCDestroyFETIDPPC(PC pc)
16423425bc38SStefano Zampini {
16433425bc38SStefano Zampini   FETIDPPC_ctx   *pc_ctx;
16443425bc38SStefano Zampini   PetscErrorCode ierr;
16453425bc38SStefano Zampini 
16463425bc38SStefano Zampini   PetscFunctionBegin;
16473425bc38SStefano Zampini   ierr = PCShellGetContext(pc,(void**)&pc_ctx);CHKERRQ(ierr);
16483425bc38SStefano Zampini   ierr = VecDestroy(&pc_ctx->lambda_local);CHKERRQ(ierr);
16493425bc38SStefano Zampini   ierr = MatDestroy(&pc_ctx->B_Ddelta);CHKERRQ(ierr);
16503425bc38SStefano Zampini   ierr = VecScatterDestroy(&pc_ctx->l2g_lambda);CHKERRQ(ierr);
16513425bc38SStefano Zampini   ierr = PCDestroy(&pc_ctx->pc);CHKERRQ(ierr); /* actually it does not destroy BDDC, only decrease its reference count */
16523425bc38SStefano Zampini   ierr = PetscFree(pc_ctx);CHKERRQ(ierr);
16533425bc38SStefano Zampini   PetscFunctionReturn(0);
16543425bc38SStefano Zampini }
16553425bc38SStefano Zampini 
16563425bc38SStefano Zampini #undef __FUNCT__
16573425bc38SStefano Zampini #define __FUNCT__ "PCBDDCSetupFETIDPMatContext"
16583425bc38SStefano Zampini static PetscErrorCode PCBDDCSetupFETIDPMatContext(FETIDPMat_ctx *fetidpmat_ctx)
16593425bc38SStefano Zampini {
16603425bc38SStefano Zampini   PetscErrorCode ierr;
16613425bc38SStefano Zampini   PC_IS          *pcis    =(PC_IS*)fetidpmat_ctx->pc->data;
16623425bc38SStefano Zampini   PC_BDDC        *pcbddc  =(PC_BDDC*)fetidpmat_ctx->pc->data;
16633425bc38SStefano Zampini   PCBDDCGraph    mat_graph=pcbddc->mat_graph;
16643425bc38SStefano Zampini   Mat_IS         *matis   = (Mat_IS*)fetidpmat_ctx->pc->pmat->data;
16653425bc38SStefano Zampini   MPI_Comm       comm     = ((PetscObject)(fetidpmat_ctx->pc))->comm;
16663425bc38SStefano Zampini 
16673425bc38SStefano Zampini   Mat ScalingMat;
16683425bc38SStefano Zampini   Vec lambda_global;
16693425bc38SStefano Zampini   IS  IS_l2g_lambda;
16703425bc38SStefano Zampini 
16713425bc38SStefano Zampini   PetscBool   skip_node,fully_redundant;
1672ef028eecSStefano Zampini   PetscInt    i,j,k,s,n_boundary_dofs,n_global_lambda,n_vertices,partial_sum;
16733425bc38SStefano Zampini   PetscInt    n_local_lambda,n_lambda_for_dof,dual_size,n_neg_values,n_pos_values;
1674ef028eecSStefano Zampini   PetscMPIInt rank,nprocs;
16753425bc38SStefano Zampini   PetscScalar scalar_value;
16763425bc38SStefano Zampini 
16773425bc38SStefano Zampini   PetscInt    *vertex_indices,*temp_indices;
16783425bc38SStefano Zampini   PetscInt    *dual_dofs_boundary_indices,*aux_local_numbering_1,*aux_global_numbering;
16793425bc38SStefano Zampini   PetscInt    *aux_sums,*cols_B_delta,*l2g_indices;
16803425bc38SStefano Zampini   PetscScalar *array,*scaling_factors,*vals_B_delta;
1681ef028eecSStefano Zampini   PetscInt    *aux_local_numbering_2,*dof_sizes,*dof_displs;
1682ef028eecSStefano Zampini   PetscInt    first_index,old_index;
1683ef028eecSStefano Zampini   PetscBool   first_found = PETSC_FALSE;
16843425bc38SStefano Zampini 
16853425bc38SStefano Zampini   /* For communication of scaling factors */
16863425bc38SStefano Zampini   PetscInt    *ptrs_buffer,neigh_position;
16873425bc38SStefano Zampini   PetscScalar **all_factors,*send_buffer,*recv_buffer;
16883425bc38SStefano Zampini   MPI_Request *send_reqs,*recv_reqs;
16893425bc38SStefano Zampini 
16903425bc38SStefano Zampini   /* tests */
16913425bc38SStefano Zampini   Vec         test_vec;
16923425bc38SStefano Zampini   PetscBool   test_fetidp;
16933425bc38SStefano Zampini   PetscViewer viewer;
16943425bc38SStefano Zampini 
16953425bc38SStefano Zampini   PetscFunctionBegin;
16963425bc38SStefano Zampini   ierr = MPI_Comm_rank(comm,&rank);CHKERRQ(ierr);
16973425bc38SStefano Zampini   ierr = MPI_Comm_size(comm,&nprocs);CHKERRQ(ierr);
16983425bc38SStefano Zampini 
16993425bc38SStefano Zampini   /* Default type of lagrange multipliers is non-redundant */
17003425bc38SStefano Zampini   fully_redundant = PETSC_FALSE;
17010298fd71SBarry Smith   ierr            = PetscOptionsGetBool(NULL,"-fetidp_fullyredundant",&fully_redundant,NULL);CHKERRQ(ierr);
17023425bc38SStefano Zampini 
17033425bc38SStefano Zampini   /* Evaluate local and global number of lagrange multipliers */
17043425bc38SStefano Zampini   ierr            = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
17053425bc38SStefano Zampini   n_local_lambda  = 0;
17063425bc38SStefano Zampini   partial_sum     = 0;
17073425bc38SStefano Zampini   n_boundary_dofs = 0;
17083425bc38SStefano Zampini   s               = 0;
17093425bc38SStefano Zampini   n_vertices      = 0;
17103425bc38SStefano Zampini   /* Get Vertices used to define the BDDC */
17113425bc38SStefano Zampini   ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(*vertex_indices),&vertex_indices);CHKERRQ(ierr);
17123425bc38SStefano Zampini   for (i=0; i<pcbddc->local_primal_size; i++) {
17130298fd71SBarry Smith     ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&j,(const PetscInt**)&temp_indices,NULL);CHKERRQ(ierr);
17143425bc38SStefano Zampini     if (j == 1) {
17153425bc38SStefano Zampini       vertex_indices[n_vertices]=temp_indices[0];
17163425bc38SStefano Zampini       n_vertices++;
17173425bc38SStefano Zampini     }
17180298fd71SBarry Smith     ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&j,(const PetscInt**)&temp_indices,NULL);CHKERRQ(ierr);
17193425bc38SStefano Zampini   }
17203425bc38SStefano Zampini   dual_size = pcis->n_B-n_vertices;
17212fa5cd67SKarl Rupp 
1722f0474715SStefano Zampini   ierr = PetscSortInt(n_vertices,vertex_indices);CHKERRQ(ierr);
17233425bc38SStefano Zampini   ierr = PetscMalloc(dual_size*sizeof(*dual_dofs_boundary_indices),&dual_dofs_boundary_indices);CHKERRQ(ierr);
17243425bc38SStefano Zampini   ierr = PetscMalloc(dual_size*sizeof(*aux_local_numbering_1),&aux_local_numbering_1);CHKERRQ(ierr);
17253425bc38SStefano Zampini   ierr = PetscMalloc(dual_size*sizeof(*aux_local_numbering_2),&aux_local_numbering_2);CHKERRQ(ierr);
17263425bc38SStefano Zampini 
17273425bc38SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
17283425bc38SStefano Zampini   for (i=0; i<pcis->n; i++) {
17293425bc38SStefano Zampini     j = mat_graph->count[i]; /* RECALL: mat_graph->count[i] does not count myself */
1730c6582918SStefano Zampini     k = 0;
17312fa5cd67SKarl Rupp     if (j > 0) k = (mat_graph->neighbours_set[i][0] == -1 ?  1 : 0);
17323425bc38SStefano Zampini     j = j - k;
17332fa5cd67SKarl Rupp     if (j > 0) n_boundary_dofs++;
17343425bc38SStefano Zampini 
17353425bc38SStefano Zampini     skip_node = PETSC_FALSE;
1736c6582918SStefano Zampini     if (s < n_vertices && vertex_indices[s]==i) { /* it works for a sorted set of vertices */
17373425bc38SStefano Zampini       skip_node = PETSC_TRUE;
17383425bc38SStefano Zampini       s++;
17393425bc38SStefano Zampini     }
17402fa5cd67SKarl Rupp     if (j < 1) skip_node = PETSC_TRUE;
17413425bc38SStefano Zampini     if (!skip_node) {
17423425bc38SStefano Zampini       if (fully_redundant) {
17433425bc38SStefano Zampini         /* fully redundant set of lagrange multipliers */
17443425bc38SStefano Zampini         n_lambda_for_dof = (j*(j+1))/2;
17453425bc38SStefano Zampini       } else {
17463425bc38SStefano Zampini         n_lambda_for_dof = j;
17473425bc38SStefano Zampini       }
17483425bc38SStefano Zampini       n_local_lambda += j;
17493425bc38SStefano Zampini       /* needed to evaluate global number of lagrange multipliers */
17503425bc38SStefano Zampini       array[i]=(1.0*n_lambda_for_dof)/(j+1.0); /* already scaled for the next global sum */
17513425bc38SStefano Zampini       /* store some data needed */
17523425bc38SStefano Zampini       dual_dofs_boundary_indices[partial_sum] = n_boundary_dofs-1;
17533425bc38SStefano Zampini       aux_local_numbering_1[partial_sum]      = i;
1754ef028eecSStefano Zampini       aux_local_numbering_2[partial_sum]      = n_lambda_for_dof;
17553425bc38SStefano Zampini       partial_sum++;
17563425bc38SStefano Zampini     }
17573425bc38SStefano Zampini   }
17583425bc38SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
1759ef028eecSStefano Zampini 
17603425bc38SStefano Zampini   ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
17613425bc38SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
17623425bc38SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
17633425bc38SStefano Zampini   ierr = VecSum(pcis->vec1_global,&scalar_value);CHKERRQ(ierr);
17642fa5cd67SKarl Rupp 
17653425bc38SStefano Zampini   fetidpmat_ctx->n_lambda = (PetscInt) scalar_value;
17663425bc38SStefano Zampini   /* printf("I found %d global multipliers (%f)\n",fetidpmat_ctx->n_lambda,scalar_value); */
17673425bc38SStefano Zampini 
17683425bc38SStefano Zampini   /* compute global ordering of lagrange multipliers and associate l2g map */
1769ef028eecSStefano Zampini   ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
1770ef028eecSStefano Zampini   ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
1771ef028eecSStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
17722fa5cd67SKarl Rupp   for (i=0;i<dual_size;i++) array[aux_local_numbering_1[i]] = aux_local_numbering_2[i];
1773ef028eecSStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
1774ef028eecSStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
1775ef028eecSStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
1776ef028eecSStefano Zampini   ierr = VecSum(pcis->vec1_global,&scalar_value);CHKERRQ(ierr);
1777ef028eecSStefano Zampini   if (pcbddc->dbg_flag && (PetscInt)scalar_value != fetidpmat_ctx->n_lambda) {
1778acee19a7SJed Brown     SETERRQ2(PETSC_COMM_WORLD,PETSC_ERR_PLIB,"Global number of multipliers mismatch! (%d!=%d)\n",(PetscInt)scalar_value,fetidpmat_ctx->n_lambda);
1779ef028eecSStefano Zampini   }
17803425bc38SStefano Zampini 
1781ef028eecSStefano Zampini   /* Fill pcis->vec1_global with cumulative function for global numbering */
1782ef028eecSStefano Zampini   ierr        = VecGetArray(pcis->vec1_global,&array);CHKERRQ(ierr);
1783ef028eecSStefano Zampini   ierr        = VecGetLocalSize(pcis->vec1_global,&s);CHKERRQ(ierr);
1784ef028eecSStefano Zampini   k           = 0;
1785ef028eecSStefano Zampini   first_index = -1;
1786ef028eecSStefano Zampini   for (i=0; i<s; i++) {
1787ef028eecSStefano Zampini     if (!first_found && array[i] > 0.0) {
1788ef028eecSStefano Zampini       first_found = PETSC_TRUE;
1789ef028eecSStefano Zampini       first_index = i;
1790ef028eecSStefano Zampini     }
1791ef028eecSStefano Zampini     k += (PetscInt)array[i];
1792ef028eecSStefano Zampini   }
1793ef028eecSStefano Zampini   j    = (!rank ? nprocs : 0);
17943425bc38SStefano Zampini   ierr = PetscMalloc(j*sizeof(*dof_sizes),&dof_sizes);CHKERRQ(ierr);
17953425bc38SStefano Zampini   ierr = PetscMalloc(j*sizeof(*dof_displs),&dof_displs);CHKERRQ(ierr);
1796ef028eecSStefano Zampini   ierr = MPI_Gather(&k,1,MPIU_INT,dof_sizes,1,MPIU_INT,0,comm);CHKERRQ(ierr);
1797ef028eecSStefano Zampini   if (!rank) {
17983425bc38SStefano Zampini     dof_displs[0]=0;
17992fa5cd67SKarl Rupp     for (i=1; i<nprocs; i++) dof_displs[i] = dof_displs[i-1]+dof_sizes[i-1];
18003425bc38SStefano Zampini   }
1801ef028eecSStefano Zampini   ierr = MPI_Scatter(dof_displs,1,MPIU_INT,&k,1,MPIU_INT,0,comm);CHKERRQ(ierr);
1802ef028eecSStefano Zampini   if (first_found) {
1803ef028eecSStefano Zampini     array[first_index] += k;
18042fa5cd67SKarl Rupp 
1805ef028eecSStefano Zampini     old_index = first_index;
1806ef028eecSStefano Zampini     for (i=first_index+1; i<s; i++) {
1807ef028eecSStefano Zampini       if (array[i] > 0.0) {
1808ef028eecSStefano Zampini         array[i] += array[old_index];
1809ef028eecSStefano Zampini         old_index = i;
1810ef028eecSStefano Zampini       }
1811ef028eecSStefano Zampini     }
1812ef028eecSStefano Zampini   }
1813ef028eecSStefano Zampini   ierr = VecRestoreArray(pcis->vec1_global,&array);CHKERRQ(ierr);
1814ef028eecSStefano Zampini   ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
1815ef028eecSStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1816ef028eecSStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1817ef028eecSStefano Zampini   ierr = PetscMalloc(dual_size*sizeof(*aux_global_numbering),&aux_global_numbering);CHKERRQ(ierr);
1818ef028eecSStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
18193425bc38SStefano Zampini   for (i=0; i<dual_size; i++) {
1820ef028eecSStefano Zampini     aux_global_numbering[i] = (PetscInt)array[aux_local_numbering_1[i]]-aux_local_numbering_2[i];
18213425bc38SStefano Zampini   }
1822ef028eecSStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
1823f0474715SStefano Zampini   ierr = PetscFree(aux_local_numbering_2);CHKERRQ(ierr);
1824f0474715SStefano Zampini   ierr = PetscFree(dof_displs);CHKERRQ(ierr);
1825f0474715SStefano Zampini   ierr = PetscFree(dof_sizes);CHKERRQ(ierr);
18263425bc38SStefano Zampini 
18273425bc38SStefano Zampini   /* init data for scaling factors exchange */
18283425bc38SStefano Zampini   partial_sum = 0;
18293425bc38SStefano Zampini   j           = 0;
18302fa5cd67SKarl Rupp 
18313425bc38SStefano Zampini   ierr = PetscMalloc(pcis->n_neigh*sizeof(PetscInt),&ptrs_buffer);CHKERRQ(ierr);
18323425bc38SStefano Zampini   ierr = PetscMalloc((pcis->n_neigh-1)*sizeof(MPI_Request),&send_reqs);CHKERRQ(ierr);
18333425bc38SStefano Zampini   ierr = PetscMalloc((pcis->n_neigh-1)*sizeof(MPI_Request),&recv_reqs);CHKERRQ(ierr);
18343425bc38SStefano Zampini   ierr = PetscMalloc(pcis->n*sizeof(PetscScalar*),&all_factors);CHKERRQ(ierr);
18352fa5cd67SKarl Rupp 
18363425bc38SStefano Zampini   ptrs_buffer[0] = 0;
18373425bc38SStefano Zampini   for (i=1; i<pcis->n_neigh; i++) {
18383425bc38SStefano Zampini     partial_sum += pcis->n_shared[i];
18393425bc38SStefano Zampini     ptrs_buffer[i] = ptrs_buffer[i-1]+pcis->n_shared[i];
18403425bc38SStefano Zampini   }
18413425bc38SStefano Zampini   ierr = PetscMalloc(partial_sum*sizeof(PetscScalar),&send_buffer);CHKERRQ(ierr);
18423425bc38SStefano Zampini   ierr = PetscMalloc(partial_sum*sizeof(PetscScalar),&recv_buffer);CHKERRQ(ierr);
18433425bc38SStefano Zampini   ierr = PetscMalloc(partial_sum*sizeof(PetscScalar),&all_factors[0]);CHKERRQ(ierr);
18443425bc38SStefano Zampini   for (i=0; i<pcis->n-1; i++) {
18453425bc38SStefano Zampini     j = mat_graph->count[i];
18463425bc38SStefano Zampini     if (j>0) {
18473425bc38SStefano Zampini       k = (mat_graph->neighbours_set[i][0] == -1 ?  1 : 0);
18483425bc38SStefano Zampini       j = j - k;
18493425bc38SStefano Zampini     }
18503425bc38SStefano Zampini     all_factors[i+1]=all_factors[i]+j;
18513425bc38SStefano Zampini   }
18523425bc38SStefano Zampini   /* scatter B scaling to N vec */
18533425bc38SStefano Zampini   ierr = VecScatterBegin(pcis->N_to_B,pcis->D,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
18543425bc38SStefano Zampini   ierr = VecScatterEnd  (pcis->N_to_B,pcis->D,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
18553425bc38SStefano Zampini   /* communications */
18563425bc38SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
18573425bc38SStefano Zampini   for (i=1; i<pcis->n_neigh; i++) {
18582fa5cd67SKarl Rupp     for (j=0; j<pcis->n_shared[i]; j++)  send_buffer[ptrs_buffer[i-1]+j] = array[pcis->shared[i][j]];
18592fa5cd67SKarl Rupp 
18603425bc38SStefano Zampini     j    = ptrs_buffer[i]-ptrs_buffer[i-1];
1861ea7e1babSStefano Zampini     ierr = MPI_Isend(&send_buffer[ptrs_buffer[i-1]],j,MPIU_SCALAR,pcis->neigh[i],0,comm,&send_reqs[i-1]);CHKERRQ(ierr);
1862ea7e1babSStefano Zampini     ierr = MPI_Irecv(&recv_buffer[ptrs_buffer[i-1]],j,MPIU_SCALAR,pcis->neigh[i],0,comm,&recv_reqs[i-1]);CHKERRQ(ierr);
18633425bc38SStefano Zampini   }
18643425bc38SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
1865ea7e1babSStefano Zampini   ierr = MPI_Waitall((pcis->n_neigh-1),recv_reqs,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
18663425bc38SStefano Zampini   /* put values in correct places */
18673425bc38SStefano Zampini   for (i=1; i<pcis->n_neigh; i++) {
18683425bc38SStefano Zampini     for (j=0; j<pcis->n_shared[i]; j++) {
18693425bc38SStefano Zampini       k = pcis->shared[i][j];
18702fa5cd67SKarl Rupp 
18713425bc38SStefano Zampini       neigh_position = 0;
18722fa5cd67SKarl Rupp       while (mat_graph->neighbours_set[k][neigh_position] != pcis->neigh[i]) neigh_position++;
18733425bc38SStefano Zampini       s = (mat_graph->neighbours_set[k][0] == -1 ? 1 : 0);
18742fa5cd67SKarl Rupp 
18753425bc38SStefano Zampini       neigh_position = neigh_position - s;
18762fa5cd67SKarl Rupp 
18773425bc38SStefano Zampini       all_factors[k][neigh_position]=recv_buffer[ptrs_buffer[i-1]+j];
18783425bc38SStefano Zampini     }
18793425bc38SStefano Zampini   }
1880ea7e1babSStefano Zampini   ierr = MPI_Waitall((pcis->n_neigh-1),send_reqs,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
18813425bc38SStefano Zampini   ierr = PetscFree(send_reqs);CHKERRQ(ierr);
18823425bc38SStefano Zampini   ierr = PetscFree(recv_reqs);CHKERRQ(ierr);
18833425bc38SStefano Zampini   ierr = PetscFree(send_buffer);CHKERRQ(ierr);
18843425bc38SStefano Zampini   ierr = PetscFree(recv_buffer);CHKERRQ(ierr);
18853425bc38SStefano Zampini   ierr = PetscFree(ptrs_buffer);CHKERRQ(ierr);
18863425bc38SStefano Zampini 
18873425bc38SStefano Zampini   /* Compute B and B_delta (local actions) */
18883425bc38SStefano Zampini   ierr = PetscMalloc(pcis->n_neigh*sizeof(*aux_sums),&aux_sums);CHKERRQ(ierr);
18893425bc38SStefano Zampini   ierr = PetscMalloc(n_local_lambda*sizeof(*l2g_indices),&l2g_indices);CHKERRQ(ierr);
18903425bc38SStefano Zampini   ierr = PetscMalloc(n_local_lambda*sizeof(*vals_B_delta),&vals_B_delta);CHKERRQ(ierr);
18913425bc38SStefano Zampini   ierr = PetscMalloc(n_local_lambda*sizeof(*cols_B_delta),&cols_B_delta);CHKERRQ(ierr);
18923425bc38SStefano Zampini   ierr = PetscMalloc(n_local_lambda*sizeof(*scaling_factors),&scaling_factors);CHKERRQ(ierr);
18932fa5cd67SKarl Rupp 
18943425bc38SStefano Zampini   n_global_lambda = 0;
18953425bc38SStefano Zampini   partial_sum     = 0;
18962fa5cd67SKarl Rupp 
18973425bc38SStefano Zampini   for (i=0;i<dual_size;i++) {
1898ef028eecSStefano Zampini     n_global_lambda = aux_global_numbering[i];
18993425bc38SStefano Zampini     j               = mat_graph->count[aux_local_numbering_1[i]];
19003425bc38SStefano Zampini     k               = (mat_graph->neighbours_set[aux_local_numbering_1[i]][0] == -1 ?  1 : 0);
19013425bc38SStefano Zampini     j               = j - k;
19023425bc38SStefano Zampini     aux_sums[0]     = 0;
19032fa5cd67SKarl Rupp     for (s=1; s<j; s++) aux_sums[s]=aux_sums[s-1]+j-s+1;
19042fa5cd67SKarl Rupp 
19053425bc38SStefano Zampini     array        = all_factors[aux_local_numbering_1[i]];
19063425bc38SStefano Zampini     n_neg_values = 0;
19072fa5cd67SKarl Rupp 
19082fa5cd67SKarl Rupp     while (n_neg_values < j && mat_graph->neighbours_set[aux_local_numbering_1[i]][n_neg_values+k] < rank) n_neg_values++;
19093425bc38SStefano Zampini     n_pos_values = j - n_neg_values;
19102fa5cd67SKarl Rupp 
19113425bc38SStefano Zampini     if (fully_redundant) {
19123425bc38SStefano Zampini       for (s=0; s<n_neg_values; s++) {
19133425bc38SStefano Zampini         l2g_indices    [partial_sum+s]=aux_sums[s]+n_neg_values-s-1+n_global_lambda;
19143425bc38SStefano Zampini         cols_B_delta   [partial_sum+s]=dual_dofs_boundary_indices[i];
19153425bc38SStefano Zampini         vals_B_delta   [partial_sum+s]=-1.0;
19163425bc38SStefano Zampini         scaling_factors[partial_sum+s]=array[s];
19173425bc38SStefano Zampini       }
19183425bc38SStefano Zampini       for (s=0; s<n_pos_values; s++) {
19193425bc38SStefano Zampini         l2g_indices    [partial_sum+s+n_neg_values]=aux_sums[n_neg_values]+s+n_global_lambda;
19203425bc38SStefano Zampini         cols_B_delta   [partial_sum+s+n_neg_values]=dual_dofs_boundary_indices[i];
19213425bc38SStefano Zampini         vals_B_delta   [partial_sum+s+n_neg_values]=1.0;
19223425bc38SStefano Zampini         scaling_factors[partial_sum+s+n_neg_values]=array[s+n_neg_values];
19233425bc38SStefano Zampini       }
19243425bc38SStefano Zampini       partial_sum += j;
19253425bc38SStefano Zampini     } else {
19263425bc38SStefano Zampini       /* l2g_indices and default cols and vals of B_delta */
19273425bc38SStefano Zampini       for (s=0; s<j; s++) {
19283425bc38SStefano Zampini         l2g_indices    [partial_sum+s]=n_global_lambda+s;
19293425bc38SStefano Zampini         cols_B_delta   [partial_sum+s]=dual_dofs_boundary_indices[i];
19303425bc38SStefano Zampini         vals_B_delta   [partial_sum+s]=0.0;
19313425bc38SStefano Zampini       }
19323425bc38SStefano Zampini       /* B_delta */
19332fa5cd67SKarl Rupp       if (n_neg_values > 0) vals_B_delta[partial_sum+n_neg_values-1] = -1.0; /* there's a rank next to me to the left */
19342fa5cd67SKarl Rupp       if (n_neg_values < j) vals_B_delta[partial_sum+n_neg_values] = 1.0; /* there's a rank next to me to the right */
19352fa5cd67SKarl Rupp 
19363425bc38SStefano Zampini       /* scaling as in Klawonn-Widlund 1999*/
19373425bc38SStefano Zampini       for (s=0;s<n_neg_values;s++) {
19383425bc38SStefano Zampini         scalar_value = 0.0;
19392fa5cd67SKarl Rupp         for (k=0;k<s+1;k++) scalar_value += array[k];
1940ef028eecSStefano Zampini         scaling_factors[partial_sum+s] = -scalar_value;
19413425bc38SStefano Zampini       }
19423425bc38SStefano Zampini       for (s=0;s<n_pos_values;s++) {
19433425bc38SStefano Zampini         scalar_value = 0.0;
19442fa5cd67SKarl Rupp         for (k=s+n_neg_values;k<j;k++) scalar_value += array[k];
19453425bc38SStefano Zampini         scaling_factors[partial_sum+s+n_neg_values] = scalar_value;
19463425bc38SStefano Zampini       }
19473425bc38SStefano Zampini       partial_sum += j;
19483425bc38SStefano Zampini     }
19493425bc38SStefano Zampini   }
1950ef028eecSStefano Zampini   ierr = PetscFree(aux_global_numbering);CHKERRQ(ierr);
1951f0474715SStefano Zampini   ierr = PetscFree(aux_sums);CHKERRQ(ierr);
1952f0474715SStefano Zampini   ierr = PetscFree(aux_local_numbering_1);CHKERRQ(ierr);
1953f0474715SStefano Zampini   ierr = PetscFree(dual_dofs_boundary_indices);CHKERRQ(ierr);
19543425bc38SStefano Zampini   ierr = PetscFree(all_factors[0]);CHKERRQ(ierr);
19553425bc38SStefano Zampini   ierr = PetscFree(all_factors);CHKERRQ(ierr);
19563425bc38SStefano Zampini   /* printf("I found %d local lambda dofs when numbering them (should be %d)\n",partial_sum,n_local_lambda); */
1957f0474715SStefano Zampini 
1958f0474715SStefano Zampini   /* Local to global mapping of fetidpmat */
1959f0474715SStefano Zampini   ierr = VecCreate(PETSC_COMM_SELF,&fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
1960f0474715SStefano Zampini   ierr = VecSetSizes(fetidpmat_ctx->lambda_local,n_local_lambda,n_local_lambda);CHKERRQ(ierr);
1961f0474715SStefano Zampini   ierr = VecSetType(fetidpmat_ctx->lambda_local,VECSEQ);CHKERRQ(ierr);
1962f0474715SStefano Zampini   ierr = VecCreate(comm,&lambda_global);CHKERRQ(ierr);
1963f0474715SStefano Zampini   ierr = VecSetSizes(lambda_global,PETSC_DECIDE,fetidpmat_ctx->n_lambda);CHKERRQ(ierr);
1964f0474715SStefano Zampini   ierr = VecSetType(lambda_global,VECMPI);CHKERRQ(ierr);
19653425bc38SStefano Zampini   ierr = ISCreateGeneral(comm,n_local_lambda,l2g_indices,PETSC_OWN_POINTER,&IS_l2g_lambda);CHKERRQ(ierr);
19663425bc38SStefano Zampini   ierr = VecScatterCreate(fetidpmat_ctx->lambda_local,(IS)0,lambda_global,IS_l2g_lambda,&fetidpmat_ctx->l2g_lambda);CHKERRQ(ierr);
1967f0474715SStefano Zampini   ierr = ISDestroy(&IS_l2g_lambda);CHKERRQ(ierr);
19683425bc38SStefano Zampini 
19693425bc38SStefano Zampini   /* Create local part of B_delta */
19703425bc38SStefano Zampini   ierr = MatCreate(PETSC_COMM_SELF,&fetidpmat_ctx->B_delta);
19713425bc38SStefano Zampini   ierr = MatSetSizes(fetidpmat_ctx->B_delta,n_local_lambda,pcis->n_B,n_local_lambda,pcis->n_B);CHKERRQ(ierr);
19723425bc38SStefano Zampini   ierr = MatSetType(fetidpmat_ctx->B_delta,MATSEQAIJ);CHKERRQ(ierr);
19730298fd71SBarry Smith   ierr = MatSeqAIJSetPreallocation(fetidpmat_ctx->B_delta,1,NULL);CHKERRQ(ierr);
19743425bc38SStefano Zampini   ierr = MatSetOption(fetidpmat_ctx->B_delta,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr);
19753425bc38SStefano Zampini   for (i=0; i<n_local_lambda; i++) {
19763425bc38SStefano Zampini     ierr = MatSetValue(fetidpmat_ctx->B_delta,i,cols_B_delta[i],vals_B_delta[i],INSERT_VALUES);CHKERRQ(ierr);
19773425bc38SStefano Zampini   }
1978f0474715SStefano Zampini   ierr = PetscFree(vals_B_delta);CHKERRQ(ierr);
19793425bc38SStefano Zampini   ierr = MatAssemblyBegin(fetidpmat_ctx->B_delta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
19803425bc38SStefano Zampini   ierr = MatAssemblyEnd  (fetidpmat_ctx->B_delta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
19813425bc38SStefano Zampini 
19823425bc38SStefano Zampini   if (fully_redundant) {
19833425bc38SStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&ScalingMat);
19843425bc38SStefano Zampini     ierr = MatSetSizes(ScalingMat,n_local_lambda,n_local_lambda,n_local_lambda,n_local_lambda);CHKERRQ(ierr);
19853425bc38SStefano Zampini     ierr = MatSetType(ScalingMat,MATSEQAIJ);CHKERRQ(ierr);
19860298fd71SBarry Smith     ierr = MatSeqAIJSetPreallocation(ScalingMat,1,NULL);CHKERRQ(ierr);
19873425bc38SStefano Zampini     for (i=0; i<n_local_lambda; i++) {
19883425bc38SStefano Zampini       ierr = MatSetValue(ScalingMat,i,i,scaling_factors[i],INSERT_VALUES);CHKERRQ(ierr);
19893425bc38SStefano Zampini     }
19903425bc38SStefano Zampini     ierr = MatAssemblyBegin(ScalingMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
19913425bc38SStefano Zampini     ierr = MatAssemblyEnd  (ScalingMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
19923425bc38SStefano Zampini     ierr = MatMatMult(ScalingMat,fetidpmat_ctx->B_delta,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&fetidpmat_ctx->B_Ddelta);CHKERRQ(ierr);
19933425bc38SStefano Zampini     ierr = MatDestroy(&ScalingMat);CHKERRQ(ierr);
19943425bc38SStefano Zampini   } else {
19953425bc38SStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&fetidpmat_ctx->B_Ddelta);
19963425bc38SStefano Zampini     ierr = MatSetSizes(fetidpmat_ctx->B_Ddelta,n_local_lambda,pcis->n_B,n_local_lambda,pcis->n_B);CHKERRQ(ierr);
19973425bc38SStefano Zampini     ierr = MatSetType(fetidpmat_ctx->B_Ddelta,MATSEQAIJ);CHKERRQ(ierr);
19980298fd71SBarry Smith     ierr = MatSeqAIJSetPreallocation(fetidpmat_ctx->B_Ddelta,1,NULL);CHKERRQ(ierr);
19993425bc38SStefano Zampini     for (i=0; i<n_local_lambda; i++) {
20003425bc38SStefano Zampini       ierr = MatSetValue(fetidpmat_ctx->B_Ddelta,i,cols_B_delta[i],scaling_factors[i],INSERT_VALUES);CHKERRQ(ierr);
20013425bc38SStefano Zampini     }
20023425bc38SStefano Zampini     ierr = MatAssemblyBegin(fetidpmat_ctx->B_Ddelta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
20033425bc38SStefano Zampini     ierr = MatAssemblyEnd  (fetidpmat_ctx->B_Ddelta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
20043425bc38SStefano Zampini   }
2005f0474715SStefano Zampini   ierr = PetscFree(scaling_factors);CHKERRQ(ierr);
2006f0474715SStefano Zampini   ierr = PetscFree(cols_B_delta);CHKERRQ(ierr);
20073425bc38SStefano Zampini 
20083425bc38SStefano Zampini   /* Create some vectors needed by fetidp */
20093425bc38SStefano Zampini   ierr = VecDuplicate(pcis->vec1_B,&fetidpmat_ctx->temp_solution_B);CHKERRQ(ierr);
20103425bc38SStefano Zampini   ierr = VecDuplicate(pcis->vec1_D,&fetidpmat_ctx->temp_solution_D);CHKERRQ(ierr);
20113425bc38SStefano Zampini 
20123425bc38SStefano Zampini   test_fetidp = PETSC_FALSE;
20132fa5cd67SKarl Rupp 
20140298fd71SBarry Smith   ierr = PetscOptionsGetBool(NULL,"-fetidp_check",&test_fetidp,NULL);CHKERRQ(ierr);
20153425bc38SStefano Zampini 
20163425bc38SStefano Zampini   if (test_fetidp) {
20173425bc38SStefano Zampini 
20183425bc38SStefano Zampini     ierr = PetscViewerASCIIGetStdout(((PetscObject)(fetidpmat_ctx->pc))->comm,&viewer);CHKERRQ(ierr);
20193425bc38SStefano Zampini     ierr = PetscViewerASCIISynchronizedAllow(viewer,PETSC_TRUE);CHKERRQ(ierr);
20203425bc38SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"----------FETI_DP TESTS--------------\n");CHKERRQ(ierr);
20213425bc38SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"All tests should return zero!\n");CHKERRQ(ierr);
20223425bc38SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"FETIDP MAT context in the ");CHKERRQ(ierr);
20233425bc38SStefano Zampini     if (fully_redundant) {
20243425bc38SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"fully redundant case for lagrange multipliers.\n");CHKERRQ(ierr);
20253425bc38SStefano Zampini     } else {
20263425bc38SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Non-fully redundant case for lagrange multiplier.\n");CHKERRQ(ierr);
20273425bc38SStefano Zampini     }
20283425bc38SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
20293425bc38SStefano Zampini 
20303425bc38SStefano Zampini     /* TEST A/B: Test numbering of global lambda dofs             */
20313425bc38SStefano Zampini 
20323425bc38SStefano Zampini     ierr         = VecDuplicate(fetidpmat_ctx->lambda_local,&test_vec);CHKERRQ(ierr);
20333425bc38SStefano Zampini     ierr         = VecSet(lambda_global,1.0);CHKERRQ(ierr);
20343425bc38SStefano Zampini     ierr         = VecSet(test_vec,1.0);CHKERRQ(ierr);
20353425bc38SStefano Zampini     ierr         = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
20363425bc38SStefano Zampini     ierr         = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
20373425bc38SStefano Zampini     scalar_value = -1.0;
20383425bc38SStefano Zampini     ierr         = VecAXPY(test_vec,scalar_value,fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
20393425bc38SStefano Zampini     ierr         = VecNorm(test_vec,NORM_INFINITY,&scalar_value);CHKERRQ(ierr);
20403425bc38SStefano Zampini     ierr         = VecDestroy(&test_vec);CHKERRQ(ierr);
20413425bc38SStefano Zampini     ierr         = PetscViewerASCIISynchronizedPrintf(viewer,"A[%04d]: CHECK glob to loc: % 1.14e\n",rank,scalar_value);CHKERRQ(ierr);
20423425bc38SStefano Zampini     ierr         = PetscViewerFlush(viewer);CHKERRQ(ierr);
20433425bc38SStefano Zampini     if (fully_redundant) {
20443425bc38SStefano Zampini       ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr);
20453425bc38SStefano Zampini       ierr = VecSet(fetidpmat_ctx->lambda_local,0.5);CHKERRQ(ierr);
20463425bc38SStefano Zampini       ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20473425bc38SStefano Zampini       ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20483425bc38SStefano Zampini       ierr = VecSum(lambda_global,&scalar_value);CHKERRQ(ierr);
20493425bc38SStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"B[%04d]: CHECK loc to glob: % 1.14e\n",rank,scalar_value-fetidpmat_ctx->n_lambda);CHKERRQ(ierr);
20503425bc38SStefano Zampini       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
20513425bc38SStefano Zampini     }
20523425bc38SStefano Zampini 
20533425bc38SStefano Zampini     /* TEST C: It should holds B_delta*w=0, w\in\widehat{W}           */
20543425bc38SStefano Zampini     /* This is the meaning of the B matrix                            */
20553425bc38SStefano Zampini 
20560298fd71SBarry Smith     ierr = VecSetRandom(pcis->vec1_N,NULL);CHKERRQ(ierr);
20573425bc38SStefano Zampini     ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
20583425bc38SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
20593425bc38SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
20603425bc38SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20613425bc38SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20623425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20633425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20643425bc38SStefano Zampini     /* Action of B_delta */
20653425bc38SStefano Zampini     ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
20663425bc38SStefano Zampini     ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr);
20673425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20683425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20693425bc38SStefano Zampini     ierr = VecNorm(lambda_global,NORM_INFINITY,&scalar_value);CHKERRQ(ierr);
20703425bc38SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"C[coll]: CHECK infty norm of B_delta*w (w continuous): % 1.14e\n",scalar_value);CHKERRQ(ierr);
20713425bc38SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
20723425bc38SStefano Zampini 
20733425bc38SStefano Zampini     /* TEST D: It should holds E_Dw = w - P_Dw w\in\widetilde{W}     */
20743425bc38SStefano Zampini     /* E_D = R_D^TR                                                   */
20753425bc38SStefano Zampini     /* P_D = B_{D,delta}^T B_{delta}                                  */
20763425bc38SStefano Zampini     /* eq.44 Mandel Tezaur and Dohrmann 2005                          */
20773425bc38SStefano Zampini 
20783425bc38SStefano Zampini     /* compute a random vector in \widetilde{W} */
20790298fd71SBarry Smith     ierr = VecSetRandom(pcis->vec1_N,NULL);CHKERRQ(ierr);
20802fa5cd67SKarl Rupp 
20813425bc38SStefano Zampini     scalar_value = 0.0; /* set zero at vertices */
20823425bc38SStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
20832fa5cd67SKarl Rupp     for (i=0;i<n_vertices;i++) array[vertex_indices[i]] = scalar_value;
20843425bc38SStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
20852fa5cd67SKarl Rupp 
20863425bc38SStefano Zampini     /* store w for final comparison */
20873425bc38SStefano Zampini     ierr = VecDuplicate(pcis->vec1_B,&test_vec);CHKERRQ(ierr);
20883425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,test_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20893425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,test_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20903425bc38SStefano Zampini 
20913425bc38SStefano Zampini     /* Jump operator P_D : results stored in pcis->vec1_B */
20923425bc38SStefano Zampini 
20933425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20943425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20953425bc38SStefano Zampini     /* Action of B_delta */
20963425bc38SStefano Zampini     ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
20973425bc38SStefano Zampini     ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr);
20983425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20993425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21003425bc38SStefano Zampini     /* Action of B_Ddelta^T */
21013425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21023425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21033425bc38SStefano Zampini     ierr = MatMultTranspose(fetidpmat_ctx->B_Ddelta,fetidpmat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr);
21043425bc38SStefano Zampini 
21053425bc38SStefano Zampini     /* Average operator E_D : results stored in pcis->vec2_B */
21063425bc38SStefano Zampini 
21073425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21083425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21093425bc38SStefano Zampini     ierr = VecPointwiseMult(pcis->vec2_B,pcis->D,pcis->vec2_B);CHKERRQ(ierr);
21103425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec2_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21113425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec2_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21123425bc38SStefano Zampini     ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
21133425bc38SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21143425bc38SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21153425bc38SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21163425bc38SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21173425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21183425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21193425bc38SStefano Zampini 
21203425bc38SStefano Zampini     /* test E_D=I-P_D */
21213425bc38SStefano Zampini     scalar_value = 1.0;
21223425bc38SStefano Zampini     ierr         = VecAXPY(pcis->vec1_B,scalar_value,pcis->vec2_B);CHKERRQ(ierr);
21233425bc38SStefano Zampini     scalar_value = -1.0;
21243425bc38SStefano Zampini     ierr         = VecAXPY(pcis->vec1_B,scalar_value,test_vec);CHKERRQ(ierr);
21253425bc38SStefano Zampini     ierr         = VecNorm(pcis->vec1_B,NORM_INFINITY,&scalar_value);CHKERRQ(ierr);
21263425bc38SStefano Zampini     ierr         = VecDestroy(&test_vec);CHKERRQ(ierr);
21273425bc38SStefano Zampini     ierr         = PetscViewerASCIISynchronizedPrintf(viewer,"D[%04d] CHECK infty norm of E_D + P_D - I: % 1.14e\n",rank,scalar_value);CHKERRQ(ierr);
21283425bc38SStefano Zampini     ierr         = PetscViewerFlush(viewer);CHKERRQ(ierr);
21293425bc38SStefano Zampini 
21303425bc38SStefano Zampini     /* TEST E: It should holds R_D^TP_Dw=0 w\in\widetilde{W}          */
21313425bc38SStefano Zampini     /* eq.48 Mandel Tezaur and Dohrmann 2005                          */
21323425bc38SStefano Zampini 
21330298fd71SBarry Smith     ierr = VecSetRandom(pcis->vec1_N,NULL);CHKERRQ(ierr);
21343425bc38SStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
21352fa5cd67SKarl Rupp 
21363425bc38SStefano Zampini     scalar_value = 0.0; /* set zero at vertices */
21372fa5cd67SKarl Rupp     for (i=0;i<n_vertices;i++) array[vertex_indices[i]]=scalar_value;
21383425bc38SStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
21393425bc38SStefano Zampini 
21403425bc38SStefano Zampini     /* Jump operator P_D : results stored in pcis->vec1_B */
21413425bc38SStefano Zampini 
21423425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21433425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21443425bc38SStefano Zampini     /* Action of B_delta */
21453425bc38SStefano Zampini     ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
21463425bc38SStefano Zampini     ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr);
21473425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21483425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21493425bc38SStefano Zampini     /* Action of B_Ddelta^T */
21503425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21513425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21523425bc38SStefano Zampini     ierr = MatMultTranspose(fetidpmat_ctx->B_Ddelta,fetidpmat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr);
21533425bc38SStefano Zampini     /* diagonal scaling */
21543425bc38SStefano Zampini     ierr = VecPointwiseMult(pcis->vec1_B,pcis->D,pcis->vec1_B);CHKERRQ(ierr);
21553425bc38SStefano Zampini     /* sum on the interface */
21563425bc38SStefano Zampini     ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
21573425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21583425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21593425bc38SStefano Zampini     ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
21603425bc38SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21613425bc38SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21623425bc38SStefano Zampini     ierr = VecNorm(pcis->vec1_global,NORM_INFINITY,&scalar_value);CHKERRQ(ierr);
21633425bc38SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"E[coll]: CHECK infty norm of R^T_D P_D: % 1.14e\n",scalar_value);CHKERRQ(ierr);
21643425bc38SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
21653425bc38SStefano Zampini 
21663425bc38SStefano Zampini     if (!fully_redundant) {
21673425bc38SStefano Zampini       /* TEST F: It should holds B_{delta}B^T_{D,delta}=I               */
21683425bc38SStefano Zampini       /* Corollary thm 14 Mandel Tezaur and Dohrmann 2005               */
21693425bc38SStefano Zampini       ierr = VecDuplicate(lambda_global,&test_vec);CHKERRQ(ierr);
21700298fd71SBarry Smith       ierr = VecSetRandom(lambda_global,NULL);CHKERRQ(ierr);
21713425bc38SStefano Zampini       /* Action of B_Ddelta^T */
21723425bc38SStefano Zampini       ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21733425bc38SStefano Zampini       ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
21743425bc38SStefano Zampini       ierr = MatMultTranspose(fetidpmat_ctx->B_Ddelta,fetidpmat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr);
21753425bc38SStefano Zampini       /* Action of B_delta */
21763425bc38SStefano Zampini       ierr         = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
21773425bc38SStefano Zampini       ierr         = VecSet(test_vec,0.0);CHKERRQ(ierr);
21783425bc38SStefano Zampini       ierr         = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,test_vec,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21793425bc38SStefano Zampini       ierr         = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,test_vec,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21803425bc38SStefano Zampini       scalar_value = -1.0;
21813425bc38SStefano Zampini       ierr         = VecAXPY(lambda_global,scalar_value,test_vec);CHKERRQ(ierr);
21823425bc38SStefano Zampini       ierr         = VecNorm(lambda_global,NORM_INFINITY,&scalar_value);CHKERRQ(ierr);
21833425bc38SStefano Zampini       ierr         = PetscViewerASCIIPrintf(viewer,"E[coll]: CHECK infty norm of P^T_D - I: % 1.14e\n",scalar_value);CHKERRQ(ierr);
21843425bc38SStefano Zampini       ierr         = PetscViewerFlush(viewer);CHKERRQ(ierr);
21853425bc38SStefano Zampini       ierr         = PetscViewerFlush(viewer);CHKERRQ(ierr);
21863425bc38SStefano Zampini       ierr         = VecDestroy(&test_vec);CHKERRQ(ierr);
21873425bc38SStefano Zampini     }
21883425bc38SStefano Zampini   }
21893425bc38SStefano Zampini   /* final cleanup */
21903425bc38SStefano Zampini   ierr = PetscFree(vertex_indices);CHKERRQ(ierr);
21913425bc38SStefano Zampini   ierr = VecDestroy(&lambda_global);CHKERRQ(ierr);
21923425bc38SStefano Zampini   PetscFunctionReturn(0);
21933425bc38SStefano Zampini }
21943425bc38SStefano Zampini 
21953425bc38SStefano Zampini #undef __FUNCT__
21963425bc38SStefano Zampini #define __FUNCT__ "PCBDDCSetupFETIDPPCContext"
21973425bc38SStefano Zampini static PetscErrorCode PCBDDCSetupFETIDPPCContext(Mat fetimat, FETIDPPC_ctx *fetidppc_ctx)
21983425bc38SStefano Zampini {
21993425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
22003425bc38SStefano Zampini   PetscErrorCode ierr;
22013425bc38SStefano Zampini 
22023425bc38SStefano Zampini   PetscFunctionBegin;
22033425bc38SStefano Zampini   ierr = MatShellGetContext(fetimat,&mat_ctx);CHKERRQ(ierr);
22043425bc38SStefano Zampini   /* get references from objects created when setting up feti mat context */
22053425bc38SStefano Zampini   ierr = PetscObjectReference((PetscObject)mat_ctx->lambda_local);CHKERRQ(ierr);
22062fa5cd67SKarl Rupp 
22073425bc38SStefano Zampini   fetidppc_ctx->lambda_local = mat_ctx->lambda_local;
22082fa5cd67SKarl Rupp 
22093425bc38SStefano Zampini   ierr = PetscObjectReference((PetscObject)mat_ctx->B_Ddelta);CHKERRQ(ierr);
22102fa5cd67SKarl Rupp 
22113425bc38SStefano Zampini   fetidppc_ctx->B_Ddelta = mat_ctx->B_Ddelta;
22122fa5cd67SKarl Rupp 
22133425bc38SStefano Zampini   ierr = PetscObjectReference((PetscObject)mat_ctx->l2g_lambda);CHKERRQ(ierr);
22142fa5cd67SKarl Rupp 
22153425bc38SStefano Zampini   fetidppc_ctx->l2g_lambda = mat_ctx->l2g_lambda;
22163425bc38SStefano Zampini   PetscFunctionReturn(0);
22173425bc38SStefano Zampini }
22183425bc38SStefano Zampini 
22193425bc38SStefano Zampini #undef __FUNCT__
22203425bc38SStefano Zampini #define __FUNCT__ "FETIDPMatMult"
22213425bc38SStefano Zampini static PetscErrorCode FETIDPMatMult(Mat fetimat, Vec x, Vec y)
22223425bc38SStefano Zampini {
22233425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
22243425bc38SStefano Zampini   PC_IS          *pcis;
22253425bc38SStefano Zampini   PetscErrorCode ierr;
22263425bc38SStefano Zampini 
22273425bc38SStefano Zampini   PetscFunctionBegin;
22283425bc38SStefano Zampini   ierr = MatShellGetContext(fetimat,&mat_ctx);CHKERRQ(ierr);
22293425bc38SStefano Zampini   pcis = (PC_IS*)mat_ctx->pc->data;
22303425bc38SStefano Zampini   /* Application of B_delta^T */
22313425bc38SStefano Zampini   ierr = VecScatterBegin(mat_ctx->l2g_lambda,x,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
22323425bc38SStefano Zampini   ierr = VecScatterEnd(mat_ctx->l2g_lambda,x,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
22333425bc38SStefano Zampini   ierr = MatMultTranspose(mat_ctx->B_delta,mat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr);
22343425bc38SStefano Zampini   /* Application of \widetilde{S}^-1 */
22353425bc38SStefano Zampini   ierr = VecSet(pcis->vec1_D,0.0);CHKERRQ(ierr);
22363425bc38SStefano Zampini   ierr = PCBDDCApplyInterfacePreconditioner(mat_ctx->pc);CHKERRQ(ierr);
22373425bc38SStefano Zampini   /* Application of B_delta */
22383425bc38SStefano Zampini   ierr = MatMult(mat_ctx->B_delta,pcis->vec1_B,mat_ctx->lambda_local);CHKERRQ(ierr);
22393425bc38SStefano Zampini   ierr = VecSet(y,0.0);CHKERRQ(ierr);
22403425bc38SStefano Zampini   ierr = VecScatterBegin(mat_ctx->l2g_lambda,mat_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
22413425bc38SStefano Zampini   ierr = VecScatterEnd(mat_ctx->l2g_lambda,mat_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
22423425bc38SStefano Zampini   PetscFunctionReturn(0);
22433425bc38SStefano Zampini }
22443425bc38SStefano Zampini 
22453425bc38SStefano Zampini #undef __FUNCT__
22463425bc38SStefano Zampini #define __FUNCT__ "FETIDPPCApply"
22473425bc38SStefano Zampini static PetscErrorCode FETIDPPCApply(PC fetipc, Vec x, Vec y)
22483425bc38SStefano Zampini {
22493425bc38SStefano Zampini   FETIDPPC_ctx   *pc_ctx;
22503425bc38SStefano Zampini   PC_IS          *pcis;
22513425bc38SStefano Zampini   PetscErrorCode ierr;
22523425bc38SStefano Zampini 
22533425bc38SStefano Zampini   PetscFunctionBegin;
22543425bc38SStefano Zampini   ierr = PCShellGetContext(fetipc,(void**)&pc_ctx);
22553425bc38SStefano Zampini   pcis = (PC_IS*)pc_ctx->pc->data;
22563425bc38SStefano Zampini   /* Application of B_Ddelta^T */
22573425bc38SStefano Zampini   ierr = VecScatterBegin(pc_ctx->l2g_lambda,x,pc_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
22583425bc38SStefano Zampini   ierr = VecScatterEnd(pc_ctx->l2g_lambda,x,pc_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
22593425bc38SStefano Zampini   ierr = VecSet(pcis->vec2_B,0.0);CHKERRQ(ierr);
22603425bc38SStefano Zampini   ierr = MatMultTranspose(pc_ctx->B_Ddelta,pc_ctx->lambda_local,pcis->vec2_B);CHKERRQ(ierr);
22613425bc38SStefano Zampini   /* Application of S */
22623425bc38SStefano Zampini   ierr = PCISApplySchur(pc_ctx->pc,pcis->vec2_B,pcis->vec1_B,(Vec)0,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr);
22633425bc38SStefano Zampini   /* Application of B_Ddelta */
22643425bc38SStefano Zampini   ierr = MatMult(pc_ctx->B_Ddelta,pcis->vec1_B,pc_ctx->lambda_local);CHKERRQ(ierr);
22653425bc38SStefano Zampini   ierr = VecSet(y,0.0);CHKERRQ(ierr);
22663425bc38SStefano Zampini   ierr = VecScatterBegin(pc_ctx->l2g_lambda,pc_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
22673425bc38SStefano Zampini   ierr = VecScatterEnd(pc_ctx->l2g_lambda,pc_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
22683425bc38SStefano Zampini   PetscFunctionReturn(0);
22693425bc38SStefano Zampini }
22703425bc38SStefano Zampini 
2271da1bb401SStefano Zampini #undef __FUNCT__
2272da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetupLocalAdjacencyGraph"
2273da1bb401SStefano Zampini static PetscErrorCode PCBDDCSetupLocalAdjacencyGraph(PC pc)
2274da1bb401SStefano Zampini {
2275da1bb401SStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
2276da1bb401SStefano Zampini   Mat_IS         *matis  = (Mat_IS*)pc->pmat->data;
22771a83f524SJed Brown   PetscInt       nvtxs;
22781a83f524SJed Brown   const PetscInt *xadj,*adjncy;
2279da1bb401SStefano Zampini   Mat            mat_adj;
2280da1bb401SStefano Zampini   PetscBool      symmetrize_rowij=PETSC_TRUE,compressed_rowij=PETSC_FALSE,flg_row=PETSC_TRUE;
2281da1bb401SStefano Zampini   PCBDDCGraph    mat_graph       =pcbddc->mat_graph;
2282da1bb401SStefano Zampini   PetscErrorCode ierr;
2283da1bb401SStefano Zampini 
2284da1bb401SStefano Zampini   PetscFunctionBegin;
2285da1bb401SStefano Zampini   /* get CSR adjacency from local matrix if user has not yet provided local graph using PCBDDCSetLocalAdjacencyGraph function */
2286da1bb401SStefano Zampini   if (!mat_graph->xadj) {
2287da1bb401SStefano Zampini     ierr = MatConvert(matis->A,MATMPIADJ,MAT_INITIAL_MATRIX,&mat_adj);CHKERRQ(ierr);
2288da1bb401SStefano Zampini     ierr = MatGetRowIJ(mat_adj,0,symmetrize_rowij,compressed_rowij,&nvtxs,&xadj,&adjncy,&flg_row);CHKERRQ(ierr);
2289acee19a7SJed Brown     if (!flg_row) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in MatGetRowIJ()\n");
2290da1bb401SStefano Zampini     /* Get adjacency into BDDC workspace */
2291da1bb401SStefano Zampini     ierr = PCBDDCSetLocalAdjacencyGraph(pc,nvtxs,xadj,adjncy,PETSC_COPY_VALUES);CHKERRQ(ierr);
2292da1bb401SStefano Zampini     ierr = MatRestoreRowIJ(mat_adj,0,symmetrize_rowij,compressed_rowij,&nvtxs,&xadj,&adjncy,&flg_row);CHKERRQ(ierr);
2293acee19a7SJed Brown     if (!flg_row) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in MatRestoreRowIJ()\n");
2294da1bb401SStefano Zampini     ierr = MatDestroy(&mat_adj);CHKERRQ(ierr);
2295da1bb401SStefano Zampini   }
2296da1bb401SStefano Zampini   PetscFunctionReturn(0);
2297da1bb401SStefano Zampini }
2298da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
22990c7d97c5SJed Brown #undef __FUNCT__
23000c7d97c5SJed Brown #define __FUNCT__ "PCBDDCApplyInterfacePreconditioner"
23012617d88aSStefano Zampini static PetscErrorCode  PCBDDCApplyInterfacePreconditioner(PC pc)
23020c7d97c5SJed Brown {
23030c7d97c5SJed Brown   PetscErrorCode    ierr;
23040c7d97c5SJed Brown   PC_BDDC           *pcbddc = (PC_BDDC*)(pc->data);
23050c7d97c5SJed Brown   PC_IS             *pcis   = (PC_IS*)(pc->data);
23063b03a366Sstefano_zampini   const PetscScalar zero     = 0.0;
23070c7d97c5SJed Brown 
23080c7d97c5SJed Brown   PetscFunctionBegin;
23090c7d97c5SJed Brown   /* Application of PHI^T  */
23100c7d97c5SJed Brown   ierr = MatMultTranspose(pcbddc->coarse_phi_B,pcis->vec1_B,pcbddc->vec1_P);CHKERRQ(ierr);
231129622bf0SStefano Zampini   if (pcbddc->inexact_prec_type) { ierr = MatMultTransposeAdd(pcbddc->coarse_phi_D,pcis->vec1_D,pcbddc->vec1_P,pcbddc->vec1_P);CHKERRQ(ierr); }
23120c7d97c5SJed Brown 
23130c7d97c5SJed Brown   /* Scatter data of coarse_rhs */
2314142dfd88SStefano Zampini   if (pcbddc->coarse_rhs) { ierr = VecSet(pcbddc->coarse_rhs,zero);CHKERRQ(ierr); }
23150c7d97c5SJed Brown   ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->vec1_P,pcbddc->coarse_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
23160c7d97c5SJed Brown 
23170c7d97c5SJed Brown   /* Local solution on R nodes */
23180c7d97c5SJed Brown   ierr = VecSet(pcbddc->vec1_R,zero);CHKERRQ(ierr);
23190c7d97c5SJed Brown   ierr = VecScatterBegin(pcbddc->R_to_B,pcis->vec1_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
23200c7d97c5SJed Brown   ierr = VecScatterEnd  (pcbddc->R_to_B,pcis->vec1_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
232129622bf0SStefano Zampini   if (pcbddc->inexact_prec_type) {
23220c7d97c5SJed Brown     ierr = VecScatterBegin(pcbddc->R_to_D,pcis->vec1_D,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
23230c7d97c5SJed Brown     ierr = VecScatterEnd  (pcbddc->R_to_D,pcis->vec1_D,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
23240c7d97c5SJed Brown   }
23250c7d97c5SJed Brown   ierr = PCBDDCSolveSaddlePoint(pc);CHKERRQ(ierr);
23260c7d97c5SJed Brown   ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr);
23270c7d97c5SJed Brown   ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec2_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
23280c7d97c5SJed Brown   ierr = VecScatterEnd  (pcbddc->R_to_B,pcbddc->vec2_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
232929622bf0SStefano Zampini   if (pcbddc->inexact_prec_type) {
23300c7d97c5SJed Brown     ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec2_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
23310c7d97c5SJed Brown     ierr = VecScatterEnd  (pcbddc->R_to_D,pcbddc->vec2_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
23320c7d97c5SJed Brown   }
23330c7d97c5SJed Brown 
23340c7d97c5SJed Brown   /* Coarse solution */
23350c7d97c5SJed Brown   ierr = PCBDDCScatterCoarseDataEnd(pc,pcbddc->vec1_P,pcbddc->coarse_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
23360bdf917eSStefano Zampini   if (pcbddc->coarse_rhs) {
23370bdf917eSStefano Zampini     if (pcbddc->CoarseNullSpace) {
23380298fd71SBarry Smith       ierr = MatNullSpaceRemove(pcbddc->CoarseNullSpace,pcbddc->coarse_rhs,NULL);CHKERRQ(ierr);
23390bdf917eSStefano Zampini     }
23400bdf917eSStefano Zampini     ierr = KSPSolve(pcbddc->coarse_ksp,pcbddc->coarse_rhs,pcbddc->coarse_vec);CHKERRQ(ierr);
23410bdf917eSStefano Zampini     if (pcbddc->CoarseNullSpace) {
23420298fd71SBarry Smith       ierr = MatNullSpaceRemove(pcbddc->CoarseNullSpace,pcbddc->coarse_vec,NULL);CHKERRQ(ierr);
23430bdf917eSStefano Zampini     }
23440bdf917eSStefano Zampini   }
23450c7d97c5SJed Brown   ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->coarse_vec,pcbddc->vec1_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
23460c7d97c5SJed Brown   ierr = PCBDDCScatterCoarseDataEnd  (pc,pcbddc->coarse_vec,pcbddc->vec1_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
23470c7d97c5SJed Brown 
23480c7d97c5SJed Brown   /* Sum contributions from two levels */
23490c7d97c5SJed Brown   ierr = MatMultAdd(pcbddc->coarse_phi_B,pcbddc->vec1_P,pcis->vec1_B,pcis->vec1_B);CHKERRQ(ierr);
235029622bf0SStefano Zampini   if (pcbddc->inexact_prec_type) { ierr = MatMultAdd(pcbddc->coarse_phi_D,pcbddc->vec1_P,pcis->vec1_D,pcis->vec1_D);CHKERRQ(ierr); }
23510c7d97c5SJed Brown   PetscFunctionReturn(0);
23520c7d97c5SJed Brown }
23530c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
23540c7d97c5SJed Brown #undef __FUNCT__
23550c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSolveSaddlePoint"
235653cdbc3dSStefano Zampini static PetscErrorCode  PCBDDCSolveSaddlePoint(PC pc)
23570c7d97c5SJed Brown {
23580c7d97c5SJed Brown   PetscErrorCode ierr;
23590c7d97c5SJed Brown   PC_BDDC        *pcbddc = (PC_BDDC*)(pc->data);
23600c7d97c5SJed Brown 
23610c7d97c5SJed Brown   PetscFunctionBegin;
236253cdbc3dSStefano Zampini   ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr);
2363534831adSStefano Zampini   if (pcbddc->local_auxmat1) {
23640c7d97c5SJed Brown     ierr = MatMult(pcbddc->local_auxmat1,pcbddc->vec2_R,pcbddc->vec1_C);CHKERRQ(ierr);
23650c7d97c5SJed Brown     ierr = MatMultAdd(pcbddc->local_auxmat2,pcbddc->vec1_C,pcbddc->vec2_R,pcbddc->vec2_R);CHKERRQ(ierr);
23660c7d97c5SJed Brown   }
23670c7d97c5SJed Brown   PetscFunctionReturn(0);
23680c7d97c5SJed Brown }
23690c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
23700c7d97c5SJed Brown #undef __FUNCT__
23710c7d97c5SJed Brown #define __FUNCT__ "PCBDDCScatterCoarseDataBegin"
237253cdbc3dSStefano Zampini static PetscErrorCode  PCBDDCScatterCoarseDataBegin(PC pc,Vec vec_from, Vec vec_to, InsertMode imode, ScatterMode smode)
23730c7d97c5SJed Brown {
23740c7d97c5SJed Brown   PetscErrorCode ierr;
23750c7d97c5SJed Brown   PC_BDDC        *pcbddc = (PC_BDDC*)(pc->data);
23760c7d97c5SJed Brown 
23770c7d97c5SJed Brown   PetscFunctionBegin;
23780c7d97c5SJed Brown   switch (pcbddc->coarse_communications_type) {
23790c7d97c5SJed Brown   case SCATTERS_BDDC:
23800c7d97c5SJed Brown     ierr = VecScatterBegin(pcbddc->coarse_loc_to_glob,vec_from,vec_to,imode,smode);CHKERRQ(ierr);
23810c7d97c5SJed Brown     break;
23820c7d97c5SJed Brown   case GATHERS_BDDC:
23830c7d97c5SJed Brown     break;
23840c7d97c5SJed Brown   }
23850c7d97c5SJed Brown   PetscFunctionReturn(0);
23860c7d97c5SJed Brown }
23870c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
23880c7d97c5SJed Brown #undef __FUNCT__
23890c7d97c5SJed Brown #define __FUNCT__ "PCBDDCScatterCoarseDataEnd"
239053cdbc3dSStefano Zampini static PetscErrorCode  PCBDDCScatterCoarseDataEnd(PC pc,Vec vec_from, Vec vec_to, InsertMode imode, ScatterMode smode)
23910c7d97c5SJed Brown {
23920c7d97c5SJed Brown   PetscErrorCode ierr;
23930c7d97c5SJed Brown   PC_BDDC        *pcbddc = (PC_BDDC*)(pc->data);
23940c7d97c5SJed Brown   PetscScalar    *array_to;
23950c7d97c5SJed Brown   PetscScalar    *array_from;
2396ce94432eSBarry Smith   MPI_Comm       comm;
23970c7d97c5SJed Brown   PetscInt       i;
23980c7d97c5SJed Brown 
23990c7d97c5SJed Brown   PetscFunctionBegin;
2400ce94432eSBarry Smith   ierr = PetscObjectGetComm((PetscObject)pc,&comm);CHKERRQ(ierr);
24010c7d97c5SJed Brown   switch (pcbddc->coarse_communications_type) {
24020c7d97c5SJed Brown   case SCATTERS_BDDC:
24030c7d97c5SJed Brown     ierr = VecScatterEnd(pcbddc->coarse_loc_to_glob,vec_from,vec_to,imode,smode);CHKERRQ(ierr);
24040c7d97c5SJed Brown     break;
24050c7d97c5SJed Brown   case GATHERS_BDDC:
24060c7d97c5SJed Brown     if (vec_from) VecGetArray(vec_from,&array_from);
24070c7d97c5SJed Brown     if (vec_to) VecGetArray(vec_to,&array_to);
24080c7d97c5SJed Brown     switch (pcbddc->coarse_problem_type) {
24090c7d97c5SJed Brown     case SEQUENTIAL_BDDC:
24100c7d97c5SJed Brown       if (smode == SCATTER_FORWARD) {
241153cdbc3dSStefano Zampini         ierr = MPI_Gatherv(&array_from[0],pcbddc->local_primal_size,MPIU_SCALAR,&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,0,comm);CHKERRQ(ierr);
24120c7d97c5SJed Brown         if (vec_to) {
24130bdf917eSStefano Zampini           if (imode == ADD_VALUES) {
24140bdf917eSStefano Zampini             for (i=0;i<pcbddc->replicated_primal_size;i++) {
24150c7d97c5SJed Brown               array_to[pcbddc->replicated_local_primal_indices[i]]+=pcbddc->replicated_local_primal_values[i];
24160c7d97c5SJed Brown             }
24170c7d97c5SJed Brown           } else {
24180bdf917eSStefano Zampini             for (i=0;i<pcbddc->replicated_primal_size;i++) {
24190bdf917eSStefano Zampini               array_to[pcbddc->replicated_local_primal_indices[i]]=pcbddc->replicated_local_primal_values[i];
24200bdf917eSStefano Zampini             }
24210bdf917eSStefano Zampini           }
24220bdf917eSStefano Zampini         }
24230bdf917eSStefano Zampini       } else {
24240bdf917eSStefano Zampini         if (vec_from) {
24250bdf917eSStefano Zampini           if (imode == ADD_VALUES) {
24260bdf917eSStefano Zampini             printf("Scatter mode %d, insert mode %d for case %d not implemented!\n",smode,imode,pcbddc->coarse_problem_type);
24270bdf917eSStefano Zampini           }
24280bdf917eSStefano Zampini           for (i=0;i<pcbddc->replicated_primal_size;i++) {
24290c7d97c5SJed Brown             pcbddc->replicated_local_primal_values[i]=array_from[pcbddc->replicated_local_primal_indices[i]];
24300bdf917eSStefano Zampini           }
24310bdf917eSStefano Zampini         }
243253cdbc3dSStefano Zampini         ierr = MPI_Scatterv(&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,&array_to[0],pcbddc->local_primal_size,MPIU_SCALAR,0,comm);CHKERRQ(ierr);
24330c7d97c5SJed Brown       }
24340c7d97c5SJed Brown       break;
24350c7d97c5SJed Brown     case REPLICATED_BDDC:
24360c7d97c5SJed Brown       if (smode == SCATTER_FORWARD) {
243753cdbc3dSStefano Zampini         ierr = MPI_Allgatherv(&array_from[0],pcbddc->local_primal_size,MPIU_SCALAR,&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,comm);CHKERRQ(ierr);
24380bdf917eSStefano Zampini         if (imode == ADD_VALUES) {
24390bdf917eSStefano Zampini           for (i=0;i<pcbddc->replicated_primal_size;i++) {
24400c7d97c5SJed Brown             array_to[pcbddc->replicated_local_primal_indices[i]]+=pcbddc->replicated_local_primal_values[i];
24410bdf917eSStefano Zampini           }
24420bdf917eSStefano Zampini         } else {
24430bdf917eSStefano Zampini           for (i=0;i<pcbddc->replicated_primal_size;i++) {
24440bdf917eSStefano Zampini             array_to[pcbddc->replicated_local_primal_indices[i]]=pcbddc->replicated_local_primal_values[i];
24450bdf917eSStefano Zampini           }
24460bdf917eSStefano Zampini         }
24470c7d97c5SJed Brown       } else { /* no communications needed for SCATTER_REVERSE since needed data is already present */
24480bdf917eSStefano Zampini         if (imode == ADD_VALUES) {
24490bdf917eSStefano Zampini           for (i=0;i<pcbddc->local_primal_size;i++) {
24500bdf917eSStefano Zampini             array_to[i]+=array_from[pcbddc->local_primal_indices[i]];
24510bdf917eSStefano Zampini           }
24520bdf917eSStefano Zampini         } else {
24530bdf917eSStefano Zampini           for (i=0;i<pcbddc->local_primal_size;i++) {
24540c7d97c5SJed Brown             array_to[i]=array_from[pcbddc->local_primal_indices[i]];
24550c7d97c5SJed Brown           }
24560bdf917eSStefano Zampini         }
24570bdf917eSStefano Zampini       }
24580c7d97c5SJed Brown       break;
245953cdbc3dSStefano Zampini     case MULTILEVEL_BDDC:
246053cdbc3dSStefano Zampini       break;
246153cdbc3dSStefano Zampini     case PARALLEL_BDDC:
246253cdbc3dSStefano Zampini       break;
24630c7d97c5SJed Brown     }
24640c7d97c5SJed Brown     if (vec_from) VecRestoreArray(vec_from,&array_from);
24650c7d97c5SJed Brown     if (vec_to) VecRestoreArray(vec_to,&array_to);
24660c7d97c5SJed Brown     break;
24670c7d97c5SJed Brown   }
24680c7d97c5SJed Brown   PetscFunctionReturn(0);
24690c7d97c5SJed Brown }
24700c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
24713b03a366Sstefano_zampini #undef __FUNCT__
24723b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCCreateConstraintMatrix"
24733b03a366Sstefano_zampini static PetscErrorCode PCBDDCCreateConstraintMatrix(PC pc)
24743b03a366Sstefano_zampini {
24753b03a366Sstefano_zampini   PetscErrorCode ierr;
24763b03a366Sstefano_zampini   PC_IS          *pcis    = (PC_IS*)(pc->data);
24773b03a366Sstefano_zampini   PC_BDDC        *pcbddc  = (PC_BDDC*)pc->data;
24783b03a366Sstefano_zampini   Mat_IS         *matis   = (Mat_IS*)pc->pmat->data;
247923d4d1a5SStefano Zampini   PetscInt       *nnz,*is_indices;
24803b03a366Sstefano_zampini   PetscScalar    *temp_quadrature_constraint;
2481534831adSStefano Zampini   PetscInt       *temp_indices,*temp_indices_to_constraint,*temp_indices_to_constraint_B,*local_to_B;
24823b03a366Sstefano_zampini   PetscInt       local_primal_size,i,j,k,total_counts,max_size_of_constraint;
24833b03a366Sstefano_zampini   PetscInt       n_constraints,n_vertices,size_of_constraint;
2484534831adSStefano Zampini   PetscScalar    quad_value;
24853b03a366Sstefano_zampini   PetscBool      nnsp_has_cnst=PETSC_FALSE,use_nnsp_true=pcbddc->use_nnsp_true;
24863b03a366Sstefano_zampini   PetscInt       nnsp_size    =0,nnsp_addone=0,temp_constraints,temp_start_ptr;
24873b03a366Sstefano_zampini   IS             *used_IS;
248819fd82e9SBarry Smith   MatType        impMatType=MATSEQAIJ;
24893b03a366Sstefano_zampini   PetscBLASInt   Bs,Bt,lwork,lierr;
24903b03a366Sstefano_zampini   PetscReal      tol=1.0e-8;
2491fcda91b4SJed Brown   MatNullSpace   nearnullsp;
2492fcda91b4SJed Brown   const Vec      *nearnullvecs;
24933b03a366Sstefano_zampini   Vec            *localnearnullsp;
24943b03a366Sstefano_zampini   PetscScalar    *work,*temp_basis,*array_vector,*correlation_mat;
24953b03a366Sstefano_zampini   PetscReal      *rwork,*singular_vals;
2496534831adSStefano Zampini   PetscBLASInt   Bone=1,*ipiv;
2497534831adSStefano Zampini   Vec            temp_vec;
2498534831adSStefano Zampini   Mat            temp_mat;
2499534831adSStefano Zampini   KSP            temp_ksp;
2500ffe5efe1SStefano Zampini   PC             temp_pc;
2501534831adSStefano Zampini   PetscInt       s,start_constraint,dual_dofs;
2502534831adSStefano Zampini   PetscBool      compute_submatrix,useksp=PETSC_FALSE;
2503534831adSStefano Zampini   PetscInt       *aux_primal_permutation,*aux_primal_numbering;
2504534831adSStefano Zampini   PetscBool      boolforface,*change_basis;
25052fa5cd67SKarl Rupp 
2506de534f79Sstefano_zampini /* some ugly conditional declarations */
25073b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD)
25083b03a366Sstefano_zampini   PetscScalar  dot_result;
25093b03a366Sstefano_zampini   PetscScalar  one=1.0,zero=0.0;
25103b03a366Sstefano_zampini   PetscInt     ii;
25113425bc38SStefano Zampini   PetscScalar  *singular_vectors;
25123425bc38SStefano Zampini   PetscBLASInt *iwork,*ifail;
25133425bc38SStefano Zampini   PetscReal    dummy_real,abs_tol;
25143425bc38SStefano Zampini   PetscBLASInt eigs_found;
25153b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX)
25163b03a366Sstefano_zampini   PetscScalar val1,val2;
25173b03a366Sstefano_zampini #endif
25183425bc38SStefano Zampini #endif
25193b03a366Sstefano_zampini   PetscBLASInt dummy_int;
25203b03a366Sstefano_zampini   PetscScalar  dummy_scalar;
25213b03a366Sstefano_zampini 
25223b03a366Sstefano_zampini   PetscFunctionBegin;
25233b03a366Sstefano_zampini   /* check if near null space is attached to global mat */
2524fcda91b4SJed Brown   ierr = MatGetNearNullSpace(pc->pmat,&nearnullsp);CHKERRQ(ierr);
2525fcda91b4SJed Brown   if (nearnullsp) {
2526fcda91b4SJed Brown     ierr = MatNullSpaceGetVecs(nearnullsp,&nnsp_has_cnst,&nnsp_size,&nearnullvecs);CHKERRQ(ierr);
25273b03a366Sstefano_zampini   } else { /* if near null space is not provided it uses constants */
25283b03a366Sstefano_zampini     nnsp_has_cnst = PETSC_TRUE;
25293b03a366Sstefano_zampini     use_nnsp_true = PETSC_TRUE;
25303b03a366Sstefano_zampini   }
25312fa5cd67SKarl Rupp   if (nnsp_has_cnst) nnsp_addone = 1;
25322fa5cd67SKarl Rupp 
25333b03a366Sstefano_zampini   /*
25343b03a366Sstefano_zampini        Evaluate maximum storage size needed by the procedure
25353b03a366Sstefano_zampini        - temp_indices will contain start index of each constraint stored as follows
25363b03a366Sstefano_zampini        - temp_indices_to_constraint  [temp_indices[i],...,temp[indices[i+1]-1] will contain the indices (in local numbering) on which the constraint acts
2537534831adSStefano Zampini        - temp_indices_to_constraint_B[temp_indices[i],...,temp[indices[i+1]-1] will contain the indices (in boundary numbering) on which the constraint acts
25383b03a366Sstefano_zampini        - temp_quadrature_constraint  [temp_indices[i],...,temp[indices[i+1]-1] will contain the scalars representing the constraint itself
25393b03a366Sstefano_zampini                                                                                                                                                          */
2540da1bb401SStefano Zampini 
25413b03a366Sstefano_zampini   total_counts  = pcbddc->n_ISForFaces+pcbddc->n_ISForEdges;
25423b03a366Sstefano_zampini   total_counts *= (nnsp_addone+nnsp_size);
25432fa5cd67SKarl Rupp 
2544da1bb401SStefano Zampini   ierr = ISGetSize(pcbddc->ISForVertices,&n_vertices);CHKERRQ(ierr);
25452fa5cd67SKarl Rupp 
2546da1bb401SStefano Zampini   total_counts += n_vertices;
25472fa5cd67SKarl Rupp 
25483b03a366Sstefano_zampini   ierr = PetscMalloc((total_counts+1)*sizeof(PetscInt),&temp_indices);CHKERRQ(ierr);
2549534831adSStefano Zampini   ierr = PetscMalloc((total_counts+1)*sizeof(PetscBool),&change_basis);CHKERRQ(ierr);
25502fa5cd67SKarl Rupp 
25513b03a366Sstefano_zampini   total_counts           = 0;
25523b03a366Sstefano_zampini   max_size_of_constraint = 0;
25533b03a366Sstefano_zampini   for (i=0;i<pcbddc->n_ISForEdges+pcbddc->n_ISForFaces;i++) {
25542fa5cd67SKarl Rupp     if (i<pcbddc->n_ISForEdges) used_IS = &pcbddc->ISForEdges[i];
25552fa5cd67SKarl Rupp     else used_IS = &pcbddc->ISForFaces[i-pcbddc->n_ISForEdges];
25563b03a366Sstefano_zampini     ierr = ISGetSize(*used_IS,&j);CHKERRQ(ierr);
25573b03a366Sstefano_zampini     total_counts += j;
25583b03a366Sstefano_zampini     if (j>max_size_of_constraint) max_size_of_constraint=j;
25593b03a366Sstefano_zampini   }
25603b03a366Sstefano_zampini   total_counts *= (nnsp_addone+nnsp_size);
2561da1bb401SStefano Zampini   total_counts += n_vertices;
25622fa5cd67SKarl Rupp 
25633b03a366Sstefano_zampini   ierr = PetscMalloc(total_counts*sizeof(PetscScalar),&temp_quadrature_constraint);CHKERRQ(ierr);
25643b03a366Sstefano_zampini   ierr = PetscMalloc(total_counts*sizeof(PetscInt),&temp_indices_to_constraint);CHKERRQ(ierr);
2565534831adSStefano Zampini   ierr = PetscMalloc(total_counts*sizeof(PetscInt),&temp_indices_to_constraint_B);CHKERRQ(ierr);
2566534831adSStefano Zampini   ierr = PetscMalloc(pcis->n*sizeof(PetscInt),&local_to_B);CHKERRQ(ierr);
2567534831adSStefano Zampini   ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
25682fa5cd67SKarl Rupp 
25692fa5cd67SKarl Rupp   for (i=0;i<pcis->n;i++) local_to_B[i]=-1;
25702fa5cd67SKarl Rupp   for (i=0;i<pcis->n_B;i++) local_to_B[is_indices[i]]=i;
2571534831adSStefano Zampini   ierr = ISRestoreIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2572534831adSStefano Zampini 
25733b03a366Sstefano_zampini   /* First we issue queries to allocate optimal workspace for LAPACKgesvd or LAPACKsyev/LAPACKheev */
25743b03a366Sstefano_zampini   rwork           = 0;
25753b03a366Sstefano_zampini   work            = 0;
25763b03a366Sstefano_zampini   singular_vals   = 0;
25773b03a366Sstefano_zampini   temp_basis      = 0;
25783b03a366Sstefano_zampini   correlation_mat = 0;
25793b03a366Sstefano_zampini   if (!pcbddc->use_nnsp_true) {
25803b03a366Sstefano_zampini     PetscScalar temp_work;
25813b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD)
25823b03a366Sstefano_zampini     /* POD */
25833b03a366Sstefano_zampini     PetscInt max_n;
25843b03a366Sstefano_zampini     max_n = nnsp_addone+nnsp_size;
25853b03a366Sstefano_zampini     /* using some techniques borrowed from Proper Orthogonal Decomposition */
25863b03a366Sstefano_zampini     ierr = PetscMalloc(max_n*max_n*sizeof(PetscScalar),&correlation_mat);CHKERRQ(ierr);
25873425bc38SStefano Zampini     ierr = PetscMalloc(max_n*max_n*sizeof(PetscScalar),&singular_vectors);CHKERRQ(ierr);
25883b03a366Sstefano_zampini     ierr = PetscMalloc(max_n*sizeof(PetscReal),&singular_vals);CHKERRQ(ierr);
25893b03a366Sstefano_zampini     ierr = PetscMalloc(max_size_of_constraint*(nnsp_addone+nnsp_size)*sizeof(PetscScalar),&temp_basis);CHKERRQ(ierr);
25903b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX)
25913b03a366Sstefano_zampini     ierr = PetscMalloc(3*max_n*sizeof(PetscReal),&rwork);CHKERRQ(ierr);
25923b03a366Sstefano_zampini #endif
25933425bc38SStefano Zampini     ierr = PetscMalloc(5*max_n*sizeof(PetscBLASInt),&iwork);CHKERRQ(ierr);
25943425bc38SStefano Zampini     ierr = PetscMalloc(max_n*sizeof(PetscBLASInt),&ifail);CHKERRQ(ierr);
25953b03a366Sstefano_zampini     /* now we evaluate the optimal workspace using query with lwork=-1 */
2596c5df96a5SBarry Smith     ierr  = PetscBLASIntCast(max_n,&Bt);CHKERRQ(ierr);
25973b03a366Sstefano_zampini     lwork =-1;
25983425bc38SStefano Zampini     ierr  = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
25993b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX)
26003425bc38SStefano Zampini     abs_tol=1.e-8;
2601f75e95b9SBarry Smith     PetscStackCall("LAPACKsyevx",LAPACKsyevx_("V","A","U",&Bt,correlation_mat,&Bt,&dummy_real,&dummy_real,&dummy_int,&dummy_int,&abs_tol,&eigs_found,singular_vals,singular_vectors,&Bt,&temp_work,&lwork,iwork,ifail,&lierr));
26023b03a366Sstefano_zampini #else
260382f516ccSBarry Smith     SETERRQ(PetscObjectComm((PetscObject)pc), PETSC_ERR_SUP, "Not yet implemented for complexes when PETSC_MISSING_GESVD = 1");
26043b03a366Sstefano_zampini #endif
26053425bc38SStefano Zampini     if (lierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to SYEVX Lapack routine %d",(int)lierr);
26063425bc38SStefano Zampini     ierr = PetscFPTrapPop();CHKERRQ(ierr);
26073b03a366Sstefano_zampini #else /* on missing GESVD */
26083b03a366Sstefano_zampini       /* SVD */
26093b03a366Sstefano_zampini     PetscInt max_n,min_n;
26103b03a366Sstefano_zampini     max_n = max_size_of_constraint;
26113b03a366Sstefano_zampini     min_n = nnsp_addone+nnsp_size;
26123b03a366Sstefano_zampini     if (max_size_of_constraint < (nnsp_addone+nnsp_size)) {
26133b03a366Sstefano_zampini       min_n = max_size_of_constraint;
26143b03a366Sstefano_zampini       max_n = nnsp_addone+nnsp_size;
26153b03a366Sstefano_zampini     }
26163b03a366Sstefano_zampini     ierr = PetscMalloc(min_n*sizeof(PetscReal),&singular_vals);CHKERRQ(ierr);
26173b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX)
26183b03a366Sstefano_zampini     ierr = PetscMalloc(5*min_n*sizeof(PetscReal),&rwork);CHKERRQ(ierr);
26193b03a366Sstefano_zampini #endif
26203b03a366Sstefano_zampini     /* now we evaluate the optimal workspace using query with lwork=-1 */
26213b03a366Sstefano_zampini     lwork     =-1;
2622c5df96a5SBarry Smith     ierr      = PetscBLASIntCast(max_n,&Bs);CHKERRQ(ierr);
2623c5df96a5SBarry Smith     ierr      = PetscBLASIntCast(min_n,&Bt);CHKERRQ(ierr);
26243b03a366Sstefano_zampini     dummy_int = Bs;
2625670f3ff9SJed Brown     ierr      = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
26263b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX)
2627f75e95b9SBarry Smith     PetscStackCall("LAPACKgesvd",LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[0],&Bs,singular_vals,&dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,&temp_work,&lwork,&lierr));
26283b03a366Sstefano_zampini #else
2629f75e95b9SBarry Smith     PetscStackCall("LAPACKgesvd",LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[0],&Bs,singular_vals,&dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,&temp_work,&lwork,rwork,&lierr);
26303b03a366Sstefano_zampini #endif
26313b03a366Sstefano_zampini     if (lierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to SVD Lapack routine %d",(int)lierr);
2632670f3ff9SJed Brown     ierr = PetscFPTrapPop();CHKERRQ(ierr);
26333b03a366Sstefano_zampini #endif
26343b03a366Sstefano_zampini     /* Allocate optimal workspace */
2635c5df96a5SBarry Smith     ierr         = PetscBLASIntCast((PetscInt)PetscRealPart(temp_work),&lwork);CHKERRQ(ierr);
26363b03a366Sstefano_zampini     total_counts = (PetscInt)lwork;
26373b03a366Sstefano_zampini     ierr         = PetscMalloc(total_counts*sizeof(PetscScalar),&work);CHKERRQ(ierr);
26383b03a366Sstefano_zampini   }
26393b03a366Sstefano_zampini   /* get local part of global near null space vectors */
26403b03a366Sstefano_zampini   ierr = PetscMalloc(nnsp_size*sizeof(Vec),&localnearnullsp);CHKERRQ(ierr);
26413b03a366Sstefano_zampini   for (k=0; k<nnsp_size; k++) {
26423b03a366Sstefano_zampini     ierr = VecDuplicate(pcis->vec1_N,&localnearnullsp[k]);CHKERRQ(ierr);
2643fcda91b4SJed Brown     ierr = VecScatterBegin(matis->ctx,nearnullvecs[k],localnearnullsp[k],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
2644fcda91b4SJed Brown     ierr = VecScatterEnd  (matis->ctx,nearnullvecs[k],localnearnullsp[k],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
26453b03a366Sstefano_zampini   }
26463b03a366Sstefano_zampini   /* Now we can loop on constraining sets */
26473b03a366Sstefano_zampini   total_counts   =0;
26483b03a366Sstefano_zampini   temp_indices[0]=0;
2649da1bb401SStefano Zampini   /* vertices */
2650da1bb401SStefano Zampini   PetscBool used_vertex;
2651da1bb401SStefano Zampini   ierr = ISGetIndices(pcbddc->ISForVertices,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2652da1bb401SStefano Zampini   if (nnsp_has_cnst) { /* consider all vertices */
2653da1bb401SStefano Zampini     for (i=0; i<n_vertices; i++) {
2654da1bb401SStefano Zampini       temp_indices_to_constraint[temp_indices[total_counts]]  = is_indices[i];
2655534831adSStefano Zampini       temp_indices_to_constraint_B[temp_indices[total_counts]]= local_to_B[is_indices[i]];
2656da1bb401SStefano Zampini       temp_quadrature_constraint[temp_indices[total_counts]]  = 1.0;
2657da1bb401SStefano Zampini       temp_indices[total_counts+1]                            = temp_indices[total_counts]+1;
2658534831adSStefano Zampini       change_basis[total_counts]                              = PETSC_FALSE;
2659da1bb401SStefano Zampini       total_counts++;
2660da1bb401SStefano Zampini     }
2661da1bb401SStefano Zampini   } else { /* consider vertices for which exist at least a localnearnullsp which is not null there */
2662da1bb401SStefano Zampini     for (i=0; i<n_vertices; i++) {
2663da1bb401SStefano Zampini       used_vertex = PETSC_FALSE;
2664da1bb401SStefano Zampini       k           = 0;
2665da1bb401SStefano Zampini       while (!used_vertex && k<nnsp_size) {
2666da1bb401SStefano Zampini         ierr = VecGetArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr);
2667da1bb401SStefano Zampini         if (PetscAbsScalar(array_vector[is_indices[i]])>0.0) {
2668da1bb401SStefano Zampini           temp_indices_to_constraint[temp_indices[total_counts]]  =is_indices[i];
2669534831adSStefano Zampini           temp_indices_to_constraint_B[temp_indices[total_counts]]=local_to_B[is_indices[i]];
2670da1bb401SStefano Zampini           temp_quadrature_constraint[temp_indices[total_counts]]  =1.0;
2671da1bb401SStefano Zampini           temp_indices[total_counts+1]                            =temp_indices[total_counts]+1;
2672534831adSStefano Zampini           change_basis[total_counts]                              =PETSC_FALSE;
2673da1bb401SStefano Zampini           total_counts++;
2674da1bb401SStefano Zampini           used_vertex=PETSC_TRUE;
2675da1bb401SStefano Zampini         }
2676da1bb401SStefano Zampini         ierr = VecRestoreArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr);
2677da1bb401SStefano Zampini         k++;
2678da1bb401SStefano Zampini       }
2679da1bb401SStefano Zampini     }
2680da1bb401SStefano Zampini   }
2681da1bb401SStefano Zampini   ierr       = ISRestoreIndices(pcbddc->ISForVertices,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2682da1bb401SStefano Zampini   n_vertices = total_counts;
26832fa5cd67SKarl Rupp 
2684da1bb401SStefano Zampini   /* edges and faces */
26853b03a366Sstefano_zampini   for (i=0; i<pcbddc->n_ISForEdges+pcbddc->n_ISForFaces; i++) {
26863b03a366Sstefano_zampini     if (i<pcbddc->n_ISForEdges) {
26873b03a366Sstefano_zampini       used_IS     = &pcbddc->ISForEdges[i];
2688534831adSStefano Zampini       boolforface = pcbddc->usechangeofbasis;
26893b03a366Sstefano_zampini     } else {
26903b03a366Sstefano_zampini       used_IS     = &pcbddc->ISForFaces[i-pcbddc->n_ISForEdges];
2691534831adSStefano Zampini       boolforface = pcbddc->usechangeonfaces;
26923b03a366Sstefano_zampini     }
26933b03a366Sstefano_zampini     temp_constraints = 0;          /* zero the number of constraints I have on this conn comp */
26943b03a366Sstefano_zampini     temp_start_ptr   = total_counts; /* need to know the starting index of constraints stored */
26953b03a366Sstefano_zampini     ierr             = ISGetSize(*used_IS,&size_of_constraint);CHKERRQ(ierr);
26963b03a366Sstefano_zampini     ierr             = ISGetIndices(*used_IS,(const PetscInt**)&is_indices);CHKERRQ(ierr);
26973b03a366Sstefano_zampini     if (nnsp_has_cnst) {
26983b03a366Sstefano_zampini       temp_constraints++;
2699534831adSStefano Zampini       quad_value = (PetscScalar) (1.0/PetscSqrtReal((PetscReal)size_of_constraint));
27003b03a366Sstefano_zampini       for (j=0; j<size_of_constraint; j++) {
27013b03a366Sstefano_zampini         temp_indices_to_constraint[temp_indices[total_counts]+j]  =is_indices[j];
2702534831adSStefano Zampini         temp_indices_to_constraint_B[temp_indices[total_counts]+j]=local_to_B[is_indices[j]];
27033b03a366Sstefano_zampini         temp_quadrature_constraint[temp_indices[total_counts]+j]  =quad_value;
27043b03a366Sstefano_zampini       }
27053b03a366Sstefano_zampini       temp_indices[total_counts+1]=temp_indices[total_counts]+size_of_constraint;  /* store new starting point */
2706534831adSStefano Zampini       change_basis[total_counts]  =boolforface;
27073b03a366Sstefano_zampini       total_counts++;
27083b03a366Sstefano_zampini     }
27093b03a366Sstefano_zampini     for (k=0; k<nnsp_size; k++) {
27103b03a366Sstefano_zampini       ierr = VecGetArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr);
27113b03a366Sstefano_zampini       for (j=0; j<size_of_constraint; j++) {
27123b03a366Sstefano_zampini         temp_indices_to_constraint[temp_indices[total_counts]+j]  =is_indices[j];
2713534831adSStefano Zampini         temp_indices_to_constraint_B[temp_indices[total_counts]+j]=local_to_B[is_indices[j]];
27143b03a366Sstefano_zampini         temp_quadrature_constraint[temp_indices[total_counts]+j]  =array_vector[is_indices[j]];
27153b03a366Sstefano_zampini       }
27163b03a366Sstefano_zampini       ierr       = VecRestoreArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr);
2717de534f79Sstefano_zampini       quad_value = 1.0;
2718de534f79Sstefano_zampini       if (use_nnsp_true) { /* check if array is null on the connected component in case use_nnsp_true has been requested */
2719c5df96a5SBarry Smith         ierr       = PetscBLASIntCast(size_of_constraint,&Bs);CHKERRQ(ierr);
2720a83cb05cSBarry Smith         PetscStackCall("BLASasum",quad_value = BLASasum_(&Bs,&temp_quadrature_constraint[temp_indices[total_counts]],&Bone));
2721de534f79Sstefano_zampini       }
2722de534f79Sstefano_zampini       if (quad_value > 0.0) { /* keep indices and values */
2723de534f79Sstefano_zampini         temp_constraints++;
27243b03a366Sstefano_zampini         temp_indices[total_counts+1]=temp_indices[total_counts]+size_of_constraint;  /* store new starting point */
2725534831adSStefano Zampini         change_basis[total_counts]  =boolforface;
27263b03a366Sstefano_zampini         total_counts++;
27273b03a366Sstefano_zampini       }
2728de534f79Sstefano_zampini     }
27293b03a366Sstefano_zampini     ierr = ISRestoreIndices(*used_IS,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2730de534f79Sstefano_zampini     /* perform SVD on the constraint if use_nnsp_true has not be requested by the user */
27313b03a366Sstefano_zampini     if (!use_nnsp_true) {
2732c5df96a5SBarry Smith       ierr = PetscBLASIntCast(size_of_constraint,&Bs);CHKERRQ(ierr);
2733c5df96a5SBarry Smith       ierr = PetscBLASIntCast(temp_constraints,&Bt);CHKERRQ(ierr);
2734de534f79Sstefano_zampini 
27353b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD)
27363b03a366Sstefano_zampini       ierr = PetscMemzero(correlation_mat,Bt*Bt*sizeof(PetscScalar));CHKERRQ(ierr);
27373b03a366Sstefano_zampini       /* Store upper triangular part of correlation matrix */
27383b03a366Sstefano_zampini       for (j=0; j<temp_constraints; j++) {
27393b03a366Sstefano_zampini         for (k=0; k<j+1; k++) {
27403b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX)
27413425bc38SStefano Zampini           /* hand made complex dot product -> replace */
27423b03a366Sstefano_zampini           dot_result = 0.0;
27433b03a366Sstefano_zampini           for (ii=0; ii<size_of_constraint; ii++) {
27443b03a366Sstefano_zampini             val1        = temp_quadrature_constraint[temp_indices[temp_start_ptr+j]+ii];
27453b03a366Sstefano_zampini             val2        = temp_quadrature_constraint[temp_indices[temp_start_ptr+k]+ii];
27463b03a366Sstefano_zampini             dot_result += val1*PetscConj(val2);
27473b03a366Sstefano_zampini           }
27483b03a366Sstefano_zampini #else
2749a83cb05cSBarry Smith           PetscStackCall("BLASdot",dot_result = BLASdot_(&Bs,&temp_quadrature_constraint[temp_indices[temp_start_ptr+j]],&Bone,&temp_quadrature_constraint[temp_indices[temp_start_ptr+k]],&Bone));
27503b03a366Sstefano_zampini #endif
27513b03a366Sstefano_zampini           correlation_mat[j*temp_constraints+k]=dot_result;
27523b03a366Sstefano_zampini         }
27533b03a366Sstefano_zampini       }
27543425bc38SStefano Zampini       ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
27553b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX)
2756f75e95b9SBarry Smith       PetscStackCall("LAPACKsyevx",LAPACKsyevx_("V","A","U",&Bt,correlation_mat,&Bt,&dummy_real,&dummy_real,&dummy_int,&dummy_int,&abs_tol,&eigs_found,singular_vals,singular_vectors,&Bt,work,&lwork,iwork,ifail,&lierr));
27573b03a366Sstefano_zampini #else
275882f516ccSBarry Smith       SETERRQ(PetscObjectComm((PetscObject)pc), PETSC_ERR_SUP, "Not yet implemented for complexes when PETSC_MISSING_GESVD = 1");
27593b03a366Sstefano_zampini #endif
27603425bc38SStefano Zampini       if (lierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYEVX Lapack routine %d",(int)lierr);
27613425bc38SStefano Zampini       ierr = PetscFPTrapPop();CHKERRQ(ierr);
27623b03a366Sstefano_zampini       /* retain eigenvalues greater than tol: note that lapack SYEV gives eigs in ascending order */
27633b03a366Sstefano_zampini       j=0;
27643b03a366Sstefano_zampini       while (j < Bt && singular_vals[j] < tol) j++;
27653b03a366Sstefano_zampini       total_counts=total_counts-j;
27663b03a366Sstefano_zampini       if (j<temp_constraints) {
27672fa5cd67SKarl Rupp         for (k=j;k<Bt;k++) singular_vals[k]=1.0/PetscSqrtReal(singular_vals[k]);
27683425bc38SStefano Zampini         ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
2769a83cb05cSBarry Smith         PetscStackCall("BLASgemm",BLASgemm_("N","N",&Bs,&Bt,&Bt,&one,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,correlation_mat,&Bt,&zero,temp_basis,&Bs));
27703425bc38SStefano Zampini         ierr = PetscFPTrapPop();CHKERRQ(ierr);
27713b03a366Sstefano_zampini         /* copy POD basis into used quadrature memory */
27723b03a366Sstefano_zampini         for (k=0;k<Bt-j;k++) {
27733b03a366Sstefano_zampini           for (ii=0;ii<size_of_constraint;ii++) {
27743b03a366Sstefano_zampini             temp_quadrature_constraint[temp_indices[temp_start_ptr+k]+ii]=singular_vals[Bt-1-k]*temp_basis[(Bt-1-k)*size_of_constraint+ii];
27753b03a366Sstefano_zampini           }
27763b03a366Sstefano_zampini         }
27773b03a366Sstefano_zampini       }
2778de534f79Sstefano_zampini 
27793b03a366Sstefano_zampini #else  /* on missing GESVD */
27803b03a366Sstefano_zampini       PetscInt min_n = temp_constraints;
27813b03a366Sstefano_zampini       if (min_n > size_of_constraint) min_n = size_of_constraint;
27823b03a366Sstefano_zampini       dummy_int = Bs;
2783670f3ff9SJed Brown       ierr      = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
27843b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX)
2785f75e95b9SBarry Smith       PetscStackCall("LAPACKgesvd",LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,singular_vals,&dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,work,&lwork,&lierr));
27863b03a366Sstefano_zampini #else
2787f75e95b9SBarry Smith       PetscStackCall("LAPACKgesvd",LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,singular_vals,&dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,work,&lwork,rwork,&lierr);
27883b03a366Sstefano_zampini #endif
27893b03a366Sstefano_zampini       if (lierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SVD Lapack routine %d",(int)lierr);
2790670f3ff9SJed Brown       ierr = PetscFPTrapPop();CHKERRQ(ierr);
27913b03a366Sstefano_zampini       /* retain eigenvalues greater than tol: note that lapack SVD gives eigs in descending order */
27923b03a366Sstefano_zampini       j=0;
27933b03a366Sstefano_zampini       while (j < min_n && singular_vals[min_n-j-1] < tol) j++;
27943b03a366Sstefano_zampini       total_counts = total_counts-(PetscInt)Bt+(min_n-j);
27953b03a366Sstefano_zampini #endif
27963b03a366Sstefano_zampini     }
27973b03a366Sstefano_zampini   }
2798534831adSStefano Zampini 
2799da1bb401SStefano Zampini   n_constraints     =total_counts-n_vertices;
2800da1bb401SStefano Zampini   local_primal_size = total_counts;
28013b03a366Sstefano_zampini   /* set quantities in pcbddc data structure */
28023b03a366Sstefano_zampini   pcbddc->n_vertices        = n_vertices;
28033b03a366Sstefano_zampini   pcbddc->n_constraints     = n_constraints;
2804da1bb401SStefano Zampini   pcbddc->local_primal_size = local_primal_size;
2805534831adSStefano Zampini 
2806534831adSStefano Zampini   /* Create constraint matrix */
2807534831adSStefano Zampini   /* The constraint matrix is used to compute the l2g map of primal dofs */
2808534831adSStefano Zampini   /* so we need to set it up properly either with or without change of basis */
2809534831adSStefano Zampini   ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->ConstraintMatrix);CHKERRQ(ierr);
2810534831adSStefano Zampini   ierr = MatSetType(pcbddc->ConstraintMatrix,impMatType);CHKERRQ(ierr);
2811534831adSStefano Zampini   ierr = MatSetSizes(pcbddc->ConstraintMatrix,local_primal_size,pcis->n,local_primal_size,pcis->n);CHKERRQ(ierr);
28122fa5cd67SKarl Rupp 
2813534831adSStefano Zampini   /* compute a local numbering of constraints : vertices first then constraints */
2814534831adSStefano Zampini   ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
2815534831adSStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array_vector);CHKERRQ(ierr);
2816534831adSStefano Zampini   ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&aux_primal_numbering);CHKERRQ(ierr);
2817534831adSStefano Zampini   ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&aux_primal_permutation);CHKERRQ(ierr);
28182fa5cd67SKarl Rupp 
2819534831adSStefano Zampini   total_counts=0;
28202fa5cd67SKarl Rupp 
2821534831adSStefano Zampini   /* find vertices: subdomain corners plus dofs with basis changed */
2822534831adSStefano Zampini   for (i=0; i<local_primal_size; i++) {
2823534831adSStefano Zampini     size_of_constraint=temp_indices[i+1]-temp_indices[i];
2824534831adSStefano Zampini     if (change_basis[i] || size_of_constraint == 1) {
2825534831adSStefano Zampini       k=0;
2826534831adSStefano Zampini       while (k < size_of_constraint && array_vector[temp_indices_to_constraint[temp_indices[i]+size_of_constraint-k-1]] != 0.0) {
2827534831adSStefano Zampini         k=k+1;
2828534831adSStefano Zampini       }
2829534831adSStefano Zampini       j = temp_indices_to_constraint[temp_indices[i]+size_of_constraint-k-1];
28302fa5cd67SKarl Rupp 
2831534831adSStefano Zampini       array_vector[j]                      = 1.0;
2832534831adSStefano Zampini       aux_primal_numbering[total_counts]   = j;
2833534831adSStefano Zampini       aux_primal_permutation[total_counts] = total_counts;
2834534831adSStefano Zampini       total_counts++;
2835534831adSStefano Zampini     }
2836534831adSStefano Zampini   }
2837534831adSStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array_vector);CHKERRQ(ierr);
2838534831adSStefano Zampini   /* permute indices in order to have a sorted set of vertices */
2839534831adSStefano Zampini   ierr = PetscSortIntWithPermutation(total_counts,aux_primal_numbering,aux_primal_permutation);
2840534831adSStefano Zampini   /* nonzero structure */
2841534831adSStefano Zampini   ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&nnz);CHKERRQ(ierr);
28422fa5cd67SKarl Rupp   for (i=0;i<total_counts;i++) nnz[i]=1;
28432fa5cd67SKarl Rupp 
2844534831adSStefano Zampini   j=total_counts;
2845534831adSStefano Zampini   for (i=n_vertices; i<local_primal_size; i++) {
2846534831adSStefano Zampini     if (!change_basis[i]) {
2847534831adSStefano Zampini       nnz[j]=temp_indices[i+1]-temp_indices[i];
2848534831adSStefano Zampini       j++;
2849534831adSStefano Zampini     }
2850534831adSStefano Zampini   }
2851534831adSStefano Zampini   ierr = MatSeqAIJSetPreallocation(pcbddc->ConstraintMatrix,0,nnz);CHKERRQ(ierr);
2852534831adSStefano Zampini   ierr = PetscFree(nnz);CHKERRQ(ierr);
2853534831adSStefano Zampini   /* set values in constraint matrix */
2854534831adSStefano Zampini   for (i=0; i<total_counts; i++) {
2855534831adSStefano Zampini     j    = aux_primal_permutation[i];
2856534831adSStefano Zampini     k    = aux_primal_numbering[j];
2857534831adSStefano Zampini     ierr = MatSetValue(pcbddc->ConstraintMatrix,i,k,1.0,INSERT_VALUES);CHKERRQ(ierr);
2858534831adSStefano Zampini   }
2859534831adSStefano Zampini   for (i=n_vertices; i<local_primal_size; i++) {
2860534831adSStefano Zampini     if (!change_basis[i]) {
2861534831adSStefano Zampini       size_of_constraint = temp_indices[i+1]-temp_indices[i];
2862534831adSStefano Zampini       ierr               = MatSetValues(pcbddc->ConstraintMatrix,1,&total_counts,size_of_constraint,&temp_indices_to_constraint[temp_indices[i]],&temp_quadrature_constraint[temp_indices[i]],INSERT_VALUES);CHKERRQ(ierr);
2863534831adSStefano Zampini       total_counts++;
2864534831adSStefano Zampini     }
2865534831adSStefano Zampini   }
2866534831adSStefano Zampini   ierr = PetscFree(aux_primal_numbering);CHKERRQ(ierr);
2867534831adSStefano Zampini   ierr = PetscFree(aux_primal_permutation);CHKERRQ(ierr);
2868534831adSStefano Zampini   /* assembling */
2869534831adSStefano Zampini   ierr = MatAssemblyBegin(pcbddc->ConstraintMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2870534831adSStefano Zampini   ierr = MatAssemblyEnd(pcbddc->ConstraintMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2871534831adSStefano Zampini 
2872534831adSStefano Zampini   /* Create matrix for change of basis. We don't need it in case pcbddc->usechangeofbasis is FALSE */
2873534831adSStefano Zampini   if (pcbddc->usechangeofbasis) {
2874534831adSStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->ChangeOfBasisMatrix);CHKERRQ(ierr);
2875534831adSStefano Zampini     ierr = MatSetType(pcbddc->ChangeOfBasisMatrix,impMatType);CHKERRQ(ierr);
2876534831adSStefano Zampini     ierr = MatSetSizes(pcbddc->ChangeOfBasisMatrix,pcis->n_B,pcis->n_B,pcis->n_B,pcis->n_B);CHKERRQ(ierr);
2877534831adSStefano Zampini     /* work arrays */
2878534831adSStefano Zampini     /* we need to reuse these arrays, so we free them */
2879534831adSStefano Zampini     ierr = PetscFree(temp_basis);CHKERRQ(ierr);
2880534831adSStefano Zampini     ierr = PetscFree(work);CHKERRQ(ierr);
2881534831adSStefano Zampini     ierr = PetscMalloc(pcis->n_B*sizeof(PetscInt),&nnz);CHKERRQ(ierr);
2882534831adSStefano Zampini     ierr = PetscMalloc((nnsp_addone+nnsp_size)*(nnsp_addone+nnsp_size)*sizeof(PetscScalar),&temp_basis);CHKERRQ(ierr);
2883534831adSStefano Zampini     ierr = PetscMalloc((nnsp_addone+nnsp_size)*sizeof(PetscScalar),&work);CHKERRQ(ierr);
2884534831adSStefano Zampini     ierr = PetscMalloc((nnsp_addone+nnsp_size)*sizeof(PetscBLASInt),&ipiv);CHKERRQ(ierr);
28852fa5cd67SKarl Rupp     for (i=0;i<pcis->n_B;i++) nnz[i]=1;
28862fa5cd67SKarl Rupp 
2887534831adSStefano Zampini     /* Overestimated nonzeros per row */
2888534831adSStefano Zampini     k=1;
2889534831adSStefano Zampini     for (i=pcbddc->n_vertices;i<local_primal_size;i++) {
2890534831adSStefano Zampini       if (change_basis[i]) {
2891534831adSStefano Zampini         size_of_constraint = temp_indices[i+1]-temp_indices[i];
28922fa5cd67SKarl Rupp         if (k < size_of_constraint) k = size_of_constraint;
28932fa5cd67SKarl Rupp 
2894534831adSStefano Zampini         for (j=0;j<size_of_constraint;j++) {
2895534831adSStefano Zampini           nnz[temp_indices_to_constraint_B[temp_indices[i]+j]] = size_of_constraint;
2896534831adSStefano Zampini         }
2897534831adSStefano Zampini       }
2898534831adSStefano Zampini     }
2899534831adSStefano Zampini     ierr = MatSeqAIJSetPreallocation(pcbddc->ChangeOfBasisMatrix,0,nnz);CHKERRQ(ierr);
2900534831adSStefano Zampini     ierr = PetscFree(nnz);CHKERRQ(ierr);
2901534831adSStefano Zampini     /* Temporary array to store indices */
2902534831adSStefano Zampini     ierr = PetscMalloc(k*sizeof(PetscInt),&is_indices);CHKERRQ(ierr);
2903534831adSStefano Zampini     /* Set initial identity in the matrix */
2904534831adSStefano Zampini     for (i=0; i<pcis->n_B; i++) {
2905534831adSStefano Zampini       ierr = MatSetValue(pcbddc->ChangeOfBasisMatrix,i,i,1.0,INSERT_VALUES);CHKERRQ(ierr);
2906534831adSStefano Zampini     }
2907534831adSStefano Zampini     /* Now we loop on the constraints which need a change of basis */
2908534831adSStefano Zampini     /* Change of basis matrix is evaluated as the FIRST APPROACH in */
2909534831adSStefano Zampini     /* Klawonn and Widlund, Dual-primal FETI-DP methods for linear elasticity, (6.2.1) */
2910534831adSStefano Zampini     temp_constraints = 0;
291193dc3b60SStefano Zampini     if (pcbddc->n_vertices < local_primal_size) {
2912534831adSStefano Zampini       temp_start_ptr = temp_indices_to_constraint_B[temp_indices[pcbddc->n_vertices]];
291393dc3b60SStefano Zampini     }
2914534831adSStefano Zampini     for (i=pcbddc->n_vertices; i<local_primal_size; i++) {
2915534831adSStefano Zampini       if (change_basis[i]) {
2916534831adSStefano Zampini         compute_submatrix = PETSC_FALSE;
2917534831adSStefano Zampini         useksp            = PETSC_FALSE;
2918534831adSStefano Zampini         if (temp_start_ptr == temp_indices_to_constraint_B[temp_indices[i]]) {
2919534831adSStefano Zampini           temp_constraints++;
292004eaf177SStefano Zampini           if (i == local_primal_size -1 ||  temp_start_ptr != temp_indices_to_constraint_B[temp_indices[i+1]]) {
2921534831adSStefano Zampini             compute_submatrix = PETSC_TRUE;
2922534831adSStefano Zampini           }
2923534831adSStefano Zampini         }
2924534831adSStefano Zampini         if (compute_submatrix) {
29252fa5cd67SKarl Rupp           if (temp_constraints > 1 || pcbddc->use_nnsp_true) useksp = PETSC_TRUE;
2926534831adSStefano Zampini           size_of_constraint = temp_indices[i+1]-temp_indices[i];
2927534831adSStefano Zampini           if (useksp) { /* experimental */
2928534831adSStefano Zampini             ierr = MatCreate(PETSC_COMM_SELF,&temp_mat);CHKERRQ(ierr);
2929534831adSStefano Zampini             ierr = MatSetType(temp_mat,impMatType);CHKERRQ(ierr);
2930534831adSStefano Zampini             ierr = MatSetSizes(temp_mat,size_of_constraint,size_of_constraint,size_of_constraint,size_of_constraint);CHKERRQ(ierr);
29310298fd71SBarry Smith             ierr = MatSeqAIJSetPreallocation(temp_mat,size_of_constraint,NULL);CHKERRQ(ierr);
2932534831adSStefano Zampini           }
2933534831adSStefano Zampini           /* First _size_of_constraint-temp_constraints_ columns */
2934534831adSStefano Zampini           dual_dofs        = size_of_constraint-temp_constraints;
2935534831adSStefano Zampini           start_constraint = i+1-temp_constraints;
2936534831adSStefano Zampini           for (s=0; s<dual_dofs; s++) {
2937534831adSStefano Zampini             is_indices[0] = s;
2938534831adSStefano Zampini             for (j=0;j<temp_constraints;j++) {
2939534831adSStefano Zampini               for (k=0;k<temp_constraints;k++) {
2940534831adSStefano Zampini                 temp_basis[j*temp_constraints+k]=temp_quadrature_constraint[temp_indices[start_constraint+k]+s+j+1];
2941534831adSStefano Zampini               }
2942534831adSStefano Zampini               work[j]         = -temp_quadrature_constraint[temp_indices[start_constraint+j]+s];
2943534831adSStefano Zampini               is_indices[j+1] = s+j+1;
2944534831adSStefano Zampini             }
2945534831adSStefano Zampini             Bt   = temp_constraints;
2946534831adSStefano Zampini             ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
2947f75e95b9SBarry Smith             PetscStackCall("LAPACKgesvd",LAPACKgesv_(&Bt,&Bone,temp_basis,&Bt,ipiv,work,&Bt,&lierr));
2948534831adSStefano Zampini             if (lierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GESV Lapack routine %d",(int)lierr);
2949534831adSStefano Zampini             ierr = PetscFPTrapPop();CHKERRQ(ierr);
2950534831adSStefano Zampini             j    = temp_indices_to_constraint_B[temp_indices[start_constraint]+s];
2951534831adSStefano Zampini             ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,temp_constraints,&temp_indices_to_constraint_B[temp_indices[start_constraint]+s+1],1,&j,work,INSERT_VALUES);CHKERRQ(ierr);
2952534831adSStefano Zampini             if (useksp) {
2953534831adSStefano Zampini               /* temp mat with transposed rows and columns */
2954534831adSStefano Zampini               ierr = MatSetValues(temp_mat,1,&s,temp_constraints,&is_indices[1],work,INSERT_VALUES);CHKERRQ(ierr);
2955534831adSStefano Zampini               ierr = MatSetValue(temp_mat,is_indices[0],is_indices[0],1.0,INSERT_VALUES);CHKERRQ(ierr);
2956534831adSStefano Zampini             }
2957534831adSStefano Zampini           }
2958534831adSStefano Zampini           if (useksp) {
2959534831adSStefano Zampini             /* last rows of temp_mat */
29602fa5cd67SKarl Rupp             for (j=0;j<size_of_constraint;j++) is_indices[j] = j;
29612fa5cd67SKarl Rupp 
2962534831adSStefano Zampini             for (s=0;s<temp_constraints;s++) {
2963534831adSStefano Zampini               k = s + dual_dofs;
2964534831adSStefano Zampini               ierr = MatSetValues(temp_mat,1,&k,size_of_constraint,is_indices,&temp_quadrature_constraint[temp_indices[start_constraint+s]],INSERT_VALUES);CHKERRQ(ierr);
2965534831adSStefano Zampini             }
2966534831adSStefano Zampini             ierr = MatAssemblyBegin(temp_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2967534831adSStefano Zampini             ierr = MatAssemblyEnd(temp_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
29680298fd71SBarry Smith             ierr = MatGetVecs(temp_mat,&temp_vec,NULL);CHKERRQ(ierr);
2969534831adSStefano Zampini             ierr = KSPCreate(PETSC_COMM_SELF,&temp_ksp);CHKERRQ(ierr);
2970534831adSStefano Zampini             ierr = KSPSetOperators(temp_ksp,temp_mat,temp_mat,SAME_PRECONDITIONER);CHKERRQ(ierr);
2971534831adSStefano Zampini             ierr = KSPSetType(temp_ksp,KSPPREONLY);CHKERRQ(ierr);
2972ffe5efe1SStefano Zampini             ierr = KSPGetPC(temp_ksp,&temp_pc);CHKERRQ(ierr);
2973ffe5efe1SStefano Zampini             ierr = PCSetType(temp_pc,PCLU);CHKERRQ(ierr);
2974534831adSStefano Zampini             ierr = KSPSetUp(temp_ksp);CHKERRQ(ierr);
2975534831adSStefano Zampini             for (s=0; s<temp_constraints; s++) {
2976534831adSStefano Zampini               ierr = VecSet(temp_vec,0.0);CHKERRQ(ierr);
2977534831adSStefano Zampini               ierr = VecSetValue(temp_vec,s+dual_dofs,1.0,INSERT_VALUES);CHKERRQ(ierr);
2978534831adSStefano Zampini               ierr = VecAssemblyBegin(temp_vec);CHKERRQ(ierr);
2979534831adSStefano Zampini               ierr = VecAssemblyEnd(temp_vec);CHKERRQ(ierr);
2980534831adSStefano Zampini               ierr = KSPSolve(temp_ksp,temp_vec,temp_vec);CHKERRQ(ierr);
2981534831adSStefano Zampini               ierr = VecGetArray(temp_vec,&array_vector);CHKERRQ(ierr);
2982534831adSStefano Zampini               j    = temp_indices_to_constraint_B[temp_indices[start_constraint+s]+size_of_constraint-s-1];
2983534831adSStefano Zampini               /* last columns of change of basis matrix associated to new primal dofs */
2984534831adSStefano Zampini               ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,size_of_constraint,&temp_indices_to_constraint_B[temp_indices[start_constraint+s]],1,&j,array_vector,INSERT_VALUES);CHKERRQ(ierr);
2985534831adSStefano Zampini               ierr = VecRestoreArray(temp_vec,&array_vector);CHKERRQ(ierr);
2986534831adSStefano Zampini             }
2987534831adSStefano Zampini             ierr = MatDestroy(&temp_mat);CHKERRQ(ierr);
2988534831adSStefano Zampini             ierr = KSPDestroy(&temp_ksp);CHKERRQ(ierr);
2989534831adSStefano Zampini             ierr = VecDestroy(&temp_vec);CHKERRQ(ierr);
2990534831adSStefano Zampini           } else {
2991534831adSStefano Zampini             /* last columns of change of basis matrix associated to new primal dofs */
2992534831adSStefano Zampini             for (s=0; s<temp_constraints; s++) {
2993534831adSStefano Zampini               j    = temp_indices_to_constraint_B[temp_indices[start_constraint+s]+size_of_constraint-s-1];
2994534831adSStefano Zampini               ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,size_of_constraint,&temp_indices_to_constraint_B[temp_indices[start_constraint+s]],1,&j,&temp_quadrature_constraint[temp_indices[start_constraint+s]],INSERT_VALUES);CHKERRQ(ierr);
2995534831adSStefano Zampini             }
2996534831adSStefano Zampini           }
2997534831adSStefano Zampini           /* prepare for the next cycle */
2998534831adSStefano Zampini           temp_constraints = 0;
29992fa5cd67SKarl Rupp           if (i != local_primal_size -1) temp_start_ptr = temp_indices_to_constraint_B[temp_indices[i+1]];
3000534831adSStefano Zampini         }
3001534831adSStefano Zampini       }
300204eaf177SStefano Zampini     }
3003534831adSStefano Zampini     /* assembling */
3004534831adSStefano Zampini     ierr = MatAssemblyBegin(pcbddc->ChangeOfBasisMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
3005534831adSStefano Zampini     ierr = MatAssemblyEnd(pcbddc->ChangeOfBasisMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
3006534831adSStefano Zampini     ierr = PetscFree(ipiv);CHKERRQ(ierr);
3007534831adSStefano Zampini     ierr = PetscFree(is_indices);CHKERRQ(ierr);
3008534831adSStefano Zampini   }
30093b03a366Sstefano_zampini   /* free workspace no longer needed */
30103b03a366Sstefano_zampini   ierr = PetscFree(rwork);CHKERRQ(ierr);
30113b03a366Sstefano_zampini   ierr = PetscFree(work);CHKERRQ(ierr);
30123b03a366Sstefano_zampini   ierr = PetscFree(temp_basis);CHKERRQ(ierr);
30133b03a366Sstefano_zampini   ierr = PetscFree(singular_vals);CHKERRQ(ierr);
30143b03a366Sstefano_zampini   ierr = PetscFree(correlation_mat);CHKERRQ(ierr);
30153b03a366Sstefano_zampini   ierr = PetscFree(temp_indices);CHKERRQ(ierr);
3016534831adSStefano Zampini   ierr = PetscFree(change_basis);CHKERRQ(ierr);
30173b03a366Sstefano_zampini   ierr = PetscFree(temp_indices_to_constraint);CHKERRQ(ierr);
3018534831adSStefano Zampini   ierr = PetscFree(temp_indices_to_constraint_B);CHKERRQ(ierr);
3019534831adSStefano Zampini   ierr = PetscFree(local_to_B);CHKERRQ(ierr);
30203b03a366Sstefano_zampini   ierr = PetscFree(temp_quadrature_constraint);CHKERRQ(ierr);
30213425bc38SStefano Zampini #if defined(PETSC_MISSING_LAPACK_GESVD)
30223425bc38SStefano Zampini   ierr = PetscFree(iwork);CHKERRQ(ierr);
30233425bc38SStefano Zampini   ierr = PetscFree(ifail);CHKERRQ(ierr);
30243425bc38SStefano Zampini   ierr = PetscFree(singular_vectors);CHKERRQ(ierr);
30253425bc38SStefano Zampini #endif
3026da1bb401SStefano Zampini   for (k=0; k<nnsp_size; k++) {
3027da1bb401SStefano Zampini     ierr = VecDestroy(&localnearnullsp[k]);CHKERRQ(ierr);
3028da1bb401SStefano Zampini   }
30293b03a366Sstefano_zampini   ierr = PetscFree(localnearnullsp);CHKERRQ(ierr);
30303b03a366Sstefano_zampini   PetscFunctionReturn(0);
30313b03a366Sstefano_zampini }
30323b03a366Sstefano_zampini /* -------------------------------------------------------------------------- */
30330c7d97c5SJed Brown #undef __FUNCT__
30340c7d97c5SJed Brown #define __FUNCT__ "PCBDDCCoarseSetUp"
303553cdbc3dSStefano Zampini static PetscErrorCode PCBDDCCoarseSetUp(PC pc)
30360c7d97c5SJed Brown {
30370c7d97c5SJed Brown   PetscErrorCode ierr;
30380c7d97c5SJed Brown   PC_IS          *pcis    = (PC_IS*)(pc->data);
30390c7d97c5SJed Brown   PC_BDDC        *pcbddc  = (PC_BDDC*)pc->data;
30400c7d97c5SJed Brown   Mat_IS         *matis   = (Mat_IS*)pc->pmat->data;
3041534831adSStefano Zampini   Mat            change_mat_all;
30420c7d97c5SJed Brown   IS             is_R_local;
30430c7d97c5SJed Brown   IS             is_V_local;
30440c7d97c5SJed Brown   IS             is_C_local;
30450c7d97c5SJed Brown   IS             is_aux1;
30460c7d97c5SJed Brown   IS             is_aux2;
304719fd82e9SBarry Smith   VecType        impVecType;
304819fd82e9SBarry Smith   MatType        impMatType;
30490c7d97c5SJed Brown   PetscInt       n_R  =0;
30500c7d97c5SJed Brown   PetscInt       n_D  =0;
30510c7d97c5SJed Brown   PetscInt       n_B  =0;
30520c7d97c5SJed Brown   PetscScalar    zero =0.0;
30530c7d97c5SJed Brown   PetscScalar    one  =1.0;
30540c7d97c5SJed Brown   PetscScalar    m_one=-1.0;
30550c7d97c5SJed Brown   PetscScalar    * array;
30560c7d97c5SJed Brown   PetscScalar    *coarse_submat_vals;
30570c7d97c5SJed Brown   PetscInt       *idx_R_local;
30580c7d97c5SJed Brown   PetscInt       *idx_V_B;
30590c7d97c5SJed Brown   PetscScalar    *coarsefunctions_errors;
30600c7d97c5SJed Brown   PetscScalar    *constraints_errors;
30612fa5cd67SKarl Rupp 
30620c7d97c5SJed Brown   /* auxiliary indices */
3063534831adSStefano Zampini   PetscInt i,j,k;
30642fa5cd67SKarl Rupp 
3065e269702eSStefano Zampini   /* for verbose output of bddc */
3066e269702eSStefano Zampini   PetscViewer viewer  =pcbddc->dbg_viewer;
3067e269702eSStefano Zampini   PetscBool   dbg_flag=pcbddc->dbg_flag;
30682fa5cd67SKarl Rupp 
3069a0ba757dSStefano Zampini   /* for counting coarse dofs */
3070534831adSStefano Zampini   PetscInt    n_vertices,n_constraints;
30713b03a366Sstefano_zampini   PetscInt    size_of_constraint;
30723b03a366Sstefano_zampini   PetscInt    *row_cmat_indices;
30733b03a366Sstefano_zampini   PetscScalar *row_cmat_values;
3074534831adSStefano Zampini   PetscInt    *vertices,*nnz,*is_indices,*temp_indices;
30750c7d97c5SJed Brown 
30760c7d97c5SJed Brown   PetscFunctionBegin;
30770c7d97c5SJed Brown   /* Set Non-overlapping dimensions */
30780c7d97c5SJed Brown   n_B = pcis->n_B; n_D = pcis->n - n_B;
3079534831adSStefano Zampini   /* Set types for local objects needed by BDDC precondtioner */
3080534831adSStefano Zampini   impMatType = MATSEQDENSE;
3081534831adSStefano Zampini   impVecType = VECSEQ;
30822fa5cd67SKarl Rupp 
3083da1bb401SStefano Zampini   /* get vertex indices from constraint matrix */
3084534831adSStefano Zampini   ierr      = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscInt),&vertices);CHKERRQ(ierr);
3085534831adSStefano Zampini   n_vertices=0;
3086da1bb401SStefano Zampini   for (i=0; i<pcbddc->local_primal_size; i++) {
30870298fd71SBarry Smith     ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,NULL);CHKERRQ(ierr);
3088da1bb401SStefano Zampini     if (size_of_constraint == 1) {
3089534831adSStefano Zampini       vertices[n_vertices]=row_cmat_indices[0];
3090534831adSStefano Zampini       n_vertices++;
3091a0ba757dSStefano Zampini     }
30920298fd71SBarry Smith     ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,NULL);CHKERRQ(ierr);
3093a0ba757dSStefano Zampini   }
3094534831adSStefano Zampini   /* Set number of constraints */
3095534831adSStefano Zampini   n_constraints = pcbddc->local_primal_size-n_vertices;
3096534831adSStefano Zampini 
3097534831adSStefano Zampini   /* vertices in boundary numbering */
3098534831adSStefano Zampini   if (n_vertices) {
3099534831adSStefano Zampini     ierr = VecSet(pcis->vec1_N,m_one);CHKERRQ(ierr);
3100534831adSStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
31012fa5cd67SKarl Rupp     for (i=0; i<n_vertices; i++) array[vertices[i]] = i;
3102534831adSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3103534831adSStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3104534831adSStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3105534831adSStefano Zampini     ierr = PetscMalloc(n_vertices*sizeof(PetscInt),&idx_V_B);CHKERRQ(ierr);
3106534831adSStefano Zampini     ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr);
3107534831adSStefano Zampini     for (i=0; i<n_vertices; i++) {
3108534831adSStefano Zampini       j=0;
31092fa5cd67SKarl Rupp       while (array[j] != i) j++;
3110534831adSStefano Zampini       idx_V_B[i]=j;
3111534831adSStefano Zampini     }
3112534831adSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr);
3113534831adSStefano Zampini   }
3114534831adSStefano Zampini 
3115534831adSStefano Zampini   /* transform local matrices if needed */
3116534831adSStefano Zampini   if (pcbddc->usechangeofbasis) {
3117534831adSStefano Zampini     ierr = PetscMalloc(pcis->n*sizeof(PetscInt),&nnz);CHKERRQ(ierr);
3118534831adSStefano Zampini     ierr = ISGetIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
31192fa5cd67SKarl Rupp     for (i=0;i<n_D;i++) nnz[is_indices[i]] = 1;
3120534831adSStefano Zampini     ierr = ISRestoreIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
3121534831adSStefano Zampini     ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
3122534831adSStefano Zampini     k=1;
3123534831adSStefano Zampini     for (i=0;i<n_B;i++) {
31240298fd71SBarry Smith       ierr = MatGetRow(pcbddc->ChangeOfBasisMatrix,i,&j,NULL,NULL);CHKERRQ(ierr);
3125534831adSStefano Zampini       nnz[is_indices[i]]=j;
31262fa5cd67SKarl Rupp       if (k < j) k = j;
31270298fd71SBarry Smith       ierr = MatRestoreRow(pcbddc->ChangeOfBasisMatrix,i,&j,NULL,NULL);CHKERRQ(ierr);
3128534831adSStefano Zampini     }
3129534831adSStefano Zampini     ierr = ISRestoreIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
3130534831adSStefano Zampini     /* assemble change of basis matrix on the whole set of local dofs */
3131534831adSStefano Zampini     ierr = PetscMalloc(k*sizeof(PetscInt),&temp_indices);CHKERRQ(ierr);
3132534831adSStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&change_mat_all);CHKERRQ(ierr);
3133534831adSStefano Zampini     ierr = MatSetSizes(change_mat_all,pcis->n,pcis->n,pcis->n,pcis->n);CHKERRQ(ierr);
3134534831adSStefano Zampini     ierr = MatSetType(change_mat_all,MATSEQAIJ);CHKERRQ(ierr);
3135534831adSStefano Zampini     ierr = MatSeqAIJSetPreallocation(change_mat_all,0,nnz);CHKERRQ(ierr);
3136534831adSStefano Zampini     ierr = ISGetIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
3137534831adSStefano Zampini     for (i=0; i<n_D; i++) {
3138534831adSStefano Zampini       ierr = MatSetValue(change_mat_all,is_indices[i],is_indices[i],1.0,INSERT_VALUES);CHKERRQ(ierr);
3139534831adSStefano Zampini     }
3140534831adSStefano Zampini     ierr = ISRestoreIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
3141534831adSStefano Zampini     ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
3142534831adSStefano Zampini     for (i=0; i<n_B; i++) {
3143534831adSStefano Zampini       ierr = MatGetRow(pcbddc->ChangeOfBasisMatrix,i,&j,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr);
31442fa5cd67SKarl Rupp       for (k=0; k<j; k++) temp_indices[k]=is_indices[row_cmat_indices[k]];
3145534831adSStefano Zampini       ierr = MatSetValues(change_mat_all,1,&is_indices[i],j,temp_indices,row_cmat_values,INSERT_VALUES);CHKERRQ(ierr);
3146534831adSStefano Zampini       ierr = MatRestoreRow(pcbddc->ChangeOfBasisMatrix,i,&j,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr);
3147534831adSStefano Zampini     }
3148534831adSStefano Zampini     ierr = MatAssemblyBegin(change_mat_all,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
3149534831adSStefano Zampini     ierr = MatAssemblyEnd(change_mat_all,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
3150534831adSStefano Zampini     ierr = MatPtAP(matis->A,change_mat_all,MAT_INITIAL_MATRIX,1.0,&pcbddc->local_mat);CHKERRQ(ierr);
3151534831adSStefano Zampini     ierr = MatDestroy(&pcis->A_IB);CHKERRQ(ierr);
3152534831adSStefano Zampini     ierr = MatDestroy(&pcis->A_BI);CHKERRQ(ierr);
3153534831adSStefano Zampini     ierr = MatDestroy(&pcis->A_BB);CHKERRQ(ierr);
3154534831adSStefano Zampini     ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_I_local,pcis->is_B_local,MAT_INITIAL_MATRIX,&pcis->A_IB);CHKERRQ(ierr);
3155534831adSStefano Zampini     ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_B_local,pcis->is_I_local,MAT_INITIAL_MATRIX,&pcis->A_BI);CHKERRQ(ierr);
3156534831adSStefano Zampini     ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_B_local,pcis->is_B_local,MAT_INITIAL_MATRIX,&pcis->A_BB);CHKERRQ(ierr);
3157534831adSStefano Zampini     ierr = MatDestroy(&change_mat_all);CHKERRQ(ierr);
3158534831adSStefano Zampini     ierr = PetscFree(nnz);CHKERRQ(ierr);
3159534831adSStefano Zampini     ierr = PetscFree(temp_indices);CHKERRQ(ierr);
3160534831adSStefano Zampini   } else {
3161534831adSStefano Zampini     /* without change of basis, the local matrix is unchanged */
3162534831adSStefano Zampini     ierr = PetscObjectReference((PetscObject)matis->A);CHKERRQ(ierr);
31632fa5cd67SKarl Rupp 
3164534831adSStefano Zampini     pcbddc->local_mat = matis->A;
3165534831adSStefano Zampini   }
31660bdf917eSStefano Zampini   /* Change global null space passed in by the user if change of basis has been performed */
31670bdf917eSStefano Zampini   if (pcbddc->NullSpace && pcbddc->usechangeofbasis) {
31680bdf917eSStefano Zampini     ierr = PCBDDCAdaptNullSpace(pc);CHKERRQ(ierr);
31690bdf917eSStefano Zampini   }
3170a0ba757dSStefano Zampini 
31710c7d97c5SJed Brown   /* Dohrmann's notation: dofs splitted in R (Remaining: all dofs but the vertices) and V (Vertices) */
31720c7d97c5SJed Brown   ierr = VecSet(pcis->vec1_N,one);CHKERRQ(ierr);
31730c7d97c5SJed Brown   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
31742fa5cd67SKarl Rupp   for (i=0;i<n_vertices;i++) array[vertices[i]] = zero;
31753b03a366Sstefano_zampini   ierr = PetscMalloc((pcis->n - n_vertices)*sizeof(PetscInt),&idx_R_local);CHKERRQ(ierr);
31762fa5cd67SKarl Rupp   for (i=0, n_R=0; i<pcis->n; i++) {
31772fa5cd67SKarl Rupp     if (array[i] == one) {
31782fa5cd67SKarl Rupp       idx_R_local[n_R] = i;
31792fa5cd67SKarl Rupp       n_R++;
31802fa5cd67SKarl Rupp     }
31812fa5cd67SKarl Rupp   }
31820c7d97c5SJed Brown   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3183e269702eSStefano Zampini   if (dbg_flag) {
31840c7d97c5SJed Brown     ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
31850c7d97c5SJed Brown     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
31860c7d97c5SJed Brown     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d local dimensions\n",PetscGlobalRank);CHKERRQ(ierr);
31870c7d97c5SJed Brown     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local_size = %d, dirichlet_size = %d, boundary_size = %d\n",pcis->n,n_D,n_B);CHKERRQ(ierr);
31883b03a366Sstefano_zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"r_size = %d, v_size = %d, constraints = %d, local_primal_size = %d\n",n_R,n_vertices,n_constraints,pcbddc->local_primal_size);CHKERRQ(ierr);
3189534831adSStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"pcbddc->n_vertices = %d, pcbddc->n_constraints = %d\n",pcbddc->n_vertices,pcbddc->n_constraints);CHKERRQ(ierr);
31900c7d97c5SJed Brown     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
31910c7d97c5SJed Brown   }
3192534831adSStefano Zampini 
31930c7d97c5SJed Brown   /* Allocate needed vectors */
3194534831adSStefano Zampini   ierr = VecDuplicate(pcis->vec1_global,&pcbddc->original_rhs);CHKERRQ(ierr);
31953972b0daSStefano Zampini   ierr = VecDuplicate(pcis->vec1_global,&pcbddc->temp_solution);CHKERRQ(ierr);
31960c7d97c5SJed Brown   ierr = VecDuplicate(pcis->vec1_D,&pcbddc->vec4_D);CHKERRQ(ierr);
31970c7d97c5SJed Brown   ierr = VecCreate(PETSC_COMM_SELF,&pcbddc->vec1_R);CHKERRQ(ierr);
31980c7d97c5SJed Brown   ierr = VecSetSizes(pcbddc->vec1_R,n_R,n_R);CHKERRQ(ierr);
31990c7d97c5SJed Brown   ierr = VecSetType(pcbddc->vec1_R,impVecType);CHKERRQ(ierr);
3200d49ef151SStefano Zampini   ierr = VecDuplicate(pcbddc->vec1_R,&pcbddc->vec2_R);CHKERRQ(ierr);
32010c7d97c5SJed Brown   ierr = VecCreate(PETSC_COMM_SELF,&pcbddc->vec1_P);CHKERRQ(ierr);
32020c7d97c5SJed Brown   ierr = VecSetSizes(pcbddc->vec1_P,pcbddc->local_primal_size,pcbddc->local_primal_size);CHKERRQ(ierr);
32030c7d97c5SJed Brown   ierr = VecSetType(pcbddc->vec1_P,impVecType);CHKERRQ(ierr);
32040c7d97c5SJed Brown 
32050c7d97c5SJed Brown   /* Creating some index sets needed  */
32060c7d97c5SJed Brown   /* For submatrices */
3207da1bb401SStefano Zampini   ierr = ISCreateGeneral(PETSC_COMM_SELF,n_R,idx_R_local,PETSC_OWN_POINTER,&is_R_local);CHKERRQ(ierr);
32083b03a366Sstefano_zampini   if (n_vertices) {
3209da1bb401SStefano Zampini     ierr = ISCreateGeneral(PETSC_COMM_SELF,n_vertices,vertices,PETSC_OWN_POINTER,&is_V_local);CHKERRQ(ierr);
32103b03a366Sstefano_zampini   }
3211da1bb401SStefano Zampini   if (n_constraints) {
3212da1bb401SStefano Zampini     ierr = ISCreateStride(PETSC_COMM_SELF,n_constraints,n_vertices,1,&is_C_local);CHKERRQ(ierr);
3213da1bb401SStefano Zampini   }
3214da1bb401SStefano Zampini 
32150c7d97c5SJed Brown   /* For VecScatters pcbddc->R_to_B and (optionally) pcbddc->R_to_D */
32160c7d97c5SJed Brown   {
32170c7d97c5SJed Brown     PetscInt *aux_array1;
32180c7d97c5SJed Brown     PetscInt *aux_array2;
32192e8d2280SStefano Zampini     PetscInt *idx_I_local;
32200c7d97c5SJed Brown 
32213b03a366Sstefano_zampini     ierr = PetscMalloc((pcis->n_B-n_vertices)*sizeof(PetscInt),&aux_array1);CHKERRQ(ierr);
32223b03a366Sstefano_zampini     ierr = PetscMalloc((pcis->n_B-n_vertices)*sizeof(PetscInt),&aux_array2);CHKERRQ(ierr);
32230c7d97c5SJed Brown 
32242e8d2280SStefano Zampini     ierr = ISGetIndices(pcis->is_I_local,(const PetscInt**)&idx_I_local);CHKERRQ(ierr);
32250c7d97c5SJed Brown     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
32262fa5cd67SKarl Rupp     for (i=0; i<n_D; i++) array[idx_I_local[i]] = 0;
32272e8d2280SStefano Zampini     ierr = ISRestoreIndices(pcis->is_I_local,(const PetscInt**)&idx_I_local);CHKERRQ(ierr);
32282fa5cd67SKarl Rupp     for (i=0, j=0; i<n_R; i++) {
32292fa5cd67SKarl Rupp       if (array[idx_R_local[i]] == one) {
32302fa5cd67SKarl Rupp         aux_array1[j] = i;
32312fa5cd67SKarl Rupp         j++;
32322fa5cd67SKarl Rupp       }
32332fa5cd67SKarl Rupp     }
32340c7d97c5SJed Brown     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3235da1bb401SStefano Zampini     ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array1,PETSC_COPY_VALUES,&is_aux1);CHKERRQ(ierr);
32362e8d2280SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
32372e8d2280SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
32380c7d97c5SJed Brown     ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr);
32392fa5cd67SKarl Rupp     for (i=0, j=0; i<n_B; i++) {
32402fa5cd67SKarl Rupp       if (array[i] == one) {
32412fa5cd67SKarl Rupp         aux_array2[j] = i; j++;
32422fa5cd67SKarl Rupp       }
32432fa5cd67SKarl Rupp     }
32443828260eSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr);
3245da1bb401SStefano Zampini     ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array2,PETSC_COPY_VALUES,&is_aux2);CHKERRQ(ierr);
32460c7d97c5SJed Brown     ierr = VecScatterCreate(pcbddc->vec1_R,is_aux1,pcis->vec1_B,is_aux2,&pcbddc->R_to_B);CHKERRQ(ierr);
32470c7d97c5SJed Brown     ierr = PetscFree(aux_array1);CHKERRQ(ierr);
32480c7d97c5SJed Brown     ierr = PetscFree(aux_array2);CHKERRQ(ierr);
32490c7d97c5SJed Brown     ierr = ISDestroy(&is_aux1);CHKERRQ(ierr);
32500c7d97c5SJed Brown     ierr = ISDestroy(&is_aux2);CHKERRQ(ierr);
32510c7d97c5SJed Brown 
325229622bf0SStefano Zampini     if (pcbddc->inexact_prec_type || dbg_flag) {
32530c7d97c5SJed Brown       ierr = PetscMalloc(n_D*sizeof(PetscInt),&aux_array1);CHKERRQ(ierr);
32540c7d97c5SJed Brown       ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
32552fa5cd67SKarl Rupp       for (i=0, j=0; i<n_R; i++) {
32562fa5cd67SKarl Rupp         if (array[idx_R_local[i]] == zero) {
32572fa5cd67SKarl Rupp           aux_array1[j] = i;
32582fa5cd67SKarl Rupp           j++;
32592fa5cd67SKarl Rupp         }
32602fa5cd67SKarl Rupp       }
32610c7d97c5SJed Brown       ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3262da1bb401SStefano Zampini       ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array1,PETSC_COPY_VALUES,&is_aux1);CHKERRQ(ierr);
32630c7d97c5SJed Brown       ierr = VecScatterCreate(pcbddc->vec1_R,is_aux1,pcis->vec1_D,(IS)0,&pcbddc->R_to_D);CHKERRQ(ierr);
32640c7d97c5SJed Brown       ierr = PetscFree(aux_array1);CHKERRQ(ierr);
32650c7d97c5SJed Brown       ierr = ISDestroy(&is_aux1);CHKERRQ(ierr);
32660c7d97c5SJed Brown     }
32670c7d97c5SJed Brown   }
32680c7d97c5SJed Brown 
32690c7d97c5SJed Brown   /* Creating PC contexts for local Dirichlet and Neumann problems */
32700c7d97c5SJed Brown   {
32710c7d97c5SJed Brown     Mat A_RR;
327253cdbc3dSStefano Zampini     PC  pc_temp;
32732fa5cd67SKarl Rupp 
32740c7d97c5SJed Brown     /* Matrix for Dirichlet problem is A_II -> we already have it from pcis.c code */
327553cdbc3dSStefano Zampini     ierr = KSPCreate(PETSC_COMM_SELF,&pcbddc->ksp_D);CHKERRQ(ierr);
327653cdbc3dSStefano Zampini     ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->ksp_D,(PetscObject)pc,1);CHKERRQ(ierr);
327753cdbc3dSStefano Zampini     ierr = KSPSetOperators(pcbddc->ksp_D,pcis->A_II,pcis->A_II,SAME_PRECONDITIONER);CHKERRQ(ierr);
327853cdbc3dSStefano Zampini     ierr = KSPSetType(pcbddc->ksp_D,KSPPREONLY);CHKERRQ(ierr);
3279da1bb401SStefano Zampini     ierr = KSPSetOptionsPrefix(pcbddc->ksp_D,"dirichlet_");CHKERRQ(ierr);
32802fa5cd67SKarl Rupp 
32810c7d97c5SJed Brown     /* default */
328253cdbc3dSStefano Zampini     ierr = KSPGetPC(pcbddc->ksp_D,&pc_temp);CHKERRQ(ierr);
328353cdbc3dSStefano Zampini     ierr = PCSetType(pc_temp,PCLU);CHKERRQ(ierr);
32842fa5cd67SKarl Rupp 
32850c7d97c5SJed Brown     /* Allow user's customization */
328653cdbc3dSStefano Zampini     ierr = KSPSetFromOptions(pcbddc->ksp_D);CHKERRQ(ierr);
32872fa5cd67SKarl Rupp 
3288950d796eSStefano Zampini     /* umfpack interface has a bug when matrix dimension is zero */
3289950d796eSStefano Zampini     if (!n_D) {
32902e8d2280SStefano Zampini       ierr = PCSetType(pc_temp,PCNONE);CHKERRQ(ierr);
3291950d796eSStefano Zampini     }
32922fa5cd67SKarl Rupp 
329353cdbc3dSStefano Zampini     /* Set Up KSP for Dirichlet problem of BDDC */
329453cdbc3dSStefano Zampini     ierr = KSPSetUp(pcbddc->ksp_D);CHKERRQ(ierr);
32952fa5cd67SKarl Rupp 
32963972b0daSStefano Zampini     /* set ksp_D into pcis data */
32973972b0daSStefano Zampini     ierr        = KSPDestroy(&pcis->ksp_D);CHKERRQ(ierr);
32983972b0daSStefano Zampini     ierr        = PetscObjectReference((PetscObject)pcbddc->ksp_D);CHKERRQ(ierr);
32993972b0daSStefano Zampini     pcis->ksp_D = pcbddc->ksp_D;
33002fa5cd67SKarl Rupp 
33010c7d97c5SJed Brown     /* Matrix for Neumann problem is A_RR -> we need to create it */
3302534831adSStefano Zampini     ierr = MatGetSubMatrix(pcbddc->local_mat,is_R_local,is_R_local,MAT_INITIAL_MATRIX,&A_RR);CHKERRQ(ierr);
330353cdbc3dSStefano Zampini     ierr = KSPCreate(PETSC_COMM_SELF,&pcbddc->ksp_R);CHKERRQ(ierr);
330453cdbc3dSStefano Zampini     ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->ksp_R,(PetscObject)pc,1);CHKERRQ(ierr);
330553cdbc3dSStefano Zampini     ierr = KSPSetOperators(pcbddc->ksp_R,A_RR,A_RR,SAME_PRECONDITIONER);CHKERRQ(ierr);
330653cdbc3dSStefano Zampini     ierr = KSPSetType(pcbddc->ksp_R,KSPPREONLY);CHKERRQ(ierr);
3307da1bb401SStefano Zampini     ierr = KSPSetOptionsPrefix(pcbddc->ksp_R,"neumann_");CHKERRQ(ierr);
33082fa5cd67SKarl Rupp 
33090c7d97c5SJed Brown     /* default */
331053cdbc3dSStefano Zampini     ierr = KSPGetPC(pcbddc->ksp_R,&pc_temp);CHKERRQ(ierr);
331153cdbc3dSStefano Zampini     ierr = PCSetType(pc_temp,PCLU);CHKERRQ(ierr);
33122fa5cd67SKarl Rupp 
33130c7d97c5SJed Brown     /* Allow user's customization */
331453cdbc3dSStefano Zampini     ierr = KSPSetFromOptions(pcbddc->ksp_R);CHKERRQ(ierr);
33152fa5cd67SKarl Rupp 
3316950d796eSStefano Zampini     /* umfpack interface has a bug when matrix dimension is zero */
3317950d796eSStefano Zampini     if (!pcis->n) {
33182e8d2280SStefano Zampini       ierr = PCSetType(pc_temp,PCNONE);CHKERRQ(ierr);
3319950d796eSStefano Zampini     }
33202fa5cd67SKarl Rupp 
332153cdbc3dSStefano Zampini     /* Set Up KSP for Neumann problem of BDDC */
332253cdbc3dSStefano Zampini     ierr = KSPSetUp(pcbddc->ksp_R);CHKERRQ(ierr);
33232fa5cd67SKarl Rupp 
332429622bf0SStefano Zampini     /* check Dirichlet and Neumann solvers and adapt them is a nullspace correction is needed */
3325b76ba322SStefano Zampini     {
33260c7d97c5SJed Brown       Vec         temp_vec;
3327b76ba322SStefano Zampini       PetscReal   value;
3328b76ba322SStefano Zampini       PetscMPIInt use_exact,use_exact_reduced;
33290c7d97c5SJed Brown 
3330a0ba757dSStefano Zampini       ierr = VecDuplicate(pcis->vec1_D,&temp_vec);CHKERRQ(ierr);
33310298fd71SBarry Smith       ierr = VecSetRandom(pcis->vec1_D,NULL);CHKERRQ(ierr);
3332a0ba757dSStefano Zampini       ierr = MatMult(pcis->A_II,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr);
3333a0ba757dSStefano Zampini       ierr = KSPSolve(pcbddc->ksp_D,pcis->vec2_D,temp_vec);CHKERRQ(ierr);
3334a0ba757dSStefano Zampini       ierr = VecAXPY(temp_vec,m_one,pcis->vec1_D);CHKERRQ(ierr);
3335a0ba757dSStefano Zampini       ierr = VecNorm(temp_vec,NORM_INFINITY,&value);CHKERRQ(ierr);
333629622bf0SStefano Zampini       ierr = VecDestroy(&temp_vec);CHKERRQ(ierr);
3337b76ba322SStefano Zampini       use_exact = 1;
33382fa5cd67SKarl Rupp       if (PetscAbsReal(value) > 1.e-4) use_exact = 0;
33392fa5cd67SKarl Rupp 
3340ce94432eSBarry Smith       ierr = MPI_Allreduce(&use_exact,&use_exact_reduced,1,MPIU_INT,MPI_LAND,PetscObjectComm((PetscObject)pc));CHKERRQ(ierr);
3341b76ba322SStefano Zampini       pcbddc->use_exact_dirichlet = (PetscBool) use_exact_reduced;
3342b76ba322SStefano Zampini       if (dbg_flag) {
3343a0ba757dSStefano Zampini         ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
3344a0ba757dSStefano Zampini         ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
3345a0ba757dSStefano Zampini         ierr = PetscViewerASCIIPrintf(viewer,"Checking solution of Dirichlet and Neumann problems\n");CHKERRQ(ierr);
3346a0ba757dSStefano Zampini         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d infinity error for Dirichlet solve = % 1.14e \n",PetscGlobalRank,value);CHKERRQ(ierr);
334729622bf0SStefano Zampini       }
334829622bf0SStefano Zampini       if (pcbddc->NullSpace && !use_exact_reduced && !pcbddc->inexact_prec_type) {
334929622bf0SStefano Zampini         ierr = PCBDDCAdaptLocalProblem(pc,pcis->is_I_local);
335029622bf0SStefano Zampini       }
3351d49ef151SStefano Zampini       ierr = VecDuplicate(pcbddc->vec1_R,&temp_vec);CHKERRQ(ierr);
33520298fd71SBarry Smith       ierr = VecSetRandom(pcbddc->vec1_R,NULL);CHKERRQ(ierr);
3353d49ef151SStefano Zampini       ierr = MatMult(A_RR,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr);
3354d49ef151SStefano Zampini       ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec2_R,temp_vec);CHKERRQ(ierr);
3355d49ef151SStefano Zampini       ierr = VecAXPY(temp_vec,m_one,pcbddc->vec1_R);CHKERRQ(ierr);
3356d49ef151SStefano Zampini       ierr = VecNorm(temp_vec,NORM_INFINITY,&value);CHKERRQ(ierr);
3357e269702eSStefano Zampini       ierr = VecDestroy(&temp_vec);CHKERRQ(ierr);
33582fa5cd67SKarl Rupp 
335929622bf0SStefano Zampini       use_exact = 1;
33602fa5cd67SKarl Rupp       if (PetscAbsReal(value) > 1.e-4) use_exact = 0;
3361ce94432eSBarry Smith       ierr = MPI_Allreduce(&use_exact,&use_exact_reduced,1,MPIU_INT,MPI_LAND,PetscObjectComm((PetscObject)pc));CHKERRQ(ierr);
336229622bf0SStefano Zampini       if (dbg_flag) {
33630c7d97c5SJed Brown         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d infinity error for  Neumann  solve = % 1.14e \n",PetscGlobalRank,value);CHKERRQ(ierr);
3364d49ef151SStefano Zampini         ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
33650c7d97c5SJed Brown       }
336629622bf0SStefano Zampini       if (pcbddc->NullSpace && !use_exact_reduced) {
336729622bf0SStefano Zampini         ierr = PCBDDCAdaptLocalProblem(pc,is_R_local);
336829622bf0SStefano Zampini       }
3369b76ba322SStefano Zampini     }
33700c7d97c5SJed Brown     /* free Neumann problem's matrix */
33710c7d97c5SJed Brown     ierr = MatDestroy(&A_RR);CHKERRQ(ierr);
33720c7d97c5SJed Brown   }
33730c7d97c5SJed Brown 
33740c7d97c5SJed Brown   /* Assemble all remaining stuff needed to apply BDDC  */
33750c7d97c5SJed Brown   {
33760c7d97c5SJed Brown     Mat           A_RV,A_VR,A_VV;
33770bdf917eSStefano Zampini     Mat           M1;
33780c7d97c5SJed Brown     Mat           C_CR;
33793b03a366Sstefano_zampini     Mat           AUXMAT;
33800c7d97c5SJed Brown     Vec           vec1_C;
33810c7d97c5SJed Brown     Vec           vec2_C;
33820c7d97c5SJed Brown     Vec           vec1_V;
33830c7d97c5SJed Brown     Vec           vec2_V;
33840c7d97c5SJed Brown     PetscInt      *nnz;
33850c7d97c5SJed Brown     PetscInt      *auxindices;
338653cdbc3dSStefano Zampini     PetscInt      index;
33870c7d97c5SJed Brown     PetscScalar   *array2;
33880c7d97c5SJed Brown     MatFactorInfo matinfo;
33890c7d97c5SJed Brown 
33900c7d97c5SJed Brown     /* Allocating some extra storage just to be safe */
33910c7d97c5SJed Brown     ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&nnz);CHKERRQ(ierr);
33920c7d97c5SJed Brown     ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&auxindices);CHKERRQ(ierr);
33932fa5cd67SKarl Rupp     for (i=0;i<pcis->n;i++) auxindices[i]=i;
33940c7d97c5SJed Brown 
33950c7d97c5SJed Brown     /* some work vectors on vertices and/or constraints */
33963b03a366Sstefano_zampini     if (n_vertices) {
33970c7d97c5SJed Brown       ierr = VecCreate(PETSC_COMM_SELF,&vec1_V);CHKERRQ(ierr);
33983b03a366Sstefano_zampini       ierr = VecSetSizes(vec1_V,n_vertices,n_vertices);CHKERRQ(ierr);
33990c7d97c5SJed Brown       ierr = VecSetType(vec1_V,impVecType);CHKERRQ(ierr);
34000c7d97c5SJed Brown       ierr = VecDuplicate(vec1_V,&vec2_V);CHKERRQ(ierr);
34010c7d97c5SJed Brown     }
3402534831adSStefano Zampini     if (n_constraints) {
34030c7d97c5SJed Brown       ierr = VecCreate(PETSC_COMM_SELF,&vec1_C);CHKERRQ(ierr);
3404534831adSStefano Zampini       ierr = VecSetSizes(vec1_C,n_constraints,n_constraints);CHKERRQ(ierr);
34050c7d97c5SJed Brown       ierr = VecSetType(vec1_C,impVecType);CHKERRQ(ierr);
34060c7d97c5SJed Brown       ierr = VecDuplicate(vec1_C,&vec2_C);CHKERRQ(ierr);
34070c7d97c5SJed Brown       ierr = VecDuplicate(vec1_C,&pcbddc->vec1_C);CHKERRQ(ierr);
34080c7d97c5SJed Brown     }
34090c7d97c5SJed Brown     /* Precompute stuffs needed for preprocessing and application of BDDC*/
34103b03a366Sstefano_zampini     if (n_constraints) {
34110c7d97c5SJed Brown       ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->local_auxmat2);CHKERRQ(ierr);
34123b03a366Sstefano_zampini       ierr = MatSetSizes(pcbddc->local_auxmat2,n_R,n_constraints,n_R,n_constraints);CHKERRQ(ierr);
34130c7d97c5SJed Brown       ierr = MatSetType(pcbddc->local_auxmat2,impMatType);CHKERRQ(ierr);
34140298fd71SBarry Smith       ierr = MatSeqDenseSetPreallocation(pcbddc->local_auxmat2,NULL);CHKERRQ(ierr);
34150c7d97c5SJed Brown 
341657a90decSStefano Zampini       /* Create Constraint matrix on R nodes: C_{CR}  */
341757a90decSStefano Zampini       ierr = MatGetSubMatrix(pcbddc->ConstraintMatrix,is_C_local,is_R_local,MAT_INITIAL_MATRIX,&C_CR);CHKERRQ(ierr);
341857a90decSStefano Zampini       ierr = ISDestroy(&is_C_local);CHKERRQ(ierr);
341957a90decSStefano Zampini 
34200c7d97c5SJed Brown       /* Assemble local_auxmat2 = - A_{RR}^{-1} C^T_{CR} needed by BDDC application */
34213b03a366Sstefano_zampini       for (i=0; i<n_constraints; i++) {
34223b03a366Sstefano_zampini         ierr = VecSet(pcbddc->vec1_R,zero);CHKERRQ(ierr);
34232fa5cd67SKarl Rupp 
34243b03a366Sstefano_zampini         /* Get row of constraint matrix in R numbering */
342557a90decSStefano Zampini         ierr = VecGetArray(pcbddc->vec1_R,&array);CHKERRQ(ierr);
342657a90decSStefano Zampini         ierr = MatGetRow(C_CR,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr);
34272fa5cd67SKarl Rupp         for (j=0;j<size_of_constraint;j++) array[row_cmat_indices[j]] = -row_cmat_values[j];
342857a90decSStefano Zampini         ierr = MatRestoreRow(C_CR,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr);
342957a90decSStefano Zampini         ierr = VecRestoreArray(pcbddc->vec1_R,&array);CHKERRQ(ierr);
34302fa5cd67SKarl Rupp 
34313b03a366Sstefano_zampini         /* Solve for row of constraint matrix in R numbering */
343253cdbc3dSStefano Zampini         ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr);
34332fa5cd67SKarl Rupp 
34343b03a366Sstefano_zampini         /* Set values */
34350c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec2_R,&array);CHKERRQ(ierr);
34363b03a366Sstefano_zampini         ierr = MatSetValues(pcbddc->local_auxmat2,n_R,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
34370c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec2_R,&array);CHKERRQ(ierr);
34380c7d97c5SJed Brown       }
34390c7d97c5SJed Brown       ierr = MatAssemblyBegin(pcbddc->local_auxmat2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
34400c7d97c5SJed Brown       ierr = MatAssemblyEnd(pcbddc->local_auxmat2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
34410c7d97c5SJed Brown 
34420c7d97c5SJed Brown       /* Assemble AUXMAT = (LUFactor)(-C_{CR} A_{RR}^{-1} C^T_{CR})^{-1} */
34430c7d97c5SJed Brown       ierr = MatMatMult(C_CR,pcbddc->local_auxmat2,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&AUXMAT);CHKERRQ(ierr);
3444d49ef151SStefano Zampini       ierr = MatFactorInfoInitialize(&matinfo);CHKERRQ(ierr);
34453b03a366Sstefano_zampini       ierr = ISCreateStride(PETSC_COMM_SELF,n_constraints,0,1,&is_aux1);CHKERRQ(ierr);
34460c7d97c5SJed Brown       ierr = MatLUFactor(AUXMAT,is_aux1,is_aux1,&matinfo);CHKERRQ(ierr);
34470c7d97c5SJed Brown       ierr = ISDestroy(&is_aux1);CHKERRQ(ierr);
34480c7d97c5SJed Brown 
34493b03a366Sstefano_zampini       /* Assemble explicitly M1 = (C_{CR} A_{RR}^{-1} C^T_{CR})^{-1} needed in preproc  */
3450d49ef151SStefano Zampini       ierr = MatCreate(PETSC_COMM_SELF,&M1);CHKERRQ(ierr);
34513b03a366Sstefano_zampini       ierr = MatSetSizes(M1,n_constraints,n_constraints,n_constraints,n_constraints);CHKERRQ(ierr);
34520c7d97c5SJed Brown       ierr = MatSetType(M1,impMatType);CHKERRQ(ierr);
34530298fd71SBarry Smith       ierr = MatSeqDenseSetPreallocation(M1,NULL);CHKERRQ(ierr);
34543b03a366Sstefano_zampini       for (i=0; i<n_constraints; i++) {
34550c7d97c5SJed Brown         ierr = VecSet(vec1_C,zero);CHKERRQ(ierr);
34560c7d97c5SJed Brown         ierr = VecSetValue(vec1_C,i,one,INSERT_VALUES);CHKERRQ(ierr);
34570c7d97c5SJed Brown         ierr = VecAssemblyBegin(vec1_C);CHKERRQ(ierr);
34580c7d97c5SJed Brown         ierr = VecAssemblyEnd(vec1_C);CHKERRQ(ierr);
34590c7d97c5SJed Brown         ierr = MatSolve(AUXMAT,vec1_C,vec2_C);CHKERRQ(ierr);
34600c7d97c5SJed Brown         ierr = VecScale(vec2_C,m_one);CHKERRQ(ierr);
34610c7d97c5SJed Brown         ierr = VecGetArray(vec2_C,&array);CHKERRQ(ierr);
34623b03a366Sstefano_zampini         ierr = MatSetValues(M1,n_constraints,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
34630c7d97c5SJed Brown         ierr = VecRestoreArray(vec2_C,&array);CHKERRQ(ierr);
34640c7d97c5SJed Brown       }
34650c7d97c5SJed Brown       ierr = MatAssemblyBegin(M1,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
34660c7d97c5SJed Brown       ierr = MatAssemblyEnd(M1,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
34670c7d97c5SJed Brown       ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr);
34680c7d97c5SJed Brown       /* Assemble local_auxmat1 = M1*C_{CR} needed by BDDC application in KSP and in preproc */
34690c7d97c5SJed Brown       ierr = MatMatMult(M1,C_CR,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&pcbddc->local_auxmat1);CHKERRQ(ierr);
34700c7d97c5SJed Brown 
34710c7d97c5SJed Brown     }
34720c7d97c5SJed Brown 
34730c7d97c5SJed Brown     /* Get submatrices from subdomain matrix */
34743b03a366Sstefano_zampini     if (n_vertices) {
3475534831adSStefano Zampini       ierr = MatGetSubMatrix(pcbddc->local_mat,is_R_local,is_V_local,MAT_INITIAL_MATRIX,&A_RV);CHKERRQ(ierr);
3476534831adSStefano Zampini       ierr = MatGetSubMatrix(pcbddc->local_mat,is_V_local,is_R_local,MAT_INITIAL_MATRIX,&A_VR);CHKERRQ(ierr);
3477534831adSStefano Zampini       ierr = MatGetSubMatrix(pcbddc->local_mat,is_V_local,is_V_local,MAT_INITIAL_MATRIX,&A_VV);CHKERRQ(ierr);
34780c7d97c5SJed Brown     }
34790c7d97c5SJed Brown 
34800c7d97c5SJed Brown     /* Matrix of coarse basis functions (local) */
3481d49ef151SStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->coarse_phi_B);CHKERRQ(ierr);
34820c7d97c5SJed Brown     ierr = MatSetSizes(pcbddc->coarse_phi_B,n_B,pcbddc->local_primal_size,n_B,pcbddc->local_primal_size);CHKERRQ(ierr);
34830c7d97c5SJed Brown     ierr = MatSetType(pcbddc->coarse_phi_B,impMatType);CHKERRQ(ierr);
34840298fd71SBarry Smith     ierr = MatSeqDenseSetPreallocation(pcbddc->coarse_phi_B,NULL);CHKERRQ(ierr);
348529622bf0SStefano Zampini     if (pcbddc->inexact_prec_type || dbg_flag) {
3486d49ef151SStefano Zampini       ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->coarse_phi_D);CHKERRQ(ierr);
34870c7d97c5SJed Brown       ierr = MatSetSizes(pcbddc->coarse_phi_D,n_D,pcbddc->local_primal_size,n_D,pcbddc->local_primal_size);CHKERRQ(ierr);
34880c7d97c5SJed Brown       ierr = MatSetType(pcbddc->coarse_phi_D,impMatType);CHKERRQ(ierr);
34890298fd71SBarry Smith       ierr = MatSeqDenseSetPreallocation(pcbddc->coarse_phi_D,NULL);CHKERRQ(ierr);
34900c7d97c5SJed Brown     }
34910c7d97c5SJed Brown 
3492e269702eSStefano Zampini     if (dbg_flag) {
34930c7d97c5SJed Brown       ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscScalar),&coarsefunctions_errors);CHKERRQ(ierr);
34940c7d97c5SJed Brown       ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscScalar),&constraints_errors);CHKERRQ(ierr);
34950c7d97c5SJed Brown     }
34963b03a366Sstefano_zampini     /* Subdomain contribution (Non-overlapping) to coarse matrix  */
34970c7d97c5SJed Brown     ierr = PetscMalloc ((pcbddc->local_primal_size)*(pcbddc->local_primal_size)*sizeof(PetscScalar),&coarse_submat_vals);CHKERRQ(ierr);
34980c7d97c5SJed Brown 
34990c7d97c5SJed Brown     /* We are now ready to evaluate coarse basis functions and subdomain contribution to coarse problem */
35003b03a366Sstefano_zampini     for (i=0; i<n_vertices; i++) {
35010c7d97c5SJed Brown       ierr = VecSet(vec1_V,zero);CHKERRQ(ierr);
35020c7d97c5SJed Brown       ierr = VecSetValue(vec1_V,i,one,INSERT_VALUES);CHKERRQ(ierr);
35030c7d97c5SJed Brown       ierr = VecAssemblyBegin(vec1_V);CHKERRQ(ierr);
35040c7d97c5SJed Brown       ierr = VecAssemblyEnd(vec1_V);CHKERRQ(ierr);
35050c7d97c5SJed Brown       /* solution of saddle point problem */
35060bdf917eSStefano Zampini       ierr = MatMult(A_RV,vec1_V,pcbddc->vec1_R);CHKERRQ(ierr);
35070bdf917eSStefano Zampini       ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec1_R);CHKERRQ(ierr);
35080c7d97c5SJed Brown       ierr = VecScale(pcbddc->vec1_R,m_one);CHKERRQ(ierr);
35093b03a366Sstefano_zampini       if (n_constraints) {
35100c7d97c5SJed Brown         ierr = MatMult(pcbddc->local_auxmat1,pcbddc->vec1_R,vec1_C);CHKERRQ(ierr);
35110c7d97c5SJed Brown         ierr = MatMultAdd(pcbddc->local_auxmat2,vec1_C,pcbddc->vec1_R,pcbddc->vec1_R);CHKERRQ(ierr);
35120c7d97c5SJed Brown         ierr = VecScale(vec1_C,m_one);CHKERRQ(ierr);
35130c7d97c5SJed Brown       }
35140c7d97c5SJed Brown       ierr = MatMult(A_VR,pcbddc->vec1_R,vec2_V);CHKERRQ(ierr);
35150c7d97c5SJed Brown       ierr = MatMultAdd(A_VV,vec1_V,vec2_V,vec2_V);CHKERRQ(ierr);
35160c7d97c5SJed Brown 
35170c7d97c5SJed Brown       /* Set values in coarse basis function and subdomain part of coarse_mat */
35180c7d97c5SJed Brown       /* coarse basis functions */
35190c7d97c5SJed Brown       ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr);
35200c7d97c5SJed Brown       ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
35210c7d97c5SJed Brown       ierr = VecScatterEnd  (pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
35220c7d97c5SJed Brown       ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr);
35233b03a366Sstefano_zampini       ierr = MatSetValues(pcbddc->coarse_phi_B,n_B,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
35240c7d97c5SJed Brown       ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr);
35250c7d97c5SJed Brown       ierr = MatSetValue(pcbddc->coarse_phi_B,idx_V_B[i],i,one,INSERT_VALUES);CHKERRQ(ierr);
352629622bf0SStefano Zampini       if (pcbddc->inexact_prec_type || dbg_flag) {
35270c7d97c5SJed Brown         ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
35280c7d97c5SJed Brown         ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
35290c7d97c5SJed Brown         ierr = VecGetArray(pcis->vec1_D,&array);CHKERRQ(ierr);
35303b03a366Sstefano_zampini         ierr = MatSetValues(pcbddc->coarse_phi_D,n_D,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
35310c7d97c5SJed Brown         ierr = VecRestoreArray(pcis->vec1_D,&array);CHKERRQ(ierr);
35320c7d97c5SJed Brown       }
35330c7d97c5SJed Brown       /* subdomain contribution to coarse matrix */
35340c7d97c5SJed Brown       ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr);
35352fa5cd67SKarl Rupp       for (j=0; j<n_vertices; j++) coarse_submat_vals[i*pcbddc->local_primal_size+j] = array[j];   /* WARNING -> column major ordering */
35360c7d97c5SJed Brown       ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr);
35373b03a366Sstefano_zampini       if (n_constraints) {
35380c7d97c5SJed Brown         ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr);
35392fa5cd67SKarl Rupp         for (j=0; j<n_constraints; j++) coarse_submat_vals[i*pcbddc->local_primal_size+j+n_vertices] = array[j];   /* WARNING -> column major ordering */
35400c7d97c5SJed Brown         ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr);
35410c7d97c5SJed Brown       }
35420c7d97c5SJed Brown 
3543e269702eSStefano Zampini       if (dbg_flag) {
35440c7d97c5SJed Brown         /* assemble subdomain vector on nodes */
3545d49ef151SStefano Zampini         ierr = VecSet(pcis->vec1_N,zero);CHKERRQ(ierr);
35460c7d97c5SJed Brown         ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
35470c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr);
35482fa5cd67SKarl Rupp         for (j=0;j<n_R;j++) array[idx_R_local[j]] = array2[j];
35493b03a366Sstefano_zampini         array[vertices[i]] = one;
35500c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr);
35510c7d97c5SJed Brown         ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
35522fa5cd67SKarl Rupp 
35530c7d97c5SJed Brown         /* assemble subdomain vector of lagrange multipliers (i.e. primal nodes) */
3554d49ef151SStefano Zampini         ierr = VecSet(pcbddc->vec1_P,zero);CHKERRQ(ierr);
35550c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr);
35560c7d97c5SJed Brown         ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr);
35572fa5cd67SKarl Rupp         for (j=0;j<n_vertices;j++) array2[j]=array[j];
35580c7d97c5SJed Brown         ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr);
35593b03a366Sstefano_zampini         if (n_constraints) {
35600c7d97c5SJed Brown           ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr);
35612fa5cd67SKarl Rupp           for (j=0;j<n_constraints;j++) array2[j+n_vertices]=array[j];
35620c7d97c5SJed Brown           ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr);
35630c7d97c5SJed Brown         }
35640c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr);
35650c7d97c5SJed Brown         ierr = VecScale(pcbddc->vec1_P,m_one);CHKERRQ(ierr);
35662fa5cd67SKarl Rupp 
35670c7d97c5SJed Brown         /* check saddle point solution */
3568534831adSStefano Zampini         ierr    = MatMult(pcbddc->local_mat,pcis->vec1_N,pcis->vec2_N);CHKERRQ(ierr);
35693b03a366Sstefano_zampini         ierr    = MatMultTransposeAdd(pcbddc->ConstraintMatrix,pcbddc->vec1_P,pcis->vec2_N,pcis->vec2_N);CHKERRQ(ierr);
35703b03a366Sstefano_zampini         ierr    = VecNorm(pcis->vec2_N,NORM_INFINITY,&coarsefunctions_errors[i]);CHKERRQ(ierr);
35713b03a366Sstefano_zampini         ierr    = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr);
35720c7d97c5SJed Brown         ierr    = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
35733b03a366Sstefano_zampini         array[i]=array[i]+m_one;  /* shift by the identity matrix */
35740c7d97c5SJed Brown         ierr    = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
35753b03a366Sstefano_zampini         ierr    = VecNorm(pcbddc->vec1_P,NORM_INFINITY,&constraints_errors[i]);CHKERRQ(ierr);
35760c7d97c5SJed Brown       }
35770c7d97c5SJed Brown     }
35780c7d97c5SJed Brown 
35793b03a366Sstefano_zampini     for (i=0; i<n_constraints; i++) {
3580d49ef151SStefano Zampini       ierr = VecSet(vec2_C,zero);CHKERRQ(ierr);
35810c7d97c5SJed Brown       ierr = VecSetValue(vec2_C,i,m_one,INSERT_VALUES);CHKERRQ(ierr);
35820c7d97c5SJed Brown       ierr = VecAssemblyBegin(vec2_C);CHKERRQ(ierr);
35830c7d97c5SJed Brown       ierr = VecAssemblyEnd(vec2_C);CHKERRQ(ierr);
35842fa5cd67SKarl Rupp 
35850c7d97c5SJed Brown       /* solution of saddle point problem */
35860c7d97c5SJed Brown       ierr = MatMult(M1,vec2_C,vec1_C);CHKERRQ(ierr);
35870c7d97c5SJed Brown       ierr = MatMult(pcbddc->local_auxmat2,vec1_C,pcbddc->vec1_R);CHKERRQ(ierr);
35880c7d97c5SJed Brown       ierr = VecScale(vec1_C,m_one);CHKERRQ(ierr);
35893b03a366Sstefano_zampini       if (n_vertices) { ierr = MatMult(A_VR,pcbddc->vec1_R,vec2_V);CHKERRQ(ierr); }
35902fa5cd67SKarl Rupp 
35910c7d97c5SJed Brown       /* Set values in coarse basis function and subdomain part of coarse_mat */
35920c7d97c5SJed Brown       /* coarse basis functions */
35933b03a366Sstefano_zampini       index=i+n_vertices;
35940c7d97c5SJed Brown       ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr);
35950c7d97c5SJed Brown       ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
35960c7d97c5SJed Brown       ierr = VecScatterEnd  (pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
35970c7d97c5SJed Brown       ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr);
359853cdbc3dSStefano Zampini       ierr = MatSetValues(pcbddc->coarse_phi_B,n_B,auxindices,1,&index,array,INSERT_VALUES);CHKERRQ(ierr);
35990c7d97c5SJed Brown       ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr);
360029622bf0SStefano Zampini       if (pcbddc->inexact_prec_type || dbg_flag) {
36010c7d97c5SJed Brown         ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
36020c7d97c5SJed Brown         ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
36030c7d97c5SJed Brown         ierr = VecGetArray(pcis->vec1_D,&array);CHKERRQ(ierr);
360453cdbc3dSStefano Zampini         ierr = MatSetValues(pcbddc->coarse_phi_D,n_D,auxindices,1,&index,array,INSERT_VALUES);CHKERRQ(ierr);
36050c7d97c5SJed Brown         ierr = VecRestoreArray(pcis->vec1_D,&array);CHKERRQ(ierr);
36060c7d97c5SJed Brown       }
36072fa5cd67SKarl Rupp 
36080c7d97c5SJed Brown       /* subdomain contribution to coarse matrix */
36093b03a366Sstefano_zampini       if (n_vertices) {
36100c7d97c5SJed Brown         ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr);
36112fa5cd67SKarl Rupp         for (j=0; j<n_vertices; j++) coarse_submat_vals[index*pcbddc->local_primal_size+j]=array[j]; /* WARNING -> column major ordering */
36120c7d97c5SJed Brown         ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr);
36130c7d97c5SJed Brown       }
36140c7d97c5SJed Brown       ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr);
36152fa5cd67SKarl Rupp       for (j=0; j<n_constraints; j++) coarse_submat_vals[index*pcbddc->local_primal_size+j+n_vertices]=array[j]; /* WARNING -> column major ordering */
36160c7d97c5SJed Brown       ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr);
36170c7d97c5SJed Brown 
3618e269702eSStefano Zampini       if (dbg_flag) {
36190c7d97c5SJed Brown         /* assemble subdomain vector on nodes */
362053cdbc3dSStefano Zampini         ierr = VecSet(pcis->vec1_N,zero);CHKERRQ(ierr);
36210c7d97c5SJed Brown         ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
36220c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr);
36232fa5cd67SKarl Rupp         for (j=0;j<n_R;j++) array[idx_R_local[j]] = array2[j];
36240c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr);
36250c7d97c5SJed Brown         ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
36262fa5cd67SKarl Rupp 
36270c7d97c5SJed Brown         /* assemble subdomain vector of lagrange multipliers */
362853cdbc3dSStefano Zampini         ierr = VecSet(pcbddc->vec1_P,zero);CHKERRQ(ierr);
36290c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr);
36303b03a366Sstefano_zampini         if (n_vertices) {
36310c7d97c5SJed Brown           ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr);
36322fa5cd67SKarl Rupp           for (j=0;j<n_vertices;j++) array2[j]=-array[j];
36330c7d97c5SJed Brown           ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr);
36340c7d97c5SJed Brown         }
36350c7d97c5SJed Brown         ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr);
36363b03a366Sstefano_zampini         for (j=0;j<n_constraints;j++) {array2[j+n_vertices]=-array[j];}
36370c7d97c5SJed Brown         ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr);
36380c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr);
36392fa5cd67SKarl Rupp 
36403972b0daSStefano Zampini         /* check saddle point solution */
3641534831adSStefano Zampini         ierr         = MatMult(pcbddc->local_mat,pcis->vec1_N,pcis->vec2_N);CHKERRQ(ierr);
36423b03a366Sstefano_zampini         ierr         = MatMultTransposeAdd(pcbddc->ConstraintMatrix,pcbddc->vec1_P,pcis->vec2_N,pcis->vec2_N);CHKERRQ(ierr);
364353cdbc3dSStefano Zampini         ierr         = VecNorm(pcis->vec2_N,NORM_INFINITY,&coarsefunctions_errors[index]);CHKERRQ(ierr);
36443b03a366Sstefano_zampini         ierr         = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr);
36450c7d97c5SJed Brown         ierr         = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
364653cdbc3dSStefano Zampini         array[index] = array[index]+m_one; /* shift by the identity matrix */
36470c7d97c5SJed Brown         ierr         = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
364853cdbc3dSStefano Zampini         ierr         = VecNorm(pcbddc->vec1_P,NORM_INFINITY,&constraints_errors[index]);CHKERRQ(ierr);
36490c7d97c5SJed Brown       }
36500c7d97c5SJed Brown     }
36510c7d97c5SJed Brown     ierr = MatAssemblyBegin(pcbddc->coarse_phi_B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
36520c7d97c5SJed Brown     ierr = MatAssemblyEnd  (pcbddc->coarse_phi_B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
365329622bf0SStefano Zampini     if (pcbddc->inexact_prec_type || dbg_flag) {
36540c7d97c5SJed Brown       ierr = MatAssemblyBegin(pcbddc->coarse_phi_D,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
36550c7d97c5SJed Brown       ierr = MatAssemblyEnd  (pcbddc->coarse_phi_D,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
36560c7d97c5SJed Brown     }
36570c7d97c5SJed Brown     /* Checking coarse_sub_mat and coarse basis functios */
36580c7d97c5SJed Brown     /* It shuld be \Phi^{(j)^T} A^{(j)} \Phi^{(j)}=coarse_sub_mat */
36599d2fce94SStefano Zampini     if (dbg_flag) {
36600c7d97c5SJed Brown       Mat         coarse_sub_mat;
36610c7d97c5SJed Brown       Mat         TM1,TM2,TM3,TM4;
36620c7d97c5SJed Brown       Mat         coarse_phi_D,coarse_phi_B,A_II,A_BB,A_IB,A_BI;
366319fd82e9SBarry Smith       MatType     checkmattype=MATSEQAIJ;
36640c7d97c5SJed Brown       PetscScalar value;
36650c7d97c5SJed Brown 
3666c042a7c3SStefano Zampini       ierr = MatConvert(pcis->A_II,checkmattype,MAT_INITIAL_MATRIX,&A_II);CHKERRQ(ierr);
3667c042a7c3SStefano Zampini       ierr = MatConvert(pcis->A_IB,checkmattype,MAT_INITIAL_MATRIX,&A_IB);CHKERRQ(ierr);
3668c042a7c3SStefano Zampini       ierr = MatConvert(pcis->A_BI,checkmattype,MAT_INITIAL_MATRIX,&A_BI);CHKERRQ(ierr);
3669c042a7c3SStefano Zampini       ierr = MatConvert(pcis->A_BB,checkmattype,MAT_INITIAL_MATRIX,&A_BB);CHKERRQ(ierr);
3670c042a7c3SStefano Zampini       ierr = MatConvert(pcbddc->coarse_phi_D,checkmattype,MAT_INITIAL_MATRIX,&coarse_phi_D);CHKERRQ(ierr);
3671c042a7c3SStefano Zampini       ierr = MatConvert(pcbddc->coarse_phi_B,checkmattype,MAT_INITIAL_MATRIX,&coarse_phi_B);CHKERRQ(ierr);
3672c042a7c3SStefano Zampini       ierr = MatCreateSeqDense(PETSC_COMM_SELF,pcbddc->local_primal_size,pcbddc->local_primal_size,coarse_submat_vals,&coarse_sub_mat);CHKERRQ(ierr);
3673c042a7c3SStefano Zampini       ierr = MatConvert(coarse_sub_mat,checkmattype,MAT_REUSE_MATRIX,&coarse_sub_mat);CHKERRQ(ierr);
36740c7d97c5SJed Brown 
36750c7d97c5SJed Brown       ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
36760c7d97c5SJed Brown       ierr = PetscViewerASCIIPrintf(viewer,"Check coarse sub mat and local basis functions\n");CHKERRQ(ierr);
36770c7d97c5SJed Brown       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
367853cdbc3dSStefano Zampini       ierr = MatPtAP(A_II,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&TM1);CHKERRQ(ierr);
367953cdbc3dSStefano Zampini       ierr = MatPtAP(A_BB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&TM2);CHKERRQ(ierr);
368053cdbc3dSStefano Zampini       ierr = MatMatMult(A_IB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr);
3681c042a7c3SStefano Zampini       ierr = MatTransposeMatMult(coarse_phi_D,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM3);CHKERRQ(ierr);
368253cdbc3dSStefano Zampini       ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr);
368353cdbc3dSStefano Zampini       ierr = MatMatMult(A_BI,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr);
3684c042a7c3SStefano Zampini       ierr = MatTransposeMatMult(coarse_phi_B,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM4);CHKERRQ(ierr);
368553cdbc3dSStefano Zampini       ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr);
368653cdbc3dSStefano Zampini       ierr = MatAXPY(TM1,one,TM2,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
368753cdbc3dSStefano Zampini       ierr = MatAXPY(TM1,one,TM3,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
368853cdbc3dSStefano Zampini       ierr = MatAXPY(TM1,one,TM4,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
368953cdbc3dSStefano Zampini       ierr = MatAXPY(TM1,m_one,coarse_sub_mat,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
369053cdbc3dSStefano Zampini       ierr = MatNorm(TM1,NORM_INFINITY,&value);CHKERRQ(ierr);
36910c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"----------------------------------\n");CHKERRQ(ierr);
36920c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d \n",PetscGlobalRank);CHKERRQ(ierr);
36930c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"matrix error = % 1.14e\n",value);CHKERRQ(ierr);
36940c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"coarse functions errors\n");CHKERRQ(ierr);
369553cdbc3dSStefano Zampini       for (i=0; i<pcbddc->local_primal_size; i++) { ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local %02d-th function error = % 1.14e\n",i,coarsefunctions_errors[i]);CHKERRQ(ierr); }
36960c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"constraints errors\n");CHKERRQ(ierr);
369753cdbc3dSStefano Zampini       for (i=0; i<pcbddc->local_primal_size; i++) { ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local %02d-th function error = % 1.14e\n",i,constraints_errors[i]);CHKERRQ(ierr); }
36980c7d97c5SJed Brown       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
369953cdbc3dSStefano Zampini       ierr = MatDestroy(&A_II);CHKERRQ(ierr);
370053cdbc3dSStefano Zampini       ierr = MatDestroy(&A_BB);CHKERRQ(ierr);
370153cdbc3dSStefano Zampini       ierr = MatDestroy(&A_IB);CHKERRQ(ierr);
370253cdbc3dSStefano Zampini       ierr = MatDestroy(&A_BI);CHKERRQ(ierr);
370353cdbc3dSStefano Zampini       ierr = MatDestroy(&TM1);CHKERRQ(ierr);
370453cdbc3dSStefano Zampini       ierr = MatDestroy(&TM2);CHKERRQ(ierr);
370553cdbc3dSStefano Zampini       ierr = MatDestroy(&TM3);CHKERRQ(ierr);
370653cdbc3dSStefano Zampini       ierr = MatDestroy(&TM4);CHKERRQ(ierr);
370753cdbc3dSStefano Zampini       ierr = MatDestroy(&coarse_phi_D);CHKERRQ(ierr);
370853cdbc3dSStefano Zampini       ierr = MatDestroy(&coarse_sub_mat);CHKERRQ(ierr);
370953cdbc3dSStefano Zampini       ierr = MatDestroy(&coarse_phi_B);CHKERRQ(ierr);
37100c7d97c5SJed Brown       ierr = PetscFree(coarsefunctions_errors);CHKERRQ(ierr);
37110c7d97c5SJed Brown       ierr = PetscFree(constraints_errors);CHKERRQ(ierr);
37120c7d97c5SJed Brown     }
37130c7d97c5SJed Brown     /* free memory */
37143b03a366Sstefano_zampini     if (n_vertices) {
37150c7d97c5SJed Brown       ierr = VecDestroy(&vec1_V);CHKERRQ(ierr);
37160c7d97c5SJed Brown       ierr = VecDestroy(&vec2_V);CHKERRQ(ierr);
37170c7d97c5SJed Brown       ierr = MatDestroy(&A_RV);CHKERRQ(ierr);
37180c7d97c5SJed Brown       ierr = MatDestroy(&A_VR);CHKERRQ(ierr);
37190c7d97c5SJed Brown       ierr = MatDestroy(&A_VV);CHKERRQ(ierr);
37200c7d97c5SJed Brown     }
3721534831adSStefano Zampini     if (n_constraints) {
37220c7d97c5SJed Brown       ierr = VecDestroy(&vec1_C);CHKERRQ(ierr);
37230c7d97c5SJed Brown       ierr = VecDestroy(&vec2_C);CHKERRQ(ierr);
37240c7d97c5SJed Brown       ierr = MatDestroy(&M1);CHKERRQ(ierr);
37250c7d97c5SJed Brown       ierr = MatDestroy(&C_CR);CHKERRQ(ierr);
37260c7d97c5SJed Brown     }
3727a929c220SStefano Zampini     ierr = PetscFree(auxindices);CHKERRQ(ierr);
3728a929c220SStefano Zampini     ierr = PetscFree(nnz);CHKERRQ(ierr);
3729a929c220SStefano Zampini     /* create coarse matrix and data structures for message passing associated actual choice of coarse problem type */
3730a929c220SStefano Zampini     ierr = PCBDDCSetupCoarseEnvironment(pc,coarse_submat_vals);CHKERRQ(ierr);
3731a929c220SStefano Zampini     ierr = PetscFree(coarse_submat_vals);CHKERRQ(ierr);
37320c7d97c5SJed Brown   }
37330c7d97c5SJed Brown   /* free memory */
37343b03a366Sstefano_zampini   if (n_vertices) {
37350c7d97c5SJed Brown     ierr = PetscFree(idx_V_B);CHKERRQ(ierr);
37360c7d97c5SJed Brown     ierr = ISDestroy(&is_V_local);CHKERRQ(ierr);
37370c7d97c5SJed Brown   }
37380c7d97c5SJed Brown   ierr = ISDestroy(&is_R_local);CHKERRQ(ierr);
37390c7d97c5SJed Brown   PetscFunctionReturn(0);
37400c7d97c5SJed Brown }
37410c7d97c5SJed Brown 
37420c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
37430c7d97c5SJed Brown 
37440c7d97c5SJed Brown #undef __FUNCT__
37450c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetupCoarseEnvironment"
374653cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetupCoarseEnvironment(PC pc,PetscScalar* coarse_submat_vals)
37470c7d97c5SJed Brown {
37480c7d97c5SJed Brown   Mat_IS   *matis    = (Mat_IS*)pc->pmat->data;
37490c7d97c5SJed Brown   PC_BDDC  *pcbddc   = (PC_BDDC*)pc->data;
37500c7d97c5SJed Brown   PC_IS    *pcis     = (PC_IS*)pc->data;
3751ce94432eSBarry Smith   MPI_Comm prec_comm;
37520c7d97c5SJed Brown   MPI_Comm coarse_comm;
37530c7d97c5SJed Brown 
37540c7d97c5SJed Brown   /* common to all choiches */
37550c7d97c5SJed Brown   PetscScalar *temp_coarse_mat_vals;
37560c7d97c5SJed Brown   PetscScalar *ins_coarse_mat_vals;
37570c7d97c5SJed Brown   PetscInt    *ins_local_primal_indices;
37580c7d97c5SJed Brown   PetscMPIInt *localsizes2,*localdispl2;
37590c7d97c5SJed Brown   PetscMPIInt size_prec_comm;
37600c7d97c5SJed Brown   PetscMPIInt rank_prec_comm;
37610c7d97c5SJed Brown   PetscMPIInt active_rank=MPI_PROC_NULL;
37620c7d97c5SJed Brown   PetscMPIInt master_proc=0;
37630c7d97c5SJed Brown   PetscInt    ins_local_primal_size;
37642fa5cd67SKarl Rupp 
37650c7d97c5SJed Brown   /* specific to MULTILEVEL_BDDC */
37660c7d97c5SJed Brown   PetscMPIInt            *ranks_recv;
37670c7d97c5SJed Brown   PetscMPIInt            count_recv=0;
37680c7d97c5SJed Brown   PetscMPIInt            rank_coarse_proc_send_to;
37690c7d97c5SJed Brown   PetscMPIInt            coarse_color = MPI_UNDEFINED;
37700c7d97c5SJed Brown   ISLocalToGlobalMapping coarse_ISLG;
37712fa5cd67SKarl Rupp 
37720c7d97c5SJed Brown   /* some other variables */
37730c7d97c5SJed Brown   PetscErrorCode ierr;
377419fd82e9SBarry Smith   MatType        coarse_mat_type;
377519fd82e9SBarry Smith   PCType         coarse_pc_type;
377619fd82e9SBarry Smith   KSPType        coarse_ksp_type;
377753cdbc3dSStefano Zampini   PC             pc_temp;
37784fad6a16SStefano Zampini   PetscInt       i,j,k;
37793b03a366Sstefano_zampini   PetscInt       max_it_coarse_ksp=1;          /* don't increase this value */
37802fa5cd67SKarl Rupp 
3781e269702eSStefano Zampini   /* verbose output viewer */
3782e269702eSStefano Zampini   PetscViewer viewer   = pcbddc->dbg_viewer;
3783e269702eSStefano Zampini   PetscBool   dbg_flag = pcbddc->dbg_flag;
3784142dfd88SStefano Zampini 
3785ea7e1babSStefano Zampini   PetscInt    offset,offset2;
3786a929c220SStefano Zampini   PetscMPIInt im_active,active_procs;
3787523858cfSStefano Zampini   PetscInt    *dnz,*onz;
3788142dfd88SStefano Zampini 
3789142dfd88SStefano Zampini   PetscBool setsym,issym=PETSC_FALSE;
37900c7d97c5SJed Brown 
37910c7d97c5SJed Brown   PetscFunctionBegin;
37924b2d0b89SJed Brown   ierr = PetscObjectGetComm((PetscObject)pc,&prec_comm);CHKERRQ(ierr);
37930c7d97c5SJed Brown   ins_local_primal_indices = 0;
37940c7d97c5SJed Brown   ins_coarse_mat_vals      = 0;
37950c7d97c5SJed Brown   localsizes2              = 0;
37960c7d97c5SJed Brown   localdispl2              = 0;
37970c7d97c5SJed Brown   temp_coarse_mat_vals     = 0;
37980c7d97c5SJed Brown   coarse_ISLG              = 0;
37990c7d97c5SJed Brown 
380053cdbc3dSStefano Zampini   ierr = MPI_Comm_size(prec_comm,&size_prec_comm);CHKERRQ(ierr);
380153cdbc3dSStefano Zampini   ierr = MPI_Comm_rank(prec_comm,&rank_prec_comm);CHKERRQ(ierr);
3802142dfd88SStefano Zampini   ierr = MatIsSymmetricKnown(pc->pmat,&setsym,&issym);CHKERRQ(ierr);
3803142dfd88SStefano Zampini 
3804beed3852SStefano Zampini   /* Assign global numbering to coarse dofs */
3805beed3852SStefano Zampini   {
3806ef028eecSStefano Zampini     PetscInt    *auxlocal_primal;
3807da1bb401SStefano Zampini     PetscInt    *row_cmat_indices;
38082e8d2280SStefano Zampini     PetscInt    *aux_ordering;
38092e8d2280SStefano Zampini     PetscInt    *row_cmat_global_indices;
3810ef028eecSStefano Zampini     PetscInt    *dof_sizes,*dof_displs;
38113b03a366Sstefano_zampini     PetscInt    size_of_constraint;
38122e8d2280SStefano Zampini     PetscBool   *array_bool;
3813ef028eecSStefano Zampini     PetscBool   first_found;
3814ef028eecSStefano Zampini     PetscInt    first_index,old_index,s;
3815ef028eecSStefano Zampini     PetscMPIInt mpi_local_primal_size;
3816ef028eecSStefano Zampini     PetscScalar coarsesum,*array;
3817ef028eecSStefano Zampini 
3818ef028eecSStefano Zampini     mpi_local_primal_size = (PetscMPIInt)pcbddc->local_primal_size;
3819beed3852SStefano Zampini 
3820beed3852SStefano Zampini     /* Construct needed data structures for message passing */
3821ef028eecSStefano Zampini     ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscInt),&pcbddc->local_primal_indices);CHKERRQ(ierr);
3822ffe5efe1SStefano Zampini     j = 0;
3823142dfd88SStefano Zampini     if (rank_prec_comm == 0 || pcbddc->coarse_problem_type == REPLICATED_BDDC || pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
3824ffe5efe1SStefano Zampini       j = size_prec_comm;
3825ffe5efe1SStefano Zampini     }
3826ffe5efe1SStefano Zampini     ierr = PetscMalloc(j*sizeof(PetscMPIInt),&pcbddc->local_primal_sizes);CHKERRQ(ierr);
3827ffe5efe1SStefano Zampini     ierr = PetscMalloc(j*sizeof(PetscMPIInt),&pcbddc->local_primal_displacements);CHKERRQ(ierr);
3828beed3852SStefano Zampini     /* Gather local_primal_size information for all processes  */
3829142dfd88SStefano Zampini     if (pcbddc->coarse_problem_type == REPLICATED_BDDC || pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
38305619798eSStefano Zampini       ierr = MPI_Allgather(&mpi_local_primal_size,1,MPIU_INT,&pcbddc->local_primal_sizes[0],1,MPIU_INT,prec_comm);CHKERRQ(ierr);
3831ffe5efe1SStefano Zampini     } else {
3832ffe5efe1SStefano Zampini       ierr = MPI_Gather(&mpi_local_primal_size,1,MPIU_INT,&pcbddc->local_primal_sizes[0],1,MPIU_INT,0,prec_comm);CHKERRQ(ierr);
3833ffe5efe1SStefano Zampini     }
3834beed3852SStefano Zampini     pcbddc->replicated_primal_size = 0;
3835ffe5efe1SStefano Zampini     for (i=0; i<j; i++) {
3836beed3852SStefano Zampini       pcbddc->local_primal_displacements[i] = pcbddc->replicated_primal_size;
3837beed3852SStefano Zampini       pcbddc->replicated_primal_size       += pcbddc->local_primal_sizes[i];
3838beed3852SStefano Zampini     }
3839beed3852SStefano Zampini 
3840da1bb401SStefano Zampini     /* First let's count coarse dofs.
3841beed3852SStefano Zampini        This code fragment assumes that the number of local constraints per connected component
3842beed3852SStefano Zampini        is not greater than the number of nodes defined for the connected component
3843beed3852SStefano Zampini        (otherwise we will surely have linear dependence between constraints and thus a singular coarse problem) */
3844ef028eecSStefano Zampini     ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscInt),&auxlocal_primal);CHKERRQ(ierr);
38452e8d2280SStefano Zampini     j    = 0;
38462e8d2280SStefano Zampini     for (i=0; i<pcbddc->local_primal_size; i++) {
38470298fd71SBarry Smith       ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,NULL,NULL);CHKERRQ(ierr);
38482fa5cd67SKarl Rupp       if (j < size_of_constraint) j = size_of_constraint;
38490298fd71SBarry Smith       ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,NULL,NULL);CHKERRQ(ierr);
38502e8d2280SStefano Zampini     }
38512e8d2280SStefano Zampini     ierr = PetscMalloc(j*sizeof(PetscInt),&aux_ordering);CHKERRQ(ierr);
38522e8d2280SStefano Zampini     ierr = PetscMalloc(j*sizeof(PetscInt),&row_cmat_global_indices);CHKERRQ(ierr);
38532e8d2280SStefano Zampini     ierr = PetscMalloc(pcis->n*sizeof(PetscBool),&array_bool);CHKERRQ(ierr);
38542fa5cd67SKarl Rupp     for (i=0;i<pcis->n;i++) array_bool[i] = PETSC_FALSE;
38552fa5cd67SKarl Rupp 
3856da1bb401SStefano Zampini     for (i=0;i<pcbddc->local_primal_size;i++) {
38570298fd71SBarry Smith       ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,NULL);CHKERRQ(ierr);
38582fa5cd67SKarl Rupp       for (j=0; j<size_of_constraint; j++) aux_ordering[j] = j;
38592fa5cd67SKarl Rupp 
38602e8d2280SStefano Zampini       ierr = ISLocalToGlobalMappingApply(matis->mapping,size_of_constraint,row_cmat_indices,row_cmat_global_indices);CHKERRQ(ierr);
38612e8d2280SStefano Zampini       ierr = PetscSortIntWithPermutation(size_of_constraint,row_cmat_global_indices,aux_ordering);CHKERRQ(ierr);
38622e8d2280SStefano Zampini       for (j=0; j<size_of_constraint; j++) {
38632e8d2280SStefano Zampini         k = row_cmat_indices[aux_ordering[j]];
38642e8d2280SStefano Zampini         if (!array_bool[k]) {
38652e8d2280SStefano Zampini           array_bool[k]      = PETSC_TRUE;
3866da1bb401SStefano Zampini           auxlocal_primal[i] = k;
3867beed3852SStefano Zampini           break;
3868beed3852SStefano Zampini         }
3869beed3852SStefano Zampini       }
38700298fd71SBarry Smith       ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,NULL);CHKERRQ(ierr);
3871beed3852SStefano Zampini     }
38722e8d2280SStefano Zampini     ierr = PetscFree(aux_ordering);CHKERRQ(ierr);
3873ef028eecSStefano Zampini     ierr = PetscFree(array_bool);CHKERRQ(ierr);
3874ef028eecSStefano Zampini     ierr = PetscFree(row_cmat_global_indices);CHKERRQ(ierr);
38752e8d2280SStefano Zampini 
3876ef028eecSStefano Zampini     /* Compute number of coarse dofs */
3877ef028eecSStefano Zampini     ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
3878ef028eecSStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
38792fa5cd67SKarl Rupp     for (i=0;i<pcbddc->local_primal_size;i++) array[auxlocal_primal[i]] = 1.0;
3880ef028eecSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3881ef028eecSStefano Zampini     ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
3882ef028eecSStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3883ef028eecSStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3884ef028eecSStefano Zampini     ierr = VecSum(pcis->vec1_global,&coarsesum);CHKERRQ(ierr);
3885ef028eecSStefano Zampini     pcbddc->coarse_size = (PetscInt)coarsesum;
3886ef028eecSStefano Zampini 
3887ef028eecSStefano Zampini     /* Fill pcis->vec1_global with cumulative function for global numbering */
3888ef028eecSStefano Zampini     ierr        = VecGetArray(pcis->vec1_global,&array);CHKERRQ(ierr);
3889ef028eecSStefano Zampini     ierr        = VecGetLocalSize(pcis->vec1_global,&s);CHKERRQ(ierr);
3890ef028eecSStefano Zampini     k           = 0;
3891ef028eecSStefano Zampini     first_index = -1;
3892ef028eecSStefano Zampini     first_found = PETSC_FALSE;
3893ef028eecSStefano Zampini     for (i=0; i<s; i++) {
3894ef028eecSStefano Zampini       if (!first_found && array[i] > 0.0) {
3895ef028eecSStefano Zampini         first_found = PETSC_TRUE;
3896ef028eecSStefano Zampini         first_index = i;
3897ef028eecSStefano Zampini       }
3898ef028eecSStefano Zampini       k += (PetscInt)array[i];
3899ef028eecSStefano Zampini     }
3900ef028eecSStefano Zampini     j    = (!rank_prec_comm ? size_prec_comm : 0);
3901ef028eecSStefano Zampini     ierr = PetscMalloc(j*sizeof(*dof_sizes),&dof_sizes);CHKERRQ(ierr);
3902ef028eecSStefano Zampini     ierr = PetscMalloc(j*sizeof(*dof_displs),&dof_displs);CHKERRQ(ierr);
3903ef028eecSStefano Zampini     ierr = MPI_Gather(&k,1,MPIU_INT,dof_sizes,1,MPIU_INT,0,prec_comm);CHKERRQ(ierr);
3904ef028eecSStefano Zampini     if (!rank_prec_comm) {
3905ef028eecSStefano Zampini       dof_displs[0]=0;
39062fa5cd67SKarl Rupp       for (i=1;i<size_prec_comm;i++) dof_displs[i] = dof_displs[i-1]+dof_sizes[i-1];
3907ef028eecSStefano Zampini     }
3908ef028eecSStefano Zampini     ierr = MPI_Scatter(dof_displs,1,MPIU_INT,&k,1,MPIU_INT,0,prec_comm);CHKERRQ(ierr);
3909ef028eecSStefano Zampini     if (first_found) {
3910ef028eecSStefano Zampini       array[first_index] += k;
3911ef028eecSStefano Zampini       old_index = first_index;
3912ef028eecSStefano Zampini       for (i=first_index+1;i<s;i++) {
3913ef028eecSStefano Zampini         if (array[i] > 0.0) {
3914ef028eecSStefano Zampini           array[i] += array[old_index];
3915ef028eecSStefano Zampini           old_index = i;
3916ef028eecSStefano Zampini         }
3917ef028eecSStefano Zampini       }
3918ef028eecSStefano Zampini     }
3919ef028eecSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_global,&array);CHKERRQ(ierr);
3920ef028eecSStefano Zampini     ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
3921ef028eecSStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3922ef028eecSStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3923ef028eecSStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
39242fa5cd67SKarl Rupp     for (i=0;i<pcbddc->local_primal_size;i++) pcbddc->local_primal_indices[i] = (PetscInt)array[auxlocal_primal[i]]-1;
3925ef028eecSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3926ef028eecSStefano Zampini     ierr = PetscFree(dof_displs);CHKERRQ(ierr);
3927ef028eecSStefano Zampini     ierr = PetscFree(dof_sizes);CHKERRQ(ierr);
3928ef028eecSStefano Zampini 
3929ef028eecSStefano Zampini     if (dbg_flag) {
39302e8d2280SStefano Zampini       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
39312e8d2280SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
39322e8d2280SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Check coarse indices\n");CHKERRQ(ierr);
39332e8d2280SStefano Zampini       ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
39342e8d2280SStefano Zampini       ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
39352fa5cd67SKarl Rupp       for (i=0;i<pcbddc->local_primal_size;i++) array[auxlocal_primal[i]]=1.0;
3936beed3852SStefano Zampini       ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
39372e8d2280SStefano Zampini       ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
3938da1bb401SStefano Zampini       ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3939da1bb401SStefano Zampini       ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3940da1bb401SStefano Zampini       ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3941da1bb401SStefano Zampini       ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3942da1bb401SStefano Zampini       ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
39432e8d2280SStefano Zampini       for (i=0;i<pcis->n;i++) {
39442e8d2280SStefano Zampini         if (array[i] == 1.0) {
39452e8d2280SStefano Zampini           ierr = ISLocalToGlobalMappingApply(matis->mapping,1,&i,&j);CHKERRQ(ierr);
39462e8d2280SStefano Zampini           ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d: WRONG COARSE INDEX %d (local %d)\n",PetscGlobalRank,j,i);CHKERRQ(ierr);
39472e8d2280SStefano Zampini         }
39482e8d2280SStefano Zampini       }
39492e8d2280SStefano Zampini       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
39502e8d2280SStefano Zampini       for (i=0;i<pcis->n;i++) {
39512fa5cd67SKarl Rupp         if (array[i] > 0.0) array[i] = 1.0/array[i];
39522e8d2280SStefano Zampini       }
3953da1bb401SStefano Zampini       ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
39542e8d2280SStefano Zampini       ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
3955da1bb401SStefano Zampini       ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3956da1bb401SStefano Zampini       ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3957da1bb401SStefano Zampini       ierr = VecSum(pcis->vec1_global,&coarsesum);CHKERRQ(ierr);
39582e8d2280SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Size of coarse problem SHOULD be %lf\n",coarsesum);CHKERRQ(ierr);
39592e8d2280SStefano Zampini       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
39602e8d2280SStefano Zampini     }
3961142dfd88SStefano Zampini     ierr = PetscFree(auxlocal_primal);CHKERRQ(ierr);
39620bdf917eSStefano Zampini   }
39630bdf917eSStefano Zampini 
39642e8d2280SStefano Zampini   if (dbg_flag) {
39657cf533a6SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"Size of coarse problem is %d\n",pcbddc->coarse_size);CHKERRQ(ierr);
39662e8d2280SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
39672e8d2280SStefano Zampini   }
39682e8d2280SStefano Zampini 
3969a929c220SStefano Zampini   im_active = 0;
39702fa5cd67SKarl Rupp   if (pcis->n) im_active = 1;
3971a929c220SStefano Zampini   ierr = MPI_Allreduce(&im_active,&active_procs,1,MPIU_INT,MPI_SUM,prec_comm);CHKERRQ(ierr);
39720bdf917eSStefano Zampini 
39730bdf917eSStefano Zampini   /* adapt coarse problem type */
39744fad6a16SStefano Zampini   if (pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
39754fad6a16SStefano Zampini     if (pcbddc->current_level < pcbddc->max_levels) {
3976a929c220SStefano Zampini       if ((active_procs/pcbddc->coarsening_ratio) < 2) {
39770bdf917eSStefano Zampini         if (dbg_flag) {
3978a929c220SStefano Zampini           ierr = PetscViewerASCIIPrintf(viewer,"Not enough active processes on level %d (active %d,ratio %d). Parallel direct solve for coarse problem\n",pcbddc->current_level,active_procs,pcbddc->coarsening_ratio);CHKERRQ(ierr);
39790bdf917eSStefano Zampini           ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
39800bdf917eSStefano Zampini         }
39810bdf917eSStefano Zampini         pcbddc->coarse_problem_type = PARALLEL_BDDC;
3982142dfd88SStefano Zampini       }
39834fad6a16SStefano Zampini     } else {
39844fad6a16SStefano Zampini       if (dbg_flag) {
3985a929c220SStefano Zampini         ierr = PetscViewerASCIIPrintf(viewer,"Max number of levels reached. Using parallel direct solve for coarse problem\n",pcbddc->max_levels,active_procs,pcbddc->coarsening_ratio);CHKERRQ(ierr);
39864fad6a16SStefano Zampini         ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
39874fad6a16SStefano Zampini       }
39884fad6a16SStefano Zampini       pcbddc->coarse_problem_type = PARALLEL_BDDC;
39894fad6a16SStefano Zampini     }
39904fad6a16SStefano Zampini   }
3991beed3852SStefano Zampini 
39920c7d97c5SJed Brown   switch (pcbddc->coarse_problem_type) {
39930c7d97c5SJed Brown 
3994da1bb401SStefano Zampini   case (MULTILEVEL_BDDC):    /* we define a coarse mesh where subdomains are elements */
39950c7d97c5SJed Brown   {
39960c7d97c5SJed Brown     /* we need additional variables */
39970c7d97c5SJed Brown     MetisInt    n_subdomains,n_parts,objval,ncon,faces_nvtxs;
39980c7d97c5SJed Brown     MetisInt    *metis_coarse_subdivision;
39990c7d97c5SJed Brown     MetisInt    options[METIS_NOPTIONS];
40000c7d97c5SJed Brown     PetscMPIInt size_coarse_comm,rank_coarse_comm;
40010c7d97c5SJed Brown     PetscMPIInt procs_jumps_coarse_comm;
40020c7d97c5SJed Brown     PetscMPIInt *coarse_subdivision;
40030c7d97c5SJed Brown     PetscMPIInt *total_count_recv;
40040c7d97c5SJed Brown     PetscMPIInt *total_ranks_recv;
40050c7d97c5SJed Brown     PetscMPIInt *displacements_recv;
40060c7d97c5SJed Brown     PetscMPIInt *my_faces_connectivity;
40070c7d97c5SJed Brown     PetscMPIInt *petsc_faces_adjncy;
40080c7d97c5SJed Brown     MetisInt    *faces_adjncy;
40090c7d97c5SJed Brown     MetisInt    *faces_xadj;
40100c7d97c5SJed Brown     PetscMPIInt *number_of_faces;
40110c7d97c5SJed Brown     PetscMPIInt *faces_displacements;
40120c7d97c5SJed Brown     PetscInt    *array_int;
40130c7d97c5SJed Brown     PetscMPIInt my_faces   =0;
40140c7d97c5SJed Brown     PetscMPIInt total_faces=0;
40153828260eSStefano Zampini     PetscInt    ranks_stretching_ratio;
40160c7d97c5SJed Brown 
40170c7d97c5SJed Brown     /* define some quantities */
40180c7d97c5SJed Brown     pcbddc->coarse_communications_type = SCATTERS_BDDC;
40190c7d97c5SJed Brown     coarse_mat_type                    = MATIS;
40200c7d97c5SJed Brown     coarse_pc_type                     = PCBDDC;
4021142dfd88SStefano Zampini     coarse_ksp_type                    = KSPRICHARDSON;
40220c7d97c5SJed Brown 
40230c7d97c5SJed Brown     /* details of coarse decomposition */
4024a929c220SStefano Zampini     n_subdomains            = active_procs;
40250c7d97c5SJed Brown     n_parts                 = n_subdomains/pcbddc->coarsening_ratio;
4026a929c220SStefano Zampini     ranks_stretching_ratio  = size_prec_comm/active_procs;
40273828260eSStefano Zampini     procs_jumps_coarse_comm = pcbddc->coarsening_ratio*ranks_stretching_ratio;
40283828260eSStefano Zampini 
4029a929c220SStefano Zampini #if 0
4030a929c220SStefano Zampini     PetscMPIInt     *old_ranks;
4031a929c220SStefano Zampini     PetscInt        *new_ranks,*jj,*ii;
4032a929c220SStefano Zampini     MatPartitioning mat_part;
4033a929c220SStefano Zampini     IS              coarse_new_decomposition,is_numbering;
4034a929c220SStefano Zampini     PetscViewer     viewer_test;
4035a929c220SStefano Zampini     MPI_Comm        test_coarse_comm;
4036a929c220SStefano Zampini     PetscMPIInt     test_coarse_color;
4037a929c220SStefano Zampini     Mat             mat_adj;
4038a929c220SStefano Zampini     /* Create new communicator for coarse problem splitting the old one */
4039a929c220SStefano Zampini     /* procs with coarse_color = MPI_UNDEFINED will have coarse_comm = MPI_COMM_NULL (from mpi standards)
4040a929c220SStefano Zampini        key = rank_prec_comm -> keep same ordering of ranks from the old to the new communicator */
4041a929c220SStefano Zampini     test_coarse_color = (im_active ? 0 : MPI_UNDEFINED);
4042a929c220SStefano Zampini     test_coarse_comm  = MPI_COMM_NULL;
4043a929c220SStefano Zampini     ierr              = MPI_Comm_split(prec_comm,test_coarse_color,rank_prec_comm,&test_coarse_comm);CHKERRQ(ierr);
4044a929c220SStefano Zampini     if (im_active) {
4045a929c220SStefano Zampini       ierr = PetscMalloc(n_subdomains*sizeof(PetscMPIInt),&old_ranks);
4046a929c220SStefano Zampini       ierr = PetscMalloc(size_prec_comm*sizeof(PetscInt),&new_ranks);
4047a929c220SStefano Zampini       ierr = MPI_Comm_rank(test_coarse_comm,&rank_coarse_comm);CHKERRQ(ierr);
4048a929c220SStefano Zampini       ierr = MPI_Comm_size(test_coarse_comm,&j);CHKERRQ(ierr);
4049a929c220SStefano Zampini       ierr = MPI_Allgather(&rank_prec_comm,1,MPIU_INT,old_ranks,1,MPIU_INT,test_coarse_comm);CHKERRQ(ierr);
40502fa5cd67SKarl Rupp       for (i=0; i<size_prec_comm; i++)
4051a929c220SStefano Zampini         new_ranks[i] = -1;
40522fa5cd67SKarl Rupp       for (i=0; i<n_subdomains; i++)
4053a929c220SStefano Zampini         new_ranks[old_ranks[i]] = i;
4054a929c220SStefano Zampini       ierr = PetscViewerASCIIOpen(test_coarse_comm,"test_mat_part.out",&viewer_test);CHKERRQ(ierr);
4055a929c220SStefano Zampini       k    = pcis->n_neigh-1;
4056a929c220SStefano Zampini       ierr = PetscMalloc(2*sizeof(PetscInt),&ii);
4057a929c220SStefano Zampini       ii[0]=0;
4058a929c220SStefano Zampini       ii[1]=k;
4059a929c220SStefano Zampini       ierr = PetscMalloc(k*sizeof(PetscInt),&jj);
40602fa5cd67SKarl Rupp       for (i=0; i<k; i++)
4061a929c220SStefano Zampini         jj[i]=new_ranks[pcis->neigh[i+1]];
4062a929c220SStefano Zampini       ierr = PetscSortInt(k,jj);CHKERRQ(ierr);
40630298fd71SBarry Smith       ierr = MatCreateMPIAdj(test_coarse_comm,1,n_subdomains,ii,jj,NULL,&mat_adj);CHKERRQ(ierr);
4064a929c220SStefano Zampini       ierr = MatView(mat_adj,viewer_test);CHKERRQ(ierr);
4065a929c220SStefano Zampini       ierr = MatPartitioningCreate(test_coarse_comm,&mat_part);CHKERRQ(ierr);
4066a929c220SStefano Zampini       ierr = MatPartitioningSetAdjacency(mat_part,mat_adj);CHKERRQ(ierr);
4067a929c220SStefano Zampini       ierr = MatPartitioningSetFromOptions(mat_part);CHKERRQ(ierr);
4068a929c220SStefano Zampini       printf("Setting Nparts %d\n",n_parts);
4069a929c220SStefano Zampini       ierr = MatPartitioningSetNParts(mat_part,n_parts);CHKERRQ(ierr);
4070a929c220SStefano Zampini       ierr = MatPartitioningView(mat_part,viewer_test);CHKERRQ(ierr);
4071a929c220SStefano Zampini       ierr = MatPartitioningApply(mat_part,&coarse_new_decomposition);CHKERRQ(ierr);
4072a929c220SStefano Zampini       ierr = ISView(coarse_new_decomposition,viewer_test);CHKERRQ(ierr);
4073a929c220SStefano Zampini       ierr = ISPartitioningToNumbering(coarse_new_decomposition,&is_numbering);CHKERRQ(ierr);
4074a929c220SStefano Zampini       ierr = ISView(is_numbering,viewer_test);CHKERRQ(ierr);
4075a929c220SStefano Zampini       ierr = PetscViewerDestroy(&viewer_test);CHKERRQ(ierr);
4076a929c220SStefano Zampini       ierr = ISDestroy(&coarse_new_decomposition);CHKERRQ(ierr);
4077a929c220SStefano Zampini       ierr = ISDestroy(&is_numbering);CHKERRQ(ierr);
4078a929c220SStefano Zampini       ierr = MatPartitioningDestroy(&mat_part);CHKERRQ(ierr);
4079a929c220SStefano Zampini       ierr = PetscFree(old_ranks);CHKERRQ(ierr);
4080a929c220SStefano Zampini       ierr = PetscFree(new_ranks);CHKERRQ(ierr);
4081a929c220SStefano Zampini       ierr = MPI_Comm_free(&test_coarse_comm);CHKERRQ(ierr);
4082a929c220SStefano Zampini     }
4083a929c220SStefano Zampini #endif
4084a929c220SStefano Zampini 
40854fad6a16SStefano Zampini     /* build CSR graph of subdomains' connectivity */
40860c7d97c5SJed Brown     ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&array_int);CHKERRQ(ierr);
40873828260eSStefano Zampini     ierr = PetscMemzero(array_int,pcis->n*sizeof(PetscInt));CHKERRQ(ierr);
40880c7d97c5SJed Brown     for (i=1;i<pcis->n_neigh;i++) {/* i=1 so I don't count myself -> faces nodes counts to 1 */
40890c7d97c5SJed Brown       for (j=0;j<pcis->n_shared[i];j++) {
40900c7d97c5SJed Brown         array_int[pcis->shared[i][j]]+=1;
40910c7d97c5SJed Brown       }
40920c7d97c5SJed Brown     }
40930c7d97c5SJed Brown     for (i=1;i<pcis->n_neigh;i++) {
40940c7d97c5SJed Brown       for (j=0;j<pcis->n_shared[i];j++) {
40957cf533a6SStefano Zampini         if (array_int[pcis->shared[i][j]] > 0) {
40960c7d97c5SJed Brown           my_faces++;
40970c7d97c5SJed Brown           break;
40980c7d97c5SJed Brown         }
40990c7d97c5SJed Brown       }
41000c7d97c5SJed Brown     }
41010c7d97c5SJed Brown 
410253cdbc3dSStefano Zampini     ierr = MPI_Reduce(&my_faces,&total_faces,1,MPIU_INT,MPI_SUM,master_proc,prec_comm);CHKERRQ(ierr);
41030c7d97c5SJed Brown     ierr = PetscMalloc (my_faces*sizeof(PetscInt),&my_faces_connectivity);CHKERRQ(ierr);
41040c7d97c5SJed Brown     my_faces=0;
41050c7d97c5SJed Brown     for (i=1;i<pcis->n_neigh;i++) {
41060c7d97c5SJed Brown       for (j=0;j<pcis->n_shared[i];j++) {
41077cf533a6SStefano Zampini         if (array_int[pcis->shared[i][j]] > 0) {
41080c7d97c5SJed Brown           my_faces_connectivity[my_faces]=pcis->neigh[i];
41090c7d97c5SJed Brown           my_faces++;
41100c7d97c5SJed Brown           break;
41110c7d97c5SJed Brown         }
41120c7d97c5SJed Brown       }
41130c7d97c5SJed Brown     }
41140c7d97c5SJed Brown     if (rank_prec_comm == master_proc) {
41150c7d97c5SJed Brown       ierr = PetscMalloc (total_faces*sizeof(PetscMPIInt),&petsc_faces_adjncy);CHKERRQ(ierr);
41160c7d97c5SJed Brown       ierr = PetscMalloc (size_prec_comm*sizeof(PetscMPIInt),&number_of_faces);CHKERRQ(ierr);
41170c7d97c5SJed Brown       ierr = PetscMalloc (total_faces*sizeof(MetisInt),&faces_adjncy);CHKERRQ(ierr);
41180c7d97c5SJed Brown       ierr = PetscMalloc ((n_subdomains+1)*sizeof(MetisInt),&faces_xadj);CHKERRQ(ierr);
41190c7d97c5SJed Brown       ierr = PetscMalloc ((size_prec_comm+1)*sizeof(PetscMPIInt),&faces_displacements);CHKERRQ(ierr);
41200c7d97c5SJed Brown     }
412153cdbc3dSStefano Zampini     ierr = MPI_Gather(&my_faces,1,MPIU_INT,&number_of_faces[0],1,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr);
41220c7d97c5SJed Brown     if (rank_prec_comm == master_proc) {
41230c7d97c5SJed Brown       faces_xadj[0]          = 0;
41240c7d97c5SJed Brown       faces_displacements[0] = 0;
41252fa5cd67SKarl Rupp 
41260c7d97c5SJed Brown       j=0;
41270c7d97c5SJed Brown       for (i=1;i<size_prec_comm+1;i++) {
41280c7d97c5SJed Brown         faces_displacements[i]=faces_displacements[i-1]+number_of_faces[i-1];
41290c7d97c5SJed Brown         if (number_of_faces[i-1]) {
41300c7d97c5SJed Brown           j++;
41310c7d97c5SJed Brown           faces_xadj[j]=faces_xadj[j-1]+number_of_faces[i-1];
41320c7d97c5SJed Brown         }
41330c7d97c5SJed Brown       }
41340c7d97c5SJed Brown     }
413553cdbc3dSStefano Zampini     ierr = MPI_Gatherv(&my_faces_connectivity[0],my_faces,MPIU_INT,&petsc_faces_adjncy[0],number_of_faces,faces_displacements,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr);
41360c7d97c5SJed Brown     ierr = PetscFree(my_faces_connectivity);CHKERRQ(ierr);
41370c7d97c5SJed Brown     ierr = PetscFree(array_int);CHKERRQ(ierr);
41380c7d97c5SJed Brown     if (rank_prec_comm == master_proc) {
41393828260eSStefano Zampini       for (i=0; i<total_faces; i++) faces_adjncy[i]=(MetisInt)(petsc_faces_adjncy[i]/ranks_stretching_ratio); /* cast to MetisInt */
41400c7d97c5SJed Brown       ierr = PetscFree(faces_displacements);CHKERRQ(ierr);
41410c7d97c5SJed Brown       ierr = PetscFree(number_of_faces);CHKERRQ(ierr);
41420c7d97c5SJed Brown       ierr = PetscFree(petsc_faces_adjncy);CHKERRQ(ierr);
41430c7d97c5SJed Brown     }
41440c7d97c5SJed Brown 
41450c7d97c5SJed Brown     if (rank_prec_comm == master_proc) {
41463828260eSStefano Zampini       PetscInt heuristic_for_metis=3;
41470c7d97c5SJed Brown       ncon       =1;
41480c7d97c5SJed Brown       faces_nvtxs=n_subdomains;
41490c7d97c5SJed Brown       /* partition graoh induced by face connectivity */
41500c7d97c5SJed Brown       ierr = PetscMalloc (n_subdomains*sizeof(MetisInt),&metis_coarse_subdivision);CHKERRQ(ierr);
41510c7d97c5SJed Brown       ierr = METIS_SetDefaultOptions(options);
41520c7d97c5SJed Brown       /* we need a contiguous partition of the coarse mesh */
41530c7d97c5SJed Brown       options[METIS_OPTION_CONTIG]=1;
41540c7d97c5SJed Brown       options[METIS_OPTION_NITER] =30;
41554fad6a16SStefano Zampini       if (pcbddc->coarsening_ratio > 1) {
41563828260eSStefano Zampini         if (n_subdomains>n_parts*heuristic_for_metis) {
41573828260eSStefano Zampini           options[METIS_OPTION_IPTYPE] =METIS_IPTYPE_EDGE;
41583828260eSStefano Zampini           options[METIS_OPTION_OBJTYPE]=METIS_OBJTYPE_CUT;
41592fa5cd67SKarl Rupp 
41600c7d97c5SJed Brown           ierr = METIS_PartGraphKway(&faces_nvtxs,&ncon,faces_xadj,faces_adjncy,NULL,NULL,NULL,&n_parts,NULL,NULL,options,&objval,metis_coarse_subdivision);
4161142dfd88SStefano Zampini           if (ierr != METIS_OK) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in METIS_PartGraphKway (metis error code %D) called from PCBDDCSetupCoarseEnvironment\n",ierr);
41623828260eSStefano Zampini         } else {
41633828260eSStefano Zampini           ierr = METIS_PartGraphRecursive(&faces_nvtxs,&ncon,faces_xadj,faces_adjncy,NULL,NULL,NULL,&n_parts,NULL,NULL,options,&objval,metis_coarse_subdivision);
4164142dfd88SStefano Zampini           if (ierr != METIS_OK) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in METIS_PartGraphRecursive (metis error code %D) called from PCBDDCSetupCoarseEnvironment\n",ierr);
41653828260eSStefano Zampini         }
41664fad6a16SStefano Zampini       } else {
41672fa5cd67SKarl Rupp         for (i=0;i<n_subdomains;i++) metis_coarse_subdivision[i]=i;
41684fad6a16SStefano Zampini       }
41690c7d97c5SJed Brown       ierr = PetscFree(faces_xadj);CHKERRQ(ierr);
41700c7d97c5SJed Brown       ierr = PetscFree(faces_adjncy);CHKERRQ(ierr);
41710bdf917eSStefano Zampini       ierr = PetscMalloc(size_prec_comm*sizeof(PetscMPIInt),&coarse_subdivision);CHKERRQ(ierr);
41722fa5cd67SKarl Rupp 
41730c7d97c5SJed Brown       /* copy/cast values avoiding possible type conflicts between PETSc, MPI and METIS */
41742fa5cd67SKarl Rupp       for (i=0;i<size_prec_comm;i++) coarse_subdivision[i]=MPI_PROC_NULL;
41752fa5cd67SKarl Rupp       for (i=0;i<n_subdomains;i++) coarse_subdivision[ranks_stretching_ratio*i]=(PetscInt)(metis_coarse_subdivision[i]);
41760c7d97c5SJed Brown       ierr = PetscFree(metis_coarse_subdivision);CHKERRQ(ierr);
41770c7d97c5SJed Brown     }
41780c7d97c5SJed Brown 
41790c7d97c5SJed Brown     /* Create new communicator for coarse problem splitting the old one */
41800c7d97c5SJed Brown     if (!(rank_prec_comm%procs_jumps_coarse_comm) && rank_prec_comm < procs_jumps_coarse_comm*n_parts) {
4181da1bb401SStefano Zampini       coarse_color=0;                /* for communicator splitting */
4182da1bb401SStefano Zampini       active_rank =rank_prec_comm;   /* for insertion of matrix values */
41830c7d97c5SJed Brown     }
4184da1bb401SStefano Zampini     /* procs with coarse_color = MPI_UNDEFINED will have coarse_comm = MPI_COMM_NULL (from mpi standards)
4185da1bb401SStefano Zampini        key = rank_prec_comm -> keep same ordering of ranks from the old to the new communicator */
418653cdbc3dSStefano Zampini     ierr = MPI_Comm_split(prec_comm,coarse_color,rank_prec_comm,&coarse_comm);CHKERRQ(ierr);
41870c7d97c5SJed Brown 
41880c7d97c5SJed Brown     if (coarse_color == 0) {
418953cdbc3dSStefano Zampini       ierr = MPI_Comm_size(coarse_comm,&size_coarse_comm);CHKERRQ(ierr);
419053cdbc3dSStefano Zampini       ierr = MPI_Comm_rank(coarse_comm,&rank_coarse_comm);CHKERRQ(ierr);
41910c7d97c5SJed Brown     } else {
41920c7d97c5SJed Brown       rank_coarse_comm = MPI_PROC_NULL;
41930c7d97c5SJed Brown     }
41940c7d97c5SJed Brown 
41957cf533a6SStefano Zampini     /* master proc take care of arranging and distributing coarse information */
41960c7d97c5SJed Brown     if (rank_coarse_comm == master_proc) {
41970c7d97c5SJed Brown       ierr = PetscMalloc (size_coarse_comm*sizeof(PetscMPIInt),&displacements_recv);CHKERRQ(ierr);
41980bdf917eSStefano Zampini       ierr = PetscMalloc (size_coarse_comm*sizeof(PetscMPIInt),&total_count_recv);CHKERRQ(ierr);
41990bdf917eSStefano Zampini       ierr = PetscMalloc (n_subdomains*sizeof(PetscMPIInt),&total_ranks_recv);CHKERRQ(ierr);
42000c7d97c5SJed Brown       /* some initializations */
42010c7d97c5SJed Brown       displacements_recv[0]=0;
42020bdf917eSStefano Zampini       ierr = PetscMemzero(total_count_recv,size_coarse_comm*sizeof(PetscMPIInt));CHKERRQ(ierr);
42030c7d97c5SJed Brown       /* count from how many processes the j-th process of the coarse decomposition will receive data */
42040bdf917eSStefano Zampini       for (j=0; j<size_coarse_comm; j++) {
42050bdf917eSStefano Zampini         for (i=0; i<size_prec_comm; i++) {
42062fa5cd67SKarl Rupp           if (coarse_subdivision[i]==j) total_count_recv[j]++;
42070bdf917eSStefano Zampini         }
42080bdf917eSStefano Zampini       }
42090c7d97c5SJed Brown       /* displacements needed for scatterv of total_ranks_recv */
42102fa5cd67SKarl Rupp       for (i=1; i<size_coarse_comm; i++) displacements_recv[i]=displacements_recv[i-1]+total_count_recv[i-1];
42112fa5cd67SKarl Rupp 
42120c7d97c5SJed Brown       /* Now fill properly total_ranks_recv -> each coarse process will receive the ranks (in prec_comm communicator) of its friend (sending) processes */
42130c7d97c5SJed Brown       ierr = PetscMemzero(total_count_recv,size_coarse_comm*sizeof(PetscMPIInt));CHKERRQ(ierr);
42140c7d97c5SJed Brown       for (j=0; j<size_coarse_comm; j++) {
42153828260eSStefano Zampini         for (i=0; i<size_prec_comm; i++) {
42160c7d97c5SJed Brown           if (coarse_subdivision[i]==j) {
42170c7d97c5SJed Brown             total_ranks_recv[displacements_recv[j]+total_count_recv[j]] = i;
42182fa5cd67SKarl Rupp 
42193828260eSStefano Zampini             total_count_recv[j] += 1;
42200c7d97c5SJed Brown           }
42210c7d97c5SJed Brown         }
42220c7d97c5SJed Brown       }
4223da1bb401SStefano Zampini       /* for (j=0;j<size_coarse_comm;j++) {
42243828260eSStefano Zampini         printf("process %d in new rank will receive from %d processes (original ranks follows)\n",j,total_count_recv[j]);
42253828260eSStefano Zampini         for (i=0;i<total_count_recv[j];i++) {
42263828260eSStefano Zampini           printf("%d ",total_ranks_recv[displacements_recv[j]+i]);
42273828260eSStefano Zampini         }
42283828260eSStefano Zampini         printf("\n");
4229da1bb401SStefano Zampini       } */
42300c7d97c5SJed Brown 
42310c7d97c5SJed Brown       /* identify new decomposition in terms of ranks in the old communicator */
42320bdf917eSStefano Zampini       for (i=0; i<n_subdomains; i++) {
42330bdf917eSStefano Zampini         coarse_subdivision[ranks_stretching_ratio*i]=coarse_subdivision[ranks_stretching_ratio*i]*procs_jumps_coarse_comm;
42340bdf917eSStefano Zampini       }
4235da1bb401SStefano Zampini       /* printf("coarse_subdivision in old end new ranks\n");
42362fa5cd67SKarl Rupp       for (i=0;i<size_prec_comm;i++) {
42373828260eSStefano Zampini         if (coarse_subdivision[i]!=MPI_PROC_NULL) {
42383828260eSStefano Zampini           printf("%d=(%d %d), ",i,coarse_subdivision[i],coarse_subdivision[i]/procs_jumps_coarse_comm);
42393828260eSStefano Zampini         } else {
42403828260eSStefano Zampini           printf("%d=(%d %d), ",i,coarse_subdivision[i],coarse_subdivision[i]);
42413828260eSStefano Zampini         }
42422fa5cd67SKarl Rupp       }
4243da1bb401SStefano Zampini       printf("\n"); */
42440c7d97c5SJed Brown     }
42450c7d97c5SJed Brown 
42460c7d97c5SJed Brown     /* Scatter new decomposition for send details */
424753cdbc3dSStefano Zampini     ierr = MPI_Scatter(&coarse_subdivision[0],1,MPIU_INT,&rank_coarse_proc_send_to,1,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr);
42480c7d97c5SJed Brown     /* Scatter receiving details to members of coarse decomposition */
42490c7d97c5SJed Brown     if (coarse_color == 0) {
425053cdbc3dSStefano Zampini       ierr = MPI_Scatter(&total_count_recv[0],1,MPIU_INT,&count_recv,1,MPIU_INT,master_proc,coarse_comm);CHKERRQ(ierr);
42510c7d97c5SJed Brown       ierr = PetscMalloc (count_recv*sizeof(PetscMPIInt),&ranks_recv);CHKERRQ(ierr);
425253cdbc3dSStefano Zampini       ierr = MPI_Scatterv(&total_ranks_recv[0],total_count_recv,displacements_recv,MPIU_INT,&ranks_recv[0],count_recv,MPIU_INT,master_proc,coarse_comm);CHKERRQ(ierr);
42530c7d97c5SJed Brown     }
42540c7d97c5SJed Brown 
4255da1bb401SStefano Zampini     /* printf("I will send my matrix data to proc  %d\n",rank_coarse_proc_send_to);
4256da1bb401SStefano Zampini     if (coarse_color == 0) {
4257da1bb401SStefano Zampini       printf("I will receive some matrix data from %d processes (ranks follows)\n",count_recv);
4258da1bb401SStefano Zampini       for (i=0;i<count_recv;i++)
4259da1bb401SStefano Zampini         printf("%d ",ranks_recv[i]);
4260da1bb401SStefano Zampini       printf("\n");
4261da1bb401SStefano Zampini     } */
42620c7d97c5SJed Brown 
42630c7d97c5SJed Brown     if (rank_prec_comm == master_proc) {
42640bdf917eSStefano Zampini       ierr = PetscFree(coarse_subdivision);CHKERRQ(ierr);
4265da1bb401SStefano Zampini       ierr = PetscFree(total_count_recv);CHKERRQ(ierr);
42660bdf917eSStefano Zampini       ierr = PetscFree(total_ranks_recv);CHKERRQ(ierr);
42670c7d97c5SJed Brown       ierr = PetscFree(displacements_recv);CHKERRQ(ierr);
42680c7d97c5SJed Brown     }
42690c7d97c5SJed Brown     break;
42700c7d97c5SJed Brown   }
42710c7d97c5SJed Brown 
42720c7d97c5SJed Brown   case (REPLICATED_BDDC):
42730c7d97c5SJed Brown 
42740c7d97c5SJed Brown     pcbddc->coarse_communications_type = GATHERS_BDDC;
42750c7d97c5SJed Brown     coarse_mat_type                    = MATSEQAIJ;
42760c7d97c5SJed Brown     coarse_pc_type                     = PCLU;
427753cdbc3dSStefano Zampini     coarse_ksp_type                    = KSPPREONLY;
42780c7d97c5SJed Brown     coarse_comm                        = PETSC_COMM_SELF;
42790c7d97c5SJed Brown     active_rank                        = rank_prec_comm;
42800c7d97c5SJed Brown     break;
42810c7d97c5SJed Brown 
42820c7d97c5SJed Brown   case (PARALLEL_BDDC):
42830c7d97c5SJed Brown 
42840c7d97c5SJed Brown     pcbddc->coarse_communications_type = SCATTERS_BDDC;
42850c7d97c5SJed Brown     coarse_mat_type                    = MATMPIAIJ;
42860c7d97c5SJed Brown     coarse_pc_type                     = PCREDUNDANT;
428753cdbc3dSStefano Zampini     coarse_ksp_type                    = KSPPREONLY;
42880c7d97c5SJed Brown     coarse_comm                        = prec_comm;
42890c7d97c5SJed Brown     active_rank                        = rank_prec_comm;
42900c7d97c5SJed Brown     break;
42910c7d97c5SJed Brown 
42920c7d97c5SJed Brown   case (SEQUENTIAL_BDDC):
42930c7d97c5SJed Brown     pcbddc->coarse_communications_type = GATHERS_BDDC;
42940c7d97c5SJed Brown     coarse_mat_type                    = MATSEQAIJ;
42950c7d97c5SJed Brown     coarse_pc_type                     = PCLU;
429653cdbc3dSStefano Zampini     coarse_ksp_type                    = KSPPREONLY;
42970c7d97c5SJed Brown     coarse_comm                        = PETSC_COMM_SELF;
42980c7d97c5SJed Brown     active_rank                        = master_proc;
42990c7d97c5SJed Brown     break;
43000c7d97c5SJed Brown   }
43010c7d97c5SJed Brown 
43020c7d97c5SJed Brown   switch (pcbddc->coarse_communications_type) {
43030c7d97c5SJed Brown 
43040c7d97c5SJed Brown   case(SCATTERS_BDDC):
43050c7d97c5SJed Brown   {
43060c7d97c5SJed Brown     if (pcbddc->coarse_problem_type==MULTILEVEL_BDDC) {
43070c7d97c5SJed Brown 
43082e8d2280SStefano Zampini       IS coarse_IS;
43092e8d2280SStefano Zampini 
4310523858cfSStefano Zampini       if (pcbddc->coarsening_ratio == 1) {
4311523858cfSStefano Zampini         ins_local_primal_size = pcbddc->local_primal_size;
4312523858cfSStefano Zampini         ins_local_primal_indices = pcbddc->local_primal_indices;
4313523858cfSStefano Zampini         if (coarse_color == 0) { ierr = PetscFree(ranks_recv);CHKERRQ(ierr); }
4314523858cfSStefano Zampini         /* nonzeros */
4315523858cfSStefano Zampini         ierr = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&dnz);CHKERRQ(ierr);
4316523858cfSStefano Zampini         ierr = PetscMemzero(dnz,ins_local_primal_size*sizeof(PetscInt));CHKERRQ(ierr);
4317523858cfSStefano Zampini         for (i=0;i<ins_local_primal_size;i++) {
4318523858cfSStefano Zampini           dnz[i] = ins_local_primal_size;
4319523858cfSStefano Zampini         }
4320523858cfSStefano Zampini       } else {
43210c7d97c5SJed Brown         PetscMPIInt send_size;
4322ef028eecSStefano Zampini         PetscMPIInt *send_buffer;
43230c7d97c5SJed Brown         PetscInt    *aux_ins_indices;
43240c7d97c5SJed Brown         PetscInt    ii,jj;
43250c7d97c5SJed Brown         MPI_Request *requests;
4326ef028eecSStefano Zampini 
4327523858cfSStefano Zampini         ierr = PetscMalloc(count_recv*sizeof(PetscMPIInt),&localdispl2);CHKERRQ(ierr);
4328523858cfSStefano Zampini         /* reusing pcbddc->local_primal_displacements and pcbddc->replicated_primal_size */
4329523858cfSStefano Zampini         ierr = PetscFree(pcbddc->local_primal_displacements);CHKERRQ(ierr);
4330523858cfSStefano Zampini         ierr = PetscMalloc((count_recv+1)*sizeof(PetscMPIInt),&pcbddc->local_primal_displacements);CHKERRQ(ierr);
4331523858cfSStefano Zampini         pcbddc->replicated_primal_size = count_recv;
4332523858cfSStefano Zampini         j = 0;
4333523858cfSStefano Zampini         for (i=0;i<count_recv;i++) {
4334523858cfSStefano Zampini           pcbddc->local_primal_displacements[i] = j;
4335523858cfSStefano Zampini           j += pcbddc->local_primal_sizes[ranks_recv[i]];
4336523858cfSStefano Zampini         }
4337523858cfSStefano Zampini         pcbddc->local_primal_displacements[count_recv] = j;
4338523858cfSStefano Zampini         ierr = PetscMalloc(j*sizeof(PetscMPIInt),&pcbddc->replicated_local_primal_indices);CHKERRQ(ierr);
43390c7d97c5SJed Brown         /* allocate auxiliary space */
4340523858cfSStefano Zampini         ierr = PetscMalloc(count_recv*sizeof(PetscMPIInt),&localsizes2);CHKERRQ(ierr);
43410c7d97c5SJed Brown         ierr = PetscMalloc(pcbddc->coarse_size*sizeof(PetscInt),&aux_ins_indices);CHKERRQ(ierr);
43420c7d97c5SJed Brown         ierr = PetscMemzero(aux_ins_indices,pcbddc->coarse_size*sizeof(PetscInt));CHKERRQ(ierr);
43430c7d97c5SJed Brown         /* allocate stuffs for message massing */
43440c7d97c5SJed Brown         ierr = PetscMalloc((count_recv+1)*sizeof(MPI_Request),&requests);CHKERRQ(ierr);
4345523858cfSStefano Zampini         for (i=0;i<count_recv+1;i++) { requests[i]=MPI_REQUEST_NULL; }
4346523858cfSStefano Zampini         /* send indices to be inserted */
4347523858cfSStefano Zampini         for (i=0;i<count_recv;i++) {
4348523858cfSStefano Zampini           send_size = pcbddc->local_primal_sizes[ranks_recv[i]];
4349523858cfSStefano Zampini           ierr = MPI_Irecv(&pcbddc->replicated_local_primal_indices[pcbddc->local_primal_displacements[i]],send_size,MPIU_INT,ranks_recv[i],999,prec_comm,&requests[i]);CHKERRQ(ierr);
4350523858cfSStefano Zampini         }
4351523858cfSStefano Zampini         if (rank_coarse_proc_send_to != MPI_PROC_NULL) {
4352523858cfSStefano Zampini           send_size = pcbddc->local_primal_size;
4353ef028eecSStefano Zampini           ierr = PetscMalloc(send_size*sizeof(PetscMPIInt),&send_buffer);CHKERRQ(ierr);
4354ef028eecSStefano Zampini           for (i=0;i<send_size;i++) {
4355ef028eecSStefano Zampini             send_buffer[i]=(PetscMPIInt)pcbddc->local_primal_indices[i];
4356ef028eecSStefano Zampini           }
4357ef028eecSStefano Zampini           ierr = MPI_Isend(send_buffer,send_size,MPIU_INT,rank_coarse_proc_send_to,999,prec_comm,&requests[count_recv]);CHKERRQ(ierr);
4358523858cfSStefano Zampini         }
4359523858cfSStefano Zampini         ierr = MPI_Waitall(count_recv+1,requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
4360ef028eecSStefano Zampini         if (rank_coarse_proc_send_to != MPI_PROC_NULL) {
4361ef028eecSStefano Zampini           ierr = PetscFree(send_buffer);CHKERRQ(ierr);
4362ef028eecSStefano Zampini         }
43630c7d97c5SJed Brown         j = 0;
43640c7d97c5SJed Brown         for (i=0;i<count_recv;i++) {
43652e8d2280SStefano Zampini           ii = pcbddc->local_primal_displacements[i+1]-pcbddc->local_primal_displacements[i];
43662e8d2280SStefano Zampini           localsizes2[i] = ii*ii;
43670c7d97c5SJed Brown           localdispl2[i] = j;
43680c7d97c5SJed Brown           j += localsizes2[i];
4369523858cfSStefano Zampini           jj = pcbddc->local_primal_displacements[i];
43704fad6a16SStefano Zampini           /* it counts the coarse subdomains sharing the coarse node */
43712e8d2280SStefano Zampini           for (k=0;k<ii;k++) {
43724fad6a16SStefano Zampini             aux_ins_indices[pcbddc->replicated_local_primal_indices[jj+k]] += 1;
43730c7d97c5SJed Brown           }
43744fad6a16SStefano Zampini         }
4375523858cfSStefano Zampini         /* temp_coarse_mat_vals used to store matrix values to be received */
43760c7d97c5SJed Brown         ierr = PetscMalloc(j*sizeof(PetscScalar),&temp_coarse_mat_vals);CHKERRQ(ierr);
43770c7d97c5SJed Brown         /* evaluate how many values I will insert in coarse mat */
43780c7d97c5SJed Brown         ins_local_primal_size = 0;
4379ea7e1babSStefano Zampini         for (i=0;i<pcbddc->coarse_size;i++) {
4380ea7e1babSStefano Zampini           if (aux_ins_indices[i]) {
43810c7d97c5SJed Brown             ins_local_primal_size++;
4382ea7e1babSStefano Zampini           }
4383ea7e1babSStefano Zampini         }
43840c7d97c5SJed Brown         /* evaluate indices I will insert in coarse mat */
43850c7d97c5SJed Brown         ierr = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&ins_local_primal_indices);CHKERRQ(ierr);
43860c7d97c5SJed Brown         j = 0;
4387ea7e1babSStefano Zampini         for (i=0;i<pcbddc->coarse_size;i++) {
4388ea7e1babSStefano Zampini           if (aux_ins_indices[i]) {
43892e8d2280SStefano Zampini             ins_local_primal_indices[j] = i;
43902e8d2280SStefano Zampini             j++;
4391ea7e1babSStefano Zampini           }
4392ea7e1babSStefano Zampini         }
4393523858cfSStefano Zampini         /* processes partecipating in coarse problem receive matrix data from their friends */
4394523858cfSStefano Zampini         for (i=0;i<count_recv;i++) {
4395523858cfSStefano Zampini           ierr = MPI_Irecv(&temp_coarse_mat_vals[localdispl2[i]],localsizes2[i],MPIU_SCALAR,ranks_recv[i],666,prec_comm,&requests[i]);CHKERRQ(ierr);
4396523858cfSStefano Zampini         }
4397523858cfSStefano Zampini         if (rank_coarse_proc_send_to != MPI_PROC_NULL) {
4398523858cfSStefano Zampini           send_size = pcbddc->local_primal_size*pcbddc->local_primal_size;
4399523858cfSStefano Zampini           ierr = MPI_Isend(&coarse_submat_vals[0],send_size,MPIU_SCALAR,rank_coarse_proc_send_to,666,prec_comm,&requests[count_recv]);CHKERRQ(ierr);
4400523858cfSStefano Zampini         }
4401523858cfSStefano Zampini         ierr = MPI_Waitall(count_recv+1,requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
4402523858cfSStefano Zampini         /* nonzeros */
4403523858cfSStefano Zampini         ierr = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&dnz);CHKERRQ(ierr);
4404523858cfSStefano Zampini         ierr = PetscMemzero(dnz,ins_local_primal_size*sizeof(PetscInt));CHKERRQ(ierr);
44050c7d97c5SJed Brown         /* use aux_ins_indices to realize a global to local mapping */
44060c7d97c5SJed Brown         j=0;
44070c7d97c5SJed Brown         for (i=0;i<pcbddc->coarse_size;i++) {
44080c7d97c5SJed Brown           if (aux_ins_indices[i]==0) {
44090c7d97c5SJed Brown             aux_ins_indices[i]=-1;
44100c7d97c5SJed Brown           } else {
44110c7d97c5SJed Brown             aux_ins_indices[i]=j;
44120c7d97c5SJed Brown             j++;
44130c7d97c5SJed Brown           }
44140c7d97c5SJed Brown         }
44154fad6a16SStefano Zampini         for (i=0;i<count_recv;i++) {
4416523858cfSStefano Zampini           j = pcbddc->local_primal_sizes[ranks_recv[i]];
4417523858cfSStefano Zampini           for (k=0;k<j;k++) {
4418523858cfSStefano Zampini             dnz[aux_ins_indices[pcbddc->replicated_local_primal_indices[pcbddc->local_primal_displacements[i]+k]]] += j;
44190c7d97c5SJed Brown           }
44200c7d97c5SJed Brown         }
4421523858cfSStefano Zampini         /* check */
4422523858cfSStefano Zampini         for (i=0;i<ins_local_primal_size;i++) {
4423523858cfSStefano Zampini           if (dnz[i] > ins_local_primal_size) {
4424523858cfSStefano Zampini             dnz[i] = ins_local_primal_size;
44250c7d97c5SJed Brown           }
44260c7d97c5SJed Brown         }
44270c7d97c5SJed Brown         ierr = PetscFree(requests);CHKERRQ(ierr);
44280c7d97c5SJed Brown         ierr = PetscFree(aux_ins_indices);CHKERRQ(ierr);
44290c7d97c5SJed Brown         if (coarse_color == 0) { ierr = PetscFree(ranks_recv);CHKERRQ(ierr); }
44304fad6a16SStefano Zampini       }
44310c7d97c5SJed Brown       /* create local to global mapping needed by coarse MATIS */
4432142dfd88SStefano Zampini       if (coarse_comm != MPI_COMM_NULL) {ierr = MPI_Comm_free(&coarse_comm);CHKERRQ(ierr);}
44330c7d97c5SJed Brown       coarse_comm = prec_comm;
44340c7d97c5SJed Brown       active_rank = rank_prec_comm;
44350c7d97c5SJed Brown       ierr = ISCreateGeneral(coarse_comm,ins_local_primal_size,ins_local_primal_indices,PETSC_COPY_VALUES,&coarse_IS);CHKERRQ(ierr);
44360c7d97c5SJed Brown       ierr = ISLocalToGlobalMappingCreateIS(coarse_IS,&coarse_ISLG);CHKERRQ(ierr);
44370c7d97c5SJed Brown       ierr = ISDestroy(&coarse_IS);CHKERRQ(ierr);
44382e8d2280SStefano Zampini     } else if (pcbddc->coarse_problem_type==PARALLEL_BDDC) {
44390c7d97c5SJed Brown       /* arrays for values insertion */
44400c7d97c5SJed Brown       ins_local_primal_size = pcbddc->local_primal_size;
44412e8d2280SStefano Zampini       ierr = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&ins_local_primal_indices);CHKERRQ(ierr);
44420c7d97c5SJed Brown       ierr = PetscMalloc(ins_local_primal_size*ins_local_primal_size*sizeof(PetscScalar),&ins_coarse_mat_vals);CHKERRQ(ierr);
44430c7d97c5SJed Brown       for (j=0;j<ins_local_primal_size;j++) {
44440c7d97c5SJed Brown         ins_local_primal_indices[j]=pcbddc->local_primal_indices[j];
44454fad6a16SStefano Zampini         for (i=0;i<ins_local_primal_size;i++) {
44464fad6a16SStefano Zampini           ins_coarse_mat_vals[j*ins_local_primal_size+i]=coarse_submat_vals[j*ins_local_primal_size+i];
44474fad6a16SStefano Zampini         }
44480c7d97c5SJed Brown       }
44490c7d97c5SJed Brown     }
44500c7d97c5SJed Brown     break;
44510c7d97c5SJed Brown   }
44520c7d97c5SJed Brown 
44530c7d97c5SJed Brown   case (GATHERS_BDDC):
44540c7d97c5SJed Brown   {
44550c7d97c5SJed Brown     PetscMPIInt mysize,mysize2;
4456ef028eecSStefano Zampini     PetscMPIInt *send_buffer;
44570c7d97c5SJed Brown 
44580c7d97c5SJed Brown     if (rank_prec_comm==active_rank) {
44590c7d97c5SJed Brown       ierr = PetscMalloc (pcbddc->replicated_primal_size*sizeof(PetscMPIInt),&pcbddc->replicated_local_primal_indices);CHKERRQ(ierr);
44600bdf917eSStefano Zampini       ierr = PetscMalloc (pcbddc->replicated_primal_size*sizeof(PetscScalar),&pcbddc->replicated_local_primal_values);CHKERRQ(ierr);
44610c7d97c5SJed Brown       ierr = PetscMalloc (size_prec_comm*sizeof(PetscMPIInt),&localsizes2);CHKERRQ(ierr);
44620c7d97c5SJed Brown       ierr = PetscMalloc (size_prec_comm*sizeof(PetscMPIInt),&localdispl2);CHKERRQ(ierr);
44630c7d97c5SJed Brown       /* arrays for values insertion */
44642fa5cd67SKarl Rupp       for (i=0;i<size_prec_comm;i++) localsizes2[i]=pcbddc->local_primal_sizes[i]*pcbddc->local_primal_sizes[i];
44650c7d97c5SJed Brown       localdispl2[0]=0;
44662fa5cd67SKarl Rupp       for (i=1;i<size_prec_comm;i++) localdispl2[i]=localsizes2[i-1]+localdispl2[i-1];
44670c7d97c5SJed Brown       j = 0;
44682fa5cd67SKarl Rupp       for (i=0;i<size_prec_comm;i++) j+=localsizes2[i];
44690c7d97c5SJed Brown       ierr = PetscMalloc (j*sizeof(PetscScalar),&temp_coarse_mat_vals);CHKERRQ(ierr);
44700c7d97c5SJed Brown     }
44710c7d97c5SJed Brown 
44720c7d97c5SJed Brown     mysize =pcbddc->local_primal_size;
44730c7d97c5SJed Brown     mysize2=pcbddc->local_primal_size*pcbddc->local_primal_size;
4474ef028eecSStefano Zampini     ierr   = PetscMalloc(mysize*sizeof(PetscMPIInt),&send_buffer);CHKERRQ(ierr);
44752fa5cd67SKarl Rupp     for (i=0; i<mysize; i++) send_buffer[i]=(PetscMPIInt)pcbddc->local_primal_indices[i];
44762fa5cd67SKarl Rupp 
44770c7d97c5SJed Brown     if (pcbddc->coarse_problem_type == SEQUENTIAL_BDDC) {
4478ef028eecSStefano Zampini       ierr = MPI_Gatherv(send_buffer,mysize,MPIU_INT,&pcbddc->replicated_local_primal_indices[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr);
447953cdbc3dSStefano Zampini       ierr = MPI_Gatherv(&coarse_submat_vals[0],mysize2,MPIU_SCALAR,&temp_coarse_mat_vals[0],localsizes2,localdispl2,MPIU_SCALAR,master_proc,prec_comm);CHKERRQ(ierr);
44800c7d97c5SJed Brown     } else {
4481ef028eecSStefano Zampini       ierr = MPI_Allgatherv(send_buffer,mysize,MPIU_INT,&pcbddc->replicated_local_primal_indices[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,prec_comm);CHKERRQ(ierr);
448253cdbc3dSStefano Zampini       ierr = MPI_Allgatherv(&coarse_submat_vals[0],mysize2,MPIU_SCALAR,&temp_coarse_mat_vals[0],localsizes2,localdispl2,MPIU_SCALAR,prec_comm);CHKERRQ(ierr);
44830c7d97c5SJed Brown     }
4484ef028eecSStefano Zampini     ierr = PetscFree(send_buffer);CHKERRQ(ierr);
44850c7d97c5SJed Brown     break;
4486da1bb401SStefano Zampini   }/* switch on coarse problem and communications associated with finished */
44870c7d97c5SJed Brown   }
44880c7d97c5SJed Brown 
44890c7d97c5SJed Brown   /* Now create and fill up coarse matrix */
44900c7d97c5SJed Brown   if (rank_prec_comm == active_rank) {
4491142dfd88SStefano Zampini 
4492142dfd88SStefano Zampini     Mat matis_coarse_local_mat;
4493142dfd88SStefano Zampini 
44940c7d97c5SJed Brown     if (pcbddc->coarse_problem_type != MULTILEVEL_BDDC) {
44950c7d97c5SJed Brown       ierr = MatCreate(coarse_comm,&pcbddc->coarse_mat);CHKERRQ(ierr);
44960c7d97c5SJed Brown       ierr = MatSetSizes(pcbddc->coarse_mat,PETSC_DECIDE,PETSC_DECIDE,pcbddc->coarse_size,pcbddc->coarse_size);CHKERRQ(ierr);
44970c7d97c5SJed Brown       ierr = MatSetType(pcbddc->coarse_mat,coarse_mat_type);CHKERRQ(ierr);
44983b03a366Sstefano_zampini       ierr = MatSetUp(pcbddc->coarse_mat);CHKERRQ(ierr);
4499da1bb401SStefano Zampini       ierr = MatSetOption(pcbddc->coarse_mat,MAT_ROW_ORIENTED,PETSC_FALSE);CHKERRQ(ierr); /* local values stored in column major */
45003b03a366Sstefano_zampini       ierr = MatSetOption(pcbddc->coarse_mat,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr);
45010c7d97c5SJed Brown     } else {
45024fad6a16SStefano Zampini       ierr = MatCreateIS(coarse_comm,1,PETSC_DECIDE,PETSC_DECIDE,pcbddc->coarse_size,pcbddc->coarse_size,coarse_ISLG,&pcbddc->coarse_mat);CHKERRQ(ierr);
45033b03a366Sstefano_zampini       ierr = MatSetUp(pcbddc->coarse_mat);CHKERRQ(ierr);
45040c7d97c5SJed Brown       ierr = MatISGetLocalMat(pcbddc->coarse_mat,&matis_coarse_local_mat);CHKERRQ(ierr);
45053b03a366Sstefano_zampini       ierr = MatSetUp(matis_coarse_local_mat);CHKERRQ(ierr);
4506da1bb401SStefano Zampini       ierr = MatSetOption(matis_coarse_local_mat,MAT_ROW_ORIENTED,PETSC_FALSE);CHKERRQ(ierr); /* local values stored in column major */
4507a0ba757dSStefano Zampini       ierr = MatSetOption(matis_coarse_local_mat,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr);
45080c7d97c5SJed Brown     }
4509142dfd88SStefano Zampini     /* preallocation */
4510142dfd88SStefano Zampini     if (pcbddc->coarse_problem_type != MULTILEVEL_BDDC) {
4511ef028eecSStefano Zampini 
4512142dfd88SStefano Zampini       PetscInt lrows,lcols;
4513ef028eecSStefano Zampini 
4514142dfd88SStefano Zampini       ierr = MatGetLocalSize(pcbddc->coarse_mat,&lrows,&lcols);CHKERRQ(ierr);
4515142dfd88SStefano Zampini       ierr = MatPreallocateInitialize(coarse_comm,lrows,lcols,dnz,onz);CHKERRQ(ierr);
4516ef028eecSStefano Zampini 
4517142dfd88SStefano Zampini       if (pcbddc->coarse_problem_type == PARALLEL_BDDC) {
4518ef028eecSStefano Zampini 
4519ef028eecSStefano Zampini         Vec         vec_dnz,vec_onz;
4520ef028eecSStefano Zampini         PetscScalar *my_dnz,*my_onz,*array;
4521ef028eecSStefano Zampini         PetscInt    *mat_ranges,*row_ownership;
4522ef028eecSStefano Zampini         PetscInt    coarse_index_row,coarse_index_col,owner;
4523ef028eecSStefano Zampini 
4524ef028eecSStefano Zampini         ierr = VecCreate(prec_comm,&vec_dnz);CHKERRQ(ierr);
4525ef028eecSStefano Zampini         ierr = VecSetSizes(vec_dnz,PETSC_DECIDE,pcbddc->coarse_size);CHKERRQ(ierr);
4526ef028eecSStefano Zampini         ierr = VecSetType(vec_dnz,VECMPI);CHKERRQ(ierr);
4527ef028eecSStefano Zampini         ierr = VecDuplicate(vec_dnz,&vec_onz);CHKERRQ(ierr);
4528ef028eecSStefano Zampini 
4529ef028eecSStefano Zampini         ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscScalar),&my_dnz);CHKERRQ(ierr);
4530ef028eecSStefano Zampini         ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscScalar),&my_onz);CHKERRQ(ierr);
4531ef028eecSStefano Zampini         ierr = PetscMemzero(my_dnz,pcbddc->local_primal_size*sizeof(PetscScalar));CHKERRQ(ierr);
4532ef028eecSStefano Zampini         ierr = PetscMemzero(my_onz,pcbddc->local_primal_size*sizeof(PetscScalar));CHKERRQ(ierr);
4533ef028eecSStefano Zampini 
4534ef028eecSStefano Zampini         ierr = PetscMalloc(pcbddc->coarse_size*sizeof(PetscInt),&row_ownership);CHKERRQ(ierr);
4535ef028eecSStefano Zampini         ierr = MatGetOwnershipRanges(pcbddc->coarse_mat,(const PetscInt**)&mat_ranges);CHKERRQ(ierr);
4536142dfd88SStefano Zampini         for (i=0; i<size_prec_comm; i++) {
4537ef028eecSStefano Zampini           for (j=mat_ranges[i]; j<mat_ranges[i+1]; j++) {
4538ef028eecSStefano Zampini             row_ownership[j]=i;
4539142dfd88SStefano Zampini           }
4540142dfd88SStefano Zampini         }
4541ef028eecSStefano Zampini 
4542ef028eecSStefano Zampini         for (i=0; i<pcbddc->local_primal_size; i++) {
4543ef028eecSStefano Zampini           coarse_index_row = pcbddc->local_primal_indices[i];
4544ef028eecSStefano Zampini           owner = row_ownership[coarse_index_row];
4545ef028eecSStefano Zampini           for (j=i; j<pcbddc->local_primal_size; j++) {
4546ef028eecSStefano Zampini             owner = row_ownership[coarse_index_row];
4547ef028eecSStefano Zampini             coarse_index_col = pcbddc->local_primal_indices[j];
4548ef028eecSStefano Zampini             if (coarse_index_col > mat_ranges[owner]-1 && coarse_index_col < mat_ranges[owner+1]) {
4549ef028eecSStefano Zampini               my_dnz[i] += 1.0;
4550142dfd88SStefano Zampini             } else {
4551ef028eecSStefano Zampini               my_onz[i] += 1.0;
4552142dfd88SStefano Zampini             }
4553ef028eecSStefano Zampini             if (i != j) {
4554ef028eecSStefano Zampini               owner = row_ownership[coarse_index_col];
4555ef028eecSStefano Zampini               if (coarse_index_row > mat_ranges[owner]-1 && coarse_index_row < mat_ranges[owner+1]) {
4556ef028eecSStefano Zampini                 my_dnz[j] += 1.0;
4557142dfd88SStefano Zampini               } else {
4558ef028eecSStefano Zampini                 my_onz[j] += 1.0;
4559142dfd88SStefano Zampini               }
4560142dfd88SStefano Zampini             }
4561142dfd88SStefano Zampini           }
4562142dfd88SStefano Zampini         }
4563ef028eecSStefano Zampini         ierr = VecSet(vec_dnz,0.0);CHKERRQ(ierr);
4564ef028eecSStefano Zampini         ierr = VecSet(vec_onz,0.0);CHKERRQ(ierr);
4565a929c220SStefano Zampini         if (pcbddc->local_primal_size) {
4566ef028eecSStefano Zampini           ierr = VecSetValues(vec_dnz,pcbddc->local_primal_size,pcbddc->local_primal_indices,my_dnz,ADD_VALUES);CHKERRQ(ierr);
4567ef028eecSStefano Zampini           ierr = VecSetValues(vec_onz,pcbddc->local_primal_size,pcbddc->local_primal_indices,my_onz,ADD_VALUES);CHKERRQ(ierr);
4568a929c220SStefano Zampini         }
4569ef028eecSStefano Zampini         ierr = VecAssemblyBegin(vec_dnz);CHKERRQ(ierr);
4570ef028eecSStefano Zampini         ierr = VecAssemblyBegin(vec_onz);CHKERRQ(ierr);
4571ef028eecSStefano Zampini         ierr = VecAssemblyEnd(vec_dnz);CHKERRQ(ierr);
4572ef028eecSStefano Zampini         ierr = VecAssemblyEnd(vec_onz);CHKERRQ(ierr);
4573ef028eecSStefano Zampini         j    = mat_ranges[rank_prec_comm+1]-mat_ranges[rank_prec_comm];
4574ef028eecSStefano Zampini         ierr = VecGetArray(vec_dnz,&array);CHKERRQ(ierr);
45752fa5cd67SKarl Rupp         for (i=0; i<j; i++) dnz[i] = (PetscInt)array[i];
45762fa5cd67SKarl Rupp 
4577ef028eecSStefano Zampini         ierr = VecRestoreArray(vec_dnz,&array);CHKERRQ(ierr);
4578ef028eecSStefano Zampini         ierr = VecGetArray(vec_onz,&array);CHKERRQ(ierr);
45792fa5cd67SKarl Rupp         for (i=0;i<j;i++) onz[i] = (PetscInt)array[i];
45802fa5cd67SKarl Rupp 
4581ef028eecSStefano Zampini         ierr = VecRestoreArray(vec_onz,&array);CHKERRQ(ierr);
4582ef028eecSStefano Zampini         ierr = PetscFree(my_dnz);CHKERRQ(ierr);
4583ef028eecSStefano Zampini         ierr = PetscFree(my_onz);CHKERRQ(ierr);
4584ef028eecSStefano Zampini         ierr = PetscFree(row_ownership);CHKERRQ(ierr);
4585ef028eecSStefano Zampini         ierr = VecDestroy(&vec_dnz);CHKERRQ(ierr);
4586ef028eecSStefano Zampini         ierr = VecDestroy(&vec_onz);CHKERRQ(ierr);
4587142dfd88SStefano Zampini       } else {
4588142dfd88SStefano Zampini         for (k=0;k<size_prec_comm;k++) {
4589142dfd88SStefano Zampini           offset=pcbddc->local_primal_displacements[k];
4590142dfd88SStefano Zampini           offset2=localdispl2[k];
4591142dfd88SStefano Zampini           ins_local_primal_size = pcbddc->local_primal_sizes[k];
4592ef028eecSStefano Zampini           ierr = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&ins_local_primal_indices);CHKERRQ(ierr);
4593ef028eecSStefano Zampini           for (j=0;j<ins_local_primal_size;j++) {
4594ef028eecSStefano Zampini             ins_local_primal_indices[j]=(PetscInt)pcbddc->replicated_local_primal_indices[offset+j];
4595ef028eecSStefano Zampini           }
4596142dfd88SStefano Zampini           for (j=0;j<ins_local_primal_size;j++) {
4597142dfd88SStefano Zampini             ierr = MatPreallocateSet(ins_local_primal_indices[j],ins_local_primal_size,ins_local_primal_indices,dnz,onz);CHKERRQ(ierr);
4598142dfd88SStefano Zampini           }
4599ef028eecSStefano Zampini           ierr = PetscFree(ins_local_primal_indices);CHKERRQ(ierr);
4600142dfd88SStefano Zampini         }
4601142dfd88SStefano Zampini       }
46022fa5cd67SKarl Rupp 
4603142dfd88SStefano Zampini       /* check */
4604142dfd88SStefano Zampini       for (i=0;i<lrows;i++) {
46052fa5cd67SKarl Rupp         if (dnz[i]>lcols) dnz[i]=lcols;
46062fa5cd67SKarl Rupp         if (onz[i]>pcbddc->coarse_size-lcols) onz[i]=pcbddc->coarse_size-lcols;
4607142dfd88SStefano Zampini       }
4608d9a4edebSJed Brown       ierr = MatSeqAIJSetPreallocation(pcbddc->coarse_mat,0,dnz);CHKERRQ(ierr);
4609d9a4edebSJed Brown       ierr = MatMPIAIJSetPreallocation(pcbddc->coarse_mat,0,dnz,0,onz);CHKERRQ(ierr);
4610142dfd88SStefano Zampini       ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr);
4611142dfd88SStefano Zampini     } else {
4612523858cfSStefano Zampini       ierr = MatSeqAIJSetPreallocation(matis_coarse_local_mat,0,dnz);CHKERRQ(ierr);
4613523858cfSStefano Zampini       ierr = PetscFree(dnz);CHKERRQ(ierr);
4614142dfd88SStefano Zampini     }
46152fa5cd67SKarl Rupp 
4616142dfd88SStefano Zampini     /* insert values */
4617523858cfSStefano Zampini     if (pcbddc->coarse_problem_type == PARALLEL_BDDC) {
46180c7d97c5SJed Brown       ierr = MatSetValues(pcbddc->coarse_mat,ins_local_primal_size,ins_local_primal_indices,ins_local_primal_size,ins_local_primal_indices,ins_coarse_mat_vals,ADD_VALUES);CHKERRQ(ierr);
4619523858cfSStefano Zampini     } else if (pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
4620523858cfSStefano Zampini       if (pcbddc->coarsening_ratio == 1) {
4621523858cfSStefano Zampini         ins_coarse_mat_vals = coarse_submat_vals;
4622523858cfSStefano Zampini         ierr                = MatSetValues(pcbddc->coarse_mat,ins_local_primal_size,ins_local_primal_indices,ins_local_primal_size,ins_local_primal_indices,ins_coarse_mat_vals,INSERT_VALUES);CHKERRQ(ierr);
4623523858cfSStefano Zampini       } else {
4624523858cfSStefano Zampini         ierr = PetscFree(ins_local_primal_indices);CHKERRQ(ierr);
4625523858cfSStefano Zampini         for (k=0; k<pcbddc->replicated_primal_size; k++) {
4626523858cfSStefano Zampini           offset                = pcbddc->local_primal_displacements[k];
4627523858cfSStefano Zampini           offset2               = localdispl2[k];
4628523858cfSStefano Zampini           ins_local_primal_size = pcbddc->local_primal_displacements[k+1]-pcbddc->local_primal_displacements[k];
4629ef028eecSStefano Zampini           ierr                  = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&ins_local_primal_indices);CHKERRQ(ierr);
4630ef028eecSStefano Zampini           for (j=0; j<ins_local_primal_size; j++) {
4631ef028eecSStefano Zampini             ins_local_primal_indices[j]=(PetscInt)pcbddc->replicated_local_primal_indices[offset+j];
4632ef028eecSStefano Zampini           }
4633523858cfSStefano Zampini           ins_coarse_mat_vals = &temp_coarse_mat_vals[offset2];
4634523858cfSStefano Zampini           ierr                = MatSetValues(pcbddc->coarse_mat,ins_local_primal_size,ins_local_primal_indices,ins_local_primal_size,ins_local_primal_indices,ins_coarse_mat_vals,ADD_VALUES);CHKERRQ(ierr);
4635ef028eecSStefano Zampini           ierr                = PetscFree(ins_local_primal_indices);CHKERRQ(ierr);
4636523858cfSStefano Zampini         }
4637523858cfSStefano Zampini       }
4638523858cfSStefano Zampini       ins_local_primal_indices = 0;
4639523858cfSStefano Zampini       ins_coarse_mat_vals      = 0;
4640ea7e1babSStefano Zampini     } else {
4641ea7e1babSStefano Zampini       for (k=0; k<size_prec_comm; k++) {
4642ea7e1babSStefano Zampini         offset                =pcbddc->local_primal_displacements[k];
4643ea7e1babSStefano Zampini         offset2               =localdispl2[k];
4644ea7e1babSStefano Zampini         ins_local_primal_size = pcbddc->local_primal_sizes[k];
4645ef028eecSStefano Zampini         ierr                  = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&ins_local_primal_indices);CHKERRQ(ierr);
4646ef028eecSStefano Zampini         for (j=0; j<ins_local_primal_size; j++) {
4647ef028eecSStefano Zampini           ins_local_primal_indices[j]=(PetscInt)pcbddc->replicated_local_primal_indices[offset+j];
4648ef028eecSStefano Zampini         }
4649ea7e1babSStefano Zampini         ins_coarse_mat_vals = &temp_coarse_mat_vals[offset2];
4650ea7e1babSStefano Zampini         ierr                = MatSetValues(pcbddc->coarse_mat,ins_local_primal_size,ins_local_primal_indices,ins_local_primal_size,ins_local_primal_indices,ins_coarse_mat_vals,ADD_VALUES);CHKERRQ(ierr);
4651ef028eecSStefano Zampini         ierr                = PetscFree(ins_local_primal_indices);CHKERRQ(ierr);
4652ea7e1babSStefano Zampini       }
4653ea7e1babSStefano Zampini       ins_local_primal_indices = 0;
4654ea7e1babSStefano Zampini       ins_coarse_mat_vals      = 0;
4655ea7e1babSStefano Zampini     }
46560c7d97c5SJed Brown     ierr = MatAssemblyBegin(pcbddc->coarse_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
46570c7d97c5SJed Brown     ierr = MatAssemblyEnd(pcbddc->coarse_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
4658142dfd88SStefano Zampini     /* symmetry of coarse matrix */
4659142dfd88SStefano Zampini     if (issym) {
4660142dfd88SStefano Zampini       ierr = MatSetOption(pcbddc->coarse_mat,MAT_SYMMETRIC,PETSC_TRUE);CHKERRQ(ierr);
4661142dfd88SStefano Zampini     }
46620c7d97c5SJed Brown     ierr = MatGetVecs(pcbddc->coarse_mat,&pcbddc->coarse_vec,&pcbddc->coarse_rhs);CHKERRQ(ierr);
46630bdf917eSStefano Zampini   }
46640bdf917eSStefano Zampini 
46650bdf917eSStefano Zampini   /* create loc to glob scatters if needed */
46660bdf917eSStefano Zampini   if (pcbddc->coarse_communications_type == SCATTERS_BDDC) {
46670bdf917eSStefano Zampini     IS local_IS,global_IS;
46680bdf917eSStefano Zampini     ierr = ISCreateStride(PETSC_COMM_SELF,pcbddc->local_primal_size,0,1,&local_IS);CHKERRQ(ierr);
46690bdf917eSStefano Zampini     ierr = ISCreateGeneral(PETSC_COMM_SELF,pcbddc->local_primal_size,pcbddc->local_primal_indices,PETSC_COPY_VALUES,&global_IS);CHKERRQ(ierr);
46700bdf917eSStefano Zampini     ierr = VecScatterCreate(pcbddc->vec1_P,local_IS,pcbddc->coarse_vec,global_IS,&pcbddc->coarse_loc_to_glob);CHKERRQ(ierr);
46710bdf917eSStefano Zampini     ierr = ISDestroy(&local_IS);CHKERRQ(ierr);
46720bdf917eSStefano Zampini     ierr = ISDestroy(&global_IS);CHKERRQ(ierr);
46730bdf917eSStefano Zampini   }
46740bdf917eSStefano Zampini 
4675a929c220SStefano Zampini   /* free memory no longer needed */
4676a929c220SStefano Zampini   if (coarse_ISLG)              { ierr = ISLocalToGlobalMappingDestroy(&coarse_ISLG);CHKERRQ(ierr); }
4677a929c220SStefano Zampini   if (ins_local_primal_indices) { ierr = PetscFree(ins_local_primal_indices);CHKERRQ(ierr); }
4678a929c220SStefano Zampini   if (ins_coarse_mat_vals)      { ierr = PetscFree(ins_coarse_mat_vals);CHKERRQ(ierr); }
4679a929c220SStefano Zampini   if (localsizes2)              { ierr = PetscFree(localsizes2);CHKERRQ(ierr); }
4680a929c220SStefano Zampini   if (localdispl2)              { ierr = PetscFree(localdispl2);CHKERRQ(ierr); }
4681a929c220SStefano Zampini   if (temp_coarse_mat_vals)     { ierr = PetscFree(temp_coarse_mat_vals);CHKERRQ(ierr); }
4682a929c220SStefano Zampini 
46830bdf917eSStefano Zampini   /* Eval coarse null space */
46840bdf917eSStefano Zampini   if (pcbddc->NullSpace) {
46850bdf917eSStefano Zampini     const Vec *nsp_vecs;
46860bdf917eSStefano Zampini     PetscInt  nsp_size,coarse_nsp_size;
46870bdf917eSStefano Zampini     PetscBool nsp_has_cnst;
46880bdf917eSStefano Zampini     PetscReal test_null;
46890bdf917eSStefano Zampini     Vec       *coarse_nsp_vecs;
46900bdf917eSStefano Zampini 
46910bdf917eSStefano Zampini     coarse_nsp_size = 0;
46920bdf917eSStefano Zampini     coarse_nsp_vecs = 0;
46930bdf917eSStefano Zampini     ierr            = MatNullSpaceGetVecs(pcbddc->NullSpace,&nsp_has_cnst,&nsp_size,&nsp_vecs);CHKERRQ(ierr);
46940bdf917eSStefano Zampini     if (rank_prec_comm == active_rank) {
46950bdf917eSStefano Zampini       ierr = PetscMalloc((nsp_size+1)*sizeof(Vec),&coarse_nsp_vecs);CHKERRQ(ierr);
46960bdf917eSStefano Zampini       for (i=0; i<nsp_size+1; i++) {
46970bdf917eSStefano Zampini         ierr = VecDuplicate(pcbddc->coarse_vec,&coarse_nsp_vecs[i]);CHKERRQ(ierr);
46980bdf917eSStefano Zampini       }
46990bdf917eSStefano Zampini     }
47000bdf917eSStefano Zampini     if (nsp_has_cnst) {
47010bdf917eSStefano Zampini       ierr = VecSet(pcis->vec1_N,1.0);CHKERRQ(ierr);
47020bdf917eSStefano Zampini       ierr = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr);
47030bdf917eSStefano Zampini       ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->vec1_P,pcbddc->coarse_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
47040bdf917eSStefano Zampini       ierr = PCBDDCScatterCoarseDataEnd(pc,pcbddc->vec1_P,pcbddc->coarse_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
47050bdf917eSStefano Zampini       if (rank_prec_comm == active_rank) {
47060bdf917eSStefano Zampini         ierr = MatMult(pcbddc->coarse_mat,pcbddc->coarse_vec,pcbddc->coarse_rhs);CHKERRQ(ierr);
47070bdf917eSStefano Zampini         ierr = VecNorm(pcbddc->coarse_rhs,NORM_INFINITY,&test_null);CHKERRQ(ierr);
47080bdf917eSStefano Zampini         if (test_null > 1.0e-12 && pcbddc->dbg_flag) {
47090bdf917eSStefano Zampini           ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Constant coarse null space error % 1.14e\n",test_null);CHKERRQ(ierr);
47100bdf917eSStefano Zampini         }
47110bdf917eSStefano Zampini         ierr = VecCopy(pcbddc->coarse_vec,coarse_nsp_vecs[coarse_nsp_size]);CHKERRQ(ierr);
47120bdf917eSStefano Zampini         coarse_nsp_size++;
47130bdf917eSStefano Zampini       }
47140bdf917eSStefano Zampini     }
47150bdf917eSStefano Zampini     for (i=0; i<nsp_size; i++)  {
47160bdf917eSStefano Zampini       ierr = VecScatterBegin(matis->ctx,nsp_vecs[i],pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
47170bdf917eSStefano Zampini       ierr = VecScatterEnd  (matis->ctx,nsp_vecs[i],pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
47180bdf917eSStefano Zampini       ierr = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr);
47190bdf917eSStefano Zampini       ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->vec1_P,pcbddc->coarse_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
47200bdf917eSStefano Zampini       ierr = PCBDDCScatterCoarseDataEnd(pc,pcbddc->vec1_P,pcbddc->coarse_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
47210bdf917eSStefano Zampini       if (rank_prec_comm == active_rank) {
47220bdf917eSStefano Zampini         ierr = MatMult(pcbddc->coarse_mat,pcbddc->coarse_vec,pcbddc->coarse_rhs);CHKERRQ(ierr);
47230bdf917eSStefano Zampini         ierr = VecNorm(pcbddc->coarse_rhs,NORM_2,&test_null);CHKERRQ(ierr);
47240bdf917eSStefano Zampini         if (test_null > 1.0e-12 && pcbddc->dbg_flag) {
47250bdf917eSStefano Zampini           ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Vec %d coarse null space error % 1.14e\n",i,test_null);CHKERRQ(ierr);
47260bdf917eSStefano Zampini         }
47270bdf917eSStefano Zampini         ierr = VecCopy(pcbddc->coarse_vec,coarse_nsp_vecs[coarse_nsp_size]);CHKERRQ(ierr);
47280bdf917eSStefano Zampini         coarse_nsp_size++;
47290bdf917eSStefano Zampini       }
47300bdf917eSStefano Zampini     }
47310bdf917eSStefano Zampini     if (coarse_nsp_size > 0) {
47320bdf917eSStefano Zampini       /* TODO orthonormalize vecs */
47330298fd71SBarry Smith       ierr = VecNormalize(coarse_nsp_vecs[0],NULL);CHKERRQ(ierr);
47340bdf917eSStefano Zampini       ierr = MatNullSpaceCreate(coarse_comm,PETSC_FALSE,coarse_nsp_size,coarse_nsp_vecs,&pcbddc->CoarseNullSpace);CHKERRQ(ierr);
47350bdf917eSStefano Zampini       for (i=0; i<nsp_size+1; i++) {
47360bdf917eSStefano Zampini         ierr = VecDestroy(&coarse_nsp_vecs[i]);CHKERRQ(ierr);
47370bdf917eSStefano Zampini       }
47380bdf917eSStefano Zampini     }
47390bdf917eSStefano Zampini     ierr = PetscFree(coarse_nsp_vecs);CHKERRQ(ierr);
47400bdf917eSStefano Zampini   }
47410bdf917eSStefano Zampini 
47420bdf917eSStefano Zampini   /* KSP for coarse problem */
47430bdf917eSStefano Zampini   if (rank_prec_comm == active_rank) {
47442e8d2280SStefano Zampini     PetscBool isbddc=PETSC_FALSE;
47450bdf917eSStefano Zampini 
474653cdbc3dSStefano Zampini     ierr = KSPCreate(coarse_comm,&pcbddc->coarse_ksp);CHKERRQ(ierr);
474753cdbc3dSStefano Zampini     ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->coarse_ksp,(PetscObject)pc,1);CHKERRQ(ierr);
474853cdbc3dSStefano Zampini     ierr = KSPSetOperators(pcbddc->coarse_ksp,pcbddc->coarse_mat,pcbddc->coarse_mat,SAME_PRECONDITIONER);CHKERRQ(ierr);
47493b03a366Sstefano_zampini     ierr = KSPSetTolerances(pcbddc->coarse_ksp,PETSC_DEFAULT,PETSC_DEFAULT,PETSC_DEFAULT,max_it_coarse_ksp);CHKERRQ(ierr);
475053cdbc3dSStefano Zampini     ierr = KSPSetType(pcbddc->coarse_ksp,coarse_ksp_type);CHKERRQ(ierr);
475153cdbc3dSStefano Zampini     ierr = KSPGetPC(pcbddc->coarse_ksp,&pc_temp);CHKERRQ(ierr);
475253cdbc3dSStefano Zampini     ierr = PCSetType(pc_temp,coarse_pc_type);CHKERRQ(ierr);
47530c7d97c5SJed Brown     /* Allow user's customization */
4754da1bb401SStefano Zampini     ierr = KSPSetOptionsPrefix(pcbddc->coarse_ksp,"coarse_");CHKERRQ(ierr);
47550c7d97c5SJed Brown     /* Set Up PC for coarse problem BDDC */
475653cdbc3dSStefano Zampini     if (pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
47574fad6a16SStefano Zampini       i    = pcbddc->current_level+1;
47584fad6a16SStefano Zampini       ierr = PCBDDCSetLevel(pc_temp,i);CHKERRQ(ierr);
47594fad6a16SStefano Zampini       ierr = PCBDDCSetCoarseningRatio(pc_temp,pcbddc->coarsening_ratio);CHKERRQ(ierr);
47604fad6a16SStefano Zampini       ierr = PCBDDCSetMaxLevels(pc_temp,pcbddc->max_levels);CHKERRQ(ierr);
476153cdbc3dSStefano Zampini       ierr = PCBDDCSetCoarseProblemType(pc_temp,MULTILEVEL_BDDC);CHKERRQ(ierr);
47620bdf917eSStefano Zampini       if (pcbddc->CoarseNullSpace) { ierr = PCBDDCSetNullSpace(pc_temp,pcbddc->CoarseNullSpace);CHKERRQ(ierr); }
47634fad6a16SStefano Zampini       if (dbg_flag) {
47644fad6a16SStefano Zampini         ierr = PetscViewerASCIIPrintf(viewer,"----------------Level %d: Setting up level %d---------------\n",pcbddc->current_level,i);CHKERRQ(ierr);
47654fad6a16SStefano Zampini         ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
476653cdbc3dSStefano Zampini       }
47674fad6a16SStefano Zampini     }
47684fad6a16SStefano Zampini     ierr = KSPSetFromOptions(pcbddc->coarse_ksp);CHKERRQ(ierr);
476953cdbc3dSStefano Zampini     ierr = KSPSetUp(pcbddc->coarse_ksp);CHKERRQ(ierr);
4770142dfd88SStefano Zampini 
47710298fd71SBarry Smith     ierr = KSPGetTolerances(pcbddc->coarse_ksp,NULL,NULL,NULL,&j);CHKERRQ(ierr);
47722e8d2280SStefano Zampini     ierr = KSPGetPC(pcbddc->coarse_ksp,&pc_temp);CHKERRQ(ierr);
47732e8d2280SStefano Zampini     ierr = PetscObjectTypeCompare((PetscObject)pc_temp,PCBDDC,&isbddc);CHKERRQ(ierr);
47742e8d2280SStefano Zampini     if (j == 1) {
47752e8d2280SStefano Zampini       ierr = KSPSetNormType(pcbddc->coarse_ksp,KSP_NORM_NONE);CHKERRQ(ierr);
47762e8d2280SStefano Zampini       if (isbddc) {
47772e8d2280SStefano Zampini         ierr = PCBDDCSetUseExactDirichlet(pc_temp,PETSC_FALSE);CHKERRQ(ierr);
47785619798eSStefano Zampini       }
47795619798eSStefano Zampini     }
47800c7d97c5SJed Brown   }
4781a929c220SStefano Zampini   /* Check coarse problem if requested */
4782142dfd88SStefano Zampini   if (dbg_flag && rank_prec_comm == active_rank) {
4783142dfd88SStefano Zampini     KSP       check_ksp;
4784142dfd88SStefano Zampini     PC        check_pc;
4785142dfd88SStefano Zampini     Vec       check_vec;
4786142dfd88SStefano Zampini     PetscReal abs_infty_error,infty_error,lambda_min,lambda_max;
478719fd82e9SBarry Smith     KSPType   check_ksp_type;
47880c7d97c5SJed Brown 
4789142dfd88SStefano Zampini     /* Create ksp object suitable for extreme eigenvalues' estimation */
4790142dfd88SStefano Zampini     ierr = KSPCreate(coarse_comm,&check_ksp);CHKERRQ(ierr);
4791142dfd88SStefano Zampini     ierr = KSPSetOperators(check_ksp,pcbddc->coarse_mat,pcbddc->coarse_mat,SAME_PRECONDITIONER);CHKERRQ(ierr);
47920bdf917eSStefano Zampini     ierr = KSPSetTolerances(check_ksp,1.e-12,1.e-12,PETSC_DEFAULT,pcbddc->coarse_size);CHKERRQ(ierr);
4793142dfd88SStefano Zampini     if (pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
47942fa5cd67SKarl Rupp       if (issym) check_ksp_type = KSPCG;
47952fa5cd67SKarl Rupp       else check_ksp_type = KSPGMRES;
4796142dfd88SStefano Zampini       ierr = KSPSetComputeSingularValues(check_ksp,PETSC_TRUE);CHKERRQ(ierr);
4797142dfd88SStefano Zampini     } else {
4798142dfd88SStefano Zampini       check_ksp_type = KSPPREONLY;
4799142dfd88SStefano Zampini     }
4800142dfd88SStefano Zampini     ierr = KSPSetType(check_ksp,check_ksp_type);CHKERRQ(ierr);
4801142dfd88SStefano Zampini     ierr = KSPGetPC(pcbddc->coarse_ksp,&check_pc);CHKERRQ(ierr);
4802142dfd88SStefano Zampini     ierr = KSPSetPC(check_ksp,check_pc);CHKERRQ(ierr);
4803142dfd88SStefano Zampini     ierr = KSPSetUp(check_ksp);CHKERRQ(ierr);
4804142dfd88SStefano Zampini     /* create random vec */
4805142dfd88SStefano Zampini     ierr = VecDuplicate(pcbddc->coarse_vec,&check_vec);CHKERRQ(ierr);
48060298fd71SBarry Smith     ierr = VecSetRandom(check_vec,NULL);CHKERRQ(ierr);
48070298fd71SBarry Smith     if (pcbddc->CoarseNullSpace) { ierr = MatNullSpaceRemove(pcbddc->CoarseNullSpace,check_vec,NULL);CHKERRQ(ierr); }
4808142dfd88SStefano Zampini     ierr = MatMult(pcbddc->coarse_mat,check_vec,pcbddc->coarse_rhs);CHKERRQ(ierr);
4809142dfd88SStefano Zampini     /* solve coarse problem */
4810142dfd88SStefano Zampini     ierr = KSPSolve(check_ksp,pcbddc->coarse_rhs,pcbddc->coarse_vec);CHKERRQ(ierr);
48110298fd71SBarry Smith     if (pcbddc->CoarseNullSpace) { ierr = MatNullSpaceRemove(pcbddc->CoarseNullSpace,pcbddc->coarse_vec,NULL);CHKERRQ(ierr); }
4812142dfd88SStefano Zampini     /* check coarse problem residual error */
4813142dfd88SStefano Zampini     ierr = VecAXPY(check_vec,-1.0,pcbddc->coarse_vec);CHKERRQ(ierr);
4814142dfd88SStefano Zampini     ierr = VecNorm(check_vec,NORM_INFINITY,&infty_error);CHKERRQ(ierr);
4815142dfd88SStefano Zampini     ierr = MatMult(pcbddc->coarse_mat,check_vec,pcbddc->coarse_rhs);CHKERRQ(ierr);
4816142dfd88SStefano Zampini     ierr = VecNorm(pcbddc->coarse_rhs,NORM_INFINITY,&abs_infty_error);CHKERRQ(ierr);
4817142dfd88SStefano Zampini     ierr = VecDestroy(&check_vec);CHKERRQ(ierr);
4818142dfd88SStefano Zampini     /* get eigenvalue estimation if inexact */
4819142dfd88SStefano Zampini     if (pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
4820142dfd88SStefano Zampini       ierr = KSPComputeExtremeSingularValues(check_ksp,&lambda_max,&lambda_min);CHKERRQ(ierr);
4821142dfd88SStefano Zampini       ierr = KSPGetIterationNumber(check_ksp,&k);CHKERRQ(ierr);
4822142dfd88SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem eigenvalues estimated with %d iterations of %s.\n",k,check_ksp_type);CHKERRQ(ierr);
4823e269702eSStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem eigenvalues: % 1.14e %1.14e\n",lambda_min,lambda_max);CHKERRQ(ierr);
48243b03a366Sstefano_zampini     }
4825142dfd88SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem exact infty_error   : %1.14e\n",infty_error);CHKERRQ(ierr);
4826142dfd88SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem residual infty_error: %1.14e\n",abs_infty_error);CHKERRQ(ierr);
4827142dfd88SStefano Zampini     ierr = KSPDestroy(&check_ksp);CHKERRQ(ierr);
482853cdbc3dSStefano Zampini   }
4829142dfd88SStefano Zampini   if (dbg_flag) { ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); }
48300c7d97c5SJed Brown   PetscFunctionReturn(0);
48310c7d97c5SJed Brown }
48320c7d97c5SJed Brown 
48330c7d97c5SJed Brown #undef __FUNCT__
48340c7d97c5SJed Brown #define __FUNCT__ "PCBDDCManageLocalBoundaries"
483553cdbc3dSStefano Zampini static PetscErrorCode PCBDDCManageLocalBoundaries(PC pc)
48360c7d97c5SJed Brown {
48370c7d97c5SJed Brown   PC_BDDC        *pcbddc  = (PC_BDDC*)pc->data;
48380c7d97c5SJed Brown   PC_IS          *pcis    = (PC_IS*)pc->data;
48390c7d97c5SJed Brown   Mat_IS         *matis   = (Mat_IS*)pc->pmat->data;
4840da1bb401SStefano Zampini   PCBDDCGraph    mat_graph=pcbddc->mat_graph;
48417cf533a6SStefano Zampini   PetscInt       *is_indices,*auxis;
48423b03a366Sstefano_zampini   PetscInt       bs,ierr,i,j,s,k,iindex,neumann_bsize,dirichlet_bsize;
4843da1bb401SStefano Zampini   PetscInt       total_counts,nodes_touched,where_values=1,vertex_size;
4844534831adSStefano Zampini   PetscMPIInt    adapt_interface=0,adapt_interface_reduced=0,NEUMANNCNT=0;
4845da1bb401SStefano Zampini   PetscBool      same_set;
4846ce94432eSBarry Smith   MPI_Comm       interface_comm;
48473b03a366Sstefano_zampini   PetscBool      use_faces = PETSC_FALSE,use_edges = PETSC_FALSE;
48483b03a366Sstefano_zampini   const PetscInt *neumann_nodes;
48493b03a366Sstefano_zampini   const PetscInt *dirichlet_nodes;
4850a81d60d8SStefano Zampini   IS             used_IS,*custom_ISForDofs;
4851da1bb401SStefano Zampini   PetscScalar    *array;
4852da1bb401SStefano Zampini   PetscScalar    *array2;
4853da1bb401SStefano Zampini   PetscViewer    viewer=pcbddc->dbg_viewer;
4854a929c220SStefano Zampini   PetscInt       *queue_in_global_numbering;
48550c7d97c5SJed Brown 
48560c7d97c5SJed Brown   PetscFunctionBegin;
4857ce94432eSBarry Smith   ierr = PetscObjectGetComm((PetscObject)pc,&interface_comm);CHKERRQ(ierr);
4858da1bb401SStefano Zampini   /* Setup local adjacency graph */
4859da1bb401SStefano Zampini   mat_graph->nvtxs=pcis->n;
48602fa5cd67SKarl Rupp   if (!mat_graph->xadj) NEUMANNCNT = 1;
4861da1bb401SStefano Zampini   ierr = PCBDDCSetupLocalAdjacencyGraph(pc);CHKERRQ(ierr);
48622fa5cd67SKarl Rupp 
4863a0ba757dSStefano Zampini   i    = mat_graph->nvtxs;
4864a0ba757dSStefano Zampini   ierr = PetscMalloc4(i,PetscInt,&mat_graph->where,i,PetscInt,&mat_graph->count,i+1,PetscInt,&mat_graph->cptr,i,PetscInt,&mat_graph->queue);CHKERRQ(ierr);
48653972b0daSStefano Zampini   ierr = PetscMalloc2(i,PetscInt,&mat_graph->which_dof,i,PetscBool,&mat_graph->touched);CHKERRQ(ierr);
4866a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->where,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
4867a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->count,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
4868a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->which_dof,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
4869a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->queue,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
48703828260eSStefano Zampini   ierr = PetscMemzero(mat_graph->cptr,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr);
4871a0ba757dSStefano Zampini 
4872a81d60d8SStefano Zampini   /* Setting dofs splitting in mat_graph->which_dof
4873a81d60d8SStefano Zampini      Get information about dofs' splitting if provided by the user
4874a81d60d8SStefano Zampini      Otherwise it assumes a constant block size */
4875a81d60d8SStefano Zampini   vertex_size=0;
4876a81d60d8SStefano Zampini   if (!pcbddc->n_ISForDofs) {
4877a81d60d8SStefano Zampini     ierr = MatGetBlockSize(matis->A,&bs);CHKERRQ(ierr);
4878a81d60d8SStefano Zampini     ierr = PetscMalloc(bs*sizeof(IS),&custom_ISForDofs);CHKERRQ(ierr);
4879a81d60d8SStefano Zampini     for (i=0; i<bs; i++) {
4880a81d60d8SStefano Zampini       ierr = ISCreateStride(PETSC_COMM_SELF,pcis->n/bs,i,bs,&custom_ISForDofs[i]);CHKERRQ(ierr);
4881a81d60d8SStefano Zampini     }
4882a81d60d8SStefano Zampini     ierr = PCBDDCSetDofsSplitting(pc,bs,custom_ISForDofs);CHKERRQ(ierr);
4883a81d60d8SStefano Zampini     vertex_size=1;
4884a81d60d8SStefano Zampini     /* remove my references to IS objects */
4885a81d60d8SStefano Zampini     for (i=0; i<bs; i++) {
4886a81d60d8SStefano Zampini       ierr = ISDestroy(&custom_ISForDofs[i]);CHKERRQ(ierr);
4887a81d60d8SStefano Zampini     }
4888a81d60d8SStefano Zampini     ierr = PetscFree(custom_ISForDofs);CHKERRQ(ierr);
4889a81d60d8SStefano Zampini   }
48909c0446d6SStefano Zampini   for (i=0; i<pcbddc->n_ISForDofs; i++) {
4891a81d60d8SStefano Zampini     ierr = ISGetSize(pcbddc->ISForDofs[i],&k);CHKERRQ(ierr);
48929c0446d6SStefano Zampini     ierr = ISGetIndices(pcbddc->ISForDofs[i],(const PetscInt**)&is_indices);CHKERRQ(ierr);
48932fa5cd67SKarl Rupp     for (j=0; j<k; j++) mat_graph->which_dof[is_indices[j]]=i;
48949c0446d6SStefano Zampini     ierr = ISRestoreIndices(pcbddc->ISForDofs[i],(const PetscInt**)&is_indices);CHKERRQ(ierr);
48959c0446d6SStefano Zampini   }
4896a81d60d8SStefano Zampini   /* use mat block size as vertex size if it has not yet set */
4897a81d60d8SStefano Zampini   if (!vertex_size) {
48983b03a366Sstefano_zampini     ierr = MatGetBlockSize(matis->A,&vertex_size);CHKERRQ(ierr);
48990c7d97c5SJed Brown   }
4900a81d60d8SStefano Zampini 
49013b03a366Sstefano_zampini   /* count number of neigh per node */
49020c7d97c5SJed Brown   total_counts=0;
49033b03a366Sstefano_zampini   for (i=1; i<pcis->n_neigh; i++) {
49040c7d97c5SJed Brown     s             = pcis->n_shared[i];
49050c7d97c5SJed Brown     total_counts += s;
49062fa5cd67SKarl Rupp     for (j=0;j<s;j++) mat_graph->count[pcis->shared[i][j]] += 1;
49070c7d97c5SJed Brown   }
49082fa5cd67SKarl Rupp 
4909534831adSStefano Zampini   /* Take into account Neumann data -> it increments number of sharing subdomains for nodes lying on the interface */
491036e030ebSStefano Zampini   ierr = PCBDDCGetNeumannBoundaries(pc,&used_IS);CHKERRQ(ierr);
4911da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
4912da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
491336e030ebSStefano Zampini   if (used_IS) {
491436e030ebSStefano Zampini     ierr = ISGetSize(used_IS,&neumann_bsize);CHKERRQ(ierr);
491536e030ebSStefano Zampini     ierr = ISGetIndices(used_IS,&neumann_nodes);CHKERRQ(ierr);
491653cdbc3dSStefano Zampini     for (i=0; i<neumann_bsize; i++) {
491753cdbc3dSStefano Zampini       iindex = neumann_nodes[i];
4918534831adSStefano Zampini       if (mat_graph->count[iindex] > NEUMANNCNT && array[iindex]==0.0) {
491953cdbc3dSStefano Zampini         mat_graph->count[iindex]+=1;
49200c7d97c5SJed Brown         total_counts++;
4921da1bb401SStefano Zampini         array[iindex]=array[iindex]+1.0;
4922f23aa3ddSBarry Smith       } else if (array[iindex]>0.0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_USER,"Error for neumann nodes provided to BDDC! They must be uniquely listed! Found duplicate node %d\n",iindex);
49230c7d97c5SJed Brown     }
49240c7d97c5SJed Brown   }
4925da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
4926da1bb401SStefano Zampini   /* allocate space for storing the set of neighbours for each node */
4927da1bb401SStefano Zampini   ierr = PetscMalloc(mat_graph->nvtxs*sizeof(PetscInt*),&mat_graph->neighbours_set);CHKERRQ(ierr);
4928da1bb401SStefano Zampini   if (mat_graph->nvtxs) { ierr = PetscMalloc(total_counts*sizeof(PetscInt),&mat_graph->neighbours_set[0]);CHKERRQ(ierr); }
4929da1bb401SStefano Zampini   for (i=1; i<mat_graph->nvtxs; i++) mat_graph->neighbours_set[i]=mat_graph->neighbours_set[i-1]+mat_graph->count[i-1];
4930a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->count,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
49313b03a366Sstefano_zampini   for (i=1; i<pcis->n_neigh; i++) {
49320c7d97c5SJed Brown     s=pcis->n_shared[i];
49330c7d97c5SJed Brown     for (j=0; j<s; j++) {
49340c7d97c5SJed Brown       k=pcis->shared[i][j];
49352fa5cd67SKarl Rupp 
4936da1bb401SStefano Zampini       mat_graph->neighbours_set[k][mat_graph->count[k]] = pcis->neigh[i];
49372fa5cd67SKarl Rupp 
49380c7d97c5SJed Brown       mat_graph->count[k]+=1;
49390c7d97c5SJed Brown     }
49400c7d97c5SJed Brown   }
4941da1bb401SStefano Zampini   /* Check consistency of Neumann nodes */
4942da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
4943da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4944da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4945da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4946da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4947da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
49483b03a366Sstefano_zampini   /* set -1 fake neighbour to mimic Neumann boundary */
494936e030ebSStefano Zampini   if (used_IS) {
495053cdbc3dSStefano Zampini     for (i=0; i<neumann_bsize; i++) {
495153cdbc3dSStefano Zampini       iindex = neumann_nodes[i];
4952534831adSStefano Zampini       if (mat_graph->count[iindex] > NEUMANNCNT) {
49532fa5cd67SKarl Rupp         if (mat_graph->count[iindex]+1 != (PetscInt)array[iindex]) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_USER,"Neumann nodes provided to BDDC must be consistent among neighbours!\nNode %d: number of sharing subdomains %d != number of subdomains for which it is a neumann node %d\n",iindex,mat_graph->count[iindex]+1,(PetscInt)array[iindex]);
4954da1bb401SStefano Zampini         mat_graph->neighbours_set[iindex][mat_graph->count[iindex]] = -1;
49552fa5cd67SKarl Rupp 
495653cdbc3dSStefano Zampini         mat_graph->count[iindex]+=1;
49570c7d97c5SJed Brown       }
49580c7d97c5SJed Brown     }
495936e030ebSStefano Zampini     ierr = ISRestoreIndices(used_IS,&neumann_nodes);CHKERRQ(ierr);
49600c7d97c5SJed Brown   }
4961da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
4962da1bb401SStefano Zampini   /* sort set of sharing subdomains */
49632fa5cd67SKarl Rupp   for (i=0;i<mat_graph->nvtxs;i++) {
49642fa5cd67SKarl Rupp     ierr = PetscSortInt(mat_graph->count[i],mat_graph->neighbours_set[i]);CHKERRQ(ierr);
49652fa5cd67SKarl Rupp   }
49662fa5cd67SKarl Rupp 
49673b03a366Sstefano_zampini   /* remove interior nodes and dirichlet boundary nodes from the next search into the graph */
49682fa5cd67SKarl Rupp   for (i=0;i<mat_graph->nvtxs;i++) mat_graph->touched[i]=PETSC_FALSE;
4969da1bb401SStefano Zampini   nodes_touched=0;
49702fa5cd67SKarl Rupp 
497136e030ebSStefano Zampini   ierr = PCBDDCGetDirichletBoundaries(pc,&used_IS);CHKERRQ(ierr);
4972da1bb401SStefano Zampini   ierr = VecSet(pcis->vec2_N,0.0);CHKERRQ(ierr);
4973da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
4974da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec2_N,&array2);CHKERRQ(ierr);
4975da1bb401SStefano Zampini   if (used_IS) {
4976da1bb401SStefano Zampini     ierr = ISGetSize(used_IS,&dirichlet_bsize);CHKERRQ(ierr);
4977f23aa3ddSBarry Smith     if (dirichlet_bsize && matis->pure_neumann) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_USER,"Dirichlet boundaries are intended to be used with matrices with zeroed rows!\n");
4978da1bb401SStefano Zampini     ierr = ISGetIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr);
4979da1bb401SStefano Zampini     for (i=0; i<dirichlet_bsize; i++) {
4980da1bb401SStefano Zampini       iindex = dirichlet_nodes[i];
4981da1bb401SStefano Zampini       if (mat_graph->count[iindex] && !mat_graph->touched[iindex]) {
4982f23aa3ddSBarry Smith         if (array[iindex]>0.0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_USER,"BDDC cannot have nodes which are marked as Neumann and Dirichlet at the same time! Wrong node %d\n",iindex);
4983da1bb401SStefano Zampini         mat_graph->touched[iindex] = PETSC_TRUE;
4984da1bb401SStefano Zampini         mat_graph->where[iindex]   = 0;
4985da1bb401SStefano Zampini         nodes_touched++;
4986da1bb401SStefano Zampini         array2[iindex] = array2[iindex]+1.0;
4987da1bb401SStefano Zampini       }
4988da1bb401SStefano Zampini     }
4989da1bb401SStefano Zampini     ierr = ISRestoreIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr);
4990da1bb401SStefano Zampini   }
4991da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
4992da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec2_N,&array2);CHKERRQ(ierr);
49932fa5cd67SKarl Rupp 
4994da1bb401SStefano Zampini   /* Check consistency of Dirichlet nodes */
4995da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_N,1.0);CHKERRQ(ierr);
4996da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
4997da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4998da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4999da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
5000da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
5001da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
5002da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec2_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
5003da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec2_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
5004da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
5005da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
5006da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
5007da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec2_N,&array2);CHKERRQ(ierr);
500836e030ebSStefano Zampini   if (used_IS) {
500936e030ebSStefano Zampini     ierr = ISGetSize(used_IS,&dirichlet_bsize);CHKERRQ(ierr);
501036e030ebSStefano Zampini     ierr = ISGetIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr);
50113b03a366Sstefano_zampini     for (i=0; i<dirichlet_bsize; i++) {
5012da1bb401SStefano Zampini       iindex=dirichlet_nodes[i];
50132fa5cd67SKarl Rupp       if (array[iindex]>1.0 && array[iindex]!=array2[iindex]) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_USER,"Dirichlet nodes provided to BDDC must be consistent among neighbours!\nNode %d: number of sharing subdomains %d != number of subdomains for which it is a neumann node %d\n",iindex,(PetscInt)array[iindex],(PetscInt)array2[iindex]);
50143b03a366Sstefano_zampini     }
501536e030ebSStefano Zampini     ierr = ISRestoreIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr);
50163b03a366Sstefano_zampini   }
5017da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
5018da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec2_N,&array2);CHKERRQ(ierr);
5019da1bb401SStefano Zampini 
50200c7d97c5SJed Brown   for (i=0; i<mat_graph->nvtxs; i++) {
50213b03a366Sstefano_zampini     if (!mat_graph->count[i]) {  /* interior nodes */
50220c7d97c5SJed Brown       mat_graph->touched[i] = PETSC_TRUE;
50230c7d97c5SJed Brown       mat_graph->where[i]   = 0;
50240c7d97c5SJed Brown       nodes_touched++;
50250c7d97c5SJed Brown     }
50260c7d97c5SJed Brown   }
50270c7d97c5SJed Brown   mat_graph->ncmps = 0;
50282fa5cd67SKarl Rupp 
5029da1bb401SStefano Zampini   i=0;
50300c7d97c5SJed Brown   while (nodes_touched<mat_graph->nvtxs) {
5031a0ba757dSStefano Zampini     /*  find first untouched node in local ordering */
50320c7d97c5SJed Brown     while (mat_graph->touched[i]) i++;
50330c7d97c5SJed Brown     mat_graph->touched[i]=PETSC_TRUE;
5034a0ba757dSStefano Zampini     mat_graph->where[i]  =where_values;
50350c7d97c5SJed Brown     nodes_touched++;
5036a0ba757dSStefano Zampini     /* now find all other nodes having the same set of sharing subdomains */
50370c7d97c5SJed Brown     for (j=i+1; j<mat_graph->nvtxs; j++) {
5038a0ba757dSStefano Zampini       /* check for same number of sharing subdomains and dof number */
5039da1bb401SStefano Zampini       if (!mat_graph->touched[j] && mat_graph->count[i]==mat_graph->count[j] && mat_graph->which_dof[i] == mat_graph->which_dof[j]) {
5040a0ba757dSStefano Zampini         /* check for same set of sharing subdomains */
50410c7d97c5SJed Brown         same_set=PETSC_TRUE;
50420c7d97c5SJed Brown         for (k=0; k<mat_graph->count[j]; k++) {
5043da1bb401SStefano Zampini           if (mat_graph->neighbours_set[i][k] != mat_graph->neighbours_set[j][k]) {
50440c7d97c5SJed Brown             same_set=PETSC_FALSE;
50450c7d97c5SJed Brown           }
50460c7d97c5SJed Brown         }
5047a0ba757dSStefano Zampini         /* I found a friend of mine */
50480c7d97c5SJed Brown         if (same_set) {
5049a0ba757dSStefano Zampini           mat_graph->where[j]   = where_values;
50500c7d97c5SJed Brown           mat_graph->touched[j] = PETSC_TRUE;
50510c7d97c5SJed Brown           nodes_touched++;
50520c7d97c5SJed Brown         }
50530c7d97c5SJed Brown       }
50540c7d97c5SJed Brown     }
5055a0ba757dSStefano Zampini     where_values++;
50560c7d97c5SJed Brown   }
5057a0ba757dSStefano Zampini   where_values--; if (where_values<0) where_values=0;
5058a0ba757dSStefano Zampini   ierr = PetscMalloc(where_values*sizeof(PetscMPIInt),&mat_graph->where_ncmps);CHKERRQ(ierr);
5059a0ba757dSStefano Zampini   /* Find connected components defined on the shared interface */
5060a0ba757dSStefano Zampini   if (where_values) {
50612fa5cd67SKarl Rupp     ierr = PCBDDCFindConnectedComponents(mat_graph, where_values);CHKERRQ(ierr);
5062a0ba757dSStefano Zampini   }
5063a929c220SStefano Zampini   ierr = PetscMalloc(mat_graph->nvtxs*sizeof(PetscInt),&queue_in_global_numbering);CHKERRQ(ierr);
5064a0ba757dSStefano Zampini   /* check consistency of connected components among neighbouring subdomains -> it adapt them in case it is needed */
5065a0ba757dSStefano Zampini   for (i=0;i<where_values;i++) {
50667cf533a6SStefano Zampini     /* We are not sure that on a given subset of the local interface,
50677cf533a6SStefano Zampini        two connected components will be the same among sharing subdomains */
50683b03a366Sstefano_zampini     if (mat_graph->where_ncmps[i]>1) {
5069a0ba757dSStefano Zampini       adapt_interface=1;
5070a0ba757dSStefano Zampini       break;
5071a0ba757dSStefano Zampini     }
5072a0ba757dSStefano Zampini   }
50732fa5cd67SKarl Rupp 
5074a0ba757dSStefano Zampini   ierr = MPI_Allreduce(&adapt_interface,&adapt_interface_reduced,1,MPIU_INT,MPI_LOR,interface_comm);CHKERRQ(ierr);
5075da1bb401SStefano Zampini   if (pcbddc->dbg_flag && adapt_interface_reduced) {
5076d8923723SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"Adapting interface\n");CHKERRQ(ierr);
5077da1bb401SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
5078da1bb401SStefano Zampini   }
5079a0ba757dSStefano Zampini   if (where_values && adapt_interface_reduced) {
5080a0ba757dSStefano Zampini     PetscInt    sum_requests=0,my_rank;
5081a0ba757dSStefano Zampini     PetscInt    buffer_size,start_of_recv,size_of_recv,start_of_send;
5082a0ba757dSStefano Zampini     PetscInt    temp_buffer_size,ins_val,global_where_counter;
5083a0ba757dSStefano Zampini     PetscInt    *cum_recv_counts;
5084a0ba757dSStefano Zampini     PetscInt    *where_to_nodes_indices;
5085a0ba757dSStefano Zampini     PetscInt    *petsc_buffer;
5086a0ba757dSStefano Zampini     PetscMPIInt *recv_buffer;
5087a0ba757dSStefano Zampini     PetscMPIInt *recv_buffer_where;
5088a0ba757dSStefano Zampini     PetscMPIInt *send_buffer;
5089a0ba757dSStefano Zampini     PetscMPIInt size_of_send;
5090a0ba757dSStefano Zampini     PetscInt    *sizes_of_sends;
5091a0ba757dSStefano Zampini     MPI_Request *send_requests;
5092a0ba757dSStefano Zampini     MPI_Request *recv_requests;
5093a0ba757dSStefano Zampini     PetscInt    *where_cc_adapt;
5094a0ba757dSStefano Zampini     PetscInt    **temp_buffer;
5095a0ba757dSStefano Zampini     PetscInt    *nodes_to_temp_buffer_indices;
5096a0ba757dSStefano Zampini     PetscInt    *add_to_where;
50977cf533a6SStefano Zampini     PetscInt    *aux_new_xadj,*new_xadj,*new_adjncy;
5098a0ba757dSStefano Zampini 
50997cf533a6SStefano Zampini     /* Retrict adjacency graph using information from connected components */
51007cf533a6SStefano Zampini     ierr = PetscMalloc(mat_graph->nvtxs*sizeof(PetscInt),&aux_new_xadj);CHKERRQ(ierr);
51012fa5cd67SKarl Rupp     for (i=0; i<mat_graph->nvtxs; i++) aux_new_xadj[i]=1;
51027cf533a6SStefano Zampini     for (i=0;i<mat_graph->ncmps;i++) {
51037cf533a6SStefano Zampini       k = mat_graph->cptr[i+1]-mat_graph->cptr[i];
51042fa5cd67SKarl Rupp       for (j=0;j<k;j++) aux_new_xadj[mat_graph->queue[mat_graph->cptr[i]+j]]=k;
51057cf533a6SStefano Zampini     }
51067cf533a6SStefano Zampini     j = 0;
51072fa5cd67SKarl Rupp     for (i=0;i<mat_graph->nvtxs;i++) j += aux_new_xadj[i];
51082fa5cd67SKarl Rupp 
51097cf533a6SStefano Zampini     ierr = PetscMalloc((mat_graph->nvtxs+1)*sizeof(PetscInt),&new_xadj);CHKERRQ(ierr);
51107cf533a6SStefano Zampini     ierr = PetscMalloc(j*sizeof(PetscInt),&new_adjncy);CHKERRQ(ierr);
51117cf533a6SStefano Zampini     new_xadj[0]=0;
51127cf533a6SStefano Zampini     for (i=0;i<mat_graph->nvtxs;i++) {
51137cf533a6SStefano Zampini       new_xadj[i+1]=new_xadj[i]+aux_new_xadj[i];
51142fa5cd67SKarl Rupp       if (aux_new_xadj[i]==1) new_adjncy[new_xadj[i]]=i;
51157cf533a6SStefano Zampini     }
5116354b9337SStefano Zampini     ierr = PetscFree(aux_new_xadj);CHKERRQ(ierr);
51177cf533a6SStefano Zampini     for (i=0; i<mat_graph->ncmps; i++) {
51187cf533a6SStefano Zampini       k = mat_graph->cptr[i+1]-mat_graph->cptr[i];
51197cf533a6SStefano Zampini       for (j=0; j<k; j++) {
51207cf533a6SStefano Zampini         ierr = PetscMemcpy(&new_adjncy[new_xadj[mat_graph->queue[mat_graph->cptr[i]+j]]],&mat_graph->queue[mat_graph->cptr[i]],k*sizeof(PetscInt));CHKERRQ(ierr);
51217cf533a6SStefano Zampini       }
51227cf533a6SStefano Zampini     }
51237cf533a6SStefano Zampini     ierr = PCBDDCSetLocalAdjacencyGraph(pc,mat_graph->nvtxs,new_xadj,new_adjncy,PETSC_OWN_POINTER);CHKERRQ(ierr);
51247cf533a6SStefano Zampini     /* For consistency among neughbouring procs, I need to sort (by global ordering) each connected component */
51257cf533a6SStefano Zampini     for (i=0; i<mat_graph->ncmps; i++) {
51267cf533a6SStefano Zampini       k    = mat_graph->cptr[i+1]-mat_graph->cptr[i];
51277cf533a6SStefano Zampini       ierr = ISLocalToGlobalMappingApply(matis->mapping,k,&mat_graph->queue[mat_graph->cptr[i]],&queue_in_global_numbering[mat_graph->cptr[i]]);CHKERRQ(ierr);
51287cf533a6SStefano Zampini       ierr = PetscSortIntWithArray(k,&queue_in_global_numbering[mat_graph->cptr[i]],&mat_graph->queue[mat_graph->cptr[i]]);CHKERRQ(ierr);
51297cf533a6SStefano Zampini     }
51307cf533a6SStefano Zampini     /* allocate some space */
5131a0ba757dSStefano Zampini     ierr = MPI_Comm_rank(interface_comm,&my_rank);CHKERRQ(ierr);
5132a0ba757dSStefano Zampini     ierr = PetscMalloc((where_values+1)*sizeof(PetscInt),&cum_recv_counts);CHKERRQ(ierr);
5133a0ba757dSStefano Zampini     ierr = PetscMemzero(cum_recv_counts,(where_values+1)*sizeof(PetscInt));CHKERRQ(ierr);
5134a0ba757dSStefano Zampini     ierr = PetscMalloc(where_values*sizeof(PetscInt),&where_to_nodes_indices);CHKERRQ(ierr);
5135a0ba757dSStefano Zampini     /* first count how many neighbours per connected component I will receive from */
5136a0ba757dSStefano Zampini     cum_recv_counts[0]=0;
5137a0ba757dSStefano Zampini     for (i=1; i<where_values+1; i++) {
5138a0ba757dSStefano Zampini       j=0;
51392fa5cd67SKarl Rupp       while (mat_graph->where[j] != i) j++;
5140a0ba757dSStefano Zampini       where_to_nodes_indices[i-1]=j;
51412fa5cd67SKarl Rupp       if (mat_graph->neighbours_set[j][0]!=-1) cum_recv_counts[i]=cum_recv_counts[i-1]+mat_graph->count[j]; /* We don't want sends/recvs_to/from_self -> here I don't count myself  */
51422fa5cd67SKarl Rupp       else cum_recv_counts[i]=cum_recv_counts[i-1]+mat_graph->count[j]-1;
5143a0ba757dSStefano Zampini     }
5144a0ba757dSStefano Zampini     ierr = PetscMalloc(2*cum_recv_counts[where_values]*sizeof(PetscMPIInt),&recv_buffer_where);CHKERRQ(ierr);
5145a0ba757dSStefano Zampini     ierr = PetscMalloc(cum_recv_counts[where_values]*sizeof(MPI_Request),&send_requests);CHKERRQ(ierr);
5146a0ba757dSStefano Zampini     ierr = PetscMalloc(cum_recv_counts[where_values]*sizeof(MPI_Request),&recv_requests);CHKERRQ(ierr);
5147a0ba757dSStefano Zampini     for (i=0; i<cum_recv_counts[where_values]; i++) {
5148a0ba757dSStefano Zampini       send_requests[i]=MPI_REQUEST_NULL;
5149a0ba757dSStefano Zampini       recv_requests[i]=MPI_REQUEST_NULL;
5150a0ba757dSStefano Zampini     }
5151a0ba757dSStefano Zampini     /* exchange with my neighbours the number of my connected components on the shared interface */
5152a0ba757dSStefano Zampini     for (i=0; i<where_values; i++) {
5153a0ba757dSStefano Zampini       j = where_to_nodes_indices[i];
5154da1bb401SStefano Zampini       k = (mat_graph->neighbours_set[j][0] == -1 ?  1 : 0);
5155a0ba757dSStefano Zampini       for (; k<mat_graph->count[j]; k++) {
5156da1bb401SStefano Zampini         ierr = MPI_Isend(&mat_graph->where_ncmps[i],1,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr);
5157da1bb401SStefano Zampini         ierr = MPI_Irecv(&recv_buffer_where[sum_requests],1,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr);
5158a0ba757dSStefano Zampini         sum_requests++;
5159a0ba757dSStefano Zampini       }
5160a0ba757dSStefano Zampini     }
5161a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
5162a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
5163a0ba757dSStefano Zampini     /* determine the connected component I need to adapt */
5164a0ba757dSStefano Zampini     ierr = PetscMalloc(where_values*sizeof(PetscInt),&where_cc_adapt);CHKERRQ(ierr);
5165a0ba757dSStefano Zampini     ierr = PetscMemzero(where_cc_adapt,where_values*sizeof(PetscInt));CHKERRQ(ierr);
5166a0ba757dSStefano Zampini     for (i=0; i<where_values; i++) {
5167a0ba757dSStefano Zampini       for (j=cum_recv_counts[i]; j<cum_recv_counts[i+1]; j++) {
51683b03a366Sstefano_zampini         /* The first condition is natural (i.e someone has a different number of cc than me), the second one is just to be safe */
51693b03a366Sstefano_zampini         if (mat_graph->where_ncmps[i]!=recv_buffer_where[j] || mat_graph->where_ncmps[i] > 1) {
5170a0ba757dSStefano Zampini           where_cc_adapt[i]=PETSC_TRUE;
5171a0ba757dSStefano Zampini           break;
5172a0ba757dSStefano Zampini         }
5173a0ba757dSStefano Zampini       }
5174a0ba757dSStefano Zampini     }
5175d8923723SStefano Zampini     buffer_size = 0;
5176d8923723SStefano Zampini     for (i=0; i<where_values; i++) {
5177d8923723SStefano Zampini       if (where_cc_adapt[i]) {
5178d8923723SStefano Zampini         for (j=i; j<mat_graph->ncmps; j++) {
5179d8923723SStefano Zampini           if (mat_graph->where[mat_graph->queue[mat_graph->cptr[j]]] == i+1) { /* WARNING -> where values goes from 1 to where_values included */
5180d8923723SStefano Zampini             buffer_size += 1 + mat_graph->cptr[j+1]-mat_graph->cptr[j];
5181d8923723SStefano Zampini           }
5182d8923723SStefano Zampini         }
5183d8923723SStefano Zampini       }
5184d8923723SStefano Zampini     }
5185d8923723SStefano Zampini     ierr = PetscMalloc(buffer_size*sizeof(PetscMPIInt),&send_buffer);CHKERRQ(ierr);
5186a0ba757dSStefano Zampini     /* now get from neighbours their ccs (in global numbering) and adapt them (in case it is needed) */
5187a0ba757dSStefano Zampini     /* first determine how much data to send (size of each queue plus the global indices) and communicate it to neighbours */
5188a0ba757dSStefano Zampini     ierr = PetscMalloc(where_values*sizeof(PetscInt),&sizes_of_sends);CHKERRQ(ierr);
5189a0ba757dSStefano Zampini     ierr = PetscMemzero(sizes_of_sends,where_values*sizeof(PetscInt));CHKERRQ(ierr);
51902fa5cd67SKarl Rupp 
5191a0ba757dSStefano Zampini     sum_requests  = 0;
5192a0ba757dSStefano Zampini     start_of_send = 0;
5193a0ba757dSStefano Zampini     start_of_recv = cum_recv_counts[where_values];
5194a0ba757dSStefano Zampini     for (i=0; i<where_values; i++) {
5195a0ba757dSStefano Zampini       if (where_cc_adapt[i]) {
5196a0ba757dSStefano Zampini         size_of_send=0;
5197a0ba757dSStefano Zampini         for (j=i; j<mat_graph->ncmps; j++) {
5198a0ba757dSStefano Zampini           if (mat_graph->where[mat_graph->queue[mat_graph->cptr[j]]] == i+1) { /* WARNING -> where values goes from 1 to where_values included */
5199a0ba757dSStefano Zampini             send_buffer[start_of_send+size_of_send]=mat_graph->cptr[j+1]-mat_graph->cptr[j];
5200a0ba757dSStefano Zampini             size_of_send += 1;
5201a0ba757dSStefano Zampini             for (k=0; k<mat_graph->cptr[j+1]-mat_graph->cptr[j]; k++) {
5202a0ba757dSStefano Zampini               send_buffer[start_of_send+size_of_send+k]=queue_in_global_numbering[mat_graph->cptr[j]+k];
5203a0ba757dSStefano Zampini             }
5204a0ba757dSStefano Zampini             size_of_send=size_of_send+mat_graph->cptr[j+1]-mat_graph->cptr[j];
5205a0ba757dSStefano Zampini           }
5206a0ba757dSStefano Zampini         }
5207a0ba757dSStefano Zampini         j = where_to_nodes_indices[i];
5208da1bb401SStefano Zampini         k = (mat_graph->neighbours_set[j][0] == -1 ?  1 : 0);
520911d8f4c2SStefano Zampini         sizes_of_sends[i]=size_of_send;
5210a0ba757dSStefano Zampini         for (; k<mat_graph->count[j]; k++) {
521111d8f4c2SStefano Zampini           ierr = MPI_Isend(&sizes_of_sends[i],1,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr);
5212da1bb401SStefano Zampini           ierr = MPI_Irecv(&recv_buffer_where[sum_requests+start_of_recv],1,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr);
5213a0ba757dSStefano Zampini           sum_requests++;
5214a0ba757dSStefano Zampini         }
5215a0ba757dSStefano Zampini         start_of_send+=size_of_send;
5216a0ba757dSStefano Zampini       }
5217a0ba757dSStefano Zampini     }
5218a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
5219a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
52202fa5cd67SKarl Rupp 
5221a0ba757dSStefano Zampini     buffer_size=0;
52222fa5cd67SKarl Rupp 
52232fa5cd67SKarl Rupp     for (k=0;k<sum_requests;k++) buffer_size += recv_buffer_where[start_of_recv+k];
5224a0ba757dSStefano Zampini     ierr = PetscMalloc(buffer_size*sizeof(PetscMPIInt),&recv_buffer);CHKERRQ(ierr);
5225a0ba757dSStefano Zampini     /* now exchange the data */
5226a0ba757dSStefano Zampini     start_of_recv = 0;
5227a0ba757dSStefano Zampini     start_of_send = 0;
5228a0ba757dSStefano Zampini     sum_requests  = 0;
5229a0ba757dSStefano Zampini     for (i=0; i<where_values; i++) {
5230a0ba757dSStefano Zampini       if (where_cc_adapt[i]) {
5231a0ba757dSStefano Zampini         size_of_send = sizes_of_sends[i];
52322fa5cd67SKarl Rupp 
5233a0ba757dSStefano Zampini         j = where_to_nodes_indices[i];
5234da1bb401SStefano Zampini         k = (mat_graph->neighbours_set[j][0] == -1 ?  1 : 0);
5235a0ba757dSStefano Zampini         for (; k<mat_graph->count[j]; k++) {
5236da1bb401SStefano Zampini           ierr          = MPI_Isend(&send_buffer[start_of_send],size_of_send,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr);
5237a0ba757dSStefano Zampini           size_of_recv  = recv_buffer_where[cum_recv_counts[where_values]+sum_requests];
5238da1bb401SStefano Zampini           ierr          = MPI_Irecv(&recv_buffer[start_of_recv],size_of_recv,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr);
5239a0ba757dSStefano Zampini           start_of_recv+=size_of_recv;
5240a0ba757dSStefano Zampini           sum_requests++;
5241a0ba757dSStefano Zampini         }
5242a0ba757dSStefano Zampini         start_of_send+=size_of_send;
5243a0ba757dSStefano Zampini       }
5244a0ba757dSStefano Zampini     }
5245a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
5246a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
5247a0ba757dSStefano Zampini     ierr = PetscMalloc(buffer_size*sizeof(PetscInt),&petsc_buffer);CHKERRQ(ierr);
52482fa5cd67SKarl Rupp     for (k=0;k<start_of_recv;k++) petsc_buffer[k]=(PetscInt)recv_buffer[k];
5249a0ba757dSStefano Zampini     for (j=0;j<buffer_size;) {
5250a0ba757dSStefano Zampini       ierr = ISGlobalToLocalMappingApply(matis->mapping,IS_GTOLM_MASK,petsc_buffer[j],&petsc_buffer[j+1],&petsc_buffer[j],&petsc_buffer[j+1]);CHKERRQ(ierr);
5251a0ba757dSStefano Zampini       k    = petsc_buffer[j]+1;
5252a0ba757dSStefano Zampini       j   += k;
5253a0ba757dSStefano Zampini     }
5254a0ba757dSStefano Zampini     sum_requests  = cum_recv_counts[where_values];
5255a0ba757dSStefano Zampini     start_of_recv = 0;
52562fa5cd67SKarl Rupp 
5257a0ba757dSStefano Zampini     ierr = PetscMalloc(mat_graph->nvtxs*sizeof(PetscInt),&nodes_to_temp_buffer_indices);CHKERRQ(ierr);
5258a0ba757dSStefano Zampini     global_where_counter=0;
5259a0ba757dSStefano Zampini     for (i=0; i<where_values; i++) {
5260a0ba757dSStefano Zampini       if (where_cc_adapt[i]) {
5261a0ba757dSStefano Zampini         temp_buffer_size=0;
5262a0ba757dSStefano Zampini         /* find nodes on the shared interface we need to adapt */
5263a0ba757dSStefano Zampini         for (j=0; j<mat_graph->nvtxs; j++) {
5264a0ba757dSStefano Zampini           if (mat_graph->where[j]==i+1) {
5265a0ba757dSStefano Zampini             nodes_to_temp_buffer_indices[j]=temp_buffer_size;
5266a0ba757dSStefano Zampini             temp_buffer_size++;
5267a0ba757dSStefano Zampini           } else {
5268a0ba757dSStefano Zampini             nodes_to_temp_buffer_indices[j]=-1;
5269a0ba757dSStefano Zampini           }
5270a0ba757dSStefano Zampini         }
52712fa5cd67SKarl Rupp 
5272a0ba757dSStefano Zampini         /* allocate some temporary space */
5273a0ba757dSStefano Zampini         ierr = PetscMalloc(temp_buffer_size*sizeof(PetscInt*),&temp_buffer);CHKERRQ(ierr);
5274a0ba757dSStefano Zampini         ierr = PetscMalloc(temp_buffer_size*(cum_recv_counts[i+1]-cum_recv_counts[i])*sizeof(PetscInt),&temp_buffer[0]);CHKERRQ(ierr);
5275a0ba757dSStefano Zampini         ierr = PetscMemzero(temp_buffer[0],temp_buffer_size*(cum_recv_counts[i+1]-cum_recv_counts[i])*sizeof(PetscInt));CHKERRQ(ierr);
5276a0ba757dSStefano Zampini         for (j=1; j<temp_buffer_size; j++) {
5277a0ba757dSStefano Zampini           temp_buffer[j]=temp_buffer[j-1]+cum_recv_counts[i+1]-cum_recv_counts[i];
5278a0ba757dSStefano Zampini         }
5279a0ba757dSStefano Zampini         /* analyze contributions from neighbouring subdomains for i-th conn comp
5280a0ba757dSStefano Zampini            temp buffer structure:
5281a0ba757dSStefano Zampini            supposing part of the interface has dimension 5 (global nodes 0,1,2,3,4)
5282a0ba757dSStefano Zampini            3 neighs procs with structured connected components:
5283a0ba757dSStefano Zampini              neigh 0: [0 1 4], [2 3];  (2 connected components)
5284a0ba757dSStefano Zampini              neigh 1: [0 1], [2 3 4];  (2 connected components)
5285a0ba757dSStefano Zampini              neigh 2: [0 4], [1], [2 3]; (3 connected components)
5286a0ba757dSStefano Zampini            tempbuffer (row-oriented) should be filled as:
5287a0ba757dSStefano Zampini              [ 0, 0, 0;
5288a0ba757dSStefano Zampini                0, 0, 1;
5289a0ba757dSStefano Zampini                1, 1, 2;
5290a0ba757dSStefano Zampini                1, 1, 2;
5291a0ba757dSStefano Zampini                0, 1, 0; ];
5292a0ba757dSStefano Zampini            This way we can simply recover the resulting structure account for possible intersections of ccs among neighs.
5293a0ba757dSStefano Zampini            The mat_graph->where array will be modified to reproduce the following 4 connected components [0], [1], [2 3], [4];
5294a0ba757dSStefano Zampini                                                                                                                                    */
5295a0ba757dSStefano Zampini         for (j=0;j<cum_recv_counts[i+1]-cum_recv_counts[i];j++) {
5296a0ba757dSStefano Zampini           ins_val=0;
5297a0ba757dSStefano Zampini           size_of_recv=recv_buffer_where[sum_requests];  /* total size of recv from neighs */
5298a0ba757dSStefano Zampini           for (buffer_size=0;buffer_size<size_of_recv;) {  /* loop until all data from neighs has been taken into account */
5299a0ba757dSStefano Zampini             for (k=1;k<petsc_buffer[buffer_size+start_of_recv]+1;k++) { /* filling properly temp_buffer using data from a single recv */
5300a0ba757dSStefano Zampini               temp_buffer[nodes_to_temp_buffer_indices[petsc_buffer[start_of_recv+buffer_size+k]]][j] = ins_val;
5301a0ba757dSStefano Zampini             }
5302a0ba757dSStefano Zampini             buffer_size+=k;
5303a0ba757dSStefano Zampini             ins_val++;
5304a0ba757dSStefano Zampini           }
5305a0ba757dSStefano Zampini           start_of_recv+=size_of_recv;
5306a0ba757dSStefano Zampini           sum_requests++;
5307a0ba757dSStefano Zampini         }
5308a0ba757dSStefano Zampini         ierr = PetscMalloc(temp_buffer_size*sizeof(PetscInt),&add_to_where);CHKERRQ(ierr);
5309a0ba757dSStefano Zampini         ierr = PetscMemzero(add_to_where,temp_buffer_size*sizeof(PetscInt));CHKERRQ(ierr);
5310a0ba757dSStefano Zampini         for (j=0; j<temp_buffer_size; j++) {
5311a0ba757dSStefano Zampini           if (!add_to_where[j]) { /* found a new cc  */
5312a0ba757dSStefano Zampini             global_where_counter++;
5313a0ba757dSStefano Zampini             add_to_where[j]=global_where_counter;
5314a0ba757dSStefano Zampini             for (k=j+1; k<temp_buffer_size; k++) { /* check for other nodes in new cc */
5315a0ba757dSStefano Zampini               same_set=PETSC_TRUE;
5316a0ba757dSStefano Zampini               for (s=0; s<cum_recv_counts[i+1]-cum_recv_counts[i]; s++) {
5317a0ba757dSStefano Zampini                 if (temp_buffer[j][s]!=temp_buffer[k][s]) {
5318a0ba757dSStefano Zampini                   same_set=PETSC_FALSE;
5319a0ba757dSStefano Zampini                   break;
5320a0ba757dSStefano Zampini                 }
5321a0ba757dSStefano Zampini               }
53222fa5cd67SKarl Rupp               if (same_set) add_to_where[k] = global_where_counter;
5323a0ba757dSStefano Zampini             }
5324a0ba757dSStefano Zampini           }
5325a0ba757dSStefano Zampini         }
5326a0ba757dSStefano Zampini         /* insert new data in where array */
5327a0ba757dSStefano Zampini         temp_buffer_size=0;
5328a0ba757dSStefano Zampini         for (j=0;j<mat_graph->nvtxs;j++) {
5329a0ba757dSStefano Zampini           if (mat_graph->where[j]==i+1) {
5330a0ba757dSStefano Zampini             mat_graph->where[j]=where_values+add_to_where[temp_buffer_size];
5331a0ba757dSStefano Zampini             temp_buffer_size++;
5332a0ba757dSStefano Zampini           }
5333a0ba757dSStefano Zampini         }
5334a0ba757dSStefano Zampini         ierr = PetscFree(temp_buffer[0]);CHKERRQ(ierr);
5335a0ba757dSStefano Zampini         ierr = PetscFree(temp_buffer);CHKERRQ(ierr);
5336a0ba757dSStefano Zampini         ierr = PetscFree(add_to_where);CHKERRQ(ierr);
5337a0ba757dSStefano Zampini       }
5338a0ba757dSStefano Zampini     }
5339a0ba757dSStefano Zampini     ierr = PetscFree(nodes_to_temp_buffer_indices);CHKERRQ(ierr);
5340a0ba757dSStefano Zampini     ierr = PetscFree(sizes_of_sends);CHKERRQ(ierr);
5341a0ba757dSStefano Zampini     ierr = PetscFree(send_requests);CHKERRQ(ierr);
5342a0ba757dSStefano Zampini     ierr = PetscFree(recv_requests);CHKERRQ(ierr);
5343a0ba757dSStefano Zampini     ierr = PetscFree(petsc_buffer);CHKERRQ(ierr);
5344a0ba757dSStefano Zampini     ierr = PetscFree(recv_buffer);CHKERRQ(ierr);
5345a0ba757dSStefano Zampini     ierr = PetscFree(recv_buffer_where);CHKERRQ(ierr);
5346a0ba757dSStefano Zampini     ierr = PetscFree(send_buffer);CHKERRQ(ierr);
5347a0ba757dSStefano Zampini     ierr = PetscFree(cum_recv_counts);CHKERRQ(ierr);
5348a0ba757dSStefano Zampini     ierr = PetscFree(where_to_nodes_indices);CHKERRQ(ierr);
534923d4d1a5SStefano Zampini     ierr = PetscFree(where_cc_adapt);CHKERRQ(ierr);
53502fa5cd67SKarl Rupp 
5351a0ba757dSStefano Zampini     /* We are ready to evaluate consistent connected components on each part of the shared interface */
5352a0ba757dSStefano Zampini     if (global_where_counter) {
53532fa5cd67SKarl Rupp       for (i=0;i<mat_graph->nvtxs;i++) mat_graph->touched[i]=PETSC_FALSE;
5354a0ba757dSStefano Zampini       global_where_counter=0;
5355a0ba757dSStefano Zampini       for (i=0;i<mat_graph->nvtxs;i++) {
5356a0ba757dSStefano Zampini         if (mat_graph->where[i] && !mat_graph->touched[i]) {
5357a0ba757dSStefano Zampini           global_where_counter++;
5358a0ba757dSStefano Zampini           for (j=i+1;j<mat_graph->nvtxs;j++) {
5359a0ba757dSStefano Zampini             if (!mat_graph->touched[j] && mat_graph->where[j]==mat_graph->where[i]) {
5360a0ba757dSStefano Zampini               mat_graph->where[j]   = global_where_counter;
5361a0ba757dSStefano Zampini               mat_graph->touched[j] = PETSC_TRUE;
5362a0ba757dSStefano Zampini             }
5363a0ba757dSStefano Zampini           }
5364a0ba757dSStefano Zampini           mat_graph->where[i]   = global_where_counter;
5365a0ba757dSStefano Zampini           mat_graph->touched[i] = PETSC_TRUE;
5366a0ba757dSStefano Zampini         }
5367a0ba757dSStefano Zampini       }
5368a0ba757dSStefano Zampini       where_values=global_where_counter;
5369a0ba757dSStefano Zampini     }
5370a0ba757dSStefano Zampini     if (global_where_counter) {
5371a0ba757dSStefano Zampini       ierr = PetscMemzero(mat_graph->cptr,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr);
5372a0ba757dSStefano Zampini       ierr = PetscMemzero(mat_graph->queue,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
5373a0ba757dSStefano Zampini       ierr = PetscFree(mat_graph->where_ncmps);CHKERRQ(ierr);
5374a0ba757dSStefano Zampini       ierr = PetscMalloc(where_values*sizeof(PetscMPIInt),&mat_graph->where_ncmps);CHKERRQ(ierr);
5375a0ba757dSStefano Zampini       ierr = PCBDDCFindConnectedComponents(mat_graph, where_values);
5376a0ba757dSStefano Zampini     }
53773b03a366Sstefano_zampini   } /* Finished adapting interface */
53782fa5cd67SKarl Rupp 
5379a929c220SStefano Zampini   /* For consistency among neughbouring procs, I need to sort (by global ordering) each connected component */
5380a929c220SStefano Zampini   for (i=0; i<mat_graph->ncmps; i++) {
5381a929c220SStefano Zampini     k    = mat_graph->cptr[i+1]-mat_graph->cptr[i];
5382a929c220SStefano Zampini     ierr = ISLocalToGlobalMappingApply(matis->mapping,k,&mat_graph->queue[mat_graph->cptr[i]],&queue_in_global_numbering[mat_graph->cptr[i]]);CHKERRQ(ierr);
5383a929c220SStefano Zampini     ierr = PetscSortIntWithArray(k,&queue_in_global_numbering[mat_graph->cptr[i]],&mat_graph->queue[mat_graph->cptr[i]]);CHKERRQ(ierr);
5384a929c220SStefano Zampini   }
5385a929c220SStefano Zampini 
53860c7d97c5SJed Brown   PetscInt  nfc         = 0;
53870c7d97c5SJed Brown   PetscInt  nec         = 0;
53880c7d97c5SJed Brown   PetscInt  nvc         = 0;
53893b03a366Sstefano_zampini   PetscBool twodim_flag = PETSC_FALSE;
53900c7d97c5SJed Brown   for (i=0; i<mat_graph->ncmps; i++) {
53913b03a366Sstefano_zampini     if (mat_graph->cptr[i+1]-mat_graph->cptr[i] > vertex_size) {
53922fa5cd67SKarl Rupp       if (mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]==1) nfc++; /* 1 neigh Neumann fake included */
53932fa5cd67SKarl Rupp       else nec++; /* note that nec will be zero in 2d */
53940c7d97c5SJed Brown     } else {
53953b03a366Sstefano_zampini       nvc+=mat_graph->cptr[i+1]-mat_graph->cptr[i];
53963b03a366Sstefano_zampini     }
53973b03a366Sstefano_zampini   }
53983b03a366Sstefano_zampini   if (!nec) { /* we are in a 2d case -> no faces, only edges */
53993b03a366Sstefano_zampini     nec         = nfc;
54003b03a366Sstefano_zampini     nfc         = 0;
54013b03a366Sstefano_zampini     twodim_flag = PETSC_TRUE;
54023b03a366Sstefano_zampini   }
54033972b0daSStefano Zampini   /* allocate IS arrays for faces, edges. Vertices need a single index set. */
54043972b0daSStefano Zampini   k=0;
54053972b0daSStefano Zampini   for (i=0; i<mat_graph->ncmps; i++) {
54063972b0daSStefano Zampini     j=mat_graph->cptr[i+1]-mat_graph->cptr[i];
54072fa5cd67SKarl Rupp     if (j > k) k=j;
54082fa5cd67SKarl Rupp 
54092fa5cd67SKarl Rupp     if (j<=vertex_size) k+=vertex_size;
54103972b0daSStefano Zampini   }
54113972b0daSStefano Zampini   ierr = PetscMalloc(k*sizeof(PetscInt),&auxis);CHKERRQ(ierr);
54123b03a366Sstefano_zampini   if (!pcbddc->vertices_flag && !pcbddc->edges_flag) {
54133b03a366Sstefano_zampini     ierr      = PetscMalloc(nfc*sizeof(IS),&pcbddc->ISForFaces);CHKERRQ(ierr);
54143b03a366Sstefano_zampini     use_faces = PETSC_TRUE;
54153b03a366Sstefano_zampini   }
54163b03a366Sstefano_zampini   if (!pcbddc->vertices_flag && !pcbddc->faces_flag) {
54173b03a366Sstefano_zampini     ierr      = PetscMalloc(nec*sizeof(IS),&pcbddc->ISForEdges);CHKERRQ(ierr);
54183b03a366Sstefano_zampini     use_edges = PETSC_TRUE;
54193b03a366Sstefano_zampini   }
54203b03a366Sstefano_zampini   nfc=0;
54213b03a366Sstefano_zampini   nec=0;
54223b03a366Sstefano_zampini   for (i=0; i<mat_graph->ncmps; i++) {
54233b03a366Sstefano_zampini     if (mat_graph->cptr[i+1]-mat_graph->cptr[i] > vertex_size) {
54243b03a366Sstefano_zampini       for (j=0; j<mat_graph->cptr[i+1]-mat_graph->cptr[i]; j++) {
54253972b0daSStefano Zampini         auxis[j]=mat_graph->queue[mat_graph->cptr[i]+j];
54263b03a366Sstefano_zampini       }
54273b03a366Sstefano_zampini       if (mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]==1) {
54283b03a366Sstefano_zampini         if (twodim_flag) {
54293b03a366Sstefano_zampini           if (use_edges) {
54303972b0daSStefano Zampini             ierr = ISCreateGeneral(PETSC_COMM_SELF,j,auxis,PETSC_COPY_VALUES,&pcbddc->ISForEdges[nec]);CHKERRQ(ierr);
54313b03a366Sstefano_zampini             nec++;
54323b03a366Sstefano_zampini           }
54333b03a366Sstefano_zampini         } else {
54343b03a366Sstefano_zampini           if (use_faces) {
54353972b0daSStefano Zampini             ierr = ISCreateGeneral(PETSC_COMM_SELF,j,auxis,PETSC_COPY_VALUES,&pcbddc->ISForFaces[nfc]);CHKERRQ(ierr);
54363b03a366Sstefano_zampini             nfc++;
54373b03a366Sstefano_zampini           }
54383b03a366Sstefano_zampini         }
54393b03a366Sstefano_zampini       } else {
54403b03a366Sstefano_zampini         if (use_edges) {
54413972b0daSStefano Zampini           ierr = ISCreateGeneral(PETSC_COMM_SELF,j,auxis,PETSC_COPY_VALUES,&pcbddc->ISForEdges[nec]);CHKERRQ(ierr);
54420c7d97c5SJed Brown           nec++;
54430c7d97c5SJed Brown         }
54440c7d97c5SJed Brown       }
54450c7d97c5SJed Brown     }
54463b03a366Sstefano_zampini   }
54473b03a366Sstefano_zampini   pcbddc->n_ISForFaces = nfc;
54483b03a366Sstefano_zampini   pcbddc->n_ISForEdges = nec;
54492fa5cd67SKarl Rupp 
54503b03a366Sstefano_zampini   nvc = 0;
54510c7d97c5SJed Brown   if (!pcbddc->constraints_flag) {
54523b03a366Sstefano_zampini     for (i=0; i<mat_graph->ncmps; i++) {
54533b03a366Sstefano_zampini       if (mat_graph->cptr[i+1]-mat_graph->cptr[i] <= vertex_size) {
54543b03a366Sstefano_zampini         for (j = mat_graph->cptr[i]; j<mat_graph->cptr[i+1]; j++) {
54553972b0daSStefano Zampini           auxis[nvc]=mat_graph->queue[j];
54560c7d97c5SJed Brown           nvc++;
54570c7d97c5SJed Brown         }
54580c7d97c5SJed Brown       }
54590c7d97c5SJed Brown     }
54600c7d97c5SJed Brown   }
54612fa5cd67SKarl Rupp 
5462a0ba757dSStefano Zampini   /* sort vertex set (by local ordering) */
54633972b0daSStefano Zampini   ierr = PetscSortInt(nvc,auxis);CHKERRQ(ierr);
54643972b0daSStefano Zampini   ierr = ISCreateGeneral(PETSC_COMM_SELF,nvc,auxis,PETSC_COPY_VALUES,&pcbddc->ISForVertices);CHKERRQ(ierr);
5465e269702eSStefano Zampini   if (pcbddc->dbg_flag) {
5466d49ef151SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"--------------------------------------------------------------\n");CHKERRQ(ierr);
5467d49ef151SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Details from PCBDDCManageLocalBoundaries for subdomain %04d\n",PetscGlobalRank);CHKERRQ(ierr);
5468d49ef151SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Matrix graph has %d connected components", mat_graph->ncmps);CHKERRQ(ierr);
54690c7d97c5SJed Brown     for (i=0; i<mat_graph->ncmps; i++) {
54703b03a366Sstefano_zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\nDetails for connected component number %02d: size %04d, count %01d. Nodes follow.\n",
54713b03a366Sstefano_zampini                                                 i,mat_graph->cptr[i+1]-mat_graph->cptr[i],mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]);CHKERRQ(ierr);
5472da1bb401SStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"subdomains: ");
5473da1bb401SStefano Zampini       for (j=0; j<mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]; j++) {
54742fa5cd67SKarl Rupp         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d ",mat_graph->neighbours_set[mat_graph->queue[mat_graph->cptr[i]]][j]);CHKERRQ(ierr);
5475da1bb401SStefano Zampini       }
5476da1bb401SStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\n");
54770c7d97c5SJed Brown       for (j=mat_graph->cptr[i]; j<mat_graph->cptr[i+1]; j++) {
5478a929c220SStefano Zampini         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d (%d), ",mat_graph->queue[j],queue_in_global_numbering[j]);CHKERRQ(ierr);
54790c7d97c5SJed Brown       }
54800c7d97c5SJed Brown     }
5481da1bb401SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\n--------------------------------------------------------------\n");CHKERRQ(ierr);
54823b03a366Sstefano_zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local vertices\n",PetscGlobalRank,nvc);CHKERRQ(ierr);
54833b03a366Sstefano_zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local faces\n",PetscGlobalRank,nfc);CHKERRQ(ierr);
54843b03a366Sstefano_zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local edges\n",PetscGlobalRank,nec);CHKERRQ(ierr);
5485d49ef151SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
54860c7d97c5SJed Brown   }
54873972b0daSStefano Zampini   ierr = PetscFree(auxis);CHKERRQ(ierr);
5488a929c220SStefano Zampini   ierr = PetscFree(queue_in_global_numbering);CHKERRQ(ierr);
54890c7d97c5SJed Brown   PetscFunctionReturn(0);
54900c7d97c5SJed Brown }
54910c7d97c5SJed Brown 
54920c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
54930c7d97c5SJed Brown 
54940c7d97c5SJed Brown /* The following code has been adapted from function IsConnectedSubdomain contained
5495da1bb401SStefano Zampini    in source file contig.c of METIS library (version 5.0.1)
5496da1bb401SStefano Zampini    It finds connected components of each partition labeled from 1 to n_dist  */
54970c7d97c5SJed Brown 
54980c7d97c5SJed Brown #undef __FUNCT__
54990c7d97c5SJed Brown #define __FUNCT__ "PCBDDCFindConnectedComponents"
55009c0446d6SStefano Zampini static PetscErrorCode PCBDDCFindConnectedComponents(PCBDDCGraph graph, PetscInt n_dist)
55010c7d97c5SJed Brown {
55020c7d97c5SJed Brown   PetscInt  i, j, k, nvtxs, first, last, nleft, ncmps,pid,cum_queue,n,ncmps_pid;
55030c7d97c5SJed Brown   PetscInt  *xadj, *adjncy, *where, *queue;
55040c7d97c5SJed Brown   PetscInt  *cptr;
55050c7d97c5SJed Brown   PetscBool *touched;
55060c7d97c5SJed Brown 
55070c7d97c5SJed Brown   PetscFunctionBegin;
55080c7d97c5SJed Brown   nvtxs   = graph->nvtxs;
55090c7d97c5SJed Brown   xadj    = graph->xadj;
55100c7d97c5SJed Brown   adjncy  = graph->adjncy;
55110c7d97c5SJed Brown   where   = graph->where;
55120c7d97c5SJed Brown   touched = graph->touched;
55130c7d97c5SJed Brown   queue   = graph->queue;
55140c7d97c5SJed Brown   cptr    = graph->cptr;
55150c7d97c5SJed Brown 
55162fa5cd67SKarl Rupp   for (i=0; i<nvtxs; i++) touched[i] = PETSC_FALSE;
55170c7d97c5SJed Brown 
55180c7d97c5SJed Brown   cum_queue = 0;
55190c7d97c5SJed Brown   ncmps     = 0;
55200c7d97c5SJed Brown 
55210c7d97c5SJed Brown   for (n=0; n<n_dist; n++) {
5522da1bb401SStefano Zampini     pid   = n+1; /* partition labeled by 0 is discarded */
55230c7d97c5SJed Brown     nleft = 0;
55240c7d97c5SJed Brown     for (i=0; i<nvtxs; i++) {
55252fa5cd67SKarl Rupp       if (where[i] == pid) nleft++;
55260c7d97c5SJed Brown     }
55270c7d97c5SJed Brown     for (i=0; i<nvtxs; i++) {
55282fa5cd67SKarl Rupp       if (where[i] == pid) break;
55290c7d97c5SJed Brown     }
55300c7d97c5SJed Brown     touched[i]       = PETSC_TRUE;
55310c7d97c5SJed Brown     queue[cum_queue] = i;
55320c7d97c5SJed Brown     first = 0; last = 1;
55332fa5cd67SKarl Rupp 
55340c7d97c5SJed Brown     cptr[ncmps] = cum_queue;  /* This actually points to queue */
55350c7d97c5SJed Brown     ncmps_pid   = 0;
55362fa5cd67SKarl Rupp 
55370c7d97c5SJed Brown     while (first != nleft) {
55380c7d97c5SJed Brown       if (first == last) { /* Find another starting vertex */
55390c7d97c5SJed Brown         cptr[++ncmps] = first+cum_queue;
55400c7d97c5SJed Brown         ncmps_pid++;
55410c7d97c5SJed Brown         for (i=0; i<nvtxs; i++) {
55422fa5cd67SKarl Rupp           if (where[i] == pid && !touched[i]) break;
55430c7d97c5SJed Brown         }
55440c7d97c5SJed Brown         queue[cum_queue+last] = i;
55450c7d97c5SJed Brown         last++;
55460c7d97c5SJed Brown         touched[i] = PETSC_TRUE;
55470c7d97c5SJed Brown       }
55480c7d97c5SJed Brown       i = queue[cum_queue+first];
55490c7d97c5SJed Brown       first++;
55500c7d97c5SJed Brown       for (j=xadj[i]; j<xadj[i+1]; j++) {
55510c7d97c5SJed Brown         k = adjncy[j];
55520c7d97c5SJed Brown         if (where[k] == pid && !touched[k]) {
55530c7d97c5SJed Brown           queue[cum_queue+last] = k;
55540c7d97c5SJed Brown           last++;
55550c7d97c5SJed Brown           touched[k] = PETSC_TRUE;
55560c7d97c5SJed Brown         }
55570c7d97c5SJed Brown       }
55580c7d97c5SJed Brown     }
55590c7d97c5SJed Brown     cptr[++ncmps] = first+cum_queue;
55600c7d97c5SJed Brown     ncmps_pid++;
55610c7d97c5SJed Brown     cum_queue             = cptr[ncmps];
5562a0ba757dSStefano Zampini     graph->where_ncmps[n] = ncmps_pid;
55630c7d97c5SJed Brown   }
55640c7d97c5SJed Brown   graph->ncmps = ncmps;
55650c7d97c5SJed Brown   PetscFunctionReturn(0);
55660c7d97c5SJed Brown }
5567