153cdbc3dSStefano Zampini /* TODOLIST 2da1bb401SStefano Zampini DofSplitting and DM attached to pc? 3da1bb401SStefano Zampini Change SetNeumannBoundaries to SetNeumannBoundariesLocal and provide new SetNeumannBoundaries (same Dirichlet) 4831a100dSStefano Zampini - change prec_type to switch_inexact_prec_type 53b03a366Sstefano_zampini Inexact solvers: global preconditioner application is ready, ask to developers (Jed?) on how to best implement Dohrmann's approach (PCSHELL?) 6a0ba757dSStefano Zampini change how to deal with the coarse problem (PCBDDCSetCoarseEnvironment): 7a0ba757dSStefano Zampini - simplify coarse problem structure -> PCBDDC or PCREDUDANT, nothing else -> same comm for all levels? 8a0ba757dSStefano Zampini - remove coarse enums and allow use of PCBDDCGetCoarseKSP 9a0ba757dSStefano Zampini - remove metis dependency -> use MatPartitioning for multilevel -> Assemble serial adjacency in ManageLocalBoundaries? 10a0ba757dSStefano Zampini code refactoring: 11a0ba757dSStefano Zampini - pick up better names for static functions 12a0ba757dSStefano Zampini change options structure: 13a0ba757dSStefano Zampini - insert BDDC into MG framework? 14a0ba757dSStefano Zampini provide other ops? Ask to developers 15a0ba757dSStefano Zampini remove all unused printf 16a0ba757dSStefano Zampini man pages 1753cdbc3dSStefano Zampini */ 180c7d97c5SJed Brown 1953cdbc3dSStefano Zampini /* ---------------------------------------------------------------------------------------------------------------------------------------------- 200c7d97c5SJed Brown Implementation of BDDC preconditioner based on: 210c7d97c5SJed Brown C. Dohrmann "An approximate BDDC preconditioner", Numerical Linear Algebra with Applications Volume 14, Issue 2, pages 149-168, March 2007 2253cdbc3dSStefano Zampini ---------------------------------------------------------------------------------------------------------------------------------------------- */ 2353cdbc3dSStefano Zampini 2453cdbc3dSStefano Zampini #include "bddc.h" /*I "petscpc.h" I*/ /* includes for fortran wrappers */ 253b03a366Sstefano_zampini #include <petscblaslapack.h> 260c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 270c7d97c5SJed Brown #undef __FUNCT__ 280c7d97c5SJed Brown #define __FUNCT__ "PCSetFromOptions_BDDC" 290c7d97c5SJed Brown PetscErrorCode PCSetFromOptions_BDDC(PC pc) 300c7d97c5SJed Brown { 310c7d97c5SJed Brown PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 320c7d97c5SJed Brown PetscErrorCode ierr; 330c7d97c5SJed Brown 340c7d97c5SJed Brown PetscFunctionBegin; 350c7d97c5SJed Brown ierr = PetscOptionsHead("BDDC options");CHKERRQ(ierr); 360c7d97c5SJed Brown /* Verbose debugging of main data structures */ 37e269702eSStefano Zampini ierr = PetscOptionsBool("-pc_bddc_check_all" ,"Verbose (debugging) output for PCBDDC" ,"none",pcbddc->dbg_flag ,&pcbddc->dbg_flag ,PETSC_NULL);CHKERRQ(ierr); 380c7d97c5SJed Brown /* Some customization for default primal space */ 39da1bb401SStefano Zampini ierr = PetscOptionsBool("-pc_bddc_vertices_only" ,"Use only vertices in coarse space (i.e. discard constraints)","none",pcbddc->vertices_flag ,&pcbddc->vertices_flag ,PETSC_NULL);CHKERRQ(ierr); 40da1bb401SStefano Zampini ierr = PetscOptionsBool("-pc_bddc_constraints_only","Use only constraints in coarse space (i.e. discard vertices)","none",pcbddc->constraints_flag,&pcbddc->constraints_flag,PETSC_NULL);CHKERRQ(ierr); 41da1bb401SStefano Zampini ierr = PetscOptionsBool("-pc_bddc_faces_only" ,"Use only faces among constraints of coarse space (i.e. discard edges)" ,"none",pcbddc->faces_flag ,&pcbddc->faces_flag ,PETSC_NULL);CHKERRQ(ierr); 42da1bb401SStefano Zampini ierr = PetscOptionsBool("-pc_bddc_edges_only" ,"Use only edges among constraints of coarse space (i.e. discard faces)" ,"none",pcbddc->edges_flag ,&pcbddc->edges_flag ,PETSC_NULL);CHKERRQ(ierr); 430c7d97c5SJed Brown /* Coarse solver context */ 446c667b0aSStefano Zampini static const char * const avail_coarse_problems[] = {"sequential","replicated","parallel","multilevel","CoarseProblemType","PC_BDDC_",0}; /*order of choiches depends on ENUM defined in bddc.h */ 450c7d97c5SJed Brown ierr = PetscOptionsEnum("-pc_bddc_coarse_problem_type","Set coarse problem type","none",avail_coarse_problems,(PetscEnum)pcbddc->coarse_problem_type,(PetscEnum*)&pcbddc->coarse_problem_type,PETSC_NULL);CHKERRQ(ierr); 460c7d97c5SJed Brown /* Two different application of BDDC to the whole set of dofs, internal and interface */ 470c7d97c5SJed Brown ierr = PetscOptionsBool("-pc_bddc_switch_preconditioning_type","Switch between M_2 (default) and M_3 preconditioners (as defined by Dohrmann)","none",pcbddc->prec_type,&pcbddc->prec_type,PETSC_NULL);CHKERRQ(ierr); 48534831adSStefano Zampini ierr = PetscOptionsBool("-pc_bddc_use_change_of_basis","Use change of basis approach for primal space","none",pcbddc->usechangeofbasis,&pcbddc->usechangeofbasis,PETSC_NULL);CHKERRQ(ierr); 49534831adSStefano Zampini ierr = PetscOptionsBool("-pc_bddc_use_change_on_faces","Use change of basis approach for face constraints","none",pcbddc->usechangeonfaces,&pcbddc->usechangeonfaces,PETSC_NULL);CHKERRQ(ierr); 50534831adSStefano Zampini pcbddc->usechangeonfaces = pcbddc->usechangeonfaces && pcbddc->usechangeofbasis; 510c7d97c5SJed Brown ierr = PetscOptionsInt("-pc_bddc_coarsening_ratio","Set coarsening ratio used in multilevel coarsening","none",pcbddc->coarsening_ratio,&pcbddc->coarsening_ratio,PETSC_NULL);CHKERRQ(ierr); 524fad6a16SStefano Zampini ierr = PetscOptionsInt("-pc_bddc_max_levels","Set maximum number of levels for multilevel","none",pcbddc->max_levels,&pcbddc->max_levels,PETSC_NULL);CHKERRQ(ierr); 530c7d97c5SJed Brown ierr = PetscOptionsTail();CHKERRQ(ierr); 540c7d97c5SJed Brown PetscFunctionReturn(0); 550c7d97c5SJed Brown } 560c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 570c7d97c5SJed Brown EXTERN_C_BEGIN 580c7d97c5SJed Brown #undef __FUNCT__ 590c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetCoarseProblemType_BDDC" 6053cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetCoarseProblemType_BDDC(PC pc, CoarseProblemType CPT) 610c7d97c5SJed Brown { 620c7d97c5SJed Brown PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 630c7d97c5SJed Brown 640c7d97c5SJed Brown PetscFunctionBegin; 650c7d97c5SJed Brown pcbddc->coarse_problem_type = CPT; 660c7d97c5SJed Brown PetscFunctionReturn(0); 670c7d97c5SJed Brown } 680c7d97c5SJed Brown EXTERN_C_END 690c7d97c5SJed Brown #undef __FUNCT__ 700c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetCoarseProblemType" 7153cdbc3dSStefano Zampini /*@ 729c0446d6SStefano Zampini PCBDDCSetCoarseProblemType - Set coarse problem type in PCBDDC. 7353cdbc3dSStefano Zampini 749c0446d6SStefano Zampini Not collective 7553cdbc3dSStefano Zampini 7653cdbc3dSStefano Zampini Input Parameters: 7753cdbc3dSStefano Zampini + pc - the preconditioning context 7853cdbc3dSStefano Zampini - CoarseProblemType - pick a better name and explain what this is 7953cdbc3dSStefano Zampini 8053cdbc3dSStefano Zampini Level: intermediate 8153cdbc3dSStefano Zampini 8253cdbc3dSStefano Zampini Notes: 83da1bb401SStefano Zampini Not collective but all procs must call with same arguments. 8453cdbc3dSStefano Zampini 8553cdbc3dSStefano Zampini .seealso: PCBDDC 8653cdbc3dSStefano Zampini @*/ 870c7d97c5SJed Brown PetscErrorCode PCBDDCSetCoarseProblemType(PC pc, CoarseProblemType CPT) 880c7d97c5SJed Brown { 890c7d97c5SJed Brown PetscErrorCode ierr; 900c7d97c5SJed Brown 910c7d97c5SJed Brown PetscFunctionBegin; 920c7d97c5SJed Brown PetscValidHeaderSpecific(pc,PC_CLASSID,1); 930c7d97c5SJed Brown ierr = PetscTryMethod(pc,"PCBDDCSetCoarseProblemType_C",(PC,CoarseProblemType),(pc,CPT));CHKERRQ(ierr); 940c7d97c5SJed Brown PetscFunctionReturn(0); 950c7d97c5SJed Brown } 960c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 970c7d97c5SJed Brown EXTERN_C_BEGIN 980c7d97c5SJed Brown #undef __FUNCT__ 994fad6a16SStefano Zampini #define __FUNCT__ "PCBDDCSetCoarseningRatio_BDDC" 1004fad6a16SStefano Zampini static PetscErrorCode PCBDDCSetCoarseningRatio_BDDC(PC pc,PetscInt k) 1014fad6a16SStefano Zampini { 1024fad6a16SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 1034fad6a16SStefano Zampini 1044fad6a16SStefano Zampini PetscFunctionBegin; 1054fad6a16SStefano Zampini pcbddc->coarsening_ratio=k; 1064fad6a16SStefano Zampini PetscFunctionReturn(0); 1074fad6a16SStefano Zampini } 1084fad6a16SStefano Zampini EXTERN_C_END 1094fad6a16SStefano Zampini #undef __FUNCT__ 1104fad6a16SStefano Zampini #define __FUNCT__ "PCBDDCSetCoarseningRatio" 1114fad6a16SStefano Zampini /*@ 1124fad6a16SStefano Zampini PCBDDCSetCoarseningRatio - Set coarsening ratio used in multilevel coarsening 1134fad6a16SStefano Zampini 1144fad6a16SStefano Zampini Logically collective on PC 1154fad6a16SStefano Zampini 1164fad6a16SStefano Zampini Input Parameters: 1174fad6a16SStefano Zampini + pc - the preconditioning context 1184fad6a16SStefano Zampini - k - coarsening ratio 1194fad6a16SStefano Zampini 1204fad6a16SStefano Zampini Approximatively k subdomains at the finer level will be aggregated into a single subdomain at the coarser level. 1214fad6a16SStefano Zampini 1224fad6a16SStefano Zampini Level: intermediate 1234fad6a16SStefano Zampini 1244fad6a16SStefano Zampini Notes: 1254fad6a16SStefano Zampini 1264fad6a16SStefano Zampini .seealso: PCBDDC 1274fad6a16SStefano Zampini @*/ 1284fad6a16SStefano Zampini PetscErrorCode PCBDDCSetCoarseningRatio(PC pc,PetscInt k) 1294fad6a16SStefano Zampini { 1304fad6a16SStefano Zampini PetscErrorCode ierr; 1314fad6a16SStefano Zampini 1324fad6a16SStefano Zampini PetscFunctionBegin; 1334fad6a16SStefano Zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 1344fad6a16SStefano Zampini ierr = PetscTryMethod(pc,"PCBDDCSetCoarseningRatio_C",(PC,PetscInt),(pc,k));CHKERRQ(ierr); 1354fad6a16SStefano Zampini PetscFunctionReturn(0); 1364fad6a16SStefano Zampini } 1374fad6a16SStefano Zampini /* -------------------------------------------------------------------------- */ 1384fad6a16SStefano Zampini EXTERN_C_BEGIN 1394fad6a16SStefano Zampini #undef __FUNCT__ 1404fad6a16SStefano Zampini #define __FUNCT__ "PCBDDCSetMaxLevels_BDDC" 1414fad6a16SStefano Zampini static PetscErrorCode PCBDDCSetMaxLevels_BDDC(PC pc,PetscInt max_levels) 1424fad6a16SStefano Zampini { 1434fad6a16SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 1444fad6a16SStefano Zampini 1454fad6a16SStefano Zampini PetscFunctionBegin; 1464fad6a16SStefano Zampini pcbddc->max_levels=max_levels; 1474fad6a16SStefano Zampini PetscFunctionReturn(0); 1484fad6a16SStefano Zampini } 1494fad6a16SStefano Zampini EXTERN_C_END 1504fad6a16SStefano Zampini #undef __FUNCT__ 1514fad6a16SStefano Zampini #define __FUNCT__ "PCBDDCSetMaxLevels" 1524fad6a16SStefano Zampini /*@ 1534fad6a16SStefano Zampini PCBDDCSetMaxLevels - Sets the maximum number of levels within the multilevel approach. 1544fad6a16SStefano Zampini 1554fad6a16SStefano Zampini Logically collective on PC 1564fad6a16SStefano Zampini 1574fad6a16SStefano Zampini Input Parameters: 1584fad6a16SStefano Zampini + pc - the preconditioning context 1594fad6a16SStefano Zampini - max_levels - the maximum number of levels 1604fad6a16SStefano Zampini 1614fad6a16SStefano Zampini Default value is 1, i.e. coarse problem will be solved inexactly with one application 1624fad6a16SStefano Zampini of PCBDDC preconditioner if the multilevel approach is requested. 1634fad6a16SStefano Zampini 1644fad6a16SStefano Zampini Level: intermediate 1654fad6a16SStefano Zampini 1664fad6a16SStefano Zampini Notes: 1674fad6a16SStefano Zampini 1684fad6a16SStefano Zampini .seealso: PCBDDC 1694fad6a16SStefano Zampini @*/ 1704fad6a16SStefano Zampini PetscErrorCode PCBDDCSetMaxLevels(PC pc,PetscInt max_levels) 1714fad6a16SStefano Zampini { 1724fad6a16SStefano Zampini PetscErrorCode ierr; 1734fad6a16SStefano Zampini 1744fad6a16SStefano Zampini PetscFunctionBegin; 1754fad6a16SStefano Zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 1764fad6a16SStefano Zampini ierr = PetscTryMethod(pc,"PCBDDCSetMaxLevels_C",(PC,PetscInt),(pc,max_levels));CHKERRQ(ierr); 1774fad6a16SStefano Zampini PetscFunctionReturn(0); 1784fad6a16SStefano Zampini } 1794fad6a16SStefano Zampini /* -------------------------------------------------------------------------- */ 1804fad6a16SStefano Zampini EXTERN_C_BEGIN 1814fad6a16SStefano Zampini #undef __FUNCT__ 1820bdf917eSStefano Zampini #define __FUNCT__ "PCBDDCSetNullSpace_BDDC" 1830bdf917eSStefano Zampini static PetscErrorCode PCBDDCSetNullSpace_BDDC(PC pc,MatNullSpace NullSpace) 1840bdf917eSStefano Zampini { 1850bdf917eSStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 1860bdf917eSStefano Zampini PetscErrorCode ierr; 1870bdf917eSStefano Zampini 1880bdf917eSStefano Zampini PetscFunctionBegin; 1890bdf917eSStefano Zampini ierr = PetscObjectReference((PetscObject)NullSpace);CHKERRQ(ierr); 1900bdf917eSStefano Zampini ierr = MatNullSpaceDestroy(&pcbddc->NullSpace);CHKERRQ(ierr); 1910bdf917eSStefano Zampini pcbddc->NullSpace=NullSpace; 1920bdf917eSStefano Zampini PetscFunctionReturn(0); 1930bdf917eSStefano Zampini } 1940bdf917eSStefano Zampini EXTERN_C_END 1950bdf917eSStefano Zampini #undef __FUNCT__ 1960bdf917eSStefano Zampini #define __FUNCT__ "PCBDDCSetNullSpace" 1970bdf917eSStefano Zampini /*@ 1980bdf917eSStefano Zampini PCBDDCSetNullSpace - Set NullSpace of global operator of BDDC preconditioned mat. 1990bdf917eSStefano Zampini 2000bdf917eSStefano Zampini Logically collective on PC and MatNullSpace 2010bdf917eSStefano Zampini 2020bdf917eSStefano Zampini Input Parameters: 2030bdf917eSStefano Zampini + pc - the preconditioning context 2040bdf917eSStefano Zampini - NullSpace - Null space of the linear operator to be preconditioned. 2050bdf917eSStefano Zampini 2060bdf917eSStefano Zampini Level: intermediate 2070bdf917eSStefano Zampini 2080bdf917eSStefano Zampini Notes: 2090bdf917eSStefano Zampini 2100bdf917eSStefano Zampini .seealso: PCBDDC 2110bdf917eSStefano Zampini @*/ 2120bdf917eSStefano Zampini PetscErrorCode PCBDDCSetNullSpace(PC pc,MatNullSpace NullSpace) 2130bdf917eSStefano Zampini { 2140bdf917eSStefano Zampini PetscErrorCode ierr; 2150bdf917eSStefano Zampini 2160bdf917eSStefano Zampini PetscFunctionBegin; 2170bdf917eSStefano Zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 2180bdf917eSStefano Zampini ierr = PetscTryMethod(pc,"PCBDDCSetNullSpace_C",(PC,MatNullSpace),(pc,NullSpace));CHKERRQ(ierr); 2190bdf917eSStefano Zampini PetscFunctionReturn(0); 2200bdf917eSStefano Zampini } 2210bdf917eSStefano Zampini /* -------------------------------------------------------------------------- */ 2220bdf917eSStefano Zampini EXTERN_C_BEGIN 2230bdf917eSStefano Zampini #undef __FUNCT__ 2243b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCSetDirichletBoundaries_BDDC" 2253b03a366Sstefano_zampini static PetscErrorCode PCBDDCSetDirichletBoundaries_BDDC(PC pc,IS DirichletBoundaries) 2263b03a366Sstefano_zampini { 2273b03a366Sstefano_zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 2283b03a366Sstefano_zampini PetscErrorCode ierr; 2293b03a366Sstefano_zampini 2303b03a366Sstefano_zampini PetscFunctionBegin; 2313b03a366Sstefano_zampini ierr = ISDestroy(&pcbddc->DirichletBoundaries);CHKERRQ(ierr); 23236e030ebSStefano Zampini ierr = PetscObjectReference((PetscObject)DirichletBoundaries);CHKERRQ(ierr); 23336e030ebSStefano Zampini pcbddc->DirichletBoundaries=DirichletBoundaries; 2343b03a366Sstefano_zampini PetscFunctionReturn(0); 2353b03a366Sstefano_zampini } 2363b03a366Sstefano_zampini EXTERN_C_END 2373b03a366Sstefano_zampini #undef __FUNCT__ 2383b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCSetDirichletBoundaries" 2393b03a366Sstefano_zampini /*@ 240da1bb401SStefano Zampini PCBDDCSetDirichletBoundaries - Set index set defining subdomain part (in local ordering) 241da1bb401SStefano Zampini of Dirichlet boundaries for the global problem. 2423b03a366Sstefano_zampini 2433b03a366Sstefano_zampini Not collective 2443b03a366Sstefano_zampini 2453b03a366Sstefano_zampini Input Parameters: 2463b03a366Sstefano_zampini + pc - the preconditioning context 2473b03a366Sstefano_zampini - DirichletBoundaries - sequential index set defining the subdomain part of Dirichlet boundaries (can be PETSC_NULL) 2483b03a366Sstefano_zampini 2493b03a366Sstefano_zampini Level: intermediate 2503b03a366Sstefano_zampini 2513b03a366Sstefano_zampini Notes: 2523b03a366Sstefano_zampini 2533b03a366Sstefano_zampini .seealso: PCBDDC 2543b03a366Sstefano_zampini @*/ 2553b03a366Sstefano_zampini PetscErrorCode PCBDDCSetDirichletBoundaries(PC pc,IS DirichletBoundaries) 2563b03a366Sstefano_zampini { 2573b03a366Sstefano_zampini PetscErrorCode ierr; 2583b03a366Sstefano_zampini 2593b03a366Sstefano_zampini PetscFunctionBegin; 2603b03a366Sstefano_zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 2613b03a366Sstefano_zampini ierr = PetscTryMethod(pc,"PCBDDCSetDirichletBoundaries_C",(PC,IS),(pc,DirichletBoundaries));CHKERRQ(ierr); 2623b03a366Sstefano_zampini PetscFunctionReturn(0); 2633b03a366Sstefano_zampini } 2643b03a366Sstefano_zampini /* -------------------------------------------------------------------------- */ 2653b03a366Sstefano_zampini EXTERN_C_BEGIN 2663b03a366Sstefano_zampini #undef __FUNCT__ 2670c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetNeumannBoundaries_BDDC" 26853cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetNeumannBoundaries_BDDC(PC pc,IS NeumannBoundaries) 2690c7d97c5SJed Brown { 2700c7d97c5SJed Brown PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 27153cdbc3dSStefano Zampini PetscErrorCode ierr; 2720c7d97c5SJed Brown 2730c7d97c5SJed Brown PetscFunctionBegin; 27453cdbc3dSStefano Zampini ierr = ISDestroy(&pcbddc->NeumannBoundaries);CHKERRQ(ierr); 27536e030ebSStefano Zampini ierr = PetscObjectReference((PetscObject)NeumannBoundaries);CHKERRQ(ierr); 27636e030ebSStefano Zampini pcbddc->NeumannBoundaries=NeumannBoundaries; 2770c7d97c5SJed Brown PetscFunctionReturn(0); 2780c7d97c5SJed Brown } 2790c7d97c5SJed Brown EXTERN_C_END 2800c7d97c5SJed Brown #undef __FUNCT__ 2810c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetNeumannBoundaries" 28257527edcSJed Brown /*@ 283da1bb401SStefano Zampini PCBDDCSetNeumannBoundaries - Set index set defining subdomain part (in local ordering) 284da1bb401SStefano Zampini of Neumann boundaries for the global problem. 28557527edcSJed Brown 2869c0446d6SStefano Zampini Not collective 28757527edcSJed Brown 28857527edcSJed Brown Input Parameters: 28957527edcSJed Brown + pc - the preconditioning context 2909c0446d6SStefano Zampini - NeumannBoundaries - sequential index set defining the subdomain part of Neumann boundaries (can be PETSC_NULL) 29157527edcSJed Brown 29257527edcSJed Brown Level: intermediate 29357527edcSJed Brown 29457527edcSJed Brown Notes: 29557527edcSJed Brown 29657527edcSJed Brown .seealso: PCBDDC 29757527edcSJed Brown @*/ 29853cdbc3dSStefano Zampini PetscErrorCode PCBDDCSetNeumannBoundaries(PC pc,IS NeumannBoundaries) 2990c7d97c5SJed Brown { 3000c7d97c5SJed Brown PetscErrorCode ierr; 3010c7d97c5SJed Brown 3020c7d97c5SJed Brown PetscFunctionBegin; 3030c7d97c5SJed Brown PetscValidHeaderSpecific(pc,PC_CLASSID,1); 30453cdbc3dSStefano Zampini ierr = PetscTryMethod(pc,"PCBDDCSetNeumannBoundaries_C",(PC,IS),(pc,NeumannBoundaries));CHKERRQ(ierr); 30553cdbc3dSStefano Zampini PetscFunctionReturn(0); 30653cdbc3dSStefano Zampini } 30753cdbc3dSStefano Zampini /* -------------------------------------------------------------------------- */ 30853cdbc3dSStefano Zampini EXTERN_C_BEGIN 30953cdbc3dSStefano Zampini #undef __FUNCT__ 310da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCGetDirichletBoundaries_BDDC" 311da1bb401SStefano Zampini static PetscErrorCode PCBDDCGetDirichletBoundaries_BDDC(PC pc,IS *DirichletBoundaries) 312da1bb401SStefano Zampini { 313da1bb401SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 314da1bb401SStefano Zampini 315da1bb401SStefano Zampini PetscFunctionBegin; 316da1bb401SStefano Zampini *DirichletBoundaries = pcbddc->DirichletBoundaries; 317da1bb401SStefano Zampini PetscFunctionReturn(0); 318da1bb401SStefano Zampini } 319da1bb401SStefano Zampini EXTERN_C_END 320da1bb401SStefano Zampini #undef __FUNCT__ 321da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCGetDirichletBoundaries" 322da1bb401SStefano Zampini /*@ 323da1bb401SStefano Zampini PCBDDCGetDirichletBoundaries - Get index set defining subdomain part (in local ordering) 324da1bb401SStefano Zampini of Dirichlet boundaries for the global problem. 325da1bb401SStefano Zampini 326da1bb401SStefano Zampini Not collective 327da1bb401SStefano Zampini 328da1bb401SStefano Zampini Input Parameters: 329da1bb401SStefano Zampini + pc - the preconditioning context 330da1bb401SStefano Zampini 331da1bb401SStefano Zampini Output Parameters: 332da1bb401SStefano Zampini + DirichletBoundaries - index set defining the subdomain part of Dirichlet boundaries 333da1bb401SStefano Zampini 334da1bb401SStefano Zampini Level: intermediate 335da1bb401SStefano Zampini 336da1bb401SStefano Zampini Notes: 337da1bb401SStefano Zampini 338da1bb401SStefano Zampini .seealso: PCBDDC 339da1bb401SStefano Zampini @*/ 340da1bb401SStefano Zampini PetscErrorCode PCBDDCGetDirichletBoundaries(PC pc,IS *DirichletBoundaries) 341da1bb401SStefano Zampini { 342da1bb401SStefano Zampini PetscErrorCode ierr; 343da1bb401SStefano Zampini 344da1bb401SStefano Zampini PetscFunctionBegin; 345da1bb401SStefano Zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 346da1bb401SStefano Zampini ierr = PetscUseMethod(pc,"PCBDDCGetDirichletBoundaries_C",(PC,IS*),(pc,DirichletBoundaries));CHKERRQ(ierr); 347da1bb401SStefano Zampini PetscFunctionReturn(0); 348da1bb401SStefano Zampini } 349da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */ 350da1bb401SStefano Zampini EXTERN_C_BEGIN 351da1bb401SStefano Zampini #undef __FUNCT__ 35253cdbc3dSStefano Zampini #define __FUNCT__ "PCBDDCGetNeumannBoundaries_BDDC" 35353cdbc3dSStefano Zampini static PetscErrorCode PCBDDCGetNeumannBoundaries_BDDC(PC pc,IS *NeumannBoundaries) 35453cdbc3dSStefano Zampini { 35553cdbc3dSStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 35653cdbc3dSStefano Zampini 35753cdbc3dSStefano Zampini PetscFunctionBegin; 35853cdbc3dSStefano Zampini *NeumannBoundaries = pcbddc->NeumannBoundaries; 35953cdbc3dSStefano Zampini PetscFunctionReturn(0); 36053cdbc3dSStefano Zampini } 36153cdbc3dSStefano Zampini EXTERN_C_END 36253cdbc3dSStefano Zampini #undef __FUNCT__ 36353cdbc3dSStefano Zampini #define __FUNCT__ "PCBDDCGetNeumannBoundaries" 36453cdbc3dSStefano Zampini /*@ 365da1bb401SStefano Zampini PCBDDCGetNeumannBoundaries - Get index set defining subdomain part (in local ordering) 366da1bb401SStefano Zampini of Neumann boundaries for the global problem. 36753cdbc3dSStefano Zampini 3689c0446d6SStefano Zampini Not collective 36953cdbc3dSStefano Zampini 37053cdbc3dSStefano Zampini Input Parameters: 37153cdbc3dSStefano Zampini + pc - the preconditioning context 37253cdbc3dSStefano Zampini 37353cdbc3dSStefano Zampini Output Parameters: 37453cdbc3dSStefano Zampini + NeumannBoundaries - index set defining the subdomain part of Neumann boundaries 37553cdbc3dSStefano Zampini 37653cdbc3dSStefano Zampini Level: intermediate 37753cdbc3dSStefano Zampini 37853cdbc3dSStefano Zampini Notes: 37953cdbc3dSStefano Zampini 38053cdbc3dSStefano Zampini .seealso: PCBDDC 38153cdbc3dSStefano Zampini @*/ 38253cdbc3dSStefano Zampini PetscErrorCode PCBDDCGetNeumannBoundaries(PC pc,IS *NeumannBoundaries) 38353cdbc3dSStefano Zampini { 38453cdbc3dSStefano Zampini PetscErrorCode ierr; 38553cdbc3dSStefano Zampini 38653cdbc3dSStefano Zampini PetscFunctionBegin; 38753cdbc3dSStefano Zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 38853cdbc3dSStefano Zampini ierr = PetscUseMethod(pc,"PCBDDCGetNeumannBoundaries_C",(PC,IS*),(pc,NeumannBoundaries));CHKERRQ(ierr); 3890c7d97c5SJed Brown PetscFunctionReturn(0); 3900c7d97c5SJed Brown } 39136e030ebSStefano Zampini /* -------------------------------------------------------------------------- */ 39236e030ebSStefano Zampini EXTERN_C_BEGIN 39336e030ebSStefano Zampini #undef __FUNCT__ 394da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetLocalAdjacencyGraph_BDDC" 395da1bb401SStefano Zampini static PetscErrorCode PCBDDCSetLocalAdjacencyGraph_BDDC(PC pc, PetscInt nvtxs, PetscInt xadj[], PetscInt adjncy[], PetscCopyMode copymode) 39636e030ebSStefano Zampini { 39736e030ebSStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 398da1bb401SStefano Zampini PCBDDCGraph mat_graph=pcbddc->mat_graph; 399da1bb401SStefano Zampini PetscErrorCode ierr; 40036e030ebSStefano Zampini 40136e030ebSStefano Zampini PetscFunctionBegin; 402da1bb401SStefano Zampini mat_graph->nvtxs=nvtxs; 403da1bb401SStefano Zampini ierr = PetscFree(mat_graph->xadj);CHKERRQ(ierr); 404da1bb401SStefano Zampini ierr = PetscFree(mat_graph->adjncy);CHKERRQ(ierr); 405da1bb401SStefano Zampini if (copymode == PETSC_COPY_VALUES) { 406da1bb401SStefano Zampini ierr = PetscMalloc((mat_graph->nvtxs+1)*sizeof(PetscInt),&mat_graph->xadj);CHKERRQ(ierr); 407da1bb401SStefano Zampini ierr = PetscMalloc(xadj[mat_graph->nvtxs]*sizeof(PetscInt),&mat_graph->adjncy);CHKERRQ(ierr); 408da1bb401SStefano Zampini ierr = PetscMemcpy(mat_graph->xadj,xadj,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr); 409da1bb401SStefano Zampini ierr = PetscMemcpy(mat_graph->adjncy,adjncy,xadj[mat_graph->nvtxs]*sizeof(PetscInt));CHKERRQ(ierr); 410da1bb401SStefano Zampini } else if (copymode == PETSC_OWN_POINTER) { 411da1bb401SStefano Zampini mat_graph->xadj=xadj; 412da1bb401SStefano Zampini mat_graph->adjncy=adjncy; 413da1bb401SStefano Zampini } else { 414da1bb401SStefano Zampini SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_SUP,"Unsupported copy mode %d in %s\n",copymode,__FUNCT__); 415da1bb401SStefano Zampini } 41636e030ebSStefano Zampini PetscFunctionReturn(0); 41736e030ebSStefano Zampini } 41836e030ebSStefano Zampini EXTERN_C_END 41936e030ebSStefano Zampini #undef __FUNCT__ 420da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetLocalAdjacencyGraph" 42136e030ebSStefano Zampini /*@ 422da1bb401SStefano Zampini PCBDDCSetLocalAdjacencyGraph - Set CSR graph of local matrix for use of PCBDDC. 42336e030ebSStefano Zampini 42436e030ebSStefano Zampini Not collective 42536e030ebSStefano Zampini 42636e030ebSStefano Zampini Input Parameters: 42736e030ebSStefano Zampini + pc - the preconditioning context 428da1bb401SStefano Zampini - nvtxs - number of local vertices of the graph 429da1bb401SStefano Zampini - xadj, adjncy - the CSR graph 430da1bb401SStefano Zampini - copymode - either PETSC_COPY_VALUES or PETSC_OWN_POINTER. In the former case the user must free the array passed in; 431da1bb401SStefano Zampini in the latter case, memory must be obtained with PetscMalloc. 43236e030ebSStefano Zampini 43336e030ebSStefano Zampini Level: intermediate 43436e030ebSStefano Zampini 43536e030ebSStefano Zampini Notes: 43636e030ebSStefano Zampini 43736e030ebSStefano Zampini .seealso: PCBDDC 43836e030ebSStefano Zampini @*/ 439da1bb401SStefano Zampini PetscErrorCode PCBDDCSetLocalAdjacencyGraph(PC pc,PetscInt nvtxs,PetscInt xadj[],PetscInt adjncy[], PetscCopyMode copymode) 44036e030ebSStefano Zampini { 441da1bb401SStefano Zampini PetscInt nrows,ncols; 442da1bb401SStefano Zampini Mat_IS *matis = (Mat_IS*)pc->pmat->data; 44336e030ebSStefano Zampini PetscErrorCode ierr; 44436e030ebSStefano Zampini 44536e030ebSStefano Zampini PetscFunctionBegin; 44636e030ebSStefano Zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 447da1bb401SStefano Zampini ierr = MatGetSize(matis->A,&nrows,&ncols);CHKERRQ(ierr); 448da1bb401SStefano Zampini if (nvtxs != nrows) { 449da1bb401SStefano Zampini SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Local adjacency size %d passed in %s differs from local problem size %d!\n",nvtxs,__FUNCT__,nrows); 450da1bb401SStefano Zampini } else { 451da1bb401SStefano Zampini ierr = PetscTryMethod(pc,"PCBDDCSetLocalAdjacencyGraph_C",(PC,PetscInt,PetscInt[],PetscInt[],PetscCopyMode),(pc,nvtxs,xadj,adjncy,copymode));CHKERRQ(ierr); 452da1bb401SStefano Zampini } 45336e030ebSStefano Zampini PetscFunctionReturn(0); 45436e030ebSStefano Zampini } 4559c0446d6SStefano Zampini /* -------------------------------------------------------------------------- */ 4569c0446d6SStefano Zampini EXTERN_C_BEGIN 4579c0446d6SStefano Zampini #undef __FUNCT__ 4589c0446d6SStefano Zampini #define __FUNCT__ "PCBDDCSetDofsSplitting_BDDC" 4599c0446d6SStefano Zampini static PetscErrorCode PCBDDCSetDofsSplitting_BDDC(PC pc,PetscInt n_is, IS ISForDofs[]) 4609c0446d6SStefano Zampini { 4619c0446d6SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 4629c0446d6SStefano Zampini PetscInt i; 4639c0446d6SStefano Zampini PetscErrorCode ierr; 4649c0446d6SStefano Zampini 4659c0446d6SStefano Zampini PetscFunctionBegin; 466da1bb401SStefano Zampini /* Destroy ISes if they were already set */ 4679c0446d6SStefano Zampini for (i=0;i<pcbddc->n_ISForDofs;i++) { 4689c0446d6SStefano Zampini ierr = ISDestroy(&pcbddc->ISForDofs[i]);CHKERRQ(ierr); 4699c0446d6SStefano Zampini } 470d11ae9bbSstefano_zampini ierr = PetscFree(pcbddc->ISForDofs);CHKERRQ(ierr); 471da1bb401SStefano Zampini /* allocate space then set */ 4729c0446d6SStefano Zampini ierr = PetscMalloc(n_is*sizeof(IS),&pcbddc->ISForDofs);CHKERRQ(ierr); 4739c0446d6SStefano Zampini for (i=0;i<n_is;i++) { 474da1bb401SStefano Zampini ierr = PetscObjectReference((PetscObject)ISForDofs[i]);CHKERRQ(ierr); 475da1bb401SStefano Zampini pcbddc->ISForDofs[i]=ISForDofs[i]; 4769c0446d6SStefano Zampini } 4779c0446d6SStefano Zampini pcbddc->n_ISForDofs=n_is; 4789c0446d6SStefano Zampini PetscFunctionReturn(0); 4799c0446d6SStefano Zampini } 4809c0446d6SStefano Zampini EXTERN_C_END 4819c0446d6SStefano Zampini #undef __FUNCT__ 4829c0446d6SStefano Zampini #define __FUNCT__ "PCBDDCSetDofsSplitting" 4839c0446d6SStefano Zampini /*@ 484da1bb401SStefano Zampini PCBDDCSetDofsSplitting - Set index sets defining fields of local mat. 4859c0446d6SStefano Zampini 4869c0446d6SStefano Zampini Not collective 4879c0446d6SStefano Zampini 4889c0446d6SStefano Zampini Input Parameters: 4899c0446d6SStefano Zampini + pc - the preconditioning context 490da1bb401SStefano Zampini - n - number of index sets defining the fields 491da1bb401SStefano Zampini - IS[] - array of IS describing the fields 4929c0446d6SStefano Zampini 4939c0446d6SStefano Zampini Level: intermediate 4949c0446d6SStefano Zampini 4959c0446d6SStefano Zampini Notes: 4969c0446d6SStefano Zampini 4979c0446d6SStefano Zampini .seealso: PCBDDC 4989c0446d6SStefano Zampini @*/ 4999c0446d6SStefano Zampini PetscErrorCode PCBDDCSetDofsSplitting(PC pc,PetscInt n_is, IS ISForDofs[]) 5009c0446d6SStefano Zampini { 5019c0446d6SStefano Zampini PetscErrorCode ierr; 5029c0446d6SStefano Zampini 5039c0446d6SStefano Zampini PetscFunctionBegin; 5049c0446d6SStefano Zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 5059c0446d6SStefano Zampini ierr = PetscTryMethod(pc,"PCBDDCSetDofsSplitting_C",(PC,PetscInt,IS[]),(pc,n_is,ISForDofs));CHKERRQ(ierr); 5069c0446d6SStefano Zampini PetscFunctionReturn(0); 5079c0446d6SStefano Zampini } 508da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */ 509534831adSStefano Zampini #undef __FUNCT__ 510534831adSStefano Zampini #define __FUNCT__ "PCPreSolve_BDDC" 511534831adSStefano Zampini /* -------------------------------------------------------------------------- */ 512534831adSStefano Zampini /* 513534831adSStefano Zampini PCPreSolve_BDDC - Changes the right hand side and (if necessary) the initial 514534831adSStefano Zampini guess if a transformation of basis approach has been selected. 5159c0446d6SStefano Zampini 516534831adSStefano Zampini Input Parameter: 517534831adSStefano Zampini + pc - the preconditioner contex 518534831adSStefano Zampini 519534831adSStefano Zampini Application Interface Routine: PCPreSolve() 520534831adSStefano Zampini 521534831adSStefano Zampini Notes: 522534831adSStefano Zampini The interface routine PCPreSolve() is not usually called directly by 523534831adSStefano Zampini the user, but instead is called by KSPSolve(). 524534831adSStefano Zampini */ 525534831adSStefano Zampini static PetscErrorCode PCPreSolve_BDDC(PC pc, KSP ksp, Vec rhs, Vec x) 526534831adSStefano Zampini { 527534831adSStefano Zampini PetscErrorCode ierr; 528534831adSStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 529534831adSStefano Zampini PC_IS *pcis = (PC_IS*)(pc->data); 530534831adSStefano Zampini Mat_IS *matis = (Mat_IS*)pc->pmat->data; 531534831adSStefano Zampini Mat temp_mat; 5323972b0daSStefano Zampini IS dirIS; 5333972b0daSStefano Zampini PetscInt dirsize,i,*is_indices; 5343972b0daSStefano Zampini PetscScalar *array_x,*array_diagonal; 5353972b0daSStefano Zampini Vec used_vec; 5363972b0daSStefano Zampini PetscBool guess_nonzero; 537534831adSStefano Zampini 538534831adSStefano Zampini PetscFunctionBegin; 5393972b0daSStefano Zampini if (x) { 5403972b0daSStefano Zampini ierr = PetscObjectReference((PetscObject)x);CHKERRQ(ierr); 5413972b0daSStefano Zampini used_vec = x; 5423972b0daSStefano Zampini } else { 5433972b0daSStefano Zampini ierr = PetscObjectReference((PetscObject)pcbddc->temp_solution);CHKERRQ(ierr); 5443972b0daSStefano Zampini used_vec = pcbddc->temp_solution; 5453972b0daSStefano Zampini ierr = VecSet(used_vec,0.0);CHKERRQ(ierr); 5463972b0daSStefano Zampini } 5473972b0daSStefano Zampini /* hack into ksp data structure PCPreSolve comes earlier in src/ksp/ksp/interface/itfunc.c */ 5483972b0daSStefano Zampini if (ksp) { 5493972b0daSStefano Zampini ierr = KSPGetInitialGuessNonzero(ksp,&guess_nonzero);CHKERRQ(ierr); 5503972b0daSStefano Zampini if ( !guess_nonzero ) { 5513972b0daSStefano Zampini ierr = VecSet(used_vec,0.0);CHKERRQ(ierr); 5523972b0daSStefano Zampini } 5533972b0daSStefano Zampini } 5543972b0daSStefano Zampini /* store the original rhs */ 5553972b0daSStefano Zampini ierr = VecCopy(rhs,pcbddc->original_rhs);CHKERRQ(ierr); 5563972b0daSStefano Zampini 5573972b0daSStefano Zampini /* Take into account zeroed rows -> change rhs and store solution removed */ 5583972b0daSStefano Zampini ierr = MatGetDiagonal(pc->pmat,pcis->vec1_global);CHKERRQ(ierr); 5593972b0daSStefano Zampini ierr = VecPointwiseDivide(pcis->vec1_global,rhs,pcis->vec1_global);CHKERRQ(ierr); 5603972b0daSStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 5613972b0daSStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 5623972b0daSStefano Zampini ierr = VecScatterBegin(matis->ctx,used_vec,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 5633972b0daSStefano Zampini ierr = VecScatterEnd (matis->ctx,used_vec,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 5643972b0daSStefano Zampini ierr = PCBDDCGetDirichletBoundaries(pc,&dirIS);CHKERRQ(ierr); 5653972b0daSStefano Zampini if (dirIS) { 5663972b0daSStefano Zampini ierr = ISGetSize(dirIS,&dirsize);CHKERRQ(ierr); 5673972b0daSStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array_x);CHKERRQ(ierr); 5683972b0daSStefano Zampini ierr = VecGetArray(pcis->vec2_N,&array_diagonal);CHKERRQ(ierr); 5693972b0daSStefano Zampini ierr = ISGetIndices(dirIS,(const PetscInt**)&is_indices);CHKERRQ(ierr); 5703972b0daSStefano Zampini for (i=0;i<dirsize;i++) { 5713972b0daSStefano Zampini array_x[is_indices[i]]=array_diagonal[is_indices[i]]; 5723972b0daSStefano Zampini } 5733972b0daSStefano Zampini ierr = ISRestoreIndices(dirIS,(const PetscInt**)&is_indices);CHKERRQ(ierr); 5743972b0daSStefano Zampini ierr = VecRestoreArray(pcis->vec2_N,&array_diagonal);CHKERRQ(ierr); 5753972b0daSStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array_x);CHKERRQ(ierr); 5763972b0daSStefano Zampini } 5773972b0daSStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 5783972b0daSStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 579b76ba322SStefano Zampini 5803972b0daSStefano Zampini /* remove the computed solution from the rhs */ 5813972b0daSStefano Zampini ierr = VecScale(used_vec,-1.0);CHKERRQ(ierr); 5823972b0daSStefano Zampini ierr = MatMultAdd(pc->pmat,used_vec,rhs,rhs);CHKERRQ(ierr); 5833972b0daSStefano Zampini ierr = VecScale(used_vec,-1.0);CHKERRQ(ierr); 584b76ba322SStefano Zampini 585b76ba322SStefano Zampini /* store partially computed solution and set initial guess */ 5863972b0daSStefano Zampini if (x) { 5873972b0daSStefano Zampini ierr = VecCopy(used_vec,pcbddc->temp_solution);CHKERRQ(ierr); 5883972b0daSStefano Zampini ierr = VecSet(used_vec,0.0);CHKERRQ(ierr); 589b76ba322SStefano Zampini if (pcbddc->use_exact_dirichlet) { 590b76ba322SStefano Zampini ierr = VecScatterBegin(pcis->global_to_D,rhs,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 591b76ba322SStefano Zampini ierr = VecScatterEnd (pcis->global_to_D,rhs,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 592b76ba322SStefano Zampini ierr = KSPSolve(pcbddc->ksp_D,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr); 593b76ba322SStefano Zampini ierr = VecScatterBegin(pcis->global_to_D,pcis->vec2_D,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 594b76ba322SStefano Zampini ierr = VecScatterEnd (pcis->global_to_D,pcis->vec2_D,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 595b76ba322SStefano Zampini if (ksp) { 596b76ba322SStefano Zampini ierr = KSPSetInitialGuessNonzero(ksp,PETSC_TRUE);CHKERRQ(ierr); 597b76ba322SStefano Zampini } 598b76ba322SStefano Zampini } 5993972b0daSStefano Zampini } 600b76ba322SStefano Zampini 601b76ba322SStefano Zampini /* rhs change of basis */ 602b76ba322SStefano Zampini if (pcbddc->usechangeofbasis) { 603b76ba322SStefano Zampini /* swap pointers for local matrices */ 604b76ba322SStefano Zampini temp_mat = matis->A; 605b76ba322SStefano Zampini matis->A = pcbddc->local_mat; 606b76ba322SStefano Zampini pcbddc->local_mat = temp_mat; 607b76ba322SStefano Zampini /* Get local rhs and apply transformation of basis */ 608b76ba322SStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,rhs,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 609b76ba322SStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,rhs,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 610b76ba322SStefano Zampini /* from original basis to modified basis */ 611b76ba322SStefano Zampini ierr = MatMultTranspose(pcbddc->ChangeOfBasisMatrix,pcis->vec1_B,pcis->vec2_B);CHKERRQ(ierr); 612b76ba322SStefano Zampini /* put back modified values into the global vec using INSERT_VALUES copy mode */ 613b76ba322SStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,pcis->vec2_B,rhs,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 614b76ba322SStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,pcis->vec2_B,rhs,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 6150bdf917eSStefano Zampini if (ksp && pcbddc->NullSpace) { 6160bdf917eSStefano Zampini ierr = MatNullSpaceRemove(pcbddc->NullSpace,used_vec,PETSC_NULL);CHKERRQ(ierr); 6170bdf917eSStefano Zampini ierr = MatNullSpaceRemove(pcbddc->NullSpace,rhs,PETSC_NULL);CHKERRQ(ierr); 618b76ba322SStefano Zampini } 6190bdf917eSStefano Zampini } 6200bdf917eSStefano Zampini ierr = VecDestroy(&used_vec);CHKERRQ(ierr); 621534831adSStefano Zampini PetscFunctionReturn(0); 622534831adSStefano Zampini } 623534831adSStefano Zampini /* -------------------------------------------------------------------------- */ 624534831adSStefano Zampini #undef __FUNCT__ 625534831adSStefano Zampini #define __FUNCT__ "PCPostSolve_BDDC" 626534831adSStefano Zampini /* -------------------------------------------------------------------------- */ 627534831adSStefano Zampini /* 628534831adSStefano Zampini PCPostSolve_BDDC - Changes the computed solution if a transformation of basis 629534831adSStefano Zampini approach has been selected. Also, restores rhs to its original state. 630534831adSStefano Zampini 631534831adSStefano Zampini Input Parameter: 632534831adSStefano Zampini + pc - the preconditioner contex 633534831adSStefano Zampini 634534831adSStefano Zampini Application Interface Routine: PCPostSolve() 635534831adSStefano Zampini 636534831adSStefano Zampini Notes: 637534831adSStefano Zampini The interface routine PCPostSolve() is not usually called directly by 638534831adSStefano Zampini the user, but instead is called by KSPSolve(). 639534831adSStefano Zampini */ 640534831adSStefano Zampini static PetscErrorCode PCPostSolve_BDDC(PC pc, KSP ksp, Vec rhs, Vec x) 641534831adSStefano Zampini { 642534831adSStefano Zampini PetscErrorCode ierr; 643534831adSStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 644534831adSStefano Zampini PC_IS *pcis = (PC_IS*)(pc->data); 645534831adSStefano Zampini Mat_IS *matis = (Mat_IS*)pc->pmat->data; 646534831adSStefano Zampini Mat temp_mat; 647534831adSStefano Zampini 648534831adSStefano Zampini PetscFunctionBegin; 649534831adSStefano Zampini if (pcbddc->usechangeofbasis) { 650534831adSStefano Zampini /* swap pointers for local matrices */ 651534831adSStefano Zampini temp_mat = matis->A; 652534831adSStefano Zampini matis->A = pcbddc->local_mat; 653534831adSStefano Zampini pcbddc->local_mat = temp_mat; 654534831adSStefano Zampini /* restore rhs to its original state */ 6553425bc38SStefano Zampini if (rhs) { 6563425bc38SStefano Zampini ierr = VecCopy(pcbddc->original_rhs,rhs);CHKERRQ(ierr); 6573425bc38SStefano Zampini } 658534831adSStefano Zampini /* Get Local boundary and apply transformation of basis to solution vector */ 659534831adSStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,x,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 660534831adSStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,x,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 661534831adSStefano Zampini /* from modified basis to original basis */ 662534831adSStefano Zampini ierr = MatMult(pcbddc->ChangeOfBasisMatrix,pcis->vec1_B,pcis->vec2_B);CHKERRQ(ierr); 663534831adSStefano Zampini /* put back modified values into the global vec using INSERT_VALUES copy mode */ 664534831adSStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,pcis->vec2_B,x,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 665534831adSStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,pcis->vec2_B,x,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 666534831adSStefano Zampini } 6673972b0daSStefano Zampini /* add solution removed in presolve */ 6683425bc38SStefano Zampini if (x) { 6693425bc38SStefano Zampini ierr = VecAXPY(x,1.0,pcbddc->temp_solution);CHKERRQ(ierr); 6703425bc38SStefano Zampini } 671534831adSStefano Zampini PetscFunctionReturn(0); 672534831adSStefano Zampini } 673534831adSStefano Zampini /* -------------------------------------------------------------------------- */ 67453cdbc3dSStefano Zampini #undef __FUNCT__ 67553cdbc3dSStefano Zampini #define __FUNCT__ "PCSetUp_BDDC" 6760c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 6770c7d97c5SJed Brown /* 6780c7d97c5SJed Brown PCSetUp_BDDC - Prepares for the use of the BDDC preconditioner 6790c7d97c5SJed Brown by setting data structures and options. 6800c7d97c5SJed Brown 6810c7d97c5SJed Brown Input Parameter: 68253cdbc3dSStefano Zampini + pc - the preconditioner context 6830c7d97c5SJed Brown 6840c7d97c5SJed Brown Application Interface Routine: PCSetUp() 6850c7d97c5SJed Brown 6860c7d97c5SJed Brown Notes: 6870c7d97c5SJed Brown The interface routine PCSetUp() is not usually called directly by 6880c7d97c5SJed Brown the user, but instead is called by PCApply() if necessary. 6890c7d97c5SJed Brown */ 69053cdbc3dSStefano Zampini PetscErrorCode PCSetUp_BDDC(PC pc) 6910c7d97c5SJed Brown { 6920c7d97c5SJed Brown PetscErrorCode ierr; 6930c7d97c5SJed Brown PC_BDDC* pcbddc = (PC_BDDC*)pc->data; 6940c7d97c5SJed Brown 6950c7d97c5SJed Brown PetscFunctionBegin; 6960c7d97c5SJed Brown if (!pc->setupcalled) { 6973b03a366Sstefano_zampini /* For BDDC we need to define a local "Neumann" problem different to that defined in PCISSetup 6989c0446d6SStefano Zampini So, we set to pcnone the Neumann problem of pcis in order to avoid unneeded computation 6990c7d97c5SJed Brown Also, we decide to directly build the (same) Dirichlet problem */ 7000c7d97c5SJed Brown ierr = PetscOptionsSetValue("-is_localN_pc_type","none");CHKERRQ(ierr); 7010c7d97c5SJed Brown ierr = PetscOptionsSetValue("-is_localD_pc_type","none");CHKERRQ(ierr); 7020c7d97c5SJed Brown /* Set up all the "iterative substructuring" common block */ 7030bdf917eSStefano Zampini 7040c7d97c5SJed Brown ierr = PCISSetUp(pc);CHKERRQ(ierr); 7053b03a366Sstefano_zampini /* Get stdout for dbg */ 706e269702eSStefano Zampini if (pcbddc->dbg_flag) { 707e269702eSStefano Zampini ierr = PetscViewerASCIIGetStdout(((PetscObject)pc)->comm,&pcbddc->dbg_viewer);CHKERRQ(ierr); 708e269702eSStefano Zampini ierr = PetscViewerASCIISynchronizedAllow(pcbddc->dbg_viewer,PETSC_TRUE);CHKERRQ(ierr); 709e269702eSStefano Zampini } 7103b03a366Sstefano_zampini /* Analyze local interface */ 7110c7d97c5SJed Brown ierr = PCBDDCManageLocalBoundaries(pc);CHKERRQ(ierr); 7123b03a366Sstefano_zampini /* Set up local constraint matrix */ 7133b03a366Sstefano_zampini ierr = PCBDDCCreateConstraintMatrix(pc);CHKERRQ(ierr); 7140c7d97c5SJed Brown /* Create coarse and local stuffs used for evaluating action of preconditioner */ 7150c7d97c5SJed Brown ierr = PCBDDCCoarseSetUp(pc);CHKERRQ(ierr); 7160c7d97c5SJed Brown } 7170c7d97c5SJed Brown PetscFunctionReturn(0); 7180c7d97c5SJed Brown } 7190c7d97c5SJed Brown 7200c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 7210c7d97c5SJed Brown /* 7220c7d97c5SJed Brown PCApply_BDDC - Applies the BDDC preconditioner to a vector. 7230c7d97c5SJed Brown 7240c7d97c5SJed Brown Input Parameters: 7250c7d97c5SJed Brown . pc - the preconditioner context 7260c7d97c5SJed Brown . r - input vector (global) 7270c7d97c5SJed Brown 7280c7d97c5SJed Brown Output Parameter: 7290c7d97c5SJed Brown . z - output vector (global) 7300c7d97c5SJed Brown 7310c7d97c5SJed Brown Application Interface Routine: PCApply() 7320c7d97c5SJed Brown */ 7330c7d97c5SJed Brown #undef __FUNCT__ 7340c7d97c5SJed Brown #define __FUNCT__ "PCApply_BDDC" 73553cdbc3dSStefano Zampini PetscErrorCode PCApply_BDDC(PC pc,Vec r,Vec z) 7360c7d97c5SJed Brown { 7370c7d97c5SJed Brown PC_IS *pcis = (PC_IS*)(pc->data); 7380c7d97c5SJed Brown PC_BDDC *pcbddc = (PC_BDDC*)(pc->data); 7390c7d97c5SJed Brown PetscErrorCode ierr; 7403b03a366Sstefano_zampini const PetscScalar one = 1.0; 7413b03a366Sstefano_zampini const PetscScalar m_one = -1.0; 7422617d88aSStefano Zampini const PetscScalar zero = 0.0; 7430c7d97c5SJed Brown 7440c7d97c5SJed Brown /* This code is similar to that provided in nn.c for PCNN 7450c7d97c5SJed Brown NN interface preconditioner changed to BDDC 7460c7d97c5SJed Brown Added support for M_3 preconditioenr in the reference article (code is active if pcbddc->prec_type = PETSC_TRUE) */ 7470c7d97c5SJed Brown 7480c7d97c5SJed Brown PetscFunctionBegin; 749b76ba322SStefano Zampini if (!pcbddc->use_exact_dirichlet) { 7500c7d97c5SJed Brown /* First Dirichlet solve */ 7510c7d97c5SJed Brown ierr = VecScatterBegin(pcis->global_to_D,r,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 7520c7d97c5SJed Brown ierr = VecScatterEnd (pcis->global_to_D,r,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 75353cdbc3dSStefano Zampini ierr = KSPSolve(pcbddc->ksp_D,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr); 7540c7d97c5SJed Brown /* 7550c7d97c5SJed Brown Assembling right hand side for BDDC operator 7560c7d97c5SJed Brown - vec1_D for the Dirichlet part (if needed, i.e. prec_flag=PETSC_TRUE) 7570c7d97c5SJed Brown - the interface part of the global vector z 7580c7d97c5SJed Brown */ 7590c7d97c5SJed Brown ierr = VecScale(pcis->vec2_D,m_one);CHKERRQ(ierr); 7600c7d97c5SJed Brown ierr = MatMult(pcis->A_BI,pcis->vec2_D,pcis->vec1_B);CHKERRQ(ierr); 7610c7d97c5SJed Brown if (pcbddc->prec_type) { ierr = MatMultAdd(pcis->A_II,pcis->vec2_D,pcis->vec1_D,pcis->vec1_D);CHKERRQ(ierr); } 7620c7d97c5SJed Brown ierr = VecScale(pcis->vec2_D,m_one);CHKERRQ(ierr); 7630c7d97c5SJed Brown ierr = VecCopy(r,z);CHKERRQ(ierr); 7640c7d97c5SJed Brown ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 7650c7d97c5SJed Brown ierr = VecScatterEnd (pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 7662617d88aSStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 7672617d88aSStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 768b76ba322SStefano Zampini } else { 769b76ba322SStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,r,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 770b76ba322SStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,r,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 7710bdf917eSStefano Zampini ierr = VecSet(pcis->vec1_D,zero);CHKERRQ(ierr); 772b76ba322SStefano Zampini ierr = VecSet(pcis->vec2_D,zero);CHKERRQ(ierr); 773b76ba322SStefano Zampini } 774b76ba322SStefano Zampini 775b76ba322SStefano Zampini /* Apply partition of unity */ 7762617d88aSStefano Zampini ierr = VecPointwiseMult(pcis->vec1_B,pcis->D,pcis->vec1_B);CHKERRQ(ierr); 7772617d88aSStefano Zampini 7782617d88aSStefano Zampini /* Apply interface preconditioner 7792617d88aSStefano Zampini input/output vecs: pcis->vec1_B and pcis->vec1_D */ 7802617d88aSStefano Zampini ierr = PCBDDCApplyInterfacePreconditioner(pc);CHKERRQ(ierr); 7812617d88aSStefano Zampini 7822617d88aSStefano Zampini /* Apply partition of unity and sum boundary values */ 7832617d88aSStefano Zampini ierr = VecPointwiseMult(pcis->vec1_B,pcis->D,pcis->vec1_B);CHKERRQ(ierr); 7842617d88aSStefano Zampini ierr = VecSet(z,zero);CHKERRQ(ierr); 7852617d88aSStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 7862617d88aSStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 7870c7d97c5SJed Brown 7883b03a366Sstefano_zampini /* Second Dirichlet solve and assembling of output */ 7890c7d97c5SJed Brown ierr = VecScatterBegin(pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 7900c7d97c5SJed Brown ierr = VecScatterEnd (pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 7910c7d97c5SJed Brown ierr = MatMult(pcis->A_IB,pcis->vec1_B,pcis->vec3_D);CHKERRQ(ierr); 7920c7d97c5SJed Brown if (pcbddc->prec_type) { ierr = MatMultAdd(pcis->A_II,pcis->vec1_D,pcis->vec3_D,pcis->vec3_D);CHKERRQ(ierr); } 79353cdbc3dSStefano Zampini ierr = KSPSolve(pcbddc->ksp_D,pcis->vec3_D,pcbddc->vec4_D);CHKERRQ(ierr); 7940c7d97c5SJed Brown ierr = VecScale(pcbddc->vec4_D,m_one);CHKERRQ(ierr); 7950c7d97c5SJed Brown if (pcbddc->prec_type) { ierr = VecAXPY (pcbddc->vec4_D,one,pcis->vec1_D);CHKERRQ(ierr); } 7960c7d97c5SJed Brown ierr = VecAXPY (pcis->vec2_D,one,pcbddc->vec4_D);CHKERRQ(ierr); 7970c7d97c5SJed Brown ierr = VecScatterBegin(pcis->global_to_D,pcis->vec2_D,z,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 7980c7d97c5SJed Brown ierr = VecScatterEnd (pcis->global_to_D,pcis->vec2_D,z,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 7990c7d97c5SJed Brown PetscFunctionReturn(0); 8000c7d97c5SJed Brown 8010c7d97c5SJed Brown } 802da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */ 803da1bb401SStefano Zampini #undef __FUNCT__ 804da1bb401SStefano Zampini #define __FUNCT__ "PCDestroy_BDDC" 805da1bb401SStefano Zampini PetscErrorCode PCDestroy_BDDC(PC pc) 806da1bb401SStefano Zampini { 807da1bb401SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 8080bdf917eSStefano Zampini PetscInt i; 809da1bb401SStefano Zampini PetscErrorCode ierr; 810da1bb401SStefano Zampini 811da1bb401SStefano Zampini PetscFunctionBegin; 812da1bb401SStefano Zampini /* free data created by PCIS */ 813da1bb401SStefano Zampini ierr = PCISDestroy(pc);CHKERRQ(ierr); 814da1bb401SStefano Zampini /* free BDDC data */ 8150bdf917eSStefano Zampini ierr = MatNullSpaceDestroy(&pcbddc->CoarseNullSpace);CHKERRQ(ierr); 8160bdf917eSStefano Zampini ierr = MatNullSpaceDestroy(&pcbddc->NullSpace);CHKERRQ(ierr); 8173972b0daSStefano Zampini ierr = VecDestroy(&pcbddc->temp_solution);CHKERRQ(ierr); 818534831adSStefano Zampini ierr = VecDestroy(&pcbddc->original_rhs);CHKERRQ(ierr); 819534831adSStefano Zampini ierr = MatDestroy(&pcbddc->local_mat);CHKERRQ(ierr); 820534831adSStefano Zampini ierr = MatDestroy(&pcbddc->ChangeOfBasisMatrix);CHKERRQ(ierr); 821da1bb401SStefano Zampini ierr = VecDestroy(&pcbddc->coarse_vec);CHKERRQ(ierr); 822da1bb401SStefano Zampini ierr = VecDestroy(&pcbddc->coarse_rhs);CHKERRQ(ierr); 823da1bb401SStefano Zampini ierr = KSPDestroy(&pcbddc->coarse_ksp);CHKERRQ(ierr); 824da1bb401SStefano Zampini ierr = MatDestroy(&pcbddc->coarse_mat);CHKERRQ(ierr); 825da1bb401SStefano Zampini ierr = MatDestroy(&pcbddc->coarse_phi_B);CHKERRQ(ierr); 826da1bb401SStefano Zampini ierr = MatDestroy(&pcbddc->coarse_phi_D);CHKERRQ(ierr); 827da1bb401SStefano Zampini ierr = VecDestroy(&pcbddc->vec1_P);CHKERRQ(ierr); 828da1bb401SStefano Zampini ierr = VecDestroy(&pcbddc->vec1_C);CHKERRQ(ierr); 829da1bb401SStefano Zampini ierr = MatDestroy(&pcbddc->local_auxmat1);CHKERRQ(ierr); 830da1bb401SStefano Zampini ierr = MatDestroy(&pcbddc->local_auxmat2);CHKERRQ(ierr); 831da1bb401SStefano Zampini ierr = VecDestroy(&pcbddc->vec1_R);CHKERRQ(ierr); 832da1bb401SStefano Zampini ierr = VecDestroy(&pcbddc->vec2_R);CHKERRQ(ierr); 833da1bb401SStefano Zampini ierr = VecDestroy(&pcbddc->vec4_D);CHKERRQ(ierr); 834da1bb401SStefano Zampini ierr = VecScatterDestroy(&pcbddc->R_to_B);CHKERRQ(ierr); 835da1bb401SStefano Zampini ierr = VecScatterDestroy(&pcbddc->R_to_D);CHKERRQ(ierr); 836da1bb401SStefano Zampini ierr = VecScatterDestroy(&pcbddc->coarse_loc_to_glob);CHKERRQ(ierr); 837da1bb401SStefano Zampini ierr = KSPDestroy(&pcbddc->ksp_D);CHKERRQ(ierr); 838da1bb401SStefano Zampini ierr = KSPDestroy(&pcbddc->ksp_R);CHKERRQ(ierr); 839da1bb401SStefano Zampini ierr = ISDestroy(&pcbddc->NeumannBoundaries);CHKERRQ(ierr); 840da1bb401SStefano Zampini ierr = ISDestroy(&pcbddc->DirichletBoundaries);CHKERRQ(ierr); 841da1bb401SStefano Zampini ierr = MatDestroy(&pcbddc->ConstraintMatrix);CHKERRQ(ierr); 842da1bb401SStefano Zampini ierr = PetscFree(pcbddc->local_primal_indices);CHKERRQ(ierr); 843da1bb401SStefano Zampini ierr = PetscFree(pcbddc->replicated_local_primal_indices);CHKERRQ(ierr); 8440bdf917eSStefano Zampini ierr = PetscFree(pcbddc->replicated_local_primal_values);CHKERRQ(ierr); 845da1bb401SStefano Zampini ierr = PetscFree(pcbddc->local_primal_displacements);CHKERRQ(ierr); 846da1bb401SStefano Zampini ierr = PetscFree(pcbddc->local_primal_sizes);CHKERRQ(ierr); 847da1bb401SStefano Zampini for (i=0;i<pcbddc->n_ISForDofs;i++) { ierr = ISDestroy(&pcbddc->ISForDofs[i]);CHKERRQ(ierr); } 848da1bb401SStefano Zampini ierr = PetscFree(pcbddc->ISForDofs);CHKERRQ(ierr); 849da1bb401SStefano Zampini for (i=0;i<pcbddc->n_ISForFaces;i++) { ierr = ISDestroy(&pcbddc->ISForFaces[i]);CHKERRQ(ierr); } 850da1bb401SStefano Zampini ierr = PetscFree(pcbddc->ISForFaces);CHKERRQ(ierr); 851da1bb401SStefano Zampini for (i=0;i<pcbddc->n_ISForEdges;i++) { ierr = ISDestroy(&pcbddc->ISForEdges[i]);CHKERRQ(ierr); } 852da1bb401SStefano Zampini ierr = PetscFree(pcbddc->ISForEdges);CHKERRQ(ierr); 853da1bb401SStefano Zampini ierr = ISDestroy(&pcbddc->ISForVertices);CHKERRQ(ierr); 8543972b0daSStefano Zampini /* Free graph structure */ 855da1bb401SStefano Zampini ierr = PetscFree(pcbddc->mat_graph->xadj);CHKERRQ(ierr); 856da1bb401SStefano Zampini ierr = PetscFree(pcbddc->mat_graph->adjncy);CHKERRQ(ierr); 857142dfd88SStefano Zampini if (pcbddc->mat_graph->nvtxs) { 858da1bb401SStefano Zampini ierr = PetscFree(pcbddc->mat_graph->neighbours_set[0]);CHKERRQ(ierr); 859142dfd88SStefano Zampini } 860da1bb401SStefano Zampini ierr = PetscFree(pcbddc->mat_graph->neighbours_set);CHKERRQ(ierr); 8613972b0daSStefano Zampini ierr = PetscFree4(pcbddc->mat_graph->where,pcbddc->mat_graph->count,pcbddc->mat_graph->cptr,pcbddc->mat_graph->queue);CHKERRQ(ierr); 8623972b0daSStefano Zampini ierr = PetscFree2(pcbddc->mat_graph->which_dof,pcbddc->mat_graph->touched);CHKERRQ(ierr); 8633972b0daSStefano Zampini ierr = PetscFree(pcbddc->mat_graph->where_ncmps);CHKERRQ(ierr); 864da1bb401SStefano Zampini ierr = PetscFree(pcbddc->mat_graph);CHKERRQ(ierr); 8653425bc38SStefano Zampini /* remove functions */ 8664fad6a16SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetCoarseningRatio_C","",PETSC_NULL);CHKERRQ(ierr); 8674fad6a16SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetMaxLevels_C","",PETSC_NULL);CHKERRQ(ierr); 8680bdf917eSStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetNullSpace_C","",PETSC_NULL);CHKERRQ(ierr); 8693425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDirichletBoundaries_C","",PETSC_NULL);CHKERRQ(ierr); 8703425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetNeumannBoundaries_C","",PETSC_NULL);CHKERRQ(ierr); 8713425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetDirichletBoundaries_C","",PETSC_NULL);CHKERRQ(ierr); 8723425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetNeumannBoundaries_C","",PETSC_NULL);CHKERRQ(ierr); 8733425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetCoarseProblemType_C","",PETSC_NULL);CHKERRQ(ierr); 8743425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDofsSplitting_C","",PETSC_NULL);CHKERRQ(ierr); 8753425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetLocalAdjacencyGraph_C","",PETSC_NULL);CHKERRQ(ierr); 8763425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPreSolve_C","",PETSC_NULL);CHKERRQ(ierr); 8773425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPostSolve_C","",PETSC_NULL);CHKERRQ(ierr); 8783425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCCreateFETIDPOperators_C","",PETSC_NULL);CHKERRQ(ierr); 8793425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetRHS_C","",PETSC_NULL);CHKERRQ(ierr); 8803425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetSolution_C","",PETSC_NULL);CHKERRQ(ierr); 881da1bb401SStefano Zampini /* Free the private data structure that was hanging off the PC */ 882da1bb401SStefano Zampini ierr = PetscFree(pcbddc);CHKERRQ(ierr); 883da1bb401SStefano Zampini PetscFunctionReturn(0); 884da1bb401SStefano Zampini } 8853425bc38SStefano Zampini /* -------------------------------------------------------------------------- */ 8863425bc38SStefano Zampini EXTERN_C_BEGIN 8873425bc38SStefano Zampini #undef __FUNCT__ 8883425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetRHS_BDDC" 8893425bc38SStefano Zampini static PetscErrorCode PCBDDCMatFETIDPGetRHS_BDDC(Mat fetidp_mat, Vec standard_rhs, Vec fetidp_flux_rhs) 8903425bc38SStefano Zampini { 8913425bc38SStefano Zampini FETIDPMat_ctx *mat_ctx; 8923425bc38SStefano Zampini PC_IS* pcis; 8933425bc38SStefano Zampini PC_BDDC* pcbddc; 8943425bc38SStefano Zampini Mat_IS* matis; 8953425bc38SStefano Zampini PetscErrorCode ierr; 8960c7d97c5SJed Brown 8973425bc38SStefano Zampini PetscFunctionBegin; 8983425bc38SStefano Zampini ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr); 8993425bc38SStefano Zampini pcis = (PC_IS*)mat_ctx->pc->data; 9003425bc38SStefano Zampini pcbddc = (PC_BDDC*)mat_ctx->pc->data; 9013425bc38SStefano Zampini matis = (Mat_IS*)mat_ctx->pc->pmat->data; 9023425bc38SStefano Zampini 9033425bc38SStefano Zampini /* change of basis for physical rhs if needed 9043425bc38SStefano Zampini It also changes the rhs in case of dirichlet boundaries */ 9053425bc38SStefano Zampini (*mat_ctx->pc->ops->presolve)(mat_ctx->pc,PETSC_NULL,standard_rhs,PETSC_NULL); 9063425bc38SStefano Zampini /* store vectors for computation of fetidp final solution */ 9073425bc38SStefano Zampini ierr = VecScatterBegin(pcis->global_to_D,standard_rhs,mat_ctx->temp_solution_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 9083425bc38SStefano Zampini ierr = VecScatterEnd (pcis->global_to_D,standard_rhs,mat_ctx->temp_solution_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 9093425bc38SStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 9103425bc38SStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 9113425bc38SStefano Zampini /* scale rhs since it should be unassembled */ 9123425bc38SStefano Zampini ierr = VecPointwiseMult(mat_ctx->temp_solution_B,pcis->D,mat_ctx->temp_solution_B);CHKERRQ(ierr); 9133425bc38SStefano Zampini if (!pcbddc->prec_type) { 9143425bc38SStefano Zampini /* compute partially subassembled Schur complement right-hand side */ 9153425bc38SStefano Zampini ierr = KSPSolve(pcbddc->ksp_D,mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr); 9163425bc38SStefano Zampini ierr = MatMult(pcis->A_BI,pcis->vec1_D,pcis->vec1_B);CHKERRQ(ierr); 9173425bc38SStefano Zampini ierr = VecAXPY(mat_ctx->temp_solution_B,-1.0,pcis->vec1_B);CHKERRQ(ierr); 9183425bc38SStefano Zampini ierr = VecSet(standard_rhs,0.0);CHKERRQ(ierr); 9193425bc38SStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,mat_ctx->temp_solution_B,standard_rhs,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 9203425bc38SStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,mat_ctx->temp_solution_B,standard_rhs,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 9213425bc38SStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 9223425bc38SStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 9233425bc38SStefano Zampini ierr = VecPointwiseMult(mat_ctx->temp_solution_B,pcis->D,mat_ctx->temp_solution_B);CHKERRQ(ierr); 9243425bc38SStefano Zampini } 9253425bc38SStefano Zampini /* BDDC rhs */ 9263425bc38SStefano Zampini ierr = VecCopy(mat_ctx->temp_solution_B,pcis->vec1_B);CHKERRQ(ierr); 9273425bc38SStefano Zampini if (pcbddc->prec_type) { 9283425bc38SStefano Zampini ierr = VecCopy(mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr); 9293425bc38SStefano Zampini } 9303425bc38SStefano Zampini /* apply BDDC */ 9313425bc38SStefano Zampini ierr = PCBDDCApplyInterfacePreconditioner(mat_ctx->pc);CHKERRQ(ierr); 9323425bc38SStefano Zampini /* Application of B_delta and assembling of rhs for fetidp fluxes */ 9333425bc38SStefano Zampini ierr = VecSet(fetidp_flux_rhs,0.0);CHKERRQ(ierr); 9343425bc38SStefano Zampini ierr = MatMult(mat_ctx->B_delta,pcis->vec1_B,mat_ctx->lambda_local);CHKERRQ(ierr); 9353425bc38SStefano Zampini ierr = VecScatterBegin(mat_ctx->l2g_lambda,mat_ctx->lambda_local,fetidp_flux_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 9363425bc38SStefano Zampini ierr = VecScatterEnd (mat_ctx->l2g_lambda,mat_ctx->lambda_local,fetidp_flux_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 9373425bc38SStefano Zampini /* restore original rhs */ 9383425bc38SStefano Zampini ierr = VecCopy(pcbddc->original_rhs,standard_rhs);CHKERRQ(ierr); 9393425bc38SStefano Zampini PetscFunctionReturn(0); 9403425bc38SStefano Zampini } 9413425bc38SStefano Zampini EXTERN_C_END 9423425bc38SStefano Zampini #undef __FUNCT__ 9433425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetRHS" 9443425bc38SStefano Zampini /*@ 9453425bc38SStefano Zampini PCBDDCMatFETIDPGetRHS - Get rhs for FETIDP linear system. 9463425bc38SStefano Zampini 9473425bc38SStefano Zampini Collective 9483425bc38SStefano Zampini 9493425bc38SStefano Zampini Input Parameters: 9503425bc38SStefano Zampini + fetidp_mat - the FETIDP mat obtained by a call to PCBDDCCreateFETIDPOperators 9513425bc38SStefano Zampini + standard_rhs - the rhs of your linear system 9523425bc38SStefano Zampini 9533425bc38SStefano Zampini Output Parameters: 9543425bc38SStefano Zampini + fetidp_flux_rhs - the rhs of the FETIDP linear system 9553425bc38SStefano Zampini 9563425bc38SStefano Zampini Level: developer 9573425bc38SStefano Zampini 9583425bc38SStefano Zampini Notes: 9593425bc38SStefano Zampini 9603425bc38SStefano Zampini .seealso: PCBDDC 9613425bc38SStefano Zampini @*/ 9623425bc38SStefano Zampini PetscErrorCode PCBDDCMatFETIDPGetRHS(Mat fetidp_mat, Vec standard_rhs, Vec fetidp_flux_rhs) 9633425bc38SStefano Zampini { 9643425bc38SStefano Zampini FETIDPMat_ctx *mat_ctx; 9653425bc38SStefano Zampini PetscErrorCode ierr; 9663425bc38SStefano Zampini 9673425bc38SStefano Zampini PetscFunctionBegin; 9683425bc38SStefano Zampini ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr); 9693425bc38SStefano Zampini ierr = PetscTryMethod(mat_ctx->pc,"PCBDDCMatFETIDPGetRHS_C",(Mat,Vec,Vec),(fetidp_mat,standard_rhs,fetidp_flux_rhs));CHKERRQ(ierr); 9703425bc38SStefano Zampini PetscFunctionReturn(0); 9713425bc38SStefano Zampini } 9723425bc38SStefano Zampini /* -------------------------------------------------------------------------- */ 9733425bc38SStefano Zampini EXTERN_C_BEGIN 9743425bc38SStefano Zampini #undef __FUNCT__ 9753425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetSolution_BDDC" 9763425bc38SStefano Zampini static PetscErrorCode PCBDDCMatFETIDPGetSolution_BDDC(Mat fetidp_mat, Vec fetidp_flux_sol, Vec standard_sol) 9773425bc38SStefano Zampini { 9783425bc38SStefano Zampini FETIDPMat_ctx *mat_ctx; 9793425bc38SStefano Zampini PC_IS* pcis; 9803425bc38SStefano Zampini PC_BDDC* pcbddc; 9813425bc38SStefano Zampini Mat_IS* matis; 9823425bc38SStefano Zampini PetscErrorCode ierr; 9833425bc38SStefano Zampini 9843425bc38SStefano Zampini PetscFunctionBegin; 9853425bc38SStefano Zampini ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr); 9863425bc38SStefano Zampini pcis = (PC_IS*)mat_ctx->pc->data; 9873425bc38SStefano Zampini pcbddc = (PC_BDDC*)mat_ctx->pc->data; 9883425bc38SStefano Zampini matis = (Mat_IS*)mat_ctx->pc->pmat->data; 9893425bc38SStefano Zampini 9903425bc38SStefano Zampini /* apply B_delta^T */ 9913425bc38SStefano Zampini ierr = VecScatterBegin(mat_ctx->l2g_lambda,fetidp_flux_sol,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 9923425bc38SStefano Zampini ierr = VecScatterEnd (mat_ctx->l2g_lambda,fetidp_flux_sol,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 9933425bc38SStefano Zampini ierr = MatMultTranspose(mat_ctx->B_delta,mat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr); 9943425bc38SStefano Zampini /* compute rhs for BDDC application */ 9953425bc38SStefano Zampini ierr = VecAYPX(pcis->vec1_B,-1.0,mat_ctx->temp_solution_B);CHKERRQ(ierr); 9963425bc38SStefano Zampini if (pcbddc->prec_type) { 9973425bc38SStefano Zampini ierr = VecCopy(mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr); 9983425bc38SStefano Zampini } 9993425bc38SStefano Zampini /* apply BDDC */ 10003425bc38SStefano Zampini ierr = PCBDDCApplyInterfacePreconditioner(mat_ctx->pc);CHKERRQ(ierr); 10013425bc38SStefano Zampini /* put values into standard global vector */ 10023425bc38SStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 10033425bc38SStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,pcis->vec1_B,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 10043425bc38SStefano Zampini if (!pcbddc->prec_type) { 10053425bc38SStefano Zampini /* compute values into the interior if solved for the partially subassembled Schur complement */ 10063425bc38SStefano Zampini ierr = MatMult(pcis->A_IB,pcis->vec1_B,pcis->vec1_D);CHKERRQ(ierr); 10073425bc38SStefano Zampini ierr = VecAXPY(mat_ctx->temp_solution_D,-1.0,pcis->vec1_D);CHKERRQ(ierr); 10083425bc38SStefano Zampini ierr = KSPSolve(pcbddc->ksp_D,mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr); 10093425bc38SStefano Zampini } 10103425bc38SStefano Zampini ierr = VecScatterBegin(pcis->global_to_D,pcis->vec1_D,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 10113425bc38SStefano Zampini ierr = VecScatterEnd (pcis->global_to_D,pcis->vec1_D,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 10123425bc38SStefano Zampini /* final change of basis if needed 10133425bc38SStefano Zampini Is also sums the dirichlet part removed during RHS assembling */ 10143425bc38SStefano Zampini (*mat_ctx->pc->ops->postsolve)(mat_ctx->pc,PETSC_NULL,PETSC_NULL,standard_sol); 10153425bc38SStefano Zampini PetscFunctionReturn(0); 10163425bc38SStefano Zampini 10173425bc38SStefano Zampini } 10183425bc38SStefano Zampini EXTERN_C_END 10193425bc38SStefano Zampini #undef __FUNCT__ 10203425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetSolution" 10213425bc38SStefano Zampini /*@ 10223425bc38SStefano Zampini PCBDDCMatFETIDPGetSolution - Get Solution for FETIDP linear system. 10233425bc38SStefano Zampini 10243425bc38SStefano Zampini Collective 10253425bc38SStefano Zampini 10263425bc38SStefano Zampini Input Parameters: 10273425bc38SStefano Zampini + fetidp_mat - the FETIDP mat obtained by a call to PCBDDCCreateFETIDPOperators 10283425bc38SStefano Zampini + fetidp_flux_sol - the solution of the FETIDP linear system 10293425bc38SStefano Zampini 10303425bc38SStefano Zampini Output Parameters: 10313425bc38SStefano Zampini + standard_sol - the solution on the global domain 10323425bc38SStefano Zampini 10333425bc38SStefano Zampini Level: developer 10343425bc38SStefano Zampini 10353425bc38SStefano Zampini Notes: 10363425bc38SStefano Zampini 10373425bc38SStefano Zampini .seealso: PCBDDC 10383425bc38SStefano Zampini @*/ 10393425bc38SStefano Zampini PetscErrorCode PCBDDCMatFETIDPGetSolution(Mat fetidp_mat, Vec fetidp_flux_sol, Vec standard_sol) 10403425bc38SStefano Zampini { 10413425bc38SStefano Zampini FETIDPMat_ctx *mat_ctx; 10423425bc38SStefano Zampini PetscErrorCode ierr; 10433425bc38SStefano Zampini 10443425bc38SStefano Zampini PetscFunctionBegin; 10453425bc38SStefano Zampini ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr); 10463425bc38SStefano Zampini ierr = PetscTryMethod(mat_ctx->pc,"PCBDDCMatFETIDPGetSolution_C",(Mat,Vec,Vec),(fetidp_mat,fetidp_flux_sol,standard_sol));CHKERRQ(ierr); 10473425bc38SStefano Zampini PetscFunctionReturn(0); 10483425bc38SStefano Zampini } 10493425bc38SStefano Zampini /* -------------------------------------------------------------------------- */ 10503425bc38SStefano Zampini EXTERN_C_BEGIN 10513425bc38SStefano Zampini #undef __FUNCT__ 10523425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPOperators_BDDC" 10533425bc38SStefano Zampini static PetscErrorCode PCBDDCCreateFETIDPOperators_BDDC(PC pc, Mat *fetidp_mat, PC *fetidp_pc) 10543425bc38SStefano Zampini { 10553425bc38SStefano Zampini PETSC_EXTERN PetscErrorCode FETIDPMatMult(Mat,Vec,Vec); 10563425bc38SStefano Zampini PETSC_EXTERN PetscErrorCode PCBDDCDestroyFETIDPMat(Mat); 10573425bc38SStefano Zampini PETSC_EXTERN PetscErrorCode FETIDPPCApply(PC,Vec,Vec); 10583425bc38SStefano Zampini PETSC_EXTERN PetscErrorCode PCBDDCDestroyFETIDPPC(PC); 10593425bc38SStefano Zampini 10603425bc38SStefano Zampini FETIDPMat_ctx *fetidpmat_ctx; 10613425bc38SStefano Zampini Mat newmat; 10623425bc38SStefano Zampini FETIDPPC_ctx *fetidppc_ctx; 10633425bc38SStefano Zampini PC newpc; 10643425bc38SStefano Zampini MPI_Comm comm = ((PetscObject)pc)->comm; 10653425bc38SStefano Zampini PetscErrorCode ierr; 10663425bc38SStefano Zampini 10673425bc38SStefano Zampini PetscFunctionBegin; 10683425bc38SStefano Zampini /* FETIDP linear matrix */ 10693425bc38SStefano Zampini ierr = PCBDDCCreateFETIDPMatContext(pc, &fetidpmat_ctx);CHKERRQ(ierr); 10703425bc38SStefano Zampini ierr = PCBDDCSetupFETIDPMatContext(fetidpmat_ctx);CHKERRQ(ierr); 10713425bc38SStefano Zampini ierr = MatCreateShell(comm,PETSC_DECIDE,PETSC_DECIDE,fetidpmat_ctx->n_lambda,fetidpmat_ctx->n_lambda,fetidpmat_ctx,&newmat);CHKERRQ(ierr); 10723425bc38SStefano Zampini ierr = MatShellSetOperation(newmat,MATOP_MULT,(void (*)(void))FETIDPMatMult);CHKERRQ(ierr); 10733425bc38SStefano Zampini ierr = MatShellSetOperation(newmat,MATOP_DESTROY,(void (*)(void))PCBDDCDestroyFETIDPMat);CHKERRQ(ierr); 10743425bc38SStefano Zampini ierr = MatSetUp(newmat);CHKERRQ(ierr); 10753425bc38SStefano Zampini /* FETIDP preconditioner */ 10763425bc38SStefano Zampini ierr = PCBDDCCreateFETIDPPCContext(pc, &fetidppc_ctx);CHKERRQ(ierr); 10773425bc38SStefano Zampini ierr = PCBDDCSetupFETIDPPCContext(newmat,fetidppc_ctx);CHKERRQ(ierr); 10783425bc38SStefano Zampini ierr = PCCreate(comm,&newpc);CHKERRQ(ierr); 10793425bc38SStefano Zampini ierr = PCSetType(newpc,PCSHELL);CHKERRQ(ierr); 10803425bc38SStefano Zampini ierr = PCShellSetContext(newpc,fetidppc_ctx);CHKERRQ(ierr); 10813425bc38SStefano Zampini ierr = PCShellSetApply(newpc,FETIDPPCApply);CHKERRQ(ierr); 10823425bc38SStefano Zampini ierr = PCShellSetDestroy(newpc,PCBDDCDestroyFETIDPPC);CHKERRQ(ierr); 10833425bc38SStefano Zampini ierr = PCSetOperators(newpc,newmat,newmat,SAME_PRECONDITIONER);CHKERRQ(ierr); 10843425bc38SStefano Zampini ierr = PCSetUp(newpc);CHKERRQ(ierr); 10853425bc38SStefano Zampini /* return pointers for objects created */ 10863425bc38SStefano Zampini *fetidp_mat=newmat; 10873425bc38SStefano Zampini *fetidp_pc=newpc; 10883425bc38SStefano Zampini 10893425bc38SStefano Zampini PetscFunctionReturn(0); 10903425bc38SStefano Zampini } 10913425bc38SStefano Zampini EXTERN_C_END 10923425bc38SStefano Zampini #undef __FUNCT__ 10933425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPOperators" 10943425bc38SStefano Zampini /*@ 10953425bc38SStefano Zampini PCBDDCCreateFETIDPOperators - Create operators for FETIDP. 10963425bc38SStefano Zampini 10973425bc38SStefano Zampini Collective 10983425bc38SStefano Zampini 10993425bc38SStefano Zampini Input Parameters: 11003425bc38SStefano Zampini + pc - the BDDC preconditioning context (setup must be already called) 11013425bc38SStefano Zampini 11023425bc38SStefano Zampini Level: developer 11033425bc38SStefano Zampini 11043425bc38SStefano Zampini Notes: 11053425bc38SStefano Zampini 11063425bc38SStefano Zampini .seealso: PCBDDC 11073425bc38SStefano Zampini @*/ 11083425bc38SStefano Zampini PetscErrorCode PCBDDCCreateFETIDPOperators(PC pc, Mat *fetidp_mat, PC *fetidp_pc) 11093425bc38SStefano Zampini { 11103425bc38SStefano Zampini PetscErrorCode ierr; 11113425bc38SStefano Zampini 11123425bc38SStefano Zampini PetscFunctionBegin; 11133425bc38SStefano Zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 11143425bc38SStefano Zampini if (pc->setupcalled) { 11153425bc38SStefano Zampini ierr = PetscTryMethod(pc,"PCBDDCCreateFETIDPOperators_C",(PC,Mat*,PC*),(pc,fetidp_mat,fetidp_pc));CHKERRQ(ierr); 11163425bc38SStefano Zampini } else { 11173425bc38SStefano Zampini SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SUP,"You must call PCSetup_BDDC before calling %s\n",__FUNCT__); 11183425bc38SStefano Zampini } 11193425bc38SStefano Zampini PetscFunctionReturn(0); 11203425bc38SStefano Zampini } 11210c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 1122da1bb401SStefano Zampini /*MC 1123da1bb401SStefano Zampini PCBDDC - Balancing Domain Decomposition by Constraints. 11240c7d97c5SJed Brown 1125da1bb401SStefano Zampini Options Database Keys: 1126da1bb401SStefano Zampini . -pcbddc ??? - 1127da1bb401SStefano Zampini 1128da1bb401SStefano Zampini Level: intermediate 1129da1bb401SStefano Zampini 1130da1bb401SStefano Zampini Notes: The matrix used with this preconditioner must be of type MATIS 1131da1bb401SStefano Zampini 1132da1bb401SStefano Zampini Unlike more 'conventional' interface preconditioners, this iterates over ALL the 1133da1bb401SStefano Zampini degrees of freedom, NOT just those on the interface (this allows the use of approximate solvers 1134da1bb401SStefano Zampini on the subdomains). 1135da1bb401SStefano Zampini 1136da1bb401SStefano Zampini Options for the coarse grid preconditioner can be set with - 1137da1bb401SStefano Zampini Options for the Dirichlet subproblem can be set with - 1138da1bb401SStefano Zampini Options for the Neumann subproblem can be set with - 1139da1bb401SStefano Zampini 1140da1bb401SStefano Zampini Contributed by Stefano Zampini 1141da1bb401SStefano Zampini 1142da1bb401SStefano Zampini .seealso: PCCreate(), PCSetType(), PCType (for list of available types), PC, MATIS 1143da1bb401SStefano Zampini M*/ 1144da1bb401SStefano Zampini EXTERN_C_BEGIN 1145da1bb401SStefano Zampini #undef __FUNCT__ 1146da1bb401SStefano Zampini #define __FUNCT__ "PCCreate_BDDC" 1147da1bb401SStefano Zampini PetscErrorCode PCCreate_BDDC(PC pc) 1148da1bb401SStefano Zampini { 1149da1bb401SStefano Zampini PetscErrorCode ierr; 1150da1bb401SStefano Zampini PC_BDDC *pcbddc; 1151da1bb401SStefano Zampini PCBDDCGraph mat_graph; 1152da1bb401SStefano Zampini 1153da1bb401SStefano Zampini PetscFunctionBegin; 1154da1bb401SStefano Zampini /* Creates the private data structure for this preconditioner and attach it to the PC object. */ 1155da1bb401SStefano Zampini ierr = PetscNewLog(pc,PC_BDDC,&pcbddc);CHKERRQ(ierr); 1156da1bb401SStefano Zampini pc->data = (void*)pcbddc; 1157da1bb401SStefano Zampini 1158da1bb401SStefano Zampini /* create PCIS data structure */ 1159da1bb401SStefano Zampini ierr = PCISCreate(pc);CHKERRQ(ierr); 1160da1bb401SStefano Zampini 1161da1bb401SStefano Zampini /* BDDC specific */ 11620bdf917eSStefano Zampini pcbddc->CoarseNullSpace = 0; 11630bdf917eSStefano Zampini pcbddc->NullSpace = 0; 11643972b0daSStefano Zampini pcbddc->temp_solution = 0; 1165534831adSStefano Zampini pcbddc->original_rhs = 0; 1166534831adSStefano Zampini pcbddc->local_mat = 0; 1167534831adSStefano Zampini pcbddc->ChangeOfBasisMatrix = 0; 1168534831adSStefano Zampini pcbddc->usechangeofbasis = PETSC_TRUE; 1169534831adSStefano Zampini pcbddc->usechangeonfaces = PETSC_FALSE; 1170da1bb401SStefano Zampini pcbddc->coarse_vec = 0; 1171da1bb401SStefano Zampini pcbddc->coarse_rhs = 0; 1172da1bb401SStefano Zampini pcbddc->coarse_ksp = 0; 1173da1bb401SStefano Zampini pcbddc->coarse_phi_B = 0; 1174da1bb401SStefano Zampini pcbddc->coarse_phi_D = 0; 1175da1bb401SStefano Zampini pcbddc->vec1_P = 0; 1176da1bb401SStefano Zampini pcbddc->vec1_R = 0; 1177da1bb401SStefano Zampini pcbddc->vec2_R = 0; 1178da1bb401SStefano Zampini pcbddc->local_auxmat1 = 0; 1179da1bb401SStefano Zampini pcbddc->local_auxmat2 = 0; 1180da1bb401SStefano Zampini pcbddc->R_to_B = 0; 1181da1bb401SStefano Zampini pcbddc->R_to_D = 0; 1182da1bb401SStefano Zampini pcbddc->ksp_D = 0; 1183da1bb401SStefano Zampini pcbddc->ksp_R = 0; 1184da1bb401SStefano Zampini pcbddc->local_primal_indices = 0; 1185da1bb401SStefano Zampini pcbddc->prec_type = PETSC_FALSE; 1186da1bb401SStefano Zampini pcbddc->NeumannBoundaries = 0; 1187da1bb401SStefano Zampini pcbddc->ISForDofs = 0; 1188da1bb401SStefano Zampini pcbddc->ISForVertices = 0; 1189da1bb401SStefano Zampini pcbddc->n_ISForFaces = 0; 1190da1bb401SStefano Zampini pcbddc->n_ISForEdges = 0; 1191da1bb401SStefano Zampini pcbddc->ConstraintMatrix = 0; 1192da1bb401SStefano Zampini pcbddc->use_nnsp_true = PETSC_FALSE; 1193da1bb401SStefano Zampini pcbddc->local_primal_sizes = 0; 1194da1bb401SStefano Zampini pcbddc->local_primal_displacements = 0; 1195da1bb401SStefano Zampini pcbddc->replicated_local_primal_indices = 0; 1196da1bb401SStefano Zampini pcbddc->replicated_local_primal_values = 0; 1197da1bb401SStefano Zampini pcbddc->coarse_loc_to_glob = 0; 1198da1bb401SStefano Zampini pcbddc->dbg_flag = PETSC_FALSE; 1199da1bb401SStefano Zampini pcbddc->coarsening_ratio = 8; 1200b76ba322SStefano Zampini pcbddc->use_exact_dirichlet = PETSC_TRUE; 12014fad6a16SStefano Zampini pcbddc->current_level = 0; 12024fad6a16SStefano Zampini pcbddc->max_levels = 1; 1203da1bb401SStefano Zampini 1204da1bb401SStefano Zampini /* allocate and initialize needed graph structure */ 1205da1bb401SStefano Zampini ierr = PetscMalloc(sizeof(*mat_graph),&pcbddc->mat_graph);CHKERRQ(ierr); 1206da1bb401SStefano Zampini pcbddc->mat_graph->xadj = 0; 1207da1bb401SStefano Zampini pcbddc->mat_graph->adjncy = 0; 1208da1bb401SStefano Zampini 1209da1bb401SStefano Zampini /* function pointers */ 1210da1bb401SStefano Zampini pc->ops->apply = PCApply_BDDC; 1211da1bb401SStefano Zampini pc->ops->applytranspose = 0; 1212da1bb401SStefano Zampini pc->ops->setup = PCSetUp_BDDC; 1213da1bb401SStefano Zampini pc->ops->destroy = PCDestroy_BDDC; 1214da1bb401SStefano Zampini pc->ops->setfromoptions = PCSetFromOptions_BDDC; 1215da1bb401SStefano Zampini pc->ops->view = 0; 1216da1bb401SStefano Zampini pc->ops->applyrichardson = 0; 1217da1bb401SStefano Zampini pc->ops->applysymmetricleft = 0; 1218da1bb401SStefano Zampini pc->ops->applysymmetricright = 0; 1219534831adSStefano Zampini pc->ops->presolve = PCPreSolve_BDDC; 1220534831adSStefano Zampini pc->ops->postsolve = PCPostSolve_BDDC; 1221da1bb401SStefano Zampini 1222da1bb401SStefano Zampini /* composing function */ 12234fad6a16SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetCoarseningRatio_C","PCBDDCSetCoarseningRatio_BDDC", 12244fad6a16SStefano Zampini PCBDDCSetCoarseningRatio_BDDC);CHKERRQ(ierr); 12254fad6a16SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetMaxLevels_C","PCBDDCSetMaxLevels_BDDC", 12264fad6a16SStefano Zampini PCBDDCSetMaxLevels_BDDC);CHKERRQ(ierr); 12270bdf917eSStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetNullSpace_C","PCBDDCSetNullSpace_BDDC", 12280bdf917eSStefano Zampini PCBDDCSetNullSpace_BDDC);CHKERRQ(ierr); 1229da1bb401SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDirichletBoundaries_C","PCBDDCSetDirichletBoundaries_BDDC", 1230da1bb401SStefano Zampini PCBDDCSetDirichletBoundaries_BDDC);CHKERRQ(ierr); 1231da1bb401SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetNeumannBoundaries_C","PCBDDCSetNeumannBoundaries_BDDC", 1232da1bb401SStefano Zampini PCBDDCSetNeumannBoundaries_BDDC);CHKERRQ(ierr); 1233da1bb401SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetDirichletBoundaries_C","PCBDDCGetDirichletBoundaries_BDDC", 1234da1bb401SStefano Zampini PCBDDCGetDirichletBoundaries_BDDC);CHKERRQ(ierr); 1235da1bb401SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetNeumannBoundaries_C","PCBDDCGetNeumannBoundaries_BDDC", 1236da1bb401SStefano Zampini PCBDDCGetNeumannBoundaries_BDDC);CHKERRQ(ierr); 1237da1bb401SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetCoarseProblemType_C","PCBDDCSetCoarseProblemType_BDDC", 1238da1bb401SStefano Zampini PCBDDCSetCoarseProblemType_BDDC);CHKERRQ(ierr); 1239da1bb401SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDofsSplitting_C","PCBDDCSetDofsSplitting_BDDC", 1240da1bb401SStefano Zampini PCBDDCSetDofsSplitting_BDDC);CHKERRQ(ierr); 1241da1bb401SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetLocalAdjacencyGraph_C","PCBDDCSetLocalAdjacencyGraph_BDDC", 1242da1bb401SStefano Zampini PCBDDCSetLocalAdjacencyGraph_BDDC);CHKERRQ(ierr); 1243534831adSStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPreSolve_C","PCPreSolve_BDDC", 1244534831adSStefano Zampini PCPreSolve_BDDC);CHKERRQ(ierr); 1245534831adSStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPostSolve_C","PCPostSolve_BDDC", 1246534831adSStefano Zampini PCPostSolve_BDDC);CHKERRQ(ierr); 12473425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCCreateFETIDPOperators_C","PCBDDCCreateFETIDPOperators_BDDC", 12483425bc38SStefano Zampini PCBDDCCreateFETIDPOperators_BDDC);CHKERRQ(ierr); 12493425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetRHS_C","PCBDDCMatFETIDPGetRHS_BDDC", 12503425bc38SStefano Zampini PCBDDCMatFETIDPGetRHS_BDDC);CHKERRQ(ierr); 12513425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetSolution_C","PCBDDCMatFETIDPGetSolution_BDDC", 12523425bc38SStefano Zampini PCBDDCMatFETIDPGetSolution_BDDC);CHKERRQ(ierr); 1253da1bb401SStefano Zampini PetscFunctionReturn(0); 1254da1bb401SStefano Zampini } 1255da1bb401SStefano Zampini EXTERN_C_END 12563425bc38SStefano Zampini 1257da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */ 1258da1bb401SStefano Zampini /* All static functions from now on */ 1259da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */ 12604fad6a16SStefano Zampini #undef __FUNCT__ 12612e8d2280SStefano Zampini #define __FUNCT__ "PCBDDCSetUseExactDirichlet" 12622e8d2280SStefano Zampini static PetscErrorCode PCBDDCSetUseExactDirichlet(PC pc,PetscBool use) 12632e8d2280SStefano Zampini { 12642e8d2280SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 12652e8d2280SStefano Zampini 12662e8d2280SStefano Zampini PetscFunctionBegin; 12672e8d2280SStefano Zampini pcbddc->use_exact_dirichlet=use; 12682e8d2280SStefano Zampini PetscFunctionReturn(0); 12692e8d2280SStefano Zampini } 12702e8d2280SStefano Zampini 12712e8d2280SStefano Zampini #undef __FUNCT__ 12724fad6a16SStefano Zampini #define __FUNCT__ "PCBDDCSetLevel" 12734fad6a16SStefano Zampini static PetscErrorCode PCBDDCSetLevel(PC pc,PetscInt level) 12744fad6a16SStefano Zampini { 12754fad6a16SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 12764fad6a16SStefano Zampini 12774fad6a16SStefano Zampini PetscFunctionBegin; 12784fad6a16SStefano Zampini pcbddc->current_level=level; 12794fad6a16SStefano Zampini PetscFunctionReturn(0); 12804fad6a16SStefano Zampini } 12813425bc38SStefano Zampini 12823425bc38SStefano Zampini #undef __FUNCT__ 12830bdf917eSStefano Zampini #define __FUNCT__ "PCBDDCAdaptNullSpace" 12840bdf917eSStefano Zampini static PetscErrorCode PCBDDCAdaptNullSpace(PC pc) 12850bdf917eSStefano Zampini { 12860bdf917eSStefano Zampini PC_IS* pcis = (PC_IS*) (pc->data); 12870bdf917eSStefano Zampini PC_BDDC* pcbddc = (PC_BDDC*)(pc->data); 12880bdf917eSStefano Zampini KSP inv_change; 12890bdf917eSStefano Zampini PC pc_change; 12900bdf917eSStefano Zampini const Vec *nsp_vecs; 12910bdf917eSStefano Zampini Vec *new_nsp_vecs; 12920bdf917eSStefano Zampini PetscInt i,nsp_size,new_nsp_size,start_new; 12930bdf917eSStefano Zampini PetscBool nsp_has_cnst; 12940bdf917eSStefano Zampini MatNullSpace new_nsp; 12950bdf917eSStefano Zampini PetscErrorCode ierr; 12960bdf917eSStefano Zampini 12970bdf917eSStefano Zampini PetscFunctionBegin; 12980bdf917eSStefano Zampini ierr = MatNullSpaceGetVecs(pcbddc->NullSpace,&nsp_has_cnst,&nsp_size,&nsp_vecs);CHKERRQ(ierr); 12990bdf917eSStefano Zampini ierr = KSPCreate(PETSC_COMM_SELF,&inv_change);CHKERRQ(ierr); 13000bdf917eSStefano Zampini ierr = KSPSetOperators(inv_change,pcbddc->ChangeOfBasisMatrix,pcbddc->ChangeOfBasisMatrix,SAME_PRECONDITIONER);CHKERRQ(ierr); 13010bdf917eSStefano Zampini ierr = KSPSetType(inv_change,KSPPREONLY);CHKERRQ(ierr); 13020bdf917eSStefano Zampini ierr = KSPGetPC(inv_change,&pc_change);CHKERRQ(ierr); 13030bdf917eSStefano Zampini ierr = PCSetType(pc_change,PCLU);CHKERRQ(ierr); 13040bdf917eSStefano Zampini ierr = KSPSetUp(inv_change);CHKERRQ(ierr); 13050bdf917eSStefano Zampini new_nsp_size = nsp_size; 13060bdf917eSStefano Zampini if (nsp_has_cnst) { new_nsp_size++; } 13070bdf917eSStefano Zampini ierr = PetscMalloc(new_nsp_size*sizeof(Vec),&new_nsp_vecs);CHKERRQ(ierr); 13080bdf917eSStefano Zampini for (i=0;i<new_nsp_size;i++) { ierr = VecDuplicate(pcis->vec1_global,&new_nsp_vecs[i]);CHKERRQ(ierr); } 13090bdf917eSStefano Zampini start_new = 0; 13100bdf917eSStefano Zampini if (nsp_has_cnst) { 13110bdf917eSStefano Zampini start_new = 1; 13120bdf917eSStefano Zampini ierr = VecSet(new_nsp_vecs[0],1.0);CHKERRQ(ierr); 13130bdf917eSStefano Zampini ierr = VecSet(pcis->vec1_B,1.0);CHKERRQ(ierr); 13140bdf917eSStefano Zampini ierr = KSPSolve(inv_change,pcis->vec1_B,pcis->vec1_B); 13150bdf917eSStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,new_nsp_vecs[0],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 13160bdf917eSStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,pcis->vec1_B,new_nsp_vecs[0],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 13170bdf917eSStefano Zampini } 13180bdf917eSStefano Zampini for (i=0;i<nsp_size;i++) { 13190bdf917eSStefano Zampini ierr = VecCopy(nsp_vecs[i],new_nsp_vecs[i+start_new]);CHKERRQ(ierr); 13200bdf917eSStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,nsp_vecs[i],pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 13210bdf917eSStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,nsp_vecs[i],pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 13220bdf917eSStefano Zampini ierr = KSPSolve(inv_change,pcis->vec1_B,pcis->vec1_B); 13230bdf917eSStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,new_nsp_vecs[i+start_new],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 13240bdf917eSStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,pcis->vec1_B,new_nsp_vecs[i+start_new],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 13250bdf917eSStefano Zampini } 13260bdf917eSStefano Zampini ierr = VecNormalize(new_nsp_vecs[0],PETSC_NULL);CHKERRQ(ierr); 13270bdf917eSStefano Zampini /* TODO : Orthonormalize vecs when new_nsp_size > 0! */ 13280bdf917eSStefano Zampini 13290bdf917eSStefano Zampini /*PetscBool nsp_t=PETSC_FALSE; 13300bdf917eSStefano Zampini ierr = MatNullSpaceTest(pcbddc->NullSpace,pc->pmat,&nsp_t);CHKERRQ(ierr); 13310bdf917eSStefano Zampini printf("Original Null Space test: %d\n",nsp_t); 13320bdf917eSStefano Zampini Mat temp_mat; 13330bdf917eSStefano Zampini Mat_IS* matis = (Mat_IS*)pc->pmat->data; 13340bdf917eSStefano Zampini temp_mat = matis->A; 13350bdf917eSStefano Zampini matis->A = pcbddc->local_mat; 13360bdf917eSStefano Zampini pcbddc->local_mat = temp_mat; 13370bdf917eSStefano Zampini ierr = MatNullSpaceTest(pcbddc->NullSpace,pc->pmat,&nsp_t);CHKERRQ(ierr); 13380bdf917eSStefano Zampini printf("Original Null Space, mat changed test: %d\n",nsp_t); 13390bdf917eSStefano Zampini { 13400bdf917eSStefano Zampini PetscReal test_norm; 13410bdf917eSStefano Zampini for (i=0;i<new_nsp_size;i++) { 13420bdf917eSStefano Zampini ierr = MatMult(pc->pmat,new_nsp_vecs[i],pcis->vec1_global);CHKERRQ(ierr); 13430bdf917eSStefano Zampini ierr = VecNorm(pcis->vec1_global,NORM_2,&test_norm);CHKERRQ(ierr); 13440bdf917eSStefano Zampini if (test_norm > 1.e-12) { 13450bdf917eSStefano Zampini printf("------------ERROR VEC %d------------------\n",i); 13460bdf917eSStefano Zampini ierr = VecView(pcis->vec1_global,PETSC_VIEWER_STDOUT_WORLD); 13470bdf917eSStefano Zampini printf("------------------------------------------\n"); 13480bdf917eSStefano Zampini } 13490bdf917eSStefano Zampini } 13500bdf917eSStefano Zampini }*/ 13510bdf917eSStefano Zampini 13520bdf917eSStefano Zampini ierr = KSPDestroy(&inv_change);CHKERRQ(ierr); 13530bdf917eSStefano Zampini ierr = MatNullSpaceCreate(((PetscObject)pc)->comm,PETSC_FALSE,new_nsp_size,new_nsp_vecs,&new_nsp);CHKERRQ(ierr); 13540bdf917eSStefano Zampini ierr = PCBDDCSetNullSpace(pc,new_nsp);CHKERRQ(ierr); 13550bdf917eSStefano Zampini ierr = MatNullSpaceDestroy(&new_nsp);CHKERRQ(ierr); 13560bdf917eSStefano Zampini /* 13570bdf917eSStefano Zampini ierr = MatNullSpaceTest(pcbddc->NullSpace,pc->pmat,&nsp_t);CHKERRQ(ierr); 13580bdf917eSStefano Zampini printf("New Null Space, mat changed: %d\n",nsp_t); 13590bdf917eSStefano Zampini temp_mat = matis->A; 13600bdf917eSStefano Zampini matis->A = pcbddc->local_mat; 13610bdf917eSStefano Zampini pcbddc->local_mat = temp_mat; 13620bdf917eSStefano Zampini ierr = MatNullSpaceTest(pcbddc->NullSpace,pc->pmat,&nsp_t);CHKERRQ(ierr); 13630bdf917eSStefano Zampini printf("New Null Space, mat original: %d\n",nsp_t);*/ 13640bdf917eSStefano Zampini 13650bdf917eSStefano Zampini for (i=0;i<new_nsp_size;i++) { ierr = VecDestroy(&new_nsp_vecs[i]);CHKERRQ(ierr); } 13660bdf917eSStefano Zampini ierr = PetscFree(new_nsp_vecs);CHKERRQ(ierr); 13670bdf917eSStefano Zampini PetscFunctionReturn(0); 13680bdf917eSStefano Zampini } 13690bdf917eSStefano Zampini 13700bdf917eSStefano Zampini #undef __FUNCT__ 13713425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPMatContext" 13723425bc38SStefano Zampini static PetscErrorCode PCBDDCCreateFETIDPMatContext(PC pc, FETIDPMat_ctx **fetidpmat_ctx) 13733425bc38SStefano Zampini { 13743425bc38SStefano Zampini FETIDPMat_ctx *newctx; 13753425bc38SStefano Zampini PetscErrorCode ierr; 13763425bc38SStefano Zampini 13773425bc38SStefano Zampini PetscFunctionBegin; 13783425bc38SStefano Zampini ierr = PetscMalloc(sizeof(*newctx),&newctx);CHKERRQ(ierr); 13793425bc38SStefano Zampini newctx->lambda_local = 0; 13803425bc38SStefano Zampini newctx->temp_solution_B = 0; 13813425bc38SStefano Zampini newctx->temp_solution_D = 0; 13823425bc38SStefano Zampini newctx->B_delta = 0; 13833425bc38SStefano Zampini newctx->B_Ddelta = 0; /* theoretically belongs to the FETIDP preconditioner */ 13843425bc38SStefano Zampini newctx->l2g_lambda = 0; 13853425bc38SStefano Zampini /* increase the reference count for BDDC preconditioner */ 13863425bc38SStefano Zampini ierr = PetscObjectReference((PetscObject)pc);CHKERRQ(ierr); 13873425bc38SStefano Zampini newctx->pc = pc; 13883425bc38SStefano Zampini *fetidpmat_ctx = newctx; 13893425bc38SStefano Zampini PetscFunctionReturn(0); 13903425bc38SStefano Zampini } 13913425bc38SStefano Zampini 13923425bc38SStefano Zampini #undef __FUNCT__ 13933425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPPCContext" 13943425bc38SStefano Zampini static PetscErrorCode PCBDDCCreateFETIDPPCContext(PC pc, FETIDPPC_ctx **fetidppc_ctx) 13953425bc38SStefano Zampini { 13963425bc38SStefano Zampini FETIDPPC_ctx *newctx; 13973425bc38SStefano Zampini PetscErrorCode ierr; 13983425bc38SStefano Zampini 13993425bc38SStefano Zampini PetscFunctionBegin; 14003425bc38SStefano Zampini ierr = PetscMalloc(sizeof(*newctx),&newctx);CHKERRQ(ierr); 14013425bc38SStefano Zampini newctx->lambda_local = 0; 14023425bc38SStefano Zampini newctx->B_Ddelta = 0; 14033425bc38SStefano Zampini newctx->l2g_lambda = 0; 14043425bc38SStefano Zampini /* increase the reference count for BDDC preconditioner */ 14053425bc38SStefano Zampini ierr = PetscObjectReference((PetscObject)pc);CHKERRQ(ierr); 14063425bc38SStefano Zampini newctx->pc = pc; 14073425bc38SStefano Zampini *fetidppc_ctx = newctx; 14083425bc38SStefano Zampini PetscFunctionReturn(0); 14093425bc38SStefano Zampini } 14103425bc38SStefano Zampini 14113425bc38SStefano Zampini #undef __FUNCT__ 14123425bc38SStefano Zampini #define __FUNCT__ "PCBDDCDestroyFETIDPMat" 14133425bc38SStefano Zampini static PetscErrorCode PCBDDCDestroyFETIDPMat(Mat A) 14143425bc38SStefano Zampini { 14153425bc38SStefano Zampini FETIDPMat_ctx *mat_ctx; 14163425bc38SStefano Zampini PetscErrorCode ierr; 14173425bc38SStefano Zampini 14183425bc38SStefano Zampini PetscFunctionBegin; 14193425bc38SStefano Zampini ierr = MatShellGetContext(A,(void**)&mat_ctx);CHKERRQ(ierr); 14203425bc38SStefano Zampini ierr = VecDestroy(&mat_ctx->lambda_local);CHKERRQ(ierr); 14213425bc38SStefano Zampini ierr = VecDestroy(&mat_ctx->temp_solution_D);CHKERRQ(ierr); 14223425bc38SStefano Zampini ierr = VecDestroy(&mat_ctx->temp_solution_B);CHKERRQ(ierr); 14233425bc38SStefano Zampini ierr = MatDestroy(&mat_ctx->B_delta);CHKERRQ(ierr); 14243425bc38SStefano Zampini ierr = MatDestroy(&mat_ctx->B_Ddelta);CHKERRQ(ierr); 14253425bc38SStefano Zampini ierr = VecScatterDestroy(&mat_ctx->l2g_lambda);CHKERRQ(ierr); 14263425bc38SStefano Zampini ierr = PCDestroy(&mat_ctx->pc);CHKERRQ(ierr); /* actually it does not destroy BDDC, only decrease its reference count */ 14273425bc38SStefano Zampini ierr = PetscFree(mat_ctx);CHKERRQ(ierr); 14283425bc38SStefano Zampini PetscFunctionReturn(0); 14293425bc38SStefano Zampini } 14303425bc38SStefano Zampini 14313425bc38SStefano Zampini #undef __FUNCT__ 14323425bc38SStefano Zampini #define __FUNCT__ "PCBDDCDestroyFETIDPPC" 14333425bc38SStefano Zampini static PetscErrorCode PCBDDCDestroyFETIDPPC(PC pc) 14343425bc38SStefano Zampini { 14353425bc38SStefano Zampini FETIDPPC_ctx *pc_ctx; 14363425bc38SStefano Zampini PetscErrorCode ierr; 14373425bc38SStefano Zampini 14383425bc38SStefano Zampini PetscFunctionBegin; 14393425bc38SStefano Zampini ierr = PCShellGetContext(pc,(void**)&pc_ctx);CHKERRQ(ierr); 14403425bc38SStefano Zampini ierr = VecDestroy(&pc_ctx->lambda_local);CHKERRQ(ierr); 14413425bc38SStefano Zampini ierr = MatDestroy(&pc_ctx->B_Ddelta);CHKERRQ(ierr); 14423425bc38SStefano Zampini ierr = VecScatterDestroy(&pc_ctx->l2g_lambda);CHKERRQ(ierr); 14433425bc38SStefano Zampini ierr = PCDestroy(&pc_ctx->pc);CHKERRQ(ierr); /* actually it does not destroy BDDC, only decrease its reference count */ 14443425bc38SStefano Zampini ierr = PetscFree(pc_ctx);CHKERRQ(ierr); 14453425bc38SStefano Zampini PetscFunctionReturn(0); 14463425bc38SStefano Zampini } 14473425bc38SStefano Zampini 14483425bc38SStefano Zampini #undef __FUNCT__ 14493425bc38SStefano Zampini #define __FUNCT__ "PCBDDCSetupFETIDPMatContext" 14503425bc38SStefano Zampini static PetscErrorCode PCBDDCSetupFETIDPMatContext(FETIDPMat_ctx *fetidpmat_ctx ) 14513425bc38SStefano Zampini { 14523425bc38SStefano Zampini PetscErrorCode ierr; 14533425bc38SStefano Zampini PC_IS *pcis=(PC_IS*)fetidpmat_ctx->pc->data; 14543425bc38SStefano Zampini PC_BDDC *pcbddc=(PC_BDDC*)fetidpmat_ctx->pc->data; 14553425bc38SStefano Zampini PCBDDCGraph mat_graph=pcbddc->mat_graph; 14563425bc38SStefano Zampini Mat_IS *matis = (Mat_IS*)fetidpmat_ctx->pc->pmat->data; 14573425bc38SStefano Zampini MPI_Comm comm = ((PetscObject)(fetidpmat_ctx->pc))->comm; 14583425bc38SStefano Zampini 14593425bc38SStefano Zampini Mat ScalingMat; 14603425bc38SStefano Zampini Vec lambda_global; 14613425bc38SStefano Zampini IS IS_l2g_lambda; 14623425bc38SStefano Zampini 14633425bc38SStefano Zampini PetscBool skip_node,fully_redundant; 1464*ef028eecSStefano Zampini PetscInt i,j,k,s,n_boundary_dofs,n_global_lambda,n_vertices,partial_sum; 14653425bc38SStefano Zampini PetscInt n_local_lambda,n_lambda_for_dof,dual_size,n_neg_values,n_pos_values; 1466*ef028eecSStefano Zampini PetscMPIInt rank,nprocs; 14673425bc38SStefano Zampini PetscScalar scalar_value; 14683425bc38SStefano Zampini 14693425bc38SStefano Zampini PetscInt *vertex_indices,*temp_indices; 14703425bc38SStefano Zampini PetscInt *dual_dofs_boundary_indices,*aux_local_numbering_1,*aux_global_numbering; 14713425bc38SStefano Zampini PetscInt *aux_sums,*cols_B_delta,*l2g_indices; 14723425bc38SStefano Zampini PetscScalar *array,*scaling_factors,*vals_B_delta; 1473*ef028eecSStefano Zampini PetscInt *aux_local_numbering_2,*dof_sizes,*dof_displs; 1474*ef028eecSStefano Zampini PetscInt first_index,old_index; 1475*ef028eecSStefano Zampini PetscBool first_found = PETSC_FALSE; 14763425bc38SStefano Zampini 14773425bc38SStefano Zampini /* For communication of scaling factors */ 14783425bc38SStefano Zampini PetscInt *ptrs_buffer,neigh_position; 14793425bc38SStefano Zampini PetscScalar **all_factors,*send_buffer,*recv_buffer; 14803425bc38SStefano Zampini MPI_Request *send_reqs,*recv_reqs; 14813425bc38SStefano Zampini 14823425bc38SStefano Zampini /* tests */ 14833425bc38SStefano Zampini Vec test_vec; 14843425bc38SStefano Zampini PetscBool test_fetidp; 14853425bc38SStefano Zampini PetscViewer viewer; 14863425bc38SStefano Zampini 14873425bc38SStefano Zampini PetscFunctionBegin; 14883425bc38SStefano Zampini ierr = MPI_Comm_rank(comm,&rank);CHKERRQ(ierr); 14893425bc38SStefano Zampini ierr = MPI_Comm_size(comm,&nprocs);CHKERRQ(ierr); 14903425bc38SStefano Zampini 14913425bc38SStefano Zampini /* Default type of lagrange multipliers is non-redundant */ 14923425bc38SStefano Zampini fully_redundant = PETSC_FALSE; 14933425bc38SStefano Zampini ierr = PetscOptionsGetBool(PETSC_NULL,"-fetidp_fullyredundant",&fully_redundant,PETSC_NULL);CHKERRQ(ierr); 14943425bc38SStefano Zampini 14953425bc38SStefano Zampini /* Evaluate local and global number of lagrange multipliers */ 14963425bc38SStefano Zampini ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr); 14973425bc38SStefano Zampini n_local_lambda = 0; 14983425bc38SStefano Zampini partial_sum = 0; 14993425bc38SStefano Zampini n_boundary_dofs = 0; 15003425bc38SStefano Zampini s = 0; 15013425bc38SStefano Zampini n_vertices = 0; 15023425bc38SStefano Zampini /* Get Vertices used to define the BDDC */ 15033425bc38SStefano Zampini ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(*vertex_indices),&vertex_indices);CHKERRQ(ierr); 15043425bc38SStefano Zampini for (i=0;i<pcbddc->local_primal_size;i++) { 15053425bc38SStefano Zampini ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&j,(const PetscInt**)&temp_indices,PETSC_NULL);CHKERRQ(ierr); 15063425bc38SStefano Zampini if (j == 1) { 15073425bc38SStefano Zampini vertex_indices[n_vertices]=temp_indices[0]; 15083425bc38SStefano Zampini n_vertices++; 15093425bc38SStefano Zampini } 15103425bc38SStefano Zampini ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&j,(const PetscInt**)&temp_indices,PETSC_NULL);CHKERRQ(ierr); 15113425bc38SStefano Zampini } 15123425bc38SStefano Zampini dual_size = pcis->n_B-n_vertices; 1513f0474715SStefano Zampini ierr = PetscSortInt(n_vertices,vertex_indices);CHKERRQ(ierr); 15143425bc38SStefano Zampini ierr = PetscMalloc(dual_size*sizeof(*dual_dofs_boundary_indices),&dual_dofs_boundary_indices);CHKERRQ(ierr); 15153425bc38SStefano Zampini ierr = PetscMalloc(dual_size*sizeof(*aux_local_numbering_1),&aux_local_numbering_1);CHKERRQ(ierr); 15163425bc38SStefano Zampini ierr = PetscMalloc(dual_size*sizeof(*aux_local_numbering_2),&aux_local_numbering_2);CHKERRQ(ierr); 15173425bc38SStefano Zampini 15183425bc38SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 15193425bc38SStefano Zampini for (i=0;i<pcis->n;i++){ 15203425bc38SStefano Zampini j = mat_graph->count[i]; /* RECALL: mat_graph->count[i] does not count myself */ 1521c6582918SStefano Zampini k = 0; 1522c6582918SStefano Zampini if (j > 0) { 15233425bc38SStefano Zampini k = (mat_graph->neighbours_set[i][0] == -1 ? 1 : 0); 1524c6582918SStefano Zampini } 15253425bc38SStefano Zampini j = j - k ; 15263425bc38SStefano Zampini if ( j > 0 ) { n_boundary_dofs++; } 15273425bc38SStefano Zampini 15283425bc38SStefano Zampini skip_node = PETSC_FALSE; 1529c6582918SStefano Zampini if ( s < n_vertices && vertex_indices[s]==i) { /* it works for a sorted set of vertices */ 15303425bc38SStefano Zampini skip_node = PETSC_TRUE; 15313425bc38SStefano Zampini s++; 15323425bc38SStefano Zampini } 15333425bc38SStefano Zampini if (j < 1) {skip_node = PETSC_TRUE;} 15343425bc38SStefano Zampini if ( !skip_node ) { 15353425bc38SStefano Zampini if (fully_redundant) { 15363425bc38SStefano Zampini /* fully redundant set of lagrange multipliers */ 15373425bc38SStefano Zampini n_lambda_for_dof = (j*(j+1))/2; 15383425bc38SStefano Zampini } else { 15393425bc38SStefano Zampini n_lambda_for_dof = j; 15403425bc38SStefano Zampini } 15413425bc38SStefano Zampini n_local_lambda += j; 15423425bc38SStefano Zampini /* needed to evaluate global number of lagrange multipliers */ 15433425bc38SStefano Zampini array[i]=(1.0*n_lambda_for_dof)/(j+1.0); /* already scaled for the next global sum */ 15443425bc38SStefano Zampini /* store some data needed */ 15453425bc38SStefano Zampini dual_dofs_boundary_indices[partial_sum] = n_boundary_dofs-1; 15463425bc38SStefano Zampini aux_local_numbering_1[partial_sum] = i; 1547*ef028eecSStefano Zampini aux_local_numbering_2[partial_sum] = n_lambda_for_dof; 15483425bc38SStefano Zampini partial_sum++; 15493425bc38SStefano Zampini } 15503425bc38SStefano Zampini } 15513425bc38SStefano Zampini /*printf("I found %d local lambda dofs\n",n_local_lambda); 15523425bc38SStefano Zampini printf("I found %d boundary dofs (should be %d)\n",n_boundary_dofs,pcis->n_B); 15533425bc38SStefano Zampini printf("Partial sum %d should be %d\n",partial_sum,dual_size);*/ 15543425bc38SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 1555*ef028eecSStefano Zampini 15563425bc38SStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 15573425bc38SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 15583425bc38SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 15593425bc38SStefano Zampini ierr = VecSum(pcis->vec1_global,&scalar_value);CHKERRQ(ierr); 15603425bc38SStefano Zampini fetidpmat_ctx->n_lambda = (PetscInt) scalar_value; 15613425bc38SStefano Zampini /* printf("I found %d global multipliers (%f)\n",fetidpmat_ctx->n_lambda,scalar_value); */ 15623425bc38SStefano Zampini 15633425bc38SStefano Zampini /* compute global ordering of lagrange multipliers and associate l2g map */ 1564*ef028eecSStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 1565*ef028eecSStefano Zampini ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr); 1566*ef028eecSStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 1567*ef028eecSStefano Zampini for (i=0;i<dual_size;i++) { 1568*ef028eecSStefano Zampini array[aux_local_numbering_1[i]] = aux_local_numbering_2[i]; 1569*ef028eecSStefano Zampini } 1570*ef028eecSStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 1571*ef028eecSStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 1572*ef028eecSStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,pcis->vec1_global,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 1573*ef028eecSStefano Zampini ierr = VecSum(pcis->vec1_global,&scalar_value);CHKERRQ(ierr); 1574*ef028eecSStefano Zampini if (pcbddc->dbg_flag && (PetscInt)scalar_value != fetidpmat_ctx->n_lambda) { 1575*ef028eecSStefano Zampini SETERRQ3(PETSC_COMM_WORLD,PETSC_ERR_PLIB,"Error in %s: global number of multipliers mismatch! (%d!=%d)\n",__FUNCT__,(PetscInt)scalar_value,fetidpmat_ctx->n_lambda); 1576*ef028eecSStefano Zampini } 15773425bc38SStefano Zampini 1578*ef028eecSStefano Zampini /* Fill pcis->vec1_global with cumulative function for global numbering */ 1579*ef028eecSStefano Zampini ierr = VecGetArray(pcis->vec1_global,&array);CHKERRQ(ierr); 1580*ef028eecSStefano Zampini ierr = VecGetLocalSize(pcis->vec1_global,&s);CHKERRQ(ierr); 1581*ef028eecSStefano Zampini k = 0; 1582*ef028eecSStefano Zampini first_index = -1; 1583*ef028eecSStefano Zampini for (i=0;i<s;i++) { 1584*ef028eecSStefano Zampini if (!first_found && array[i] > 0.0) { 1585*ef028eecSStefano Zampini first_found = PETSC_TRUE; 1586*ef028eecSStefano Zampini first_index = i; 1587*ef028eecSStefano Zampini } 1588*ef028eecSStefano Zampini k += (PetscInt)array[i]; 1589*ef028eecSStefano Zampini } 1590*ef028eecSStefano Zampini j = ( !rank ? nprocs : 0); 15913425bc38SStefano Zampini ierr = PetscMalloc(j*sizeof(*dof_sizes),&dof_sizes);CHKERRQ(ierr); 15923425bc38SStefano Zampini ierr = PetscMalloc(j*sizeof(*dof_displs),&dof_displs);CHKERRQ(ierr); 1593*ef028eecSStefano Zampini ierr = MPI_Gather(&k,1,MPIU_INT,dof_sizes,1,MPIU_INT,0,comm);CHKERRQ(ierr); 1594*ef028eecSStefano Zampini if (!rank) { 15953425bc38SStefano Zampini dof_displs[0]=0; 15963425bc38SStefano Zampini for (i=1;i<nprocs;i++) { 15973425bc38SStefano Zampini dof_displs[i] = dof_displs[i-1]+dof_sizes[i-1]; 15983425bc38SStefano Zampini } 15993425bc38SStefano Zampini } 1600*ef028eecSStefano Zampini ierr = MPI_Scatter(dof_displs,1,MPIU_INT,&k,1,MPIU_INT,0,comm);CHKERRQ(ierr); 1601*ef028eecSStefano Zampini if (first_found) { 1602*ef028eecSStefano Zampini array[first_index] += k; 1603*ef028eecSStefano Zampini old_index = first_index; 1604*ef028eecSStefano Zampini for (i=first_index+1;i<s;i++) { 1605*ef028eecSStefano Zampini if (array[i] > 0.0) { 1606*ef028eecSStefano Zampini array[i] += array[old_index]; 1607*ef028eecSStefano Zampini old_index = i; 1608*ef028eecSStefano Zampini } 1609*ef028eecSStefano Zampini } 1610*ef028eecSStefano Zampini } 1611*ef028eecSStefano Zampini ierr = VecRestoreArray(pcis->vec1_global,&array);CHKERRQ(ierr); 1612*ef028eecSStefano Zampini ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr); 1613*ef028eecSStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 1614*ef028eecSStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 1615*ef028eecSStefano Zampini ierr = PetscMalloc(dual_size*sizeof(*aux_global_numbering),&aux_global_numbering);CHKERRQ(ierr); 1616*ef028eecSStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 16173425bc38SStefano Zampini for (i=0;i<dual_size;i++) { 1618*ef028eecSStefano Zampini aux_global_numbering[i] = (PetscInt)array[aux_local_numbering_1[i]]-aux_local_numbering_2[i]; 16193425bc38SStefano Zampini } 1620*ef028eecSStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 1621f0474715SStefano Zampini ierr = PetscFree(aux_local_numbering_2);CHKERRQ(ierr); 1622f0474715SStefano Zampini ierr = PetscFree(dof_displs);CHKERRQ(ierr); 1623f0474715SStefano Zampini ierr = PetscFree(dof_sizes);CHKERRQ(ierr); 16243425bc38SStefano Zampini 16253425bc38SStefano Zampini /* init data for scaling factors exchange */ 16263425bc38SStefano Zampini partial_sum = 0; 16273425bc38SStefano Zampini j = 0; 16283425bc38SStefano Zampini ierr = PetscMalloc(pcis->n_neigh*sizeof(PetscInt),&ptrs_buffer);CHKERRQ(ierr); 16293425bc38SStefano Zampini ierr = PetscMalloc((pcis->n_neigh-1)*sizeof(MPI_Request),&send_reqs);CHKERRQ(ierr); 16303425bc38SStefano Zampini ierr = PetscMalloc((pcis->n_neigh-1)*sizeof(MPI_Request),&recv_reqs);CHKERRQ(ierr); 16313425bc38SStefano Zampini ierr = PetscMalloc(pcis->n*sizeof(PetscScalar*),&all_factors);CHKERRQ(ierr); 16323425bc38SStefano Zampini ptrs_buffer[0]=0; 16333425bc38SStefano Zampini for (i=1;i<pcis->n_neigh;i++) { 16343425bc38SStefano Zampini partial_sum += pcis->n_shared[i]; 16353425bc38SStefano Zampini ptrs_buffer[i] = ptrs_buffer[i-1]+pcis->n_shared[i]; 16363425bc38SStefano Zampini } 16373425bc38SStefano Zampini ierr = PetscMalloc( partial_sum*sizeof(PetscScalar),&send_buffer);CHKERRQ(ierr); 16383425bc38SStefano Zampini ierr = PetscMalloc( partial_sum*sizeof(PetscScalar),&recv_buffer);CHKERRQ(ierr); 16393425bc38SStefano Zampini ierr = PetscMalloc( partial_sum*sizeof(PetscScalar),&all_factors[0]);CHKERRQ(ierr); 16403425bc38SStefano Zampini for (i=0;i<pcis->n-1;i++) { 16413425bc38SStefano Zampini j = mat_graph->count[i]; 16423425bc38SStefano Zampini if (j>0) { 16433425bc38SStefano Zampini k = (mat_graph->neighbours_set[i][0] == -1 ? 1 : 0); 16443425bc38SStefano Zampini j = j - k; 16453425bc38SStefano Zampini } 16463425bc38SStefano Zampini all_factors[i+1]=all_factors[i]+j; 16473425bc38SStefano Zampini } 16483425bc38SStefano Zampini /* scatter B scaling to N vec */ 16493425bc38SStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->D,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 16503425bc38SStefano Zampini ierr = VecScatterEnd (pcis->N_to_B,pcis->D,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 16513425bc38SStefano Zampini /* communications */ 16523425bc38SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 16533425bc38SStefano Zampini for (i=1;i<pcis->n_neigh;i++) { 16543425bc38SStefano Zampini for (j=0;j<pcis->n_shared[i];j++) { 16553425bc38SStefano Zampini send_buffer[ptrs_buffer[i-1]+j]=array[pcis->shared[i][j]]; 16563425bc38SStefano Zampini } 16573425bc38SStefano Zampini j = ptrs_buffer[i]-ptrs_buffer[i-1]; 1658ea7e1babSStefano Zampini ierr = MPI_Isend(&send_buffer[ptrs_buffer[i-1]],j,MPIU_SCALAR,pcis->neigh[i],0,comm,&send_reqs[i-1]);CHKERRQ(ierr); 1659ea7e1babSStefano Zampini ierr = MPI_Irecv(&recv_buffer[ptrs_buffer[i-1]],j,MPIU_SCALAR,pcis->neigh[i],0,comm,&recv_reqs[i-1]);CHKERRQ(ierr); 16603425bc38SStefano Zampini } 16613425bc38SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 1662ea7e1babSStefano Zampini ierr = MPI_Waitall((pcis->n_neigh-1),recv_reqs,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 16633425bc38SStefano Zampini /* put values in correct places */ 16643425bc38SStefano Zampini for (i=1;i<pcis->n_neigh;i++) { 16653425bc38SStefano Zampini for (j=0;j<pcis->n_shared[i];j++) { 16663425bc38SStefano Zampini k = pcis->shared[i][j]; 16673425bc38SStefano Zampini neigh_position = 0; 16683425bc38SStefano Zampini while(mat_graph->neighbours_set[k][neigh_position] != pcis->neigh[i]) {neigh_position++;} 16693425bc38SStefano Zampini s = (mat_graph->neighbours_set[k][0] == -1 ? 1 : 0); 16703425bc38SStefano Zampini neigh_position = neigh_position - s; 16713425bc38SStefano Zampini all_factors[k][neigh_position]=recv_buffer[ptrs_buffer[i-1]+j]; 16723425bc38SStefano Zampini } 16733425bc38SStefano Zampini } 1674ea7e1babSStefano Zampini ierr = MPI_Waitall((pcis->n_neigh-1),send_reqs,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 16753425bc38SStefano Zampini ierr = PetscFree(send_reqs);CHKERRQ(ierr); 16763425bc38SStefano Zampini ierr = PetscFree(recv_reqs);CHKERRQ(ierr); 16773425bc38SStefano Zampini ierr = PetscFree(send_buffer);CHKERRQ(ierr); 16783425bc38SStefano Zampini ierr = PetscFree(recv_buffer);CHKERRQ(ierr); 16793425bc38SStefano Zampini ierr = PetscFree(ptrs_buffer);CHKERRQ(ierr); 16803425bc38SStefano Zampini 16813425bc38SStefano Zampini /* Compute B and B_delta (local actions) */ 16823425bc38SStefano Zampini ierr = PetscMalloc(pcis->n_neigh*sizeof(*aux_sums),&aux_sums);CHKERRQ(ierr); 16833425bc38SStefano Zampini ierr = PetscMalloc(n_local_lambda*sizeof(*l2g_indices),&l2g_indices);CHKERRQ(ierr); 16843425bc38SStefano Zampini ierr = PetscMalloc(n_local_lambda*sizeof(*vals_B_delta),&vals_B_delta);CHKERRQ(ierr); 16853425bc38SStefano Zampini ierr = PetscMalloc(n_local_lambda*sizeof(*cols_B_delta),&cols_B_delta);CHKERRQ(ierr); 16863425bc38SStefano Zampini ierr = PetscMalloc(n_local_lambda*sizeof(*scaling_factors),&scaling_factors);CHKERRQ(ierr); 16873425bc38SStefano Zampini n_global_lambda=0; 16883425bc38SStefano Zampini partial_sum=0; 16893425bc38SStefano Zampini for (i=0;i<dual_size;i++) { 1690*ef028eecSStefano Zampini n_global_lambda = aux_global_numbering[i]; 16913425bc38SStefano Zampini j = mat_graph->count[aux_local_numbering_1[i]]; 16923425bc38SStefano Zampini k = (mat_graph->neighbours_set[aux_local_numbering_1[i]][0] == -1 ? 1 : 0); 16933425bc38SStefano Zampini j = j - k; 16943425bc38SStefano Zampini aux_sums[0]=0; 16953425bc38SStefano Zampini for (s=1;s<j;s++) { 16963425bc38SStefano Zampini aux_sums[s]=aux_sums[s-1]+j-s+1; 16973425bc38SStefano Zampini } 16983425bc38SStefano Zampini array = all_factors[aux_local_numbering_1[i]]; 16993425bc38SStefano Zampini n_neg_values = 0; 17003425bc38SStefano Zampini while(n_neg_values < j && mat_graph->neighbours_set[aux_local_numbering_1[i]][n_neg_values+k] < rank) {n_neg_values++;} 17013425bc38SStefano Zampini n_pos_values = j - n_neg_values; 17023425bc38SStefano Zampini if (fully_redundant) { 17033425bc38SStefano Zampini for (s=0;s<n_neg_values;s++) { 17043425bc38SStefano Zampini l2g_indices [partial_sum+s]=aux_sums[s]+n_neg_values-s-1+n_global_lambda; 17053425bc38SStefano Zampini cols_B_delta [partial_sum+s]=dual_dofs_boundary_indices[i]; 17063425bc38SStefano Zampini vals_B_delta [partial_sum+s]=-1.0; 17073425bc38SStefano Zampini scaling_factors[partial_sum+s]=array[s]; 17083425bc38SStefano Zampini } 17093425bc38SStefano Zampini for (s=0;s<n_pos_values;s++) { 17103425bc38SStefano Zampini l2g_indices [partial_sum+s+n_neg_values]=aux_sums[n_neg_values]+s+n_global_lambda; 17113425bc38SStefano Zampini cols_B_delta [partial_sum+s+n_neg_values]=dual_dofs_boundary_indices[i]; 17123425bc38SStefano Zampini vals_B_delta [partial_sum+s+n_neg_values]=1.0; 17133425bc38SStefano Zampini scaling_factors[partial_sum+s+n_neg_values]=array[s+n_neg_values]; 17143425bc38SStefano Zampini } 17153425bc38SStefano Zampini partial_sum += j; 17163425bc38SStefano Zampini } else { 17173425bc38SStefano Zampini /* l2g_indices and default cols and vals of B_delta */ 17183425bc38SStefano Zampini for (s=0;s<j;s++) { 17193425bc38SStefano Zampini l2g_indices [partial_sum+s]=n_global_lambda+s; 17203425bc38SStefano Zampini cols_B_delta [partial_sum+s]=dual_dofs_boundary_indices[i]; 17213425bc38SStefano Zampini vals_B_delta [partial_sum+s]=0.0; 17223425bc38SStefano Zampini } 17233425bc38SStefano Zampini /* B_delta */ 17243425bc38SStefano Zampini if ( n_neg_values > 0 ) { /* there's a rank next to me to the left */ 17253425bc38SStefano Zampini vals_B_delta [partial_sum+n_neg_values-1]=-1.0; 17263425bc38SStefano Zampini } 17273425bc38SStefano Zampini if ( n_neg_values < j ) { /* there's a rank next to me to the right */ 17283425bc38SStefano Zampini vals_B_delta [partial_sum+n_neg_values]=1.0; 17293425bc38SStefano Zampini } 17303425bc38SStefano Zampini /* scaling as in Klawonn-Widlund 1999*/ 17313425bc38SStefano Zampini for (s=0;s<n_neg_values;s++) { 17323425bc38SStefano Zampini scalar_value = 0.0; 17333425bc38SStefano Zampini for (k=0;k<s+1;k++) { 17343425bc38SStefano Zampini scalar_value += array[k]; 17353425bc38SStefano Zampini } 1736*ef028eecSStefano Zampini scaling_factors[partial_sum+s] = -scalar_value; 17373425bc38SStefano Zampini } 17383425bc38SStefano Zampini for (s=0;s<n_pos_values;s++) { 17393425bc38SStefano Zampini scalar_value = 0.0; 17403425bc38SStefano Zampini for (k=s+n_neg_values;k<j;k++) { 17413425bc38SStefano Zampini scalar_value += array[k]; 17423425bc38SStefano Zampini } 17433425bc38SStefano Zampini scaling_factors[partial_sum+s+n_neg_values] = scalar_value; 17443425bc38SStefano Zampini } 17453425bc38SStefano Zampini partial_sum += j; 17463425bc38SStefano Zampini } 17473425bc38SStefano Zampini } 1748*ef028eecSStefano Zampini ierr = PetscFree(aux_global_numbering);CHKERRQ(ierr); 1749f0474715SStefano Zampini ierr = PetscFree(aux_sums);CHKERRQ(ierr); 1750f0474715SStefano Zampini ierr = PetscFree(aux_local_numbering_1);CHKERRQ(ierr); 1751f0474715SStefano Zampini ierr = PetscFree(dual_dofs_boundary_indices);CHKERRQ(ierr); 17523425bc38SStefano Zampini ierr = PetscFree(all_factors[0]);CHKERRQ(ierr); 17533425bc38SStefano Zampini ierr = PetscFree(all_factors);CHKERRQ(ierr); 17543425bc38SStefano Zampini /* printf("I found %d local lambda dofs when numbering them (should be %d)\n",partial_sum,n_local_lambda); */ 1755f0474715SStefano Zampini 1756f0474715SStefano Zampini /* Local to global mapping of fetidpmat */ 1757f0474715SStefano Zampini ierr = VecCreate(PETSC_COMM_SELF,&fetidpmat_ctx->lambda_local);CHKERRQ(ierr); 1758f0474715SStefano Zampini ierr = VecSetSizes(fetidpmat_ctx->lambda_local,n_local_lambda,n_local_lambda);CHKERRQ(ierr); 1759f0474715SStefano Zampini ierr = VecSetType(fetidpmat_ctx->lambda_local,VECSEQ);CHKERRQ(ierr); 1760f0474715SStefano Zampini ierr = VecCreate(comm,&lambda_global);CHKERRQ(ierr); 1761f0474715SStefano Zampini ierr = VecSetSizes(lambda_global,PETSC_DECIDE,fetidpmat_ctx->n_lambda);CHKERRQ(ierr); 1762f0474715SStefano Zampini ierr = VecSetType(lambda_global,VECMPI);CHKERRQ(ierr); 17633425bc38SStefano Zampini ierr = ISCreateGeneral(comm,n_local_lambda,l2g_indices,PETSC_OWN_POINTER,&IS_l2g_lambda);CHKERRQ(ierr); 17643425bc38SStefano Zampini ierr = VecScatterCreate(fetidpmat_ctx->lambda_local,(IS)0,lambda_global,IS_l2g_lambda,&fetidpmat_ctx->l2g_lambda);CHKERRQ(ierr); 1765f0474715SStefano Zampini ierr = ISDestroy(&IS_l2g_lambda);CHKERRQ(ierr); 17663425bc38SStefano Zampini 17673425bc38SStefano Zampini /* Create local part of B_delta */ 17683425bc38SStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&fetidpmat_ctx->B_delta); 17693425bc38SStefano Zampini ierr = MatSetSizes(fetidpmat_ctx->B_delta,n_local_lambda,pcis->n_B,n_local_lambda,pcis->n_B);CHKERRQ(ierr); 17703425bc38SStefano Zampini ierr = MatSetType(fetidpmat_ctx->B_delta,MATSEQAIJ);CHKERRQ(ierr); 17713425bc38SStefano Zampini ierr = MatSeqAIJSetPreallocation(fetidpmat_ctx->B_delta,1,PETSC_NULL);CHKERRQ(ierr); 17723425bc38SStefano Zampini ierr = MatSetOption(fetidpmat_ctx->B_delta,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr); 17733425bc38SStefano Zampini for (i=0;i<n_local_lambda;i++) { 17743425bc38SStefano Zampini ierr = MatSetValue(fetidpmat_ctx->B_delta,i,cols_B_delta[i],vals_B_delta[i],INSERT_VALUES);CHKERRQ(ierr); 17753425bc38SStefano Zampini } 1776f0474715SStefano Zampini ierr = PetscFree(vals_B_delta);CHKERRQ(ierr); 17773425bc38SStefano Zampini ierr = MatAssemblyBegin(fetidpmat_ctx->B_delta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 17783425bc38SStefano Zampini ierr = MatAssemblyEnd (fetidpmat_ctx->B_delta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 17793425bc38SStefano Zampini 17803425bc38SStefano Zampini if (fully_redundant) { 17813425bc38SStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&ScalingMat); 17823425bc38SStefano Zampini ierr = MatSetSizes(ScalingMat,n_local_lambda,n_local_lambda,n_local_lambda,n_local_lambda);CHKERRQ(ierr); 17833425bc38SStefano Zampini ierr = MatSetType(ScalingMat,MATSEQAIJ);CHKERRQ(ierr); 17843425bc38SStefano Zampini ierr = MatSeqAIJSetPreallocation(ScalingMat,1,PETSC_NULL);CHKERRQ(ierr); 17853425bc38SStefano Zampini for (i=0;i<n_local_lambda;i++) { 17863425bc38SStefano Zampini ierr = MatSetValue(ScalingMat,i,i,scaling_factors[i],INSERT_VALUES);CHKERRQ(ierr); 17873425bc38SStefano Zampini } 17883425bc38SStefano Zampini ierr = MatAssemblyBegin(ScalingMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 17893425bc38SStefano Zampini ierr = MatAssemblyEnd (ScalingMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 17903425bc38SStefano Zampini ierr = MatMatMult(ScalingMat,fetidpmat_ctx->B_delta,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&fetidpmat_ctx->B_Ddelta);CHKERRQ(ierr); 17913425bc38SStefano Zampini ierr = MatDestroy(&ScalingMat);CHKERRQ(ierr); 17923425bc38SStefano Zampini } else { 17933425bc38SStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&fetidpmat_ctx->B_Ddelta); 17943425bc38SStefano Zampini ierr = MatSetSizes(fetidpmat_ctx->B_Ddelta,n_local_lambda,pcis->n_B,n_local_lambda,pcis->n_B);CHKERRQ(ierr); 17953425bc38SStefano Zampini ierr = MatSetType(fetidpmat_ctx->B_Ddelta,MATSEQAIJ);CHKERRQ(ierr); 17963425bc38SStefano Zampini ierr = MatSeqAIJSetPreallocation(fetidpmat_ctx->B_Ddelta,1,PETSC_NULL);CHKERRQ(ierr); 17973425bc38SStefano Zampini for (i=0;i<n_local_lambda;i++) { 17983425bc38SStefano Zampini ierr = MatSetValue(fetidpmat_ctx->B_Ddelta,i,cols_B_delta[i],scaling_factors[i],INSERT_VALUES);CHKERRQ(ierr); 17993425bc38SStefano Zampini } 18003425bc38SStefano Zampini ierr = MatAssemblyBegin(fetidpmat_ctx->B_Ddelta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 18013425bc38SStefano Zampini ierr = MatAssemblyEnd (fetidpmat_ctx->B_Ddelta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 18023425bc38SStefano Zampini } 1803f0474715SStefano Zampini ierr = PetscFree(scaling_factors);CHKERRQ(ierr); 1804f0474715SStefano Zampini ierr = PetscFree(cols_B_delta);CHKERRQ(ierr); 18053425bc38SStefano Zampini 18063425bc38SStefano Zampini /* Create some vectors needed by fetidp */ 18073425bc38SStefano Zampini ierr = VecDuplicate(pcis->vec1_B,&fetidpmat_ctx->temp_solution_B);CHKERRQ(ierr); 18083425bc38SStefano Zampini ierr = VecDuplicate(pcis->vec1_D,&fetidpmat_ctx->temp_solution_D);CHKERRQ(ierr); 18093425bc38SStefano Zampini 18103425bc38SStefano Zampini test_fetidp = PETSC_FALSE; 18113425bc38SStefano Zampini ierr = PetscOptionsGetBool(PETSC_NULL,"-fetidp_check",&test_fetidp,PETSC_NULL);CHKERRQ(ierr); 18123425bc38SStefano Zampini 18133425bc38SStefano Zampini if (test_fetidp) { 18143425bc38SStefano Zampini 18153425bc38SStefano Zampini ierr = PetscViewerASCIIGetStdout(((PetscObject)(fetidpmat_ctx->pc))->comm,&viewer);CHKERRQ(ierr); 18163425bc38SStefano Zampini ierr = PetscViewerASCIISynchronizedAllow(viewer,PETSC_TRUE);CHKERRQ(ierr); 18173425bc38SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"----------FETI_DP TESTS--------------\n");CHKERRQ(ierr); 18183425bc38SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"All tests should return zero!\n");CHKERRQ(ierr); 18193425bc38SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"FETIDP MAT context in the ");CHKERRQ(ierr); 18203425bc38SStefano Zampini if (fully_redundant) { 18213425bc38SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"fully redundant case for lagrange multipliers.\n");CHKERRQ(ierr); 18223425bc38SStefano Zampini } else { 18233425bc38SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Non-fully redundant case for lagrange multiplier.\n");CHKERRQ(ierr); 18243425bc38SStefano Zampini } 18253425bc38SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 18263425bc38SStefano Zampini 18273425bc38SStefano Zampini /******************************************************************/ 18283425bc38SStefano Zampini /* TEST A/B: Test numbering of global lambda dofs */ 18293425bc38SStefano Zampini /******************************************************************/ 18303425bc38SStefano Zampini 18313425bc38SStefano Zampini ierr = VecDuplicate(fetidpmat_ctx->lambda_local,&test_vec);CHKERRQ(ierr); 18323425bc38SStefano Zampini ierr = VecSet(lambda_global,1.0);CHKERRQ(ierr); 18333425bc38SStefano Zampini ierr = VecSet(test_vec,1.0);CHKERRQ(ierr); 18343425bc38SStefano Zampini ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 18353425bc38SStefano Zampini ierr = VecScatterEnd (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 18363425bc38SStefano Zampini scalar_value = -1.0; 18373425bc38SStefano Zampini ierr = VecAXPY(test_vec,scalar_value,fetidpmat_ctx->lambda_local);CHKERRQ(ierr); 18383425bc38SStefano Zampini ierr = VecNorm(test_vec,NORM_INFINITY,&scalar_value);CHKERRQ(ierr); 18393425bc38SStefano Zampini ierr = VecDestroy(&test_vec);CHKERRQ(ierr); 18403425bc38SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"A[%04d]: CHECK glob to loc: % 1.14e\n",rank,scalar_value);CHKERRQ(ierr); 18413425bc38SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 18423425bc38SStefano Zampini if (fully_redundant) { 18433425bc38SStefano Zampini ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr); 18443425bc38SStefano Zampini ierr = VecSet(fetidpmat_ctx->lambda_local,0.5);CHKERRQ(ierr); 18453425bc38SStefano Zampini ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 18463425bc38SStefano Zampini ierr = VecScatterEnd (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 18473425bc38SStefano Zampini ierr = VecSum(lambda_global,&scalar_value);CHKERRQ(ierr); 18483425bc38SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"B[%04d]: CHECK loc to glob: % 1.14e\n",rank,scalar_value-fetidpmat_ctx->n_lambda);CHKERRQ(ierr); 18493425bc38SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 18503425bc38SStefano Zampini } 18513425bc38SStefano Zampini 18523425bc38SStefano Zampini /******************************************************************/ 18533425bc38SStefano Zampini /* TEST C: It should holds B_delta*w=0, w\in\widehat{W} */ 18543425bc38SStefano Zampini /* This is the meaning of the B matrix */ 18553425bc38SStefano Zampini /******************************************************************/ 18563425bc38SStefano Zampini 18573425bc38SStefano Zampini ierr = VecSetRandom(pcis->vec1_N,PETSC_NULL);CHKERRQ(ierr); 18583425bc38SStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 18593425bc38SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 18603425bc38SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 18613425bc38SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 18623425bc38SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 18633425bc38SStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 18643425bc38SStefano Zampini ierr = VecScatterEnd (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 18653425bc38SStefano Zampini /* Action of B_delta */ 18663425bc38SStefano Zampini ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr); 18673425bc38SStefano Zampini ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr); 18683425bc38SStefano Zampini ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 18693425bc38SStefano Zampini ierr = VecScatterEnd (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 18703425bc38SStefano Zampini ierr = VecNorm(lambda_global,NORM_INFINITY,&scalar_value);CHKERRQ(ierr); 18713425bc38SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"C[coll]: CHECK infty norm of B_delta*w (w continuous): % 1.14e\n",scalar_value);CHKERRQ(ierr); 18723425bc38SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 18733425bc38SStefano Zampini 18743425bc38SStefano Zampini /******************************************************************/ 18753425bc38SStefano Zampini /* TEST D: It should holds E_Dw = w - P_Dw w\in\widetilde{W} */ 18763425bc38SStefano Zampini /* E_D = R_D^TR */ 18773425bc38SStefano Zampini /* P_D = B_{D,delta}^T B_{delta} */ 18783425bc38SStefano Zampini /* eq.44 Mandel Tezaur and Dohrmann 2005 */ 18793425bc38SStefano Zampini /******************************************************************/ 18803425bc38SStefano Zampini 18813425bc38SStefano Zampini /* compute a random vector in \widetilde{W} */ 18823425bc38SStefano Zampini ierr = VecSetRandom(pcis->vec1_N,PETSC_NULL);CHKERRQ(ierr); 18833425bc38SStefano Zampini scalar_value = 0.0; /* set zero at vertices */ 18843425bc38SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 18853425bc38SStefano Zampini for (i=0;i<n_vertices;i++) { array[vertex_indices[i]]=scalar_value; } 18863425bc38SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 18873425bc38SStefano Zampini /* store w for final comparison */ 18883425bc38SStefano Zampini ierr = VecDuplicate(pcis->vec1_B,&test_vec);CHKERRQ(ierr); 18893425bc38SStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,test_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 18903425bc38SStefano Zampini ierr = VecScatterEnd (pcis->N_to_B,pcis->vec1_N,test_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 18913425bc38SStefano Zampini 18923425bc38SStefano Zampini /* Jump operator P_D : results stored in pcis->vec1_B */ 18933425bc38SStefano Zampini 18943425bc38SStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 18953425bc38SStefano Zampini ierr = VecScatterEnd (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 18963425bc38SStefano Zampini /* Action of B_delta */ 18973425bc38SStefano Zampini ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr); 18983425bc38SStefano Zampini ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr); 18993425bc38SStefano Zampini ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 19003425bc38SStefano Zampini ierr = VecScatterEnd (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 19013425bc38SStefano Zampini /* Action of B_Ddelta^T */ 19023425bc38SStefano Zampini ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 19033425bc38SStefano Zampini ierr = VecScatterEnd (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 19043425bc38SStefano Zampini ierr = MatMultTranspose(fetidpmat_ctx->B_Ddelta,fetidpmat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr); 19053425bc38SStefano Zampini 19063425bc38SStefano Zampini /* Average operator E_D : results stored in pcis->vec2_B */ 19073425bc38SStefano Zampini 19083425bc38SStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 19093425bc38SStefano Zampini ierr = VecScatterEnd (pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 19103425bc38SStefano Zampini ierr = VecPointwiseMult(pcis->vec2_B,pcis->D,pcis->vec2_B);CHKERRQ(ierr); 19113425bc38SStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->vec2_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 19123425bc38SStefano Zampini ierr = VecScatterEnd (pcis->N_to_B,pcis->vec2_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 19133425bc38SStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 19143425bc38SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 19153425bc38SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 19163425bc38SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 19173425bc38SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 19183425bc38SStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 19193425bc38SStefano Zampini ierr = VecScatterEnd (pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 19203425bc38SStefano Zampini 19213425bc38SStefano Zampini /* test E_D=I-P_D */ 19223425bc38SStefano Zampini scalar_value = 1.0; 19233425bc38SStefano Zampini ierr = VecAXPY(pcis->vec1_B,scalar_value,pcis->vec2_B);CHKERRQ(ierr); 19243425bc38SStefano Zampini scalar_value = -1.0; 19253425bc38SStefano Zampini ierr = VecAXPY(pcis->vec1_B,scalar_value,test_vec);CHKERRQ(ierr); 19263425bc38SStefano Zampini ierr = VecNorm(pcis->vec1_B,NORM_INFINITY,&scalar_value);CHKERRQ(ierr); 19273425bc38SStefano Zampini ierr = VecDestroy(&test_vec);CHKERRQ(ierr); 19283425bc38SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"D[%04d] CHECK infty norm of E_D + P_D - I: % 1.14e\n",rank,scalar_value);CHKERRQ(ierr); 19293425bc38SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 19303425bc38SStefano Zampini 19313425bc38SStefano Zampini /******************************************************************/ 19323425bc38SStefano Zampini /* TEST E: It should holds R_D^TP_Dw=0 w\in\widetilde{W} */ 19333425bc38SStefano Zampini /* eq.48 Mandel Tezaur and Dohrmann 2005 */ 19343425bc38SStefano Zampini /******************************************************************/ 19353425bc38SStefano Zampini 19363425bc38SStefano Zampini ierr = VecSetRandom(pcis->vec1_N,PETSC_NULL);CHKERRQ(ierr); 19373425bc38SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 19383425bc38SStefano Zampini scalar_value = 0.0; /* set zero at vertices */ 19393425bc38SStefano Zampini for (i=0;i<n_vertices;i++) { array[vertex_indices[i]]=scalar_value; } 19403425bc38SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 19413425bc38SStefano Zampini 19423425bc38SStefano Zampini /* Jump operator P_D : results stored in pcis->vec1_B */ 19433425bc38SStefano Zampini 19443425bc38SStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 19453425bc38SStefano Zampini ierr = VecScatterEnd (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 19463425bc38SStefano Zampini /* Action of B_delta */ 19473425bc38SStefano Zampini ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr); 19483425bc38SStefano Zampini ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr); 19493425bc38SStefano Zampini ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 19503425bc38SStefano Zampini ierr = VecScatterEnd (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 19513425bc38SStefano Zampini /* Action of B_Ddelta^T */ 19523425bc38SStefano Zampini ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 19533425bc38SStefano Zampini ierr = VecScatterEnd (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 19543425bc38SStefano Zampini ierr = MatMultTranspose(fetidpmat_ctx->B_Ddelta,fetidpmat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr); 19553425bc38SStefano Zampini /* diagonal scaling */ 19563425bc38SStefano Zampini ierr = VecPointwiseMult(pcis->vec1_B,pcis->D,pcis->vec1_B);CHKERRQ(ierr); 19573425bc38SStefano Zampini /* sum on the interface */ 19583425bc38SStefano Zampini ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr); 19593425bc38SStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 19603425bc38SStefano Zampini ierr = VecScatterEnd (pcis->N_to_B,pcis->vec1_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 19613425bc38SStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 19623425bc38SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 19633425bc38SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 19643425bc38SStefano Zampini ierr = VecNorm(pcis->vec1_global,NORM_INFINITY,&scalar_value);CHKERRQ(ierr); 19653425bc38SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"E[coll]: CHECK infty norm of R^T_D P_D: % 1.14e\n",scalar_value);CHKERRQ(ierr); 19663425bc38SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 19673425bc38SStefano Zampini 19683425bc38SStefano Zampini if (!fully_redundant) { 19693425bc38SStefano Zampini /******************************************************************/ 19703425bc38SStefano Zampini /* TEST F: It should holds B_{delta}B^T_{D,delta}=I */ 19713425bc38SStefano Zampini /* Corollary thm 14 Mandel Tezaur and Dohrmann 2005 */ 19723425bc38SStefano Zampini /******************************************************************/ 19733425bc38SStefano Zampini ierr = VecDuplicate(lambda_global,&test_vec);CHKERRQ(ierr); 19743425bc38SStefano Zampini ierr = VecSetRandom(lambda_global,PETSC_NULL);CHKERRQ(ierr); 19753425bc38SStefano Zampini /* Action of B_Ddelta^T */ 19763425bc38SStefano Zampini ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 19773425bc38SStefano Zampini ierr = VecScatterEnd (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 19783425bc38SStefano Zampini ierr = MatMultTranspose(fetidpmat_ctx->B_Ddelta,fetidpmat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr); 19793425bc38SStefano Zampini /* Action of B_delta */ 19803425bc38SStefano Zampini ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr); 19813425bc38SStefano Zampini ierr = VecSet(test_vec,0.0);CHKERRQ(ierr); 19823425bc38SStefano Zampini ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,test_vec,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 19833425bc38SStefano Zampini ierr = VecScatterEnd (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,test_vec,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 19843425bc38SStefano Zampini scalar_value = -1.0; 19853425bc38SStefano Zampini ierr = VecAXPY(lambda_global,scalar_value,test_vec);CHKERRQ(ierr); 19863425bc38SStefano Zampini ierr = VecNorm(lambda_global,NORM_INFINITY,&scalar_value);CHKERRQ(ierr); 19873425bc38SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"E[coll]: CHECK infty norm of P^T_D - I: % 1.14e\n",scalar_value);CHKERRQ(ierr); 19883425bc38SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 19893425bc38SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 19903425bc38SStefano Zampini ierr = VecDestroy(&test_vec);CHKERRQ(ierr); 19913425bc38SStefano Zampini } 19923425bc38SStefano Zampini } 19933425bc38SStefano Zampini /* final cleanup */ 19943425bc38SStefano Zampini ierr = PetscFree(vertex_indices);CHKERRQ(ierr); 19953425bc38SStefano Zampini ierr = VecDestroy(&lambda_global);CHKERRQ(ierr); 19963425bc38SStefano Zampini 19973425bc38SStefano Zampini PetscFunctionReturn(0); 19983425bc38SStefano Zampini } 19993425bc38SStefano Zampini 20003425bc38SStefano Zampini #undef __FUNCT__ 20013425bc38SStefano Zampini #define __FUNCT__ "PCBDDCSetupFETIDPPCContext" 20023425bc38SStefano Zampini static PetscErrorCode PCBDDCSetupFETIDPPCContext(Mat fetimat, FETIDPPC_ctx *fetidppc_ctx) 20033425bc38SStefano Zampini { 20043425bc38SStefano Zampini FETIDPMat_ctx *mat_ctx; 20053425bc38SStefano Zampini PetscErrorCode ierr; 20063425bc38SStefano Zampini 20073425bc38SStefano Zampini PetscFunctionBegin; 20083425bc38SStefano Zampini ierr = MatShellGetContext(fetimat,&mat_ctx);CHKERRQ(ierr); 20093425bc38SStefano Zampini /* get references from objects created when setting up feti mat context */ 20103425bc38SStefano Zampini ierr = PetscObjectReference((PetscObject)mat_ctx->lambda_local);CHKERRQ(ierr); 20113425bc38SStefano Zampini fetidppc_ctx->lambda_local = mat_ctx->lambda_local; 20123425bc38SStefano Zampini ierr = PetscObjectReference((PetscObject)mat_ctx->B_Ddelta);CHKERRQ(ierr); 20133425bc38SStefano Zampini fetidppc_ctx->B_Ddelta = mat_ctx->B_Ddelta; 20143425bc38SStefano Zampini ierr = PetscObjectReference((PetscObject)mat_ctx->l2g_lambda);CHKERRQ(ierr); 20153425bc38SStefano Zampini fetidppc_ctx->l2g_lambda = mat_ctx->l2g_lambda; 20163425bc38SStefano Zampini PetscFunctionReturn(0); 20173425bc38SStefano Zampini } 20183425bc38SStefano Zampini 20193425bc38SStefano Zampini #undef __FUNCT__ 20203425bc38SStefano Zampini #define __FUNCT__ "FETIDPMatMult" 20213425bc38SStefano Zampini static PetscErrorCode FETIDPMatMult(Mat fetimat, Vec x, Vec y) 20223425bc38SStefano Zampini { 20233425bc38SStefano Zampini FETIDPMat_ctx *mat_ctx; 20243425bc38SStefano Zampini PC_IS *pcis; 20253425bc38SStefano Zampini PetscErrorCode ierr; 20263425bc38SStefano Zampini 20273425bc38SStefano Zampini PetscFunctionBegin; 20283425bc38SStefano Zampini ierr = MatShellGetContext(fetimat,&mat_ctx);CHKERRQ(ierr); 20293425bc38SStefano Zampini pcis = (PC_IS*)mat_ctx->pc->data; 20303425bc38SStefano Zampini /* Application of B_delta^T */ 20313425bc38SStefano Zampini ierr = VecScatterBegin(mat_ctx->l2g_lambda,x,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 20323425bc38SStefano Zampini ierr = VecScatterEnd(mat_ctx->l2g_lambda,x,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 20333425bc38SStefano Zampini ierr = MatMultTranspose(mat_ctx->B_delta,mat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr); 20343425bc38SStefano Zampini /* Application of \widetilde{S}^-1 */ 20353425bc38SStefano Zampini ierr = VecSet(pcis->vec1_D,0.0);CHKERRQ(ierr); 20363425bc38SStefano Zampini ierr = PCBDDCApplyInterfacePreconditioner(mat_ctx->pc);CHKERRQ(ierr); 20373425bc38SStefano Zampini /* Application of B_delta */ 20383425bc38SStefano Zampini ierr = MatMult(mat_ctx->B_delta,pcis->vec1_B,mat_ctx->lambda_local);CHKERRQ(ierr); 20393425bc38SStefano Zampini ierr = VecSet(y,0.0);CHKERRQ(ierr); 20403425bc38SStefano Zampini ierr = VecScatterBegin(mat_ctx->l2g_lambda,mat_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 20413425bc38SStefano Zampini ierr = VecScatterEnd(mat_ctx->l2g_lambda,mat_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 20423425bc38SStefano Zampini PetscFunctionReturn(0); 20433425bc38SStefano Zampini } 20443425bc38SStefano Zampini 20453425bc38SStefano Zampini #undef __FUNCT__ 20463425bc38SStefano Zampini #define __FUNCT__ "FETIDPPCApply" 20473425bc38SStefano Zampini static PetscErrorCode FETIDPPCApply(PC fetipc, Vec x, Vec y) 20483425bc38SStefano Zampini { 20493425bc38SStefano Zampini FETIDPPC_ctx *pc_ctx; 20503425bc38SStefano Zampini PC_IS *pcis; 20513425bc38SStefano Zampini PetscErrorCode ierr; 20523425bc38SStefano Zampini 20533425bc38SStefano Zampini PetscFunctionBegin; 20543425bc38SStefano Zampini ierr = PCShellGetContext(fetipc,(void**)&pc_ctx); 20553425bc38SStefano Zampini pcis = (PC_IS*)pc_ctx->pc->data; 20563425bc38SStefano Zampini /* Application of B_Ddelta^T */ 20573425bc38SStefano Zampini ierr = VecScatterBegin(pc_ctx->l2g_lambda,x,pc_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 20583425bc38SStefano Zampini ierr = VecScatterEnd(pc_ctx->l2g_lambda,x,pc_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 20593425bc38SStefano Zampini ierr = VecSet(pcis->vec2_B,0.0);CHKERRQ(ierr); 20603425bc38SStefano Zampini ierr = MatMultTranspose(pc_ctx->B_Ddelta,pc_ctx->lambda_local,pcis->vec2_B);CHKERRQ(ierr); 20613425bc38SStefano Zampini /* Application of S */ 20623425bc38SStefano Zampini ierr = PCISApplySchur(pc_ctx->pc,pcis->vec2_B,pcis->vec1_B,(Vec)0,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr); 20633425bc38SStefano Zampini /* Application of B_Ddelta */ 20643425bc38SStefano Zampini ierr = MatMult(pc_ctx->B_Ddelta,pcis->vec1_B,pc_ctx->lambda_local);CHKERRQ(ierr); 20653425bc38SStefano Zampini ierr = VecSet(y,0.0);CHKERRQ(ierr); 20663425bc38SStefano Zampini ierr = VecScatterBegin(pc_ctx->l2g_lambda,pc_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 20673425bc38SStefano Zampini ierr = VecScatterEnd(pc_ctx->l2g_lambda,pc_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 20683425bc38SStefano Zampini PetscFunctionReturn(0); 20693425bc38SStefano Zampini } 20703425bc38SStefano Zampini 2071da1bb401SStefano Zampini #undef __FUNCT__ 2072da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetupLocalAdjacencyGraph" 2073da1bb401SStefano Zampini static PetscErrorCode PCBDDCSetupLocalAdjacencyGraph(PC pc) 2074da1bb401SStefano Zampini { 2075da1bb401SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 2076da1bb401SStefano Zampini Mat_IS *matis = (Mat_IS*)pc->pmat->data; 2077da1bb401SStefano Zampini PetscInt nvtxs,*xadj,*adjncy; 2078da1bb401SStefano Zampini Mat mat_adj; 2079da1bb401SStefano Zampini PetscBool symmetrize_rowij=PETSC_TRUE,compressed_rowij=PETSC_FALSE,flg_row=PETSC_TRUE; 2080da1bb401SStefano Zampini PCBDDCGraph mat_graph=pcbddc->mat_graph; 2081da1bb401SStefano Zampini PetscErrorCode ierr; 2082da1bb401SStefano Zampini 2083da1bb401SStefano Zampini PetscFunctionBegin; 2084da1bb401SStefano Zampini /* get CSR adjacency from local matrix if user has not yet provided local graph using PCBDDCSetLocalAdjacencyGraph function */ 2085da1bb401SStefano Zampini if (!mat_graph->xadj) { 2086da1bb401SStefano Zampini ierr = MatConvert(matis->A,MATMPIADJ,MAT_INITIAL_MATRIX,&mat_adj);CHKERRQ(ierr); 2087da1bb401SStefano Zampini ierr = MatGetRowIJ(mat_adj,0,symmetrize_rowij,compressed_rowij,&nvtxs,&xadj,&adjncy,&flg_row);CHKERRQ(ierr); 2088da1bb401SStefano Zampini if (!flg_row) { 2089da1bb401SStefano Zampini SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in MatGetRowIJ called in %s\n",__FUNCT__); 2090da1bb401SStefano Zampini } 2091da1bb401SStefano Zampini /* Get adjacency into BDDC workspace */ 2092da1bb401SStefano Zampini ierr = PCBDDCSetLocalAdjacencyGraph(pc,nvtxs,xadj,adjncy,PETSC_COPY_VALUES);CHKERRQ(ierr); 2093da1bb401SStefano Zampini ierr = MatRestoreRowIJ(mat_adj,0,symmetrize_rowij,compressed_rowij,&nvtxs,&xadj,&adjncy,&flg_row);CHKERRQ(ierr); 2094da1bb401SStefano Zampini if (!flg_row) { 2095da1bb401SStefano Zampini SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in MatRestoreRowIJ called in %s\n",__FUNCT__); 2096da1bb401SStefano Zampini } 2097da1bb401SStefano Zampini ierr = MatDestroy(&mat_adj);CHKERRQ(ierr); 2098da1bb401SStefano Zampini } 2099da1bb401SStefano Zampini PetscFunctionReturn(0); 2100da1bb401SStefano Zampini } 2101da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */ 21020c7d97c5SJed Brown #undef __FUNCT__ 21030c7d97c5SJed Brown #define __FUNCT__ "PCBDDCApplyInterfacePreconditioner" 21042617d88aSStefano Zampini static PetscErrorCode PCBDDCApplyInterfacePreconditioner(PC pc) 21050c7d97c5SJed Brown { 21060c7d97c5SJed Brown PetscErrorCode ierr; 21070c7d97c5SJed Brown PC_BDDC* pcbddc = (PC_BDDC*)(pc->data); 21080c7d97c5SJed Brown PC_IS* pcis = (PC_IS*) (pc->data); 21093b03a366Sstefano_zampini const PetscScalar zero = 0.0; 21100c7d97c5SJed Brown 21110c7d97c5SJed Brown PetscFunctionBegin; 21120c7d97c5SJed Brown /* Application of PHI^T */ 21130c7d97c5SJed Brown ierr = MatMultTranspose(pcbddc->coarse_phi_B,pcis->vec1_B,pcbddc->vec1_P);CHKERRQ(ierr); 21140c7d97c5SJed Brown if (pcbddc->prec_type) { ierr = MatMultTransposeAdd(pcbddc->coarse_phi_D,pcis->vec1_D,pcbddc->vec1_P,pcbddc->vec1_P);CHKERRQ(ierr); } 21150c7d97c5SJed Brown 21160c7d97c5SJed Brown /* Scatter data of coarse_rhs */ 2117142dfd88SStefano Zampini if (pcbddc->coarse_rhs) { ierr = VecSet(pcbddc->coarse_rhs,zero);CHKERRQ(ierr); } 21180c7d97c5SJed Brown ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->vec1_P,pcbddc->coarse_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 21190c7d97c5SJed Brown 21200c7d97c5SJed Brown /* Local solution on R nodes */ 21210c7d97c5SJed Brown ierr = VecSet(pcbddc->vec1_R,zero);CHKERRQ(ierr); 21220c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->R_to_B,pcis->vec1_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 21230c7d97c5SJed Brown ierr = VecScatterEnd (pcbddc->R_to_B,pcis->vec1_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 21240c7d97c5SJed Brown if (pcbddc->prec_type) { 21250c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->R_to_D,pcis->vec1_D,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 21260c7d97c5SJed Brown ierr = VecScatterEnd (pcbddc->R_to_D,pcis->vec1_D,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 21270c7d97c5SJed Brown } 21280c7d97c5SJed Brown ierr = PCBDDCSolveSaddlePoint(pc);CHKERRQ(ierr); 21290c7d97c5SJed Brown ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr); 21300c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec2_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 21310c7d97c5SJed Brown ierr = VecScatterEnd (pcbddc->R_to_B,pcbddc->vec2_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 21320c7d97c5SJed Brown if (pcbddc->prec_type) { 21330c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec2_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 21340c7d97c5SJed Brown ierr = VecScatterEnd (pcbddc->R_to_D,pcbddc->vec2_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 21350c7d97c5SJed Brown } 21360c7d97c5SJed Brown 21370c7d97c5SJed Brown /* Coarse solution */ 21380c7d97c5SJed Brown ierr = PCBDDCScatterCoarseDataEnd(pc,pcbddc->vec1_P,pcbddc->coarse_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 21390bdf917eSStefano Zampini if (pcbddc->coarse_rhs) { 21400bdf917eSStefano Zampini if (pcbddc->CoarseNullSpace) { 21410bdf917eSStefano Zampini ierr = MatNullSpaceRemove(pcbddc->CoarseNullSpace,pcbddc->coarse_rhs,PETSC_NULL);CHKERRQ(ierr); 21420bdf917eSStefano Zampini } 21430bdf917eSStefano Zampini ierr = KSPSolve(pcbddc->coarse_ksp,pcbddc->coarse_rhs,pcbddc->coarse_vec);CHKERRQ(ierr); 21440bdf917eSStefano Zampini if (pcbddc->CoarseNullSpace) { 21450bdf917eSStefano Zampini ierr = MatNullSpaceRemove(pcbddc->CoarseNullSpace,pcbddc->coarse_vec,PETSC_NULL);CHKERRQ(ierr); 21460bdf917eSStefano Zampini } 21470bdf917eSStefano Zampini } 21480c7d97c5SJed Brown ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->coarse_vec,pcbddc->vec1_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 21490c7d97c5SJed Brown ierr = PCBDDCScatterCoarseDataEnd (pc,pcbddc->coarse_vec,pcbddc->vec1_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 21500c7d97c5SJed Brown 21510c7d97c5SJed Brown /* Sum contributions from two levels */ 21520c7d97c5SJed Brown ierr = MatMultAdd(pcbddc->coarse_phi_B,pcbddc->vec1_P,pcis->vec1_B,pcis->vec1_B);CHKERRQ(ierr); 21530c7d97c5SJed Brown if (pcbddc->prec_type) { ierr = MatMultAdd(pcbddc->coarse_phi_D,pcbddc->vec1_P,pcis->vec1_D,pcis->vec1_D);CHKERRQ(ierr); } 21540c7d97c5SJed Brown PetscFunctionReturn(0); 21550c7d97c5SJed Brown } 21560c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 21570c7d97c5SJed Brown #undef __FUNCT__ 21580c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSolveSaddlePoint" 215953cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSolveSaddlePoint(PC pc) 21600c7d97c5SJed Brown { 21610c7d97c5SJed Brown PetscErrorCode ierr; 21620c7d97c5SJed Brown PC_BDDC* pcbddc = (PC_BDDC*)(pc->data); 21630c7d97c5SJed Brown 21640c7d97c5SJed Brown PetscFunctionBegin; 216553cdbc3dSStefano Zampini ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr); 2166534831adSStefano Zampini if (pcbddc->local_auxmat1) { 21670c7d97c5SJed Brown ierr = MatMult(pcbddc->local_auxmat1,pcbddc->vec2_R,pcbddc->vec1_C);CHKERRQ(ierr); 21680c7d97c5SJed Brown ierr = MatMultAdd(pcbddc->local_auxmat2,pcbddc->vec1_C,pcbddc->vec2_R,pcbddc->vec2_R);CHKERRQ(ierr); 21690c7d97c5SJed Brown } 21700c7d97c5SJed Brown PetscFunctionReturn(0); 21710c7d97c5SJed Brown } 21720c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 21730c7d97c5SJed Brown #undef __FUNCT__ 21740c7d97c5SJed Brown #define __FUNCT__ "PCBDDCScatterCoarseDataBegin" 217553cdbc3dSStefano Zampini static PetscErrorCode PCBDDCScatterCoarseDataBegin(PC pc,Vec vec_from, Vec vec_to, InsertMode imode, ScatterMode smode) 21760c7d97c5SJed Brown { 21770c7d97c5SJed Brown PetscErrorCode ierr; 21780c7d97c5SJed Brown PC_BDDC* pcbddc = (PC_BDDC*)(pc->data); 21790c7d97c5SJed Brown 21800c7d97c5SJed Brown PetscFunctionBegin; 21810c7d97c5SJed Brown switch(pcbddc->coarse_communications_type){ 21820c7d97c5SJed Brown case SCATTERS_BDDC: 21830c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->coarse_loc_to_glob,vec_from,vec_to,imode,smode);CHKERRQ(ierr); 21840c7d97c5SJed Brown break; 21850c7d97c5SJed Brown case GATHERS_BDDC: 21860c7d97c5SJed Brown break; 21870c7d97c5SJed Brown } 21880c7d97c5SJed Brown PetscFunctionReturn(0); 21890c7d97c5SJed Brown } 21900c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 21910c7d97c5SJed Brown #undef __FUNCT__ 21920c7d97c5SJed Brown #define __FUNCT__ "PCBDDCScatterCoarseDataEnd" 219353cdbc3dSStefano Zampini static PetscErrorCode PCBDDCScatterCoarseDataEnd(PC pc,Vec vec_from, Vec vec_to, InsertMode imode, ScatterMode smode) 21940c7d97c5SJed Brown { 21950c7d97c5SJed Brown PetscErrorCode ierr; 21960c7d97c5SJed Brown PC_BDDC* pcbddc = (PC_BDDC*)(pc->data); 21970c7d97c5SJed Brown PetscScalar* array_to; 21980c7d97c5SJed Brown PetscScalar* array_from; 21990c7d97c5SJed Brown MPI_Comm comm=((PetscObject)pc)->comm; 22000c7d97c5SJed Brown PetscInt i; 22010c7d97c5SJed Brown 22020c7d97c5SJed Brown PetscFunctionBegin; 22030c7d97c5SJed Brown 22040c7d97c5SJed Brown switch(pcbddc->coarse_communications_type){ 22050c7d97c5SJed Brown case SCATTERS_BDDC: 22060c7d97c5SJed Brown ierr = VecScatterEnd(pcbddc->coarse_loc_to_glob,vec_from,vec_to,imode,smode);CHKERRQ(ierr); 22070c7d97c5SJed Brown break; 22080c7d97c5SJed Brown case GATHERS_BDDC: 22090c7d97c5SJed Brown if (vec_from) VecGetArray(vec_from,&array_from); 22100c7d97c5SJed Brown if (vec_to) VecGetArray(vec_to,&array_to); 22110c7d97c5SJed Brown switch(pcbddc->coarse_problem_type){ 22120c7d97c5SJed Brown case SEQUENTIAL_BDDC: 22130c7d97c5SJed Brown if (smode == SCATTER_FORWARD) { 221453cdbc3dSStefano Zampini ierr = MPI_Gatherv(&array_from[0],pcbddc->local_primal_size,MPIU_SCALAR,&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,0,comm);CHKERRQ(ierr); 22150c7d97c5SJed Brown if (vec_to) { 22160bdf917eSStefano Zampini if (imode == ADD_VALUES) { 22170bdf917eSStefano Zampini for (i=0;i<pcbddc->replicated_primal_size;i++) { 22180c7d97c5SJed Brown array_to[pcbddc->replicated_local_primal_indices[i]]+=pcbddc->replicated_local_primal_values[i]; 22190c7d97c5SJed Brown } 22200c7d97c5SJed Brown } else { 22210bdf917eSStefano Zampini for (i=0;i<pcbddc->replicated_primal_size;i++) { 22220bdf917eSStefano Zampini array_to[pcbddc->replicated_local_primal_indices[i]]=pcbddc->replicated_local_primal_values[i]; 22230bdf917eSStefano Zampini } 22240bdf917eSStefano Zampini } 22250bdf917eSStefano Zampini } 22260bdf917eSStefano Zampini } else { 22270bdf917eSStefano Zampini if (vec_from) { 22280bdf917eSStefano Zampini if (imode == ADD_VALUES) { 22290bdf917eSStefano Zampini printf("Scatter mode %d, insert mode %d for case %d not implemented!\n",smode,imode,pcbddc->coarse_problem_type); 22300bdf917eSStefano Zampini } 22310bdf917eSStefano Zampini for (i=0;i<pcbddc->replicated_primal_size;i++) { 22320c7d97c5SJed Brown pcbddc->replicated_local_primal_values[i]=array_from[pcbddc->replicated_local_primal_indices[i]]; 22330bdf917eSStefano Zampini } 22340bdf917eSStefano Zampini } 223553cdbc3dSStefano Zampini ierr = MPI_Scatterv(&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,&array_to[0],pcbddc->local_primal_size,MPIU_SCALAR,0,comm);CHKERRQ(ierr); 22360c7d97c5SJed Brown } 22370c7d97c5SJed Brown break; 22380c7d97c5SJed Brown case REPLICATED_BDDC: 22390c7d97c5SJed Brown if (smode == SCATTER_FORWARD) { 224053cdbc3dSStefano Zampini ierr = MPI_Allgatherv(&array_from[0],pcbddc->local_primal_size,MPIU_SCALAR,&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,comm);CHKERRQ(ierr); 22410bdf917eSStefano Zampini if (imode == ADD_VALUES) { 22420bdf917eSStefano Zampini for (i=0;i<pcbddc->replicated_primal_size;i++) { 22430c7d97c5SJed Brown array_to[pcbddc->replicated_local_primal_indices[i]]+=pcbddc->replicated_local_primal_values[i]; 22440bdf917eSStefano Zampini } 22450bdf917eSStefano Zampini } else { 22460bdf917eSStefano Zampini for (i=0;i<pcbddc->replicated_primal_size;i++) { 22470bdf917eSStefano Zampini array_to[pcbddc->replicated_local_primal_indices[i]]=pcbddc->replicated_local_primal_values[i]; 22480bdf917eSStefano Zampini } 22490bdf917eSStefano Zampini } 22500c7d97c5SJed Brown } else { /* no communications needed for SCATTER_REVERSE since needed data is already present */ 22510bdf917eSStefano Zampini if (imode == ADD_VALUES) { 22520bdf917eSStefano Zampini for (i=0;i<pcbddc->local_primal_size;i++) { 22530bdf917eSStefano Zampini array_to[i]+=array_from[pcbddc->local_primal_indices[i]]; 22540bdf917eSStefano Zampini } 22550bdf917eSStefano Zampini } else { 22560bdf917eSStefano Zampini for (i=0;i<pcbddc->local_primal_size;i++) { 22570c7d97c5SJed Brown array_to[i]=array_from[pcbddc->local_primal_indices[i]]; 22580c7d97c5SJed Brown } 22590bdf917eSStefano Zampini } 22600bdf917eSStefano Zampini } 22610c7d97c5SJed Brown break; 226253cdbc3dSStefano Zampini case MULTILEVEL_BDDC: 226353cdbc3dSStefano Zampini break; 226453cdbc3dSStefano Zampini case PARALLEL_BDDC: 226553cdbc3dSStefano Zampini break; 22660c7d97c5SJed Brown } 22670c7d97c5SJed Brown if (vec_from) VecRestoreArray(vec_from,&array_from); 22680c7d97c5SJed Brown if (vec_to) VecRestoreArray(vec_to,&array_to); 22690c7d97c5SJed Brown break; 22700c7d97c5SJed Brown } 22710c7d97c5SJed Brown PetscFunctionReturn(0); 22720c7d97c5SJed Brown } 22730c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 22743b03a366Sstefano_zampini #undef __FUNCT__ 22753b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCCreateConstraintMatrix" 22763b03a366Sstefano_zampini static PetscErrorCode PCBDDCCreateConstraintMatrix(PC pc) 22773b03a366Sstefano_zampini { 22783b03a366Sstefano_zampini PetscErrorCode ierr; 22793b03a366Sstefano_zampini PC_IS* pcis = (PC_IS*)(pc->data); 22803b03a366Sstefano_zampini PC_BDDC* pcbddc = (PC_BDDC*)pc->data; 22813b03a366Sstefano_zampini Mat_IS *matis = (Mat_IS*)pc->pmat->data; 228223d4d1a5SStefano Zampini PetscInt *nnz,*is_indices; 22833b03a366Sstefano_zampini PetscScalar *temp_quadrature_constraint; 2284534831adSStefano Zampini PetscInt *temp_indices,*temp_indices_to_constraint,*temp_indices_to_constraint_B,*local_to_B; 22853b03a366Sstefano_zampini PetscInt local_primal_size,i,j,k,total_counts,max_size_of_constraint; 22863b03a366Sstefano_zampini PetscInt n_constraints,n_vertices,size_of_constraint; 2287534831adSStefano Zampini PetscScalar quad_value; 22883b03a366Sstefano_zampini PetscBool nnsp_has_cnst=PETSC_FALSE,use_nnsp_true=pcbddc->use_nnsp_true; 22893b03a366Sstefano_zampini PetscInt nnsp_size=0,nnsp_addone=0,temp_constraints,temp_start_ptr; 22903b03a366Sstefano_zampini IS *used_IS; 229119fd82e9SBarry Smith MatType impMatType=MATSEQAIJ; 22923b03a366Sstefano_zampini PetscBLASInt Bs,Bt,lwork,lierr; 22933b03a366Sstefano_zampini PetscReal tol=1.0e-8; 2294fcda91b4SJed Brown MatNullSpace nearnullsp; 2295fcda91b4SJed Brown const Vec *nearnullvecs; 22963b03a366Sstefano_zampini Vec *localnearnullsp; 22973b03a366Sstefano_zampini PetscScalar *work,*temp_basis,*array_vector,*correlation_mat; 22983b03a366Sstefano_zampini PetscReal *rwork,*singular_vals; 2299534831adSStefano Zampini PetscBLASInt Bone=1,*ipiv; 2300534831adSStefano Zampini Vec temp_vec; 2301534831adSStefano Zampini Mat temp_mat; 2302534831adSStefano Zampini KSP temp_ksp; 2303ffe5efe1SStefano Zampini PC temp_pc; 2304534831adSStefano Zampini PetscInt s,start_constraint,dual_dofs; 2305534831adSStefano Zampini PetscBool compute_submatrix,useksp=PETSC_FALSE; 2306534831adSStefano Zampini PetscInt *aux_primal_permutation,*aux_primal_numbering; 2307534831adSStefano Zampini PetscBool boolforface,*change_basis; 2308de534f79Sstefano_zampini /* some ugly conditional declarations */ 23093b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD) 23103b03a366Sstefano_zampini PetscScalar dot_result; 23113b03a366Sstefano_zampini PetscScalar one=1.0,zero=0.0; 23123b03a366Sstefano_zampini PetscInt ii; 23133425bc38SStefano Zampini PetscScalar *singular_vectors; 23143425bc38SStefano Zampini PetscBLASInt *iwork,*ifail; 23153425bc38SStefano Zampini PetscReal dummy_real,abs_tol; 23163425bc38SStefano Zampini PetscBLASInt eigs_found; 23173b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX) 23183b03a366Sstefano_zampini PetscScalar val1,val2; 23193b03a366Sstefano_zampini #endif 23203425bc38SStefano Zampini #endif 23213b03a366Sstefano_zampini PetscBLASInt dummy_int; 23223b03a366Sstefano_zampini PetscScalar dummy_scalar; 23233b03a366Sstefano_zampini 23243b03a366Sstefano_zampini PetscFunctionBegin; 23253b03a366Sstefano_zampini /* check if near null space is attached to global mat */ 2326fcda91b4SJed Brown ierr = MatGetNearNullSpace(pc->pmat,&nearnullsp);CHKERRQ(ierr); 2327fcda91b4SJed Brown if (nearnullsp) { 2328fcda91b4SJed Brown ierr = MatNullSpaceGetVecs(nearnullsp,&nnsp_has_cnst,&nnsp_size,&nearnullvecs);CHKERRQ(ierr); 23293b03a366Sstefano_zampini } else { /* if near null space is not provided it uses constants */ 23303b03a366Sstefano_zampini nnsp_has_cnst = PETSC_TRUE; 23313b03a366Sstefano_zampini use_nnsp_true = PETSC_TRUE; 23323b03a366Sstefano_zampini } 23333b03a366Sstefano_zampini if (nnsp_has_cnst) { 23343b03a366Sstefano_zampini nnsp_addone = 1; 23353b03a366Sstefano_zampini } 23363b03a366Sstefano_zampini /* 23373b03a366Sstefano_zampini Evaluate maximum storage size needed by the procedure 23383b03a366Sstefano_zampini - temp_indices will contain start index of each constraint stored as follows 23393b03a366Sstefano_zampini - temp_indices_to_constraint [temp_indices[i],...,temp[indices[i+1]-1] will contain the indices (in local numbering) on which the constraint acts 2340534831adSStefano Zampini - temp_indices_to_constraint_B[temp_indices[i],...,temp[indices[i+1]-1] will contain the indices (in boundary numbering) on which the constraint acts 23413b03a366Sstefano_zampini - temp_quadrature_constraint [temp_indices[i],...,temp[indices[i+1]-1] will contain the scalars representing the constraint itself 23423b03a366Sstefano_zampini */ 2343da1bb401SStefano Zampini 23443b03a366Sstefano_zampini total_counts = pcbddc->n_ISForFaces+pcbddc->n_ISForEdges; 23453b03a366Sstefano_zampini total_counts *= (nnsp_addone+nnsp_size); 2346da1bb401SStefano Zampini ierr = ISGetSize(pcbddc->ISForVertices,&n_vertices);CHKERRQ(ierr); 2347da1bb401SStefano Zampini total_counts += n_vertices; 23483b03a366Sstefano_zampini ierr = PetscMalloc((total_counts+1)*sizeof(PetscInt),&temp_indices);CHKERRQ(ierr); 2349534831adSStefano Zampini ierr = PetscMalloc((total_counts+1)*sizeof(PetscBool),&change_basis);CHKERRQ(ierr); 23503b03a366Sstefano_zampini total_counts = 0; 23513b03a366Sstefano_zampini max_size_of_constraint = 0; 23523b03a366Sstefano_zampini for (i=0;i<pcbddc->n_ISForEdges+pcbddc->n_ISForFaces;i++){ 23533b03a366Sstefano_zampini if (i<pcbddc->n_ISForEdges){ 23543b03a366Sstefano_zampini used_IS = &pcbddc->ISForEdges[i]; 23553b03a366Sstefano_zampini } else { 23563b03a366Sstefano_zampini used_IS = &pcbddc->ISForFaces[i-pcbddc->n_ISForEdges]; 23573b03a366Sstefano_zampini } 23583b03a366Sstefano_zampini ierr = ISGetSize(*used_IS,&j);CHKERRQ(ierr); 23593b03a366Sstefano_zampini total_counts += j; 23603b03a366Sstefano_zampini if (j>max_size_of_constraint) max_size_of_constraint=j; 23613b03a366Sstefano_zampini } 23623b03a366Sstefano_zampini total_counts *= (nnsp_addone+nnsp_size); 2363da1bb401SStefano Zampini total_counts += n_vertices; 23643b03a366Sstefano_zampini ierr = PetscMalloc(total_counts*sizeof(PetscScalar),&temp_quadrature_constraint);CHKERRQ(ierr); 23653b03a366Sstefano_zampini ierr = PetscMalloc(total_counts*sizeof(PetscInt),&temp_indices_to_constraint);CHKERRQ(ierr); 2366534831adSStefano Zampini ierr = PetscMalloc(total_counts*sizeof(PetscInt),&temp_indices_to_constraint_B);CHKERRQ(ierr); 2367534831adSStefano Zampini ierr = PetscMalloc(pcis->n*sizeof(PetscInt),&local_to_B);CHKERRQ(ierr); 2368534831adSStefano Zampini ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 2369534831adSStefano Zampini for (i=0;i<pcis->n;i++) { 2370534831adSStefano Zampini local_to_B[i]=-1; 2371534831adSStefano Zampini } 2372534831adSStefano Zampini for (i=0;i<pcis->n_B;i++) { 2373534831adSStefano Zampini local_to_B[is_indices[i]]=i; 2374534831adSStefano Zampini } 2375534831adSStefano Zampini ierr = ISRestoreIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 2376534831adSStefano Zampini 23773b03a366Sstefano_zampini /* First we issue queries to allocate optimal workspace for LAPACKgesvd or LAPACKsyev/LAPACKheev */ 23783b03a366Sstefano_zampini rwork = 0; 23793b03a366Sstefano_zampini work = 0; 23803b03a366Sstefano_zampini singular_vals = 0; 23813b03a366Sstefano_zampini temp_basis = 0; 23823b03a366Sstefano_zampini correlation_mat = 0; 23833b03a366Sstefano_zampini if (!pcbddc->use_nnsp_true) { 23843b03a366Sstefano_zampini PetscScalar temp_work; 23853b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD) 23863b03a366Sstefano_zampini /* POD */ 23873b03a366Sstefano_zampini PetscInt max_n; 23883b03a366Sstefano_zampini max_n = nnsp_addone+nnsp_size; 23893b03a366Sstefano_zampini /* using some techniques borrowed from Proper Orthogonal Decomposition */ 23903b03a366Sstefano_zampini ierr = PetscMalloc(max_n*max_n*sizeof(PetscScalar),&correlation_mat);CHKERRQ(ierr); 23913425bc38SStefano Zampini ierr = PetscMalloc(max_n*max_n*sizeof(PetscScalar),&singular_vectors);CHKERRQ(ierr); 23923b03a366Sstefano_zampini ierr = PetscMalloc(max_n*sizeof(PetscReal),&singular_vals);CHKERRQ(ierr); 23933b03a366Sstefano_zampini ierr = PetscMalloc(max_size_of_constraint*(nnsp_addone+nnsp_size)*sizeof(PetscScalar),&temp_basis);CHKERRQ(ierr); 23943b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX) 23953b03a366Sstefano_zampini ierr = PetscMalloc(3*max_n*sizeof(PetscReal),&rwork);CHKERRQ(ierr); 23963b03a366Sstefano_zampini #endif 23973425bc38SStefano Zampini ierr = PetscMalloc(5*max_n*sizeof(PetscBLASInt),&iwork);CHKERRQ(ierr); 23983425bc38SStefano Zampini ierr = PetscMalloc(max_n*sizeof(PetscBLASInt),&ifail);CHKERRQ(ierr); 23993b03a366Sstefano_zampini /* now we evaluate the optimal workspace using query with lwork=-1 */ 24003b03a366Sstefano_zampini Bt = PetscBLASIntCast(max_n); 24013b03a366Sstefano_zampini lwork=-1; 24023425bc38SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 24033b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX) 24043425bc38SStefano Zampini abs_tol=1.e-8; 24053425bc38SStefano Zampini /* LAPACKsyev_("V","U",&Bt,correlation_mat,&Bt,singular_vals,&temp_work,&lwork,&lierr); */ 24063425bc38SStefano Zampini LAPACKsyevx_("V","A","U",&Bt,correlation_mat,&Bt,&dummy_real,&dummy_real,&dummy_int,&dummy_int, 24073425bc38SStefano Zampini &abs_tol,&eigs_found,singular_vals,singular_vectors,&Bt,&temp_work,&lwork,iwork,ifail,&lierr); 24083b03a366Sstefano_zampini #else 24093425bc38SStefano Zampini /* LAPACKsyev_("V","U",&Bt,correlation_mat,&Bt,singular_vals,&temp_work,&lwork,rwork,&lierr); */ 24103425bc38SStefano Zampini /* LAPACK call is missing here! TODO */ 24113425bc38SStefano Zampini SETERRQ(((PetscObject) pc)->comm, PETSC_ERR_SUP, "Not yet implemented for complexes when PETSC_MISSING_GESVD = 1"); 24123b03a366Sstefano_zampini #endif 24133425bc38SStefano Zampini if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to SYEVX Lapack routine %d",(int)lierr); 24143425bc38SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 24153b03a366Sstefano_zampini #else /* on missing GESVD */ 24163b03a366Sstefano_zampini /* SVD */ 24173b03a366Sstefano_zampini PetscInt max_n,min_n; 24183b03a366Sstefano_zampini max_n = max_size_of_constraint; 24193b03a366Sstefano_zampini min_n = nnsp_addone+nnsp_size; 24203b03a366Sstefano_zampini if (max_size_of_constraint < ( nnsp_addone+nnsp_size ) ) { 24213b03a366Sstefano_zampini min_n = max_size_of_constraint; 24223b03a366Sstefano_zampini max_n = nnsp_addone+nnsp_size; 24233b03a366Sstefano_zampini } 24243b03a366Sstefano_zampini ierr = PetscMalloc(min_n*sizeof(PetscReal),&singular_vals);CHKERRQ(ierr); 24253b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX) 24263b03a366Sstefano_zampini ierr = PetscMalloc(5*min_n*sizeof(PetscReal),&rwork);CHKERRQ(ierr); 24273b03a366Sstefano_zampini #endif 24283b03a366Sstefano_zampini /* now we evaluate the optimal workspace using query with lwork=-1 */ 24293b03a366Sstefano_zampini lwork=-1; 24303b03a366Sstefano_zampini Bs = PetscBLASIntCast(max_n); 24313b03a366Sstefano_zampini Bt = PetscBLASIntCast(min_n); 24323b03a366Sstefano_zampini dummy_int = Bs; 2433670f3ff9SJed Brown ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 24343b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX) 24353b03a366Sstefano_zampini LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[0],&Bs,singular_vals, 24363b03a366Sstefano_zampini &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,&temp_work,&lwork,&lierr); 24373b03a366Sstefano_zampini #else 24383b03a366Sstefano_zampini LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[0],&Bs,singular_vals, 24393b03a366Sstefano_zampini &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,&temp_work,&lwork,rwork,&lierr); 24403b03a366Sstefano_zampini #endif 24413b03a366Sstefano_zampini if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to SVD Lapack routine %d",(int)lierr); 2442670f3ff9SJed Brown ierr = PetscFPTrapPop();CHKERRQ(ierr); 24433b03a366Sstefano_zampini #endif 24443b03a366Sstefano_zampini /* Allocate optimal workspace */ 24453b03a366Sstefano_zampini lwork = PetscBLASIntCast((PetscInt)PetscRealPart(temp_work)); 24463b03a366Sstefano_zampini total_counts = (PetscInt)lwork; 24473b03a366Sstefano_zampini ierr = PetscMalloc(total_counts*sizeof(PetscScalar),&work);CHKERRQ(ierr); 24483b03a366Sstefano_zampini } 24493b03a366Sstefano_zampini /* get local part of global near null space vectors */ 24503b03a366Sstefano_zampini ierr = PetscMalloc(nnsp_size*sizeof(Vec),&localnearnullsp);CHKERRQ(ierr); 24513b03a366Sstefano_zampini for (k=0;k<nnsp_size;k++) { 24523b03a366Sstefano_zampini ierr = VecDuplicate(pcis->vec1_N,&localnearnullsp[k]);CHKERRQ(ierr); 2453fcda91b4SJed Brown ierr = VecScatterBegin(matis->ctx,nearnullvecs[k],localnearnullsp[k],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 2454fcda91b4SJed Brown ierr = VecScatterEnd (matis->ctx,nearnullvecs[k],localnearnullsp[k],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 24553b03a366Sstefano_zampini } 24563b03a366Sstefano_zampini /* Now we can loop on constraining sets */ 24573b03a366Sstefano_zampini total_counts=0; 24583b03a366Sstefano_zampini temp_indices[0]=0; 2459da1bb401SStefano Zampini /* vertices */ 2460da1bb401SStefano Zampini PetscBool used_vertex; 2461da1bb401SStefano Zampini ierr = ISGetIndices(pcbddc->ISForVertices,(const PetscInt**)&is_indices);CHKERRQ(ierr); 2462da1bb401SStefano Zampini if (nnsp_has_cnst) { /* consider all vertices */ 2463da1bb401SStefano Zampini for (i=0;i<n_vertices;i++) { 2464da1bb401SStefano Zampini temp_indices_to_constraint[temp_indices[total_counts]]=is_indices[i]; 2465534831adSStefano Zampini temp_indices_to_constraint_B[temp_indices[total_counts]]=local_to_B[is_indices[i]]; 2466da1bb401SStefano Zampini temp_quadrature_constraint[temp_indices[total_counts]]=1.0; 2467da1bb401SStefano Zampini temp_indices[total_counts+1]=temp_indices[total_counts]+1; 2468534831adSStefano Zampini change_basis[total_counts]=PETSC_FALSE; 2469da1bb401SStefano Zampini total_counts++; 2470da1bb401SStefano Zampini } 2471da1bb401SStefano Zampini } else { /* consider vertices for which exist at least a localnearnullsp which is not null there */ 2472da1bb401SStefano Zampini for (i=0;i<n_vertices;i++) { 2473da1bb401SStefano Zampini used_vertex=PETSC_FALSE; 2474da1bb401SStefano Zampini k=0; 2475da1bb401SStefano Zampini while(!used_vertex && k<nnsp_size) { 2476da1bb401SStefano Zampini ierr = VecGetArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr); 2477da1bb401SStefano Zampini if (PetscAbsScalar(array_vector[is_indices[i]])>0.0) { 2478da1bb401SStefano Zampini temp_indices_to_constraint[temp_indices[total_counts]]=is_indices[i]; 2479534831adSStefano Zampini temp_indices_to_constraint_B[temp_indices[total_counts]]=local_to_B[is_indices[i]]; 2480da1bb401SStefano Zampini temp_quadrature_constraint[temp_indices[total_counts]]=1.0; 2481da1bb401SStefano Zampini temp_indices[total_counts+1]=temp_indices[total_counts]+1; 2482534831adSStefano Zampini change_basis[total_counts]=PETSC_FALSE; 2483da1bb401SStefano Zampini total_counts++; 2484da1bb401SStefano Zampini used_vertex=PETSC_TRUE; 2485da1bb401SStefano Zampini } 2486da1bb401SStefano Zampini ierr = VecRestoreArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr); 2487da1bb401SStefano Zampini k++; 2488da1bb401SStefano Zampini } 2489da1bb401SStefano Zampini } 2490da1bb401SStefano Zampini } 2491da1bb401SStefano Zampini ierr = ISRestoreIndices(pcbddc->ISForVertices,(const PetscInt**)&is_indices);CHKERRQ(ierr); 2492da1bb401SStefano Zampini n_vertices=total_counts; 2493da1bb401SStefano Zampini /* edges and faces */ 24943b03a366Sstefano_zampini for (i=0;i<pcbddc->n_ISForEdges+pcbddc->n_ISForFaces;i++){ 24953b03a366Sstefano_zampini if (i<pcbddc->n_ISForEdges){ 24963b03a366Sstefano_zampini used_IS = &pcbddc->ISForEdges[i]; 2497534831adSStefano Zampini boolforface = pcbddc->usechangeofbasis; 24983b03a366Sstefano_zampini } else { 24993b03a366Sstefano_zampini used_IS = &pcbddc->ISForFaces[i-pcbddc->n_ISForEdges]; 2500534831adSStefano Zampini boolforface = pcbddc->usechangeonfaces; 25013b03a366Sstefano_zampini } 25023b03a366Sstefano_zampini temp_constraints = 0; /* zero the number of constraints I have on this conn comp */ 25033b03a366Sstefano_zampini temp_start_ptr = total_counts; /* need to know the starting index of constraints stored */ 25043b03a366Sstefano_zampini ierr = ISGetSize(*used_IS,&size_of_constraint);CHKERRQ(ierr); 25053b03a366Sstefano_zampini ierr = ISGetIndices(*used_IS,(const PetscInt**)&is_indices);CHKERRQ(ierr); 25063b03a366Sstefano_zampini if (nnsp_has_cnst) { 25073b03a366Sstefano_zampini temp_constraints++; 2508534831adSStefano Zampini quad_value = (PetscScalar) (1.0/PetscSqrtReal((PetscReal)size_of_constraint)); 25093b03a366Sstefano_zampini for (j=0;j<size_of_constraint;j++) { 25103b03a366Sstefano_zampini temp_indices_to_constraint[temp_indices[total_counts]+j]=is_indices[j]; 2511534831adSStefano Zampini temp_indices_to_constraint_B[temp_indices[total_counts]+j]=local_to_B[is_indices[j]]; 25123b03a366Sstefano_zampini temp_quadrature_constraint[temp_indices[total_counts]+j]=quad_value; 25133b03a366Sstefano_zampini } 25143b03a366Sstefano_zampini temp_indices[total_counts+1]=temp_indices[total_counts]+size_of_constraint; /* store new starting point */ 2515534831adSStefano Zampini change_basis[total_counts]=boolforface; 25163b03a366Sstefano_zampini total_counts++; 25173b03a366Sstefano_zampini } 25183b03a366Sstefano_zampini for (k=0;k<nnsp_size;k++) { 25193b03a366Sstefano_zampini ierr = VecGetArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr); 25203b03a366Sstefano_zampini for (j=0;j<size_of_constraint;j++) { 25213b03a366Sstefano_zampini temp_indices_to_constraint[temp_indices[total_counts]+j]=is_indices[j]; 2522534831adSStefano Zampini temp_indices_to_constraint_B[temp_indices[total_counts]+j]=local_to_B[is_indices[j]]; 25233b03a366Sstefano_zampini temp_quadrature_constraint[temp_indices[total_counts]+j]=array_vector[is_indices[j]]; 25243b03a366Sstefano_zampini } 25253b03a366Sstefano_zampini ierr = VecRestoreArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr); 2526de534f79Sstefano_zampini quad_value = 1.0; 2527de534f79Sstefano_zampini if ( use_nnsp_true ) { /* check if array is null on the connected component in case use_nnsp_true has been requested */ 2528de534f79Sstefano_zampini Bs = PetscBLASIntCast(size_of_constraint); 2529de534f79Sstefano_zampini quad_value = BLASasum_(&Bs,&temp_quadrature_constraint[temp_indices[total_counts]],&Bone); 2530de534f79Sstefano_zampini } 2531de534f79Sstefano_zampini if ( quad_value > 0.0 ) { /* keep indices and values */ 2532de534f79Sstefano_zampini temp_constraints++; 25333b03a366Sstefano_zampini temp_indices[total_counts+1]=temp_indices[total_counts]+size_of_constraint; /* store new starting point */ 2534534831adSStefano Zampini change_basis[total_counts]=boolforface; 25353b03a366Sstefano_zampini total_counts++; 25363b03a366Sstefano_zampini } 2537de534f79Sstefano_zampini } 25383b03a366Sstefano_zampini ierr = ISRestoreIndices(*used_IS,(const PetscInt**)&is_indices);CHKERRQ(ierr); 2539de534f79Sstefano_zampini /* perform SVD on the constraint if use_nnsp_true has not be requested by the user */ 25403b03a366Sstefano_zampini if (!use_nnsp_true) { 2541de534f79Sstefano_zampini 25423b03a366Sstefano_zampini Bs = PetscBLASIntCast(size_of_constraint); 25433b03a366Sstefano_zampini Bt = PetscBLASIntCast(temp_constraints); 2544de534f79Sstefano_zampini 25453b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD) 25463b03a366Sstefano_zampini ierr = PetscMemzero(correlation_mat,Bt*Bt*sizeof(PetscScalar));CHKERRQ(ierr); 25473b03a366Sstefano_zampini /* Store upper triangular part of correlation matrix */ 25483b03a366Sstefano_zampini for (j=0;j<temp_constraints;j++) { 25493b03a366Sstefano_zampini for (k=0;k<j+1;k++) { 25503b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX) 25513425bc38SStefano Zampini /* hand made complex dot product -> replace */ 25523b03a366Sstefano_zampini dot_result = 0.0; 25533b03a366Sstefano_zampini for (ii=0; ii<size_of_constraint; ii++) { 25543b03a366Sstefano_zampini val1 = temp_quadrature_constraint[temp_indices[temp_start_ptr+j]+ii]; 25553b03a366Sstefano_zampini val2 = temp_quadrature_constraint[temp_indices[temp_start_ptr+k]+ii]; 25563b03a366Sstefano_zampini dot_result += val1*PetscConj(val2); 25573b03a366Sstefano_zampini } 25583b03a366Sstefano_zampini #else 25593b03a366Sstefano_zampini dot_result = BLASdot_(&Bs,&temp_quadrature_constraint[temp_indices[temp_start_ptr+j]],&Bone, 25603b03a366Sstefano_zampini &temp_quadrature_constraint[temp_indices[temp_start_ptr+k]],&Bone); 25613b03a366Sstefano_zampini #endif 25623b03a366Sstefano_zampini correlation_mat[j*temp_constraints+k]=dot_result; 25633b03a366Sstefano_zampini } 25643b03a366Sstefano_zampini } 25653425bc38SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 25663b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX) 25673425bc38SStefano Zampini /* LAPACKsyev_("V","U",&Bt,correlation_mat,&Bt,singular_vals,work,&lwork,&lierr); */ 25683425bc38SStefano Zampini LAPACKsyevx_("V","A","U",&Bt,correlation_mat,&Bt,&dummy_real,&dummy_real,&dummy_int,&dummy_int, 25693425bc38SStefano Zampini &abs_tol,&eigs_found,singular_vals,singular_vectors,&Bt,work,&lwork,iwork,ifail,&lierr); 25703b03a366Sstefano_zampini #else 25713425bc38SStefano Zampini /* LAPACK call is missing here! TODO */ 25723425bc38SStefano Zampini SETERRQ(((PetscObject) pc)->comm, PETSC_ERR_SUP, "Not yet implemented for complexes when PETSC_MISSING_GESVD = 1"); 25733b03a366Sstefano_zampini #endif 25743425bc38SStefano Zampini if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYEVX Lapack routine %d",(int)lierr); 25753425bc38SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 25763b03a366Sstefano_zampini /* retain eigenvalues greater than tol: note that lapack SYEV gives eigs in ascending order */ 25773b03a366Sstefano_zampini j=0; 25783b03a366Sstefano_zampini while( j < Bt && singular_vals[j] < tol) j++; 25793b03a366Sstefano_zampini total_counts=total_counts-j; 25803b03a366Sstefano_zampini if (j<temp_constraints) { 25813b03a366Sstefano_zampini for (k=j;k<Bt;k++) { singular_vals[k]=1.0/PetscSqrtReal(singular_vals[k]); } 25823425bc38SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 25833b03a366Sstefano_zampini BLASgemm_("N","N",&Bs,&Bt,&Bt,&one,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,correlation_mat,&Bt,&zero,temp_basis,&Bs); 25843425bc38SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 25853b03a366Sstefano_zampini /* copy POD basis into used quadrature memory */ 25863b03a366Sstefano_zampini for (k=0;k<Bt-j;k++) { 25873b03a366Sstefano_zampini for (ii=0;ii<size_of_constraint;ii++) { 25883b03a366Sstefano_zampini temp_quadrature_constraint[temp_indices[temp_start_ptr+k]+ii]=singular_vals[Bt-1-k]*temp_basis[(Bt-1-k)*size_of_constraint+ii]; 25893b03a366Sstefano_zampini } 25903b03a366Sstefano_zampini } 25913b03a366Sstefano_zampini } 2592de534f79Sstefano_zampini 25933b03a366Sstefano_zampini #else /* on missing GESVD */ 25943b03a366Sstefano_zampini PetscInt min_n = temp_constraints; 25953b03a366Sstefano_zampini if (min_n > size_of_constraint) min_n = size_of_constraint; 25963b03a366Sstefano_zampini dummy_int = Bs; 2597670f3ff9SJed Brown ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 25983b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX) 25993b03a366Sstefano_zampini LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,singular_vals, 26003b03a366Sstefano_zampini &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,work,&lwork,&lierr); 26013b03a366Sstefano_zampini #else 26023b03a366Sstefano_zampini LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,singular_vals, 26033b03a366Sstefano_zampini &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,work,&lwork,rwork,&lierr); 26043b03a366Sstefano_zampini #endif 26053b03a366Sstefano_zampini if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SVD Lapack routine %d",(int)lierr); 2606670f3ff9SJed Brown ierr = PetscFPTrapPop();CHKERRQ(ierr); 26073b03a366Sstefano_zampini /* retain eigenvalues greater than tol: note that lapack SVD gives eigs in descending order */ 26083b03a366Sstefano_zampini j=0; 26093b03a366Sstefano_zampini while( j < min_n && singular_vals[min_n-j-1] < tol) j++; 26103b03a366Sstefano_zampini total_counts = total_counts-(PetscInt)Bt+(min_n-j); 26113b03a366Sstefano_zampini #endif 26123b03a366Sstefano_zampini } 26133b03a366Sstefano_zampini } 2614534831adSStefano Zampini 2615da1bb401SStefano Zampini n_constraints=total_counts-n_vertices; 2616da1bb401SStefano Zampini local_primal_size = total_counts; 26173b03a366Sstefano_zampini /* set quantities in pcbddc data structure */ 26183b03a366Sstefano_zampini pcbddc->n_vertices = n_vertices; 26193b03a366Sstefano_zampini pcbddc->n_constraints = n_constraints; 2620da1bb401SStefano Zampini pcbddc->local_primal_size = local_primal_size; 2621534831adSStefano Zampini 2622534831adSStefano Zampini /* Create constraint matrix */ 2623534831adSStefano Zampini /* The constraint matrix is used to compute the l2g map of primal dofs */ 2624534831adSStefano Zampini /* so we need to set it up properly either with or without change of basis */ 2625534831adSStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->ConstraintMatrix);CHKERRQ(ierr); 2626534831adSStefano Zampini ierr = MatSetType(pcbddc->ConstraintMatrix,impMatType);CHKERRQ(ierr); 2627534831adSStefano Zampini ierr = MatSetSizes(pcbddc->ConstraintMatrix,local_primal_size,pcis->n,local_primal_size,pcis->n);CHKERRQ(ierr); 2628534831adSStefano Zampini /* compute a local numbering of constraints : vertices first then constraints */ 2629534831adSStefano Zampini ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr); 2630534831adSStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array_vector);CHKERRQ(ierr); 2631534831adSStefano Zampini ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&aux_primal_numbering);CHKERRQ(ierr); 2632534831adSStefano Zampini ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&aux_primal_permutation);CHKERRQ(ierr); 2633534831adSStefano Zampini total_counts=0; 2634534831adSStefano Zampini /* find vertices: subdomain corners plus dofs with basis changed */ 2635534831adSStefano Zampini for (i=0;i<local_primal_size;i++) { 2636534831adSStefano Zampini size_of_constraint=temp_indices[i+1]-temp_indices[i]; 2637534831adSStefano Zampini if (change_basis[i] || size_of_constraint == 1) { 2638534831adSStefano Zampini k=0; 2639534831adSStefano Zampini while(k < size_of_constraint && array_vector[temp_indices_to_constraint[temp_indices[i]+size_of_constraint-k-1]] != 0.0) { 2640534831adSStefano Zampini k=k+1; 2641534831adSStefano Zampini } 2642534831adSStefano Zampini j=temp_indices_to_constraint[temp_indices[i]+size_of_constraint-k-1]; 2643534831adSStefano Zampini array_vector[j] = 1.0; 2644534831adSStefano Zampini aux_primal_numbering[total_counts]=j; 2645534831adSStefano Zampini aux_primal_permutation[total_counts]=total_counts; 2646534831adSStefano Zampini total_counts++; 2647534831adSStefano Zampini } 2648534831adSStefano Zampini } 2649534831adSStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array_vector);CHKERRQ(ierr); 2650534831adSStefano Zampini /* permute indices in order to have a sorted set of vertices */ 2651534831adSStefano Zampini ierr = PetscSortIntWithPermutation(total_counts,aux_primal_numbering,aux_primal_permutation); 2652534831adSStefano Zampini /* nonzero structure */ 2653534831adSStefano Zampini ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&nnz);CHKERRQ(ierr); 2654534831adSStefano Zampini for (i=0;i<total_counts;i++) { 2655534831adSStefano Zampini nnz[i]=1; 2656534831adSStefano Zampini } 2657534831adSStefano Zampini j=total_counts; 2658534831adSStefano Zampini for (i=n_vertices;i<local_primal_size;i++) { 2659534831adSStefano Zampini if (!change_basis[i]) { 2660534831adSStefano Zampini nnz[j]=temp_indices[i+1]-temp_indices[i]; 2661534831adSStefano Zampini j++; 2662534831adSStefano Zampini } 2663534831adSStefano Zampini } 2664534831adSStefano Zampini ierr = MatSeqAIJSetPreallocation(pcbddc->ConstraintMatrix,0,nnz);CHKERRQ(ierr); 2665534831adSStefano Zampini ierr = PetscFree(nnz);CHKERRQ(ierr); 2666534831adSStefano Zampini /* set values in constraint matrix */ 2667534831adSStefano Zampini for (i=0;i<total_counts;i++) { 2668534831adSStefano Zampini j = aux_primal_permutation[i]; 2669534831adSStefano Zampini k = aux_primal_numbering[j]; 2670534831adSStefano Zampini ierr = MatSetValue(pcbddc->ConstraintMatrix,i,k,1.0,INSERT_VALUES);CHKERRQ(ierr); 2671534831adSStefano Zampini } 2672534831adSStefano Zampini for (i=n_vertices;i<local_primal_size;i++) { 2673534831adSStefano Zampini if (!change_basis[i]) { 2674534831adSStefano Zampini size_of_constraint=temp_indices[i+1]-temp_indices[i]; 2675534831adSStefano Zampini ierr = MatSetValues(pcbddc->ConstraintMatrix,1,&total_counts,size_of_constraint,&temp_indices_to_constraint[temp_indices[i]],&temp_quadrature_constraint[temp_indices[i]],INSERT_VALUES);CHKERRQ(ierr); 2676534831adSStefano Zampini total_counts++; 2677534831adSStefano Zampini } 2678534831adSStefano Zampini } 2679534831adSStefano Zampini ierr = PetscFree(aux_primal_numbering);CHKERRQ(ierr); 2680534831adSStefano Zampini ierr = PetscFree(aux_primal_permutation);CHKERRQ(ierr); 2681534831adSStefano Zampini /* assembling */ 2682534831adSStefano Zampini ierr = MatAssemblyBegin(pcbddc->ConstraintMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2683534831adSStefano Zampini ierr = MatAssemblyEnd(pcbddc->ConstraintMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2684534831adSStefano Zampini 2685534831adSStefano Zampini /* Create matrix for change of basis. We don't need it in case pcbddc->usechangeofbasis is FALSE */ 2686534831adSStefano Zampini if (pcbddc->usechangeofbasis) { 2687534831adSStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->ChangeOfBasisMatrix);CHKERRQ(ierr); 2688534831adSStefano Zampini ierr = MatSetType(pcbddc->ChangeOfBasisMatrix,impMatType);CHKERRQ(ierr); 2689534831adSStefano Zampini ierr = MatSetSizes(pcbddc->ChangeOfBasisMatrix,pcis->n_B,pcis->n_B,pcis->n_B,pcis->n_B);CHKERRQ(ierr); 2690534831adSStefano Zampini /* work arrays */ 2691534831adSStefano Zampini /* we need to reuse these arrays, so we free them */ 2692534831adSStefano Zampini ierr = PetscFree(temp_basis);CHKERRQ(ierr); 2693534831adSStefano Zampini ierr = PetscFree(work);CHKERRQ(ierr); 2694534831adSStefano Zampini ierr = PetscMalloc(pcis->n_B*sizeof(PetscInt),&nnz);CHKERRQ(ierr); 2695534831adSStefano Zampini ierr = PetscMalloc((nnsp_addone+nnsp_size)*(nnsp_addone+nnsp_size)*sizeof(PetscScalar),&temp_basis);CHKERRQ(ierr); 2696534831adSStefano Zampini ierr = PetscMalloc((nnsp_addone+nnsp_size)*sizeof(PetscScalar),&work);CHKERRQ(ierr); 2697534831adSStefano Zampini ierr = PetscMalloc((nnsp_addone+nnsp_size)*sizeof(PetscBLASInt),&ipiv);CHKERRQ(ierr); 2698534831adSStefano Zampini for (i=0;i<pcis->n_B;i++) { 2699534831adSStefano Zampini nnz[i]=1; 2700534831adSStefano Zampini } 2701534831adSStefano Zampini /* Overestimated nonzeros per row */ 2702534831adSStefano Zampini k=1; 2703534831adSStefano Zampini for (i=pcbddc->n_vertices;i<local_primal_size;i++) { 2704534831adSStefano Zampini if (change_basis[i]) { 2705534831adSStefano Zampini size_of_constraint = temp_indices[i+1]-temp_indices[i]; 2706534831adSStefano Zampini if (k < size_of_constraint) { 2707534831adSStefano Zampini k = size_of_constraint; 2708534831adSStefano Zampini } 2709534831adSStefano Zampini for (j=0;j<size_of_constraint;j++) { 2710534831adSStefano Zampini nnz[temp_indices_to_constraint_B[temp_indices[i]+j]] = size_of_constraint; 2711534831adSStefano Zampini } 2712534831adSStefano Zampini } 2713534831adSStefano Zampini } 2714534831adSStefano Zampini ierr = MatSeqAIJSetPreallocation(pcbddc->ChangeOfBasisMatrix,0,nnz);CHKERRQ(ierr); 2715534831adSStefano Zampini ierr = PetscFree(nnz);CHKERRQ(ierr); 2716534831adSStefano Zampini /* Temporary array to store indices */ 2717534831adSStefano Zampini ierr = PetscMalloc(k*sizeof(PetscInt),&is_indices);CHKERRQ(ierr); 2718534831adSStefano Zampini /* Set initial identity in the matrix */ 2719534831adSStefano Zampini for (i=0;i<pcis->n_B;i++) { 2720534831adSStefano Zampini ierr = MatSetValue(pcbddc->ChangeOfBasisMatrix,i,i,1.0,INSERT_VALUES);CHKERRQ(ierr); 2721534831adSStefano Zampini } 2722534831adSStefano Zampini /* Now we loop on the constraints which need a change of basis */ 2723534831adSStefano Zampini /* Change of basis matrix is evaluated as the FIRST APPROACH in */ 2724534831adSStefano Zampini /* Klawonn and Widlund, Dual-primal FETI-DP methods for linear elasticity, (6.2.1) */ 2725534831adSStefano Zampini temp_constraints = 0; 272693dc3b60SStefano Zampini if (pcbddc->n_vertices < local_primal_size) { 2727534831adSStefano Zampini temp_start_ptr = temp_indices_to_constraint_B[temp_indices[pcbddc->n_vertices]]; 272893dc3b60SStefano Zampini } 2729534831adSStefano Zampini for (i=pcbddc->n_vertices;i<local_primal_size;i++) { 2730534831adSStefano Zampini if (change_basis[i]) { 2731534831adSStefano Zampini compute_submatrix = PETSC_FALSE; 2732534831adSStefano Zampini useksp = PETSC_FALSE; 2733534831adSStefano Zampini if (temp_start_ptr == temp_indices_to_constraint_B[temp_indices[i]]) { 2734534831adSStefano Zampini temp_constraints++; 273504eaf177SStefano Zampini if (i == local_primal_size -1 || temp_start_ptr != temp_indices_to_constraint_B[temp_indices[i+1]]) { 2736534831adSStefano Zampini compute_submatrix = PETSC_TRUE; 2737534831adSStefano Zampini } 2738534831adSStefano Zampini } 2739534831adSStefano Zampini if (compute_submatrix) { 2740534831adSStefano Zampini if (temp_constraints > 1 || pcbddc->use_nnsp_true) { 2741534831adSStefano Zampini useksp = PETSC_TRUE; 2742534831adSStefano Zampini } 2743534831adSStefano Zampini size_of_constraint = temp_indices[i+1]-temp_indices[i]; 2744534831adSStefano Zampini if (useksp) { /* experimental */ 2745534831adSStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&temp_mat);CHKERRQ(ierr); 2746534831adSStefano Zampini ierr = MatSetType(temp_mat,impMatType);CHKERRQ(ierr); 2747534831adSStefano Zampini ierr = MatSetSizes(temp_mat,size_of_constraint,size_of_constraint,size_of_constraint,size_of_constraint);CHKERRQ(ierr); 2748534831adSStefano Zampini ierr = MatSeqAIJSetPreallocation(temp_mat,size_of_constraint,PETSC_NULL);CHKERRQ(ierr); 2749534831adSStefano Zampini } 2750534831adSStefano Zampini /* First _size_of_constraint-temp_constraints_ columns */ 2751534831adSStefano Zampini dual_dofs = size_of_constraint-temp_constraints; 2752534831adSStefano Zampini start_constraint = i+1-temp_constraints; 2753534831adSStefano Zampini for (s=0;s<dual_dofs;s++) { 2754534831adSStefano Zampini is_indices[0] = s; 2755534831adSStefano Zampini for (j=0;j<temp_constraints;j++) { 2756534831adSStefano Zampini for (k=0;k<temp_constraints;k++) { 2757534831adSStefano Zampini temp_basis[j*temp_constraints+k]=temp_quadrature_constraint[temp_indices[start_constraint+k]+s+j+1]; 2758534831adSStefano Zampini } 2759534831adSStefano Zampini work[j]=-temp_quadrature_constraint[temp_indices[start_constraint+j]+s]; 2760534831adSStefano Zampini is_indices[j+1]=s+j+1; 2761534831adSStefano Zampini } 2762534831adSStefano Zampini Bt = temp_constraints; 2763534831adSStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 2764534831adSStefano Zampini LAPACKgesv_(&Bt,&Bone,temp_basis,&Bt,ipiv,work,&Bt,&lierr); 2765534831adSStefano Zampini if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GESV Lapack routine %d",(int)lierr); 2766534831adSStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 2767534831adSStefano Zampini j = temp_indices_to_constraint_B[temp_indices[start_constraint]+s]; 2768534831adSStefano Zampini ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,temp_constraints,&temp_indices_to_constraint_B[temp_indices[start_constraint]+s+1],1,&j,work,INSERT_VALUES);CHKERRQ(ierr); 2769534831adSStefano Zampini if (useksp) { 2770534831adSStefano Zampini /* temp mat with transposed rows and columns */ 2771534831adSStefano Zampini ierr = MatSetValues(temp_mat,1,&s,temp_constraints,&is_indices[1],work,INSERT_VALUES);CHKERRQ(ierr); 2772534831adSStefano Zampini ierr = MatSetValue(temp_mat,is_indices[0],is_indices[0],1.0,INSERT_VALUES);CHKERRQ(ierr); 2773534831adSStefano Zampini } 2774534831adSStefano Zampini } 2775534831adSStefano Zampini if (useksp) { 2776534831adSStefano Zampini /* last rows of temp_mat */ 2777534831adSStefano Zampini for (j=0;j<size_of_constraint;j++) { 2778534831adSStefano Zampini is_indices[j] = j; 2779534831adSStefano Zampini } 2780534831adSStefano Zampini for (s=0;s<temp_constraints;s++) { 2781534831adSStefano Zampini k = s + dual_dofs; 2782534831adSStefano Zampini ierr = MatSetValues(temp_mat,1,&k,size_of_constraint,is_indices,&temp_quadrature_constraint[temp_indices[start_constraint+s]],INSERT_VALUES);CHKERRQ(ierr); 2783534831adSStefano Zampini } 2784534831adSStefano Zampini ierr = MatAssemblyBegin(temp_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2785534831adSStefano Zampini ierr = MatAssemblyEnd(temp_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2786534831adSStefano Zampini ierr = MatGetVecs(temp_mat,&temp_vec,PETSC_NULL);CHKERRQ(ierr); 2787534831adSStefano Zampini ierr = KSPCreate(PETSC_COMM_SELF,&temp_ksp);CHKERRQ(ierr); 2788534831adSStefano Zampini ierr = KSPSetOperators(temp_ksp,temp_mat,temp_mat,SAME_PRECONDITIONER);CHKERRQ(ierr); 2789534831adSStefano Zampini ierr = KSPSetType(temp_ksp,KSPPREONLY);CHKERRQ(ierr); 2790ffe5efe1SStefano Zampini ierr = KSPGetPC(temp_ksp,&temp_pc);CHKERRQ(ierr); 2791ffe5efe1SStefano Zampini ierr = PCSetType(temp_pc,PCLU);CHKERRQ(ierr); 2792534831adSStefano Zampini ierr = KSPSetUp(temp_ksp);CHKERRQ(ierr); 2793534831adSStefano Zampini for (s=0;s<temp_constraints;s++) { 2794534831adSStefano Zampini ierr = VecSet(temp_vec,0.0);CHKERRQ(ierr); 2795534831adSStefano Zampini ierr = VecSetValue(temp_vec,s+dual_dofs,1.0,INSERT_VALUES);CHKERRQ(ierr); 2796534831adSStefano Zampini ierr = VecAssemblyBegin(temp_vec);CHKERRQ(ierr); 2797534831adSStefano Zampini ierr = VecAssemblyEnd(temp_vec);CHKERRQ(ierr); 2798534831adSStefano Zampini ierr = KSPSolve(temp_ksp,temp_vec,temp_vec);CHKERRQ(ierr); 2799534831adSStefano Zampini ierr = VecGetArray(temp_vec,&array_vector);CHKERRQ(ierr); 2800534831adSStefano Zampini j = temp_indices_to_constraint_B[temp_indices[start_constraint+s]+size_of_constraint-s-1]; 2801534831adSStefano Zampini /* last columns of change of basis matrix associated to new primal dofs */ 2802534831adSStefano Zampini ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,size_of_constraint,&temp_indices_to_constraint_B[temp_indices[start_constraint+s]],1,&j,array_vector,INSERT_VALUES);CHKERRQ(ierr); 2803534831adSStefano Zampini ierr = VecRestoreArray(temp_vec,&array_vector);CHKERRQ(ierr); 2804534831adSStefano Zampini } 2805534831adSStefano Zampini ierr = MatDestroy(&temp_mat);CHKERRQ(ierr); 2806534831adSStefano Zampini ierr = KSPDestroy(&temp_ksp);CHKERRQ(ierr); 2807534831adSStefano Zampini ierr = VecDestroy(&temp_vec);CHKERRQ(ierr); 2808534831adSStefano Zampini } else { 2809534831adSStefano Zampini /* last columns of change of basis matrix associated to new primal dofs */ 2810534831adSStefano Zampini for (s=0;s<temp_constraints;s++) { 2811534831adSStefano Zampini j = temp_indices_to_constraint_B[temp_indices[start_constraint+s]+size_of_constraint-s-1]; 2812534831adSStefano Zampini ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,size_of_constraint,&temp_indices_to_constraint_B[temp_indices[start_constraint+s]],1,&j,&temp_quadrature_constraint[temp_indices[start_constraint+s]],INSERT_VALUES);CHKERRQ(ierr); 2813534831adSStefano Zampini } 2814534831adSStefano Zampini } 2815534831adSStefano Zampini /* prepare for the next cycle */ 2816534831adSStefano Zampini temp_constraints = 0; 281704eaf177SStefano Zampini if (i != local_primal_size -1 ) { 2818534831adSStefano Zampini temp_start_ptr = temp_indices_to_constraint_B[temp_indices[i+1]]; 2819534831adSStefano Zampini } 2820534831adSStefano Zampini } 2821534831adSStefano Zampini } 282204eaf177SStefano Zampini } 2823534831adSStefano Zampini /* assembling */ 2824534831adSStefano Zampini ierr = MatAssemblyBegin(pcbddc->ChangeOfBasisMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2825534831adSStefano Zampini ierr = MatAssemblyEnd(pcbddc->ChangeOfBasisMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2826534831adSStefano Zampini ierr = PetscFree(ipiv);CHKERRQ(ierr); 2827534831adSStefano Zampini ierr = PetscFree(is_indices);CHKERRQ(ierr); 2828534831adSStefano Zampini } 28293b03a366Sstefano_zampini /* free workspace no longer needed */ 28303b03a366Sstefano_zampini ierr = PetscFree(rwork);CHKERRQ(ierr); 28313b03a366Sstefano_zampini ierr = PetscFree(work);CHKERRQ(ierr); 28323b03a366Sstefano_zampini ierr = PetscFree(temp_basis);CHKERRQ(ierr); 28333b03a366Sstefano_zampini ierr = PetscFree(singular_vals);CHKERRQ(ierr); 28343b03a366Sstefano_zampini ierr = PetscFree(correlation_mat);CHKERRQ(ierr); 28353b03a366Sstefano_zampini ierr = PetscFree(temp_indices);CHKERRQ(ierr); 2836534831adSStefano Zampini ierr = PetscFree(change_basis);CHKERRQ(ierr); 28373b03a366Sstefano_zampini ierr = PetscFree(temp_indices_to_constraint);CHKERRQ(ierr); 2838534831adSStefano Zampini ierr = PetscFree(temp_indices_to_constraint_B);CHKERRQ(ierr); 2839534831adSStefano Zampini ierr = PetscFree(local_to_B);CHKERRQ(ierr); 28403b03a366Sstefano_zampini ierr = PetscFree(temp_quadrature_constraint);CHKERRQ(ierr); 28413425bc38SStefano Zampini #if defined(PETSC_MISSING_LAPACK_GESVD) 28423425bc38SStefano Zampini ierr = PetscFree(iwork);CHKERRQ(ierr); 28433425bc38SStefano Zampini ierr = PetscFree(ifail);CHKERRQ(ierr); 28443425bc38SStefano Zampini ierr = PetscFree(singular_vectors);CHKERRQ(ierr); 28453425bc38SStefano Zampini #endif 2846da1bb401SStefano Zampini for (k=0;k<nnsp_size;k++) { 2847da1bb401SStefano Zampini ierr = VecDestroy(&localnearnullsp[k]);CHKERRQ(ierr); 2848da1bb401SStefano Zampini } 28493b03a366Sstefano_zampini ierr = PetscFree(localnearnullsp);CHKERRQ(ierr); 28503b03a366Sstefano_zampini PetscFunctionReturn(0); 28513b03a366Sstefano_zampini } 28523b03a366Sstefano_zampini /* -------------------------------------------------------------------------- */ 28530c7d97c5SJed Brown #undef __FUNCT__ 28540c7d97c5SJed Brown #define __FUNCT__ "PCBDDCCoarseSetUp" 285553cdbc3dSStefano Zampini static PetscErrorCode PCBDDCCoarseSetUp(PC pc) 28560c7d97c5SJed Brown { 28570c7d97c5SJed Brown PetscErrorCode ierr; 28580c7d97c5SJed Brown 28590c7d97c5SJed Brown PC_IS* pcis = (PC_IS*)(pc->data); 28600c7d97c5SJed Brown PC_BDDC* pcbddc = (PC_BDDC*)pc->data; 28610c7d97c5SJed Brown Mat_IS *matis = (Mat_IS*)pc->pmat->data; 2862534831adSStefano Zampini Mat change_mat_all; 28630c7d97c5SJed Brown IS is_R_local; 28640c7d97c5SJed Brown IS is_V_local; 28650c7d97c5SJed Brown IS is_C_local; 28660c7d97c5SJed Brown IS is_aux1; 28670c7d97c5SJed Brown IS is_aux2; 286819fd82e9SBarry Smith VecType impVecType; 286919fd82e9SBarry Smith MatType impMatType; 28700c7d97c5SJed Brown PetscInt n_R=0; 28710c7d97c5SJed Brown PetscInt n_D=0; 28720c7d97c5SJed Brown PetscInt n_B=0; 28730c7d97c5SJed Brown PetscScalar zero=0.0; 28740c7d97c5SJed Brown PetscScalar one=1.0; 28750c7d97c5SJed Brown PetscScalar m_one=-1.0; 28760c7d97c5SJed Brown PetscScalar* array; 28770c7d97c5SJed Brown PetscScalar *coarse_submat_vals; 28780c7d97c5SJed Brown PetscInt *idx_R_local; 28790c7d97c5SJed Brown PetscInt *idx_V_B; 28800c7d97c5SJed Brown PetscScalar *coarsefunctions_errors; 28810c7d97c5SJed Brown PetscScalar *constraints_errors; 28820c7d97c5SJed Brown /* auxiliary indices */ 2883534831adSStefano Zampini PetscInt i,j,k; 2884e269702eSStefano Zampini /* for verbose output of bddc */ 2885e269702eSStefano Zampini PetscViewer viewer=pcbddc->dbg_viewer; 2886e269702eSStefano Zampini PetscBool dbg_flag=pcbddc->dbg_flag; 2887a0ba757dSStefano Zampini /* for counting coarse dofs */ 2888534831adSStefano Zampini PetscInt n_vertices,n_constraints; 28893b03a366Sstefano_zampini PetscInt size_of_constraint; 28903b03a366Sstefano_zampini PetscInt *row_cmat_indices; 28913b03a366Sstefano_zampini PetscScalar *row_cmat_values; 2892534831adSStefano Zampini PetscInt *vertices,*nnz,*is_indices,*temp_indices; 28930c7d97c5SJed Brown 28940c7d97c5SJed Brown PetscFunctionBegin; 28950c7d97c5SJed Brown /* Set Non-overlapping dimensions */ 28960c7d97c5SJed Brown n_B = pcis->n_B; n_D = pcis->n - n_B; 2897534831adSStefano Zampini /* Set types for local objects needed by BDDC precondtioner */ 2898534831adSStefano Zampini impMatType = MATSEQDENSE; 2899534831adSStefano Zampini impVecType = VECSEQ; 2900da1bb401SStefano Zampini /* get vertex indices from constraint matrix */ 2901534831adSStefano Zampini ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscInt),&vertices);CHKERRQ(ierr); 2902534831adSStefano Zampini n_vertices=0; 2903da1bb401SStefano Zampini for (i=0;i<pcbddc->local_primal_size;i++) { 2904da1bb401SStefano Zampini ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr); 2905da1bb401SStefano Zampini if (size_of_constraint == 1) { 2906534831adSStefano Zampini vertices[n_vertices]=row_cmat_indices[0]; 2907534831adSStefano Zampini n_vertices++; 2908a0ba757dSStefano Zampini } 2909da1bb401SStefano Zampini ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr); 2910a0ba757dSStefano Zampini } 2911534831adSStefano Zampini /* Set number of constraints */ 2912534831adSStefano Zampini n_constraints = pcbddc->local_primal_size-n_vertices; 2913534831adSStefano Zampini 2914534831adSStefano Zampini /* vertices in boundary numbering */ 2915534831adSStefano Zampini if (n_vertices) { 2916534831adSStefano Zampini ierr = VecSet(pcis->vec1_N,m_one);CHKERRQ(ierr); 2917534831adSStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 2918534831adSStefano Zampini for (i=0; i<n_vertices; i++) { array[ vertices[i] ] = i; } 2919534831adSStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 2920534831adSStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 2921534831adSStefano Zampini ierr = VecScatterEnd (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 2922534831adSStefano Zampini ierr = PetscMalloc(n_vertices*sizeof(PetscInt),&idx_V_B);CHKERRQ(ierr); 2923534831adSStefano Zampini ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr); 2924534831adSStefano Zampini for (i=0; i<n_vertices; i++) { 2925534831adSStefano Zampini j=0; 2926534831adSStefano Zampini while (array[j] != i ) {j++;} 2927534831adSStefano Zampini idx_V_B[i]=j; 2928534831adSStefano Zampini } 2929534831adSStefano Zampini ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr); 2930534831adSStefano Zampini } 2931534831adSStefano Zampini 2932534831adSStefano Zampini /* transform local matrices if needed */ 2933534831adSStefano Zampini if (pcbddc->usechangeofbasis) { 2934534831adSStefano Zampini ierr = PetscMalloc(pcis->n*sizeof(PetscInt),&nnz);CHKERRQ(ierr); 2935534831adSStefano Zampini ierr = ISGetIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 2936534831adSStefano Zampini for (i=0;i<n_D;i++) { 2937534831adSStefano Zampini nnz[is_indices[i]]=1; 2938534831adSStefano Zampini } 2939534831adSStefano Zampini ierr = ISRestoreIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 2940534831adSStefano Zampini ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 2941534831adSStefano Zampini k=1; 2942534831adSStefano Zampini for (i=0;i<n_B;i++) { 2943534831adSStefano Zampini ierr = MatGetRow(pcbddc->ChangeOfBasisMatrix,i,&j,PETSC_NULL,PETSC_NULL);CHKERRQ(ierr); 2944534831adSStefano Zampini nnz[is_indices[i]]=j; 2945534831adSStefano Zampini if ( k < j) { 2946534831adSStefano Zampini k = j; 2947534831adSStefano Zampini } 2948534831adSStefano Zampini ierr = MatRestoreRow(pcbddc->ChangeOfBasisMatrix,i,&j,PETSC_NULL,PETSC_NULL);CHKERRQ(ierr); 2949534831adSStefano Zampini } 2950534831adSStefano Zampini ierr = ISRestoreIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 2951534831adSStefano Zampini /* assemble change of basis matrix on the whole set of local dofs */ 2952534831adSStefano Zampini ierr = PetscMalloc(k*sizeof(PetscInt),&temp_indices);CHKERRQ(ierr); 2953534831adSStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&change_mat_all);CHKERRQ(ierr); 2954534831adSStefano Zampini ierr = MatSetSizes(change_mat_all,pcis->n,pcis->n,pcis->n,pcis->n);CHKERRQ(ierr); 2955534831adSStefano Zampini ierr = MatSetType(change_mat_all,MATSEQAIJ);CHKERRQ(ierr); 2956534831adSStefano Zampini ierr = MatSeqAIJSetPreallocation(change_mat_all,0,nnz);CHKERRQ(ierr); 2957534831adSStefano Zampini ierr = ISGetIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 2958534831adSStefano Zampini for (i=0;i<n_D;i++) { 2959534831adSStefano Zampini ierr = MatSetValue(change_mat_all,is_indices[i],is_indices[i],1.0,INSERT_VALUES);CHKERRQ(ierr); 2960534831adSStefano Zampini } 2961534831adSStefano Zampini ierr = ISRestoreIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 2962534831adSStefano Zampini ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 2963534831adSStefano Zampini for (i=0;i<n_B;i++) { 2964534831adSStefano Zampini ierr = MatGetRow(pcbddc->ChangeOfBasisMatrix,i,&j,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr); 2965534831adSStefano Zampini for (k=0;k<j;k++) { 2966534831adSStefano Zampini temp_indices[k]=is_indices[row_cmat_indices[k]]; 2967534831adSStefano Zampini } 2968534831adSStefano Zampini ierr = MatSetValues(change_mat_all,1,&is_indices[i],j,temp_indices,row_cmat_values,INSERT_VALUES);CHKERRQ(ierr); 2969534831adSStefano Zampini ierr = MatRestoreRow(pcbddc->ChangeOfBasisMatrix,i,&j,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr); 2970534831adSStefano Zampini } 2971534831adSStefano Zampini ierr = MatAssemblyBegin(change_mat_all,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2972534831adSStefano Zampini ierr = MatAssemblyEnd(change_mat_all,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2973534831adSStefano Zampini ierr = MatPtAP(matis->A,change_mat_all,MAT_INITIAL_MATRIX,1.0,&pcbddc->local_mat);CHKERRQ(ierr); 2974534831adSStefano Zampini ierr = MatDestroy(&pcis->A_IB);CHKERRQ(ierr); 2975534831adSStefano Zampini ierr = MatDestroy(&pcis->A_BI);CHKERRQ(ierr); 2976534831adSStefano Zampini ierr = MatDestroy(&pcis->A_BB);CHKERRQ(ierr); 2977534831adSStefano Zampini ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_I_local,pcis->is_B_local,MAT_INITIAL_MATRIX,&pcis->A_IB);CHKERRQ(ierr); 2978534831adSStefano Zampini ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_B_local,pcis->is_I_local,MAT_INITIAL_MATRIX,&pcis->A_BI);CHKERRQ(ierr); 2979534831adSStefano Zampini ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_B_local,pcis->is_B_local,MAT_INITIAL_MATRIX,&pcis->A_BB);CHKERRQ(ierr); 2980534831adSStefano Zampini ierr = MatDestroy(&change_mat_all);CHKERRQ(ierr); 2981534831adSStefano Zampini ierr = PetscFree(nnz);CHKERRQ(ierr); 2982534831adSStefano Zampini ierr = PetscFree(temp_indices);CHKERRQ(ierr); 2983534831adSStefano Zampini } else { 2984534831adSStefano Zampini /* without change of basis, the local matrix is unchanged */ 2985534831adSStefano Zampini ierr = PetscObjectReference((PetscObject)matis->A);CHKERRQ(ierr); 2986534831adSStefano Zampini pcbddc->local_mat = matis->A; 2987534831adSStefano Zampini } 29880bdf917eSStefano Zampini /* Change global null space passed in by the user if change of basis has been performed */ 29890bdf917eSStefano Zampini if (pcbddc->NullSpace && pcbddc->usechangeofbasis) { 29900bdf917eSStefano Zampini ierr = PCBDDCAdaptNullSpace(pc);CHKERRQ(ierr); 29910bdf917eSStefano Zampini } 2992a0ba757dSStefano Zampini 29930c7d97c5SJed Brown /* Dohrmann's notation: dofs splitted in R (Remaining: all dofs but the vertices) and V (Vertices) */ 29940c7d97c5SJed Brown ierr = VecSet(pcis->vec1_N,one);CHKERRQ(ierr); 29950c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 29963b03a366Sstefano_zampini for (i=0;i<n_vertices;i++) { array[ vertices[i] ] = zero; } 29973b03a366Sstefano_zampini ierr = PetscMalloc(( pcis->n - n_vertices )*sizeof(PetscInt),&idx_R_local);CHKERRQ(ierr); 29980c7d97c5SJed Brown for (i=0, n_R=0; i<pcis->n; i++) { if (array[i] == one) { idx_R_local[n_R] = i; n_R++; } } 29990c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 3000e269702eSStefano Zampini if (dbg_flag) { 30010c7d97c5SJed Brown ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr); 30020c7d97c5SJed Brown ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 30030c7d97c5SJed Brown ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d local dimensions\n",PetscGlobalRank);CHKERRQ(ierr); 30040c7d97c5SJed Brown ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local_size = %d, dirichlet_size = %d, boundary_size = %d\n",pcis->n,n_D,n_B);CHKERRQ(ierr); 30053b03a366Sstefano_zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"r_size = %d, v_size = %d, constraints = %d, local_primal_size = %d\n",n_R,n_vertices,n_constraints,pcbddc->local_primal_size);CHKERRQ(ierr); 3006534831adSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"pcbddc->n_vertices = %d, pcbddc->n_constraints = %d\n",pcbddc->n_vertices,pcbddc->n_constraints);CHKERRQ(ierr); 30070c7d97c5SJed Brown ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 30080c7d97c5SJed Brown } 3009534831adSStefano Zampini 30100c7d97c5SJed Brown /* Allocate needed vectors */ 3011534831adSStefano Zampini ierr = VecDuplicate(pcis->vec1_global,&pcbddc->original_rhs);CHKERRQ(ierr); 30123972b0daSStefano Zampini ierr = VecDuplicate(pcis->vec1_global,&pcbddc->temp_solution);CHKERRQ(ierr); 30130c7d97c5SJed Brown ierr = VecDuplicate(pcis->vec1_D,&pcbddc->vec4_D);CHKERRQ(ierr); 30140c7d97c5SJed Brown ierr = VecCreate(PETSC_COMM_SELF,&pcbddc->vec1_R);CHKERRQ(ierr); 30150c7d97c5SJed Brown ierr = VecSetSizes(pcbddc->vec1_R,n_R,n_R);CHKERRQ(ierr); 30160c7d97c5SJed Brown ierr = VecSetType(pcbddc->vec1_R,impVecType);CHKERRQ(ierr); 3017d49ef151SStefano Zampini ierr = VecDuplicate(pcbddc->vec1_R,&pcbddc->vec2_R);CHKERRQ(ierr); 30180c7d97c5SJed Brown ierr = VecCreate(PETSC_COMM_SELF,&pcbddc->vec1_P);CHKERRQ(ierr); 30190c7d97c5SJed Brown ierr = VecSetSizes(pcbddc->vec1_P,pcbddc->local_primal_size,pcbddc->local_primal_size);CHKERRQ(ierr); 30200c7d97c5SJed Brown ierr = VecSetType(pcbddc->vec1_P,impVecType);CHKERRQ(ierr); 30210c7d97c5SJed Brown 30220c7d97c5SJed Brown /* Creating some index sets needed */ 30230c7d97c5SJed Brown /* For submatrices */ 3024da1bb401SStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,n_R,idx_R_local,PETSC_OWN_POINTER,&is_R_local);CHKERRQ(ierr); 30253b03a366Sstefano_zampini if (n_vertices) { 3026da1bb401SStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,n_vertices,vertices,PETSC_OWN_POINTER,&is_V_local);CHKERRQ(ierr); 30273b03a366Sstefano_zampini } 3028da1bb401SStefano Zampini if (n_constraints) { 3029da1bb401SStefano Zampini ierr = ISCreateStride(PETSC_COMM_SELF,n_constraints,n_vertices,1,&is_C_local);CHKERRQ(ierr); 3030da1bb401SStefano Zampini } 3031da1bb401SStefano Zampini 30320c7d97c5SJed Brown /* For VecScatters pcbddc->R_to_B and (optionally) pcbddc->R_to_D */ 30330c7d97c5SJed Brown { 30340c7d97c5SJed Brown PetscInt *aux_array1; 30350c7d97c5SJed Brown PetscInt *aux_array2; 30362e8d2280SStefano Zampini PetscInt *idx_I_local; 30370c7d97c5SJed Brown 30383b03a366Sstefano_zampini ierr = PetscMalloc( (pcis->n_B-n_vertices)*sizeof(PetscInt),&aux_array1);CHKERRQ(ierr); 30393b03a366Sstefano_zampini ierr = PetscMalloc( (pcis->n_B-n_vertices)*sizeof(PetscInt),&aux_array2);CHKERRQ(ierr); 30400c7d97c5SJed Brown 30412e8d2280SStefano Zampini ierr = ISGetIndices(pcis->is_I_local,(const PetscInt**)&idx_I_local);CHKERRQ(ierr); 30420c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 30432e8d2280SStefano Zampini for (i=0; i<n_D; i++) { array[idx_I_local[i]] = 0; } 30442e8d2280SStefano Zampini ierr = ISRestoreIndices(pcis->is_I_local,(const PetscInt**)&idx_I_local);CHKERRQ(ierr); 30452e8d2280SStefano Zampini for (i=0, j=0; i<n_R; i++) { if ( array[idx_R_local[i]] == one ) { aux_array1[j] = i; j++; } } 30460c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 3047da1bb401SStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array1,PETSC_COPY_VALUES,&is_aux1);CHKERRQ(ierr); 30482e8d2280SStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 30492e8d2280SStefano Zampini ierr = VecScatterEnd (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 30500c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr); 30512e8d2280SStefano Zampini for (i=0, j=0; i<n_B; i++) { if ( array[i] == one ) { aux_array2[j] = i; j++; } } 30523828260eSStefano Zampini ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr); 3053da1bb401SStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array2,PETSC_COPY_VALUES,&is_aux2);CHKERRQ(ierr); 30540c7d97c5SJed Brown ierr = VecScatterCreate(pcbddc->vec1_R,is_aux1,pcis->vec1_B,is_aux2,&pcbddc->R_to_B);CHKERRQ(ierr); 30550c7d97c5SJed Brown ierr = PetscFree(aux_array1);CHKERRQ(ierr); 30560c7d97c5SJed Brown ierr = PetscFree(aux_array2);CHKERRQ(ierr); 30570c7d97c5SJed Brown ierr = ISDestroy(&is_aux1);CHKERRQ(ierr); 30580c7d97c5SJed Brown ierr = ISDestroy(&is_aux2);CHKERRQ(ierr); 30590c7d97c5SJed Brown 3060e269702eSStefano Zampini if (pcbddc->prec_type || dbg_flag ) { 30610c7d97c5SJed Brown ierr = PetscMalloc(n_D*sizeof(PetscInt),&aux_array1);CHKERRQ(ierr); 30620c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 30632e8d2280SStefano Zampini for (i=0, j=0; i<n_R; i++) { if (array[idx_R_local[i]] == zero) { aux_array1[j] = i; j++; } } 30640c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 3065da1bb401SStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array1,PETSC_COPY_VALUES,&is_aux1);CHKERRQ(ierr); 30660c7d97c5SJed Brown ierr = VecScatterCreate(pcbddc->vec1_R,is_aux1,pcis->vec1_D,(IS)0,&pcbddc->R_to_D);CHKERRQ(ierr); 30670c7d97c5SJed Brown ierr = PetscFree(aux_array1);CHKERRQ(ierr); 30680c7d97c5SJed Brown ierr = ISDestroy(&is_aux1);CHKERRQ(ierr); 30690c7d97c5SJed Brown } 30700c7d97c5SJed Brown } 30710c7d97c5SJed Brown 30720c7d97c5SJed Brown /* Creating PC contexts for local Dirichlet and Neumann problems */ 30730c7d97c5SJed Brown { 30740c7d97c5SJed Brown Mat A_RR; 307553cdbc3dSStefano Zampini PC pc_temp; 30760c7d97c5SJed Brown /* Matrix for Dirichlet problem is A_II -> we already have it from pcis.c code */ 307753cdbc3dSStefano Zampini ierr = KSPCreate(PETSC_COMM_SELF,&pcbddc->ksp_D);CHKERRQ(ierr); 307853cdbc3dSStefano Zampini ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->ksp_D,(PetscObject)pc,1);CHKERRQ(ierr); 307953cdbc3dSStefano Zampini ierr = KSPSetOperators(pcbddc->ksp_D,pcis->A_II,pcis->A_II,SAME_PRECONDITIONER);CHKERRQ(ierr); 308053cdbc3dSStefano Zampini ierr = KSPSetType(pcbddc->ksp_D,KSPPREONLY);CHKERRQ(ierr); 3081da1bb401SStefano Zampini ierr = KSPSetOptionsPrefix(pcbddc->ksp_D,"dirichlet_");CHKERRQ(ierr); 30820c7d97c5SJed Brown /* default */ 308353cdbc3dSStefano Zampini ierr = KSPGetPC(pcbddc->ksp_D,&pc_temp);CHKERRQ(ierr); 308453cdbc3dSStefano Zampini ierr = PCSetType(pc_temp,PCLU);CHKERRQ(ierr); 30850c7d97c5SJed Brown /* Allow user's customization */ 308653cdbc3dSStefano Zampini ierr = KSPSetFromOptions(pcbddc->ksp_D);CHKERRQ(ierr); 3087950d796eSStefano Zampini /* umfpack interface has a bug when matrix dimension is zero */ 3088950d796eSStefano Zampini if (!n_D) { 30892e8d2280SStefano Zampini ierr = PCSetType(pc_temp,PCNONE);CHKERRQ(ierr); 3090950d796eSStefano Zampini } 309153cdbc3dSStefano Zampini /* Set Up KSP for Dirichlet problem of BDDC */ 309253cdbc3dSStefano Zampini ierr = KSPSetUp(pcbddc->ksp_D);CHKERRQ(ierr); 30933972b0daSStefano Zampini /* set ksp_D into pcis data */ 30943972b0daSStefano Zampini ierr = KSPDestroy(&pcis->ksp_D);CHKERRQ(ierr); 30953972b0daSStefano Zampini ierr = PetscObjectReference((PetscObject)pcbddc->ksp_D);CHKERRQ(ierr); 30963972b0daSStefano Zampini pcis->ksp_D = pcbddc->ksp_D; 30970c7d97c5SJed Brown /* Matrix for Neumann problem is A_RR -> we need to create it */ 3098534831adSStefano Zampini ierr = MatGetSubMatrix(pcbddc->local_mat,is_R_local,is_R_local,MAT_INITIAL_MATRIX,&A_RR);CHKERRQ(ierr); 309953cdbc3dSStefano Zampini ierr = KSPCreate(PETSC_COMM_SELF,&pcbddc->ksp_R);CHKERRQ(ierr); 310053cdbc3dSStefano Zampini ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->ksp_R,(PetscObject)pc,1);CHKERRQ(ierr); 310153cdbc3dSStefano Zampini ierr = KSPSetOperators(pcbddc->ksp_R,A_RR,A_RR,SAME_PRECONDITIONER);CHKERRQ(ierr); 310253cdbc3dSStefano Zampini ierr = KSPSetType(pcbddc->ksp_R,KSPPREONLY);CHKERRQ(ierr); 3103da1bb401SStefano Zampini ierr = KSPSetOptionsPrefix(pcbddc->ksp_R,"neumann_");CHKERRQ(ierr); 31040c7d97c5SJed Brown /* default */ 310553cdbc3dSStefano Zampini ierr = KSPGetPC(pcbddc->ksp_R,&pc_temp);CHKERRQ(ierr); 310653cdbc3dSStefano Zampini ierr = PCSetType(pc_temp,PCLU);CHKERRQ(ierr); 31070c7d97c5SJed Brown /* Allow user's customization */ 310853cdbc3dSStefano Zampini ierr = KSPSetFromOptions(pcbddc->ksp_R);CHKERRQ(ierr); 3109950d796eSStefano Zampini /* umfpack interface has a bug when matrix dimension is zero */ 3110950d796eSStefano Zampini if (!pcis->n) { 31112e8d2280SStefano Zampini ierr = PCSetType(pc_temp,PCNONE);CHKERRQ(ierr); 3112950d796eSStefano Zampini } 311353cdbc3dSStefano Zampini /* Set Up KSP for Neumann problem of BDDC */ 311453cdbc3dSStefano Zampini ierr = KSPSetUp(pcbddc->ksp_R);CHKERRQ(ierr); 3115a0ba757dSStefano Zampini /* check Dirichlet and Neumann solvers */ 3116b76ba322SStefano Zampini { 31170c7d97c5SJed Brown Vec temp_vec; 3118b76ba322SStefano Zampini PetscReal value; 3119b76ba322SStefano Zampini PetscMPIInt use_exact,use_exact_reduced; 31200c7d97c5SJed Brown 3121a0ba757dSStefano Zampini ierr = VecDuplicate(pcis->vec1_D,&temp_vec);CHKERRQ(ierr); 3122a0ba757dSStefano Zampini ierr = VecSetRandom(pcis->vec1_D,PETSC_NULL);CHKERRQ(ierr); 3123a0ba757dSStefano Zampini ierr = MatMult(pcis->A_II,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr); 3124a0ba757dSStefano Zampini ierr = KSPSolve(pcbddc->ksp_D,pcis->vec2_D,temp_vec);CHKERRQ(ierr); 3125a0ba757dSStefano Zampini ierr = VecAXPY(temp_vec,m_one,pcis->vec1_D);CHKERRQ(ierr); 3126a0ba757dSStefano Zampini ierr = VecNorm(temp_vec,NORM_INFINITY,&value);CHKERRQ(ierr); 3127b76ba322SStefano Zampini use_exact = 1; 3128b76ba322SStefano Zampini if (PetscAbsReal(value) > 1.e-4) { 3129b76ba322SStefano Zampini use_exact = 0; 3130b76ba322SStefano Zampini } 3131b76ba322SStefano Zampini ierr = MPI_Allreduce(&use_exact,&use_exact_reduced,1,MPIU_INT,MPI_LAND,((PetscObject)pc)->comm);CHKERRQ(ierr); 3132b76ba322SStefano Zampini pcbddc->use_exact_dirichlet = (PetscBool) use_exact_reduced; 3133a0ba757dSStefano Zampini ierr = VecDestroy(&temp_vec);CHKERRQ(ierr); 3134b76ba322SStefano Zampini if (dbg_flag) { 3135a0ba757dSStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 3136a0ba757dSStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr); 3137a0ba757dSStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Checking solution of Dirichlet and Neumann problems\n");CHKERRQ(ierr); 3138a0ba757dSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d infinity error for Dirichlet solve = % 1.14e \n",PetscGlobalRank,value);CHKERRQ(ierr); 3139d49ef151SStefano Zampini ierr = VecDuplicate(pcbddc->vec1_R,&temp_vec);CHKERRQ(ierr); 3140d49ef151SStefano Zampini ierr = VecSetRandom(pcbddc->vec1_R,PETSC_NULL);CHKERRQ(ierr); 3141d49ef151SStefano Zampini ierr = MatMult(A_RR,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr); 3142d49ef151SStefano Zampini ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec2_R,temp_vec);CHKERRQ(ierr); 3143d49ef151SStefano Zampini ierr = VecAXPY(temp_vec,m_one,pcbddc->vec1_R);CHKERRQ(ierr); 3144d49ef151SStefano Zampini ierr = VecNorm(temp_vec,NORM_INFINITY,&value);CHKERRQ(ierr); 3145e269702eSStefano Zampini ierr = VecDestroy(&temp_vec);CHKERRQ(ierr); 31460c7d97c5SJed Brown ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d infinity error for Neumann solve = % 1.14e \n",PetscGlobalRank,value);CHKERRQ(ierr); 3147d49ef151SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 31480c7d97c5SJed Brown } 3149b76ba322SStefano Zampini } 31500c7d97c5SJed Brown /* free Neumann problem's matrix */ 31510c7d97c5SJed Brown ierr = MatDestroy(&A_RR);CHKERRQ(ierr); 31520c7d97c5SJed Brown } 31530c7d97c5SJed Brown 31540c7d97c5SJed Brown /* Assemble all remaining stuff needed to apply BDDC */ 31550c7d97c5SJed Brown { 31560c7d97c5SJed Brown Mat A_RV,A_VR,A_VV; 31570bdf917eSStefano Zampini Mat M1; 31580c7d97c5SJed Brown Mat C_CR; 31593b03a366Sstefano_zampini Mat AUXMAT; 31600c7d97c5SJed Brown Vec vec1_C; 31610c7d97c5SJed Brown Vec vec2_C; 31620c7d97c5SJed Brown Vec vec1_V; 31630c7d97c5SJed Brown Vec vec2_V; 31640c7d97c5SJed Brown PetscInt *nnz; 31650c7d97c5SJed Brown PetscInt *auxindices; 316653cdbc3dSStefano Zampini PetscInt index; 31670c7d97c5SJed Brown PetscScalar* array2; 31680c7d97c5SJed Brown MatFactorInfo matinfo; 31690c7d97c5SJed Brown 31700c7d97c5SJed Brown /* Allocating some extra storage just to be safe */ 31710c7d97c5SJed Brown ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&nnz);CHKERRQ(ierr); 31720c7d97c5SJed Brown ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&auxindices);CHKERRQ(ierr); 31730c7d97c5SJed Brown for (i=0;i<pcis->n;i++) {auxindices[i]=i;} 31740c7d97c5SJed Brown 31750c7d97c5SJed Brown /* some work vectors on vertices and/or constraints */ 31763b03a366Sstefano_zampini if (n_vertices) { 31770c7d97c5SJed Brown ierr = VecCreate(PETSC_COMM_SELF,&vec1_V);CHKERRQ(ierr); 31783b03a366Sstefano_zampini ierr = VecSetSizes(vec1_V,n_vertices,n_vertices);CHKERRQ(ierr); 31790c7d97c5SJed Brown ierr = VecSetType(vec1_V,impVecType);CHKERRQ(ierr); 31800c7d97c5SJed Brown ierr = VecDuplicate(vec1_V,&vec2_V);CHKERRQ(ierr); 31810c7d97c5SJed Brown } 3182534831adSStefano Zampini if (n_constraints) { 31830c7d97c5SJed Brown ierr = VecCreate(PETSC_COMM_SELF,&vec1_C);CHKERRQ(ierr); 3184534831adSStefano Zampini ierr = VecSetSizes(vec1_C,n_constraints,n_constraints);CHKERRQ(ierr); 31850c7d97c5SJed Brown ierr = VecSetType(vec1_C,impVecType);CHKERRQ(ierr); 31860c7d97c5SJed Brown ierr = VecDuplicate(vec1_C,&vec2_C);CHKERRQ(ierr); 31870c7d97c5SJed Brown ierr = VecDuplicate(vec1_C,&pcbddc->vec1_C);CHKERRQ(ierr); 31880c7d97c5SJed Brown } 31890c7d97c5SJed Brown /* Precompute stuffs needed for preprocessing and application of BDDC*/ 31903b03a366Sstefano_zampini if (n_constraints) { 31910c7d97c5SJed Brown ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->local_auxmat2);CHKERRQ(ierr); 31923b03a366Sstefano_zampini ierr = MatSetSizes(pcbddc->local_auxmat2,n_R,n_constraints,n_R,n_constraints);CHKERRQ(ierr); 31930c7d97c5SJed Brown ierr = MatSetType(pcbddc->local_auxmat2,impMatType);CHKERRQ(ierr); 31943b03a366Sstefano_zampini ierr = MatSeqDenseSetPreallocation(pcbddc->local_auxmat2,PETSC_NULL);CHKERRQ(ierr); 31950c7d97c5SJed Brown 319657a90decSStefano Zampini /* Create Constraint matrix on R nodes: C_{CR} */ 319757a90decSStefano Zampini ierr = MatGetSubMatrix(pcbddc->ConstraintMatrix,is_C_local,is_R_local,MAT_INITIAL_MATRIX,&C_CR);CHKERRQ(ierr); 319857a90decSStefano Zampini ierr = ISDestroy(&is_C_local);CHKERRQ(ierr); 319957a90decSStefano Zampini 32000c7d97c5SJed Brown /* Assemble local_auxmat2 = - A_{RR}^{-1} C^T_{CR} needed by BDDC application */ 32013b03a366Sstefano_zampini for (i=0;i<n_constraints;i++) { 32023b03a366Sstefano_zampini ierr = VecSet(pcbddc->vec1_R,zero);CHKERRQ(ierr); 32033b03a366Sstefano_zampini /* Get row of constraint matrix in R numbering */ 320457a90decSStefano Zampini ierr = VecGetArray(pcbddc->vec1_R,&array);CHKERRQ(ierr); 320557a90decSStefano Zampini ierr = MatGetRow(C_CR,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr); 32063b03a366Sstefano_zampini for (j=0;j<size_of_constraint;j++) { array[ row_cmat_indices[j] ] = - row_cmat_values[j]; } 320757a90decSStefano Zampini ierr = MatRestoreRow(C_CR,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr); 320857a90decSStefano Zampini ierr = VecRestoreArray(pcbddc->vec1_R,&array);CHKERRQ(ierr); 32093b03a366Sstefano_zampini /* Solve for row of constraint matrix in R numbering */ 321053cdbc3dSStefano Zampini ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr); 32113b03a366Sstefano_zampini /* Set values */ 32120c7d97c5SJed Brown ierr = VecGetArray(pcbddc->vec2_R,&array);CHKERRQ(ierr); 32133b03a366Sstefano_zampini ierr = MatSetValues(pcbddc->local_auxmat2,n_R,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr); 32140c7d97c5SJed Brown ierr = VecRestoreArray(pcbddc->vec2_R,&array);CHKERRQ(ierr); 32150c7d97c5SJed Brown } 32160c7d97c5SJed Brown ierr = MatAssemblyBegin(pcbddc->local_auxmat2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 32170c7d97c5SJed Brown ierr = MatAssemblyEnd(pcbddc->local_auxmat2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 32180c7d97c5SJed Brown 32190c7d97c5SJed Brown /* Assemble AUXMAT = ( LUFactor )( -C_{CR} A_{RR}^{-1} C^T_{CR} )^{-1} */ 32200c7d97c5SJed Brown ierr = MatMatMult(C_CR,pcbddc->local_auxmat2,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&AUXMAT);CHKERRQ(ierr); 3221d49ef151SStefano Zampini ierr = MatFactorInfoInitialize(&matinfo);CHKERRQ(ierr); 32223b03a366Sstefano_zampini ierr = ISCreateStride(PETSC_COMM_SELF,n_constraints,0,1,&is_aux1);CHKERRQ(ierr); 32230c7d97c5SJed Brown ierr = MatLUFactor(AUXMAT,is_aux1,is_aux1,&matinfo);CHKERRQ(ierr); 32240c7d97c5SJed Brown ierr = ISDestroy(&is_aux1);CHKERRQ(ierr); 32250c7d97c5SJed Brown 32263b03a366Sstefano_zampini /* Assemble explicitly M1 = ( C_{CR} A_{RR}^{-1} C^T_{CR} )^{-1} needed in preproc */ 3227d49ef151SStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&M1);CHKERRQ(ierr); 32283b03a366Sstefano_zampini ierr = MatSetSizes(M1,n_constraints,n_constraints,n_constraints,n_constraints);CHKERRQ(ierr); 32290c7d97c5SJed Brown ierr = MatSetType(M1,impMatType);CHKERRQ(ierr); 32303b03a366Sstefano_zampini ierr = MatSeqDenseSetPreallocation(M1,PETSC_NULL);CHKERRQ(ierr); 32313b03a366Sstefano_zampini for (i=0;i<n_constraints;i++) { 32320c7d97c5SJed Brown ierr = VecSet(vec1_C,zero);CHKERRQ(ierr); 32330c7d97c5SJed Brown ierr = VecSetValue(vec1_C,i,one,INSERT_VALUES);CHKERRQ(ierr); 32340c7d97c5SJed Brown ierr = VecAssemblyBegin(vec1_C);CHKERRQ(ierr); 32350c7d97c5SJed Brown ierr = VecAssemblyEnd(vec1_C);CHKERRQ(ierr); 32360c7d97c5SJed Brown ierr = MatSolve(AUXMAT,vec1_C,vec2_C);CHKERRQ(ierr); 32370c7d97c5SJed Brown ierr = VecScale(vec2_C,m_one);CHKERRQ(ierr); 32380c7d97c5SJed Brown ierr = VecGetArray(vec2_C,&array);CHKERRQ(ierr); 32393b03a366Sstefano_zampini ierr = MatSetValues(M1,n_constraints,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr); 32400c7d97c5SJed Brown ierr = VecRestoreArray(vec2_C,&array);CHKERRQ(ierr); 32410c7d97c5SJed Brown } 32420c7d97c5SJed Brown ierr = MatAssemblyBegin(M1,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 32430c7d97c5SJed Brown ierr = MatAssemblyEnd(M1,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 32440c7d97c5SJed Brown ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr); 32450c7d97c5SJed Brown /* Assemble local_auxmat1 = M1*C_{CR} needed by BDDC application in KSP and in preproc */ 32460c7d97c5SJed Brown ierr = MatMatMult(M1,C_CR,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&pcbddc->local_auxmat1);CHKERRQ(ierr); 32470c7d97c5SJed Brown 32480c7d97c5SJed Brown } 32490c7d97c5SJed Brown 32500c7d97c5SJed Brown /* Get submatrices from subdomain matrix */ 32513b03a366Sstefano_zampini if (n_vertices){ 3252534831adSStefano Zampini ierr = MatGetSubMatrix(pcbddc->local_mat,is_R_local,is_V_local,MAT_INITIAL_MATRIX,&A_RV);CHKERRQ(ierr); 3253534831adSStefano Zampini ierr = MatGetSubMatrix(pcbddc->local_mat,is_V_local,is_R_local,MAT_INITIAL_MATRIX,&A_VR);CHKERRQ(ierr); 3254534831adSStefano Zampini ierr = MatGetSubMatrix(pcbddc->local_mat,is_V_local,is_V_local,MAT_INITIAL_MATRIX,&A_VV);CHKERRQ(ierr); 32550c7d97c5SJed Brown } 32560c7d97c5SJed Brown 32570c7d97c5SJed Brown /* Matrix of coarse basis functions (local) */ 3258d49ef151SStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->coarse_phi_B);CHKERRQ(ierr); 32590c7d97c5SJed Brown ierr = MatSetSizes(pcbddc->coarse_phi_B,n_B,pcbddc->local_primal_size,n_B,pcbddc->local_primal_size);CHKERRQ(ierr); 32600c7d97c5SJed Brown ierr = MatSetType(pcbddc->coarse_phi_B,impMatType);CHKERRQ(ierr); 32613b03a366Sstefano_zampini ierr = MatSeqDenseSetPreallocation(pcbddc->coarse_phi_B,PETSC_NULL);CHKERRQ(ierr); 3262e269702eSStefano Zampini if (pcbddc->prec_type || dbg_flag ) { 3263d49ef151SStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->coarse_phi_D);CHKERRQ(ierr); 32640c7d97c5SJed Brown ierr = MatSetSizes(pcbddc->coarse_phi_D,n_D,pcbddc->local_primal_size,n_D,pcbddc->local_primal_size);CHKERRQ(ierr); 32650c7d97c5SJed Brown ierr = MatSetType(pcbddc->coarse_phi_D,impMatType);CHKERRQ(ierr); 32663b03a366Sstefano_zampini ierr = MatSeqDenseSetPreallocation(pcbddc->coarse_phi_D,PETSC_NULL);CHKERRQ(ierr); 32670c7d97c5SJed Brown } 32680c7d97c5SJed Brown 3269e269702eSStefano Zampini if (dbg_flag) { 32700c7d97c5SJed Brown ierr = PetscMalloc( pcbddc->local_primal_size*sizeof(PetscScalar),&coarsefunctions_errors);CHKERRQ(ierr); 32710c7d97c5SJed Brown ierr = PetscMalloc( pcbddc->local_primal_size*sizeof(PetscScalar),&constraints_errors);CHKERRQ(ierr); 32720c7d97c5SJed Brown } 32733b03a366Sstefano_zampini /* Subdomain contribution (Non-overlapping) to coarse matrix */ 32740c7d97c5SJed Brown ierr = PetscMalloc ((pcbddc->local_primal_size)*(pcbddc->local_primal_size)*sizeof(PetscScalar),&coarse_submat_vals);CHKERRQ(ierr); 32750c7d97c5SJed Brown 32760c7d97c5SJed Brown /* We are now ready to evaluate coarse basis functions and subdomain contribution to coarse problem */ 32773b03a366Sstefano_zampini for (i=0;i<n_vertices;i++){ 32780c7d97c5SJed Brown ierr = VecSet(vec1_V,zero);CHKERRQ(ierr); 32790c7d97c5SJed Brown ierr = VecSetValue(vec1_V,i,one,INSERT_VALUES);CHKERRQ(ierr); 32800c7d97c5SJed Brown ierr = VecAssemblyBegin(vec1_V);CHKERRQ(ierr); 32810c7d97c5SJed Brown ierr = VecAssemblyEnd(vec1_V);CHKERRQ(ierr); 32820c7d97c5SJed Brown /* solution of saddle point problem */ 32830bdf917eSStefano Zampini ierr = MatMult(A_RV,vec1_V,pcbddc->vec1_R);CHKERRQ(ierr); 32840bdf917eSStefano Zampini ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec1_R);CHKERRQ(ierr); 32850c7d97c5SJed Brown ierr = VecScale(pcbddc->vec1_R,m_one);CHKERRQ(ierr); 32863b03a366Sstefano_zampini if (n_constraints) { 32870c7d97c5SJed Brown ierr = MatMult(pcbddc->local_auxmat1,pcbddc->vec1_R,vec1_C);CHKERRQ(ierr); 32880c7d97c5SJed Brown ierr = MatMultAdd(pcbddc->local_auxmat2,vec1_C,pcbddc->vec1_R,pcbddc->vec1_R);CHKERRQ(ierr); 32890c7d97c5SJed Brown ierr = VecScale(vec1_C,m_one);CHKERRQ(ierr); 32900c7d97c5SJed Brown } 32910c7d97c5SJed Brown ierr = MatMult(A_VR,pcbddc->vec1_R,vec2_V);CHKERRQ(ierr); 32920c7d97c5SJed Brown ierr = MatMultAdd(A_VV,vec1_V,vec2_V,vec2_V);CHKERRQ(ierr); 32930c7d97c5SJed Brown 32940c7d97c5SJed Brown /* Set values in coarse basis function and subdomain part of coarse_mat */ 32950c7d97c5SJed Brown /* coarse basis functions */ 32960c7d97c5SJed Brown ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr); 32970c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 32980c7d97c5SJed Brown ierr = VecScatterEnd (pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 32990c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr); 33003b03a366Sstefano_zampini ierr = MatSetValues(pcbddc->coarse_phi_B,n_B,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr); 33010c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr); 33020c7d97c5SJed Brown ierr = MatSetValue(pcbddc->coarse_phi_B,idx_V_B[i],i,one,INSERT_VALUES);CHKERRQ(ierr); 3303e269702eSStefano Zampini if ( pcbddc->prec_type || dbg_flag ) { 33040c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 33050c7d97c5SJed Brown ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 33060c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_D,&array);CHKERRQ(ierr); 33073b03a366Sstefano_zampini ierr = MatSetValues(pcbddc->coarse_phi_D,n_D,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr); 33080c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_D,&array);CHKERRQ(ierr); 33090c7d97c5SJed Brown } 33100c7d97c5SJed Brown /* subdomain contribution to coarse matrix */ 33110c7d97c5SJed Brown ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr); 3312da1bb401SStefano Zampini for (j=0;j<n_vertices;j++) { coarse_submat_vals[i*pcbddc->local_primal_size+j] = array[j]; } /* WARNING -> column major ordering */ 33130c7d97c5SJed Brown ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr); 33143b03a366Sstefano_zampini if (n_constraints) { 33150c7d97c5SJed Brown ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr); 3316da1bb401SStefano Zampini for (j=0;j<n_constraints;j++) { coarse_submat_vals[i*pcbddc->local_primal_size+j+n_vertices] = array[j]; } /* WARNING -> column major ordering */ 33170c7d97c5SJed Brown ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr); 33180c7d97c5SJed Brown } 33190c7d97c5SJed Brown 3320e269702eSStefano Zampini if ( dbg_flag ) { 33210c7d97c5SJed Brown /* assemble subdomain vector on nodes */ 3322d49ef151SStefano Zampini ierr = VecSet(pcis->vec1_N,zero);CHKERRQ(ierr); 33230c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 33240c7d97c5SJed Brown ierr = VecGetArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr); 33250c7d97c5SJed Brown for (j=0;j<n_R;j++) { array[idx_R_local[j]] = array2[j]; } 33263b03a366Sstefano_zampini array[ vertices[i] ] = one; 33270c7d97c5SJed Brown ierr = VecRestoreArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr); 33280c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 33290c7d97c5SJed Brown /* assemble subdomain vector of lagrange multipliers (i.e. primal nodes) */ 3330d49ef151SStefano Zampini ierr = VecSet(pcbddc->vec1_P,zero);CHKERRQ(ierr); 33310c7d97c5SJed Brown ierr = VecGetArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr); 33320c7d97c5SJed Brown ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr); 33333b03a366Sstefano_zampini for (j=0;j<n_vertices;j++) { array2[j]=array[j]; } 33340c7d97c5SJed Brown ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr); 33353b03a366Sstefano_zampini if (n_constraints) { 33360c7d97c5SJed Brown ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr); 33373b03a366Sstefano_zampini for (j=0;j<n_constraints;j++) { array2[j+n_vertices]=array[j]; } 33380c7d97c5SJed Brown ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr); 33390c7d97c5SJed Brown } 33400c7d97c5SJed Brown ierr = VecRestoreArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr); 33410c7d97c5SJed Brown ierr = VecScale(pcbddc->vec1_P,m_one);CHKERRQ(ierr); 33420c7d97c5SJed Brown /* check saddle point solution */ 3343534831adSStefano Zampini ierr = MatMult(pcbddc->local_mat,pcis->vec1_N,pcis->vec2_N);CHKERRQ(ierr); 33443b03a366Sstefano_zampini ierr = MatMultTransposeAdd(pcbddc->ConstraintMatrix,pcbddc->vec1_P,pcis->vec2_N,pcis->vec2_N);CHKERRQ(ierr); 33453b03a366Sstefano_zampini ierr = VecNorm(pcis->vec2_N,NORM_INFINITY,&coarsefunctions_errors[i]);CHKERRQ(ierr); 33463b03a366Sstefano_zampini ierr = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr); 33470c7d97c5SJed Brown ierr = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr); 33483b03a366Sstefano_zampini array[i]=array[i]+m_one; /* shift by the identity matrix */ 33490c7d97c5SJed Brown ierr = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr); 33503b03a366Sstefano_zampini ierr = VecNorm(pcbddc->vec1_P,NORM_INFINITY,&constraints_errors[i]);CHKERRQ(ierr); 33510c7d97c5SJed Brown } 33520c7d97c5SJed Brown } 33530c7d97c5SJed Brown 33543b03a366Sstefano_zampini for (i=0;i<n_constraints;i++){ 3355d49ef151SStefano Zampini ierr = VecSet(vec2_C,zero);CHKERRQ(ierr); 33560c7d97c5SJed Brown ierr = VecSetValue(vec2_C,i,m_one,INSERT_VALUES);CHKERRQ(ierr); 33570c7d97c5SJed Brown ierr = VecAssemblyBegin(vec2_C);CHKERRQ(ierr); 33580c7d97c5SJed Brown ierr = VecAssemblyEnd(vec2_C);CHKERRQ(ierr); 33590c7d97c5SJed Brown /* solution of saddle point problem */ 33600c7d97c5SJed Brown ierr = MatMult(M1,vec2_C,vec1_C);CHKERRQ(ierr); 33610c7d97c5SJed Brown ierr = MatMult(pcbddc->local_auxmat2,vec1_C,pcbddc->vec1_R);CHKERRQ(ierr); 33620c7d97c5SJed Brown ierr = VecScale(vec1_C,m_one);CHKERRQ(ierr); 33633b03a366Sstefano_zampini if (n_vertices) { ierr = MatMult(A_VR,pcbddc->vec1_R,vec2_V);CHKERRQ(ierr); } 33640c7d97c5SJed Brown /* Set values in coarse basis function and subdomain part of coarse_mat */ 33650c7d97c5SJed Brown /* coarse basis functions */ 33663b03a366Sstefano_zampini index=i+n_vertices; 33670c7d97c5SJed Brown ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr); 33680c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 33690c7d97c5SJed Brown ierr = VecScatterEnd (pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 33700c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr); 337153cdbc3dSStefano Zampini ierr = MatSetValues(pcbddc->coarse_phi_B,n_B,auxindices,1,&index,array,INSERT_VALUES);CHKERRQ(ierr); 33720c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr); 3373e269702eSStefano Zampini if ( pcbddc->prec_type || dbg_flag ) { 33740c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 33750c7d97c5SJed Brown ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 33760c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_D,&array);CHKERRQ(ierr); 337753cdbc3dSStefano Zampini ierr = MatSetValues(pcbddc->coarse_phi_D,n_D,auxindices,1,&index,array,INSERT_VALUES);CHKERRQ(ierr); 33780c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_D,&array);CHKERRQ(ierr); 33790c7d97c5SJed Brown } 33800c7d97c5SJed Brown /* subdomain contribution to coarse matrix */ 33813b03a366Sstefano_zampini if (n_vertices) { 33820c7d97c5SJed Brown ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr); 3383da1bb401SStefano Zampini for (j=0;j<n_vertices;j++) {coarse_submat_vals[index*pcbddc->local_primal_size+j]=array[j];} /* WARNING -> column major ordering */ 33840c7d97c5SJed Brown ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr); 33850c7d97c5SJed Brown } 33860c7d97c5SJed Brown ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr); 3387da1bb401SStefano Zampini for (j=0;j<n_constraints;j++) {coarse_submat_vals[index*pcbddc->local_primal_size+j+n_vertices]=array[j];} /* WARNING -> column major ordering */ 33880c7d97c5SJed Brown ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr); 33890c7d97c5SJed Brown 3390e269702eSStefano Zampini if ( dbg_flag ) { 33910c7d97c5SJed Brown /* assemble subdomain vector on nodes */ 339253cdbc3dSStefano Zampini ierr = VecSet(pcis->vec1_N,zero);CHKERRQ(ierr); 33930c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 33940c7d97c5SJed Brown ierr = VecGetArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr); 33950c7d97c5SJed Brown for (j=0;j<n_R;j++){ array[ idx_R_local[j] ] = array2[j]; } 33960c7d97c5SJed Brown ierr = VecRestoreArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr); 33970c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 33980c7d97c5SJed Brown /* assemble subdomain vector of lagrange multipliers */ 339953cdbc3dSStefano Zampini ierr = VecSet(pcbddc->vec1_P,zero);CHKERRQ(ierr); 34000c7d97c5SJed Brown ierr = VecGetArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr); 34013b03a366Sstefano_zampini if ( n_vertices) { 34020c7d97c5SJed Brown ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr); 34033b03a366Sstefano_zampini for (j=0;j<n_vertices;j++) {array2[j]=-array[j];} 34040c7d97c5SJed Brown ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr); 34050c7d97c5SJed Brown } 34060c7d97c5SJed Brown ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr); 34073b03a366Sstefano_zampini for (j=0;j<n_constraints;j++) {array2[j+n_vertices]=-array[j];} 34080c7d97c5SJed Brown ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr); 34090c7d97c5SJed Brown ierr = VecRestoreArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr); 34103972b0daSStefano Zampini /* check saddle point solution */ 3411534831adSStefano Zampini ierr = MatMult(pcbddc->local_mat,pcis->vec1_N,pcis->vec2_N);CHKERRQ(ierr); 34123b03a366Sstefano_zampini ierr = MatMultTransposeAdd(pcbddc->ConstraintMatrix,pcbddc->vec1_P,pcis->vec2_N,pcis->vec2_N);CHKERRQ(ierr); 341353cdbc3dSStefano Zampini ierr = VecNorm(pcis->vec2_N,NORM_INFINITY,&coarsefunctions_errors[index]);CHKERRQ(ierr); 34143b03a366Sstefano_zampini ierr = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr); 34150c7d97c5SJed Brown ierr = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr); 341653cdbc3dSStefano Zampini array[index]=array[index]+m_one; /* shift by the identity matrix */ 34170c7d97c5SJed Brown ierr = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr); 341853cdbc3dSStefano Zampini ierr = VecNorm(pcbddc->vec1_P,NORM_INFINITY,&constraints_errors[index]);CHKERRQ(ierr); 34190c7d97c5SJed Brown } 34200c7d97c5SJed Brown } 34210c7d97c5SJed Brown ierr = MatAssemblyBegin(pcbddc->coarse_phi_B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 34220c7d97c5SJed Brown ierr = MatAssemblyEnd (pcbddc->coarse_phi_B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 3423e269702eSStefano Zampini if ( pcbddc->prec_type || dbg_flag ) { 34240c7d97c5SJed Brown ierr = MatAssemblyBegin(pcbddc->coarse_phi_D,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 34250c7d97c5SJed Brown ierr = MatAssemblyEnd (pcbddc->coarse_phi_D,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 34260c7d97c5SJed Brown } 34270c7d97c5SJed Brown /* Checking coarse_sub_mat and coarse basis functios */ 34280c7d97c5SJed Brown /* It shuld be \Phi^{(j)^T} A^{(j)} \Phi^{(j)}=coarse_sub_mat */ 34299d2fce94SStefano Zampini if (dbg_flag) { 34300c7d97c5SJed Brown Mat coarse_sub_mat; 34310c7d97c5SJed Brown Mat TM1,TM2,TM3,TM4; 34320c7d97c5SJed Brown Mat coarse_phi_D,coarse_phi_B,A_II,A_BB,A_IB,A_BI; 343319fd82e9SBarry Smith MatType checkmattype=MATSEQAIJ; 34340c7d97c5SJed Brown PetscScalar value; 34350c7d97c5SJed Brown 3436c042a7c3SStefano Zampini ierr = MatConvert(pcis->A_II,checkmattype,MAT_INITIAL_MATRIX,&A_II);CHKERRQ(ierr); 3437c042a7c3SStefano Zampini ierr = MatConvert(pcis->A_IB,checkmattype,MAT_INITIAL_MATRIX,&A_IB);CHKERRQ(ierr); 3438c042a7c3SStefano Zampini ierr = MatConvert(pcis->A_BI,checkmattype,MAT_INITIAL_MATRIX,&A_BI);CHKERRQ(ierr); 3439c042a7c3SStefano Zampini ierr = MatConvert(pcis->A_BB,checkmattype,MAT_INITIAL_MATRIX,&A_BB);CHKERRQ(ierr); 3440c042a7c3SStefano Zampini ierr = MatConvert(pcbddc->coarse_phi_D,checkmattype,MAT_INITIAL_MATRIX,&coarse_phi_D);CHKERRQ(ierr); 3441c042a7c3SStefano Zampini ierr = MatConvert(pcbddc->coarse_phi_B,checkmattype,MAT_INITIAL_MATRIX,&coarse_phi_B);CHKERRQ(ierr); 3442c042a7c3SStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,pcbddc->local_primal_size,pcbddc->local_primal_size,coarse_submat_vals,&coarse_sub_mat);CHKERRQ(ierr); 3443c042a7c3SStefano Zampini ierr = MatConvert(coarse_sub_mat,checkmattype,MAT_REUSE_MATRIX,&coarse_sub_mat);CHKERRQ(ierr); 34440c7d97c5SJed Brown 3445da1bb401SStefano Zampini /*PetscViewer view_out; 3446da1bb401SStefano Zampini PetscMPIInt myrank; 3447da1bb401SStefano Zampini char filename[256]; 3448da1bb401SStefano Zampini MPI_Comm_rank(((PetscObject)pc)->comm,&myrank); 3449da1bb401SStefano Zampini sprintf(filename,"coarsesubmat_%04d.m",myrank); 3450da1bb401SStefano Zampini ierr = PetscViewerASCIIOpen(PETSC_COMM_SELF,filename,&view_out);CHKERRQ(ierr); 3451da1bb401SStefano Zampini ierr = PetscViewerSetFormat(view_out,PETSC_VIEWER_ASCII_MATLAB);CHKERRQ(ierr); 3452da1bb401SStefano Zampini ierr = MatView(coarse_sub_mat,view_out);CHKERRQ(ierr); 3453da1bb401SStefano Zampini ierr = PetscViewerDestroy(&view_out);CHKERRQ(ierr);*/ 3454da1bb401SStefano Zampini 34550c7d97c5SJed Brown ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr); 34560c7d97c5SJed Brown ierr = PetscViewerASCIIPrintf(viewer,"Check coarse sub mat and local basis functions\n");CHKERRQ(ierr); 34570c7d97c5SJed Brown ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 345853cdbc3dSStefano Zampini ierr = MatPtAP(A_II,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&TM1);CHKERRQ(ierr); 345953cdbc3dSStefano Zampini ierr = MatPtAP(A_BB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&TM2);CHKERRQ(ierr); 346053cdbc3dSStefano Zampini ierr = MatMatMult(A_IB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr); 3461c042a7c3SStefano Zampini ierr = MatTransposeMatMult(coarse_phi_D,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM3);CHKERRQ(ierr); 346253cdbc3dSStefano Zampini ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr); 346353cdbc3dSStefano Zampini ierr = MatMatMult(A_BI,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr); 3464c042a7c3SStefano Zampini ierr = MatTransposeMatMult(coarse_phi_B,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM4);CHKERRQ(ierr); 346553cdbc3dSStefano Zampini ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr); 346653cdbc3dSStefano Zampini ierr = MatAXPY(TM1,one,TM2,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr); 346753cdbc3dSStefano Zampini ierr = MatAXPY(TM1,one,TM3,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr); 346853cdbc3dSStefano Zampini ierr = MatAXPY(TM1,one,TM4,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr); 346953cdbc3dSStefano Zampini ierr = MatAXPY(TM1,m_one,coarse_sub_mat,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr); 347053cdbc3dSStefano Zampini ierr = MatNorm(TM1,NORM_INFINITY,&value);CHKERRQ(ierr); 34710c7d97c5SJed Brown ierr = PetscViewerASCIISynchronizedPrintf(viewer,"----------------------------------\n");CHKERRQ(ierr); 34720c7d97c5SJed Brown ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d \n",PetscGlobalRank);CHKERRQ(ierr); 34730c7d97c5SJed Brown ierr = PetscViewerASCIISynchronizedPrintf(viewer,"matrix error = % 1.14e\n",value);CHKERRQ(ierr); 34740c7d97c5SJed Brown ierr = PetscViewerASCIISynchronizedPrintf(viewer,"coarse functions errors\n");CHKERRQ(ierr); 347553cdbc3dSStefano Zampini for (i=0;i<pcbddc->local_primal_size;i++) { ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local %02d-th function error = % 1.14e\n",i,coarsefunctions_errors[i]);CHKERRQ(ierr); } 34760c7d97c5SJed Brown ierr = PetscViewerASCIISynchronizedPrintf(viewer,"constraints errors\n");CHKERRQ(ierr); 347753cdbc3dSStefano Zampini for (i=0;i<pcbddc->local_primal_size;i++) { ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local %02d-th function error = % 1.14e\n",i,constraints_errors[i]);CHKERRQ(ierr); } 34780c7d97c5SJed Brown ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 347953cdbc3dSStefano Zampini ierr = MatDestroy(&A_II);CHKERRQ(ierr); 348053cdbc3dSStefano Zampini ierr = MatDestroy(&A_BB);CHKERRQ(ierr); 348153cdbc3dSStefano Zampini ierr = MatDestroy(&A_IB);CHKERRQ(ierr); 348253cdbc3dSStefano Zampini ierr = MatDestroy(&A_BI);CHKERRQ(ierr); 348353cdbc3dSStefano Zampini ierr = MatDestroy(&TM1);CHKERRQ(ierr); 348453cdbc3dSStefano Zampini ierr = MatDestroy(&TM2);CHKERRQ(ierr); 348553cdbc3dSStefano Zampini ierr = MatDestroy(&TM3);CHKERRQ(ierr); 348653cdbc3dSStefano Zampini ierr = MatDestroy(&TM4);CHKERRQ(ierr); 348753cdbc3dSStefano Zampini ierr = MatDestroy(&coarse_phi_D);CHKERRQ(ierr); 348853cdbc3dSStefano Zampini ierr = MatDestroy(&coarse_sub_mat);CHKERRQ(ierr); 348953cdbc3dSStefano Zampini ierr = MatDestroy(&coarse_phi_B);CHKERRQ(ierr); 34900c7d97c5SJed Brown ierr = PetscFree(coarsefunctions_errors);CHKERRQ(ierr); 34910c7d97c5SJed Brown ierr = PetscFree(constraints_errors);CHKERRQ(ierr); 34920c7d97c5SJed Brown } 34930c7d97c5SJed Brown 34940c7d97c5SJed Brown /* create coarse matrix and data structures for message passing associated actual choice of coarse problem type */ 34950c7d97c5SJed Brown ierr = PCBDDCSetupCoarseEnvironment(pc,coarse_submat_vals);CHKERRQ(ierr); 34960c7d97c5SJed Brown /* free memory */ 34970c7d97c5SJed Brown ierr = PetscFree(coarse_submat_vals);CHKERRQ(ierr); 34980c7d97c5SJed Brown ierr = PetscFree(auxindices);CHKERRQ(ierr); 34990c7d97c5SJed Brown ierr = PetscFree(nnz);CHKERRQ(ierr); 35003b03a366Sstefano_zampini if (n_vertices) { 35010c7d97c5SJed Brown ierr = VecDestroy(&vec1_V);CHKERRQ(ierr); 35020c7d97c5SJed Brown ierr = VecDestroy(&vec2_V);CHKERRQ(ierr); 35030c7d97c5SJed Brown ierr = MatDestroy(&A_RV);CHKERRQ(ierr); 35040c7d97c5SJed Brown ierr = MatDestroy(&A_VR);CHKERRQ(ierr); 35050c7d97c5SJed Brown ierr = MatDestroy(&A_VV);CHKERRQ(ierr); 35060c7d97c5SJed Brown } 3507534831adSStefano Zampini if (n_constraints) { 35080c7d97c5SJed Brown ierr = VecDestroy(&vec1_C);CHKERRQ(ierr); 35090c7d97c5SJed Brown ierr = VecDestroy(&vec2_C);CHKERRQ(ierr); 35100c7d97c5SJed Brown ierr = MatDestroy(&M1);CHKERRQ(ierr); 35110c7d97c5SJed Brown ierr = MatDestroy(&C_CR);CHKERRQ(ierr); 35120c7d97c5SJed Brown } 35130c7d97c5SJed Brown } 35140c7d97c5SJed Brown /* free memory */ 35153b03a366Sstefano_zampini if (n_vertices) { 35160c7d97c5SJed Brown ierr = PetscFree(idx_V_B);CHKERRQ(ierr); 35170c7d97c5SJed Brown ierr = ISDestroy(&is_V_local);CHKERRQ(ierr); 35180c7d97c5SJed Brown } 35190c7d97c5SJed Brown ierr = ISDestroy(&is_R_local);CHKERRQ(ierr); 35200c7d97c5SJed Brown 35210c7d97c5SJed Brown PetscFunctionReturn(0); 35220c7d97c5SJed Brown } 35230c7d97c5SJed Brown 35240c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 35250c7d97c5SJed Brown 35260c7d97c5SJed Brown #undef __FUNCT__ 35270c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetupCoarseEnvironment" 352853cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetupCoarseEnvironment(PC pc,PetscScalar* coarse_submat_vals) 35290c7d97c5SJed Brown { 35300c7d97c5SJed Brown 35310c7d97c5SJed Brown 35320c7d97c5SJed Brown Mat_IS *matis = (Mat_IS*)pc->pmat->data; 35330c7d97c5SJed Brown PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 35340c7d97c5SJed Brown PC_IS *pcis = (PC_IS*)pc->data; 35350c7d97c5SJed Brown MPI_Comm prec_comm = ((PetscObject)pc)->comm; 35360c7d97c5SJed Brown MPI_Comm coarse_comm; 35370c7d97c5SJed Brown 35380c7d97c5SJed Brown /* common to all choiches */ 35390c7d97c5SJed Brown PetscScalar *temp_coarse_mat_vals; 35400c7d97c5SJed Brown PetscScalar *ins_coarse_mat_vals; 35410c7d97c5SJed Brown PetscInt *ins_local_primal_indices; 35420c7d97c5SJed Brown PetscMPIInt *localsizes2,*localdispl2; 35430c7d97c5SJed Brown PetscMPIInt size_prec_comm; 35440c7d97c5SJed Brown PetscMPIInt rank_prec_comm; 35450c7d97c5SJed Brown PetscMPIInt active_rank=MPI_PROC_NULL; 35460c7d97c5SJed Brown PetscMPIInt master_proc=0; 35470c7d97c5SJed Brown PetscInt ins_local_primal_size; 35480c7d97c5SJed Brown /* specific to MULTILEVEL_BDDC */ 35490c7d97c5SJed Brown PetscMPIInt *ranks_recv; 35500c7d97c5SJed Brown PetscMPIInt count_recv=0; 35510c7d97c5SJed Brown PetscMPIInt rank_coarse_proc_send_to; 35520c7d97c5SJed Brown PetscMPIInt coarse_color = MPI_UNDEFINED; 35530c7d97c5SJed Brown ISLocalToGlobalMapping coarse_ISLG; 35540c7d97c5SJed Brown /* some other variables */ 35550c7d97c5SJed Brown PetscErrorCode ierr; 355619fd82e9SBarry Smith MatType coarse_mat_type; 355719fd82e9SBarry Smith PCType coarse_pc_type; 355819fd82e9SBarry Smith KSPType coarse_ksp_type; 355953cdbc3dSStefano Zampini PC pc_temp; 35604fad6a16SStefano Zampini PetscInt i,j,k; 35613b03a366Sstefano_zampini PetscInt max_it_coarse_ksp=1; /* don't increase this value */ 3562e269702eSStefano Zampini /* verbose output viewer */ 3563e269702eSStefano Zampini PetscViewer viewer=pcbddc->dbg_viewer; 3564e269702eSStefano Zampini PetscBool dbg_flag=pcbddc->dbg_flag; 3565142dfd88SStefano Zampini 3566ea7e1babSStefano Zampini PetscInt offset,offset2; 3567142dfd88SStefano Zampini PetscMPIInt im_active=0; 3568523858cfSStefano Zampini PetscInt *dnz,*onz; 3569142dfd88SStefano Zampini 3570142dfd88SStefano Zampini PetscBool setsym,issym=PETSC_FALSE; 35710c7d97c5SJed Brown 35720c7d97c5SJed Brown PetscFunctionBegin; 35730c7d97c5SJed Brown ins_local_primal_indices = 0; 35740c7d97c5SJed Brown ins_coarse_mat_vals = 0; 35750c7d97c5SJed Brown localsizes2 = 0; 35760c7d97c5SJed Brown localdispl2 = 0; 35770c7d97c5SJed Brown temp_coarse_mat_vals = 0; 35780c7d97c5SJed Brown coarse_ISLG = 0; 35790c7d97c5SJed Brown 358053cdbc3dSStefano Zampini ierr = MPI_Comm_size(prec_comm,&size_prec_comm);CHKERRQ(ierr); 358153cdbc3dSStefano Zampini ierr = MPI_Comm_rank(prec_comm,&rank_prec_comm);CHKERRQ(ierr); 3582142dfd88SStefano Zampini ierr = MatIsSymmetricKnown(pc->pmat,&setsym,&issym);CHKERRQ(ierr); 3583142dfd88SStefano Zampini 3584beed3852SStefano Zampini /* Assign global numbering to coarse dofs */ 3585beed3852SStefano Zampini { 3586*ef028eecSStefano Zampini PetscInt *auxlocal_primal; 3587da1bb401SStefano Zampini PetscInt *row_cmat_indices; 35882e8d2280SStefano Zampini PetscInt *aux_ordering; 35892e8d2280SStefano Zampini PetscInt *row_cmat_global_indices; 3590*ef028eecSStefano Zampini PetscInt *dof_sizes,*dof_displs; 35913b03a366Sstefano_zampini PetscInt size_of_constraint; 35922e8d2280SStefano Zampini PetscBool *array_bool; 3593*ef028eecSStefano Zampini PetscBool first_found; 3594*ef028eecSStefano Zampini PetscInt first_index,old_index,s; 3595*ef028eecSStefano Zampini PetscMPIInt mpi_local_primal_size; 3596*ef028eecSStefano Zampini PetscScalar coarsesum,*array; 3597*ef028eecSStefano Zampini 3598*ef028eecSStefano Zampini mpi_local_primal_size = (PetscMPIInt)pcbddc->local_primal_size; 3599beed3852SStefano Zampini 3600beed3852SStefano Zampini /* Construct needed data structures for message passing */ 3601*ef028eecSStefano Zampini ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscInt),&pcbddc->local_primal_indices);CHKERRQ(ierr); 3602ffe5efe1SStefano Zampini j = 0; 3603142dfd88SStefano Zampini if (rank_prec_comm == 0 || pcbddc->coarse_problem_type == REPLICATED_BDDC || pcbddc->coarse_problem_type == MULTILEVEL_BDDC) { 3604ffe5efe1SStefano Zampini j = size_prec_comm; 3605ffe5efe1SStefano Zampini } 3606ffe5efe1SStefano Zampini ierr = PetscMalloc(j*sizeof(PetscMPIInt),&pcbddc->local_primal_sizes);CHKERRQ(ierr); 3607ffe5efe1SStefano Zampini ierr = PetscMalloc(j*sizeof(PetscMPIInt),&pcbddc->local_primal_displacements);CHKERRQ(ierr); 3608beed3852SStefano Zampini /* Gather local_primal_size information for all processes */ 3609142dfd88SStefano Zampini if (pcbddc->coarse_problem_type == REPLICATED_BDDC || pcbddc->coarse_problem_type == MULTILEVEL_BDDC) { 36105619798eSStefano Zampini ierr = MPI_Allgather(&mpi_local_primal_size,1,MPIU_INT,&pcbddc->local_primal_sizes[0],1,MPIU_INT,prec_comm);CHKERRQ(ierr); 3611ffe5efe1SStefano Zampini } else { 3612ffe5efe1SStefano Zampini ierr = MPI_Gather(&mpi_local_primal_size,1,MPIU_INT,&pcbddc->local_primal_sizes[0],1,MPIU_INT,0,prec_comm);CHKERRQ(ierr); 3613ffe5efe1SStefano Zampini } 3614beed3852SStefano Zampini pcbddc->replicated_primal_size = 0; 3615ffe5efe1SStefano Zampini for (i=0; i<j; i++) { 3616beed3852SStefano Zampini pcbddc->local_primal_displacements[i] = pcbddc->replicated_primal_size ; 3617beed3852SStefano Zampini pcbddc->replicated_primal_size += pcbddc->local_primal_sizes[i]; 3618beed3852SStefano Zampini } 3619beed3852SStefano Zampini 3620da1bb401SStefano Zampini /* First let's count coarse dofs. 3621beed3852SStefano Zampini This code fragment assumes that the number of local constraints per connected component 3622beed3852SStefano Zampini is not greater than the number of nodes defined for the connected component 3623beed3852SStefano Zampini (otherwise we will surely have linear dependence between constraints and thus a singular coarse problem) */ 3624*ef028eecSStefano Zampini ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscInt),&auxlocal_primal);CHKERRQ(ierr); 36252e8d2280SStefano Zampini j = 0; 36262e8d2280SStefano Zampini for (i=0;i<pcbddc->local_primal_size;i++) { 36272e8d2280SStefano Zampini ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,PETSC_NULL,PETSC_NULL);CHKERRQ(ierr); 36282e8d2280SStefano Zampini if ( j < size_of_constraint ) { 36292e8d2280SStefano Zampini j = size_of_constraint; 36302e8d2280SStefano Zampini } 36312e8d2280SStefano Zampini ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,PETSC_NULL,PETSC_NULL);CHKERRQ(ierr); 36322e8d2280SStefano Zampini } 36332e8d2280SStefano Zampini ierr = PetscMalloc(j*sizeof(PetscInt),&aux_ordering);CHKERRQ(ierr); 36342e8d2280SStefano Zampini ierr = PetscMalloc(j*sizeof(PetscInt),&row_cmat_global_indices);CHKERRQ(ierr); 36352e8d2280SStefano Zampini ierr = PetscMalloc(pcis->n*sizeof(PetscBool),&array_bool);CHKERRQ(ierr); 36362e8d2280SStefano Zampini for (i=0;i<pcis->n;i++) { 36372e8d2280SStefano Zampini array_bool[i] = PETSC_FALSE; 36382e8d2280SStefano Zampini } 3639da1bb401SStefano Zampini for (i=0;i<pcbddc->local_primal_size;i++) { 3640da1bb401SStefano Zampini ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr); 36413b03a366Sstefano_zampini for (j=0; j<size_of_constraint; j++) { 36422e8d2280SStefano Zampini aux_ordering[j] = j; 36432e8d2280SStefano Zampini } 36442e8d2280SStefano Zampini ierr = ISLocalToGlobalMappingApply(matis->mapping,size_of_constraint,row_cmat_indices,row_cmat_global_indices);CHKERRQ(ierr); 36452e8d2280SStefano Zampini ierr = PetscSortIntWithPermutation(size_of_constraint,row_cmat_global_indices,aux_ordering);CHKERRQ(ierr); 36462e8d2280SStefano Zampini for (j=0; j<size_of_constraint; j++) { 36472e8d2280SStefano Zampini k = row_cmat_indices[aux_ordering[j]]; 36482e8d2280SStefano Zampini if ( !array_bool[k] ) { 36492e8d2280SStefano Zampini array_bool[k] = PETSC_TRUE; 3650da1bb401SStefano Zampini auxlocal_primal[i] = k; 3651beed3852SStefano Zampini break; 3652beed3852SStefano Zampini } 3653beed3852SStefano Zampini } 3654da1bb401SStefano Zampini ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr); 3655beed3852SStefano Zampini } 36562e8d2280SStefano Zampini ierr = PetscFree(aux_ordering);CHKERRQ(ierr); 3657*ef028eecSStefano Zampini ierr = PetscFree(array_bool);CHKERRQ(ierr); 3658*ef028eecSStefano Zampini ierr = PetscFree(row_cmat_global_indices);CHKERRQ(ierr); 36592e8d2280SStefano Zampini 3660*ef028eecSStefano Zampini /* Compute number of coarse dofs */ 3661*ef028eecSStefano Zampini ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr); 3662*ef028eecSStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 3663*ef028eecSStefano Zampini for (i=0;i<pcbddc->local_primal_size;i++) { 3664*ef028eecSStefano Zampini array[auxlocal_primal[i]]=1.0; 3665*ef028eecSStefano Zampini } 3666*ef028eecSStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 3667*ef028eecSStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 3668*ef028eecSStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 3669*ef028eecSStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,pcis->vec1_global,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 3670*ef028eecSStefano Zampini ierr = VecSum(pcis->vec1_global,&coarsesum);CHKERRQ(ierr); 3671*ef028eecSStefano Zampini pcbddc->coarse_size = (PetscInt)coarsesum; 3672*ef028eecSStefano Zampini 3673*ef028eecSStefano Zampini /* Fill pcis->vec1_global with cumulative function for global numbering */ 3674*ef028eecSStefano Zampini ierr = VecGetArray(pcis->vec1_global,&array);CHKERRQ(ierr); 3675*ef028eecSStefano Zampini ierr = VecGetLocalSize(pcis->vec1_global,&s);CHKERRQ(ierr); 3676*ef028eecSStefano Zampini k = 0; 3677*ef028eecSStefano Zampini first_index = -1; 3678*ef028eecSStefano Zampini first_found = PETSC_FALSE; 3679*ef028eecSStefano Zampini for (i=0;i<s;i++) { 3680*ef028eecSStefano Zampini if (!first_found && array[i] > 0.0) { 3681*ef028eecSStefano Zampini first_found = PETSC_TRUE; 3682*ef028eecSStefano Zampini first_index = i; 3683*ef028eecSStefano Zampini } 3684*ef028eecSStefano Zampini k += (PetscInt)array[i]; 3685*ef028eecSStefano Zampini } 3686*ef028eecSStefano Zampini j = ( !rank_prec_comm ? size_prec_comm : 0); 3687*ef028eecSStefano Zampini ierr = PetscMalloc(j*sizeof(*dof_sizes),&dof_sizes);CHKERRQ(ierr); 3688*ef028eecSStefano Zampini ierr = PetscMalloc(j*sizeof(*dof_displs),&dof_displs);CHKERRQ(ierr); 3689*ef028eecSStefano Zampini ierr = MPI_Gather(&k,1,MPIU_INT,dof_sizes,1,MPIU_INT,0,prec_comm);CHKERRQ(ierr); 3690*ef028eecSStefano Zampini if (!rank_prec_comm) { 3691*ef028eecSStefano Zampini dof_displs[0]=0; 3692*ef028eecSStefano Zampini for (i=1;i<size_prec_comm;i++) { 3693*ef028eecSStefano Zampini dof_displs[i] = dof_displs[i-1]+dof_sizes[i-1]; 3694*ef028eecSStefano Zampini } 3695*ef028eecSStefano Zampini } 3696*ef028eecSStefano Zampini ierr = MPI_Scatter(dof_displs,1,MPIU_INT,&k,1,MPIU_INT,0,prec_comm);CHKERRQ(ierr); 3697*ef028eecSStefano Zampini if (first_found) { 3698*ef028eecSStefano Zampini array[first_index] += k; 3699*ef028eecSStefano Zampini old_index = first_index; 3700*ef028eecSStefano Zampini for (i=first_index+1;i<s;i++) { 3701*ef028eecSStefano Zampini if (array[i] > 0.0) { 3702*ef028eecSStefano Zampini array[i] += array[old_index]; 3703*ef028eecSStefano Zampini old_index = i; 3704*ef028eecSStefano Zampini } 3705*ef028eecSStefano Zampini } 3706*ef028eecSStefano Zampini } 3707*ef028eecSStefano Zampini ierr = VecRestoreArray(pcis->vec1_global,&array);CHKERRQ(ierr); 3708*ef028eecSStefano Zampini ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr); 3709*ef028eecSStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 3710*ef028eecSStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 3711*ef028eecSStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 3712*ef028eecSStefano Zampini for (i=0;i<pcbddc->local_primal_size;i++) { 3713*ef028eecSStefano Zampini pcbddc->local_primal_indices[i] = (PetscInt)array[auxlocal_primal[i]]-1; 3714*ef028eecSStefano Zampini } 3715*ef028eecSStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 3716*ef028eecSStefano Zampini ierr = PetscFree(dof_displs);CHKERRQ(ierr); 3717*ef028eecSStefano Zampini ierr = PetscFree(dof_sizes);CHKERRQ(ierr); 3718*ef028eecSStefano Zampini 3719*ef028eecSStefano Zampini if (dbg_flag) { 37202e8d2280SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 37212e8d2280SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr); 37222e8d2280SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Check coarse indices\n");CHKERRQ(ierr); 37232e8d2280SStefano Zampini ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr); 37242e8d2280SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 3725*ef028eecSStefano Zampini for (i=0;i<pcbddc->local_primal_size;i++) { 3726*ef028eecSStefano Zampini array[auxlocal_primal[i]]=1.0; 37272e8d2280SStefano Zampini } 3728beed3852SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 37292e8d2280SStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 3730da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 3731da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 3732da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 3733da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 3734da1bb401SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 37352e8d2280SStefano Zampini for (i=0;i<pcis->n;i++) { 37362e8d2280SStefano Zampini if (array[i] == 1.0) { 37372e8d2280SStefano Zampini ierr = ISLocalToGlobalMappingApply(matis->mapping,1,&i,&j);CHKERRQ(ierr); 37382e8d2280SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d: WRONG COARSE INDEX %d (local %d)\n",PetscGlobalRank,j,i);CHKERRQ(ierr); 37392e8d2280SStefano Zampini } 37402e8d2280SStefano Zampini } 37412e8d2280SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 37422e8d2280SStefano Zampini for (i=0;i<pcis->n;i++) { 37432e8d2280SStefano Zampini if( array[i] > 0.0) { 37442e8d2280SStefano Zampini array[i] = 1.0/array[i]; 37452e8d2280SStefano Zampini } 37462e8d2280SStefano Zampini } 3747da1bb401SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 37482e8d2280SStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 3749da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 3750da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 3751da1bb401SStefano Zampini ierr = VecSum(pcis->vec1_global,&coarsesum);CHKERRQ(ierr); 37522e8d2280SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Size of coarse problem SHOULD be %lf\n",coarsesum);CHKERRQ(ierr); 37532e8d2280SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 37542e8d2280SStefano Zampini } 3755142dfd88SStefano Zampini ierr = PetscFree(auxlocal_primal);CHKERRQ(ierr); 37560bdf917eSStefano Zampini } 37570bdf917eSStefano Zampini 37582e8d2280SStefano Zampini if (dbg_flag) { 37597cf533a6SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Size of coarse problem is %d\n",pcbddc->coarse_size);CHKERRQ(ierr); 37602e8d2280SStefano Zampini /*ierr = PetscViewerASCIIPrintf(viewer,"Distribution of local primal indices\n");CHKERRQ(ierr); 37612e8d2280SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 37622e8d2280SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d\n",PetscGlobalRank);CHKERRQ(ierr); 37632e8d2280SStefano Zampini for (i=0;i<pcbddc->local_primal_size;i++) { 37642e8d2280SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local_primal_indices[%d]=%d \n",i,pcbddc->local_primal_indices[i]); 37652e8d2280SStefano Zampini }*/ 37662e8d2280SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 37672e8d2280SStefano Zampini } 37682e8d2280SStefano Zampini 37690bdf917eSStefano Zampini if (pcis->n) { im_active = 1; } 37700bdf917eSStefano Zampini ierr = MPI_Allreduce(&im_active,&pcbddc->active_procs,1,MPIU_INT,MPI_SUM,prec_comm);CHKERRQ(ierr); 37710bdf917eSStefano Zampini 37720bdf917eSStefano Zampini /* adapt coarse problem type */ 37734fad6a16SStefano Zampini if (pcbddc->coarse_problem_type == MULTILEVEL_BDDC) { 37744fad6a16SStefano Zampini if (pcbddc->current_level < pcbddc->max_levels) { 37754fad6a16SStefano Zampini if ( (pcbddc->active_procs/pcbddc->coarsening_ratio) < 2 ) { 37760bdf917eSStefano Zampini if (dbg_flag) { 37774fad6a16SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Not enough active processes on level %d (active %d,ratio %d). Parallel direct solve for coarse problem\n",pcbddc->current_level,pcbddc->active_procs,pcbddc->coarsening_ratio);CHKERRQ(ierr); 37780bdf917eSStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 37790bdf917eSStefano Zampini } 37800bdf917eSStefano Zampini pcbddc->coarse_problem_type = PARALLEL_BDDC; 3781142dfd88SStefano Zampini } 37824fad6a16SStefano Zampini } else { 37834fad6a16SStefano Zampini if (dbg_flag) { 37844fad6a16SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Max number of levels reached. Using parallel direct solve for coarse problem\n",pcbddc->max_levels,pcbddc->active_procs,pcbddc->coarsening_ratio);CHKERRQ(ierr); 37854fad6a16SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 37864fad6a16SStefano Zampini } 37874fad6a16SStefano Zampini pcbddc->coarse_problem_type = PARALLEL_BDDC; 37884fad6a16SStefano Zampini } 37894fad6a16SStefano Zampini } 3790beed3852SStefano Zampini 37910c7d97c5SJed Brown switch(pcbddc->coarse_problem_type){ 37920c7d97c5SJed Brown 3793da1bb401SStefano Zampini case(MULTILEVEL_BDDC): /* we define a coarse mesh where subdomains are elements */ 37940c7d97c5SJed Brown { 37950c7d97c5SJed Brown /* we need additional variables */ 37960c7d97c5SJed Brown MetisInt n_subdomains,n_parts,objval,ncon,faces_nvtxs; 37970c7d97c5SJed Brown MetisInt *metis_coarse_subdivision; 37980c7d97c5SJed Brown MetisInt options[METIS_NOPTIONS]; 37990c7d97c5SJed Brown PetscMPIInt size_coarse_comm,rank_coarse_comm; 38000c7d97c5SJed Brown PetscMPIInt procs_jumps_coarse_comm; 38010c7d97c5SJed Brown PetscMPIInt *coarse_subdivision; 38020c7d97c5SJed Brown PetscMPIInt *total_count_recv; 38030c7d97c5SJed Brown PetscMPIInt *total_ranks_recv; 38040c7d97c5SJed Brown PetscMPIInt *displacements_recv; 38050c7d97c5SJed Brown PetscMPIInt *my_faces_connectivity; 38060c7d97c5SJed Brown PetscMPIInt *petsc_faces_adjncy; 38070c7d97c5SJed Brown MetisInt *faces_adjncy; 38080c7d97c5SJed Brown MetisInt *faces_xadj; 38090c7d97c5SJed Brown PetscMPIInt *number_of_faces; 38100c7d97c5SJed Brown PetscMPIInt *faces_displacements; 38110c7d97c5SJed Brown PetscInt *array_int; 38120c7d97c5SJed Brown PetscMPIInt my_faces=0; 38130c7d97c5SJed Brown PetscMPIInt total_faces=0; 38143828260eSStefano Zampini PetscInt ranks_stretching_ratio; 38150c7d97c5SJed Brown 38160c7d97c5SJed Brown /* define some quantities */ 38170c7d97c5SJed Brown pcbddc->coarse_communications_type = SCATTERS_BDDC; 38180c7d97c5SJed Brown coarse_mat_type = MATIS; 38190c7d97c5SJed Brown coarse_pc_type = PCBDDC; 3820142dfd88SStefano Zampini coarse_ksp_type = KSPRICHARDSON; 38210c7d97c5SJed Brown 38220c7d97c5SJed Brown /* details of coarse decomposition */ 38230c7d97c5SJed Brown n_subdomains = pcbddc->active_procs; 38240c7d97c5SJed Brown n_parts = n_subdomains/pcbddc->coarsening_ratio; 38253828260eSStefano Zampini ranks_stretching_ratio = size_prec_comm/pcbddc->active_procs; 38263828260eSStefano Zampini procs_jumps_coarse_comm = pcbddc->coarsening_ratio*ranks_stretching_ratio; 38273828260eSStefano Zampini 38284fad6a16SStefano Zampini /* build CSR graph of subdomains' connectivity */ 38290c7d97c5SJed Brown ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&array_int);CHKERRQ(ierr); 38303828260eSStefano Zampini ierr = PetscMemzero(array_int,pcis->n*sizeof(PetscInt));CHKERRQ(ierr); 38310c7d97c5SJed Brown for (i=1;i<pcis->n_neigh;i++){/* i=1 so I don't count myself -> faces nodes counts to 1 */ 38320c7d97c5SJed Brown for (j=0;j<pcis->n_shared[i];j++){ 38330c7d97c5SJed Brown array_int[ pcis->shared[i][j] ]+=1; 38340c7d97c5SJed Brown } 38350c7d97c5SJed Brown } 38360c7d97c5SJed Brown for (i=1;i<pcis->n_neigh;i++){ 38370c7d97c5SJed Brown for (j=0;j<pcis->n_shared[i];j++){ 38387cf533a6SStefano Zampini if (array_int[ pcis->shared[i][j] ] > 0 ){ 38390c7d97c5SJed Brown my_faces++; 38400c7d97c5SJed Brown break; 38410c7d97c5SJed Brown } 38420c7d97c5SJed Brown } 38430c7d97c5SJed Brown } 38440c7d97c5SJed Brown 384553cdbc3dSStefano Zampini ierr = MPI_Reduce(&my_faces,&total_faces,1,MPIU_INT,MPI_SUM,master_proc,prec_comm);CHKERRQ(ierr); 38460c7d97c5SJed Brown ierr = PetscMalloc (my_faces*sizeof(PetscInt),&my_faces_connectivity);CHKERRQ(ierr); 38470c7d97c5SJed Brown my_faces=0; 38480c7d97c5SJed Brown for (i=1;i<pcis->n_neigh;i++){ 38490c7d97c5SJed Brown for (j=0;j<pcis->n_shared[i];j++){ 38507cf533a6SStefano Zampini if (array_int[ pcis->shared[i][j] ] > 0 ){ 38510c7d97c5SJed Brown my_faces_connectivity[my_faces]=pcis->neigh[i]; 38520c7d97c5SJed Brown my_faces++; 38530c7d97c5SJed Brown break; 38540c7d97c5SJed Brown } 38550c7d97c5SJed Brown } 38560c7d97c5SJed Brown } 38570c7d97c5SJed Brown if (rank_prec_comm == master_proc) { 38580c7d97c5SJed Brown ierr = PetscMalloc (total_faces*sizeof(PetscMPIInt),&petsc_faces_adjncy);CHKERRQ(ierr); 38590c7d97c5SJed Brown ierr = PetscMalloc (size_prec_comm*sizeof(PetscMPIInt),&number_of_faces);CHKERRQ(ierr); 38600c7d97c5SJed Brown ierr = PetscMalloc (total_faces*sizeof(MetisInt),&faces_adjncy);CHKERRQ(ierr); 38610c7d97c5SJed Brown ierr = PetscMalloc ((n_subdomains+1)*sizeof(MetisInt),&faces_xadj);CHKERRQ(ierr); 38620c7d97c5SJed Brown ierr = PetscMalloc ((size_prec_comm+1)*sizeof(PetscMPIInt),&faces_displacements);CHKERRQ(ierr); 38630c7d97c5SJed Brown } 386453cdbc3dSStefano Zampini ierr = MPI_Gather(&my_faces,1,MPIU_INT,&number_of_faces[0],1,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr); 38650c7d97c5SJed Brown if (rank_prec_comm == master_proc) { 38660c7d97c5SJed Brown faces_xadj[0]=0; 38670c7d97c5SJed Brown faces_displacements[0]=0; 38680c7d97c5SJed Brown j=0; 38690c7d97c5SJed Brown for (i=1;i<size_prec_comm+1;i++) { 38700c7d97c5SJed Brown faces_displacements[i]=faces_displacements[i-1]+number_of_faces[i-1]; 38710c7d97c5SJed Brown if (number_of_faces[i-1]) { 38720c7d97c5SJed Brown j++; 38730c7d97c5SJed Brown faces_xadj[j]=faces_xadj[j-1]+number_of_faces[i-1]; 38740c7d97c5SJed Brown } 38750c7d97c5SJed Brown } 38760c7d97c5SJed Brown } 387753cdbc3dSStefano Zampini ierr = MPI_Gatherv(&my_faces_connectivity[0],my_faces,MPIU_INT,&petsc_faces_adjncy[0],number_of_faces,faces_displacements,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr); 38780c7d97c5SJed Brown ierr = PetscFree(my_faces_connectivity);CHKERRQ(ierr); 38790c7d97c5SJed Brown ierr = PetscFree(array_int);CHKERRQ(ierr); 38800c7d97c5SJed Brown if (rank_prec_comm == master_proc) { 38813828260eSStefano Zampini for (i=0;i<total_faces;i++) faces_adjncy[i]=(MetisInt)(petsc_faces_adjncy[i]/ranks_stretching_ratio); /* cast to MetisInt */ 3882da1bb401SStefano Zampini /*printf("This is the face connectivity (actual ranks)\n"); 38830c7d97c5SJed Brown for (i=0;i<n_subdomains;i++){ 38840c7d97c5SJed Brown printf("proc %d is connected with \n",i); 38850c7d97c5SJed Brown for (j=faces_xadj[i];j<faces_xadj[i+1];j++) 38860c7d97c5SJed Brown printf("%d ",faces_adjncy[j]); 38870c7d97c5SJed Brown printf("\n"); 3888da1bb401SStefano Zampini }*/ 38890c7d97c5SJed Brown ierr = PetscFree(faces_displacements);CHKERRQ(ierr); 38900c7d97c5SJed Brown ierr = PetscFree(number_of_faces);CHKERRQ(ierr); 38910c7d97c5SJed Brown ierr = PetscFree(petsc_faces_adjncy);CHKERRQ(ierr); 38920c7d97c5SJed Brown } 38930c7d97c5SJed Brown 38940c7d97c5SJed Brown if ( rank_prec_comm == master_proc ) { 38950c7d97c5SJed Brown 38963828260eSStefano Zampini PetscInt heuristic_for_metis=3; 38973828260eSStefano Zampini 38980c7d97c5SJed Brown ncon=1; 38990c7d97c5SJed Brown faces_nvtxs=n_subdomains; 39000c7d97c5SJed Brown /* partition graoh induced by face connectivity */ 39010c7d97c5SJed Brown ierr = PetscMalloc (n_subdomains*sizeof(MetisInt),&metis_coarse_subdivision);CHKERRQ(ierr); 39020c7d97c5SJed Brown ierr = METIS_SetDefaultOptions(options); 39030c7d97c5SJed Brown /* we need a contiguous partition of the coarse mesh */ 39040c7d97c5SJed Brown options[METIS_OPTION_CONTIG]=1; 39050c7d97c5SJed Brown options[METIS_OPTION_NITER]=30; 39064fad6a16SStefano Zampini if (pcbddc->coarsening_ratio > 1) { 39073828260eSStefano Zampini if (n_subdomains>n_parts*heuristic_for_metis) { 39083828260eSStefano Zampini options[METIS_OPTION_IPTYPE]=METIS_IPTYPE_EDGE; 39093828260eSStefano Zampini options[METIS_OPTION_OBJTYPE]=METIS_OBJTYPE_CUT; 39100c7d97c5SJed Brown ierr = METIS_PartGraphKway(&faces_nvtxs,&ncon,faces_xadj,faces_adjncy,NULL,NULL,NULL,&n_parts,NULL,NULL,options,&objval,metis_coarse_subdivision); 3911142dfd88SStefano Zampini if (ierr != METIS_OK) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in METIS_PartGraphKway (metis error code %D) called from PCBDDCSetupCoarseEnvironment\n",ierr); 39123828260eSStefano Zampini } else { 39133828260eSStefano Zampini ierr = METIS_PartGraphRecursive(&faces_nvtxs,&ncon,faces_xadj,faces_adjncy,NULL,NULL,NULL,&n_parts,NULL,NULL,options,&objval,metis_coarse_subdivision); 3914142dfd88SStefano Zampini if (ierr != METIS_OK) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in METIS_PartGraphRecursive (metis error code %D) called from PCBDDCSetupCoarseEnvironment\n",ierr); 39153828260eSStefano Zampini } 39164fad6a16SStefano Zampini } else { 39174fad6a16SStefano Zampini for (i=0;i<n_subdomains;i++) { 39184fad6a16SStefano Zampini metis_coarse_subdivision[i]=i; 39194fad6a16SStefano Zampini } 39204fad6a16SStefano Zampini } 39210c7d97c5SJed Brown ierr = PetscFree(faces_xadj);CHKERRQ(ierr); 39220c7d97c5SJed Brown ierr = PetscFree(faces_adjncy);CHKERRQ(ierr); 39230bdf917eSStefano Zampini ierr = PetscMalloc(size_prec_comm*sizeof(PetscMPIInt),&coarse_subdivision);CHKERRQ(ierr); 39240c7d97c5SJed Brown /* copy/cast values avoiding possible type conflicts between PETSc, MPI and METIS */ 39250bdf917eSStefano Zampini for (i=0;i<size_prec_comm;i++) { coarse_subdivision[i]=MPI_PROC_NULL; } 39260bdf917eSStefano Zampini for (i=0;i<n_subdomains;i++) { coarse_subdivision[ranks_stretching_ratio*i]=(PetscInt)(metis_coarse_subdivision[i]); } 39270c7d97c5SJed Brown ierr = PetscFree(metis_coarse_subdivision);CHKERRQ(ierr); 39280c7d97c5SJed Brown } 39290c7d97c5SJed Brown 39300c7d97c5SJed Brown /* Create new communicator for coarse problem splitting the old one */ 39310c7d97c5SJed Brown if ( !(rank_prec_comm%procs_jumps_coarse_comm) && rank_prec_comm < procs_jumps_coarse_comm*n_parts ){ 3932da1bb401SStefano Zampini coarse_color=0; /* for communicator splitting */ 3933da1bb401SStefano Zampini active_rank=rank_prec_comm; /* for insertion of matrix values */ 39340c7d97c5SJed Brown } 3935da1bb401SStefano Zampini /* procs with coarse_color = MPI_UNDEFINED will have coarse_comm = MPI_COMM_NULL (from mpi standards) 3936da1bb401SStefano Zampini key = rank_prec_comm -> keep same ordering of ranks from the old to the new communicator */ 393753cdbc3dSStefano Zampini ierr = MPI_Comm_split(prec_comm,coarse_color,rank_prec_comm,&coarse_comm);CHKERRQ(ierr); 39380c7d97c5SJed Brown 39390c7d97c5SJed Brown if ( coarse_color == 0 ) { 394053cdbc3dSStefano Zampini ierr = MPI_Comm_size(coarse_comm,&size_coarse_comm);CHKERRQ(ierr); 394153cdbc3dSStefano Zampini ierr = MPI_Comm_rank(coarse_comm,&rank_coarse_comm);CHKERRQ(ierr); 39420c7d97c5SJed Brown } else { 39430c7d97c5SJed Brown rank_coarse_comm = MPI_PROC_NULL; 39440c7d97c5SJed Brown } 39450c7d97c5SJed Brown 39467cf533a6SStefano Zampini /* master proc take care of arranging and distributing coarse information */ 39470c7d97c5SJed Brown if (rank_coarse_comm == master_proc) { 39480c7d97c5SJed Brown ierr = PetscMalloc (size_coarse_comm*sizeof(PetscMPIInt),&displacements_recv);CHKERRQ(ierr); 39490bdf917eSStefano Zampini ierr = PetscMalloc (size_coarse_comm*sizeof(PetscMPIInt),&total_count_recv);CHKERRQ(ierr); 39500bdf917eSStefano Zampini ierr = PetscMalloc (n_subdomains*sizeof(PetscMPIInt),&total_ranks_recv);CHKERRQ(ierr); 39510c7d97c5SJed Brown /* some initializations */ 39520c7d97c5SJed Brown displacements_recv[0]=0; 39530bdf917eSStefano Zampini ierr = PetscMemzero(total_count_recv,size_coarse_comm*sizeof(PetscMPIInt));CHKERRQ(ierr); 39540c7d97c5SJed Brown /* count from how many processes the j-th process of the coarse decomposition will receive data */ 39550bdf917eSStefano Zampini for (j=0;j<size_coarse_comm;j++) { 39560bdf917eSStefano Zampini for (i=0;i<size_prec_comm;i++) { 39570bdf917eSStefano Zampini if (coarse_subdivision[i]==j) { 39580c7d97c5SJed Brown total_count_recv[j]++; 39590bdf917eSStefano Zampini } 39600bdf917eSStefano Zampini } 39610bdf917eSStefano Zampini } 39620c7d97c5SJed Brown /* displacements needed for scatterv of total_ranks_recv */ 39630bdf917eSStefano Zampini for (i=1;i<size_coarse_comm;i++) { displacements_recv[i]=displacements_recv[i-1]+total_count_recv[i-1]; } 39640c7d97c5SJed Brown /* Now fill properly total_ranks_recv -> each coarse process will receive the ranks (in prec_comm communicator) of its friend (sending) processes */ 39650c7d97c5SJed Brown ierr = PetscMemzero(total_count_recv,size_coarse_comm*sizeof(PetscMPIInt));CHKERRQ(ierr); 39660c7d97c5SJed Brown for (j=0;j<size_coarse_comm;j++) { 39673828260eSStefano Zampini for (i=0;i<size_prec_comm;i++) { 39680c7d97c5SJed Brown if (coarse_subdivision[i]==j) { 39690c7d97c5SJed Brown total_ranks_recv[displacements_recv[j]+total_count_recv[j]]=i; 39703828260eSStefano Zampini total_count_recv[j]+=1; 39710c7d97c5SJed Brown } 39720c7d97c5SJed Brown } 39730c7d97c5SJed Brown } 3974da1bb401SStefano Zampini /*for (j=0;j<size_coarse_comm;j++) { 39753828260eSStefano Zampini printf("process %d in new rank will receive from %d processes (original ranks follows)\n",j,total_count_recv[j]); 39763828260eSStefano Zampini for (i=0;i<total_count_recv[j];i++) { 39773828260eSStefano Zampini printf("%d ",total_ranks_recv[displacements_recv[j]+i]); 39783828260eSStefano Zampini } 39793828260eSStefano Zampini printf("\n"); 3980da1bb401SStefano Zampini }*/ 39810c7d97c5SJed Brown 39820c7d97c5SJed Brown /* identify new decomposition in terms of ranks in the old communicator */ 39830bdf917eSStefano Zampini for (i=0;i<n_subdomains;i++) { 39840bdf917eSStefano Zampini coarse_subdivision[ranks_stretching_ratio*i]=coarse_subdivision[ranks_stretching_ratio*i]*procs_jumps_coarse_comm; 39850bdf917eSStefano Zampini } 3986da1bb401SStefano Zampini /*printf("coarse_subdivision in old end new ranks\n"); 39870c7d97c5SJed Brown for (i=0;i<size_prec_comm;i++) 39883828260eSStefano Zampini if (coarse_subdivision[i]!=MPI_PROC_NULL) { 39893828260eSStefano Zampini printf("%d=(%d %d), ",i,coarse_subdivision[i],coarse_subdivision[i]/procs_jumps_coarse_comm); 39903828260eSStefano Zampini } else { 39913828260eSStefano Zampini printf("%d=(%d %d), ",i,coarse_subdivision[i],coarse_subdivision[i]); 39923828260eSStefano Zampini } 3993da1bb401SStefano Zampini printf("\n");*/ 39940c7d97c5SJed Brown } 39950c7d97c5SJed Brown 39960c7d97c5SJed Brown /* Scatter new decomposition for send details */ 399753cdbc3dSStefano Zampini ierr = MPI_Scatter(&coarse_subdivision[0],1,MPIU_INT,&rank_coarse_proc_send_to,1,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr); 39980c7d97c5SJed Brown /* Scatter receiving details to members of coarse decomposition */ 39990c7d97c5SJed Brown if ( coarse_color == 0) { 400053cdbc3dSStefano Zampini ierr = MPI_Scatter(&total_count_recv[0],1,MPIU_INT,&count_recv,1,MPIU_INT,master_proc,coarse_comm);CHKERRQ(ierr); 40010c7d97c5SJed Brown ierr = PetscMalloc (count_recv*sizeof(PetscMPIInt),&ranks_recv);CHKERRQ(ierr); 400253cdbc3dSStefano Zampini ierr = MPI_Scatterv(&total_ranks_recv[0],total_count_recv,displacements_recv,MPIU_INT,&ranks_recv[0],count_recv,MPIU_INT,master_proc,coarse_comm);CHKERRQ(ierr); 40030c7d97c5SJed Brown } 40040c7d97c5SJed Brown 4005da1bb401SStefano Zampini /*printf("I will send my matrix data to proc %d\n",rank_coarse_proc_send_to); 4006da1bb401SStefano Zampini if (coarse_color == 0) { 4007da1bb401SStefano Zampini printf("I will receive some matrix data from %d processes (ranks follows)\n",count_recv); 4008da1bb401SStefano Zampini for (i=0;i<count_recv;i++) 4009da1bb401SStefano Zampini printf("%d ",ranks_recv[i]); 4010da1bb401SStefano Zampini printf("\n"); 4011da1bb401SStefano Zampini }*/ 40120c7d97c5SJed Brown 40130c7d97c5SJed Brown if (rank_prec_comm == master_proc) { 40140bdf917eSStefano Zampini ierr = PetscFree(coarse_subdivision);CHKERRQ(ierr); 4015da1bb401SStefano Zampini ierr = PetscFree(total_count_recv);CHKERRQ(ierr); 40160bdf917eSStefano Zampini ierr = PetscFree(total_ranks_recv);CHKERRQ(ierr); 40170c7d97c5SJed Brown ierr = PetscFree(displacements_recv);CHKERRQ(ierr); 40180c7d97c5SJed Brown } 40190c7d97c5SJed Brown break; 40200c7d97c5SJed Brown } 40210c7d97c5SJed Brown 40220c7d97c5SJed Brown case(REPLICATED_BDDC): 40230c7d97c5SJed Brown 40240c7d97c5SJed Brown pcbddc->coarse_communications_type = GATHERS_BDDC; 40250c7d97c5SJed Brown coarse_mat_type = MATSEQAIJ; 40260c7d97c5SJed Brown coarse_pc_type = PCLU; 402753cdbc3dSStefano Zampini coarse_ksp_type = KSPPREONLY; 40280c7d97c5SJed Brown coarse_comm = PETSC_COMM_SELF; 40290c7d97c5SJed Brown active_rank = rank_prec_comm; 40300c7d97c5SJed Brown break; 40310c7d97c5SJed Brown 40320c7d97c5SJed Brown case(PARALLEL_BDDC): 40330c7d97c5SJed Brown 40340c7d97c5SJed Brown pcbddc->coarse_communications_type = SCATTERS_BDDC; 40350c7d97c5SJed Brown coarse_mat_type = MATMPIAIJ; 40360c7d97c5SJed Brown coarse_pc_type = PCREDUNDANT; 403753cdbc3dSStefano Zampini coarse_ksp_type = KSPPREONLY; 40380c7d97c5SJed Brown coarse_comm = prec_comm; 40390c7d97c5SJed Brown active_rank = rank_prec_comm; 40400c7d97c5SJed Brown break; 40410c7d97c5SJed Brown 40420c7d97c5SJed Brown case(SEQUENTIAL_BDDC): 40430c7d97c5SJed Brown pcbddc->coarse_communications_type = GATHERS_BDDC; 40440c7d97c5SJed Brown coarse_mat_type = MATSEQAIJ; 40450c7d97c5SJed Brown coarse_pc_type = PCLU; 404653cdbc3dSStefano Zampini coarse_ksp_type = KSPPREONLY; 40470c7d97c5SJed Brown coarse_comm = PETSC_COMM_SELF; 40480c7d97c5SJed Brown active_rank = master_proc; 40490c7d97c5SJed Brown break; 40500c7d97c5SJed Brown } 40510c7d97c5SJed Brown 40520c7d97c5SJed Brown switch(pcbddc->coarse_communications_type){ 40530c7d97c5SJed Brown 40540c7d97c5SJed Brown case(SCATTERS_BDDC): 40550c7d97c5SJed Brown { 40560c7d97c5SJed Brown if (pcbddc->coarse_problem_type==MULTILEVEL_BDDC) { 40570c7d97c5SJed Brown 40582e8d2280SStefano Zampini IS coarse_IS; 40592e8d2280SStefano Zampini 4060523858cfSStefano Zampini if(pcbddc->coarsening_ratio == 1) { 4061523858cfSStefano Zampini ins_local_primal_size = pcbddc->local_primal_size; 4062523858cfSStefano Zampini ins_local_primal_indices = pcbddc->local_primal_indices; 4063523858cfSStefano Zampini if (coarse_color == 0) { ierr = PetscFree(ranks_recv);CHKERRQ(ierr); } 4064523858cfSStefano Zampini /* nonzeros */ 4065523858cfSStefano Zampini ierr = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&dnz);CHKERRQ(ierr); 4066523858cfSStefano Zampini ierr = PetscMemzero(dnz,ins_local_primal_size*sizeof(PetscInt));CHKERRQ(ierr); 4067523858cfSStefano Zampini for (i=0;i<ins_local_primal_size;i++) { 4068523858cfSStefano Zampini dnz[i] = ins_local_primal_size; 4069523858cfSStefano Zampini } 4070523858cfSStefano Zampini } else { 40710c7d97c5SJed Brown PetscMPIInt send_size; 4072*ef028eecSStefano Zampini PetscMPIInt *send_buffer; 40730c7d97c5SJed Brown PetscInt *aux_ins_indices; 40740c7d97c5SJed Brown PetscInt ii,jj; 40750c7d97c5SJed Brown MPI_Request *requests; 4076*ef028eecSStefano Zampini 4077523858cfSStefano Zampini ierr = PetscMalloc(count_recv*sizeof(PetscMPIInt),&localdispl2);CHKERRQ(ierr); 4078523858cfSStefano Zampini /* reusing pcbddc->local_primal_displacements and pcbddc->replicated_primal_size */ 4079523858cfSStefano Zampini ierr = PetscFree(pcbddc->local_primal_displacements);CHKERRQ(ierr); 4080523858cfSStefano Zampini ierr = PetscMalloc((count_recv+1)*sizeof(PetscMPIInt),&pcbddc->local_primal_displacements);CHKERRQ(ierr); 4081523858cfSStefano Zampini pcbddc->replicated_primal_size = count_recv; 4082523858cfSStefano Zampini j = 0; 4083523858cfSStefano Zampini for (i=0;i<count_recv;i++) { 4084523858cfSStefano Zampini pcbddc->local_primal_displacements[i] = j; 4085523858cfSStefano Zampini j += pcbddc->local_primal_sizes[ranks_recv[i]]; 4086523858cfSStefano Zampini } 4087523858cfSStefano Zampini pcbddc->local_primal_displacements[count_recv] = j; 4088523858cfSStefano Zampini ierr = PetscMalloc(j*sizeof(PetscMPIInt),&pcbddc->replicated_local_primal_indices);CHKERRQ(ierr); 40890c7d97c5SJed Brown /* allocate auxiliary space */ 4090523858cfSStefano Zampini ierr = PetscMalloc(count_recv*sizeof(PetscMPIInt),&localsizes2);CHKERRQ(ierr); 40910c7d97c5SJed Brown ierr = PetscMalloc(pcbddc->coarse_size*sizeof(PetscInt),&aux_ins_indices);CHKERRQ(ierr); 40920c7d97c5SJed Brown ierr = PetscMemzero(aux_ins_indices,pcbddc->coarse_size*sizeof(PetscInt));CHKERRQ(ierr); 40930c7d97c5SJed Brown /* allocate stuffs for message massing */ 40940c7d97c5SJed Brown ierr = PetscMalloc((count_recv+1)*sizeof(MPI_Request),&requests);CHKERRQ(ierr); 4095523858cfSStefano Zampini for (i=0;i<count_recv+1;i++) { requests[i]=MPI_REQUEST_NULL; } 4096523858cfSStefano Zampini /* send indices to be inserted */ 4097523858cfSStefano Zampini for (i=0;i<count_recv;i++) { 4098523858cfSStefano Zampini send_size = pcbddc->local_primal_sizes[ranks_recv[i]]; 4099523858cfSStefano Zampini ierr = MPI_Irecv(&pcbddc->replicated_local_primal_indices[pcbddc->local_primal_displacements[i]],send_size,MPIU_INT,ranks_recv[i],999,prec_comm,&requests[i]);CHKERRQ(ierr); 4100523858cfSStefano Zampini } 4101523858cfSStefano Zampini if (rank_coarse_proc_send_to != MPI_PROC_NULL ) { 4102523858cfSStefano Zampini send_size = pcbddc->local_primal_size; 4103*ef028eecSStefano Zampini ierr = PetscMalloc(send_size*sizeof(PetscMPIInt),&send_buffer);CHKERRQ(ierr); 4104*ef028eecSStefano Zampini for (i=0;i<send_size;i++) { 4105*ef028eecSStefano Zampini send_buffer[i]=(PetscMPIInt)pcbddc->local_primal_indices[i]; 4106*ef028eecSStefano Zampini } 4107*ef028eecSStefano Zampini ierr = MPI_Isend(send_buffer,send_size,MPIU_INT,rank_coarse_proc_send_to,999,prec_comm,&requests[count_recv]);CHKERRQ(ierr); 4108523858cfSStefano Zampini } 4109523858cfSStefano Zampini ierr = MPI_Waitall(count_recv+1,requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 4110*ef028eecSStefano Zampini if (rank_coarse_proc_send_to != MPI_PROC_NULL ) { 4111*ef028eecSStefano Zampini ierr = PetscFree(send_buffer);CHKERRQ(ierr); 4112*ef028eecSStefano Zampini } 41130c7d97c5SJed Brown j = 0; 41140c7d97c5SJed Brown for (i=0;i<count_recv;i++) { 41152e8d2280SStefano Zampini ii = pcbddc->local_primal_displacements[i+1]-pcbddc->local_primal_displacements[i]; 41162e8d2280SStefano Zampini localsizes2[i] = ii*ii; 41170c7d97c5SJed Brown localdispl2[i] = j; 41180c7d97c5SJed Brown j += localsizes2[i]; 4119523858cfSStefano Zampini jj = pcbddc->local_primal_displacements[i]; 41204fad6a16SStefano Zampini /* it counts the coarse subdomains sharing the coarse node */ 41212e8d2280SStefano Zampini for (k=0;k<ii;k++) { 41224fad6a16SStefano Zampini aux_ins_indices[pcbddc->replicated_local_primal_indices[jj+k]] += 1; 41230c7d97c5SJed Brown } 41244fad6a16SStefano Zampini } 4125523858cfSStefano Zampini /* temp_coarse_mat_vals used to store matrix values to be received */ 41260c7d97c5SJed Brown ierr = PetscMalloc(j*sizeof(PetscScalar),&temp_coarse_mat_vals);CHKERRQ(ierr); 41270c7d97c5SJed Brown /* evaluate how many values I will insert in coarse mat */ 41280c7d97c5SJed Brown ins_local_primal_size = 0; 4129ea7e1babSStefano Zampini for (i=0;i<pcbddc->coarse_size;i++) { 4130ea7e1babSStefano Zampini if (aux_ins_indices[i]) { 41310c7d97c5SJed Brown ins_local_primal_size++; 4132ea7e1babSStefano Zampini } 4133ea7e1babSStefano Zampini } 41340c7d97c5SJed Brown /* evaluate indices I will insert in coarse mat */ 41350c7d97c5SJed Brown ierr = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&ins_local_primal_indices);CHKERRQ(ierr); 41360c7d97c5SJed Brown j = 0; 4137ea7e1babSStefano Zampini for(i=0;i<pcbddc->coarse_size;i++) { 4138ea7e1babSStefano Zampini if(aux_ins_indices[i]) { 41392e8d2280SStefano Zampini ins_local_primal_indices[j] = i; 41402e8d2280SStefano Zampini j++; 4141ea7e1babSStefano Zampini } 4142ea7e1babSStefano Zampini } 4143523858cfSStefano Zampini /* processes partecipating in coarse problem receive matrix data from their friends */ 4144523858cfSStefano Zampini for (i=0;i<count_recv;i++) { 4145523858cfSStefano Zampini ierr = MPI_Irecv(&temp_coarse_mat_vals[localdispl2[i]],localsizes2[i],MPIU_SCALAR,ranks_recv[i],666,prec_comm,&requests[i]);CHKERRQ(ierr); 4146523858cfSStefano Zampini } 4147523858cfSStefano Zampini if (rank_coarse_proc_send_to != MPI_PROC_NULL ) { 4148523858cfSStefano Zampini send_size = pcbddc->local_primal_size*pcbddc->local_primal_size; 4149523858cfSStefano Zampini ierr = MPI_Isend(&coarse_submat_vals[0],send_size,MPIU_SCALAR,rank_coarse_proc_send_to,666,prec_comm,&requests[count_recv]);CHKERRQ(ierr); 4150523858cfSStefano Zampini } 4151523858cfSStefano Zampini ierr = MPI_Waitall(count_recv+1,requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 4152523858cfSStefano Zampini /* nonzeros */ 4153523858cfSStefano Zampini ierr = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&dnz);CHKERRQ(ierr); 4154523858cfSStefano Zampini ierr = PetscMemzero(dnz,ins_local_primal_size*sizeof(PetscInt));CHKERRQ(ierr); 41550c7d97c5SJed Brown /* use aux_ins_indices to realize a global to local mapping */ 41560c7d97c5SJed Brown j=0; 41570c7d97c5SJed Brown for(i=0;i<pcbddc->coarse_size;i++){ 41580c7d97c5SJed Brown if(aux_ins_indices[i]==0){ 41590c7d97c5SJed Brown aux_ins_indices[i]=-1; 41600c7d97c5SJed Brown } else { 41610c7d97c5SJed Brown aux_ins_indices[i]=j; 41620c7d97c5SJed Brown j++; 41630c7d97c5SJed Brown } 41640c7d97c5SJed Brown } 41654fad6a16SStefano Zampini for (i=0;i<count_recv;i++) { 4166523858cfSStefano Zampini j = pcbddc->local_primal_sizes[ranks_recv[i]]; 4167523858cfSStefano Zampini for (k=0;k<j;k++) { 4168523858cfSStefano Zampini dnz[aux_ins_indices[pcbddc->replicated_local_primal_indices[pcbddc->local_primal_displacements[i]+k]]] += j; 41690c7d97c5SJed Brown } 41700c7d97c5SJed Brown } 4171523858cfSStefano Zampini /* check */ 4172523858cfSStefano Zampini for (i=0;i<ins_local_primal_size;i++) { 4173523858cfSStefano Zampini if (dnz[i] > ins_local_primal_size) { 4174523858cfSStefano Zampini dnz[i] = ins_local_primal_size; 41750c7d97c5SJed Brown } 41760c7d97c5SJed Brown } 41770c7d97c5SJed Brown ierr = PetscFree(requests);CHKERRQ(ierr); 41780c7d97c5SJed Brown ierr = PetscFree(aux_ins_indices);CHKERRQ(ierr); 41790c7d97c5SJed Brown if (coarse_color == 0) { ierr = PetscFree(ranks_recv);CHKERRQ(ierr); } 41804fad6a16SStefano Zampini } 41810c7d97c5SJed Brown /* create local to global mapping needed by coarse MATIS */ 4182142dfd88SStefano Zampini if (coarse_comm != MPI_COMM_NULL ) {ierr = MPI_Comm_free(&coarse_comm);CHKERRQ(ierr);} 41830c7d97c5SJed Brown coarse_comm = prec_comm; 41840c7d97c5SJed Brown active_rank = rank_prec_comm; 41850c7d97c5SJed Brown ierr = ISCreateGeneral(coarse_comm,ins_local_primal_size,ins_local_primal_indices,PETSC_COPY_VALUES,&coarse_IS);CHKERRQ(ierr); 41860c7d97c5SJed Brown ierr = ISLocalToGlobalMappingCreateIS(coarse_IS,&coarse_ISLG);CHKERRQ(ierr); 41870c7d97c5SJed Brown ierr = ISDestroy(&coarse_IS);CHKERRQ(ierr); 41882e8d2280SStefano Zampini } else if (pcbddc->coarse_problem_type==PARALLEL_BDDC) { 41890c7d97c5SJed Brown /* arrays for values insertion */ 41900c7d97c5SJed Brown ins_local_primal_size = pcbddc->local_primal_size; 41912e8d2280SStefano Zampini ierr = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&ins_local_primal_indices);CHKERRQ(ierr); 41920c7d97c5SJed Brown ierr = PetscMalloc(ins_local_primal_size*ins_local_primal_size*sizeof(PetscScalar),&ins_coarse_mat_vals);CHKERRQ(ierr); 41930c7d97c5SJed Brown for (j=0;j<ins_local_primal_size;j++){ 41940c7d97c5SJed Brown ins_local_primal_indices[j]=pcbddc->local_primal_indices[j]; 41954fad6a16SStefano Zampini for (i=0;i<ins_local_primal_size;i++) { 41964fad6a16SStefano Zampini ins_coarse_mat_vals[j*ins_local_primal_size+i]=coarse_submat_vals[j*ins_local_primal_size+i]; 41974fad6a16SStefano Zampini } 41980c7d97c5SJed Brown } 41990c7d97c5SJed Brown } 42000c7d97c5SJed Brown break; 42010c7d97c5SJed Brown 42020c7d97c5SJed Brown } 42030c7d97c5SJed Brown 42040c7d97c5SJed Brown case(GATHERS_BDDC): 42050c7d97c5SJed Brown { 42060c7d97c5SJed Brown 42070c7d97c5SJed Brown PetscMPIInt mysize,mysize2; 4208*ef028eecSStefano Zampini PetscMPIInt *send_buffer; 42090c7d97c5SJed Brown 42100c7d97c5SJed Brown if (rank_prec_comm==active_rank) { 42110c7d97c5SJed Brown ierr = PetscMalloc ( pcbddc->replicated_primal_size*sizeof(PetscMPIInt),&pcbddc->replicated_local_primal_indices);CHKERRQ(ierr); 42120bdf917eSStefano Zampini ierr = PetscMalloc ( pcbddc->replicated_primal_size*sizeof(PetscScalar),&pcbddc->replicated_local_primal_values);CHKERRQ(ierr); 42130c7d97c5SJed Brown ierr = PetscMalloc ( size_prec_comm*sizeof(PetscMPIInt),&localsizes2);CHKERRQ(ierr); 42140c7d97c5SJed Brown ierr = PetscMalloc ( size_prec_comm*sizeof(PetscMPIInt),&localdispl2);CHKERRQ(ierr); 42150c7d97c5SJed Brown /* arrays for values insertion */ 42164fad6a16SStefano Zampini for (i=0;i<size_prec_comm;i++) { localsizes2[i]=pcbddc->local_primal_sizes[i]*pcbddc->local_primal_sizes[i]; } 42170c7d97c5SJed Brown localdispl2[0]=0; 42184fad6a16SStefano Zampini for (i=1;i<size_prec_comm;i++) { localdispl2[i]=localsizes2[i-1]+localdispl2[i-1]; } 42190c7d97c5SJed Brown j=0; 42204fad6a16SStefano Zampini for (i=0;i<size_prec_comm;i++) { j+=localsizes2[i]; } 42210c7d97c5SJed Brown ierr = PetscMalloc ( j*sizeof(PetscScalar),&temp_coarse_mat_vals);CHKERRQ(ierr); 42220c7d97c5SJed Brown } 42230c7d97c5SJed Brown 42240c7d97c5SJed Brown mysize=pcbddc->local_primal_size; 42250c7d97c5SJed Brown mysize2=pcbddc->local_primal_size*pcbddc->local_primal_size; 4226*ef028eecSStefano Zampini ierr = PetscMalloc(mysize*sizeof(PetscMPIInt),&send_buffer);CHKERRQ(ierr); 4227*ef028eecSStefano Zampini for (i=0;i<mysize;i++) { 4228*ef028eecSStefano Zampini send_buffer[i]=(PetscMPIInt)pcbddc->local_primal_indices[i]; 4229*ef028eecSStefano Zampini } 42300c7d97c5SJed Brown if (pcbddc->coarse_problem_type == SEQUENTIAL_BDDC){ 4231*ef028eecSStefano Zampini ierr = MPI_Gatherv(send_buffer,mysize,MPIU_INT,&pcbddc->replicated_local_primal_indices[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr); 423253cdbc3dSStefano Zampini ierr = MPI_Gatherv(&coarse_submat_vals[0],mysize2,MPIU_SCALAR,&temp_coarse_mat_vals[0],localsizes2,localdispl2,MPIU_SCALAR,master_proc,prec_comm);CHKERRQ(ierr); 42330c7d97c5SJed Brown } else { 4234*ef028eecSStefano Zampini ierr = MPI_Allgatherv(send_buffer,mysize,MPIU_INT,&pcbddc->replicated_local_primal_indices[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,prec_comm);CHKERRQ(ierr); 423553cdbc3dSStefano Zampini ierr = MPI_Allgatherv(&coarse_submat_vals[0],mysize2,MPIU_SCALAR,&temp_coarse_mat_vals[0],localsizes2,localdispl2,MPIU_SCALAR,prec_comm);CHKERRQ(ierr); 42360c7d97c5SJed Brown } 4237*ef028eecSStefano Zampini ierr = PetscFree(send_buffer);CHKERRQ(ierr); 42380c7d97c5SJed Brown break; 4239da1bb401SStefano Zampini }/* switch on coarse problem and communications associated with finished */ 42400c7d97c5SJed Brown } 42410c7d97c5SJed Brown 42420c7d97c5SJed Brown /* Now create and fill up coarse matrix */ 42430c7d97c5SJed Brown if ( rank_prec_comm == active_rank ) { 4244142dfd88SStefano Zampini 4245142dfd88SStefano Zampini Mat matis_coarse_local_mat; 4246142dfd88SStefano Zampini 42470c7d97c5SJed Brown if (pcbddc->coarse_problem_type != MULTILEVEL_BDDC) { 42480c7d97c5SJed Brown ierr = MatCreate(coarse_comm,&pcbddc->coarse_mat);CHKERRQ(ierr); 42490c7d97c5SJed Brown ierr = MatSetSizes(pcbddc->coarse_mat,PETSC_DECIDE,PETSC_DECIDE,pcbddc->coarse_size,pcbddc->coarse_size);CHKERRQ(ierr); 42500c7d97c5SJed Brown ierr = MatSetType(pcbddc->coarse_mat,coarse_mat_type);CHKERRQ(ierr); 42513b03a366Sstefano_zampini ierr = MatSetUp(pcbddc->coarse_mat);CHKERRQ(ierr); 4252da1bb401SStefano Zampini ierr = MatSetOption(pcbddc->coarse_mat,MAT_ROW_ORIENTED,PETSC_FALSE);CHKERRQ(ierr); /* local values stored in column major */ 42533b03a366Sstefano_zampini ierr = MatSetOption(pcbddc->coarse_mat,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr); 42540c7d97c5SJed Brown } else { 42554fad6a16SStefano Zampini ierr = MatCreateIS(coarse_comm,1,PETSC_DECIDE,PETSC_DECIDE,pcbddc->coarse_size,pcbddc->coarse_size,coarse_ISLG,&pcbddc->coarse_mat);CHKERRQ(ierr); 42563b03a366Sstefano_zampini ierr = MatSetUp(pcbddc->coarse_mat);CHKERRQ(ierr); 42570c7d97c5SJed Brown ierr = MatISGetLocalMat(pcbddc->coarse_mat,&matis_coarse_local_mat);CHKERRQ(ierr); 42583b03a366Sstefano_zampini ierr = MatSetUp(matis_coarse_local_mat);CHKERRQ(ierr); 4259da1bb401SStefano Zampini ierr = MatSetOption(matis_coarse_local_mat,MAT_ROW_ORIENTED,PETSC_FALSE);CHKERRQ(ierr); /* local values stored in column major */ 4260a0ba757dSStefano Zampini ierr = MatSetOption(matis_coarse_local_mat,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr); 42610c7d97c5SJed Brown } 4262142dfd88SStefano Zampini /* preallocation */ 4263142dfd88SStefano Zampini if (pcbddc->coarse_problem_type != MULTILEVEL_BDDC) { 4264*ef028eecSStefano Zampini 4265142dfd88SStefano Zampini PetscInt lrows,lcols; 4266*ef028eecSStefano Zampini 4267142dfd88SStefano Zampini ierr = MatGetLocalSize(pcbddc->coarse_mat,&lrows,&lcols);CHKERRQ(ierr); 4268142dfd88SStefano Zampini ierr = MatPreallocateInitialize(coarse_comm,lrows,lcols,dnz,onz);CHKERRQ(ierr); 4269*ef028eecSStefano Zampini 4270142dfd88SStefano Zampini if (pcbddc->coarse_problem_type == PARALLEL_BDDC) { 4271*ef028eecSStefano Zampini 4272*ef028eecSStefano Zampini Vec vec_dnz,vec_onz; 4273*ef028eecSStefano Zampini PetscScalar *my_dnz,*my_onz,*array; 4274*ef028eecSStefano Zampini PetscInt *mat_ranges,*row_ownership; 4275*ef028eecSStefano Zampini PetscInt coarse_index_row,coarse_index_col,owner; 4276*ef028eecSStefano Zampini 4277*ef028eecSStefano Zampini ierr = VecCreate(prec_comm,&vec_dnz);CHKERRQ(ierr); 4278*ef028eecSStefano Zampini ierr = VecSetSizes(vec_dnz,PETSC_DECIDE,pcbddc->coarse_size);CHKERRQ(ierr); 4279*ef028eecSStefano Zampini ierr = VecSetType(vec_dnz,VECMPI);CHKERRQ(ierr); 4280*ef028eecSStefano Zampini ierr = VecDuplicate(vec_dnz,&vec_onz);CHKERRQ(ierr); 4281*ef028eecSStefano Zampini 4282*ef028eecSStefano Zampini ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscScalar),&my_dnz);CHKERRQ(ierr); 4283*ef028eecSStefano Zampini ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscScalar),&my_onz);CHKERRQ(ierr); 4284*ef028eecSStefano Zampini ierr = PetscMemzero(my_dnz,pcbddc->local_primal_size*sizeof(PetscScalar));CHKERRQ(ierr); 4285*ef028eecSStefano Zampini ierr = PetscMemzero(my_onz,pcbddc->local_primal_size*sizeof(PetscScalar));CHKERRQ(ierr); 4286*ef028eecSStefano Zampini 4287*ef028eecSStefano Zampini ierr = PetscMalloc(pcbddc->coarse_size*sizeof(PetscInt),&row_ownership);CHKERRQ(ierr); 4288*ef028eecSStefano Zampini ierr = MatGetOwnershipRanges(pcbddc->coarse_mat,(const PetscInt**)&mat_ranges);CHKERRQ(ierr); 4289142dfd88SStefano Zampini for (i=0;i<size_prec_comm;i++) { 4290*ef028eecSStefano Zampini for (j=mat_ranges[i];j<mat_ranges[i+1];j++) { 4291*ef028eecSStefano Zampini row_ownership[j]=i; 4292142dfd88SStefano Zampini } 4293142dfd88SStefano Zampini } 4294*ef028eecSStefano Zampini 4295*ef028eecSStefano Zampini for (i=0;i<pcbddc->local_primal_size;i++) { 4296*ef028eecSStefano Zampini coarse_index_row = pcbddc->local_primal_indices[i]; 4297*ef028eecSStefano Zampini owner = row_ownership[coarse_index_row]; 4298*ef028eecSStefano Zampini for (j=i;j<pcbddc->local_primal_size;j++) { 4299*ef028eecSStefano Zampini owner = row_ownership[coarse_index_row]; 4300*ef028eecSStefano Zampini coarse_index_col = pcbddc->local_primal_indices[j]; 4301*ef028eecSStefano Zampini if (coarse_index_col > mat_ranges[owner]-1 && coarse_index_col < mat_ranges[owner+1] ) { 4302*ef028eecSStefano Zampini my_dnz[i] += 1.0; 4303142dfd88SStefano Zampini } else { 4304*ef028eecSStefano Zampini my_onz[i] += 1.0; 4305142dfd88SStefano Zampini } 4306*ef028eecSStefano Zampini if (i != j) { 4307*ef028eecSStefano Zampini owner = row_ownership[coarse_index_col]; 4308*ef028eecSStefano Zampini if (coarse_index_row > mat_ranges[owner]-1 && coarse_index_row < mat_ranges[owner+1] ) { 4309*ef028eecSStefano Zampini my_dnz[j] += 1.0; 4310142dfd88SStefano Zampini } else { 4311*ef028eecSStefano Zampini my_onz[j] += 1.0; 4312142dfd88SStefano Zampini } 4313142dfd88SStefano Zampini } 4314142dfd88SStefano Zampini } 4315142dfd88SStefano Zampini } 4316*ef028eecSStefano Zampini ierr = VecSet(vec_dnz,0.0);CHKERRQ(ierr); 4317*ef028eecSStefano Zampini ierr = VecSet(vec_onz,0.0);CHKERRQ(ierr); 4318*ef028eecSStefano Zampini ierr = VecSetValues(vec_dnz,pcbddc->local_primal_size,pcbddc->local_primal_indices,my_dnz,ADD_VALUES);CHKERRQ(ierr); 4319*ef028eecSStefano Zampini ierr = VecSetValues(vec_onz,pcbddc->local_primal_size,pcbddc->local_primal_indices,my_onz,ADD_VALUES);CHKERRQ(ierr); 4320*ef028eecSStefano Zampini ierr = VecAssemblyBegin(vec_dnz);CHKERRQ(ierr); 4321*ef028eecSStefano Zampini ierr = VecAssemblyBegin(vec_onz);CHKERRQ(ierr); 4322*ef028eecSStefano Zampini ierr = VecAssemblyEnd(vec_dnz);CHKERRQ(ierr); 4323*ef028eecSStefano Zampini ierr = VecAssemblyEnd(vec_onz);CHKERRQ(ierr); 4324*ef028eecSStefano Zampini j = mat_ranges[rank_prec_comm+1]-mat_ranges[rank_prec_comm]; 4325*ef028eecSStefano Zampini ierr = VecGetArray(vec_dnz,&array);CHKERRQ(ierr); 4326*ef028eecSStefano Zampini for (i=0;i<j;i++) { 4327*ef028eecSStefano Zampini dnz[i] = (PetscInt)array[i]; 4328142dfd88SStefano Zampini } 4329*ef028eecSStefano Zampini ierr = VecRestoreArray(vec_dnz,&array);CHKERRQ(ierr); 4330*ef028eecSStefano Zampini ierr = VecGetArray(vec_onz,&array);CHKERRQ(ierr); 4331*ef028eecSStefano Zampini for (i=0;i<j;i++) { 4332*ef028eecSStefano Zampini onz[i] = (PetscInt)array[i]; 4333142dfd88SStefano Zampini } 4334*ef028eecSStefano Zampini ierr = VecRestoreArray(vec_onz,&array);CHKERRQ(ierr); 4335*ef028eecSStefano Zampini ierr = PetscFree(my_dnz);CHKERRQ(ierr); 4336*ef028eecSStefano Zampini ierr = PetscFree(my_onz);CHKERRQ(ierr); 4337*ef028eecSStefano Zampini ierr = PetscFree(row_ownership);CHKERRQ(ierr); 4338*ef028eecSStefano Zampini ierr = VecDestroy(&vec_dnz);CHKERRQ(ierr); 4339*ef028eecSStefano Zampini ierr = VecDestroy(&vec_onz);CHKERRQ(ierr); 4340142dfd88SStefano Zampini } else { 4341142dfd88SStefano Zampini for (k=0;k<size_prec_comm;k++){ 4342142dfd88SStefano Zampini offset=pcbddc->local_primal_displacements[k]; 4343142dfd88SStefano Zampini offset2=localdispl2[k]; 4344142dfd88SStefano Zampini ins_local_primal_size = pcbddc->local_primal_sizes[k]; 4345*ef028eecSStefano Zampini ierr = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&ins_local_primal_indices);CHKERRQ(ierr); 4346*ef028eecSStefano Zampini for (j=0;j<ins_local_primal_size;j++){ 4347*ef028eecSStefano Zampini ins_local_primal_indices[j]=(PetscInt)pcbddc->replicated_local_primal_indices[offset+j]; 4348*ef028eecSStefano Zampini } 4349142dfd88SStefano Zampini for (j=0;j<ins_local_primal_size;j++) { 4350142dfd88SStefano Zampini ierr = MatPreallocateSet(ins_local_primal_indices[j],ins_local_primal_size,ins_local_primal_indices,dnz,onz);CHKERRQ(ierr); 4351142dfd88SStefano Zampini } 4352*ef028eecSStefano Zampini ierr = PetscFree(ins_local_primal_indices);CHKERRQ(ierr); 4353142dfd88SStefano Zampini } 4354142dfd88SStefano Zampini } 4355142dfd88SStefano Zampini /* check */ 4356142dfd88SStefano Zampini for (i=0;i<lrows;i++) { 4357142dfd88SStefano Zampini if (dnz[i]>lcols) { 4358142dfd88SStefano Zampini dnz[i]=lcols; 4359142dfd88SStefano Zampini } 4360142dfd88SStefano Zampini if (onz[i]>pcbddc->coarse_size-lcols) { 4361142dfd88SStefano Zampini onz[i]=pcbddc->coarse_size-lcols; 4362142dfd88SStefano Zampini } 4363142dfd88SStefano Zampini } 4364142dfd88SStefano Zampini ierr = MatSeqAIJSetPreallocation(pcbddc->coarse_mat,PETSC_NULL,dnz);CHKERRQ(ierr); 4365142dfd88SStefano Zampini ierr = MatMPIAIJSetPreallocation(pcbddc->coarse_mat,PETSC_NULL,dnz,PETSC_NULL,onz);CHKERRQ(ierr); 4366142dfd88SStefano Zampini ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr); 4367142dfd88SStefano Zampini } else { 4368523858cfSStefano Zampini ierr = MatSeqAIJSetPreallocation(matis_coarse_local_mat,0,dnz);CHKERRQ(ierr); 4369523858cfSStefano Zampini ierr = PetscFree(dnz);CHKERRQ(ierr); 4370142dfd88SStefano Zampini } 4371142dfd88SStefano Zampini /* insert values */ 4372523858cfSStefano Zampini if (pcbddc->coarse_problem_type == PARALLEL_BDDC) { 43730c7d97c5SJed Brown ierr = MatSetValues(pcbddc->coarse_mat,ins_local_primal_size,ins_local_primal_indices,ins_local_primal_size,ins_local_primal_indices,ins_coarse_mat_vals,ADD_VALUES);CHKERRQ(ierr); 4374523858cfSStefano Zampini } else if (pcbddc->coarse_problem_type == MULTILEVEL_BDDC) { 4375523858cfSStefano Zampini if (pcbddc->coarsening_ratio == 1) { 4376523858cfSStefano Zampini ins_coarse_mat_vals = coarse_submat_vals; 4377523858cfSStefano Zampini ierr = MatSetValues(pcbddc->coarse_mat,ins_local_primal_size,ins_local_primal_indices,ins_local_primal_size,ins_local_primal_indices,ins_coarse_mat_vals,INSERT_VALUES);CHKERRQ(ierr); 4378523858cfSStefano Zampini } else { 4379523858cfSStefano Zampini ierr = PetscFree(ins_local_primal_indices);CHKERRQ(ierr); 4380523858cfSStefano Zampini for (k=0;k<pcbddc->replicated_primal_size;k++) { 4381523858cfSStefano Zampini offset = pcbddc->local_primal_displacements[k]; 4382523858cfSStefano Zampini offset2 = localdispl2[k]; 4383523858cfSStefano Zampini ins_local_primal_size = pcbddc->local_primal_displacements[k+1]-pcbddc->local_primal_displacements[k]; 4384*ef028eecSStefano Zampini ierr = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&ins_local_primal_indices);CHKERRQ(ierr); 4385*ef028eecSStefano Zampini for (j=0;j<ins_local_primal_size;j++){ 4386*ef028eecSStefano Zampini ins_local_primal_indices[j]=(PetscInt)pcbddc->replicated_local_primal_indices[offset+j]; 4387*ef028eecSStefano Zampini } 4388523858cfSStefano Zampini ins_coarse_mat_vals = &temp_coarse_mat_vals[offset2]; 4389523858cfSStefano Zampini ierr = MatSetValues(pcbddc->coarse_mat,ins_local_primal_size,ins_local_primal_indices,ins_local_primal_size,ins_local_primal_indices,ins_coarse_mat_vals,ADD_VALUES);CHKERRQ(ierr); 4390*ef028eecSStefano Zampini ierr = PetscFree(ins_local_primal_indices);CHKERRQ(ierr); 4391523858cfSStefano Zampini } 4392523858cfSStefano Zampini } 4393523858cfSStefano Zampini ins_local_primal_indices = 0; 4394523858cfSStefano Zampini ins_coarse_mat_vals = 0; 4395ea7e1babSStefano Zampini } else { 4396ea7e1babSStefano Zampini for (k=0;k<size_prec_comm;k++){ 4397ea7e1babSStefano Zampini offset=pcbddc->local_primal_displacements[k]; 4398ea7e1babSStefano Zampini offset2=localdispl2[k]; 4399ea7e1babSStefano Zampini ins_local_primal_size = pcbddc->local_primal_sizes[k]; 4400*ef028eecSStefano Zampini ierr = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&ins_local_primal_indices);CHKERRQ(ierr); 4401*ef028eecSStefano Zampini for (j=0;j<ins_local_primal_size;j++){ 4402*ef028eecSStefano Zampini ins_local_primal_indices[j]=(PetscInt)pcbddc->replicated_local_primal_indices[offset+j]; 4403*ef028eecSStefano Zampini } 4404ea7e1babSStefano Zampini ins_coarse_mat_vals = &temp_coarse_mat_vals[offset2]; 4405ea7e1babSStefano Zampini ierr = MatSetValues(pcbddc->coarse_mat,ins_local_primal_size,ins_local_primal_indices,ins_local_primal_size,ins_local_primal_indices,ins_coarse_mat_vals,ADD_VALUES);CHKERRQ(ierr); 4406*ef028eecSStefano Zampini ierr = PetscFree(ins_local_primal_indices);CHKERRQ(ierr); 4407ea7e1babSStefano Zampini } 4408ea7e1babSStefano Zampini ins_local_primal_indices = 0; 4409ea7e1babSStefano Zampini ins_coarse_mat_vals = 0; 4410ea7e1babSStefano Zampini } 44110c7d97c5SJed Brown ierr = MatAssemblyBegin(pcbddc->coarse_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 44120c7d97c5SJed Brown ierr = MatAssemblyEnd(pcbddc->coarse_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 4413142dfd88SStefano Zampini /* symmetry of coarse matrix */ 4414142dfd88SStefano Zampini if (issym) { 4415142dfd88SStefano Zampini ierr = MatSetOption(pcbddc->coarse_mat,MAT_SYMMETRIC,PETSC_TRUE);CHKERRQ(ierr); 4416142dfd88SStefano Zampini } 44170c7d97c5SJed Brown ierr = MatGetVecs(pcbddc->coarse_mat,&pcbddc->coarse_vec,&pcbddc->coarse_rhs);CHKERRQ(ierr); 44180bdf917eSStefano Zampini } 44190bdf917eSStefano Zampini 44200bdf917eSStefano Zampini /* create loc to glob scatters if needed */ 44210bdf917eSStefano Zampini if (pcbddc->coarse_communications_type == SCATTERS_BDDC) { 44220bdf917eSStefano Zampini IS local_IS,global_IS; 44230bdf917eSStefano Zampini ierr = ISCreateStride(PETSC_COMM_SELF,pcbddc->local_primal_size,0,1,&local_IS);CHKERRQ(ierr); 44240bdf917eSStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,pcbddc->local_primal_size,pcbddc->local_primal_indices,PETSC_COPY_VALUES,&global_IS);CHKERRQ(ierr); 44250bdf917eSStefano Zampini ierr = VecScatterCreate(pcbddc->vec1_P,local_IS,pcbddc->coarse_vec,global_IS,&pcbddc->coarse_loc_to_glob);CHKERRQ(ierr); 44260bdf917eSStefano Zampini ierr = ISDestroy(&local_IS);CHKERRQ(ierr); 44270bdf917eSStefano Zampini ierr = ISDestroy(&global_IS);CHKERRQ(ierr); 44280bdf917eSStefano Zampini } 44290bdf917eSStefano Zampini 44300bdf917eSStefano Zampini /* Eval coarse null space */ 44310bdf917eSStefano Zampini if (pcbddc->NullSpace) { 44320bdf917eSStefano Zampini const Vec *nsp_vecs; 44330bdf917eSStefano Zampini PetscInt nsp_size,coarse_nsp_size; 44340bdf917eSStefano Zampini PetscBool nsp_has_cnst; 44350bdf917eSStefano Zampini PetscReal test_null; 44360bdf917eSStefano Zampini Vec *coarse_nsp_vecs; 44370bdf917eSStefano Zampini 44380bdf917eSStefano Zampini coarse_nsp_size = 0; 44390bdf917eSStefano Zampini coarse_nsp_vecs = 0; 44400bdf917eSStefano Zampini ierr = MatNullSpaceGetVecs(pcbddc->NullSpace,&nsp_has_cnst,&nsp_size,&nsp_vecs);CHKERRQ(ierr); 44410bdf917eSStefano Zampini if (rank_prec_comm == active_rank) { 44420bdf917eSStefano Zampini ierr = PetscMalloc((nsp_size+1)*sizeof(Vec),&coarse_nsp_vecs);CHKERRQ(ierr); 44430bdf917eSStefano Zampini for (i=0;i<nsp_size+1;i++) { 44440bdf917eSStefano Zampini ierr = VecDuplicate(pcbddc->coarse_vec,&coarse_nsp_vecs[i]);CHKERRQ(ierr); 44450bdf917eSStefano Zampini } 44460bdf917eSStefano Zampini } 44470bdf917eSStefano Zampini if (nsp_has_cnst) { 44480bdf917eSStefano Zampini ierr = VecSet(pcis->vec1_N,1.0);CHKERRQ(ierr); 44490bdf917eSStefano Zampini ierr = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr); 44500bdf917eSStefano Zampini ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->vec1_P,pcbddc->coarse_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 44510bdf917eSStefano Zampini ierr = PCBDDCScatterCoarseDataEnd(pc,pcbddc->vec1_P,pcbddc->coarse_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 44520bdf917eSStefano Zampini if (rank_prec_comm == active_rank) { 44530bdf917eSStefano Zampini ierr = MatMult(pcbddc->coarse_mat,pcbddc->coarse_vec,pcbddc->coarse_rhs);CHKERRQ(ierr); 44540bdf917eSStefano Zampini ierr = VecNorm(pcbddc->coarse_rhs,NORM_INFINITY,&test_null);CHKERRQ(ierr); 44550bdf917eSStefano Zampini if (test_null > 1.0e-12 && pcbddc->dbg_flag ) { 44560bdf917eSStefano Zampini ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Constant coarse null space error % 1.14e\n",test_null);CHKERRQ(ierr); 44570bdf917eSStefano Zampini } 44580bdf917eSStefano Zampini ierr = VecCopy(pcbddc->coarse_vec,coarse_nsp_vecs[coarse_nsp_size]);CHKERRQ(ierr); 44590bdf917eSStefano Zampini coarse_nsp_size++; 44600bdf917eSStefano Zampini } 44610bdf917eSStefano Zampini } 44620bdf917eSStefano Zampini for (i=0;i<nsp_size;i++) { 44630bdf917eSStefano Zampini ierr = VecScatterBegin(matis->ctx,nsp_vecs[i],pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 44640bdf917eSStefano Zampini ierr = VecScatterEnd (matis->ctx,nsp_vecs[i],pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 44650bdf917eSStefano Zampini ierr = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr); 44660bdf917eSStefano Zampini ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->vec1_P,pcbddc->coarse_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 44670bdf917eSStefano Zampini ierr = PCBDDCScatterCoarseDataEnd(pc,pcbddc->vec1_P,pcbddc->coarse_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 44680bdf917eSStefano Zampini if (rank_prec_comm == active_rank) { 44690bdf917eSStefano Zampini ierr = MatMult(pcbddc->coarse_mat,pcbddc->coarse_vec,pcbddc->coarse_rhs);CHKERRQ(ierr); 44700bdf917eSStefano Zampini ierr = VecNorm(pcbddc->coarse_rhs,NORM_2,&test_null);CHKERRQ(ierr); 44710bdf917eSStefano Zampini if (test_null > 1.0e-12 && pcbddc->dbg_flag ) { 44720bdf917eSStefano Zampini ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Vec %d coarse null space error % 1.14e\n",i,test_null);CHKERRQ(ierr); 44730bdf917eSStefano Zampini } 44740bdf917eSStefano Zampini ierr = VecCopy(pcbddc->coarse_vec,coarse_nsp_vecs[coarse_nsp_size]);CHKERRQ(ierr); 44750bdf917eSStefano Zampini coarse_nsp_size++; 44760bdf917eSStefano Zampini } 44770bdf917eSStefano Zampini } 44780bdf917eSStefano Zampini if (coarse_nsp_size > 0) { 44790bdf917eSStefano Zampini /* TODO orthonormalize vecs */ 44800bdf917eSStefano Zampini ierr = VecNormalize(coarse_nsp_vecs[0],PETSC_NULL);CHKERRQ(ierr); 44810bdf917eSStefano Zampini ierr = MatNullSpaceCreate(coarse_comm,PETSC_FALSE,coarse_nsp_size,coarse_nsp_vecs,&pcbddc->CoarseNullSpace);CHKERRQ(ierr); 44820bdf917eSStefano Zampini for (i=0;i<nsp_size+1;i++) { 44830bdf917eSStefano Zampini ierr = VecDestroy(&coarse_nsp_vecs[i]);CHKERRQ(ierr); 44840bdf917eSStefano Zampini } 44850bdf917eSStefano Zampini } 44860bdf917eSStefano Zampini ierr = PetscFree(coarse_nsp_vecs);CHKERRQ(ierr); 44870bdf917eSStefano Zampini } 44880bdf917eSStefano Zampini 44890bdf917eSStefano Zampini /* KSP for coarse problem */ 44900bdf917eSStefano Zampini if (rank_prec_comm == active_rank) { 44912e8d2280SStefano Zampini PetscBool isbddc=PETSC_FALSE; 44920bdf917eSStefano Zampini 449353cdbc3dSStefano Zampini ierr = KSPCreate(coarse_comm,&pcbddc->coarse_ksp);CHKERRQ(ierr); 449453cdbc3dSStefano Zampini ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->coarse_ksp,(PetscObject)pc,1);CHKERRQ(ierr); 449553cdbc3dSStefano Zampini ierr = KSPSetOperators(pcbddc->coarse_ksp,pcbddc->coarse_mat,pcbddc->coarse_mat,SAME_PRECONDITIONER);CHKERRQ(ierr); 44963b03a366Sstefano_zampini ierr = KSPSetTolerances(pcbddc->coarse_ksp,PETSC_DEFAULT,PETSC_DEFAULT,PETSC_DEFAULT,max_it_coarse_ksp);CHKERRQ(ierr); 449753cdbc3dSStefano Zampini ierr = KSPSetType(pcbddc->coarse_ksp,coarse_ksp_type);CHKERRQ(ierr); 449853cdbc3dSStefano Zampini ierr = KSPGetPC(pcbddc->coarse_ksp,&pc_temp);CHKERRQ(ierr); 449953cdbc3dSStefano Zampini ierr = PCSetType(pc_temp,coarse_pc_type);CHKERRQ(ierr); 45000c7d97c5SJed Brown /* Allow user's customization */ 4501da1bb401SStefano Zampini ierr = KSPSetOptionsPrefix(pcbddc->coarse_ksp,"coarse_");CHKERRQ(ierr); 45020c7d97c5SJed Brown /* Set Up PC for coarse problem BDDC */ 450353cdbc3dSStefano Zampini if (pcbddc->coarse_problem_type == MULTILEVEL_BDDC) { 45044fad6a16SStefano Zampini i = pcbddc->current_level+1; 45054fad6a16SStefano Zampini ierr = PCBDDCSetLevel(pc_temp,i);CHKERRQ(ierr); 45064fad6a16SStefano Zampini ierr = PCBDDCSetCoarseningRatio(pc_temp,pcbddc->coarsening_ratio);CHKERRQ(ierr); 45074fad6a16SStefano Zampini ierr = PCBDDCSetMaxLevels(pc_temp,pcbddc->max_levels);CHKERRQ(ierr); 450853cdbc3dSStefano Zampini ierr = PCBDDCSetCoarseProblemType(pc_temp,MULTILEVEL_BDDC);CHKERRQ(ierr); 45090bdf917eSStefano Zampini if (pcbddc->CoarseNullSpace) { ierr = PCBDDCSetNullSpace(pc_temp,pcbddc->CoarseNullSpace);CHKERRQ(ierr); } 45104fad6a16SStefano Zampini if (dbg_flag) { 45114fad6a16SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"----------------Level %d: Setting up level %d---------------\n",pcbddc->current_level,i);CHKERRQ(ierr); 45124fad6a16SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 451353cdbc3dSStefano Zampini } 45144fad6a16SStefano Zampini } 45154fad6a16SStefano Zampini ierr = KSPSetFromOptions(pcbddc->coarse_ksp);CHKERRQ(ierr); 451653cdbc3dSStefano Zampini ierr = KSPSetUp(pcbddc->coarse_ksp);CHKERRQ(ierr); 4517142dfd88SStefano Zampini 45182e8d2280SStefano Zampini ierr = KSPGetTolerances(pcbddc->coarse_ksp,PETSC_NULL,PETSC_NULL,PETSC_NULL,&j);CHKERRQ(ierr); 45192e8d2280SStefano Zampini ierr = KSPGetPC(pcbddc->coarse_ksp,&pc_temp);CHKERRQ(ierr); 45202e8d2280SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)pc_temp,PCBDDC,&isbddc);CHKERRQ(ierr); 45212e8d2280SStefano Zampini if (j == 1) { 45222e8d2280SStefano Zampini ierr = KSPSetNormType(pcbddc->coarse_ksp,KSP_NORM_NONE);CHKERRQ(ierr); 45232e8d2280SStefano Zampini if (isbddc) { 45242e8d2280SStefano Zampini ierr = PCBDDCSetUseExactDirichlet(pc_temp,PETSC_FALSE);CHKERRQ(ierr); 45255619798eSStefano Zampini } 45265619798eSStefano Zampini } 45270c7d97c5SJed Brown } 45283b03a366Sstefano_zampini /* Evaluate condition number of coarse problem for cheby (and verbose output if requested) */ 4529142dfd88SStefano Zampini if ( dbg_flag && rank_prec_comm == active_rank ) { 4530142dfd88SStefano Zampini KSP check_ksp; 4531142dfd88SStefano Zampini PC check_pc; 4532142dfd88SStefano Zampini Vec check_vec; 4533142dfd88SStefano Zampini PetscReal abs_infty_error,infty_error,lambda_min,lambda_max; 453419fd82e9SBarry Smith KSPType check_ksp_type; 45350c7d97c5SJed Brown 4536142dfd88SStefano Zampini /* Create ksp object suitable for extreme eigenvalues' estimation */ 4537142dfd88SStefano Zampini ierr = KSPCreate(coarse_comm,&check_ksp);CHKERRQ(ierr); 4538142dfd88SStefano Zampini ierr = KSPSetOperators(check_ksp,pcbddc->coarse_mat,pcbddc->coarse_mat,SAME_PRECONDITIONER);CHKERRQ(ierr); 45390bdf917eSStefano Zampini ierr = KSPSetTolerances(check_ksp,1.e-12,1.e-12,PETSC_DEFAULT,pcbddc->coarse_size);CHKERRQ(ierr); 4540142dfd88SStefano Zampini if (pcbddc->coarse_problem_type == MULTILEVEL_BDDC) { 4541142dfd88SStefano Zampini if (issym) { 4542142dfd88SStefano Zampini check_ksp_type = KSPCG; 4543142dfd88SStefano Zampini } else { 4544142dfd88SStefano Zampini check_ksp_type = KSPGMRES; 4545142dfd88SStefano Zampini } 4546142dfd88SStefano Zampini ierr = KSPSetComputeSingularValues(check_ksp,PETSC_TRUE);CHKERRQ(ierr); 4547142dfd88SStefano Zampini } else { 4548142dfd88SStefano Zampini check_ksp_type = KSPPREONLY; 4549142dfd88SStefano Zampini } 4550142dfd88SStefano Zampini ierr = KSPSetType(check_ksp,check_ksp_type);CHKERRQ(ierr); 4551142dfd88SStefano Zampini ierr = KSPGetPC(pcbddc->coarse_ksp,&check_pc);CHKERRQ(ierr); 4552142dfd88SStefano Zampini ierr = KSPSetPC(check_ksp,check_pc);CHKERRQ(ierr); 4553142dfd88SStefano Zampini ierr = KSPSetUp(check_ksp);CHKERRQ(ierr); 4554142dfd88SStefano Zampini /* create random vec */ 4555142dfd88SStefano Zampini ierr = VecDuplicate(pcbddc->coarse_vec,&check_vec);CHKERRQ(ierr); 4556142dfd88SStefano Zampini ierr = VecSetRandom(check_vec,PETSC_NULL);CHKERRQ(ierr); 45570bdf917eSStefano Zampini if (pcbddc->CoarseNullSpace) { ierr = MatNullSpaceRemove(pcbddc->CoarseNullSpace,check_vec,PETSC_NULL);CHKERRQ(ierr); } 4558142dfd88SStefano Zampini ierr = MatMult(pcbddc->coarse_mat,check_vec,pcbddc->coarse_rhs);CHKERRQ(ierr); 4559142dfd88SStefano Zampini /* solve coarse problem */ 4560142dfd88SStefano Zampini ierr = KSPSolve(check_ksp,pcbddc->coarse_rhs,pcbddc->coarse_vec);CHKERRQ(ierr); 45610bdf917eSStefano Zampini if (pcbddc->CoarseNullSpace) { ierr = MatNullSpaceRemove(pcbddc->CoarseNullSpace,pcbddc->coarse_vec,PETSC_NULL);CHKERRQ(ierr); } 4562142dfd88SStefano Zampini /* check coarse problem residual error */ 4563142dfd88SStefano Zampini ierr = VecAXPY(check_vec,-1.0,pcbddc->coarse_vec);CHKERRQ(ierr); 4564142dfd88SStefano Zampini ierr = VecNorm(check_vec,NORM_INFINITY,&infty_error);CHKERRQ(ierr); 4565142dfd88SStefano Zampini ierr = MatMult(pcbddc->coarse_mat,check_vec,pcbddc->coarse_rhs);CHKERRQ(ierr); 4566142dfd88SStefano Zampini ierr = VecNorm(pcbddc->coarse_rhs,NORM_INFINITY,&abs_infty_error);CHKERRQ(ierr); 4567142dfd88SStefano Zampini ierr = VecDestroy(&check_vec);CHKERRQ(ierr); 4568142dfd88SStefano Zampini /* get eigenvalue estimation if inexact */ 4569142dfd88SStefano Zampini if (pcbddc->coarse_problem_type == MULTILEVEL_BDDC) { 4570142dfd88SStefano Zampini ierr = KSPComputeExtremeSingularValues(check_ksp,&lambda_max,&lambda_min);CHKERRQ(ierr); 4571142dfd88SStefano Zampini ierr = KSPGetIterationNumber(check_ksp,&k);CHKERRQ(ierr); 4572142dfd88SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem eigenvalues estimated with %d iterations of %s.\n",k,check_ksp_type);CHKERRQ(ierr); 4573e269702eSStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem eigenvalues: % 1.14e %1.14e\n",lambda_min,lambda_max);CHKERRQ(ierr); 45743b03a366Sstefano_zampini } 4575142dfd88SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem exact infty_error : %1.14e\n",infty_error);CHKERRQ(ierr); 4576142dfd88SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem residual infty_error: %1.14e\n",abs_infty_error);CHKERRQ(ierr); 4577142dfd88SStefano Zampini ierr = KSPDestroy(&check_ksp);CHKERRQ(ierr); 457853cdbc3dSStefano Zampini } 4579142dfd88SStefano Zampini if (dbg_flag) { ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); } 45800c7d97c5SJed Brown /* free data structures no longer needed */ 45810c7d97c5SJed Brown if (coarse_ISLG) { ierr = ISLocalToGlobalMappingDestroy(&coarse_ISLG);CHKERRQ(ierr); } 45820c7d97c5SJed Brown if (ins_local_primal_indices) { ierr = PetscFree(ins_local_primal_indices);CHKERRQ(ierr); } 45830c7d97c5SJed Brown if (ins_coarse_mat_vals) { ierr = PetscFree(ins_coarse_mat_vals);CHKERRQ(ierr);} 45840c7d97c5SJed Brown if (localsizes2) { ierr = PetscFree(localsizes2);CHKERRQ(ierr);} 45850c7d97c5SJed Brown if (localdispl2) { ierr = PetscFree(localdispl2);CHKERRQ(ierr);} 45860c7d97c5SJed Brown if (temp_coarse_mat_vals) { ierr = PetscFree(temp_coarse_mat_vals);CHKERRQ(ierr);} 45870c7d97c5SJed Brown 45880c7d97c5SJed Brown PetscFunctionReturn(0); 45890c7d97c5SJed Brown } 45900c7d97c5SJed Brown 45910c7d97c5SJed Brown #undef __FUNCT__ 45920c7d97c5SJed Brown #define __FUNCT__ "PCBDDCManageLocalBoundaries" 459353cdbc3dSStefano Zampini static PetscErrorCode PCBDDCManageLocalBoundaries(PC pc) 45940c7d97c5SJed Brown { 45950c7d97c5SJed Brown 45960c7d97c5SJed Brown PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 45970c7d97c5SJed Brown PC_IS *pcis = (PC_IS*)pc->data; 45980c7d97c5SJed Brown Mat_IS *matis = (Mat_IS*)pc->pmat->data; 4599da1bb401SStefano Zampini PCBDDCGraph mat_graph=pcbddc->mat_graph; 46007cf533a6SStefano Zampini PetscInt *is_indices,*auxis; 46013b03a366Sstefano_zampini PetscInt bs,ierr,i,j,s,k,iindex,neumann_bsize,dirichlet_bsize; 4602da1bb401SStefano Zampini PetscInt total_counts,nodes_touched,where_values=1,vertex_size; 4603534831adSStefano Zampini PetscMPIInt adapt_interface=0,adapt_interface_reduced=0,NEUMANNCNT=0; 4604da1bb401SStefano Zampini PetscBool same_set; 4605a0ba757dSStefano Zampini MPI_Comm interface_comm=((PetscObject)pc)->comm; 46063b03a366Sstefano_zampini PetscBool use_faces=PETSC_FALSE,use_edges=PETSC_FALSE; 46073b03a366Sstefano_zampini const PetscInt *neumann_nodes; 46083b03a366Sstefano_zampini const PetscInt *dirichlet_nodes; 4609a81d60d8SStefano Zampini IS used_IS,*custom_ISForDofs; 4610da1bb401SStefano Zampini PetscScalar *array; 4611da1bb401SStefano Zampini PetscScalar *array2; 4612da1bb401SStefano Zampini PetscViewer viewer=pcbddc->dbg_viewer; 46130c7d97c5SJed Brown 46140c7d97c5SJed Brown PetscFunctionBegin; 4615da1bb401SStefano Zampini /* Setup local adjacency graph */ 4616da1bb401SStefano Zampini mat_graph->nvtxs=pcis->n; 4617534831adSStefano Zampini if (!mat_graph->xadj) { NEUMANNCNT = 1; } 4618da1bb401SStefano Zampini ierr = PCBDDCSetupLocalAdjacencyGraph(pc);CHKERRQ(ierr); 4619a0ba757dSStefano Zampini i = mat_graph->nvtxs; 4620a0ba757dSStefano Zampini ierr = PetscMalloc4(i,PetscInt,&mat_graph->where,i,PetscInt,&mat_graph->count,i+1,PetscInt,&mat_graph->cptr,i,PetscInt,&mat_graph->queue);CHKERRQ(ierr); 46213972b0daSStefano Zampini ierr = PetscMalloc2(i,PetscInt,&mat_graph->which_dof,i,PetscBool,&mat_graph->touched);CHKERRQ(ierr); 4622a0ba757dSStefano Zampini ierr = PetscMemzero(mat_graph->where,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr); 4623a0ba757dSStefano Zampini ierr = PetscMemzero(mat_graph->count,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr); 4624a0ba757dSStefano Zampini ierr = PetscMemzero(mat_graph->which_dof,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr); 4625a0ba757dSStefano Zampini ierr = PetscMemzero(mat_graph->queue,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr); 46263828260eSStefano Zampini ierr = PetscMemzero(mat_graph->cptr,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr); 4627a0ba757dSStefano Zampini 4628a81d60d8SStefano Zampini /* Setting dofs splitting in mat_graph->which_dof 4629a81d60d8SStefano Zampini Get information about dofs' splitting if provided by the user 4630a81d60d8SStefano Zampini Otherwise it assumes a constant block size */ 4631a81d60d8SStefano Zampini vertex_size=0; 4632a81d60d8SStefano Zampini if (!pcbddc->n_ISForDofs) { 4633a81d60d8SStefano Zampini ierr = MatGetBlockSize(matis->A,&bs);CHKERRQ(ierr); 4634a81d60d8SStefano Zampini ierr = PetscMalloc(bs*sizeof(IS),&custom_ISForDofs);CHKERRQ(ierr); 4635a81d60d8SStefano Zampini for (i=0;i<bs;i++) { 4636a81d60d8SStefano Zampini ierr = ISCreateStride(PETSC_COMM_SELF,pcis->n/bs,i,bs,&custom_ISForDofs[i]);CHKERRQ(ierr); 4637a81d60d8SStefano Zampini } 4638a81d60d8SStefano Zampini ierr = PCBDDCSetDofsSplitting(pc,bs,custom_ISForDofs);CHKERRQ(ierr); 4639a81d60d8SStefano Zampini vertex_size=1; 4640a81d60d8SStefano Zampini /* remove my references to IS objects */ 4641a81d60d8SStefano Zampini for (i=0;i<bs;i++) { 4642a81d60d8SStefano Zampini ierr = ISDestroy(&custom_ISForDofs[i]);CHKERRQ(ierr); 4643a81d60d8SStefano Zampini } 4644a81d60d8SStefano Zampini ierr = PetscFree(custom_ISForDofs);CHKERRQ(ierr); 4645a81d60d8SStefano Zampini } 46469c0446d6SStefano Zampini for (i=0;i<pcbddc->n_ISForDofs;i++) { 4647a81d60d8SStefano Zampini ierr = ISGetSize(pcbddc->ISForDofs[i],&k);CHKERRQ(ierr); 46489c0446d6SStefano Zampini ierr = ISGetIndices(pcbddc->ISForDofs[i],(const PetscInt**)&is_indices);CHKERRQ(ierr); 4649a81d60d8SStefano Zampini for (j=0;j<k;j++) { 46509c0446d6SStefano Zampini mat_graph->which_dof[is_indices[j]]=i; 46519c0446d6SStefano Zampini } 46529c0446d6SStefano Zampini ierr = ISRestoreIndices(pcbddc->ISForDofs[i],(const PetscInt**)&is_indices);CHKERRQ(ierr); 46539c0446d6SStefano Zampini } 4654a81d60d8SStefano Zampini /* use mat block size as vertex size if it has not yet set */ 4655a81d60d8SStefano Zampini if (!vertex_size) { 46563b03a366Sstefano_zampini ierr = MatGetBlockSize(matis->A,&vertex_size);CHKERRQ(ierr); 46570c7d97c5SJed Brown } 4658a81d60d8SStefano Zampini 46593b03a366Sstefano_zampini /* count number of neigh per node */ 46600c7d97c5SJed Brown total_counts=0; 46613b03a366Sstefano_zampini for (i=1;i<pcis->n_neigh;i++){ 46620c7d97c5SJed Brown s=pcis->n_shared[i]; 46630c7d97c5SJed Brown total_counts+=s; 466453cdbc3dSStefano Zampini for (j=0;j<s;j++){ 46650c7d97c5SJed Brown mat_graph->count[pcis->shared[i][j]] += 1; 46660c7d97c5SJed Brown } 46670c7d97c5SJed Brown } 4668534831adSStefano Zampini /* Take into account Neumann data -> it increments number of sharing subdomains for nodes lying on the interface */ 466936e030ebSStefano Zampini ierr = PCBDDCGetNeumannBoundaries(pc,&used_IS);CHKERRQ(ierr); 4670da1bb401SStefano Zampini ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr); 4671da1bb401SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 467236e030ebSStefano Zampini if (used_IS) { 467336e030ebSStefano Zampini ierr = ISGetSize(used_IS,&neumann_bsize);CHKERRQ(ierr); 467436e030ebSStefano Zampini ierr = ISGetIndices(used_IS,&neumann_nodes);CHKERRQ(ierr); 467553cdbc3dSStefano Zampini for (i=0;i<neumann_bsize;i++){ 467653cdbc3dSStefano Zampini iindex = neumann_nodes[i]; 4677534831adSStefano Zampini if (mat_graph->count[iindex] > NEUMANNCNT && array[iindex]==0.0){ 467853cdbc3dSStefano Zampini mat_graph->count[iindex]+=1; 46790c7d97c5SJed Brown total_counts++; 4680da1bb401SStefano Zampini array[iindex]=array[iindex]+1.0; 4681da1bb401SStefano Zampini } else if (array[iindex]>0.0) { 4682da1bb401SStefano Zampini SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_USER,"Error for neumann nodes provided to BDDC! They must be uniquely listed! Found duplicate node %d\n",iindex); 46830c7d97c5SJed Brown } 46840c7d97c5SJed Brown } 46850c7d97c5SJed Brown } 4686da1bb401SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 4687da1bb401SStefano Zampini /* allocate space for storing the set of neighbours for each node */ 4688da1bb401SStefano Zampini ierr = PetscMalloc(mat_graph->nvtxs*sizeof(PetscInt*),&mat_graph->neighbours_set);CHKERRQ(ierr); 4689da1bb401SStefano Zampini if (mat_graph->nvtxs) { ierr = PetscMalloc(total_counts*sizeof(PetscInt),&mat_graph->neighbours_set[0]);CHKERRQ(ierr); } 4690da1bb401SStefano Zampini for (i=1;i<mat_graph->nvtxs;i++) mat_graph->neighbours_set[i]=mat_graph->neighbours_set[i-1]+mat_graph->count[i-1]; 4691a0ba757dSStefano Zampini ierr = PetscMemzero(mat_graph->count,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr); 46923b03a366Sstefano_zampini for (i=1;i<pcis->n_neigh;i++){ 46930c7d97c5SJed Brown s=pcis->n_shared[i]; 46940c7d97c5SJed Brown for (j=0;j<s;j++) { 46950c7d97c5SJed Brown k=pcis->shared[i][j]; 4696da1bb401SStefano Zampini mat_graph->neighbours_set[k][mat_graph->count[k]] = pcis->neigh[i]; 46970c7d97c5SJed Brown mat_graph->count[k]+=1; 46980c7d97c5SJed Brown } 46990c7d97c5SJed Brown } 4700da1bb401SStefano Zampini /* Check consistency of Neumann nodes */ 4701da1bb401SStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 4702da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 4703da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 4704da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 4705da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 4706da1bb401SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 47073b03a366Sstefano_zampini /* set -1 fake neighbour to mimic Neumann boundary */ 470836e030ebSStefano Zampini if (used_IS) { 470953cdbc3dSStefano Zampini for (i=0;i<neumann_bsize;i++){ 471053cdbc3dSStefano Zampini iindex = neumann_nodes[i]; 4711534831adSStefano Zampini if (mat_graph->count[iindex] > NEUMANNCNT){ 4712da1bb401SStefano Zampini if (mat_graph->count[iindex]+1 != (PetscInt)array[iindex]) { 4713da1bb401SStefano Zampini SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_USER,"Neumann nodes provided to BDDC must be consistent among neighbours!\nNode %d: number of sharing subdomains %d != number of subdomains for which it is a neumann node %d\n",iindex,mat_graph->count[iindex]+1,(PetscInt)array[iindex]); 4714da1bb401SStefano Zampini } 4715da1bb401SStefano Zampini mat_graph->neighbours_set[iindex][mat_graph->count[iindex]] = -1; 471653cdbc3dSStefano Zampini mat_graph->count[iindex]+=1; 47170c7d97c5SJed Brown } 47180c7d97c5SJed Brown } 471936e030ebSStefano Zampini ierr = ISRestoreIndices(used_IS,&neumann_nodes);CHKERRQ(ierr); 47200c7d97c5SJed Brown } 4721da1bb401SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 4722da1bb401SStefano Zampini /* sort set of sharing subdomains */ 4723da1bb401SStefano Zampini for (i=0;i<mat_graph->nvtxs;i++) { ierr = PetscSortInt(mat_graph->count[i],mat_graph->neighbours_set[i]);CHKERRQ(ierr); } 47243b03a366Sstefano_zampini /* remove interior nodes and dirichlet boundary nodes from the next search into the graph */ 4725da1bb401SStefano Zampini for (i=0;i<mat_graph->nvtxs;i++){mat_graph->touched[i]=PETSC_FALSE;} 4726da1bb401SStefano Zampini nodes_touched=0; 472736e030ebSStefano Zampini ierr = PCBDDCGetDirichletBoundaries(pc,&used_IS);CHKERRQ(ierr); 4728da1bb401SStefano Zampini ierr = VecSet(pcis->vec2_N,0.0);CHKERRQ(ierr); 4729da1bb401SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 4730da1bb401SStefano Zampini ierr = VecGetArray(pcis->vec2_N,&array2);CHKERRQ(ierr); 4731da1bb401SStefano Zampini if (used_IS) { 4732da1bb401SStefano Zampini ierr = ISGetSize(used_IS,&dirichlet_bsize);CHKERRQ(ierr); 4733da1bb401SStefano Zampini if (dirichlet_bsize && matis->pure_neumann) { 4734da1bb401SStefano Zampini SETERRQ(PETSC_COMM_SELF,PETSC_ERR_USER,"Dirichlet boundaries are intended to be used with matrices with zeroed rows!\n"); 4735da1bb401SStefano Zampini } 4736da1bb401SStefano Zampini ierr = ISGetIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr); 4737da1bb401SStefano Zampini for (i=0;i<dirichlet_bsize;i++){ 4738da1bb401SStefano Zampini iindex=dirichlet_nodes[i]; 4739da1bb401SStefano Zampini if (mat_graph->count[iindex] && !mat_graph->touched[iindex]) { 4740da1bb401SStefano Zampini if (array[iindex]>0.0) { 4741da1bb401SStefano Zampini SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_USER,"BDDC cannot have nodes which are marked as Neumann and Dirichlet at the same time! Wrong node %d\n",iindex); 4742da1bb401SStefano Zampini } 4743da1bb401SStefano Zampini mat_graph->touched[iindex]=PETSC_TRUE; 4744da1bb401SStefano Zampini mat_graph->where[iindex]=0; 4745da1bb401SStefano Zampini nodes_touched++; 4746da1bb401SStefano Zampini array2[iindex]=array2[iindex]+1.0; 4747da1bb401SStefano Zampini } 4748da1bb401SStefano Zampini } 4749da1bb401SStefano Zampini ierr = ISRestoreIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr); 4750da1bb401SStefano Zampini } 4751da1bb401SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 4752da1bb401SStefano Zampini ierr = VecRestoreArray(pcis->vec2_N,&array2);CHKERRQ(ierr); 4753da1bb401SStefano Zampini /* Check consistency of Dirichlet nodes */ 4754da1bb401SStefano Zampini ierr = VecSet(pcis->vec1_N,1.0);CHKERRQ(ierr); 4755da1bb401SStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 4756da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 4757da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 4758da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 4759da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 4760da1bb401SStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 4761da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec2_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 4762da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec2_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 4763da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 4764da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 4765da1bb401SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 4766da1bb401SStefano Zampini ierr = VecGetArray(pcis->vec2_N,&array2);CHKERRQ(ierr); 476736e030ebSStefano Zampini if (used_IS) { 476836e030ebSStefano Zampini ierr = ISGetSize(used_IS,&dirichlet_bsize);CHKERRQ(ierr); 476936e030ebSStefano Zampini ierr = ISGetIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr); 47703b03a366Sstefano_zampini for (i=0;i<dirichlet_bsize;i++){ 4771da1bb401SStefano Zampini iindex=dirichlet_nodes[i]; 4772da1bb401SStefano Zampini if (array[iindex]>1.0 && array[iindex]!=array2[iindex] ) { 4773da1bb401SStefano Zampini SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_USER,"Dirichlet nodes provided to BDDC must be consistent among neighbours!\nNode %d: number of sharing subdomains %d != number of subdomains for which it is a neumann node %d\n",iindex,(PetscInt)array[iindex],(PetscInt)array2[iindex]); 4774da1bb401SStefano Zampini } 47753b03a366Sstefano_zampini } 477636e030ebSStefano Zampini ierr = ISRestoreIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr); 47773b03a366Sstefano_zampini } 4778da1bb401SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 4779da1bb401SStefano Zampini ierr = VecRestoreArray(pcis->vec2_N,&array2);CHKERRQ(ierr); 4780da1bb401SStefano Zampini 47810c7d97c5SJed Brown for (i=0;i<mat_graph->nvtxs;i++){ 47823b03a366Sstefano_zampini if (!mat_graph->count[i]){ /* interior nodes */ 47830c7d97c5SJed Brown mat_graph->touched[i]=PETSC_TRUE; 47840c7d97c5SJed Brown mat_graph->where[i]=0; 47850c7d97c5SJed Brown nodes_touched++; 47860c7d97c5SJed Brown } 47870c7d97c5SJed Brown } 47880c7d97c5SJed Brown mat_graph->ncmps = 0; 4789da1bb401SStefano Zampini i=0; 47900c7d97c5SJed Brown while(nodes_touched<mat_graph->nvtxs) { 4791a0ba757dSStefano Zampini /* find first untouched node in local ordering */ 47920c7d97c5SJed Brown while(mat_graph->touched[i]) i++; 47930c7d97c5SJed Brown mat_graph->touched[i]=PETSC_TRUE; 4794a0ba757dSStefano Zampini mat_graph->where[i]=where_values; 47950c7d97c5SJed Brown nodes_touched++; 4796a0ba757dSStefano Zampini /* now find all other nodes having the same set of sharing subdomains */ 47970c7d97c5SJed Brown for (j=i+1;j<mat_graph->nvtxs;j++){ 4798a0ba757dSStefano Zampini /* check for same number of sharing subdomains and dof number */ 4799da1bb401SStefano Zampini if (!mat_graph->touched[j] && mat_graph->count[i]==mat_graph->count[j] && mat_graph->which_dof[i] == mat_graph->which_dof[j] ){ 4800a0ba757dSStefano Zampini /* check for same set of sharing subdomains */ 48010c7d97c5SJed Brown same_set=PETSC_TRUE; 48020c7d97c5SJed Brown for (k=0;k<mat_graph->count[j];k++){ 4803da1bb401SStefano Zampini if (mat_graph->neighbours_set[i][k]!=mat_graph->neighbours_set[j][k]) { 48040c7d97c5SJed Brown same_set=PETSC_FALSE; 48050c7d97c5SJed Brown } 48060c7d97c5SJed Brown } 4807a0ba757dSStefano Zampini /* I found a friend of mine */ 48080c7d97c5SJed Brown if (same_set) { 4809a0ba757dSStefano Zampini mat_graph->where[j]=where_values; 48100c7d97c5SJed Brown mat_graph->touched[j]=PETSC_TRUE; 48110c7d97c5SJed Brown nodes_touched++; 48120c7d97c5SJed Brown } 48130c7d97c5SJed Brown } 48140c7d97c5SJed Brown } 4815a0ba757dSStefano Zampini where_values++; 48160c7d97c5SJed Brown } 4817a0ba757dSStefano Zampini where_values--; if (where_values<0) where_values=0; 4818a0ba757dSStefano Zampini ierr = PetscMalloc(where_values*sizeof(PetscMPIInt),&mat_graph->where_ncmps);CHKERRQ(ierr); 4819a0ba757dSStefano Zampini /* Find connected components defined on the shared interface */ 4820a0ba757dSStefano Zampini if (where_values) { 4821a0ba757dSStefano Zampini ierr = PCBDDCFindConnectedComponents(mat_graph, where_values); 4822a0ba757dSStefano Zampini } 4823a0ba757dSStefano Zampini /* check consistency of connected components among neighbouring subdomains -> it adapt them in case it is needed */ 4824a0ba757dSStefano Zampini for (i=0;i<where_values;i++) { 48257cf533a6SStefano Zampini /* We are not sure that on a given subset of the local interface, 48267cf533a6SStefano Zampini two connected components will be the same among sharing subdomains */ 48273b03a366Sstefano_zampini if (mat_graph->where_ncmps[i]>1) { 4828a0ba757dSStefano Zampini adapt_interface=1; 4829a0ba757dSStefano Zampini break; 4830a0ba757dSStefano Zampini } 4831a0ba757dSStefano Zampini } 4832a0ba757dSStefano Zampini ierr = MPI_Allreduce(&adapt_interface,&adapt_interface_reduced,1,MPIU_INT,MPI_LOR,interface_comm);CHKERRQ(ierr); 4833da1bb401SStefano Zampini if (pcbddc->dbg_flag && adapt_interface_reduced) { 4834d8923723SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Adapting interface\n");CHKERRQ(ierr); 4835da1bb401SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 4836da1bb401SStefano Zampini } 4837a0ba757dSStefano Zampini if (where_values && adapt_interface_reduced) { 48380c7d97c5SJed Brown 4839a0ba757dSStefano Zampini PetscInt sum_requests=0,my_rank; 4840a0ba757dSStefano Zampini PetscInt buffer_size,start_of_recv,size_of_recv,start_of_send; 4841a0ba757dSStefano Zampini PetscInt temp_buffer_size,ins_val,global_where_counter; 4842a0ba757dSStefano Zampini PetscInt *cum_recv_counts; 4843a0ba757dSStefano Zampini PetscInt *where_to_nodes_indices; 4844a0ba757dSStefano Zampini PetscInt *petsc_buffer; 4845a0ba757dSStefano Zampini PetscMPIInt *recv_buffer; 4846a0ba757dSStefano Zampini PetscMPIInt *recv_buffer_where; 4847a0ba757dSStefano Zampini PetscMPIInt *send_buffer; 4848a0ba757dSStefano Zampini PetscMPIInt size_of_send; 4849a0ba757dSStefano Zampini PetscInt *sizes_of_sends; 4850a0ba757dSStefano Zampini MPI_Request *send_requests; 4851a0ba757dSStefano Zampini MPI_Request *recv_requests; 4852a0ba757dSStefano Zampini PetscInt *where_cc_adapt; 4853a0ba757dSStefano Zampini PetscInt **temp_buffer; 4854a0ba757dSStefano Zampini PetscInt *nodes_to_temp_buffer_indices; 4855a0ba757dSStefano Zampini PetscInt *add_to_where; 48567cf533a6SStefano Zampini PetscInt *aux_new_xadj,*new_xadj,*new_adjncy; 48577cf533a6SStefano Zampini PetscInt *queue_in_global_numbering; 4858a0ba757dSStefano Zampini 48597cf533a6SStefano Zampini /* Retrict adjacency graph using information from connected components */ 48607cf533a6SStefano Zampini ierr = PetscMalloc(mat_graph->nvtxs*sizeof(PetscInt),&aux_new_xadj);CHKERRQ(ierr); 48617cf533a6SStefano Zampini for (i=0;i<mat_graph->nvtxs;i++) { 48627cf533a6SStefano Zampini aux_new_xadj[i]=1; 48637cf533a6SStefano Zampini } 48647cf533a6SStefano Zampini for (i=0;i<mat_graph->ncmps;i++) { 48657cf533a6SStefano Zampini k = mat_graph->cptr[i+1]-mat_graph->cptr[i]; 48667cf533a6SStefano Zampini for (j=0;j<k;j++) { 48677cf533a6SStefano Zampini aux_new_xadj[mat_graph->queue[mat_graph->cptr[i]+j]]=k; 48687cf533a6SStefano Zampini } 48697cf533a6SStefano Zampini } 48707cf533a6SStefano Zampini j = 0; 48717cf533a6SStefano Zampini for (i=0;i<mat_graph->nvtxs;i++) { 48727cf533a6SStefano Zampini j += aux_new_xadj[i]; 48737cf533a6SStefano Zampini } 48747cf533a6SStefano Zampini ierr = PetscMalloc((mat_graph->nvtxs+1)*sizeof(PetscInt),&new_xadj);CHKERRQ(ierr); 48757cf533a6SStefano Zampini ierr = PetscMalloc(j*sizeof(PetscInt),&new_adjncy);CHKERRQ(ierr); 48767cf533a6SStefano Zampini new_xadj[0]=0; 48777cf533a6SStefano Zampini for (i=0;i<mat_graph->nvtxs;i++) { 48787cf533a6SStefano Zampini new_xadj[i+1]=new_xadj[i]+aux_new_xadj[i]; 48797cf533a6SStefano Zampini if (aux_new_xadj[i]==1) { 48807cf533a6SStefano Zampini new_adjncy[new_xadj[i]]=i; 48817cf533a6SStefano Zampini } 48827cf533a6SStefano Zampini } 4883354b9337SStefano Zampini ierr = PetscFree(aux_new_xadj);CHKERRQ(ierr); 48847cf533a6SStefano Zampini for (i=0;i<mat_graph->ncmps;i++) { 48857cf533a6SStefano Zampini k = mat_graph->cptr[i+1]-mat_graph->cptr[i]; 48867cf533a6SStefano Zampini for (j=0;j<k;j++) { 48877cf533a6SStefano Zampini ierr = PetscMemcpy(&new_adjncy[new_xadj[mat_graph->queue[mat_graph->cptr[i]+j]]],&mat_graph->queue[mat_graph->cptr[i]],k*sizeof(PetscInt));CHKERRQ(ierr); 48887cf533a6SStefano Zampini } 48897cf533a6SStefano Zampini } 48907cf533a6SStefano Zampini ierr = PCBDDCSetLocalAdjacencyGraph(pc,mat_graph->nvtxs,new_xadj,new_adjncy,PETSC_OWN_POINTER);CHKERRQ(ierr); 48917cf533a6SStefano Zampini /* For consistency among neughbouring procs, I need to sort (by global ordering) each connected component */ 48927cf533a6SStefano Zampini ierr = PetscMalloc(mat_graph->nvtxs*sizeof(PetscInt),&queue_in_global_numbering);CHKERRQ(ierr); 48937cf533a6SStefano Zampini for (i=0;i<mat_graph->ncmps;i++) { 48947cf533a6SStefano Zampini k = mat_graph->cptr[i+1]-mat_graph->cptr[i]; 48957cf533a6SStefano Zampini ierr = ISLocalToGlobalMappingApply(matis->mapping,k,&mat_graph->queue[mat_graph->cptr[i]],&queue_in_global_numbering[mat_graph->cptr[i]]);CHKERRQ(ierr); 48967cf533a6SStefano Zampini ierr = PetscSortIntWithArray(k,&queue_in_global_numbering[mat_graph->cptr[i]],&mat_graph->queue[mat_graph->cptr[i]]);CHKERRQ(ierr); 48977cf533a6SStefano Zampini } 48987cf533a6SStefano Zampini /* allocate some space */ 4899a0ba757dSStefano Zampini ierr = MPI_Comm_rank(interface_comm,&my_rank);CHKERRQ(ierr); 4900a0ba757dSStefano Zampini ierr = PetscMalloc((where_values+1)*sizeof(PetscInt),&cum_recv_counts);CHKERRQ(ierr); 4901a0ba757dSStefano Zampini ierr = PetscMemzero(cum_recv_counts,(where_values+1)*sizeof(PetscInt));CHKERRQ(ierr); 4902a0ba757dSStefano Zampini ierr = PetscMalloc(where_values*sizeof(PetscInt),&where_to_nodes_indices);CHKERRQ(ierr); 4903a0ba757dSStefano Zampini /* first count how many neighbours per connected component I will receive from */ 4904a0ba757dSStefano Zampini cum_recv_counts[0]=0; 4905a0ba757dSStefano Zampini for (i=1;i<where_values+1;i++){ 4906a0ba757dSStefano Zampini j=0; 4907d8923723SStefano Zampini while(mat_graph->where[j] != i) { j++; } 4908a0ba757dSStefano Zampini where_to_nodes_indices[i-1]=j; 4909da1bb401SStefano Zampini if (mat_graph->neighbours_set[j][0]!=-1) { cum_recv_counts[i]=cum_recv_counts[i-1]+mat_graph->count[j]; } /* We don't want sends/recvs_to/from_self -> here I don't count myself */ 49103b03a366Sstefano_zampini else { cum_recv_counts[i]=cum_recv_counts[i-1]+mat_graph->count[j]-1; } 4911a0ba757dSStefano Zampini } 4912a0ba757dSStefano Zampini ierr = PetscMalloc(2*cum_recv_counts[where_values]*sizeof(PetscMPIInt),&recv_buffer_where);CHKERRQ(ierr); 4913a0ba757dSStefano Zampini ierr = PetscMalloc(cum_recv_counts[where_values]*sizeof(MPI_Request),&send_requests);CHKERRQ(ierr); 4914a0ba757dSStefano Zampini ierr = PetscMalloc(cum_recv_counts[where_values]*sizeof(MPI_Request),&recv_requests);CHKERRQ(ierr); 4915a0ba757dSStefano Zampini for (i=0;i<cum_recv_counts[where_values];i++) { 4916a0ba757dSStefano Zampini send_requests[i]=MPI_REQUEST_NULL; 4917a0ba757dSStefano Zampini recv_requests[i]=MPI_REQUEST_NULL; 4918a0ba757dSStefano Zampini } 4919a0ba757dSStefano Zampini /* exchange with my neighbours the number of my connected components on the shared interface */ 4920a0ba757dSStefano Zampini for (i=0;i<where_values;i++){ 4921a0ba757dSStefano Zampini j=where_to_nodes_indices[i]; 4922da1bb401SStefano Zampini k = (mat_graph->neighbours_set[j][0] == -1 ? 1 : 0); 4923a0ba757dSStefano Zampini for (;k<mat_graph->count[j];k++){ 4924da1bb401SStefano Zampini ierr = MPI_Isend(&mat_graph->where_ncmps[i],1,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr); 4925da1bb401SStefano Zampini ierr = MPI_Irecv(&recv_buffer_where[sum_requests],1,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr); 4926a0ba757dSStefano Zampini sum_requests++; 4927a0ba757dSStefano Zampini } 4928a0ba757dSStefano Zampini } 4929a0ba757dSStefano Zampini ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 4930a0ba757dSStefano Zampini ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 4931a0ba757dSStefano Zampini /* determine the connected component I need to adapt */ 4932a0ba757dSStefano Zampini ierr = PetscMalloc(where_values*sizeof(PetscInt),&where_cc_adapt);CHKERRQ(ierr); 4933a0ba757dSStefano Zampini ierr = PetscMemzero(where_cc_adapt,where_values*sizeof(PetscInt));CHKERRQ(ierr); 4934a0ba757dSStefano Zampini for (i=0;i<where_values;i++){ 4935a0ba757dSStefano Zampini for (j=cum_recv_counts[i];j<cum_recv_counts[i+1];j++){ 49363b03a366Sstefano_zampini /* The first condition is natural (i.e someone has a different number of cc than me), the second one is just to be safe */ 49373b03a366Sstefano_zampini if ( mat_graph->where_ncmps[i]!=recv_buffer_where[j] || mat_graph->where_ncmps[i] > 1 ) { 4938a0ba757dSStefano Zampini where_cc_adapt[i]=PETSC_TRUE; 4939a0ba757dSStefano Zampini break; 4940a0ba757dSStefano Zampini } 4941a0ba757dSStefano Zampini } 4942a0ba757dSStefano Zampini } 4943d8923723SStefano Zampini buffer_size = 0; 4944d8923723SStefano Zampini for (i=0;i<where_values;i++) { 4945d8923723SStefano Zampini if (where_cc_adapt[i]) { 4946d8923723SStefano Zampini for (j=i;j<mat_graph->ncmps;j++) { 4947d8923723SStefano Zampini if (mat_graph->where[mat_graph->queue[mat_graph->cptr[j]]] == i+1) { /* WARNING -> where values goes from 1 to where_values included */ 4948d8923723SStefano Zampini buffer_size += 1 + mat_graph->cptr[j+1]-mat_graph->cptr[j]; 4949d8923723SStefano Zampini } 4950d8923723SStefano Zampini } 4951d8923723SStefano Zampini } 4952d8923723SStefano Zampini } 4953d8923723SStefano Zampini ierr = PetscMalloc(buffer_size*sizeof(PetscMPIInt),&send_buffer);CHKERRQ(ierr); 4954a0ba757dSStefano Zampini /* now get from neighbours their ccs (in global numbering) and adapt them (in case it is needed) */ 4955a0ba757dSStefano Zampini /* first determine how much data to send (size of each queue plus the global indices) and communicate it to neighbours */ 4956a0ba757dSStefano Zampini ierr = PetscMalloc(where_values*sizeof(PetscInt),&sizes_of_sends);CHKERRQ(ierr); 4957a0ba757dSStefano Zampini ierr = PetscMemzero(sizes_of_sends,where_values*sizeof(PetscInt));CHKERRQ(ierr); 4958a0ba757dSStefano Zampini sum_requests=0; 4959a0ba757dSStefano Zampini start_of_send=0; 4960a0ba757dSStefano Zampini start_of_recv=cum_recv_counts[where_values]; 4961a0ba757dSStefano Zampini for (i=0;i<where_values;i++) { 4962a0ba757dSStefano Zampini if (where_cc_adapt[i]) { 4963a0ba757dSStefano Zampini size_of_send=0; 4964a0ba757dSStefano Zampini for (j=i;j<mat_graph->ncmps;j++) { 4965a0ba757dSStefano Zampini if (mat_graph->where[mat_graph->queue[mat_graph->cptr[j]]] == i+1) { /* WARNING -> where values goes from 1 to where_values included */ 4966a0ba757dSStefano Zampini send_buffer[start_of_send+size_of_send]=mat_graph->cptr[j+1]-mat_graph->cptr[j]; 4967a0ba757dSStefano Zampini size_of_send+=1; 4968a0ba757dSStefano Zampini for (k=0;k<mat_graph->cptr[j+1]-mat_graph->cptr[j];k++) { 4969a0ba757dSStefano Zampini send_buffer[start_of_send+size_of_send+k]=queue_in_global_numbering[mat_graph->cptr[j]+k]; 4970a0ba757dSStefano Zampini } 4971a0ba757dSStefano Zampini size_of_send=size_of_send+mat_graph->cptr[j+1]-mat_graph->cptr[j]; 4972a0ba757dSStefano Zampini } 4973a0ba757dSStefano Zampini } 4974a0ba757dSStefano Zampini j = where_to_nodes_indices[i]; 4975da1bb401SStefano Zampini k = (mat_graph->neighbours_set[j][0] == -1 ? 1 : 0); 497611d8f4c2SStefano Zampini sizes_of_sends[i]=size_of_send; 4977a0ba757dSStefano Zampini for (;k<mat_graph->count[j];k++){ 497811d8f4c2SStefano Zampini ierr = MPI_Isend(&sizes_of_sends[i],1,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr); 4979da1bb401SStefano Zampini ierr = MPI_Irecv(&recv_buffer_where[sum_requests+start_of_recv],1,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr); 4980a0ba757dSStefano Zampini sum_requests++; 4981a0ba757dSStefano Zampini } 4982a0ba757dSStefano Zampini start_of_send+=size_of_send; 4983a0ba757dSStefano Zampini } 4984a0ba757dSStefano Zampini } 4985a0ba757dSStefano Zampini ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 4986a0ba757dSStefano Zampini ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 4987a0ba757dSStefano Zampini buffer_size=0; 4988a0ba757dSStefano Zampini for (k=0;k<sum_requests;k++) { buffer_size+=recv_buffer_where[start_of_recv+k]; } 4989a0ba757dSStefano Zampini ierr = PetscMalloc(buffer_size*sizeof(PetscMPIInt),&recv_buffer);CHKERRQ(ierr); 4990a0ba757dSStefano Zampini /* now exchange the data */ 4991a0ba757dSStefano Zampini start_of_recv=0; 4992a0ba757dSStefano Zampini start_of_send=0; 4993a0ba757dSStefano Zampini sum_requests=0; 4994a0ba757dSStefano Zampini for (i=0;i<where_values;i++) { 4995a0ba757dSStefano Zampini if (where_cc_adapt[i]) { 4996a0ba757dSStefano Zampini size_of_send = sizes_of_sends[i]; 4997a0ba757dSStefano Zampini j = where_to_nodes_indices[i]; 4998da1bb401SStefano Zampini k = (mat_graph->neighbours_set[j][0] == -1 ? 1 : 0); 4999a0ba757dSStefano Zampini for (;k<mat_graph->count[j];k++){ 5000da1bb401SStefano Zampini ierr = MPI_Isend(&send_buffer[start_of_send],size_of_send,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr); 5001a0ba757dSStefano Zampini size_of_recv=recv_buffer_where[cum_recv_counts[where_values]+sum_requests]; 5002da1bb401SStefano Zampini ierr = MPI_Irecv(&recv_buffer[start_of_recv],size_of_recv,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr); 5003a0ba757dSStefano Zampini start_of_recv+=size_of_recv; 5004a0ba757dSStefano Zampini sum_requests++; 5005a0ba757dSStefano Zampini } 5006a0ba757dSStefano Zampini start_of_send+=size_of_send; 5007a0ba757dSStefano Zampini } 5008a0ba757dSStefano Zampini } 5009a0ba757dSStefano Zampini ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 5010a0ba757dSStefano Zampini ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 5011a0ba757dSStefano Zampini ierr = PetscMalloc(buffer_size*sizeof(PetscInt),&petsc_buffer);CHKERRQ(ierr); 5012a0ba757dSStefano Zampini for (k=0;k<start_of_recv;k++) { petsc_buffer[k]=(PetscInt)recv_buffer[k]; } 5013a0ba757dSStefano Zampini for (j=0;j<buffer_size;) { 5014a0ba757dSStefano Zampini ierr = ISGlobalToLocalMappingApply(matis->mapping,IS_GTOLM_MASK,petsc_buffer[j],&petsc_buffer[j+1],&petsc_buffer[j],&petsc_buffer[j+1]);CHKERRQ(ierr); 5015a0ba757dSStefano Zampini k=petsc_buffer[j]+1; 5016a0ba757dSStefano Zampini j+=k; 5017a0ba757dSStefano Zampini } 5018a0ba757dSStefano Zampini sum_requests=cum_recv_counts[where_values]; 5019a0ba757dSStefano Zampini start_of_recv=0; 5020a0ba757dSStefano Zampini ierr = PetscMalloc(mat_graph->nvtxs*sizeof(PetscInt),&nodes_to_temp_buffer_indices);CHKERRQ(ierr); 5021a0ba757dSStefano Zampini global_where_counter=0; 5022a0ba757dSStefano Zampini for (i=0;i<where_values;i++){ 5023a0ba757dSStefano Zampini if (where_cc_adapt[i]){ 5024a0ba757dSStefano Zampini temp_buffer_size=0; 5025a0ba757dSStefano Zampini /* find nodes on the shared interface we need to adapt */ 5026a0ba757dSStefano Zampini for (j=0;j<mat_graph->nvtxs;j++){ 5027a0ba757dSStefano Zampini if (mat_graph->where[j]==i+1) { 5028a0ba757dSStefano Zampini nodes_to_temp_buffer_indices[j]=temp_buffer_size; 5029a0ba757dSStefano Zampini temp_buffer_size++; 5030a0ba757dSStefano Zampini } else { 5031a0ba757dSStefano Zampini nodes_to_temp_buffer_indices[j]=-1; 5032a0ba757dSStefano Zampini } 5033a0ba757dSStefano Zampini } 5034a0ba757dSStefano Zampini /* allocate some temporary space */ 5035a0ba757dSStefano Zampini ierr = PetscMalloc(temp_buffer_size*sizeof(PetscInt*),&temp_buffer);CHKERRQ(ierr); 5036a0ba757dSStefano Zampini ierr = PetscMalloc(temp_buffer_size*(cum_recv_counts[i+1]-cum_recv_counts[i])*sizeof(PetscInt),&temp_buffer[0]);CHKERRQ(ierr); 5037a0ba757dSStefano Zampini ierr = PetscMemzero(temp_buffer[0],temp_buffer_size*(cum_recv_counts[i+1]-cum_recv_counts[i])*sizeof(PetscInt));CHKERRQ(ierr); 5038a0ba757dSStefano Zampini for (j=1;j<temp_buffer_size;j++){ 5039a0ba757dSStefano Zampini temp_buffer[j]=temp_buffer[j-1]+cum_recv_counts[i+1]-cum_recv_counts[i]; 5040a0ba757dSStefano Zampini } 5041a0ba757dSStefano Zampini /* analyze contributions from neighbouring subdomains for i-th conn comp 5042a0ba757dSStefano Zampini temp buffer structure: 5043a0ba757dSStefano Zampini supposing part of the interface has dimension 5 (global nodes 0,1,2,3,4) 5044a0ba757dSStefano Zampini 3 neighs procs with structured connected components: 5045a0ba757dSStefano Zampini neigh 0: [0 1 4], [2 3]; (2 connected components) 5046a0ba757dSStefano Zampini neigh 1: [0 1], [2 3 4]; (2 connected components) 5047a0ba757dSStefano Zampini neigh 2: [0 4], [1], [2 3]; (3 connected components) 5048a0ba757dSStefano Zampini tempbuffer (row-oriented) should be filled as: 5049a0ba757dSStefano Zampini [ 0, 0, 0; 5050a0ba757dSStefano Zampini 0, 0, 1; 5051a0ba757dSStefano Zampini 1, 1, 2; 5052a0ba757dSStefano Zampini 1, 1, 2; 5053a0ba757dSStefano Zampini 0, 1, 0; ]; 5054a0ba757dSStefano Zampini This way we can simply recover the resulting structure account for possible intersections of ccs among neighs. 5055a0ba757dSStefano Zampini The mat_graph->where array will be modified to reproduce the following 4 connected components [0], [1], [2 3], [4]; 5056a0ba757dSStefano Zampini */ 5057a0ba757dSStefano Zampini for (j=0;j<cum_recv_counts[i+1]-cum_recv_counts[i];j++) { 5058a0ba757dSStefano Zampini ins_val=0; 5059a0ba757dSStefano Zampini size_of_recv=recv_buffer_where[sum_requests]; /* total size of recv from neighs */ 5060a0ba757dSStefano Zampini for (buffer_size=0;buffer_size<size_of_recv;) { /* loop until all data from neighs has been taken into account */ 5061a0ba757dSStefano Zampini for (k=1;k<petsc_buffer[buffer_size+start_of_recv]+1;k++) { /* filling properly temp_buffer using data from a single recv */ 5062a0ba757dSStefano Zampini temp_buffer[ nodes_to_temp_buffer_indices[ petsc_buffer[ start_of_recv+buffer_size+k ] ] ][j]=ins_val; 5063a0ba757dSStefano Zampini } 5064a0ba757dSStefano Zampini buffer_size+=k; 5065a0ba757dSStefano Zampini ins_val++; 5066a0ba757dSStefano Zampini } 5067a0ba757dSStefano Zampini start_of_recv+=size_of_recv; 5068a0ba757dSStefano Zampini sum_requests++; 5069a0ba757dSStefano Zampini } 5070a0ba757dSStefano Zampini ierr = PetscMalloc(temp_buffer_size*sizeof(PetscInt),&add_to_where);CHKERRQ(ierr); 5071a0ba757dSStefano Zampini ierr = PetscMemzero(add_to_where,temp_buffer_size*sizeof(PetscInt));CHKERRQ(ierr); 5072a0ba757dSStefano Zampini for (j=0;j<temp_buffer_size;j++){ 5073a0ba757dSStefano Zampini if (!add_to_where[j]){ /* found a new cc */ 5074a0ba757dSStefano Zampini global_where_counter++; 5075a0ba757dSStefano Zampini add_to_where[j]=global_where_counter; 5076a0ba757dSStefano Zampini for (k=j+1;k<temp_buffer_size;k++){ /* check for other nodes in new cc */ 5077a0ba757dSStefano Zampini same_set=PETSC_TRUE; 5078a0ba757dSStefano Zampini for (s=0;s<cum_recv_counts[i+1]-cum_recv_counts[i];s++){ 5079a0ba757dSStefano Zampini if (temp_buffer[j][s]!=temp_buffer[k][s]) { 5080a0ba757dSStefano Zampini same_set=PETSC_FALSE; 5081a0ba757dSStefano Zampini break; 5082a0ba757dSStefano Zampini } 5083a0ba757dSStefano Zampini } 50842e8d2280SStefano Zampini if (same_set) { add_to_where[k]=global_where_counter; } 5085a0ba757dSStefano Zampini } 5086a0ba757dSStefano Zampini } 5087a0ba757dSStefano Zampini } 5088a0ba757dSStefano Zampini /* insert new data in where array */ 5089a0ba757dSStefano Zampini temp_buffer_size=0; 5090a0ba757dSStefano Zampini for (j=0;j<mat_graph->nvtxs;j++){ 5091a0ba757dSStefano Zampini if (mat_graph->where[j]==i+1) { 5092a0ba757dSStefano Zampini mat_graph->where[j]=where_values+add_to_where[temp_buffer_size]; 5093a0ba757dSStefano Zampini temp_buffer_size++; 5094a0ba757dSStefano Zampini } 5095a0ba757dSStefano Zampini } 5096a0ba757dSStefano Zampini ierr = PetscFree(temp_buffer[0]);CHKERRQ(ierr); 5097a0ba757dSStefano Zampini ierr = PetscFree(temp_buffer);CHKERRQ(ierr); 5098a0ba757dSStefano Zampini ierr = PetscFree(add_to_where);CHKERRQ(ierr); 5099a0ba757dSStefano Zampini } 5100a0ba757dSStefano Zampini } 5101a0ba757dSStefano Zampini ierr = PetscFree(nodes_to_temp_buffer_indices);CHKERRQ(ierr); 5102a0ba757dSStefano Zampini ierr = PetscFree(sizes_of_sends);CHKERRQ(ierr); 5103a0ba757dSStefano Zampini ierr = PetscFree(send_requests);CHKERRQ(ierr); 5104a0ba757dSStefano Zampini ierr = PetscFree(recv_requests);CHKERRQ(ierr); 5105a0ba757dSStefano Zampini ierr = PetscFree(petsc_buffer);CHKERRQ(ierr); 5106a0ba757dSStefano Zampini ierr = PetscFree(recv_buffer);CHKERRQ(ierr); 5107a0ba757dSStefano Zampini ierr = PetscFree(recv_buffer_where);CHKERRQ(ierr); 5108a0ba757dSStefano Zampini ierr = PetscFree(send_buffer);CHKERRQ(ierr); 5109a0ba757dSStefano Zampini ierr = PetscFree(cum_recv_counts);CHKERRQ(ierr); 5110a0ba757dSStefano Zampini ierr = PetscFree(where_to_nodes_indices);CHKERRQ(ierr); 511123d4d1a5SStefano Zampini ierr = PetscFree(where_cc_adapt);CHKERRQ(ierr); 5112a0ba757dSStefano Zampini /* We are ready to evaluate consistent connected components on each part of the shared interface */ 5113a0ba757dSStefano Zampini if (global_where_counter) { 5114a0ba757dSStefano Zampini for (i=0;i<mat_graph->nvtxs;i++){ mat_graph->touched[i]=PETSC_FALSE; } 5115a0ba757dSStefano Zampini global_where_counter=0; 5116a0ba757dSStefano Zampini for (i=0;i<mat_graph->nvtxs;i++){ 5117a0ba757dSStefano Zampini if (mat_graph->where[i] && !mat_graph->touched[i]) { 5118a0ba757dSStefano Zampini global_where_counter++; 5119a0ba757dSStefano Zampini for (j=i+1;j<mat_graph->nvtxs;j++){ 5120a0ba757dSStefano Zampini if (!mat_graph->touched[j] && mat_graph->where[j]==mat_graph->where[i]) { 5121a0ba757dSStefano Zampini mat_graph->where[j]=global_where_counter; 5122a0ba757dSStefano Zampini mat_graph->touched[j]=PETSC_TRUE; 5123a0ba757dSStefano Zampini } 5124a0ba757dSStefano Zampini } 5125a0ba757dSStefano Zampini mat_graph->where[i]=global_where_counter; 5126a0ba757dSStefano Zampini mat_graph->touched[i]=PETSC_TRUE; 5127a0ba757dSStefano Zampini } 5128a0ba757dSStefano Zampini } 5129a0ba757dSStefano Zampini where_values=global_where_counter; 5130a0ba757dSStefano Zampini } 5131a0ba757dSStefano Zampini if (global_where_counter) { 5132a0ba757dSStefano Zampini ierr = PetscMemzero(mat_graph->cptr,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr); 5133a0ba757dSStefano Zampini ierr = PetscMemzero(mat_graph->queue,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr); 5134a0ba757dSStefano Zampini ierr = PetscFree(mat_graph->where_ncmps);CHKERRQ(ierr); 5135a0ba757dSStefano Zampini ierr = PetscMalloc(where_values*sizeof(PetscMPIInt),&mat_graph->where_ncmps);CHKERRQ(ierr); 5136a0ba757dSStefano Zampini ierr = PCBDDCFindConnectedComponents(mat_graph, where_values); 5137a0ba757dSStefano Zampini } 51387cf533a6SStefano Zampini ierr = PetscFree(queue_in_global_numbering);CHKERRQ(ierr); 51393b03a366Sstefano_zampini } /* Finished adapting interface */ 51400c7d97c5SJed Brown PetscInt nfc=0; 51410c7d97c5SJed Brown PetscInt nec=0; 51420c7d97c5SJed Brown PetscInt nvc=0; 51433b03a366Sstefano_zampini PetscBool twodim_flag=PETSC_FALSE; 51440c7d97c5SJed Brown for (i=0; i<mat_graph->ncmps; i++) { 51453b03a366Sstefano_zampini if ( mat_graph->cptr[i+1]-mat_graph->cptr[i] > vertex_size ){ 5146534831adSStefano Zampini if (mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]==1){ /* 1 neigh Neumann fake included */ 51470c7d97c5SJed Brown nfc++; 51483b03a366Sstefano_zampini } else { /* note that nec will be zero in 2d */ 51493b03a366Sstefano_zampini nec++; 51503b03a366Sstefano_zampini } 51510c7d97c5SJed Brown } else { 51523b03a366Sstefano_zampini nvc+=mat_graph->cptr[i+1]-mat_graph->cptr[i]; 51533b03a366Sstefano_zampini } 51543b03a366Sstefano_zampini } 51553b03a366Sstefano_zampini if (!nec) { /* we are in a 2d case -> no faces, only edges */ 51563b03a366Sstefano_zampini nec = nfc; 51573b03a366Sstefano_zampini nfc = 0; 51583b03a366Sstefano_zampini twodim_flag = PETSC_TRUE; 51593b03a366Sstefano_zampini } 51603972b0daSStefano Zampini /* allocate IS arrays for faces, edges. Vertices need a single index set. */ 51613972b0daSStefano Zampini k=0; 51623972b0daSStefano Zampini for (i=0; i<mat_graph->ncmps; i++) { 51633972b0daSStefano Zampini j=mat_graph->cptr[i+1]-mat_graph->cptr[i]; 51643972b0daSStefano Zampini if ( j > k) { 51653972b0daSStefano Zampini k=j; 51663972b0daSStefano Zampini } 5167ba1573a8SStefano Zampini if (j<=vertex_size) { 5168ba1573a8SStefano Zampini k+=vertex_size; 5169ba1573a8SStefano Zampini } 51703972b0daSStefano Zampini } 51713972b0daSStefano Zampini ierr = PetscMalloc(k*sizeof(PetscInt),&auxis);CHKERRQ(ierr); 51723b03a366Sstefano_zampini if (!pcbddc->vertices_flag && !pcbddc->edges_flag) { 51733b03a366Sstefano_zampini ierr = PetscMalloc(nfc*sizeof(IS),&pcbddc->ISForFaces);CHKERRQ(ierr); 51743b03a366Sstefano_zampini use_faces=PETSC_TRUE; 51753b03a366Sstefano_zampini } 51763b03a366Sstefano_zampini if (!pcbddc->vertices_flag && !pcbddc->faces_flag) { 51773b03a366Sstefano_zampini ierr = PetscMalloc(nec*sizeof(IS),&pcbddc->ISForEdges);CHKERRQ(ierr); 51783b03a366Sstefano_zampini use_edges=PETSC_TRUE; 51793b03a366Sstefano_zampini } 51803b03a366Sstefano_zampini nfc=0; 51813b03a366Sstefano_zampini nec=0; 51823b03a366Sstefano_zampini for (i=0; i<mat_graph->ncmps; i++) { 51833b03a366Sstefano_zampini if ( mat_graph->cptr[i+1]-mat_graph->cptr[i] > vertex_size ){ 51843b03a366Sstefano_zampini for (j=0;j<mat_graph->cptr[i+1]-mat_graph->cptr[i];j++) { 51853972b0daSStefano Zampini auxis[j]=mat_graph->queue[mat_graph->cptr[i]+j]; 51863b03a366Sstefano_zampini } 51873b03a366Sstefano_zampini if (mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]==1){ 51883b03a366Sstefano_zampini if (twodim_flag) { 51893b03a366Sstefano_zampini if (use_edges) { 51903972b0daSStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,j,auxis,PETSC_COPY_VALUES,&pcbddc->ISForEdges[nec]);CHKERRQ(ierr); 51913b03a366Sstefano_zampini nec++; 51923b03a366Sstefano_zampini } 51933b03a366Sstefano_zampini } else { 51943b03a366Sstefano_zampini if (use_faces) { 51953972b0daSStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,j,auxis,PETSC_COPY_VALUES,&pcbddc->ISForFaces[nfc]);CHKERRQ(ierr); 51963b03a366Sstefano_zampini nfc++; 51973b03a366Sstefano_zampini } 51983b03a366Sstefano_zampini } 51993b03a366Sstefano_zampini } else { 52003b03a366Sstefano_zampini if (use_edges) { 52013972b0daSStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,j,auxis,PETSC_COPY_VALUES,&pcbddc->ISForEdges[nec]);CHKERRQ(ierr); 52020c7d97c5SJed Brown nec++; 52030c7d97c5SJed Brown } 52040c7d97c5SJed Brown } 52050c7d97c5SJed Brown } 52063b03a366Sstefano_zampini } 52073b03a366Sstefano_zampini pcbddc->n_ISForFaces=nfc; 52083b03a366Sstefano_zampini pcbddc->n_ISForEdges=nec; 52093b03a366Sstefano_zampini nvc=0; 52100c7d97c5SJed Brown if ( !pcbddc->constraints_flag ) { 52113b03a366Sstefano_zampini for (i=0; i<mat_graph->ncmps; i++) { 52123b03a366Sstefano_zampini if ( mat_graph->cptr[i+1]-mat_graph->cptr[i] <= vertex_size ){ 52133b03a366Sstefano_zampini for ( j=mat_graph->cptr[i];j<mat_graph->cptr[i+1];j++) { 52143972b0daSStefano Zampini auxis[nvc]=mat_graph->queue[j]; 52150c7d97c5SJed Brown nvc++; 52160c7d97c5SJed Brown } 52170c7d97c5SJed Brown } 52180c7d97c5SJed Brown } 52190c7d97c5SJed Brown } 5220a0ba757dSStefano Zampini /* sort vertex set (by local ordering) */ 52213972b0daSStefano Zampini ierr = PetscSortInt(nvc,auxis);CHKERRQ(ierr); 52223972b0daSStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,nvc,auxis,PETSC_COPY_VALUES,&pcbddc->ISForVertices);CHKERRQ(ierr); 5223e269702eSStefano Zampini if (pcbddc->dbg_flag) { 5224d49ef151SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"--------------------------------------------------------------\n");CHKERRQ(ierr); 5225d49ef151SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Details from PCBDDCManageLocalBoundaries for subdomain %04d\n",PetscGlobalRank);CHKERRQ(ierr); 5226d49ef151SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Matrix graph has %d connected components", mat_graph->ncmps);CHKERRQ(ierr); 52270c7d97c5SJed Brown for (i=0;i<mat_graph->ncmps;i++) { 52283b03a366Sstefano_zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\nDetails for connected component number %02d: size %04d, count %01d. Nodes follow.\n", 52293b03a366Sstefano_zampini i,mat_graph->cptr[i+1]-mat_graph->cptr[i],mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]);CHKERRQ(ierr); 5230da1bb401SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"subdomains: "); 5231da1bb401SStefano Zampini for (j=0;j<mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]; j++) { 5232da1bb401SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d ",mat_graph->neighbours_set[mat_graph->queue[mat_graph->cptr[i]]][j]); 5233da1bb401SStefano Zampini } 5234da1bb401SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\n"); 52350c7d97c5SJed Brown for (j=mat_graph->cptr[i]; j<mat_graph->cptr[i+1]; j++){ 52367cf533a6SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d, ",mat_graph->queue[j]);CHKERRQ(ierr); 52370c7d97c5SJed Brown } 52380c7d97c5SJed Brown } 5239da1bb401SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\n--------------------------------------------------------------\n");CHKERRQ(ierr); 52403b03a366Sstefano_zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local vertices\n",PetscGlobalRank,nvc);CHKERRQ(ierr); 52413b03a366Sstefano_zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local faces\n",PetscGlobalRank,nfc);CHKERRQ(ierr); 52423b03a366Sstefano_zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local edges\n",PetscGlobalRank,nec);CHKERRQ(ierr); 5243d49ef151SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 52440c7d97c5SJed Brown } 52453972b0daSStefano Zampini ierr = PetscFree(auxis);CHKERRQ(ierr); 52460c7d97c5SJed Brown PetscFunctionReturn(0); 52470c7d97c5SJed Brown } 52480c7d97c5SJed Brown 52490c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 52500c7d97c5SJed Brown 52510c7d97c5SJed Brown /* The following code has been adapted from function IsConnectedSubdomain contained 5252da1bb401SStefano Zampini in source file contig.c of METIS library (version 5.0.1) 5253da1bb401SStefano Zampini It finds connected components of each partition labeled from 1 to n_dist */ 52540c7d97c5SJed Brown 52550c7d97c5SJed Brown #undef __FUNCT__ 52560c7d97c5SJed Brown #define __FUNCT__ "PCBDDCFindConnectedComponents" 52579c0446d6SStefano Zampini static PetscErrorCode PCBDDCFindConnectedComponents(PCBDDCGraph graph, PetscInt n_dist ) 52580c7d97c5SJed Brown { 52590c7d97c5SJed Brown PetscInt i, j, k, nvtxs, first, last, nleft, ncmps,pid,cum_queue,n,ncmps_pid; 52600c7d97c5SJed Brown PetscInt *xadj, *adjncy, *where, *queue; 52610c7d97c5SJed Brown PetscInt *cptr; 52620c7d97c5SJed Brown PetscBool *touched; 52630c7d97c5SJed Brown 52640c7d97c5SJed Brown PetscFunctionBegin; 52650c7d97c5SJed Brown 52660c7d97c5SJed Brown nvtxs = graph->nvtxs; 52670c7d97c5SJed Brown xadj = graph->xadj; 52680c7d97c5SJed Brown adjncy = graph->adjncy; 52690c7d97c5SJed Brown where = graph->where; 52700c7d97c5SJed Brown touched = graph->touched; 52710c7d97c5SJed Brown queue = graph->queue; 52720c7d97c5SJed Brown cptr = graph->cptr; 52730c7d97c5SJed Brown 52742e8d2280SStefano Zampini for (i=0; i<nvtxs; i++) { 52750c7d97c5SJed Brown touched[i] = PETSC_FALSE; 52762e8d2280SStefano Zampini } 52770c7d97c5SJed Brown 52780c7d97c5SJed Brown cum_queue=0; 52790c7d97c5SJed Brown ncmps=0; 52800c7d97c5SJed Brown 52810c7d97c5SJed Brown for (n=0; n<n_dist; n++) { 5282da1bb401SStefano Zampini pid = n+1; /* partition labeled by 0 is discarded */ 52830c7d97c5SJed Brown nleft = 0; 52840c7d97c5SJed Brown for (i=0; i<nvtxs; i++) { 52850c7d97c5SJed Brown if (where[i] == pid) 52860c7d97c5SJed Brown nleft++; 52870c7d97c5SJed Brown } 52880c7d97c5SJed Brown for (i=0; i<nvtxs; i++) { 52890c7d97c5SJed Brown if (where[i] == pid) 52900c7d97c5SJed Brown break; 52910c7d97c5SJed Brown } 52920c7d97c5SJed Brown touched[i] = PETSC_TRUE; 52930c7d97c5SJed Brown queue[cum_queue] = i; 52940c7d97c5SJed Brown first = 0; last = 1; 52950c7d97c5SJed Brown cptr[ncmps] = cum_queue; /* This actually points to queue */ 52960c7d97c5SJed Brown ncmps_pid = 0; 52970c7d97c5SJed Brown while (first != nleft) { 52980c7d97c5SJed Brown if (first == last) { /* Find another starting vertex */ 52990c7d97c5SJed Brown cptr[++ncmps] = first+cum_queue; 53000c7d97c5SJed Brown ncmps_pid++; 53010c7d97c5SJed Brown for (i=0; i<nvtxs; i++) { 53020c7d97c5SJed Brown if (where[i] == pid && !touched[i]) 53030c7d97c5SJed Brown break; 53040c7d97c5SJed Brown } 53050c7d97c5SJed Brown queue[cum_queue+last] = i; 53060c7d97c5SJed Brown last++; 53070c7d97c5SJed Brown touched[i] = PETSC_TRUE; 53080c7d97c5SJed Brown } 53090c7d97c5SJed Brown i = queue[cum_queue+first]; 53100c7d97c5SJed Brown first++; 53110c7d97c5SJed Brown for (j=xadj[i]; j<xadj[i+1]; j++) { 53120c7d97c5SJed Brown k = adjncy[j]; 53130c7d97c5SJed Brown if (where[k] == pid && !touched[k]) { 53140c7d97c5SJed Brown queue[cum_queue+last] = k; 53150c7d97c5SJed Brown last++; 53160c7d97c5SJed Brown touched[k] = PETSC_TRUE; 53170c7d97c5SJed Brown } 53180c7d97c5SJed Brown } 53190c7d97c5SJed Brown } 53200c7d97c5SJed Brown cptr[++ncmps] = first+cum_queue; 53210c7d97c5SJed Brown ncmps_pid++; 53220c7d97c5SJed Brown cum_queue=cptr[ncmps]; 5323a0ba757dSStefano Zampini graph->where_ncmps[n] = ncmps_pid; 53240c7d97c5SJed Brown } 53250c7d97c5SJed Brown graph->ncmps = ncmps; 53260c7d97c5SJed Brown 53270c7d97c5SJed Brown PetscFunctionReturn(0); 53280c7d97c5SJed Brown } 5329