153cdbc3dSStefano Zampini /* TODOLIST 2da1bb401SStefano Zampini DofSplitting and DM attached to pc? 3da1bb401SStefano Zampini Change SetNeumannBoundaries to SetNeumannBoundariesLocal and provide new SetNeumannBoundaries (same Dirichlet) 4a0ba757dSStefano Zampini change how to deal with the coarse problem (PCBDDCSetCoarseEnvironment): 5a0ba757dSStefano Zampini - simplify coarse problem structure -> PCBDDC or PCREDUDANT, nothing else -> same comm for all levels? 6a0ba757dSStefano Zampini - remove coarse enums and allow use of PCBDDCGetCoarseKSP 7a0ba757dSStefano Zampini - remove metis dependency -> use MatPartitioning for multilevel -> Assemble serial adjacency in ManageLocalBoundaries? 8a0ba757dSStefano Zampini code refactoring: 9a0ba757dSStefano Zampini - pick up better names for static functions 10a0ba757dSStefano Zampini change options structure: 11a0ba757dSStefano Zampini - insert BDDC into MG framework? 12a0ba757dSStefano Zampini provide other ops? Ask to developers 13a0ba757dSStefano Zampini remove all unused printf 14a0ba757dSStefano Zampini man pages 1553cdbc3dSStefano Zampini */ 160c7d97c5SJed Brown 1753cdbc3dSStefano Zampini /* ---------------------------------------------------------------------------------------------------------------------------------------------- 180c7d97c5SJed Brown Implementation of BDDC preconditioner based on: 190c7d97c5SJed Brown C. Dohrmann "An approximate BDDC preconditioner", Numerical Linear Algebra with Applications Volume 14, Issue 2, pages 149-168, March 2007 2053cdbc3dSStefano Zampini ---------------------------------------------------------------------------------------------------------------------------------------------- */ 2153cdbc3dSStefano Zampini 2207475bc1SBarry Smith #include "bddc.h" /*I "petscpc.h" I*/ 233b03a366Sstefano_zampini #include <petscblaslapack.h> 240c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 250c7d97c5SJed Brown #undef __FUNCT__ 260c7d97c5SJed Brown #define __FUNCT__ "PCSetFromOptions_BDDC" 270c7d97c5SJed Brown PetscErrorCode PCSetFromOptions_BDDC(PC pc) 280c7d97c5SJed Brown { 290c7d97c5SJed Brown PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 300c7d97c5SJed Brown PetscErrorCode ierr; 310c7d97c5SJed Brown 320c7d97c5SJed Brown PetscFunctionBegin; 330c7d97c5SJed Brown ierr = PetscOptionsHead("BDDC options");CHKERRQ(ierr); 340c7d97c5SJed Brown /* Verbose debugging of main data structures */ 35e269702eSStefano Zampini ierr = PetscOptionsBool("-pc_bddc_check_all" ,"Verbose (debugging) output for PCBDDC" ,"none",pcbddc->dbg_flag ,&pcbddc->dbg_flag ,PETSC_NULL);CHKERRQ(ierr); 360c7d97c5SJed Brown /* Some customization for default primal space */ 37da1bb401SStefano Zampini ierr = PetscOptionsBool("-pc_bddc_vertices_only" ,"Use only vertices in coarse space (i.e. discard constraints)","none",pcbddc->vertices_flag ,&pcbddc->vertices_flag ,PETSC_NULL);CHKERRQ(ierr); 38da1bb401SStefano Zampini ierr = PetscOptionsBool("-pc_bddc_constraints_only","Use only constraints in coarse space (i.e. discard vertices)","none",pcbddc->constraints_flag,&pcbddc->constraints_flag,PETSC_NULL);CHKERRQ(ierr); 39da1bb401SStefano Zampini ierr = PetscOptionsBool("-pc_bddc_faces_only" ,"Use only faces among constraints of coarse space (i.e. discard edges)" ,"none",pcbddc->faces_flag ,&pcbddc->faces_flag ,PETSC_NULL);CHKERRQ(ierr); 40da1bb401SStefano Zampini ierr = PetscOptionsBool("-pc_bddc_edges_only" ,"Use only edges among constraints of coarse space (i.e. discard faces)" ,"none",pcbddc->edges_flag ,&pcbddc->edges_flag ,PETSC_NULL);CHKERRQ(ierr); 412fa5cd67SKarl Rupp 420c7d97c5SJed Brown /* Coarse solver context */ 436c667b0aSStefano Zampini static const char * const avail_coarse_problems[] = {"sequential","replicated","parallel","multilevel","CoarseProblemType","PC_BDDC_",0}; /* order of choiches depends on ENUM defined in bddc.h */ 440c7d97c5SJed Brown ierr = PetscOptionsEnum("-pc_bddc_coarse_problem_type","Set coarse problem type","none",avail_coarse_problems,(PetscEnum)pcbddc->coarse_problem_type,(PetscEnum*)&pcbddc->coarse_problem_type,PETSC_NULL);CHKERRQ(ierr); 452fa5cd67SKarl Rupp 460c7d97c5SJed Brown /* Two different application of BDDC to the whole set of dofs, internal and interface */ 4729622bf0SStefano Zampini ierr = PetscOptionsBool("-pc_bddc_switch_preconditioning_type","Switch between M_2 (default) and M_3 preconditioners (as defined by Dohrmann)","none",pcbddc->inexact_prec_type,&pcbddc->inexact_prec_type,PETSC_NULL);CHKERRQ(ierr); 48534831adSStefano Zampini ierr = PetscOptionsBool("-pc_bddc_use_change_of_basis","Use change of basis approach for primal space","none",pcbddc->usechangeofbasis,&pcbddc->usechangeofbasis,PETSC_NULL);CHKERRQ(ierr); 49534831adSStefano Zampini ierr = PetscOptionsBool("-pc_bddc_use_change_on_faces","Use change of basis approach for face constraints","none",pcbddc->usechangeonfaces,&pcbddc->usechangeonfaces,PETSC_NULL);CHKERRQ(ierr); 502fa5cd67SKarl Rupp 51534831adSStefano Zampini pcbddc->usechangeonfaces = pcbddc->usechangeonfaces && pcbddc->usechangeofbasis; 522fa5cd67SKarl Rupp 530c7d97c5SJed Brown ierr = PetscOptionsInt("-pc_bddc_coarsening_ratio","Set coarsening ratio used in multilevel coarsening","none",pcbddc->coarsening_ratio,&pcbddc->coarsening_ratio,PETSC_NULL);CHKERRQ(ierr); 544fad6a16SStefano Zampini ierr = PetscOptionsInt("-pc_bddc_max_levels","Set maximum number of levels for multilevel","none",pcbddc->max_levels,&pcbddc->max_levels,PETSC_NULL);CHKERRQ(ierr); 550c7d97c5SJed Brown ierr = PetscOptionsTail();CHKERRQ(ierr); 560c7d97c5SJed Brown PetscFunctionReturn(0); 570c7d97c5SJed Brown } 580c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 590c7d97c5SJed Brown EXTERN_C_BEGIN 600c7d97c5SJed Brown #undef __FUNCT__ 610c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetCoarseProblemType_BDDC" 6253cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetCoarseProblemType_BDDC(PC pc, CoarseProblemType CPT) 630c7d97c5SJed Brown { 640c7d97c5SJed Brown PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 650c7d97c5SJed Brown 660c7d97c5SJed Brown PetscFunctionBegin; 670c7d97c5SJed Brown pcbddc->coarse_problem_type = CPT; 680c7d97c5SJed Brown PetscFunctionReturn(0); 690c7d97c5SJed Brown } 700c7d97c5SJed Brown EXTERN_C_END 710c7d97c5SJed Brown #undef __FUNCT__ 720c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetCoarseProblemType" 7353cdbc3dSStefano Zampini /*@ 749c0446d6SStefano Zampini PCBDDCSetCoarseProblemType - Set coarse problem type in PCBDDC. 7553cdbc3dSStefano Zampini 769c0446d6SStefano Zampini Not collective 7753cdbc3dSStefano Zampini 7853cdbc3dSStefano Zampini Input Parameters: 7953cdbc3dSStefano Zampini + pc - the preconditioning context 8053cdbc3dSStefano Zampini - CoarseProblemType - pick a better name and explain what this is 8153cdbc3dSStefano Zampini 8253cdbc3dSStefano Zampini Level: intermediate 8353cdbc3dSStefano Zampini 8453cdbc3dSStefano Zampini Notes: 85da1bb401SStefano Zampini Not collective but all procs must call with same arguments. 8653cdbc3dSStefano Zampini 8753cdbc3dSStefano Zampini .seealso: PCBDDC 8853cdbc3dSStefano Zampini @*/ 890c7d97c5SJed Brown PetscErrorCode PCBDDCSetCoarseProblemType(PC pc, CoarseProblemType CPT) 900c7d97c5SJed Brown { 910c7d97c5SJed Brown PetscErrorCode ierr; 920c7d97c5SJed Brown 930c7d97c5SJed Brown PetscFunctionBegin; 940c7d97c5SJed Brown PetscValidHeaderSpecific(pc,PC_CLASSID,1); 950c7d97c5SJed Brown ierr = PetscTryMethod(pc,"PCBDDCSetCoarseProblemType_C",(PC,CoarseProblemType),(pc,CPT));CHKERRQ(ierr); 960c7d97c5SJed Brown PetscFunctionReturn(0); 970c7d97c5SJed Brown } 980c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 990c7d97c5SJed Brown EXTERN_C_BEGIN 1000c7d97c5SJed Brown #undef __FUNCT__ 1014fad6a16SStefano Zampini #define __FUNCT__ "PCBDDCSetCoarseningRatio_BDDC" 1024fad6a16SStefano Zampini static PetscErrorCode PCBDDCSetCoarseningRatio_BDDC(PC pc,PetscInt k) 1034fad6a16SStefano Zampini { 1044fad6a16SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 1054fad6a16SStefano Zampini 1064fad6a16SStefano Zampini PetscFunctionBegin; 1074fad6a16SStefano Zampini pcbddc->coarsening_ratio=k; 1084fad6a16SStefano Zampini PetscFunctionReturn(0); 1094fad6a16SStefano Zampini } 1104fad6a16SStefano Zampini EXTERN_C_END 1114fad6a16SStefano Zampini #undef __FUNCT__ 1124fad6a16SStefano Zampini #define __FUNCT__ "PCBDDCSetCoarseningRatio" 1134fad6a16SStefano Zampini /*@ 1144fad6a16SStefano Zampini PCBDDCSetCoarseningRatio - Set coarsening ratio used in multilevel coarsening 1154fad6a16SStefano Zampini 1164fad6a16SStefano Zampini Logically collective on PC 1174fad6a16SStefano Zampini 1184fad6a16SStefano Zampini Input Parameters: 1194fad6a16SStefano Zampini + pc - the preconditioning context 1204fad6a16SStefano Zampini - k - coarsening ratio 1214fad6a16SStefano Zampini 1224fad6a16SStefano Zampini Approximatively k subdomains at the finer level will be aggregated into a single subdomain at the coarser level. 1234fad6a16SStefano Zampini 1244fad6a16SStefano Zampini Level: intermediate 1254fad6a16SStefano Zampini 1264fad6a16SStefano Zampini Notes: 1274fad6a16SStefano Zampini 1284fad6a16SStefano Zampini .seealso: PCBDDC 1294fad6a16SStefano Zampini @*/ 1304fad6a16SStefano Zampini PetscErrorCode PCBDDCSetCoarseningRatio(PC pc,PetscInt k) 1314fad6a16SStefano Zampini { 1324fad6a16SStefano Zampini PetscErrorCode ierr; 1334fad6a16SStefano Zampini 1344fad6a16SStefano Zampini PetscFunctionBegin; 1354fad6a16SStefano Zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 1364fad6a16SStefano Zampini ierr = PetscTryMethod(pc,"PCBDDCSetCoarseningRatio_C",(PC,PetscInt),(pc,k));CHKERRQ(ierr); 1374fad6a16SStefano Zampini PetscFunctionReturn(0); 1384fad6a16SStefano Zampini } 1394fad6a16SStefano Zampini /* -------------------------------------------------------------------------- */ 1404fad6a16SStefano Zampini EXTERN_C_BEGIN 1414fad6a16SStefano Zampini #undef __FUNCT__ 1424fad6a16SStefano Zampini #define __FUNCT__ "PCBDDCSetMaxLevels_BDDC" 1434fad6a16SStefano Zampini static PetscErrorCode PCBDDCSetMaxLevels_BDDC(PC pc,PetscInt max_levels) 1444fad6a16SStefano Zampini { 1454fad6a16SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 1464fad6a16SStefano Zampini 1474fad6a16SStefano Zampini PetscFunctionBegin; 1484fad6a16SStefano Zampini pcbddc->max_levels=max_levels; 1494fad6a16SStefano Zampini PetscFunctionReturn(0); 1504fad6a16SStefano Zampini } 1514fad6a16SStefano Zampini EXTERN_C_END 1524fad6a16SStefano Zampini #undef __FUNCT__ 1534fad6a16SStefano Zampini #define __FUNCT__ "PCBDDCSetMaxLevels" 1544fad6a16SStefano Zampini /*@ 1554fad6a16SStefano Zampini PCBDDCSetMaxLevels - Sets the maximum number of levels within the multilevel approach. 1564fad6a16SStefano Zampini 1574fad6a16SStefano Zampini Logically collective on PC 1584fad6a16SStefano Zampini 1594fad6a16SStefano Zampini Input Parameters: 1604fad6a16SStefano Zampini + pc - the preconditioning context 1614fad6a16SStefano Zampini - max_levels - the maximum number of levels 1624fad6a16SStefano Zampini 1634fad6a16SStefano Zampini Default value is 1, i.e. coarse problem will be solved inexactly with one application 1644fad6a16SStefano Zampini of PCBDDC preconditioner if the multilevel approach is requested. 1654fad6a16SStefano Zampini 1664fad6a16SStefano Zampini Level: intermediate 1674fad6a16SStefano Zampini 1684fad6a16SStefano Zampini Notes: 1694fad6a16SStefano Zampini 1704fad6a16SStefano Zampini .seealso: PCBDDC 1714fad6a16SStefano Zampini @*/ 1724fad6a16SStefano Zampini PetscErrorCode PCBDDCSetMaxLevels(PC pc,PetscInt max_levels) 1734fad6a16SStefano Zampini { 1744fad6a16SStefano Zampini PetscErrorCode ierr; 1754fad6a16SStefano Zampini 1764fad6a16SStefano Zampini PetscFunctionBegin; 1774fad6a16SStefano Zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 1784fad6a16SStefano Zampini ierr = PetscTryMethod(pc,"PCBDDCSetMaxLevels_C",(PC,PetscInt),(pc,max_levels));CHKERRQ(ierr); 1794fad6a16SStefano Zampini PetscFunctionReturn(0); 1804fad6a16SStefano Zampini } 1814fad6a16SStefano Zampini /* -------------------------------------------------------------------------- */ 1824fad6a16SStefano Zampini EXTERN_C_BEGIN 1834fad6a16SStefano Zampini #undef __FUNCT__ 1840bdf917eSStefano Zampini #define __FUNCT__ "PCBDDCSetNullSpace_BDDC" 1850bdf917eSStefano Zampini static PetscErrorCode PCBDDCSetNullSpace_BDDC(PC pc,MatNullSpace NullSpace) 1860bdf917eSStefano Zampini { 1870bdf917eSStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 1880bdf917eSStefano Zampini PetscErrorCode ierr; 1890bdf917eSStefano Zampini 1900bdf917eSStefano Zampini PetscFunctionBegin; 1910bdf917eSStefano Zampini ierr = PetscObjectReference((PetscObject)NullSpace);CHKERRQ(ierr); 1920bdf917eSStefano Zampini ierr = MatNullSpaceDestroy(&pcbddc->NullSpace);CHKERRQ(ierr); 1932fa5cd67SKarl Rupp 1940bdf917eSStefano Zampini pcbddc->NullSpace = NullSpace; 1950bdf917eSStefano Zampini PetscFunctionReturn(0); 1960bdf917eSStefano Zampini } 1970bdf917eSStefano Zampini EXTERN_C_END 1980bdf917eSStefano Zampini #undef __FUNCT__ 1990bdf917eSStefano Zampini #define __FUNCT__ "PCBDDCSetNullSpace" 2000bdf917eSStefano Zampini /*@ 2010bdf917eSStefano Zampini PCBDDCSetNullSpace - Set NullSpace of global operator of BDDC preconditioned mat. 2020bdf917eSStefano Zampini 2030bdf917eSStefano Zampini Logically collective on PC and MatNullSpace 2040bdf917eSStefano Zampini 2050bdf917eSStefano Zampini Input Parameters: 2060bdf917eSStefano Zampini + pc - the preconditioning context 2070bdf917eSStefano Zampini - NullSpace - Null space of the linear operator to be preconditioned. 2080bdf917eSStefano Zampini 2090bdf917eSStefano Zampini Level: intermediate 2100bdf917eSStefano Zampini 2110bdf917eSStefano Zampini Notes: 2120bdf917eSStefano Zampini 2130bdf917eSStefano Zampini .seealso: PCBDDC 2140bdf917eSStefano Zampini @*/ 2150bdf917eSStefano Zampini PetscErrorCode PCBDDCSetNullSpace(PC pc,MatNullSpace NullSpace) 2160bdf917eSStefano Zampini { 2170bdf917eSStefano Zampini PetscErrorCode ierr; 2180bdf917eSStefano Zampini 2190bdf917eSStefano Zampini PetscFunctionBegin; 2200bdf917eSStefano Zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 2210bdf917eSStefano Zampini ierr = PetscTryMethod(pc,"PCBDDCSetNullSpace_C",(PC,MatNullSpace),(pc,NullSpace));CHKERRQ(ierr); 2220bdf917eSStefano Zampini PetscFunctionReturn(0); 2230bdf917eSStefano Zampini } 2240bdf917eSStefano Zampini /* -------------------------------------------------------------------------- */ 2250bdf917eSStefano Zampini EXTERN_C_BEGIN 2260bdf917eSStefano Zampini #undef __FUNCT__ 2273b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCSetDirichletBoundaries_BDDC" 2283b03a366Sstefano_zampini static PetscErrorCode PCBDDCSetDirichletBoundaries_BDDC(PC pc,IS DirichletBoundaries) 2293b03a366Sstefano_zampini { 2303b03a366Sstefano_zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 2313b03a366Sstefano_zampini PetscErrorCode ierr; 2323b03a366Sstefano_zampini 2333b03a366Sstefano_zampini PetscFunctionBegin; 2343b03a366Sstefano_zampini ierr = ISDestroy(&pcbddc->DirichletBoundaries);CHKERRQ(ierr); 23536e030ebSStefano Zampini ierr = PetscObjectReference((PetscObject)DirichletBoundaries);CHKERRQ(ierr); 2362fa5cd67SKarl Rupp 23736e030ebSStefano Zampini pcbddc->DirichletBoundaries = DirichletBoundaries; 2383b03a366Sstefano_zampini PetscFunctionReturn(0); 2393b03a366Sstefano_zampini } 2403b03a366Sstefano_zampini EXTERN_C_END 2413b03a366Sstefano_zampini #undef __FUNCT__ 2423b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCSetDirichletBoundaries" 2433b03a366Sstefano_zampini /*@ 244da1bb401SStefano Zampini PCBDDCSetDirichletBoundaries - Set index set defining subdomain part (in local ordering) 245da1bb401SStefano Zampini of Dirichlet boundaries for the global problem. 2463b03a366Sstefano_zampini 2473b03a366Sstefano_zampini Not collective 2483b03a366Sstefano_zampini 2493b03a366Sstefano_zampini Input Parameters: 2503b03a366Sstefano_zampini + pc - the preconditioning context 2513b03a366Sstefano_zampini - DirichletBoundaries - sequential index set defining the subdomain part of Dirichlet boundaries (can be PETSC_NULL) 2523b03a366Sstefano_zampini 2533b03a366Sstefano_zampini Level: intermediate 2543b03a366Sstefano_zampini 2553b03a366Sstefano_zampini Notes: 2563b03a366Sstefano_zampini 2573b03a366Sstefano_zampini .seealso: PCBDDC 2583b03a366Sstefano_zampini @*/ 2593b03a366Sstefano_zampini PetscErrorCode PCBDDCSetDirichletBoundaries(PC pc,IS DirichletBoundaries) 2603b03a366Sstefano_zampini { 2613b03a366Sstefano_zampini PetscErrorCode ierr; 2623b03a366Sstefano_zampini 2633b03a366Sstefano_zampini PetscFunctionBegin; 2643b03a366Sstefano_zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 2653b03a366Sstefano_zampini ierr = PetscTryMethod(pc,"PCBDDCSetDirichletBoundaries_C",(PC,IS),(pc,DirichletBoundaries));CHKERRQ(ierr); 2663b03a366Sstefano_zampini PetscFunctionReturn(0); 2673b03a366Sstefano_zampini } 2683b03a366Sstefano_zampini /* -------------------------------------------------------------------------- */ 2693b03a366Sstefano_zampini EXTERN_C_BEGIN 2703b03a366Sstefano_zampini #undef __FUNCT__ 2710c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetNeumannBoundaries_BDDC" 27253cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetNeumannBoundaries_BDDC(PC pc,IS NeumannBoundaries) 2730c7d97c5SJed Brown { 2740c7d97c5SJed Brown PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 27553cdbc3dSStefano Zampini PetscErrorCode ierr; 2760c7d97c5SJed Brown 2770c7d97c5SJed Brown PetscFunctionBegin; 27853cdbc3dSStefano Zampini ierr = ISDestroy(&pcbddc->NeumannBoundaries);CHKERRQ(ierr); 27936e030ebSStefano Zampini ierr = PetscObjectReference((PetscObject)NeumannBoundaries);CHKERRQ(ierr); 2802fa5cd67SKarl Rupp 28136e030ebSStefano Zampini pcbddc->NeumannBoundaries = NeumannBoundaries; 2820c7d97c5SJed Brown PetscFunctionReturn(0); 2830c7d97c5SJed Brown } 2840c7d97c5SJed Brown EXTERN_C_END 2850c7d97c5SJed Brown #undef __FUNCT__ 2860c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetNeumannBoundaries" 28757527edcSJed Brown /*@ 288da1bb401SStefano Zampini PCBDDCSetNeumannBoundaries - Set index set defining subdomain part (in local ordering) 289da1bb401SStefano Zampini of Neumann boundaries for the global problem. 29057527edcSJed Brown 2919c0446d6SStefano Zampini Not collective 29257527edcSJed Brown 29357527edcSJed Brown Input Parameters: 29457527edcSJed Brown + pc - the preconditioning context 2959c0446d6SStefano Zampini - NeumannBoundaries - sequential index set defining the subdomain part of Neumann boundaries (can be PETSC_NULL) 29657527edcSJed Brown 29757527edcSJed Brown Level: intermediate 29857527edcSJed Brown 29957527edcSJed Brown Notes: 30057527edcSJed Brown 30157527edcSJed Brown .seealso: PCBDDC 30257527edcSJed Brown @*/ 30353cdbc3dSStefano Zampini PetscErrorCode PCBDDCSetNeumannBoundaries(PC pc,IS NeumannBoundaries) 3040c7d97c5SJed Brown { 3050c7d97c5SJed Brown PetscErrorCode ierr; 3060c7d97c5SJed Brown 3070c7d97c5SJed Brown PetscFunctionBegin; 3080c7d97c5SJed Brown PetscValidHeaderSpecific(pc,PC_CLASSID,1); 30953cdbc3dSStefano Zampini ierr = PetscTryMethod(pc,"PCBDDCSetNeumannBoundaries_C",(PC,IS),(pc,NeumannBoundaries));CHKERRQ(ierr); 31053cdbc3dSStefano Zampini PetscFunctionReturn(0); 31153cdbc3dSStefano Zampini } 31253cdbc3dSStefano Zampini /* -------------------------------------------------------------------------- */ 31353cdbc3dSStefano Zampini EXTERN_C_BEGIN 31453cdbc3dSStefano Zampini #undef __FUNCT__ 315da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCGetDirichletBoundaries_BDDC" 316da1bb401SStefano Zampini static PetscErrorCode PCBDDCGetDirichletBoundaries_BDDC(PC pc,IS *DirichletBoundaries) 317da1bb401SStefano Zampini { 318da1bb401SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 319da1bb401SStefano Zampini 320da1bb401SStefano Zampini PetscFunctionBegin; 321da1bb401SStefano Zampini *DirichletBoundaries = pcbddc->DirichletBoundaries; 322da1bb401SStefano Zampini PetscFunctionReturn(0); 323da1bb401SStefano Zampini } 324da1bb401SStefano Zampini EXTERN_C_END 325da1bb401SStefano Zampini #undef __FUNCT__ 326da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCGetDirichletBoundaries" 327da1bb401SStefano Zampini /*@ 328da1bb401SStefano Zampini PCBDDCGetDirichletBoundaries - Get index set defining subdomain part (in local ordering) 329da1bb401SStefano Zampini of Dirichlet boundaries for the global problem. 330da1bb401SStefano Zampini 331da1bb401SStefano Zampini Not collective 332da1bb401SStefano Zampini 333da1bb401SStefano Zampini Input Parameters: 334da1bb401SStefano Zampini + pc - the preconditioning context 335da1bb401SStefano Zampini 336da1bb401SStefano Zampini Output Parameters: 337da1bb401SStefano Zampini + DirichletBoundaries - index set defining the subdomain part of Dirichlet boundaries 338da1bb401SStefano Zampini 339da1bb401SStefano Zampini Level: intermediate 340da1bb401SStefano Zampini 341da1bb401SStefano Zampini Notes: 342da1bb401SStefano Zampini 343da1bb401SStefano Zampini .seealso: PCBDDC 344da1bb401SStefano Zampini @*/ 345da1bb401SStefano Zampini PetscErrorCode PCBDDCGetDirichletBoundaries(PC pc,IS *DirichletBoundaries) 346da1bb401SStefano Zampini { 347da1bb401SStefano Zampini PetscErrorCode ierr; 348da1bb401SStefano Zampini 349da1bb401SStefano Zampini PetscFunctionBegin; 350da1bb401SStefano Zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 351da1bb401SStefano Zampini ierr = PetscUseMethod(pc,"PCBDDCGetDirichletBoundaries_C",(PC,IS*),(pc,DirichletBoundaries));CHKERRQ(ierr); 352da1bb401SStefano Zampini PetscFunctionReturn(0); 353da1bb401SStefano Zampini } 354da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */ 355da1bb401SStefano Zampini EXTERN_C_BEGIN 356da1bb401SStefano Zampini #undef __FUNCT__ 35753cdbc3dSStefano Zampini #define __FUNCT__ "PCBDDCGetNeumannBoundaries_BDDC" 35853cdbc3dSStefano Zampini static PetscErrorCode PCBDDCGetNeumannBoundaries_BDDC(PC pc,IS *NeumannBoundaries) 35953cdbc3dSStefano Zampini { 36053cdbc3dSStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 36153cdbc3dSStefano Zampini 36253cdbc3dSStefano Zampini PetscFunctionBegin; 36353cdbc3dSStefano Zampini *NeumannBoundaries = pcbddc->NeumannBoundaries; 36453cdbc3dSStefano Zampini PetscFunctionReturn(0); 36553cdbc3dSStefano Zampini } 36653cdbc3dSStefano Zampini EXTERN_C_END 36753cdbc3dSStefano Zampini #undef __FUNCT__ 36853cdbc3dSStefano Zampini #define __FUNCT__ "PCBDDCGetNeumannBoundaries" 36953cdbc3dSStefano Zampini /*@ 370da1bb401SStefano Zampini PCBDDCGetNeumannBoundaries - Get index set defining subdomain part (in local ordering) 371da1bb401SStefano Zampini of Neumann boundaries for the global problem. 37253cdbc3dSStefano Zampini 3739c0446d6SStefano Zampini Not collective 37453cdbc3dSStefano Zampini 37553cdbc3dSStefano Zampini Input Parameters: 37653cdbc3dSStefano Zampini + pc - the preconditioning context 37753cdbc3dSStefano Zampini 37853cdbc3dSStefano Zampini Output Parameters: 37953cdbc3dSStefano Zampini + NeumannBoundaries - index set defining the subdomain part of Neumann boundaries 38053cdbc3dSStefano Zampini 38153cdbc3dSStefano Zampini Level: intermediate 38253cdbc3dSStefano Zampini 38353cdbc3dSStefano Zampini Notes: 38453cdbc3dSStefano Zampini 38553cdbc3dSStefano Zampini .seealso: PCBDDC 38653cdbc3dSStefano Zampini @*/ 38753cdbc3dSStefano Zampini PetscErrorCode PCBDDCGetNeumannBoundaries(PC pc,IS *NeumannBoundaries) 38853cdbc3dSStefano Zampini { 38953cdbc3dSStefano Zampini PetscErrorCode ierr; 39053cdbc3dSStefano Zampini 39153cdbc3dSStefano Zampini PetscFunctionBegin; 39253cdbc3dSStefano Zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 39353cdbc3dSStefano Zampini ierr = PetscUseMethod(pc,"PCBDDCGetNeumannBoundaries_C",(PC,IS*),(pc,NeumannBoundaries));CHKERRQ(ierr); 3940c7d97c5SJed Brown PetscFunctionReturn(0); 3950c7d97c5SJed Brown } 39636e030ebSStefano Zampini /* -------------------------------------------------------------------------- */ 39736e030ebSStefano Zampini EXTERN_C_BEGIN 39836e030ebSStefano Zampini #undef __FUNCT__ 399da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetLocalAdjacencyGraph_BDDC" 4001a83f524SJed Brown static PetscErrorCode PCBDDCSetLocalAdjacencyGraph_BDDC(PC pc, PetscInt nvtxs,const PetscInt xadj[],const PetscInt adjncy[], PetscCopyMode copymode) 40136e030ebSStefano Zampini { 40236e030ebSStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 403da1bb401SStefano Zampini PCBDDCGraph mat_graph=pcbddc->mat_graph; 404da1bb401SStefano Zampini PetscErrorCode ierr; 40536e030ebSStefano Zampini 40636e030ebSStefano Zampini PetscFunctionBegin; 407da1bb401SStefano Zampini mat_graph->nvtxs=nvtxs; 4082fa5cd67SKarl Rupp 409da1bb401SStefano Zampini ierr = PetscFree(mat_graph->xadj);CHKERRQ(ierr); 410da1bb401SStefano Zampini ierr = PetscFree(mat_graph->adjncy);CHKERRQ(ierr); 411da1bb401SStefano Zampini if (copymode == PETSC_COPY_VALUES) { 412da1bb401SStefano Zampini ierr = PetscMalloc((mat_graph->nvtxs+1)*sizeof(PetscInt),&mat_graph->xadj);CHKERRQ(ierr); 413da1bb401SStefano Zampini ierr = PetscMalloc(xadj[mat_graph->nvtxs]*sizeof(PetscInt),&mat_graph->adjncy);CHKERRQ(ierr); 414da1bb401SStefano Zampini ierr = PetscMemcpy(mat_graph->xadj,xadj,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr); 415da1bb401SStefano Zampini ierr = PetscMemcpy(mat_graph->adjncy,adjncy,xadj[mat_graph->nvtxs]*sizeof(PetscInt));CHKERRQ(ierr); 416da1bb401SStefano Zampini } else if (copymode == PETSC_OWN_POINTER) { 4171a83f524SJed Brown mat_graph->xadj = (PetscInt*)xadj; 4181a83f524SJed Brown mat_graph->adjncy = (PetscInt*)adjncy; 419acee19a7SJed Brown } else SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SUP,"Unsupported copy mode %d\n",copymode); 42036e030ebSStefano Zampini PetscFunctionReturn(0); 42136e030ebSStefano Zampini } 42236e030ebSStefano Zampini EXTERN_C_END 42336e030ebSStefano Zampini #undef __FUNCT__ 424da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetLocalAdjacencyGraph" 42536e030ebSStefano Zampini /*@ 426da1bb401SStefano Zampini PCBDDCSetLocalAdjacencyGraph - Set CSR graph of local matrix for use of PCBDDC. 42736e030ebSStefano Zampini 42836e030ebSStefano Zampini Not collective 42936e030ebSStefano Zampini 43036e030ebSStefano Zampini Input Parameters: 43136e030ebSStefano Zampini + pc - the preconditioning context 432da1bb401SStefano Zampini - nvtxs - number of local vertices of the graph 433da1bb401SStefano Zampini - xadj, adjncy - the CSR graph 434da1bb401SStefano Zampini - copymode - either PETSC_COPY_VALUES or PETSC_OWN_POINTER. In the former case the user must free the array passed in; 435da1bb401SStefano Zampini in the latter case, memory must be obtained with PetscMalloc. 43636e030ebSStefano Zampini 43736e030ebSStefano Zampini Level: intermediate 43836e030ebSStefano Zampini 43936e030ebSStefano Zampini Notes: 44036e030ebSStefano Zampini 44136e030ebSStefano Zampini .seealso: PCBDDC 44236e030ebSStefano Zampini @*/ 4431a83f524SJed Brown PetscErrorCode PCBDDCSetLocalAdjacencyGraph(PC pc,PetscInt nvtxs,const PetscInt xadj[],const PetscInt adjncy[], PetscCopyMode copymode) 44436e030ebSStefano Zampini { 445da1bb401SStefano Zampini PetscInt nrows,ncols; 446da1bb401SStefano Zampini Mat_IS *matis = (Mat_IS*)pc->pmat->data; 44736e030ebSStefano Zampini PetscErrorCode ierr; 44836e030ebSStefano Zampini 44936e030ebSStefano Zampini PetscFunctionBegin; 45036e030ebSStefano Zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 451da1bb401SStefano Zampini ierr = MatGetSize(matis->A,&nrows,&ncols);CHKERRQ(ierr); 452f23aa3ddSBarry Smith if (nvtxs != nrows) SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Local adjacency size %d passed in %s differs from local problem size %d!\n",nvtxs,nrows); 453f23aa3ddSBarry Smith else { 4541a83f524SJed Brown ierr = PetscTryMethod(pc,"PCBDDCSetLocalAdjacencyGraph_C",(PC,PetscInt,const PetscInt[],const PetscInt[],PetscCopyMode),(pc,nvtxs,xadj,adjncy,copymode));CHKERRQ(ierr); 455da1bb401SStefano Zampini } 45636e030ebSStefano Zampini PetscFunctionReturn(0); 45736e030ebSStefano Zampini } 4589c0446d6SStefano Zampini /* -------------------------------------------------------------------------- */ 4599c0446d6SStefano Zampini EXTERN_C_BEGIN 4609c0446d6SStefano Zampini #undef __FUNCT__ 4619c0446d6SStefano Zampini #define __FUNCT__ "PCBDDCSetDofsSplitting_BDDC" 4629c0446d6SStefano Zampini static PetscErrorCode PCBDDCSetDofsSplitting_BDDC(PC pc,PetscInt n_is, IS ISForDofs[]) 4639c0446d6SStefano Zampini { 4649c0446d6SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 4659c0446d6SStefano Zampini PetscInt i; 4669c0446d6SStefano Zampini PetscErrorCode ierr; 4679c0446d6SStefano Zampini 4689c0446d6SStefano Zampini PetscFunctionBegin; 469da1bb401SStefano Zampini /* Destroy ISes if they were already set */ 4709c0446d6SStefano Zampini for (i=0; i<pcbddc->n_ISForDofs; i++) { 4719c0446d6SStefano Zampini ierr = ISDestroy(&pcbddc->ISForDofs[i]);CHKERRQ(ierr); 4729c0446d6SStefano Zampini } 473d11ae9bbSstefano_zampini ierr = PetscFree(pcbddc->ISForDofs);CHKERRQ(ierr); 474da1bb401SStefano Zampini /* allocate space then set */ 4759c0446d6SStefano Zampini ierr = PetscMalloc(n_is*sizeof(IS),&pcbddc->ISForDofs);CHKERRQ(ierr); 4769c0446d6SStefano Zampini for (i=0; i<n_is; i++) { 477da1bb401SStefano Zampini ierr = PetscObjectReference((PetscObject)ISForDofs[i]);CHKERRQ(ierr); 4782fa5cd67SKarl Rupp 479da1bb401SStefano Zampini pcbddc->ISForDofs[i]=ISForDofs[i]; 4809c0446d6SStefano Zampini } 4819c0446d6SStefano Zampini pcbddc->n_ISForDofs=n_is; 4829c0446d6SStefano Zampini PetscFunctionReturn(0); 4839c0446d6SStefano Zampini } 4849c0446d6SStefano Zampini EXTERN_C_END 4859c0446d6SStefano Zampini #undef __FUNCT__ 4869c0446d6SStefano Zampini #define __FUNCT__ "PCBDDCSetDofsSplitting" 4879c0446d6SStefano Zampini /*@ 488da1bb401SStefano Zampini PCBDDCSetDofsSplitting - Set index sets defining fields of local mat. 4899c0446d6SStefano Zampini 4909c0446d6SStefano Zampini Not collective 4919c0446d6SStefano Zampini 4929c0446d6SStefano Zampini Input Parameters: 4939c0446d6SStefano Zampini + pc - the preconditioning context 494da1bb401SStefano Zampini - n - number of index sets defining the fields 495da1bb401SStefano Zampini - IS[] - array of IS describing the fields 4969c0446d6SStefano Zampini 4979c0446d6SStefano Zampini Level: intermediate 4989c0446d6SStefano Zampini 4999c0446d6SStefano Zampini Notes: 5009c0446d6SStefano Zampini 5019c0446d6SStefano Zampini .seealso: PCBDDC 5029c0446d6SStefano Zampini @*/ 5039c0446d6SStefano Zampini PetscErrorCode PCBDDCSetDofsSplitting(PC pc,PetscInt n_is, IS ISForDofs[]) 5049c0446d6SStefano Zampini { 5059c0446d6SStefano Zampini PetscErrorCode ierr; 5069c0446d6SStefano Zampini 5079c0446d6SStefano Zampini PetscFunctionBegin; 5089c0446d6SStefano Zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 5099c0446d6SStefano Zampini ierr = PetscTryMethod(pc,"PCBDDCSetDofsSplitting_C",(PC,PetscInt,IS[]),(pc,n_is,ISForDofs));CHKERRQ(ierr); 5109c0446d6SStefano Zampini PetscFunctionReturn(0); 5119c0446d6SStefano Zampini } 512da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */ 513534831adSStefano Zampini #undef __FUNCT__ 514534831adSStefano Zampini #define __FUNCT__ "PCPreSolve_BDDC" 515534831adSStefano Zampini /* -------------------------------------------------------------------------- */ 516534831adSStefano Zampini /* 517534831adSStefano Zampini PCPreSolve_BDDC - Changes the right hand side and (if necessary) the initial 518534831adSStefano Zampini guess if a transformation of basis approach has been selected. 5199c0446d6SStefano Zampini 520534831adSStefano Zampini Input Parameter: 521534831adSStefano Zampini + pc - the preconditioner contex 522534831adSStefano Zampini 523534831adSStefano Zampini Application Interface Routine: PCPreSolve() 524534831adSStefano Zampini 525534831adSStefano Zampini Notes: 526534831adSStefano Zampini The interface routine PCPreSolve() is not usually called directly by 527534831adSStefano Zampini the user, but instead is called by KSPSolve(). 528534831adSStefano Zampini */ 529534831adSStefano Zampini static PetscErrorCode PCPreSolve_BDDC(PC pc, KSP ksp, Vec rhs, Vec x) 530534831adSStefano Zampini { 531534831adSStefano Zampini PetscErrorCode ierr; 532534831adSStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 533534831adSStefano Zampini PC_IS *pcis = (PC_IS*)(pc->data); 534534831adSStefano Zampini Mat_IS *matis = (Mat_IS*)pc->pmat->data; 535534831adSStefano Zampini Mat temp_mat; 5363972b0daSStefano Zampini IS dirIS; 5373972b0daSStefano Zampini PetscInt dirsize,i,*is_indices; 5383972b0daSStefano Zampini PetscScalar *array_x,*array_diagonal; 5393972b0daSStefano Zampini Vec used_vec; 5403972b0daSStefano Zampini PetscBool guess_nonzero; 541534831adSStefano Zampini 542534831adSStefano Zampini PetscFunctionBegin; 5433972b0daSStefano Zampini if (x) { 5443972b0daSStefano Zampini ierr = PetscObjectReference((PetscObject)x);CHKERRQ(ierr); 5453972b0daSStefano Zampini used_vec = x; 5463972b0daSStefano Zampini } else { 5473972b0daSStefano Zampini ierr = PetscObjectReference((PetscObject)pcbddc->temp_solution);CHKERRQ(ierr); 5483972b0daSStefano Zampini used_vec = pcbddc->temp_solution; 5493972b0daSStefano Zampini ierr = VecSet(used_vec,0.0);CHKERRQ(ierr); 5503972b0daSStefano Zampini } 5513972b0daSStefano Zampini /* hack into ksp data structure PCPreSolve comes earlier in src/ksp/ksp/interface/itfunc.c */ 5523972b0daSStefano Zampini if (ksp) { 5533972b0daSStefano Zampini ierr = KSPGetInitialGuessNonzero(ksp,&guess_nonzero);CHKERRQ(ierr); 5543972b0daSStefano Zampini if (!guess_nonzero) { 5553972b0daSStefano Zampini ierr = VecSet(used_vec,0.0);CHKERRQ(ierr); 5563972b0daSStefano Zampini } 5573972b0daSStefano Zampini } 5583972b0daSStefano Zampini /* store the original rhs */ 5593972b0daSStefano Zampini ierr = VecCopy(rhs,pcbddc->original_rhs);CHKERRQ(ierr); 5603972b0daSStefano Zampini 5613972b0daSStefano Zampini /* Take into account zeroed rows -> change rhs and store solution removed */ 5623972b0daSStefano Zampini ierr = MatGetDiagonal(pc->pmat,pcis->vec1_global);CHKERRQ(ierr); 5633972b0daSStefano Zampini ierr = VecPointwiseDivide(pcis->vec1_global,rhs,pcis->vec1_global);CHKERRQ(ierr); 5643972b0daSStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 5653972b0daSStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 5663972b0daSStefano Zampini ierr = VecScatterBegin(matis->ctx,used_vec,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 5673972b0daSStefano Zampini ierr = VecScatterEnd (matis->ctx,used_vec,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 5683972b0daSStefano Zampini ierr = PCBDDCGetDirichletBoundaries(pc,&dirIS);CHKERRQ(ierr); 5693972b0daSStefano Zampini if (dirIS) { 5703972b0daSStefano Zampini ierr = ISGetSize(dirIS,&dirsize);CHKERRQ(ierr); 5713972b0daSStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array_x);CHKERRQ(ierr); 5723972b0daSStefano Zampini ierr = VecGetArray(pcis->vec2_N,&array_diagonal);CHKERRQ(ierr); 5733972b0daSStefano Zampini ierr = ISGetIndices(dirIS,(const PetscInt**)&is_indices);CHKERRQ(ierr); 5742fa5cd67SKarl Rupp for (i=0; i<dirsize; i++) array_x[is_indices[i]] = array_diagonal[is_indices[i]]; 5752fa5cd67SKarl Rupp 5763972b0daSStefano Zampini ierr = ISRestoreIndices(dirIS,(const PetscInt**)&is_indices);CHKERRQ(ierr); 5773972b0daSStefano Zampini ierr = VecRestoreArray(pcis->vec2_N,&array_diagonal);CHKERRQ(ierr); 5783972b0daSStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array_x);CHKERRQ(ierr); 5793972b0daSStefano Zampini } 5803972b0daSStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 5813972b0daSStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 582b76ba322SStefano Zampini 5833972b0daSStefano Zampini /* remove the computed solution from the rhs */ 5843972b0daSStefano Zampini ierr = VecScale(used_vec,-1.0);CHKERRQ(ierr); 5853972b0daSStefano Zampini ierr = MatMultAdd(pc->pmat,used_vec,rhs,rhs);CHKERRQ(ierr); 5863972b0daSStefano Zampini ierr = VecScale(used_vec,-1.0);CHKERRQ(ierr); 587b76ba322SStefano Zampini 588b76ba322SStefano Zampini /* store partially computed solution and set initial guess */ 5893972b0daSStefano Zampini if (x) { 5903972b0daSStefano Zampini ierr = VecCopy(used_vec,pcbddc->temp_solution);CHKERRQ(ierr); 5913972b0daSStefano Zampini ierr = VecSet(used_vec,0.0);CHKERRQ(ierr); 592b76ba322SStefano Zampini if (pcbddc->use_exact_dirichlet) { 593b76ba322SStefano Zampini ierr = VecScatterBegin(pcis->global_to_D,rhs,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 594b76ba322SStefano Zampini ierr = VecScatterEnd (pcis->global_to_D,rhs,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 595b76ba322SStefano Zampini ierr = KSPSolve(pcbddc->ksp_D,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr); 596b76ba322SStefano Zampini ierr = VecScatterBegin(pcis->global_to_D,pcis->vec2_D,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 597b76ba322SStefano Zampini ierr = VecScatterEnd (pcis->global_to_D,pcis->vec2_D,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 598b76ba322SStefano Zampini if (ksp) { 599b76ba322SStefano Zampini ierr = KSPSetInitialGuessNonzero(ksp,PETSC_TRUE);CHKERRQ(ierr); 600b76ba322SStefano Zampini } 601b76ba322SStefano Zampini } 6023972b0daSStefano Zampini } 603b76ba322SStefano Zampini 604b76ba322SStefano Zampini /* rhs change of basis */ 605b76ba322SStefano Zampini if (pcbddc->usechangeofbasis) { 606b76ba322SStefano Zampini /* swap pointers for local matrices */ 607b76ba322SStefano Zampini temp_mat = matis->A; 608b76ba322SStefano Zampini matis->A = pcbddc->local_mat; 609b76ba322SStefano Zampini pcbddc->local_mat = temp_mat; 610b76ba322SStefano Zampini /* Get local rhs and apply transformation of basis */ 611b76ba322SStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,rhs,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 612b76ba322SStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,rhs,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 613b76ba322SStefano Zampini /* from original basis to modified basis */ 614b76ba322SStefano Zampini ierr = MatMultTranspose(pcbddc->ChangeOfBasisMatrix,pcis->vec1_B,pcis->vec2_B);CHKERRQ(ierr); 615b76ba322SStefano Zampini /* put back modified values into the global vec using INSERT_VALUES copy mode */ 616b76ba322SStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,pcis->vec2_B,rhs,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 617b76ba322SStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,pcis->vec2_B,rhs,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 6180bdf917eSStefano Zampini if (ksp && pcbddc->NullSpace) { 6190bdf917eSStefano Zampini ierr = MatNullSpaceRemove(pcbddc->NullSpace,used_vec,PETSC_NULL);CHKERRQ(ierr); 6200bdf917eSStefano Zampini ierr = MatNullSpaceRemove(pcbddc->NullSpace,rhs,PETSC_NULL);CHKERRQ(ierr); 621b76ba322SStefano Zampini } 6220bdf917eSStefano Zampini } 6230bdf917eSStefano Zampini ierr = VecDestroy(&used_vec);CHKERRQ(ierr); 624534831adSStefano Zampini PetscFunctionReturn(0); 625534831adSStefano Zampini } 626534831adSStefano Zampini /* -------------------------------------------------------------------------- */ 627534831adSStefano Zampini #undef __FUNCT__ 628534831adSStefano Zampini #define __FUNCT__ "PCPostSolve_BDDC" 629534831adSStefano Zampini /* -------------------------------------------------------------------------- */ 630534831adSStefano Zampini /* 631534831adSStefano Zampini PCPostSolve_BDDC - Changes the computed solution if a transformation of basis 632534831adSStefano Zampini approach has been selected. Also, restores rhs to its original state. 633534831adSStefano Zampini 634534831adSStefano Zampini Input Parameter: 635534831adSStefano Zampini + pc - the preconditioner contex 636534831adSStefano Zampini 637534831adSStefano Zampini Application Interface Routine: PCPostSolve() 638534831adSStefano Zampini 639534831adSStefano Zampini Notes: 640534831adSStefano Zampini The interface routine PCPostSolve() is not usually called directly by 641534831adSStefano Zampini the user, but instead is called by KSPSolve(). 642534831adSStefano Zampini */ 643534831adSStefano Zampini static PetscErrorCode PCPostSolve_BDDC(PC pc, KSP ksp, Vec rhs, Vec x) 644534831adSStefano Zampini { 645534831adSStefano Zampini PetscErrorCode ierr; 646534831adSStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 647534831adSStefano Zampini PC_IS *pcis = (PC_IS*)(pc->data); 648534831adSStefano Zampini Mat_IS *matis = (Mat_IS*)pc->pmat->data; 649534831adSStefano Zampini Mat temp_mat; 650534831adSStefano Zampini 651534831adSStefano Zampini PetscFunctionBegin; 652534831adSStefano Zampini if (pcbddc->usechangeofbasis) { 653534831adSStefano Zampini /* swap pointers for local matrices */ 654534831adSStefano Zampini temp_mat = matis->A; 655534831adSStefano Zampini matis->A = pcbddc->local_mat; 656534831adSStefano Zampini pcbddc->local_mat = temp_mat; 657534831adSStefano Zampini /* restore rhs to its original state */ 6583425bc38SStefano Zampini if (rhs) { 6593425bc38SStefano Zampini ierr = VecCopy(pcbddc->original_rhs,rhs);CHKERRQ(ierr); 6603425bc38SStefano Zampini } 661534831adSStefano Zampini /* Get Local boundary and apply transformation of basis to solution vector */ 662534831adSStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,x,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 663534831adSStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,x,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 664534831adSStefano Zampini /* from modified basis to original basis */ 665534831adSStefano Zampini ierr = MatMult(pcbddc->ChangeOfBasisMatrix,pcis->vec1_B,pcis->vec2_B);CHKERRQ(ierr); 666534831adSStefano Zampini /* put back modified values into the global vec using INSERT_VALUES copy mode */ 667534831adSStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,pcis->vec2_B,x,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 668534831adSStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,pcis->vec2_B,x,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 669534831adSStefano Zampini } 6703972b0daSStefano Zampini /* add solution removed in presolve */ 6713425bc38SStefano Zampini if (x) { 6723425bc38SStefano Zampini ierr = VecAXPY(x,1.0,pcbddc->temp_solution);CHKERRQ(ierr); 6733425bc38SStefano Zampini } 674534831adSStefano Zampini PetscFunctionReturn(0); 675534831adSStefano Zampini } 676534831adSStefano Zampini /* -------------------------------------------------------------------------- */ 67753cdbc3dSStefano Zampini #undef __FUNCT__ 67853cdbc3dSStefano Zampini #define __FUNCT__ "PCSetUp_BDDC" 6790c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 6800c7d97c5SJed Brown /* 6810c7d97c5SJed Brown PCSetUp_BDDC - Prepares for the use of the BDDC preconditioner 6820c7d97c5SJed Brown by setting data structures and options. 6830c7d97c5SJed Brown 6840c7d97c5SJed Brown Input Parameter: 68553cdbc3dSStefano Zampini + pc - the preconditioner context 6860c7d97c5SJed Brown 6870c7d97c5SJed Brown Application Interface Routine: PCSetUp() 6880c7d97c5SJed Brown 6890c7d97c5SJed Brown Notes: 6900c7d97c5SJed Brown The interface routine PCSetUp() is not usually called directly by 6910c7d97c5SJed Brown the user, but instead is called by PCApply() if necessary. 6920c7d97c5SJed Brown */ 69353cdbc3dSStefano Zampini PetscErrorCode PCSetUp_BDDC(PC pc) 6940c7d97c5SJed Brown { 6950c7d97c5SJed Brown PetscErrorCode ierr; 6960c7d97c5SJed Brown PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 6970c7d97c5SJed Brown 6980c7d97c5SJed Brown PetscFunctionBegin; 6990c7d97c5SJed Brown if (!pc->setupcalled) { 7003b03a366Sstefano_zampini /* For BDDC we need to define a local "Neumann" problem different to that defined in PCISSetup 7019c0446d6SStefano Zampini So, we set to pcnone the Neumann problem of pcis in order to avoid unneeded computation 7020c7d97c5SJed Brown Also, we decide to directly build the (same) Dirichlet problem */ 7030c7d97c5SJed Brown ierr = PetscOptionsSetValue("-is_localN_pc_type","none");CHKERRQ(ierr); 7040c7d97c5SJed Brown ierr = PetscOptionsSetValue("-is_localD_pc_type","none");CHKERRQ(ierr); 7050c7d97c5SJed Brown /* Set up all the "iterative substructuring" common block */ 7060bdf917eSStefano Zampini 7070c7d97c5SJed Brown ierr = PCISSetUp(pc);CHKERRQ(ierr); 7083b03a366Sstefano_zampini /* Get stdout for dbg */ 709e269702eSStefano Zampini if (pcbddc->dbg_flag) { 710e269702eSStefano Zampini ierr = PetscViewerASCIIGetStdout(((PetscObject)pc)->comm,&pcbddc->dbg_viewer);CHKERRQ(ierr); 711e269702eSStefano Zampini ierr = PetscViewerASCIISynchronizedAllow(pcbddc->dbg_viewer,PETSC_TRUE);CHKERRQ(ierr); 712e269702eSStefano Zampini } 7133b03a366Sstefano_zampini /* Analyze local interface */ 7140c7d97c5SJed Brown ierr = PCBDDCManageLocalBoundaries(pc);CHKERRQ(ierr); 7153b03a366Sstefano_zampini /* Set up local constraint matrix */ 7163b03a366Sstefano_zampini ierr = PCBDDCCreateConstraintMatrix(pc);CHKERRQ(ierr); 7170c7d97c5SJed Brown /* Create coarse and local stuffs used for evaluating action of preconditioner */ 7180c7d97c5SJed Brown ierr = PCBDDCCoarseSetUp(pc);CHKERRQ(ierr); 7190c7d97c5SJed Brown } 7200c7d97c5SJed Brown PetscFunctionReturn(0); 7210c7d97c5SJed Brown } 7220c7d97c5SJed Brown 7230c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 7240c7d97c5SJed Brown /* 7250c7d97c5SJed Brown PCApply_BDDC - Applies the BDDC preconditioner to a vector. 7260c7d97c5SJed Brown 7270c7d97c5SJed Brown Input Parameters: 7280c7d97c5SJed Brown . pc - the preconditioner context 7290c7d97c5SJed Brown . r - input vector (global) 7300c7d97c5SJed Brown 7310c7d97c5SJed Brown Output Parameter: 7320c7d97c5SJed Brown . z - output vector (global) 7330c7d97c5SJed Brown 7340c7d97c5SJed Brown Application Interface Routine: PCApply() 7350c7d97c5SJed Brown */ 7360c7d97c5SJed Brown #undef __FUNCT__ 7370c7d97c5SJed Brown #define __FUNCT__ "PCApply_BDDC" 73853cdbc3dSStefano Zampini PetscErrorCode PCApply_BDDC(PC pc,Vec r,Vec z) 7390c7d97c5SJed Brown { 7400c7d97c5SJed Brown PC_IS *pcis = (PC_IS*)(pc->data); 7410c7d97c5SJed Brown PC_BDDC *pcbddc = (PC_BDDC*)(pc->data); 7420c7d97c5SJed Brown PetscErrorCode ierr; 7433b03a366Sstefano_zampini const PetscScalar one = 1.0; 7443b03a366Sstefano_zampini const PetscScalar m_one = -1.0; 7452617d88aSStefano Zampini const PetscScalar zero = 0.0; 7460c7d97c5SJed Brown 7470c7d97c5SJed Brown /* This code is similar to that provided in nn.c for PCNN 7480c7d97c5SJed Brown NN interface preconditioner changed to BDDC 74929622bf0SStefano Zampini Added support for M_3 preconditioner in the reference article (code is active if pcbddc->inexact_prec_type = PETSC_TRUE) */ 7500c7d97c5SJed Brown 7510c7d97c5SJed Brown PetscFunctionBegin; 752b76ba322SStefano Zampini if (!pcbddc->use_exact_dirichlet) { 7530c7d97c5SJed Brown /* First Dirichlet solve */ 7540c7d97c5SJed Brown ierr = VecScatterBegin(pcis->global_to_D,r,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 7550c7d97c5SJed Brown ierr = VecScatterEnd (pcis->global_to_D,r,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 75653cdbc3dSStefano Zampini ierr = KSPSolve(pcbddc->ksp_D,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr); 7570c7d97c5SJed Brown /* 7580c7d97c5SJed Brown Assembling right hand side for BDDC operator 7590c7d97c5SJed Brown - vec1_D for the Dirichlet part (if needed, i.e. prec_flag=PETSC_TRUE) 7600c7d97c5SJed Brown - the interface part of the global vector z 7610c7d97c5SJed Brown */ 7620c7d97c5SJed Brown ierr = VecScale(pcis->vec2_D,m_one);CHKERRQ(ierr); 7630c7d97c5SJed Brown ierr = MatMult(pcis->A_BI,pcis->vec2_D,pcis->vec1_B);CHKERRQ(ierr); 76429622bf0SStefano Zampini if (pcbddc->inexact_prec_type) { ierr = MatMultAdd(pcis->A_II,pcis->vec2_D,pcis->vec1_D,pcis->vec1_D);CHKERRQ(ierr); } 7650c7d97c5SJed Brown ierr = VecScale(pcis->vec2_D,m_one);CHKERRQ(ierr); 7660c7d97c5SJed Brown ierr = VecCopy(r,z);CHKERRQ(ierr); 7670c7d97c5SJed Brown ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 7680c7d97c5SJed Brown ierr = VecScatterEnd (pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 7692617d88aSStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 7702617d88aSStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 771b76ba322SStefano Zampini } else { 772b76ba322SStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,r,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 773b76ba322SStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,r,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 7740bdf917eSStefano Zampini ierr = VecSet(pcis->vec1_D,zero);CHKERRQ(ierr); 775b76ba322SStefano Zampini ierr = VecSet(pcis->vec2_D,zero);CHKERRQ(ierr); 776b76ba322SStefano Zampini } 777b76ba322SStefano Zampini 778b76ba322SStefano Zampini /* Apply partition of unity */ 7792617d88aSStefano Zampini ierr = VecPointwiseMult(pcis->vec1_B,pcis->D,pcis->vec1_B);CHKERRQ(ierr); 7802617d88aSStefano Zampini 7812617d88aSStefano Zampini /* Apply interface preconditioner 7822617d88aSStefano Zampini input/output vecs: pcis->vec1_B and pcis->vec1_D */ 7832617d88aSStefano Zampini ierr = PCBDDCApplyInterfacePreconditioner(pc);CHKERRQ(ierr); 7842617d88aSStefano Zampini 7852617d88aSStefano Zampini /* Apply partition of unity and sum boundary values */ 7862617d88aSStefano Zampini ierr = VecPointwiseMult(pcis->vec1_B,pcis->D,pcis->vec1_B);CHKERRQ(ierr); 7872617d88aSStefano Zampini ierr = VecSet(z,zero);CHKERRQ(ierr); 7882617d88aSStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 7892617d88aSStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 7900c7d97c5SJed Brown 7913b03a366Sstefano_zampini /* Second Dirichlet solve and assembling of output */ 7920c7d97c5SJed Brown ierr = VecScatterBegin(pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 7930c7d97c5SJed Brown ierr = VecScatterEnd (pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 7940c7d97c5SJed Brown ierr = MatMult(pcis->A_IB,pcis->vec1_B,pcis->vec3_D);CHKERRQ(ierr); 79529622bf0SStefano Zampini if (pcbddc->inexact_prec_type) { ierr = MatMultAdd(pcis->A_II,pcis->vec1_D,pcis->vec3_D,pcis->vec3_D);CHKERRQ(ierr); } 79653cdbc3dSStefano Zampini ierr = KSPSolve(pcbddc->ksp_D,pcis->vec3_D,pcbddc->vec4_D);CHKERRQ(ierr); 7970c7d97c5SJed Brown ierr = VecScale(pcbddc->vec4_D,m_one);CHKERRQ(ierr); 79829622bf0SStefano Zampini if (pcbddc->inexact_prec_type) { ierr = VecAXPY (pcbddc->vec4_D,one,pcis->vec1_D);CHKERRQ(ierr); } 7990c7d97c5SJed Brown ierr = VecAXPY (pcis->vec2_D,one,pcbddc->vec4_D);CHKERRQ(ierr); 8000c7d97c5SJed Brown ierr = VecScatterBegin(pcis->global_to_D,pcis->vec2_D,z,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8010c7d97c5SJed Brown ierr = VecScatterEnd (pcis->global_to_D,pcis->vec2_D,z,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8020c7d97c5SJed Brown PetscFunctionReturn(0); 8030c7d97c5SJed Brown 8040c7d97c5SJed Brown } 805da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */ 806da1bb401SStefano Zampini #undef __FUNCT__ 807da1bb401SStefano Zampini #define __FUNCT__ "PCDestroy_BDDC" 808da1bb401SStefano Zampini PetscErrorCode PCDestroy_BDDC(PC pc) 809da1bb401SStefano Zampini { 810da1bb401SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 8110bdf917eSStefano Zampini PetscInt i; 812da1bb401SStefano Zampini PetscErrorCode ierr; 813da1bb401SStefano Zampini 814da1bb401SStefano Zampini PetscFunctionBegin; 815da1bb401SStefano Zampini /* free data created by PCIS */ 816da1bb401SStefano Zampini ierr = PCISDestroy(pc);CHKERRQ(ierr); 817da1bb401SStefano Zampini /* free BDDC data */ 8180bdf917eSStefano Zampini ierr = MatNullSpaceDestroy(&pcbddc->CoarseNullSpace);CHKERRQ(ierr); 8190bdf917eSStefano Zampini ierr = MatNullSpaceDestroy(&pcbddc->NullSpace);CHKERRQ(ierr); 8203972b0daSStefano Zampini ierr = VecDestroy(&pcbddc->temp_solution);CHKERRQ(ierr); 821534831adSStefano Zampini ierr = VecDestroy(&pcbddc->original_rhs);CHKERRQ(ierr); 822534831adSStefano Zampini ierr = MatDestroy(&pcbddc->local_mat);CHKERRQ(ierr); 823534831adSStefano Zampini ierr = MatDestroy(&pcbddc->ChangeOfBasisMatrix);CHKERRQ(ierr); 824da1bb401SStefano Zampini ierr = VecDestroy(&pcbddc->coarse_vec);CHKERRQ(ierr); 825da1bb401SStefano Zampini ierr = VecDestroy(&pcbddc->coarse_rhs);CHKERRQ(ierr); 826da1bb401SStefano Zampini ierr = KSPDestroy(&pcbddc->coarse_ksp);CHKERRQ(ierr); 827da1bb401SStefano Zampini ierr = MatDestroy(&pcbddc->coarse_mat);CHKERRQ(ierr); 828da1bb401SStefano Zampini ierr = MatDestroy(&pcbddc->coarse_phi_B);CHKERRQ(ierr); 829da1bb401SStefano Zampini ierr = MatDestroy(&pcbddc->coarse_phi_D);CHKERRQ(ierr); 830da1bb401SStefano Zampini ierr = VecDestroy(&pcbddc->vec1_P);CHKERRQ(ierr); 831da1bb401SStefano Zampini ierr = VecDestroy(&pcbddc->vec1_C);CHKERRQ(ierr); 832da1bb401SStefano Zampini ierr = MatDestroy(&pcbddc->local_auxmat1);CHKERRQ(ierr); 833da1bb401SStefano Zampini ierr = MatDestroy(&pcbddc->local_auxmat2);CHKERRQ(ierr); 834da1bb401SStefano Zampini ierr = VecDestroy(&pcbddc->vec1_R);CHKERRQ(ierr); 835da1bb401SStefano Zampini ierr = VecDestroy(&pcbddc->vec2_R);CHKERRQ(ierr); 836da1bb401SStefano Zampini ierr = VecDestroy(&pcbddc->vec4_D);CHKERRQ(ierr); 837da1bb401SStefano Zampini ierr = VecScatterDestroy(&pcbddc->R_to_B);CHKERRQ(ierr); 838da1bb401SStefano Zampini ierr = VecScatterDestroy(&pcbddc->R_to_D);CHKERRQ(ierr); 839da1bb401SStefano Zampini ierr = VecScatterDestroy(&pcbddc->coarse_loc_to_glob);CHKERRQ(ierr); 840da1bb401SStefano Zampini ierr = KSPDestroy(&pcbddc->ksp_D);CHKERRQ(ierr); 841da1bb401SStefano Zampini ierr = KSPDestroy(&pcbddc->ksp_R);CHKERRQ(ierr); 842da1bb401SStefano Zampini ierr = ISDestroy(&pcbddc->NeumannBoundaries);CHKERRQ(ierr); 843da1bb401SStefano Zampini ierr = ISDestroy(&pcbddc->DirichletBoundaries);CHKERRQ(ierr); 844da1bb401SStefano Zampini ierr = MatDestroy(&pcbddc->ConstraintMatrix);CHKERRQ(ierr); 845da1bb401SStefano Zampini ierr = PetscFree(pcbddc->local_primal_indices);CHKERRQ(ierr); 846da1bb401SStefano Zampini ierr = PetscFree(pcbddc->replicated_local_primal_indices);CHKERRQ(ierr); 8470bdf917eSStefano Zampini ierr = PetscFree(pcbddc->replicated_local_primal_values);CHKERRQ(ierr); 848da1bb401SStefano Zampini ierr = PetscFree(pcbddc->local_primal_displacements);CHKERRQ(ierr); 849da1bb401SStefano Zampini ierr = PetscFree(pcbddc->local_primal_sizes);CHKERRQ(ierr); 8502fa5cd67SKarl Rupp for (i=0; i<pcbddc->n_ISForDofs; i++) { 8512fa5cd67SKarl Rupp ierr = ISDestroy(&pcbddc->ISForDofs[i]);CHKERRQ(ierr); 8522fa5cd67SKarl Rupp } 853da1bb401SStefano Zampini ierr = PetscFree(pcbddc->ISForDofs);CHKERRQ(ierr); 8542fa5cd67SKarl Rupp for (i=0; i<pcbddc->n_ISForFaces; i++) { 8552fa5cd67SKarl Rupp ierr = ISDestroy(&pcbddc->ISForFaces[i]);CHKERRQ(ierr); 8562fa5cd67SKarl Rupp } 857da1bb401SStefano Zampini ierr = PetscFree(pcbddc->ISForFaces);CHKERRQ(ierr); 8582fa5cd67SKarl Rupp for (i=0; i<pcbddc->n_ISForEdges; i++) { 8592fa5cd67SKarl Rupp ierr = ISDestroy(&pcbddc->ISForEdges[i]);CHKERRQ(ierr); 8602fa5cd67SKarl Rupp } 861da1bb401SStefano Zampini ierr = PetscFree(pcbddc->ISForEdges);CHKERRQ(ierr); 862da1bb401SStefano Zampini ierr = ISDestroy(&pcbddc->ISForVertices);CHKERRQ(ierr); 8633972b0daSStefano Zampini /* Free graph structure */ 864da1bb401SStefano Zampini ierr = PetscFree(pcbddc->mat_graph->xadj);CHKERRQ(ierr); 865da1bb401SStefano Zampini ierr = PetscFree(pcbddc->mat_graph->adjncy);CHKERRQ(ierr); 866142dfd88SStefano Zampini if (pcbddc->mat_graph->nvtxs) { 867da1bb401SStefano Zampini ierr = PetscFree(pcbddc->mat_graph->neighbours_set[0]);CHKERRQ(ierr); 868142dfd88SStefano Zampini } 869da1bb401SStefano Zampini ierr = PetscFree(pcbddc->mat_graph->neighbours_set);CHKERRQ(ierr); 8703972b0daSStefano Zampini ierr = PetscFree4(pcbddc->mat_graph->where,pcbddc->mat_graph->count,pcbddc->mat_graph->cptr,pcbddc->mat_graph->queue);CHKERRQ(ierr); 8713972b0daSStefano Zampini ierr = PetscFree2(pcbddc->mat_graph->which_dof,pcbddc->mat_graph->touched);CHKERRQ(ierr); 8723972b0daSStefano Zampini ierr = PetscFree(pcbddc->mat_graph->where_ncmps);CHKERRQ(ierr); 873da1bb401SStefano Zampini ierr = PetscFree(pcbddc->mat_graph);CHKERRQ(ierr); 8743425bc38SStefano Zampini /* remove functions */ 8754fad6a16SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetCoarseningRatio_C","",PETSC_NULL);CHKERRQ(ierr); 8764fad6a16SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetMaxLevels_C","",PETSC_NULL);CHKERRQ(ierr); 8770bdf917eSStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetNullSpace_C","",PETSC_NULL);CHKERRQ(ierr); 8783425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDirichletBoundaries_C","",PETSC_NULL);CHKERRQ(ierr); 8793425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetNeumannBoundaries_C","",PETSC_NULL);CHKERRQ(ierr); 8803425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetDirichletBoundaries_C","",PETSC_NULL);CHKERRQ(ierr); 8813425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetNeumannBoundaries_C","",PETSC_NULL);CHKERRQ(ierr); 8823425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetCoarseProblemType_C","",PETSC_NULL);CHKERRQ(ierr); 8833425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDofsSplitting_C","",PETSC_NULL);CHKERRQ(ierr); 8843425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetLocalAdjacencyGraph_C","",PETSC_NULL);CHKERRQ(ierr); 8853425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPreSolve_C","",PETSC_NULL);CHKERRQ(ierr); 8863425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPostSolve_C","",PETSC_NULL);CHKERRQ(ierr); 8873425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCCreateFETIDPOperators_C","",PETSC_NULL);CHKERRQ(ierr); 8883425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetRHS_C","",PETSC_NULL);CHKERRQ(ierr); 8893425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetSolution_C","",PETSC_NULL);CHKERRQ(ierr); 890da1bb401SStefano Zampini /* Free the private data structure that was hanging off the PC */ 891da1bb401SStefano Zampini ierr = PetscFree(pcbddc);CHKERRQ(ierr); 892da1bb401SStefano Zampini PetscFunctionReturn(0); 893da1bb401SStefano Zampini } 8943425bc38SStefano Zampini /* -------------------------------------------------------------------------- */ 8953425bc38SStefano Zampini EXTERN_C_BEGIN 8963425bc38SStefano Zampini #undef __FUNCT__ 8973425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetRHS_BDDC" 8983425bc38SStefano Zampini static PetscErrorCode PCBDDCMatFETIDPGetRHS_BDDC(Mat fetidp_mat, Vec standard_rhs, Vec fetidp_flux_rhs) 8993425bc38SStefano Zampini { 9003425bc38SStefano Zampini FETIDPMat_ctx *mat_ctx; 9013425bc38SStefano Zampini PC_IS * pcis; 9023425bc38SStefano Zampini PC_BDDC * pcbddc; 9033425bc38SStefano Zampini PetscErrorCode ierr; 9040c7d97c5SJed Brown 9053425bc38SStefano Zampini PetscFunctionBegin; 9063425bc38SStefano Zampini ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr); 9073425bc38SStefano Zampini pcis = (PC_IS*)mat_ctx->pc->data; 9083425bc38SStefano Zampini pcbddc = (PC_BDDC*)mat_ctx->pc->data; 9093425bc38SStefano Zampini 9103425bc38SStefano Zampini /* change of basis for physical rhs if needed 9113425bc38SStefano Zampini It also changes the rhs in case of dirichlet boundaries */ 9123425bc38SStefano Zampini (*mat_ctx->pc->ops->presolve)(mat_ctx->pc,PETSC_NULL,standard_rhs,PETSC_NULL); 9133425bc38SStefano Zampini /* store vectors for computation of fetidp final solution */ 9143425bc38SStefano Zampini ierr = VecScatterBegin(pcis->global_to_D,standard_rhs,mat_ctx->temp_solution_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 9153425bc38SStefano Zampini ierr = VecScatterEnd (pcis->global_to_D,standard_rhs,mat_ctx->temp_solution_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 9163425bc38SStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 9173425bc38SStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 9183425bc38SStefano Zampini /* scale rhs since it should be unassembled */ 9193425bc38SStefano Zampini ierr = VecPointwiseMult(mat_ctx->temp_solution_B,pcis->D,mat_ctx->temp_solution_B);CHKERRQ(ierr); 92029622bf0SStefano Zampini if (!pcbddc->inexact_prec_type) { 9213425bc38SStefano Zampini /* compute partially subassembled Schur complement right-hand side */ 9223425bc38SStefano Zampini ierr = KSPSolve(pcbddc->ksp_D,mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr); 9233425bc38SStefano Zampini ierr = MatMult(pcis->A_BI,pcis->vec1_D,pcis->vec1_B);CHKERRQ(ierr); 9243425bc38SStefano Zampini ierr = VecAXPY(mat_ctx->temp_solution_B,-1.0,pcis->vec1_B);CHKERRQ(ierr); 9253425bc38SStefano Zampini ierr = VecSet(standard_rhs,0.0);CHKERRQ(ierr); 9263425bc38SStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,mat_ctx->temp_solution_B,standard_rhs,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 9273425bc38SStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,mat_ctx->temp_solution_B,standard_rhs,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 9283425bc38SStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 9293425bc38SStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 9303425bc38SStefano Zampini ierr = VecPointwiseMult(mat_ctx->temp_solution_B,pcis->D,mat_ctx->temp_solution_B);CHKERRQ(ierr); 9313425bc38SStefano Zampini } 9323425bc38SStefano Zampini /* BDDC rhs */ 9333425bc38SStefano Zampini ierr = VecCopy(mat_ctx->temp_solution_B,pcis->vec1_B);CHKERRQ(ierr); 93429622bf0SStefano Zampini if (pcbddc->inexact_prec_type) { 9353425bc38SStefano Zampini ierr = VecCopy(mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr); 9363425bc38SStefano Zampini } 9373425bc38SStefano Zampini /* apply BDDC */ 9383425bc38SStefano Zampini ierr = PCBDDCApplyInterfacePreconditioner(mat_ctx->pc);CHKERRQ(ierr); 9393425bc38SStefano Zampini /* Application of B_delta and assembling of rhs for fetidp fluxes */ 9403425bc38SStefano Zampini ierr = VecSet(fetidp_flux_rhs,0.0);CHKERRQ(ierr); 9413425bc38SStefano Zampini ierr = MatMult(mat_ctx->B_delta,pcis->vec1_B,mat_ctx->lambda_local);CHKERRQ(ierr); 9423425bc38SStefano Zampini ierr = VecScatterBegin(mat_ctx->l2g_lambda,mat_ctx->lambda_local,fetidp_flux_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 9433425bc38SStefano Zampini ierr = VecScatterEnd (mat_ctx->l2g_lambda,mat_ctx->lambda_local,fetidp_flux_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 9443425bc38SStefano Zampini /* restore original rhs */ 9453425bc38SStefano Zampini ierr = VecCopy(pcbddc->original_rhs,standard_rhs);CHKERRQ(ierr); 9463425bc38SStefano Zampini PetscFunctionReturn(0); 9473425bc38SStefano Zampini } 9483425bc38SStefano Zampini EXTERN_C_END 9493425bc38SStefano Zampini #undef __FUNCT__ 9503425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetRHS" 9513425bc38SStefano Zampini /*@ 9523425bc38SStefano Zampini PCBDDCMatFETIDPGetRHS - Get rhs for FETIDP linear system. 9533425bc38SStefano Zampini 9543425bc38SStefano Zampini Collective 9553425bc38SStefano Zampini 9563425bc38SStefano Zampini Input Parameters: 9573425bc38SStefano Zampini + fetidp_mat - the FETIDP mat obtained by a call to PCBDDCCreateFETIDPOperators 9583425bc38SStefano Zampini + standard_rhs - the rhs of your linear system 9593425bc38SStefano Zampini 9603425bc38SStefano Zampini Output Parameters: 9613425bc38SStefano Zampini + fetidp_flux_rhs - the rhs of the FETIDP linear system 9623425bc38SStefano Zampini 9633425bc38SStefano Zampini Level: developer 9643425bc38SStefano Zampini 9653425bc38SStefano Zampini Notes: 9663425bc38SStefano Zampini 9673425bc38SStefano Zampini .seealso: PCBDDC 9683425bc38SStefano Zampini @*/ 9693425bc38SStefano Zampini PetscErrorCode PCBDDCMatFETIDPGetRHS(Mat fetidp_mat, Vec standard_rhs, Vec fetidp_flux_rhs) 9703425bc38SStefano Zampini { 9713425bc38SStefano Zampini FETIDPMat_ctx *mat_ctx; 9723425bc38SStefano Zampini PetscErrorCode ierr; 9733425bc38SStefano Zampini 9743425bc38SStefano Zampini PetscFunctionBegin; 9753425bc38SStefano Zampini ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr); 9763425bc38SStefano Zampini ierr = PetscTryMethod(mat_ctx->pc,"PCBDDCMatFETIDPGetRHS_C",(Mat,Vec,Vec),(fetidp_mat,standard_rhs,fetidp_flux_rhs));CHKERRQ(ierr); 9773425bc38SStefano Zampini PetscFunctionReturn(0); 9783425bc38SStefano Zampini } 9793425bc38SStefano Zampini /* -------------------------------------------------------------------------- */ 9803425bc38SStefano Zampini EXTERN_C_BEGIN 9813425bc38SStefano Zampini #undef __FUNCT__ 9823425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetSolution_BDDC" 9833425bc38SStefano Zampini static PetscErrorCode PCBDDCMatFETIDPGetSolution_BDDC(Mat fetidp_mat, Vec fetidp_flux_sol, Vec standard_sol) 9843425bc38SStefano Zampini { 9853425bc38SStefano Zampini FETIDPMat_ctx *mat_ctx; 9863425bc38SStefano Zampini PC_IS *pcis; 9873425bc38SStefano Zampini PC_BDDC *pcbddc; 9883425bc38SStefano Zampini PetscErrorCode ierr; 9893425bc38SStefano Zampini 9903425bc38SStefano Zampini PetscFunctionBegin; 9913425bc38SStefano Zampini ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr); 9923425bc38SStefano Zampini pcis = (PC_IS*)mat_ctx->pc->data; 9933425bc38SStefano Zampini pcbddc = (PC_BDDC*)mat_ctx->pc->data; 9943425bc38SStefano Zampini 9953425bc38SStefano Zampini /* apply B_delta^T */ 9963425bc38SStefano Zampini ierr = VecScatterBegin(mat_ctx->l2g_lambda,fetidp_flux_sol,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 9973425bc38SStefano Zampini ierr = VecScatterEnd (mat_ctx->l2g_lambda,fetidp_flux_sol,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 9983425bc38SStefano Zampini ierr = MatMultTranspose(mat_ctx->B_delta,mat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr); 9993425bc38SStefano Zampini /* compute rhs for BDDC application */ 10003425bc38SStefano Zampini ierr = VecAYPX(pcis->vec1_B,-1.0,mat_ctx->temp_solution_B);CHKERRQ(ierr); 100129622bf0SStefano Zampini if (pcbddc->inexact_prec_type) { 10023425bc38SStefano Zampini ierr = VecCopy(mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr); 10033425bc38SStefano Zampini } 10043425bc38SStefano Zampini /* apply BDDC */ 10053425bc38SStefano Zampini ierr = PCBDDCApplyInterfacePreconditioner(mat_ctx->pc);CHKERRQ(ierr); 10063425bc38SStefano Zampini /* put values into standard global vector */ 10073425bc38SStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 10083425bc38SStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,pcis->vec1_B,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 100929622bf0SStefano Zampini if (!pcbddc->inexact_prec_type) { 10103425bc38SStefano Zampini /* compute values into the interior if solved for the partially subassembled Schur complement */ 10113425bc38SStefano Zampini ierr = MatMult(pcis->A_IB,pcis->vec1_B,pcis->vec1_D);CHKERRQ(ierr); 10123425bc38SStefano Zampini ierr = VecAXPY(mat_ctx->temp_solution_D,-1.0,pcis->vec1_D);CHKERRQ(ierr); 10133425bc38SStefano Zampini ierr = KSPSolve(pcbddc->ksp_D,mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr); 10143425bc38SStefano Zampini } 10153425bc38SStefano Zampini ierr = VecScatterBegin(pcis->global_to_D,pcis->vec1_D,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 10163425bc38SStefano Zampini ierr = VecScatterEnd (pcis->global_to_D,pcis->vec1_D,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 10173425bc38SStefano Zampini /* final change of basis if needed 10183425bc38SStefano Zampini Is also sums the dirichlet part removed during RHS assembling */ 10193425bc38SStefano Zampini (*mat_ctx->pc->ops->postsolve)(mat_ctx->pc,PETSC_NULL,PETSC_NULL,standard_sol); 10203425bc38SStefano Zampini PetscFunctionReturn(0); 10213425bc38SStefano Zampini 10223425bc38SStefano Zampini } 10233425bc38SStefano Zampini EXTERN_C_END 10243425bc38SStefano Zampini #undef __FUNCT__ 10253425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetSolution" 10263425bc38SStefano Zampini /*@ 10273425bc38SStefano Zampini PCBDDCMatFETIDPGetSolution - Get Solution for FETIDP linear system. 10283425bc38SStefano Zampini 10293425bc38SStefano Zampini Collective 10303425bc38SStefano Zampini 10313425bc38SStefano Zampini Input Parameters: 10323425bc38SStefano Zampini + fetidp_mat - the FETIDP mat obtained by a call to PCBDDCCreateFETIDPOperators 10333425bc38SStefano Zampini + fetidp_flux_sol - the solution of the FETIDP linear system 10343425bc38SStefano Zampini 10353425bc38SStefano Zampini Output Parameters: 10363425bc38SStefano Zampini + standard_sol - the solution on the global domain 10373425bc38SStefano Zampini 10383425bc38SStefano Zampini Level: developer 10393425bc38SStefano Zampini 10403425bc38SStefano Zampini Notes: 10413425bc38SStefano Zampini 10423425bc38SStefano Zampini .seealso: PCBDDC 10433425bc38SStefano Zampini @*/ 10443425bc38SStefano Zampini PetscErrorCode PCBDDCMatFETIDPGetSolution(Mat fetidp_mat, Vec fetidp_flux_sol, Vec standard_sol) 10453425bc38SStefano Zampini { 10463425bc38SStefano Zampini FETIDPMat_ctx *mat_ctx; 10473425bc38SStefano Zampini PetscErrorCode ierr; 10483425bc38SStefano Zampini 10493425bc38SStefano Zampini PetscFunctionBegin; 10503425bc38SStefano Zampini ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr); 10513425bc38SStefano Zampini ierr = PetscTryMethod(mat_ctx->pc,"PCBDDCMatFETIDPGetSolution_C",(Mat,Vec,Vec),(fetidp_mat,fetidp_flux_sol,standard_sol));CHKERRQ(ierr); 10523425bc38SStefano Zampini PetscFunctionReturn(0); 10533425bc38SStefano Zampini } 10543425bc38SStefano Zampini /* -------------------------------------------------------------------------- */ 10553425bc38SStefano Zampini EXTERN_C_BEGIN 1056f23aa3ddSBarry Smith extern PetscErrorCode FETIDPMatMult(Mat,Vec,Vec); 1057f23aa3ddSBarry Smith extern PetscErrorCode PCBDDCDestroyFETIDPMat(Mat); 1058f23aa3ddSBarry Smith extern PetscErrorCode FETIDPPCApply(PC,Vec,Vec); 1059f23aa3ddSBarry Smith extern PetscErrorCode PCBDDCDestroyFETIDPPC(PC); 10603425bc38SStefano Zampini #undef __FUNCT__ 10613425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPOperators_BDDC" 10623425bc38SStefano Zampini static PetscErrorCode PCBDDCCreateFETIDPOperators_BDDC(PC pc, Mat *fetidp_mat, PC *fetidp_pc) 10633425bc38SStefano Zampini { 10643425bc38SStefano Zampini FETIDPMat_ctx *fetidpmat_ctx; 10653425bc38SStefano Zampini Mat newmat; 10663425bc38SStefano Zampini FETIDPPC_ctx *fetidppc_ctx; 10673425bc38SStefano Zampini PC newpc; 10683425bc38SStefano Zampini MPI_Comm comm = ((PetscObject)pc)->comm; 10693425bc38SStefano Zampini PetscErrorCode ierr; 10703425bc38SStefano Zampini 10713425bc38SStefano Zampini PetscFunctionBegin; 10723425bc38SStefano Zampini /* FETIDP linear matrix */ 10733425bc38SStefano Zampini ierr = PCBDDCCreateFETIDPMatContext(pc, &fetidpmat_ctx);CHKERRQ(ierr); 10743425bc38SStefano Zampini ierr = PCBDDCSetupFETIDPMatContext(fetidpmat_ctx);CHKERRQ(ierr); 10753425bc38SStefano Zampini ierr = MatCreateShell(comm,PETSC_DECIDE,PETSC_DECIDE,fetidpmat_ctx->n_lambda,fetidpmat_ctx->n_lambda,fetidpmat_ctx,&newmat);CHKERRQ(ierr); 10763425bc38SStefano Zampini ierr = MatShellSetOperation(newmat,MATOP_MULT,(void (*)(void))FETIDPMatMult);CHKERRQ(ierr); 10773425bc38SStefano Zampini ierr = MatShellSetOperation(newmat,MATOP_DESTROY,(void (*)(void))PCBDDCDestroyFETIDPMat);CHKERRQ(ierr); 10783425bc38SStefano Zampini ierr = MatSetUp(newmat);CHKERRQ(ierr); 10793425bc38SStefano Zampini /* FETIDP preconditioner */ 10803425bc38SStefano Zampini ierr = PCBDDCCreateFETIDPPCContext(pc, &fetidppc_ctx);CHKERRQ(ierr); 10813425bc38SStefano Zampini ierr = PCBDDCSetupFETIDPPCContext(newmat,fetidppc_ctx);CHKERRQ(ierr); 10823425bc38SStefano Zampini ierr = PCCreate(comm,&newpc);CHKERRQ(ierr); 10833425bc38SStefano Zampini ierr = PCSetType(newpc,PCSHELL);CHKERRQ(ierr); 10843425bc38SStefano Zampini ierr = PCShellSetContext(newpc,fetidppc_ctx);CHKERRQ(ierr); 10853425bc38SStefano Zampini ierr = PCShellSetApply(newpc,FETIDPPCApply);CHKERRQ(ierr); 10863425bc38SStefano Zampini ierr = PCShellSetDestroy(newpc,PCBDDCDestroyFETIDPPC);CHKERRQ(ierr); 10873425bc38SStefano Zampini ierr = PCSetOperators(newpc,newmat,newmat,SAME_PRECONDITIONER);CHKERRQ(ierr); 10883425bc38SStefano Zampini ierr = PCSetUp(newpc);CHKERRQ(ierr); 10892fa5cd67SKarl Rupp 10903425bc38SStefano Zampini /* return pointers for objects created */ 10913425bc38SStefano Zampini *fetidp_mat = newmat; 10923425bc38SStefano Zampini *fetidp_pc = newpc; 10933425bc38SStefano Zampini PetscFunctionReturn(0); 10943425bc38SStefano Zampini } 10953425bc38SStefano Zampini EXTERN_C_END 10963425bc38SStefano Zampini #undef __FUNCT__ 10973425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPOperators" 10983425bc38SStefano Zampini /*@ 10993425bc38SStefano Zampini PCBDDCCreateFETIDPOperators - Create operators for FETIDP. 11003425bc38SStefano Zampini 11013425bc38SStefano Zampini Collective 11023425bc38SStefano Zampini 11033425bc38SStefano Zampini Input Parameters: 11043425bc38SStefano Zampini + pc - the BDDC preconditioning context (setup must be already called) 11053425bc38SStefano Zampini 11063425bc38SStefano Zampini Level: developer 11073425bc38SStefano Zampini 11083425bc38SStefano Zampini Notes: 11093425bc38SStefano Zampini 11103425bc38SStefano Zampini .seealso: PCBDDC 11113425bc38SStefano Zampini @*/ 11123425bc38SStefano Zampini PetscErrorCode PCBDDCCreateFETIDPOperators(PC pc, Mat *fetidp_mat, PC *fetidp_pc) 11133425bc38SStefano Zampini { 11143425bc38SStefano Zampini PetscErrorCode ierr; 11153425bc38SStefano Zampini 11163425bc38SStefano Zampini PetscFunctionBegin; 11173425bc38SStefano Zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 11183425bc38SStefano Zampini if (pc->setupcalled) { 11193425bc38SStefano Zampini ierr = PetscTryMethod(pc,"PCBDDCCreateFETIDPOperators_C",(PC,Mat*,PC*),(pc,fetidp_mat,fetidp_pc));CHKERRQ(ierr); 1120f23aa3ddSBarry Smith } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"You must call PCSetup_BDDC() first \n"); 11213425bc38SStefano Zampini PetscFunctionReturn(0); 11223425bc38SStefano Zampini } 11230c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 1124da1bb401SStefano Zampini /*MC 1125da1bb401SStefano Zampini PCBDDC - Balancing Domain Decomposition by Constraints. 11260c7d97c5SJed Brown 1127da1bb401SStefano Zampini Options Database Keys: 1128da1bb401SStefano Zampini . -pcbddc ??? - 1129da1bb401SStefano Zampini 1130da1bb401SStefano Zampini Level: intermediate 1131da1bb401SStefano Zampini 1132da1bb401SStefano Zampini Notes: The matrix used with this preconditioner must be of type MATIS 1133da1bb401SStefano Zampini 1134da1bb401SStefano Zampini Unlike more 'conventional' interface preconditioners, this iterates over ALL the 1135da1bb401SStefano Zampini degrees of freedom, NOT just those on the interface (this allows the use of approximate solvers 1136da1bb401SStefano Zampini on the subdomains). 1137da1bb401SStefano Zampini 1138da1bb401SStefano Zampini Options for the coarse grid preconditioner can be set with - 1139da1bb401SStefano Zampini Options for the Dirichlet subproblem can be set with - 1140da1bb401SStefano Zampini Options for the Neumann subproblem can be set with - 1141da1bb401SStefano Zampini 1142da1bb401SStefano Zampini Contributed by Stefano Zampini 1143da1bb401SStefano Zampini 1144da1bb401SStefano Zampini .seealso: PCCreate(), PCSetType(), PCType (for list of available types), PC, MATIS 1145da1bb401SStefano Zampini M*/ 1146da1bb401SStefano Zampini EXTERN_C_BEGIN 1147da1bb401SStefano Zampini #undef __FUNCT__ 1148da1bb401SStefano Zampini #define __FUNCT__ "PCCreate_BDDC" 1149da1bb401SStefano Zampini PetscErrorCode PCCreate_BDDC(PC pc) 1150da1bb401SStefano Zampini { 1151da1bb401SStefano Zampini PetscErrorCode ierr; 1152da1bb401SStefano Zampini PC_BDDC *pcbddc; 1153da1bb401SStefano Zampini PCBDDCGraph mat_graph; 1154da1bb401SStefano Zampini 1155da1bb401SStefano Zampini PetscFunctionBegin; 1156da1bb401SStefano Zampini /* Creates the private data structure for this preconditioner and attach it to the PC object. */ 1157da1bb401SStefano Zampini ierr = PetscNewLog(pc,PC_BDDC,&pcbddc);CHKERRQ(ierr); 1158da1bb401SStefano Zampini pc->data = (void*)pcbddc; 1159da1bb401SStefano Zampini 1160da1bb401SStefano Zampini /* create PCIS data structure */ 1161da1bb401SStefano Zampini ierr = PCISCreate(pc);CHKERRQ(ierr); 1162da1bb401SStefano Zampini 1163da1bb401SStefano Zampini /* BDDC specific */ 11640bdf917eSStefano Zampini pcbddc->CoarseNullSpace = 0; 11650bdf917eSStefano Zampini pcbddc->NullSpace = 0; 11663972b0daSStefano Zampini pcbddc->temp_solution = 0; 1167534831adSStefano Zampini pcbddc->original_rhs = 0; 1168534831adSStefano Zampini pcbddc->local_mat = 0; 1169534831adSStefano Zampini pcbddc->ChangeOfBasisMatrix = 0; 1170534831adSStefano Zampini pcbddc->usechangeofbasis = PETSC_TRUE; 1171534831adSStefano Zampini pcbddc->usechangeonfaces = PETSC_FALSE; 1172da1bb401SStefano Zampini pcbddc->coarse_vec = 0; 1173da1bb401SStefano Zampini pcbddc->coarse_rhs = 0; 1174da1bb401SStefano Zampini pcbddc->coarse_ksp = 0; 1175da1bb401SStefano Zampini pcbddc->coarse_phi_B = 0; 1176da1bb401SStefano Zampini pcbddc->coarse_phi_D = 0; 1177da1bb401SStefano Zampini pcbddc->vec1_P = 0; 1178da1bb401SStefano Zampini pcbddc->vec1_R = 0; 1179da1bb401SStefano Zampini pcbddc->vec2_R = 0; 1180da1bb401SStefano Zampini pcbddc->local_auxmat1 = 0; 1181da1bb401SStefano Zampini pcbddc->local_auxmat2 = 0; 1182da1bb401SStefano Zampini pcbddc->R_to_B = 0; 1183da1bb401SStefano Zampini pcbddc->R_to_D = 0; 1184da1bb401SStefano Zampini pcbddc->ksp_D = 0; 1185da1bb401SStefano Zampini pcbddc->ksp_R = 0; 1186da1bb401SStefano Zampini pcbddc->local_primal_indices = 0; 118729622bf0SStefano Zampini pcbddc->inexact_prec_type = PETSC_FALSE; 1188da1bb401SStefano Zampini pcbddc->NeumannBoundaries = 0; 1189da1bb401SStefano Zampini pcbddc->ISForDofs = 0; 1190da1bb401SStefano Zampini pcbddc->ISForVertices = 0; 1191da1bb401SStefano Zampini pcbddc->n_ISForFaces = 0; 1192da1bb401SStefano Zampini pcbddc->n_ISForEdges = 0; 1193da1bb401SStefano Zampini pcbddc->ConstraintMatrix = 0; 1194da1bb401SStefano Zampini pcbddc->use_nnsp_true = PETSC_FALSE; 1195da1bb401SStefano Zampini pcbddc->local_primal_sizes = 0; 1196da1bb401SStefano Zampini pcbddc->local_primal_displacements = 0; 1197da1bb401SStefano Zampini pcbddc->replicated_local_primal_indices = 0; 1198da1bb401SStefano Zampini pcbddc->replicated_local_primal_values = 0; 1199da1bb401SStefano Zampini pcbddc->coarse_loc_to_glob = 0; 1200da1bb401SStefano Zampini pcbddc->dbg_flag = PETSC_FALSE; 1201da1bb401SStefano Zampini pcbddc->coarsening_ratio = 8; 1202b76ba322SStefano Zampini pcbddc->use_exact_dirichlet = PETSC_TRUE; 12034fad6a16SStefano Zampini pcbddc->current_level = 0; 12044fad6a16SStefano Zampini pcbddc->max_levels = 1; 1205da1bb401SStefano Zampini 1206da1bb401SStefano Zampini /* allocate and initialize needed graph structure */ 1207da1bb401SStefano Zampini ierr = PetscMalloc(sizeof(*mat_graph),&pcbddc->mat_graph);CHKERRQ(ierr); 1208da1bb401SStefano Zampini pcbddc->mat_graph->xadj = 0; 1209da1bb401SStefano Zampini pcbddc->mat_graph->adjncy = 0; 1210da1bb401SStefano Zampini 1211da1bb401SStefano Zampini /* function pointers */ 1212da1bb401SStefano Zampini pc->ops->apply = PCApply_BDDC; 1213da1bb401SStefano Zampini pc->ops->applytranspose = 0; 1214da1bb401SStefano Zampini pc->ops->setup = PCSetUp_BDDC; 1215da1bb401SStefano Zampini pc->ops->destroy = PCDestroy_BDDC; 1216da1bb401SStefano Zampini pc->ops->setfromoptions = PCSetFromOptions_BDDC; 1217da1bb401SStefano Zampini pc->ops->view = 0; 1218da1bb401SStefano Zampini pc->ops->applyrichardson = 0; 1219da1bb401SStefano Zampini pc->ops->applysymmetricleft = 0; 1220da1bb401SStefano Zampini pc->ops->applysymmetricright = 0; 1221534831adSStefano Zampini pc->ops->presolve = PCPreSolve_BDDC; 1222534831adSStefano Zampini pc->ops->postsolve = PCPostSolve_BDDC; 1223da1bb401SStefano Zampini 1224da1bb401SStefano Zampini /* composing function */ 12254fad6a16SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetCoarseningRatio_C","PCBDDCSetCoarseningRatio_BDDC", 12264fad6a16SStefano Zampini PCBDDCSetCoarseningRatio_BDDC);CHKERRQ(ierr); 12274fad6a16SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetMaxLevels_C","PCBDDCSetMaxLevels_BDDC", 12284fad6a16SStefano Zampini PCBDDCSetMaxLevels_BDDC);CHKERRQ(ierr); 12290bdf917eSStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetNullSpace_C","PCBDDCSetNullSpace_BDDC", 12300bdf917eSStefano Zampini PCBDDCSetNullSpace_BDDC);CHKERRQ(ierr); 1231da1bb401SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDirichletBoundaries_C","PCBDDCSetDirichletBoundaries_BDDC", 1232da1bb401SStefano Zampini PCBDDCSetDirichletBoundaries_BDDC);CHKERRQ(ierr); 1233da1bb401SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetNeumannBoundaries_C","PCBDDCSetNeumannBoundaries_BDDC", 1234da1bb401SStefano Zampini PCBDDCSetNeumannBoundaries_BDDC);CHKERRQ(ierr); 1235da1bb401SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetDirichletBoundaries_C","PCBDDCGetDirichletBoundaries_BDDC", 1236da1bb401SStefano Zampini PCBDDCGetDirichletBoundaries_BDDC);CHKERRQ(ierr); 1237da1bb401SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetNeumannBoundaries_C","PCBDDCGetNeumannBoundaries_BDDC", 1238da1bb401SStefano Zampini PCBDDCGetNeumannBoundaries_BDDC);CHKERRQ(ierr); 1239da1bb401SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetCoarseProblemType_C","PCBDDCSetCoarseProblemType_BDDC", 1240da1bb401SStefano Zampini PCBDDCSetCoarseProblemType_BDDC);CHKERRQ(ierr); 1241da1bb401SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDofsSplitting_C","PCBDDCSetDofsSplitting_BDDC", 1242da1bb401SStefano Zampini PCBDDCSetDofsSplitting_BDDC);CHKERRQ(ierr); 1243da1bb401SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetLocalAdjacencyGraph_C","PCBDDCSetLocalAdjacencyGraph_BDDC", 1244da1bb401SStefano Zampini PCBDDCSetLocalAdjacencyGraph_BDDC);CHKERRQ(ierr); 1245534831adSStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPreSolve_C","PCPreSolve_BDDC", 1246534831adSStefano Zampini PCPreSolve_BDDC);CHKERRQ(ierr); 1247534831adSStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPostSolve_C","PCPostSolve_BDDC", 1248534831adSStefano Zampini PCPostSolve_BDDC);CHKERRQ(ierr); 12493425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCCreateFETIDPOperators_C","PCBDDCCreateFETIDPOperators_BDDC", 12503425bc38SStefano Zampini PCBDDCCreateFETIDPOperators_BDDC);CHKERRQ(ierr); 12513425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetRHS_C","PCBDDCMatFETIDPGetRHS_BDDC", 12523425bc38SStefano Zampini PCBDDCMatFETIDPGetRHS_BDDC);CHKERRQ(ierr); 12533425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetSolution_C","PCBDDCMatFETIDPGetSolution_BDDC", 12543425bc38SStefano Zampini PCBDDCMatFETIDPGetSolution_BDDC);CHKERRQ(ierr); 1255da1bb401SStefano Zampini PetscFunctionReturn(0); 1256da1bb401SStefano Zampini } 1257da1bb401SStefano Zampini EXTERN_C_END 12583425bc38SStefano Zampini 1259da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */ 1260da1bb401SStefano Zampini /* All static functions from now on */ 1261da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */ 12624fad6a16SStefano Zampini #undef __FUNCT__ 126329622bf0SStefano Zampini #define __FUNCT__ "PCBDDCApplyNullSpaceCorrectionPC" 126429622bf0SStefano Zampini static PetscErrorCode PCBDDCApplyNullSpaceCorrectionPC(PC pc,Vec x,Vec y) 126529622bf0SStefano Zampini { 126629622bf0SStefano Zampini NullSpaceCorrection_ctx *pc_ctx; 126729622bf0SStefano Zampini PetscErrorCode ierr; 126829622bf0SStefano Zampini 126929622bf0SStefano Zampini PetscFunctionBegin; 127029622bf0SStefano Zampini ierr = PCShellGetContext(pc,(void**)&pc_ctx);CHKERRQ(ierr); 127129622bf0SStefano Zampini /* E */ 127229622bf0SStefano Zampini ierr = MatMultTranspose(pc_ctx->Lbasis_mat,x,pc_ctx->work_small_2);CHKERRQ(ierr); 127329622bf0SStefano Zampini ierr = MatMultAdd(pc_ctx->Kbasis_mat,pc_ctx->work_small_2,x,pc_ctx->work_full_1);CHKERRQ(ierr); 127429622bf0SStefano Zampini /* P^-1 */ 127529622bf0SStefano Zampini ierr = PCApply(pc_ctx->local_pc,pc_ctx->work_full_1,pc_ctx->work_full_2);CHKERRQ(ierr); 127629622bf0SStefano Zampini /* E^T */ 127729622bf0SStefano Zampini ierr = MatMultTranspose(pc_ctx->Kbasis_mat,pc_ctx->work_full_2,pc_ctx->work_small_1);CHKERRQ(ierr); 127829622bf0SStefano Zampini ierr = VecScale(pc_ctx->work_small_1,-1.0);CHKERRQ(ierr); 127929622bf0SStefano Zampini ierr = MatMultAdd(pc_ctx->Lbasis_mat,pc_ctx->work_small_1,pc_ctx->work_full_2,pc_ctx->work_full_1);CHKERRQ(ierr); 128029622bf0SStefano Zampini /* Sum contributions */ 128129622bf0SStefano Zampini ierr = MatMultAdd(pc_ctx->basis_mat,pc_ctx->work_small_2,pc_ctx->work_full_1,y);CHKERRQ(ierr); 128229622bf0SStefano Zampini PetscFunctionReturn(0); 128329622bf0SStefano Zampini } 128429622bf0SStefano Zampini 128529622bf0SStefano Zampini #undef __FUNCT__ 128629622bf0SStefano Zampini #define __FUNCT__ "PCBDDCDestroyNullSpaceCorrectionPC" 128729622bf0SStefano Zampini static PetscErrorCode PCBDDCDestroyNullSpaceCorrectionPC(PC pc) 128829622bf0SStefano Zampini { 128929622bf0SStefano Zampini NullSpaceCorrection_ctx *pc_ctx; 129029622bf0SStefano Zampini PetscErrorCode ierr; 129129622bf0SStefano Zampini 129229622bf0SStefano Zampini PetscFunctionBegin; 129329622bf0SStefano Zampini ierr = PCShellGetContext(pc,(void**)&pc_ctx);CHKERRQ(ierr); 129429622bf0SStefano Zampini ierr = VecDestroy(&pc_ctx->work_small_1);CHKERRQ(ierr); 129529622bf0SStefano Zampini ierr = VecDestroy(&pc_ctx->work_small_2);CHKERRQ(ierr); 129629622bf0SStefano Zampini ierr = VecDestroy(&pc_ctx->work_full_1);CHKERRQ(ierr); 129729622bf0SStefano Zampini ierr = VecDestroy(&pc_ctx->work_full_2);CHKERRQ(ierr); 129829622bf0SStefano Zampini ierr = MatDestroy(&pc_ctx->basis_mat);CHKERRQ(ierr); 129929622bf0SStefano Zampini ierr = MatDestroy(&pc_ctx->Lbasis_mat);CHKERRQ(ierr); 130029622bf0SStefano Zampini ierr = MatDestroy(&pc_ctx->Kbasis_mat);CHKERRQ(ierr); 130129622bf0SStefano Zampini ierr = PCDestroy(&pc_ctx->local_pc);CHKERRQ(ierr); 130229622bf0SStefano Zampini ierr = PetscFree(pc_ctx);CHKERRQ(ierr); 130329622bf0SStefano Zampini PetscFunctionReturn(0); 130429622bf0SStefano Zampini } 130529622bf0SStefano Zampini 130629622bf0SStefano Zampini #undef __FUNCT__ 130729622bf0SStefano Zampini #define __FUNCT__ "PCBDDCAdaptLocalProblem" 130829622bf0SStefano Zampini static PetscErrorCode PCBDDCAdaptLocalProblem(PC pc,IS local_dofs) 130929622bf0SStefano Zampini { 1310f23aa3ddSBarry Smith extern PetscErrorCode PCBDDCApplyNullSpaceCorrectionPC(PC,Vec,Vec); 1311f23aa3ddSBarry Smith extern PetscErrorCode PCBDDCDestroyNullSpaceCorrectionPC(PC); 131229622bf0SStefano Zampini 131329622bf0SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 131429622bf0SStefano Zampini PC_IS *pcis = (PC_IS*)pc->data; 131529622bf0SStefano Zampini Mat_IS * matis = (Mat_IS*)pc->pmat->data; 131629622bf0SStefano Zampini KSP *local_ksp; 131729622bf0SStefano Zampini PC newpc; 131829622bf0SStefano Zampini NullSpaceCorrection_ctx *shell_ctx; 131929622bf0SStefano Zampini Mat local_mat,local_pmat,small_mat,inv_small_mat; 132029622bf0SStefano Zampini MatStructure local_mat_struct; 132129622bf0SStefano Zampini Vec work1,work2,work3; 132229622bf0SStefano Zampini const Vec *nullvecs; 132329622bf0SStefano Zampini VecScatter scatter_ctx; 132429622bf0SStefano Zampini IS is_aux; 132529622bf0SStefano Zampini MatFactorInfo matinfo; 132629622bf0SStefano Zampini PetscScalar *basis_mat,*Kbasis_mat,*array,*array_mat; 132729622bf0SStefano Zampini PetscScalar one = 1.0,zero = 0.0, m_one = -1.0; 132829622bf0SStefano Zampini PetscInt basis_dofs,basis_size,nnsp_size,i,k,n_I,n_R; 132929622bf0SStefano Zampini PetscBool nnsp_has_cnst; 133029622bf0SStefano Zampini PetscErrorCode ierr; 133129622bf0SStefano Zampini 133229622bf0SStefano Zampini PetscFunctionBegin; 133329622bf0SStefano Zampini /* Infer the local solver */ 133429622bf0SStefano Zampini ierr = ISGetSize(local_dofs,&basis_dofs);CHKERRQ(ierr); 133529622bf0SStefano Zampini ierr = VecGetSize(pcis->vec1_D,&n_I);CHKERRQ(ierr); 133629622bf0SStefano Zampini ierr = VecGetSize(pcbddc->vec1_R,&n_R);CHKERRQ(ierr); 133729622bf0SStefano Zampini if (basis_dofs == n_I) { 133829622bf0SStefano Zampini /* Dirichlet solver */ 133929622bf0SStefano Zampini local_ksp = &pcbddc->ksp_D; 134029622bf0SStefano Zampini } else if (basis_dofs == n_R) { 134129622bf0SStefano Zampini /* Neumann solver */ 134229622bf0SStefano Zampini local_ksp = &pcbddc->ksp_R; 1343f23aa3ddSBarry Smith } else SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in %s: unknown local IS size %d. n_I=%d, n_R=%d)\n",basis_dofs,n_I,n_R); 134429622bf0SStefano Zampini ierr = KSPGetOperators(*local_ksp,&local_mat,&local_pmat,&local_mat_struct);CHKERRQ(ierr); 134529622bf0SStefano Zampini 134629622bf0SStefano Zampini /* Get null space vecs */ 134729622bf0SStefano Zampini ierr = MatNullSpaceGetVecs(pcbddc->NullSpace,&nnsp_has_cnst,&nnsp_size,&nullvecs);CHKERRQ(ierr); 134829622bf0SStefano Zampini basis_size = nnsp_size; 13492fa5cd67SKarl Rupp if (nnsp_has_cnst) basis_size++; 135029622bf0SStefano Zampini 135129622bf0SStefano Zampini /* Create shell ctx */ 135229622bf0SStefano Zampini ierr = PetscMalloc(sizeof(*shell_ctx),&shell_ctx);CHKERRQ(ierr); 135329622bf0SStefano Zampini 135429622bf0SStefano Zampini /* Create work vectors in shell context */ 135529622bf0SStefano Zampini ierr = VecCreate(PETSC_COMM_SELF,&shell_ctx->work_small_1);CHKERRQ(ierr); 135629622bf0SStefano Zampini ierr = VecSetSizes(shell_ctx->work_small_1,basis_size,basis_size);CHKERRQ(ierr); 135729622bf0SStefano Zampini ierr = VecSetType(shell_ctx->work_small_1,VECSEQ);CHKERRQ(ierr); 135829622bf0SStefano Zampini ierr = VecDuplicate(shell_ctx->work_small_1,&shell_ctx->work_small_2);CHKERRQ(ierr); 135929622bf0SStefano Zampini ierr = VecCreate(PETSC_COMM_SELF,&shell_ctx->work_full_1);CHKERRQ(ierr); 136029622bf0SStefano Zampini ierr = VecSetSizes(shell_ctx->work_full_1,basis_dofs,basis_dofs);CHKERRQ(ierr); 136129622bf0SStefano Zampini ierr = VecSetType(shell_ctx->work_full_1,VECSEQ);CHKERRQ(ierr); 136229622bf0SStefano Zampini ierr = VecDuplicate(shell_ctx->work_full_1,&shell_ctx->work_full_2);CHKERRQ(ierr); 136329622bf0SStefano Zampini 136429622bf0SStefano Zampini /* Allocate workspace */ 136529622bf0SStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,basis_dofs,basis_size,PETSC_NULL,&shell_ctx->basis_mat);CHKERRQ(ierr); 136629622bf0SStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,basis_dofs,basis_size,PETSC_NULL,&shell_ctx->Kbasis_mat);CHKERRQ(ierr); 136729622bf0SStefano Zampini ierr = MatDenseGetArray(shell_ctx->basis_mat,&basis_mat);CHKERRQ(ierr); 136829622bf0SStefano Zampini ierr = MatDenseGetArray(shell_ctx->Kbasis_mat,&Kbasis_mat);CHKERRQ(ierr); 136929622bf0SStefano Zampini 137029622bf0SStefano Zampini /* Restrict local null space on selected dofs (Dirichlet or Neumann) 137129622bf0SStefano Zampini and compute matrices N and K*N */ 137229622bf0SStefano Zampini ierr = VecDuplicate(shell_ctx->work_full_1,&work1);CHKERRQ(ierr); 137329622bf0SStefano Zampini ierr = VecDuplicate(shell_ctx->work_full_1,&work2);CHKERRQ(ierr); 137429622bf0SStefano Zampini ierr = VecScatterCreate(pcis->vec1_N,local_dofs,work1,(IS)0,&scatter_ctx);CHKERRQ(ierr); 137529622bf0SStefano Zampini k = 0; 137629622bf0SStefano Zampini for (; k<nnsp_size; k++) { 137729622bf0SStefano Zampini ierr = VecScatterBegin(matis->ctx,nullvecs[k],pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 137829622bf0SStefano Zampini ierr = VecScatterEnd(matis->ctx,nullvecs[k],pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 137929622bf0SStefano Zampini ierr = VecPlaceArray(work1,(const PetscScalar*)&basis_mat[k*basis_dofs]);CHKERRQ(ierr); 138029622bf0SStefano Zampini ierr = VecScatterBegin(scatter_ctx,pcis->vec1_N,work1,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 138129622bf0SStefano Zampini ierr = VecScatterEnd(scatter_ctx,pcis->vec1_N,work1,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 138229622bf0SStefano Zampini ierr = VecPlaceArray(work2,(const PetscScalar*)&Kbasis_mat[k*basis_dofs]);CHKERRQ(ierr); 138329622bf0SStefano Zampini ierr = MatMult(local_mat,work1,work2);CHKERRQ(ierr); 138429622bf0SStefano Zampini ierr = VecResetArray(work1);CHKERRQ(ierr); 138529622bf0SStefano Zampini ierr = VecResetArray(work2);CHKERRQ(ierr); 138629622bf0SStefano Zampini } 138729622bf0SStefano Zampini if (nnsp_has_cnst) { 138829622bf0SStefano Zampini ierr = VecPlaceArray(work1,(const PetscScalar*)&basis_mat[k*basis_dofs]);CHKERRQ(ierr); 138929622bf0SStefano Zampini ierr = VecSet(work1,one);CHKERRQ(ierr); 139029622bf0SStefano Zampini ierr = VecPlaceArray(work2,(const PetscScalar*)&Kbasis_mat[k*basis_dofs]);CHKERRQ(ierr); 139129622bf0SStefano Zampini ierr = MatMult(local_mat,work1,work2);CHKERRQ(ierr); 139229622bf0SStefano Zampini ierr = VecResetArray(work1);CHKERRQ(ierr); 139329622bf0SStefano Zampini ierr = VecResetArray(work2);CHKERRQ(ierr); 139429622bf0SStefano Zampini } 139529622bf0SStefano Zampini ierr = VecDestroy(&work1);CHKERRQ(ierr); 139629622bf0SStefano Zampini ierr = VecDestroy(&work2);CHKERRQ(ierr); 139729622bf0SStefano Zampini ierr = VecScatterDestroy(&scatter_ctx);CHKERRQ(ierr); 139829622bf0SStefano Zampini ierr = MatDenseRestoreArray(shell_ctx->basis_mat,&basis_mat);CHKERRQ(ierr); 139929622bf0SStefano Zampini ierr = MatDenseRestoreArray(shell_ctx->Kbasis_mat,&Kbasis_mat);CHKERRQ(ierr); 140029622bf0SStefano Zampini 140129622bf0SStefano Zampini /* Assemble another Mat object in shell context */ 140229622bf0SStefano Zampini ierr = MatTransposeMatMult(shell_ctx->basis_mat,shell_ctx->Kbasis_mat,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&small_mat);CHKERRQ(ierr); 140329622bf0SStefano Zampini ierr = MatFactorInfoInitialize(&matinfo);CHKERRQ(ierr); 140429622bf0SStefano Zampini ierr = ISCreateStride(PETSC_COMM_SELF,basis_size,0,1,&is_aux);CHKERRQ(ierr); 140529622bf0SStefano Zampini ierr = MatLUFactor(small_mat,is_aux,is_aux,&matinfo);CHKERRQ(ierr); 140629622bf0SStefano Zampini ierr = ISDestroy(&is_aux);CHKERRQ(ierr); 140729622bf0SStefano Zampini ierr = PetscMalloc(basis_size*basis_size*sizeof(PetscScalar),&array_mat);CHKERRQ(ierr); 140829622bf0SStefano Zampini for (k=0; k<basis_size; k++) { 140929622bf0SStefano Zampini ierr = VecSet(shell_ctx->work_small_1,zero);CHKERRQ(ierr); 141029622bf0SStefano Zampini ierr = VecSetValue(shell_ctx->work_small_1,k,one,INSERT_VALUES);CHKERRQ(ierr); 141129622bf0SStefano Zampini ierr = VecAssemblyBegin(shell_ctx->work_small_1);CHKERRQ(ierr); 141229622bf0SStefano Zampini ierr = VecAssemblyEnd(shell_ctx->work_small_1);CHKERRQ(ierr); 141329622bf0SStefano Zampini ierr = MatSolve(small_mat,shell_ctx->work_small_1,shell_ctx->work_small_2);CHKERRQ(ierr); 141429622bf0SStefano Zampini ierr = VecGetArray(shell_ctx->work_small_2,&array);CHKERRQ(ierr); 14152fa5cd67SKarl Rupp for (i=0; i<basis_size; i++) array_mat[i*basis_size+k]=array[i]; 141629622bf0SStefano Zampini ierr = VecRestoreArray(shell_ctx->work_small_2,&array);CHKERRQ(ierr); 141729622bf0SStefano Zampini } 141829622bf0SStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,basis_size,basis_size,array_mat,&inv_small_mat);CHKERRQ(ierr); 141929622bf0SStefano Zampini ierr = MatMatMult(shell_ctx->basis_mat,inv_small_mat,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&shell_ctx->Lbasis_mat);CHKERRQ(ierr); 142029622bf0SStefano Zampini ierr = PetscFree(array_mat);CHKERRQ(ierr); 142129622bf0SStefano Zampini ierr = MatDestroy(&inv_small_mat);CHKERRQ(ierr); 142229622bf0SStefano Zampini ierr = MatDestroy(&small_mat);CHKERRQ(ierr); 142329622bf0SStefano Zampini ierr = MatScale(shell_ctx->Kbasis_mat,m_one);CHKERRQ(ierr); 142429622bf0SStefano Zampini 142529622bf0SStefano Zampini /* Rebuild local PC */ 142629622bf0SStefano Zampini ierr = KSPGetPC(*local_ksp,&shell_ctx->local_pc);CHKERRQ(ierr); 142729622bf0SStefano Zampini ierr = PetscObjectReference((PetscObject)shell_ctx->local_pc);CHKERRQ(ierr); 142829622bf0SStefano Zampini ierr = PCCreate(PETSC_COMM_SELF,&newpc);CHKERRQ(ierr); 142929622bf0SStefano Zampini ierr = PCSetOperators(newpc,local_mat,local_mat,SAME_PRECONDITIONER);CHKERRQ(ierr); 143029622bf0SStefano Zampini ierr = PCSetType(newpc,PCSHELL);CHKERRQ(ierr); 143129622bf0SStefano Zampini ierr = PCShellSetContext(newpc,shell_ctx);CHKERRQ(ierr); 143229622bf0SStefano Zampini ierr = PCShellSetApply(newpc,PCBDDCApplyNullSpaceCorrectionPC);CHKERRQ(ierr); 143329622bf0SStefano Zampini ierr = PCShellSetDestroy(newpc,PCBDDCDestroyNullSpaceCorrectionPC);CHKERRQ(ierr); 143429622bf0SStefano Zampini ierr = PCSetUp(newpc);CHKERRQ(ierr); 143529622bf0SStefano Zampini ierr = KSPSetPC(*local_ksp,newpc);CHKERRQ(ierr); 143629622bf0SStefano Zampini ierr = PCDestroy(&newpc);CHKERRQ(ierr); 143729622bf0SStefano Zampini ierr = KSPSetUp(*local_ksp);CHKERRQ(ierr); 143829622bf0SStefano Zampini 143929622bf0SStefano Zampini /* test */ 144029622bf0SStefano Zampini if (pcbddc->dbg_flag) { 144129622bf0SStefano Zampini PetscReal test_err; 144229622bf0SStefano Zampini KSP check_ksp; 144329622bf0SStefano Zampini PC check_pc; 144429622bf0SStefano Zampini PetscReal lambda_min,lambda_max; 144529622bf0SStefano Zampini Mat test_mat; 144629622bf0SStefano Zampini PetscViewer viewer=pcbddc->dbg_viewer; 144729622bf0SStefano Zampini PetscBool setsym,issym=PETSC_FALSE; 144829622bf0SStefano Zampini 144929622bf0SStefano Zampini ierr = KSPGetPC(*local_ksp,&check_pc);CHKERRQ(ierr); 145029622bf0SStefano Zampini ierr = VecDuplicate(shell_ctx->work_full_1,&work1);CHKERRQ(ierr); 145129622bf0SStefano Zampini ierr = VecDuplicate(shell_ctx->work_full_1,&work2);CHKERRQ(ierr); 145229622bf0SStefano Zampini ierr = VecDuplicate(shell_ctx->work_full_1,&work3);CHKERRQ(ierr); 145329622bf0SStefano Zampini ierr = VecSetRandom(shell_ctx->work_small_1,PETSC_NULL);CHKERRQ(ierr); 145429622bf0SStefano Zampini ierr = MatMult(shell_ctx->basis_mat,shell_ctx->work_small_1,work1);CHKERRQ(ierr); 145529622bf0SStefano Zampini ierr = VecCopy(work1,work2);CHKERRQ(ierr); 145629622bf0SStefano Zampini ierr = MatMult(local_mat,work1,work3);CHKERRQ(ierr); 145729622bf0SStefano Zampini ierr = PCApply(check_pc,work3,work1);CHKERRQ(ierr); 145829622bf0SStefano Zampini ierr = VecAXPY(work1,m_one,work2);CHKERRQ(ierr); 145929622bf0SStefano Zampini ierr = VecNorm(work1,NORM_INFINITY,&test_err);CHKERRQ(ierr); 146029622bf0SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d error for nullspace correction for ",PetscGlobalRank); 146129622bf0SStefano Zampini if (basis_dofs == n_I) { 14622fa5cd67SKarl Rupp ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Dirichlet ");CHKERRQ(ierr); 146329622bf0SStefano Zampini } else { 14642fa5cd67SKarl Rupp ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Neumann ");CHKERRQ(ierr); 146529622bf0SStefano Zampini } 146629622bf0SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"solver is :%1.14e\n",test_err); 146729622bf0SStefano Zampini 146829622bf0SStefano Zampini ierr = MatTransposeMatMult(shell_ctx->Lbasis_mat,shell_ctx->Kbasis_mat,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&test_mat);CHKERRQ(ierr); 146929622bf0SStefano Zampini ierr = MatShift(test_mat,one);CHKERRQ(ierr); 147029622bf0SStefano Zampini ierr = MatNorm(test_mat,NORM_INFINITY,&test_err);CHKERRQ(ierr); 147129622bf0SStefano Zampini ierr = MatDestroy(&test_mat);CHKERRQ(ierr); 147229622bf0SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d error for nullspace matrices is :%1.14e\n",PetscGlobalRank,test_err); 147329622bf0SStefano Zampini 147429622bf0SStefano Zampini /* Create ksp object suitable for extreme eigenvalues' estimation */ 147529622bf0SStefano Zampini ierr = KSPCreate(PETSC_COMM_SELF,&check_ksp);CHKERRQ(ierr); 147629622bf0SStefano Zampini ierr = KSPSetOperators(check_ksp,local_mat,local_mat,SAME_PRECONDITIONER);CHKERRQ(ierr); 147729622bf0SStefano Zampini ierr = KSPSetTolerances(check_ksp,1.e-8,1.e-8,PETSC_DEFAULT,basis_dofs);CHKERRQ(ierr); 147829622bf0SStefano Zampini ierr = KSPSetComputeSingularValues(check_ksp,PETSC_TRUE);CHKERRQ(ierr); 147929622bf0SStefano Zampini ierr = MatIsSymmetricKnown(pc->pmat,&setsym,&issym);CHKERRQ(ierr); 148029622bf0SStefano Zampini if (issym) { 148129622bf0SStefano Zampini ierr = KSPSetType(check_ksp,KSPCG);CHKERRQ(ierr); 148229622bf0SStefano Zampini } 148329622bf0SStefano Zampini ierr = KSPSetPC(check_ksp,check_pc);CHKERRQ(ierr); 148429622bf0SStefano Zampini ierr = KSPSetUp(check_ksp);CHKERRQ(ierr); 148529622bf0SStefano Zampini ierr = VecSetRandom(work1,PETSC_NULL);CHKERRQ(ierr); 148629622bf0SStefano Zampini ierr = MatMult(local_mat,work1,work2);CHKERRQ(ierr); 148729622bf0SStefano Zampini ierr = KSPSolve(check_ksp,work2,work2);CHKERRQ(ierr); 148829622bf0SStefano Zampini ierr = VecAXPY(work2,m_one,work1);CHKERRQ(ierr); 148929622bf0SStefano Zampini ierr = VecNorm(work2,NORM_INFINITY,&test_err);CHKERRQ(ierr); 149029622bf0SStefano Zampini ierr = KSPComputeExtremeSingularValues(check_ksp,&lambda_max,&lambda_min);CHKERRQ(ierr); 149129622bf0SStefano Zampini ierr = KSPGetIterationNumber(check_ksp,&k);CHKERRQ(ierr); 149229622bf0SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d error for adapted KSP %1.14e (it %d, eigs %1.6e %1.6e)\n",PetscGlobalRank,test_err,k,lambda_min,lambda_max); 149329622bf0SStefano Zampini ierr = KSPDestroy(&check_ksp);CHKERRQ(ierr); 149429622bf0SStefano Zampini ierr = VecDestroy(&work1);CHKERRQ(ierr); 149529622bf0SStefano Zampini ierr = VecDestroy(&work2);CHKERRQ(ierr); 149629622bf0SStefano Zampini ierr = VecDestroy(&work3);CHKERRQ(ierr); 149729622bf0SStefano Zampini } 149829622bf0SStefano Zampini PetscFunctionReturn(0); 149929622bf0SStefano Zampini } 150029622bf0SStefano Zampini 150129622bf0SStefano Zampini #undef __FUNCT__ 15022e8d2280SStefano Zampini #define __FUNCT__ "PCBDDCSetUseExactDirichlet" 15032e8d2280SStefano Zampini static PetscErrorCode PCBDDCSetUseExactDirichlet(PC pc,PetscBool use) 15042e8d2280SStefano Zampini { 15052e8d2280SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 15062e8d2280SStefano Zampini 15072e8d2280SStefano Zampini PetscFunctionBegin; 15082e8d2280SStefano Zampini pcbddc->use_exact_dirichlet=use; 15092e8d2280SStefano Zampini PetscFunctionReturn(0); 15102e8d2280SStefano Zampini } 15112e8d2280SStefano Zampini 15122e8d2280SStefano Zampini #undef __FUNCT__ 15134fad6a16SStefano Zampini #define __FUNCT__ "PCBDDCSetLevel" 15144fad6a16SStefano Zampini static PetscErrorCode PCBDDCSetLevel(PC pc,PetscInt level) 15154fad6a16SStefano Zampini { 15164fad6a16SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 15174fad6a16SStefano Zampini 15184fad6a16SStefano Zampini PetscFunctionBegin; 15194fad6a16SStefano Zampini pcbddc->current_level=level; 15204fad6a16SStefano Zampini PetscFunctionReturn(0); 15214fad6a16SStefano Zampini } 15223425bc38SStefano Zampini 15233425bc38SStefano Zampini #undef __FUNCT__ 15240bdf917eSStefano Zampini #define __FUNCT__ "PCBDDCAdaptNullSpace" 15250bdf917eSStefano Zampini static PetscErrorCode PCBDDCAdaptNullSpace(PC pc) 15260bdf917eSStefano Zampini { 15270bdf917eSStefano Zampini PC_IS *pcis = (PC_IS*) (pc->data); 15280bdf917eSStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)(pc->data); 15290bdf917eSStefano Zampini KSP inv_change; 15300bdf917eSStefano Zampini PC pc_change; 15310bdf917eSStefano Zampini const Vec *nsp_vecs; 15320bdf917eSStefano Zampini Vec *new_nsp_vecs; 15330bdf917eSStefano Zampini PetscInt i,nsp_size,new_nsp_size,start_new; 15340bdf917eSStefano Zampini PetscBool nsp_has_cnst; 15350bdf917eSStefano Zampini MatNullSpace new_nsp; 15360bdf917eSStefano Zampini PetscErrorCode ierr; 15370bdf917eSStefano Zampini 15380bdf917eSStefano Zampini PetscFunctionBegin; 15390bdf917eSStefano Zampini ierr = MatNullSpaceGetVecs(pcbddc->NullSpace,&nsp_has_cnst,&nsp_size,&nsp_vecs);CHKERRQ(ierr); 15400bdf917eSStefano Zampini ierr = KSPCreate(PETSC_COMM_SELF,&inv_change);CHKERRQ(ierr); 15410bdf917eSStefano Zampini ierr = KSPSetOperators(inv_change,pcbddc->ChangeOfBasisMatrix,pcbddc->ChangeOfBasisMatrix,SAME_PRECONDITIONER);CHKERRQ(ierr); 15420bdf917eSStefano Zampini ierr = KSPSetType(inv_change,KSPPREONLY);CHKERRQ(ierr); 15430bdf917eSStefano Zampini ierr = KSPGetPC(inv_change,&pc_change);CHKERRQ(ierr); 15440bdf917eSStefano Zampini ierr = PCSetType(pc_change,PCLU);CHKERRQ(ierr); 15450bdf917eSStefano Zampini ierr = KSPSetUp(inv_change);CHKERRQ(ierr); 15462fa5cd67SKarl Rupp 15470bdf917eSStefano Zampini new_nsp_size = nsp_size; 15482fa5cd67SKarl Rupp if (nsp_has_cnst) new_nsp_size++; 15490bdf917eSStefano Zampini ierr = PetscMalloc(new_nsp_size*sizeof(Vec),&new_nsp_vecs);CHKERRQ(ierr); 15500bdf917eSStefano Zampini for (i=0;i<new_nsp_size;i++) { ierr = VecDuplicate(pcis->vec1_global,&new_nsp_vecs[i]);CHKERRQ(ierr); } 15510bdf917eSStefano Zampini start_new = 0; 15520bdf917eSStefano Zampini if (nsp_has_cnst) { 15530bdf917eSStefano Zampini start_new = 1; 15540bdf917eSStefano Zampini ierr = VecSet(new_nsp_vecs[0],1.0);CHKERRQ(ierr); 15550bdf917eSStefano Zampini ierr = VecSet(pcis->vec1_B,1.0);CHKERRQ(ierr); 15560bdf917eSStefano Zampini ierr = KSPSolve(inv_change,pcis->vec1_B,pcis->vec1_B); 15570bdf917eSStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,new_nsp_vecs[0],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 15580bdf917eSStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,pcis->vec1_B,new_nsp_vecs[0],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 15590bdf917eSStefano Zampini } 15600bdf917eSStefano Zampini for (i=0; i<nsp_size; i++) { 15610bdf917eSStefano Zampini ierr = VecCopy(nsp_vecs[i],new_nsp_vecs[i+start_new]);CHKERRQ(ierr); 15620bdf917eSStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,nsp_vecs[i],pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 15630bdf917eSStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,nsp_vecs[i],pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 15640bdf917eSStefano Zampini ierr = KSPSolve(inv_change,pcis->vec1_B,pcis->vec1_B); 15650bdf917eSStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,new_nsp_vecs[i+start_new],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 15660bdf917eSStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,pcis->vec1_B,new_nsp_vecs[i+start_new],INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 15670bdf917eSStefano Zampini } 15680bdf917eSStefano Zampini ierr = VecNormalize(new_nsp_vecs[0],PETSC_NULL);CHKERRQ(ierr); 15690bdf917eSStefano Zampini /* TODO : Orthonormalize vecs when new_nsp_size > 0! */ 15700bdf917eSStefano Zampini 15710bdf917eSStefano Zampini ierr = KSPDestroy(&inv_change);CHKERRQ(ierr); 15720bdf917eSStefano Zampini ierr = MatNullSpaceCreate(((PetscObject)pc)->comm,PETSC_FALSE,new_nsp_size,new_nsp_vecs,&new_nsp);CHKERRQ(ierr); 15730bdf917eSStefano Zampini ierr = PCBDDCSetNullSpace(pc,new_nsp);CHKERRQ(ierr); 15740bdf917eSStefano Zampini ierr = MatNullSpaceDestroy(&new_nsp);CHKERRQ(ierr); 15750bdf917eSStefano Zampini /* 15760bdf917eSStefano Zampini ierr = MatNullSpaceTest(pcbddc->NullSpace,pc->pmat,&nsp_t);CHKERRQ(ierr); 15770bdf917eSStefano Zampini printf("New Null Space, mat changed: %d\n",nsp_t); 15780bdf917eSStefano Zampini temp_mat = matis->A; 15790bdf917eSStefano Zampini matis->A = pcbddc->local_mat; 15800bdf917eSStefano Zampini pcbddc->local_mat = temp_mat; 15810bdf917eSStefano Zampini ierr = MatNullSpaceTest(pcbddc->NullSpace,pc->pmat,&nsp_t);CHKERRQ(ierr); 15820bdf917eSStefano Zampini printf("New Null Space, mat original: %d\n",nsp_t);*/ 15830bdf917eSStefano Zampini 15840bdf917eSStefano Zampini for (i=0; i<new_nsp_size; i++) { ierr = VecDestroy(&new_nsp_vecs[i]);CHKERRQ(ierr); } 15850bdf917eSStefano Zampini ierr = PetscFree(new_nsp_vecs);CHKERRQ(ierr); 15860bdf917eSStefano Zampini PetscFunctionReturn(0); 15870bdf917eSStefano Zampini } 15880bdf917eSStefano Zampini 15890bdf917eSStefano Zampini #undef __FUNCT__ 15903425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPMatContext" 15913425bc38SStefano Zampini static PetscErrorCode PCBDDCCreateFETIDPMatContext(PC pc, FETIDPMat_ctx **fetidpmat_ctx) 15923425bc38SStefano Zampini { 15933425bc38SStefano Zampini FETIDPMat_ctx *newctx; 15943425bc38SStefano Zampini PetscErrorCode ierr; 15953425bc38SStefano Zampini 15963425bc38SStefano Zampini PetscFunctionBegin; 15973425bc38SStefano Zampini ierr = PetscMalloc(sizeof(*newctx),&newctx);CHKERRQ(ierr); 15982fa5cd67SKarl Rupp 15993425bc38SStefano Zampini newctx->lambda_local = 0; 16003425bc38SStefano Zampini newctx->temp_solution_B = 0; 16013425bc38SStefano Zampini newctx->temp_solution_D = 0; 16023425bc38SStefano Zampini newctx->B_delta = 0; 16033425bc38SStefano Zampini newctx->B_Ddelta = 0; /* theoretically belongs to the FETIDP preconditioner */ 16043425bc38SStefano Zampini newctx->l2g_lambda = 0; 16052fa5cd67SKarl Rupp 16063425bc38SStefano Zampini /* increase the reference count for BDDC preconditioner */ 16073425bc38SStefano Zampini ierr = PetscObjectReference((PetscObject)pc);CHKERRQ(ierr); 16083425bc38SStefano Zampini newctx->pc = pc; 16093425bc38SStefano Zampini *fetidpmat_ctx = newctx; 16103425bc38SStefano Zampini PetscFunctionReturn(0); 16113425bc38SStefano Zampini } 16123425bc38SStefano Zampini 16133425bc38SStefano Zampini #undef __FUNCT__ 16143425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPPCContext" 16153425bc38SStefano Zampini static PetscErrorCode PCBDDCCreateFETIDPPCContext(PC pc, FETIDPPC_ctx **fetidppc_ctx) 16163425bc38SStefano Zampini { 16173425bc38SStefano Zampini FETIDPPC_ctx *newctx; 16183425bc38SStefano Zampini PetscErrorCode ierr; 16193425bc38SStefano Zampini 16203425bc38SStefano Zampini PetscFunctionBegin; 16213425bc38SStefano Zampini ierr = PetscMalloc(sizeof(*newctx),&newctx);CHKERRQ(ierr); 16222fa5cd67SKarl Rupp 16233425bc38SStefano Zampini newctx->lambda_local = 0; 16243425bc38SStefano Zampini newctx->B_Ddelta = 0; 16253425bc38SStefano Zampini newctx->l2g_lambda = 0; 16262fa5cd67SKarl Rupp 16273425bc38SStefano Zampini /* increase the reference count for BDDC preconditioner */ 16283425bc38SStefano Zampini ierr = PetscObjectReference((PetscObject)pc);CHKERRQ(ierr); 16293425bc38SStefano Zampini newctx->pc = pc; 16303425bc38SStefano Zampini *fetidppc_ctx = newctx; 16313425bc38SStefano Zampini PetscFunctionReturn(0); 16323425bc38SStefano Zampini } 16333425bc38SStefano Zampini 16343425bc38SStefano Zampini #undef __FUNCT__ 16353425bc38SStefano Zampini #define __FUNCT__ "PCBDDCDestroyFETIDPMat" 16363425bc38SStefano Zampini static PetscErrorCode PCBDDCDestroyFETIDPMat(Mat A) 16373425bc38SStefano Zampini { 16383425bc38SStefano Zampini FETIDPMat_ctx *mat_ctx; 16393425bc38SStefano Zampini PetscErrorCode ierr; 16403425bc38SStefano Zampini 16413425bc38SStefano Zampini PetscFunctionBegin; 16423425bc38SStefano Zampini ierr = MatShellGetContext(A,(void**)&mat_ctx);CHKERRQ(ierr); 16433425bc38SStefano Zampini ierr = VecDestroy(&mat_ctx->lambda_local);CHKERRQ(ierr); 16443425bc38SStefano Zampini ierr = VecDestroy(&mat_ctx->temp_solution_D);CHKERRQ(ierr); 16453425bc38SStefano Zampini ierr = VecDestroy(&mat_ctx->temp_solution_B);CHKERRQ(ierr); 16463425bc38SStefano Zampini ierr = MatDestroy(&mat_ctx->B_delta);CHKERRQ(ierr); 16473425bc38SStefano Zampini ierr = MatDestroy(&mat_ctx->B_Ddelta);CHKERRQ(ierr); 16483425bc38SStefano Zampini ierr = VecScatterDestroy(&mat_ctx->l2g_lambda);CHKERRQ(ierr); 16493425bc38SStefano Zampini ierr = PCDestroy(&mat_ctx->pc);CHKERRQ(ierr); /* actually it does not destroy BDDC, only decrease its reference count */ 16503425bc38SStefano Zampini ierr = PetscFree(mat_ctx);CHKERRQ(ierr); 16513425bc38SStefano Zampini PetscFunctionReturn(0); 16523425bc38SStefano Zampini } 16533425bc38SStefano Zampini 16543425bc38SStefano Zampini #undef __FUNCT__ 16553425bc38SStefano Zampini #define __FUNCT__ "PCBDDCDestroyFETIDPPC" 16563425bc38SStefano Zampini static PetscErrorCode PCBDDCDestroyFETIDPPC(PC pc) 16573425bc38SStefano Zampini { 16583425bc38SStefano Zampini FETIDPPC_ctx *pc_ctx; 16593425bc38SStefano Zampini PetscErrorCode ierr; 16603425bc38SStefano Zampini 16613425bc38SStefano Zampini PetscFunctionBegin; 16623425bc38SStefano Zampini ierr = PCShellGetContext(pc,(void**)&pc_ctx);CHKERRQ(ierr); 16633425bc38SStefano Zampini ierr = VecDestroy(&pc_ctx->lambda_local);CHKERRQ(ierr); 16643425bc38SStefano Zampini ierr = MatDestroy(&pc_ctx->B_Ddelta);CHKERRQ(ierr); 16653425bc38SStefano Zampini ierr = VecScatterDestroy(&pc_ctx->l2g_lambda);CHKERRQ(ierr); 16663425bc38SStefano Zampini ierr = PCDestroy(&pc_ctx->pc);CHKERRQ(ierr); /* actually it does not destroy BDDC, only decrease its reference count */ 16673425bc38SStefano Zampini ierr = PetscFree(pc_ctx);CHKERRQ(ierr); 16683425bc38SStefano Zampini PetscFunctionReturn(0); 16693425bc38SStefano Zampini } 16703425bc38SStefano Zampini 16713425bc38SStefano Zampini #undef __FUNCT__ 16723425bc38SStefano Zampini #define __FUNCT__ "PCBDDCSetupFETIDPMatContext" 16733425bc38SStefano Zampini static PetscErrorCode PCBDDCSetupFETIDPMatContext(FETIDPMat_ctx *fetidpmat_ctx) 16743425bc38SStefano Zampini { 16753425bc38SStefano Zampini PetscErrorCode ierr; 16763425bc38SStefano Zampini PC_IS *pcis =(PC_IS*)fetidpmat_ctx->pc->data; 16773425bc38SStefano Zampini PC_BDDC *pcbddc =(PC_BDDC*)fetidpmat_ctx->pc->data; 16783425bc38SStefano Zampini PCBDDCGraph mat_graph=pcbddc->mat_graph; 16793425bc38SStefano Zampini Mat_IS *matis = (Mat_IS*)fetidpmat_ctx->pc->pmat->data; 16803425bc38SStefano Zampini MPI_Comm comm = ((PetscObject)(fetidpmat_ctx->pc))->comm; 16813425bc38SStefano Zampini 16823425bc38SStefano Zampini Mat ScalingMat; 16833425bc38SStefano Zampini Vec lambda_global; 16843425bc38SStefano Zampini IS IS_l2g_lambda; 16853425bc38SStefano Zampini 16863425bc38SStefano Zampini PetscBool skip_node,fully_redundant; 1687ef028eecSStefano Zampini PetscInt i,j,k,s,n_boundary_dofs,n_global_lambda,n_vertices,partial_sum; 16883425bc38SStefano Zampini PetscInt n_local_lambda,n_lambda_for_dof,dual_size,n_neg_values,n_pos_values; 1689ef028eecSStefano Zampini PetscMPIInt rank,nprocs; 16903425bc38SStefano Zampini PetscScalar scalar_value; 16913425bc38SStefano Zampini 16923425bc38SStefano Zampini PetscInt *vertex_indices,*temp_indices; 16933425bc38SStefano Zampini PetscInt *dual_dofs_boundary_indices,*aux_local_numbering_1,*aux_global_numbering; 16943425bc38SStefano Zampini PetscInt *aux_sums,*cols_B_delta,*l2g_indices; 16953425bc38SStefano Zampini PetscScalar *array,*scaling_factors,*vals_B_delta; 1696ef028eecSStefano Zampini PetscInt *aux_local_numbering_2,*dof_sizes,*dof_displs; 1697ef028eecSStefano Zampini PetscInt first_index,old_index; 1698ef028eecSStefano Zampini PetscBool first_found = PETSC_FALSE; 16993425bc38SStefano Zampini 17003425bc38SStefano Zampini /* For communication of scaling factors */ 17013425bc38SStefano Zampini PetscInt *ptrs_buffer,neigh_position; 17023425bc38SStefano Zampini PetscScalar **all_factors,*send_buffer,*recv_buffer; 17033425bc38SStefano Zampini MPI_Request *send_reqs,*recv_reqs; 17043425bc38SStefano Zampini 17053425bc38SStefano Zampini /* tests */ 17063425bc38SStefano Zampini Vec test_vec; 17073425bc38SStefano Zampini PetscBool test_fetidp; 17083425bc38SStefano Zampini PetscViewer viewer; 17093425bc38SStefano Zampini 17103425bc38SStefano Zampini PetscFunctionBegin; 17113425bc38SStefano Zampini ierr = MPI_Comm_rank(comm,&rank);CHKERRQ(ierr); 17123425bc38SStefano Zampini ierr = MPI_Comm_size(comm,&nprocs);CHKERRQ(ierr); 17133425bc38SStefano Zampini 17143425bc38SStefano Zampini /* Default type of lagrange multipliers is non-redundant */ 17153425bc38SStefano Zampini fully_redundant = PETSC_FALSE; 17163425bc38SStefano Zampini ierr = PetscOptionsGetBool(PETSC_NULL,"-fetidp_fullyredundant",&fully_redundant,PETSC_NULL);CHKERRQ(ierr); 17173425bc38SStefano Zampini 17183425bc38SStefano Zampini /* Evaluate local and global number of lagrange multipliers */ 17193425bc38SStefano Zampini ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr); 17203425bc38SStefano Zampini n_local_lambda = 0; 17213425bc38SStefano Zampini partial_sum = 0; 17223425bc38SStefano Zampini n_boundary_dofs = 0; 17233425bc38SStefano Zampini s = 0; 17243425bc38SStefano Zampini n_vertices = 0; 17253425bc38SStefano Zampini /* Get Vertices used to define the BDDC */ 17263425bc38SStefano Zampini ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(*vertex_indices),&vertex_indices);CHKERRQ(ierr); 17273425bc38SStefano Zampini for (i=0; i<pcbddc->local_primal_size; i++) { 17283425bc38SStefano Zampini ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&j,(const PetscInt**)&temp_indices,PETSC_NULL);CHKERRQ(ierr); 17293425bc38SStefano Zampini if (j == 1) { 17303425bc38SStefano Zampini vertex_indices[n_vertices]=temp_indices[0]; 17313425bc38SStefano Zampini n_vertices++; 17323425bc38SStefano Zampini } 17333425bc38SStefano Zampini ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&j,(const PetscInt**)&temp_indices,PETSC_NULL);CHKERRQ(ierr); 17343425bc38SStefano Zampini } 17353425bc38SStefano Zampini dual_size = pcis->n_B-n_vertices; 17362fa5cd67SKarl Rupp 1737f0474715SStefano Zampini ierr = PetscSortInt(n_vertices,vertex_indices);CHKERRQ(ierr); 17383425bc38SStefano Zampini ierr = PetscMalloc(dual_size*sizeof(*dual_dofs_boundary_indices),&dual_dofs_boundary_indices);CHKERRQ(ierr); 17393425bc38SStefano Zampini ierr = PetscMalloc(dual_size*sizeof(*aux_local_numbering_1),&aux_local_numbering_1);CHKERRQ(ierr); 17403425bc38SStefano Zampini ierr = PetscMalloc(dual_size*sizeof(*aux_local_numbering_2),&aux_local_numbering_2);CHKERRQ(ierr); 17413425bc38SStefano Zampini 17423425bc38SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 17433425bc38SStefano Zampini for (i=0; i<pcis->n; i++) { 17443425bc38SStefano Zampini j = mat_graph->count[i]; /* RECALL: mat_graph->count[i] does not count myself */ 1745c6582918SStefano Zampini k = 0; 17462fa5cd67SKarl Rupp if (j > 0) k = (mat_graph->neighbours_set[i][0] == -1 ? 1 : 0); 17473425bc38SStefano Zampini j = j - k; 17482fa5cd67SKarl Rupp if (j > 0) n_boundary_dofs++; 17493425bc38SStefano Zampini 17503425bc38SStefano Zampini skip_node = PETSC_FALSE; 1751c6582918SStefano Zampini if (s < n_vertices && vertex_indices[s]==i) { /* it works for a sorted set of vertices */ 17523425bc38SStefano Zampini skip_node = PETSC_TRUE; 17533425bc38SStefano Zampini s++; 17543425bc38SStefano Zampini } 17552fa5cd67SKarl Rupp if (j < 1) skip_node = PETSC_TRUE; 17563425bc38SStefano Zampini if (!skip_node) { 17573425bc38SStefano Zampini if (fully_redundant) { 17583425bc38SStefano Zampini /* fully redundant set of lagrange multipliers */ 17593425bc38SStefano Zampini n_lambda_for_dof = (j*(j+1))/2; 17603425bc38SStefano Zampini } else { 17613425bc38SStefano Zampini n_lambda_for_dof = j; 17623425bc38SStefano Zampini } 17633425bc38SStefano Zampini n_local_lambda += j; 17643425bc38SStefano Zampini /* needed to evaluate global number of lagrange multipliers */ 17653425bc38SStefano Zampini array[i]=(1.0*n_lambda_for_dof)/(j+1.0); /* already scaled for the next global sum */ 17663425bc38SStefano Zampini /* store some data needed */ 17673425bc38SStefano Zampini dual_dofs_boundary_indices[partial_sum] = n_boundary_dofs-1; 17683425bc38SStefano Zampini aux_local_numbering_1[partial_sum] = i; 1769ef028eecSStefano Zampini aux_local_numbering_2[partial_sum] = n_lambda_for_dof; 17703425bc38SStefano Zampini partial_sum++; 17713425bc38SStefano Zampini } 17723425bc38SStefano Zampini } 17733425bc38SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 1774ef028eecSStefano Zampini 17753425bc38SStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 17763425bc38SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 17773425bc38SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 17783425bc38SStefano Zampini ierr = VecSum(pcis->vec1_global,&scalar_value);CHKERRQ(ierr); 17792fa5cd67SKarl Rupp 17803425bc38SStefano Zampini fetidpmat_ctx->n_lambda = (PetscInt) scalar_value; 17813425bc38SStefano Zampini /* printf("I found %d global multipliers (%f)\n",fetidpmat_ctx->n_lambda,scalar_value); */ 17823425bc38SStefano Zampini 17833425bc38SStefano Zampini /* compute global ordering of lagrange multipliers and associate l2g map */ 1784ef028eecSStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 1785ef028eecSStefano Zampini ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr); 1786ef028eecSStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 17872fa5cd67SKarl Rupp for (i=0;i<dual_size;i++) array[aux_local_numbering_1[i]] = aux_local_numbering_2[i]; 1788ef028eecSStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 1789ef028eecSStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 1790ef028eecSStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,pcis->vec1_global,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 1791ef028eecSStefano Zampini ierr = VecSum(pcis->vec1_global,&scalar_value);CHKERRQ(ierr); 1792ef028eecSStefano Zampini if (pcbddc->dbg_flag && (PetscInt)scalar_value != fetidpmat_ctx->n_lambda) { 1793acee19a7SJed Brown SETERRQ2(PETSC_COMM_WORLD,PETSC_ERR_PLIB,"Global number of multipliers mismatch! (%d!=%d)\n",(PetscInt)scalar_value,fetidpmat_ctx->n_lambda); 1794ef028eecSStefano Zampini } 17953425bc38SStefano Zampini 1796ef028eecSStefano Zampini /* Fill pcis->vec1_global with cumulative function for global numbering */ 1797ef028eecSStefano Zampini ierr = VecGetArray(pcis->vec1_global,&array);CHKERRQ(ierr); 1798ef028eecSStefano Zampini ierr = VecGetLocalSize(pcis->vec1_global,&s);CHKERRQ(ierr); 1799ef028eecSStefano Zampini k = 0; 1800ef028eecSStefano Zampini first_index = -1; 1801ef028eecSStefano Zampini for (i=0; i<s; i++) { 1802ef028eecSStefano Zampini if (!first_found && array[i] > 0.0) { 1803ef028eecSStefano Zampini first_found = PETSC_TRUE; 1804ef028eecSStefano Zampini first_index = i; 1805ef028eecSStefano Zampini } 1806ef028eecSStefano Zampini k += (PetscInt)array[i]; 1807ef028eecSStefano Zampini } 1808ef028eecSStefano Zampini j = (!rank ? nprocs : 0); 18093425bc38SStefano Zampini ierr = PetscMalloc(j*sizeof(*dof_sizes),&dof_sizes);CHKERRQ(ierr); 18103425bc38SStefano Zampini ierr = PetscMalloc(j*sizeof(*dof_displs),&dof_displs);CHKERRQ(ierr); 1811ef028eecSStefano Zampini ierr = MPI_Gather(&k,1,MPIU_INT,dof_sizes,1,MPIU_INT,0,comm);CHKERRQ(ierr); 1812ef028eecSStefano Zampini if (!rank) { 18133425bc38SStefano Zampini dof_displs[0]=0; 18142fa5cd67SKarl Rupp for (i=1; i<nprocs; i++) dof_displs[i] = dof_displs[i-1]+dof_sizes[i-1]; 18153425bc38SStefano Zampini } 1816ef028eecSStefano Zampini ierr = MPI_Scatter(dof_displs,1,MPIU_INT,&k,1,MPIU_INT,0,comm);CHKERRQ(ierr); 1817ef028eecSStefano Zampini if (first_found) { 1818ef028eecSStefano Zampini array[first_index] += k; 18192fa5cd67SKarl Rupp 1820ef028eecSStefano Zampini old_index = first_index; 1821ef028eecSStefano Zampini for (i=first_index+1; i<s; i++) { 1822ef028eecSStefano Zampini if (array[i] > 0.0) { 1823ef028eecSStefano Zampini array[i] += array[old_index]; 1824ef028eecSStefano Zampini old_index = i; 1825ef028eecSStefano Zampini } 1826ef028eecSStefano Zampini } 1827ef028eecSStefano Zampini } 1828ef028eecSStefano Zampini ierr = VecRestoreArray(pcis->vec1_global,&array);CHKERRQ(ierr); 1829ef028eecSStefano Zampini ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr); 1830ef028eecSStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 1831ef028eecSStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 1832ef028eecSStefano Zampini ierr = PetscMalloc(dual_size*sizeof(*aux_global_numbering),&aux_global_numbering);CHKERRQ(ierr); 1833ef028eecSStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 18343425bc38SStefano Zampini for (i=0; i<dual_size; i++) { 1835ef028eecSStefano Zampini aux_global_numbering[i] = (PetscInt)array[aux_local_numbering_1[i]]-aux_local_numbering_2[i]; 18363425bc38SStefano Zampini } 1837ef028eecSStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 1838f0474715SStefano Zampini ierr = PetscFree(aux_local_numbering_2);CHKERRQ(ierr); 1839f0474715SStefano Zampini ierr = PetscFree(dof_displs);CHKERRQ(ierr); 1840f0474715SStefano Zampini ierr = PetscFree(dof_sizes);CHKERRQ(ierr); 18413425bc38SStefano Zampini 18423425bc38SStefano Zampini /* init data for scaling factors exchange */ 18433425bc38SStefano Zampini partial_sum = 0; 18443425bc38SStefano Zampini j = 0; 18452fa5cd67SKarl Rupp 18463425bc38SStefano Zampini ierr = PetscMalloc(pcis->n_neigh*sizeof(PetscInt),&ptrs_buffer);CHKERRQ(ierr); 18473425bc38SStefano Zampini ierr = PetscMalloc((pcis->n_neigh-1)*sizeof(MPI_Request),&send_reqs);CHKERRQ(ierr); 18483425bc38SStefano Zampini ierr = PetscMalloc((pcis->n_neigh-1)*sizeof(MPI_Request),&recv_reqs);CHKERRQ(ierr); 18493425bc38SStefano Zampini ierr = PetscMalloc(pcis->n*sizeof(PetscScalar*),&all_factors);CHKERRQ(ierr); 18502fa5cd67SKarl Rupp 18513425bc38SStefano Zampini ptrs_buffer[0] = 0; 18523425bc38SStefano Zampini for (i=1; i<pcis->n_neigh; i++) { 18533425bc38SStefano Zampini partial_sum += pcis->n_shared[i]; 18543425bc38SStefano Zampini ptrs_buffer[i] = ptrs_buffer[i-1]+pcis->n_shared[i]; 18553425bc38SStefano Zampini } 18563425bc38SStefano Zampini ierr = PetscMalloc(partial_sum*sizeof(PetscScalar),&send_buffer);CHKERRQ(ierr); 18573425bc38SStefano Zampini ierr = PetscMalloc(partial_sum*sizeof(PetscScalar),&recv_buffer);CHKERRQ(ierr); 18583425bc38SStefano Zampini ierr = PetscMalloc(partial_sum*sizeof(PetscScalar),&all_factors[0]);CHKERRQ(ierr); 18593425bc38SStefano Zampini for (i=0; i<pcis->n-1; i++) { 18603425bc38SStefano Zampini j = mat_graph->count[i]; 18613425bc38SStefano Zampini if (j>0) { 18623425bc38SStefano Zampini k = (mat_graph->neighbours_set[i][0] == -1 ? 1 : 0); 18633425bc38SStefano Zampini j = j - k; 18643425bc38SStefano Zampini } 18653425bc38SStefano Zampini all_factors[i+1]=all_factors[i]+j; 18663425bc38SStefano Zampini } 18673425bc38SStefano Zampini /* scatter B scaling to N vec */ 18683425bc38SStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->D,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 18693425bc38SStefano Zampini ierr = VecScatterEnd (pcis->N_to_B,pcis->D,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 18703425bc38SStefano Zampini /* communications */ 18713425bc38SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 18723425bc38SStefano Zampini for (i=1; i<pcis->n_neigh; i++) { 18732fa5cd67SKarl Rupp for (j=0; j<pcis->n_shared[i]; j++) send_buffer[ptrs_buffer[i-1]+j] = array[pcis->shared[i][j]]; 18742fa5cd67SKarl Rupp 18753425bc38SStefano Zampini j = ptrs_buffer[i]-ptrs_buffer[i-1]; 1876ea7e1babSStefano Zampini ierr = MPI_Isend(&send_buffer[ptrs_buffer[i-1]],j,MPIU_SCALAR,pcis->neigh[i],0,comm,&send_reqs[i-1]);CHKERRQ(ierr); 1877ea7e1babSStefano Zampini ierr = MPI_Irecv(&recv_buffer[ptrs_buffer[i-1]],j,MPIU_SCALAR,pcis->neigh[i],0,comm,&recv_reqs[i-1]);CHKERRQ(ierr); 18783425bc38SStefano Zampini } 18793425bc38SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 1880ea7e1babSStefano Zampini ierr = MPI_Waitall((pcis->n_neigh-1),recv_reqs,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 18813425bc38SStefano Zampini /* put values in correct places */ 18823425bc38SStefano Zampini for (i=1; i<pcis->n_neigh; i++) { 18833425bc38SStefano Zampini for (j=0; j<pcis->n_shared[i]; j++) { 18843425bc38SStefano Zampini k = pcis->shared[i][j]; 18852fa5cd67SKarl Rupp 18863425bc38SStefano Zampini neigh_position = 0; 18872fa5cd67SKarl Rupp while (mat_graph->neighbours_set[k][neigh_position] != pcis->neigh[i]) neigh_position++; 18883425bc38SStefano Zampini s = (mat_graph->neighbours_set[k][0] == -1 ? 1 : 0); 18892fa5cd67SKarl Rupp 18903425bc38SStefano Zampini neigh_position = neigh_position - s; 18912fa5cd67SKarl Rupp 18923425bc38SStefano Zampini all_factors[k][neigh_position]=recv_buffer[ptrs_buffer[i-1]+j]; 18933425bc38SStefano Zampini } 18943425bc38SStefano Zampini } 1895ea7e1babSStefano Zampini ierr = MPI_Waitall((pcis->n_neigh-1),send_reqs,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 18963425bc38SStefano Zampini ierr = PetscFree(send_reqs);CHKERRQ(ierr); 18973425bc38SStefano Zampini ierr = PetscFree(recv_reqs);CHKERRQ(ierr); 18983425bc38SStefano Zampini ierr = PetscFree(send_buffer);CHKERRQ(ierr); 18993425bc38SStefano Zampini ierr = PetscFree(recv_buffer);CHKERRQ(ierr); 19003425bc38SStefano Zampini ierr = PetscFree(ptrs_buffer);CHKERRQ(ierr); 19013425bc38SStefano Zampini 19023425bc38SStefano Zampini /* Compute B and B_delta (local actions) */ 19033425bc38SStefano Zampini ierr = PetscMalloc(pcis->n_neigh*sizeof(*aux_sums),&aux_sums);CHKERRQ(ierr); 19043425bc38SStefano Zampini ierr = PetscMalloc(n_local_lambda*sizeof(*l2g_indices),&l2g_indices);CHKERRQ(ierr); 19053425bc38SStefano Zampini ierr = PetscMalloc(n_local_lambda*sizeof(*vals_B_delta),&vals_B_delta);CHKERRQ(ierr); 19063425bc38SStefano Zampini ierr = PetscMalloc(n_local_lambda*sizeof(*cols_B_delta),&cols_B_delta);CHKERRQ(ierr); 19073425bc38SStefano Zampini ierr = PetscMalloc(n_local_lambda*sizeof(*scaling_factors),&scaling_factors);CHKERRQ(ierr); 19082fa5cd67SKarl Rupp 19093425bc38SStefano Zampini n_global_lambda = 0; 19103425bc38SStefano Zampini partial_sum = 0; 19112fa5cd67SKarl Rupp 19123425bc38SStefano Zampini for (i=0;i<dual_size;i++) { 1913ef028eecSStefano Zampini n_global_lambda = aux_global_numbering[i]; 19143425bc38SStefano Zampini j = mat_graph->count[aux_local_numbering_1[i]]; 19153425bc38SStefano Zampini k = (mat_graph->neighbours_set[aux_local_numbering_1[i]][0] == -1 ? 1 : 0); 19163425bc38SStefano Zampini j = j - k; 19173425bc38SStefano Zampini aux_sums[0] = 0; 19182fa5cd67SKarl Rupp for (s=1; s<j; s++) aux_sums[s]=aux_sums[s-1]+j-s+1; 19192fa5cd67SKarl Rupp 19203425bc38SStefano Zampini array = all_factors[aux_local_numbering_1[i]]; 19213425bc38SStefano Zampini n_neg_values = 0; 19222fa5cd67SKarl Rupp 19232fa5cd67SKarl Rupp while (n_neg_values < j && mat_graph->neighbours_set[aux_local_numbering_1[i]][n_neg_values+k] < rank) n_neg_values++; 19243425bc38SStefano Zampini n_pos_values = j - n_neg_values; 19252fa5cd67SKarl Rupp 19263425bc38SStefano Zampini if (fully_redundant) { 19273425bc38SStefano Zampini for (s=0; s<n_neg_values; s++) { 19283425bc38SStefano Zampini l2g_indices [partial_sum+s]=aux_sums[s]+n_neg_values-s-1+n_global_lambda; 19293425bc38SStefano Zampini cols_B_delta [partial_sum+s]=dual_dofs_boundary_indices[i]; 19303425bc38SStefano Zampini vals_B_delta [partial_sum+s]=-1.0; 19313425bc38SStefano Zampini scaling_factors[partial_sum+s]=array[s]; 19323425bc38SStefano Zampini } 19333425bc38SStefano Zampini for (s=0; s<n_pos_values; s++) { 19343425bc38SStefano Zampini l2g_indices [partial_sum+s+n_neg_values]=aux_sums[n_neg_values]+s+n_global_lambda; 19353425bc38SStefano Zampini cols_B_delta [partial_sum+s+n_neg_values]=dual_dofs_boundary_indices[i]; 19363425bc38SStefano Zampini vals_B_delta [partial_sum+s+n_neg_values]=1.0; 19373425bc38SStefano Zampini scaling_factors[partial_sum+s+n_neg_values]=array[s+n_neg_values]; 19383425bc38SStefano Zampini } 19393425bc38SStefano Zampini partial_sum += j; 19403425bc38SStefano Zampini } else { 19413425bc38SStefano Zampini /* l2g_indices and default cols and vals of B_delta */ 19423425bc38SStefano Zampini for (s=0; s<j; s++) { 19433425bc38SStefano Zampini l2g_indices [partial_sum+s]=n_global_lambda+s; 19443425bc38SStefano Zampini cols_B_delta [partial_sum+s]=dual_dofs_boundary_indices[i]; 19453425bc38SStefano Zampini vals_B_delta [partial_sum+s]=0.0; 19463425bc38SStefano Zampini } 19473425bc38SStefano Zampini /* B_delta */ 19482fa5cd67SKarl Rupp if (n_neg_values > 0) vals_B_delta[partial_sum+n_neg_values-1] = -1.0; /* there's a rank next to me to the left */ 19492fa5cd67SKarl Rupp if (n_neg_values < j) vals_B_delta[partial_sum+n_neg_values] = 1.0; /* there's a rank next to me to the right */ 19502fa5cd67SKarl Rupp 19513425bc38SStefano Zampini /* scaling as in Klawonn-Widlund 1999*/ 19523425bc38SStefano Zampini for (s=0;s<n_neg_values;s++) { 19533425bc38SStefano Zampini scalar_value = 0.0; 19542fa5cd67SKarl Rupp for (k=0;k<s+1;k++) scalar_value += array[k]; 1955ef028eecSStefano Zampini scaling_factors[partial_sum+s] = -scalar_value; 19563425bc38SStefano Zampini } 19573425bc38SStefano Zampini for (s=0;s<n_pos_values;s++) { 19583425bc38SStefano Zampini scalar_value = 0.0; 19592fa5cd67SKarl Rupp for (k=s+n_neg_values;k<j;k++) scalar_value += array[k]; 19603425bc38SStefano Zampini scaling_factors[partial_sum+s+n_neg_values] = scalar_value; 19613425bc38SStefano Zampini } 19623425bc38SStefano Zampini partial_sum += j; 19633425bc38SStefano Zampini } 19643425bc38SStefano Zampini } 1965ef028eecSStefano Zampini ierr = PetscFree(aux_global_numbering);CHKERRQ(ierr); 1966f0474715SStefano Zampini ierr = PetscFree(aux_sums);CHKERRQ(ierr); 1967f0474715SStefano Zampini ierr = PetscFree(aux_local_numbering_1);CHKERRQ(ierr); 1968f0474715SStefano Zampini ierr = PetscFree(dual_dofs_boundary_indices);CHKERRQ(ierr); 19693425bc38SStefano Zampini ierr = PetscFree(all_factors[0]);CHKERRQ(ierr); 19703425bc38SStefano Zampini ierr = PetscFree(all_factors);CHKERRQ(ierr); 19713425bc38SStefano Zampini /* printf("I found %d local lambda dofs when numbering them (should be %d)\n",partial_sum,n_local_lambda); */ 1972f0474715SStefano Zampini 1973f0474715SStefano Zampini /* Local to global mapping of fetidpmat */ 1974f0474715SStefano Zampini ierr = VecCreate(PETSC_COMM_SELF,&fetidpmat_ctx->lambda_local);CHKERRQ(ierr); 1975f0474715SStefano Zampini ierr = VecSetSizes(fetidpmat_ctx->lambda_local,n_local_lambda,n_local_lambda);CHKERRQ(ierr); 1976f0474715SStefano Zampini ierr = VecSetType(fetidpmat_ctx->lambda_local,VECSEQ);CHKERRQ(ierr); 1977f0474715SStefano Zampini ierr = VecCreate(comm,&lambda_global);CHKERRQ(ierr); 1978f0474715SStefano Zampini ierr = VecSetSizes(lambda_global,PETSC_DECIDE,fetidpmat_ctx->n_lambda);CHKERRQ(ierr); 1979f0474715SStefano Zampini ierr = VecSetType(lambda_global,VECMPI);CHKERRQ(ierr); 19803425bc38SStefano Zampini ierr = ISCreateGeneral(comm,n_local_lambda,l2g_indices,PETSC_OWN_POINTER,&IS_l2g_lambda);CHKERRQ(ierr); 19813425bc38SStefano Zampini ierr = VecScatterCreate(fetidpmat_ctx->lambda_local,(IS)0,lambda_global,IS_l2g_lambda,&fetidpmat_ctx->l2g_lambda);CHKERRQ(ierr); 1982f0474715SStefano Zampini ierr = ISDestroy(&IS_l2g_lambda);CHKERRQ(ierr); 19833425bc38SStefano Zampini 19843425bc38SStefano Zampini /* Create local part of B_delta */ 19853425bc38SStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&fetidpmat_ctx->B_delta); 19863425bc38SStefano Zampini ierr = MatSetSizes(fetidpmat_ctx->B_delta,n_local_lambda,pcis->n_B,n_local_lambda,pcis->n_B);CHKERRQ(ierr); 19873425bc38SStefano Zampini ierr = MatSetType(fetidpmat_ctx->B_delta,MATSEQAIJ);CHKERRQ(ierr); 19883425bc38SStefano Zampini ierr = MatSeqAIJSetPreallocation(fetidpmat_ctx->B_delta,1,PETSC_NULL);CHKERRQ(ierr); 19893425bc38SStefano Zampini ierr = MatSetOption(fetidpmat_ctx->B_delta,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr); 19903425bc38SStefano Zampini for (i=0; i<n_local_lambda; i++) { 19913425bc38SStefano Zampini ierr = MatSetValue(fetidpmat_ctx->B_delta,i,cols_B_delta[i],vals_B_delta[i],INSERT_VALUES);CHKERRQ(ierr); 19923425bc38SStefano Zampini } 1993f0474715SStefano Zampini ierr = PetscFree(vals_B_delta);CHKERRQ(ierr); 19943425bc38SStefano Zampini ierr = MatAssemblyBegin(fetidpmat_ctx->B_delta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 19953425bc38SStefano Zampini ierr = MatAssemblyEnd (fetidpmat_ctx->B_delta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 19963425bc38SStefano Zampini 19973425bc38SStefano Zampini if (fully_redundant) { 19983425bc38SStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&ScalingMat); 19993425bc38SStefano Zampini ierr = MatSetSizes(ScalingMat,n_local_lambda,n_local_lambda,n_local_lambda,n_local_lambda);CHKERRQ(ierr); 20003425bc38SStefano Zampini ierr = MatSetType(ScalingMat,MATSEQAIJ);CHKERRQ(ierr); 20013425bc38SStefano Zampini ierr = MatSeqAIJSetPreallocation(ScalingMat,1,PETSC_NULL);CHKERRQ(ierr); 20023425bc38SStefano Zampini for (i=0; i<n_local_lambda; i++) { 20033425bc38SStefano Zampini ierr = MatSetValue(ScalingMat,i,i,scaling_factors[i],INSERT_VALUES);CHKERRQ(ierr); 20043425bc38SStefano Zampini } 20053425bc38SStefano Zampini ierr = MatAssemblyBegin(ScalingMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 20063425bc38SStefano Zampini ierr = MatAssemblyEnd (ScalingMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 20073425bc38SStefano Zampini ierr = MatMatMult(ScalingMat,fetidpmat_ctx->B_delta,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&fetidpmat_ctx->B_Ddelta);CHKERRQ(ierr); 20083425bc38SStefano Zampini ierr = MatDestroy(&ScalingMat);CHKERRQ(ierr); 20093425bc38SStefano Zampini } else { 20103425bc38SStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&fetidpmat_ctx->B_Ddelta); 20113425bc38SStefano Zampini ierr = MatSetSizes(fetidpmat_ctx->B_Ddelta,n_local_lambda,pcis->n_B,n_local_lambda,pcis->n_B);CHKERRQ(ierr); 20123425bc38SStefano Zampini ierr = MatSetType(fetidpmat_ctx->B_Ddelta,MATSEQAIJ);CHKERRQ(ierr); 20133425bc38SStefano Zampini ierr = MatSeqAIJSetPreallocation(fetidpmat_ctx->B_Ddelta,1,PETSC_NULL);CHKERRQ(ierr); 20143425bc38SStefano Zampini for (i=0; i<n_local_lambda; i++) { 20153425bc38SStefano Zampini ierr = MatSetValue(fetidpmat_ctx->B_Ddelta,i,cols_B_delta[i],scaling_factors[i],INSERT_VALUES);CHKERRQ(ierr); 20163425bc38SStefano Zampini } 20173425bc38SStefano Zampini ierr = MatAssemblyBegin(fetidpmat_ctx->B_Ddelta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 20183425bc38SStefano Zampini ierr = MatAssemblyEnd (fetidpmat_ctx->B_Ddelta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 20193425bc38SStefano Zampini } 2020f0474715SStefano Zampini ierr = PetscFree(scaling_factors);CHKERRQ(ierr); 2021f0474715SStefano Zampini ierr = PetscFree(cols_B_delta);CHKERRQ(ierr); 20223425bc38SStefano Zampini 20233425bc38SStefano Zampini /* Create some vectors needed by fetidp */ 20243425bc38SStefano Zampini ierr = VecDuplicate(pcis->vec1_B,&fetidpmat_ctx->temp_solution_B);CHKERRQ(ierr); 20253425bc38SStefano Zampini ierr = VecDuplicate(pcis->vec1_D,&fetidpmat_ctx->temp_solution_D);CHKERRQ(ierr); 20263425bc38SStefano Zampini 20273425bc38SStefano Zampini test_fetidp = PETSC_FALSE; 20282fa5cd67SKarl Rupp 20293425bc38SStefano Zampini ierr = PetscOptionsGetBool(PETSC_NULL,"-fetidp_check",&test_fetidp,PETSC_NULL);CHKERRQ(ierr); 20303425bc38SStefano Zampini 20313425bc38SStefano Zampini if (test_fetidp) { 20323425bc38SStefano Zampini 20333425bc38SStefano Zampini ierr = PetscViewerASCIIGetStdout(((PetscObject)(fetidpmat_ctx->pc))->comm,&viewer);CHKERRQ(ierr); 20343425bc38SStefano Zampini ierr = PetscViewerASCIISynchronizedAllow(viewer,PETSC_TRUE);CHKERRQ(ierr); 20353425bc38SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"----------FETI_DP TESTS--------------\n");CHKERRQ(ierr); 20363425bc38SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"All tests should return zero!\n");CHKERRQ(ierr); 20373425bc38SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"FETIDP MAT context in the ");CHKERRQ(ierr); 20383425bc38SStefano Zampini if (fully_redundant) { 20393425bc38SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"fully redundant case for lagrange multipliers.\n");CHKERRQ(ierr); 20403425bc38SStefano Zampini } else { 20413425bc38SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Non-fully redundant case for lagrange multiplier.\n");CHKERRQ(ierr); 20423425bc38SStefano Zampini } 20433425bc38SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 20443425bc38SStefano Zampini 20453425bc38SStefano Zampini /* TEST A/B: Test numbering of global lambda dofs */ 20463425bc38SStefano Zampini 20473425bc38SStefano Zampini ierr = VecDuplicate(fetidpmat_ctx->lambda_local,&test_vec);CHKERRQ(ierr); 20483425bc38SStefano Zampini ierr = VecSet(lambda_global,1.0);CHKERRQ(ierr); 20493425bc38SStefano Zampini ierr = VecSet(test_vec,1.0);CHKERRQ(ierr); 20503425bc38SStefano Zampini ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 20513425bc38SStefano Zampini ierr = VecScatterEnd (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 20523425bc38SStefano Zampini scalar_value = -1.0; 20533425bc38SStefano Zampini ierr = VecAXPY(test_vec,scalar_value,fetidpmat_ctx->lambda_local);CHKERRQ(ierr); 20543425bc38SStefano Zampini ierr = VecNorm(test_vec,NORM_INFINITY,&scalar_value);CHKERRQ(ierr); 20553425bc38SStefano Zampini ierr = VecDestroy(&test_vec);CHKERRQ(ierr); 20563425bc38SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"A[%04d]: CHECK glob to loc: % 1.14e\n",rank,scalar_value);CHKERRQ(ierr); 20573425bc38SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 20583425bc38SStefano Zampini if (fully_redundant) { 20593425bc38SStefano Zampini ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr); 20603425bc38SStefano Zampini ierr = VecSet(fetidpmat_ctx->lambda_local,0.5);CHKERRQ(ierr); 20613425bc38SStefano Zampini ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 20623425bc38SStefano Zampini ierr = VecScatterEnd (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 20633425bc38SStefano Zampini ierr = VecSum(lambda_global,&scalar_value);CHKERRQ(ierr); 20643425bc38SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"B[%04d]: CHECK loc to glob: % 1.14e\n",rank,scalar_value-fetidpmat_ctx->n_lambda);CHKERRQ(ierr); 20653425bc38SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 20663425bc38SStefano Zampini } 20673425bc38SStefano Zampini 20683425bc38SStefano Zampini /* TEST C: It should holds B_delta*w=0, w\in\widehat{W} */ 20693425bc38SStefano Zampini /* This is the meaning of the B matrix */ 20703425bc38SStefano Zampini 20713425bc38SStefano Zampini ierr = VecSetRandom(pcis->vec1_N,PETSC_NULL);CHKERRQ(ierr); 20723425bc38SStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 20733425bc38SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 20743425bc38SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 20753425bc38SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 20763425bc38SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 20773425bc38SStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 20783425bc38SStefano Zampini ierr = VecScatterEnd (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 20793425bc38SStefano Zampini /* Action of B_delta */ 20803425bc38SStefano Zampini ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr); 20813425bc38SStefano Zampini ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr); 20823425bc38SStefano Zampini ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 20833425bc38SStefano Zampini ierr = VecScatterEnd (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 20843425bc38SStefano Zampini ierr = VecNorm(lambda_global,NORM_INFINITY,&scalar_value);CHKERRQ(ierr); 20853425bc38SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"C[coll]: CHECK infty norm of B_delta*w (w continuous): % 1.14e\n",scalar_value);CHKERRQ(ierr); 20863425bc38SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 20873425bc38SStefano Zampini 20883425bc38SStefano Zampini /* TEST D: It should holds E_Dw = w - P_Dw w\in\widetilde{W} */ 20893425bc38SStefano Zampini /* E_D = R_D^TR */ 20903425bc38SStefano Zampini /* P_D = B_{D,delta}^T B_{delta} */ 20913425bc38SStefano Zampini /* eq.44 Mandel Tezaur and Dohrmann 2005 */ 20923425bc38SStefano Zampini 20933425bc38SStefano Zampini /* compute a random vector in \widetilde{W} */ 20943425bc38SStefano Zampini ierr = VecSetRandom(pcis->vec1_N,PETSC_NULL);CHKERRQ(ierr); 20952fa5cd67SKarl Rupp 20963425bc38SStefano Zampini scalar_value = 0.0; /* set zero at vertices */ 20973425bc38SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 20982fa5cd67SKarl Rupp for (i=0;i<n_vertices;i++) array[vertex_indices[i]] = scalar_value; 20993425bc38SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 21002fa5cd67SKarl Rupp 21013425bc38SStefano Zampini /* store w for final comparison */ 21023425bc38SStefano Zampini ierr = VecDuplicate(pcis->vec1_B,&test_vec);CHKERRQ(ierr); 21033425bc38SStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,test_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 21043425bc38SStefano Zampini ierr = VecScatterEnd (pcis->N_to_B,pcis->vec1_N,test_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 21053425bc38SStefano Zampini 21063425bc38SStefano Zampini /* Jump operator P_D : results stored in pcis->vec1_B */ 21073425bc38SStefano Zampini 21083425bc38SStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 21093425bc38SStefano Zampini ierr = VecScatterEnd (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 21103425bc38SStefano Zampini /* Action of B_delta */ 21113425bc38SStefano Zampini ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr); 21123425bc38SStefano Zampini ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr); 21133425bc38SStefano Zampini ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 21143425bc38SStefano Zampini ierr = VecScatterEnd (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 21153425bc38SStefano Zampini /* Action of B_Ddelta^T */ 21163425bc38SStefano Zampini ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 21173425bc38SStefano Zampini ierr = VecScatterEnd (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 21183425bc38SStefano Zampini ierr = MatMultTranspose(fetidpmat_ctx->B_Ddelta,fetidpmat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr); 21193425bc38SStefano Zampini 21203425bc38SStefano Zampini /* Average operator E_D : results stored in pcis->vec2_B */ 21213425bc38SStefano Zampini 21223425bc38SStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 21233425bc38SStefano Zampini ierr = VecScatterEnd (pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 21243425bc38SStefano Zampini ierr = VecPointwiseMult(pcis->vec2_B,pcis->D,pcis->vec2_B);CHKERRQ(ierr); 21253425bc38SStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->vec2_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 21263425bc38SStefano Zampini ierr = VecScatterEnd (pcis->N_to_B,pcis->vec2_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 21273425bc38SStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 21283425bc38SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 21293425bc38SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 21303425bc38SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 21313425bc38SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 21323425bc38SStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 21333425bc38SStefano Zampini ierr = VecScatterEnd (pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 21343425bc38SStefano Zampini 21353425bc38SStefano Zampini /* test E_D=I-P_D */ 21363425bc38SStefano Zampini scalar_value = 1.0; 21373425bc38SStefano Zampini ierr = VecAXPY(pcis->vec1_B,scalar_value,pcis->vec2_B);CHKERRQ(ierr); 21383425bc38SStefano Zampini scalar_value = -1.0; 21393425bc38SStefano Zampini ierr = VecAXPY(pcis->vec1_B,scalar_value,test_vec);CHKERRQ(ierr); 21403425bc38SStefano Zampini ierr = VecNorm(pcis->vec1_B,NORM_INFINITY,&scalar_value);CHKERRQ(ierr); 21413425bc38SStefano Zampini ierr = VecDestroy(&test_vec);CHKERRQ(ierr); 21423425bc38SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"D[%04d] CHECK infty norm of E_D + P_D - I: % 1.14e\n",rank,scalar_value);CHKERRQ(ierr); 21433425bc38SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 21443425bc38SStefano Zampini 21453425bc38SStefano Zampini /* TEST E: It should holds R_D^TP_Dw=0 w\in\widetilde{W} */ 21463425bc38SStefano Zampini /* eq.48 Mandel Tezaur and Dohrmann 2005 */ 21473425bc38SStefano Zampini 21483425bc38SStefano Zampini ierr = VecSetRandom(pcis->vec1_N,PETSC_NULL);CHKERRQ(ierr); 21493425bc38SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 21502fa5cd67SKarl Rupp 21513425bc38SStefano Zampini scalar_value = 0.0; /* set zero at vertices */ 21522fa5cd67SKarl Rupp for (i=0;i<n_vertices;i++) array[vertex_indices[i]]=scalar_value; 21533425bc38SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 21543425bc38SStefano Zampini 21553425bc38SStefano Zampini /* Jump operator P_D : results stored in pcis->vec1_B */ 21563425bc38SStefano Zampini 21573425bc38SStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 21583425bc38SStefano Zampini ierr = VecScatterEnd (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 21593425bc38SStefano Zampini /* Action of B_delta */ 21603425bc38SStefano Zampini ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr); 21613425bc38SStefano Zampini ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr); 21623425bc38SStefano Zampini ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 21633425bc38SStefano Zampini ierr = VecScatterEnd (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 21643425bc38SStefano Zampini /* Action of B_Ddelta^T */ 21653425bc38SStefano Zampini ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 21663425bc38SStefano Zampini ierr = VecScatterEnd (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 21673425bc38SStefano Zampini ierr = MatMultTranspose(fetidpmat_ctx->B_Ddelta,fetidpmat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr); 21683425bc38SStefano Zampini /* diagonal scaling */ 21693425bc38SStefano Zampini ierr = VecPointwiseMult(pcis->vec1_B,pcis->D,pcis->vec1_B);CHKERRQ(ierr); 21703425bc38SStefano Zampini /* sum on the interface */ 21713425bc38SStefano Zampini ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr); 21723425bc38SStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 21733425bc38SStefano Zampini ierr = VecScatterEnd (pcis->N_to_B,pcis->vec1_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 21743425bc38SStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 21753425bc38SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 21763425bc38SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 21773425bc38SStefano Zampini ierr = VecNorm(pcis->vec1_global,NORM_INFINITY,&scalar_value);CHKERRQ(ierr); 21783425bc38SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"E[coll]: CHECK infty norm of R^T_D P_D: % 1.14e\n",scalar_value);CHKERRQ(ierr); 21793425bc38SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 21803425bc38SStefano Zampini 21813425bc38SStefano Zampini if (!fully_redundant) { 21823425bc38SStefano Zampini /* TEST F: It should holds B_{delta}B^T_{D,delta}=I */ 21833425bc38SStefano Zampini /* Corollary thm 14 Mandel Tezaur and Dohrmann 2005 */ 21843425bc38SStefano Zampini ierr = VecDuplicate(lambda_global,&test_vec);CHKERRQ(ierr); 21853425bc38SStefano Zampini ierr = VecSetRandom(lambda_global,PETSC_NULL);CHKERRQ(ierr); 21863425bc38SStefano Zampini /* Action of B_Ddelta^T */ 21873425bc38SStefano Zampini ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 21883425bc38SStefano Zampini ierr = VecScatterEnd (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 21893425bc38SStefano Zampini ierr = MatMultTranspose(fetidpmat_ctx->B_Ddelta,fetidpmat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr); 21903425bc38SStefano Zampini /* Action of B_delta */ 21913425bc38SStefano Zampini ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr); 21923425bc38SStefano Zampini ierr = VecSet(test_vec,0.0);CHKERRQ(ierr); 21933425bc38SStefano Zampini ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,test_vec,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 21943425bc38SStefano Zampini ierr = VecScatterEnd (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,test_vec,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 21953425bc38SStefano Zampini scalar_value = -1.0; 21963425bc38SStefano Zampini ierr = VecAXPY(lambda_global,scalar_value,test_vec);CHKERRQ(ierr); 21973425bc38SStefano Zampini ierr = VecNorm(lambda_global,NORM_INFINITY,&scalar_value);CHKERRQ(ierr); 21983425bc38SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"E[coll]: CHECK infty norm of P^T_D - I: % 1.14e\n",scalar_value);CHKERRQ(ierr); 21993425bc38SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 22003425bc38SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 22013425bc38SStefano Zampini ierr = VecDestroy(&test_vec);CHKERRQ(ierr); 22023425bc38SStefano Zampini } 22033425bc38SStefano Zampini } 22043425bc38SStefano Zampini /* final cleanup */ 22053425bc38SStefano Zampini ierr = PetscFree(vertex_indices);CHKERRQ(ierr); 22063425bc38SStefano Zampini ierr = VecDestroy(&lambda_global);CHKERRQ(ierr); 22073425bc38SStefano Zampini PetscFunctionReturn(0); 22083425bc38SStefano Zampini } 22093425bc38SStefano Zampini 22103425bc38SStefano Zampini #undef __FUNCT__ 22113425bc38SStefano Zampini #define __FUNCT__ "PCBDDCSetupFETIDPPCContext" 22123425bc38SStefano Zampini static PetscErrorCode PCBDDCSetupFETIDPPCContext(Mat fetimat, FETIDPPC_ctx *fetidppc_ctx) 22133425bc38SStefano Zampini { 22143425bc38SStefano Zampini FETIDPMat_ctx *mat_ctx; 22153425bc38SStefano Zampini PetscErrorCode ierr; 22163425bc38SStefano Zampini 22173425bc38SStefano Zampini PetscFunctionBegin; 22183425bc38SStefano Zampini ierr = MatShellGetContext(fetimat,&mat_ctx);CHKERRQ(ierr); 22193425bc38SStefano Zampini /* get references from objects created when setting up feti mat context */ 22203425bc38SStefano Zampini ierr = PetscObjectReference((PetscObject)mat_ctx->lambda_local);CHKERRQ(ierr); 22212fa5cd67SKarl Rupp 22223425bc38SStefano Zampini fetidppc_ctx->lambda_local = mat_ctx->lambda_local; 22232fa5cd67SKarl Rupp 22243425bc38SStefano Zampini ierr = PetscObjectReference((PetscObject)mat_ctx->B_Ddelta);CHKERRQ(ierr); 22252fa5cd67SKarl Rupp 22263425bc38SStefano Zampini fetidppc_ctx->B_Ddelta = mat_ctx->B_Ddelta; 22272fa5cd67SKarl Rupp 22283425bc38SStefano Zampini ierr = PetscObjectReference((PetscObject)mat_ctx->l2g_lambda);CHKERRQ(ierr); 22292fa5cd67SKarl Rupp 22303425bc38SStefano Zampini fetidppc_ctx->l2g_lambda = mat_ctx->l2g_lambda; 22313425bc38SStefano Zampini PetscFunctionReturn(0); 22323425bc38SStefano Zampini } 22333425bc38SStefano Zampini 22343425bc38SStefano Zampini #undef __FUNCT__ 22353425bc38SStefano Zampini #define __FUNCT__ "FETIDPMatMult" 22363425bc38SStefano Zampini static PetscErrorCode FETIDPMatMult(Mat fetimat, Vec x, Vec y) 22373425bc38SStefano Zampini { 22383425bc38SStefano Zampini FETIDPMat_ctx *mat_ctx; 22393425bc38SStefano Zampini PC_IS *pcis; 22403425bc38SStefano Zampini PetscErrorCode ierr; 22413425bc38SStefano Zampini 22423425bc38SStefano Zampini PetscFunctionBegin; 22433425bc38SStefano Zampini ierr = MatShellGetContext(fetimat,&mat_ctx);CHKERRQ(ierr); 22443425bc38SStefano Zampini pcis = (PC_IS*)mat_ctx->pc->data; 22453425bc38SStefano Zampini /* Application of B_delta^T */ 22463425bc38SStefano Zampini ierr = VecScatterBegin(mat_ctx->l2g_lambda,x,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 22473425bc38SStefano Zampini ierr = VecScatterEnd(mat_ctx->l2g_lambda,x,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 22483425bc38SStefano Zampini ierr = MatMultTranspose(mat_ctx->B_delta,mat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr); 22493425bc38SStefano Zampini /* Application of \widetilde{S}^-1 */ 22503425bc38SStefano Zampini ierr = VecSet(pcis->vec1_D,0.0);CHKERRQ(ierr); 22513425bc38SStefano Zampini ierr = PCBDDCApplyInterfacePreconditioner(mat_ctx->pc);CHKERRQ(ierr); 22523425bc38SStefano Zampini /* Application of B_delta */ 22533425bc38SStefano Zampini ierr = MatMult(mat_ctx->B_delta,pcis->vec1_B,mat_ctx->lambda_local);CHKERRQ(ierr); 22543425bc38SStefano Zampini ierr = VecSet(y,0.0);CHKERRQ(ierr); 22553425bc38SStefano Zampini ierr = VecScatterBegin(mat_ctx->l2g_lambda,mat_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 22563425bc38SStefano Zampini ierr = VecScatterEnd(mat_ctx->l2g_lambda,mat_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 22573425bc38SStefano Zampini PetscFunctionReturn(0); 22583425bc38SStefano Zampini } 22593425bc38SStefano Zampini 22603425bc38SStefano Zampini #undef __FUNCT__ 22613425bc38SStefano Zampini #define __FUNCT__ "FETIDPPCApply" 22623425bc38SStefano Zampini static PetscErrorCode FETIDPPCApply(PC fetipc, Vec x, Vec y) 22633425bc38SStefano Zampini { 22643425bc38SStefano Zampini FETIDPPC_ctx *pc_ctx; 22653425bc38SStefano Zampini PC_IS *pcis; 22663425bc38SStefano Zampini PetscErrorCode ierr; 22673425bc38SStefano Zampini 22683425bc38SStefano Zampini PetscFunctionBegin; 22693425bc38SStefano Zampini ierr = PCShellGetContext(fetipc,(void**)&pc_ctx); 22703425bc38SStefano Zampini pcis = (PC_IS*)pc_ctx->pc->data; 22713425bc38SStefano Zampini /* Application of B_Ddelta^T */ 22723425bc38SStefano Zampini ierr = VecScatterBegin(pc_ctx->l2g_lambda,x,pc_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 22733425bc38SStefano Zampini ierr = VecScatterEnd(pc_ctx->l2g_lambda,x,pc_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 22743425bc38SStefano Zampini ierr = VecSet(pcis->vec2_B,0.0);CHKERRQ(ierr); 22753425bc38SStefano Zampini ierr = MatMultTranspose(pc_ctx->B_Ddelta,pc_ctx->lambda_local,pcis->vec2_B);CHKERRQ(ierr); 22763425bc38SStefano Zampini /* Application of S */ 22773425bc38SStefano Zampini ierr = PCISApplySchur(pc_ctx->pc,pcis->vec2_B,pcis->vec1_B,(Vec)0,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr); 22783425bc38SStefano Zampini /* Application of B_Ddelta */ 22793425bc38SStefano Zampini ierr = MatMult(pc_ctx->B_Ddelta,pcis->vec1_B,pc_ctx->lambda_local);CHKERRQ(ierr); 22803425bc38SStefano Zampini ierr = VecSet(y,0.0);CHKERRQ(ierr); 22813425bc38SStefano Zampini ierr = VecScatterBegin(pc_ctx->l2g_lambda,pc_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 22823425bc38SStefano Zampini ierr = VecScatterEnd(pc_ctx->l2g_lambda,pc_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 22833425bc38SStefano Zampini PetscFunctionReturn(0); 22843425bc38SStefano Zampini } 22853425bc38SStefano Zampini 2286da1bb401SStefano Zampini #undef __FUNCT__ 2287da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetupLocalAdjacencyGraph" 2288da1bb401SStefano Zampini static PetscErrorCode PCBDDCSetupLocalAdjacencyGraph(PC pc) 2289da1bb401SStefano Zampini { 2290da1bb401SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 2291da1bb401SStefano Zampini Mat_IS *matis = (Mat_IS*)pc->pmat->data; 22921a83f524SJed Brown PetscInt nvtxs; 22931a83f524SJed Brown const PetscInt *xadj,*adjncy; 2294da1bb401SStefano Zampini Mat mat_adj; 2295da1bb401SStefano Zampini PetscBool symmetrize_rowij=PETSC_TRUE,compressed_rowij=PETSC_FALSE,flg_row=PETSC_TRUE; 2296da1bb401SStefano Zampini PCBDDCGraph mat_graph =pcbddc->mat_graph; 2297da1bb401SStefano Zampini PetscErrorCode ierr; 2298da1bb401SStefano Zampini 2299da1bb401SStefano Zampini PetscFunctionBegin; 2300da1bb401SStefano Zampini /* get CSR adjacency from local matrix if user has not yet provided local graph using PCBDDCSetLocalAdjacencyGraph function */ 2301da1bb401SStefano Zampini if (!mat_graph->xadj) { 2302da1bb401SStefano Zampini ierr = MatConvert(matis->A,MATMPIADJ,MAT_INITIAL_MATRIX,&mat_adj);CHKERRQ(ierr); 2303da1bb401SStefano Zampini ierr = MatGetRowIJ(mat_adj,0,symmetrize_rowij,compressed_rowij,&nvtxs,&xadj,&adjncy,&flg_row);CHKERRQ(ierr); 2304acee19a7SJed Brown if (!flg_row) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in MatGetRowIJ()\n"); 2305da1bb401SStefano Zampini /* Get adjacency into BDDC workspace */ 2306da1bb401SStefano Zampini ierr = PCBDDCSetLocalAdjacencyGraph(pc,nvtxs,xadj,adjncy,PETSC_COPY_VALUES);CHKERRQ(ierr); 2307da1bb401SStefano Zampini ierr = MatRestoreRowIJ(mat_adj,0,symmetrize_rowij,compressed_rowij,&nvtxs,&xadj,&adjncy,&flg_row);CHKERRQ(ierr); 2308acee19a7SJed Brown if (!flg_row) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in MatRestoreRowIJ()\n"); 2309da1bb401SStefano Zampini ierr = MatDestroy(&mat_adj);CHKERRQ(ierr); 2310da1bb401SStefano Zampini } 2311da1bb401SStefano Zampini PetscFunctionReturn(0); 2312da1bb401SStefano Zampini } 2313da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */ 23140c7d97c5SJed Brown #undef __FUNCT__ 23150c7d97c5SJed Brown #define __FUNCT__ "PCBDDCApplyInterfacePreconditioner" 23162617d88aSStefano Zampini static PetscErrorCode PCBDDCApplyInterfacePreconditioner(PC pc) 23170c7d97c5SJed Brown { 23180c7d97c5SJed Brown PetscErrorCode ierr; 23190c7d97c5SJed Brown PC_BDDC *pcbddc = (PC_BDDC*)(pc->data); 23200c7d97c5SJed Brown PC_IS *pcis = (PC_IS*)(pc->data); 23213b03a366Sstefano_zampini const PetscScalar zero = 0.0; 23220c7d97c5SJed Brown 23230c7d97c5SJed Brown PetscFunctionBegin; 23240c7d97c5SJed Brown /* Application of PHI^T */ 23250c7d97c5SJed Brown ierr = MatMultTranspose(pcbddc->coarse_phi_B,pcis->vec1_B,pcbddc->vec1_P);CHKERRQ(ierr); 232629622bf0SStefano Zampini if (pcbddc->inexact_prec_type) { ierr = MatMultTransposeAdd(pcbddc->coarse_phi_D,pcis->vec1_D,pcbddc->vec1_P,pcbddc->vec1_P);CHKERRQ(ierr); } 23270c7d97c5SJed Brown 23280c7d97c5SJed Brown /* Scatter data of coarse_rhs */ 2329142dfd88SStefano Zampini if (pcbddc->coarse_rhs) { ierr = VecSet(pcbddc->coarse_rhs,zero);CHKERRQ(ierr); } 23300c7d97c5SJed Brown ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->vec1_P,pcbddc->coarse_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 23310c7d97c5SJed Brown 23320c7d97c5SJed Brown /* Local solution on R nodes */ 23330c7d97c5SJed Brown ierr = VecSet(pcbddc->vec1_R,zero);CHKERRQ(ierr); 23340c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->R_to_B,pcis->vec1_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 23350c7d97c5SJed Brown ierr = VecScatterEnd (pcbddc->R_to_B,pcis->vec1_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 233629622bf0SStefano Zampini if (pcbddc->inexact_prec_type) { 23370c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->R_to_D,pcis->vec1_D,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 23380c7d97c5SJed Brown ierr = VecScatterEnd (pcbddc->R_to_D,pcis->vec1_D,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 23390c7d97c5SJed Brown } 23400c7d97c5SJed Brown ierr = PCBDDCSolveSaddlePoint(pc);CHKERRQ(ierr); 23410c7d97c5SJed Brown ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr); 23420c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec2_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 23430c7d97c5SJed Brown ierr = VecScatterEnd (pcbddc->R_to_B,pcbddc->vec2_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 234429622bf0SStefano Zampini if (pcbddc->inexact_prec_type) { 23450c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec2_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 23460c7d97c5SJed Brown ierr = VecScatterEnd (pcbddc->R_to_D,pcbddc->vec2_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 23470c7d97c5SJed Brown } 23480c7d97c5SJed Brown 23490c7d97c5SJed Brown /* Coarse solution */ 23500c7d97c5SJed Brown ierr = PCBDDCScatterCoarseDataEnd(pc,pcbddc->vec1_P,pcbddc->coarse_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 23510bdf917eSStefano Zampini if (pcbddc->coarse_rhs) { 23520bdf917eSStefano Zampini if (pcbddc->CoarseNullSpace) { 23530bdf917eSStefano Zampini ierr = MatNullSpaceRemove(pcbddc->CoarseNullSpace,pcbddc->coarse_rhs,PETSC_NULL);CHKERRQ(ierr); 23540bdf917eSStefano Zampini } 23550bdf917eSStefano Zampini ierr = KSPSolve(pcbddc->coarse_ksp,pcbddc->coarse_rhs,pcbddc->coarse_vec);CHKERRQ(ierr); 23560bdf917eSStefano Zampini if (pcbddc->CoarseNullSpace) { 23570bdf917eSStefano Zampini ierr = MatNullSpaceRemove(pcbddc->CoarseNullSpace,pcbddc->coarse_vec,PETSC_NULL);CHKERRQ(ierr); 23580bdf917eSStefano Zampini } 23590bdf917eSStefano Zampini } 23600c7d97c5SJed Brown ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->coarse_vec,pcbddc->vec1_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 23610c7d97c5SJed Brown ierr = PCBDDCScatterCoarseDataEnd (pc,pcbddc->coarse_vec,pcbddc->vec1_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 23620c7d97c5SJed Brown 23630c7d97c5SJed Brown /* Sum contributions from two levels */ 23640c7d97c5SJed Brown ierr = MatMultAdd(pcbddc->coarse_phi_B,pcbddc->vec1_P,pcis->vec1_B,pcis->vec1_B);CHKERRQ(ierr); 236529622bf0SStefano Zampini if (pcbddc->inexact_prec_type) { ierr = MatMultAdd(pcbddc->coarse_phi_D,pcbddc->vec1_P,pcis->vec1_D,pcis->vec1_D);CHKERRQ(ierr); } 23660c7d97c5SJed Brown PetscFunctionReturn(0); 23670c7d97c5SJed Brown } 23680c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 23690c7d97c5SJed Brown #undef __FUNCT__ 23700c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSolveSaddlePoint" 237153cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSolveSaddlePoint(PC pc) 23720c7d97c5SJed Brown { 23730c7d97c5SJed Brown PetscErrorCode ierr; 23740c7d97c5SJed Brown PC_BDDC *pcbddc = (PC_BDDC*)(pc->data); 23750c7d97c5SJed Brown 23760c7d97c5SJed Brown PetscFunctionBegin; 237753cdbc3dSStefano Zampini ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr); 2378534831adSStefano Zampini if (pcbddc->local_auxmat1) { 23790c7d97c5SJed Brown ierr = MatMult(pcbddc->local_auxmat1,pcbddc->vec2_R,pcbddc->vec1_C);CHKERRQ(ierr); 23800c7d97c5SJed Brown ierr = MatMultAdd(pcbddc->local_auxmat2,pcbddc->vec1_C,pcbddc->vec2_R,pcbddc->vec2_R);CHKERRQ(ierr); 23810c7d97c5SJed Brown } 23820c7d97c5SJed Brown PetscFunctionReturn(0); 23830c7d97c5SJed Brown } 23840c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 23850c7d97c5SJed Brown #undef __FUNCT__ 23860c7d97c5SJed Brown #define __FUNCT__ "PCBDDCScatterCoarseDataBegin" 238753cdbc3dSStefano Zampini static PetscErrorCode PCBDDCScatterCoarseDataBegin(PC pc,Vec vec_from, Vec vec_to, InsertMode imode, ScatterMode smode) 23880c7d97c5SJed Brown { 23890c7d97c5SJed Brown PetscErrorCode ierr; 23900c7d97c5SJed Brown PC_BDDC *pcbddc = (PC_BDDC*)(pc->data); 23910c7d97c5SJed Brown 23920c7d97c5SJed Brown PetscFunctionBegin; 23930c7d97c5SJed Brown switch (pcbddc->coarse_communications_type) { 23940c7d97c5SJed Brown case SCATTERS_BDDC: 23950c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->coarse_loc_to_glob,vec_from,vec_to,imode,smode);CHKERRQ(ierr); 23960c7d97c5SJed Brown break; 23970c7d97c5SJed Brown case GATHERS_BDDC: 23980c7d97c5SJed Brown break; 23990c7d97c5SJed Brown } 24000c7d97c5SJed Brown PetscFunctionReturn(0); 24010c7d97c5SJed Brown } 24020c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 24030c7d97c5SJed Brown #undef __FUNCT__ 24040c7d97c5SJed Brown #define __FUNCT__ "PCBDDCScatterCoarseDataEnd" 240553cdbc3dSStefano Zampini static PetscErrorCode PCBDDCScatterCoarseDataEnd(PC pc,Vec vec_from, Vec vec_to, InsertMode imode, ScatterMode smode) 24060c7d97c5SJed Brown { 24070c7d97c5SJed Brown PetscErrorCode ierr; 24080c7d97c5SJed Brown PC_BDDC *pcbddc = (PC_BDDC*)(pc->data); 24090c7d97c5SJed Brown PetscScalar *array_to; 24100c7d97c5SJed Brown PetscScalar *array_from; 24110c7d97c5SJed Brown MPI_Comm comm=((PetscObject)pc)->comm; 24120c7d97c5SJed Brown PetscInt i; 24130c7d97c5SJed Brown 24140c7d97c5SJed Brown PetscFunctionBegin; 24150c7d97c5SJed Brown switch (pcbddc->coarse_communications_type) { 24160c7d97c5SJed Brown case SCATTERS_BDDC: 24170c7d97c5SJed Brown ierr = VecScatterEnd(pcbddc->coarse_loc_to_glob,vec_from,vec_to,imode,smode);CHKERRQ(ierr); 24180c7d97c5SJed Brown break; 24190c7d97c5SJed Brown case GATHERS_BDDC: 24200c7d97c5SJed Brown if (vec_from) VecGetArray(vec_from,&array_from); 24210c7d97c5SJed Brown if (vec_to) VecGetArray(vec_to,&array_to); 24220c7d97c5SJed Brown switch (pcbddc->coarse_problem_type) { 24230c7d97c5SJed Brown case SEQUENTIAL_BDDC: 24240c7d97c5SJed Brown if (smode == SCATTER_FORWARD) { 242553cdbc3dSStefano Zampini ierr = MPI_Gatherv(&array_from[0],pcbddc->local_primal_size,MPIU_SCALAR,&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,0,comm);CHKERRQ(ierr); 24260c7d97c5SJed Brown if (vec_to) { 24270bdf917eSStefano Zampini if (imode == ADD_VALUES) { 24280bdf917eSStefano Zampini for (i=0;i<pcbddc->replicated_primal_size;i++) { 24290c7d97c5SJed Brown array_to[pcbddc->replicated_local_primal_indices[i]]+=pcbddc->replicated_local_primal_values[i]; 24300c7d97c5SJed Brown } 24310c7d97c5SJed Brown } else { 24320bdf917eSStefano Zampini for (i=0;i<pcbddc->replicated_primal_size;i++) { 24330bdf917eSStefano Zampini array_to[pcbddc->replicated_local_primal_indices[i]]=pcbddc->replicated_local_primal_values[i]; 24340bdf917eSStefano Zampini } 24350bdf917eSStefano Zampini } 24360bdf917eSStefano Zampini } 24370bdf917eSStefano Zampini } else { 24380bdf917eSStefano Zampini if (vec_from) { 24390bdf917eSStefano Zampini if (imode == ADD_VALUES) { 24400bdf917eSStefano Zampini printf("Scatter mode %d, insert mode %d for case %d not implemented!\n",smode,imode,pcbddc->coarse_problem_type); 24410bdf917eSStefano Zampini } 24420bdf917eSStefano Zampini for (i=0;i<pcbddc->replicated_primal_size;i++) { 24430c7d97c5SJed Brown pcbddc->replicated_local_primal_values[i]=array_from[pcbddc->replicated_local_primal_indices[i]]; 24440bdf917eSStefano Zampini } 24450bdf917eSStefano Zampini } 244653cdbc3dSStefano Zampini ierr = MPI_Scatterv(&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,&array_to[0],pcbddc->local_primal_size,MPIU_SCALAR,0,comm);CHKERRQ(ierr); 24470c7d97c5SJed Brown } 24480c7d97c5SJed Brown break; 24490c7d97c5SJed Brown case REPLICATED_BDDC: 24500c7d97c5SJed Brown if (smode == SCATTER_FORWARD) { 245153cdbc3dSStefano Zampini ierr = MPI_Allgatherv(&array_from[0],pcbddc->local_primal_size,MPIU_SCALAR,&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,comm);CHKERRQ(ierr); 24520bdf917eSStefano Zampini if (imode == ADD_VALUES) { 24530bdf917eSStefano Zampini for (i=0;i<pcbddc->replicated_primal_size;i++) { 24540c7d97c5SJed Brown array_to[pcbddc->replicated_local_primal_indices[i]]+=pcbddc->replicated_local_primal_values[i]; 24550bdf917eSStefano Zampini } 24560bdf917eSStefano Zampini } else { 24570bdf917eSStefano Zampini for (i=0;i<pcbddc->replicated_primal_size;i++) { 24580bdf917eSStefano Zampini array_to[pcbddc->replicated_local_primal_indices[i]]=pcbddc->replicated_local_primal_values[i]; 24590bdf917eSStefano Zampini } 24600bdf917eSStefano Zampini } 24610c7d97c5SJed Brown } else { /* no communications needed for SCATTER_REVERSE since needed data is already present */ 24620bdf917eSStefano Zampini if (imode == ADD_VALUES) { 24630bdf917eSStefano Zampini for (i=0;i<pcbddc->local_primal_size;i++) { 24640bdf917eSStefano Zampini array_to[i]+=array_from[pcbddc->local_primal_indices[i]]; 24650bdf917eSStefano Zampini } 24660bdf917eSStefano Zampini } else { 24670bdf917eSStefano Zampini for (i=0;i<pcbddc->local_primal_size;i++) { 24680c7d97c5SJed Brown array_to[i]=array_from[pcbddc->local_primal_indices[i]]; 24690c7d97c5SJed Brown } 24700bdf917eSStefano Zampini } 24710bdf917eSStefano Zampini } 24720c7d97c5SJed Brown break; 247353cdbc3dSStefano Zampini case MULTILEVEL_BDDC: 247453cdbc3dSStefano Zampini break; 247553cdbc3dSStefano Zampini case PARALLEL_BDDC: 247653cdbc3dSStefano Zampini break; 24770c7d97c5SJed Brown } 24780c7d97c5SJed Brown if (vec_from) VecRestoreArray(vec_from,&array_from); 24790c7d97c5SJed Brown if (vec_to) VecRestoreArray(vec_to,&array_to); 24800c7d97c5SJed Brown break; 24810c7d97c5SJed Brown } 24820c7d97c5SJed Brown PetscFunctionReturn(0); 24830c7d97c5SJed Brown } 24840c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 24853b03a366Sstefano_zampini #undef __FUNCT__ 24863b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCCreateConstraintMatrix" 24873b03a366Sstefano_zampini static PetscErrorCode PCBDDCCreateConstraintMatrix(PC pc) 24883b03a366Sstefano_zampini { 24893b03a366Sstefano_zampini PetscErrorCode ierr; 24903b03a366Sstefano_zampini PC_IS *pcis = (PC_IS*)(pc->data); 24913b03a366Sstefano_zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 24923b03a366Sstefano_zampini Mat_IS *matis = (Mat_IS*)pc->pmat->data; 249323d4d1a5SStefano Zampini PetscInt *nnz,*is_indices; 24943b03a366Sstefano_zampini PetscScalar *temp_quadrature_constraint; 2495534831adSStefano Zampini PetscInt *temp_indices,*temp_indices_to_constraint,*temp_indices_to_constraint_B,*local_to_B; 24963b03a366Sstefano_zampini PetscInt local_primal_size,i,j,k,total_counts,max_size_of_constraint; 24973b03a366Sstefano_zampini PetscInt n_constraints,n_vertices,size_of_constraint; 2498534831adSStefano Zampini PetscScalar quad_value; 24993b03a366Sstefano_zampini PetscBool nnsp_has_cnst=PETSC_FALSE,use_nnsp_true=pcbddc->use_nnsp_true; 25003b03a366Sstefano_zampini PetscInt nnsp_size =0,nnsp_addone=0,temp_constraints,temp_start_ptr; 25013b03a366Sstefano_zampini IS *used_IS; 250219fd82e9SBarry Smith MatType impMatType=MATSEQAIJ; 25033b03a366Sstefano_zampini PetscBLASInt Bs,Bt,lwork,lierr; 25043b03a366Sstefano_zampini PetscReal tol=1.0e-8; 2505fcda91b4SJed Brown MatNullSpace nearnullsp; 2506fcda91b4SJed Brown const Vec *nearnullvecs; 25073b03a366Sstefano_zampini Vec *localnearnullsp; 25083b03a366Sstefano_zampini PetscScalar *work,*temp_basis,*array_vector,*correlation_mat; 25093b03a366Sstefano_zampini PetscReal *rwork,*singular_vals; 2510534831adSStefano Zampini PetscBLASInt Bone=1,*ipiv; 2511534831adSStefano Zampini Vec temp_vec; 2512534831adSStefano Zampini Mat temp_mat; 2513534831adSStefano Zampini KSP temp_ksp; 2514ffe5efe1SStefano Zampini PC temp_pc; 2515534831adSStefano Zampini PetscInt s,start_constraint,dual_dofs; 2516534831adSStefano Zampini PetscBool compute_submatrix,useksp=PETSC_FALSE; 2517534831adSStefano Zampini PetscInt *aux_primal_permutation,*aux_primal_numbering; 2518534831adSStefano Zampini PetscBool boolforface,*change_basis; 25192fa5cd67SKarl Rupp 2520de534f79Sstefano_zampini /* some ugly conditional declarations */ 25213b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD) 25223b03a366Sstefano_zampini PetscScalar dot_result; 25233b03a366Sstefano_zampini PetscScalar one=1.0,zero=0.0; 25243b03a366Sstefano_zampini PetscInt ii; 25253425bc38SStefano Zampini PetscScalar *singular_vectors; 25263425bc38SStefano Zampini PetscBLASInt *iwork,*ifail; 25273425bc38SStefano Zampini PetscReal dummy_real,abs_tol; 25283425bc38SStefano Zampini PetscBLASInt eigs_found; 25293b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX) 25303b03a366Sstefano_zampini PetscScalar val1,val2; 25313b03a366Sstefano_zampini #endif 25323425bc38SStefano Zampini #endif 25333b03a366Sstefano_zampini PetscBLASInt dummy_int; 25343b03a366Sstefano_zampini PetscScalar dummy_scalar; 25353b03a366Sstefano_zampini 25363b03a366Sstefano_zampini PetscFunctionBegin; 25373b03a366Sstefano_zampini /* check if near null space is attached to global mat */ 2538fcda91b4SJed Brown ierr = MatGetNearNullSpace(pc->pmat,&nearnullsp);CHKERRQ(ierr); 2539fcda91b4SJed Brown if (nearnullsp) { 2540fcda91b4SJed Brown ierr = MatNullSpaceGetVecs(nearnullsp,&nnsp_has_cnst,&nnsp_size,&nearnullvecs);CHKERRQ(ierr); 25413b03a366Sstefano_zampini } else { /* if near null space is not provided it uses constants */ 25423b03a366Sstefano_zampini nnsp_has_cnst = PETSC_TRUE; 25433b03a366Sstefano_zampini use_nnsp_true = PETSC_TRUE; 25443b03a366Sstefano_zampini } 25452fa5cd67SKarl Rupp if (nnsp_has_cnst) nnsp_addone = 1; 25462fa5cd67SKarl Rupp 25473b03a366Sstefano_zampini /* 25483b03a366Sstefano_zampini Evaluate maximum storage size needed by the procedure 25493b03a366Sstefano_zampini - temp_indices will contain start index of each constraint stored as follows 25503b03a366Sstefano_zampini - temp_indices_to_constraint [temp_indices[i],...,temp[indices[i+1]-1] will contain the indices (in local numbering) on which the constraint acts 2551534831adSStefano Zampini - temp_indices_to_constraint_B[temp_indices[i],...,temp[indices[i+1]-1] will contain the indices (in boundary numbering) on which the constraint acts 25523b03a366Sstefano_zampini - temp_quadrature_constraint [temp_indices[i],...,temp[indices[i+1]-1] will contain the scalars representing the constraint itself 25533b03a366Sstefano_zampini */ 2554da1bb401SStefano Zampini 25553b03a366Sstefano_zampini total_counts = pcbddc->n_ISForFaces+pcbddc->n_ISForEdges; 25563b03a366Sstefano_zampini total_counts *= (nnsp_addone+nnsp_size); 25572fa5cd67SKarl Rupp 2558da1bb401SStefano Zampini ierr = ISGetSize(pcbddc->ISForVertices,&n_vertices);CHKERRQ(ierr); 25592fa5cd67SKarl Rupp 2560da1bb401SStefano Zampini total_counts += n_vertices; 25612fa5cd67SKarl Rupp 25623b03a366Sstefano_zampini ierr = PetscMalloc((total_counts+1)*sizeof(PetscInt),&temp_indices);CHKERRQ(ierr); 2563534831adSStefano Zampini ierr = PetscMalloc((total_counts+1)*sizeof(PetscBool),&change_basis);CHKERRQ(ierr); 25642fa5cd67SKarl Rupp 25653b03a366Sstefano_zampini total_counts = 0; 25663b03a366Sstefano_zampini max_size_of_constraint = 0; 25673b03a366Sstefano_zampini for (i=0;i<pcbddc->n_ISForEdges+pcbddc->n_ISForFaces;i++) { 25682fa5cd67SKarl Rupp if (i<pcbddc->n_ISForEdges) used_IS = &pcbddc->ISForEdges[i]; 25692fa5cd67SKarl Rupp else used_IS = &pcbddc->ISForFaces[i-pcbddc->n_ISForEdges]; 25703b03a366Sstefano_zampini ierr = ISGetSize(*used_IS,&j);CHKERRQ(ierr); 25713b03a366Sstefano_zampini total_counts += j; 25723b03a366Sstefano_zampini if (j>max_size_of_constraint) max_size_of_constraint=j; 25733b03a366Sstefano_zampini } 25743b03a366Sstefano_zampini total_counts *= (nnsp_addone+nnsp_size); 2575da1bb401SStefano Zampini total_counts += n_vertices; 25762fa5cd67SKarl Rupp 25773b03a366Sstefano_zampini ierr = PetscMalloc(total_counts*sizeof(PetscScalar),&temp_quadrature_constraint);CHKERRQ(ierr); 25783b03a366Sstefano_zampini ierr = PetscMalloc(total_counts*sizeof(PetscInt),&temp_indices_to_constraint);CHKERRQ(ierr); 2579534831adSStefano Zampini ierr = PetscMalloc(total_counts*sizeof(PetscInt),&temp_indices_to_constraint_B);CHKERRQ(ierr); 2580534831adSStefano Zampini ierr = PetscMalloc(pcis->n*sizeof(PetscInt),&local_to_B);CHKERRQ(ierr); 2581534831adSStefano Zampini ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 25822fa5cd67SKarl Rupp 25832fa5cd67SKarl Rupp for (i=0;i<pcis->n;i++) local_to_B[i]=-1; 25842fa5cd67SKarl Rupp for (i=0;i<pcis->n_B;i++) local_to_B[is_indices[i]]=i; 2585534831adSStefano Zampini ierr = ISRestoreIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 2586534831adSStefano Zampini 25873b03a366Sstefano_zampini /* First we issue queries to allocate optimal workspace for LAPACKgesvd or LAPACKsyev/LAPACKheev */ 25883b03a366Sstefano_zampini rwork = 0; 25893b03a366Sstefano_zampini work = 0; 25903b03a366Sstefano_zampini singular_vals = 0; 25913b03a366Sstefano_zampini temp_basis = 0; 25923b03a366Sstefano_zampini correlation_mat = 0; 25933b03a366Sstefano_zampini if (!pcbddc->use_nnsp_true) { 25943b03a366Sstefano_zampini PetscScalar temp_work; 25953b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD) 25963b03a366Sstefano_zampini /* POD */ 25973b03a366Sstefano_zampini PetscInt max_n; 25983b03a366Sstefano_zampini max_n = nnsp_addone+nnsp_size; 25993b03a366Sstefano_zampini /* using some techniques borrowed from Proper Orthogonal Decomposition */ 26003b03a366Sstefano_zampini ierr = PetscMalloc(max_n*max_n*sizeof(PetscScalar),&correlation_mat);CHKERRQ(ierr); 26013425bc38SStefano Zampini ierr = PetscMalloc(max_n*max_n*sizeof(PetscScalar),&singular_vectors);CHKERRQ(ierr); 26023b03a366Sstefano_zampini ierr = PetscMalloc(max_n*sizeof(PetscReal),&singular_vals);CHKERRQ(ierr); 26033b03a366Sstefano_zampini ierr = PetscMalloc(max_size_of_constraint*(nnsp_addone+nnsp_size)*sizeof(PetscScalar),&temp_basis);CHKERRQ(ierr); 26043b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX) 26053b03a366Sstefano_zampini ierr = PetscMalloc(3*max_n*sizeof(PetscReal),&rwork);CHKERRQ(ierr); 26063b03a366Sstefano_zampini #endif 26073425bc38SStefano Zampini ierr = PetscMalloc(5*max_n*sizeof(PetscBLASInt),&iwork);CHKERRQ(ierr); 26083425bc38SStefano Zampini ierr = PetscMalloc(max_n*sizeof(PetscBLASInt),&ifail);CHKERRQ(ierr); 26093b03a366Sstefano_zampini /* now we evaluate the optimal workspace using query with lwork=-1 */ 2610c5df96a5SBarry Smith ierr = PetscBLASIntCast(max_n,&Bt);CHKERRQ(ierr); 26113b03a366Sstefano_zampini lwork =-1; 26123425bc38SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 26133b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX) 26143425bc38SStefano Zampini abs_tol=1.e-8; 26153425bc38SStefano Zampini LAPACKsyevx_("V","A","U",&Bt,correlation_mat,&Bt,&dummy_real,&dummy_real,&dummy_int,&dummy_int, 26163425bc38SStefano Zampini &abs_tol,&eigs_found,singular_vals,singular_vectors,&Bt,&temp_work,&lwork,iwork,ifail,&lierr); 26173b03a366Sstefano_zampini #else 26183425bc38SStefano Zampini SETERRQ(((PetscObject) pc)->comm, PETSC_ERR_SUP, "Not yet implemented for complexes when PETSC_MISSING_GESVD = 1"); 26193b03a366Sstefano_zampini #endif 26203425bc38SStefano Zampini if (lierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to SYEVX Lapack routine %d",(int)lierr); 26213425bc38SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 26223b03a366Sstefano_zampini #else /* on missing GESVD */ 26233b03a366Sstefano_zampini /* SVD */ 26243b03a366Sstefano_zampini PetscInt max_n,min_n; 26253b03a366Sstefano_zampini max_n = max_size_of_constraint; 26263b03a366Sstefano_zampini min_n = nnsp_addone+nnsp_size; 26273b03a366Sstefano_zampini if (max_size_of_constraint < (nnsp_addone+nnsp_size)) { 26283b03a366Sstefano_zampini min_n = max_size_of_constraint; 26293b03a366Sstefano_zampini max_n = nnsp_addone+nnsp_size; 26303b03a366Sstefano_zampini } 26313b03a366Sstefano_zampini ierr = PetscMalloc(min_n*sizeof(PetscReal),&singular_vals);CHKERRQ(ierr); 26323b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX) 26333b03a366Sstefano_zampini ierr = PetscMalloc(5*min_n*sizeof(PetscReal),&rwork);CHKERRQ(ierr); 26343b03a366Sstefano_zampini #endif 26353b03a366Sstefano_zampini /* now we evaluate the optimal workspace using query with lwork=-1 */ 26363b03a366Sstefano_zampini lwork =-1; 2637c5df96a5SBarry Smith ierr = PetscBLASIntCast(max_n,&Bs);CHKERRQ(ierr); 2638c5df96a5SBarry Smith ierr = PetscBLASIntCast(min_n,&Bt);CHKERRQ(ierr); 26393b03a366Sstefano_zampini dummy_int = Bs; 2640670f3ff9SJed Brown ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 26413b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX) 26423b03a366Sstefano_zampini LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[0],&Bs,singular_vals, 26433b03a366Sstefano_zampini &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,&temp_work,&lwork,&lierr); 26443b03a366Sstefano_zampini #else 26453b03a366Sstefano_zampini LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[0],&Bs,singular_vals, 26463b03a366Sstefano_zampini &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,&temp_work,&lwork,rwork,&lierr); 26473b03a366Sstefano_zampini #endif 26483b03a366Sstefano_zampini if (lierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to SVD Lapack routine %d",(int)lierr); 2649670f3ff9SJed Brown ierr = PetscFPTrapPop();CHKERRQ(ierr); 26503b03a366Sstefano_zampini #endif 26513b03a366Sstefano_zampini /* Allocate optimal workspace */ 2652c5df96a5SBarry Smith ierr = PetscBLASIntCast((PetscInt)PetscRealPart(temp_work),&lwork);CHKERRQ(ierr); 26533b03a366Sstefano_zampini total_counts = (PetscInt)lwork; 26543b03a366Sstefano_zampini ierr = PetscMalloc(total_counts*sizeof(PetscScalar),&work);CHKERRQ(ierr); 26553b03a366Sstefano_zampini } 26563b03a366Sstefano_zampini /* get local part of global near null space vectors */ 26573b03a366Sstefano_zampini ierr = PetscMalloc(nnsp_size*sizeof(Vec),&localnearnullsp);CHKERRQ(ierr); 26583b03a366Sstefano_zampini for (k=0; k<nnsp_size; k++) { 26593b03a366Sstefano_zampini ierr = VecDuplicate(pcis->vec1_N,&localnearnullsp[k]);CHKERRQ(ierr); 2660fcda91b4SJed Brown ierr = VecScatterBegin(matis->ctx,nearnullvecs[k],localnearnullsp[k],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 2661fcda91b4SJed Brown ierr = VecScatterEnd (matis->ctx,nearnullvecs[k],localnearnullsp[k],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 26623b03a366Sstefano_zampini } 26633b03a366Sstefano_zampini /* Now we can loop on constraining sets */ 26643b03a366Sstefano_zampini total_counts =0; 26653b03a366Sstefano_zampini temp_indices[0]=0; 2666da1bb401SStefano Zampini /* vertices */ 2667da1bb401SStefano Zampini PetscBool used_vertex; 2668da1bb401SStefano Zampini ierr = ISGetIndices(pcbddc->ISForVertices,(const PetscInt**)&is_indices);CHKERRQ(ierr); 2669da1bb401SStefano Zampini if (nnsp_has_cnst) { /* consider all vertices */ 2670da1bb401SStefano Zampini for (i=0; i<n_vertices; i++) { 2671da1bb401SStefano Zampini temp_indices_to_constraint[temp_indices[total_counts]] = is_indices[i]; 2672534831adSStefano Zampini temp_indices_to_constraint_B[temp_indices[total_counts]]= local_to_B[is_indices[i]]; 2673da1bb401SStefano Zampini temp_quadrature_constraint[temp_indices[total_counts]] = 1.0; 2674da1bb401SStefano Zampini temp_indices[total_counts+1] = temp_indices[total_counts]+1; 2675534831adSStefano Zampini change_basis[total_counts] = PETSC_FALSE; 2676da1bb401SStefano Zampini total_counts++; 2677da1bb401SStefano Zampini } 2678da1bb401SStefano Zampini } else { /* consider vertices for which exist at least a localnearnullsp which is not null there */ 2679da1bb401SStefano Zampini for (i=0; i<n_vertices; i++) { 2680da1bb401SStefano Zampini used_vertex = PETSC_FALSE; 2681da1bb401SStefano Zampini k = 0; 2682da1bb401SStefano Zampini while (!used_vertex && k<nnsp_size) { 2683da1bb401SStefano Zampini ierr = VecGetArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr); 2684da1bb401SStefano Zampini if (PetscAbsScalar(array_vector[is_indices[i]])>0.0) { 2685da1bb401SStefano Zampini temp_indices_to_constraint[temp_indices[total_counts]] =is_indices[i]; 2686534831adSStefano Zampini temp_indices_to_constraint_B[temp_indices[total_counts]]=local_to_B[is_indices[i]]; 2687da1bb401SStefano Zampini temp_quadrature_constraint[temp_indices[total_counts]] =1.0; 2688da1bb401SStefano Zampini temp_indices[total_counts+1] =temp_indices[total_counts]+1; 2689534831adSStefano Zampini change_basis[total_counts] =PETSC_FALSE; 2690da1bb401SStefano Zampini total_counts++; 2691da1bb401SStefano Zampini used_vertex=PETSC_TRUE; 2692da1bb401SStefano Zampini } 2693da1bb401SStefano Zampini ierr = VecRestoreArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr); 2694da1bb401SStefano Zampini k++; 2695da1bb401SStefano Zampini } 2696da1bb401SStefano Zampini } 2697da1bb401SStefano Zampini } 2698da1bb401SStefano Zampini ierr = ISRestoreIndices(pcbddc->ISForVertices,(const PetscInt**)&is_indices);CHKERRQ(ierr); 2699da1bb401SStefano Zampini n_vertices = total_counts; 27002fa5cd67SKarl Rupp 2701da1bb401SStefano Zampini /* edges and faces */ 27023b03a366Sstefano_zampini for (i=0; i<pcbddc->n_ISForEdges+pcbddc->n_ISForFaces; i++) { 27033b03a366Sstefano_zampini if (i<pcbddc->n_ISForEdges) { 27043b03a366Sstefano_zampini used_IS = &pcbddc->ISForEdges[i]; 2705534831adSStefano Zampini boolforface = pcbddc->usechangeofbasis; 27063b03a366Sstefano_zampini } else { 27073b03a366Sstefano_zampini used_IS = &pcbddc->ISForFaces[i-pcbddc->n_ISForEdges]; 2708534831adSStefano Zampini boolforface = pcbddc->usechangeonfaces; 27093b03a366Sstefano_zampini } 27103b03a366Sstefano_zampini temp_constraints = 0; /* zero the number of constraints I have on this conn comp */ 27113b03a366Sstefano_zampini temp_start_ptr = total_counts; /* need to know the starting index of constraints stored */ 27123b03a366Sstefano_zampini ierr = ISGetSize(*used_IS,&size_of_constraint);CHKERRQ(ierr); 27133b03a366Sstefano_zampini ierr = ISGetIndices(*used_IS,(const PetscInt**)&is_indices);CHKERRQ(ierr); 27143b03a366Sstefano_zampini if (nnsp_has_cnst) { 27153b03a366Sstefano_zampini temp_constraints++; 2716534831adSStefano Zampini quad_value = (PetscScalar) (1.0/PetscSqrtReal((PetscReal)size_of_constraint)); 27173b03a366Sstefano_zampini for (j=0; j<size_of_constraint; j++) { 27183b03a366Sstefano_zampini temp_indices_to_constraint[temp_indices[total_counts]+j] =is_indices[j]; 2719534831adSStefano Zampini temp_indices_to_constraint_B[temp_indices[total_counts]+j]=local_to_B[is_indices[j]]; 27203b03a366Sstefano_zampini temp_quadrature_constraint[temp_indices[total_counts]+j] =quad_value; 27213b03a366Sstefano_zampini } 27223b03a366Sstefano_zampini temp_indices[total_counts+1]=temp_indices[total_counts]+size_of_constraint; /* store new starting point */ 2723534831adSStefano Zampini change_basis[total_counts] =boolforface; 27243b03a366Sstefano_zampini total_counts++; 27253b03a366Sstefano_zampini } 27263b03a366Sstefano_zampini for (k=0; k<nnsp_size; k++) { 27273b03a366Sstefano_zampini ierr = VecGetArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr); 27283b03a366Sstefano_zampini for (j=0; j<size_of_constraint; j++) { 27293b03a366Sstefano_zampini temp_indices_to_constraint[temp_indices[total_counts]+j] =is_indices[j]; 2730534831adSStefano Zampini temp_indices_to_constraint_B[temp_indices[total_counts]+j]=local_to_B[is_indices[j]]; 27313b03a366Sstefano_zampini temp_quadrature_constraint[temp_indices[total_counts]+j] =array_vector[is_indices[j]]; 27323b03a366Sstefano_zampini } 27333b03a366Sstefano_zampini ierr = VecRestoreArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr); 2734de534f79Sstefano_zampini quad_value = 1.0; 2735de534f79Sstefano_zampini if (use_nnsp_true) { /* check if array is null on the connected component in case use_nnsp_true has been requested */ 2736c5df96a5SBarry Smith ierr = PetscBLASIntCast(size_of_constraint,&Bs);CHKERRQ(ierr); 2737*a83cb05cSBarry Smith PetscStackCall("BLASasum",quad_value = BLASasum_(&Bs,&temp_quadrature_constraint[temp_indices[total_counts]],&Bone)); 2738de534f79Sstefano_zampini } 2739de534f79Sstefano_zampini if (quad_value > 0.0) { /* keep indices and values */ 2740de534f79Sstefano_zampini temp_constraints++; 27413b03a366Sstefano_zampini temp_indices[total_counts+1]=temp_indices[total_counts]+size_of_constraint; /* store new starting point */ 2742534831adSStefano Zampini change_basis[total_counts] =boolforface; 27433b03a366Sstefano_zampini total_counts++; 27443b03a366Sstefano_zampini } 2745de534f79Sstefano_zampini } 27463b03a366Sstefano_zampini ierr = ISRestoreIndices(*used_IS,(const PetscInt**)&is_indices);CHKERRQ(ierr); 2747de534f79Sstefano_zampini /* perform SVD on the constraint if use_nnsp_true has not be requested by the user */ 27483b03a366Sstefano_zampini if (!use_nnsp_true) { 2749c5df96a5SBarry Smith ierr = PetscBLASIntCast(size_of_constraint,&Bs);CHKERRQ(ierr); 2750c5df96a5SBarry Smith ierr = PetscBLASIntCast(temp_constraints,&Bt);CHKERRQ(ierr); 2751de534f79Sstefano_zampini 27523b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD) 27533b03a366Sstefano_zampini ierr = PetscMemzero(correlation_mat,Bt*Bt*sizeof(PetscScalar));CHKERRQ(ierr); 27543b03a366Sstefano_zampini /* Store upper triangular part of correlation matrix */ 27553b03a366Sstefano_zampini for (j=0; j<temp_constraints; j++) { 27563b03a366Sstefano_zampini for (k=0; k<j+1; k++) { 27573b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX) 27583425bc38SStefano Zampini /* hand made complex dot product -> replace */ 27593b03a366Sstefano_zampini dot_result = 0.0; 27603b03a366Sstefano_zampini for (ii=0; ii<size_of_constraint; ii++) { 27613b03a366Sstefano_zampini val1 = temp_quadrature_constraint[temp_indices[temp_start_ptr+j]+ii]; 27623b03a366Sstefano_zampini val2 = temp_quadrature_constraint[temp_indices[temp_start_ptr+k]+ii]; 27633b03a366Sstefano_zampini dot_result += val1*PetscConj(val2); 27643b03a366Sstefano_zampini } 27653b03a366Sstefano_zampini #else 2766*a83cb05cSBarry Smith PetscStackCall("BLASdot",dot_result = BLASdot_(&Bs,&temp_quadrature_constraint[temp_indices[temp_start_ptr+j]],&Bone,&temp_quadrature_constraint[temp_indices[temp_start_ptr+k]],&Bone)); 27673b03a366Sstefano_zampini #endif 27683b03a366Sstefano_zampini correlation_mat[j*temp_constraints+k]=dot_result; 27693b03a366Sstefano_zampini } 27703b03a366Sstefano_zampini } 27713425bc38SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 27723b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX) 27733425bc38SStefano Zampini /* LAPACKsyev_("V","U",&Bt,correlation_mat,&Bt,singular_vals,work,&lwork,&lierr); */ 27743425bc38SStefano Zampini LAPACKsyevx_("V","A","U",&Bt,correlation_mat,&Bt,&dummy_real,&dummy_real,&dummy_int,&dummy_int, 27753425bc38SStefano Zampini &abs_tol,&eigs_found,singular_vals,singular_vectors,&Bt,work,&lwork,iwork,ifail,&lierr); 27763b03a366Sstefano_zampini #else 27773425bc38SStefano Zampini /* LAPACK call is missing here! TODO */ 27783425bc38SStefano Zampini SETERRQ(((PetscObject) pc)->comm, PETSC_ERR_SUP, "Not yet implemented for complexes when PETSC_MISSING_GESVD = 1"); 27793b03a366Sstefano_zampini #endif 27803425bc38SStefano Zampini if (lierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYEVX Lapack routine %d",(int)lierr); 27813425bc38SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 27823b03a366Sstefano_zampini /* retain eigenvalues greater than tol: note that lapack SYEV gives eigs in ascending order */ 27833b03a366Sstefano_zampini j=0; 27843b03a366Sstefano_zampini while (j < Bt && singular_vals[j] < tol) j++; 27853b03a366Sstefano_zampini total_counts=total_counts-j; 27863b03a366Sstefano_zampini if (j<temp_constraints) { 27872fa5cd67SKarl Rupp for (k=j;k<Bt;k++) singular_vals[k]=1.0/PetscSqrtReal(singular_vals[k]); 27883425bc38SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 2789*a83cb05cSBarry Smith PetscStackCall("BLASgemm",BLASgemm_("N","N",&Bs,&Bt,&Bt,&one,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,correlation_mat,&Bt,&zero,temp_basis,&Bs)); 27903425bc38SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 27913b03a366Sstefano_zampini /* copy POD basis into used quadrature memory */ 27923b03a366Sstefano_zampini for (k=0;k<Bt-j;k++) { 27933b03a366Sstefano_zampini for (ii=0;ii<size_of_constraint;ii++) { 27943b03a366Sstefano_zampini temp_quadrature_constraint[temp_indices[temp_start_ptr+k]+ii]=singular_vals[Bt-1-k]*temp_basis[(Bt-1-k)*size_of_constraint+ii]; 27953b03a366Sstefano_zampini } 27963b03a366Sstefano_zampini } 27973b03a366Sstefano_zampini } 2798de534f79Sstefano_zampini 27993b03a366Sstefano_zampini #else /* on missing GESVD */ 28003b03a366Sstefano_zampini PetscInt min_n = temp_constraints; 28013b03a366Sstefano_zampini if (min_n > size_of_constraint) min_n = size_of_constraint; 28023b03a366Sstefano_zampini dummy_int = Bs; 2803670f3ff9SJed Brown ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 28043b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX) 28053b03a366Sstefano_zampini LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,singular_vals, 28063b03a366Sstefano_zampini &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,work,&lwork,&lierr); 28073b03a366Sstefano_zampini #else 28083b03a366Sstefano_zampini LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,singular_vals, 28093b03a366Sstefano_zampini &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,work,&lwork,rwork,&lierr); 28103b03a366Sstefano_zampini #endif 28113b03a366Sstefano_zampini if (lierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SVD Lapack routine %d",(int)lierr); 2812670f3ff9SJed Brown ierr = PetscFPTrapPop();CHKERRQ(ierr); 28133b03a366Sstefano_zampini /* retain eigenvalues greater than tol: note that lapack SVD gives eigs in descending order */ 28143b03a366Sstefano_zampini j=0; 28153b03a366Sstefano_zampini while (j < min_n && singular_vals[min_n-j-1] < tol) j++; 28163b03a366Sstefano_zampini total_counts = total_counts-(PetscInt)Bt+(min_n-j); 28173b03a366Sstefano_zampini #endif 28183b03a366Sstefano_zampini } 28193b03a366Sstefano_zampini } 2820534831adSStefano Zampini 2821da1bb401SStefano Zampini n_constraints =total_counts-n_vertices; 2822da1bb401SStefano Zampini local_primal_size = total_counts; 28233b03a366Sstefano_zampini /* set quantities in pcbddc data structure */ 28243b03a366Sstefano_zampini pcbddc->n_vertices = n_vertices; 28253b03a366Sstefano_zampini pcbddc->n_constraints = n_constraints; 2826da1bb401SStefano Zampini pcbddc->local_primal_size = local_primal_size; 2827534831adSStefano Zampini 2828534831adSStefano Zampini /* Create constraint matrix */ 2829534831adSStefano Zampini /* The constraint matrix is used to compute the l2g map of primal dofs */ 2830534831adSStefano Zampini /* so we need to set it up properly either with or without change of basis */ 2831534831adSStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->ConstraintMatrix);CHKERRQ(ierr); 2832534831adSStefano Zampini ierr = MatSetType(pcbddc->ConstraintMatrix,impMatType);CHKERRQ(ierr); 2833534831adSStefano Zampini ierr = MatSetSizes(pcbddc->ConstraintMatrix,local_primal_size,pcis->n,local_primal_size,pcis->n);CHKERRQ(ierr); 28342fa5cd67SKarl Rupp 2835534831adSStefano Zampini /* compute a local numbering of constraints : vertices first then constraints */ 2836534831adSStefano Zampini ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr); 2837534831adSStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array_vector);CHKERRQ(ierr); 2838534831adSStefano Zampini ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&aux_primal_numbering);CHKERRQ(ierr); 2839534831adSStefano Zampini ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&aux_primal_permutation);CHKERRQ(ierr); 28402fa5cd67SKarl Rupp 2841534831adSStefano Zampini total_counts=0; 28422fa5cd67SKarl Rupp 2843534831adSStefano Zampini /* find vertices: subdomain corners plus dofs with basis changed */ 2844534831adSStefano Zampini for (i=0; i<local_primal_size; i++) { 2845534831adSStefano Zampini size_of_constraint=temp_indices[i+1]-temp_indices[i]; 2846534831adSStefano Zampini if (change_basis[i] || size_of_constraint == 1) { 2847534831adSStefano Zampini k=0; 2848534831adSStefano Zampini while (k < size_of_constraint && array_vector[temp_indices_to_constraint[temp_indices[i]+size_of_constraint-k-1]] != 0.0) { 2849534831adSStefano Zampini k=k+1; 2850534831adSStefano Zampini } 2851534831adSStefano Zampini j = temp_indices_to_constraint[temp_indices[i]+size_of_constraint-k-1]; 28522fa5cd67SKarl Rupp 2853534831adSStefano Zampini array_vector[j] = 1.0; 2854534831adSStefano Zampini aux_primal_numbering[total_counts] = j; 2855534831adSStefano Zampini aux_primal_permutation[total_counts] = total_counts; 2856534831adSStefano Zampini total_counts++; 2857534831adSStefano Zampini } 2858534831adSStefano Zampini } 2859534831adSStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array_vector);CHKERRQ(ierr); 2860534831adSStefano Zampini /* permute indices in order to have a sorted set of vertices */ 2861534831adSStefano Zampini ierr = PetscSortIntWithPermutation(total_counts,aux_primal_numbering,aux_primal_permutation); 2862534831adSStefano Zampini /* nonzero structure */ 2863534831adSStefano Zampini ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&nnz);CHKERRQ(ierr); 28642fa5cd67SKarl Rupp for (i=0;i<total_counts;i++) nnz[i]=1; 28652fa5cd67SKarl Rupp 2866534831adSStefano Zampini j=total_counts; 2867534831adSStefano Zampini for (i=n_vertices; i<local_primal_size; i++) { 2868534831adSStefano Zampini if (!change_basis[i]) { 2869534831adSStefano Zampini nnz[j]=temp_indices[i+1]-temp_indices[i]; 2870534831adSStefano Zampini j++; 2871534831adSStefano Zampini } 2872534831adSStefano Zampini } 2873534831adSStefano Zampini ierr = MatSeqAIJSetPreallocation(pcbddc->ConstraintMatrix,0,nnz);CHKERRQ(ierr); 2874534831adSStefano Zampini ierr = PetscFree(nnz);CHKERRQ(ierr); 2875534831adSStefano Zampini /* set values in constraint matrix */ 2876534831adSStefano Zampini for (i=0; i<total_counts; i++) { 2877534831adSStefano Zampini j = aux_primal_permutation[i]; 2878534831adSStefano Zampini k = aux_primal_numbering[j]; 2879534831adSStefano Zampini ierr = MatSetValue(pcbddc->ConstraintMatrix,i,k,1.0,INSERT_VALUES);CHKERRQ(ierr); 2880534831adSStefano Zampini } 2881534831adSStefano Zampini for (i=n_vertices; i<local_primal_size; i++) { 2882534831adSStefano Zampini if (!change_basis[i]) { 2883534831adSStefano Zampini size_of_constraint = temp_indices[i+1]-temp_indices[i]; 2884534831adSStefano Zampini ierr = MatSetValues(pcbddc->ConstraintMatrix,1,&total_counts,size_of_constraint,&temp_indices_to_constraint[temp_indices[i]],&temp_quadrature_constraint[temp_indices[i]],INSERT_VALUES);CHKERRQ(ierr); 2885534831adSStefano Zampini total_counts++; 2886534831adSStefano Zampini } 2887534831adSStefano Zampini } 2888534831adSStefano Zampini ierr = PetscFree(aux_primal_numbering);CHKERRQ(ierr); 2889534831adSStefano Zampini ierr = PetscFree(aux_primal_permutation);CHKERRQ(ierr); 2890534831adSStefano Zampini /* assembling */ 2891534831adSStefano Zampini ierr = MatAssemblyBegin(pcbddc->ConstraintMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2892534831adSStefano Zampini ierr = MatAssemblyEnd(pcbddc->ConstraintMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2893534831adSStefano Zampini 2894534831adSStefano Zampini /* Create matrix for change of basis. We don't need it in case pcbddc->usechangeofbasis is FALSE */ 2895534831adSStefano Zampini if (pcbddc->usechangeofbasis) { 2896534831adSStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->ChangeOfBasisMatrix);CHKERRQ(ierr); 2897534831adSStefano Zampini ierr = MatSetType(pcbddc->ChangeOfBasisMatrix,impMatType);CHKERRQ(ierr); 2898534831adSStefano Zampini ierr = MatSetSizes(pcbddc->ChangeOfBasisMatrix,pcis->n_B,pcis->n_B,pcis->n_B,pcis->n_B);CHKERRQ(ierr); 2899534831adSStefano Zampini /* work arrays */ 2900534831adSStefano Zampini /* we need to reuse these arrays, so we free them */ 2901534831adSStefano Zampini ierr = PetscFree(temp_basis);CHKERRQ(ierr); 2902534831adSStefano Zampini ierr = PetscFree(work);CHKERRQ(ierr); 2903534831adSStefano Zampini ierr = PetscMalloc(pcis->n_B*sizeof(PetscInt),&nnz);CHKERRQ(ierr); 2904534831adSStefano Zampini ierr = PetscMalloc((nnsp_addone+nnsp_size)*(nnsp_addone+nnsp_size)*sizeof(PetscScalar),&temp_basis);CHKERRQ(ierr); 2905534831adSStefano Zampini ierr = PetscMalloc((nnsp_addone+nnsp_size)*sizeof(PetscScalar),&work);CHKERRQ(ierr); 2906534831adSStefano Zampini ierr = PetscMalloc((nnsp_addone+nnsp_size)*sizeof(PetscBLASInt),&ipiv);CHKERRQ(ierr); 29072fa5cd67SKarl Rupp for (i=0;i<pcis->n_B;i++) nnz[i]=1; 29082fa5cd67SKarl Rupp 2909534831adSStefano Zampini /* Overestimated nonzeros per row */ 2910534831adSStefano Zampini k=1; 2911534831adSStefano Zampini for (i=pcbddc->n_vertices;i<local_primal_size;i++) { 2912534831adSStefano Zampini if (change_basis[i]) { 2913534831adSStefano Zampini size_of_constraint = temp_indices[i+1]-temp_indices[i]; 29142fa5cd67SKarl Rupp if (k < size_of_constraint) k = size_of_constraint; 29152fa5cd67SKarl Rupp 2916534831adSStefano Zampini for (j=0;j<size_of_constraint;j++) { 2917534831adSStefano Zampini nnz[temp_indices_to_constraint_B[temp_indices[i]+j]] = size_of_constraint; 2918534831adSStefano Zampini } 2919534831adSStefano Zampini } 2920534831adSStefano Zampini } 2921534831adSStefano Zampini ierr = MatSeqAIJSetPreallocation(pcbddc->ChangeOfBasisMatrix,0,nnz);CHKERRQ(ierr); 2922534831adSStefano Zampini ierr = PetscFree(nnz);CHKERRQ(ierr); 2923534831adSStefano Zampini /* Temporary array to store indices */ 2924534831adSStefano Zampini ierr = PetscMalloc(k*sizeof(PetscInt),&is_indices);CHKERRQ(ierr); 2925534831adSStefano Zampini /* Set initial identity in the matrix */ 2926534831adSStefano Zampini for (i=0; i<pcis->n_B; i++) { 2927534831adSStefano Zampini ierr = MatSetValue(pcbddc->ChangeOfBasisMatrix,i,i,1.0,INSERT_VALUES);CHKERRQ(ierr); 2928534831adSStefano Zampini } 2929534831adSStefano Zampini /* Now we loop on the constraints which need a change of basis */ 2930534831adSStefano Zampini /* Change of basis matrix is evaluated as the FIRST APPROACH in */ 2931534831adSStefano Zampini /* Klawonn and Widlund, Dual-primal FETI-DP methods for linear elasticity, (6.2.1) */ 2932534831adSStefano Zampini temp_constraints = 0; 293393dc3b60SStefano Zampini if (pcbddc->n_vertices < local_primal_size) { 2934534831adSStefano Zampini temp_start_ptr = temp_indices_to_constraint_B[temp_indices[pcbddc->n_vertices]]; 293593dc3b60SStefano Zampini } 2936534831adSStefano Zampini for (i=pcbddc->n_vertices; i<local_primal_size; i++) { 2937534831adSStefano Zampini if (change_basis[i]) { 2938534831adSStefano Zampini compute_submatrix = PETSC_FALSE; 2939534831adSStefano Zampini useksp = PETSC_FALSE; 2940534831adSStefano Zampini if (temp_start_ptr == temp_indices_to_constraint_B[temp_indices[i]]) { 2941534831adSStefano Zampini temp_constraints++; 294204eaf177SStefano Zampini if (i == local_primal_size -1 || temp_start_ptr != temp_indices_to_constraint_B[temp_indices[i+1]]) { 2943534831adSStefano Zampini compute_submatrix = PETSC_TRUE; 2944534831adSStefano Zampini } 2945534831adSStefano Zampini } 2946534831adSStefano Zampini if (compute_submatrix) { 29472fa5cd67SKarl Rupp if (temp_constraints > 1 || pcbddc->use_nnsp_true) useksp = PETSC_TRUE; 2948534831adSStefano Zampini size_of_constraint = temp_indices[i+1]-temp_indices[i]; 2949534831adSStefano Zampini if (useksp) { /* experimental */ 2950534831adSStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&temp_mat);CHKERRQ(ierr); 2951534831adSStefano Zampini ierr = MatSetType(temp_mat,impMatType);CHKERRQ(ierr); 2952534831adSStefano Zampini ierr = MatSetSizes(temp_mat,size_of_constraint,size_of_constraint,size_of_constraint,size_of_constraint);CHKERRQ(ierr); 2953534831adSStefano Zampini ierr = MatSeqAIJSetPreallocation(temp_mat,size_of_constraint,PETSC_NULL);CHKERRQ(ierr); 2954534831adSStefano Zampini } 2955534831adSStefano Zampini /* First _size_of_constraint-temp_constraints_ columns */ 2956534831adSStefano Zampini dual_dofs = size_of_constraint-temp_constraints; 2957534831adSStefano Zampini start_constraint = i+1-temp_constraints; 2958534831adSStefano Zampini for (s=0; s<dual_dofs; s++) { 2959534831adSStefano Zampini is_indices[0] = s; 2960534831adSStefano Zampini for (j=0;j<temp_constraints;j++) { 2961534831adSStefano Zampini for (k=0;k<temp_constraints;k++) { 2962534831adSStefano Zampini temp_basis[j*temp_constraints+k]=temp_quadrature_constraint[temp_indices[start_constraint+k]+s+j+1]; 2963534831adSStefano Zampini } 2964534831adSStefano Zampini work[j] = -temp_quadrature_constraint[temp_indices[start_constraint+j]+s]; 2965534831adSStefano Zampini is_indices[j+1] = s+j+1; 2966534831adSStefano Zampini } 2967534831adSStefano Zampini Bt = temp_constraints; 2968534831adSStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 2969534831adSStefano Zampini LAPACKgesv_(&Bt,&Bone,temp_basis,&Bt,ipiv,work,&Bt,&lierr); 2970534831adSStefano Zampini if (lierr) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GESV Lapack routine %d",(int)lierr); 2971534831adSStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 2972534831adSStefano Zampini j = temp_indices_to_constraint_B[temp_indices[start_constraint]+s]; 2973534831adSStefano Zampini ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,temp_constraints,&temp_indices_to_constraint_B[temp_indices[start_constraint]+s+1],1,&j,work,INSERT_VALUES);CHKERRQ(ierr); 2974534831adSStefano Zampini if (useksp) { 2975534831adSStefano Zampini /* temp mat with transposed rows and columns */ 2976534831adSStefano Zampini ierr = MatSetValues(temp_mat,1,&s,temp_constraints,&is_indices[1],work,INSERT_VALUES);CHKERRQ(ierr); 2977534831adSStefano Zampini ierr = MatSetValue(temp_mat,is_indices[0],is_indices[0],1.0,INSERT_VALUES);CHKERRQ(ierr); 2978534831adSStefano Zampini } 2979534831adSStefano Zampini } 2980534831adSStefano Zampini if (useksp) { 2981534831adSStefano Zampini /* last rows of temp_mat */ 29822fa5cd67SKarl Rupp for (j=0;j<size_of_constraint;j++) is_indices[j] = j; 29832fa5cd67SKarl Rupp 2984534831adSStefano Zampini for (s=0;s<temp_constraints;s++) { 2985534831adSStefano Zampini k = s + dual_dofs; 2986534831adSStefano Zampini ierr = MatSetValues(temp_mat,1,&k,size_of_constraint,is_indices,&temp_quadrature_constraint[temp_indices[start_constraint+s]],INSERT_VALUES);CHKERRQ(ierr); 2987534831adSStefano Zampini } 2988534831adSStefano Zampini ierr = MatAssemblyBegin(temp_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2989534831adSStefano Zampini ierr = MatAssemblyEnd(temp_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2990534831adSStefano Zampini ierr = MatGetVecs(temp_mat,&temp_vec,PETSC_NULL);CHKERRQ(ierr); 2991534831adSStefano Zampini ierr = KSPCreate(PETSC_COMM_SELF,&temp_ksp);CHKERRQ(ierr); 2992534831adSStefano Zampini ierr = KSPSetOperators(temp_ksp,temp_mat,temp_mat,SAME_PRECONDITIONER);CHKERRQ(ierr); 2993534831adSStefano Zampini ierr = KSPSetType(temp_ksp,KSPPREONLY);CHKERRQ(ierr); 2994ffe5efe1SStefano Zampini ierr = KSPGetPC(temp_ksp,&temp_pc);CHKERRQ(ierr); 2995ffe5efe1SStefano Zampini ierr = PCSetType(temp_pc,PCLU);CHKERRQ(ierr); 2996534831adSStefano Zampini ierr = KSPSetUp(temp_ksp);CHKERRQ(ierr); 2997534831adSStefano Zampini for (s=0; s<temp_constraints; s++) { 2998534831adSStefano Zampini ierr = VecSet(temp_vec,0.0);CHKERRQ(ierr); 2999534831adSStefano Zampini ierr = VecSetValue(temp_vec,s+dual_dofs,1.0,INSERT_VALUES);CHKERRQ(ierr); 3000534831adSStefano Zampini ierr = VecAssemblyBegin(temp_vec);CHKERRQ(ierr); 3001534831adSStefano Zampini ierr = VecAssemblyEnd(temp_vec);CHKERRQ(ierr); 3002534831adSStefano Zampini ierr = KSPSolve(temp_ksp,temp_vec,temp_vec);CHKERRQ(ierr); 3003534831adSStefano Zampini ierr = VecGetArray(temp_vec,&array_vector);CHKERRQ(ierr); 3004534831adSStefano Zampini j = temp_indices_to_constraint_B[temp_indices[start_constraint+s]+size_of_constraint-s-1]; 3005534831adSStefano Zampini /* last columns of change of basis matrix associated to new primal dofs */ 3006534831adSStefano Zampini ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,size_of_constraint,&temp_indices_to_constraint_B[temp_indices[start_constraint+s]],1,&j,array_vector,INSERT_VALUES);CHKERRQ(ierr); 3007534831adSStefano Zampini ierr = VecRestoreArray(temp_vec,&array_vector);CHKERRQ(ierr); 3008534831adSStefano Zampini } 3009534831adSStefano Zampini ierr = MatDestroy(&temp_mat);CHKERRQ(ierr); 3010534831adSStefano Zampini ierr = KSPDestroy(&temp_ksp);CHKERRQ(ierr); 3011534831adSStefano Zampini ierr = VecDestroy(&temp_vec);CHKERRQ(ierr); 3012534831adSStefano Zampini } else { 3013534831adSStefano Zampini /* last columns of change of basis matrix associated to new primal dofs */ 3014534831adSStefano Zampini for (s=0; s<temp_constraints; s++) { 3015534831adSStefano Zampini j = temp_indices_to_constraint_B[temp_indices[start_constraint+s]+size_of_constraint-s-1]; 3016534831adSStefano Zampini ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,size_of_constraint,&temp_indices_to_constraint_B[temp_indices[start_constraint+s]],1,&j,&temp_quadrature_constraint[temp_indices[start_constraint+s]],INSERT_VALUES);CHKERRQ(ierr); 3017534831adSStefano Zampini } 3018534831adSStefano Zampini } 3019534831adSStefano Zampini /* prepare for the next cycle */ 3020534831adSStefano Zampini temp_constraints = 0; 30212fa5cd67SKarl Rupp if (i != local_primal_size -1) temp_start_ptr = temp_indices_to_constraint_B[temp_indices[i+1]]; 3022534831adSStefano Zampini } 3023534831adSStefano Zampini } 302404eaf177SStefano Zampini } 3025534831adSStefano Zampini /* assembling */ 3026534831adSStefano Zampini ierr = MatAssemblyBegin(pcbddc->ChangeOfBasisMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 3027534831adSStefano Zampini ierr = MatAssemblyEnd(pcbddc->ChangeOfBasisMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 3028534831adSStefano Zampini ierr = PetscFree(ipiv);CHKERRQ(ierr); 3029534831adSStefano Zampini ierr = PetscFree(is_indices);CHKERRQ(ierr); 3030534831adSStefano Zampini } 30313b03a366Sstefano_zampini /* free workspace no longer needed */ 30323b03a366Sstefano_zampini ierr = PetscFree(rwork);CHKERRQ(ierr); 30333b03a366Sstefano_zampini ierr = PetscFree(work);CHKERRQ(ierr); 30343b03a366Sstefano_zampini ierr = PetscFree(temp_basis);CHKERRQ(ierr); 30353b03a366Sstefano_zampini ierr = PetscFree(singular_vals);CHKERRQ(ierr); 30363b03a366Sstefano_zampini ierr = PetscFree(correlation_mat);CHKERRQ(ierr); 30373b03a366Sstefano_zampini ierr = PetscFree(temp_indices);CHKERRQ(ierr); 3038534831adSStefano Zampini ierr = PetscFree(change_basis);CHKERRQ(ierr); 30393b03a366Sstefano_zampini ierr = PetscFree(temp_indices_to_constraint);CHKERRQ(ierr); 3040534831adSStefano Zampini ierr = PetscFree(temp_indices_to_constraint_B);CHKERRQ(ierr); 3041534831adSStefano Zampini ierr = PetscFree(local_to_B);CHKERRQ(ierr); 30423b03a366Sstefano_zampini ierr = PetscFree(temp_quadrature_constraint);CHKERRQ(ierr); 30433425bc38SStefano Zampini #if defined(PETSC_MISSING_LAPACK_GESVD) 30443425bc38SStefano Zampini ierr = PetscFree(iwork);CHKERRQ(ierr); 30453425bc38SStefano Zampini ierr = PetscFree(ifail);CHKERRQ(ierr); 30463425bc38SStefano Zampini ierr = PetscFree(singular_vectors);CHKERRQ(ierr); 30473425bc38SStefano Zampini #endif 3048da1bb401SStefano Zampini for (k=0; k<nnsp_size; k++) { 3049da1bb401SStefano Zampini ierr = VecDestroy(&localnearnullsp[k]);CHKERRQ(ierr); 3050da1bb401SStefano Zampini } 30513b03a366Sstefano_zampini ierr = PetscFree(localnearnullsp);CHKERRQ(ierr); 30523b03a366Sstefano_zampini PetscFunctionReturn(0); 30533b03a366Sstefano_zampini } 30543b03a366Sstefano_zampini /* -------------------------------------------------------------------------- */ 30550c7d97c5SJed Brown #undef __FUNCT__ 30560c7d97c5SJed Brown #define __FUNCT__ "PCBDDCCoarseSetUp" 305753cdbc3dSStefano Zampini static PetscErrorCode PCBDDCCoarseSetUp(PC pc) 30580c7d97c5SJed Brown { 30590c7d97c5SJed Brown PetscErrorCode ierr; 30600c7d97c5SJed Brown PC_IS *pcis = (PC_IS*)(pc->data); 30610c7d97c5SJed Brown PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 30620c7d97c5SJed Brown Mat_IS *matis = (Mat_IS*)pc->pmat->data; 3063534831adSStefano Zampini Mat change_mat_all; 30640c7d97c5SJed Brown IS is_R_local; 30650c7d97c5SJed Brown IS is_V_local; 30660c7d97c5SJed Brown IS is_C_local; 30670c7d97c5SJed Brown IS is_aux1; 30680c7d97c5SJed Brown IS is_aux2; 306919fd82e9SBarry Smith VecType impVecType; 307019fd82e9SBarry Smith MatType impMatType; 30710c7d97c5SJed Brown PetscInt n_R =0; 30720c7d97c5SJed Brown PetscInt n_D =0; 30730c7d97c5SJed Brown PetscInt n_B =0; 30740c7d97c5SJed Brown PetscScalar zero =0.0; 30750c7d97c5SJed Brown PetscScalar one =1.0; 30760c7d97c5SJed Brown PetscScalar m_one=-1.0; 30770c7d97c5SJed Brown PetscScalar * array; 30780c7d97c5SJed Brown PetscScalar *coarse_submat_vals; 30790c7d97c5SJed Brown PetscInt *idx_R_local; 30800c7d97c5SJed Brown PetscInt *idx_V_B; 30810c7d97c5SJed Brown PetscScalar *coarsefunctions_errors; 30820c7d97c5SJed Brown PetscScalar *constraints_errors; 30832fa5cd67SKarl Rupp 30840c7d97c5SJed Brown /* auxiliary indices */ 3085534831adSStefano Zampini PetscInt i,j,k; 30862fa5cd67SKarl Rupp 3087e269702eSStefano Zampini /* for verbose output of bddc */ 3088e269702eSStefano Zampini PetscViewer viewer =pcbddc->dbg_viewer; 3089e269702eSStefano Zampini PetscBool dbg_flag=pcbddc->dbg_flag; 30902fa5cd67SKarl Rupp 3091a0ba757dSStefano Zampini /* for counting coarse dofs */ 3092534831adSStefano Zampini PetscInt n_vertices,n_constraints; 30933b03a366Sstefano_zampini PetscInt size_of_constraint; 30943b03a366Sstefano_zampini PetscInt *row_cmat_indices; 30953b03a366Sstefano_zampini PetscScalar *row_cmat_values; 3096534831adSStefano Zampini PetscInt *vertices,*nnz,*is_indices,*temp_indices; 30970c7d97c5SJed Brown 30980c7d97c5SJed Brown PetscFunctionBegin; 30990c7d97c5SJed Brown /* Set Non-overlapping dimensions */ 31000c7d97c5SJed Brown n_B = pcis->n_B; n_D = pcis->n - n_B; 3101534831adSStefano Zampini /* Set types for local objects needed by BDDC precondtioner */ 3102534831adSStefano Zampini impMatType = MATSEQDENSE; 3103534831adSStefano Zampini impVecType = VECSEQ; 31042fa5cd67SKarl Rupp 3105da1bb401SStefano Zampini /* get vertex indices from constraint matrix */ 3106534831adSStefano Zampini ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscInt),&vertices);CHKERRQ(ierr); 3107534831adSStefano Zampini n_vertices=0; 3108da1bb401SStefano Zampini for (i=0; i<pcbddc->local_primal_size; i++) { 3109da1bb401SStefano Zampini ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr); 3110da1bb401SStefano Zampini if (size_of_constraint == 1) { 3111534831adSStefano Zampini vertices[n_vertices]=row_cmat_indices[0]; 3112534831adSStefano Zampini n_vertices++; 3113a0ba757dSStefano Zampini } 3114da1bb401SStefano Zampini ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr); 3115a0ba757dSStefano Zampini } 3116534831adSStefano Zampini /* Set number of constraints */ 3117534831adSStefano Zampini n_constraints = pcbddc->local_primal_size-n_vertices; 3118534831adSStefano Zampini 3119534831adSStefano Zampini /* vertices in boundary numbering */ 3120534831adSStefano Zampini if (n_vertices) { 3121534831adSStefano Zampini ierr = VecSet(pcis->vec1_N,m_one);CHKERRQ(ierr); 3122534831adSStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 31232fa5cd67SKarl Rupp for (i=0; i<n_vertices; i++) array[vertices[i]] = i; 3124534831adSStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 3125534831adSStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 3126534831adSStefano Zampini ierr = VecScatterEnd (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 3127534831adSStefano Zampini ierr = PetscMalloc(n_vertices*sizeof(PetscInt),&idx_V_B);CHKERRQ(ierr); 3128534831adSStefano Zampini ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr); 3129534831adSStefano Zampini for (i=0; i<n_vertices; i++) { 3130534831adSStefano Zampini j=0; 31312fa5cd67SKarl Rupp while (array[j] != i) j++; 3132534831adSStefano Zampini idx_V_B[i]=j; 3133534831adSStefano Zampini } 3134534831adSStefano Zampini ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr); 3135534831adSStefano Zampini } 3136534831adSStefano Zampini 3137534831adSStefano Zampini /* transform local matrices if needed */ 3138534831adSStefano Zampini if (pcbddc->usechangeofbasis) { 3139534831adSStefano Zampini ierr = PetscMalloc(pcis->n*sizeof(PetscInt),&nnz);CHKERRQ(ierr); 3140534831adSStefano Zampini ierr = ISGetIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 31412fa5cd67SKarl Rupp for (i=0;i<n_D;i++) nnz[is_indices[i]] = 1; 3142534831adSStefano Zampini ierr = ISRestoreIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 3143534831adSStefano Zampini ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 3144534831adSStefano Zampini k=1; 3145534831adSStefano Zampini for (i=0;i<n_B;i++) { 3146534831adSStefano Zampini ierr = MatGetRow(pcbddc->ChangeOfBasisMatrix,i,&j,PETSC_NULL,PETSC_NULL);CHKERRQ(ierr); 3147534831adSStefano Zampini nnz[is_indices[i]]=j; 31482fa5cd67SKarl Rupp if (k < j) k = j; 3149534831adSStefano Zampini ierr = MatRestoreRow(pcbddc->ChangeOfBasisMatrix,i,&j,PETSC_NULL,PETSC_NULL);CHKERRQ(ierr); 3150534831adSStefano Zampini } 3151534831adSStefano Zampini ierr = ISRestoreIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 3152534831adSStefano Zampini /* assemble change of basis matrix on the whole set of local dofs */ 3153534831adSStefano Zampini ierr = PetscMalloc(k*sizeof(PetscInt),&temp_indices);CHKERRQ(ierr); 3154534831adSStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&change_mat_all);CHKERRQ(ierr); 3155534831adSStefano Zampini ierr = MatSetSizes(change_mat_all,pcis->n,pcis->n,pcis->n,pcis->n);CHKERRQ(ierr); 3156534831adSStefano Zampini ierr = MatSetType(change_mat_all,MATSEQAIJ);CHKERRQ(ierr); 3157534831adSStefano Zampini ierr = MatSeqAIJSetPreallocation(change_mat_all,0,nnz);CHKERRQ(ierr); 3158534831adSStefano Zampini ierr = ISGetIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 3159534831adSStefano Zampini for (i=0; i<n_D; i++) { 3160534831adSStefano Zampini ierr = MatSetValue(change_mat_all,is_indices[i],is_indices[i],1.0,INSERT_VALUES);CHKERRQ(ierr); 3161534831adSStefano Zampini } 3162534831adSStefano Zampini ierr = ISRestoreIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 3163534831adSStefano Zampini ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 3164534831adSStefano Zampini for (i=0; i<n_B; i++) { 3165534831adSStefano Zampini ierr = MatGetRow(pcbddc->ChangeOfBasisMatrix,i,&j,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr); 31662fa5cd67SKarl Rupp for (k=0; k<j; k++) temp_indices[k]=is_indices[row_cmat_indices[k]]; 3167534831adSStefano Zampini ierr = MatSetValues(change_mat_all,1,&is_indices[i],j,temp_indices,row_cmat_values,INSERT_VALUES);CHKERRQ(ierr); 3168534831adSStefano Zampini ierr = MatRestoreRow(pcbddc->ChangeOfBasisMatrix,i,&j,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr); 3169534831adSStefano Zampini } 3170534831adSStefano Zampini ierr = MatAssemblyBegin(change_mat_all,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 3171534831adSStefano Zampini ierr = MatAssemblyEnd(change_mat_all,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 3172534831adSStefano Zampini ierr = MatPtAP(matis->A,change_mat_all,MAT_INITIAL_MATRIX,1.0,&pcbddc->local_mat);CHKERRQ(ierr); 3173534831adSStefano Zampini ierr = MatDestroy(&pcis->A_IB);CHKERRQ(ierr); 3174534831adSStefano Zampini ierr = MatDestroy(&pcis->A_BI);CHKERRQ(ierr); 3175534831adSStefano Zampini ierr = MatDestroy(&pcis->A_BB);CHKERRQ(ierr); 3176534831adSStefano Zampini ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_I_local,pcis->is_B_local,MAT_INITIAL_MATRIX,&pcis->A_IB);CHKERRQ(ierr); 3177534831adSStefano Zampini ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_B_local,pcis->is_I_local,MAT_INITIAL_MATRIX,&pcis->A_BI);CHKERRQ(ierr); 3178534831adSStefano Zampini ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_B_local,pcis->is_B_local,MAT_INITIAL_MATRIX,&pcis->A_BB);CHKERRQ(ierr); 3179534831adSStefano Zampini ierr = MatDestroy(&change_mat_all);CHKERRQ(ierr); 3180534831adSStefano Zampini ierr = PetscFree(nnz);CHKERRQ(ierr); 3181534831adSStefano Zampini ierr = PetscFree(temp_indices);CHKERRQ(ierr); 3182534831adSStefano Zampini } else { 3183534831adSStefano Zampini /* without change of basis, the local matrix is unchanged */ 3184534831adSStefano Zampini ierr = PetscObjectReference((PetscObject)matis->A);CHKERRQ(ierr); 31852fa5cd67SKarl Rupp 3186534831adSStefano Zampini pcbddc->local_mat = matis->A; 3187534831adSStefano Zampini } 31880bdf917eSStefano Zampini /* Change global null space passed in by the user if change of basis has been performed */ 31890bdf917eSStefano Zampini if (pcbddc->NullSpace && pcbddc->usechangeofbasis) { 31900bdf917eSStefano Zampini ierr = PCBDDCAdaptNullSpace(pc);CHKERRQ(ierr); 31910bdf917eSStefano Zampini } 3192a0ba757dSStefano Zampini 31930c7d97c5SJed Brown /* Dohrmann's notation: dofs splitted in R (Remaining: all dofs but the vertices) and V (Vertices) */ 31940c7d97c5SJed Brown ierr = VecSet(pcis->vec1_N,one);CHKERRQ(ierr); 31950c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 31962fa5cd67SKarl Rupp for (i=0;i<n_vertices;i++) array[vertices[i]] = zero; 31973b03a366Sstefano_zampini ierr = PetscMalloc((pcis->n - n_vertices)*sizeof(PetscInt),&idx_R_local);CHKERRQ(ierr); 31982fa5cd67SKarl Rupp for (i=0, n_R=0; i<pcis->n; i++) { 31992fa5cd67SKarl Rupp if (array[i] == one) { 32002fa5cd67SKarl Rupp idx_R_local[n_R] = i; 32012fa5cd67SKarl Rupp n_R++; 32022fa5cd67SKarl Rupp } 32032fa5cd67SKarl Rupp } 32040c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 3205e269702eSStefano Zampini if (dbg_flag) { 32060c7d97c5SJed Brown ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr); 32070c7d97c5SJed Brown ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 32080c7d97c5SJed Brown ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d local dimensions\n",PetscGlobalRank);CHKERRQ(ierr); 32090c7d97c5SJed Brown ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local_size = %d, dirichlet_size = %d, boundary_size = %d\n",pcis->n,n_D,n_B);CHKERRQ(ierr); 32103b03a366Sstefano_zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"r_size = %d, v_size = %d, constraints = %d, local_primal_size = %d\n",n_R,n_vertices,n_constraints,pcbddc->local_primal_size);CHKERRQ(ierr); 3211534831adSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"pcbddc->n_vertices = %d, pcbddc->n_constraints = %d\n",pcbddc->n_vertices,pcbddc->n_constraints);CHKERRQ(ierr); 32120c7d97c5SJed Brown ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 32130c7d97c5SJed Brown } 3214534831adSStefano Zampini 32150c7d97c5SJed Brown /* Allocate needed vectors */ 3216534831adSStefano Zampini ierr = VecDuplicate(pcis->vec1_global,&pcbddc->original_rhs);CHKERRQ(ierr); 32173972b0daSStefano Zampini ierr = VecDuplicate(pcis->vec1_global,&pcbddc->temp_solution);CHKERRQ(ierr); 32180c7d97c5SJed Brown ierr = VecDuplicate(pcis->vec1_D,&pcbddc->vec4_D);CHKERRQ(ierr); 32190c7d97c5SJed Brown ierr = VecCreate(PETSC_COMM_SELF,&pcbddc->vec1_R);CHKERRQ(ierr); 32200c7d97c5SJed Brown ierr = VecSetSizes(pcbddc->vec1_R,n_R,n_R);CHKERRQ(ierr); 32210c7d97c5SJed Brown ierr = VecSetType(pcbddc->vec1_R,impVecType);CHKERRQ(ierr); 3222d49ef151SStefano Zampini ierr = VecDuplicate(pcbddc->vec1_R,&pcbddc->vec2_R);CHKERRQ(ierr); 32230c7d97c5SJed Brown ierr = VecCreate(PETSC_COMM_SELF,&pcbddc->vec1_P);CHKERRQ(ierr); 32240c7d97c5SJed Brown ierr = VecSetSizes(pcbddc->vec1_P,pcbddc->local_primal_size,pcbddc->local_primal_size);CHKERRQ(ierr); 32250c7d97c5SJed Brown ierr = VecSetType(pcbddc->vec1_P,impVecType);CHKERRQ(ierr); 32260c7d97c5SJed Brown 32270c7d97c5SJed Brown /* Creating some index sets needed */ 32280c7d97c5SJed Brown /* For submatrices */ 3229da1bb401SStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,n_R,idx_R_local,PETSC_OWN_POINTER,&is_R_local);CHKERRQ(ierr); 32303b03a366Sstefano_zampini if (n_vertices) { 3231da1bb401SStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,n_vertices,vertices,PETSC_OWN_POINTER,&is_V_local);CHKERRQ(ierr); 32323b03a366Sstefano_zampini } 3233da1bb401SStefano Zampini if (n_constraints) { 3234da1bb401SStefano Zampini ierr = ISCreateStride(PETSC_COMM_SELF,n_constraints,n_vertices,1,&is_C_local);CHKERRQ(ierr); 3235da1bb401SStefano Zampini } 3236da1bb401SStefano Zampini 32370c7d97c5SJed Brown /* For VecScatters pcbddc->R_to_B and (optionally) pcbddc->R_to_D */ 32380c7d97c5SJed Brown { 32390c7d97c5SJed Brown PetscInt *aux_array1; 32400c7d97c5SJed Brown PetscInt *aux_array2; 32412e8d2280SStefano Zampini PetscInt *idx_I_local; 32420c7d97c5SJed Brown 32433b03a366Sstefano_zampini ierr = PetscMalloc((pcis->n_B-n_vertices)*sizeof(PetscInt),&aux_array1);CHKERRQ(ierr); 32443b03a366Sstefano_zampini ierr = PetscMalloc((pcis->n_B-n_vertices)*sizeof(PetscInt),&aux_array2);CHKERRQ(ierr); 32450c7d97c5SJed Brown 32462e8d2280SStefano Zampini ierr = ISGetIndices(pcis->is_I_local,(const PetscInt**)&idx_I_local);CHKERRQ(ierr); 32470c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 32482fa5cd67SKarl Rupp for (i=0; i<n_D; i++) array[idx_I_local[i]] = 0; 32492e8d2280SStefano Zampini ierr = ISRestoreIndices(pcis->is_I_local,(const PetscInt**)&idx_I_local);CHKERRQ(ierr); 32502fa5cd67SKarl Rupp for (i=0, j=0; i<n_R; i++) { 32512fa5cd67SKarl Rupp if (array[idx_R_local[i]] == one) { 32522fa5cd67SKarl Rupp aux_array1[j] = i; 32532fa5cd67SKarl Rupp j++; 32542fa5cd67SKarl Rupp } 32552fa5cd67SKarl Rupp } 32560c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 3257da1bb401SStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array1,PETSC_COPY_VALUES,&is_aux1);CHKERRQ(ierr); 32582e8d2280SStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 32592e8d2280SStefano Zampini ierr = VecScatterEnd (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 32600c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr); 32612fa5cd67SKarl Rupp for (i=0, j=0; i<n_B; i++) { 32622fa5cd67SKarl Rupp if (array[i] == one) { 32632fa5cd67SKarl Rupp aux_array2[j] = i; j++; 32642fa5cd67SKarl Rupp } 32652fa5cd67SKarl Rupp } 32663828260eSStefano Zampini ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr); 3267da1bb401SStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array2,PETSC_COPY_VALUES,&is_aux2);CHKERRQ(ierr); 32680c7d97c5SJed Brown ierr = VecScatterCreate(pcbddc->vec1_R,is_aux1,pcis->vec1_B,is_aux2,&pcbddc->R_to_B);CHKERRQ(ierr); 32690c7d97c5SJed Brown ierr = PetscFree(aux_array1);CHKERRQ(ierr); 32700c7d97c5SJed Brown ierr = PetscFree(aux_array2);CHKERRQ(ierr); 32710c7d97c5SJed Brown ierr = ISDestroy(&is_aux1);CHKERRQ(ierr); 32720c7d97c5SJed Brown ierr = ISDestroy(&is_aux2);CHKERRQ(ierr); 32730c7d97c5SJed Brown 327429622bf0SStefano Zampini if (pcbddc->inexact_prec_type || dbg_flag) { 32750c7d97c5SJed Brown ierr = PetscMalloc(n_D*sizeof(PetscInt),&aux_array1);CHKERRQ(ierr); 32760c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 32772fa5cd67SKarl Rupp for (i=0, j=0; i<n_R; i++) { 32782fa5cd67SKarl Rupp if (array[idx_R_local[i]] == zero) { 32792fa5cd67SKarl Rupp aux_array1[j] = i; 32802fa5cd67SKarl Rupp j++; 32812fa5cd67SKarl Rupp } 32822fa5cd67SKarl Rupp } 32830c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 3284da1bb401SStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array1,PETSC_COPY_VALUES,&is_aux1);CHKERRQ(ierr); 32850c7d97c5SJed Brown ierr = VecScatterCreate(pcbddc->vec1_R,is_aux1,pcis->vec1_D,(IS)0,&pcbddc->R_to_D);CHKERRQ(ierr); 32860c7d97c5SJed Brown ierr = PetscFree(aux_array1);CHKERRQ(ierr); 32870c7d97c5SJed Brown ierr = ISDestroy(&is_aux1);CHKERRQ(ierr); 32880c7d97c5SJed Brown } 32890c7d97c5SJed Brown } 32900c7d97c5SJed Brown 32910c7d97c5SJed Brown /* Creating PC contexts for local Dirichlet and Neumann problems */ 32920c7d97c5SJed Brown { 32930c7d97c5SJed Brown Mat A_RR; 329453cdbc3dSStefano Zampini PC pc_temp; 32952fa5cd67SKarl Rupp 32960c7d97c5SJed Brown /* Matrix for Dirichlet problem is A_II -> we already have it from pcis.c code */ 329753cdbc3dSStefano Zampini ierr = KSPCreate(PETSC_COMM_SELF,&pcbddc->ksp_D);CHKERRQ(ierr); 329853cdbc3dSStefano Zampini ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->ksp_D,(PetscObject)pc,1);CHKERRQ(ierr); 329953cdbc3dSStefano Zampini ierr = KSPSetOperators(pcbddc->ksp_D,pcis->A_II,pcis->A_II,SAME_PRECONDITIONER);CHKERRQ(ierr); 330053cdbc3dSStefano Zampini ierr = KSPSetType(pcbddc->ksp_D,KSPPREONLY);CHKERRQ(ierr); 3301da1bb401SStefano Zampini ierr = KSPSetOptionsPrefix(pcbddc->ksp_D,"dirichlet_");CHKERRQ(ierr); 33022fa5cd67SKarl Rupp 33030c7d97c5SJed Brown /* default */ 330453cdbc3dSStefano Zampini ierr = KSPGetPC(pcbddc->ksp_D,&pc_temp);CHKERRQ(ierr); 330553cdbc3dSStefano Zampini ierr = PCSetType(pc_temp,PCLU);CHKERRQ(ierr); 33062fa5cd67SKarl Rupp 33070c7d97c5SJed Brown /* Allow user's customization */ 330853cdbc3dSStefano Zampini ierr = KSPSetFromOptions(pcbddc->ksp_D);CHKERRQ(ierr); 33092fa5cd67SKarl Rupp 3310950d796eSStefano Zampini /* umfpack interface has a bug when matrix dimension is zero */ 3311950d796eSStefano Zampini if (!n_D) { 33122e8d2280SStefano Zampini ierr = PCSetType(pc_temp,PCNONE);CHKERRQ(ierr); 3313950d796eSStefano Zampini } 33142fa5cd67SKarl Rupp 331553cdbc3dSStefano Zampini /* Set Up KSP for Dirichlet problem of BDDC */ 331653cdbc3dSStefano Zampini ierr = KSPSetUp(pcbddc->ksp_D);CHKERRQ(ierr); 33172fa5cd67SKarl Rupp 33183972b0daSStefano Zampini /* set ksp_D into pcis data */ 33193972b0daSStefano Zampini ierr = KSPDestroy(&pcis->ksp_D);CHKERRQ(ierr); 33203972b0daSStefano Zampini ierr = PetscObjectReference((PetscObject)pcbddc->ksp_D);CHKERRQ(ierr); 33213972b0daSStefano Zampini pcis->ksp_D = pcbddc->ksp_D; 33222fa5cd67SKarl Rupp 33230c7d97c5SJed Brown /* Matrix for Neumann problem is A_RR -> we need to create it */ 3324534831adSStefano Zampini ierr = MatGetSubMatrix(pcbddc->local_mat,is_R_local,is_R_local,MAT_INITIAL_MATRIX,&A_RR);CHKERRQ(ierr); 332553cdbc3dSStefano Zampini ierr = KSPCreate(PETSC_COMM_SELF,&pcbddc->ksp_R);CHKERRQ(ierr); 332653cdbc3dSStefano Zampini ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->ksp_R,(PetscObject)pc,1);CHKERRQ(ierr); 332753cdbc3dSStefano Zampini ierr = KSPSetOperators(pcbddc->ksp_R,A_RR,A_RR,SAME_PRECONDITIONER);CHKERRQ(ierr); 332853cdbc3dSStefano Zampini ierr = KSPSetType(pcbddc->ksp_R,KSPPREONLY);CHKERRQ(ierr); 3329da1bb401SStefano Zampini ierr = KSPSetOptionsPrefix(pcbddc->ksp_R,"neumann_");CHKERRQ(ierr); 33302fa5cd67SKarl Rupp 33310c7d97c5SJed Brown /* default */ 333253cdbc3dSStefano Zampini ierr = KSPGetPC(pcbddc->ksp_R,&pc_temp);CHKERRQ(ierr); 333353cdbc3dSStefano Zampini ierr = PCSetType(pc_temp,PCLU);CHKERRQ(ierr); 33342fa5cd67SKarl Rupp 33350c7d97c5SJed Brown /* Allow user's customization */ 333653cdbc3dSStefano Zampini ierr = KSPSetFromOptions(pcbddc->ksp_R);CHKERRQ(ierr); 33372fa5cd67SKarl Rupp 3338950d796eSStefano Zampini /* umfpack interface has a bug when matrix dimension is zero */ 3339950d796eSStefano Zampini if (!pcis->n) { 33402e8d2280SStefano Zampini ierr = PCSetType(pc_temp,PCNONE);CHKERRQ(ierr); 3341950d796eSStefano Zampini } 33422fa5cd67SKarl Rupp 334353cdbc3dSStefano Zampini /* Set Up KSP for Neumann problem of BDDC */ 334453cdbc3dSStefano Zampini ierr = KSPSetUp(pcbddc->ksp_R);CHKERRQ(ierr); 33452fa5cd67SKarl Rupp 334629622bf0SStefano Zampini /* check Dirichlet and Neumann solvers and adapt them is a nullspace correction is needed */ 3347b76ba322SStefano Zampini { 33480c7d97c5SJed Brown Vec temp_vec; 3349b76ba322SStefano Zampini PetscReal value; 3350b76ba322SStefano Zampini PetscMPIInt use_exact,use_exact_reduced; 33510c7d97c5SJed Brown 3352a0ba757dSStefano Zampini ierr = VecDuplicate(pcis->vec1_D,&temp_vec);CHKERRQ(ierr); 3353a0ba757dSStefano Zampini ierr = VecSetRandom(pcis->vec1_D,PETSC_NULL);CHKERRQ(ierr); 3354a0ba757dSStefano Zampini ierr = MatMult(pcis->A_II,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr); 3355a0ba757dSStefano Zampini ierr = KSPSolve(pcbddc->ksp_D,pcis->vec2_D,temp_vec);CHKERRQ(ierr); 3356a0ba757dSStefano Zampini ierr = VecAXPY(temp_vec,m_one,pcis->vec1_D);CHKERRQ(ierr); 3357a0ba757dSStefano Zampini ierr = VecNorm(temp_vec,NORM_INFINITY,&value);CHKERRQ(ierr); 335829622bf0SStefano Zampini ierr = VecDestroy(&temp_vec);CHKERRQ(ierr); 3359b76ba322SStefano Zampini use_exact = 1; 33602fa5cd67SKarl Rupp if (PetscAbsReal(value) > 1.e-4) use_exact = 0; 33612fa5cd67SKarl Rupp 3362b76ba322SStefano Zampini ierr = MPI_Allreduce(&use_exact,&use_exact_reduced,1,MPIU_INT,MPI_LAND,((PetscObject)pc)->comm);CHKERRQ(ierr); 3363b76ba322SStefano Zampini pcbddc->use_exact_dirichlet = (PetscBool) use_exact_reduced; 3364b76ba322SStefano Zampini if (dbg_flag) { 3365a0ba757dSStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 3366a0ba757dSStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr); 3367a0ba757dSStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Checking solution of Dirichlet and Neumann problems\n");CHKERRQ(ierr); 3368a0ba757dSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d infinity error for Dirichlet solve = % 1.14e \n",PetscGlobalRank,value);CHKERRQ(ierr); 336929622bf0SStefano Zampini } 337029622bf0SStefano Zampini if (pcbddc->NullSpace && !use_exact_reduced && !pcbddc->inexact_prec_type) { 337129622bf0SStefano Zampini ierr = PCBDDCAdaptLocalProblem(pc,pcis->is_I_local); 337229622bf0SStefano Zampini } 3373d49ef151SStefano Zampini ierr = VecDuplicate(pcbddc->vec1_R,&temp_vec);CHKERRQ(ierr); 3374d49ef151SStefano Zampini ierr = VecSetRandom(pcbddc->vec1_R,PETSC_NULL);CHKERRQ(ierr); 3375d49ef151SStefano Zampini ierr = MatMult(A_RR,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr); 3376d49ef151SStefano Zampini ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec2_R,temp_vec);CHKERRQ(ierr); 3377d49ef151SStefano Zampini ierr = VecAXPY(temp_vec,m_one,pcbddc->vec1_R);CHKERRQ(ierr); 3378d49ef151SStefano Zampini ierr = VecNorm(temp_vec,NORM_INFINITY,&value);CHKERRQ(ierr); 3379e269702eSStefano Zampini ierr = VecDestroy(&temp_vec);CHKERRQ(ierr); 33802fa5cd67SKarl Rupp 338129622bf0SStefano Zampini use_exact = 1; 33822fa5cd67SKarl Rupp if (PetscAbsReal(value) > 1.e-4) use_exact = 0; 338329622bf0SStefano Zampini ierr = MPI_Allreduce(&use_exact,&use_exact_reduced,1,MPIU_INT,MPI_LAND,((PetscObject)pc)->comm);CHKERRQ(ierr); 338429622bf0SStefano Zampini if (dbg_flag) { 33850c7d97c5SJed Brown ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d infinity error for Neumann solve = % 1.14e \n",PetscGlobalRank,value);CHKERRQ(ierr); 3386d49ef151SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 33870c7d97c5SJed Brown } 338829622bf0SStefano Zampini if (pcbddc->NullSpace && !use_exact_reduced) { 338929622bf0SStefano Zampini ierr = PCBDDCAdaptLocalProblem(pc,is_R_local); 339029622bf0SStefano Zampini } 3391b76ba322SStefano Zampini } 33920c7d97c5SJed Brown /* free Neumann problem's matrix */ 33930c7d97c5SJed Brown ierr = MatDestroy(&A_RR);CHKERRQ(ierr); 33940c7d97c5SJed Brown } 33950c7d97c5SJed Brown 33960c7d97c5SJed Brown /* Assemble all remaining stuff needed to apply BDDC */ 33970c7d97c5SJed Brown { 33980c7d97c5SJed Brown Mat A_RV,A_VR,A_VV; 33990bdf917eSStefano Zampini Mat M1; 34000c7d97c5SJed Brown Mat C_CR; 34013b03a366Sstefano_zampini Mat AUXMAT; 34020c7d97c5SJed Brown Vec vec1_C; 34030c7d97c5SJed Brown Vec vec2_C; 34040c7d97c5SJed Brown Vec vec1_V; 34050c7d97c5SJed Brown Vec vec2_V; 34060c7d97c5SJed Brown PetscInt *nnz; 34070c7d97c5SJed Brown PetscInt *auxindices; 340853cdbc3dSStefano Zampini PetscInt index; 34090c7d97c5SJed Brown PetscScalar *array2; 34100c7d97c5SJed Brown MatFactorInfo matinfo; 34110c7d97c5SJed Brown 34120c7d97c5SJed Brown /* Allocating some extra storage just to be safe */ 34130c7d97c5SJed Brown ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&nnz);CHKERRQ(ierr); 34140c7d97c5SJed Brown ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&auxindices);CHKERRQ(ierr); 34152fa5cd67SKarl Rupp for (i=0;i<pcis->n;i++) auxindices[i]=i; 34160c7d97c5SJed Brown 34170c7d97c5SJed Brown /* some work vectors on vertices and/or constraints */ 34183b03a366Sstefano_zampini if (n_vertices) { 34190c7d97c5SJed Brown ierr = VecCreate(PETSC_COMM_SELF,&vec1_V);CHKERRQ(ierr); 34203b03a366Sstefano_zampini ierr = VecSetSizes(vec1_V,n_vertices,n_vertices);CHKERRQ(ierr); 34210c7d97c5SJed Brown ierr = VecSetType(vec1_V,impVecType);CHKERRQ(ierr); 34220c7d97c5SJed Brown ierr = VecDuplicate(vec1_V,&vec2_V);CHKERRQ(ierr); 34230c7d97c5SJed Brown } 3424534831adSStefano Zampini if (n_constraints) { 34250c7d97c5SJed Brown ierr = VecCreate(PETSC_COMM_SELF,&vec1_C);CHKERRQ(ierr); 3426534831adSStefano Zampini ierr = VecSetSizes(vec1_C,n_constraints,n_constraints);CHKERRQ(ierr); 34270c7d97c5SJed Brown ierr = VecSetType(vec1_C,impVecType);CHKERRQ(ierr); 34280c7d97c5SJed Brown ierr = VecDuplicate(vec1_C,&vec2_C);CHKERRQ(ierr); 34290c7d97c5SJed Brown ierr = VecDuplicate(vec1_C,&pcbddc->vec1_C);CHKERRQ(ierr); 34300c7d97c5SJed Brown } 34310c7d97c5SJed Brown /* Precompute stuffs needed for preprocessing and application of BDDC*/ 34323b03a366Sstefano_zampini if (n_constraints) { 34330c7d97c5SJed Brown ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->local_auxmat2);CHKERRQ(ierr); 34343b03a366Sstefano_zampini ierr = MatSetSizes(pcbddc->local_auxmat2,n_R,n_constraints,n_R,n_constraints);CHKERRQ(ierr); 34350c7d97c5SJed Brown ierr = MatSetType(pcbddc->local_auxmat2,impMatType);CHKERRQ(ierr); 34363b03a366Sstefano_zampini ierr = MatSeqDenseSetPreallocation(pcbddc->local_auxmat2,PETSC_NULL);CHKERRQ(ierr); 34370c7d97c5SJed Brown 343857a90decSStefano Zampini /* Create Constraint matrix on R nodes: C_{CR} */ 343957a90decSStefano Zampini ierr = MatGetSubMatrix(pcbddc->ConstraintMatrix,is_C_local,is_R_local,MAT_INITIAL_MATRIX,&C_CR);CHKERRQ(ierr); 344057a90decSStefano Zampini ierr = ISDestroy(&is_C_local);CHKERRQ(ierr); 344157a90decSStefano Zampini 34420c7d97c5SJed Brown /* Assemble local_auxmat2 = - A_{RR}^{-1} C^T_{CR} needed by BDDC application */ 34433b03a366Sstefano_zampini for (i=0; i<n_constraints; i++) { 34443b03a366Sstefano_zampini ierr = VecSet(pcbddc->vec1_R,zero);CHKERRQ(ierr); 34452fa5cd67SKarl Rupp 34463b03a366Sstefano_zampini /* Get row of constraint matrix in R numbering */ 344757a90decSStefano Zampini ierr = VecGetArray(pcbddc->vec1_R,&array);CHKERRQ(ierr); 344857a90decSStefano Zampini ierr = MatGetRow(C_CR,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr); 34492fa5cd67SKarl Rupp for (j=0;j<size_of_constraint;j++) array[row_cmat_indices[j]] = -row_cmat_values[j]; 345057a90decSStefano Zampini ierr = MatRestoreRow(C_CR,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr); 345157a90decSStefano Zampini ierr = VecRestoreArray(pcbddc->vec1_R,&array);CHKERRQ(ierr); 34522fa5cd67SKarl Rupp 34533b03a366Sstefano_zampini /* Solve for row of constraint matrix in R numbering */ 345453cdbc3dSStefano Zampini ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr); 34552fa5cd67SKarl Rupp 34563b03a366Sstefano_zampini /* Set values */ 34570c7d97c5SJed Brown ierr = VecGetArray(pcbddc->vec2_R,&array);CHKERRQ(ierr); 34583b03a366Sstefano_zampini ierr = MatSetValues(pcbddc->local_auxmat2,n_R,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr); 34590c7d97c5SJed Brown ierr = VecRestoreArray(pcbddc->vec2_R,&array);CHKERRQ(ierr); 34600c7d97c5SJed Brown } 34610c7d97c5SJed Brown ierr = MatAssemblyBegin(pcbddc->local_auxmat2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 34620c7d97c5SJed Brown ierr = MatAssemblyEnd(pcbddc->local_auxmat2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 34630c7d97c5SJed Brown 34640c7d97c5SJed Brown /* Assemble AUXMAT = (LUFactor)(-C_{CR} A_{RR}^{-1} C^T_{CR})^{-1} */ 34650c7d97c5SJed Brown ierr = MatMatMult(C_CR,pcbddc->local_auxmat2,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&AUXMAT);CHKERRQ(ierr); 3466d49ef151SStefano Zampini ierr = MatFactorInfoInitialize(&matinfo);CHKERRQ(ierr); 34673b03a366Sstefano_zampini ierr = ISCreateStride(PETSC_COMM_SELF,n_constraints,0,1,&is_aux1);CHKERRQ(ierr); 34680c7d97c5SJed Brown ierr = MatLUFactor(AUXMAT,is_aux1,is_aux1,&matinfo);CHKERRQ(ierr); 34690c7d97c5SJed Brown ierr = ISDestroy(&is_aux1);CHKERRQ(ierr); 34700c7d97c5SJed Brown 34713b03a366Sstefano_zampini /* Assemble explicitly M1 = (C_{CR} A_{RR}^{-1} C^T_{CR})^{-1} needed in preproc */ 3472d49ef151SStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&M1);CHKERRQ(ierr); 34733b03a366Sstefano_zampini ierr = MatSetSizes(M1,n_constraints,n_constraints,n_constraints,n_constraints);CHKERRQ(ierr); 34740c7d97c5SJed Brown ierr = MatSetType(M1,impMatType);CHKERRQ(ierr); 34753b03a366Sstefano_zampini ierr = MatSeqDenseSetPreallocation(M1,PETSC_NULL);CHKERRQ(ierr); 34763b03a366Sstefano_zampini for (i=0; i<n_constraints; i++) { 34770c7d97c5SJed Brown ierr = VecSet(vec1_C,zero);CHKERRQ(ierr); 34780c7d97c5SJed Brown ierr = VecSetValue(vec1_C,i,one,INSERT_VALUES);CHKERRQ(ierr); 34790c7d97c5SJed Brown ierr = VecAssemblyBegin(vec1_C);CHKERRQ(ierr); 34800c7d97c5SJed Brown ierr = VecAssemblyEnd(vec1_C);CHKERRQ(ierr); 34810c7d97c5SJed Brown ierr = MatSolve(AUXMAT,vec1_C,vec2_C);CHKERRQ(ierr); 34820c7d97c5SJed Brown ierr = VecScale(vec2_C,m_one);CHKERRQ(ierr); 34830c7d97c5SJed Brown ierr = VecGetArray(vec2_C,&array);CHKERRQ(ierr); 34843b03a366Sstefano_zampini ierr = MatSetValues(M1,n_constraints,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr); 34850c7d97c5SJed Brown ierr = VecRestoreArray(vec2_C,&array);CHKERRQ(ierr); 34860c7d97c5SJed Brown } 34870c7d97c5SJed Brown ierr = MatAssemblyBegin(M1,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 34880c7d97c5SJed Brown ierr = MatAssemblyEnd(M1,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 34890c7d97c5SJed Brown ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr); 34900c7d97c5SJed Brown /* Assemble local_auxmat1 = M1*C_{CR} needed by BDDC application in KSP and in preproc */ 34910c7d97c5SJed Brown ierr = MatMatMult(M1,C_CR,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&pcbddc->local_auxmat1);CHKERRQ(ierr); 34920c7d97c5SJed Brown 34930c7d97c5SJed Brown } 34940c7d97c5SJed Brown 34950c7d97c5SJed Brown /* Get submatrices from subdomain matrix */ 34963b03a366Sstefano_zampini if (n_vertices) { 3497534831adSStefano Zampini ierr = MatGetSubMatrix(pcbddc->local_mat,is_R_local,is_V_local,MAT_INITIAL_MATRIX,&A_RV);CHKERRQ(ierr); 3498534831adSStefano Zampini ierr = MatGetSubMatrix(pcbddc->local_mat,is_V_local,is_R_local,MAT_INITIAL_MATRIX,&A_VR);CHKERRQ(ierr); 3499534831adSStefano Zampini ierr = MatGetSubMatrix(pcbddc->local_mat,is_V_local,is_V_local,MAT_INITIAL_MATRIX,&A_VV);CHKERRQ(ierr); 35000c7d97c5SJed Brown } 35010c7d97c5SJed Brown 35020c7d97c5SJed Brown /* Matrix of coarse basis functions (local) */ 3503d49ef151SStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->coarse_phi_B);CHKERRQ(ierr); 35040c7d97c5SJed Brown ierr = MatSetSizes(pcbddc->coarse_phi_B,n_B,pcbddc->local_primal_size,n_B,pcbddc->local_primal_size);CHKERRQ(ierr); 35050c7d97c5SJed Brown ierr = MatSetType(pcbddc->coarse_phi_B,impMatType);CHKERRQ(ierr); 35063b03a366Sstefano_zampini ierr = MatSeqDenseSetPreallocation(pcbddc->coarse_phi_B,PETSC_NULL);CHKERRQ(ierr); 350729622bf0SStefano Zampini if (pcbddc->inexact_prec_type || dbg_flag) { 3508d49ef151SStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->coarse_phi_D);CHKERRQ(ierr); 35090c7d97c5SJed Brown ierr = MatSetSizes(pcbddc->coarse_phi_D,n_D,pcbddc->local_primal_size,n_D,pcbddc->local_primal_size);CHKERRQ(ierr); 35100c7d97c5SJed Brown ierr = MatSetType(pcbddc->coarse_phi_D,impMatType);CHKERRQ(ierr); 35113b03a366Sstefano_zampini ierr = MatSeqDenseSetPreallocation(pcbddc->coarse_phi_D,PETSC_NULL);CHKERRQ(ierr); 35120c7d97c5SJed Brown } 35130c7d97c5SJed Brown 3514e269702eSStefano Zampini if (dbg_flag) { 35150c7d97c5SJed Brown ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscScalar),&coarsefunctions_errors);CHKERRQ(ierr); 35160c7d97c5SJed Brown ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscScalar),&constraints_errors);CHKERRQ(ierr); 35170c7d97c5SJed Brown } 35183b03a366Sstefano_zampini /* Subdomain contribution (Non-overlapping) to coarse matrix */ 35190c7d97c5SJed Brown ierr = PetscMalloc ((pcbddc->local_primal_size)*(pcbddc->local_primal_size)*sizeof(PetscScalar),&coarse_submat_vals);CHKERRQ(ierr); 35200c7d97c5SJed Brown 35210c7d97c5SJed Brown /* We are now ready to evaluate coarse basis functions and subdomain contribution to coarse problem */ 35223b03a366Sstefano_zampini for (i=0; i<n_vertices; i++) { 35230c7d97c5SJed Brown ierr = VecSet(vec1_V,zero);CHKERRQ(ierr); 35240c7d97c5SJed Brown ierr = VecSetValue(vec1_V,i,one,INSERT_VALUES);CHKERRQ(ierr); 35250c7d97c5SJed Brown ierr = VecAssemblyBegin(vec1_V);CHKERRQ(ierr); 35260c7d97c5SJed Brown ierr = VecAssemblyEnd(vec1_V);CHKERRQ(ierr); 35270c7d97c5SJed Brown /* solution of saddle point problem */ 35280bdf917eSStefano Zampini ierr = MatMult(A_RV,vec1_V,pcbddc->vec1_R);CHKERRQ(ierr); 35290bdf917eSStefano Zampini ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec1_R);CHKERRQ(ierr); 35300c7d97c5SJed Brown ierr = VecScale(pcbddc->vec1_R,m_one);CHKERRQ(ierr); 35313b03a366Sstefano_zampini if (n_constraints) { 35320c7d97c5SJed Brown ierr = MatMult(pcbddc->local_auxmat1,pcbddc->vec1_R,vec1_C);CHKERRQ(ierr); 35330c7d97c5SJed Brown ierr = MatMultAdd(pcbddc->local_auxmat2,vec1_C,pcbddc->vec1_R,pcbddc->vec1_R);CHKERRQ(ierr); 35340c7d97c5SJed Brown ierr = VecScale(vec1_C,m_one);CHKERRQ(ierr); 35350c7d97c5SJed Brown } 35360c7d97c5SJed Brown ierr = MatMult(A_VR,pcbddc->vec1_R,vec2_V);CHKERRQ(ierr); 35370c7d97c5SJed Brown ierr = MatMultAdd(A_VV,vec1_V,vec2_V,vec2_V);CHKERRQ(ierr); 35380c7d97c5SJed Brown 35390c7d97c5SJed Brown /* Set values in coarse basis function and subdomain part of coarse_mat */ 35400c7d97c5SJed Brown /* coarse basis functions */ 35410c7d97c5SJed Brown ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr); 35420c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 35430c7d97c5SJed Brown ierr = VecScatterEnd (pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 35440c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr); 35453b03a366Sstefano_zampini ierr = MatSetValues(pcbddc->coarse_phi_B,n_B,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr); 35460c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr); 35470c7d97c5SJed Brown ierr = MatSetValue(pcbddc->coarse_phi_B,idx_V_B[i],i,one,INSERT_VALUES);CHKERRQ(ierr); 354829622bf0SStefano Zampini if (pcbddc->inexact_prec_type || dbg_flag) { 35490c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 35500c7d97c5SJed Brown ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 35510c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_D,&array);CHKERRQ(ierr); 35523b03a366Sstefano_zampini ierr = MatSetValues(pcbddc->coarse_phi_D,n_D,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr); 35530c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_D,&array);CHKERRQ(ierr); 35540c7d97c5SJed Brown } 35550c7d97c5SJed Brown /* subdomain contribution to coarse matrix */ 35560c7d97c5SJed Brown ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr); 35572fa5cd67SKarl Rupp for (j=0; j<n_vertices; j++) coarse_submat_vals[i*pcbddc->local_primal_size+j] = array[j]; /* WARNING -> column major ordering */ 35580c7d97c5SJed Brown ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr); 35593b03a366Sstefano_zampini if (n_constraints) { 35600c7d97c5SJed Brown ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr); 35612fa5cd67SKarl Rupp for (j=0; j<n_constraints; j++) coarse_submat_vals[i*pcbddc->local_primal_size+j+n_vertices] = array[j]; /* WARNING -> column major ordering */ 35620c7d97c5SJed Brown ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr); 35630c7d97c5SJed Brown } 35640c7d97c5SJed Brown 3565e269702eSStefano Zampini if (dbg_flag) { 35660c7d97c5SJed Brown /* assemble subdomain vector on nodes */ 3567d49ef151SStefano Zampini ierr = VecSet(pcis->vec1_N,zero);CHKERRQ(ierr); 35680c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 35690c7d97c5SJed Brown ierr = VecGetArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr); 35702fa5cd67SKarl Rupp for (j=0;j<n_R;j++) array[idx_R_local[j]] = array2[j]; 35713b03a366Sstefano_zampini array[vertices[i]] = one; 35720c7d97c5SJed Brown ierr = VecRestoreArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr); 35730c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 35742fa5cd67SKarl Rupp 35750c7d97c5SJed Brown /* assemble subdomain vector of lagrange multipliers (i.e. primal nodes) */ 3576d49ef151SStefano Zampini ierr = VecSet(pcbddc->vec1_P,zero);CHKERRQ(ierr); 35770c7d97c5SJed Brown ierr = VecGetArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr); 35780c7d97c5SJed Brown ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr); 35792fa5cd67SKarl Rupp for (j=0;j<n_vertices;j++) array2[j]=array[j]; 35800c7d97c5SJed Brown ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr); 35813b03a366Sstefano_zampini if (n_constraints) { 35820c7d97c5SJed Brown ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr); 35832fa5cd67SKarl Rupp for (j=0;j<n_constraints;j++) array2[j+n_vertices]=array[j]; 35840c7d97c5SJed Brown ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr); 35850c7d97c5SJed Brown } 35860c7d97c5SJed Brown ierr = VecRestoreArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr); 35870c7d97c5SJed Brown ierr = VecScale(pcbddc->vec1_P,m_one);CHKERRQ(ierr); 35882fa5cd67SKarl Rupp 35890c7d97c5SJed Brown /* check saddle point solution */ 3590534831adSStefano Zampini ierr = MatMult(pcbddc->local_mat,pcis->vec1_N,pcis->vec2_N);CHKERRQ(ierr); 35913b03a366Sstefano_zampini ierr = MatMultTransposeAdd(pcbddc->ConstraintMatrix,pcbddc->vec1_P,pcis->vec2_N,pcis->vec2_N);CHKERRQ(ierr); 35923b03a366Sstefano_zampini ierr = VecNorm(pcis->vec2_N,NORM_INFINITY,&coarsefunctions_errors[i]);CHKERRQ(ierr); 35933b03a366Sstefano_zampini ierr = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr); 35940c7d97c5SJed Brown ierr = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr); 35953b03a366Sstefano_zampini array[i]=array[i]+m_one; /* shift by the identity matrix */ 35960c7d97c5SJed Brown ierr = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr); 35973b03a366Sstefano_zampini ierr = VecNorm(pcbddc->vec1_P,NORM_INFINITY,&constraints_errors[i]);CHKERRQ(ierr); 35980c7d97c5SJed Brown } 35990c7d97c5SJed Brown } 36000c7d97c5SJed Brown 36013b03a366Sstefano_zampini for (i=0; i<n_constraints; i++) { 3602d49ef151SStefano Zampini ierr = VecSet(vec2_C,zero);CHKERRQ(ierr); 36030c7d97c5SJed Brown ierr = VecSetValue(vec2_C,i,m_one,INSERT_VALUES);CHKERRQ(ierr); 36040c7d97c5SJed Brown ierr = VecAssemblyBegin(vec2_C);CHKERRQ(ierr); 36050c7d97c5SJed Brown ierr = VecAssemblyEnd(vec2_C);CHKERRQ(ierr); 36062fa5cd67SKarl Rupp 36070c7d97c5SJed Brown /* solution of saddle point problem */ 36080c7d97c5SJed Brown ierr = MatMult(M1,vec2_C,vec1_C);CHKERRQ(ierr); 36090c7d97c5SJed Brown ierr = MatMult(pcbddc->local_auxmat2,vec1_C,pcbddc->vec1_R);CHKERRQ(ierr); 36100c7d97c5SJed Brown ierr = VecScale(vec1_C,m_one);CHKERRQ(ierr); 36113b03a366Sstefano_zampini if (n_vertices) { ierr = MatMult(A_VR,pcbddc->vec1_R,vec2_V);CHKERRQ(ierr); } 36122fa5cd67SKarl Rupp 36130c7d97c5SJed Brown /* Set values in coarse basis function and subdomain part of coarse_mat */ 36140c7d97c5SJed Brown /* coarse basis functions */ 36153b03a366Sstefano_zampini index=i+n_vertices; 36160c7d97c5SJed Brown ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr); 36170c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 36180c7d97c5SJed Brown ierr = VecScatterEnd (pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 36190c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr); 362053cdbc3dSStefano Zampini ierr = MatSetValues(pcbddc->coarse_phi_B,n_B,auxindices,1,&index,array,INSERT_VALUES);CHKERRQ(ierr); 36210c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr); 362229622bf0SStefano Zampini if (pcbddc->inexact_prec_type || dbg_flag) { 36230c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 36240c7d97c5SJed Brown ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 36250c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_D,&array);CHKERRQ(ierr); 362653cdbc3dSStefano Zampini ierr = MatSetValues(pcbddc->coarse_phi_D,n_D,auxindices,1,&index,array,INSERT_VALUES);CHKERRQ(ierr); 36270c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_D,&array);CHKERRQ(ierr); 36280c7d97c5SJed Brown } 36292fa5cd67SKarl Rupp 36300c7d97c5SJed Brown /* subdomain contribution to coarse matrix */ 36313b03a366Sstefano_zampini if (n_vertices) { 36320c7d97c5SJed Brown ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr); 36332fa5cd67SKarl Rupp for (j=0; j<n_vertices; j++) coarse_submat_vals[index*pcbddc->local_primal_size+j]=array[j]; /* WARNING -> column major ordering */ 36340c7d97c5SJed Brown ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr); 36350c7d97c5SJed Brown } 36360c7d97c5SJed Brown ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr); 36372fa5cd67SKarl Rupp for (j=0; j<n_constraints; j++) coarse_submat_vals[index*pcbddc->local_primal_size+j+n_vertices]=array[j]; /* WARNING -> column major ordering */ 36380c7d97c5SJed Brown ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr); 36390c7d97c5SJed Brown 3640e269702eSStefano Zampini if (dbg_flag) { 36410c7d97c5SJed Brown /* assemble subdomain vector on nodes */ 364253cdbc3dSStefano Zampini ierr = VecSet(pcis->vec1_N,zero);CHKERRQ(ierr); 36430c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 36440c7d97c5SJed Brown ierr = VecGetArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr); 36452fa5cd67SKarl Rupp for (j=0;j<n_R;j++) array[idx_R_local[j]] = array2[j]; 36460c7d97c5SJed Brown ierr = VecRestoreArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr); 36470c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 36482fa5cd67SKarl Rupp 36490c7d97c5SJed Brown /* assemble subdomain vector of lagrange multipliers */ 365053cdbc3dSStefano Zampini ierr = VecSet(pcbddc->vec1_P,zero);CHKERRQ(ierr); 36510c7d97c5SJed Brown ierr = VecGetArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr); 36523b03a366Sstefano_zampini if (n_vertices) { 36530c7d97c5SJed Brown ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr); 36542fa5cd67SKarl Rupp for (j=0;j<n_vertices;j++) array2[j]=-array[j]; 36550c7d97c5SJed Brown ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr); 36560c7d97c5SJed Brown } 36570c7d97c5SJed Brown ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr); 36583b03a366Sstefano_zampini for (j=0;j<n_constraints;j++) {array2[j+n_vertices]=-array[j];} 36590c7d97c5SJed Brown ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr); 36600c7d97c5SJed Brown ierr = VecRestoreArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr); 36612fa5cd67SKarl Rupp 36623972b0daSStefano Zampini /* check saddle point solution */ 3663534831adSStefano Zampini ierr = MatMult(pcbddc->local_mat,pcis->vec1_N,pcis->vec2_N);CHKERRQ(ierr); 36643b03a366Sstefano_zampini ierr = MatMultTransposeAdd(pcbddc->ConstraintMatrix,pcbddc->vec1_P,pcis->vec2_N,pcis->vec2_N);CHKERRQ(ierr); 366553cdbc3dSStefano Zampini ierr = VecNorm(pcis->vec2_N,NORM_INFINITY,&coarsefunctions_errors[index]);CHKERRQ(ierr); 36663b03a366Sstefano_zampini ierr = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr); 36670c7d97c5SJed Brown ierr = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr); 366853cdbc3dSStefano Zampini array[index] = array[index]+m_one; /* shift by the identity matrix */ 36690c7d97c5SJed Brown ierr = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr); 367053cdbc3dSStefano Zampini ierr = VecNorm(pcbddc->vec1_P,NORM_INFINITY,&constraints_errors[index]);CHKERRQ(ierr); 36710c7d97c5SJed Brown } 36720c7d97c5SJed Brown } 36730c7d97c5SJed Brown ierr = MatAssemblyBegin(pcbddc->coarse_phi_B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 36740c7d97c5SJed Brown ierr = MatAssemblyEnd (pcbddc->coarse_phi_B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 367529622bf0SStefano Zampini if (pcbddc->inexact_prec_type || dbg_flag) { 36760c7d97c5SJed Brown ierr = MatAssemblyBegin(pcbddc->coarse_phi_D,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 36770c7d97c5SJed Brown ierr = MatAssemblyEnd (pcbddc->coarse_phi_D,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 36780c7d97c5SJed Brown } 36790c7d97c5SJed Brown /* Checking coarse_sub_mat and coarse basis functios */ 36800c7d97c5SJed Brown /* It shuld be \Phi^{(j)^T} A^{(j)} \Phi^{(j)}=coarse_sub_mat */ 36819d2fce94SStefano Zampini if (dbg_flag) { 36820c7d97c5SJed Brown Mat coarse_sub_mat; 36830c7d97c5SJed Brown Mat TM1,TM2,TM3,TM4; 36840c7d97c5SJed Brown Mat coarse_phi_D,coarse_phi_B,A_II,A_BB,A_IB,A_BI; 368519fd82e9SBarry Smith MatType checkmattype=MATSEQAIJ; 36860c7d97c5SJed Brown PetscScalar value; 36870c7d97c5SJed Brown 3688c042a7c3SStefano Zampini ierr = MatConvert(pcis->A_II,checkmattype,MAT_INITIAL_MATRIX,&A_II);CHKERRQ(ierr); 3689c042a7c3SStefano Zampini ierr = MatConvert(pcis->A_IB,checkmattype,MAT_INITIAL_MATRIX,&A_IB);CHKERRQ(ierr); 3690c042a7c3SStefano Zampini ierr = MatConvert(pcis->A_BI,checkmattype,MAT_INITIAL_MATRIX,&A_BI);CHKERRQ(ierr); 3691c042a7c3SStefano Zampini ierr = MatConvert(pcis->A_BB,checkmattype,MAT_INITIAL_MATRIX,&A_BB);CHKERRQ(ierr); 3692c042a7c3SStefano Zampini ierr = MatConvert(pcbddc->coarse_phi_D,checkmattype,MAT_INITIAL_MATRIX,&coarse_phi_D);CHKERRQ(ierr); 3693c042a7c3SStefano Zampini ierr = MatConvert(pcbddc->coarse_phi_B,checkmattype,MAT_INITIAL_MATRIX,&coarse_phi_B);CHKERRQ(ierr); 3694c042a7c3SStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,pcbddc->local_primal_size,pcbddc->local_primal_size,coarse_submat_vals,&coarse_sub_mat);CHKERRQ(ierr); 3695c042a7c3SStefano Zampini ierr = MatConvert(coarse_sub_mat,checkmattype,MAT_REUSE_MATRIX,&coarse_sub_mat);CHKERRQ(ierr); 36960c7d97c5SJed Brown 36970c7d97c5SJed Brown ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr); 36980c7d97c5SJed Brown ierr = PetscViewerASCIIPrintf(viewer,"Check coarse sub mat and local basis functions\n");CHKERRQ(ierr); 36990c7d97c5SJed Brown ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 370053cdbc3dSStefano Zampini ierr = MatPtAP(A_II,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&TM1);CHKERRQ(ierr); 370153cdbc3dSStefano Zampini ierr = MatPtAP(A_BB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&TM2);CHKERRQ(ierr); 370253cdbc3dSStefano Zampini ierr = MatMatMult(A_IB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr); 3703c042a7c3SStefano Zampini ierr = MatTransposeMatMult(coarse_phi_D,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM3);CHKERRQ(ierr); 370453cdbc3dSStefano Zampini ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr); 370553cdbc3dSStefano Zampini ierr = MatMatMult(A_BI,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr); 3706c042a7c3SStefano Zampini ierr = MatTransposeMatMult(coarse_phi_B,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM4);CHKERRQ(ierr); 370753cdbc3dSStefano Zampini ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr); 370853cdbc3dSStefano Zampini ierr = MatAXPY(TM1,one,TM2,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr); 370953cdbc3dSStefano Zampini ierr = MatAXPY(TM1,one,TM3,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr); 371053cdbc3dSStefano Zampini ierr = MatAXPY(TM1,one,TM4,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr); 371153cdbc3dSStefano Zampini ierr = MatAXPY(TM1,m_one,coarse_sub_mat,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr); 371253cdbc3dSStefano Zampini ierr = MatNorm(TM1,NORM_INFINITY,&value);CHKERRQ(ierr); 37130c7d97c5SJed Brown ierr = PetscViewerASCIISynchronizedPrintf(viewer,"----------------------------------\n");CHKERRQ(ierr); 37140c7d97c5SJed Brown ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d \n",PetscGlobalRank);CHKERRQ(ierr); 37150c7d97c5SJed Brown ierr = PetscViewerASCIISynchronizedPrintf(viewer,"matrix error = % 1.14e\n",value);CHKERRQ(ierr); 37160c7d97c5SJed Brown ierr = PetscViewerASCIISynchronizedPrintf(viewer,"coarse functions errors\n");CHKERRQ(ierr); 371753cdbc3dSStefano Zampini for (i=0; i<pcbddc->local_primal_size; i++) { ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local %02d-th function error = % 1.14e\n",i,coarsefunctions_errors[i]);CHKERRQ(ierr); } 37180c7d97c5SJed Brown ierr = PetscViewerASCIISynchronizedPrintf(viewer,"constraints errors\n");CHKERRQ(ierr); 371953cdbc3dSStefano Zampini for (i=0; i<pcbddc->local_primal_size; i++) { ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local %02d-th function error = % 1.14e\n",i,constraints_errors[i]);CHKERRQ(ierr); } 37200c7d97c5SJed Brown ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 372153cdbc3dSStefano Zampini ierr = MatDestroy(&A_II);CHKERRQ(ierr); 372253cdbc3dSStefano Zampini ierr = MatDestroy(&A_BB);CHKERRQ(ierr); 372353cdbc3dSStefano Zampini ierr = MatDestroy(&A_IB);CHKERRQ(ierr); 372453cdbc3dSStefano Zampini ierr = MatDestroy(&A_BI);CHKERRQ(ierr); 372553cdbc3dSStefano Zampini ierr = MatDestroy(&TM1);CHKERRQ(ierr); 372653cdbc3dSStefano Zampini ierr = MatDestroy(&TM2);CHKERRQ(ierr); 372753cdbc3dSStefano Zampini ierr = MatDestroy(&TM3);CHKERRQ(ierr); 372853cdbc3dSStefano Zampini ierr = MatDestroy(&TM4);CHKERRQ(ierr); 372953cdbc3dSStefano Zampini ierr = MatDestroy(&coarse_phi_D);CHKERRQ(ierr); 373053cdbc3dSStefano Zampini ierr = MatDestroy(&coarse_sub_mat);CHKERRQ(ierr); 373153cdbc3dSStefano Zampini ierr = MatDestroy(&coarse_phi_B);CHKERRQ(ierr); 37320c7d97c5SJed Brown ierr = PetscFree(coarsefunctions_errors);CHKERRQ(ierr); 37330c7d97c5SJed Brown ierr = PetscFree(constraints_errors);CHKERRQ(ierr); 37340c7d97c5SJed Brown } 37350c7d97c5SJed Brown /* free memory */ 37363b03a366Sstefano_zampini if (n_vertices) { 37370c7d97c5SJed Brown ierr = VecDestroy(&vec1_V);CHKERRQ(ierr); 37380c7d97c5SJed Brown ierr = VecDestroy(&vec2_V);CHKERRQ(ierr); 37390c7d97c5SJed Brown ierr = MatDestroy(&A_RV);CHKERRQ(ierr); 37400c7d97c5SJed Brown ierr = MatDestroy(&A_VR);CHKERRQ(ierr); 37410c7d97c5SJed Brown ierr = MatDestroy(&A_VV);CHKERRQ(ierr); 37420c7d97c5SJed Brown } 3743534831adSStefano Zampini if (n_constraints) { 37440c7d97c5SJed Brown ierr = VecDestroy(&vec1_C);CHKERRQ(ierr); 37450c7d97c5SJed Brown ierr = VecDestroy(&vec2_C);CHKERRQ(ierr); 37460c7d97c5SJed Brown ierr = MatDestroy(&M1);CHKERRQ(ierr); 37470c7d97c5SJed Brown ierr = MatDestroy(&C_CR);CHKERRQ(ierr); 37480c7d97c5SJed Brown } 3749a929c220SStefano Zampini ierr = PetscFree(auxindices);CHKERRQ(ierr); 3750a929c220SStefano Zampini ierr = PetscFree(nnz);CHKERRQ(ierr); 3751a929c220SStefano Zampini /* create coarse matrix and data structures for message passing associated actual choice of coarse problem type */ 3752a929c220SStefano Zampini ierr = PCBDDCSetupCoarseEnvironment(pc,coarse_submat_vals);CHKERRQ(ierr); 3753a929c220SStefano Zampini ierr = PetscFree(coarse_submat_vals);CHKERRQ(ierr); 37540c7d97c5SJed Brown } 37550c7d97c5SJed Brown /* free memory */ 37563b03a366Sstefano_zampini if (n_vertices) { 37570c7d97c5SJed Brown ierr = PetscFree(idx_V_B);CHKERRQ(ierr); 37580c7d97c5SJed Brown ierr = ISDestroy(&is_V_local);CHKERRQ(ierr); 37590c7d97c5SJed Brown } 37600c7d97c5SJed Brown ierr = ISDestroy(&is_R_local);CHKERRQ(ierr); 37610c7d97c5SJed Brown PetscFunctionReturn(0); 37620c7d97c5SJed Brown } 37630c7d97c5SJed Brown 37640c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 37650c7d97c5SJed Brown 37660c7d97c5SJed Brown #undef __FUNCT__ 37670c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetupCoarseEnvironment" 376853cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetupCoarseEnvironment(PC pc,PetscScalar* coarse_submat_vals) 37690c7d97c5SJed Brown { 37700c7d97c5SJed Brown Mat_IS *matis = (Mat_IS*)pc->pmat->data; 37710c7d97c5SJed Brown PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 37720c7d97c5SJed Brown PC_IS *pcis = (PC_IS*)pc->data; 37730c7d97c5SJed Brown MPI_Comm prec_comm = ((PetscObject)pc)->comm; 37740c7d97c5SJed Brown MPI_Comm coarse_comm; 37750c7d97c5SJed Brown 37760c7d97c5SJed Brown /* common to all choiches */ 37770c7d97c5SJed Brown PetscScalar *temp_coarse_mat_vals; 37780c7d97c5SJed Brown PetscScalar *ins_coarse_mat_vals; 37790c7d97c5SJed Brown PetscInt *ins_local_primal_indices; 37800c7d97c5SJed Brown PetscMPIInt *localsizes2,*localdispl2; 37810c7d97c5SJed Brown PetscMPIInt size_prec_comm; 37820c7d97c5SJed Brown PetscMPIInt rank_prec_comm; 37830c7d97c5SJed Brown PetscMPIInt active_rank=MPI_PROC_NULL; 37840c7d97c5SJed Brown PetscMPIInt master_proc=0; 37850c7d97c5SJed Brown PetscInt ins_local_primal_size; 37862fa5cd67SKarl Rupp 37870c7d97c5SJed Brown /* specific to MULTILEVEL_BDDC */ 37880c7d97c5SJed Brown PetscMPIInt *ranks_recv; 37890c7d97c5SJed Brown PetscMPIInt count_recv=0; 37900c7d97c5SJed Brown PetscMPIInt rank_coarse_proc_send_to; 37910c7d97c5SJed Brown PetscMPIInt coarse_color = MPI_UNDEFINED; 37920c7d97c5SJed Brown ISLocalToGlobalMapping coarse_ISLG; 37932fa5cd67SKarl Rupp 37940c7d97c5SJed Brown /* some other variables */ 37950c7d97c5SJed Brown PetscErrorCode ierr; 379619fd82e9SBarry Smith MatType coarse_mat_type; 379719fd82e9SBarry Smith PCType coarse_pc_type; 379819fd82e9SBarry Smith KSPType coarse_ksp_type; 379953cdbc3dSStefano Zampini PC pc_temp; 38004fad6a16SStefano Zampini PetscInt i,j,k; 38013b03a366Sstefano_zampini PetscInt max_it_coarse_ksp=1; /* don't increase this value */ 38022fa5cd67SKarl Rupp 3803e269702eSStefano Zampini /* verbose output viewer */ 3804e269702eSStefano Zampini PetscViewer viewer = pcbddc->dbg_viewer; 3805e269702eSStefano Zampini PetscBool dbg_flag = pcbddc->dbg_flag; 3806142dfd88SStefano Zampini 3807ea7e1babSStefano Zampini PetscInt offset,offset2; 3808a929c220SStefano Zampini PetscMPIInt im_active,active_procs; 3809523858cfSStefano Zampini PetscInt *dnz,*onz; 3810142dfd88SStefano Zampini 3811142dfd88SStefano Zampini PetscBool setsym,issym=PETSC_FALSE; 38120c7d97c5SJed Brown 38130c7d97c5SJed Brown PetscFunctionBegin; 38140c7d97c5SJed Brown ins_local_primal_indices = 0; 38150c7d97c5SJed Brown ins_coarse_mat_vals = 0; 38160c7d97c5SJed Brown localsizes2 = 0; 38170c7d97c5SJed Brown localdispl2 = 0; 38180c7d97c5SJed Brown temp_coarse_mat_vals = 0; 38190c7d97c5SJed Brown coarse_ISLG = 0; 38200c7d97c5SJed Brown 382153cdbc3dSStefano Zampini ierr = MPI_Comm_size(prec_comm,&size_prec_comm);CHKERRQ(ierr); 382253cdbc3dSStefano Zampini ierr = MPI_Comm_rank(prec_comm,&rank_prec_comm);CHKERRQ(ierr); 3823142dfd88SStefano Zampini ierr = MatIsSymmetricKnown(pc->pmat,&setsym,&issym);CHKERRQ(ierr); 3824142dfd88SStefano Zampini 3825beed3852SStefano Zampini /* Assign global numbering to coarse dofs */ 3826beed3852SStefano Zampini { 3827ef028eecSStefano Zampini PetscInt *auxlocal_primal; 3828da1bb401SStefano Zampini PetscInt *row_cmat_indices; 38292e8d2280SStefano Zampini PetscInt *aux_ordering; 38302e8d2280SStefano Zampini PetscInt *row_cmat_global_indices; 3831ef028eecSStefano Zampini PetscInt *dof_sizes,*dof_displs; 38323b03a366Sstefano_zampini PetscInt size_of_constraint; 38332e8d2280SStefano Zampini PetscBool *array_bool; 3834ef028eecSStefano Zampini PetscBool first_found; 3835ef028eecSStefano Zampini PetscInt first_index,old_index,s; 3836ef028eecSStefano Zampini PetscMPIInt mpi_local_primal_size; 3837ef028eecSStefano Zampini PetscScalar coarsesum,*array; 3838ef028eecSStefano Zampini 3839ef028eecSStefano Zampini mpi_local_primal_size = (PetscMPIInt)pcbddc->local_primal_size; 3840beed3852SStefano Zampini 3841beed3852SStefano Zampini /* Construct needed data structures for message passing */ 3842ef028eecSStefano Zampini ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscInt),&pcbddc->local_primal_indices);CHKERRQ(ierr); 3843ffe5efe1SStefano Zampini j = 0; 3844142dfd88SStefano Zampini if (rank_prec_comm == 0 || pcbddc->coarse_problem_type == REPLICATED_BDDC || pcbddc->coarse_problem_type == MULTILEVEL_BDDC) { 3845ffe5efe1SStefano Zampini j = size_prec_comm; 3846ffe5efe1SStefano Zampini } 3847ffe5efe1SStefano Zampini ierr = PetscMalloc(j*sizeof(PetscMPIInt),&pcbddc->local_primal_sizes);CHKERRQ(ierr); 3848ffe5efe1SStefano Zampini ierr = PetscMalloc(j*sizeof(PetscMPIInt),&pcbddc->local_primal_displacements);CHKERRQ(ierr); 3849beed3852SStefano Zampini /* Gather local_primal_size information for all processes */ 3850142dfd88SStefano Zampini if (pcbddc->coarse_problem_type == REPLICATED_BDDC || pcbddc->coarse_problem_type == MULTILEVEL_BDDC) { 38515619798eSStefano Zampini ierr = MPI_Allgather(&mpi_local_primal_size,1,MPIU_INT,&pcbddc->local_primal_sizes[0],1,MPIU_INT,prec_comm);CHKERRQ(ierr); 3852ffe5efe1SStefano Zampini } else { 3853ffe5efe1SStefano Zampini ierr = MPI_Gather(&mpi_local_primal_size,1,MPIU_INT,&pcbddc->local_primal_sizes[0],1,MPIU_INT,0,prec_comm);CHKERRQ(ierr); 3854ffe5efe1SStefano Zampini } 3855beed3852SStefano Zampini pcbddc->replicated_primal_size = 0; 3856ffe5efe1SStefano Zampini for (i=0; i<j; i++) { 3857beed3852SStefano Zampini pcbddc->local_primal_displacements[i] = pcbddc->replicated_primal_size; 3858beed3852SStefano Zampini pcbddc->replicated_primal_size += pcbddc->local_primal_sizes[i]; 3859beed3852SStefano Zampini } 3860beed3852SStefano Zampini 3861da1bb401SStefano Zampini /* First let's count coarse dofs. 3862beed3852SStefano Zampini This code fragment assumes that the number of local constraints per connected component 3863beed3852SStefano Zampini is not greater than the number of nodes defined for the connected component 3864beed3852SStefano Zampini (otherwise we will surely have linear dependence between constraints and thus a singular coarse problem) */ 3865ef028eecSStefano Zampini ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscInt),&auxlocal_primal);CHKERRQ(ierr); 38662e8d2280SStefano Zampini j = 0; 38672e8d2280SStefano Zampini for (i=0; i<pcbddc->local_primal_size; i++) { 38682e8d2280SStefano Zampini ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,PETSC_NULL,PETSC_NULL);CHKERRQ(ierr); 38692fa5cd67SKarl Rupp if (j < size_of_constraint) j = size_of_constraint; 38702e8d2280SStefano Zampini ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,PETSC_NULL,PETSC_NULL);CHKERRQ(ierr); 38712e8d2280SStefano Zampini } 38722e8d2280SStefano Zampini ierr = PetscMalloc(j*sizeof(PetscInt),&aux_ordering);CHKERRQ(ierr); 38732e8d2280SStefano Zampini ierr = PetscMalloc(j*sizeof(PetscInt),&row_cmat_global_indices);CHKERRQ(ierr); 38742e8d2280SStefano Zampini ierr = PetscMalloc(pcis->n*sizeof(PetscBool),&array_bool);CHKERRQ(ierr); 38752fa5cd67SKarl Rupp for (i=0;i<pcis->n;i++) array_bool[i] = PETSC_FALSE; 38762fa5cd67SKarl Rupp 3877da1bb401SStefano Zampini for (i=0;i<pcbddc->local_primal_size;i++) { 3878da1bb401SStefano Zampini ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr); 38792fa5cd67SKarl Rupp for (j=0; j<size_of_constraint; j++) aux_ordering[j] = j; 38802fa5cd67SKarl Rupp 38812e8d2280SStefano Zampini ierr = ISLocalToGlobalMappingApply(matis->mapping,size_of_constraint,row_cmat_indices,row_cmat_global_indices);CHKERRQ(ierr); 38822e8d2280SStefano Zampini ierr = PetscSortIntWithPermutation(size_of_constraint,row_cmat_global_indices,aux_ordering);CHKERRQ(ierr); 38832e8d2280SStefano Zampini for (j=0; j<size_of_constraint; j++) { 38842e8d2280SStefano Zampini k = row_cmat_indices[aux_ordering[j]]; 38852e8d2280SStefano Zampini if (!array_bool[k]) { 38862e8d2280SStefano Zampini array_bool[k] = PETSC_TRUE; 3887da1bb401SStefano Zampini auxlocal_primal[i] = k; 3888beed3852SStefano Zampini break; 3889beed3852SStefano Zampini } 3890beed3852SStefano Zampini } 3891da1bb401SStefano Zampini ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr); 3892beed3852SStefano Zampini } 38932e8d2280SStefano Zampini ierr = PetscFree(aux_ordering);CHKERRQ(ierr); 3894ef028eecSStefano Zampini ierr = PetscFree(array_bool);CHKERRQ(ierr); 3895ef028eecSStefano Zampini ierr = PetscFree(row_cmat_global_indices);CHKERRQ(ierr); 38962e8d2280SStefano Zampini 3897ef028eecSStefano Zampini /* Compute number of coarse dofs */ 3898ef028eecSStefano Zampini ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr); 3899ef028eecSStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 39002fa5cd67SKarl Rupp for (i=0;i<pcbddc->local_primal_size;i++) array[auxlocal_primal[i]] = 1.0; 3901ef028eecSStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 3902ef028eecSStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 3903ef028eecSStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 3904ef028eecSStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,pcis->vec1_global,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 3905ef028eecSStefano Zampini ierr = VecSum(pcis->vec1_global,&coarsesum);CHKERRQ(ierr); 3906ef028eecSStefano Zampini pcbddc->coarse_size = (PetscInt)coarsesum; 3907ef028eecSStefano Zampini 3908ef028eecSStefano Zampini /* Fill pcis->vec1_global with cumulative function for global numbering */ 3909ef028eecSStefano Zampini ierr = VecGetArray(pcis->vec1_global,&array);CHKERRQ(ierr); 3910ef028eecSStefano Zampini ierr = VecGetLocalSize(pcis->vec1_global,&s);CHKERRQ(ierr); 3911ef028eecSStefano Zampini k = 0; 3912ef028eecSStefano Zampini first_index = -1; 3913ef028eecSStefano Zampini first_found = PETSC_FALSE; 3914ef028eecSStefano Zampini for (i=0; i<s; i++) { 3915ef028eecSStefano Zampini if (!first_found && array[i] > 0.0) { 3916ef028eecSStefano Zampini first_found = PETSC_TRUE; 3917ef028eecSStefano Zampini first_index = i; 3918ef028eecSStefano Zampini } 3919ef028eecSStefano Zampini k += (PetscInt)array[i]; 3920ef028eecSStefano Zampini } 3921ef028eecSStefano Zampini j = (!rank_prec_comm ? size_prec_comm : 0); 3922ef028eecSStefano Zampini ierr = PetscMalloc(j*sizeof(*dof_sizes),&dof_sizes);CHKERRQ(ierr); 3923ef028eecSStefano Zampini ierr = PetscMalloc(j*sizeof(*dof_displs),&dof_displs);CHKERRQ(ierr); 3924ef028eecSStefano Zampini ierr = MPI_Gather(&k,1,MPIU_INT,dof_sizes,1,MPIU_INT,0,prec_comm);CHKERRQ(ierr); 3925ef028eecSStefano Zampini if (!rank_prec_comm) { 3926ef028eecSStefano Zampini dof_displs[0]=0; 39272fa5cd67SKarl Rupp for (i=1;i<size_prec_comm;i++) dof_displs[i] = dof_displs[i-1]+dof_sizes[i-1]; 3928ef028eecSStefano Zampini } 3929ef028eecSStefano Zampini ierr = MPI_Scatter(dof_displs,1,MPIU_INT,&k,1,MPIU_INT,0,prec_comm);CHKERRQ(ierr); 3930ef028eecSStefano Zampini if (first_found) { 3931ef028eecSStefano Zampini array[first_index] += k; 3932ef028eecSStefano Zampini old_index = first_index; 3933ef028eecSStefano Zampini for (i=first_index+1;i<s;i++) { 3934ef028eecSStefano Zampini if (array[i] > 0.0) { 3935ef028eecSStefano Zampini array[i] += array[old_index]; 3936ef028eecSStefano Zampini old_index = i; 3937ef028eecSStefano Zampini } 3938ef028eecSStefano Zampini } 3939ef028eecSStefano Zampini } 3940ef028eecSStefano Zampini ierr = VecRestoreArray(pcis->vec1_global,&array);CHKERRQ(ierr); 3941ef028eecSStefano Zampini ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr); 3942ef028eecSStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 3943ef028eecSStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 3944ef028eecSStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 39452fa5cd67SKarl Rupp for (i=0;i<pcbddc->local_primal_size;i++) pcbddc->local_primal_indices[i] = (PetscInt)array[auxlocal_primal[i]]-1; 3946ef028eecSStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 3947ef028eecSStefano Zampini ierr = PetscFree(dof_displs);CHKERRQ(ierr); 3948ef028eecSStefano Zampini ierr = PetscFree(dof_sizes);CHKERRQ(ierr); 3949ef028eecSStefano Zampini 3950ef028eecSStefano Zampini if (dbg_flag) { 39512e8d2280SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 39522e8d2280SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr); 39532e8d2280SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Check coarse indices\n");CHKERRQ(ierr); 39542e8d2280SStefano Zampini ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr); 39552e8d2280SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 39562fa5cd67SKarl Rupp for (i=0;i<pcbddc->local_primal_size;i++) array[auxlocal_primal[i]]=1.0; 3957beed3852SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 39582e8d2280SStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 3959da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 3960da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 3961da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 3962da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 3963da1bb401SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 39642e8d2280SStefano Zampini for (i=0;i<pcis->n;i++) { 39652e8d2280SStefano Zampini if (array[i] == 1.0) { 39662e8d2280SStefano Zampini ierr = ISLocalToGlobalMappingApply(matis->mapping,1,&i,&j);CHKERRQ(ierr); 39672e8d2280SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d: WRONG COARSE INDEX %d (local %d)\n",PetscGlobalRank,j,i);CHKERRQ(ierr); 39682e8d2280SStefano Zampini } 39692e8d2280SStefano Zampini } 39702e8d2280SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 39712e8d2280SStefano Zampini for (i=0;i<pcis->n;i++) { 39722fa5cd67SKarl Rupp if (array[i] > 0.0) array[i] = 1.0/array[i]; 39732e8d2280SStefano Zampini } 3974da1bb401SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 39752e8d2280SStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 3976da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 3977da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 3978da1bb401SStefano Zampini ierr = VecSum(pcis->vec1_global,&coarsesum);CHKERRQ(ierr); 39792e8d2280SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Size of coarse problem SHOULD be %lf\n",coarsesum);CHKERRQ(ierr); 39802e8d2280SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 39812e8d2280SStefano Zampini } 3982142dfd88SStefano Zampini ierr = PetscFree(auxlocal_primal);CHKERRQ(ierr); 39830bdf917eSStefano Zampini } 39840bdf917eSStefano Zampini 39852e8d2280SStefano Zampini if (dbg_flag) { 39867cf533a6SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Size of coarse problem is %d\n",pcbddc->coarse_size);CHKERRQ(ierr); 39872e8d2280SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 39882e8d2280SStefano Zampini } 39892e8d2280SStefano Zampini 3990a929c220SStefano Zampini im_active = 0; 39912fa5cd67SKarl Rupp if (pcis->n) im_active = 1; 3992a929c220SStefano Zampini ierr = MPI_Allreduce(&im_active,&active_procs,1,MPIU_INT,MPI_SUM,prec_comm);CHKERRQ(ierr); 39930bdf917eSStefano Zampini 39940bdf917eSStefano Zampini /* adapt coarse problem type */ 39954fad6a16SStefano Zampini if (pcbddc->coarse_problem_type == MULTILEVEL_BDDC) { 39964fad6a16SStefano Zampini if (pcbddc->current_level < pcbddc->max_levels) { 3997a929c220SStefano Zampini if ((active_procs/pcbddc->coarsening_ratio) < 2) { 39980bdf917eSStefano Zampini if (dbg_flag) { 3999a929c220SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Not enough active processes on level %d (active %d,ratio %d). Parallel direct solve for coarse problem\n",pcbddc->current_level,active_procs,pcbddc->coarsening_ratio);CHKERRQ(ierr); 40000bdf917eSStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 40010bdf917eSStefano Zampini } 40020bdf917eSStefano Zampini pcbddc->coarse_problem_type = PARALLEL_BDDC; 4003142dfd88SStefano Zampini } 40044fad6a16SStefano Zampini } else { 40054fad6a16SStefano Zampini if (dbg_flag) { 4006a929c220SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Max number of levels reached. Using parallel direct solve for coarse problem\n",pcbddc->max_levels,active_procs,pcbddc->coarsening_ratio);CHKERRQ(ierr); 40074fad6a16SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 40084fad6a16SStefano Zampini } 40094fad6a16SStefano Zampini pcbddc->coarse_problem_type = PARALLEL_BDDC; 40104fad6a16SStefano Zampini } 40114fad6a16SStefano Zampini } 4012beed3852SStefano Zampini 40130c7d97c5SJed Brown switch (pcbddc->coarse_problem_type) { 40140c7d97c5SJed Brown 4015da1bb401SStefano Zampini case (MULTILEVEL_BDDC): /* we define a coarse mesh where subdomains are elements */ 40160c7d97c5SJed Brown { 40170c7d97c5SJed Brown /* we need additional variables */ 40180c7d97c5SJed Brown MetisInt n_subdomains,n_parts,objval,ncon,faces_nvtxs; 40190c7d97c5SJed Brown MetisInt *metis_coarse_subdivision; 40200c7d97c5SJed Brown MetisInt options[METIS_NOPTIONS]; 40210c7d97c5SJed Brown PetscMPIInt size_coarse_comm,rank_coarse_comm; 40220c7d97c5SJed Brown PetscMPIInt procs_jumps_coarse_comm; 40230c7d97c5SJed Brown PetscMPIInt *coarse_subdivision; 40240c7d97c5SJed Brown PetscMPIInt *total_count_recv; 40250c7d97c5SJed Brown PetscMPIInt *total_ranks_recv; 40260c7d97c5SJed Brown PetscMPIInt *displacements_recv; 40270c7d97c5SJed Brown PetscMPIInt *my_faces_connectivity; 40280c7d97c5SJed Brown PetscMPIInt *petsc_faces_adjncy; 40290c7d97c5SJed Brown MetisInt *faces_adjncy; 40300c7d97c5SJed Brown MetisInt *faces_xadj; 40310c7d97c5SJed Brown PetscMPIInt *number_of_faces; 40320c7d97c5SJed Brown PetscMPIInt *faces_displacements; 40330c7d97c5SJed Brown PetscInt *array_int; 40340c7d97c5SJed Brown PetscMPIInt my_faces =0; 40350c7d97c5SJed Brown PetscMPIInt total_faces=0; 40363828260eSStefano Zampini PetscInt ranks_stretching_ratio; 40370c7d97c5SJed Brown 40380c7d97c5SJed Brown /* define some quantities */ 40390c7d97c5SJed Brown pcbddc->coarse_communications_type = SCATTERS_BDDC; 40400c7d97c5SJed Brown coarse_mat_type = MATIS; 40410c7d97c5SJed Brown coarse_pc_type = PCBDDC; 4042142dfd88SStefano Zampini coarse_ksp_type = KSPRICHARDSON; 40430c7d97c5SJed Brown 40440c7d97c5SJed Brown /* details of coarse decomposition */ 4045a929c220SStefano Zampini n_subdomains = active_procs; 40460c7d97c5SJed Brown n_parts = n_subdomains/pcbddc->coarsening_ratio; 4047a929c220SStefano Zampini ranks_stretching_ratio = size_prec_comm/active_procs; 40483828260eSStefano Zampini procs_jumps_coarse_comm = pcbddc->coarsening_ratio*ranks_stretching_ratio; 40493828260eSStefano Zampini 4050a929c220SStefano Zampini #if 0 4051a929c220SStefano Zampini PetscMPIInt *old_ranks; 4052a929c220SStefano Zampini PetscInt *new_ranks,*jj,*ii; 4053a929c220SStefano Zampini MatPartitioning mat_part; 4054a929c220SStefano Zampini IS coarse_new_decomposition,is_numbering; 4055a929c220SStefano Zampini PetscViewer viewer_test; 4056a929c220SStefano Zampini MPI_Comm test_coarse_comm; 4057a929c220SStefano Zampini PetscMPIInt test_coarse_color; 4058a929c220SStefano Zampini Mat mat_adj; 4059a929c220SStefano Zampini /* Create new communicator for coarse problem splitting the old one */ 4060a929c220SStefano Zampini /* procs with coarse_color = MPI_UNDEFINED will have coarse_comm = MPI_COMM_NULL (from mpi standards) 4061a929c220SStefano Zampini key = rank_prec_comm -> keep same ordering of ranks from the old to the new communicator */ 4062a929c220SStefano Zampini test_coarse_color = (im_active ? 0 : MPI_UNDEFINED); 4063a929c220SStefano Zampini test_coarse_comm = MPI_COMM_NULL; 4064a929c220SStefano Zampini ierr = MPI_Comm_split(prec_comm,test_coarse_color,rank_prec_comm,&test_coarse_comm);CHKERRQ(ierr); 4065a929c220SStefano Zampini if (im_active) { 4066a929c220SStefano Zampini ierr = PetscMalloc(n_subdomains*sizeof(PetscMPIInt),&old_ranks); 4067a929c220SStefano Zampini ierr = PetscMalloc(size_prec_comm*sizeof(PetscInt),&new_ranks); 4068a929c220SStefano Zampini ierr = MPI_Comm_rank(test_coarse_comm,&rank_coarse_comm);CHKERRQ(ierr); 4069a929c220SStefano Zampini ierr = MPI_Comm_size(test_coarse_comm,&j);CHKERRQ(ierr); 4070a929c220SStefano Zampini ierr = MPI_Allgather(&rank_prec_comm,1,MPIU_INT,old_ranks,1,MPIU_INT,test_coarse_comm);CHKERRQ(ierr); 40712fa5cd67SKarl Rupp for (i=0; i<size_prec_comm; i++) 4072a929c220SStefano Zampini new_ranks[i] = -1; 40732fa5cd67SKarl Rupp for (i=0; i<n_subdomains; i++) 4074a929c220SStefano Zampini new_ranks[old_ranks[i]] = i; 4075a929c220SStefano Zampini ierr = PetscViewerASCIIOpen(test_coarse_comm,"test_mat_part.out",&viewer_test);CHKERRQ(ierr); 4076a929c220SStefano Zampini k = pcis->n_neigh-1; 4077a929c220SStefano Zampini ierr = PetscMalloc(2*sizeof(PetscInt),&ii); 4078a929c220SStefano Zampini ii[0]=0; 4079a929c220SStefano Zampini ii[1]=k; 4080a929c220SStefano Zampini ierr = PetscMalloc(k*sizeof(PetscInt),&jj); 40812fa5cd67SKarl Rupp for (i=0; i<k; i++) 4082a929c220SStefano Zampini jj[i]=new_ranks[pcis->neigh[i+1]]; 4083a929c220SStefano Zampini ierr = PetscSortInt(k,jj);CHKERRQ(ierr); 4084a929c220SStefano Zampini ierr = MatCreateMPIAdj(test_coarse_comm,1,n_subdomains,ii,jj,PETSC_NULL,&mat_adj);CHKERRQ(ierr); 4085a929c220SStefano Zampini ierr = MatView(mat_adj,viewer_test);CHKERRQ(ierr); 4086a929c220SStefano Zampini ierr = MatPartitioningCreate(test_coarse_comm,&mat_part);CHKERRQ(ierr); 4087a929c220SStefano Zampini ierr = MatPartitioningSetAdjacency(mat_part,mat_adj);CHKERRQ(ierr); 4088a929c220SStefano Zampini ierr = MatPartitioningSetFromOptions(mat_part);CHKERRQ(ierr); 4089a929c220SStefano Zampini printf("Setting Nparts %d\n",n_parts); 4090a929c220SStefano Zampini ierr = MatPartitioningSetNParts(mat_part,n_parts);CHKERRQ(ierr); 4091a929c220SStefano Zampini ierr = MatPartitioningView(mat_part,viewer_test);CHKERRQ(ierr); 4092a929c220SStefano Zampini ierr = MatPartitioningApply(mat_part,&coarse_new_decomposition);CHKERRQ(ierr); 4093a929c220SStefano Zampini ierr = ISView(coarse_new_decomposition,viewer_test);CHKERRQ(ierr); 4094a929c220SStefano Zampini ierr = ISPartitioningToNumbering(coarse_new_decomposition,&is_numbering);CHKERRQ(ierr); 4095a929c220SStefano Zampini ierr = ISView(is_numbering,viewer_test);CHKERRQ(ierr); 4096a929c220SStefano Zampini ierr = PetscViewerDestroy(&viewer_test);CHKERRQ(ierr); 4097a929c220SStefano Zampini ierr = ISDestroy(&coarse_new_decomposition);CHKERRQ(ierr); 4098a929c220SStefano Zampini ierr = ISDestroy(&is_numbering);CHKERRQ(ierr); 4099a929c220SStefano Zampini ierr = MatPartitioningDestroy(&mat_part);CHKERRQ(ierr); 4100a929c220SStefano Zampini ierr = PetscFree(old_ranks);CHKERRQ(ierr); 4101a929c220SStefano Zampini ierr = PetscFree(new_ranks);CHKERRQ(ierr); 4102a929c220SStefano Zampini ierr = MPI_Comm_free(&test_coarse_comm);CHKERRQ(ierr); 4103a929c220SStefano Zampini } 4104a929c220SStefano Zampini #endif 4105a929c220SStefano Zampini 41064fad6a16SStefano Zampini /* build CSR graph of subdomains' connectivity */ 41070c7d97c5SJed Brown ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&array_int);CHKERRQ(ierr); 41083828260eSStefano Zampini ierr = PetscMemzero(array_int,pcis->n*sizeof(PetscInt));CHKERRQ(ierr); 41090c7d97c5SJed Brown for (i=1;i<pcis->n_neigh;i++) {/* i=1 so I don't count myself -> faces nodes counts to 1 */ 41100c7d97c5SJed Brown for (j=0;j<pcis->n_shared[i];j++) { 41110c7d97c5SJed Brown array_int[pcis->shared[i][j]]+=1; 41120c7d97c5SJed Brown } 41130c7d97c5SJed Brown } 41140c7d97c5SJed Brown for (i=1;i<pcis->n_neigh;i++) { 41150c7d97c5SJed Brown for (j=0;j<pcis->n_shared[i];j++) { 41167cf533a6SStefano Zampini if (array_int[pcis->shared[i][j]] > 0) { 41170c7d97c5SJed Brown my_faces++; 41180c7d97c5SJed Brown break; 41190c7d97c5SJed Brown } 41200c7d97c5SJed Brown } 41210c7d97c5SJed Brown } 41220c7d97c5SJed Brown 412353cdbc3dSStefano Zampini ierr = MPI_Reduce(&my_faces,&total_faces,1,MPIU_INT,MPI_SUM,master_proc,prec_comm);CHKERRQ(ierr); 41240c7d97c5SJed Brown ierr = PetscMalloc (my_faces*sizeof(PetscInt),&my_faces_connectivity);CHKERRQ(ierr); 41250c7d97c5SJed Brown my_faces=0; 41260c7d97c5SJed Brown for (i=1;i<pcis->n_neigh;i++) { 41270c7d97c5SJed Brown for (j=0;j<pcis->n_shared[i];j++) { 41287cf533a6SStefano Zampini if (array_int[pcis->shared[i][j]] > 0) { 41290c7d97c5SJed Brown my_faces_connectivity[my_faces]=pcis->neigh[i]; 41300c7d97c5SJed Brown my_faces++; 41310c7d97c5SJed Brown break; 41320c7d97c5SJed Brown } 41330c7d97c5SJed Brown } 41340c7d97c5SJed Brown } 41350c7d97c5SJed Brown if (rank_prec_comm == master_proc) { 41360c7d97c5SJed Brown ierr = PetscMalloc (total_faces*sizeof(PetscMPIInt),&petsc_faces_adjncy);CHKERRQ(ierr); 41370c7d97c5SJed Brown ierr = PetscMalloc (size_prec_comm*sizeof(PetscMPIInt),&number_of_faces);CHKERRQ(ierr); 41380c7d97c5SJed Brown ierr = PetscMalloc (total_faces*sizeof(MetisInt),&faces_adjncy);CHKERRQ(ierr); 41390c7d97c5SJed Brown ierr = PetscMalloc ((n_subdomains+1)*sizeof(MetisInt),&faces_xadj);CHKERRQ(ierr); 41400c7d97c5SJed Brown ierr = PetscMalloc ((size_prec_comm+1)*sizeof(PetscMPIInt),&faces_displacements);CHKERRQ(ierr); 41410c7d97c5SJed Brown } 414253cdbc3dSStefano Zampini ierr = MPI_Gather(&my_faces,1,MPIU_INT,&number_of_faces[0],1,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr); 41430c7d97c5SJed Brown if (rank_prec_comm == master_proc) { 41440c7d97c5SJed Brown faces_xadj[0] = 0; 41450c7d97c5SJed Brown faces_displacements[0] = 0; 41462fa5cd67SKarl Rupp 41470c7d97c5SJed Brown j=0; 41480c7d97c5SJed Brown for (i=1;i<size_prec_comm+1;i++) { 41490c7d97c5SJed Brown faces_displacements[i]=faces_displacements[i-1]+number_of_faces[i-1]; 41500c7d97c5SJed Brown if (number_of_faces[i-1]) { 41510c7d97c5SJed Brown j++; 41520c7d97c5SJed Brown faces_xadj[j]=faces_xadj[j-1]+number_of_faces[i-1]; 41530c7d97c5SJed Brown } 41540c7d97c5SJed Brown } 41550c7d97c5SJed Brown } 415653cdbc3dSStefano Zampini ierr = MPI_Gatherv(&my_faces_connectivity[0],my_faces,MPIU_INT,&petsc_faces_adjncy[0],number_of_faces,faces_displacements,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr); 41570c7d97c5SJed Brown ierr = PetscFree(my_faces_connectivity);CHKERRQ(ierr); 41580c7d97c5SJed Brown ierr = PetscFree(array_int);CHKERRQ(ierr); 41590c7d97c5SJed Brown if (rank_prec_comm == master_proc) { 41603828260eSStefano Zampini for (i=0; i<total_faces; i++) faces_adjncy[i]=(MetisInt)(petsc_faces_adjncy[i]/ranks_stretching_ratio); /* cast to MetisInt */ 41610c7d97c5SJed Brown ierr = PetscFree(faces_displacements);CHKERRQ(ierr); 41620c7d97c5SJed Brown ierr = PetscFree(number_of_faces);CHKERRQ(ierr); 41630c7d97c5SJed Brown ierr = PetscFree(petsc_faces_adjncy);CHKERRQ(ierr); 41640c7d97c5SJed Brown } 41650c7d97c5SJed Brown 41660c7d97c5SJed Brown if (rank_prec_comm == master_proc) { 41673828260eSStefano Zampini PetscInt heuristic_for_metis=3; 41680c7d97c5SJed Brown ncon =1; 41690c7d97c5SJed Brown faces_nvtxs=n_subdomains; 41700c7d97c5SJed Brown /* partition graoh induced by face connectivity */ 41710c7d97c5SJed Brown ierr = PetscMalloc (n_subdomains*sizeof(MetisInt),&metis_coarse_subdivision);CHKERRQ(ierr); 41720c7d97c5SJed Brown ierr = METIS_SetDefaultOptions(options); 41730c7d97c5SJed Brown /* we need a contiguous partition of the coarse mesh */ 41740c7d97c5SJed Brown options[METIS_OPTION_CONTIG]=1; 41750c7d97c5SJed Brown options[METIS_OPTION_NITER] =30; 41764fad6a16SStefano Zampini if (pcbddc->coarsening_ratio > 1) { 41773828260eSStefano Zampini if (n_subdomains>n_parts*heuristic_for_metis) { 41783828260eSStefano Zampini options[METIS_OPTION_IPTYPE] =METIS_IPTYPE_EDGE; 41793828260eSStefano Zampini options[METIS_OPTION_OBJTYPE]=METIS_OBJTYPE_CUT; 41802fa5cd67SKarl Rupp 41810c7d97c5SJed Brown ierr = METIS_PartGraphKway(&faces_nvtxs,&ncon,faces_xadj,faces_adjncy,NULL,NULL,NULL,&n_parts,NULL,NULL,options,&objval,metis_coarse_subdivision); 4182142dfd88SStefano Zampini if (ierr != METIS_OK) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in METIS_PartGraphKway (metis error code %D) called from PCBDDCSetupCoarseEnvironment\n",ierr); 41833828260eSStefano Zampini } else { 41843828260eSStefano Zampini ierr = METIS_PartGraphRecursive(&faces_nvtxs,&ncon,faces_xadj,faces_adjncy,NULL,NULL,NULL,&n_parts,NULL,NULL,options,&objval,metis_coarse_subdivision); 4185142dfd88SStefano Zampini if (ierr != METIS_OK) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in METIS_PartGraphRecursive (metis error code %D) called from PCBDDCSetupCoarseEnvironment\n",ierr); 41863828260eSStefano Zampini } 41874fad6a16SStefano Zampini } else { 41882fa5cd67SKarl Rupp for (i=0;i<n_subdomains;i++) metis_coarse_subdivision[i]=i; 41894fad6a16SStefano Zampini } 41900c7d97c5SJed Brown ierr = PetscFree(faces_xadj);CHKERRQ(ierr); 41910c7d97c5SJed Brown ierr = PetscFree(faces_adjncy);CHKERRQ(ierr); 41920bdf917eSStefano Zampini ierr = PetscMalloc(size_prec_comm*sizeof(PetscMPIInt),&coarse_subdivision);CHKERRQ(ierr); 41932fa5cd67SKarl Rupp 41940c7d97c5SJed Brown /* copy/cast values avoiding possible type conflicts between PETSc, MPI and METIS */ 41952fa5cd67SKarl Rupp for (i=0;i<size_prec_comm;i++) coarse_subdivision[i]=MPI_PROC_NULL; 41962fa5cd67SKarl Rupp for (i=0;i<n_subdomains;i++) coarse_subdivision[ranks_stretching_ratio*i]=(PetscInt)(metis_coarse_subdivision[i]); 41970c7d97c5SJed Brown ierr = PetscFree(metis_coarse_subdivision);CHKERRQ(ierr); 41980c7d97c5SJed Brown } 41990c7d97c5SJed Brown 42000c7d97c5SJed Brown /* Create new communicator for coarse problem splitting the old one */ 42010c7d97c5SJed Brown if (!(rank_prec_comm%procs_jumps_coarse_comm) && rank_prec_comm < procs_jumps_coarse_comm*n_parts) { 4202da1bb401SStefano Zampini coarse_color=0; /* for communicator splitting */ 4203da1bb401SStefano Zampini active_rank =rank_prec_comm; /* for insertion of matrix values */ 42040c7d97c5SJed Brown } 4205da1bb401SStefano Zampini /* procs with coarse_color = MPI_UNDEFINED will have coarse_comm = MPI_COMM_NULL (from mpi standards) 4206da1bb401SStefano Zampini key = rank_prec_comm -> keep same ordering of ranks from the old to the new communicator */ 420753cdbc3dSStefano Zampini ierr = MPI_Comm_split(prec_comm,coarse_color,rank_prec_comm,&coarse_comm);CHKERRQ(ierr); 42080c7d97c5SJed Brown 42090c7d97c5SJed Brown if (coarse_color == 0) { 421053cdbc3dSStefano Zampini ierr = MPI_Comm_size(coarse_comm,&size_coarse_comm);CHKERRQ(ierr); 421153cdbc3dSStefano Zampini ierr = MPI_Comm_rank(coarse_comm,&rank_coarse_comm);CHKERRQ(ierr); 42120c7d97c5SJed Brown } else { 42130c7d97c5SJed Brown rank_coarse_comm = MPI_PROC_NULL; 42140c7d97c5SJed Brown } 42150c7d97c5SJed Brown 42167cf533a6SStefano Zampini /* master proc take care of arranging and distributing coarse information */ 42170c7d97c5SJed Brown if (rank_coarse_comm == master_proc) { 42180c7d97c5SJed Brown ierr = PetscMalloc (size_coarse_comm*sizeof(PetscMPIInt),&displacements_recv);CHKERRQ(ierr); 42190bdf917eSStefano Zampini ierr = PetscMalloc (size_coarse_comm*sizeof(PetscMPIInt),&total_count_recv);CHKERRQ(ierr); 42200bdf917eSStefano Zampini ierr = PetscMalloc (n_subdomains*sizeof(PetscMPIInt),&total_ranks_recv);CHKERRQ(ierr); 42210c7d97c5SJed Brown /* some initializations */ 42220c7d97c5SJed Brown displacements_recv[0]=0; 42230bdf917eSStefano Zampini ierr = PetscMemzero(total_count_recv,size_coarse_comm*sizeof(PetscMPIInt));CHKERRQ(ierr); 42240c7d97c5SJed Brown /* count from how many processes the j-th process of the coarse decomposition will receive data */ 42250bdf917eSStefano Zampini for (j=0; j<size_coarse_comm; j++) { 42260bdf917eSStefano Zampini for (i=0; i<size_prec_comm; i++) { 42272fa5cd67SKarl Rupp if (coarse_subdivision[i]==j) total_count_recv[j]++; 42280bdf917eSStefano Zampini } 42290bdf917eSStefano Zampini } 42300c7d97c5SJed Brown /* displacements needed for scatterv of total_ranks_recv */ 42312fa5cd67SKarl Rupp for (i=1; i<size_coarse_comm; i++) displacements_recv[i]=displacements_recv[i-1]+total_count_recv[i-1]; 42322fa5cd67SKarl Rupp 42330c7d97c5SJed Brown /* Now fill properly total_ranks_recv -> each coarse process will receive the ranks (in prec_comm communicator) of its friend (sending) processes */ 42340c7d97c5SJed Brown ierr = PetscMemzero(total_count_recv,size_coarse_comm*sizeof(PetscMPIInt));CHKERRQ(ierr); 42350c7d97c5SJed Brown for (j=0; j<size_coarse_comm; j++) { 42363828260eSStefano Zampini for (i=0; i<size_prec_comm; i++) { 42370c7d97c5SJed Brown if (coarse_subdivision[i]==j) { 42380c7d97c5SJed Brown total_ranks_recv[displacements_recv[j]+total_count_recv[j]] = i; 42392fa5cd67SKarl Rupp 42403828260eSStefano Zampini total_count_recv[j] += 1; 42410c7d97c5SJed Brown } 42420c7d97c5SJed Brown } 42430c7d97c5SJed Brown } 4244da1bb401SStefano Zampini /* for (j=0;j<size_coarse_comm;j++) { 42453828260eSStefano Zampini printf("process %d in new rank will receive from %d processes (original ranks follows)\n",j,total_count_recv[j]); 42463828260eSStefano Zampini for (i=0;i<total_count_recv[j];i++) { 42473828260eSStefano Zampini printf("%d ",total_ranks_recv[displacements_recv[j]+i]); 42483828260eSStefano Zampini } 42493828260eSStefano Zampini printf("\n"); 4250da1bb401SStefano Zampini } */ 42510c7d97c5SJed Brown 42520c7d97c5SJed Brown /* identify new decomposition in terms of ranks in the old communicator */ 42530bdf917eSStefano Zampini for (i=0; i<n_subdomains; i++) { 42540bdf917eSStefano Zampini coarse_subdivision[ranks_stretching_ratio*i]=coarse_subdivision[ranks_stretching_ratio*i]*procs_jumps_coarse_comm; 42550bdf917eSStefano Zampini } 4256da1bb401SStefano Zampini /* printf("coarse_subdivision in old end new ranks\n"); 42572fa5cd67SKarl Rupp for (i=0;i<size_prec_comm;i++) { 42583828260eSStefano Zampini if (coarse_subdivision[i]!=MPI_PROC_NULL) { 42593828260eSStefano Zampini printf("%d=(%d %d), ",i,coarse_subdivision[i],coarse_subdivision[i]/procs_jumps_coarse_comm); 42603828260eSStefano Zampini } else { 42613828260eSStefano Zampini printf("%d=(%d %d), ",i,coarse_subdivision[i],coarse_subdivision[i]); 42623828260eSStefano Zampini } 42632fa5cd67SKarl Rupp } 4264da1bb401SStefano Zampini printf("\n"); */ 42650c7d97c5SJed Brown } 42660c7d97c5SJed Brown 42670c7d97c5SJed Brown /* Scatter new decomposition for send details */ 426853cdbc3dSStefano Zampini ierr = MPI_Scatter(&coarse_subdivision[0],1,MPIU_INT,&rank_coarse_proc_send_to,1,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr); 42690c7d97c5SJed Brown /* Scatter receiving details to members of coarse decomposition */ 42700c7d97c5SJed Brown if (coarse_color == 0) { 427153cdbc3dSStefano Zampini ierr = MPI_Scatter(&total_count_recv[0],1,MPIU_INT,&count_recv,1,MPIU_INT,master_proc,coarse_comm);CHKERRQ(ierr); 42720c7d97c5SJed Brown ierr = PetscMalloc (count_recv*sizeof(PetscMPIInt),&ranks_recv);CHKERRQ(ierr); 427353cdbc3dSStefano Zampini ierr = MPI_Scatterv(&total_ranks_recv[0],total_count_recv,displacements_recv,MPIU_INT,&ranks_recv[0],count_recv,MPIU_INT,master_proc,coarse_comm);CHKERRQ(ierr); 42740c7d97c5SJed Brown } 42750c7d97c5SJed Brown 4276da1bb401SStefano Zampini /* printf("I will send my matrix data to proc %d\n",rank_coarse_proc_send_to); 4277da1bb401SStefano Zampini if (coarse_color == 0) { 4278da1bb401SStefano Zampini printf("I will receive some matrix data from %d processes (ranks follows)\n",count_recv); 4279da1bb401SStefano Zampini for (i=0;i<count_recv;i++) 4280da1bb401SStefano Zampini printf("%d ",ranks_recv[i]); 4281da1bb401SStefano Zampini printf("\n"); 4282da1bb401SStefano Zampini } */ 42830c7d97c5SJed Brown 42840c7d97c5SJed Brown if (rank_prec_comm == master_proc) { 42850bdf917eSStefano Zampini ierr = PetscFree(coarse_subdivision);CHKERRQ(ierr); 4286da1bb401SStefano Zampini ierr = PetscFree(total_count_recv);CHKERRQ(ierr); 42870bdf917eSStefano Zampini ierr = PetscFree(total_ranks_recv);CHKERRQ(ierr); 42880c7d97c5SJed Brown ierr = PetscFree(displacements_recv);CHKERRQ(ierr); 42890c7d97c5SJed Brown } 42900c7d97c5SJed Brown break; 42910c7d97c5SJed Brown } 42920c7d97c5SJed Brown 42930c7d97c5SJed Brown case (REPLICATED_BDDC): 42940c7d97c5SJed Brown 42950c7d97c5SJed Brown pcbddc->coarse_communications_type = GATHERS_BDDC; 42960c7d97c5SJed Brown coarse_mat_type = MATSEQAIJ; 42970c7d97c5SJed Brown coarse_pc_type = PCLU; 429853cdbc3dSStefano Zampini coarse_ksp_type = KSPPREONLY; 42990c7d97c5SJed Brown coarse_comm = PETSC_COMM_SELF; 43000c7d97c5SJed Brown active_rank = rank_prec_comm; 43010c7d97c5SJed Brown break; 43020c7d97c5SJed Brown 43030c7d97c5SJed Brown case (PARALLEL_BDDC): 43040c7d97c5SJed Brown 43050c7d97c5SJed Brown pcbddc->coarse_communications_type = SCATTERS_BDDC; 43060c7d97c5SJed Brown coarse_mat_type = MATMPIAIJ; 43070c7d97c5SJed Brown coarse_pc_type = PCREDUNDANT; 430853cdbc3dSStefano Zampini coarse_ksp_type = KSPPREONLY; 43090c7d97c5SJed Brown coarse_comm = prec_comm; 43100c7d97c5SJed Brown active_rank = rank_prec_comm; 43110c7d97c5SJed Brown break; 43120c7d97c5SJed Brown 43130c7d97c5SJed Brown case (SEQUENTIAL_BDDC): 43140c7d97c5SJed Brown pcbddc->coarse_communications_type = GATHERS_BDDC; 43150c7d97c5SJed Brown coarse_mat_type = MATSEQAIJ; 43160c7d97c5SJed Brown coarse_pc_type = PCLU; 431753cdbc3dSStefano Zampini coarse_ksp_type = KSPPREONLY; 43180c7d97c5SJed Brown coarse_comm = PETSC_COMM_SELF; 43190c7d97c5SJed Brown active_rank = master_proc; 43200c7d97c5SJed Brown break; 43210c7d97c5SJed Brown } 43220c7d97c5SJed Brown 43230c7d97c5SJed Brown switch (pcbddc->coarse_communications_type) { 43240c7d97c5SJed Brown 43250c7d97c5SJed Brown case(SCATTERS_BDDC): 43260c7d97c5SJed Brown { 43270c7d97c5SJed Brown if (pcbddc->coarse_problem_type==MULTILEVEL_BDDC) { 43280c7d97c5SJed Brown 43292e8d2280SStefano Zampini IS coarse_IS; 43302e8d2280SStefano Zampini 4331523858cfSStefano Zampini if (pcbddc->coarsening_ratio == 1) { 4332523858cfSStefano Zampini ins_local_primal_size = pcbddc->local_primal_size; 4333523858cfSStefano Zampini ins_local_primal_indices = pcbddc->local_primal_indices; 4334523858cfSStefano Zampini if (coarse_color == 0) { ierr = PetscFree(ranks_recv);CHKERRQ(ierr); } 4335523858cfSStefano Zampini /* nonzeros */ 4336523858cfSStefano Zampini ierr = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&dnz);CHKERRQ(ierr); 4337523858cfSStefano Zampini ierr = PetscMemzero(dnz,ins_local_primal_size*sizeof(PetscInt));CHKERRQ(ierr); 4338523858cfSStefano Zampini for (i=0;i<ins_local_primal_size;i++) { 4339523858cfSStefano Zampini dnz[i] = ins_local_primal_size; 4340523858cfSStefano Zampini } 4341523858cfSStefano Zampini } else { 43420c7d97c5SJed Brown PetscMPIInt send_size; 4343ef028eecSStefano Zampini PetscMPIInt *send_buffer; 43440c7d97c5SJed Brown PetscInt *aux_ins_indices; 43450c7d97c5SJed Brown PetscInt ii,jj; 43460c7d97c5SJed Brown MPI_Request *requests; 4347ef028eecSStefano Zampini 4348523858cfSStefano Zampini ierr = PetscMalloc(count_recv*sizeof(PetscMPIInt),&localdispl2);CHKERRQ(ierr); 4349523858cfSStefano Zampini /* reusing pcbddc->local_primal_displacements and pcbddc->replicated_primal_size */ 4350523858cfSStefano Zampini ierr = PetscFree(pcbddc->local_primal_displacements);CHKERRQ(ierr); 4351523858cfSStefano Zampini ierr = PetscMalloc((count_recv+1)*sizeof(PetscMPIInt),&pcbddc->local_primal_displacements);CHKERRQ(ierr); 4352523858cfSStefano Zampini pcbddc->replicated_primal_size = count_recv; 4353523858cfSStefano Zampini j = 0; 4354523858cfSStefano Zampini for (i=0;i<count_recv;i++) { 4355523858cfSStefano Zampini pcbddc->local_primal_displacements[i] = j; 4356523858cfSStefano Zampini j += pcbddc->local_primal_sizes[ranks_recv[i]]; 4357523858cfSStefano Zampini } 4358523858cfSStefano Zampini pcbddc->local_primal_displacements[count_recv] = j; 4359523858cfSStefano Zampini ierr = PetscMalloc(j*sizeof(PetscMPIInt),&pcbddc->replicated_local_primal_indices);CHKERRQ(ierr); 43600c7d97c5SJed Brown /* allocate auxiliary space */ 4361523858cfSStefano Zampini ierr = PetscMalloc(count_recv*sizeof(PetscMPIInt),&localsizes2);CHKERRQ(ierr); 43620c7d97c5SJed Brown ierr = PetscMalloc(pcbddc->coarse_size*sizeof(PetscInt),&aux_ins_indices);CHKERRQ(ierr); 43630c7d97c5SJed Brown ierr = PetscMemzero(aux_ins_indices,pcbddc->coarse_size*sizeof(PetscInt));CHKERRQ(ierr); 43640c7d97c5SJed Brown /* allocate stuffs for message massing */ 43650c7d97c5SJed Brown ierr = PetscMalloc((count_recv+1)*sizeof(MPI_Request),&requests);CHKERRQ(ierr); 4366523858cfSStefano Zampini for (i=0;i<count_recv+1;i++) { requests[i]=MPI_REQUEST_NULL; } 4367523858cfSStefano Zampini /* send indices to be inserted */ 4368523858cfSStefano Zampini for (i=0;i<count_recv;i++) { 4369523858cfSStefano Zampini send_size = pcbddc->local_primal_sizes[ranks_recv[i]]; 4370523858cfSStefano Zampini ierr = MPI_Irecv(&pcbddc->replicated_local_primal_indices[pcbddc->local_primal_displacements[i]],send_size,MPIU_INT,ranks_recv[i],999,prec_comm,&requests[i]);CHKERRQ(ierr); 4371523858cfSStefano Zampini } 4372523858cfSStefano Zampini if (rank_coarse_proc_send_to != MPI_PROC_NULL) { 4373523858cfSStefano Zampini send_size = pcbddc->local_primal_size; 4374ef028eecSStefano Zampini ierr = PetscMalloc(send_size*sizeof(PetscMPIInt),&send_buffer);CHKERRQ(ierr); 4375ef028eecSStefano Zampini for (i=0;i<send_size;i++) { 4376ef028eecSStefano Zampini send_buffer[i]=(PetscMPIInt)pcbddc->local_primal_indices[i]; 4377ef028eecSStefano Zampini } 4378ef028eecSStefano Zampini ierr = MPI_Isend(send_buffer,send_size,MPIU_INT,rank_coarse_proc_send_to,999,prec_comm,&requests[count_recv]);CHKERRQ(ierr); 4379523858cfSStefano Zampini } 4380523858cfSStefano Zampini ierr = MPI_Waitall(count_recv+1,requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 4381ef028eecSStefano Zampini if (rank_coarse_proc_send_to != MPI_PROC_NULL) { 4382ef028eecSStefano Zampini ierr = PetscFree(send_buffer);CHKERRQ(ierr); 4383ef028eecSStefano Zampini } 43840c7d97c5SJed Brown j = 0; 43850c7d97c5SJed Brown for (i=0;i<count_recv;i++) { 43862e8d2280SStefano Zampini ii = pcbddc->local_primal_displacements[i+1]-pcbddc->local_primal_displacements[i]; 43872e8d2280SStefano Zampini localsizes2[i] = ii*ii; 43880c7d97c5SJed Brown localdispl2[i] = j; 43890c7d97c5SJed Brown j += localsizes2[i]; 4390523858cfSStefano Zampini jj = pcbddc->local_primal_displacements[i]; 43914fad6a16SStefano Zampini /* it counts the coarse subdomains sharing the coarse node */ 43922e8d2280SStefano Zampini for (k=0;k<ii;k++) { 43934fad6a16SStefano Zampini aux_ins_indices[pcbddc->replicated_local_primal_indices[jj+k]] += 1; 43940c7d97c5SJed Brown } 43954fad6a16SStefano Zampini } 4396523858cfSStefano Zampini /* temp_coarse_mat_vals used to store matrix values to be received */ 43970c7d97c5SJed Brown ierr = PetscMalloc(j*sizeof(PetscScalar),&temp_coarse_mat_vals);CHKERRQ(ierr); 43980c7d97c5SJed Brown /* evaluate how many values I will insert in coarse mat */ 43990c7d97c5SJed Brown ins_local_primal_size = 0; 4400ea7e1babSStefano Zampini for (i=0;i<pcbddc->coarse_size;i++) { 4401ea7e1babSStefano Zampini if (aux_ins_indices[i]) { 44020c7d97c5SJed Brown ins_local_primal_size++; 4403ea7e1babSStefano Zampini } 4404ea7e1babSStefano Zampini } 44050c7d97c5SJed Brown /* evaluate indices I will insert in coarse mat */ 44060c7d97c5SJed Brown ierr = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&ins_local_primal_indices);CHKERRQ(ierr); 44070c7d97c5SJed Brown j = 0; 4408ea7e1babSStefano Zampini for (i=0;i<pcbddc->coarse_size;i++) { 4409ea7e1babSStefano Zampini if (aux_ins_indices[i]) { 44102e8d2280SStefano Zampini ins_local_primal_indices[j] = i; 44112e8d2280SStefano Zampini j++; 4412ea7e1babSStefano Zampini } 4413ea7e1babSStefano Zampini } 4414523858cfSStefano Zampini /* processes partecipating in coarse problem receive matrix data from their friends */ 4415523858cfSStefano Zampini for (i=0;i<count_recv;i++) { 4416523858cfSStefano Zampini ierr = MPI_Irecv(&temp_coarse_mat_vals[localdispl2[i]],localsizes2[i],MPIU_SCALAR,ranks_recv[i],666,prec_comm,&requests[i]);CHKERRQ(ierr); 4417523858cfSStefano Zampini } 4418523858cfSStefano Zampini if (rank_coarse_proc_send_to != MPI_PROC_NULL) { 4419523858cfSStefano Zampini send_size = pcbddc->local_primal_size*pcbddc->local_primal_size; 4420523858cfSStefano Zampini ierr = MPI_Isend(&coarse_submat_vals[0],send_size,MPIU_SCALAR,rank_coarse_proc_send_to,666,prec_comm,&requests[count_recv]);CHKERRQ(ierr); 4421523858cfSStefano Zampini } 4422523858cfSStefano Zampini ierr = MPI_Waitall(count_recv+1,requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 4423523858cfSStefano Zampini /* nonzeros */ 4424523858cfSStefano Zampini ierr = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&dnz);CHKERRQ(ierr); 4425523858cfSStefano Zampini ierr = PetscMemzero(dnz,ins_local_primal_size*sizeof(PetscInt));CHKERRQ(ierr); 44260c7d97c5SJed Brown /* use aux_ins_indices to realize a global to local mapping */ 44270c7d97c5SJed Brown j=0; 44280c7d97c5SJed Brown for (i=0;i<pcbddc->coarse_size;i++) { 44290c7d97c5SJed Brown if (aux_ins_indices[i]==0) { 44300c7d97c5SJed Brown aux_ins_indices[i]=-1; 44310c7d97c5SJed Brown } else { 44320c7d97c5SJed Brown aux_ins_indices[i]=j; 44330c7d97c5SJed Brown j++; 44340c7d97c5SJed Brown } 44350c7d97c5SJed Brown } 44364fad6a16SStefano Zampini for (i=0;i<count_recv;i++) { 4437523858cfSStefano Zampini j = pcbddc->local_primal_sizes[ranks_recv[i]]; 4438523858cfSStefano Zampini for (k=0;k<j;k++) { 4439523858cfSStefano Zampini dnz[aux_ins_indices[pcbddc->replicated_local_primal_indices[pcbddc->local_primal_displacements[i]+k]]] += j; 44400c7d97c5SJed Brown } 44410c7d97c5SJed Brown } 4442523858cfSStefano Zampini /* check */ 4443523858cfSStefano Zampini for (i=0;i<ins_local_primal_size;i++) { 4444523858cfSStefano Zampini if (dnz[i] > ins_local_primal_size) { 4445523858cfSStefano Zampini dnz[i] = ins_local_primal_size; 44460c7d97c5SJed Brown } 44470c7d97c5SJed Brown } 44480c7d97c5SJed Brown ierr = PetscFree(requests);CHKERRQ(ierr); 44490c7d97c5SJed Brown ierr = PetscFree(aux_ins_indices);CHKERRQ(ierr); 44500c7d97c5SJed Brown if (coarse_color == 0) { ierr = PetscFree(ranks_recv);CHKERRQ(ierr); } 44514fad6a16SStefano Zampini } 44520c7d97c5SJed Brown /* create local to global mapping needed by coarse MATIS */ 4453142dfd88SStefano Zampini if (coarse_comm != MPI_COMM_NULL) {ierr = MPI_Comm_free(&coarse_comm);CHKERRQ(ierr);} 44540c7d97c5SJed Brown coarse_comm = prec_comm; 44550c7d97c5SJed Brown active_rank = rank_prec_comm; 44560c7d97c5SJed Brown ierr = ISCreateGeneral(coarse_comm,ins_local_primal_size,ins_local_primal_indices,PETSC_COPY_VALUES,&coarse_IS);CHKERRQ(ierr); 44570c7d97c5SJed Brown ierr = ISLocalToGlobalMappingCreateIS(coarse_IS,&coarse_ISLG);CHKERRQ(ierr); 44580c7d97c5SJed Brown ierr = ISDestroy(&coarse_IS);CHKERRQ(ierr); 44592e8d2280SStefano Zampini } else if (pcbddc->coarse_problem_type==PARALLEL_BDDC) { 44600c7d97c5SJed Brown /* arrays for values insertion */ 44610c7d97c5SJed Brown ins_local_primal_size = pcbddc->local_primal_size; 44622e8d2280SStefano Zampini ierr = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&ins_local_primal_indices);CHKERRQ(ierr); 44630c7d97c5SJed Brown ierr = PetscMalloc(ins_local_primal_size*ins_local_primal_size*sizeof(PetscScalar),&ins_coarse_mat_vals);CHKERRQ(ierr); 44640c7d97c5SJed Brown for (j=0;j<ins_local_primal_size;j++) { 44650c7d97c5SJed Brown ins_local_primal_indices[j]=pcbddc->local_primal_indices[j]; 44664fad6a16SStefano Zampini for (i=0;i<ins_local_primal_size;i++) { 44674fad6a16SStefano Zampini ins_coarse_mat_vals[j*ins_local_primal_size+i]=coarse_submat_vals[j*ins_local_primal_size+i]; 44684fad6a16SStefano Zampini } 44690c7d97c5SJed Brown } 44700c7d97c5SJed Brown } 44710c7d97c5SJed Brown break; 44720c7d97c5SJed Brown } 44730c7d97c5SJed Brown 44740c7d97c5SJed Brown case (GATHERS_BDDC): 44750c7d97c5SJed Brown { 44760c7d97c5SJed Brown PetscMPIInt mysize,mysize2; 4477ef028eecSStefano Zampini PetscMPIInt *send_buffer; 44780c7d97c5SJed Brown 44790c7d97c5SJed Brown if (rank_prec_comm==active_rank) { 44800c7d97c5SJed Brown ierr = PetscMalloc (pcbddc->replicated_primal_size*sizeof(PetscMPIInt),&pcbddc->replicated_local_primal_indices);CHKERRQ(ierr); 44810bdf917eSStefano Zampini ierr = PetscMalloc (pcbddc->replicated_primal_size*sizeof(PetscScalar),&pcbddc->replicated_local_primal_values);CHKERRQ(ierr); 44820c7d97c5SJed Brown ierr = PetscMalloc (size_prec_comm*sizeof(PetscMPIInt),&localsizes2);CHKERRQ(ierr); 44830c7d97c5SJed Brown ierr = PetscMalloc (size_prec_comm*sizeof(PetscMPIInt),&localdispl2);CHKERRQ(ierr); 44840c7d97c5SJed Brown /* arrays for values insertion */ 44852fa5cd67SKarl Rupp for (i=0;i<size_prec_comm;i++) localsizes2[i]=pcbddc->local_primal_sizes[i]*pcbddc->local_primal_sizes[i]; 44860c7d97c5SJed Brown localdispl2[0]=0; 44872fa5cd67SKarl Rupp for (i=1;i<size_prec_comm;i++) localdispl2[i]=localsizes2[i-1]+localdispl2[i-1]; 44880c7d97c5SJed Brown j = 0; 44892fa5cd67SKarl Rupp for (i=0;i<size_prec_comm;i++) j+=localsizes2[i]; 44900c7d97c5SJed Brown ierr = PetscMalloc (j*sizeof(PetscScalar),&temp_coarse_mat_vals);CHKERRQ(ierr); 44910c7d97c5SJed Brown } 44920c7d97c5SJed Brown 44930c7d97c5SJed Brown mysize =pcbddc->local_primal_size; 44940c7d97c5SJed Brown mysize2=pcbddc->local_primal_size*pcbddc->local_primal_size; 4495ef028eecSStefano Zampini ierr = PetscMalloc(mysize*sizeof(PetscMPIInt),&send_buffer);CHKERRQ(ierr); 44962fa5cd67SKarl Rupp for (i=0; i<mysize; i++) send_buffer[i]=(PetscMPIInt)pcbddc->local_primal_indices[i]; 44972fa5cd67SKarl Rupp 44980c7d97c5SJed Brown if (pcbddc->coarse_problem_type == SEQUENTIAL_BDDC) { 4499ef028eecSStefano Zampini ierr = MPI_Gatherv(send_buffer,mysize,MPIU_INT,&pcbddc->replicated_local_primal_indices[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr); 450053cdbc3dSStefano Zampini ierr = MPI_Gatherv(&coarse_submat_vals[0],mysize2,MPIU_SCALAR,&temp_coarse_mat_vals[0],localsizes2,localdispl2,MPIU_SCALAR,master_proc,prec_comm);CHKERRQ(ierr); 45010c7d97c5SJed Brown } else { 4502ef028eecSStefano Zampini ierr = MPI_Allgatherv(send_buffer,mysize,MPIU_INT,&pcbddc->replicated_local_primal_indices[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,prec_comm);CHKERRQ(ierr); 450353cdbc3dSStefano Zampini ierr = MPI_Allgatherv(&coarse_submat_vals[0],mysize2,MPIU_SCALAR,&temp_coarse_mat_vals[0],localsizes2,localdispl2,MPIU_SCALAR,prec_comm);CHKERRQ(ierr); 45040c7d97c5SJed Brown } 4505ef028eecSStefano Zampini ierr = PetscFree(send_buffer);CHKERRQ(ierr); 45060c7d97c5SJed Brown break; 4507da1bb401SStefano Zampini }/* switch on coarse problem and communications associated with finished */ 45080c7d97c5SJed Brown } 45090c7d97c5SJed Brown 45100c7d97c5SJed Brown /* Now create and fill up coarse matrix */ 45110c7d97c5SJed Brown if (rank_prec_comm == active_rank) { 4512142dfd88SStefano Zampini 4513142dfd88SStefano Zampini Mat matis_coarse_local_mat; 4514142dfd88SStefano Zampini 45150c7d97c5SJed Brown if (pcbddc->coarse_problem_type != MULTILEVEL_BDDC) { 45160c7d97c5SJed Brown ierr = MatCreate(coarse_comm,&pcbddc->coarse_mat);CHKERRQ(ierr); 45170c7d97c5SJed Brown ierr = MatSetSizes(pcbddc->coarse_mat,PETSC_DECIDE,PETSC_DECIDE,pcbddc->coarse_size,pcbddc->coarse_size);CHKERRQ(ierr); 45180c7d97c5SJed Brown ierr = MatSetType(pcbddc->coarse_mat,coarse_mat_type);CHKERRQ(ierr); 45193b03a366Sstefano_zampini ierr = MatSetUp(pcbddc->coarse_mat);CHKERRQ(ierr); 4520da1bb401SStefano Zampini ierr = MatSetOption(pcbddc->coarse_mat,MAT_ROW_ORIENTED,PETSC_FALSE);CHKERRQ(ierr); /* local values stored in column major */ 45213b03a366Sstefano_zampini ierr = MatSetOption(pcbddc->coarse_mat,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr); 45220c7d97c5SJed Brown } else { 45234fad6a16SStefano Zampini ierr = MatCreateIS(coarse_comm,1,PETSC_DECIDE,PETSC_DECIDE,pcbddc->coarse_size,pcbddc->coarse_size,coarse_ISLG,&pcbddc->coarse_mat);CHKERRQ(ierr); 45243b03a366Sstefano_zampini ierr = MatSetUp(pcbddc->coarse_mat);CHKERRQ(ierr); 45250c7d97c5SJed Brown ierr = MatISGetLocalMat(pcbddc->coarse_mat,&matis_coarse_local_mat);CHKERRQ(ierr); 45263b03a366Sstefano_zampini ierr = MatSetUp(matis_coarse_local_mat);CHKERRQ(ierr); 4527da1bb401SStefano Zampini ierr = MatSetOption(matis_coarse_local_mat,MAT_ROW_ORIENTED,PETSC_FALSE);CHKERRQ(ierr); /* local values stored in column major */ 4528a0ba757dSStefano Zampini ierr = MatSetOption(matis_coarse_local_mat,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr); 45290c7d97c5SJed Brown } 4530142dfd88SStefano Zampini /* preallocation */ 4531142dfd88SStefano Zampini if (pcbddc->coarse_problem_type != MULTILEVEL_BDDC) { 4532ef028eecSStefano Zampini 4533142dfd88SStefano Zampini PetscInt lrows,lcols; 4534ef028eecSStefano Zampini 4535142dfd88SStefano Zampini ierr = MatGetLocalSize(pcbddc->coarse_mat,&lrows,&lcols);CHKERRQ(ierr); 4536142dfd88SStefano Zampini ierr = MatPreallocateInitialize(coarse_comm,lrows,lcols,dnz,onz);CHKERRQ(ierr); 4537ef028eecSStefano Zampini 4538142dfd88SStefano Zampini if (pcbddc->coarse_problem_type == PARALLEL_BDDC) { 4539ef028eecSStefano Zampini 4540ef028eecSStefano Zampini Vec vec_dnz,vec_onz; 4541ef028eecSStefano Zampini PetscScalar *my_dnz,*my_onz,*array; 4542ef028eecSStefano Zampini PetscInt *mat_ranges,*row_ownership; 4543ef028eecSStefano Zampini PetscInt coarse_index_row,coarse_index_col,owner; 4544ef028eecSStefano Zampini 4545ef028eecSStefano Zampini ierr = VecCreate(prec_comm,&vec_dnz);CHKERRQ(ierr); 4546ef028eecSStefano Zampini ierr = VecSetSizes(vec_dnz,PETSC_DECIDE,pcbddc->coarse_size);CHKERRQ(ierr); 4547ef028eecSStefano Zampini ierr = VecSetType(vec_dnz,VECMPI);CHKERRQ(ierr); 4548ef028eecSStefano Zampini ierr = VecDuplicate(vec_dnz,&vec_onz);CHKERRQ(ierr); 4549ef028eecSStefano Zampini 4550ef028eecSStefano Zampini ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscScalar),&my_dnz);CHKERRQ(ierr); 4551ef028eecSStefano Zampini ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscScalar),&my_onz);CHKERRQ(ierr); 4552ef028eecSStefano Zampini ierr = PetscMemzero(my_dnz,pcbddc->local_primal_size*sizeof(PetscScalar));CHKERRQ(ierr); 4553ef028eecSStefano Zampini ierr = PetscMemzero(my_onz,pcbddc->local_primal_size*sizeof(PetscScalar));CHKERRQ(ierr); 4554ef028eecSStefano Zampini 4555ef028eecSStefano Zampini ierr = PetscMalloc(pcbddc->coarse_size*sizeof(PetscInt),&row_ownership);CHKERRQ(ierr); 4556ef028eecSStefano Zampini ierr = MatGetOwnershipRanges(pcbddc->coarse_mat,(const PetscInt**)&mat_ranges);CHKERRQ(ierr); 4557142dfd88SStefano Zampini for (i=0; i<size_prec_comm; i++) { 4558ef028eecSStefano Zampini for (j=mat_ranges[i]; j<mat_ranges[i+1]; j++) { 4559ef028eecSStefano Zampini row_ownership[j]=i; 4560142dfd88SStefano Zampini } 4561142dfd88SStefano Zampini } 4562ef028eecSStefano Zampini 4563ef028eecSStefano Zampini for (i=0; i<pcbddc->local_primal_size; i++) { 4564ef028eecSStefano Zampini coarse_index_row = pcbddc->local_primal_indices[i]; 4565ef028eecSStefano Zampini owner = row_ownership[coarse_index_row]; 4566ef028eecSStefano Zampini for (j=i; j<pcbddc->local_primal_size; j++) { 4567ef028eecSStefano Zampini owner = row_ownership[coarse_index_row]; 4568ef028eecSStefano Zampini coarse_index_col = pcbddc->local_primal_indices[j]; 4569ef028eecSStefano Zampini if (coarse_index_col > mat_ranges[owner]-1 && coarse_index_col < mat_ranges[owner+1]) { 4570ef028eecSStefano Zampini my_dnz[i] += 1.0; 4571142dfd88SStefano Zampini } else { 4572ef028eecSStefano Zampini my_onz[i] += 1.0; 4573142dfd88SStefano Zampini } 4574ef028eecSStefano Zampini if (i != j) { 4575ef028eecSStefano Zampini owner = row_ownership[coarse_index_col]; 4576ef028eecSStefano Zampini if (coarse_index_row > mat_ranges[owner]-1 && coarse_index_row < mat_ranges[owner+1]) { 4577ef028eecSStefano Zampini my_dnz[j] += 1.0; 4578142dfd88SStefano Zampini } else { 4579ef028eecSStefano Zampini my_onz[j] += 1.0; 4580142dfd88SStefano Zampini } 4581142dfd88SStefano Zampini } 4582142dfd88SStefano Zampini } 4583142dfd88SStefano Zampini } 4584ef028eecSStefano Zampini ierr = VecSet(vec_dnz,0.0);CHKERRQ(ierr); 4585ef028eecSStefano Zampini ierr = VecSet(vec_onz,0.0);CHKERRQ(ierr); 4586a929c220SStefano Zampini if (pcbddc->local_primal_size) { 4587ef028eecSStefano Zampini ierr = VecSetValues(vec_dnz,pcbddc->local_primal_size,pcbddc->local_primal_indices,my_dnz,ADD_VALUES);CHKERRQ(ierr); 4588ef028eecSStefano Zampini ierr = VecSetValues(vec_onz,pcbddc->local_primal_size,pcbddc->local_primal_indices,my_onz,ADD_VALUES);CHKERRQ(ierr); 4589a929c220SStefano Zampini } 4590ef028eecSStefano Zampini ierr = VecAssemblyBegin(vec_dnz);CHKERRQ(ierr); 4591ef028eecSStefano Zampini ierr = VecAssemblyBegin(vec_onz);CHKERRQ(ierr); 4592ef028eecSStefano Zampini ierr = VecAssemblyEnd(vec_dnz);CHKERRQ(ierr); 4593ef028eecSStefano Zampini ierr = VecAssemblyEnd(vec_onz);CHKERRQ(ierr); 4594ef028eecSStefano Zampini j = mat_ranges[rank_prec_comm+1]-mat_ranges[rank_prec_comm]; 4595ef028eecSStefano Zampini ierr = VecGetArray(vec_dnz,&array);CHKERRQ(ierr); 45962fa5cd67SKarl Rupp for (i=0; i<j; i++) dnz[i] = (PetscInt)array[i]; 45972fa5cd67SKarl Rupp 4598ef028eecSStefano Zampini ierr = VecRestoreArray(vec_dnz,&array);CHKERRQ(ierr); 4599ef028eecSStefano Zampini ierr = VecGetArray(vec_onz,&array);CHKERRQ(ierr); 46002fa5cd67SKarl Rupp for (i=0;i<j;i++) onz[i] = (PetscInt)array[i]; 46012fa5cd67SKarl Rupp 4602ef028eecSStefano Zampini ierr = VecRestoreArray(vec_onz,&array);CHKERRQ(ierr); 4603ef028eecSStefano Zampini ierr = PetscFree(my_dnz);CHKERRQ(ierr); 4604ef028eecSStefano Zampini ierr = PetscFree(my_onz);CHKERRQ(ierr); 4605ef028eecSStefano Zampini ierr = PetscFree(row_ownership);CHKERRQ(ierr); 4606ef028eecSStefano Zampini ierr = VecDestroy(&vec_dnz);CHKERRQ(ierr); 4607ef028eecSStefano Zampini ierr = VecDestroy(&vec_onz);CHKERRQ(ierr); 4608142dfd88SStefano Zampini } else { 4609142dfd88SStefano Zampini for (k=0;k<size_prec_comm;k++) { 4610142dfd88SStefano Zampini offset=pcbddc->local_primal_displacements[k]; 4611142dfd88SStefano Zampini offset2=localdispl2[k]; 4612142dfd88SStefano Zampini ins_local_primal_size = pcbddc->local_primal_sizes[k]; 4613ef028eecSStefano Zampini ierr = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&ins_local_primal_indices);CHKERRQ(ierr); 4614ef028eecSStefano Zampini for (j=0;j<ins_local_primal_size;j++) { 4615ef028eecSStefano Zampini ins_local_primal_indices[j]=(PetscInt)pcbddc->replicated_local_primal_indices[offset+j]; 4616ef028eecSStefano Zampini } 4617142dfd88SStefano Zampini for (j=0;j<ins_local_primal_size;j++) { 4618142dfd88SStefano Zampini ierr = MatPreallocateSet(ins_local_primal_indices[j],ins_local_primal_size,ins_local_primal_indices,dnz,onz);CHKERRQ(ierr); 4619142dfd88SStefano Zampini } 4620ef028eecSStefano Zampini ierr = PetscFree(ins_local_primal_indices);CHKERRQ(ierr); 4621142dfd88SStefano Zampini } 4622142dfd88SStefano Zampini } 46232fa5cd67SKarl Rupp 4624142dfd88SStefano Zampini /* check */ 4625142dfd88SStefano Zampini for (i=0;i<lrows;i++) { 46262fa5cd67SKarl Rupp if (dnz[i]>lcols) dnz[i]=lcols; 46272fa5cd67SKarl Rupp if (onz[i]>pcbddc->coarse_size-lcols) onz[i]=pcbddc->coarse_size-lcols; 4628142dfd88SStefano Zampini } 4629142dfd88SStefano Zampini ierr = MatSeqAIJSetPreallocation(pcbddc->coarse_mat,PETSC_NULL,dnz);CHKERRQ(ierr); 4630142dfd88SStefano Zampini ierr = MatMPIAIJSetPreallocation(pcbddc->coarse_mat,PETSC_NULL,dnz,PETSC_NULL,onz);CHKERRQ(ierr); 4631142dfd88SStefano Zampini ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr); 4632142dfd88SStefano Zampini } else { 4633523858cfSStefano Zampini ierr = MatSeqAIJSetPreallocation(matis_coarse_local_mat,0,dnz);CHKERRQ(ierr); 4634523858cfSStefano Zampini ierr = PetscFree(dnz);CHKERRQ(ierr); 4635142dfd88SStefano Zampini } 46362fa5cd67SKarl Rupp 4637142dfd88SStefano Zampini /* insert values */ 4638523858cfSStefano Zampini if (pcbddc->coarse_problem_type == PARALLEL_BDDC) { 46390c7d97c5SJed Brown ierr = MatSetValues(pcbddc->coarse_mat,ins_local_primal_size,ins_local_primal_indices,ins_local_primal_size,ins_local_primal_indices,ins_coarse_mat_vals,ADD_VALUES);CHKERRQ(ierr); 4640523858cfSStefano Zampini } else if (pcbddc->coarse_problem_type == MULTILEVEL_BDDC) { 4641523858cfSStefano Zampini if (pcbddc->coarsening_ratio == 1) { 4642523858cfSStefano Zampini ins_coarse_mat_vals = coarse_submat_vals; 4643523858cfSStefano Zampini ierr = MatSetValues(pcbddc->coarse_mat,ins_local_primal_size,ins_local_primal_indices,ins_local_primal_size,ins_local_primal_indices,ins_coarse_mat_vals,INSERT_VALUES);CHKERRQ(ierr); 4644523858cfSStefano Zampini } else { 4645523858cfSStefano Zampini ierr = PetscFree(ins_local_primal_indices);CHKERRQ(ierr); 4646523858cfSStefano Zampini for (k=0; k<pcbddc->replicated_primal_size; k++) { 4647523858cfSStefano Zampini offset = pcbddc->local_primal_displacements[k]; 4648523858cfSStefano Zampini offset2 = localdispl2[k]; 4649523858cfSStefano Zampini ins_local_primal_size = pcbddc->local_primal_displacements[k+1]-pcbddc->local_primal_displacements[k]; 4650ef028eecSStefano Zampini ierr = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&ins_local_primal_indices);CHKERRQ(ierr); 4651ef028eecSStefano Zampini for (j=0; j<ins_local_primal_size; j++) { 4652ef028eecSStefano Zampini ins_local_primal_indices[j]=(PetscInt)pcbddc->replicated_local_primal_indices[offset+j]; 4653ef028eecSStefano Zampini } 4654523858cfSStefano Zampini ins_coarse_mat_vals = &temp_coarse_mat_vals[offset2]; 4655523858cfSStefano Zampini ierr = MatSetValues(pcbddc->coarse_mat,ins_local_primal_size,ins_local_primal_indices,ins_local_primal_size,ins_local_primal_indices,ins_coarse_mat_vals,ADD_VALUES);CHKERRQ(ierr); 4656ef028eecSStefano Zampini ierr = PetscFree(ins_local_primal_indices);CHKERRQ(ierr); 4657523858cfSStefano Zampini } 4658523858cfSStefano Zampini } 4659523858cfSStefano Zampini ins_local_primal_indices = 0; 4660523858cfSStefano Zampini ins_coarse_mat_vals = 0; 4661ea7e1babSStefano Zampini } else { 4662ea7e1babSStefano Zampini for (k=0; k<size_prec_comm; k++) { 4663ea7e1babSStefano Zampini offset =pcbddc->local_primal_displacements[k]; 4664ea7e1babSStefano Zampini offset2 =localdispl2[k]; 4665ea7e1babSStefano Zampini ins_local_primal_size = pcbddc->local_primal_sizes[k]; 4666ef028eecSStefano Zampini ierr = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&ins_local_primal_indices);CHKERRQ(ierr); 4667ef028eecSStefano Zampini for (j=0; j<ins_local_primal_size; j++) { 4668ef028eecSStefano Zampini ins_local_primal_indices[j]=(PetscInt)pcbddc->replicated_local_primal_indices[offset+j]; 4669ef028eecSStefano Zampini } 4670ea7e1babSStefano Zampini ins_coarse_mat_vals = &temp_coarse_mat_vals[offset2]; 4671ea7e1babSStefano Zampini ierr = MatSetValues(pcbddc->coarse_mat,ins_local_primal_size,ins_local_primal_indices,ins_local_primal_size,ins_local_primal_indices,ins_coarse_mat_vals,ADD_VALUES);CHKERRQ(ierr); 4672ef028eecSStefano Zampini ierr = PetscFree(ins_local_primal_indices);CHKERRQ(ierr); 4673ea7e1babSStefano Zampini } 4674ea7e1babSStefano Zampini ins_local_primal_indices = 0; 4675ea7e1babSStefano Zampini ins_coarse_mat_vals = 0; 4676ea7e1babSStefano Zampini } 46770c7d97c5SJed Brown ierr = MatAssemblyBegin(pcbddc->coarse_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 46780c7d97c5SJed Brown ierr = MatAssemblyEnd(pcbddc->coarse_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 4679142dfd88SStefano Zampini /* symmetry of coarse matrix */ 4680142dfd88SStefano Zampini if (issym) { 4681142dfd88SStefano Zampini ierr = MatSetOption(pcbddc->coarse_mat,MAT_SYMMETRIC,PETSC_TRUE);CHKERRQ(ierr); 4682142dfd88SStefano Zampini } 46830c7d97c5SJed Brown ierr = MatGetVecs(pcbddc->coarse_mat,&pcbddc->coarse_vec,&pcbddc->coarse_rhs);CHKERRQ(ierr); 46840bdf917eSStefano Zampini } 46850bdf917eSStefano Zampini 46860bdf917eSStefano Zampini /* create loc to glob scatters if needed */ 46870bdf917eSStefano Zampini if (pcbddc->coarse_communications_type == SCATTERS_BDDC) { 46880bdf917eSStefano Zampini IS local_IS,global_IS; 46890bdf917eSStefano Zampini ierr = ISCreateStride(PETSC_COMM_SELF,pcbddc->local_primal_size,0,1,&local_IS);CHKERRQ(ierr); 46900bdf917eSStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,pcbddc->local_primal_size,pcbddc->local_primal_indices,PETSC_COPY_VALUES,&global_IS);CHKERRQ(ierr); 46910bdf917eSStefano Zampini ierr = VecScatterCreate(pcbddc->vec1_P,local_IS,pcbddc->coarse_vec,global_IS,&pcbddc->coarse_loc_to_glob);CHKERRQ(ierr); 46920bdf917eSStefano Zampini ierr = ISDestroy(&local_IS);CHKERRQ(ierr); 46930bdf917eSStefano Zampini ierr = ISDestroy(&global_IS);CHKERRQ(ierr); 46940bdf917eSStefano Zampini } 46950bdf917eSStefano Zampini 4696a929c220SStefano Zampini /* free memory no longer needed */ 4697a929c220SStefano Zampini if (coarse_ISLG) { ierr = ISLocalToGlobalMappingDestroy(&coarse_ISLG);CHKERRQ(ierr); } 4698a929c220SStefano Zampini if (ins_local_primal_indices) { ierr = PetscFree(ins_local_primal_indices);CHKERRQ(ierr); } 4699a929c220SStefano Zampini if (ins_coarse_mat_vals) { ierr = PetscFree(ins_coarse_mat_vals);CHKERRQ(ierr); } 4700a929c220SStefano Zampini if (localsizes2) { ierr = PetscFree(localsizes2);CHKERRQ(ierr); } 4701a929c220SStefano Zampini if (localdispl2) { ierr = PetscFree(localdispl2);CHKERRQ(ierr); } 4702a929c220SStefano Zampini if (temp_coarse_mat_vals) { ierr = PetscFree(temp_coarse_mat_vals);CHKERRQ(ierr); } 4703a929c220SStefano Zampini 47040bdf917eSStefano Zampini /* Eval coarse null space */ 47050bdf917eSStefano Zampini if (pcbddc->NullSpace) { 47060bdf917eSStefano Zampini const Vec *nsp_vecs; 47070bdf917eSStefano Zampini PetscInt nsp_size,coarse_nsp_size; 47080bdf917eSStefano Zampini PetscBool nsp_has_cnst; 47090bdf917eSStefano Zampini PetscReal test_null; 47100bdf917eSStefano Zampini Vec *coarse_nsp_vecs; 47110bdf917eSStefano Zampini 47120bdf917eSStefano Zampini coarse_nsp_size = 0; 47130bdf917eSStefano Zampini coarse_nsp_vecs = 0; 47140bdf917eSStefano Zampini ierr = MatNullSpaceGetVecs(pcbddc->NullSpace,&nsp_has_cnst,&nsp_size,&nsp_vecs);CHKERRQ(ierr); 47150bdf917eSStefano Zampini if (rank_prec_comm == active_rank) { 47160bdf917eSStefano Zampini ierr = PetscMalloc((nsp_size+1)*sizeof(Vec),&coarse_nsp_vecs);CHKERRQ(ierr); 47170bdf917eSStefano Zampini for (i=0; i<nsp_size+1; i++) { 47180bdf917eSStefano Zampini ierr = VecDuplicate(pcbddc->coarse_vec,&coarse_nsp_vecs[i]);CHKERRQ(ierr); 47190bdf917eSStefano Zampini } 47200bdf917eSStefano Zampini } 47210bdf917eSStefano Zampini if (nsp_has_cnst) { 47220bdf917eSStefano Zampini ierr = VecSet(pcis->vec1_N,1.0);CHKERRQ(ierr); 47230bdf917eSStefano Zampini ierr = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr); 47240bdf917eSStefano Zampini ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->vec1_P,pcbddc->coarse_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 47250bdf917eSStefano Zampini ierr = PCBDDCScatterCoarseDataEnd(pc,pcbddc->vec1_P,pcbddc->coarse_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 47260bdf917eSStefano Zampini if (rank_prec_comm == active_rank) { 47270bdf917eSStefano Zampini ierr = MatMult(pcbddc->coarse_mat,pcbddc->coarse_vec,pcbddc->coarse_rhs);CHKERRQ(ierr); 47280bdf917eSStefano Zampini ierr = VecNorm(pcbddc->coarse_rhs,NORM_INFINITY,&test_null);CHKERRQ(ierr); 47290bdf917eSStefano Zampini if (test_null > 1.0e-12 && pcbddc->dbg_flag) { 47300bdf917eSStefano Zampini ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Constant coarse null space error % 1.14e\n",test_null);CHKERRQ(ierr); 47310bdf917eSStefano Zampini } 47320bdf917eSStefano Zampini ierr = VecCopy(pcbddc->coarse_vec,coarse_nsp_vecs[coarse_nsp_size]);CHKERRQ(ierr); 47330bdf917eSStefano Zampini coarse_nsp_size++; 47340bdf917eSStefano Zampini } 47350bdf917eSStefano Zampini } 47360bdf917eSStefano Zampini for (i=0; i<nsp_size; i++) { 47370bdf917eSStefano Zampini ierr = VecScatterBegin(matis->ctx,nsp_vecs[i],pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 47380bdf917eSStefano Zampini ierr = VecScatterEnd (matis->ctx,nsp_vecs[i],pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 47390bdf917eSStefano Zampini ierr = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr); 47400bdf917eSStefano Zampini ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->vec1_P,pcbddc->coarse_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 47410bdf917eSStefano Zampini ierr = PCBDDCScatterCoarseDataEnd(pc,pcbddc->vec1_P,pcbddc->coarse_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 47420bdf917eSStefano Zampini if (rank_prec_comm == active_rank) { 47430bdf917eSStefano Zampini ierr = MatMult(pcbddc->coarse_mat,pcbddc->coarse_vec,pcbddc->coarse_rhs);CHKERRQ(ierr); 47440bdf917eSStefano Zampini ierr = VecNorm(pcbddc->coarse_rhs,NORM_2,&test_null);CHKERRQ(ierr); 47450bdf917eSStefano Zampini if (test_null > 1.0e-12 && pcbddc->dbg_flag) { 47460bdf917eSStefano Zampini ierr = PetscViewerASCIIPrintf(pcbddc->dbg_viewer,"Vec %d coarse null space error % 1.14e\n",i,test_null);CHKERRQ(ierr); 47470bdf917eSStefano Zampini } 47480bdf917eSStefano Zampini ierr = VecCopy(pcbddc->coarse_vec,coarse_nsp_vecs[coarse_nsp_size]);CHKERRQ(ierr); 47490bdf917eSStefano Zampini coarse_nsp_size++; 47500bdf917eSStefano Zampini } 47510bdf917eSStefano Zampini } 47520bdf917eSStefano Zampini if (coarse_nsp_size > 0) { 47530bdf917eSStefano Zampini /* TODO orthonormalize vecs */ 47540bdf917eSStefano Zampini ierr = VecNormalize(coarse_nsp_vecs[0],PETSC_NULL);CHKERRQ(ierr); 47550bdf917eSStefano Zampini ierr = MatNullSpaceCreate(coarse_comm,PETSC_FALSE,coarse_nsp_size,coarse_nsp_vecs,&pcbddc->CoarseNullSpace);CHKERRQ(ierr); 47560bdf917eSStefano Zampini for (i=0; i<nsp_size+1; i++) { 47570bdf917eSStefano Zampini ierr = VecDestroy(&coarse_nsp_vecs[i]);CHKERRQ(ierr); 47580bdf917eSStefano Zampini } 47590bdf917eSStefano Zampini } 47600bdf917eSStefano Zampini ierr = PetscFree(coarse_nsp_vecs);CHKERRQ(ierr); 47610bdf917eSStefano Zampini } 47620bdf917eSStefano Zampini 47630bdf917eSStefano Zampini /* KSP for coarse problem */ 47640bdf917eSStefano Zampini if (rank_prec_comm == active_rank) { 47652e8d2280SStefano Zampini PetscBool isbddc=PETSC_FALSE; 47660bdf917eSStefano Zampini 476753cdbc3dSStefano Zampini ierr = KSPCreate(coarse_comm,&pcbddc->coarse_ksp);CHKERRQ(ierr); 476853cdbc3dSStefano Zampini ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->coarse_ksp,(PetscObject)pc,1);CHKERRQ(ierr); 476953cdbc3dSStefano Zampini ierr = KSPSetOperators(pcbddc->coarse_ksp,pcbddc->coarse_mat,pcbddc->coarse_mat,SAME_PRECONDITIONER);CHKERRQ(ierr); 47703b03a366Sstefano_zampini ierr = KSPSetTolerances(pcbddc->coarse_ksp,PETSC_DEFAULT,PETSC_DEFAULT,PETSC_DEFAULT,max_it_coarse_ksp);CHKERRQ(ierr); 477153cdbc3dSStefano Zampini ierr = KSPSetType(pcbddc->coarse_ksp,coarse_ksp_type);CHKERRQ(ierr); 477253cdbc3dSStefano Zampini ierr = KSPGetPC(pcbddc->coarse_ksp,&pc_temp);CHKERRQ(ierr); 477353cdbc3dSStefano Zampini ierr = PCSetType(pc_temp,coarse_pc_type);CHKERRQ(ierr); 47740c7d97c5SJed Brown /* Allow user's customization */ 4775da1bb401SStefano Zampini ierr = KSPSetOptionsPrefix(pcbddc->coarse_ksp,"coarse_");CHKERRQ(ierr); 47760c7d97c5SJed Brown /* Set Up PC for coarse problem BDDC */ 477753cdbc3dSStefano Zampini if (pcbddc->coarse_problem_type == MULTILEVEL_BDDC) { 47784fad6a16SStefano Zampini i = pcbddc->current_level+1; 47794fad6a16SStefano Zampini ierr = PCBDDCSetLevel(pc_temp,i);CHKERRQ(ierr); 47804fad6a16SStefano Zampini ierr = PCBDDCSetCoarseningRatio(pc_temp,pcbddc->coarsening_ratio);CHKERRQ(ierr); 47814fad6a16SStefano Zampini ierr = PCBDDCSetMaxLevels(pc_temp,pcbddc->max_levels);CHKERRQ(ierr); 478253cdbc3dSStefano Zampini ierr = PCBDDCSetCoarseProblemType(pc_temp,MULTILEVEL_BDDC);CHKERRQ(ierr); 47830bdf917eSStefano Zampini if (pcbddc->CoarseNullSpace) { ierr = PCBDDCSetNullSpace(pc_temp,pcbddc->CoarseNullSpace);CHKERRQ(ierr); } 47844fad6a16SStefano Zampini if (dbg_flag) { 47854fad6a16SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"----------------Level %d: Setting up level %d---------------\n",pcbddc->current_level,i);CHKERRQ(ierr); 47864fad6a16SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 478753cdbc3dSStefano Zampini } 47884fad6a16SStefano Zampini } 47894fad6a16SStefano Zampini ierr = KSPSetFromOptions(pcbddc->coarse_ksp);CHKERRQ(ierr); 479053cdbc3dSStefano Zampini ierr = KSPSetUp(pcbddc->coarse_ksp);CHKERRQ(ierr); 4791142dfd88SStefano Zampini 47922e8d2280SStefano Zampini ierr = KSPGetTolerances(pcbddc->coarse_ksp,PETSC_NULL,PETSC_NULL,PETSC_NULL,&j);CHKERRQ(ierr); 47932e8d2280SStefano Zampini ierr = KSPGetPC(pcbddc->coarse_ksp,&pc_temp);CHKERRQ(ierr); 47942e8d2280SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)pc_temp,PCBDDC,&isbddc);CHKERRQ(ierr); 47952e8d2280SStefano Zampini if (j == 1) { 47962e8d2280SStefano Zampini ierr = KSPSetNormType(pcbddc->coarse_ksp,KSP_NORM_NONE);CHKERRQ(ierr); 47972e8d2280SStefano Zampini if (isbddc) { 47982e8d2280SStefano Zampini ierr = PCBDDCSetUseExactDirichlet(pc_temp,PETSC_FALSE);CHKERRQ(ierr); 47995619798eSStefano Zampini } 48005619798eSStefano Zampini } 48010c7d97c5SJed Brown } 4802a929c220SStefano Zampini /* Check coarse problem if requested */ 4803142dfd88SStefano Zampini if (dbg_flag && rank_prec_comm == active_rank) { 4804142dfd88SStefano Zampini KSP check_ksp; 4805142dfd88SStefano Zampini PC check_pc; 4806142dfd88SStefano Zampini Vec check_vec; 4807142dfd88SStefano Zampini PetscReal abs_infty_error,infty_error,lambda_min,lambda_max; 480819fd82e9SBarry Smith KSPType check_ksp_type; 48090c7d97c5SJed Brown 4810142dfd88SStefano Zampini /* Create ksp object suitable for extreme eigenvalues' estimation */ 4811142dfd88SStefano Zampini ierr = KSPCreate(coarse_comm,&check_ksp);CHKERRQ(ierr); 4812142dfd88SStefano Zampini ierr = KSPSetOperators(check_ksp,pcbddc->coarse_mat,pcbddc->coarse_mat,SAME_PRECONDITIONER);CHKERRQ(ierr); 48130bdf917eSStefano Zampini ierr = KSPSetTolerances(check_ksp,1.e-12,1.e-12,PETSC_DEFAULT,pcbddc->coarse_size);CHKERRQ(ierr); 4814142dfd88SStefano Zampini if (pcbddc->coarse_problem_type == MULTILEVEL_BDDC) { 48152fa5cd67SKarl Rupp if (issym) check_ksp_type = KSPCG; 48162fa5cd67SKarl Rupp else check_ksp_type = KSPGMRES; 4817142dfd88SStefano Zampini ierr = KSPSetComputeSingularValues(check_ksp,PETSC_TRUE);CHKERRQ(ierr); 4818142dfd88SStefano Zampini } else { 4819142dfd88SStefano Zampini check_ksp_type = KSPPREONLY; 4820142dfd88SStefano Zampini } 4821142dfd88SStefano Zampini ierr = KSPSetType(check_ksp,check_ksp_type);CHKERRQ(ierr); 4822142dfd88SStefano Zampini ierr = KSPGetPC(pcbddc->coarse_ksp,&check_pc);CHKERRQ(ierr); 4823142dfd88SStefano Zampini ierr = KSPSetPC(check_ksp,check_pc);CHKERRQ(ierr); 4824142dfd88SStefano Zampini ierr = KSPSetUp(check_ksp);CHKERRQ(ierr); 4825142dfd88SStefano Zampini /* create random vec */ 4826142dfd88SStefano Zampini ierr = VecDuplicate(pcbddc->coarse_vec,&check_vec);CHKERRQ(ierr); 4827142dfd88SStefano Zampini ierr = VecSetRandom(check_vec,PETSC_NULL);CHKERRQ(ierr); 48280bdf917eSStefano Zampini if (pcbddc->CoarseNullSpace) { ierr = MatNullSpaceRemove(pcbddc->CoarseNullSpace,check_vec,PETSC_NULL);CHKERRQ(ierr); } 4829142dfd88SStefano Zampini ierr = MatMult(pcbddc->coarse_mat,check_vec,pcbddc->coarse_rhs);CHKERRQ(ierr); 4830142dfd88SStefano Zampini /* solve coarse problem */ 4831142dfd88SStefano Zampini ierr = KSPSolve(check_ksp,pcbddc->coarse_rhs,pcbddc->coarse_vec);CHKERRQ(ierr); 48320bdf917eSStefano Zampini if (pcbddc->CoarseNullSpace) { ierr = MatNullSpaceRemove(pcbddc->CoarseNullSpace,pcbddc->coarse_vec,PETSC_NULL);CHKERRQ(ierr); } 4833142dfd88SStefano Zampini /* check coarse problem residual error */ 4834142dfd88SStefano Zampini ierr = VecAXPY(check_vec,-1.0,pcbddc->coarse_vec);CHKERRQ(ierr); 4835142dfd88SStefano Zampini ierr = VecNorm(check_vec,NORM_INFINITY,&infty_error);CHKERRQ(ierr); 4836142dfd88SStefano Zampini ierr = MatMult(pcbddc->coarse_mat,check_vec,pcbddc->coarse_rhs);CHKERRQ(ierr); 4837142dfd88SStefano Zampini ierr = VecNorm(pcbddc->coarse_rhs,NORM_INFINITY,&abs_infty_error);CHKERRQ(ierr); 4838142dfd88SStefano Zampini ierr = VecDestroy(&check_vec);CHKERRQ(ierr); 4839142dfd88SStefano Zampini /* get eigenvalue estimation if inexact */ 4840142dfd88SStefano Zampini if (pcbddc->coarse_problem_type == MULTILEVEL_BDDC) { 4841142dfd88SStefano Zampini ierr = KSPComputeExtremeSingularValues(check_ksp,&lambda_max,&lambda_min);CHKERRQ(ierr); 4842142dfd88SStefano Zampini ierr = KSPGetIterationNumber(check_ksp,&k);CHKERRQ(ierr); 4843142dfd88SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem eigenvalues estimated with %d iterations of %s.\n",k,check_ksp_type);CHKERRQ(ierr); 4844e269702eSStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem eigenvalues: % 1.14e %1.14e\n",lambda_min,lambda_max);CHKERRQ(ierr); 48453b03a366Sstefano_zampini } 4846142dfd88SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem exact infty_error : %1.14e\n",infty_error);CHKERRQ(ierr); 4847142dfd88SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem residual infty_error: %1.14e\n",abs_infty_error);CHKERRQ(ierr); 4848142dfd88SStefano Zampini ierr = KSPDestroy(&check_ksp);CHKERRQ(ierr); 484953cdbc3dSStefano Zampini } 4850142dfd88SStefano Zampini if (dbg_flag) { ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); } 48510c7d97c5SJed Brown PetscFunctionReturn(0); 48520c7d97c5SJed Brown } 48530c7d97c5SJed Brown 48540c7d97c5SJed Brown #undef __FUNCT__ 48550c7d97c5SJed Brown #define __FUNCT__ "PCBDDCManageLocalBoundaries" 485653cdbc3dSStefano Zampini static PetscErrorCode PCBDDCManageLocalBoundaries(PC pc) 48570c7d97c5SJed Brown { 48580c7d97c5SJed Brown PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 48590c7d97c5SJed Brown PC_IS *pcis = (PC_IS*)pc->data; 48600c7d97c5SJed Brown Mat_IS *matis = (Mat_IS*)pc->pmat->data; 4861da1bb401SStefano Zampini PCBDDCGraph mat_graph=pcbddc->mat_graph; 48627cf533a6SStefano Zampini PetscInt *is_indices,*auxis; 48633b03a366Sstefano_zampini PetscInt bs,ierr,i,j,s,k,iindex,neumann_bsize,dirichlet_bsize; 4864da1bb401SStefano Zampini PetscInt total_counts,nodes_touched,where_values=1,vertex_size; 4865534831adSStefano Zampini PetscMPIInt adapt_interface=0,adapt_interface_reduced=0,NEUMANNCNT=0; 4866da1bb401SStefano Zampini PetscBool same_set; 4867a0ba757dSStefano Zampini MPI_Comm interface_comm=((PetscObject)pc)->comm; 48683b03a366Sstefano_zampini PetscBool use_faces =PETSC_FALSE,use_edges=PETSC_FALSE; 48693b03a366Sstefano_zampini const PetscInt *neumann_nodes; 48703b03a366Sstefano_zampini const PetscInt *dirichlet_nodes; 4871a81d60d8SStefano Zampini IS used_IS,*custom_ISForDofs; 4872da1bb401SStefano Zampini PetscScalar *array; 4873da1bb401SStefano Zampini PetscScalar *array2; 4874da1bb401SStefano Zampini PetscViewer viewer=pcbddc->dbg_viewer; 4875a929c220SStefano Zampini PetscInt *queue_in_global_numbering; 48760c7d97c5SJed Brown 48770c7d97c5SJed Brown PetscFunctionBegin; 4878da1bb401SStefano Zampini /* Setup local adjacency graph */ 4879da1bb401SStefano Zampini mat_graph->nvtxs=pcis->n; 48802fa5cd67SKarl Rupp if (!mat_graph->xadj) NEUMANNCNT = 1; 4881da1bb401SStefano Zampini ierr = PCBDDCSetupLocalAdjacencyGraph(pc);CHKERRQ(ierr); 48822fa5cd67SKarl Rupp 4883a0ba757dSStefano Zampini i = mat_graph->nvtxs; 4884a0ba757dSStefano Zampini ierr = PetscMalloc4(i,PetscInt,&mat_graph->where,i,PetscInt,&mat_graph->count,i+1,PetscInt,&mat_graph->cptr,i,PetscInt,&mat_graph->queue);CHKERRQ(ierr); 48853972b0daSStefano Zampini ierr = PetscMalloc2(i,PetscInt,&mat_graph->which_dof,i,PetscBool,&mat_graph->touched);CHKERRQ(ierr); 4886a0ba757dSStefano Zampini ierr = PetscMemzero(mat_graph->where,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr); 4887a0ba757dSStefano Zampini ierr = PetscMemzero(mat_graph->count,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr); 4888a0ba757dSStefano Zampini ierr = PetscMemzero(mat_graph->which_dof,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr); 4889a0ba757dSStefano Zampini ierr = PetscMemzero(mat_graph->queue,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr); 48903828260eSStefano Zampini ierr = PetscMemzero(mat_graph->cptr,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr); 4891a0ba757dSStefano Zampini 4892a81d60d8SStefano Zampini /* Setting dofs splitting in mat_graph->which_dof 4893a81d60d8SStefano Zampini Get information about dofs' splitting if provided by the user 4894a81d60d8SStefano Zampini Otherwise it assumes a constant block size */ 4895a81d60d8SStefano Zampini vertex_size=0; 4896a81d60d8SStefano Zampini if (!pcbddc->n_ISForDofs) { 4897a81d60d8SStefano Zampini ierr = MatGetBlockSize(matis->A,&bs);CHKERRQ(ierr); 4898a81d60d8SStefano Zampini ierr = PetscMalloc(bs*sizeof(IS),&custom_ISForDofs);CHKERRQ(ierr); 4899a81d60d8SStefano Zampini for (i=0; i<bs; i++) { 4900a81d60d8SStefano Zampini ierr = ISCreateStride(PETSC_COMM_SELF,pcis->n/bs,i,bs,&custom_ISForDofs[i]);CHKERRQ(ierr); 4901a81d60d8SStefano Zampini } 4902a81d60d8SStefano Zampini ierr = PCBDDCSetDofsSplitting(pc,bs,custom_ISForDofs);CHKERRQ(ierr); 4903a81d60d8SStefano Zampini vertex_size=1; 4904a81d60d8SStefano Zampini /* remove my references to IS objects */ 4905a81d60d8SStefano Zampini for (i=0; i<bs; i++) { 4906a81d60d8SStefano Zampini ierr = ISDestroy(&custom_ISForDofs[i]);CHKERRQ(ierr); 4907a81d60d8SStefano Zampini } 4908a81d60d8SStefano Zampini ierr = PetscFree(custom_ISForDofs);CHKERRQ(ierr); 4909a81d60d8SStefano Zampini } 49109c0446d6SStefano Zampini for (i=0; i<pcbddc->n_ISForDofs; i++) { 4911a81d60d8SStefano Zampini ierr = ISGetSize(pcbddc->ISForDofs[i],&k);CHKERRQ(ierr); 49129c0446d6SStefano Zampini ierr = ISGetIndices(pcbddc->ISForDofs[i],(const PetscInt**)&is_indices);CHKERRQ(ierr); 49132fa5cd67SKarl Rupp for (j=0; j<k; j++) mat_graph->which_dof[is_indices[j]]=i; 49149c0446d6SStefano Zampini ierr = ISRestoreIndices(pcbddc->ISForDofs[i],(const PetscInt**)&is_indices);CHKERRQ(ierr); 49159c0446d6SStefano Zampini } 4916a81d60d8SStefano Zampini /* use mat block size as vertex size if it has not yet set */ 4917a81d60d8SStefano Zampini if (!vertex_size) { 49183b03a366Sstefano_zampini ierr = MatGetBlockSize(matis->A,&vertex_size);CHKERRQ(ierr); 49190c7d97c5SJed Brown } 4920a81d60d8SStefano Zampini 49213b03a366Sstefano_zampini /* count number of neigh per node */ 49220c7d97c5SJed Brown total_counts=0; 49233b03a366Sstefano_zampini for (i=1; i<pcis->n_neigh; i++) { 49240c7d97c5SJed Brown s = pcis->n_shared[i]; 49250c7d97c5SJed Brown total_counts += s; 49262fa5cd67SKarl Rupp for (j=0;j<s;j++) mat_graph->count[pcis->shared[i][j]] += 1; 49270c7d97c5SJed Brown } 49282fa5cd67SKarl Rupp 4929534831adSStefano Zampini /* Take into account Neumann data -> it increments number of sharing subdomains for nodes lying on the interface */ 493036e030ebSStefano Zampini ierr = PCBDDCGetNeumannBoundaries(pc,&used_IS);CHKERRQ(ierr); 4931da1bb401SStefano Zampini ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr); 4932da1bb401SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 493336e030ebSStefano Zampini if (used_IS) { 493436e030ebSStefano Zampini ierr = ISGetSize(used_IS,&neumann_bsize);CHKERRQ(ierr); 493536e030ebSStefano Zampini ierr = ISGetIndices(used_IS,&neumann_nodes);CHKERRQ(ierr); 493653cdbc3dSStefano Zampini for (i=0; i<neumann_bsize; i++) { 493753cdbc3dSStefano Zampini iindex = neumann_nodes[i]; 4938534831adSStefano Zampini if (mat_graph->count[iindex] > NEUMANNCNT && array[iindex]==0.0) { 493953cdbc3dSStefano Zampini mat_graph->count[iindex]+=1; 49400c7d97c5SJed Brown total_counts++; 4941da1bb401SStefano Zampini array[iindex]=array[iindex]+1.0; 4942f23aa3ddSBarry Smith } else if (array[iindex]>0.0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_USER,"Error for neumann nodes provided to BDDC! They must be uniquely listed! Found duplicate node %d\n",iindex); 49430c7d97c5SJed Brown } 49440c7d97c5SJed Brown } 4945da1bb401SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 4946da1bb401SStefano Zampini /* allocate space for storing the set of neighbours for each node */ 4947da1bb401SStefano Zampini ierr = PetscMalloc(mat_graph->nvtxs*sizeof(PetscInt*),&mat_graph->neighbours_set);CHKERRQ(ierr); 4948da1bb401SStefano Zampini if (mat_graph->nvtxs) { ierr = PetscMalloc(total_counts*sizeof(PetscInt),&mat_graph->neighbours_set[0]);CHKERRQ(ierr); } 4949da1bb401SStefano Zampini for (i=1; i<mat_graph->nvtxs; i++) mat_graph->neighbours_set[i]=mat_graph->neighbours_set[i-1]+mat_graph->count[i-1]; 4950a0ba757dSStefano Zampini ierr = PetscMemzero(mat_graph->count,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr); 49513b03a366Sstefano_zampini for (i=1; i<pcis->n_neigh; i++) { 49520c7d97c5SJed Brown s=pcis->n_shared[i]; 49530c7d97c5SJed Brown for (j=0; j<s; j++) { 49540c7d97c5SJed Brown k=pcis->shared[i][j]; 49552fa5cd67SKarl Rupp 4956da1bb401SStefano Zampini mat_graph->neighbours_set[k][mat_graph->count[k]] = pcis->neigh[i]; 49572fa5cd67SKarl Rupp 49580c7d97c5SJed Brown mat_graph->count[k]+=1; 49590c7d97c5SJed Brown } 49600c7d97c5SJed Brown } 4961da1bb401SStefano Zampini /* Check consistency of Neumann nodes */ 4962da1bb401SStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 4963da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 4964da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 4965da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 4966da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 4967da1bb401SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 49683b03a366Sstefano_zampini /* set -1 fake neighbour to mimic Neumann boundary */ 496936e030ebSStefano Zampini if (used_IS) { 497053cdbc3dSStefano Zampini for (i=0; i<neumann_bsize; i++) { 497153cdbc3dSStefano Zampini iindex = neumann_nodes[i]; 4972534831adSStefano Zampini if (mat_graph->count[iindex] > NEUMANNCNT) { 49732fa5cd67SKarl Rupp if (mat_graph->count[iindex]+1 != (PetscInt)array[iindex]) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_USER,"Neumann nodes provided to BDDC must be consistent among neighbours!\nNode %d: number of sharing subdomains %d != number of subdomains for which it is a neumann node %d\n",iindex,mat_graph->count[iindex]+1,(PetscInt)array[iindex]); 4974da1bb401SStefano Zampini mat_graph->neighbours_set[iindex][mat_graph->count[iindex]] = -1; 49752fa5cd67SKarl Rupp 497653cdbc3dSStefano Zampini mat_graph->count[iindex]+=1; 49770c7d97c5SJed Brown } 49780c7d97c5SJed Brown } 497936e030ebSStefano Zampini ierr = ISRestoreIndices(used_IS,&neumann_nodes);CHKERRQ(ierr); 49800c7d97c5SJed Brown } 4981da1bb401SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 4982da1bb401SStefano Zampini /* sort set of sharing subdomains */ 49832fa5cd67SKarl Rupp for (i=0;i<mat_graph->nvtxs;i++) { 49842fa5cd67SKarl Rupp ierr = PetscSortInt(mat_graph->count[i],mat_graph->neighbours_set[i]);CHKERRQ(ierr); 49852fa5cd67SKarl Rupp } 49862fa5cd67SKarl Rupp 49873b03a366Sstefano_zampini /* remove interior nodes and dirichlet boundary nodes from the next search into the graph */ 49882fa5cd67SKarl Rupp for (i=0;i<mat_graph->nvtxs;i++) mat_graph->touched[i]=PETSC_FALSE; 4989da1bb401SStefano Zampini nodes_touched=0; 49902fa5cd67SKarl Rupp 499136e030ebSStefano Zampini ierr = PCBDDCGetDirichletBoundaries(pc,&used_IS);CHKERRQ(ierr); 4992da1bb401SStefano Zampini ierr = VecSet(pcis->vec2_N,0.0);CHKERRQ(ierr); 4993da1bb401SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 4994da1bb401SStefano Zampini ierr = VecGetArray(pcis->vec2_N,&array2);CHKERRQ(ierr); 4995da1bb401SStefano Zampini if (used_IS) { 4996da1bb401SStefano Zampini ierr = ISGetSize(used_IS,&dirichlet_bsize);CHKERRQ(ierr); 4997f23aa3ddSBarry Smith if (dirichlet_bsize && matis->pure_neumann) SETERRQ(PETSC_COMM_SELF,PETSC_ERR_USER,"Dirichlet boundaries are intended to be used with matrices with zeroed rows!\n"); 4998da1bb401SStefano Zampini ierr = ISGetIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr); 4999da1bb401SStefano Zampini for (i=0; i<dirichlet_bsize; i++) { 5000da1bb401SStefano Zampini iindex = dirichlet_nodes[i]; 5001da1bb401SStefano Zampini if (mat_graph->count[iindex] && !mat_graph->touched[iindex]) { 5002f23aa3ddSBarry Smith if (array[iindex]>0.0) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_USER,"BDDC cannot have nodes which are marked as Neumann and Dirichlet at the same time! Wrong node %d\n",iindex); 5003da1bb401SStefano Zampini mat_graph->touched[iindex] = PETSC_TRUE; 5004da1bb401SStefano Zampini mat_graph->where[iindex] = 0; 5005da1bb401SStefano Zampini nodes_touched++; 5006da1bb401SStefano Zampini array2[iindex] = array2[iindex]+1.0; 5007da1bb401SStefano Zampini } 5008da1bb401SStefano Zampini } 5009da1bb401SStefano Zampini ierr = ISRestoreIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr); 5010da1bb401SStefano Zampini } 5011da1bb401SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 5012da1bb401SStefano Zampini ierr = VecRestoreArray(pcis->vec2_N,&array2);CHKERRQ(ierr); 50132fa5cd67SKarl Rupp 5014da1bb401SStefano Zampini /* Check consistency of Dirichlet nodes */ 5015da1bb401SStefano Zampini ierr = VecSet(pcis->vec1_N,1.0);CHKERRQ(ierr); 5016da1bb401SStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 5017da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 5018da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 5019da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 5020da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 5021da1bb401SStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 5022da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec2_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 5023da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec2_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 5024da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 5025da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 5026da1bb401SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 5027da1bb401SStefano Zampini ierr = VecGetArray(pcis->vec2_N,&array2);CHKERRQ(ierr); 502836e030ebSStefano Zampini if (used_IS) { 502936e030ebSStefano Zampini ierr = ISGetSize(used_IS,&dirichlet_bsize);CHKERRQ(ierr); 503036e030ebSStefano Zampini ierr = ISGetIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr); 50313b03a366Sstefano_zampini for (i=0; i<dirichlet_bsize; i++) { 5032da1bb401SStefano Zampini iindex=dirichlet_nodes[i]; 50332fa5cd67SKarl Rupp if (array[iindex]>1.0 && array[iindex]!=array2[iindex]) SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_USER,"Dirichlet nodes provided to BDDC must be consistent among neighbours!\nNode %d: number of sharing subdomains %d != number of subdomains for which it is a neumann node %d\n",iindex,(PetscInt)array[iindex],(PetscInt)array2[iindex]); 50343b03a366Sstefano_zampini } 503536e030ebSStefano Zampini ierr = ISRestoreIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr); 50363b03a366Sstefano_zampini } 5037da1bb401SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 5038da1bb401SStefano Zampini ierr = VecRestoreArray(pcis->vec2_N,&array2);CHKERRQ(ierr); 5039da1bb401SStefano Zampini 50400c7d97c5SJed Brown for (i=0; i<mat_graph->nvtxs; i++) { 50413b03a366Sstefano_zampini if (!mat_graph->count[i]) { /* interior nodes */ 50420c7d97c5SJed Brown mat_graph->touched[i] = PETSC_TRUE; 50430c7d97c5SJed Brown mat_graph->where[i] = 0; 50440c7d97c5SJed Brown nodes_touched++; 50450c7d97c5SJed Brown } 50460c7d97c5SJed Brown } 50470c7d97c5SJed Brown mat_graph->ncmps = 0; 50482fa5cd67SKarl Rupp 5049da1bb401SStefano Zampini i=0; 50500c7d97c5SJed Brown while (nodes_touched<mat_graph->nvtxs) { 5051a0ba757dSStefano Zampini /* find first untouched node in local ordering */ 50520c7d97c5SJed Brown while (mat_graph->touched[i]) i++; 50530c7d97c5SJed Brown mat_graph->touched[i]=PETSC_TRUE; 5054a0ba757dSStefano Zampini mat_graph->where[i] =where_values; 50550c7d97c5SJed Brown nodes_touched++; 5056a0ba757dSStefano Zampini /* now find all other nodes having the same set of sharing subdomains */ 50570c7d97c5SJed Brown for (j=i+1; j<mat_graph->nvtxs; j++) { 5058a0ba757dSStefano Zampini /* check for same number of sharing subdomains and dof number */ 5059da1bb401SStefano Zampini if (!mat_graph->touched[j] && mat_graph->count[i]==mat_graph->count[j] && mat_graph->which_dof[i] == mat_graph->which_dof[j]) { 5060a0ba757dSStefano Zampini /* check for same set of sharing subdomains */ 50610c7d97c5SJed Brown same_set=PETSC_TRUE; 50620c7d97c5SJed Brown for (k=0; k<mat_graph->count[j]; k++) { 5063da1bb401SStefano Zampini if (mat_graph->neighbours_set[i][k] != mat_graph->neighbours_set[j][k]) { 50640c7d97c5SJed Brown same_set=PETSC_FALSE; 50650c7d97c5SJed Brown } 50660c7d97c5SJed Brown } 5067a0ba757dSStefano Zampini /* I found a friend of mine */ 50680c7d97c5SJed Brown if (same_set) { 5069a0ba757dSStefano Zampini mat_graph->where[j] = where_values; 50700c7d97c5SJed Brown mat_graph->touched[j] = PETSC_TRUE; 50710c7d97c5SJed Brown nodes_touched++; 50720c7d97c5SJed Brown } 50730c7d97c5SJed Brown } 50740c7d97c5SJed Brown } 5075a0ba757dSStefano Zampini where_values++; 50760c7d97c5SJed Brown } 5077a0ba757dSStefano Zampini where_values--; if (where_values<0) where_values=0; 5078a0ba757dSStefano Zampini ierr = PetscMalloc(where_values*sizeof(PetscMPIInt),&mat_graph->where_ncmps);CHKERRQ(ierr); 5079a0ba757dSStefano Zampini /* Find connected components defined on the shared interface */ 5080a0ba757dSStefano Zampini if (where_values) { 50812fa5cd67SKarl Rupp ierr = PCBDDCFindConnectedComponents(mat_graph, where_values);CHKERRQ(ierr); 5082a0ba757dSStefano Zampini } 5083a929c220SStefano Zampini ierr = PetscMalloc(mat_graph->nvtxs*sizeof(PetscInt),&queue_in_global_numbering);CHKERRQ(ierr); 5084a0ba757dSStefano Zampini /* check consistency of connected components among neighbouring subdomains -> it adapt them in case it is needed */ 5085a0ba757dSStefano Zampini for (i=0;i<where_values;i++) { 50867cf533a6SStefano Zampini /* We are not sure that on a given subset of the local interface, 50877cf533a6SStefano Zampini two connected components will be the same among sharing subdomains */ 50883b03a366Sstefano_zampini if (mat_graph->where_ncmps[i]>1) { 5089a0ba757dSStefano Zampini adapt_interface=1; 5090a0ba757dSStefano Zampini break; 5091a0ba757dSStefano Zampini } 5092a0ba757dSStefano Zampini } 50932fa5cd67SKarl Rupp 5094a0ba757dSStefano Zampini ierr = MPI_Allreduce(&adapt_interface,&adapt_interface_reduced,1,MPIU_INT,MPI_LOR,interface_comm);CHKERRQ(ierr); 5095da1bb401SStefano Zampini if (pcbddc->dbg_flag && adapt_interface_reduced) { 5096d8923723SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Adapting interface\n");CHKERRQ(ierr); 5097da1bb401SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 5098da1bb401SStefano Zampini } 5099a0ba757dSStefano Zampini if (where_values && adapt_interface_reduced) { 5100a0ba757dSStefano Zampini PetscInt sum_requests=0,my_rank; 5101a0ba757dSStefano Zampini PetscInt buffer_size,start_of_recv,size_of_recv,start_of_send; 5102a0ba757dSStefano Zampini PetscInt temp_buffer_size,ins_val,global_where_counter; 5103a0ba757dSStefano Zampini PetscInt *cum_recv_counts; 5104a0ba757dSStefano Zampini PetscInt *where_to_nodes_indices; 5105a0ba757dSStefano Zampini PetscInt *petsc_buffer; 5106a0ba757dSStefano Zampini PetscMPIInt *recv_buffer; 5107a0ba757dSStefano Zampini PetscMPIInt *recv_buffer_where; 5108a0ba757dSStefano Zampini PetscMPIInt *send_buffer; 5109a0ba757dSStefano Zampini PetscMPIInt size_of_send; 5110a0ba757dSStefano Zampini PetscInt *sizes_of_sends; 5111a0ba757dSStefano Zampini MPI_Request *send_requests; 5112a0ba757dSStefano Zampini MPI_Request *recv_requests; 5113a0ba757dSStefano Zampini PetscInt *where_cc_adapt; 5114a0ba757dSStefano Zampini PetscInt **temp_buffer; 5115a0ba757dSStefano Zampini PetscInt *nodes_to_temp_buffer_indices; 5116a0ba757dSStefano Zampini PetscInt *add_to_where; 51177cf533a6SStefano Zampini PetscInt *aux_new_xadj,*new_xadj,*new_adjncy; 5118a0ba757dSStefano Zampini 51197cf533a6SStefano Zampini /* Retrict adjacency graph using information from connected components */ 51207cf533a6SStefano Zampini ierr = PetscMalloc(mat_graph->nvtxs*sizeof(PetscInt),&aux_new_xadj);CHKERRQ(ierr); 51212fa5cd67SKarl Rupp for (i=0; i<mat_graph->nvtxs; i++) aux_new_xadj[i]=1; 51227cf533a6SStefano Zampini for (i=0;i<mat_graph->ncmps;i++) { 51237cf533a6SStefano Zampini k = mat_graph->cptr[i+1]-mat_graph->cptr[i]; 51242fa5cd67SKarl Rupp for (j=0;j<k;j++) aux_new_xadj[mat_graph->queue[mat_graph->cptr[i]+j]]=k; 51257cf533a6SStefano Zampini } 51267cf533a6SStefano Zampini j = 0; 51272fa5cd67SKarl Rupp for (i=0;i<mat_graph->nvtxs;i++) j += aux_new_xadj[i]; 51282fa5cd67SKarl Rupp 51297cf533a6SStefano Zampini ierr = PetscMalloc((mat_graph->nvtxs+1)*sizeof(PetscInt),&new_xadj);CHKERRQ(ierr); 51307cf533a6SStefano Zampini ierr = PetscMalloc(j*sizeof(PetscInt),&new_adjncy);CHKERRQ(ierr); 51317cf533a6SStefano Zampini new_xadj[0]=0; 51327cf533a6SStefano Zampini for (i=0;i<mat_graph->nvtxs;i++) { 51337cf533a6SStefano Zampini new_xadj[i+1]=new_xadj[i]+aux_new_xadj[i]; 51342fa5cd67SKarl Rupp if (aux_new_xadj[i]==1) new_adjncy[new_xadj[i]]=i; 51357cf533a6SStefano Zampini } 5136354b9337SStefano Zampini ierr = PetscFree(aux_new_xadj);CHKERRQ(ierr); 51377cf533a6SStefano Zampini for (i=0; i<mat_graph->ncmps; i++) { 51387cf533a6SStefano Zampini k = mat_graph->cptr[i+1]-mat_graph->cptr[i]; 51397cf533a6SStefano Zampini for (j=0; j<k; j++) { 51407cf533a6SStefano Zampini ierr = PetscMemcpy(&new_adjncy[new_xadj[mat_graph->queue[mat_graph->cptr[i]+j]]],&mat_graph->queue[mat_graph->cptr[i]],k*sizeof(PetscInt));CHKERRQ(ierr); 51417cf533a6SStefano Zampini } 51427cf533a6SStefano Zampini } 51437cf533a6SStefano Zampini ierr = PCBDDCSetLocalAdjacencyGraph(pc,mat_graph->nvtxs,new_xadj,new_adjncy,PETSC_OWN_POINTER);CHKERRQ(ierr); 51447cf533a6SStefano Zampini /* For consistency among neughbouring procs, I need to sort (by global ordering) each connected component */ 51457cf533a6SStefano Zampini for (i=0; i<mat_graph->ncmps; i++) { 51467cf533a6SStefano Zampini k = mat_graph->cptr[i+1]-mat_graph->cptr[i]; 51477cf533a6SStefano Zampini ierr = ISLocalToGlobalMappingApply(matis->mapping,k,&mat_graph->queue[mat_graph->cptr[i]],&queue_in_global_numbering[mat_graph->cptr[i]]);CHKERRQ(ierr); 51487cf533a6SStefano Zampini ierr = PetscSortIntWithArray(k,&queue_in_global_numbering[mat_graph->cptr[i]],&mat_graph->queue[mat_graph->cptr[i]]);CHKERRQ(ierr); 51497cf533a6SStefano Zampini } 51507cf533a6SStefano Zampini /* allocate some space */ 5151a0ba757dSStefano Zampini ierr = MPI_Comm_rank(interface_comm,&my_rank);CHKERRQ(ierr); 5152a0ba757dSStefano Zampini ierr = PetscMalloc((where_values+1)*sizeof(PetscInt),&cum_recv_counts);CHKERRQ(ierr); 5153a0ba757dSStefano Zampini ierr = PetscMemzero(cum_recv_counts,(where_values+1)*sizeof(PetscInt));CHKERRQ(ierr); 5154a0ba757dSStefano Zampini ierr = PetscMalloc(where_values*sizeof(PetscInt),&where_to_nodes_indices);CHKERRQ(ierr); 5155a0ba757dSStefano Zampini /* first count how many neighbours per connected component I will receive from */ 5156a0ba757dSStefano Zampini cum_recv_counts[0]=0; 5157a0ba757dSStefano Zampini for (i=1; i<where_values+1; i++) { 5158a0ba757dSStefano Zampini j=0; 51592fa5cd67SKarl Rupp while (mat_graph->where[j] != i) j++; 5160a0ba757dSStefano Zampini where_to_nodes_indices[i-1]=j; 51612fa5cd67SKarl Rupp if (mat_graph->neighbours_set[j][0]!=-1) cum_recv_counts[i]=cum_recv_counts[i-1]+mat_graph->count[j]; /* We don't want sends/recvs_to/from_self -> here I don't count myself */ 51622fa5cd67SKarl Rupp else cum_recv_counts[i]=cum_recv_counts[i-1]+mat_graph->count[j]-1; 5163a0ba757dSStefano Zampini } 5164a0ba757dSStefano Zampini ierr = PetscMalloc(2*cum_recv_counts[where_values]*sizeof(PetscMPIInt),&recv_buffer_where);CHKERRQ(ierr); 5165a0ba757dSStefano Zampini ierr = PetscMalloc(cum_recv_counts[where_values]*sizeof(MPI_Request),&send_requests);CHKERRQ(ierr); 5166a0ba757dSStefano Zampini ierr = PetscMalloc(cum_recv_counts[where_values]*sizeof(MPI_Request),&recv_requests);CHKERRQ(ierr); 5167a0ba757dSStefano Zampini for (i=0; i<cum_recv_counts[where_values]; i++) { 5168a0ba757dSStefano Zampini send_requests[i]=MPI_REQUEST_NULL; 5169a0ba757dSStefano Zampini recv_requests[i]=MPI_REQUEST_NULL; 5170a0ba757dSStefano Zampini } 5171a0ba757dSStefano Zampini /* exchange with my neighbours the number of my connected components on the shared interface */ 5172a0ba757dSStefano Zampini for (i=0; i<where_values; i++) { 5173a0ba757dSStefano Zampini j = where_to_nodes_indices[i]; 5174da1bb401SStefano Zampini k = (mat_graph->neighbours_set[j][0] == -1 ? 1 : 0); 5175a0ba757dSStefano Zampini for (; k<mat_graph->count[j]; k++) { 5176da1bb401SStefano Zampini ierr = MPI_Isend(&mat_graph->where_ncmps[i],1,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr); 5177da1bb401SStefano Zampini ierr = MPI_Irecv(&recv_buffer_where[sum_requests],1,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr); 5178a0ba757dSStefano Zampini sum_requests++; 5179a0ba757dSStefano Zampini } 5180a0ba757dSStefano Zampini } 5181a0ba757dSStefano Zampini ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 5182a0ba757dSStefano Zampini ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 5183a0ba757dSStefano Zampini /* determine the connected component I need to adapt */ 5184a0ba757dSStefano Zampini ierr = PetscMalloc(where_values*sizeof(PetscInt),&where_cc_adapt);CHKERRQ(ierr); 5185a0ba757dSStefano Zampini ierr = PetscMemzero(where_cc_adapt,where_values*sizeof(PetscInt));CHKERRQ(ierr); 5186a0ba757dSStefano Zampini for (i=0; i<where_values; i++) { 5187a0ba757dSStefano Zampini for (j=cum_recv_counts[i]; j<cum_recv_counts[i+1]; j++) { 51883b03a366Sstefano_zampini /* The first condition is natural (i.e someone has a different number of cc than me), the second one is just to be safe */ 51893b03a366Sstefano_zampini if (mat_graph->where_ncmps[i]!=recv_buffer_where[j] || mat_graph->where_ncmps[i] > 1) { 5190a0ba757dSStefano Zampini where_cc_adapt[i]=PETSC_TRUE; 5191a0ba757dSStefano Zampini break; 5192a0ba757dSStefano Zampini } 5193a0ba757dSStefano Zampini } 5194a0ba757dSStefano Zampini } 5195d8923723SStefano Zampini buffer_size = 0; 5196d8923723SStefano Zampini for (i=0; i<where_values; i++) { 5197d8923723SStefano Zampini if (where_cc_adapt[i]) { 5198d8923723SStefano Zampini for (j=i; j<mat_graph->ncmps; j++) { 5199d8923723SStefano Zampini if (mat_graph->where[mat_graph->queue[mat_graph->cptr[j]]] == i+1) { /* WARNING -> where values goes from 1 to where_values included */ 5200d8923723SStefano Zampini buffer_size += 1 + mat_graph->cptr[j+1]-mat_graph->cptr[j]; 5201d8923723SStefano Zampini } 5202d8923723SStefano Zampini } 5203d8923723SStefano Zampini } 5204d8923723SStefano Zampini } 5205d8923723SStefano Zampini ierr = PetscMalloc(buffer_size*sizeof(PetscMPIInt),&send_buffer);CHKERRQ(ierr); 5206a0ba757dSStefano Zampini /* now get from neighbours their ccs (in global numbering) and adapt them (in case it is needed) */ 5207a0ba757dSStefano Zampini /* first determine how much data to send (size of each queue plus the global indices) and communicate it to neighbours */ 5208a0ba757dSStefano Zampini ierr = PetscMalloc(where_values*sizeof(PetscInt),&sizes_of_sends);CHKERRQ(ierr); 5209a0ba757dSStefano Zampini ierr = PetscMemzero(sizes_of_sends,where_values*sizeof(PetscInt));CHKERRQ(ierr); 52102fa5cd67SKarl Rupp 5211a0ba757dSStefano Zampini sum_requests = 0; 5212a0ba757dSStefano Zampini start_of_send = 0; 5213a0ba757dSStefano Zampini start_of_recv = cum_recv_counts[where_values]; 5214a0ba757dSStefano Zampini for (i=0; i<where_values; i++) { 5215a0ba757dSStefano Zampini if (where_cc_adapt[i]) { 5216a0ba757dSStefano Zampini size_of_send=0; 5217a0ba757dSStefano Zampini for (j=i; j<mat_graph->ncmps; j++) { 5218a0ba757dSStefano Zampini if (mat_graph->where[mat_graph->queue[mat_graph->cptr[j]]] == i+1) { /* WARNING -> where values goes from 1 to where_values included */ 5219a0ba757dSStefano Zampini send_buffer[start_of_send+size_of_send]=mat_graph->cptr[j+1]-mat_graph->cptr[j]; 5220a0ba757dSStefano Zampini size_of_send += 1; 5221a0ba757dSStefano Zampini for (k=0; k<mat_graph->cptr[j+1]-mat_graph->cptr[j]; k++) { 5222a0ba757dSStefano Zampini send_buffer[start_of_send+size_of_send+k]=queue_in_global_numbering[mat_graph->cptr[j]+k]; 5223a0ba757dSStefano Zampini } 5224a0ba757dSStefano Zampini size_of_send=size_of_send+mat_graph->cptr[j+1]-mat_graph->cptr[j]; 5225a0ba757dSStefano Zampini } 5226a0ba757dSStefano Zampini } 5227a0ba757dSStefano Zampini j = where_to_nodes_indices[i]; 5228da1bb401SStefano Zampini k = (mat_graph->neighbours_set[j][0] == -1 ? 1 : 0); 522911d8f4c2SStefano Zampini sizes_of_sends[i]=size_of_send; 5230a0ba757dSStefano Zampini for (; k<mat_graph->count[j]; k++) { 523111d8f4c2SStefano Zampini ierr = MPI_Isend(&sizes_of_sends[i],1,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr); 5232da1bb401SStefano Zampini ierr = MPI_Irecv(&recv_buffer_where[sum_requests+start_of_recv],1,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr); 5233a0ba757dSStefano Zampini sum_requests++; 5234a0ba757dSStefano Zampini } 5235a0ba757dSStefano Zampini start_of_send+=size_of_send; 5236a0ba757dSStefano Zampini } 5237a0ba757dSStefano Zampini } 5238a0ba757dSStefano Zampini ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 5239a0ba757dSStefano Zampini ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 52402fa5cd67SKarl Rupp 5241a0ba757dSStefano Zampini buffer_size=0; 52422fa5cd67SKarl Rupp 52432fa5cd67SKarl Rupp for (k=0;k<sum_requests;k++) buffer_size += recv_buffer_where[start_of_recv+k]; 5244a0ba757dSStefano Zampini ierr = PetscMalloc(buffer_size*sizeof(PetscMPIInt),&recv_buffer);CHKERRQ(ierr); 5245a0ba757dSStefano Zampini /* now exchange the data */ 5246a0ba757dSStefano Zampini start_of_recv = 0; 5247a0ba757dSStefano Zampini start_of_send = 0; 5248a0ba757dSStefano Zampini sum_requests = 0; 5249a0ba757dSStefano Zampini for (i=0; i<where_values; i++) { 5250a0ba757dSStefano Zampini if (where_cc_adapt[i]) { 5251a0ba757dSStefano Zampini size_of_send = sizes_of_sends[i]; 52522fa5cd67SKarl Rupp 5253a0ba757dSStefano Zampini j = where_to_nodes_indices[i]; 5254da1bb401SStefano Zampini k = (mat_graph->neighbours_set[j][0] == -1 ? 1 : 0); 5255a0ba757dSStefano Zampini for (; k<mat_graph->count[j]; k++) { 5256da1bb401SStefano Zampini ierr = MPI_Isend(&send_buffer[start_of_send],size_of_send,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr); 5257a0ba757dSStefano Zampini size_of_recv = recv_buffer_where[cum_recv_counts[where_values]+sum_requests]; 5258da1bb401SStefano Zampini ierr = MPI_Irecv(&recv_buffer[start_of_recv],size_of_recv,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr); 5259a0ba757dSStefano Zampini start_of_recv+=size_of_recv; 5260a0ba757dSStefano Zampini sum_requests++; 5261a0ba757dSStefano Zampini } 5262a0ba757dSStefano Zampini start_of_send+=size_of_send; 5263a0ba757dSStefano Zampini } 5264a0ba757dSStefano Zampini } 5265a0ba757dSStefano Zampini ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 5266a0ba757dSStefano Zampini ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 5267a0ba757dSStefano Zampini ierr = PetscMalloc(buffer_size*sizeof(PetscInt),&petsc_buffer);CHKERRQ(ierr); 52682fa5cd67SKarl Rupp for (k=0;k<start_of_recv;k++) petsc_buffer[k]=(PetscInt)recv_buffer[k]; 5269a0ba757dSStefano Zampini for (j=0;j<buffer_size;) { 5270a0ba757dSStefano Zampini ierr = ISGlobalToLocalMappingApply(matis->mapping,IS_GTOLM_MASK,petsc_buffer[j],&petsc_buffer[j+1],&petsc_buffer[j],&petsc_buffer[j+1]);CHKERRQ(ierr); 5271a0ba757dSStefano Zampini k = petsc_buffer[j]+1; 5272a0ba757dSStefano Zampini j += k; 5273a0ba757dSStefano Zampini } 5274a0ba757dSStefano Zampini sum_requests = cum_recv_counts[where_values]; 5275a0ba757dSStefano Zampini start_of_recv = 0; 52762fa5cd67SKarl Rupp 5277a0ba757dSStefano Zampini ierr = PetscMalloc(mat_graph->nvtxs*sizeof(PetscInt),&nodes_to_temp_buffer_indices);CHKERRQ(ierr); 5278a0ba757dSStefano Zampini global_where_counter=0; 5279a0ba757dSStefano Zampini for (i=0; i<where_values; i++) { 5280a0ba757dSStefano Zampini if (where_cc_adapt[i]) { 5281a0ba757dSStefano Zampini temp_buffer_size=0; 5282a0ba757dSStefano Zampini /* find nodes on the shared interface we need to adapt */ 5283a0ba757dSStefano Zampini for (j=0; j<mat_graph->nvtxs; j++) { 5284a0ba757dSStefano Zampini if (mat_graph->where[j]==i+1) { 5285a0ba757dSStefano Zampini nodes_to_temp_buffer_indices[j]=temp_buffer_size; 5286a0ba757dSStefano Zampini temp_buffer_size++; 5287a0ba757dSStefano Zampini } else { 5288a0ba757dSStefano Zampini nodes_to_temp_buffer_indices[j]=-1; 5289a0ba757dSStefano Zampini } 5290a0ba757dSStefano Zampini } 52912fa5cd67SKarl Rupp 5292a0ba757dSStefano Zampini /* allocate some temporary space */ 5293a0ba757dSStefano Zampini ierr = PetscMalloc(temp_buffer_size*sizeof(PetscInt*),&temp_buffer);CHKERRQ(ierr); 5294a0ba757dSStefano Zampini ierr = PetscMalloc(temp_buffer_size*(cum_recv_counts[i+1]-cum_recv_counts[i])*sizeof(PetscInt),&temp_buffer[0]);CHKERRQ(ierr); 5295a0ba757dSStefano Zampini ierr = PetscMemzero(temp_buffer[0],temp_buffer_size*(cum_recv_counts[i+1]-cum_recv_counts[i])*sizeof(PetscInt));CHKERRQ(ierr); 5296a0ba757dSStefano Zampini for (j=1; j<temp_buffer_size; j++) { 5297a0ba757dSStefano Zampini temp_buffer[j]=temp_buffer[j-1]+cum_recv_counts[i+1]-cum_recv_counts[i]; 5298a0ba757dSStefano Zampini } 5299a0ba757dSStefano Zampini /* analyze contributions from neighbouring subdomains for i-th conn comp 5300a0ba757dSStefano Zampini temp buffer structure: 5301a0ba757dSStefano Zampini supposing part of the interface has dimension 5 (global nodes 0,1,2,3,4) 5302a0ba757dSStefano Zampini 3 neighs procs with structured connected components: 5303a0ba757dSStefano Zampini neigh 0: [0 1 4], [2 3]; (2 connected components) 5304a0ba757dSStefano Zampini neigh 1: [0 1], [2 3 4]; (2 connected components) 5305a0ba757dSStefano Zampini neigh 2: [0 4], [1], [2 3]; (3 connected components) 5306a0ba757dSStefano Zampini tempbuffer (row-oriented) should be filled as: 5307a0ba757dSStefano Zampini [ 0, 0, 0; 5308a0ba757dSStefano Zampini 0, 0, 1; 5309a0ba757dSStefano Zampini 1, 1, 2; 5310a0ba757dSStefano Zampini 1, 1, 2; 5311a0ba757dSStefano Zampini 0, 1, 0; ]; 5312a0ba757dSStefano Zampini This way we can simply recover the resulting structure account for possible intersections of ccs among neighs. 5313a0ba757dSStefano Zampini The mat_graph->where array will be modified to reproduce the following 4 connected components [0], [1], [2 3], [4]; 5314a0ba757dSStefano Zampini */ 5315a0ba757dSStefano Zampini for (j=0;j<cum_recv_counts[i+1]-cum_recv_counts[i];j++) { 5316a0ba757dSStefano Zampini ins_val=0; 5317a0ba757dSStefano Zampini size_of_recv=recv_buffer_where[sum_requests]; /* total size of recv from neighs */ 5318a0ba757dSStefano Zampini for (buffer_size=0;buffer_size<size_of_recv;) { /* loop until all data from neighs has been taken into account */ 5319a0ba757dSStefano Zampini for (k=1;k<petsc_buffer[buffer_size+start_of_recv]+1;k++) { /* filling properly temp_buffer using data from a single recv */ 5320a0ba757dSStefano Zampini temp_buffer[nodes_to_temp_buffer_indices[petsc_buffer[start_of_recv+buffer_size+k]]][j] = ins_val; 5321a0ba757dSStefano Zampini } 5322a0ba757dSStefano Zampini buffer_size+=k; 5323a0ba757dSStefano Zampini ins_val++; 5324a0ba757dSStefano Zampini } 5325a0ba757dSStefano Zampini start_of_recv+=size_of_recv; 5326a0ba757dSStefano Zampini sum_requests++; 5327a0ba757dSStefano Zampini } 5328a0ba757dSStefano Zampini ierr = PetscMalloc(temp_buffer_size*sizeof(PetscInt),&add_to_where);CHKERRQ(ierr); 5329a0ba757dSStefano Zampini ierr = PetscMemzero(add_to_where,temp_buffer_size*sizeof(PetscInt));CHKERRQ(ierr); 5330a0ba757dSStefano Zampini for (j=0; j<temp_buffer_size; j++) { 5331a0ba757dSStefano Zampini if (!add_to_where[j]) { /* found a new cc */ 5332a0ba757dSStefano Zampini global_where_counter++; 5333a0ba757dSStefano Zampini add_to_where[j]=global_where_counter; 5334a0ba757dSStefano Zampini for (k=j+1; k<temp_buffer_size; k++) { /* check for other nodes in new cc */ 5335a0ba757dSStefano Zampini same_set=PETSC_TRUE; 5336a0ba757dSStefano Zampini for (s=0; s<cum_recv_counts[i+1]-cum_recv_counts[i]; s++) { 5337a0ba757dSStefano Zampini if (temp_buffer[j][s]!=temp_buffer[k][s]) { 5338a0ba757dSStefano Zampini same_set=PETSC_FALSE; 5339a0ba757dSStefano Zampini break; 5340a0ba757dSStefano Zampini } 5341a0ba757dSStefano Zampini } 53422fa5cd67SKarl Rupp if (same_set) add_to_where[k] = global_where_counter; 5343a0ba757dSStefano Zampini } 5344a0ba757dSStefano Zampini } 5345a0ba757dSStefano Zampini } 5346a0ba757dSStefano Zampini /* insert new data in where array */ 5347a0ba757dSStefano Zampini temp_buffer_size=0; 5348a0ba757dSStefano Zampini for (j=0;j<mat_graph->nvtxs;j++) { 5349a0ba757dSStefano Zampini if (mat_graph->where[j]==i+1) { 5350a0ba757dSStefano Zampini mat_graph->where[j]=where_values+add_to_where[temp_buffer_size]; 5351a0ba757dSStefano Zampini temp_buffer_size++; 5352a0ba757dSStefano Zampini } 5353a0ba757dSStefano Zampini } 5354a0ba757dSStefano Zampini ierr = PetscFree(temp_buffer[0]);CHKERRQ(ierr); 5355a0ba757dSStefano Zampini ierr = PetscFree(temp_buffer);CHKERRQ(ierr); 5356a0ba757dSStefano Zampini ierr = PetscFree(add_to_where);CHKERRQ(ierr); 5357a0ba757dSStefano Zampini } 5358a0ba757dSStefano Zampini } 5359a0ba757dSStefano Zampini ierr = PetscFree(nodes_to_temp_buffer_indices);CHKERRQ(ierr); 5360a0ba757dSStefano Zampini ierr = PetscFree(sizes_of_sends);CHKERRQ(ierr); 5361a0ba757dSStefano Zampini ierr = PetscFree(send_requests);CHKERRQ(ierr); 5362a0ba757dSStefano Zampini ierr = PetscFree(recv_requests);CHKERRQ(ierr); 5363a0ba757dSStefano Zampini ierr = PetscFree(petsc_buffer);CHKERRQ(ierr); 5364a0ba757dSStefano Zampini ierr = PetscFree(recv_buffer);CHKERRQ(ierr); 5365a0ba757dSStefano Zampini ierr = PetscFree(recv_buffer_where);CHKERRQ(ierr); 5366a0ba757dSStefano Zampini ierr = PetscFree(send_buffer);CHKERRQ(ierr); 5367a0ba757dSStefano Zampini ierr = PetscFree(cum_recv_counts);CHKERRQ(ierr); 5368a0ba757dSStefano Zampini ierr = PetscFree(where_to_nodes_indices);CHKERRQ(ierr); 536923d4d1a5SStefano Zampini ierr = PetscFree(where_cc_adapt);CHKERRQ(ierr); 53702fa5cd67SKarl Rupp 5371a0ba757dSStefano Zampini /* We are ready to evaluate consistent connected components on each part of the shared interface */ 5372a0ba757dSStefano Zampini if (global_where_counter) { 53732fa5cd67SKarl Rupp for (i=0;i<mat_graph->nvtxs;i++) mat_graph->touched[i]=PETSC_FALSE; 5374a0ba757dSStefano Zampini global_where_counter=0; 5375a0ba757dSStefano Zampini for (i=0;i<mat_graph->nvtxs;i++) { 5376a0ba757dSStefano Zampini if (mat_graph->where[i] && !mat_graph->touched[i]) { 5377a0ba757dSStefano Zampini global_where_counter++; 5378a0ba757dSStefano Zampini for (j=i+1;j<mat_graph->nvtxs;j++) { 5379a0ba757dSStefano Zampini if (!mat_graph->touched[j] && mat_graph->where[j]==mat_graph->where[i]) { 5380a0ba757dSStefano Zampini mat_graph->where[j] = global_where_counter; 5381a0ba757dSStefano Zampini mat_graph->touched[j] = PETSC_TRUE; 5382a0ba757dSStefano Zampini } 5383a0ba757dSStefano Zampini } 5384a0ba757dSStefano Zampini mat_graph->where[i] = global_where_counter; 5385a0ba757dSStefano Zampini mat_graph->touched[i] = PETSC_TRUE; 5386a0ba757dSStefano Zampini } 5387a0ba757dSStefano Zampini } 5388a0ba757dSStefano Zampini where_values=global_where_counter; 5389a0ba757dSStefano Zampini } 5390a0ba757dSStefano Zampini if (global_where_counter) { 5391a0ba757dSStefano Zampini ierr = PetscMemzero(mat_graph->cptr,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr); 5392a0ba757dSStefano Zampini ierr = PetscMemzero(mat_graph->queue,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr); 5393a0ba757dSStefano Zampini ierr = PetscFree(mat_graph->where_ncmps);CHKERRQ(ierr); 5394a0ba757dSStefano Zampini ierr = PetscMalloc(where_values*sizeof(PetscMPIInt),&mat_graph->where_ncmps);CHKERRQ(ierr); 5395a0ba757dSStefano Zampini ierr = PCBDDCFindConnectedComponents(mat_graph, where_values); 5396a0ba757dSStefano Zampini } 53973b03a366Sstefano_zampini } /* Finished adapting interface */ 53982fa5cd67SKarl Rupp 5399a929c220SStefano Zampini /* For consistency among neughbouring procs, I need to sort (by global ordering) each connected component */ 5400a929c220SStefano Zampini for (i=0; i<mat_graph->ncmps; i++) { 5401a929c220SStefano Zampini k = mat_graph->cptr[i+1]-mat_graph->cptr[i]; 5402a929c220SStefano Zampini ierr = ISLocalToGlobalMappingApply(matis->mapping,k,&mat_graph->queue[mat_graph->cptr[i]],&queue_in_global_numbering[mat_graph->cptr[i]]);CHKERRQ(ierr); 5403a929c220SStefano Zampini ierr = PetscSortIntWithArray(k,&queue_in_global_numbering[mat_graph->cptr[i]],&mat_graph->queue[mat_graph->cptr[i]]);CHKERRQ(ierr); 5404a929c220SStefano Zampini } 5405a929c220SStefano Zampini 54060c7d97c5SJed Brown PetscInt nfc = 0; 54070c7d97c5SJed Brown PetscInt nec = 0; 54080c7d97c5SJed Brown PetscInt nvc = 0; 54093b03a366Sstefano_zampini PetscBool twodim_flag = PETSC_FALSE; 54100c7d97c5SJed Brown for (i=0; i<mat_graph->ncmps; i++) { 54113b03a366Sstefano_zampini if (mat_graph->cptr[i+1]-mat_graph->cptr[i] > vertex_size) { 54122fa5cd67SKarl Rupp if (mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]==1) nfc++; /* 1 neigh Neumann fake included */ 54132fa5cd67SKarl Rupp else nec++; /* note that nec will be zero in 2d */ 54140c7d97c5SJed Brown } else { 54153b03a366Sstefano_zampini nvc+=mat_graph->cptr[i+1]-mat_graph->cptr[i]; 54163b03a366Sstefano_zampini } 54173b03a366Sstefano_zampini } 54183b03a366Sstefano_zampini if (!nec) { /* we are in a 2d case -> no faces, only edges */ 54193b03a366Sstefano_zampini nec = nfc; 54203b03a366Sstefano_zampini nfc = 0; 54213b03a366Sstefano_zampini twodim_flag = PETSC_TRUE; 54223b03a366Sstefano_zampini } 54233972b0daSStefano Zampini /* allocate IS arrays for faces, edges. Vertices need a single index set. */ 54243972b0daSStefano Zampini k=0; 54253972b0daSStefano Zampini for (i=0; i<mat_graph->ncmps; i++) { 54263972b0daSStefano Zampini j=mat_graph->cptr[i+1]-mat_graph->cptr[i]; 54272fa5cd67SKarl Rupp if (j > k) k=j; 54282fa5cd67SKarl Rupp 54292fa5cd67SKarl Rupp if (j<=vertex_size) k+=vertex_size; 54303972b0daSStefano Zampini } 54313972b0daSStefano Zampini ierr = PetscMalloc(k*sizeof(PetscInt),&auxis);CHKERRQ(ierr); 54323b03a366Sstefano_zampini if (!pcbddc->vertices_flag && !pcbddc->edges_flag) { 54333b03a366Sstefano_zampini ierr = PetscMalloc(nfc*sizeof(IS),&pcbddc->ISForFaces);CHKERRQ(ierr); 54343b03a366Sstefano_zampini use_faces = PETSC_TRUE; 54353b03a366Sstefano_zampini } 54363b03a366Sstefano_zampini if (!pcbddc->vertices_flag && !pcbddc->faces_flag) { 54373b03a366Sstefano_zampini ierr = PetscMalloc(nec*sizeof(IS),&pcbddc->ISForEdges);CHKERRQ(ierr); 54383b03a366Sstefano_zampini use_edges = PETSC_TRUE; 54393b03a366Sstefano_zampini } 54403b03a366Sstefano_zampini nfc=0; 54413b03a366Sstefano_zampini nec=0; 54423b03a366Sstefano_zampini for (i=0; i<mat_graph->ncmps; i++) { 54433b03a366Sstefano_zampini if (mat_graph->cptr[i+1]-mat_graph->cptr[i] > vertex_size) { 54443b03a366Sstefano_zampini for (j=0; j<mat_graph->cptr[i+1]-mat_graph->cptr[i]; j++) { 54453972b0daSStefano Zampini auxis[j]=mat_graph->queue[mat_graph->cptr[i]+j]; 54463b03a366Sstefano_zampini } 54473b03a366Sstefano_zampini if (mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]==1) { 54483b03a366Sstefano_zampini if (twodim_flag) { 54493b03a366Sstefano_zampini if (use_edges) { 54503972b0daSStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,j,auxis,PETSC_COPY_VALUES,&pcbddc->ISForEdges[nec]);CHKERRQ(ierr); 54513b03a366Sstefano_zampini nec++; 54523b03a366Sstefano_zampini } 54533b03a366Sstefano_zampini } else { 54543b03a366Sstefano_zampini if (use_faces) { 54553972b0daSStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,j,auxis,PETSC_COPY_VALUES,&pcbddc->ISForFaces[nfc]);CHKERRQ(ierr); 54563b03a366Sstefano_zampini nfc++; 54573b03a366Sstefano_zampini } 54583b03a366Sstefano_zampini } 54593b03a366Sstefano_zampini } else { 54603b03a366Sstefano_zampini if (use_edges) { 54613972b0daSStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,j,auxis,PETSC_COPY_VALUES,&pcbddc->ISForEdges[nec]);CHKERRQ(ierr); 54620c7d97c5SJed Brown nec++; 54630c7d97c5SJed Brown } 54640c7d97c5SJed Brown } 54650c7d97c5SJed Brown } 54663b03a366Sstefano_zampini } 54673b03a366Sstefano_zampini pcbddc->n_ISForFaces = nfc; 54683b03a366Sstefano_zampini pcbddc->n_ISForEdges = nec; 54692fa5cd67SKarl Rupp 54703b03a366Sstefano_zampini nvc = 0; 54710c7d97c5SJed Brown if (!pcbddc->constraints_flag) { 54723b03a366Sstefano_zampini for (i=0; i<mat_graph->ncmps; i++) { 54733b03a366Sstefano_zampini if (mat_graph->cptr[i+1]-mat_graph->cptr[i] <= vertex_size) { 54743b03a366Sstefano_zampini for (j = mat_graph->cptr[i]; j<mat_graph->cptr[i+1]; j++) { 54753972b0daSStefano Zampini auxis[nvc]=mat_graph->queue[j]; 54760c7d97c5SJed Brown nvc++; 54770c7d97c5SJed Brown } 54780c7d97c5SJed Brown } 54790c7d97c5SJed Brown } 54800c7d97c5SJed Brown } 54812fa5cd67SKarl Rupp 5482a0ba757dSStefano Zampini /* sort vertex set (by local ordering) */ 54833972b0daSStefano Zampini ierr = PetscSortInt(nvc,auxis);CHKERRQ(ierr); 54843972b0daSStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,nvc,auxis,PETSC_COPY_VALUES,&pcbddc->ISForVertices);CHKERRQ(ierr); 5485e269702eSStefano Zampini if (pcbddc->dbg_flag) { 5486d49ef151SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"--------------------------------------------------------------\n");CHKERRQ(ierr); 5487d49ef151SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Details from PCBDDCManageLocalBoundaries for subdomain %04d\n",PetscGlobalRank);CHKERRQ(ierr); 5488d49ef151SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Matrix graph has %d connected components", mat_graph->ncmps);CHKERRQ(ierr); 54890c7d97c5SJed Brown for (i=0; i<mat_graph->ncmps; i++) { 54903b03a366Sstefano_zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\nDetails for connected component number %02d: size %04d, count %01d. Nodes follow.\n", 54913b03a366Sstefano_zampini i,mat_graph->cptr[i+1]-mat_graph->cptr[i],mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]);CHKERRQ(ierr); 5492da1bb401SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"subdomains: "); 5493da1bb401SStefano Zampini for (j=0; j<mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]; j++) { 54942fa5cd67SKarl Rupp ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d ",mat_graph->neighbours_set[mat_graph->queue[mat_graph->cptr[i]]][j]);CHKERRQ(ierr); 5495da1bb401SStefano Zampini } 5496da1bb401SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\n"); 54970c7d97c5SJed Brown for (j=mat_graph->cptr[i]; j<mat_graph->cptr[i+1]; j++) { 5498a929c220SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d (%d), ",mat_graph->queue[j],queue_in_global_numbering[j]);CHKERRQ(ierr); 54990c7d97c5SJed Brown } 55000c7d97c5SJed Brown } 5501da1bb401SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\n--------------------------------------------------------------\n");CHKERRQ(ierr); 55023b03a366Sstefano_zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local vertices\n",PetscGlobalRank,nvc);CHKERRQ(ierr); 55033b03a366Sstefano_zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local faces\n",PetscGlobalRank,nfc);CHKERRQ(ierr); 55043b03a366Sstefano_zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local edges\n",PetscGlobalRank,nec);CHKERRQ(ierr); 5505d49ef151SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 55060c7d97c5SJed Brown } 55073972b0daSStefano Zampini ierr = PetscFree(auxis);CHKERRQ(ierr); 5508a929c220SStefano Zampini ierr = PetscFree(queue_in_global_numbering);CHKERRQ(ierr); 55090c7d97c5SJed Brown PetscFunctionReturn(0); 55100c7d97c5SJed Brown } 55110c7d97c5SJed Brown 55120c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 55130c7d97c5SJed Brown 55140c7d97c5SJed Brown /* The following code has been adapted from function IsConnectedSubdomain contained 5515da1bb401SStefano Zampini in source file contig.c of METIS library (version 5.0.1) 5516da1bb401SStefano Zampini It finds connected components of each partition labeled from 1 to n_dist */ 55170c7d97c5SJed Brown 55180c7d97c5SJed Brown #undef __FUNCT__ 55190c7d97c5SJed Brown #define __FUNCT__ "PCBDDCFindConnectedComponents" 55209c0446d6SStefano Zampini static PetscErrorCode PCBDDCFindConnectedComponents(PCBDDCGraph graph, PetscInt n_dist) 55210c7d97c5SJed Brown { 55220c7d97c5SJed Brown PetscInt i, j, k, nvtxs, first, last, nleft, ncmps,pid,cum_queue,n,ncmps_pid; 55230c7d97c5SJed Brown PetscInt *xadj, *adjncy, *where, *queue; 55240c7d97c5SJed Brown PetscInt *cptr; 55250c7d97c5SJed Brown PetscBool *touched; 55260c7d97c5SJed Brown 55270c7d97c5SJed Brown PetscFunctionBegin; 55280c7d97c5SJed Brown nvtxs = graph->nvtxs; 55290c7d97c5SJed Brown xadj = graph->xadj; 55300c7d97c5SJed Brown adjncy = graph->adjncy; 55310c7d97c5SJed Brown where = graph->where; 55320c7d97c5SJed Brown touched = graph->touched; 55330c7d97c5SJed Brown queue = graph->queue; 55340c7d97c5SJed Brown cptr = graph->cptr; 55350c7d97c5SJed Brown 55362fa5cd67SKarl Rupp for (i=0; i<nvtxs; i++) touched[i] = PETSC_FALSE; 55370c7d97c5SJed Brown 55380c7d97c5SJed Brown cum_queue = 0; 55390c7d97c5SJed Brown ncmps = 0; 55400c7d97c5SJed Brown 55410c7d97c5SJed Brown for (n=0; n<n_dist; n++) { 5542da1bb401SStefano Zampini pid = n+1; /* partition labeled by 0 is discarded */ 55430c7d97c5SJed Brown nleft = 0; 55440c7d97c5SJed Brown for (i=0; i<nvtxs; i++) { 55452fa5cd67SKarl Rupp if (where[i] == pid) nleft++; 55460c7d97c5SJed Brown } 55470c7d97c5SJed Brown for (i=0; i<nvtxs; i++) { 55482fa5cd67SKarl Rupp if (where[i] == pid) break; 55490c7d97c5SJed Brown } 55500c7d97c5SJed Brown touched[i] = PETSC_TRUE; 55510c7d97c5SJed Brown queue[cum_queue] = i; 55520c7d97c5SJed Brown first = 0; last = 1; 55532fa5cd67SKarl Rupp 55540c7d97c5SJed Brown cptr[ncmps] = cum_queue; /* This actually points to queue */ 55550c7d97c5SJed Brown ncmps_pid = 0; 55562fa5cd67SKarl Rupp 55570c7d97c5SJed Brown while (first != nleft) { 55580c7d97c5SJed Brown if (first == last) { /* Find another starting vertex */ 55590c7d97c5SJed Brown cptr[++ncmps] = first+cum_queue; 55600c7d97c5SJed Brown ncmps_pid++; 55610c7d97c5SJed Brown for (i=0; i<nvtxs; i++) { 55622fa5cd67SKarl Rupp if (where[i] == pid && !touched[i]) break; 55630c7d97c5SJed Brown } 55640c7d97c5SJed Brown queue[cum_queue+last] = i; 55650c7d97c5SJed Brown last++; 55660c7d97c5SJed Brown touched[i] = PETSC_TRUE; 55670c7d97c5SJed Brown } 55680c7d97c5SJed Brown i = queue[cum_queue+first]; 55690c7d97c5SJed Brown first++; 55700c7d97c5SJed Brown for (j=xadj[i]; j<xadj[i+1]; j++) { 55710c7d97c5SJed Brown k = adjncy[j]; 55720c7d97c5SJed Brown if (where[k] == pid && !touched[k]) { 55730c7d97c5SJed Brown queue[cum_queue+last] = k; 55740c7d97c5SJed Brown last++; 55750c7d97c5SJed Brown touched[k] = PETSC_TRUE; 55760c7d97c5SJed Brown } 55770c7d97c5SJed Brown } 55780c7d97c5SJed Brown } 55790c7d97c5SJed Brown cptr[++ncmps] = first+cum_queue; 55800c7d97c5SJed Brown ncmps_pid++; 55810c7d97c5SJed Brown cum_queue = cptr[ncmps]; 5582a0ba757dSStefano Zampini graph->where_ncmps[n] = ncmps_pid; 55830c7d97c5SJed Brown } 55840c7d97c5SJed Brown graph->ncmps = ncmps; 55850c7d97c5SJed Brown PetscFunctionReturn(0); 55860c7d97c5SJed Brown } 5587