153cdbc3dSStefano Zampini /* TODOLIST 2da1bb401SStefano Zampini DofSplitting and DM attached to pc? 3da1bb401SStefano Zampini Change SetNeumannBoundaries to SetNeumannBoundariesLocal and provide new SetNeumannBoundaries (same Dirichlet) 4a0ba757dSStefano Zampini change how to deal with the coarse problem (PCBDDCSetCoarseEnvironment): 5a0ba757dSStefano Zampini - simplify coarse problem structure -> PCBDDC or PCREDUDANT, nothing else -> same comm for all levels? 6a0ba757dSStefano Zampini - remove coarse enums and allow use of PCBDDCGetCoarseKSP 7674ae819SStefano Zampini - remove metis dependency -> use MatPartitioning for multilevel -> Assemble serial adjacency in PCBDDCAnalyzeInterface? 8a0ba757dSStefano Zampini code refactoring: 9a0ba757dSStefano Zampini - pick up better names for static functions 10a0ba757dSStefano Zampini change options structure: 11a0ba757dSStefano Zampini - insert BDDC into MG framework? 12a0ba757dSStefano Zampini provide other ops? Ask to developers 13a0ba757dSStefano Zampini remove all unused printf 14a0ba757dSStefano Zampini man pages 1553cdbc3dSStefano Zampini */ 160c7d97c5SJed Brown 1753cdbc3dSStefano Zampini /* ---------------------------------------------------------------------------------------------------------------------------------------------- 180c7d97c5SJed Brown Implementation of BDDC preconditioner based on: 190c7d97c5SJed Brown C. Dohrmann "An approximate BDDC preconditioner", Numerical Linear Algebra with Applications Volume 14, Issue 2, pages 149-168, March 2007 2053cdbc3dSStefano Zampini ---------------------------------------------------------------------------------------------------------------------------------------------- */ 2153cdbc3dSStefano Zampini 22674ae819SStefano Zampini #include "bddc.h" /*I "petscpc.h" I*/ /* includes for fortran wrappers */ 23674ae819SStefano Zampini #include "bddcprivate.h" 243b03a366Sstefano_zampini #include <petscblaslapack.h> 25674ae819SStefano Zampini 26674ae819SStefano Zampini /* prototypes for static functions contained in bddc.c */ 27674ae819SStefano Zampini static PetscErrorCode PCBDDCSetLevel(PC,PetscInt); 28674ae819SStefano Zampini static PetscErrorCode PCBDDCCoarseSetUp(PC); 29674ae819SStefano Zampini static PetscErrorCode PCBDDCSetUpCoarseEnvironment(PC,PetscScalar*); 30674ae819SStefano Zampini 310c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 320c7d97c5SJed Brown #undef __FUNCT__ 330c7d97c5SJed Brown #define __FUNCT__ "PCSetFromOptions_BDDC" 340c7d97c5SJed Brown PetscErrorCode PCSetFromOptions_BDDC(PC pc) 350c7d97c5SJed Brown { 360c7d97c5SJed Brown PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 370c7d97c5SJed Brown PetscErrorCode ierr; 380c7d97c5SJed Brown 390c7d97c5SJed Brown PetscFunctionBegin; 400c7d97c5SJed Brown ierr = PetscOptionsHead("BDDC options");CHKERRQ(ierr); 410c7d97c5SJed Brown /* Verbose debugging of main data structures */ 429d9e44b6SStefano Zampini ierr = PetscOptionsInt("-pc_bddc_check_level" ,"Verbose (debugging) output for PCBDDC" ,"none",pcbddc->dbg_flag ,&pcbddc->dbg_flag ,NULL);CHKERRQ(ierr); 430c7d97c5SJed Brown /* Some customization for default primal space */ 440298fd71SBarry Smith ierr = PetscOptionsBool("-pc_bddc_vertices_only" ,"Use only vertices in coarse space (i.e. discard constraints)","none",pcbddc->vertices_flag ,&pcbddc->vertices_flag ,NULL);CHKERRQ(ierr); 450298fd71SBarry Smith ierr = PetscOptionsBool("-pc_bddc_constraints_only","Use only constraints in coarse space (i.e. discard vertices)","none",pcbddc->constraints_flag,&pcbddc->constraints_flag,NULL);CHKERRQ(ierr); 460298fd71SBarry Smith ierr = PetscOptionsBool("-pc_bddc_faces_only" ,"Use only faces among constraints of coarse space (i.e. discard edges)" ,"none",pcbddc->faces_flag ,&pcbddc->faces_flag ,NULL);CHKERRQ(ierr); 470298fd71SBarry Smith ierr = PetscOptionsBool("-pc_bddc_edges_only" ,"Use only edges among constraints of coarse space (i.e. discard faces)" ,"none",pcbddc->edges_flag ,&pcbddc->edges_flag ,NULL);CHKERRQ(ierr); 480c7d97c5SJed Brown /* Coarse solver context */ 496c667b0aSStefano Zampini static const char * const avail_coarse_problems[] = {"sequential","replicated","parallel","multilevel","CoarseProblemType","PC_BDDC_",0}; /*order of choiches depends on ENUM defined in bddc.h */ 500298fd71SBarry Smith ierr = PetscOptionsEnum("-pc_bddc_coarse_problem_type","Set coarse problem type","none",avail_coarse_problems,(PetscEnum)pcbddc->coarse_problem_type,(PetscEnum*)&pcbddc->coarse_problem_type,NULL);CHKERRQ(ierr); 510c7d97c5SJed Brown /* Two different application of BDDC to the whole set of dofs, internal and interface */ 520298fd71SBarry Smith ierr = PetscOptionsBool("-pc_bddc_switch_preconditioning_type","Switch between M_2 (default) and M_3 preconditioners (as defined by Dohrmann)","none",pcbddc->inexact_prec_type,&pcbddc->inexact_prec_type,NULL);CHKERRQ(ierr); 53674ae819SStefano Zampini ierr = PetscOptionsBool("-pc_bddc_use_change_of_basis","Use change of basis approach for primal space","none",pcbddc->use_change_of_basis,&pcbddc->use_change_of_basis,NULL);CHKERRQ(ierr); 54674ae819SStefano Zampini ierr = PetscOptionsBool("-pc_bddc_use_change_on_faces","Use change of basis approach for face constraints","none",pcbddc->use_change_on_faces,&pcbddc->use_change_on_faces,NULL);CHKERRQ(ierr); 55674ae819SStefano Zampini if (!pcbddc->use_change_of_basis) { 56674ae819SStefano Zampini pcbddc->use_change_on_faces = PETSC_FALSE; 57674ae819SStefano Zampini } 580298fd71SBarry Smith ierr = PetscOptionsInt("-pc_bddc_coarsening_ratio","Set coarsening ratio used in multilevel coarsening","none",pcbddc->coarsening_ratio,&pcbddc->coarsening_ratio,NULL);CHKERRQ(ierr); 590298fd71SBarry Smith ierr = PetscOptionsInt("-pc_bddc_max_levels","Set maximum number of levels for multilevel","none",pcbddc->max_levels,&pcbddc->max_levels,NULL);CHKERRQ(ierr); 60674ae819SStefano Zampini ierr = PetscOptionsBool("-pc_bddc_use_deluxe_scaling","Use deluxe scaling for BDDC","none",pcbddc->use_deluxe_scaling,&pcbddc->use_deluxe_scaling,NULL);CHKERRQ(ierr); 610c7d97c5SJed Brown ierr = PetscOptionsTail();CHKERRQ(ierr); 620c7d97c5SJed Brown PetscFunctionReturn(0); 630c7d97c5SJed Brown } 640c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 65674ae819SStefano Zampini #undef __FUNCT__ 66674ae819SStefano Zampini #define __FUNCT__ "PCBDDCSetPrimalVerticesLocalIS_BDDC" 67674ae819SStefano Zampini static PetscErrorCode PCBDDCSetPrimalVerticesLocalIS_BDDC(PC pc, IS PrimalVertices) 68674ae819SStefano Zampini { 69674ae819SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 70674ae819SStefano Zampini PetscErrorCode ierr; 711e6b0712SBarry Smith 72674ae819SStefano Zampini PetscFunctionBegin; 73674ae819SStefano Zampini ierr = ISDestroy(&pcbddc->user_primal_vertices);CHKERRQ(ierr); 74674ae819SStefano Zampini ierr = PetscObjectReference((PetscObject)PrimalVertices);CHKERRQ(ierr); 75674ae819SStefano Zampini pcbddc->user_primal_vertices = PrimalVertices; 76674ae819SStefano Zampini PetscFunctionReturn(0); 77674ae819SStefano Zampini } 78674ae819SStefano Zampini #undef __FUNCT__ 79674ae819SStefano Zampini #define __FUNCT__ "PCBDDCSetPrimalVerticesLocalIS" 80674ae819SStefano Zampini /*@ 81674ae819SStefano Zampini PCBDDCSetPrimalVerticesLocalIS - Set user defined primal vertices in PCBDDC. 82674ae819SStefano Zampini 83674ae819SStefano Zampini Not collective 84674ae819SStefano Zampini 85674ae819SStefano Zampini Input Parameters: 86674ae819SStefano Zampini + pc - the preconditioning context 87674ae819SStefano Zampini - PrimalVertices - index sets of primal vertices in local numbering 88674ae819SStefano Zampini 89674ae819SStefano Zampini Level: intermediate 90674ae819SStefano Zampini 91674ae819SStefano Zampini Notes: 92674ae819SStefano Zampini 93674ae819SStefano Zampini .seealso: PCBDDC 94674ae819SStefano Zampini @*/ 95674ae819SStefano Zampini PetscErrorCode PCBDDCSetPrimalVerticesLocalIS(PC pc, IS PrimalVertices) 96674ae819SStefano Zampini { 97674ae819SStefano Zampini PetscErrorCode ierr; 98674ae819SStefano Zampini 99674ae819SStefano Zampini PetscFunctionBegin; 100674ae819SStefano Zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 101674ae819SStefano Zampini PetscValidHeaderSpecific(PrimalVertices,IS_CLASSID,2); 102674ae819SStefano Zampini ierr = PetscTryMethod(pc,"PCBDDCSetPrimalVerticesLocalIS_C",(PC,IS),(pc,PrimalVertices));CHKERRQ(ierr); 103674ae819SStefano Zampini PetscFunctionReturn(0); 104674ae819SStefano Zampini } 105674ae819SStefano Zampini /* -------------------------------------------------------------------------- */ 1060c7d97c5SJed Brown #undef __FUNCT__ 1070c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetCoarseProblemType_BDDC" 10853cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetCoarseProblemType_BDDC(PC pc, CoarseProblemType CPT) 1090c7d97c5SJed Brown { 1100c7d97c5SJed Brown PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 1110c7d97c5SJed Brown 1120c7d97c5SJed Brown PetscFunctionBegin; 1130c7d97c5SJed Brown pcbddc->coarse_problem_type = CPT; 1140c7d97c5SJed Brown PetscFunctionReturn(0); 1150c7d97c5SJed Brown } 1161e6b0712SBarry Smith 1170c7d97c5SJed Brown #undef __FUNCT__ 1180c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetCoarseProblemType" 11953cdbc3dSStefano Zampini /*@ 1209c0446d6SStefano Zampini PCBDDCSetCoarseProblemType - Set coarse problem type in PCBDDC. 12153cdbc3dSStefano Zampini 1229c0446d6SStefano Zampini Not collective 12353cdbc3dSStefano Zampini 12453cdbc3dSStefano Zampini Input Parameters: 12553cdbc3dSStefano Zampini + pc - the preconditioning context 12653cdbc3dSStefano Zampini - CoarseProblemType - pick a better name and explain what this is 12753cdbc3dSStefano Zampini 12853cdbc3dSStefano Zampini Level: intermediate 12953cdbc3dSStefano Zampini 13053cdbc3dSStefano Zampini Notes: 131da1bb401SStefano Zampini Not collective but all procs must call with same arguments. 13253cdbc3dSStefano Zampini 13353cdbc3dSStefano Zampini .seealso: PCBDDC 13453cdbc3dSStefano Zampini @*/ 1350c7d97c5SJed Brown PetscErrorCode PCBDDCSetCoarseProblemType(PC pc, CoarseProblemType CPT) 1360c7d97c5SJed Brown { 1370c7d97c5SJed Brown PetscErrorCode ierr; 1380c7d97c5SJed Brown 1390c7d97c5SJed Brown PetscFunctionBegin; 1400c7d97c5SJed Brown PetscValidHeaderSpecific(pc,PC_CLASSID,1); 1410c7d97c5SJed Brown ierr = PetscTryMethod(pc,"PCBDDCSetCoarseProblemType_C",(PC,CoarseProblemType),(pc,CPT));CHKERRQ(ierr); 1420c7d97c5SJed Brown PetscFunctionReturn(0); 1430c7d97c5SJed Brown } 1440c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 1450c7d97c5SJed Brown #undef __FUNCT__ 1464fad6a16SStefano Zampini #define __FUNCT__ "PCBDDCSetCoarseningRatio_BDDC" 1474fad6a16SStefano Zampini static PetscErrorCode PCBDDCSetCoarseningRatio_BDDC(PC pc,PetscInt k) 1484fad6a16SStefano Zampini { 1494fad6a16SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 1504fad6a16SStefano Zampini 1514fad6a16SStefano Zampini PetscFunctionBegin; 1524fad6a16SStefano Zampini pcbddc->coarsening_ratio=k; 1534fad6a16SStefano Zampini PetscFunctionReturn(0); 1544fad6a16SStefano Zampini } 1551e6b0712SBarry Smith 1564fad6a16SStefano Zampini #undef __FUNCT__ 1574fad6a16SStefano Zampini #define __FUNCT__ "PCBDDCSetCoarseningRatio" 1584fad6a16SStefano Zampini /*@ 1594fad6a16SStefano Zampini PCBDDCSetCoarseningRatio - Set coarsening ratio used in multilevel coarsening 1604fad6a16SStefano Zampini 1614fad6a16SStefano Zampini Logically collective on PC 1624fad6a16SStefano Zampini 1634fad6a16SStefano Zampini Input Parameters: 1644fad6a16SStefano Zampini + pc - the preconditioning context 1654fad6a16SStefano Zampini - k - coarsening ratio 1664fad6a16SStefano Zampini 1674fad6a16SStefano Zampini Approximatively k subdomains at the finer level will be aggregated into a single subdomain at the coarser level. 1684fad6a16SStefano Zampini 1694fad6a16SStefano Zampini Level: intermediate 1704fad6a16SStefano Zampini 1714fad6a16SStefano Zampini Notes: 1724fad6a16SStefano Zampini 1734fad6a16SStefano Zampini .seealso: PCBDDC 1744fad6a16SStefano Zampini @*/ 1754fad6a16SStefano Zampini PetscErrorCode PCBDDCSetCoarseningRatio(PC pc,PetscInt k) 1764fad6a16SStefano Zampini { 1774fad6a16SStefano Zampini PetscErrorCode ierr; 1784fad6a16SStefano Zampini 1794fad6a16SStefano Zampini PetscFunctionBegin; 1804fad6a16SStefano Zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 1814fad6a16SStefano Zampini ierr = PetscTryMethod(pc,"PCBDDCSetCoarseningRatio_C",(PC,PetscInt),(pc,k));CHKERRQ(ierr); 1824fad6a16SStefano Zampini PetscFunctionReturn(0); 1834fad6a16SStefano Zampini } 1844fad6a16SStefano Zampini /* -------------------------------------------------------------------------- */ 1851e6b0712SBarry Smith 1864fad6a16SStefano Zampini #undef __FUNCT__ 1874fad6a16SStefano Zampini #define __FUNCT__ "PCBDDCSetMaxLevels_BDDC" 1884fad6a16SStefano Zampini static PetscErrorCode PCBDDCSetMaxLevels_BDDC(PC pc,PetscInt max_levels) 1894fad6a16SStefano Zampini { 1904fad6a16SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 1914fad6a16SStefano Zampini 1924fad6a16SStefano Zampini PetscFunctionBegin; 1934fad6a16SStefano Zampini pcbddc->max_levels=max_levels; 1944fad6a16SStefano Zampini PetscFunctionReturn(0); 1954fad6a16SStefano Zampini } 1961e6b0712SBarry Smith 1974fad6a16SStefano Zampini #undef __FUNCT__ 1984fad6a16SStefano Zampini #define __FUNCT__ "PCBDDCSetMaxLevels" 1994fad6a16SStefano Zampini /*@ 2004fad6a16SStefano Zampini PCBDDCSetMaxLevels - Sets the maximum number of levels within the multilevel approach. 2014fad6a16SStefano Zampini 2024fad6a16SStefano Zampini Logically collective on PC 2034fad6a16SStefano Zampini 2044fad6a16SStefano Zampini Input Parameters: 2054fad6a16SStefano Zampini + pc - the preconditioning context 2064fad6a16SStefano Zampini - max_levels - the maximum number of levels 2074fad6a16SStefano Zampini 2084fad6a16SStefano Zampini Default value is 1, i.e. coarse problem will be solved inexactly with one application 2094fad6a16SStefano Zampini of PCBDDC preconditioner if the multilevel approach is requested. 2104fad6a16SStefano Zampini 2114fad6a16SStefano Zampini Level: intermediate 2124fad6a16SStefano Zampini 2134fad6a16SStefano Zampini Notes: 2144fad6a16SStefano Zampini 2154fad6a16SStefano Zampini .seealso: PCBDDC 2164fad6a16SStefano Zampini @*/ 2174fad6a16SStefano Zampini PetscErrorCode PCBDDCSetMaxLevels(PC pc,PetscInt max_levels) 2184fad6a16SStefano Zampini { 2194fad6a16SStefano Zampini PetscErrorCode ierr; 2204fad6a16SStefano Zampini 2214fad6a16SStefano Zampini PetscFunctionBegin; 2224fad6a16SStefano Zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 2234fad6a16SStefano Zampini ierr = PetscTryMethod(pc,"PCBDDCSetMaxLevels_C",(PC,PetscInt),(pc,max_levels));CHKERRQ(ierr); 2244fad6a16SStefano Zampini PetscFunctionReturn(0); 2254fad6a16SStefano Zampini } 2264fad6a16SStefano Zampini /* -------------------------------------------------------------------------- */ 2271e6b0712SBarry Smith 2284fad6a16SStefano Zampini #undef __FUNCT__ 2290bdf917eSStefano Zampini #define __FUNCT__ "PCBDDCSetNullSpace_BDDC" 2300bdf917eSStefano Zampini static PetscErrorCode PCBDDCSetNullSpace_BDDC(PC pc,MatNullSpace NullSpace) 2310bdf917eSStefano Zampini { 2320bdf917eSStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 2330bdf917eSStefano Zampini PetscErrorCode ierr; 2340bdf917eSStefano Zampini 2350bdf917eSStefano Zampini PetscFunctionBegin; 2360bdf917eSStefano Zampini ierr = PetscObjectReference((PetscObject)NullSpace);CHKERRQ(ierr); 2370bdf917eSStefano Zampini ierr = MatNullSpaceDestroy(&pcbddc->NullSpace);CHKERRQ(ierr); 2380bdf917eSStefano Zampini pcbddc->NullSpace=NullSpace; 2390bdf917eSStefano Zampini PetscFunctionReturn(0); 2400bdf917eSStefano Zampini } 2411e6b0712SBarry Smith 2420bdf917eSStefano Zampini #undef __FUNCT__ 2430bdf917eSStefano Zampini #define __FUNCT__ "PCBDDCSetNullSpace" 2440bdf917eSStefano Zampini /*@ 2450bdf917eSStefano Zampini PCBDDCSetNullSpace - Set NullSpace of global operator of BDDC preconditioned mat. 2460bdf917eSStefano Zampini 2470bdf917eSStefano Zampini Logically collective on PC and MatNullSpace 2480bdf917eSStefano Zampini 2490bdf917eSStefano Zampini Input Parameters: 2500bdf917eSStefano Zampini + pc - the preconditioning context 2510bdf917eSStefano Zampini - NullSpace - Null space of the linear operator to be preconditioned. 2520bdf917eSStefano Zampini 2530bdf917eSStefano Zampini Level: intermediate 2540bdf917eSStefano Zampini 2550bdf917eSStefano Zampini Notes: 2560bdf917eSStefano Zampini 2570bdf917eSStefano Zampini .seealso: PCBDDC 2580bdf917eSStefano Zampini @*/ 2590bdf917eSStefano Zampini PetscErrorCode PCBDDCSetNullSpace(PC pc,MatNullSpace NullSpace) 2600bdf917eSStefano Zampini { 2610bdf917eSStefano Zampini PetscErrorCode ierr; 2620bdf917eSStefano Zampini 2630bdf917eSStefano Zampini PetscFunctionBegin; 2640bdf917eSStefano Zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 265674ae819SStefano Zampini PetscValidHeaderSpecific(NullSpace,MAT_NULLSPACE_CLASSID,2); 2660bdf917eSStefano Zampini ierr = PetscTryMethod(pc,"PCBDDCSetNullSpace_C",(PC,MatNullSpace),(pc,NullSpace));CHKERRQ(ierr); 2670bdf917eSStefano Zampini PetscFunctionReturn(0); 2680bdf917eSStefano Zampini } 2690bdf917eSStefano Zampini /* -------------------------------------------------------------------------- */ 2701e6b0712SBarry Smith 2710bdf917eSStefano Zampini #undef __FUNCT__ 2723b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCSetDirichletBoundaries_BDDC" 2733b03a366Sstefano_zampini static PetscErrorCode PCBDDCSetDirichletBoundaries_BDDC(PC pc,IS DirichletBoundaries) 2743b03a366Sstefano_zampini { 2753b03a366Sstefano_zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 2763b03a366Sstefano_zampini PetscErrorCode ierr; 2773b03a366Sstefano_zampini 2783b03a366Sstefano_zampini PetscFunctionBegin; 2793b03a366Sstefano_zampini ierr = ISDestroy(&pcbddc->DirichletBoundaries);CHKERRQ(ierr); 28036e030ebSStefano Zampini ierr = PetscObjectReference((PetscObject)DirichletBoundaries);CHKERRQ(ierr); 28136e030ebSStefano Zampini pcbddc->DirichletBoundaries=DirichletBoundaries; 2823b03a366Sstefano_zampini PetscFunctionReturn(0); 2833b03a366Sstefano_zampini } 2841e6b0712SBarry Smith 2853b03a366Sstefano_zampini #undef __FUNCT__ 2863b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCSetDirichletBoundaries" 2873b03a366Sstefano_zampini /*@ 288da1bb401SStefano Zampini PCBDDCSetDirichletBoundaries - Set index set defining subdomain part (in local ordering) 289da1bb401SStefano Zampini of Dirichlet boundaries for the global problem. 2903b03a366Sstefano_zampini 2913b03a366Sstefano_zampini Not collective 2923b03a366Sstefano_zampini 2933b03a366Sstefano_zampini Input Parameters: 2943b03a366Sstefano_zampini + pc - the preconditioning context 2950298fd71SBarry Smith - DirichletBoundaries - sequential index set defining the subdomain part of Dirichlet boundaries (can be NULL) 2963b03a366Sstefano_zampini 2973b03a366Sstefano_zampini Level: intermediate 2983b03a366Sstefano_zampini 2993b03a366Sstefano_zampini Notes: 3003b03a366Sstefano_zampini 3013b03a366Sstefano_zampini .seealso: PCBDDC 3023b03a366Sstefano_zampini @*/ 3033b03a366Sstefano_zampini PetscErrorCode PCBDDCSetDirichletBoundaries(PC pc,IS DirichletBoundaries) 3043b03a366Sstefano_zampini { 3053b03a366Sstefano_zampini PetscErrorCode ierr; 3063b03a366Sstefano_zampini 3073b03a366Sstefano_zampini PetscFunctionBegin; 3083b03a366Sstefano_zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 309674ae819SStefano Zampini PetscValidHeaderSpecific(DirichletBoundaries,IS_CLASSID,2); 3103b03a366Sstefano_zampini ierr = PetscTryMethod(pc,"PCBDDCSetDirichletBoundaries_C",(PC,IS),(pc,DirichletBoundaries));CHKERRQ(ierr); 3113b03a366Sstefano_zampini PetscFunctionReturn(0); 3123b03a366Sstefano_zampini } 3133b03a366Sstefano_zampini /* -------------------------------------------------------------------------- */ 3141e6b0712SBarry Smith 3153b03a366Sstefano_zampini #undef __FUNCT__ 3160c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetNeumannBoundaries_BDDC" 31753cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetNeumannBoundaries_BDDC(PC pc,IS NeumannBoundaries) 3180c7d97c5SJed Brown { 3190c7d97c5SJed Brown PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 32053cdbc3dSStefano Zampini PetscErrorCode ierr; 3210c7d97c5SJed Brown 3220c7d97c5SJed Brown PetscFunctionBegin; 32353cdbc3dSStefano Zampini ierr = ISDestroy(&pcbddc->NeumannBoundaries);CHKERRQ(ierr); 32436e030ebSStefano Zampini ierr = PetscObjectReference((PetscObject)NeumannBoundaries);CHKERRQ(ierr); 32536e030ebSStefano Zampini pcbddc->NeumannBoundaries=NeumannBoundaries; 3260c7d97c5SJed Brown PetscFunctionReturn(0); 3270c7d97c5SJed Brown } 3281e6b0712SBarry Smith 3290c7d97c5SJed Brown #undef __FUNCT__ 3300c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetNeumannBoundaries" 33157527edcSJed Brown /*@ 332da1bb401SStefano Zampini PCBDDCSetNeumannBoundaries - Set index set defining subdomain part (in local ordering) 333da1bb401SStefano Zampini of Neumann boundaries for the global problem. 33457527edcSJed Brown 3359c0446d6SStefano Zampini Not collective 33657527edcSJed Brown 33757527edcSJed Brown Input Parameters: 33857527edcSJed Brown + pc - the preconditioning context 3390298fd71SBarry Smith - NeumannBoundaries - sequential index set defining the subdomain part of Neumann boundaries (can be NULL) 34057527edcSJed Brown 34157527edcSJed Brown Level: intermediate 34257527edcSJed Brown 34357527edcSJed Brown Notes: 34457527edcSJed Brown 34557527edcSJed Brown .seealso: PCBDDC 34657527edcSJed Brown @*/ 34753cdbc3dSStefano Zampini PetscErrorCode PCBDDCSetNeumannBoundaries(PC pc,IS NeumannBoundaries) 3480c7d97c5SJed Brown { 3490c7d97c5SJed Brown PetscErrorCode ierr; 3500c7d97c5SJed Brown 3510c7d97c5SJed Brown PetscFunctionBegin; 3520c7d97c5SJed Brown PetscValidHeaderSpecific(pc,PC_CLASSID,1); 353674ae819SStefano Zampini PetscValidHeaderSpecific(NeumannBoundaries,IS_CLASSID,2); 35453cdbc3dSStefano Zampini ierr = PetscTryMethod(pc,"PCBDDCSetNeumannBoundaries_C",(PC,IS),(pc,NeumannBoundaries));CHKERRQ(ierr); 35553cdbc3dSStefano Zampini PetscFunctionReturn(0); 35653cdbc3dSStefano Zampini } 35753cdbc3dSStefano Zampini /* -------------------------------------------------------------------------- */ 3581e6b0712SBarry Smith 35953cdbc3dSStefano Zampini #undef __FUNCT__ 360da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCGetDirichletBoundaries_BDDC" 361da1bb401SStefano Zampini static PetscErrorCode PCBDDCGetDirichletBoundaries_BDDC(PC pc,IS *DirichletBoundaries) 362da1bb401SStefano Zampini { 363da1bb401SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 364da1bb401SStefano Zampini 365da1bb401SStefano Zampini PetscFunctionBegin; 366da1bb401SStefano Zampini *DirichletBoundaries = pcbddc->DirichletBoundaries; 367da1bb401SStefano Zampini PetscFunctionReturn(0); 368da1bb401SStefano Zampini } 3691e6b0712SBarry Smith 370da1bb401SStefano Zampini #undef __FUNCT__ 371da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCGetDirichletBoundaries" 372da1bb401SStefano Zampini /*@ 373da1bb401SStefano Zampini PCBDDCGetDirichletBoundaries - Get index set defining subdomain part (in local ordering) 374da1bb401SStefano Zampini of Dirichlet boundaries for the global problem. 375da1bb401SStefano Zampini 376da1bb401SStefano Zampini Not collective 377da1bb401SStefano Zampini 378da1bb401SStefano Zampini Input Parameters: 379da1bb401SStefano Zampini + pc - the preconditioning context 380da1bb401SStefano Zampini 381da1bb401SStefano Zampini Output Parameters: 382da1bb401SStefano Zampini + DirichletBoundaries - index set defining the subdomain part of Dirichlet boundaries 383da1bb401SStefano Zampini 384da1bb401SStefano Zampini Level: intermediate 385da1bb401SStefano Zampini 386da1bb401SStefano Zampini Notes: 387da1bb401SStefano Zampini 388da1bb401SStefano Zampini .seealso: PCBDDC 389da1bb401SStefano Zampini @*/ 390da1bb401SStefano Zampini PetscErrorCode PCBDDCGetDirichletBoundaries(PC pc,IS *DirichletBoundaries) 391da1bb401SStefano Zampini { 392da1bb401SStefano Zampini PetscErrorCode ierr; 393da1bb401SStefano Zampini 394da1bb401SStefano Zampini PetscFunctionBegin; 395da1bb401SStefano Zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 396da1bb401SStefano Zampini ierr = PetscUseMethod(pc,"PCBDDCGetDirichletBoundaries_C",(PC,IS*),(pc,DirichletBoundaries));CHKERRQ(ierr); 397da1bb401SStefano Zampini PetscFunctionReturn(0); 398da1bb401SStefano Zampini } 399da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */ 4001e6b0712SBarry Smith 401da1bb401SStefano Zampini #undef __FUNCT__ 40253cdbc3dSStefano Zampini #define __FUNCT__ "PCBDDCGetNeumannBoundaries_BDDC" 40353cdbc3dSStefano Zampini static PetscErrorCode PCBDDCGetNeumannBoundaries_BDDC(PC pc,IS *NeumannBoundaries) 40453cdbc3dSStefano Zampini { 40553cdbc3dSStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 40653cdbc3dSStefano Zampini 40753cdbc3dSStefano Zampini PetscFunctionBegin; 40853cdbc3dSStefano Zampini *NeumannBoundaries = pcbddc->NeumannBoundaries; 40953cdbc3dSStefano Zampini PetscFunctionReturn(0); 41053cdbc3dSStefano Zampini } 4111e6b0712SBarry Smith 41253cdbc3dSStefano Zampini #undef __FUNCT__ 41353cdbc3dSStefano Zampini #define __FUNCT__ "PCBDDCGetNeumannBoundaries" 41453cdbc3dSStefano Zampini /*@ 415da1bb401SStefano Zampini PCBDDCGetNeumannBoundaries - Get index set defining subdomain part (in local ordering) 416da1bb401SStefano Zampini of Neumann boundaries for the global problem. 41753cdbc3dSStefano Zampini 4189c0446d6SStefano Zampini Not collective 41953cdbc3dSStefano Zampini 42053cdbc3dSStefano Zampini Input Parameters: 42153cdbc3dSStefano Zampini + pc - the preconditioning context 42253cdbc3dSStefano Zampini 42353cdbc3dSStefano Zampini Output Parameters: 42453cdbc3dSStefano Zampini + NeumannBoundaries - index set defining the subdomain part of Neumann boundaries 42553cdbc3dSStefano Zampini 42653cdbc3dSStefano Zampini Level: intermediate 42753cdbc3dSStefano Zampini 42853cdbc3dSStefano Zampini Notes: 42953cdbc3dSStefano Zampini 43053cdbc3dSStefano Zampini .seealso: PCBDDC 43153cdbc3dSStefano Zampini @*/ 43253cdbc3dSStefano Zampini PetscErrorCode PCBDDCGetNeumannBoundaries(PC pc,IS *NeumannBoundaries) 43353cdbc3dSStefano Zampini { 43453cdbc3dSStefano Zampini PetscErrorCode ierr; 43553cdbc3dSStefano Zampini 43653cdbc3dSStefano Zampini PetscFunctionBegin; 43753cdbc3dSStefano Zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 43853cdbc3dSStefano Zampini ierr = PetscUseMethod(pc,"PCBDDCGetNeumannBoundaries_C",(PC,IS*),(pc,NeumannBoundaries));CHKERRQ(ierr); 4390c7d97c5SJed Brown PetscFunctionReturn(0); 4400c7d97c5SJed Brown } 44136e030ebSStefano Zampini /* -------------------------------------------------------------------------- */ 4421e6b0712SBarry Smith 44336e030ebSStefano Zampini #undef __FUNCT__ 444da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetLocalAdjacencyGraph_BDDC" 4451a83f524SJed Brown static PetscErrorCode PCBDDCSetLocalAdjacencyGraph_BDDC(PC pc, PetscInt nvtxs,const PetscInt xadj[],const PetscInt adjncy[], PetscCopyMode copymode) 44636e030ebSStefano Zampini { 44736e030ebSStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 448da1bb401SStefano Zampini PCBDDCGraph mat_graph = pcbddc->mat_graph; 449da1bb401SStefano Zampini PetscErrorCode ierr; 45036e030ebSStefano Zampini 45136e030ebSStefano Zampini PetscFunctionBegin; 452674ae819SStefano Zampini /* free old CSR */ 453674ae819SStefano Zampini ierr = PCBDDCGraphResetCSR(mat_graph);CHKERRQ(ierr); 454674ae819SStefano Zampini /* get CSR into graph structure */ 455da1bb401SStefano Zampini if (copymode == PETSC_COPY_VALUES) { 456674ae819SStefano Zampini ierr = PetscMalloc((nvtxs+1)*sizeof(PetscInt),&mat_graph->xadj);CHKERRQ(ierr); 457674ae819SStefano Zampini ierr = PetscMalloc(xadj[nvtxs]*sizeof(PetscInt),&mat_graph->adjncy);CHKERRQ(ierr); 458674ae819SStefano Zampini ierr = PetscMemcpy(mat_graph->xadj,xadj,(nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr); 459674ae819SStefano Zampini ierr = PetscMemcpy(mat_graph->adjncy,adjncy,xadj[nvtxs]*sizeof(PetscInt));CHKERRQ(ierr); 460da1bb401SStefano Zampini } else if (copymode == PETSC_OWN_POINTER) { 4611a83f524SJed Brown mat_graph->xadj = (PetscInt*)xadj; 4621a83f524SJed Brown mat_graph->adjncy = (PetscInt*)adjncy; 463674ae819SStefano Zampini } 464575ad6abSStefano Zampini mat_graph->nvtxs_csr = nvtxs; 46536e030ebSStefano Zampini PetscFunctionReturn(0); 46636e030ebSStefano Zampini } 4671e6b0712SBarry Smith 46836e030ebSStefano Zampini #undef __FUNCT__ 469da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetLocalAdjacencyGraph" 47036e030ebSStefano Zampini /*@ 471da1bb401SStefano Zampini PCBDDCSetLocalAdjacencyGraph - Set CSR graph of local matrix for use of PCBDDC. 47236e030ebSStefano Zampini 47336e030ebSStefano Zampini Not collective 47436e030ebSStefano Zampini 47536e030ebSStefano Zampini Input Parameters: 47636e030ebSStefano Zampini + pc - the preconditioning context 477da1bb401SStefano Zampini - nvtxs - number of local vertices of the graph 478da1bb401SStefano Zampini - xadj, adjncy - the CSR graph 479da1bb401SStefano Zampini - copymode - either PETSC_COPY_VALUES or PETSC_OWN_POINTER. In the former case the user must free the array passed in; 480da1bb401SStefano Zampini in the latter case, memory must be obtained with PetscMalloc. 48136e030ebSStefano Zampini 48236e030ebSStefano Zampini Level: intermediate 48336e030ebSStefano Zampini 48436e030ebSStefano Zampini Notes: 48536e030ebSStefano Zampini 48636e030ebSStefano Zampini .seealso: PCBDDC 48736e030ebSStefano Zampini @*/ 4881a83f524SJed Brown PetscErrorCode PCBDDCSetLocalAdjacencyGraph(PC pc,PetscInt nvtxs,const PetscInt xadj[],const PetscInt adjncy[], PetscCopyMode copymode) 48936e030ebSStefano Zampini { 490575ad6abSStefano Zampini void (*f)(void) = 0; 49136e030ebSStefano Zampini PetscErrorCode ierr; 49236e030ebSStefano Zampini 49336e030ebSStefano Zampini PetscFunctionBegin; 49436e030ebSStefano Zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 495674ae819SStefano Zampini PetscValidIntPointer(xadj,3); 496674ae819SStefano Zampini PetscValidIntPointer(xadj,4); 497674ae819SStefano Zampini if (copymode != PETSC_COPY_VALUES && copymode != PETSC_OWN_POINTER) { 498674ae819SStefano Zampini SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_SUP,"Unsupported copy mode %d in %s\n",copymode,__FUNCT__); 499da1bb401SStefano Zampini } 50036e030ebSStefano Zampini ierr = PetscTryMethod(pc,"PCBDDCSetLocalAdjacencyGraph_C",(PC,PetscInt,const PetscInt[],const PetscInt[],PetscCopyMode),(pc,nvtxs,xadj,adjncy,copymode));CHKERRQ(ierr); 501575ad6abSStefano Zampini /* free arrays if PCBDDC is not the PC type */ 502575ad6abSStefano Zampini ierr = PetscObjectQueryFunction((PetscObject)pc,"PCBDDCSetLocalAdjacencyGraph_C",&f);CHKERRQ(ierr); 503575ad6abSStefano Zampini if (!f && copymode == PETSC_OWN_POINTER) { 504575ad6abSStefano Zampini ierr = PetscFree(xadj);CHKERRQ(ierr); 505575ad6abSStefano Zampini ierr = PetscFree(adjncy);CHKERRQ(ierr); 50636e030ebSStefano Zampini } 50736e030ebSStefano Zampini PetscFunctionReturn(0); 50836e030ebSStefano Zampini } 5099c0446d6SStefano Zampini /* -------------------------------------------------------------------------- */ 5101e6b0712SBarry Smith 5119c0446d6SStefano Zampini #undef __FUNCT__ 5129c0446d6SStefano Zampini #define __FUNCT__ "PCBDDCSetDofsSplitting_BDDC" 5139c0446d6SStefano Zampini static PetscErrorCode PCBDDCSetDofsSplitting_BDDC(PC pc,PetscInt n_is, IS ISForDofs[]) 5149c0446d6SStefano Zampini { 5159c0446d6SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 5169c0446d6SStefano Zampini PetscInt i; 5179c0446d6SStefano Zampini PetscErrorCode ierr; 5189c0446d6SStefano Zampini 5199c0446d6SStefano Zampini PetscFunctionBegin; 520da1bb401SStefano Zampini /* Destroy ISes if they were already set */ 5219c0446d6SStefano Zampini for (i=0;i<pcbddc->n_ISForDofs;i++) { 5229c0446d6SStefano Zampini ierr = ISDestroy(&pcbddc->ISForDofs[i]);CHKERRQ(ierr); 5239c0446d6SStefano Zampini } 524d11ae9bbSstefano_zampini ierr = PetscFree(pcbddc->ISForDofs);CHKERRQ(ierr); 525da1bb401SStefano Zampini /* allocate space then set */ 5269c0446d6SStefano Zampini ierr = PetscMalloc(n_is*sizeof(IS),&pcbddc->ISForDofs);CHKERRQ(ierr); 5279c0446d6SStefano Zampini for (i=0;i<n_is;i++) { 528da1bb401SStefano Zampini ierr = PetscObjectReference((PetscObject)ISForDofs[i]);CHKERRQ(ierr); 529da1bb401SStefano Zampini pcbddc->ISForDofs[i]=ISForDofs[i]; 5309c0446d6SStefano Zampini } 5319c0446d6SStefano Zampini pcbddc->n_ISForDofs=n_is; 5329c0446d6SStefano Zampini PetscFunctionReturn(0); 5339c0446d6SStefano Zampini } 5341e6b0712SBarry Smith 5359c0446d6SStefano Zampini #undef __FUNCT__ 5369c0446d6SStefano Zampini #define __FUNCT__ "PCBDDCSetDofsSplitting" 5379c0446d6SStefano Zampini /*@ 538da1bb401SStefano Zampini PCBDDCSetDofsSplitting - Set index sets defining fields of local mat. 5399c0446d6SStefano Zampini 5409c0446d6SStefano Zampini Not collective 5419c0446d6SStefano Zampini 5429c0446d6SStefano Zampini Input Parameters: 5439c0446d6SStefano Zampini + pc - the preconditioning context 544da1bb401SStefano Zampini - n - number of index sets defining the fields 545da1bb401SStefano Zampini - IS[] - array of IS describing the fields 5469c0446d6SStefano Zampini 5479c0446d6SStefano Zampini Level: intermediate 5489c0446d6SStefano Zampini 5499c0446d6SStefano Zampini Notes: 5509c0446d6SStefano Zampini 5519c0446d6SStefano Zampini .seealso: PCBDDC 5529c0446d6SStefano Zampini @*/ 5539c0446d6SStefano Zampini PetscErrorCode PCBDDCSetDofsSplitting(PC pc,PetscInt n_is, IS ISForDofs[]) 5549c0446d6SStefano Zampini { 5559c0446d6SStefano Zampini PetscErrorCode ierr; 5569c0446d6SStefano Zampini 5579c0446d6SStefano Zampini PetscFunctionBegin; 5589c0446d6SStefano Zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 5599c0446d6SStefano Zampini ierr = PetscTryMethod(pc,"PCBDDCSetDofsSplitting_C",(PC,PetscInt,IS[]),(pc,n_is,ISForDofs));CHKERRQ(ierr); 5609c0446d6SStefano Zampini PetscFunctionReturn(0); 5619c0446d6SStefano Zampini } 562da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */ 563534831adSStefano Zampini #undef __FUNCT__ 564534831adSStefano Zampini #define __FUNCT__ "PCPreSolve_BDDC" 565534831adSStefano Zampini /* -------------------------------------------------------------------------- */ 566534831adSStefano Zampini /* 567534831adSStefano Zampini PCPreSolve_BDDC - Changes the right hand side and (if necessary) the initial 568534831adSStefano Zampini guess if a transformation of basis approach has been selected. 5699c0446d6SStefano Zampini 570534831adSStefano Zampini Input Parameter: 571534831adSStefano Zampini + pc - the preconditioner contex 572534831adSStefano Zampini 573534831adSStefano Zampini Application Interface Routine: PCPreSolve() 574534831adSStefano Zampini 575534831adSStefano Zampini Notes: 576534831adSStefano Zampini The interface routine PCPreSolve() is not usually called directly by 577534831adSStefano Zampini the user, but instead is called by KSPSolve(). 578534831adSStefano Zampini */ 579534831adSStefano Zampini static PetscErrorCode PCPreSolve_BDDC(PC pc, KSP ksp, Vec rhs, Vec x) 580534831adSStefano Zampini { 581534831adSStefano Zampini PetscErrorCode ierr; 582534831adSStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 583534831adSStefano Zampini PC_IS *pcis = (PC_IS*)(pc->data); 584534831adSStefano Zampini Mat_IS *matis = (Mat_IS*)pc->pmat->data; 585534831adSStefano Zampini Mat temp_mat; 5863972b0daSStefano Zampini IS dirIS; 5873972b0daSStefano Zampini PetscInt dirsize,i,*is_indices; 5883972b0daSStefano Zampini PetscScalar *array_x,*array_diagonal; 5893972b0daSStefano Zampini Vec used_vec; 5903972b0daSStefano Zampini PetscBool guess_nonzero; 591534831adSStefano Zampini 592534831adSStefano Zampini PetscFunctionBegin; 5933972b0daSStefano Zampini if (x) { 5943972b0daSStefano Zampini ierr = PetscObjectReference((PetscObject)x);CHKERRQ(ierr); 5953972b0daSStefano Zampini used_vec = x; 5963972b0daSStefano Zampini } else { 5973972b0daSStefano Zampini ierr = PetscObjectReference((PetscObject)pcbddc->temp_solution);CHKERRQ(ierr); 5983972b0daSStefano Zampini used_vec = pcbddc->temp_solution; 5993972b0daSStefano Zampini ierr = VecSet(used_vec,0.0);CHKERRQ(ierr); 6003972b0daSStefano Zampini } 6013972b0daSStefano Zampini /* hack into ksp data structure PCPreSolve comes earlier in src/ksp/ksp/interface/itfunc.c */ 6023972b0daSStefano Zampini if (ksp) { 6033972b0daSStefano Zampini ierr = KSPGetInitialGuessNonzero(ksp,&guess_nonzero);CHKERRQ(ierr); 6043972b0daSStefano Zampini if ( !guess_nonzero ) { 6053972b0daSStefano Zampini ierr = VecSet(used_vec,0.0);CHKERRQ(ierr); 6063972b0daSStefano Zampini } 6073972b0daSStefano Zampini } 6083972b0daSStefano Zampini /* store the original rhs */ 6093972b0daSStefano Zampini ierr = VecCopy(rhs,pcbddc->original_rhs);CHKERRQ(ierr); 6103972b0daSStefano Zampini 6113972b0daSStefano Zampini /* Take into account zeroed rows -> change rhs and store solution removed */ 6123972b0daSStefano Zampini ierr = MatGetDiagonal(pc->pmat,pcis->vec1_global);CHKERRQ(ierr); 6133972b0daSStefano Zampini ierr = VecPointwiseDivide(pcis->vec1_global,rhs,pcis->vec1_global);CHKERRQ(ierr); 6143972b0daSStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 6153972b0daSStefano Zampini ierr = VecScatterEnd(matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 6163972b0daSStefano Zampini ierr = VecScatterBegin(matis->ctx,used_vec,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 6173972b0daSStefano Zampini ierr = VecScatterEnd(matis->ctx,used_vec,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 6183972b0daSStefano Zampini ierr = PCBDDCGetDirichletBoundaries(pc,&dirIS);CHKERRQ(ierr); 6193972b0daSStefano Zampini if (dirIS) { 6203972b0daSStefano Zampini ierr = ISGetSize(dirIS,&dirsize);CHKERRQ(ierr); 6213972b0daSStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array_x);CHKERRQ(ierr); 6223972b0daSStefano Zampini ierr = VecGetArray(pcis->vec2_N,&array_diagonal);CHKERRQ(ierr); 6233972b0daSStefano Zampini ierr = ISGetIndices(dirIS,(const PetscInt**)&is_indices);CHKERRQ(ierr); 6242fa5cd67SKarl Rupp for (i=0; i<dirsize; i++) array_x[is_indices[i]] = array_diagonal[is_indices[i]]; 6253972b0daSStefano Zampini ierr = ISRestoreIndices(dirIS,(const PetscInt**)&is_indices);CHKERRQ(ierr); 6263972b0daSStefano Zampini ierr = VecRestoreArray(pcis->vec2_N,&array_diagonal);CHKERRQ(ierr); 6273972b0daSStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array_x);CHKERRQ(ierr); 6283972b0daSStefano Zampini } 6293972b0daSStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 6303972b0daSStefano Zampini ierr = VecScatterEnd(matis->ctx,pcis->vec1_N,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 631b76ba322SStefano Zampini 6323972b0daSStefano Zampini /* remove the computed solution from the rhs */ 6333972b0daSStefano Zampini ierr = VecScale(used_vec,-1.0);CHKERRQ(ierr); 6343972b0daSStefano Zampini ierr = MatMultAdd(pc->pmat,used_vec,rhs,rhs);CHKERRQ(ierr); 6353972b0daSStefano Zampini ierr = VecScale(used_vec,-1.0);CHKERRQ(ierr); 636b76ba322SStefano Zampini 637b76ba322SStefano Zampini /* store partially computed solution and set initial guess */ 6383972b0daSStefano Zampini if (x) { 6393972b0daSStefano Zampini ierr = VecCopy(used_vec,pcbddc->temp_solution);CHKERRQ(ierr); 6403972b0daSStefano Zampini ierr = VecSet(used_vec,0.0);CHKERRQ(ierr); 64115aaf578SStefano Zampini if (pcbddc->use_exact_dirichlet && !pcbddc->coarse_psi_B) { 642b76ba322SStefano Zampini ierr = VecScatterBegin(pcis->global_to_D,rhs,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 643b76ba322SStefano Zampini ierr = VecScatterEnd (pcis->global_to_D,rhs,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 644b76ba322SStefano Zampini ierr = KSPSolve(pcbddc->ksp_D,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr); 645b76ba322SStefano Zampini ierr = VecScatterBegin(pcis->global_to_D,pcis->vec2_D,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 646b76ba322SStefano Zampini ierr = VecScatterEnd (pcis->global_to_D,pcis->vec2_D,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 647b76ba322SStefano Zampini if (ksp) { 648b76ba322SStefano Zampini ierr = KSPSetInitialGuessNonzero(ksp,PETSC_TRUE);CHKERRQ(ierr); 649b76ba322SStefano Zampini } 650b76ba322SStefano Zampini } 6513972b0daSStefano Zampini } 652b76ba322SStefano Zampini 653b76ba322SStefano Zampini /* rhs change of basis */ 654674ae819SStefano Zampini if (pcbddc->use_change_of_basis) { 655b76ba322SStefano Zampini /* swap pointers for local matrices */ 656b76ba322SStefano Zampini temp_mat = matis->A; 657b76ba322SStefano Zampini matis->A = pcbddc->local_mat; 658b76ba322SStefano Zampini pcbddc->local_mat = temp_mat; 659b76ba322SStefano Zampini /* Get local rhs and apply transformation of basis */ 660b76ba322SStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,rhs,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 661b76ba322SStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,rhs,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 662b76ba322SStefano Zampini /* from original basis to modified basis */ 663b76ba322SStefano Zampini ierr = MatMultTranspose(pcbddc->ChangeOfBasisMatrix,pcis->vec1_B,pcis->vec2_B);CHKERRQ(ierr); 664b76ba322SStefano Zampini /* put back modified values into the global vec using INSERT_VALUES copy mode */ 665b76ba322SStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,pcis->vec2_B,rhs,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 666b76ba322SStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,pcis->vec2_B,rhs,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 667674ae819SStefano Zampini } 6680bdf917eSStefano Zampini if (ksp && pcbddc->NullSpace) { 669d0195637SJed Brown ierr = MatNullSpaceRemove(pcbddc->NullSpace,used_vec);CHKERRQ(ierr); 670d0195637SJed Brown ierr = MatNullSpaceRemove(pcbddc->NullSpace,rhs);CHKERRQ(ierr); 671b76ba322SStefano Zampini } 6720bdf917eSStefano Zampini ierr = VecDestroy(&used_vec);CHKERRQ(ierr); 673534831adSStefano Zampini PetscFunctionReturn(0); 674534831adSStefano Zampini } 675534831adSStefano Zampini /* -------------------------------------------------------------------------- */ 676534831adSStefano Zampini #undef __FUNCT__ 677534831adSStefano Zampini #define __FUNCT__ "PCPostSolve_BDDC" 678534831adSStefano Zampini /* -------------------------------------------------------------------------- */ 679534831adSStefano Zampini /* 680534831adSStefano Zampini PCPostSolve_BDDC - Changes the computed solution if a transformation of basis 681534831adSStefano Zampini approach has been selected. Also, restores rhs to its original state. 682534831adSStefano Zampini 683534831adSStefano Zampini Input Parameter: 684534831adSStefano Zampini + pc - the preconditioner contex 685534831adSStefano Zampini 686534831adSStefano Zampini Application Interface Routine: PCPostSolve() 687534831adSStefano Zampini 688534831adSStefano Zampini Notes: 689534831adSStefano Zampini The interface routine PCPostSolve() is not usually called directly by 690534831adSStefano Zampini the user, but instead is called by KSPSolve(). 691534831adSStefano Zampini */ 692534831adSStefano Zampini static PetscErrorCode PCPostSolve_BDDC(PC pc, KSP ksp, Vec rhs, Vec x) 693534831adSStefano Zampini { 694534831adSStefano Zampini PetscErrorCode ierr; 695534831adSStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 696534831adSStefano Zampini PC_IS *pcis = (PC_IS*)(pc->data); 697534831adSStefano Zampini Mat_IS *matis = (Mat_IS*)pc->pmat->data; 698534831adSStefano Zampini Mat temp_mat; 699534831adSStefano Zampini 700534831adSStefano Zampini PetscFunctionBegin; 701674ae819SStefano Zampini if (pcbddc->use_change_of_basis) { 702534831adSStefano Zampini /* swap pointers for local matrices */ 703534831adSStefano Zampini temp_mat = matis->A; 704534831adSStefano Zampini matis->A = pcbddc->local_mat; 705534831adSStefano Zampini pcbddc->local_mat = temp_mat; 706534831adSStefano Zampini /* restore rhs to its original state */ 7073425bc38SStefano Zampini if (rhs) { 7083425bc38SStefano Zampini ierr = VecCopy(pcbddc->original_rhs,rhs);CHKERRQ(ierr); 7093425bc38SStefano Zampini } 710534831adSStefano Zampini /* Get Local boundary and apply transformation of basis to solution vector */ 711534831adSStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,x,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 712534831adSStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,x,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 713534831adSStefano Zampini /* from modified basis to original basis */ 714534831adSStefano Zampini ierr = MatMult(pcbddc->ChangeOfBasisMatrix,pcis->vec1_B,pcis->vec2_B);CHKERRQ(ierr); 715534831adSStefano Zampini /* put back modified values into the global vec using INSERT_VALUES copy mode */ 716534831adSStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,pcis->vec2_B,x,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 717534831adSStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,pcis->vec2_B,x,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 718534831adSStefano Zampini } 7193972b0daSStefano Zampini /* add solution removed in presolve */ 7203425bc38SStefano Zampini if (x) { 7213425bc38SStefano Zampini ierr = VecAXPY(x,1.0,pcbddc->temp_solution);CHKERRQ(ierr); 7223425bc38SStefano Zampini } 723534831adSStefano Zampini PetscFunctionReturn(0); 724534831adSStefano Zampini } 725534831adSStefano Zampini /* -------------------------------------------------------------------------- */ 72653cdbc3dSStefano Zampini #undef __FUNCT__ 72753cdbc3dSStefano Zampini #define __FUNCT__ "PCSetUp_BDDC" 7280c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 7290c7d97c5SJed Brown /* 7300c7d97c5SJed Brown PCSetUp_BDDC - Prepares for the use of the BDDC preconditioner 7310c7d97c5SJed Brown by setting data structures and options. 7320c7d97c5SJed Brown 7330c7d97c5SJed Brown Input Parameter: 73453cdbc3dSStefano Zampini + pc - the preconditioner context 7350c7d97c5SJed Brown 7360c7d97c5SJed Brown Application Interface Routine: PCSetUp() 7370c7d97c5SJed Brown 7380c7d97c5SJed Brown Notes: 7390c7d97c5SJed Brown The interface routine PCSetUp() is not usually called directly by 7400c7d97c5SJed Brown the user, but instead is called by PCApply() if necessary. 7410c7d97c5SJed Brown */ 74253cdbc3dSStefano Zampini PetscErrorCode PCSetUp_BDDC(PC pc) 7430c7d97c5SJed Brown { 7440c7d97c5SJed Brown PetscErrorCode ierr; 7450c7d97c5SJed Brown PC_BDDC* pcbddc = (PC_BDDC*)pc->data; 746674ae819SStefano Zampini MatStructure flag; 747674ae819SStefano Zampini PetscBool computeis,computetopography,computesolvers; 7480c7d97c5SJed Brown 7490c7d97c5SJed Brown PetscFunctionBegin; 750674ae819SStefano Zampini /* the following lines of code should be replaced by a better logic between PCIS, PCNN, PCBDDC and other nonoverlapping preconditioners */ 7513b03a366Sstefano_zampini /* For BDDC we need to define a local "Neumann" problem different to that defined in PCISSetup 7529c0446d6SStefano Zampini So, we set to pcnone the Neumann problem of pcis in order to avoid unneeded computation 7530c7d97c5SJed Brown Also, we decide to directly build the (same) Dirichlet problem */ 7540c7d97c5SJed Brown ierr = PetscOptionsSetValue("-is_localN_pc_type","none");CHKERRQ(ierr); 7550c7d97c5SJed Brown ierr = PetscOptionsSetValue("-is_localD_pc_type","none");CHKERRQ(ierr); 7563b03a366Sstefano_zampini /* Get stdout for dbg */ 757674ae819SStefano Zampini if (pcbddc->dbg_flag && !pcbddc->dbg_viewer) { 758ce94432eSBarry Smith ierr = PetscViewerASCIIGetStdout(PetscObjectComm((PetscObject)pc),&pcbddc->dbg_viewer);CHKERRQ(ierr); 759e269702eSStefano Zampini ierr = PetscViewerASCIISynchronizedAllow(pcbddc->dbg_viewer,PETSC_TRUE);CHKERRQ(ierr); 760e269702eSStefano Zampini } 761674ae819SStefano Zampini /* first attempt to split work */ 762674ae819SStefano Zampini if (pc->setupcalled) { 763674ae819SStefano Zampini computeis = PETSC_FALSE; 764674ae819SStefano Zampini ierr = PCGetOperators(pc,NULL,NULL,&flag);CHKERRQ(ierr); 765674ae819SStefano Zampini if (flag == SAME_PRECONDITIONER) { 766674ae819SStefano Zampini computetopography = PETSC_FALSE; 767674ae819SStefano Zampini computesolvers = PETSC_FALSE; 768674ae819SStefano Zampini } else if (flag == SAME_NONZERO_PATTERN) { 769674ae819SStefano Zampini computetopography = PETSC_FALSE; 770674ae819SStefano Zampini computesolvers = PETSC_TRUE; 771674ae819SStefano Zampini } else { /* DIFFERENT_NONZERO_PATTERN */ 772674ae819SStefano Zampini computetopography = PETSC_TRUE; 773674ae819SStefano Zampini computesolvers = PETSC_TRUE; 774674ae819SStefano Zampini } 775674ae819SStefano Zampini } else { 776674ae819SStefano Zampini computeis = PETSC_TRUE; 777674ae819SStefano Zampini computetopography = PETSC_TRUE; 778674ae819SStefano Zampini computesolvers = PETSC_TRUE; 779674ae819SStefano Zampini } 780674ae819SStefano Zampini /* Set up all the "iterative substructuring" common block */ 781674ae819SStefano Zampini if (computeis) { 782674ae819SStefano Zampini ierr = PCISSetUp(pc);CHKERRQ(ierr); 783674ae819SStefano Zampini } 784674ae819SStefano Zampini /* Analyze interface and set up local constraint and change of basis matrices */ 785674ae819SStefano Zampini if (computetopography) { 786674ae819SStefano Zampini /* reset data */ 787674ae819SStefano Zampini ierr = PCBDDCResetTopography(pc);CHKERRQ(ierr); 788674ae819SStefano Zampini ierr = PCBDDCAnalyzeInterface(pc);CHKERRQ(ierr); 789674ae819SStefano Zampini ierr = PCBDDCConstraintsSetUp(pc);CHKERRQ(ierr); 790674ae819SStefano Zampini } 791674ae819SStefano Zampini if (computesolvers) { 792674ae819SStefano Zampini /* reset data */ 793674ae819SStefano Zampini ierr = PCBDDCResetSolvers(pc);CHKERRQ(ierr); 794674ae819SStefano Zampini ierr = PCBDDCScalingDestroy(pc);CHKERRQ(ierr); 7950c7d97c5SJed Brown /* Create coarse and local stuffs used for evaluating action of preconditioner */ 7960c7d97c5SJed Brown ierr = PCBDDCCoarseSetUp(pc);CHKERRQ(ierr); 797674ae819SStefano Zampini ierr = PCBDDCScalingSetUp(pc);CHKERRQ(ierr); 7980c7d97c5SJed Brown } 7990c7d97c5SJed Brown PetscFunctionReturn(0); 8000c7d97c5SJed Brown } 8010c7d97c5SJed Brown 8020c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 8030c7d97c5SJed Brown /* 8040c7d97c5SJed Brown PCApply_BDDC - Applies the BDDC preconditioner to a vector. 8050c7d97c5SJed Brown 8060c7d97c5SJed Brown Input Parameters: 8070c7d97c5SJed Brown . pc - the preconditioner context 8080c7d97c5SJed Brown . r - input vector (global) 8090c7d97c5SJed Brown 8100c7d97c5SJed Brown Output Parameter: 8110c7d97c5SJed Brown . z - output vector (global) 8120c7d97c5SJed Brown 8130c7d97c5SJed Brown Application Interface Routine: PCApply() 8140c7d97c5SJed Brown */ 8150c7d97c5SJed Brown #undef __FUNCT__ 8160c7d97c5SJed Brown #define __FUNCT__ "PCApply_BDDC" 81753cdbc3dSStefano Zampini PetscErrorCode PCApply_BDDC(PC pc,Vec r,Vec z) 8180c7d97c5SJed Brown { 8190c7d97c5SJed Brown PC_IS *pcis = (PC_IS*)(pc->data); 8200c7d97c5SJed Brown PC_BDDC *pcbddc = (PC_BDDC*)(pc->data); 8210c7d97c5SJed Brown PetscErrorCode ierr; 8223b03a366Sstefano_zampini const PetscScalar one = 1.0; 8233b03a366Sstefano_zampini const PetscScalar m_one = -1.0; 8242617d88aSStefano Zampini const PetscScalar zero = 0.0; 8250c7d97c5SJed Brown 8260c7d97c5SJed Brown /* This code is similar to that provided in nn.c for PCNN 8270c7d97c5SJed Brown NN interface preconditioner changed to BDDC 82829622bf0SStefano Zampini Added support for M_3 preconditioner in the reference article (code is active if pcbddc->inexact_prec_type = PETSC_TRUE) */ 8290c7d97c5SJed Brown 8300c7d97c5SJed Brown PetscFunctionBegin; 83115aaf578SStefano Zampini if (!pcbddc->use_exact_dirichlet || pcbddc->coarse_psi_B) { 8320c7d97c5SJed Brown /* First Dirichlet solve */ 8330c7d97c5SJed Brown ierr = VecScatterBegin(pcis->global_to_D,r,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 8340c7d97c5SJed Brown ierr = VecScatterEnd (pcis->global_to_D,r,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 83553cdbc3dSStefano Zampini ierr = KSPSolve(pcbddc->ksp_D,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr); 8360c7d97c5SJed Brown /* 8370c7d97c5SJed Brown Assembling right hand side for BDDC operator 838674ae819SStefano Zampini - pcis->vec1_D for the Dirichlet part (if needed, i.e. prec_flag=PETSC_TRUE) 839674ae819SStefano Zampini - pcis->vec1_B the interface part of the global vector z 8400c7d97c5SJed Brown */ 8410c7d97c5SJed Brown ierr = VecScale(pcis->vec2_D,m_one);CHKERRQ(ierr); 8420c7d97c5SJed Brown ierr = MatMult(pcis->A_BI,pcis->vec2_D,pcis->vec1_B);CHKERRQ(ierr); 84329622bf0SStefano Zampini if (pcbddc->inexact_prec_type) { ierr = MatMultAdd(pcis->A_II,pcis->vec2_D,pcis->vec1_D,pcis->vec1_D);CHKERRQ(ierr); } 8440c7d97c5SJed Brown ierr = VecScale(pcis->vec2_D,m_one);CHKERRQ(ierr); 8450c7d97c5SJed Brown ierr = VecCopy(r,z);CHKERRQ(ierr); 8460c7d97c5SJed Brown ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8470c7d97c5SJed Brown ierr = VecScatterEnd (pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 848674ae819SStefano Zampini ierr = PCBDDCScalingRestriction(pc,z,pcis->vec1_B);CHKERRQ(ierr); 849b76ba322SStefano Zampini } else { 8500bdf917eSStefano Zampini ierr = VecSet(pcis->vec1_D,zero);CHKERRQ(ierr); 851b76ba322SStefano Zampini ierr = VecSet(pcis->vec2_D,zero);CHKERRQ(ierr); 852674ae819SStefano Zampini ierr = PCBDDCScalingRestriction(pc,r,pcis->vec1_B);CHKERRQ(ierr); 853b76ba322SStefano Zampini } 854b76ba322SStefano Zampini 8552617d88aSStefano Zampini /* Apply interface preconditioner 8562617d88aSStefano Zampini input/output vecs: pcis->vec1_B and pcis->vec1_D */ 8572617d88aSStefano Zampini ierr = PCBDDCApplyInterfacePreconditioner(pc);CHKERRQ(ierr); 8582617d88aSStefano Zampini 859674ae819SStefano Zampini /* Apply transpose of partition of unity operator */ 860674ae819SStefano Zampini ierr = PCBDDCScalingExtension(pc,pcis->vec1_B,z);CHKERRQ(ierr); 8610c7d97c5SJed Brown 8623b03a366Sstefano_zampini /* Second Dirichlet solve and assembling of output */ 8630c7d97c5SJed Brown ierr = VecScatterBegin(pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 8640c7d97c5SJed Brown ierr = VecScatterEnd (pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 8650c7d97c5SJed Brown ierr = MatMult(pcis->A_IB,pcis->vec1_B,pcis->vec3_D);CHKERRQ(ierr); 86629622bf0SStefano Zampini if (pcbddc->inexact_prec_type) { ierr = MatMultAdd(pcis->A_II,pcis->vec1_D,pcis->vec3_D,pcis->vec3_D);CHKERRQ(ierr); } 86753cdbc3dSStefano Zampini ierr = KSPSolve(pcbddc->ksp_D,pcis->vec3_D,pcbddc->vec4_D);CHKERRQ(ierr); 8680c7d97c5SJed Brown ierr = VecScale(pcbddc->vec4_D,m_one);CHKERRQ(ierr); 86929622bf0SStefano Zampini if (pcbddc->inexact_prec_type) { ierr = VecAXPY (pcbddc->vec4_D,one,pcis->vec1_D);CHKERRQ(ierr); } 8700c7d97c5SJed Brown ierr = VecAXPY (pcis->vec2_D,one,pcbddc->vec4_D);CHKERRQ(ierr); 8710c7d97c5SJed Brown ierr = VecScatterBegin(pcis->global_to_D,pcis->vec2_D,z,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8720c7d97c5SJed Brown ierr = VecScatterEnd (pcis->global_to_D,pcis->vec2_D,z,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8730c7d97c5SJed Brown PetscFunctionReturn(0); 8740c7d97c5SJed Brown } 875da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */ 876674ae819SStefano Zampini 877da1bb401SStefano Zampini #undef __FUNCT__ 878da1bb401SStefano Zampini #define __FUNCT__ "PCDestroy_BDDC" 879da1bb401SStefano Zampini PetscErrorCode PCDestroy_BDDC(PC pc) 880da1bb401SStefano Zampini { 881da1bb401SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 882da1bb401SStefano Zampini PetscErrorCode ierr; 883da1bb401SStefano Zampini 884da1bb401SStefano Zampini PetscFunctionBegin; 885da1bb401SStefano Zampini /* free data created by PCIS */ 886da1bb401SStefano Zampini ierr = PCISDestroy(pc);CHKERRQ(ierr); 887674ae819SStefano Zampini /* free BDDC custom data */ 888674ae819SStefano Zampini ierr = PCBDDCResetCustomization(pc);CHKERRQ(ierr); 889674ae819SStefano Zampini /* destroy objects related to topography */ 890674ae819SStefano Zampini ierr = PCBDDCResetTopography(pc);CHKERRQ(ierr); 891674ae819SStefano Zampini /* free allocated graph structure */ 892da1bb401SStefano Zampini ierr = PetscFree(pcbddc->mat_graph);CHKERRQ(ierr); 893674ae819SStefano Zampini /* free data for scaling operator */ 894674ae819SStefano Zampini ierr = PCBDDCScalingDestroy(pc);CHKERRQ(ierr); 895674ae819SStefano Zampini /* free solvers stuff */ 896674ae819SStefano Zampini ierr = PCBDDCResetSolvers(pc);CHKERRQ(ierr); 89733bc96a4SStefano Zampini ierr = KSPDestroy(&pcbddc->ksp_D);CHKERRQ(ierr); 89833bc96a4SStefano Zampini ierr = KSPDestroy(&pcbddc->ksp_R);CHKERRQ(ierr); 8993425bc38SStefano Zampini /* remove functions */ 900674ae819SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCSetPrimalVerticesLocalIS_C",NULL);CHKERRQ(ierr); 901bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCSetCoarseningRatio_C",NULL);CHKERRQ(ierr); 902bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCSetMaxLevels_C",NULL);CHKERRQ(ierr); 903bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCSetNullSpace_C",NULL);CHKERRQ(ierr); 904bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCSetDirichletBoundaries_C",NULL);CHKERRQ(ierr); 905bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCSetNeumannBoundaries_C",NULL);CHKERRQ(ierr); 906bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCGetDirichletBoundaries_C",NULL);CHKERRQ(ierr); 907bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCGetNeumannBoundaries_C",NULL);CHKERRQ(ierr); 908bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCSetCoarseProblemType_C",NULL);CHKERRQ(ierr); 909bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCSetDofsSplitting_C",NULL);CHKERRQ(ierr); 910bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCSetLocalAdjacencyGraph_C",NULL);CHKERRQ(ierr); 911bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCCreateFETIDPOperators_C",NULL);CHKERRQ(ierr); 912bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCMatFETIDPGetRHS_C",NULL);CHKERRQ(ierr); 913bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCMatFETIDPGetSolution_C",NULL);CHKERRQ(ierr); 914674ae819SStefano Zampini /* Free the private data structure */ 915674ae819SStefano Zampini ierr = PetscFree(pc->data);CHKERRQ(ierr); 916da1bb401SStefano Zampini PetscFunctionReturn(0); 917da1bb401SStefano Zampini } 9183425bc38SStefano Zampini /* -------------------------------------------------------------------------- */ 9191e6b0712SBarry Smith 9203425bc38SStefano Zampini #undef __FUNCT__ 9213425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetRHS_BDDC" 9223425bc38SStefano Zampini static PetscErrorCode PCBDDCMatFETIDPGetRHS_BDDC(Mat fetidp_mat, Vec standard_rhs, Vec fetidp_flux_rhs) 9233425bc38SStefano Zampini { 924674ae819SStefano Zampini FETIDPMat_ctx mat_ctx; 9253425bc38SStefano Zampini PC_IS* pcis; 9263425bc38SStefano Zampini PC_BDDC* pcbddc; 9273425bc38SStefano Zampini PetscErrorCode ierr; 9280c7d97c5SJed Brown 9293425bc38SStefano Zampini PetscFunctionBegin; 9303425bc38SStefano Zampini ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr); 9313425bc38SStefano Zampini pcis = (PC_IS*)mat_ctx->pc->data; 9323425bc38SStefano Zampini pcbddc = (PC_BDDC*)mat_ctx->pc->data; 9333425bc38SStefano Zampini 9343425bc38SStefano Zampini /* change of basis for physical rhs if needed 9353425bc38SStefano Zampini It also changes the rhs in case of dirichlet boundaries */ 9360298fd71SBarry Smith (*mat_ctx->pc->ops->presolve)(mat_ctx->pc,NULL,standard_rhs,NULL); 9373425bc38SStefano Zampini /* store vectors for computation of fetidp final solution */ 9383425bc38SStefano Zampini ierr = VecScatterBegin(pcis->global_to_D,standard_rhs,mat_ctx->temp_solution_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 9393425bc38SStefano Zampini ierr = VecScatterEnd(pcis->global_to_D,standard_rhs,mat_ctx->temp_solution_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 940674ae819SStefano Zampini /* scale rhs since it should be unassembled : TODO use counter scaling? (also below) */ 9413425bc38SStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 9423425bc38SStefano Zampini ierr = VecScatterEnd(pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 943674ae819SStefano Zampini /* Apply partition of unity */ 9443425bc38SStefano Zampini ierr = VecPointwiseMult(mat_ctx->temp_solution_B,pcis->D,mat_ctx->temp_solution_B);CHKERRQ(ierr); 945674ae819SStefano Zampini /* ierr = PCBDDCScalingRestriction(mat_ctx->pc,standard_rhs,mat_ctx->temp_solution_B);CHKERRQ(ierr); */ 94629622bf0SStefano Zampini if (!pcbddc->inexact_prec_type) { 9473425bc38SStefano Zampini /* compute partially subassembled Schur complement right-hand side */ 9483425bc38SStefano Zampini ierr = KSPSolve(pcbddc->ksp_D,mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr); 9493425bc38SStefano Zampini ierr = MatMult(pcis->A_BI,pcis->vec1_D,pcis->vec1_B);CHKERRQ(ierr); 9503425bc38SStefano Zampini ierr = VecAXPY(mat_ctx->temp_solution_B,-1.0,pcis->vec1_B);CHKERRQ(ierr); 9513425bc38SStefano Zampini ierr = VecSet(standard_rhs,0.0);CHKERRQ(ierr); 9523425bc38SStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,mat_ctx->temp_solution_B,standard_rhs,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 9533425bc38SStefano Zampini ierr = VecScatterEnd(pcis->global_to_B,mat_ctx->temp_solution_B,standard_rhs,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 954674ae819SStefano Zampini /* ierr = PCBDDCScalingRestriction(mat_ctx->pc,standard_rhs,mat_ctx->temp_solution_B);CHKERRQ(ierr); */ 9553425bc38SStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 9563425bc38SStefano Zampini ierr = VecScatterEnd(pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 9573425bc38SStefano Zampini ierr = VecPointwiseMult(mat_ctx->temp_solution_B,pcis->D,mat_ctx->temp_solution_B);CHKERRQ(ierr); 9583425bc38SStefano Zampini } 9593425bc38SStefano Zampini /* BDDC rhs */ 9603425bc38SStefano Zampini ierr = VecCopy(mat_ctx->temp_solution_B,pcis->vec1_B);CHKERRQ(ierr); 96129622bf0SStefano Zampini if (pcbddc->inexact_prec_type) { 9623425bc38SStefano Zampini ierr = VecCopy(mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr); 9633425bc38SStefano Zampini } 9643425bc38SStefano Zampini /* apply BDDC */ 9653425bc38SStefano Zampini ierr = PCBDDCApplyInterfacePreconditioner(mat_ctx->pc);CHKERRQ(ierr); 9663425bc38SStefano Zampini /* Application of B_delta and assembling of rhs for fetidp fluxes */ 9673425bc38SStefano Zampini ierr = VecSet(fetidp_flux_rhs,0.0);CHKERRQ(ierr); 9683425bc38SStefano Zampini ierr = MatMult(mat_ctx->B_delta,pcis->vec1_B,mat_ctx->lambda_local);CHKERRQ(ierr); 9693425bc38SStefano Zampini ierr = VecScatterBegin(mat_ctx->l2g_lambda,mat_ctx->lambda_local,fetidp_flux_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 9703425bc38SStefano Zampini ierr = VecScatterEnd (mat_ctx->l2g_lambda,mat_ctx->lambda_local,fetidp_flux_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 9713425bc38SStefano Zampini /* restore original rhs */ 9723425bc38SStefano Zampini ierr = VecCopy(pcbddc->original_rhs,standard_rhs);CHKERRQ(ierr); 9733425bc38SStefano Zampini PetscFunctionReturn(0); 9743425bc38SStefano Zampini } 9751e6b0712SBarry Smith 9763425bc38SStefano Zampini #undef __FUNCT__ 9773425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetRHS" 9783425bc38SStefano Zampini /*@ 9793425bc38SStefano Zampini PCBDDCMatFETIDPGetRHS - Get rhs for FETIDP linear system. 9803425bc38SStefano Zampini 9813425bc38SStefano Zampini Collective 9823425bc38SStefano Zampini 9833425bc38SStefano Zampini Input Parameters: 9843425bc38SStefano Zampini + fetidp_mat - the FETIDP mat obtained by a call to PCBDDCCreateFETIDPOperators 9853425bc38SStefano Zampini + standard_rhs - the rhs of your linear system 9863425bc38SStefano Zampini 9873425bc38SStefano Zampini Output Parameters: 9883425bc38SStefano Zampini + fetidp_flux_rhs - the rhs of the FETIDP linear system 9893425bc38SStefano Zampini 9903425bc38SStefano Zampini Level: developer 9913425bc38SStefano Zampini 9923425bc38SStefano Zampini Notes: 9933425bc38SStefano Zampini 9943425bc38SStefano Zampini .seealso: PCBDDC 9953425bc38SStefano Zampini @*/ 9963425bc38SStefano Zampini PetscErrorCode PCBDDCMatFETIDPGetRHS(Mat fetidp_mat, Vec standard_rhs, Vec fetidp_flux_rhs) 9973425bc38SStefano Zampini { 998674ae819SStefano Zampini FETIDPMat_ctx mat_ctx; 9993425bc38SStefano Zampini PetscErrorCode ierr; 10003425bc38SStefano Zampini 10013425bc38SStefano Zampini PetscFunctionBegin; 10023425bc38SStefano Zampini ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr); 10033425bc38SStefano Zampini ierr = PetscTryMethod(mat_ctx->pc,"PCBDDCMatFETIDPGetRHS_C",(Mat,Vec,Vec),(fetidp_mat,standard_rhs,fetidp_flux_rhs));CHKERRQ(ierr); 10043425bc38SStefano Zampini PetscFunctionReturn(0); 10053425bc38SStefano Zampini } 10063425bc38SStefano Zampini /* -------------------------------------------------------------------------- */ 10071e6b0712SBarry Smith 10083425bc38SStefano Zampini #undef __FUNCT__ 10093425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetSolution_BDDC" 10103425bc38SStefano Zampini static PetscErrorCode PCBDDCMatFETIDPGetSolution_BDDC(Mat fetidp_mat, Vec fetidp_flux_sol, Vec standard_sol) 10113425bc38SStefano Zampini { 1012674ae819SStefano Zampini FETIDPMat_ctx mat_ctx; 10133425bc38SStefano Zampini PC_IS* pcis; 10143425bc38SStefano Zampini PC_BDDC* pcbddc; 10153425bc38SStefano Zampini PetscErrorCode ierr; 10163425bc38SStefano Zampini 10173425bc38SStefano Zampini PetscFunctionBegin; 10183425bc38SStefano Zampini ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr); 10193425bc38SStefano Zampini pcis = (PC_IS*)mat_ctx->pc->data; 10203425bc38SStefano Zampini pcbddc = (PC_BDDC*)mat_ctx->pc->data; 10213425bc38SStefano Zampini 10223425bc38SStefano Zampini /* apply B_delta^T */ 10233425bc38SStefano Zampini ierr = VecScatterBegin(mat_ctx->l2g_lambda,fetidp_flux_sol,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 10243425bc38SStefano Zampini ierr = VecScatterEnd (mat_ctx->l2g_lambda,fetidp_flux_sol,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 10253425bc38SStefano Zampini ierr = MatMultTranspose(mat_ctx->B_delta,mat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr); 10263425bc38SStefano Zampini /* compute rhs for BDDC application */ 10273425bc38SStefano Zampini ierr = VecAYPX(pcis->vec1_B,-1.0,mat_ctx->temp_solution_B);CHKERRQ(ierr); 102829622bf0SStefano Zampini if (pcbddc->inexact_prec_type) { 10293425bc38SStefano Zampini ierr = VecCopy(mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr); 10303425bc38SStefano Zampini } 10313425bc38SStefano Zampini /* apply BDDC */ 10323425bc38SStefano Zampini ierr = PCBDDCApplyInterfacePreconditioner(mat_ctx->pc);CHKERRQ(ierr); 10333425bc38SStefano Zampini /* put values into standard global vector */ 10343425bc38SStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 10353425bc38SStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,pcis->vec1_B,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 103629622bf0SStefano Zampini if (!pcbddc->inexact_prec_type) { 10373425bc38SStefano Zampini /* compute values into the interior if solved for the partially subassembled Schur complement */ 10383425bc38SStefano Zampini ierr = MatMult(pcis->A_IB,pcis->vec1_B,pcis->vec1_D);CHKERRQ(ierr); 10393425bc38SStefano Zampini ierr = VecAXPY(mat_ctx->temp_solution_D,-1.0,pcis->vec1_D);CHKERRQ(ierr); 10403425bc38SStefano Zampini ierr = KSPSolve(pcbddc->ksp_D,mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr); 10413425bc38SStefano Zampini } 10423425bc38SStefano Zampini ierr = VecScatterBegin(pcis->global_to_D,pcis->vec1_D,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 10433425bc38SStefano Zampini ierr = VecScatterEnd (pcis->global_to_D,pcis->vec1_D,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 10443425bc38SStefano Zampini /* final change of basis if needed 10453425bc38SStefano Zampini Is also sums the dirichlet part removed during RHS assembling */ 10460298fd71SBarry Smith (*mat_ctx->pc->ops->postsolve)(mat_ctx->pc,NULL,NULL,standard_sol); 10473425bc38SStefano Zampini PetscFunctionReturn(0); 10483425bc38SStefano Zampini 10493425bc38SStefano Zampini } 10501e6b0712SBarry Smith 10513425bc38SStefano Zampini #undef __FUNCT__ 10523425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetSolution" 10533425bc38SStefano Zampini /*@ 10543425bc38SStefano Zampini PCBDDCMatFETIDPGetSolution - Get Solution for FETIDP linear system. 10553425bc38SStefano Zampini 10563425bc38SStefano Zampini Collective 10573425bc38SStefano Zampini 10583425bc38SStefano Zampini Input Parameters: 10593425bc38SStefano Zampini + fetidp_mat - the FETIDP mat obtained by a call to PCBDDCCreateFETIDPOperators 10603425bc38SStefano Zampini + fetidp_flux_sol - the solution of the FETIDP linear system 10613425bc38SStefano Zampini 10623425bc38SStefano Zampini Output Parameters: 10633425bc38SStefano Zampini + standard_sol - the solution on the global domain 10643425bc38SStefano Zampini 10653425bc38SStefano Zampini Level: developer 10663425bc38SStefano Zampini 10673425bc38SStefano Zampini Notes: 10683425bc38SStefano Zampini 10693425bc38SStefano Zampini .seealso: PCBDDC 10703425bc38SStefano Zampini @*/ 10713425bc38SStefano Zampini PetscErrorCode PCBDDCMatFETIDPGetSolution(Mat fetidp_mat, Vec fetidp_flux_sol, Vec standard_sol) 10723425bc38SStefano Zampini { 1073674ae819SStefano Zampini FETIDPMat_ctx mat_ctx; 10743425bc38SStefano Zampini PetscErrorCode ierr; 10753425bc38SStefano Zampini 10763425bc38SStefano Zampini PetscFunctionBegin; 10773425bc38SStefano Zampini ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr); 10783425bc38SStefano Zampini ierr = PetscTryMethod(mat_ctx->pc,"PCBDDCMatFETIDPGetSolution_C",(Mat,Vec,Vec),(fetidp_mat,fetidp_flux_sol,standard_sol));CHKERRQ(ierr); 10793425bc38SStefano Zampini PetscFunctionReturn(0); 10803425bc38SStefano Zampini } 10813425bc38SStefano Zampini /* -------------------------------------------------------------------------- */ 10821e6b0712SBarry Smith 1083f23aa3ddSBarry Smith extern PetscErrorCode FETIDPMatMult(Mat,Vec,Vec); 1084f23aa3ddSBarry Smith extern PetscErrorCode PCBDDCDestroyFETIDPMat(Mat); 1085f23aa3ddSBarry Smith extern PetscErrorCode FETIDPPCApply(PC,Vec,Vec); 1086f23aa3ddSBarry Smith extern PetscErrorCode PCBDDCDestroyFETIDPPC(PC); 1087674ae819SStefano Zampini 10883425bc38SStefano Zampini #undef __FUNCT__ 10893425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPOperators_BDDC" 10903425bc38SStefano Zampini static PetscErrorCode PCBDDCCreateFETIDPOperators_BDDC(PC pc, Mat *fetidp_mat, PC *fetidp_pc) 10913425bc38SStefano Zampini { 1092674ae819SStefano Zampini 1093674ae819SStefano Zampini FETIDPMat_ctx fetidpmat_ctx; 10943425bc38SStefano Zampini Mat newmat; 1095674ae819SStefano Zampini FETIDPPC_ctx fetidppc_ctx; 10963425bc38SStefano Zampini PC newpc; 1097ce94432eSBarry Smith MPI_Comm comm; 10983425bc38SStefano Zampini PetscErrorCode ierr; 10993425bc38SStefano Zampini 11003425bc38SStefano Zampini PetscFunctionBegin; 1101ce94432eSBarry Smith ierr = PetscObjectGetComm((PetscObject)pc,&comm);CHKERRQ(ierr); 11023425bc38SStefano Zampini /* FETIDP linear matrix */ 11033425bc38SStefano Zampini ierr = PCBDDCCreateFETIDPMatContext(pc,&fetidpmat_ctx);CHKERRQ(ierr); 11043425bc38SStefano Zampini ierr = PCBDDCSetupFETIDPMatContext(fetidpmat_ctx);CHKERRQ(ierr); 11053425bc38SStefano Zampini ierr = MatCreateShell(comm,PETSC_DECIDE,PETSC_DECIDE,fetidpmat_ctx->n_lambda,fetidpmat_ctx->n_lambda,fetidpmat_ctx,&newmat);CHKERRQ(ierr); 11063425bc38SStefano Zampini ierr = MatShellSetOperation(newmat,MATOP_MULT,(void (*)(void))FETIDPMatMult);CHKERRQ(ierr); 11073425bc38SStefano Zampini ierr = MatShellSetOperation(newmat,MATOP_DESTROY,(void (*)(void))PCBDDCDestroyFETIDPMat);CHKERRQ(ierr); 11083425bc38SStefano Zampini ierr = MatSetUp(newmat);CHKERRQ(ierr); 11093425bc38SStefano Zampini /* FETIDP preconditioner */ 11103425bc38SStefano Zampini ierr = PCBDDCCreateFETIDPPCContext(pc,&fetidppc_ctx);CHKERRQ(ierr); 11113425bc38SStefano Zampini ierr = PCBDDCSetupFETIDPPCContext(newmat,fetidppc_ctx);CHKERRQ(ierr); 11123425bc38SStefano Zampini ierr = PCCreate(comm,&newpc);CHKERRQ(ierr); 11133425bc38SStefano Zampini ierr = PCSetType(newpc,PCSHELL);CHKERRQ(ierr); 11143425bc38SStefano Zampini ierr = PCShellSetContext(newpc,fetidppc_ctx);CHKERRQ(ierr); 11153425bc38SStefano Zampini ierr = PCShellSetApply(newpc,FETIDPPCApply);CHKERRQ(ierr); 11163425bc38SStefano Zampini ierr = PCShellSetDestroy(newpc,PCBDDCDestroyFETIDPPC);CHKERRQ(ierr); 11173425bc38SStefano Zampini ierr = PCSetOperators(newpc,newmat,newmat,SAME_PRECONDITIONER);CHKERRQ(ierr); 11183425bc38SStefano Zampini ierr = PCSetUp(newpc);CHKERRQ(ierr); 11193425bc38SStefano Zampini /* return pointers for objects created */ 11203425bc38SStefano Zampini *fetidp_mat=newmat; 11213425bc38SStefano Zampini *fetidp_pc=newpc; 11223425bc38SStefano Zampini PetscFunctionReturn(0); 11233425bc38SStefano Zampini } 11241e6b0712SBarry Smith 11253425bc38SStefano Zampini #undef __FUNCT__ 11263425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPOperators" 11273425bc38SStefano Zampini /*@ 11283425bc38SStefano Zampini PCBDDCCreateFETIDPOperators - Create operators for FETIDP. 11293425bc38SStefano Zampini 11303425bc38SStefano Zampini Collective 11313425bc38SStefano Zampini 11323425bc38SStefano Zampini Input Parameters: 11333425bc38SStefano Zampini + pc - the BDDC preconditioning context (setup must be already called) 11343425bc38SStefano Zampini 11353425bc38SStefano Zampini Level: developer 11363425bc38SStefano Zampini 11373425bc38SStefano Zampini Notes: 11383425bc38SStefano Zampini 11393425bc38SStefano Zampini .seealso: PCBDDC 11403425bc38SStefano Zampini @*/ 11413425bc38SStefano Zampini PetscErrorCode PCBDDCCreateFETIDPOperators(PC pc, Mat *fetidp_mat, PC *fetidp_pc) 11423425bc38SStefano Zampini { 11433425bc38SStefano Zampini PetscErrorCode ierr; 11443425bc38SStefano Zampini 11453425bc38SStefano Zampini PetscFunctionBegin; 11463425bc38SStefano Zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 11473425bc38SStefano Zampini if (pc->setupcalled) { 11483425bc38SStefano Zampini ierr = PetscTryMethod(pc,"PCBDDCCreateFETIDPOperators_C",(PC,Mat*,PC*),(pc,fetidp_mat,fetidp_pc));CHKERRQ(ierr); 1149f23aa3ddSBarry Smith } else SETERRQ(PETSC_COMM_SELF,PETSC_ERR_SUP,"You must call PCSetup_BDDC() first \n"); 11503425bc38SStefano Zampini PetscFunctionReturn(0); 11513425bc38SStefano Zampini } 11520c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 1153da1bb401SStefano Zampini /*MC 1154da1bb401SStefano Zampini PCBDDC - Balancing Domain Decomposition by Constraints. 11550c7d97c5SJed Brown 1156da1bb401SStefano Zampini Options Database Keys: 1157da1bb401SStefano Zampini . -pcbddc ??? - 1158da1bb401SStefano Zampini 1159da1bb401SStefano Zampini Level: intermediate 1160da1bb401SStefano Zampini 1161da1bb401SStefano Zampini Notes: The matrix used with this preconditioner must be of type MATIS 1162da1bb401SStefano Zampini 1163da1bb401SStefano Zampini Unlike more 'conventional' interface preconditioners, this iterates over ALL the 1164da1bb401SStefano Zampini degrees of freedom, NOT just those on the interface (this allows the use of approximate solvers 1165da1bb401SStefano Zampini on the subdomains). 1166da1bb401SStefano Zampini 1167da1bb401SStefano Zampini Options for the coarse grid preconditioner can be set with - 1168da1bb401SStefano Zampini Options for the Dirichlet subproblem can be set with - 1169da1bb401SStefano Zampini Options for the Neumann subproblem can be set with - 1170da1bb401SStefano Zampini 1171da1bb401SStefano Zampini Contributed by Stefano Zampini 1172da1bb401SStefano Zampini 1173da1bb401SStefano Zampini .seealso: PCCreate(), PCSetType(), PCType (for list of available types), PC, MATIS 1174da1bb401SStefano Zampini M*/ 1175b2573a8aSBarry Smith 1176da1bb401SStefano Zampini #undef __FUNCT__ 1177da1bb401SStefano Zampini #define __FUNCT__ "PCCreate_BDDC" 11788cc058d9SJed Brown PETSC_EXTERN PetscErrorCode PCCreate_BDDC(PC pc) 1179da1bb401SStefano Zampini { 1180da1bb401SStefano Zampini PetscErrorCode ierr; 1181da1bb401SStefano Zampini PC_BDDC *pcbddc; 1182da1bb401SStefano Zampini 1183da1bb401SStefano Zampini PetscFunctionBegin; 1184da1bb401SStefano Zampini /* Creates the private data structure for this preconditioner and attach it to the PC object. */ 1185da1bb401SStefano Zampini ierr = PetscNewLog(pc,PC_BDDC,&pcbddc);CHKERRQ(ierr); 1186da1bb401SStefano Zampini pc->data = (void*)pcbddc; 1187da1bb401SStefano Zampini 1188da1bb401SStefano Zampini /* create PCIS data structure */ 1189da1bb401SStefano Zampini ierr = PCISCreate(pc);CHKERRQ(ierr); 1190da1bb401SStefano Zampini 1191da1bb401SStefano Zampini /* BDDC specific */ 1192674ae819SStefano Zampini pcbddc->user_primal_vertices = 0; 11930bdf917eSStefano Zampini pcbddc->NullSpace = 0; 11943972b0daSStefano Zampini pcbddc->temp_solution = 0; 1195534831adSStefano Zampini pcbddc->original_rhs = 0; 1196534831adSStefano Zampini pcbddc->local_mat = 0; 1197534831adSStefano Zampini pcbddc->ChangeOfBasisMatrix = 0; 1198674ae819SStefano Zampini pcbddc->use_change_of_basis = PETSC_TRUE; 1199674ae819SStefano Zampini pcbddc->use_change_on_faces = PETSC_FALSE; 1200da1bb401SStefano Zampini pcbddc->coarse_vec = 0; 1201da1bb401SStefano Zampini pcbddc->coarse_rhs = 0; 1202da1bb401SStefano Zampini pcbddc->coarse_ksp = 0; 1203da1bb401SStefano Zampini pcbddc->coarse_phi_B = 0; 1204da1bb401SStefano Zampini pcbddc->coarse_phi_D = 0; 120515aaf578SStefano Zampini pcbddc->coarse_psi_B = 0; 120615aaf578SStefano Zampini pcbddc->coarse_psi_D = 0; 1207da1bb401SStefano Zampini pcbddc->vec1_P = 0; 1208da1bb401SStefano Zampini pcbddc->vec1_R = 0; 1209da1bb401SStefano Zampini pcbddc->vec2_R = 0; 1210da1bb401SStefano Zampini pcbddc->local_auxmat1 = 0; 1211da1bb401SStefano Zampini pcbddc->local_auxmat2 = 0; 1212da1bb401SStefano Zampini pcbddc->R_to_B = 0; 1213da1bb401SStefano Zampini pcbddc->R_to_D = 0; 1214da1bb401SStefano Zampini pcbddc->ksp_D = 0; 1215da1bb401SStefano Zampini pcbddc->ksp_R = 0; 1216da1bb401SStefano Zampini pcbddc->local_primal_indices = 0; 121729622bf0SStefano Zampini pcbddc->inexact_prec_type = PETSC_FALSE; 1218da1bb401SStefano Zampini pcbddc->NeumannBoundaries = 0; 1219da1bb401SStefano Zampini pcbddc->ISForDofs = 0; 1220da1bb401SStefano Zampini pcbddc->ConstraintMatrix = 0; 1221da1bb401SStefano Zampini pcbddc->use_nnsp_true = PETSC_FALSE; 1222da1bb401SStefano Zampini pcbddc->local_primal_sizes = 0; 1223da1bb401SStefano Zampini pcbddc->local_primal_displacements = 0; 1224da1bb401SStefano Zampini pcbddc->coarse_loc_to_glob = 0; 12259d9e44b6SStefano Zampini pcbddc->dbg_flag = 0; 1226da1bb401SStefano Zampini pcbddc->coarsening_ratio = 8; 1227b76ba322SStefano Zampini pcbddc->use_exact_dirichlet = PETSC_TRUE; 12284fad6a16SStefano Zampini pcbddc->current_level = 0; 12294fad6a16SStefano Zampini pcbddc->max_levels = 1; 1230674ae819SStefano Zampini pcbddc->replicated_local_primal_indices = 0; 1231674ae819SStefano Zampini pcbddc->replicated_local_primal_values = 0; 1232da1bb401SStefano Zampini 1233674ae819SStefano Zampini /* create local graph structure */ 1234674ae819SStefano Zampini ierr = PCBDDCGraphCreate(&pcbddc->mat_graph);CHKERRQ(ierr); 1235674ae819SStefano Zampini 1236674ae819SStefano Zampini /* scaling */ 1237674ae819SStefano Zampini pcbddc->use_deluxe_scaling = PETSC_FALSE; 1238674ae819SStefano Zampini pcbddc->work_scaling = 0; 1239da1bb401SStefano Zampini 1240da1bb401SStefano Zampini /* function pointers */ 1241da1bb401SStefano Zampini pc->ops->apply = PCApply_BDDC; 1242da1bb401SStefano Zampini pc->ops->applytranspose = 0; 1243da1bb401SStefano Zampini pc->ops->setup = PCSetUp_BDDC; 1244da1bb401SStefano Zampini pc->ops->destroy = PCDestroy_BDDC; 1245da1bb401SStefano Zampini pc->ops->setfromoptions = PCSetFromOptions_BDDC; 1246da1bb401SStefano Zampini pc->ops->view = 0; 1247da1bb401SStefano Zampini pc->ops->applyrichardson = 0; 1248da1bb401SStefano Zampini pc->ops->applysymmetricleft = 0; 1249da1bb401SStefano Zampini pc->ops->applysymmetricright = 0; 1250534831adSStefano Zampini pc->ops->presolve = PCPreSolve_BDDC; 1251534831adSStefano Zampini pc->ops->postsolve = PCPostSolve_BDDC; 1252da1bb401SStefano Zampini 1253da1bb401SStefano Zampini /* composing function */ 1254674ae819SStefano Zampini ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCSetPrimalVerticesLocalIS_C",PCBDDCSetPrimalVerticesLocalIS_BDDC);CHKERRQ(ierr); 1255bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCSetCoarseningRatio_C",PCBDDCSetCoarseningRatio_BDDC);CHKERRQ(ierr); 1256bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCSetMaxLevels_C",PCBDDCSetMaxLevels_BDDC);CHKERRQ(ierr); 1257bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCSetNullSpace_C",PCBDDCSetNullSpace_BDDC);CHKERRQ(ierr); 1258bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCSetDirichletBoundaries_C",PCBDDCSetDirichletBoundaries_BDDC);CHKERRQ(ierr); 1259bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCSetNeumannBoundaries_C",PCBDDCSetNeumannBoundaries_BDDC);CHKERRQ(ierr); 1260bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCGetDirichletBoundaries_C",PCBDDCGetDirichletBoundaries_BDDC);CHKERRQ(ierr); 1261bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCGetNeumannBoundaries_C",PCBDDCGetNeumannBoundaries_BDDC);CHKERRQ(ierr); 1262bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCSetCoarseProblemType_C",PCBDDCSetCoarseProblemType_BDDC);CHKERRQ(ierr); 1263bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCSetDofsSplitting_C",PCBDDCSetDofsSplitting_BDDC);CHKERRQ(ierr); 1264bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCSetLocalAdjacencyGraph_C",PCBDDCSetLocalAdjacencyGraph_BDDC);CHKERRQ(ierr); 1265bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCCreateFETIDPOperators_C",PCBDDCCreateFETIDPOperators_BDDC);CHKERRQ(ierr); 1266bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCMatFETIDPGetRHS_C",PCBDDCMatFETIDPGetRHS_BDDC);CHKERRQ(ierr); 1267bdf89e91SBarry Smith ierr = PetscObjectComposeFunction((PetscObject)pc,"PCBDDCMatFETIDPGetSolution_C",PCBDDCMatFETIDPGetSolution_BDDC);CHKERRQ(ierr); 1268da1bb401SStefano Zampini PetscFunctionReturn(0); 1269da1bb401SStefano Zampini } 12703425bc38SStefano Zampini 1271da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */ 1272da1bb401SStefano Zampini /* All static functions from now on */ 1273da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */ 127429622bf0SStefano Zampini 127529622bf0SStefano Zampini #undef __FUNCT__ 12764fad6a16SStefano Zampini #define __FUNCT__ "PCBDDCSetLevel" 12774fad6a16SStefano Zampini static PetscErrorCode PCBDDCSetLevel(PC pc,PetscInt level) 12784fad6a16SStefano Zampini { 12794fad6a16SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 12804fad6a16SStefano Zampini 12814fad6a16SStefano Zampini PetscFunctionBegin; 12824fad6a16SStefano Zampini pcbddc->current_level=level; 12834fad6a16SStefano Zampini PetscFunctionReturn(0); 12844fad6a16SStefano Zampini } 12853425bc38SStefano Zampini 12863b03a366Sstefano_zampini /* -------------------------------------------------------------------------- */ 12870c7d97c5SJed Brown #undef __FUNCT__ 12880c7d97c5SJed Brown #define __FUNCT__ "PCBDDCCoarseSetUp" 128953cdbc3dSStefano Zampini static PetscErrorCode PCBDDCCoarseSetUp(PC pc) 12900c7d97c5SJed Brown { 12910c7d97c5SJed Brown PetscErrorCode ierr; 1292674ae819SStefano Zampini 12930c7d97c5SJed Brown PC_IS* pcis = (PC_IS*)(pc->data); 12940c7d97c5SJed Brown PC_BDDC* pcbddc = (PC_BDDC*)pc->data; 12950c7d97c5SJed Brown Mat_IS *matis = (Mat_IS*)pc->pmat->data; 12960c7d97c5SJed Brown IS is_R_local; 129719fd82e9SBarry Smith VecType impVecType; 129819fd82e9SBarry Smith MatType impMatType; 12990c7d97c5SJed Brown PetscInt n_R=0; 13000c7d97c5SJed Brown PetscInt n_D=0; 13010c7d97c5SJed Brown PetscInt n_B=0; 13020c7d97c5SJed Brown PetscScalar zero=0.0; 13030c7d97c5SJed Brown PetscScalar one=1.0; 13040c7d97c5SJed Brown PetscScalar m_one=-1.0; 13050c7d97c5SJed Brown PetscScalar* array; 13060c7d97c5SJed Brown PetscScalar *coarse_submat_vals; 13070c7d97c5SJed Brown PetscInt *idx_R_local; 13085b08dc53SStefano Zampini PetscReal *coarsefunctions_errors,*constraints_errors; 13090c7d97c5SJed Brown /* auxiliary indices */ 1310534831adSStefano Zampini PetscInt i,j,k; 1311e269702eSStefano Zampini /* for verbose output of bddc */ 1312e269702eSStefano Zampini PetscViewer viewer=pcbddc->dbg_viewer; 13135b08dc53SStefano Zampini PetscInt dbg_flag=pcbddc->dbg_flag; 1314a0ba757dSStefano Zampini /* for counting coarse dofs */ 1315534831adSStefano Zampini PetscInt n_vertices,n_constraints; 13163b03a366Sstefano_zampini PetscInt size_of_constraint; 13173b03a366Sstefano_zampini PetscInt *row_cmat_indices; 13183b03a366Sstefano_zampini PetscScalar *row_cmat_values; 1319e6872a76SStefano Zampini PetscInt *vertices; 13200c7d97c5SJed Brown 13210c7d97c5SJed Brown PetscFunctionBegin; 13220c7d97c5SJed Brown /* Set Non-overlapping dimensions */ 13230c7d97c5SJed Brown n_B = pcis->n_B; n_D = pcis->n - n_B; 1324534831adSStefano Zampini 1325534831adSStefano Zampini /* transform local matrices if needed */ 1326674ae819SStefano Zampini if (pcbddc->use_change_of_basis) { 1327e6872a76SStefano Zampini Mat change_mat_all; 1328e6872a76SStefano Zampini PetscInt *nnz,*is_indices,*temp_indices; 1329e6872a76SStefano Zampini 1330534831adSStefano Zampini ierr = PetscMalloc(pcis->n*sizeof(PetscInt),&nnz);CHKERRQ(ierr); 1331534831adSStefano Zampini ierr = ISGetIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 13322fa5cd67SKarl Rupp for (i=0;i<n_D;i++) nnz[is_indices[i]] = 1; 1333534831adSStefano Zampini ierr = ISRestoreIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 1334534831adSStefano Zampini ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 1335534831adSStefano Zampini k=1; 1336534831adSStefano Zampini for (i=0;i<n_B;i++) { 13370298fd71SBarry Smith ierr = MatGetRow(pcbddc->ChangeOfBasisMatrix,i,&j,NULL,NULL);CHKERRQ(ierr); 1338534831adSStefano Zampini nnz[is_indices[i]]=j; 13392fa5cd67SKarl Rupp if (k < j) k = j; 13400298fd71SBarry Smith ierr = MatRestoreRow(pcbddc->ChangeOfBasisMatrix,i,&j,NULL,NULL);CHKERRQ(ierr); 1341534831adSStefano Zampini } 1342534831adSStefano Zampini ierr = ISRestoreIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 1343534831adSStefano Zampini /* assemble change of basis matrix on the whole set of local dofs */ 1344534831adSStefano Zampini ierr = PetscMalloc(k*sizeof(PetscInt),&temp_indices);CHKERRQ(ierr); 1345534831adSStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&change_mat_all);CHKERRQ(ierr); 1346534831adSStefano Zampini ierr = MatSetSizes(change_mat_all,pcis->n,pcis->n,pcis->n,pcis->n);CHKERRQ(ierr); 1347534831adSStefano Zampini ierr = MatSetType(change_mat_all,MATSEQAIJ);CHKERRQ(ierr); 1348534831adSStefano Zampini ierr = MatSeqAIJSetPreallocation(change_mat_all,0,nnz);CHKERRQ(ierr); 1349534831adSStefano Zampini ierr = ISGetIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 1350534831adSStefano Zampini for (i=0;i<n_D;i++) { 1351534831adSStefano Zampini ierr = MatSetValue(change_mat_all,is_indices[i],is_indices[i],1.0,INSERT_VALUES);CHKERRQ(ierr); 1352534831adSStefano Zampini } 1353534831adSStefano Zampini ierr = ISRestoreIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 1354534831adSStefano Zampini ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 1355534831adSStefano Zampini for (i=0;i<n_B;i++) { 1356534831adSStefano Zampini ierr = MatGetRow(pcbddc->ChangeOfBasisMatrix,i,&j,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr); 13572fa5cd67SKarl Rupp for (k=0; k<j; k++) temp_indices[k]=is_indices[row_cmat_indices[k]]; 1358534831adSStefano Zampini ierr = MatSetValues(change_mat_all,1,&is_indices[i],j,temp_indices,row_cmat_values,INSERT_VALUES);CHKERRQ(ierr); 1359534831adSStefano Zampini ierr = MatRestoreRow(pcbddc->ChangeOfBasisMatrix,i,&j,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr); 1360534831adSStefano Zampini } 1361534831adSStefano Zampini ierr = MatAssemblyBegin(change_mat_all,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1362534831adSStefano Zampini ierr = MatAssemblyEnd(change_mat_all,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 13635ce978abSStefano Zampini /* TODO: HOW TO WORK WITH BAIJ? PtAP not provided */ 13645ce978abSStefano Zampini ierr = MatGetBlockSize(matis->A,&i);CHKERRQ(ierr); 13655ce978abSStefano Zampini if (i==1) { 1366534831adSStefano Zampini ierr = MatPtAP(matis->A,change_mat_all,MAT_INITIAL_MATRIX,1.0,&pcbddc->local_mat);CHKERRQ(ierr); 13675ce978abSStefano Zampini } else { 13685ce978abSStefano Zampini Mat work_mat; 13695ce978abSStefano Zampini ierr = MatConvert(matis->A,MATSEQAIJ,MAT_INITIAL_MATRIX,&work_mat);CHKERRQ(ierr); 13705ce978abSStefano Zampini ierr = MatPtAP(work_mat,change_mat_all,MAT_INITIAL_MATRIX,1.0,&pcbddc->local_mat);CHKERRQ(ierr); 13715ce978abSStefano Zampini ierr = MatDestroy(&work_mat);CHKERRQ(ierr); 13725ce978abSStefano Zampini } 1373534831adSStefano Zampini ierr = MatDestroy(&change_mat_all);CHKERRQ(ierr); 1374534831adSStefano Zampini ierr = PetscFree(nnz);CHKERRQ(ierr); 1375534831adSStefano Zampini ierr = PetscFree(temp_indices);CHKERRQ(ierr); 1376534831adSStefano Zampini } else { 1377534831adSStefano Zampini /* without change of basis, the local matrix is unchanged */ 1378534831adSStefano Zampini ierr = PetscObjectReference((PetscObject)matis->A);CHKERRQ(ierr); 1379534831adSStefano Zampini pcbddc->local_mat = matis->A; 1380534831adSStefano Zampini } 138115aaf578SStefano Zampini /* need to rebuild PCIS matrices during SNES or TS -> TODO move this to PCIS code */ 138215aaf578SStefano Zampini ierr = MatDestroy(&pcis->A_IB);CHKERRQ(ierr); 138315aaf578SStefano Zampini ierr = MatDestroy(&pcis->A_BI);CHKERRQ(ierr); 138415aaf578SStefano Zampini ierr = MatDestroy(&pcis->A_BB);CHKERRQ(ierr); 138515aaf578SStefano Zampini ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_I_local,pcis->is_B_local,MAT_INITIAL_MATRIX,&pcis->A_IB);CHKERRQ(ierr); 138615aaf578SStefano Zampini ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_B_local,pcis->is_I_local,MAT_INITIAL_MATRIX,&pcis->A_BI);CHKERRQ(ierr); 138715aaf578SStefano Zampini ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_B_local,pcis->is_B_local,MAT_INITIAL_MATRIX,&pcis->A_BB);CHKERRQ(ierr); 1388674ae819SStefano Zampini /* Change global null space passed in by the user if change of basis has been requested */ 1389674ae819SStefano Zampini if (pcbddc->NullSpace && pcbddc->use_change_of_basis) { 1390674ae819SStefano Zampini ierr = PCBDDCNullSpaceAdaptGlobal(pc);CHKERRQ(ierr); 13910bdf917eSStefano Zampini } 1392a0ba757dSStefano Zampini 1393e6872a76SStefano Zampini /* Set types for local objects needed by BDDC precondtioner */ 1394e6872a76SStefano Zampini impMatType = MATSEQDENSE; 1395e6872a76SStefano Zampini impVecType = VECSEQ; 1396e6872a76SStefano Zampini /* get vertex indices from constraint matrix */ 1397e6872a76SStefano Zampini ierr = PCBDDCGetPrimalVerticesLocalIdx(pc,&n_vertices,&vertices);CHKERRQ(ierr); 1398e6872a76SStefano Zampini /* Set number of constraints */ 1399e6872a76SStefano Zampini n_constraints = pcbddc->local_primal_size-n_vertices; 14000c7d97c5SJed Brown /* Dohrmann's notation: dofs splitted in R (Remaining: all dofs but the vertices) and V (Vertices) */ 14010c7d97c5SJed Brown ierr = VecSet(pcis->vec1_N,one);CHKERRQ(ierr); 14020c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 14032fa5cd67SKarl Rupp for (i=0;i<n_vertices;i++) array[vertices[i]] = zero; 14043b03a366Sstefano_zampini ierr = PetscMalloc((pcis->n-n_vertices)*sizeof(PetscInt),&idx_R_local);CHKERRQ(ierr); 14052fa5cd67SKarl Rupp for (i=0, n_R=0; i<pcis->n; i++) { 14062fa5cd67SKarl Rupp if (array[i] == one) { 14072fa5cd67SKarl Rupp idx_R_local[n_R] = i; 14082fa5cd67SKarl Rupp n_R++; 14092fa5cd67SKarl Rupp } 14102fa5cd67SKarl Rupp } 14110c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 1412e6872a76SStefano Zampini ierr = PetscFree(vertices);CHKERRQ(ierr); 1413e269702eSStefano Zampini if (dbg_flag) { 14140c7d97c5SJed Brown ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr); 14150c7d97c5SJed Brown ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 14160c7d97c5SJed Brown ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d local dimensions\n",PetscGlobalRank);CHKERRQ(ierr); 14170c7d97c5SJed Brown ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local_size = %d, dirichlet_size = %d, boundary_size = %d\n",pcis->n,n_D,n_B);CHKERRQ(ierr); 14183b03a366Sstefano_zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"r_size = %d, v_size = %d, constraints = %d, local_primal_size = %d\n",n_R,n_vertices,n_constraints,pcbddc->local_primal_size);CHKERRQ(ierr); 1419534831adSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"pcbddc->n_vertices = %d, pcbddc->n_constraints = %d\n",pcbddc->n_vertices,pcbddc->n_constraints);CHKERRQ(ierr); 14200c7d97c5SJed Brown ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 14210c7d97c5SJed Brown } 1422534831adSStefano Zampini 14230c7d97c5SJed Brown /* Allocate needed vectors */ 1424534831adSStefano Zampini ierr = VecDuplicate(pcis->vec1_global,&pcbddc->original_rhs);CHKERRQ(ierr); 14253972b0daSStefano Zampini ierr = VecDuplicate(pcis->vec1_global,&pcbddc->temp_solution);CHKERRQ(ierr); 14260c7d97c5SJed Brown ierr = VecDuplicate(pcis->vec1_D,&pcbddc->vec4_D);CHKERRQ(ierr); 14270c7d97c5SJed Brown ierr = VecCreate(PETSC_COMM_SELF,&pcbddc->vec1_R);CHKERRQ(ierr); 14280c7d97c5SJed Brown ierr = VecSetSizes(pcbddc->vec1_R,n_R,n_R);CHKERRQ(ierr); 14290c7d97c5SJed Brown ierr = VecSetType(pcbddc->vec1_R,impVecType);CHKERRQ(ierr); 1430d49ef151SStefano Zampini ierr = VecDuplicate(pcbddc->vec1_R,&pcbddc->vec2_R);CHKERRQ(ierr); 14310c7d97c5SJed Brown ierr = VecCreate(PETSC_COMM_SELF,&pcbddc->vec1_P);CHKERRQ(ierr); 14320c7d97c5SJed Brown ierr = VecSetSizes(pcbddc->vec1_P,pcbddc->local_primal_size,pcbddc->local_primal_size);CHKERRQ(ierr); 14330c7d97c5SJed Brown ierr = VecSetType(pcbddc->vec1_P,impVecType);CHKERRQ(ierr); 14340c7d97c5SJed Brown 14350c7d97c5SJed Brown /* Creating some index sets needed */ 14360c7d97c5SJed Brown /* For submatrices */ 1437da1bb401SStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,n_R,idx_R_local,PETSC_OWN_POINTER,&is_R_local);CHKERRQ(ierr); 1438da1bb401SStefano Zampini 14390c7d97c5SJed Brown /* For VecScatters pcbddc->R_to_B and (optionally) pcbddc->R_to_D */ 14400c7d97c5SJed Brown { 1441e6872a76SStefano Zampini IS is_aux1,is_aux2; 14420c7d97c5SJed Brown PetscInt *aux_array1; 14430c7d97c5SJed Brown PetscInt *aux_array2; 14442e8d2280SStefano Zampini PetscInt *idx_I_local; 14450c7d97c5SJed Brown 14463b03a366Sstefano_zampini ierr = PetscMalloc((pcis->n_B-n_vertices)*sizeof(PetscInt),&aux_array1);CHKERRQ(ierr); 14473b03a366Sstefano_zampini ierr = PetscMalloc((pcis->n_B-n_vertices)*sizeof(PetscInt),&aux_array2);CHKERRQ(ierr); 14480c7d97c5SJed Brown 14492e8d2280SStefano Zampini ierr = ISGetIndices(pcis->is_I_local,(const PetscInt**)&idx_I_local);CHKERRQ(ierr); 14500c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 14512fa5cd67SKarl Rupp for (i=0; i<n_D; i++) array[idx_I_local[i]] = 0; 14522e8d2280SStefano Zampini ierr = ISRestoreIndices(pcis->is_I_local,(const PetscInt**)&idx_I_local);CHKERRQ(ierr); 14532fa5cd67SKarl Rupp for (i=0, j=0; i<n_R; i++) { 14542fa5cd67SKarl Rupp if (array[idx_R_local[i]] == one) { 14552fa5cd67SKarl Rupp aux_array1[j] = i; 14562fa5cd67SKarl Rupp j++; 14572fa5cd67SKarl Rupp } 14582fa5cd67SKarl Rupp } 14590c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 1460da1bb401SStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array1,PETSC_COPY_VALUES,&is_aux1);CHKERRQ(ierr); 14612e8d2280SStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 14622e8d2280SStefano Zampini ierr = VecScatterEnd (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 14630c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr); 14642fa5cd67SKarl Rupp for (i=0, j=0; i<n_B; i++) { 14652fa5cd67SKarl Rupp if (array[i] == one) { 14662fa5cd67SKarl Rupp aux_array2[j] = i; j++; 14672fa5cd67SKarl Rupp } 14682fa5cd67SKarl Rupp } 14693828260eSStefano Zampini ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr); 1470da1bb401SStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array2,PETSC_COPY_VALUES,&is_aux2);CHKERRQ(ierr); 14710c7d97c5SJed Brown ierr = VecScatterCreate(pcbddc->vec1_R,is_aux1,pcis->vec1_B,is_aux2,&pcbddc->R_to_B);CHKERRQ(ierr); 14720c7d97c5SJed Brown ierr = PetscFree(aux_array1);CHKERRQ(ierr); 14730c7d97c5SJed Brown ierr = PetscFree(aux_array2);CHKERRQ(ierr); 14740c7d97c5SJed Brown ierr = ISDestroy(&is_aux1);CHKERRQ(ierr); 14750c7d97c5SJed Brown ierr = ISDestroy(&is_aux2);CHKERRQ(ierr); 14760c7d97c5SJed Brown 147729622bf0SStefano Zampini if (pcbddc->inexact_prec_type || dbg_flag ) { 14780c7d97c5SJed Brown ierr = PetscMalloc(n_D*sizeof(PetscInt),&aux_array1);CHKERRQ(ierr); 14790c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 14802fa5cd67SKarl Rupp for (i=0, j=0; i<n_R; i++) { 14812fa5cd67SKarl Rupp if (array[idx_R_local[i]] == zero) { 14822fa5cd67SKarl Rupp aux_array1[j] = i; 14832fa5cd67SKarl Rupp j++; 14842fa5cd67SKarl Rupp } 14852fa5cd67SKarl Rupp } 14860c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 1487da1bb401SStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array1,PETSC_COPY_VALUES,&is_aux1);CHKERRQ(ierr); 14880c7d97c5SJed Brown ierr = VecScatterCreate(pcbddc->vec1_R,is_aux1,pcis->vec1_D,(IS)0,&pcbddc->R_to_D);CHKERRQ(ierr); 14890c7d97c5SJed Brown ierr = PetscFree(aux_array1);CHKERRQ(ierr); 14900c7d97c5SJed Brown ierr = ISDestroy(&is_aux1);CHKERRQ(ierr); 14910c7d97c5SJed Brown } 14920c7d97c5SJed Brown } 14930c7d97c5SJed Brown 1494*304d26faSStefano Zampini /* setup local solvers */ 1495*304d26faSStefano Zampini ierr = PCBDDCSetUpLocalSolvers(pc,pcis->is_I_local,is_R_local);CHKERRQ(ierr); 14960c7d97c5SJed Brown 14970c7d97c5SJed Brown /* Assemble all remaining stuff needed to apply BDDC */ 14980c7d97c5SJed Brown { 14990c7d97c5SJed Brown Mat A_RV,A_VR,A_VV; 15000bdf917eSStefano Zampini Mat M1; 15010c7d97c5SJed Brown Mat C_CR; 15023b03a366Sstefano_zampini Mat AUXMAT; 15030c7d97c5SJed Brown Vec vec1_C; 15040c7d97c5SJed Brown Vec vec2_C; 15050c7d97c5SJed Brown Vec vec1_V; 15060c7d97c5SJed Brown Vec vec2_V; 1507e6872a76SStefano Zampini IS is_C_local,is_V_local,is_aux1; 1508e6872a76SStefano Zampini ISLocalToGlobalMapping BtoNmap; 15090c7d97c5SJed Brown PetscInt *nnz; 1510e6872a76SStefano Zampini PetscInt *idx_V_B; 15110c7d97c5SJed Brown PetscInt *auxindices; 151253cdbc3dSStefano Zampini PetscInt index; 15130c7d97c5SJed Brown PetscScalar* array2; 15140c7d97c5SJed Brown MatFactorInfo matinfo; 151515aaf578SStefano Zampini PetscBool setsym=PETSC_FALSE,issym=PETSC_FALSE; 15160c7d97c5SJed Brown 15170c7d97c5SJed Brown /* Allocating some extra storage just to be safe */ 15180c7d97c5SJed Brown ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&nnz);CHKERRQ(ierr); 15190c7d97c5SJed Brown ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&auxindices);CHKERRQ(ierr); 15202fa5cd67SKarl Rupp for (i=0;i<pcis->n;i++) auxindices[i]=i; 15210c7d97c5SJed Brown 1522e6872a76SStefano Zampini ierr = PCBDDCGetPrimalVerticesLocalIdx(pc,&n_vertices,&vertices);CHKERRQ(ierr); 1523e6872a76SStefano Zampini /* vertices in boundary numbering */ 1524e6872a76SStefano Zampini ierr = PetscMalloc(n_vertices*sizeof(PetscInt),&idx_V_B);CHKERRQ(ierr); 1525e6872a76SStefano Zampini ierr = ISLocalToGlobalMappingCreateIS(pcis->is_B_local,&BtoNmap);CHKERRQ(ierr); 1526e6872a76SStefano Zampini ierr = ISGlobalToLocalMappingApply(BtoNmap,IS_GTOLM_DROP,n_vertices,vertices,&i,idx_V_B);CHKERRQ(ierr); 1527e6872a76SStefano Zampini ierr = ISLocalToGlobalMappingDestroy(&BtoNmap);CHKERRQ(ierr); 1528e6872a76SStefano Zampini if (i != n_vertices) { 1529e6872a76SStefano Zampini SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_SUP,"Error in boundary numbering for BDDC vertices! %d != %d\n",n_vertices,i); 1530e6872a76SStefano Zampini } 1531e6872a76SStefano Zampini 15320c7d97c5SJed Brown /* some work vectors on vertices and/or constraints */ 15333b03a366Sstefano_zampini if (n_vertices) { 15340c7d97c5SJed Brown ierr = VecCreate(PETSC_COMM_SELF,&vec1_V);CHKERRQ(ierr); 15353b03a366Sstefano_zampini ierr = VecSetSizes(vec1_V,n_vertices,n_vertices);CHKERRQ(ierr); 15360c7d97c5SJed Brown ierr = VecSetType(vec1_V,impVecType);CHKERRQ(ierr); 15370c7d97c5SJed Brown ierr = VecDuplicate(vec1_V,&vec2_V);CHKERRQ(ierr); 15380c7d97c5SJed Brown } 1539534831adSStefano Zampini if (n_constraints) { 15400c7d97c5SJed Brown ierr = VecCreate(PETSC_COMM_SELF,&vec1_C);CHKERRQ(ierr); 1541534831adSStefano Zampini ierr = VecSetSizes(vec1_C,n_constraints,n_constraints);CHKERRQ(ierr); 15420c7d97c5SJed Brown ierr = VecSetType(vec1_C,impVecType);CHKERRQ(ierr); 15430c7d97c5SJed Brown ierr = VecDuplicate(vec1_C,&vec2_C);CHKERRQ(ierr); 15440c7d97c5SJed Brown ierr = VecDuplicate(vec1_C,&pcbddc->vec1_C);CHKERRQ(ierr); 15450c7d97c5SJed Brown } 15460c7d97c5SJed Brown /* Precompute stuffs needed for preprocessing and application of BDDC*/ 15473b03a366Sstefano_zampini if (n_constraints) { 15480c7d97c5SJed Brown ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->local_auxmat2);CHKERRQ(ierr); 15493b03a366Sstefano_zampini ierr = MatSetSizes(pcbddc->local_auxmat2,n_R,n_constraints,n_R,n_constraints);CHKERRQ(ierr); 15500c7d97c5SJed Brown ierr = MatSetType(pcbddc->local_auxmat2,impMatType);CHKERRQ(ierr); 15510298fd71SBarry Smith ierr = MatSeqDenseSetPreallocation(pcbddc->local_auxmat2,NULL);CHKERRQ(ierr); 15520c7d97c5SJed Brown 155357a90decSStefano Zampini /* Create Constraint matrix on R nodes: C_{CR} */ 1554e6872a76SStefano Zampini ierr = ISCreateStride(PETSC_COMM_SELF,n_constraints,n_vertices,1,&is_C_local);CHKERRQ(ierr); 155557a90decSStefano Zampini ierr = MatGetSubMatrix(pcbddc->ConstraintMatrix,is_C_local,is_R_local,MAT_INITIAL_MATRIX,&C_CR);CHKERRQ(ierr); 155657a90decSStefano Zampini ierr = ISDestroy(&is_C_local);CHKERRQ(ierr); 155757a90decSStefano Zampini 15580c7d97c5SJed Brown /* Assemble local_auxmat2 = - A_{RR}^{-1} C^T_{CR} needed by BDDC application */ 15593b03a366Sstefano_zampini for (i=0;i<n_constraints;i++) { 15603b03a366Sstefano_zampini ierr = VecSet(pcbddc->vec1_R,zero);CHKERRQ(ierr); 15613b03a366Sstefano_zampini /* Get row of constraint matrix in R numbering */ 156257a90decSStefano Zampini ierr = VecGetArray(pcbddc->vec1_R,&array);CHKERRQ(ierr); 156357a90decSStefano Zampini ierr = MatGetRow(C_CR,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr); 15642fa5cd67SKarl Rupp for (j=0;j<size_of_constraint;j++) array[row_cmat_indices[j]] = -row_cmat_values[j]; 156557a90decSStefano Zampini ierr = MatRestoreRow(C_CR,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr); 156657a90decSStefano Zampini ierr = VecRestoreArray(pcbddc->vec1_R,&array);CHKERRQ(ierr); 15672fa5cd67SKarl Rupp 15683b03a366Sstefano_zampini /* Solve for row of constraint matrix in R numbering */ 156953cdbc3dSStefano Zampini ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr); 15702fa5cd67SKarl Rupp 15713b03a366Sstefano_zampini /* Set values */ 15720c7d97c5SJed Brown ierr = VecGetArray(pcbddc->vec2_R,&array);CHKERRQ(ierr); 15733b03a366Sstefano_zampini ierr = MatSetValues(pcbddc->local_auxmat2,n_R,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr); 15740c7d97c5SJed Brown ierr = VecRestoreArray(pcbddc->vec2_R,&array);CHKERRQ(ierr); 15750c7d97c5SJed Brown } 15760c7d97c5SJed Brown ierr = MatAssemblyBegin(pcbddc->local_auxmat2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 15770c7d97c5SJed Brown ierr = MatAssemblyEnd(pcbddc->local_auxmat2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 15780c7d97c5SJed Brown 15790c7d97c5SJed Brown /* Assemble AUXMAT = ( LUFactor )( -C_{CR} A_{RR}^{-1} C^T_{CR} )^{-1} */ 15800c7d97c5SJed Brown ierr = MatMatMult(C_CR,pcbddc->local_auxmat2,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&AUXMAT);CHKERRQ(ierr); 1581d49ef151SStefano Zampini ierr = MatFactorInfoInitialize(&matinfo);CHKERRQ(ierr); 15823b03a366Sstefano_zampini ierr = ISCreateStride(PETSC_COMM_SELF,n_constraints,0,1,&is_aux1);CHKERRQ(ierr); 15830c7d97c5SJed Brown ierr = MatLUFactor(AUXMAT,is_aux1,is_aux1,&matinfo);CHKERRQ(ierr); 15840c7d97c5SJed Brown ierr = ISDestroy(&is_aux1);CHKERRQ(ierr); 15850c7d97c5SJed Brown 15863b03a366Sstefano_zampini /* Assemble explicitly M1 = ( C_{CR} A_{RR}^{-1} C^T_{CR} )^{-1} needed in preproc */ 1587d49ef151SStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&M1);CHKERRQ(ierr); 15883b03a366Sstefano_zampini ierr = MatSetSizes(M1,n_constraints,n_constraints,n_constraints,n_constraints);CHKERRQ(ierr); 15890c7d97c5SJed Brown ierr = MatSetType(M1,impMatType);CHKERRQ(ierr); 15900298fd71SBarry Smith ierr = MatSeqDenseSetPreallocation(M1,NULL);CHKERRQ(ierr); 15913b03a366Sstefano_zampini for (i=0;i<n_constraints;i++) { 15920c7d97c5SJed Brown ierr = VecSet(vec1_C,zero);CHKERRQ(ierr); 15930c7d97c5SJed Brown ierr = VecSetValue(vec1_C,i,one,INSERT_VALUES);CHKERRQ(ierr); 15940c7d97c5SJed Brown ierr = VecAssemblyBegin(vec1_C);CHKERRQ(ierr); 15950c7d97c5SJed Brown ierr = VecAssemblyEnd(vec1_C);CHKERRQ(ierr); 15960c7d97c5SJed Brown ierr = MatSolve(AUXMAT,vec1_C,vec2_C);CHKERRQ(ierr); 15970c7d97c5SJed Brown ierr = VecScale(vec2_C,m_one);CHKERRQ(ierr); 15980c7d97c5SJed Brown ierr = VecGetArray(vec2_C,&array);CHKERRQ(ierr); 15993b03a366Sstefano_zampini ierr = MatSetValues(M1,n_constraints,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr); 16000c7d97c5SJed Brown ierr = VecRestoreArray(vec2_C,&array);CHKERRQ(ierr); 16010c7d97c5SJed Brown } 16020c7d97c5SJed Brown ierr = MatAssemblyBegin(M1,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 16030c7d97c5SJed Brown ierr = MatAssemblyEnd(M1,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 16040c7d97c5SJed Brown ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr); 16050c7d97c5SJed Brown /* Assemble local_auxmat1 = M1*C_{CR} needed by BDDC application in KSP and in preproc */ 16060c7d97c5SJed Brown ierr = MatMatMult(M1,C_CR,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&pcbddc->local_auxmat1);CHKERRQ(ierr); 16070c7d97c5SJed Brown 16080c7d97c5SJed Brown } 16090c7d97c5SJed Brown 16100c7d97c5SJed Brown /* Get submatrices from subdomain matrix */ 16113b03a366Sstefano_zampini if (n_vertices) { 161215aaf578SStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,n_vertices,vertices,PETSC_COPY_VALUES,&is_V_local);CHKERRQ(ierr); 1613534831adSStefano Zampini ierr = MatGetSubMatrix(pcbddc->local_mat,is_R_local,is_V_local,MAT_INITIAL_MATRIX,&A_RV);CHKERRQ(ierr); 1614534831adSStefano Zampini ierr = MatGetSubMatrix(pcbddc->local_mat,is_V_local,is_R_local,MAT_INITIAL_MATRIX,&A_VR);CHKERRQ(ierr); 1615534831adSStefano Zampini ierr = MatGetSubMatrix(pcbddc->local_mat,is_V_local,is_V_local,MAT_INITIAL_MATRIX,&A_VV);CHKERRQ(ierr); 161615aaf578SStefano Zampini ierr = ISDestroy(&is_V_local);CHKERRQ(ierr); 16170c7d97c5SJed Brown } 16180c7d97c5SJed Brown 16190c7d97c5SJed Brown /* Matrix of coarse basis functions (local) */ 1620d49ef151SStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->coarse_phi_B);CHKERRQ(ierr); 16210c7d97c5SJed Brown ierr = MatSetSizes(pcbddc->coarse_phi_B,n_B,pcbddc->local_primal_size,n_B,pcbddc->local_primal_size);CHKERRQ(ierr); 16220c7d97c5SJed Brown ierr = MatSetType(pcbddc->coarse_phi_B,impMatType);CHKERRQ(ierr); 16230298fd71SBarry Smith ierr = MatSeqDenseSetPreallocation(pcbddc->coarse_phi_B,NULL);CHKERRQ(ierr); 162429622bf0SStefano Zampini if (pcbddc->inexact_prec_type || dbg_flag ) { 1625d49ef151SStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->coarse_phi_D);CHKERRQ(ierr); 16260c7d97c5SJed Brown ierr = MatSetSizes(pcbddc->coarse_phi_D,n_D,pcbddc->local_primal_size,n_D,pcbddc->local_primal_size);CHKERRQ(ierr); 16270c7d97c5SJed Brown ierr = MatSetType(pcbddc->coarse_phi_D,impMatType);CHKERRQ(ierr); 16280298fd71SBarry Smith ierr = MatSeqDenseSetPreallocation(pcbddc->coarse_phi_D,NULL);CHKERRQ(ierr); 16290c7d97c5SJed Brown } 16300c7d97c5SJed Brown 1631e269702eSStefano Zampini if (dbg_flag) { 16325b08dc53SStefano Zampini ierr = PetscMalloc(2*pcbddc->local_primal_size*sizeof(*coarsefunctions_errors),&coarsefunctions_errors);CHKERRQ(ierr); 16335b08dc53SStefano Zampini ierr = PetscMalloc(2*pcbddc->local_primal_size*sizeof(*constraints_errors),&constraints_errors);CHKERRQ(ierr); 16340c7d97c5SJed Brown } 16353b03a366Sstefano_zampini /* Subdomain contribution (Non-overlapping) to coarse matrix */ 16360c7d97c5SJed Brown ierr = PetscMalloc ((pcbddc->local_primal_size)*(pcbddc->local_primal_size)*sizeof(PetscScalar),&coarse_submat_vals);CHKERRQ(ierr); 16370c7d97c5SJed Brown 16380c7d97c5SJed Brown /* We are now ready to evaluate coarse basis functions and subdomain contribution to coarse problem */ 16393b03a366Sstefano_zampini for (i=0;i<n_vertices;i++){ 16400c7d97c5SJed Brown ierr = VecSet(vec1_V,zero);CHKERRQ(ierr); 16410c7d97c5SJed Brown ierr = VecSetValue(vec1_V,i,one,INSERT_VALUES);CHKERRQ(ierr); 16420c7d97c5SJed Brown ierr = VecAssemblyBegin(vec1_V);CHKERRQ(ierr); 16430c7d97c5SJed Brown ierr = VecAssemblyEnd(vec1_V);CHKERRQ(ierr); 16440c7d97c5SJed Brown /* solution of saddle point problem */ 16450bdf917eSStefano Zampini ierr = MatMult(A_RV,vec1_V,pcbddc->vec1_R);CHKERRQ(ierr); 16460bdf917eSStefano Zampini ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec1_R);CHKERRQ(ierr); 16470c7d97c5SJed Brown ierr = VecScale(pcbddc->vec1_R,m_one);CHKERRQ(ierr); 16483b03a366Sstefano_zampini if (n_constraints) { 16490c7d97c5SJed Brown ierr = MatMult(pcbddc->local_auxmat1,pcbddc->vec1_R,vec1_C);CHKERRQ(ierr); 16500c7d97c5SJed Brown ierr = MatMultAdd(pcbddc->local_auxmat2,vec1_C,pcbddc->vec1_R,pcbddc->vec1_R);CHKERRQ(ierr); 16510c7d97c5SJed Brown ierr = VecScale(vec1_C,m_one);CHKERRQ(ierr); 16520c7d97c5SJed Brown } 16530c7d97c5SJed Brown ierr = MatMult(A_VR,pcbddc->vec1_R,vec2_V);CHKERRQ(ierr); 16540c7d97c5SJed Brown ierr = MatMultAdd(A_VV,vec1_V,vec2_V,vec2_V);CHKERRQ(ierr); 16550c7d97c5SJed Brown 16560c7d97c5SJed Brown /* Set values in coarse basis function and subdomain part of coarse_mat */ 16570c7d97c5SJed Brown /* coarse basis functions */ 16580c7d97c5SJed Brown ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr); 16590c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 16600c7d97c5SJed Brown ierr = VecScatterEnd (pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 16610c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr); 16623b03a366Sstefano_zampini ierr = MatSetValues(pcbddc->coarse_phi_B,n_B,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr); 16630c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr); 16640c7d97c5SJed Brown ierr = MatSetValue(pcbddc->coarse_phi_B,idx_V_B[i],i,one,INSERT_VALUES);CHKERRQ(ierr); 166529622bf0SStefano Zampini if ( pcbddc->inexact_prec_type || dbg_flag ) { 16660c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 16670c7d97c5SJed Brown ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 16680c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_D,&array);CHKERRQ(ierr); 16693b03a366Sstefano_zampini ierr = MatSetValues(pcbddc->coarse_phi_D,n_D,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr); 16700c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_D,&array);CHKERRQ(ierr); 16710c7d97c5SJed Brown } 16720c7d97c5SJed Brown /* subdomain contribution to coarse matrix */ 16730c7d97c5SJed Brown ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr); 16742fa5cd67SKarl Rupp for (j=0; j<n_vertices; j++) coarse_submat_vals[i*pcbddc->local_primal_size+j] = array[j]; /* WARNING -> column major ordering */ 16750c7d97c5SJed Brown ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr); 16763b03a366Sstefano_zampini if (n_constraints) { 16770c7d97c5SJed Brown ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr); 16782fa5cd67SKarl Rupp for (j=0; j<n_constraints; j++) coarse_submat_vals[i*pcbddc->local_primal_size+j+n_vertices] = array[j]; /* WARNING -> column major ordering */ 16790c7d97c5SJed Brown ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr); 16800c7d97c5SJed Brown } 16810c7d97c5SJed Brown 1682e269702eSStefano Zampini if ( dbg_flag ) { 16830c7d97c5SJed Brown /* assemble subdomain vector on nodes */ 1684d49ef151SStefano Zampini ierr = VecSet(pcis->vec1_N,zero);CHKERRQ(ierr); 16850c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 16860c7d97c5SJed Brown ierr = VecGetArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr); 16872fa5cd67SKarl Rupp for (j=0;j<n_R;j++) array[idx_R_local[j]] = array2[j]; 16883b03a366Sstefano_zampini array[ vertices[i] ] = one; 16890c7d97c5SJed Brown ierr = VecRestoreArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr); 16900c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 16910c7d97c5SJed Brown /* assemble subdomain vector of lagrange multipliers (i.e. primal nodes) */ 1692d49ef151SStefano Zampini ierr = VecSet(pcbddc->vec1_P,zero);CHKERRQ(ierr); 16930c7d97c5SJed Brown ierr = VecGetArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr); 16940c7d97c5SJed Brown ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr); 16952fa5cd67SKarl Rupp for (j=0;j<n_vertices;j++) array2[j]=array[j]; 16960c7d97c5SJed Brown ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr); 16973b03a366Sstefano_zampini if (n_constraints) { 16980c7d97c5SJed Brown ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr); 16992fa5cd67SKarl Rupp for (j=0;j<n_constraints;j++) array2[j+n_vertices]=array[j]; 17000c7d97c5SJed Brown ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr); 17010c7d97c5SJed Brown } 17020c7d97c5SJed Brown ierr = VecRestoreArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr); 17030c7d97c5SJed Brown ierr = VecScale(pcbddc->vec1_P,m_one);CHKERRQ(ierr); 17040c7d97c5SJed Brown /* check saddle point solution */ 1705534831adSStefano Zampini ierr = MatMult(pcbddc->local_mat,pcis->vec1_N,pcis->vec2_N);CHKERRQ(ierr); 17063b03a366Sstefano_zampini ierr = MatMultTransposeAdd(pcbddc->ConstraintMatrix,pcbddc->vec1_P,pcis->vec2_N,pcis->vec2_N);CHKERRQ(ierr); 17073b03a366Sstefano_zampini ierr = VecNorm(pcis->vec2_N,NORM_INFINITY,&coarsefunctions_errors[i]);CHKERRQ(ierr); 17083b03a366Sstefano_zampini ierr = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr); 17090c7d97c5SJed Brown ierr = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr); 17103b03a366Sstefano_zampini array[i]=array[i]+m_one; /* shift by the identity matrix */ 17110c7d97c5SJed Brown ierr = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr); 17123b03a366Sstefano_zampini ierr = VecNorm(pcbddc->vec1_P,NORM_INFINITY,&constraints_errors[i]);CHKERRQ(ierr); 17130c7d97c5SJed Brown } 17140c7d97c5SJed Brown } 17150c7d97c5SJed Brown 17163b03a366Sstefano_zampini for (i=0;i<n_constraints;i++){ 1717d49ef151SStefano Zampini ierr = VecSet(vec2_C,zero);CHKERRQ(ierr); 17180c7d97c5SJed Brown ierr = VecSetValue(vec2_C,i,m_one,INSERT_VALUES);CHKERRQ(ierr); 17190c7d97c5SJed Brown ierr = VecAssemblyBegin(vec2_C);CHKERRQ(ierr); 17200c7d97c5SJed Brown ierr = VecAssemblyEnd(vec2_C);CHKERRQ(ierr); 17210c7d97c5SJed Brown /* solution of saddle point problem */ 17220c7d97c5SJed Brown ierr = MatMult(M1,vec2_C,vec1_C);CHKERRQ(ierr); 17230c7d97c5SJed Brown ierr = MatMult(pcbddc->local_auxmat2,vec1_C,pcbddc->vec1_R);CHKERRQ(ierr); 17240c7d97c5SJed Brown ierr = VecScale(vec1_C,m_one);CHKERRQ(ierr); 17253b03a366Sstefano_zampini if (n_vertices) { ierr = MatMult(A_VR,pcbddc->vec1_R,vec2_V);CHKERRQ(ierr); } 17260c7d97c5SJed Brown /* Set values in coarse basis function and subdomain part of coarse_mat */ 17270c7d97c5SJed Brown /* coarse basis functions */ 17283b03a366Sstefano_zampini index=i+n_vertices; 17290c7d97c5SJed Brown ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr); 17300c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 17310c7d97c5SJed Brown ierr = VecScatterEnd(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 17320c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr); 173353cdbc3dSStefano Zampini ierr = MatSetValues(pcbddc->coarse_phi_B,n_B,auxindices,1,&index,array,INSERT_VALUES);CHKERRQ(ierr); 17340c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr); 173529622bf0SStefano Zampini if ( pcbddc->inexact_prec_type || dbg_flag ) { 17360c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 17370c7d97c5SJed Brown ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 17380c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_D,&array);CHKERRQ(ierr); 173953cdbc3dSStefano Zampini ierr = MatSetValues(pcbddc->coarse_phi_D,n_D,auxindices,1,&index,array,INSERT_VALUES);CHKERRQ(ierr); 17400c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_D,&array);CHKERRQ(ierr); 17410c7d97c5SJed Brown } 17420c7d97c5SJed Brown /* subdomain contribution to coarse matrix */ 17433b03a366Sstefano_zampini if (n_vertices) { 17440c7d97c5SJed Brown ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr); 17452fa5cd67SKarl Rupp for (j=0; j<n_vertices; j++) coarse_submat_vals[index*pcbddc->local_primal_size+j]=array[j]; /* WARNING -> column major ordering */ 17460c7d97c5SJed Brown ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr); 17470c7d97c5SJed Brown } 17480c7d97c5SJed Brown ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr); 17492fa5cd67SKarl Rupp for (j=0; j<n_constraints; j++) coarse_submat_vals[index*pcbddc->local_primal_size+j+n_vertices]=array[j]; /* WARNING -> column major ordering */ 17500c7d97c5SJed Brown ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr); 17510c7d97c5SJed Brown 1752e269702eSStefano Zampini if ( dbg_flag ) { 17530c7d97c5SJed Brown /* assemble subdomain vector on nodes */ 175453cdbc3dSStefano Zampini ierr = VecSet(pcis->vec1_N,zero);CHKERRQ(ierr); 17550c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 17560c7d97c5SJed Brown ierr = VecGetArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr); 17572fa5cd67SKarl Rupp for (j=0;j<n_R;j++) array[idx_R_local[j]] = array2[j]; 17580c7d97c5SJed Brown ierr = VecRestoreArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr); 17590c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 17600c7d97c5SJed Brown /* assemble subdomain vector of lagrange multipliers */ 176153cdbc3dSStefano Zampini ierr = VecSet(pcbddc->vec1_P,zero);CHKERRQ(ierr); 17620c7d97c5SJed Brown ierr = VecGetArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr); 17633b03a366Sstefano_zampini if ( n_vertices) { 17640c7d97c5SJed Brown ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr); 17652fa5cd67SKarl Rupp for (j=0;j<n_vertices;j++) array2[j]=-array[j]; 17660c7d97c5SJed Brown ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr); 17670c7d97c5SJed Brown } 17680c7d97c5SJed Brown ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr); 17693b03a366Sstefano_zampini for (j=0;j<n_constraints;j++) {array2[j+n_vertices]=-array[j];} 17700c7d97c5SJed Brown ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr); 17710c7d97c5SJed Brown ierr = VecRestoreArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr); 17723972b0daSStefano Zampini /* check saddle point solution */ 1773534831adSStefano Zampini ierr = MatMult(pcbddc->local_mat,pcis->vec1_N,pcis->vec2_N);CHKERRQ(ierr); 17743b03a366Sstefano_zampini ierr = MatMultTransposeAdd(pcbddc->ConstraintMatrix,pcbddc->vec1_P,pcis->vec2_N,pcis->vec2_N);CHKERRQ(ierr); 177553cdbc3dSStefano Zampini ierr = VecNorm(pcis->vec2_N,NORM_INFINITY,&coarsefunctions_errors[index]);CHKERRQ(ierr); 17763b03a366Sstefano_zampini ierr = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr); 17770c7d97c5SJed Brown ierr = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr); 177853cdbc3dSStefano Zampini array[index]=array[index]+m_one; /* shift by the identity matrix */ 17790c7d97c5SJed Brown ierr = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr); 178053cdbc3dSStefano Zampini ierr = VecNorm(pcbddc->vec1_P,NORM_INFINITY,&constraints_errors[index]);CHKERRQ(ierr); 17810c7d97c5SJed Brown } 17820c7d97c5SJed Brown } 17830c7d97c5SJed Brown ierr = MatAssemblyBegin(pcbddc->coarse_phi_B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 17840c7d97c5SJed Brown ierr = MatAssemblyEnd(pcbddc->coarse_phi_B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 178529622bf0SStefano Zampini if ( pcbddc->inexact_prec_type || dbg_flag ) { 17860c7d97c5SJed Brown ierr = MatAssemblyBegin(pcbddc->coarse_phi_D,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 17870c7d97c5SJed Brown ierr = MatAssemblyEnd(pcbddc->coarse_phi_D,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 17880c7d97c5SJed Brown } 178915aaf578SStefano Zampini /* compute other basis functions for non-symmetric problems */ 179015aaf578SStefano Zampini ierr = MatIsSymmetricKnown(pc->pmat,&setsym,&issym);CHKERRQ(ierr); 179115aaf578SStefano Zampini if ( !setsym || (setsym && !issym) ) { 179215aaf578SStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->coarse_psi_B);CHKERRQ(ierr); 179315aaf578SStefano Zampini ierr = MatSetSizes(pcbddc->coarse_psi_B,n_B,pcbddc->local_primal_size,n_B,pcbddc->local_primal_size);CHKERRQ(ierr); 179415aaf578SStefano Zampini ierr = MatSetType(pcbddc->coarse_psi_B,impMatType);CHKERRQ(ierr); 179515aaf578SStefano Zampini ierr = MatSeqDenseSetPreallocation(pcbddc->coarse_psi_B,NULL);CHKERRQ(ierr); 179615aaf578SStefano Zampini if (pcbddc->inexact_prec_type || dbg_flag ) { 179715aaf578SStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->coarse_psi_D);CHKERRQ(ierr); 179815aaf578SStefano Zampini ierr = MatSetSizes(pcbddc->coarse_psi_D,n_D,pcbddc->local_primal_size,n_D,pcbddc->local_primal_size);CHKERRQ(ierr); 179915aaf578SStefano Zampini ierr = MatSetType(pcbddc->coarse_psi_D,impMatType);CHKERRQ(ierr); 180015aaf578SStefano Zampini ierr = MatSeqDenseSetPreallocation(pcbddc->coarse_psi_D,NULL);CHKERRQ(ierr); 180115aaf578SStefano Zampini } 180215aaf578SStefano Zampini for (i=0;i<pcbddc->local_primal_size;i++) { 180315aaf578SStefano Zampini if (n_constraints) { 180415aaf578SStefano Zampini ierr = VecSet(vec1_C,zero);CHKERRQ(ierr); 180515aaf578SStefano Zampini ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr); 180615aaf578SStefano Zampini for (j=0;j<n_constraints;j++) { 180715aaf578SStefano Zampini array[j]=coarse_submat_vals[(j+n_vertices)*pcbddc->local_primal_size+i]; 180815aaf578SStefano Zampini } 180915aaf578SStefano Zampini ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr); 181015aaf578SStefano Zampini } 181115aaf578SStefano Zampini if (i<n_vertices) { 181215aaf578SStefano Zampini ierr = VecSet(vec1_V,zero);CHKERRQ(ierr); 181315aaf578SStefano Zampini ierr = VecSetValue(vec1_V,i,m_one,INSERT_VALUES);CHKERRQ(ierr); 181415aaf578SStefano Zampini ierr = VecAssemblyBegin(vec1_V);CHKERRQ(ierr); 181515aaf578SStefano Zampini ierr = VecAssemblyEnd(vec1_V);CHKERRQ(ierr); 181615aaf578SStefano Zampini ierr = MatMultTranspose(A_VR,vec1_V,pcbddc->vec1_R);CHKERRQ(ierr); 181715aaf578SStefano Zampini if (n_constraints) { 181815aaf578SStefano Zampini ierr = MatMultTransposeAdd(C_CR,vec1_C,pcbddc->vec1_R,pcbddc->vec1_R);CHKERRQ(ierr); 181915aaf578SStefano Zampini } 182015aaf578SStefano Zampini } else { 182115aaf578SStefano Zampini ierr = MatMultTranspose(C_CR,vec1_C,pcbddc->vec1_R);CHKERRQ(ierr); 182215aaf578SStefano Zampini } 182315aaf578SStefano Zampini ierr = KSPSolveTranspose(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec1_R);CHKERRQ(ierr); 182415aaf578SStefano Zampini ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr); 182515aaf578SStefano Zampini ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 182615aaf578SStefano Zampini ierr = VecScatterEnd(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 182715aaf578SStefano Zampini ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr); 182815aaf578SStefano Zampini ierr = MatSetValues(pcbddc->coarse_psi_B,n_B,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr); 182915aaf578SStefano Zampini ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr); 183015aaf578SStefano Zampini if (i<n_vertices) { 183115aaf578SStefano Zampini ierr = MatSetValue(pcbddc->coarse_psi_B,idx_V_B[i],i,one,INSERT_VALUES);CHKERRQ(ierr); 183215aaf578SStefano Zampini } 183315aaf578SStefano Zampini if ( pcbddc->inexact_prec_type || dbg_flag ) { 183415aaf578SStefano Zampini ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 183515aaf578SStefano Zampini ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 183615aaf578SStefano Zampini ierr = VecGetArray(pcis->vec1_D,&array);CHKERRQ(ierr); 183715aaf578SStefano Zampini ierr = MatSetValues(pcbddc->coarse_psi_D,n_D,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr); 183815aaf578SStefano Zampini ierr = VecRestoreArray(pcis->vec1_D,&array);CHKERRQ(ierr); 183915aaf578SStefano Zampini } 184015aaf578SStefano Zampini 184115aaf578SStefano Zampini if ( dbg_flag ) { 184215aaf578SStefano Zampini /* assemble subdomain vector on nodes */ 184315aaf578SStefano Zampini ierr = VecSet(pcis->vec1_N,zero);CHKERRQ(ierr); 184415aaf578SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 184515aaf578SStefano Zampini ierr = VecGetArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr); 184615aaf578SStefano Zampini for (j=0;j<n_R;j++) array[idx_R_local[j]] = array2[j]; 184715aaf578SStefano Zampini if (i<n_vertices) array[vertices[i]] = one; 184815aaf578SStefano Zampini ierr = VecRestoreArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr); 184915aaf578SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 185015aaf578SStefano Zampini /* assemble subdomain vector of lagrange multipliers */ 185115aaf578SStefano Zampini ierr = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr); 185215aaf578SStefano Zampini for (j=0;j<pcbddc->local_primal_size;j++) { 185315aaf578SStefano Zampini array[j]=-coarse_submat_vals[j*pcbddc->local_primal_size+i]; 185415aaf578SStefano Zampini } 185515aaf578SStefano Zampini ierr = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr); 185615aaf578SStefano Zampini /* check saddle point solution */ 185715aaf578SStefano Zampini ierr = MatMultTranspose(pcbddc->local_mat,pcis->vec1_N,pcis->vec2_N);CHKERRQ(ierr); 185815aaf578SStefano Zampini ierr = MatMultTransposeAdd(pcbddc->ConstraintMatrix,pcbddc->vec1_P,pcis->vec2_N,pcis->vec2_N);CHKERRQ(ierr); 185915aaf578SStefano Zampini ierr = VecNorm(pcis->vec2_N,NORM_INFINITY,&coarsefunctions_errors[i+pcbddc->local_primal_size]);CHKERRQ(ierr); 186015aaf578SStefano Zampini ierr = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr); 186115aaf578SStefano Zampini ierr = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr); 186215aaf578SStefano Zampini array[i]=array[i]+m_one; /* shift by the identity matrix */ 186315aaf578SStefano Zampini ierr = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr); 186415aaf578SStefano Zampini ierr = VecNorm(pcbddc->vec1_P,NORM_INFINITY,&constraints_errors[i+pcbddc->local_primal_size]);CHKERRQ(ierr); 186515aaf578SStefano Zampini } 186615aaf578SStefano Zampini } 186715aaf578SStefano Zampini ierr = MatAssemblyBegin(pcbddc->coarse_psi_B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 186815aaf578SStefano Zampini ierr = MatAssemblyEnd(pcbddc->coarse_psi_B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 186915aaf578SStefano Zampini if ( pcbddc->inexact_prec_type || dbg_flag ) { 187015aaf578SStefano Zampini ierr = MatAssemblyBegin(pcbddc->coarse_psi_D,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 187115aaf578SStefano Zampini ierr = MatAssemblyEnd(pcbddc->coarse_psi_D,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 187215aaf578SStefano Zampini } 187315aaf578SStefano Zampini } 187415aaf578SStefano Zampini ierr = PetscFree(idx_V_B);CHKERRQ(ierr); 18750c7d97c5SJed Brown /* Checking coarse_sub_mat and coarse basis functios */ 187615aaf578SStefano Zampini /* Symmetric case : It should be \Phi^{(j)^T} A^{(j)} \Phi^{(j)}=coarse_sub_mat */ 187715aaf578SStefano Zampini /* Non-symmetric case : It should be \Psi^{(j)^T} A^{(j)} \Phi^{(j)}=coarse_sub_mat */ 18789d2fce94SStefano Zampini if (dbg_flag) { 18790c7d97c5SJed Brown Mat coarse_sub_mat; 18800c7d97c5SJed Brown Mat TM1,TM2,TM3,TM4; 188115aaf578SStefano Zampini Mat coarse_phi_D,coarse_phi_B; 188215aaf578SStefano Zampini Mat coarse_psi_D,coarse_psi_B; 188315aaf578SStefano Zampini Mat A_II,A_BB,A_IB,A_BI; 188419fd82e9SBarry Smith MatType checkmattype=MATSEQAIJ; 18855b08dc53SStefano Zampini PetscReal real_value; 18860c7d97c5SJed Brown 1887c042a7c3SStefano Zampini ierr = MatConvert(pcis->A_II,checkmattype,MAT_INITIAL_MATRIX,&A_II);CHKERRQ(ierr); 1888c042a7c3SStefano Zampini ierr = MatConvert(pcis->A_IB,checkmattype,MAT_INITIAL_MATRIX,&A_IB);CHKERRQ(ierr); 1889c042a7c3SStefano Zampini ierr = MatConvert(pcis->A_BI,checkmattype,MAT_INITIAL_MATRIX,&A_BI);CHKERRQ(ierr); 1890c042a7c3SStefano Zampini ierr = MatConvert(pcis->A_BB,checkmattype,MAT_INITIAL_MATRIX,&A_BB);CHKERRQ(ierr); 1891c042a7c3SStefano Zampini ierr = MatConvert(pcbddc->coarse_phi_D,checkmattype,MAT_INITIAL_MATRIX,&coarse_phi_D);CHKERRQ(ierr); 1892c042a7c3SStefano Zampini ierr = MatConvert(pcbddc->coarse_phi_B,checkmattype,MAT_INITIAL_MATRIX,&coarse_phi_B);CHKERRQ(ierr); 189315aaf578SStefano Zampini if (pcbddc->coarse_psi_B) { 189415aaf578SStefano Zampini ierr = MatConvert(pcbddc->coarse_psi_D,checkmattype,MAT_INITIAL_MATRIX,&coarse_psi_D);CHKERRQ(ierr); 189515aaf578SStefano Zampini ierr = MatConvert(pcbddc->coarse_psi_B,checkmattype,MAT_INITIAL_MATRIX,&coarse_psi_B);CHKERRQ(ierr); 189615aaf578SStefano Zampini } 1897c042a7c3SStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,pcbddc->local_primal_size,pcbddc->local_primal_size,coarse_submat_vals,&coarse_sub_mat);CHKERRQ(ierr); 18980c7d97c5SJed Brown 18990c7d97c5SJed Brown ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr); 19000c7d97c5SJed Brown ierr = PetscViewerASCIIPrintf(viewer,"Check coarse sub mat and local basis functions\n");CHKERRQ(ierr); 19010c7d97c5SJed Brown ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 190215aaf578SStefano Zampini if (pcbddc->coarse_psi_B) { 190315aaf578SStefano Zampini ierr = MatMatMult(A_II,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr); 190415aaf578SStefano Zampini ierr = MatTransposeMatMult(coarse_psi_D,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM1);CHKERRQ(ierr); 190515aaf578SStefano Zampini ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr); 190615aaf578SStefano Zampini ierr = MatMatMult(A_BB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr); 190715aaf578SStefano Zampini ierr = MatTransposeMatMult(coarse_psi_B,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM2);CHKERRQ(ierr); 190815aaf578SStefano Zampini ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr); 190915aaf578SStefano Zampini ierr = MatMatMult(A_IB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr); 191015aaf578SStefano Zampini ierr = MatTransposeMatMult(coarse_psi_D,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM3);CHKERRQ(ierr); 191115aaf578SStefano Zampini ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr); 191215aaf578SStefano Zampini ierr = MatMatMult(A_BI,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr); 191315aaf578SStefano Zampini ierr = MatTransposeMatMult(coarse_psi_B,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM4);CHKERRQ(ierr); 191415aaf578SStefano Zampini ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr); 191515aaf578SStefano Zampini } else { 191653cdbc3dSStefano Zampini ierr = MatPtAP(A_II,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&TM1);CHKERRQ(ierr); 191753cdbc3dSStefano Zampini ierr = MatPtAP(A_BB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&TM2);CHKERRQ(ierr); 191853cdbc3dSStefano Zampini ierr = MatMatMult(A_IB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr); 1919c042a7c3SStefano Zampini ierr = MatTransposeMatMult(coarse_phi_D,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM3);CHKERRQ(ierr); 192053cdbc3dSStefano Zampini ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr); 192153cdbc3dSStefano Zampini ierr = MatMatMult(A_BI,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr); 1922c042a7c3SStefano Zampini ierr = MatTransposeMatMult(coarse_phi_B,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM4);CHKERRQ(ierr); 192353cdbc3dSStefano Zampini ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr); 192415aaf578SStefano Zampini } 192553cdbc3dSStefano Zampini ierr = MatAXPY(TM1,one,TM2,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr); 192653cdbc3dSStefano Zampini ierr = MatAXPY(TM1,one,TM3,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr); 192753cdbc3dSStefano Zampini ierr = MatAXPY(TM1,one,TM4,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr); 192815aaf578SStefano Zampini ierr = MatConvert(TM1,MATSEQDENSE,MAT_REUSE_MATRIX,&TM1);CHKERRQ(ierr); 192915aaf578SStefano Zampini ierr = MatAXPY(TM1,m_one,coarse_sub_mat,SAME_NONZERO_PATTERN);CHKERRQ(ierr); 19305b08dc53SStefano Zampini ierr = MatNorm(TM1,NORM_INFINITY,&real_value);CHKERRQ(ierr); 19310c7d97c5SJed Brown ierr = PetscViewerASCIISynchronizedPrintf(viewer,"----------------------------------\n");CHKERRQ(ierr); 19320c7d97c5SJed Brown ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d \n",PetscGlobalRank);CHKERRQ(ierr); 19335b08dc53SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"matrix error = % 1.14e\n",real_value);CHKERRQ(ierr); 193415aaf578SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"coarse functions (phi) errors\n");CHKERRQ(ierr); 193515aaf578SStefano Zampini for (i=0;i<pcbddc->local_primal_size;i++) { 193615aaf578SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local %02d-th function error = % 1.14e\n",i,coarsefunctions_errors[i]);CHKERRQ(ierr); 193715aaf578SStefano Zampini } 193815aaf578SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"constraints (phi) errors\n");CHKERRQ(ierr); 193915aaf578SStefano Zampini for (i=0;i<pcbddc->local_primal_size;i++) { 194015aaf578SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local %02d-th function error = % 1.14e\n",i,constraints_errors[i]);CHKERRQ(ierr); 194115aaf578SStefano Zampini } 194215aaf578SStefano Zampini if (pcbddc->coarse_psi_B) { 194315aaf578SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"coarse functions (psi) errors\n");CHKERRQ(ierr); 194415aaf578SStefano Zampini for (i=pcbddc->local_primal_size;i<2*pcbddc->local_primal_size;i++) { 194515aaf578SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local %02d-th function error = % 1.14e\n",i-pcbddc->local_primal_size,coarsefunctions_errors[i]);CHKERRQ(ierr); 194615aaf578SStefano Zampini } 194715aaf578SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"constraints (psi) errors\n");CHKERRQ(ierr); 194815aaf578SStefano Zampini for (i=pcbddc->local_primal_size;i<2*pcbddc->local_primal_size;i++) { 194915aaf578SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local %02d-th function error = % 1.14e\n",i-pcbddc->local_primal_size,constraints_errors[i]);CHKERRQ(ierr); 195015aaf578SStefano Zampini } 195115aaf578SStefano Zampini } 19520c7d97c5SJed Brown ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 195353cdbc3dSStefano Zampini ierr = MatDestroy(&A_II);CHKERRQ(ierr); 195453cdbc3dSStefano Zampini ierr = MatDestroy(&A_BB);CHKERRQ(ierr); 195553cdbc3dSStefano Zampini ierr = MatDestroy(&A_IB);CHKERRQ(ierr); 195653cdbc3dSStefano Zampini ierr = MatDestroy(&A_BI);CHKERRQ(ierr); 195753cdbc3dSStefano Zampini ierr = MatDestroy(&TM1);CHKERRQ(ierr); 195853cdbc3dSStefano Zampini ierr = MatDestroy(&TM2);CHKERRQ(ierr); 195953cdbc3dSStefano Zampini ierr = MatDestroy(&TM3);CHKERRQ(ierr); 196053cdbc3dSStefano Zampini ierr = MatDestroy(&TM4);CHKERRQ(ierr); 196153cdbc3dSStefano Zampini ierr = MatDestroy(&coarse_phi_D);CHKERRQ(ierr); 196253cdbc3dSStefano Zampini ierr = MatDestroy(&coarse_phi_B);CHKERRQ(ierr); 196315aaf578SStefano Zampini if (pcbddc->coarse_psi_B) { 196415aaf578SStefano Zampini ierr = MatDestroy(&coarse_psi_D);CHKERRQ(ierr); 196515aaf578SStefano Zampini ierr = MatDestroy(&coarse_psi_B);CHKERRQ(ierr); 196615aaf578SStefano Zampini } 196715aaf578SStefano Zampini ierr = MatDestroy(&coarse_sub_mat);CHKERRQ(ierr); 19680c7d97c5SJed Brown ierr = PetscFree(coarsefunctions_errors);CHKERRQ(ierr); 19690c7d97c5SJed Brown ierr = PetscFree(constraints_errors);CHKERRQ(ierr); 19700c7d97c5SJed Brown } 19710c7d97c5SJed Brown /* free memory */ 19723b03a366Sstefano_zampini if (n_vertices) { 197315aaf578SStefano Zampini ierr = PetscFree(vertices);CHKERRQ(ierr); 19740c7d97c5SJed Brown ierr = VecDestroy(&vec1_V);CHKERRQ(ierr); 19750c7d97c5SJed Brown ierr = VecDestroy(&vec2_V);CHKERRQ(ierr); 19760c7d97c5SJed Brown ierr = MatDestroy(&A_RV);CHKERRQ(ierr); 19770c7d97c5SJed Brown ierr = MatDestroy(&A_VR);CHKERRQ(ierr); 19780c7d97c5SJed Brown ierr = MatDestroy(&A_VV);CHKERRQ(ierr); 19790c7d97c5SJed Brown } 1980534831adSStefano Zampini if (n_constraints) { 19810c7d97c5SJed Brown ierr = VecDestroy(&vec1_C);CHKERRQ(ierr); 19820c7d97c5SJed Brown ierr = VecDestroy(&vec2_C);CHKERRQ(ierr); 19830c7d97c5SJed Brown ierr = MatDestroy(&M1);CHKERRQ(ierr); 19840c7d97c5SJed Brown ierr = MatDestroy(&C_CR);CHKERRQ(ierr); 19850c7d97c5SJed Brown } 1986a929c220SStefano Zampini ierr = PetscFree(auxindices);CHKERRQ(ierr); 1987a929c220SStefano Zampini ierr = PetscFree(nnz);CHKERRQ(ierr); 1988a929c220SStefano Zampini /* create coarse matrix and data structures for message passing associated actual choice of coarse problem type */ 1989674ae819SStefano Zampini ierr = PCBDDCSetUpCoarseEnvironment(pc,coarse_submat_vals);CHKERRQ(ierr); 1990a929c220SStefano Zampini ierr = PetscFree(coarse_submat_vals);CHKERRQ(ierr); 19910c7d97c5SJed Brown } 19920c7d97c5SJed Brown /* free memory */ 19930c7d97c5SJed Brown ierr = ISDestroy(&is_R_local);CHKERRQ(ierr); 1994674ae819SStefano Zampini 19950c7d97c5SJed Brown PetscFunctionReturn(0); 19960c7d97c5SJed Brown } 19970c7d97c5SJed Brown 19980c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 19990c7d97c5SJed Brown 20007cbb387bSStefano Zampini /* BDDC requires metis 5.0.1 for multilevel */ 20017cbb387bSStefano Zampini #if defined(PETSC_HAVE_METIS) 20027cbb387bSStefano Zampini #include "metis.h" 20037cbb387bSStefano Zampini #define MetisInt idx_t 20047cbb387bSStefano Zampini #define MetisScalar real_t 20057cbb387bSStefano Zampini #endif 20067cbb387bSStefano Zampini 20070c7d97c5SJed Brown #undef __FUNCT__ 2008674ae819SStefano Zampini #define __FUNCT__ "PCBDDCSetUpCoarseEnvironment" 2009674ae819SStefano Zampini static PetscErrorCode PCBDDCSetUpCoarseEnvironment(PC pc,PetscScalar* coarse_submat_vals) 20100c7d97c5SJed Brown { 2011674ae819SStefano Zampini 2012674ae819SStefano Zampini 20130c7d97c5SJed Brown Mat_IS *matis = (Mat_IS*)pc->pmat->data; 20140c7d97c5SJed Brown PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 20150c7d97c5SJed Brown PC_IS *pcis = (PC_IS*)pc->data; 2016ce94432eSBarry Smith MPI_Comm prec_comm; 20170c7d97c5SJed Brown MPI_Comm coarse_comm; 20180c7d97c5SJed Brown 2019674ae819SStefano Zampini MatNullSpace CoarseNullSpace; 2020674ae819SStefano Zampini 20210c7d97c5SJed Brown /* common to all choiches */ 20220c7d97c5SJed Brown PetscScalar *temp_coarse_mat_vals; 20230c7d97c5SJed Brown PetscScalar *ins_coarse_mat_vals; 20240c7d97c5SJed Brown PetscInt *ins_local_primal_indices; 20250c7d97c5SJed Brown PetscMPIInt *localsizes2,*localdispl2; 20260c7d97c5SJed Brown PetscMPIInt size_prec_comm; 20270c7d97c5SJed Brown PetscMPIInt rank_prec_comm; 20280c7d97c5SJed Brown PetscMPIInt active_rank=MPI_PROC_NULL; 20290c7d97c5SJed Brown PetscMPIInt master_proc=0; 20300c7d97c5SJed Brown PetscInt ins_local_primal_size; 20310c7d97c5SJed Brown /* specific to MULTILEVEL_BDDC */ 20325b08dc53SStefano Zampini PetscMPIInt *ranks_recv=0; 20330c7d97c5SJed Brown PetscMPIInt count_recv=0; 20345b08dc53SStefano Zampini PetscMPIInt rank_coarse_proc_send_to=-1; 20350c7d97c5SJed Brown PetscMPIInt coarse_color = MPI_UNDEFINED; 20360c7d97c5SJed Brown ISLocalToGlobalMapping coarse_ISLG; 20370c7d97c5SJed Brown /* some other variables */ 20380c7d97c5SJed Brown PetscErrorCode ierr; 203919fd82e9SBarry Smith MatType coarse_mat_type; 204019fd82e9SBarry Smith PCType coarse_pc_type; 204119fd82e9SBarry Smith KSPType coarse_ksp_type; 204253cdbc3dSStefano Zampini PC pc_temp; 20434fad6a16SStefano Zampini PetscInt i,j,k; 20443b03a366Sstefano_zampini PetscInt max_it_coarse_ksp=1; /* don't increase this value */ 2045e269702eSStefano Zampini /* verbose output viewer */ 2046e269702eSStefano Zampini PetscViewer viewer=pcbddc->dbg_viewer; 20475b08dc53SStefano Zampini PetscInt dbg_flag=pcbddc->dbg_flag; 2048142dfd88SStefano Zampini 2049ea7e1babSStefano Zampini PetscInt offset,offset2; 2050a929c220SStefano Zampini PetscMPIInt im_active,active_procs; 2051523858cfSStefano Zampini PetscInt *dnz,*onz; 2052142dfd88SStefano Zampini 2053142dfd88SStefano Zampini PetscBool setsym,issym=PETSC_FALSE; 20540c7d97c5SJed Brown 20550c7d97c5SJed Brown PetscFunctionBegin; 20564b2d0b89SJed Brown ierr = PetscObjectGetComm((PetscObject)pc,&prec_comm);CHKERRQ(ierr); 20570c7d97c5SJed Brown ins_local_primal_indices = 0; 20580c7d97c5SJed Brown ins_coarse_mat_vals = 0; 20590c7d97c5SJed Brown localsizes2 = 0; 20600c7d97c5SJed Brown localdispl2 = 0; 20610c7d97c5SJed Brown temp_coarse_mat_vals = 0; 20620c7d97c5SJed Brown coarse_ISLG = 0; 20630c7d97c5SJed Brown 206453cdbc3dSStefano Zampini ierr = MPI_Comm_size(prec_comm,&size_prec_comm);CHKERRQ(ierr); 206553cdbc3dSStefano Zampini ierr = MPI_Comm_rank(prec_comm,&rank_prec_comm);CHKERRQ(ierr); 2066142dfd88SStefano Zampini ierr = MatIsSymmetricKnown(pc->pmat,&setsym,&issym);CHKERRQ(ierr); 2067142dfd88SStefano Zampini 2068beed3852SStefano Zampini /* Assign global numbering to coarse dofs */ 2069beed3852SStefano Zampini { 2070674ae819SStefano Zampini PetscInt *auxlocal_primal,*aux_idx; 2071ef028eecSStefano Zampini PetscMPIInt mpi_local_primal_size; 2072ef028eecSStefano Zampini PetscScalar coarsesum,*array; 2073ef028eecSStefano Zampini 2074ef028eecSStefano Zampini mpi_local_primal_size = (PetscMPIInt)pcbddc->local_primal_size; 2075beed3852SStefano Zampini 2076beed3852SStefano Zampini /* Construct needed data structures for message passing */ 2077ffe5efe1SStefano Zampini j = 0; 2078142dfd88SStefano Zampini if (rank_prec_comm == 0 || pcbddc->coarse_problem_type == REPLICATED_BDDC || pcbddc->coarse_problem_type == MULTILEVEL_BDDC) { 2079ffe5efe1SStefano Zampini j = size_prec_comm; 2080ffe5efe1SStefano Zampini } 2081ffe5efe1SStefano Zampini ierr = PetscMalloc(j*sizeof(PetscMPIInt),&pcbddc->local_primal_sizes);CHKERRQ(ierr); 2082ffe5efe1SStefano Zampini ierr = PetscMalloc(j*sizeof(PetscMPIInt),&pcbddc->local_primal_displacements);CHKERRQ(ierr); 2083beed3852SStefano Zampini /* Gather local_primal_size information for all processes */ 2084142dfd88SStefano Zampini if (pcbddc->coarse_problem_type == REPLICATED_BDDC || pcbddc->coarse_problem_type == MULTILEVEL_BDDC) { 20855619798eSStefano Zampini ierr = MPI_Allgather(&mpi_local_primal_size,1,MPIU_INT,&pcbddc->local_primal_sizes[0],1,MPIU_INT,prec_comm);CHKERRQ(ierr); 2086ffe5efe1SStefano Zampini } else { 2087ffe5efe1SStefano Zampini ierr = MPI_Gather(&mpi_local_primal_size,1,MPIU_INT,&pcbddc->local_primal_sizes[0],1,MPIU_INT,0,prec_comm);CHKERRQ(ierr); 2088ffe5efe1SStefano Zampini } 2089beed3852SStefano Zampini pcbddc->replicated_primal_size = 0; 2090ffe5efe1SStefano Zampini for (i=0; i<j; i++) { 2091beed3852SStefano Zampini pcbddc->local_primal_displacements[i] = pcbddc->replicated_primal_size ; 2092beed3852SStefano Zampini pcbddc->replicated_primal_size += pcbddc->local_primal_sizes[i]; 2093beed3852SStefano Zampini } 2094beed3852SStefano Zampini 2095da1bb401SStefano Zampini /* First let's count coarse dofs. 2096beed3852SStefano Zampini This code fragment assumes that the number of local constraints per connected component 2097beed3852SStefano Zampini is not greater than the number of nodes defined for the connected component 2098beed3852SStefano Zampini (otherwise we will surely have linear dependence between constraints and thus a singular coarse problem) */ 2099ef028eecSStefano Zampini ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscInt),&auxlocal_primal);CHKERRQ(ierr); 2100674ae819SStefano Zampini ierr = PCBDDCGetPrimalVerticesLocalIdx(pc,&i,&aux_idx);CHKERRQ(ierr); 2101674ae819SStefano Zampini ierr = PetscMemcpy(auxlocal_primal,aux_idx,i*sizeof(PetscInt));CHKERRQ(ierr); 2102674ae819SStefano Zampini ierr = PetscFree(aux_idx);CHKERRQ(ierr); 2103674ae819SStefano Zampini ierr = PCBDDCGetPrimalConstraintsLocalIdx(pc,&j,&aux_idx);CHKERRQ(ierr); 2104674ae819SStefano Zampini ierr = PetscMemcpy(&auxlocal_primal[i],aux_idx,j*sizeof(PetscInt));CHKERRQ(ierr); 2105674ae819SStefano Zampini ierr = PetscFree(aux_idx);CHKERRQ(ierr); 2106ef028eecSStefano Zampini /* Compute number of coarse dofs */ 2107674ae819SStefano Zampini ierr = PCBDDCSubsetNumbering(prec_comm,matis->mapping,pcbddc->local_primal_size,auxlocal_primal,NULL,&pcbddc->coarse_size,&pcbddc->local_primal_indices);CHKERRQ(ierr); 2108ef028eecSStefano Zampini 2109ef028eecSStefano Zampini if (dbg_flag) { 21102e8d2280SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 21112e8d2280SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr); 21122e8d2280SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Check coarse indices\n");CHKERRQ(ierr); 21132e8d2280SStefano Zampini ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr); 21142e8d2280SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 21152fa5cd67SKarl Rupp for (i=0;i<pcbddc->local_primal_size;i++) array[auxlocal_primal[i]]=1.0; 2116beed3852SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 21172e8d2280SStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 2118da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 2119da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 2120da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 2121da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 2122da1bb401SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 21232e8d2280SStefano Zampini for (i=0;i<pcis->n;i++) { 21242e8d2280SStefano Zampini if (array[i] == 1.0) { 21252e8d2280SStefano Zampini ierr = ISLocalToGlobalMappingApply(matis->mapping,1,&i,&j);CHKERRQ(ierr); 21262e8d2280SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d: WRONG COARSE INDEX %d (local %d)\n",PetscGlobalRank,j,i);CHKERRQ(ierr); 21272e8d2280SStefano Zampini } 21282e8d2280SStefano Zampini } 21292e8d2280SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 21302e8d2280SStefano Zampini for (i=0;i<pcis->n;i++) { 21315b08dc53SStefano Zampini if (PetscRealPart(array[i]) > 0.0) array[i] = 1.0/PetscRealPart(array[i]); 21322e8d2280SStefano Zampini } 2133da1bb401SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 21342e8d2280SStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 2135da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 2136da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 2137da1bb401SStefano Zampini ierr = VecSum(pcis->vec1_global,&coarsesum);CHKERRQ(ierr); 21382e8d2280SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Size of coarse problem SHOULD be %lf\n",coarsesum);CHKERRQ(ierr); 21392e8d2280SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 21402e8d2280SStefano Zampini } 2141142dfd88SStefano Zampini ierr = PetscFree(auxlocal_primal);CHKERRQ(ierr); 21420bdf917eSStefano Zampini } 21430bdf917eSStefano Zampini 21442e8d2280SStefano Zampini if (dbg_flag) { 21457cf533a6SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Size of coarse problem is %d\n",pcbddc->coarse_size);CHKERRQ(ierr); 21469d9e44b6SStefano Zampini if (dbg_flag > 1) { 2147674ae819SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Distribution of local primal indices\n");CHKERRQ(ierr); 21482e8d2280SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 2149674ae819SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d\n",PetscGlobalRank);CHKERRQ(ierr); 2150674ae819SStefano Zampini for (i=0;i<pcbddc->local_primal_size;i++) { 2151674ae819SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local_primal_indices[%d]=%d \n",i,pcbddc->local_primal_indices[i]); 2152674ae819SStefano Zampini } 21532e8d2280SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 21542e8d2280SStefano Zampini } 21552e8d2280SStefano Zampini } 21562e8d2280SStefano Zampini 2157a929c220SStefano Zampini im_active = 0; 21582fa5cd67SKarl Rupp if (pcis->n) im_active = 1; 2159a929c220SStefano Zampini ierr = MPI_Allreduce(&im_active,&active_procs,1,MPIU_INT,MPI_SUM,prec_comm);CHKERRQ(ierr); 21600bdf917eSStefano Zampini 21610bdf917eSStefano Zampini /* adapt coarse problem type */ 21627cbb387bSStefano Zampini #if defined(PETSC_HAVE_METIS) 21634fad6a16SStefano Zampini if (pcbddc->coarse_problem_type == MULTILEVEL_BDDC) { 21644fad6a16SStefano Zampini if (pcbddc->current_level < pcbddc->max_levels) { 2165a929c220SStefano Zampini if ( (active_procs/pcbddc->coarsening_ratio) < 2 ) { 21660bdf917eSStefano Zampini if (dbg_flag) { 2167a929c220SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Not enough active processes on level %d (active %d,ratio %d). Parallel direct solve for coarse problem\n",pcbddc->current_level,active_procs,pcbddc->coarsening_ratio);CHKERRQ(ierr); 21680bdf917eSStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 21690bdf917eSStefano Zampini } 21700bdf917eSStefano Zampini pcbddc->coarse_problem_type = PARALLEL_BDDC; 2171142dfd88SStefano Zampini } 21724fad6a16SStefano Zampini } else { 21734fad6a16SStefano Zampini if (dbg_flag) { 2174a929c220SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Max number of levels reached. Using parallel direct solve for coarse problem\n",pcbddc->max_levels,active_procs,pcbddc->coarsening_ratio);CHKERRQ(ierr); 21754fad6a16SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 21764fad6a16SStefano Zampini } 21774fad6a16SStefano Zampini pcbddc->coarse_problem_type = PARALLEL_BDDC; 21784fad6a16SStefano Zampini } 21794fad6a16SStefano Zampini } 21807cbb387bSStefano Zampini #else 21817cbb387bSStefano Zampini pcbddc->coarse_problem_type = PARALLEL_BDDC; 21827cbb387bSStefano Zampini #endif 2183beed3852SStefano Zampini 21840c7d97c5SJed Brown switch(pcbddc->coarse_problem_type){ 21850c7d97c5SJed Brown 2186da1bb401SStefano Zampini case(MULTILEVEL_BDDC): /* we define a coarse mesh where subdomains are elements */ 21870c7d97c5SJed Brown { 21887cbb387bSStefano Zampini #if defined(PETSC_HAVE_METIS) 21890c7d97c5SJed Brown /* we need additional variables */ 21900c7d97c5SJed Brown MetisInt n_subdomains,n_parts,objval,ncon,faces_nvtxs; 21910c7d97c5SJed Brown MetisInt *metis_coarse_subdivision; 21920c7d97c5SJed Brown MetisInt options[METIS_NOPTIONS]; 21930c7d97c5SJed Brown PetscMPIInt size_coarse_comm,rank_coarse_comm; 21940c7d97c5SJed Brown PetscMPIInt procs_jumps_coarse_comm; 21950c7d97c5SJed Brown PetscMPIInt *coarse_subdivision; 21960c7d97c5SJed Brown PetscMPIInt *total_count_recv; 21970c7d97c5SJed Brown PetscMPIInt *total_ranks_recv; 21980c7d97c5SJed Brown PetscMPIInt *displacements_recv; 21990c7d97c5SJed Brown PetscMPIInt *my_faces_connectivity; 22000c7d97c5SJed Brown PetscMPIInt *petsc_faces_adjncy; 22010c7d97c5SJed Brown MetisInt *faces_adjncy; 22020c7d97c5SJed Brown MetisInt *faces_xadj; 22030c7d97c5SJed Brown PetscMPIInt *number_of_faces; 22040c7d97c5SJed Brown PetscMPIInt *faces_displacements; 22050c7d97c5SJed Brown PetscInt *array_int; 22060c7d97c5SJed Brown PetscMPIInt my_faces=0; 22070c7d97c5SJed Brown PetscMPIInt total_faces=0; 22083828260eSStefano Zampini PetscInt ranks_stretching_ratio; 22090c7d97c5SJed Brown 22100c7d97c5SJed Brown /* define some quantities */ 22110c7d97c5SJed Brown pcbddc->coarse_communications_type = SCATTERS_BDDC; 22120c7d97c5SJed Brown coarse_mat_type = MATIS; 22130c7d97c5SJed Brown coarse_pc_type = PCBDDC; 2214142dfd88SStefano Zampini coarse_ksp_type = KSPRICHARDSON; 22150c7d97c5SJed Brown 22160c7d97c5SJed Brown /* details of coarse decomposition */ 2217a929c220SStefano Zampini n_subdomains = active_procs; 22180c7d97c5SJed Brown n_parts = n_subdomains/pcbddc->coarsening_ratio; 2219a929c220SStefano Zampini ranks_stretching_ratio = size_prec_comm/active_procs; 22203828260eSStefano Zampini procs_jumps_coarse_comm = pcbddc->coarsening_ratio*ranks_stretching_ratio; 22213828260eSStefano Zampini 2222a929c220SStefano Zampini #if 0 2223a929c220SStefano Zampini PetscMPIInt *old_ranks; 2224a929c220SStefano Zampini PetscInt *new_ranks,*jj,*ii; 2225a929c220SStefano Zampini MatPartitioning mat_part; 2226a929c220SStefano Zampini IS coarse_new_decomposition,is_numbering; 2227a929c220SStefano Zampini PetscViewer viewer_test; 2228a929c220SStefano Zampini MPI_Comm test_coarse_comm; 2229a929c220SStefano Zampini PetscMPIInt test_coarse_color; 2230a929c220SStefano Zampini Mat mat_adj; 2231a929c220SStefano Zampini /* Create new communicator for coarse problem splitting the old one */ 2232a929c220SStefano Zampini /* procs with coarse_color = MPI_UNDEFINED will have coarse_comm = MPI_COMM_NULL (from mpi standards) 2233a929c220SStefano Zampini key = rank_prec_comm -> keep same ordering of ranks from the old to the new communicator */ 2234a929c220SStefano Zampini test_coarse_color = ( im_active ? 0 : MPI_UNDEFINED ); 2235a929c220SStefano Zampini test_coarse_comm = MPI_COMM_NULL; 2236a929c220SStefano Zampini ierr = MPI_Comm_split(prec_comm,test_coarse_color,rank_prec_comm,&test_coarse_comm);CHKERRQ(ierr); 2237a929c220SStefano Zampini if (im_active) { 2238a929c220SStefano Zampini ierr = PetscMalloc(n_subdomains*sizeof(PetscMPIInt),&old_ranks); 2239a929c220SStefano Zampini ierr = PetscMalloc(size_prec_comm*sizeof(PetscInt),&new_ranks); 2240a929c220SStefano Zampini ierr = MPI_Comm_rank(test_coarse_comm,&rank_coarse_comm);CHKERRQ(ierr); 2241a929c220SStefano Zampini ierr = MPI_Comm_size(test_coarse_comm,&j);CHKERRQ(ierr); 2242a929c220SStefano Zampini ierr = MPI_Allgather(&rank_prec_comm,1,MPIU_INT,old_ranks,1,MPIU_INT,test_coarse_comm);CHKERRQ(ierr); 2243674ae819SStefano Zampini for (i=0; i<size_prec_comm; i++) new_ranks[i] = -1; 2244674ae819SStefano Zampini for (i=0; i<n_subdomains; i++) new_ranks[old_ranks[i]] = i; 2245a929c220SStefano Zampini ierr = PetscViewerASCIIOpen(test_coarse_comm,"test_mat_part.out",&viewer_test);CHKERRQ(ierr); 2246a929c220SStefano Zampini k = pcis->n_neigh-1; 2247a929c220SStefano Zampini ierr = PetscMalloc(2*sizeof(PetscInt),&ii); 2248a929c220SStefano Zampini ii[0]=0; 2249a929c220SStefano Zampini ii[1]=k; 2250a929c220SStefano Zampini ierr = PetscMalloc(k*sizeof(PetscInt),&jj); 2251674ae819SStefano Zampini for (i=0; i<k; i++) jj[i]=new_ranks[pcis->neigh[i+1]]; 2252a929c220SStefano Zampini ierr = PetscSortInt(k,jj);CHKERRQ(ierr); 22530298fd71SBarry Smith ierr = MatCreateMPIAdj(test_coarse_comm,1,n_subdomains,ii,jj,NULL,&mat_adj);CHKERRQ(ierr); 2254a929c220SStefano Zampini ierr = MatView(mat_adj,viewer_test);CHKERRQ(ierr); 2255a929c220SStefano Zampini ierr = MatPartitioningCreate(test_coarse_comm,&mat_part);CHKERRQ(ierr); 2256a929c220SStefano Zampini ierr = MatPartitioningSetAdjacency(mat_part,mat_adj);CHKERRQ(ierr); 2257a929c220SStefano Zampini ierr = MatPartitioningSetFromOptions(mat_part);CHKERRQ(ierr); 2258a929c220SStefano Zampini printf("Setting Nparts %d\n",n_parts); 2259a929c220SStefano Zampini ierr = MatPartitioningSetNParts(mat_part,n_parts);CHKERRQ(ierr); 2260a929c220SStefano Zampini ierr = MatPartitioningView(mat_part,viewer_test);CHKERRQ(ierr); 2261a929c220SStefano Zampini ierr = MatPartitioningApply(mat_part,&coarse_new_decomposition);CHKERRQ(ierr); 2262a929c220SStefano Zampini ierr = ISView(coarse_new_decomposition,viewer_test);CHKERRQ(ierr); 2263a929c220SStefano Zampini ierr = ISPartitioningToNumbering(coarse_new_decomposition,&is_numbering);CHKERRQ(ierr); 2264a929c220SStefano Zampini ierr = ISView(is_numbering,viewer_test);CHKERRQ(ierr); 2265a929c220SStefano Zampini ierr = PetscViewerDestroy(&viewer_test);CHKERRQ(ierr); 2266a929c220SStefano Zampini ierr = ISDestroy(&coarse_new_decomposition);CHKERRQ(ierr); 2267a929c220SStefano Zampini ierr = ISDestroy(&is_numbering);CHKERRQ(ierr); 2268a929c220SStefano Zampini ierr = MatPartitioningDestroy(&mat_part);CHKERRQ(ierr); 2269a929c220SStefano Zampini ierr = PetscFree(old_ranks);CHKERRQ(ierr); 2270a929c220SStefano Zampini ierr = PetscFree(new_ranks);CHKERRQ(ierr); 2271a929c220SStefano Zampini ierr = MPI_Comm_free(&test_coarse_comm);CHKERRQ(ierr); 2272a929c220SStefano Zampini } 2273a929c220SStefano Zampini #endif 2274a929c220SStefano Zampini 22754fad6a16SStefano Zampini /* build CSR graph of subdomains' connectivity */ 22760c7d97c5SJed Brown ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&array_int);CHKERRQ(ierr); 22773828260eSStefano Zampini ierr = PetscMemzero(array_int,pcis->n*sizeof(PetscInt));CHKERRQ(ierr); 22780c7d97c5SJed Brown for (i=1;i<pcis->n_neigh;i++){/* i=1 so I don't count myself -> faces nodes counts to 1 */ 22790c7d97c5SJed Brown for (j=0;j<pcis->n_shared[i];j++){ 22800c7d97c5SJed Brown array_int[ pcis->shared[i][j] ]+=1; 22810c7d97c5SJed Brown } 22820c7d97c5SJed Brown } 22830c7d97c5SJed Brown for (i=1;i<pcis->n_neigh;i++){ 22840c7d97c5SJed Brown for (j=0;j<pcis->n_shared[i];j++){ 22857cf533a6SStefano Zampini if (array_int[ pcis->shared[i][j] ] > 0 ){ 22860c7d97c5SJed Brown my_faces++; 22870c7d97c5SJed Brown break; 22880c7d97c5SJed Brown } 22890c7d97c5SJed Brown } 22900c7d97c5SJed Brown } 22910c7d97c5SJed Brown 229253cdbc3dSStefano Zampini ierr = MPI_Reduce(&my_faces,&total_faces,1,MPIU_INT,MPI_SUM,master_proc,prec_comm);CHKERRQ(ierr); 22930c7d97c5SJed Brown ierr = PetscMalloc (my_faces*sizeof(PetscInt),&my_faces_connectivity);CHKERRQ(ierr); 22940c7d97c5SJed Brown my_faces=0; 22950c7d97c5SJed Brown for (i=1;i<pcis->n_neigh;i++){ 22960c7d97c5SJed Brown for (j=0;j<pcis->n_shared[i];j++){ 22977cf533a6SStefano Zampini if (array_int[ pcis->shared[i][j] ] > 0 ){ 22980c7d97c5SJed Brown my_faces_connectivity[my_faces]=pcis->neigh[i]; 22990c7d97c5SJed Brown my_faces++; 23000c7d97c5SJed Brown break; 23010c7d97c5SJed Brown } 23020c7d97c5SJed Brown } 23030c7d97c5SJed Brown } 23040c7d97c5SJed Brown if (rank_prec_comm == master_proc) { 23050c7d97c5SJed Brown ierr = PetscMalloc (total_faces*sizeof(PetscMPIInt),&petsc_faces_adjncy);CHKERRQ(ierr); 23060c7d97c5SJed Brown ierr = PetscMalloc (size_prec_comm*sizeof(PetscMPIInt),&number_of_faces);CHKERRQ(ierr); 23070c7d97c5SJed Brown ierr = PetscMalloc (total_faces*sizeof(MetisInt),&faces_adjncy);CHKERRQ(ierr); 23080c7d97c5SJed Brown ierr = PetscMalloc ((n_subdomains+1)*sizeof(MetisInt),&faces_xadj);CHKERRQ(ierr); 23090c7d97c5SJed Brown ierr = PetscMalloc ((size_prec_comm+1)*sizeof(PetscMPIInt),&faces_displacements);CHKERRQ(ierr); 23100c7d97c5SJed Brown } 231153cdbc3dSStefano Zampini ierr = MPI_Gather(&my_faces,1,MPIU_INT,&number_of_faces[0],1,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr); 23120c7d97c5SJed Brown if (rank_prec_comm == master_proc) { 23130c7d97c5SJed Brown faces_xadj[0]=0; 23140c7d97c5SJed Brown faces_displacements[0]=0; 23150c7d97c5SJed Brown j=0; 23160c7d97c5SJed Brown for (i=1;i<size_prec_comm+1;i++) { 23170c7d97c5SJed Brown faces_displacements[i]=faces_displacements[i-1]+number_of_faces[i-1]; 23180c7d97c5SJed Brown if (number_of_faces[i-1]) { 23190c7d97c5SJed Brown j++; 23200c7d97c5SJed Brown faces_xadj[j]=faces_xadj[j-1]+number_of_faces[i-1]; 23210c7d97c5SJed Brown } 23220c7d97c5SJed Brown } 23230c7d97c5SJed Brown } 232453cdbc3dSStefano Zampini ierr = MPI_Gatherv(&my_faces_connectivity[0],my_faces,MPIU_INT,&petsc_faces_adjncy[0],number_of_faces,faces_displacements,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr); 23250c7d97c5SJed Brown ierr = PetscFree(my_faces_connectivity);CHKERRQ(ierr); 23260c7d97c5SJed Brown ierr = PetscFree(array_int);CHKERRQ(ierr); 23270c7d97c5SJed Brown if (rank_prec_comm == master_proc) { 23283828260eSStefano Zampini for (i=0;i<total_faces;i++) faces_adjncy[i]=(MetisInt)(petsc_faces_adjncy[i]/ranks_stretching_ratio); /* cast to MetisInt */ 23290c7d97c5SJed Brown ierr = PetscFree(faces_displacements);CHKERRQ(ierr); 23300c7d97c5SJed Brown ierr = PetscFree(number_of_faces);CHKERRQ(ierr); 23310c7d97c5SJed Brown ierr = PetscFree(petsc_faces_adjncy);CHKERRQ(ierr); 23320c7d97c5SJed Brown } 23330c7d97c5SJed Brown 23340c7d97c5SJed Brown if ( rank_prec_comm == master_proc ) { 2335674ae819SStefano Zampini 23363828260eSStefano Zampini PetscInt heuristic_for_metis=3; 2337674ae819SStefano Zampini 23380c7d97c5SJed Brown ncon=1; 23390c7d97c5SJed Brown faces_nvtxs=n_subdomains; 23400c7d97c5SJed Brown /* partition graoh induced by face connectivity */ 23410c7d97c5SJed Brown ierr = PetscMalloc (n_subdomains*sizeof(MetisInt),&metis_coarse_subdivision);CHKERRQ(ierr); 23420c7d97c5SJed Brown ierr = METIS_SetDefaultOptions(options); 23430c7d97c5SJed Brown /* we need a contiguous partition of the coarse mesh */ 23440c7d97c5SJed Brown options[METIS_OPTION_CONTIG]=1; 23450c7d97c5SJed Brown options[METIS_OPTION_NITER]=30; 23464fad6a16SStefano Zampini if (pcbddc->coarsening_ratio > 1) { 23473828260eSStefano Zampini if (n_subdomains>n_parts*heuristic_for_metis) { 23483828260eSStefano Zampini options[METIS_OPTION_IPTYPE]=METIS_IPTYPE_EDGE; 23493828260eSStefano Zampini options[METIS_OPTION_OBJTYPE]=METIS_OBJTYPE_CUT; 23500c7d97c5SJed Brown ierr = METIS_PartGraphKway(&faces_nvtxs,&ncon,faces_xadj,faces_adjncy,NULL,NULL,NULL,&n_parts,NULL,NULL,options,&objval,metis_coarse_subdivision); 2351674ae819SStefano Zampini if (ierr != METIS_OK) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in METIS_PartGraphKway (metis error code %D) called from PCBDDCSetUpCoarseEnvironment\n",ierr); 23523828260eSStefano Zampini } else { 23533828260eSStefano Zampini ierr = METIS_PartGraphRecursive(&faces_nvtxs,&ncon,faces_xadj,faces_adjncy,NULL,NULL,NULL,&n_parts,NULL,NULL,options,&objval,metis_coarse_subdivision); 2354674ae819SStefano Zampini if (ierr != METIS_OK) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in METIS_PartGraphRecursive (metis error code %D) called from PCBDDCSetUpCoarseEnvironment\n",ierr); 23553828260eSStefano Zampini } 23564fad6a16SStefano Zampini } else { 23572fa5cd67SKarl Rupp for (i=0;i<n_subdomains;i++) metis_coarse_subdivision[i]=i; 23584fad6a16SStefano Zampini } 23590c7d97c5SJed Brown ierr = PetscFree(faces_xadj);CHKERRQ(ierr); 23600c7d97c5SJed Brown ierr = PetscFree(faces_adjncy);CHKERRQ(ierr); 23610bdf917eSStefano Zampini ierr = PetscMalloc(size_prec_comm*sizeof(PetscMPIInt),&coarse_subdivision);CHKERRQ(ierr); 23622fa5cd67SKarl Rupp 23630c7d97c5SJed Brown /* copy/cast values avoiding possible type conflicts between PETSc, MPI and METIS */ 23642fa5cd67SKarl Rupp for (i=0;i<size_prec_comm;i++) coarse_subdivision[i]=MPI_PROC_NULL; 23652fa5cd67SKarl Rupp for (i=0;i<n_subdomains;i++) coarse_subdivision[ranks_stretching_ratio*i]=(PetscInt)(metis_coarse_subdivision[i]); 23660c7d97c5SJed Brown ierr = PetscFree(metis_coarse_subdivision);CHKERRQ(ierr); 23670c7d97c5SJed Brown } 23680c7d97c5SJed Brown 23690c7d97c5SJed Brown /* Create new communicator for coarse problem splitting the old one */ 23700c7d97c5SJed Brown if ( !(rank_prec_comm%procs_jumps_coarse_comm) && rank_prec_comm < procs_jumps_coarse_comm*n_parts ){ 2371da1bb401SStefano Zampini coarse_color=0; /* for communicator splitting */ 2372da1bb401SStefano Zampini active_rank=rank_prec_comm; /* for insertion of matrix values */ 23730c7d97c5SJed Brown } 2374da1bb401SStefano Zampini /* procs with coarse_color = MPI_UNDEFINED will have coarse_comm = MPI_COMM_NULL (from mpi standards) 2375da1bb401SStefano Zampini key = rank_prec_comm -> keep same ordering of ranks from the old to the new communicator */ 237653cdbc3dSStefano Zampini ierr = MPI_Comm_split(prec_comm,coarse_color,rank_prec_comm,&coarse_comm);CHKERRQ(ierr); 23770c7d97c5SJed Brown 23780c7d97c5SJed Brown if ( coarse_color == 0 ) { 237953cdbc3dSStefano Zampini ierr = MPI_Comm_size(coarse_comm,&size_coarse_comm);CHKERRQ(ierr); 238053cdbc3dSStefano Zampini ierr = MPI_Comm_rank(coarse_comm,&rank_coarse_comm);CHKERRQ(ierr); 23810c7d97c5SJed Brown } else { 23820c7d97c5SJed Brown rank_coarse_comm = MPI_PROC_NULL; 23830c7d97c5SJed Brown } 23840c7d97c5SJed Brown 23857cf533a6SStefano Zampini /* master proc take care of arranging and distributing coarse information */ 23860c7d97c5SJed Brown if (rank_coarse_comm == master_proc) { 23870c7d97c5SJed Brown ierr = PetscMalloc (size_coarse_comm*sizeof(PetscMPIInt),&displacements_recv);CHKERRQ(ierr); 23880bdf917eSStefano Zampini ierr = PetscMalloc (size_coarse_comm*sizeof(PetscMPIInt),&total_count_recv);CHKERRQ(ierr); 23890bdf917eSStefano Zampini ierr = PetscMalloc (n_subdomains*sizeof(PetscMPIInt),&total_ranks_recv);CHKERRQ(ierr); 23900c7d97c5SJed Brown /* some initializations */ 23910c7d97c5SJed Brown displacements_recv[0]=0; 23920bdf917eSStefano Zampini ierr = PetscMemzero(total_count_recv,size_coarse_comm*sizeof(PetscMPIInt));CHKERRQ(ierr); 23930c7d97c5SJed Brown /* count from how many processes the j-th process of the coarse decomposition will receive data */ 23940bdf917eSStefano Zampini for (j=0;j<size_coarse_comm;j++) { 23950bdf917eSStefano Zampini for (i=0;i<size_prec_comm;i++) { 23962fa5cd67SKarl Rupp if (coarse_subdivision[i]==j) total_count_recv[j]++; 23970bdf917eSStefano Zampini } 23980bdf917eSStefano Zampini } 23990c7d97c5SJed Brown /* displacements needed for scatterv of total_ranks_recv */ 24002fa5cd67SKarl Rupp for (i=1; i<size_coarse_comm; i++) displacements_recv[i]=displacements_recv[i-1]+total_count_recv[i-1]; 24012fa5cd67SKarl Rupp 24020c7d97c5SJed Brown /* Now fill properly total_ranks_recv -> each coarse process will receive the ranks (in prec_comm communicator) of its friend (sending) processes */ 24030c7d97c5SJed Brown ierr = PetscMemzero(total_count_recv,size_coarse_comm*sizeof(PetscMPIInt));CHKERRQ(ierr); 24040c7d97c5SJed Brown for (j=0;j<size_coarse_comm;j++) { 24053828260eSStefano Zampini for (i=0;i<size_prec_comm;i++) { 24060c7d97c5SJed Brown if (coarse_subdivision[i]==j) { 24070c7d97c5SJed Brown total_ranks_recv[displacements_recv[j]+total_count_recv[j]]=i; 24083828260eSStefano Zampini total_count_recv[j]+=1; 24090c7d97c5SJed Brown } 24100c7d97c5SJed Brown } 24110c7d97c5SJed Brown } 2412da1bb401SStefano Zampini /*for (j=0;j<size_coarse_comm;j++) { 24133828260eSStefano Zampini printf("process %d in new rank will receive from %d processes (original ranks follows)\n",j,total_count_recv[j]); 24143828260eSStefano Zampini for (i=0;i<total_count_recv[j];i++) { 24153828260eSStefano Zampini printf("%d ",total_ranks_recv[displacements_recv[j]+i]); 24163828260eSStefano Zampini } 24173828260eSStefano Zampini printf("\n"); 2418da1bb401SStefano Zampini }*/ 24190c7d97c5SJed Brown 24200c7d97c5SJed Brown /* identify new decomposition in terms of ranks in the old communicator */ 24210bdf917eSStefano Zampini for (i=0;i<n_subdomains;i++) { 24220bdf917eSStefano Zampini coarse_subdivision[ranks_stretching_ratio*i]=coarse_subdivision[ranks_stretching_ratio*i]*procs_jumps_coarse_comm; 24230bdf917eSStefano Zampini } 2424da1bb401SStefano Zampini /*printf("coarse_subdivision in old end new ranks\n"); 2425674ae819SStefano Zampini for (i=0;i<size_prec_comm;i++) 24263828260eSStefano Zampini if (coarse_subdivision[i]!=MPI_PROC_NULL) { 24273828260eSStefano Zampini printf("%d=(%d %d), ",i,coarse_subdivision[i],coarse_subdivision[i]/procs_jumps_coarse_comm); 24283828260eSStefano Zampini } else { 24293828260eSStefano Zampini printf("%d=(%d %d), ",i,coarse_subdivision[i],coarse_subdivision[i]); 24303828260eSStefano Zampini } 2431da1bb401SStefano Zampini printf("\n");*/ 24320c7d97c5SJed Brown } 24330c7d97c5SJed Brown 24340c7d97c5SJed Brown /* Scatter new decomposition for send details */ 243553cdbc3dSStefano Zampini ierr = MPI_Scatter(&coarse_subdivision[0],1,MPIU_INT,&rank_coarse_proc_send_to,1,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr); 24360c7d97c5SJed Brown /* Scatter receiving details to members of coarse decomposition */ 24370c7d97c5SJed Brown if ( coarse_color == 0) { 243853cdbc3dSStefano Zampini ierr = MPI_Scatter(&total_count_recv[0],1,MPIU_INT,&count_recv,1,MPIU_INT,master_proc,coarse_comm);CHKERRQ(ierr); 24390c7d97c5SJed Brown ierr = PetscMalloc (count_recv*sizeof(PetscMPIInt),&ranks_recv);CHKERRQ(ierr); 244053cdbc3dSStefano Zampini ierr = MPI_Scatterv(&total_ranks_recv[0],total_count_recv,displacements_recv,MPIU_INT,&ranks_recv[0],count_recv,MPIU_INT,master_proc,coarse_comm);CHKERRQ(ierr); 24410c7d97c5SJed Brown } 24420c7d97c5SJed Brown 2443da1bb401SStefano Zampini /*printf("I will send my matrix data to proc %d\n",rank_coarse_proc_send_to); 2444da1bb401SStefano Zampini if (coarse_color == 0) { 2445da1bb401SStefano Zampini printf("I will receive some matrix data from %d processes (ranks follows)\n",count_recv); 2446da1bb401SStefano Zampini for (i=0;i<count_recv;i++) 2447da1bb401SStefano Zampini printf("%d ",ranks_recv[i]); 2448da1bb401SStefano Zampini printf("\n"); 2449da1bb401SStefano Zampini }*/ 24500c7d97c5SJed Brown 24510c7d97c5SJed Brown if (rank_prec_comm == master_proc) { 24520bdf917eSStefano Zampini ierr = PetscFree(coarse_subdivision);CHKERRQ(ierr); 2453da1bb401SStefano Zampini ierr = PetscFree(total_count_recv);CHKERRQ(ierr); 24540bdf917eSStefano Zampini ierr = PetscFree(total_ranks_recv);CHKERRQ(ierr); 24550c7d97c5SJed Brown ierr = PetscFree(displacements_recv);CHKERRQ(ierr); 24560c7d97c5SJed Brown } 24577cbb387bSStefano Zampini #endif 24580c7d97c5SJed Brown break; 24590c7d97c5SJed Brown } 24600c7d97c5SJed Brown 24610c7d97c5SJed Brown case(REPLICATED_BDDC): 24620c7d97c5SJed Brown 24630c7d97c5SJed Brown pcbddc->coarse_communications_type = GATHERS_BDDC; 24640c7d97c5SJed Brown coarse_mat_type = MATSEQAIJ; 24650c7d97c5SJed Brown coarse_pc_type = PCLU; 246653cdbc3dSStefano Zampini coarse_ksp_type = KSPPREONLY; 24670c7d97c5SJed Brown coarse_comm = PETSC_COMM_SELF; 24680c7d97c5SJed Brown active_rank = rank_prec_comm; 24690c7d97c5SJed Brown break; 24700c7d97c5SJed Brown 24710c7d97c5SJed Brown case(PARALLEL_BDDC): 24720c7d97c5SJed Brown 24730c7d97c5SJed Brown pcbddc->coarse_communications_type = SCATTERS_BDDC; 2474674ae819SStefano Zampini coarse_mat_type = MATAIJ; 24750c7d97c5SJed Brown coarse_pc_type = PCREDUNDANT; 247653cdbc3dSStefano Zampini coarse_ksp_type = KSPPREONLY; 24770c7d97c5SJed Brown coarse_comm = prec_comm; 24780c7d97c5SJed Brown active_rank = rank_prec_comm; 24790c7d97c5SJed Brown break; 24800c7d97c5SJed Brown 24810c7d97c5SJed Brown case(SEQUENTIAL_BDDC): 24820c7d97c5SJed Brown pcbddc->coarse_communications_type = GATHERS_BDDC; 2483674ae819SStefano Zampini coarse_mat_type = MATAIJ; 24840c7d97c5SJed Brown coarse_pc_type = PCLU; 248553cdbc3dSStefano Zampini coarse_ksp_type = KSPPREONLY; 24860c7d97c5SJed Brown coarse_comm = PETSC_COMM_SELF; 24870c7d97c5SJed Brown active_rank = master_proc; 24880c7d97c5SJed Brown break; 24890c7d97c5SJed Brown } 24900c7d97c5SJed Brown 24910c7d97c5SJed Brown switch(pcbddc->coarse_communications_type){ 24920c7d97c5SJed Brown 24930c7d97c5SJed Brown case(SCATTERS_BDDC): 24940c7d97c5SJed Brown { 24950c7d97c5SJed Brown if (pcbddc->coarse_problem_type==MULTILEVEL_BDDC) { 24960c7d97c5SJed Brown 24972e8d2280SStefano Zampini IS coarse_IS; 24982e8d2280SStefano Zampini 2499523858cfSStefano Zampini if(pcbddc->coarsening_ratio == 1) { 2500523858cfSStefano Zampini ins_local_primal_size = pcbddc->local_primal_size; 2501523858cfSStefano Zampini ins_local_primal_indices = pcbddc->local_primal_indices; 2502523858cfSStefano Zampini if (coarse_color == 0) { ierr = PetscFree(ranks_recv);CHKERRQ(ierr); } 2503523858cfSStefano Zampini /* nonzeros */ 2504523858cfSStefano Zampini ierr = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&dnz);CHKERRQ(ierr); 2505523858cfSStefano Zampini ierr = PetscMemzero(dnz,ins_local_primal_size*sizeof(PetscInt));CHKERRQ(ierr); 2506523858cfSStefano Zampini for (i=0;i<ins_local_primal_size;i++) { 2507523858cfSStefano Zampini dnz[i] = ins_local_primal_size; 2508523858cfSStefano Zampini } 2509523858cfSStefano Zampini } else { 25100c7d97c5SJed Brown PetscMPIInt send_size; 2511ef028eecSStefano Zampini PetscMPIInt *send_buffer; 25120c7d97c5SJed Brown PetscInt *aux_ins_indices; 25130c7d97c5SJed Brown PetscInt ii,jj; 25140c7d97c5SJed Brown MPI_Request *requests; 2515ef028eecSStefano Zampini 2516523858cfSStefano Zampini ierr = PetscMalloc(count_recv*sizeof(PetscMPIInt),&localdispl2);CHKERRQ(ierr); 2517523858cfSStefano Zampini /* reusing pcbddc->local_primal_displacements and pcbddc->replicated_primal_size */ 2518523858cfSStefano Zampini ierr = PetscFree(pcbddc->local_primal_displacements);CHKERRQ(ierr); 2519523858cfSStefano Zampini ierr = PetscMalloc((count_recv+1)*sizeof(PetscMPIInt),&pcbddc->local_primal_displacements);CHKERRQ(ierr); 2520523858cfSStefano Zampini pcbddc->replicated_primal_size = count_recv; 2521523858cfSStefano Zampini j = 0; 2522523858cfSStefano Zampini for (i=0;i<count_recv;i++) { 2523523858cfSStefano Zampini pcbddc->local_primal_displacements[i] = j; 2524523858cfSStefano Zampini j += pcbddc->local_primal_sizes[ranks_recv[i]]; 2525523858cfSStefano Zampini } 2526523858cfSStefano Zampini pcbddc->local_primal_displacements[count_recv] = j; 2527523858cfSStefano Zampini ierr = PetscMalloc(j*sizeof(PetscMPIInt),&pcbddc->replicated_local_primal_indices);CHKERRQ(ierr); 25280c7d97c5SJed Brown /* allocate auxiliary space */ 2529523858cfSStefano Zampini ierr = PetscMalloc(count_recv*sizeof(PetscMPIInt),&localsizes2);CHKERRQ(ierr); 25300c7d97c5SJed Brown ierr = PetscMalloc(pcbddc->coarse_size*sizeof(PetscInt),&aux_ins_indices);CHKERRQ(ierr); 25310c7d97c5SJed Brown ierr = PetscMemzero(aux_ins_indices,pcbddc->coarse_size*sizeof(PetscInt));CHKERRQ(ierr); 25320c7d97c5SJed Brown /* allocate stuffs for message massing */ 25330c7d97c5SJed Brown ierr = PetscMalloc((count_recv+1)*sizeof(MPI_Request),&requests);CHKERRQ(ierr); 2534523858cfSStefano Zampini for (i=0;i<count_recv+1;i++) { requests[i]=MPI_REQUEST_NULL; } 2535523858cfSStefano Zampini /* send indices to be inserted */ 2536523858cfSStefano Zampini for (i=0;i<count_recv;i++) { 2537523858cfSStefano Zampini send_size = pcbddc->local_primal_sizes[ranks_recv[i]]; 2538523858cfSStefano Zampini ierr = MPI_Irecv(&pcbddc->replicated_local_primal_indices[pcbddc->local_primal_displacements[i]],send_size,MPIU_INT,ranks_recv[i],999,prec_comm,&requests[i]);CHKERRQ(ierr); 2539523858cfSStefano Zampini } 2540523858cfSStefano Zampini if (rank_coarse_proc_send_to != MPI_PROC_NULL ) { 2541523858cfSStefano Zampini send_size = pcbddc->local_primal_size; 2542ef028eecSStefano Zampini ierr = PetscMalloc(send_size*sizeof(PetscMPIInt),&send_buffer);CHKERRQ(ierr); 2543ef028eecSStefano Zampini for (i=0;i<send_size;i++) { 2544ef028eecSStefano Zampini send_buffer[i]=(PetscMPIInt)pcbddc->local_primal_indices[i]; 2545ef028eecSStefano Zampini } 2546ef028eecSStefano Zampini ierr = MPI_Isend(send_buffer,send_size,MPIU_INT,rank_coarse_proc_send_to,999,prec_comm,&requests[count_recv]);CHKERRQ(ierr); 2547523858cfSStefano Zampini } 2548523858cfSStefano Zampini ierr = MPI_Waitall(count_recv+1,requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 2549ef028eecSStefano Zampini if (rank_coarse_proc_send_to != MPI_PROC_NULL ) { 2550ef028eecSStefano Zampini ierr = PetscFree(send_buffer);CHKERRQ(ierr); 2551ef028eecSStefano Zampini } 25520c7d97c5SJed Brown j = 0; 25530c7d97c5SJed Brown for (i=0;i<count_recv;i++) { 25542e8d2280SStefano Zampini ii = pcbddc->local_primal_displacements[i+1]-pcbddc->local_primal_displacements[i]; 25552e8d2280SStefano Zampini localsizes2[i] = ii*ii; 25560c7d97c5SJed Brown localdispl2[i] = j; 25570c7d97c5SJed Brown j += localsizes2[i]; 2558523858cfSStefano Zampini jj = pcbddc->local_primal_displacements[i]; 25594fad6a16SStefano Zampini /* it counts the coarse subdomains sharing the coarse node */ 25602e8d2280SStefano Zampini for (k=0;k<ii;k++) { 25614fad6a16SStefano Zampini aux_ins_indices[pcbddc->replicated_local_primal_indices[jj+k]] += 1; 25620c7d97c5SJed Brown } 25634fad6a16SStefano Zampini } 2564523858cfSStefano Zampini /* temp_coarse_mat_vals used to store matrix values to be received */ 25650c7d97c5SJed Brown ierr = PetscMalloc(j*sizeof(PetscScalar),&temp_coarse_mat_vals);CHKERRQ(ierr); 25660c7d97c5SJed Brown /* evaluate how many values I will insert in coarse mat */ 25670c7d97c5SJed Brown ins_local_primal_size = 0; 2568ea7e1babSStefano Zampini for (i=0;i<pcbddc->coarse_size;i++) { 2569ea7e1babSStefano Zampini if (aux_ins_indices[i]) { 25700c7d97c5SJed Brown ins_local_primal_size++; 2571ea7e1babSStefano Zampini } 2572ea7e1babSStefano Zampini } 25730c7d97c5SJed Brown /* evaluate indices I will insert in coarse mat */ 25740c7d97c5SJed Brown ierr = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&ins_local_primal_indices);CHKERRQ(ierr); 25750c7d97c5SJed Brown j = 0; 2576ea7e1babSStefano Zampini for(i=0;i<pcbddc->coarse_size;i++) { 2577ea7e1babSStefano Zampini if(aux_ins_indices[i]) { 25782e8d2280SStefano Zampini ins_local_primal_indices[j] = i; 25792e8d2280SStefano Zampini j++; 2580ea7e1babSStefano Zampini } 2581ea7e1babSStefano Zampini } 2582523858cfSStefano Zampini /* processes partecipating in coarse problem receive matrix data from their friends */ 2583523858cfSStefano Zampini for (i=0;i<count_recv;i++) { 2584523858cfSStefano Zampini ierr = MPI_Irecv(&temp_coarse_mat_vals[localdispl2[i]],localsizes2[i],MPIU_SCALAR,ranks_recv[i],666,prec_comm,&requests[i]);CHKERRQ(ierr); 2585523858cfSStefano Zampini } 2586523858cfSStefano Zampini if (rank_coarse_proc_send_to != MPI_PROC_NULL ) { 2587523858cfSStefano Zampini send_size = pcbddc->local_primal_size*pcbddc->local_primal_size; 2588523858cfSStefano Zampini ierr = MPI_Isend(&coarse_submat_vals[0],send_size,MPIU_SCALAR,rank_coarse_proc_send_to,666,prec_comm,&requests[count_recv]);CHKERRQ(ierr); 2589523858cfSStefano Zampini } 2590523858cfSStefano Zampini ierr = MPI_Waitall(count_recv+1,requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 2591523858cfSStefano Zampini /* nonzeros */ 2592523858cfSStefano Zampini ierr = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&dnz);CHKERRQ(ierr); 2593523858cfSStefano Zampini ierr = PetscMemzero(dnz,ins_local_primal_size*sizeof(PetscInt));CHKERRQ(ierr); 25940c7d97c5SJed Brown /* use aux_ins_indices to realize a global to local mapping */ 25950c7d97c5SJed Brown j=0; 25960c7d97c5SJed Brown for(i=0;i<pcbddc->coarse_size;i++){ 25970c7d97c5SJed Brown if(aux_ins_indices[i]==0){ 25980c7d97c5SJed Brown aux_ins_indices[i]=-1; 25990c7d97c5SJed Brown } else { 26000c7d97c5SJed Brown aux_ins_indices[i]=j; 26010c7d97c5SJed Brown j++; 26020c7d97c5SJed Brown } 26030c7d97c5SJed Brown } 26044fad6a16SStefano Zampini for (i=0;i<count_recv;i++) { 2605523858cfSStefano Zampini j = pcbddc->local_primal_sizes[ranks_recv[i]]; 2606523858cfSStefano Zampini for (k=0;k<j;k++) { 2607523858cfSStefano Zampini dnz[aux_ins_indices[pcbddc->replicated_local_primal_indices[pcbddc->local_primal_displacements[i]+k]]] += j; 26080c7d97c5SJed Brown } 26090c7d97c5SJed Brown } 2610523858cfSStefano Zampini /* check */ 2611523858cfSStefano Zampini for (i=0;i<ins_local_primal_size;i++) { 2612523858cfSStefano Zampini if (dnz[i] > ins_local_primal_size) { 2613523858cfSStefano Zampini dnz[i] = ins_local_primal_size; 26140c7d97c5SJed Brown } 26150c7d97c5SJed Brown } 26160c7d97c5SJed Brown ierr = PetscFree(requests);CHKERRQ(ierr); 26170c7d97c5SJed Brown ierr = PetscFree(aux_ins_indices);CHKERRQ(ierr); 26180c7d97c5SJed Brown if (coarse_color == 0) { ierr = PetscFree(ranks_recv);CHKERRQ(ierr); } 26194fad6a16SStefano Zampini } 26200c7d97c5SJed Brown /* create local to global mapping needed by coarse MATIS */ 2621142dfd88SStefano Zampini if (coarse_comm != MPI_COMM_NULL ) {ierr = MPI_Comm_free(&coarse_comm);CHKERRQ(ierr);} 26220c7d97c5SJed Brown coarse_comm = prec_comm; 26230c7d97c5SJed Brown active_rank = rank_prec_comm; 26240c7d97c5SJed Brown ierr = ISCreateGeneral(coarse_comm,ins_local_primal_size,ins_local_primal_indices,PETSC_COPY_VALUES,&coarse_IS);CHKERRQ(ierr); 26250c7d97c5SJed Brown ierr = ISLocalToGlobalMappingCreateIS(coarse_IS,&coarse_ISLG);CHKERRQ(ierr); 26260c7d97c5SJed Brown ierr = ISDestroy(&coarse_IS);CHKERRQ(ierr); 26272e8d2280SStefano Zampini } else if (pcbddc->coarse_problem_type==PARALLEL_BDDC) { 26280c7d97c5SJed Brown /* arrays for values insertion */ 26290c7d97c5SJed Brown ins_local_primal_size = pcbddc->local_primal_size; 26302e8d2280SStefano Zampini ierr = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&ins_local_primal_indices);CHKERRQ(ierr); 26310c7d97c5SJed Brown ierr = PetscMalloc(ins_local_primal_size*ins_local_primal_size*sizeof(PetscScalar),&ins_coarse_mat_vals);CHKERRQ(ierr); 26320c7d97c5SJed Brown for (j=0;j<ins_local_primal_size;j++){ 26330c7d97c5SJed Brown ins_local_primal_indices[j]=pcbddc->local_primal_indices[j]; 26344fad6a16SStefano Zampini for (i=0;i<ins_local_primal_size;i++) { 26354fad6a16SStefano Zampini ins_coarse_mat_vals[j*ins_local_primal_size+i]=coarse_submat_vals[j*ins_local_primal_size+i]; 26364fad6a16SStefano Zampini } 26370c7d97c5SJed Brown } 26380c7d97c5SJed Brown } 26390c7d97c5SJed Brown break; 2640674ae819SStefano Zampini 26410c7d97c5SJed Brown } 26420c7d97c5SJed Brown 26430c7d97c5SJed Brown case(GATHERS_BDDC): 26440c7d97c5SJed Brown { 2645674ae819SStefano Zampini 26460c7d97c5SJed Brown PetscMPIInt mysize,mysize2; 2647ef028eecSStefano Zampini PetscMPIInt *send_buffer; 26480c7d97c5SJed Brown 26490c7d97c5SJed Brown if (rank_prec_comm==active_rank) { 26500c7d97c5SJed Brown ierr = PetscMalloc ( pcbddc->replicated_primal_size*sizeof(PetscMPIInt),&pcbddc->replicated_local_primal_indices);CHKERRQ(ierr); 26510bdf917eSStefano Zampini ierr = PetscMalloc ( pcbddc->replicated_primal_size*sizeof(PetscScalar),&pcbddc->replicated_local_primal_values);CHKERRQ(ierr); 26520c7d97c5SJed Brown ierr = PetscMalloc ( size_prec_comm*sizeof(PetscMPIInt),&localsizes2);CHKERRQ(ierr); 26530c7d97c5SJed Brown ierr = PetscMalloc ( size_prec_comm*sizeof(PetscMPIInt),&localdispl2);CHKERRQ(ierr); 26540c7d97c5SJed Brown /* arrays for values insertion */ 26552fa5cd67SKarl Rupp for (i=0;i<size_prec_comm;i++) localsizes2[i]=pcbddc->local_primal_sizes[i]*pcbddc->local_primal_sizes[i]; 26560c7d97c5SJed Brown localdispl2[0]=0; 26572fa5cd67SKarl Rupp for (i=1;i<size_prec_comm;i++) localdispl2[i]=localsizes2[i-1]+localdispl2[i-1]; 26580c7d97c5SJed Brown j=0; 26592fa5cd67SKarl Rupp for (i=0;i<size_prec_comm;i++) j+=localsizes2[i]; 26600c7d97c5SJed Brown ierr = PetscMalloc ( j*sizeof(PetscScalar),&temp_coarse_mat_vals);CHKERRQ(ierr); 26610c7d97c5SJed Brown } 26620c7d97c5SJed Brown 26630c7d97c5SJed Brown mysize=pcbddc->local_primal_size; 26640c7d97c5SJed Brown mysize2=pcbddc->local_primal_size*pcbddc->local_primal_size; 2665ef028eecSStefano Zampini ierr = PetscMalloc(mysize*sizeof(PetscMPIInt),&send_buffer);CHKERRQ(ierr); 26662fa5cd67SKarl Rupp for (i=0; i<mysize; i++) send_buffer[i]=(PetscMPIInt)pcbddc->local_primal_indices[i]; 26672fa5cd67SKarl Rupp 26680c7d97c5SJed Brown if (pcbddc->coarse_problem_type == SEQUENTIAL_BDDC){ 2669ef028eecSStefano Zampini ierr = MPI_Gatherv(send_buffer,mysize,MPIU_INT,&pcbddc->replicated_local_primal_indices[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr); 267053cdbc3dSStefano Zampini ierr = MPI_Gatherv(&coarse_submat_vals[0],mysize2,MPIU_SCALAR,&temp_coarse_mat_vals[0],localsizes2,localdispl2,MPIU_SCALAR,master_proc,prec_comm);CHKERRQ(ierr); 26710c7d97c5SJed Brown } else { 2672ef028eecSStefano Zampini ierr = MPI_Allgatherv(send_buffer,mysize,MPIU_INT,&pcbddc->replicated_local_primal_indices[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,prec_comm);CHKERRQ(ierr); 267353cdbc3dSStefano Zampini ierr = MPI_Allgatherv(&coarse_submat_vals[0],mysize2,MPIU_SCALAR,&temp_coarse_mat_vals[0],localsizes2,localdispl2,MPIU_SCALAR,prec_comm);CHKERRQ(ierr); 26740c7d97c5SJed Brown } 2675ef028eecSStefano Zampini ierr = PetscFree(send_buffer);CHKERRQ(ierr); 26760c7d97c5SJed Brown break; 2677da1bb401SStefano Zampini }/* switch on coarse problem and communications associated with finished */ 26780c7d97c5SJed Brown } 26790c7d97c5SJed Brown 26800c7d97c5SJed Brown /* Now create and fill up coarse matrix */ 26810c7d97c5SJed Brown if ( rank_prec_comm == active_rank ) { 2682142dfd88SStefano Zampini 2683142dfd88SStefano Zampini Mat matis_coarse_local_mat; 2684142dfd88SStefano Zampini 26850c7d97c5SJed Brown if (pcbddc->coarse_problem_type != MULTILEVEL_BDDC) { 26860c7d97c5SJed Brown ierr = MatCreate(coarse_comm,&pcbddc->coarse_mat);CHKERRQ(ierr); 26870c7d97c5SJed Brown ierr = MatSetSizes(pcbddc->coarse_mat,PETSC_DECIDE,PETSC_DECIDE,pcbddc->coarse_size,pcbddc->coarse_size);CHKERRQ(ierr); 26880c7d97c5SJed Brown ierr = MatSetType(pcbddc->coarse_mat,coarse_mat_type);CHKERRQ(ierr); 2689674ae819SStefano Zampini ierr = MatSetOptionsPrefix(pcbddc->coarse_mat,"coarse_");CHKERRQ(ierr); 2690674ae819SStefano Zampini ierr = MatSetFromOptions(pcbddc->coarse_mat);CHKERRQ(ierr); 26913b03a366Sstefano_zampini ierr = MatSetUp(pcbddc->coarse_mat);CHKERRQ(ierr); 2692da1bb401SStefano Zampini ierr = MatSetOption(pcbddc->coarse_mat,MAT_ROW_ORIENTED,PETSC_FALSE);CHKERRQ(ierr); /* local values stored in column major */ 26933b03a366Sstefano_zampini ierr = MatSetOption(pcbddc->coarse_mat,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr); 26940c7d97c5SJed Brown } else { 26954fad6a16SStefano Zampini ierr = MatCreateIS(coarse_comm,1,PETSC_DECIDE,PETSC_DECIDE,pcbddc->coarse_size,pcbddc->coarse_size,coarse_ISLG,&pcbddc->coarse_mat);CHKERRQ(ierr); 26963b03a366Sstefano_zampini ierr = MatSetUp(pcbddc->coarse_mat);CHKERRQ(ierr); 26970c7d97c5SJed Brown ierr = MatISGetLocalMat(pcbddc->coarse_mat,&matis_coarse_local_mat);CHKERRQ(ierr); 2698674ae819SStefano Zampini ierr = MatSetOptionsPrefix(pcbddc->coarse_mat,"coarse_");CHKERRQ(ierr); 2699674ae819SStefano Zampini ierr = MatSetFromOptions(pcbddc->coarse_mat);CHKERRQ(ierr); 27003b03a366Sstefano_zampini ierr = MatSetUp(matis_coarse_local_mat);CHKERRQ(ierr); 2701da1bb401SStefano Zampini ierr = MatSetOption(matis_coarse_local_mat,MAT_ROW_ORIENTED,PETSC_FALSE);CHKERRQ(ierr); /* local values stored in column major */ 2702a0ba757dSStefano Zampini ierr = MatSetOption(matis_coarse_local_mat,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr); 27030c7d97c5SJed Brown } 2704142dfd88SStefano Zampini /* preallocation */ 2705142dfd88SStefano Zampini if (pcbddc->coarse_problem_type != MULTILEVEL_BDDC) { 2706ef028eecSStefano Zampini 2707674ae819SStefano Zampini PetscInt lrows,lcols,bs; 2708ef028eecSStefano Zampini 2709142dfd88SStefano Zampini ierr = MatGetLocalSize(pcbddc->coarse_mat,&lrows,&lcols);CHKERRQ(ierr); 2710142dfd88SStefano Zampini ierr = MatPreallocateInitialize(coarse_comm,lrows,lcols,dnz,onz);CHKERRQ(ierr); 2711674ae819SStefano Zampini ierr = MatGetBlockSize(pcbddc->coarse_mat,&bs);CHKERRQ(ierr); 2712ef028eecSStefano Zampini 2713142dfd88SStefano Zampini if (pcbddc->coarse_problem_type == PARALLEL_BDDC) { 2714ef028eecSStefano Zampini 2715ef028eecSStefano Zampini Vec vec_dnz,vec_onz; 2716ef028eecSStefano Zampini PetscScalar *my_dnz,*my_onz,*array; 2717ef028eecSStefano Zampini PetscInt *mat_ranges,*row_ownership; 2718ef028eecSStefano Zampini PetscInt coarse_index_row,coarse_index_col,owner; 2719ef028eecSStefano Zampini 2720ef028eecSStefano Zampini ierr = VecCreate(prec_comm,&vec_dnz);CHKERRQ(ierr); 2721674ae819SStefano Zampini ierr = VecSetBlockSize(vec_dnz,bs);CHKERRQ(ierr); 2722ef028eecSStefano Zampini ierr = VecSetSizes(vec_dnz,PETSC_DECIDE,pcbddc->coarse_size);CHKERRQ(ierr); 2723ef028eecSStefano Zampini ierr = VecSetType(vec_dnz,VECMPI);CHKERRQ(ierr); 2724ef028eecSStefano Zampini ierr = VecDuplicate(vec_dnz,&vec_onz);CHKERRQ(ierr); 2725ef028eecSStefano Zampini 2726ef028eecSStefano Zampini ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscScalar),&my_dnz);CHKERRQ(ierr); 2727ef028eecSStefano Zampini ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscScalar),&my_onz);CHKERRQ(ierr); 2728ef028eecSStefano Zampini ierr = PetscMemzero(my_dnz,pcbddc->local_primal_size*sizeof(PetscScalar));CHKERRQ(ierr); 2729ef028eecSStefano Zampini ierr = PetscMemzero(my_onz,pcbddc->local_primal_size*sizeof(PetscScalar));CHKERRQ(ierr); 2730ef028eecSStefano Zampini 2731ef028eecSStefano Zampini ierr = PetscMalloc(pcbddc->coarse_size*sizeof(PetscInt),&row_ownership);CHKERRQ(ierr); 2732ef028eecSStefano Zampini ierr = MatGetOwnershipRanges(pcbddc->coarse_mat,(const PetscInt**)&mat_ranges);CHKERRQ(ierr); 2733142dfd88SStefano Zampini for (i=0;i<size_prec_comm;i++) { 2734ef028eecSStefano Zampini for (j=mat_ranges[i];j<mat_ranges[i+1];j++) { 2735ef028eecSStefano Zampini row_ownership[j]=i; 2736142dfd88SStefano Zampini } 2737142dfd88SStefano Zampini } 2738ef028eecSStefano Zampini 2739ef028eecSStefano Zampini for (i=0;i<pcbddc->local_primal_size;i++) { 2740ef028eecSStefano Zampini coarse_index_row = pcbddc->local_primal_indices[i]; 2741ef028eecSStefano Zampini owner = row_ownership[coarse_index_row]; 2742ef028eecSStefano Zampini for (j=i;j<pcbddc->local_primal_size;j++) { 2743ef028eecSStefano Zampini owner = row_ownership[coarse_index_row]; 2744ef028eecSStefano Zampini coarse_index_col = pcbddc->local_primal_indices[j]; 2745ef028eecSStefano Zampini if (coarse_index_col > mat_ranges[owner]-1 && coarse_index_col < mat_ranges[owner+1] ) { 2746ef028eecSStefano Zampini my_dnz[i] += 1.0; 2747142dfd88SStefano Zampini } else { 2748ef028eecSStefano Zampini my_onz[i] += 1.0; 2749142dfd88SStefano Zampini } 2750ef028eecSStefano Zampini if (i != j) { 2751ef028eecSStefano Zampini owner = row_ownership[coarse_index_col]; 2752ef028eecSStefano Zampini if (coarse_index_row > mat_ranges[owner]-1 && coarse_index_row < mat_ranges[owner+1] ) { 2753ef028eecSStefano Zampini my_dnz[j] += 1.0; 2754142dfd88SStefano Zampini } else { 2755ef028eecSStefano Zampini my_onz[j] += 1.0; 2756142dfd88SStefano Zampini } 2757142dfd88SStefano Zampini } 2758142dfd88SStefano Zampini } 2759142dfd88SStefano Zampini } 2760ef028eecSStefano Zampini ierr = VecSet(vec_dnz,0.0);CHKERRQ(ierr); 2761ef028eecSStefano Zampini ierr = VecSet(vec_onz,0.0);CHKERRQ(ierr); 2762a929c220SStefano Zampini if (pcbddc->local_primal_size) { 2763ef028eecSStefano Zampini ierr = VecSetValues(vec_dnz,pcbddc->local_primal_size,pcbddc->local_primal_indices,my_dnz,ADD_VALUES);CHKERRQ(ierr); 2764ef028eecSStefano Zampini ierr = VecSetValues(vec_onz,pcbddc->local_primal_size,pcbddc->local_primal_indices,my_onz,ADD_VALUES);CHKERRQ(ierr); 2765a929c220SStefano Zampini } 2766ef028eecSStefano Zampini ierr = VecAssemblyBegin(vec_dnz);CHKERRQ(ierr); 2767ef028eecSStefano Zampini ierr = VecAssemblyBegin(vec_onz);CHKERRQ(ierr); 2768ef028eecSStefano Zampini ierr = VecAssemblyEnd(vec_dnz);CHKERRQ(ierr); 2769ef028eecSStefano Zampini ierr = VecAssemblyEnd(vec_onz);CHKERRQ(ierr); 2770ef028eecSStefano Zampini j = mat_ranges[rank_prec_comm+1]-mat_ranges[rank_prec_comm]; 2771ef028eecSStefano Zampini ierr = VecGetArray(vec_dnz,&array);CHKERRQ(ierr); 27725b08dc53SStefano Zampini for (i=0; i<j; i++) dnz[i] = (PetscInt)PetscRealPart(array[i]); 27732fa5cd67SKarl Rupp 2774ef028eecSStefano Zampini ierr = VecRestoreArray(vec_dnz,&array);CHKERRQ(ierr); 2775ef028eecSStefano Zampini ierr = VecGetArray(vec_onz,&array);CHKERRQ(ierr); 27765b08dc53SStefano Zampini for (i=0;i<j;i++) onz[i] = (PetscInt)PetscRealPart(array[i]); 27772fa5cd67SKarl Rupp 2778ef028eecSStefano Zampini ierr = VecRestoreArray(vec_onz,&array);CHKERRQ(ierr); 2779ef028eecSStefano Zampini ierr = PetscFree(my_dnz);CHKERRQ(ierr); 2780ef028eecSStefano Zampini ierr = PetscFree(my_onz);CHKERRQ(ierr); 2781ef028eecSStefano Zampini ierr = PetscFree(row_ownership);CHKERRQ(ierr); 2782ef028eecSStefano Zampini ierr = VecDestroy(&vec_dnz);CHKERRQ(ierr); 2783ef028eecSStefano Zampini ierr = VecDestroy(&vec_onz);CHKERRQ(ierr); 2784142dfd88SStefano Zampini } else { 2785142dfd88SStefano Zampini for (k=0;k<size_prec_comm;k++){ 2786142dfd88SStefano Zampini offset=pcbddc->local_primal_displacements[k]; 2787142dfd88SStefano Zampini offset2=localdispl2[k]; 2788142dfd88SStefano Zampini ins_local_primal_size = pcbddc->local_primal_sizes[k]; 2789ef028eecSStefano Zampini ierr = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&ins_local_primal_indices);CHKERRQ(ierr); 2790ef028eecSStefano Zampini for (j=0;j<ins_local_primal_size;j++){ 2791ef028eecSStefano Zampini ins_local_primal_indices[j]=(PetscInt)pcbddc->replicated_local_primal_indices[offset+j]; 2792ef028eecSStefano Zampini } 2793142dfd88SStefano Zampini for (j=0;j<ins_local_primal_size;j++) { 2794142dfd88SStefano Zampini ierr = MatPreallocateSet(ins_local_primal_indices[j],ins_local_primal_size,ins_local_primal_indices,dnz,onz);CHKERRQ(ierr); 2795142dfd88SStefano Zampini } 2796ef028eecSStefano Zampini ierr = PetscFree(ins_local_primal_indices);CHKERRQ(ierr); 2797142dfd88SStefano Zampini } 2798142dfd88SStefano Zampini } 27992fa5cd67SKarl Rupp 2800142dfd88SStefano Zampini /* check */ 2801142dfd88SStefano Zampini for (i=0;i<lrows;i++) { 28022fa5cd67SKarl Rupp if (dnz[i]>lcols) dnz[i]=lcols; 28032fa5cd67SKarl Rupp if (onz[i]>pcbddc->coarse_size-lcols) onz[i]=pcbddc->coarse_size-lcols; 2804142dfd88SStefano Zampini } 2805d9a4edebSJed Brown ierr = MatSeqAIJSetPreallocation(pcbddc->coarse_mat,0,dnz);CHKERRQ(ierr); 2806d9a4edebSJed Brown ierr = MatMPIAIJSetPreallocation(pcbddc->coarse_mat,0,dnz,0,onz);CHKERRQ(ierr); 2807142dfd88SStefano Zampini ierr = MatPreallocateFinalize(dnz,onz);CHKERRQ(ierr); 2808142dfd88SStefano Zampini } else { 2809523858cfSStefano Zampini ierr = MatSeqAIJSetPreallocation(matis_coarse_local_mat,0,dnz);CHKERRQ(ierr); 2810523858cfSStefano Zampini ierr = PetscFree(dnz);CHKERRQ(ierr); 2811142dfd88SStefano Zampini } 2812142dfd88SStefano Zampini /* insert values */ 2813523858cfSStefano Zampini if (pcbddc->coarse_problem_type == PARALLEL_BDDC) { 28140c7d97c5SJed Brown ierr = MatSetValues(pcbddc->coarse_mat,ins_local_primal_size,ins_local_primal_indices,ins_local_primal_size,ins_local_primal_indices,ins_coarse_mat_vals,ADD_VALUES);CHKERRQ(ierr); 2815523858cfSStefano Zampini } else if (pcbddc->coarse_problem_type == MULTILEVEL_BDDC) { 2816523858cfSStefano Zampini if (pcbddc->coarsening_ratio == 1) { 2817523858cfSStefano Zampini ins_coarse_mat_vals = coarse_submat_vals; 2818523858cfSStefano Zampini ierr = MatSetValues(pcbddc->coarse_mat,ins_local_primal_size,ins_local_primal_indices,ins_local_primal_size,ins_local_primal_indices,ins_coarse_mat_vals,INSERT_VALUES);CHKERRQ(ierr); 2819523858cfSStefano Zampini } else { 2820523858cfSStefano Zampini ierr = PetscFree(ins_local_primal_indices);CHKERRQ(ierr); 2821523858cfSStefano Zampini for (k=0;k<pcbddc->replicated_primal_size;k++) { 2822523858cfSStefano Zampini offset = pcbddc->local_primal_displacements[k]; 2823523858cfSStefano Zampini offset2 = localdispl2[k]; 2824523858cfSStefano Zampini ins_local_primal_size = pcbddc->local_primal_displacements[k+1]-pcbddc->local_primal_displacements[k]; 2825ef028eecSStefano Zampini ierr = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&ins_local_primal_indices);CHKERRQ(ierr); 2826ef028eecSStefano Zampini for (j=0;j<ins_local_primal_size;j++){ 2827ef028eecSStefano Zampini ins_local_primal_indices[j]=(PetscInt)pcbddc->replicated_local_primal_indices[offset+j]; 2828ef028eecSStefano Zampini } 2829523858cfSStefano Zampini ins_coarse_mat_vals = &temp_coarse_mat_vals[offset2]; 2830523858cfSStefano Zampini ierr = MatSetValues(pcbddc->coarse_mat,ins_local_primal_size,ins_local_primal_indices,ins_local_primal_size,ins_local_primal_indices,ins_coarse_mat_vals,ADD_VALUES);CHKERRQ(ierr); 2831ef028eecSStefano Zampini ierr = PetscFree(ins_local_primal_indices);CHKERRQ(ierr); 2832523858cfSStefano Zampini } 2833523858cfSStefano Zampini } 2834523858cfSStefano Zampini ins_local_primal_indices = 0; 2835523858cfSStefano Zampini ins_coarse_mat_vals = 0; 2836ea7e1babSStefano Zampini } else { 2837ea7e1babSStefano Zampini for (k=0;k<size_prec_comm;k++){ 2838ea7e1babSStefano Zampini offset=pcbddc->local_primal_displacements[k]; 2839ea7e1babSStefano Zampini offset2=localdispl2[k]; 2840ea7e1babSStefano Zampini ins_local_primal_size = pcbddc->local_primal_sizes[k]; 2841ef028eecSStefano Zampini ierr = PetscMalloc(ins_local_primal_size*sizeof(PetscInt),&ins_local_primal_indices);CHKERRQ(ierr); 2842ef028eecSStefano Zampini for (j=0;j<ins_local_primal_size;j++){ 2843ef028eecSStefano Zampini ins_local_primal_indices[j]=(PetscInt)pcbddc->replicated_local_primal_indices[offset+j]; 2844ef028eecSStefano Zampini } 2845ea7e1babSStefano Zampini ins_coarse_mat_vals = &temp_coarse_mat_vals[offset2]; 2846ea7e1babSStefano Zampini ierr = MatSetValues(pcbddc->coarse_mat,ins_local_primal_size,ins_local_primal_indices,ins_local_primal_size,ins_local_primal_indices,ins_coarse_mat_vals,ADD_VALUES);CHKERRQ(ierr); 2847ef028eecSStefano Zampini ierr = PetscFree(ins_local_primal_indices);CHKERRQ(ierr); 2848ea7e1babSStefano Zampini } 2849ea7e1babSStefano Zampini ins_local_primal_indices = 0; 2850ea7e1babSStefano Zampini ins_coarse_mat_vals = 0; 2851ea7e1babSStefano Zampini } 28520c7d97c5SJed Brown ierr = MatAssemblyBegin(pcbddc->coarse_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 28530c7d97c5SJed Brown ierr = MatAssemblyEnd(pcbddc->coarse_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2854142dfd88SStefano Zampini /* symmetry of coarse matrix */ 2855142dfd88SStefano Zampini if (issym) { 2856142dfd88SStefano Zampini ierr = MatSetOption(pcbddc->coarse_mat,MAT_SYMMETRIC,PETSC_TRUE);CHKERRQ(ierr); 2857142dfd88SStefano Zampini } 28580c7d97c5SJed Brown ierr = MatGetVecs(pcbddc->coarse_mat,&pcbddc->coarse_vec,&pcbddc->coarse_rhs);CHKERRQ(ierr); 28590bdf917eSStefano Zampini } 28600bdf917eSStefano Zampini 28610bdf917eSStefano Zampini /* create loc to glob scatters if needed */ 28620bdf917eSStefano Zampini if (pcbddc->coarse_communications_type == SCATTERS_BDDC) { 28630bdf917eSStefano Zampini IS local_IS,global_IS; 28640bdf917eSStefano Zampini ierr = ISCreateStride(PETSC_COMM_SELF,pcbddc->local_primal_size,0,1,&local_IS);CHKERRQ(ierr); 28650bdf917eSStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,pcbddc->local_primal_size,pcbddc->local_primal_indices,PETSC_COPY_VALUES,&global_IS);CHKERRQ(ierr); 28660bdf917eSStefano Zampini ierr = VecScatterCreate(pcbddc->vec1_P,local_IS,pcbddc->coarse_vec,global_IS,&pcbddc->coarse_loc_to_glob);CHKERRQ(ierr); 28670bdf917eSStefano Zampini ierr = ISDestroy(&local_IS);CHKERRQ(ierr); 28680bdf917eSStefano Zampini ierr = ISDestroy(&global_IS);CHKERRQ(ierr); 28690bdf917eSStefano Zampini } 28700bdf917eSStefano Zampini 2871a929c220SStefano Zampini /* free memory no longer needed */ 2872a929c220SStefano Zampini if (coarse_ISLG) { ierr = ISLocalToGlobalMappingDestroy(&coarse_ISLG);CHKERRQ(ierr); } 2873a929c220SStefano Zampini if (ins_local_primal_indices) { ierr = PetscFree(ins_local_primal_indices);CHKERRQ(ierr); } 2874a929c220SStefano Zampini if (ins_coarse_mat_vals) { ierr = PetscFree(ins_coarse_mat_vals);CHKERRQ(ierr); } 2875a929c220SStefano Zampini if (localsizes2) { ierr = PetscFree(localsizes2);CHKERRQ(ierr); } 2876a929c220SStefano Zampini if (localdispl2) { ierr = PetscFree(localdispl2);CHKERRQ(ierr); } 2877a929c220SStefano Zampini if (temp_coarse_mat_vals) { ierr = PetscFree(temp_coarse_mat_vals);CHKERRQ(ierr); } 2878a929c220SStefano Zampini 2879674ae819SStefano Zampini /* Compute coarse null space */ 2880674ae819SStefano Zampini CoarseNullSpace = 0; 28810bdf917eSStefano Zampini if (pcbddc->NullSpace) { 2882674ae819SStefano Zampini ierr = PCBDDCNullSpaceAssembleCoarse(pc,&CoarseNullSpace);CHKERRQ(ierr); 28830bdf917eSStefano Zampini } 28840bdf917eSStefano Zampini 28850bdf917eSStefano Zampini /* KSP for coarse problem */ 28860bdf917eSStefano Zampini if (rank_prec_comm == active_rank) { 28872e8d2280SStefano Zampini PetscBool isbddc=PETSC_FALSE; 28880bdf917eSStefano Zampini 288953cdbc3dSStefano Zampini ierr = KSPCreate(coarse_comm,&pcbddc->coarse_ksp);CHKERRQ(ierr); 289053cdbc3dSStefano Zampini ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->coarse_ksp,(PetscObject)pc,1);CHKERRQ(ierr); 289153cdbc3dSStefano Zampini ierr = KSPSetOperators(pcbddc->coarse_ksp,pcbddc->coarse_mat,pcbddc->coarse_mat,SAME_PRECONDITIONER);CHKERRQ(ierr); 28923b03a366Sstefano_zampini ierr = KSPSetTolerances(pcbddc->coarse_ksp,PETSC_DEFAULT,PETSC_DEFAULT,PETSC_DEFAULT,max_it_coarse_ksp);CHKERRQ(ierr); 289353cdbc3dSStefano Zampini ierr = KSPSetType(pcbddc->coarse_ksp,coarse_ksp_type);CHKERRQ(ierr); 289453cdbc3dSStefano Zampini ierr = KSPGetPC(pcbddc->coarse_ksp,&pc_temp);CHKERRQ(ierr); 289553cdbc3dSStefano Zampini ierr = PCSetType(pc_temp,coarse_pc_type);CHKERRQ(ierr); 28960c7d97c5SJed Brown /* Allow user's customization */ 2897da1bb401SStefano Zampini ierr = KSPSetOptionsPrefix(pcbddc->coarse_ksp,"coarse_");CHKERRQ(ierr); 28980c7d97c5SJed Brown /* Set Up PC for coarse problem BDDC */ 289953cdbc3dSStefano Zampini if (pcbddc->coarse_problem_type == MULTILEVEL_BDDC) { 29004fad6a16SStefano Zampini i = pcbddc->current_level+1; 29014fad6a16SStefano Zampini ierr = PCBDDCSetLevel(pc_temp,i);CHKERRQ(ierr); 29024fad6a16SStefano Zampini ierr = PCBDDCSetCoarseningRatio(pc_temp,pcbddc->coarsening_ratio);CHKERRQ(ierr); 29034fad6a16SStefano Zampini ierr = PCBDDCSetMaxLevels(pc_temp,pcbddc->max_levels);CHKERRQ(ierr); 290453cdbc3dSStefano Zampini ierr = PCBDDCSetCoarseProblemType(pc_temp,MULTILEVEL_BDDC);CHKERRQ(ierr); 2905674ae819SStefano Zampini if (CoarseNullSpace) { 2906674ae819SStefano Zampini ierr = PCBDDCSetNullSpace(pc_temp,CoarseNullSpace);CHKERRQ(ierr); 2907674ae819SStefano Zampini } 29084fad6a16SStefano Zampini if (dbg_flag) { 29094fad6a16SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"----------------Level %d: Setting up level %d---------------\n",pcbddc->current_level,i);CHKERRQ(ierr); 29104fad6a16SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 291153cdbc3dSStefano Zampini } 2912674ae819SStefano Zampini } else { 2913674ae819SStefano Zampini if (CoarseNullSpace) { 2914674ae819SStefano Zampini ierr = KSPSetNullSpace(pcbddc->coarse_ksp,CoarseNullSpace);CHKERRQ(ierr); 2915674ae819SStefano Zampini } 29164fad6a16SStefano Zampini } 29174fad6a16SStefano Zampini ierr = KSPSetFromOptions(pcbddc->coarse_ksp);CHKERRQ(ierr); 291853cdbc3dSStefano Zampini ierr = KSPSetUp(pcbddc->coarse_ksp);CHKERRQ(ierr); 2919142dfd88SStefano Zampini 29200298fd71SBarry Smith ierr = KSPGetTolerances(pcbddc->coarse_ksp,NULL,NULL,NULL,&j);CHKERRQ(ierr); 29212e8d2280SStefano Zampini ierr = KSPGetPC(pcbddc->coarse_ksp,&pc_temp);CHKERRQ(ierr); 29222e8d2280SStefano Zampini ierr = PetscObjectTypeCompare((PetscObject)pc_temp,PCBDDC,&isbddc);CHKERRQ(ierr); 29232e8d2280SStefano Zampini if (j == 1) { 29242e8d2280SStefano Zampini ierr = KSPSetNormType(pcbddc->coarse_ksp,KSP_NORM_NONE);CHKERRQ(ierr); 29252e8d2280SStefano Zampini if (isbddc) { 29262e8d2280SStefano Zampini ierr = PCBDDCSetUseExactDirichlet(pc_temp,PETSC_FALSE);CHKERRQ(ierr); 29275619798eSStefano Zampini } 29285619798eSStefano Zampini } 29290c7d97c5SJed Brown } 2930a929c220SStefano Zampini /* Check coarse problem if requested */ 2931142dfd88SStefano Zampini if ( dbg_flag && rank_prec_comm == active_rank ) { 2932142dfd88SStefano Zampini KSP check_ksp; 2933142dfd88SStefano Zampini PC check_pc; 2934142dfd88SStefano Zampini Vec check_vec; 2935142dfd88SStefano Zampini PetscReal abs_infty_error,infty_error,lambda_min,lambda_max; 293619fd82e9SBarry Smith KSPType check_ksp_type; 29370c7d97c5SJed Brown 2938142dfd88SStefano Zampini /* Create ksp object suitable for extreme eigenvalues' estimation */ 2939142dfd88SStefano Zampini ierr = KSPCreate(coarse_comm,&check_ksp);CHKERRQ(ierr); 2940142dfd88SStefano Zampini ierr = KSPSetOperators(check_ksp,pcbddc->coarse_mat,pcbddc->coarse_mat,SAME_PRECONDITIONER);CHKERRQ(ierr); 29410bdf917eSStefano Zampini ierr = KSPSetTolerances(check_ksp,1.e-12,1.e-12,PETSC_DEFAULT,pcbddc->coarse_size);CHKERRQ(ierr); 2942142dfd88SStefano Zampini if (pcbddc->coarse_problem_type == MULTILEVEL_BDDC) { 29432fa5cd67SKarl Rupp if (issym) check_ksp_type = KSPCG; 29442fa5cd67SKarl Rupp else check_ksp_type = KSPGMRES; 2945142dfd88SStefano Zampini ierr = KSPSetComputeSingularValues(check_ksp,PETSC_TRUE);CHKERRQ(ierr); 2946142dfd88SStefano Zampini } else { 2947142dfd88SStefano Zampini check_ksp_type = KSPPREONLY; 2948142dfd88SStefano Zampini } 2949142dfd88SStefano Zampini ierr = KSPSetType(check_ksp,check_ksp_type);CHKERRQ(ierr); 2950142dfd88SStefano Zampini ierr = KSPGetPC(pcbddc->coarse_ksp,&check_pc);CHKERRQ(ierr); 2951142dfd88SStefano Zampini ierr = KSPSetPC(check_ksp,check_pc);CHKERRQ(ierr); 2952142dfd88SStefano Zampini ierr = KSPSetUp(check_ksp);CHKERRQ(ierr); 2953142dfd88SStefano Zampini /* create random vec */ 2954142dfd88SStefano Zampini ierr = VecDuplicate(pcbddc->coarse_vec,&check_vec);CHKERRQ(ierr); 29550298fd71SBarry Smith ierr = VecSetRandom(check_vec,NULL);CHKERRQ(ierr); 2956674ae819SStefano Zampini if (CoarseNullSpace) { 29571cb54aadSJed Brown ierr = MatNullSpaceRemove(CoarseNullSpace,check_vec);CHKERRQ(ierr); 2958674ae819SStefano Zampini } 2959142dfd88SStefano Zampini ierr = MatMult(pcbddc->coarse_mat,check_vec,pcbddc->coarse_rhs);CHKERRQ(ierr); 2960142dfd88SStefano Zampini /* solve coarse problem */ 2961142dfd88SStefano Zampini ierr = KSPSolve(check_ksp,pcbddc->coarse_rhs,pcbddc->coarse_vec);CHKERRQ(ierr); 2962674ae819SStefano Zampini if (CoarseNullSpace) { 29631cb54aadSJed Brown ierr = MatNullSpaceRemove(CoarseNullSpace,pcbddc->coarse_vec);CHKERRQ(ierr); 2964674ae819SStefano Zampini } 2965142dfd88SStefano Zampini /* check coarse problem residual error */ 2966142dfd88SStefano Zampini ierr = VecAXPY(check_vec,-1.0,pcbddc->coarse_vec);CHKERRQ(ierr); 2967142dfd88SStefano Zampini ierr = VecNorm(check_vec,NORM_INFINITY,&infty_error);CHKERRQ(ierr); 2968142dfd88SStefano Zampini ierr = MatMult(pcbddc->coarse_mat,check_vec,pcbddc->coarse_rhs);CHKERRQ(ierr); 2969142dfd88SStefano Zampini ierr = VecNorm(pcbddc->coarse_rhs,NORM_INFINITY,&abs_infty_error);CHKERRQ(ierr); 2970142dfd88SStefano Zampini ierr = VecDestroy(&check_vec);CHKERRQ(ierr); 2971142dfd88SStefano Zampini /* get eigenvalue estimation if inexact */ 2972142dfd88SStefano Zampini if (pcbddc->coarse_problem_type == MULTILEVEL_BDDC) { 2973142dfd88SStefano Zampini ierr = KSPComputeExtremeSingularValues(check_ksp,&lambda_max,&lambda_min);CHKERRQ(ierr); 2974142dfd88SStefano Zampini ierr = KSPGetIterationNumber(check_ksp,&k);CHKERRQ(ierr); 2975142dfd88SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem eigenvalues estimated with %d iterations of %s.\n",k,check_ksp_type);CHKERRQ(ierr); 2976e269702eSStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem eigenvalues: % 1.14e %1.14e\n",lambda_min,lambda_max);CHKERRQ(ierr); 29773b03a366Sstefano_zampini } 2978142dfd88SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem exact infty_error : %1.14e\n",infty_error);CHKERRQ(ierr); 2979142dfd88SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem residual infty_error: %1.14e\n",abs_infty_error);CHKERRQ(ierr); 2980142dfd88SStefano Zampini ierr = KSPDestroy(&check_ksp);CHKERRQ(ierr); 298153cdbc3dSStefano Zampini } 2982674ae819SStefano Zampini if (dbg_flag) { 2983da1bb401SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 2984da1bb401SStefano Zampini } 2985674ae819SStefano Zampini ierr = MatNullSpaceDestroy(&CoarseNullSpace);CHKERRQ(ierr); 2986a0ba757dSStefano Zampini 29870c7d97c5SJed Brown PetscFunctionReturn(0); 29880c7d97c5SJed Brown } 29890c7d97c5SJed Brown 2990