153cdbc3dSStefano Zampini /* TODOLIST 2da1bb401SStefano Zampini DofSplitting and DM attached to pc? 3da1bb401SStefano Zampini Change SetNeumannBoundaries to SetNeumannBoundariesLocal and provide new SetNeumannBoundaries (same Dirichlet) 4da1bb401SStefano Zampini Exact solvers: Solve local saddle point directly 5831a100dSStefano Zampini - change prec_type to switch_inexact_prec_type 6831a100dSStefano Zampini - add bool solve_exact_saddle_point slot to pdbddc data 73b03a366Sstefano_zampini Inexact solvers: global preconditioner application is ready, ask to developers (Jed?) on how to best implement Dohrmann's approach (PCSHELL?) 8a0ba757dSStefano Zampini change how to deal with the coarse problem (PCBDDCSetCoarseEnvironment): 9a0ba757dSStefano Zampini - mind the problem with coarsening_factor 10a0ba757dSStefano Zampini - simplify coarse problem structure -> PCBDDC or PCREDUDANT, nothing else -> same comm for all levels? 11a0ba757dSStefano Zampini - remove coarse enums and allow use of PCBDDCGetCoarseKSP 12a0ba757dSStefano Zampini - remove metis dependency -> use MatPartitioning for multilevel -> Assemble serial adjacency in ManageLocalBoundaries? 133b03a366Sstefano_zampini - Add levels' slot to bddc data structure and associated Set/Get functions 14a0ba757dSStefano Zampini code refactoring: 15a0ba757dSStefano Zampini - pick up better names for static functions 16a0ba757dSStefano Zampini change options structure: 17a0ba757dSStefano Zampini - insert BDDC into MG framework? 18a0ba757dSStefano Zampini provide other ops? Ask to developers 19a0ba757dSStefano Zampini remove all unused printf 20a0ba757dSStefano Zampini man pages 2153cdbc3dSStefano Zampini */ 220c7d97c5SJed Brown 2353cdbc3dSStefano Zampini /* ---------------------------------------------------------------------------------------------------------------------------------------------- 240c7d97c5SJed Brown Implementation of BDDC preconditioner based on: 250c7d97c5SJed Brown C. Dohrmann "An approximate BDDC preconditioner", Numerical Linear Algebra with Applications Volume 14, Issue 2, pages 149-168, March 2007 2653cdbc3dSStefano Zampini ---------------------------------------------------------------------------------------------------------------------------------------------- */ 2753cdbc3dSStefano Zampini 2853cdbc3dSStefano Zampini #include "bddc.h" /*I "petscpc.h" I*/ /* includes for fortran wrappers */ 293b03a366Sstefano_zampini #include <petscblaslapack.h> 300c7d97c5SJed Brown 310c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 320c7d97c5SJed Brown #undef __FUNCT__ 330c7d97c5SJed Brown #define __FUNCT__ "PCSetFromOptions_BDDC" 340c7d97c5SJed Brown PetscErrorCode PCSetFromOptions_BDDC(PC pc) 350c7d97c5SJed Brown { 360c7d97c5SJed Brown PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 370c7d97c5SJed Brown PetscErrorCode ierr; 380c7d97c5SJed Brown 390c7d97c5SJed Brown PetscFunctionBegin; 400c7d97c5SJed Brown ierr = PetscOptionsHead("BDDC options");CHKERRQ(ierr); 410c7d97c5SJed Brown /* Verbose debugging of main data structures */ 42e269702eSStefano Zampini ierr = PetscOptionsBool("-pc_bddc_check_all" ,"Verbose (debugging) output for PCBDDC" ,"none",pcbddc->dbg_flag ,&pcbddc->dbg_flag ,PETSC_NULL);CHKERRQ(ierr); 430c7d97c5SJed Brown /* Some customization for default primal space */ 44da1bb401SStefano Zampini ierr = PetscOptionsBool("-pc_bddc_vertices_only" ,"Use only vertices in coarse space (i.e. discard constraints)","none",pcbddc->vertices_flag ,&pcbddc->vertices_flag ,PETSC_NULL);CHKERRQ(ierr); 45da1bb401SStefano Zampini ierr = PetscOptionsBool("-pc_bddc_constraints_only","Use only constraints in coarse space (i.e. discard vertices)","none",pcbddc->constraints_flag,&pcbddc->constraints_flag,PETSC_NULL);CHKERRQ(ierr); 46da1bb401SStefano Zampini ierr = PetscOptionsBool("-pc_bddc_faces_only" ,"Use only faces among constraints of coarse space (i.e. discard edges)" ,"none",pcbddc->faces_flag ,&pcbddc->faces_flag ,PETSC_NULL);CHKERRQ(ierr); 47da1bb401SStefano Zampini ierr = PetscOptionsBool("-pc_bddc_edges_only" ,"Use only edges among constraints of coarse space (i.e. discard faces)" ,"none",pcbddc->edges_flag ,&pcbddc->edges_flag ,PETSC_NULL);CHKERRQ(ierr); 480c7d97c5SJed Brown /* Coarse solver context */ 49da1bb401SStefano Zampini static const char *avail_coarse_problems[] = {"sequential","replicated","parallel","multilevel",""}; /*order of choiches depends on ENUM defined in bddc.h */ 500c7d97c5SJed Brown ierr = PetscOptionsEnum("-pc_bddc_coarse_problem_type","Set coarse problem type","none",avail_coarse_problems,(PetscEnum)pcbddc->coarse_problem_type,(PetscEnum*)&pcbddc->coarse_problem_type,PETSC_NULL);CHKERRQ(ierr); 510c7d97c5SJed Brown /* Two different application of BDDC to the whole set of dofs, internal and interface */ 520c7d97c5SJed Brown ierr = PetscOptionsBool("-pc_bddc_switch_preconditioning_type","Switch between M_2 (default) and M_3 preconditioners (as defined by Dohrmann)","none",pcbddc->prec_type,&pcbddc->prec_type,PETSC_NULL);CHKERRQ(ierr); 53534831adSStefano Zampini ierr = PetscOptionsBool("-pc_bddc_use_change_of_basis","Use change of basis approach for primal space","none",pcbddc->usechangeofbasis,&pcbddc->usechangeofbasis,PETSC_NULL);CHKERRQ(ierr); 54534831adSStefano Zampini ierr = PetscOptionsBool("-pc_bddc_use_change_on_faces","Use change of basis approach for face constraints","none",pcbddc->usechangeonfaces,&pcbddc->usechangeonfaces,PETSC_NULL);CHKERRQ(ierr); 55534831adSStefano Zampini pcbddc->usechangeonfaces = pcbddc->usechangeonfaces && pcbddc->usechangeofbasis; 560c7d97c5SJed Brown ierr = PetscOptionsInt("-pc_bddc_coarsening_ratio","Set coarsening ratio used in multilevel coarsening","none",pcbddc->coarsening_ratio,&pcbddc->coarsening_ratio,PETSC_NULL);CHKERRQ(ierr); 570c7d97c5SJed Brown ierr = PetscOptionsTail();CHKERRQ(ierr); 580c7d97c5SJed Brown PetscFunctionReturn(0); 590c7d97c5SJed Brown } 600c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 610c7d97c5SJed Brown EXTERN_C_BEGIN 620c7d97c5SJed Brown #undef __FUNCT__ 630c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetCoarseProblemType_BDDC" 6453cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetCoarseProblemType_BDDC(PC pc, CoarseProblemType CPT) 650c7d97c5SJed Brown { 660c7d97c5SJed Brown PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 670c7d97c5SJed Brown 680c7d97c5SJed Brown PetscFunctionBegin; 690c7d97c5SJed Brown pcbddc->coarse_problem_type = CPT; 700c7d97c5SJed Brown PetscFunctionReturn(0); 710c7d97c5SJed Brown } 720c7d97c5SJed Brown EXTERN_C_END 730c7d97c5SJed Brown #undef __FUNCT__ 740c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetCoarseProblemType" 7553cdbc3dSStefano Zampini /*@ 769c0446d6SStefano Zampini PCBDDCSetCoarseProblemType - Set coarse problem type in PCBDDC. 7753cdbc3dSStefano Zampini 789c0446d6SStefano Zampini Not collective 7953cdbc3dSStefano Zampini 8053cdbc3dSStefano Zampini Input Parameters: 8153cdbc3dSStefano Zampini + pc - the preconditioning context 8253cdbc3dSStefano Zampini - CoarseProblemType - pick a better name and explain what this is 8353cdbc3dSStefano Zampini 8453cdbc3dSStefano Zampini Level: intermediate 8553cdbc3dSStefano Zampini 8653cdbc3dSStefano Zampini Notes: 87da1bb401SStefano Zampini Not collective but all procs must call with same arguments. 8853cdbc3dSStefano Zampini 8953cdbc3dSStefano Zampini .seealso: PCBDDC 9053cdbc3dSStefano Zampini @*/ 910c7d97c5SJed Brown PetscErrorCode PCBDDCSetCoarseProblemType(PC pc, CoarseProblemType CPT) 920c7d97c5SJed Brown { 930c7d97c5SJed Brown PetscErrorCode ierr; 940c7d97c5SJed Brown 950c7d97c5SJed Brown PetscFunctionBegin; 960c7d97c5SJed Brown PetscValidHeaderSpecific(pc,PC_CLASSID,1); 970c7d97c5SJed Brown ierr = PetscTryMethod(pc,"PCBDDCSetCoarseProblemType_C",(PC,CoarseProblemType),(pc,CPT));CHKERRQ(ierr); 980c7d97c5SJed Brown PetscFunctionReturn(0); 990c7d97c5SJed Brown } 1000c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 1010c7d97c5SJed Brown EXTERN_C_BEGIN 1020c7d97c5SJed Brown #undef __FUNCT__ 1033b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCSetDirichletBoundaries_BDDC" 1043b03a366Sstefano_zampini static PetscErrorCode PCBDDCSetDirichletBoundaries_BDDC(PC pc,IS DirichletBoundaries) 1053b03a366Sstefano_zampini { 1063b03a366Sstefano_zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 1073b03a366Sstefano_zampini PetscErrorCode ierr; 1083b03a366Sstefano_zampini 1093b03a366Sstefano_zampini PetscFunctionBegin; 1103b03a366Sstefano_zampini ierr = ISDestroy(&pcbddc->DirichletBoundaries);CHKERRQ(ierr); 11136e030ebSStefano Zampini ierr = PetscObjectReference((PetscObject)DirichletBoundaries);CHKERRQ(ierr); 11236e030ebSStefano Zampini pcbddc->DirichletBoundaries=DirichletBoundaries; 1133b03a366Sstefano_zampini PetscFunctionReturn(0); 1143b03a366Sstefano_zampini } 1153b03a366Sstefano_zampini EXTERN_C_END 1163b03a366Sstefano_zampini #undef __FUNCT__ 1173b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCSetDirichletBoundaries" 1183b03a366Sstefano_zampini /*@ 119da1bb401SStefano Zampini PCBDDCSetDirichletBoundaries - Set index set defining subdomain part (in local ordering) 120da1bb401SStefano Zampini of Dirichlet boundaries for the global problem. 1213b03a366Sstefano_zampini 1223b03a366Sstefano_zampini Not collective 1233b03a366Sstefano_zampini 1243b03a366Sstefano_zampini Input Parameters: 1253b03a366Sstefano_zampini + pc - the preconditioning context 1263b03a366Sstefano_zampini - DirichletBoundaries - sequential index set defining the subdomain part of Dirichlet boundaries (can be PETSC_NULL) 1273b03a366Sstefano_zampini 1283b03a366Sstefano_zampini Level: intermediate 1293b03a366Sstefano_zampini 1303b03a366Sstefano_zampini Notes: 1313b03a366Sstefano_zampini 1323b03a366Sstefano_zampini .seealso: PCBDDC 1333b03a366Sstefano_zampini @*/ 1343b03a366Sstefano_zampini PetscErrorCode PCBDDCSetDirichletBoundaries(PC pc,IS DirichletBoundaries) 1353b03a366Sstefano_zampini { 1363b03a366Sstefano_zampini PetscErrorCode ierr; 1373b03a366Sstefano_zampini 1383b03a366Sstefano_zampini PetscFunctionBegin; 1393b03a366Sstefano_zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 1403b03a366Sstefano_zampini ierr = PetscTryMethod(pc,"PCBDDCSetDirichletBoundaries_C",(PC,IS),(pc,DirichletBoundaries));CHKERRQ(ierr); 1413b03a366Sstefano_zampini PetscFunctionReturn(0); 1423b03a366Sstefano_zampini } 1433b03a366Sstefano_zampini /* -------------------------------------------------------------------------- */ 1443b03a366Sstefano_zampini EXTERN_C_BEGIN 1453b03a366Sstefano_zampini #undef __FUNCT__ 1460c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetNeumannBoundaries_BDDC" 14753cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetNeumannBoundaries_BDDC(PC pc,IS NeumannBoundaries) 1480c7d97c5SJed Brown { 1490c7d97c5SJed Brown PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 15053cdbc3dSStefano Zampini PetscErrorCode ierr; 1510c7d97c5SJed Brown 1520c7d97c5SJed Brown PetscFunctionBegin; 15353cdbc3dSStefano Zampini ierr = ISDestroy(&pcbddc->NeumannBoundaries);CHKERRQ(ierr); 15436e030ebSStefano Zampini ierr = PetscObjectReference((PetscObject)NeumannBoundaries);CHKERRQ(ierr); 15536e030ebSStefano Zampini pcbddc->NeumannBoundaries=NeumannBoundaries; 1560c7d97c5SJed Brown PetscFunctionReturn(0); 1570c7d97c5SJed Brown } 1580c7d97c5SJed Brown EXTERN_C_END 1590c7d97c5SJed Brown #undef __FUNCT__ 1600c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetNeumannBoundaries" 16157527edcSJed Brown /*@ 162da1bb401SStefano Zampini PCBDDCSetNeumannBoundaries - Set index set defining subdomain part (in local ordering) 163da1bb401SStefano Zampini of Neumann boundaries for the global problem. 16457527edcSJed Brown 1659c0446d6SStefano Zampini Not collective 16657527edcSJed Brown 16757527edcSJed Brown Input Parameters: 16857527edcSJed Brown + pc - the preconditioning context 1699c0446d6SStefano Zampini - NeumannBoundaries - sequential index set defining the subdomain part of Neumann boundaries (can be PETSC_NULL) 17057527edcSJed Brown 17157527edcSJed Brown Level: intermediate 17257527edcSJed Brown 17357527edcSJed Brown Notes: 17457527edcSJed Brown 17557527edcSJed Brown .seealso: PCBDDC 17657527edcSJed Brown @*/ 17753cdbc3dSStefano Zampini PetscErrorCode PCBDDCSetNeumannBoundaries(PC pc,IS NeumannBoundaries) 1780c7d97c5SJed Brown { 1790c7d97c5SJed Brown PetscErrorCode ierr; 1800c7d97c5SJed Brown 1810c7d97c5SJed Brown PetscFunctionBegin; 1820c7d97c5SJed Brown PetscValidHeaderSpecific(pc,PC_CLASSID,1); 18353cdbc3dSStefano Zampini ierr = PetscTryMethod(pc,"PCBDDCSetNeumannBoundaries_C",(PC,IS),(pc,NeumannBoundaries));CHKERRQ(ierr); 18453cdbc3dSStefano Zampini PetscFunctionReturn(0); 18553cdbc3dSStefano Zampini } 18653cdbc3dSStefano Zampini /* -------------------------------------------------------------------------- */ 18753cdbc3dSStefano Zampini EXTERN_C_BEGIN 18853cdbc3dSStefano Zampini #undef __FUNCT__ 189da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCGetDirichletBoundaries_BDDC" 190da1bb401SStefano Zampini static PetscErrorCode PCBDDCGetDirichletBoundaries_BDDC(PC pc,IS *DirichletBoundaries) 191da1bb401SStefano Zampini { 192da1bb401SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 193da1bb401SStefano Zampini 194da1bb401SStefano Zampini PetscFunctionBegin; 195da1bb401SStefano Zampini *DirichletBoundaries = pcbddc->DirichletBoundaries; 196da1bb401SStefano Zampini PetscFunctionReturn(0); 197da1bb401SStefano Zampini } 198da1bb401SStefano Zampini EXTERN_C_END 199da1bb401SStefano Zampini #undef __FUNCT__ 200da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCGetDirichletBoundaries" 201da1bb401SStefano Zampini /*@ 202da1bb401SStefano Zampini PCBDDCGetDirichletBoundaries - Get index set defining subdomain part (in local ordering) 203da1bb401SStefano Zampini of Dirichlet boundaries for the global problem. 204da1bb401SStefano Zampini 205da1bb401SStefano Zampini Not collective 206da1bb401SStefano Zampini 207da1bb401SStefano Zampini Input Parameters: 208da1bb401SStefano Zampini + pc - the preconditioning context 209da1bb401SStefano Zampini 210da1bb401SStefano Zampini Output Parameters: 211da1bb401SStefano Zampini + DirichletBoundaries - index set defining the subdomain part of Dirichlet boundaries 212da1bb401SStefano Zampini 213da1bb401SStefano Zampini Level: intermediate 214da1bb401SStefano Zampini 215da1bb401SStefano Zampini Notes: 216da1bb401SStefano Zampini 217da1bb401SStefano Zampini .seealso: PCBDDC 218da1bb401SStefano Zampini @*/ 219da1bb401SStefano Zampini PetscErrorCode PCBDDCGetDirichletBoundaries(PC pc,IS *DirichletBoundaries) 220da1bb401SStefano Zampini { 221da1bb401SStefano Zampini PetscErrorCode ierr; 222da1bb401SStefano Zampini 223da1bb401SStefano Zampini PetscFunctionBegin; 224da1bb401SStefano Zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 225da1bb401SStefano Zampini ierr = PetscUseMethod(pc,"PCBDDCGetDirichletBoundaries_C",(PC,IS*),(pc,DirichletBoundaries));CHKERRQ(ierr); 226da1bb401SStefano Zampini PetscFunctionReturn(0); 227da1bb401SStefano Zampini } 228da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */ 229da1bb401SStefano Zampini EXTERN_C_BEGIN 230da1bb401SStefano Zampini #undef __FUNCT__ 23153cdbc3dSStefano Zampini #define __FUNCT__ "PCBDDCGetNeumannBoundaries_BDDC" 23253cdbc3dSStefano Zampini static PetscErrorCode PCBDDCGetNeumannBoundaries_BDDC(PC pc,IS *NeumannBoundaries) 23353cdbc3dSStefano Zampini { 23453cdbc3dSStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 23553cdbc3dSStefano Zampini 23653cdbc3dSStefano Zampini PetscFunctionBegin; 23753cdbc3dSStefano Zampini *NeumannBoundaries = pcbddc->NeumannBoundaries; 23853cdbc3dSStefano Zampini PetscFunctionReturn(0); 23953cdbc3dSStefano Zampini } 24053cdbc3dSStefano Zampini EXTERN_C_END 24153cdbc3dSStefano Zampini #undef __FUNCT__ 24253cdbc3dSStefano Zampini #define __FUNCT__ "PCBDDCGetNeumannBoundaries" 24353cdbc3dSStefano Zampini /*@ 244da1bb401SStefano Zampini PCBDDCGetNeumannBoundaries - Get index set defining subdomain part (in local ordering) 245da1bb401SStefano Zampini of Neumann boundaries for the global problem. 24653cdbc3dSStefano Zampini 2479c0446d6SStefano Zampini Not collective 24853cdbc3dSStefano Zampini 24953cdbc3dSStefano Zampini Input Parameters: 25053cdbc3dSStefano Zampini + pc - the preconditioning context 25153cdbc3dSStefano Zampini 25253cdbc3dSStefano Zampini Output Parameters: 25353cdbc3dSStefano Zampini + NeumannBoundaries - index set defining the subdomain part of Neumann boundaries 25453cdbc3dSStefano Zampini 25553cdbc3dSStefano Zampini Level: intermediate 25653cdbc3dSStefano Zampini 25753cdbc3dSStefano Zampini Notes: 25853cdbc3dSStefano Zampini 25953cdbc3dSStefano Zampini .seealso: PCBDDC 26053cdbc3dSStefano Zampini @*/ 26153cdbc3dSStefano Zampini PetscErrorCode PCBDDCGetNeumannBoundaries(PC pc,IS *NeumannBoundaries) 26253cdbc3dSStefano Zampini { 26353cdbc3dSStefano Zampini PetscErrorCode ierr; 26453cdbc3dSStefano Zampini 26553cdbc3dSStefano Zampini PetscFunctionBegin; 26653cdbc3dSStefano Zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 26753cdbc3dSStefano Zampini ierr = PetscUseMethod(pc,"PCBDDCGetNeumannBoundaries_C",(PC,IS*),(pc,NeumannBoundaries));CHKERRQ(ierr); 2680c7d97c5SJed Brown PetscFunctionReturn(0); 2690c7d97c5SJed Brown } 27036e030ebSStefano Zampini /* -------------------------------------------------------------------------- */ 27136e030ebSStefano Zampini EXTERN_C_BEGIN 27236e030ebSStefano Zampini #undef __FUNCT__ 273da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetLocalAdjacencyGraph_BDDC" 274da1bb401SStefano Zampini static PetscErrorCode PCBDDCSetLocalAdjacencyGraph_BDDC(PC pc, PetscInt nvtxs, PetscInt xadj[], PetscInt adjncy[], PetscCopyMode copymode) 27536e030ebSStefano Zampini { 27636e030ebSStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 277da1bb401SStefano Zampini PCBDDCGraph mat_graph=pcbddc->mat_graph; 278da1bb401SStefano Zampini PetscErrorCode ierr; 27936e030ebSStefano Zampini 28036e030ebSStefano Zampini PetscFunctionBegin; 281da1bb401SStefano Zampini mat_graph->nvtxs=nvtxs; 282da1bb401SStefano Zampini ierr = PetscFree(mat_graph->xadj);CHKERRQ(ierr); 283da1bb401SStefano Zampini ierr = PetscFree(mat_graph->adjncy);CHKERRQ(ierr); 284da1bb401SStefano Zampini if(copymode == PETSC_COPY_VALUES) { 285da1bb401SStefano Zampini ierr = PetscMalloc((mat_graph->nvtxs+1)*sizeof(PetscInt),&mat_graph->xadj);CHKERRQ(ierr); 286da1bb401SStefano Zampini ierr = PetscMalloc(xadj[mat_graph->nvtxs]*sizeof(PetscInt),&mat_graph->adjncy);CHKERRQ(ierr); 287da1bb401SStefano Zampini ierr = PetscMemcpy(mat_graph->xadj,xadj,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr); 288da1bb401SStefano Zampini ierr = PetscMemcpy(mat_graph->adjncy,adjncy,xadj[mat_graph->nvtxs]*sizeof(PetscInt));CHKERRQ(ierr); 289da1bb401SStefano Zampini } else if(copymode == PETSC_OWN_POINTER) { 290da1bb401SStefano Zampini mat_graph->xadj=xadj; 291da1bb401SStefano Zampini mat_graph->adjncy=adjncy; 292da1bb401SStefano Zampini } else { 293da1bb401SStefano Zampini SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_SUP,"Unsupported copy mode %d in %s\n",copymode,__FUNCT__); 294da1bb401SStefano Zampini } 29536e030ebSStefano Zampini PetscFunctionReturn(0); 29636e030ebSStefano Zampini } 29736e030ebSStefano Zampini EXTERN_C_END 29836e030ebSStefano Zampini #undef __FUNCT__ 299da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetLocalAdjacencyGraph" 30036e030ebSStefano Zampini /*@ 301da1bb401SStefano Zampini PCBDDCSetLocalAdjacencyGraph - Set CSR graph of local matrix for use of PCBDDC. 30236e030ebSStefano Zampini 30336e030ebSStefano Zampini Not collective 30436e030ebSStefano Zampini 30536e030ebSStefano Zampini Input Parameters: 30636e030ebSStefano Zampini + pc - the preconditioning context 307da1bb401SStefano Zampini - nvtxs - number of local vertices of the graph 308da1bb401SStefano Zampini - xadj, adjncy - the CSR graph 309da1bb401SStefano Zampini - copymode - either PETSC_COPY_VALUES or PETSC_OWN_POINTER. In the former case the user must free the array passed in; 310da1bb401SStefano Zampini in the latter case, memory must be obtained with PetscMalloc. 31136e030ebSStefano Zampini 31236e030ebSStefano Zampini Level: intermediate 31336e030ebSStefano Zampini 31436e030ebSStefano Zampini Notes: 31536e030ebSStefano Zampini 31636e030ebSStefano Zampini .seealso: PCBDDC 31736e030ebSStefano Zampini @*/ 318da1bb401SStefano Zampini PetscErrorCode PCBDDCSetLocalAdjacencyGraph(PC pc,PetscInt nvtxs,PetscInt xadj[],PetscInt adjncy[], PetscCopyMode copymode) 31936e030ebSStefano Zampini { 320da1bb401SStefano Zampini PetscInt nrows,ncols; 321da1bb401SStefano Zampini Mat_IS *matis = (Mat_IS*)pc->pmat->data; 32236e030ebSStefano Zampini PetscErrorCode ierr; 32336e030ebSStefano Zampini 32436e030ebSStefano Zampini PetscFunctionBegin; 32536e030ebSStefano Zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 326da1bb401SStefano Zampini ierr = MatGetSize(matis->A,&nrows,&ncols);CHKERRQ(ierr); 327da1bb401SStefano Zampini if(nvtxs != nrows) { 328da1bb401SStefano Zampini SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Local adjacency size %d passed in %s differs from local problem size %d!\n",nvtxs,__FUNCT__,nrows); 329da1bb401SStefano Zampini } else { 330da1bb401SStefano Zampini ierr = PetscTryMethod(pc,"PCBDDCSetLocalAdjacencyGraph_C",(PC,PetscInt,PetscInt[],PetscInt[],PetscCopyMode),(pc,nvtxs,xadj,adjncy,copymode));CHKERRQ(ierr); 331da1bb401SStefano Zampini } 33236e030ebSStefano Zampini PetscFunctionReturn(0); 33336e030ebSStefano Zampini } 3349c0446d6SStefano Zampini /* -------------------------------------------------------------------------- */ 3359c0446d6SStefano Zampini EXTERN_C_BEGIN 3369c0446d6SStefano Zampini #undef __FUNCT__ 3379c0446d6SStefano Zampini #define __FUNCT__ "PCBDDCSetDofsSplitting_BDDC" 3389c0446d6SStefano Zampini static PetscErrorCode PCBDDCSetDofsSplitting_BDDC(PC pc,PetscInt n_is, IS ISForDofs[]) 3399c0446d6SStefano Zampini { 3409c0446d6SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 3419c0446d6SStefano Zampini PetscInt i; 3429c0446d6SStefano Zampini PetscErrorCode ierr; 3439c0446d6SStefano Zampini 3449c0446d6SStefano Zampini PetscFunctionBegin; 345da1bb401SStefano Zampini /* Destroy ISes if they were already set */ 3469c0446d6SStefano Zampini for(i=0;i<pcbddc->n_ISForDofs;i++) { 3479c0446d6SStefano Zampini ierr = ISDestroy(&pcbddc->ISForDofs[i]);CHKERRQ(ierr); 3489c0446d6SStefano Zampini } 349d11ae9bbSstefano_zampini ierr = PetscFree(pcbddc->ISForDofs);CHKERRQ(ierr); 350da1bb401SStefano Zampini /* allocate space then set */ 3519c0446d6SStefano Zampini ierr = PetscMalloc(n_is*sizeof(IS),&pcbddc->ISForDofs);CHKERRQ(ierr); 3529c0446d6SStefano Zampini for(i=0;i<n_is;i++) { 353da1bb401SStefano Zampini ierr = PetscObjectReference((PetscObject)ISForDofs[i]);CHKERRQ(ierr); 354da1bb401SStefano Zampini pcbddc->ISForDofs[i]=ISForDofs[i]; 3559c0446d6SStefano Zampini } 3569c0446d6SStefano Zampini pcbddc->n_ISForDofs=n_is; 3579c0446d6SStefano Zampini PetscFunctionReturn(0); 3589c0446d6SStefano Zampini } 3599c0446d6SStefano Zampini EXTERN_C_END 3609c0446d6SStefano Zampini #undef __FUNCT__ 3619c0446d6SStefano Zampini #define __FUNCT__ "PCBDDCSetDofsSplitting" 3629c0446d6SStefano Zampini /*@ 363da1bb401SStefano Zampini PCBDDCSetDofsSplitting - Set index sets defining fields of local mat. 3649c0446d6SStefano Zampini 3659c0446d6SStefano Zampini Not collective 3669c0446d6SStefano Zampini 3679c0446d6SStefano Zampini Input Parameters: 3689c0446d6SStefano Zampini + pc - the preconditioning context 369da1bb401SStefano Zampini - n - number of index sets defining the fields 370da1bb401SStefano Zampini - IS[] - array of IS describing the fields 3719c0446d6SStefano Zampini 3729c0446d6SStefano Zampini Level: intermediate 3739c0446d6SStefano Zampini 3749c0446d6SStefano Zampini Notes: 3759c0446d6SStefano Zampini 3769c0446d6SStefano Zampini .seealso: PCBDDC 3779c0446d6SStefano Zampini @*/ 3789c0446d6SStefano Zampini PetscErrorCode PCBDDCSetDofsSplitting(PC pc,PetscInt n_is, IS ISForDofs[]) 3799c0446d6SStefano Zampini { 3809c0446d6SStefano Zampini PetscErrorCode ierr; 3819c0446d6SStefano Zampini 3829c0446d6SStefano Zampini PetscFunctionBegin; 3839c0446d6SStefano Zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 3849c0446d6SStefano Zampini ierr = PetscTryMethod(pc,"PCBDDCSetDofsSplitting_C",(PC,PetscInt,IS[]),(pc,n_is,ISForDofs));CHKERRQ(ierr); 3859c0446d6SStefano Zampini PetscFunctionReturn(0); 3869c0446d6SStefano Zampini } 387da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */ 388534831adSStefano Zampini #undef __FUNCT__ 389534831adSStefano Zampini #define __FUNCT__ "PCPreSolve_BDDC" 390534831adSStefano Zampini /* -------------------------------------------------------------------------- */ 391534831adSStefano Zampini /* 392534831adSStefano Zampini PCPreSolve_BDDC - Changes the right hand side and (if necessary) the initial 393534831adSStefano Zampini guess if a transformation of basis approach has been selected. 3949c0446d6SStefano Zampini 395534831adSStefano Zampini Input Parameter: 396534831adSStefano Zampini + pc - the preconditioner contex 397534831adSStefano Zampini 398534831adSStefano Zampini Application Interface Routine: PCPreSolve() 399534831adSStefano Zampini 400534831adSStefano Zampini Notes: 401534831adSStefano Zampini The interface routine PCPreSolve() is not usually called directly by 402534831adSStefano Zampini the user, but instead is called by KSPSolve(). 403534831adSStefano Zampini */ 404534831adSStefano Zampini static PetscErrorCode PCPreSolve_BDDC(PC pc, KSP ksp, Vec rhs, Vec x) 405534831adSStefano Zampini { 406534831adSStefano Zampini PetscErrorCode ierr; 407534831adSStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 408534831adSStefano Zampini PC_IS *pcis = (PC_IS*)(pc->data); 409534831adSStefano Zampini Mat_IS *matis = (Mat_IS*)pc->pmat->data; 410534831adSStefano Zampini Mat temp_mat; 411534831adSStefano Zampini 412534831adSStefano Zampini PetscFunctionBegin; 413534831adSStefano Zampini if(pcbddc->usechangeofbasis) { 414534831adSStefano Zampini /* swap pointers for local matrices */ 415534831adSStefano Zampini temp_mat = matis->A; 416534831adSStefano Zampini matis->A = pcbddc->local_mat; 417534831adSStefano Zampini pcbddc->local_mat = temp_mat; 418534831adSStefano Zampini /* store the original rhs */ 419534831adSStefano Zampini ierr = VecCopy(rhs,pcbddc->original_rhs);CHKERRQ(ierr); 420534831adSStefano Zampini /* Get local rhs and apply transformation of basis */ 421534831adSStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,rhs,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 422534831adSStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,rhs,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 423534831adSStefano Zampini /* from original basis to modified basis */ 424534831adSStefano Zampini ierr = MatMultTranspose(pcbddc->ChangeOfBasisMatrix,pcis->vec1_B,pcis->vec2_B);CHKERRQ(ierr); 425534831adSStefano Zampini /* put back modified values into the global vec using INSERT_VALUES copy mode */ 426534831adSStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,pcis->vec2_B,rhs,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 427534831adSStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,pcis->vec2_B,rhs,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 428534831adSStefano Zampini } 429534831adSStefano Zampini PetscFunctionReturn(0); 430534831adSStefano Zampini } 431534831adSStefano Zampini /* -------------------------------------------------------------------------- */ 432534831adSStefano Zampini #undef __FUNCT__ 433534831adSStefano Zampini #define __FUNCT__ "PCPostSolve_BDDC" 434534831adSStefano Zampini /* -------------------------------------------------------------------------- */ 435534831adSStefano Zampini /* 436534831adSStefano Zampini PCPostSolve_BDDC - Changes the computed solution if a transformation of basis 437534831adSStefano Zampini approach has been selected. Also, restores rhs to its original state. 438534831adSStefano Zampini 439534831adSStefano Zampini Input Parameter: 440534831adSStefano Zampini + pc - the preconditioner contex 441534831adSStefano Zampini 442534831adSStefano Zampini Application Interface Routine: PCPostSolve() 443534831adSStefano Zampini 444534831adSStefano Zampini Notes: 445534831adSStefano Zampini The interface routine PCPostSolve() is not usually called directly by 446534831adSStefano Zampini the user, but instead is called by KSPSolve(). 447534831adSStefano Zampini */ 448534831adSStefano Zampini static PetscErrorCode PCPostSolve_BDDC(PC pc, KSP ksp, Vec rhs, Vec x) 449534831adSStefano Zampini { 450534831adSStefano Zampini PetscErrorCode ierr; 451534831adSStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 452534831adSStefano Zampini PC_IS *pcis = (PC_IS*)(pc->data); 453534831adSStefano Zampini Mat_IS *matis = (Mat_IS*)pc->pmat->data; 454534831adSStefano Zampini Mat temp_mat; 455534831adSStefano Zampini 456534831adSStefano Zampini PetscFunctionBegin; 457534831adSStefano Zampini if(pcbddc->usechangeofbasis) { 458534831adSStefano Zampini /* swap pointers for local matrices */ 459534831adSStefano Zampini temp_mat = matis->A; 460534831adSStefano Zampini matis->A = pcbddc->local_mat; 461534831adSStefano Zampini pcbddc->local_mat = temp_mat; 462534831adSStefano Zampini /* restore rhs to its original state */ 463534831adSStefano Zampini ierr = VecCopy(pcbddc->original_rhs,rhs);CHKERRQ(ierr); 464534831adSStefano Zampini /* Get Local boundary and apply transformation of basis to solution vector */ 465534831adSStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,x,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 466534831adSStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,x,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 467534831adSStefano Zampini /* from modified basis to original basis */ 468534831adSStefano Zampini ierr = MatMult(pcbddc->ChangeOfBasisMatrix,pcis->vec1_B,pcis->vec2_B);CHKERRQ(ierr); 469534831adSStefano Zampini /* put back modified values into the global vec using INSERT_VALUES copy mode */ 470534831adSStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,pcis->vec2_B,x,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 471534831adSStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,pcis->vec2_B,x,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 472534831adSStefano Zampini } 473534831adSStefano Zampini PetscFunctionReturn(0); 474534831adSStefano Zampini } 475534831adSStefano Zampini /* -------------------------------------------------------------------------- */ 47653cdbc3dSStefano Zampini #undef __FUNCT__ 47753cdbc3dSStefano Zampini #define __FUNCT__ "PCSetUp_BDDC" 4780c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 4790c7d97c5SJed Brown /* 4800c7d97c5SJed Brown PCSetUp_BDDC - Prepares for the use of the BDDC preconditioner 4810c7d97c5SJed Brown by setting data structures and options. 4820c7d97c5SJed Brown 4830c7d97c5SJed Brown Input Parameter: 48453cdbc3dSStefano Zampini + pc - the preconditioner context 4850c7d97c5SJed Brown 4860c7d97c5SJed Brown Application Interface Routine: PCSetUp() 4870c7d97c5SJed Brown 4880c7d97c5SJed Brown Notes: 4890c7d97c5SJed Brown The interface routine PCSetUp() is not usually called directly by 4900c7d97c5SJed Brown the user, but instead is called by PCApply() if necessary. 4910c7d97c5SJed Brown */ 49253cdbc3dSStefano Zampini PetscErrorCode PCSetUp_BDDC(PC pc) 4930c7d97c5SJed Brown { 4940c7d97c5SJed Brown PetscErrorCode ierr; 4950c7d97c5SJed Brown PC_BDDC* pcbddc = (PC_BDDC*)pc->data; 4960c7d97c5SJed Brown PC_IS *pcis = (PC_IS*)(pc->data); 4970c7d97c5SJed Brown 4980c7d97c5SJed Brown PetscFunctionBegin; 4990c7d97c5SJed Brown if (!pc->setupcalled) { 5003b03a366Sstefano_zampini /* For BDDC we need to define a local "Neumann" problem different to that defined in PCISSetup 5019c0446d6SStefano Zampini So, we set to pcnone the Neumann problem of pcis in order to avoid unneeded computation 5020c7d97c5SJed Brown Also, we decide to directly build the (same) Dirichlet problem */ 5030c7d97c5SJed Brown ierr = PetscOptionsSetValue("-is_localN_pc_type","none");CHKERRQ(ierr); 5040c7d97c5SJed Brown ierr = PetscOptionsSetValue("-is_localD_pc_type","none");CHKERRQ(ierr); 5050c7d97c5SJed Brown /* Set up all the "iterative substructuring" common block */ 5060c7d97c5SJed Brown ierr = PCISSetUp(pc);CHKERRQ(ierr); 5073b03a366Sstefano_zampini /* Get stdout for dbg */ 508e269702eSStefano Zampini if(pcbddc->dbg_flag) { 509e269702eSStefano Zampini ierr = PetscViewerASCIIGetStdout(((PetscObject)pc)->comm,&pcbddc->dbg_viewer);CHKERRQ(ierr); 510e269702eSStefano Zampini ierr = PetscViewerASCIISynchronizedAllow(pcbddc->dbg_viewer,PETSC_TRUE);CHKERRQ(ierr); 511e269702eSStefano Zampini } 5123b03a366Sstefano_zampini /* TODO MOVE CODE FRAGMENT */ 5130c7d97c5SJed Brown PetscInt im_active=0; 5140c7d97c5SJed Brown if(pcis->n) im_active = 1; 51553cdbc3dSStefano Zampini ierr = MPI_Allreduce(&im_active,&pcbddc->active_procs,1,MPIU_INT,MPI_SUM,((PetscObject)pc)->comm);CHKERRQ(ierr); 5163b03a366Sstefano_zampini /* Analyze local interface */ 5170c7d97c5SJed Brown ierr = PCBDDCManageLocalBoundaries(pc);CHKERRQ(ierr); 5183b03a366Sstefano_zampini /* Set up local constraint matrix */ 5193b03a366Sstefano_zampini ierr = PCBDDCCreateConstraintMatrix(pc);CHKERRQ(ierr); 5200c7d97c5SJed Brown /* Create coarse and local stuffs used for evaluating action of preconditioner */ 5210c7d97c5SJed Brown ierr = PCBDDCCoarseSetUp(pc);CHKERRQ(ierr); 5223b03a366Sstefano_zampini /* Processes fakely involved in multilevel should not call ISLocalToGlobalMappingRestoreInfo */ 5233b03a366Sstefano_zampini if ( !pcis->n_neigh ) pcis->ISLocalToGlobalMappingGetInfoWasCalled=PETSC_FALSE; 5240c7d97c5SJed Brown } 5250c7d97c5SJed Brown PetscFunctionReturn(0); 5260c7d97c5SJed Brown } 5270c7d97c5SJed Brown 5280c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 5290c7d97c5SJed Brown /* 5300c7d97c5SJed Brown PCApply_BDDC - Applies the BDDC preconditioner to a vector. 5310c7d97c5SJed Brown 5320c7d97c5SJed Brown Input Parameters: 5330c7d97c5SJed Brown . pc - the preconditioner context 5340c7d97c5SJed Brown . r - input vector (global) 5350c7d97c5SJed Brown 5360c7d97c5SJed Brown Output Parameter: 5370c7d97c5SJed Brown . z - output vector (global) 5380c7d97c5SJed Brown 5390c7d97c5SJed Brown Application Interface Routine: PCApply() 5400c7d97c5SJed Brown */ 5410c7d97c5SJed Brown #undef __FUNCT__ 5420c7d97c5SJed Brown #define __FUNCT__ "PCApply_BDDC" 54353cdbc3dSStefano Zampini PetscErrorCode PCApply_BDDC(PC pc,Vec r,Vec z) 5440c7d97c5SJed Brown { 5450c7d97c5SJed Brown PC_IS *pcis = (PC_IS*)(pc->data); 5460c7d97c5SJed Brown PC_BDDC *pcbddc = (PC_BDDC*)(pc->data); 5470c7d97c5SJed Brown PetscErrorCode ierr; 5483b03a366Sstefano_zampini const PetscScalar one = 1.0; 5493b03a366Sstefano_zampini const PetscScalar m_one = -1.0; 5502617d88aSStefano Zampini const PetscScalar zero = 0.0; 5510c7d97c5SJed Brown 5520c7d97c5SJed Brown /* This code is similar to that provided in nn.c for PCNN 5530c7d97c5SJed Brown NN interface preconditioner changed to BDDC 5540c7d97c5SJed Brown Added support for M_3 preconditioenr in the reference article (code is active if pcbddc->prec_type = PETSC_TRUE) */ 5550c7d97c5SJed Brown 5560c7d97c5SJed Brown PetscFunctionBegin; 5570c7d97c5SJed Brown /* First Dirichlet solve */ 5580c7d97c5SJed Brown ierr = VecScatterBegin(pcis->global_to_D,r,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 5590c7d97c5SJed Brown ierr = VecScatterEnd (pcis->global_to_D,r,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 56053cdbc3dSStefano Zampini ierr = KSPSolve(pcbddc->ksp_D,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr); 5610c7d97c5SJed Brown /* 5620c7d97c5SJed Brown Assembling right hand side for BDDC operator 5630c7d97c5SJed Brown - vec1_D for the Dirichlet part (if needed, i.e. prec_flag=PETSC_TRUE) 5640c7d97c5SJed Brown - the interface part of the global vector z 5650c7d97c5SJed Brown */ 5660c7d97c5SJed Brown ierr = VecScale(pcis->vec2_D,m_one);CHKERRQ(ierr); 5670c7d97c5SJed Brown ierr = MatMult(pcis->A_BI,pcis->vec2_D,pcis->vec1_B);CHKERRQ(ierr); 5680c7d97c5SJed Brown if(pcbddc->prec_type) { ierr = MatMultAdd(pcis->A_II,pcis->vec2_D,pcis->vec1_D,pcis->vec1_D);CHKERRQ(ierr); } 5690c7d97c5SJed Brown ierr = VecScale(pcis->vec2_D,m_one);CHKERRQ(ierr); 5700c7d97c5SJed Brown ierr = VecCopy(r,z);CHKERRQ(ierr); 5710c7d97c5SJed Brown ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 5720c7d97c5SJed Brown ierr = VecScatterEnd (pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 5730c7d97c5SJed Brown 5742617d88aSStefano Zampini /* Get Local boundary and apply partition of unity */ 5752617d88aSStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 5762617d88aSStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 5772617d88aSStefano Zampini ierr = VecPointwiseMult(pcis->vec1_B,pcis->D,pcis->vec1_B);CHKERRQ(ierr); 5782617d88aSStefano Zampini 5792617d88aSStefano Zampini /* Apply interface preconditioner 5802617d88aSStefano Zampini input/output vecs: pcis->vec1_B and pcis->vec1_D */ 5812617d88aSStefano Zampini ierr = PCBDDCApplyInterfacePreconditioner(pc);CHKERRQ(ierr); 5822617d88aSStefano Zampini 5832617d88aSStefano Zampini /* Apply partition of unity and sum boundary values */ 5842617d88aSStefano Zampini ierr = VecPointwiseMult(pcis->vec1_B,pcis->D,pcis->vec1_B);CHKERRQ(ierr); 5852617d88aSStefano Zampini ierr = VecSet(z,zero);CHKERRQ(ierr); 5862617d88aSStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 5872617d88aSStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 5880c7d97c5SJed Brown 5893b03a366Sstefano_zampini /* Second Dirichlet solve and assembling of output */ 5900c7d97c5SJed Brown ierr = VecScatterBegin(pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 5910c7d97c5SJed Brown ierr = VecScatterEnd (pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 5920c7d97c5SJed Brown ierr = MatMult(pcis->A_IB,pcis->vec1_B,pcis->vec3_D);CHKERRQ(ierr); 5930c7d97c5SJed Brown if(pcbddc->prec_type) { ierr = MatMultAdd(pcis->A_II,pcis->vec1_D,pcis->vec3_D,pcis->vec3_D);CHKERRQ(ierr); } 59453cdbc3dSStefano Zampini ierr = KSPSolve(pcbddc->ksp_D,pcis->vec3_D,pcbddc->vec4_D);CHKERRQ(ierr); 5950c7d97c5SJed Brown ierr = VecScale(pcbddc->vec4_D,m_one);CHKERRQ(ierr); 5960c7d97c5SJed Brown if(pcbddc->prec_type) { ierr = VecAXPY (pcbddc->vec4_D,one,pcis->vec1_D);CHKERRQ(ierr); } 5970c7d97c5SJed Brown ierr = VecAXPY (pcis->vec2_D,one,pcbddc->vec4_D);CHKERRQ(ierr); 5980c7d97c5SJed Brown ierr = VecScatterBegin(pcis->global_to_D,pcis->vec2_D,z,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 5990c7d97c5SJed Brown ierr = VecScatterEnd (pcis->global_to_D,pcis->vec2_D,z,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 6000c7d97c5SJed Brown 6010c7d97c5SJed Brown PetscFunctionReturn(0); 6020c7d97c5SJed Brown 6030c7d97c5SJed Brown } 604da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */ 605da1bb401SStefano Zampini #undef __FUNCT__ 606da1bb401SStefano Zampini #define __FUNCT__ "PCDestroy_BDDC" 607da1bb401SStefano Zampini PetscErrorCode PCDestroy_BDDC(PC pc) 608da1bb401SStefano Zampini { 609da1bb401SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 610da1bb401SStefano Zampini PetscErrorCode ierr; 611da1bb401SStefano Zampini 612da1bb401SStefano Zampini PetscFunctionBegin; 613da1bb401SStefano Zampini /* free data created by PCIS */ 614da1bb401SStefano Zampini ierr = PCISDestroy(pc);CHKERRQ(ierr); 615da1bb401SStefano Zampini /* free BDDC data */ 616534831adSStefano Zampini ierr = VecDestroy(&pcbddc->original_rhs);CHKERRQ(ierr); 617534831adSStefano Zampini ierr = MatDestroy(&pcbddc->local_mat);CHKERRQ(ierr); 618534831adSStefano Zampini ierr = MatDestroy(&pcbddc->ChangeOfBasisMatrix);CHKERRQ(ierr); 619da1bb401SStefano Zampini ierr = VecDestroy(&pcbddc->coarse_vec);CHKERRQ(ierr); 620da1bb401SStefano Zampini ierr = VecDestroy(&pcbddc->coarse_rhs);CHKERRQ(ierr); 621da1bb401SStefano Zampini ierr = KSPDestroy(&pcbddc->coarse_ksp);CHKERRQ(ierr); 622da1bb401SStefano Zampini ierr = MatDestroy(&pcbddc->coarse_mat);CHKERRQ(ierr); 623da1bb401SStefano Zampini ierr = MatDestroy(&pcbddc->coarse_phi_B);CHKERRQ(ierr); 624da1bb401SStefano Zampini ierr = MatDestroy(&pcbddc->coarse_phi_D);CHKERRQ(ierr); 625da1bb401SStefano Zampini ierr = VecDestroy(&pcbddc->vec1_P);CHKERRQ(ierr); 626da1bb401SStefano Zampini ierr = VecDestroy(&pcbddc->vec1_C);CHKERRQ(ierr); 627da1bb401SStefano Zampini ierr = MatDestroy(&pcbddc->local_auxmat1);CHKERRQ(ierr); 628da1bb401SStefano Zampini ierr = MatDestroy(&pcbddc->local_auxmat2);CHKERRQ(ierr); 629da1bb401SStefano Zampini ierr = VecDestroy(&pcbddc->vec1_R);CHKERRQ(ierr); 630da1bb401SStefano Zampini ierr = VecDestroy(&pcbddc->vec2_R);CHKERRQ(ierr); 631da1bb401SStefano Zampini ierr = VecDestroy(&pcbddc->vec4_D);CHKERRQ(ierr); 632da1bb401SStefano Zampini ierr = VecScatterDestroy(&pcbddc->R_to_B);CHKERRQ(ierr); 633da1bb401SStefano Zampini ierr = VecScatterDestroy(&pcbddc->R_to_D);CHKERRQ(ierr); 634da1bb401SStefano Zampini ierr = VecScatterDestroy(&pcbddc->coarse_loc_to_glob);CHKERRQ(ierr); 635da1bb401SStefano Zampini ierr = KSPDestroy(&pcbddc->ksp_D);CHKERRQ(ierr); 636da1bb401SStefano Zampini ierr = KSPDestroy(&pcbddc->ksp_R);CHKERRQ(ierr); 637da1bb401SStefano Zampini ierr = ISDestroy(&pcbddc->NeumannBoundaries);CHKERRQ(ierr); 638da1bb401SStefano Zampini ierr = ISDestroy(&pcbddc->DirichletBoundaries);CHKERRQ(ierr); 639da1bb401SStefano Zampini ierr = MatDestroy(&pcbddc->ConstraintMatrix);CHKERRQ(ierr); 640da1bb401SStefano Zampini ierr = PetscFree(pcbddc->local_primal_indices);CHKERRQ(ierr); 641da1bb401SStefano Zampini ierr = PetscFree(pcbddc->replicated_local_primal_indices);CHKERRQ(ierr); 642da1bb401SStefano Zampini if (pcbddc->replicated_local_primal_values) { free(pcbddc->replicated_local_primal_values); } 643da1bb401SStefano Zampini ierr = PetscFree(pcbddc->local_primal_displacements);CHKERRQ(ierr); 644da1bb401SStefano Zampini ierr = PetscFree(pcbddc->local_primal_sizes);CHKERRQ(ierr); 645da1bb401SStefano Zampini PetscInt i; 646da1bb401SStefano Zampini for(i=0;i<pcbddc->n_ISForDofs;i++) { ierr = ISDestroy(&pcbddc->ISForDofs[i]);CHKERRQ(ierr); } 647da1bb401SStefano Zampini ierr = PetscFree(pcbddc->ISForDofs);CHKERRQ(ierr); 648da1bb401SStefano Zampini for(i=0;i<pcbddc->n_ISForFaces;i++) { ierr = ISDestroy(&pcbddc->ISForFaces[i]);CHKERRQ(ierr); } 649da1bb401SStefano Zampini ierr = PetscFree(pcbddc->ISForFaces);CHKERRQ(ierr); 650da1bb401SStefano Zampini for(i=0;i<pcbddc->n_ISForEdges;i++) { ierr = ISDestroy(&pcbddc->ISForEdges[i]);CHKERRQ(ierr); } 651da1bb401SStefano Zampini ierr = PetscFree(pcbddc->ISForEdges);CHKERRQ(ierr); 652da1bb401SStefano Zampini ierr = ISDestroy(&pcbddc->ISForVertices);CHKERRQ(ierr); 653da1bb401SStefano Zampini ierr = PetscFree(pcbddc->mat_graph->xadj);CHKERRQ(ierr); 654da1bb401SStefano Zampini ierr = PetscFree(pcbddc->mat_graph->adjncy);CHKERRQ(ierr); 655da1bb401SStefano Zampini ierr = PetscFree(pcbddc->mat_graph->neighbours_set[0]);CHKERRQ(ierr); 656da1bb401SStefano Zampini ierr = PetscFree(pcbddc->mat_graph->neighbours_set);CHKERRQ(ierr); 657da1bb401SStefano Zampini ierr = PetscFree(pcbddc->mat_graph);CHKERRQ(ierr); 658da1bb401SStefano Zampini /* Free the private data structure that was hanging off the PC */ 659da1bb401SStefano Zampini ierr = PetscFree(pcbddc);CHKERRQ(ierr); 660da1bb401SStefano Zampini PetscFunctionReturn(0); 661da1bb401SStefano Zampini } 6620c7d97c5SJed Brown 6630c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 664da1bb401SStefano Zampini /*MC 665da1bb401SStefano Zampini PCBDDC - Balancing Domain Decomposition by Constraints. 6660c7d97c5SJed Brown 667da1bb401SStefano Zampini Options Database Keys: 668da1bb401SStefano Zampini . -pcbddc ??? - 669da1bb401SStefano Zampini 670da1bb401SStefano Zampini Level: intermediate 671da1bb401SStefano Zampini 672da1bb401SStefano Zampini Notes: The matrix used with this preconditioner must be of type MATIS 673da1bb401SStefano Zampini 674da1bb401SStefano Zampini Unlike more 'conventional' interface preconditioners, this iterates over ALL the 675da1bb401SStefano Zampini degrees of freedom, NOT just those on the interface (this allows the use of approximate solvers 676da1bb401SStefano Zampini on the subdomains). 677da1bb401SStefano Zampini 678da1bb401SStefano Zampini Options for the coarse grid preconditioner can be set with - 679da1bb401SStefano Zampini Options for the Dirichlet subproblem can be set with - 680da1bb401SStefano Zampini Options for the Neumann subproblem can be set with - 681da1bb401SStefano Zampini 682da1bb401SStefano Zampini Contributed by Stefano Zampini 683da1bb401SStefano Zampini 684da1bb401SStefano Zampini .seealso: PCCreate(), PCSetType(), PCType (for list of available types), PC, MATIS 685da1bb401SStefano Zampini M*/ 686da1bb401SStefano Zampini EXTERN_C_BEGIN 687da1bb401SStefano Zampini #undef __FUNCT__ 688da1bb401SStefano Zampini #define __FUNCT__ "PCCreate_BDDC" 689da1bb401SStefano Zampini PetscErrorCode PCCreate_BDDC(PC pc) 690da1bb401SStefano Zampini { 691da1bb401SStefano Zampini PetscErrorCode ierr; 692da1bb401SStefano Zampini PC_BDDC *pcbddc; 693da1bb401SStefano Zampini PCBDDCGraph mat_graph; 694da1bb401SStefano Zampini 695da1bb401SStefano Zampini PetscFunctionBegin; 696da1bb401SStefano Zampini /* Creates the private data structure for this preconditioner and attach it to the PC object. */ 697da1bb401SStefano Zampini ierr = PetscNewLog(pc,PC_BDDC,&pcbddc);CHKERRQ(ierr); 698da1bb401SStefano Zampini pc->data = (void*)pcbddc; 699da1bb401SStefano Zampini 700da1bb401SStefano Zampini /* create PCIS data structure */ 701da1bb401SStefano Zampini ierr = PCISCreate(pc);CHKERRQ(ierr); 702da1bb401SStefano Zampini 703da1bb401SStefano Zampini /* BDDC specific */ 704534831adSStefano Zampini pcbddc->original_rhs = 0; 705534831adSStefano Zampini pcbddc->local_mat = 0; 706534831adSStefano Zampini pcbddc->ChangeOfBasisMatrix = 0; 707534831adSStefano Zampini pcbddc->usechangeofbasis = PETSC_TRUE; 708534831adSStefano Zampini pcbddc->usechangeonfaces = PETSC_FALSE; 709da1bb401SStefano Zampini pcbddc->coarse_vec = 0; 710da1bb401SStefano Zampini pcbddc->coarse_rhs = 0; 711da1bb401SStefano Zampini pcbddc->coarse_ksp = 0; 712da1bb401SStefano Zampini pcbddc->coarse_phi_B = 0; 713da1bb401SStefano Zampini pcbddc->coarse_phi_D = 0; 714da1bb401SStefano Zampini pcbddc->vec1_P = 0; 715da1bb401SStefano Zampini pcbddc->vec1_R = 0; 716da1bb401SStefano Zampini pcbddc->vec2_R = 0; 717da1bb401SStefano Zampini pcbddc->local_auxmat1 = 0; 718da1bb401SStefano Zampini pcbddc->local_auxmat2 = 0; 719da1bb401SStefano Zampini pcbddc->R_to_B = 0; 720da1bb401SStefano Zampini pcbddc->R_to_D = 0; 721da1bb401SStefano Zampini pcbddc->ksp_D = 0; 722da1bb401SStefano Zampini pcbddc->ksp_R = 0; 723da1bb401SStefano Zampini pcbddc->local_primal_indices = 0; 724da1bb401SStefano Zampini pcbddc->prec_type = PETSC_FALSE; 725da1bb401SStefano Zampini pcbddc->NeumannBoundaries = 0; 726da1bb401SStefano Zampini pcbddc->ISForDofs = 0; 727da1bb401SStefano Zampini pcbddc->ISForVertices = 0; 728da1bb401SStefano Zampini pcbddc->n_ISForFaces = 0; 729da1bb401SStefano Zampini pcbddc->n_ISForEdges = 0; 730da1bb401SStefano Zampini pcbddc->ConstraintMatrix = 0; 731da1bb401SStefano Zampini pcbddc->use_nnsp_true = PETSC_FALSE; 732da1bb401SStefano Zampini pcbddc->local_primal_sizes = 0; 733da1bb401SStefano Zampini pcbddc->local_primal_displacements = 0; 734da1bb401SStefano Zampini pcbddc->replicated_local_primal_indices = 0; 735da1bb401SStefano Zampini pcbddc->replicated_local_primal_values = 0; 736da1bb401SStefano Zampini pcbddc->coarse_loc_to_glob = 0; 737da1bb401SStefano Zampini pcbddc->dbg_flag = PETSC_FALSE; 738da1bb401SStefano Zampini pcbddc->coarsening_ratio = 8; 739da1bb401SStefano Zampini 740da1bb401SStefano Zampini /* allocate and initialize needed graph structure */ 741da1bb401SStefano Zampini ierr = PetscMalloc(sizeof(*mat_graph),&pcbddc->mat_graph);CHKERRQ(ierr); 742da1bb401SStefano Zampini pcbddc->mat_graph->xadj = 0; 743da1bb401SStefano Zampini pcbddc->mat_graph->adjncy = 0; 744da1bb401SStefano Zampini 745da1bb401SStefano Zampini /* function pointers */ 746da1bb401SStefano Zampini pc->ops->apply = PCApply_BDDC; 747da1bb401SStefano Zampini pc->ops->applytranspose = 0; 748da1bb401SStefano Zampini pc->ops->setup = PCSetUp_BDDC; 749da1bb401SStefano Zampini pc->ops->destroy = PCDestroy_BDDC; 750da1bb401SStefano Zampini pc->ops->setfromoptions = PCSetFromOptions_BDDC; 751da1bb401SStefano Zampini pc->ops->view = 0; 752da1bb401SStefano Zampini pc->ops->applyrichardson = 0; 753da1bb401SStefano Zampini pc->ops->applysymmetricleft = 0; 754da1bb401SStefano Zampini pc->ops->applysymmetricright = 0; 755534831adSStefano Zampini pc->ops->presolve = PCPreSolve_BDDC; 756534831adSStefano Zampini pc->ops->postsolve = PCPostSolve_BDDC; 757da1bb401SStefano Zampini 758da1bb401SStefano Zampini /* composing function */ 759da1bb401SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDirichletBoundaries_C","PCBDDCSetDirichletBoundaries_BDDC", 760da1bb401SStefano Zampini PCBDDCSetDirichletBoundaries_BDDC);CHKERRQ(ierr); 761da1bb401SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetNeumannBoundaries_C","PCBDDCSetNeumannBoundaries_BDDC", 762da1bb401SStefano Zampini PCBDDCSetNeumannBoundaries_BDDC);CHKERRQ(ierr); 763da1bb401SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetDirichletBoundaries_C","PCBDDCGetDirichletBoundaries_BDDC", 764da1bb401SStefano Zampini PCBDDCGetDirichletBoundaries_BDDC);CHKERRQ(ierr); 765da1bb401SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetNeumannBoundaries_C","PCBDDCGetNeumannBoundaries_BDDC", 766da1bb401SStefano Zampini PCBDDCGetNeumannBoundaries_BDDC);CHKERRQ(ierr); 767da1bb401SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetCoarseProblemType_C","PCBDDCSetCoarseProblemType_BDDC", 768da1bb401SStefano Zampini PCBDDCSetCoarseProblemType_BDDC);CHKERRQ(ierr); 769da1bb401SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDofsSplitting_C","PCBDDCSetDofsSplitting_BDDC", 770da1bb401SStefano Zampini PCBDDCSetDofsSplitting_BDDC);CHKERRQ(ierr); 771da1bb401SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetLocalAdjacencyGraph_C","PCBDDCSetLocalAdjacencyGraph_BDDC", 772da1bb401SStefano Zampini PCBDDCSetLocalAdjacencyGraph_BDDC);CHKERRQ(ierr); 773534831adSStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPreSolve_C","PCPreSolve_BDDC", 774534831adSStefano Zampini PCPreSolve_BDDC);CHKERRQ(ierr); 775534831adSStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPostSolve_C","PCPostSolve_BDDC", 776534831adSStefano Zampini PCPostSolve_BDDC);CHKERRQ(ierr); 777da1bb401SStefano Zampini PetscFunctionReturn(0); 778da1bb401SStefano Zampini } 779da1bb401SStefano Zampini EXTERN_C_END 780da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */ 781da1bb401SStefano Zampini /* All static functions from now on */ 782da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */ 783da1bb401SStefano Zampini #undef __FUNCT__ 784da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetupLocalAdjacencyGraph" 785da1bb401SStefano Zampini static PetscErrorCode PCBDDCSetupLocalAdjacencyGraph(PC pc) 786da1bb401SStefano Zampini { 787da1bb401SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 788da1bb401SStefano Zampini Mat_IS *matis = (Mat_IS*)pc->pmat->data; 789da1bb401SStefano Zampini PetscInt nvtxs,*xadj,*adjncy; 790da1bb401SStefano Zampini Mat mat_adj; 791da1bb401SStefano Zampini PetscBool symmetrize_rowij=PETSC_TRUE,compressed_rowij=PETSC_FALSE,flg_row=PETSC_TRUE; 792da1bb401SStefano Zampini PCBDDCGraph mat_graph=pcbddc->mat_graph; 793da1bb401SStefano Zampini PetscErrorCode ierr; 794da1bb401SStefano Zampini 795da1bb401SStefano Zampini PetscFunctionBegin; 796da1bb401SStefano Zampini /* get CSR adjacency from local matrix if user has not yet provided local graph using PCBDDCSetLocalAdjacencyGraph function */ 797da1bb401SStefano Zampini if(!mat_graph->xadj) { 798da1bb401SStefano Zampini ierr = MatConvert(matis->A,MATMPIADJ,MAT_INITIAL_MATRIX,&mat_adj);CHKERRQ(ierr); 799da1bb401SStefano Zampini ierr = MatGetRowIJ(mat_adj,0,symmetrize_rowij,compressed_rowij,&nvtxs,&xadj,&adjncy,&flg_row);CHKERRQ(ierr); 800da1bb401SStefano Zampini if(!flg_row) { 801da1bb401SStefano Zampini SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in MatGetRowIJ called in %s\n",__FUNCT__); 802da1bb401SStefano Zampini } 803da1bb401SStefano Zampini /* Get adjacency into BDDC workspace */ 804da1bb401SStefano Zampini ierr = PCBDDCSetLocalAdjacencyGraph(pc,nvtxs,xadj,adjncy,PETSC_COPY_VALUES);CHKERRQ(ierr); 805da1bb401SStefano Zampini ierr = MatRestoreRowIJ(mat_adj,0,symmetrize_rowij,compressed_rowij,&nvtxs,&xadj,&adjncy,&flg_row);CHKERRQ(ierr); 806da1bb401SStefano Zampini if(!flg_row) { 807da1bb401SStefano Zampini SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in MatRestoreRowIJ called in %s\n",__FUNCT__); 808da1bb401SStefano Zampini } 809da1bb401SStefano Zampini ierr = MatDestroy(&mat_adj);CHKERRQ(ierr); 810da1bb401SStefano Zampini } 811da1bb401SStefano Zampini PetscFunctionReturn(0); 812da1bb401SStefano Zampini } 813da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */ 8140c7d97c5SJed Brown #undef __FUNCT__ 8150c7d97c5SJed Brown #define __FUNCT__ "PCBDDCApplyInterfacePreconditioner" 8162617d88aSStefano Zampini static PetscErrorCode PCBDDCApplyInterfacePreconditioner(PC pc) 8170c7d97c5SJed Brown { 8180c7d97c5SJed Brown PetscErrorCode ierr; 8190c7d97c5SJed Brown PC_BDDC* pcbddc = (PC_BDDC*)(pc->data); 8200c7d97c5SJed Brown PC_IS* pcis = (PC_IS*) (pc->data); 8213b03a366Sstefano_zampini const PetscScalar zero = 0.0; 8220c7d97c5SJed Brown 8230c7d97c5SJed Brown PetscFunctionBegin; 8240c7d97c5SJed Brown /* Application of PHI^T */ 8250c7d97c5SJed Brown ierr = MatMultTranspose(pcbddc->coarse_phi_B,pcis->vec1_B,pcbddc->vec1_P);CHKERRQ(ierr); 8260c7d97c5SJed Brown if(pcbddc->prec_type) { ierr = MatMultTransposeAdd(pcbddc->coarse_phi_D,pcis->vec1_D,pcbddc->vec1_P,pcbddc->vec1_P);CHKERRQ(ierr); } 8270c7d97c5SJed Brown 8280c7d97c5SJed Brown /* Scatter data of coarse_rhs */ 8290c7d97c5SJed Brown if(pcbddc->coarse_rhs) ierr = VecSet(pcbddc->coarse_rhs,zero);CHKERRQ(ierr); 8300c7d97c5SJed Brown ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->vec1_P,pcbddc->coarse_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 8310c7d97c5SJed Brown 8320c7d97c5SJed Brown /* Local solution on R nodes */ 8330c7d97c5SJed Brown ierr = VecSet(pcbddc->vec1_R,zero);CHKERRQ(ierr); 8340c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->R_to_B,pcis->vec1_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8350c7d97c5SJed Brown ierr = VecScatterEnd (pcbddc->R_to_B,pcis->vec1_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8360c7d97c5SJed Brown if(pcbddc->prec_type) { 8370c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->R_to_D,pcis->vec1_D,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8380c7d97c5SJed Brown ierr = VecScatterEnd (pcbddc->R_to_D,pcis->vec1_D,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8390c7d97c5SJed Brown } 8400c7d97c5SJed Brown ierr = PCBDDCSolveSaddlePoint(pc);CHKERRQ(ierr); 8410c7d97c5SJed Brown ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr); 8420c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec2_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 8430c7d97c5SJed Brown ierr = VecScatterEnd (pcbddc->R_to_B,pcbddc->vec2_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 8440c7d97c5SJed Brown if(pcbddc->prec_type) { 8450c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec2_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 8460c7d97c5SJed Brown ierr = VecScatterEnd (pcbddc->R_to_D,pcbddc->vec2_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 8470c7d97c5SJed Brown } 8480c7d97c5SJed Brown 8490c7d97c5SJed Brown /* Coarse solution */ 8500c7d97c5SJed Brown ierr = PCBDDCScatterCoarseDataEnd(pc,pcbddc->vec1_P,pcbddc->coarse_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 85153cdbc3dSStefano Zampini if(pcbddc->coarse_rhs) ierr = KSPSolve(pcbddc->coarse_ksp,pcbddc->coarse_rhs,pcbddc->coarse_vec);CHKERRQ(ierr); 8520c7d97c5SJed Brown ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->coarse_vec,pcbddc->vec1_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8530c7d97c5SJed Brown ierr = PCBDDCScatterCoarseDataEnd (pc,pcbddc->coarse_vec,pcbddc->vec1_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8540c7d97c5SJed Brown 8550c7d97c5SJed Brown /* Sum contributions from two levels */ 8560c7d97c5SJed Brown ierr = MatMultAdd(pcbddc->coarse_phi_B,pcbddc->vec1_P,pcis->vec1_B,pcis->vec1_B);CHKERRQ(ierr); 8570c7d97c5SJed Brown if(pcbddc->prec_type) { ierr = MatMultAdd(pcbddc->coarse_phi_D,pcbddc->vec1_P,pcis->vec1_D,pcis->vec1_D);CHKERRQ(ierr); } 8580c7d97c5SJed Brown PetscFunctionReturn(0); 8590c7d97c5SJed Brown } 8600c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 8610c7d97c5SJed Brown #undef __FUNCT__ 8620c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSolveSaddlePoint" 86353cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSolveSaddlePoint(PC pc) 8640c7d97c5SJed Brown { 8650c7d97c5SJed Brown PetscErrorCode ierr; 8660c7d97c5SJed Brown PC_BDDC* pcbddc = (PC_BDDC*)(pc->data); 8670c7d97c5SJed Brown 8680c7d97c5SJed Brown PetscFunctionBegin; 86953cdbc3dSStefano Zampini ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr); 870534831adSStefano Zampini if(pcbddc->local_auxmat1) { 8710c7d97c5SJed Brown ierr = MatMult(pcbddc->local_auxmat1,pcbddc->vec2_R,pcbddc->vec1_C);CHKERRQ(ierr); 8720c7d97c5SJed Brown ierr = MatMultAdd(pcbddc->local_auxmat2,pcbddc->vec1_C,pcbddc->vec2_R,pcbddc->vec2_R);CHKERRQ(ierr); 8730c7d97c5SJed Brown } 8740c7d97c5SJed Brown PetscFunctionReturn(0); 8750c7d97c5SJed Brown } 8760c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 8770c7d97c5SJed Brown #undef __FUNCT__ 8780c7d97c5SJed Brown #define __FUNCT__ "PCBDDCScatterCoarseDataBegin" 87953cdbc3dSStefano Zampini static PetscErrorCode PCBDDCScatterCoarseDataBegin(PC pc,Vec vec_from, Vec vec_to, InsertMode imode, ScatterMode smode) 8800c7d97c5SJed Brown { 8810c7d97c5SJed Brown PetscErrorCode ierr; 8820c7d97c5SJed Brown PC_BDDC* pcbddc = (PC_BDDC*)(pc->data); 8830c7d97c5SJed Brown 8840c7d97c5SJed Brown PetscFunctionBegin; 8850c7d97c5SJed Brown switch(pcbddc->coarse_communications_type){ 8860c7d97c5SJed Brown case SCATTERS_BDDC: 8870c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->coarse_loc_to_glob,vec_from,vec_to,imode,smode);CHKERRQ(ierr); 8880c7d97c5SJed Brown break; 8890c7d97c5SJed Brown case GATHERS_BDDC: 8900c7d97c5SJed Brown break; 8910c7d97c5SJed Brown } 8920c7d97c5SJed Brown PetscFunctionReturn(0); 8930c7d97c5SJed Brown } 8940c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 8950c7d97c5SJed Brown #undef __FUNCT__ 8960c7d97c5SJed Brown #define __FUNCT__ "PCBDDCScatterCoarseDataEnd" 89753cdbc3dSStefano Zampini static PetscErrorCode PCBDDCScatterCoarseDataEnd(PC pc,Vec vec_from, Vec vec_to, InsertMode imode, ScatterMode smode) 8980c7d97c5SJed Brown { 8990c7d97c5SJed Brown PetscErrorCode ierr; 9000c7d97c5SJed Brown PC_BDDC* pcbddc = (PC_BDDC*)(pc->data); 9010c7d97c5SJed Brown PetscScalar* array_to; 9020c7d97c5SJed Brown PetscScalar* array_from; 9030c7d97c5SJed Brown MPI_Comm comm=((PetscObject)pc)->comm; 9040c7d97c5SJed Brown PetscInt i; 9050c7d97c5SJed Brown 9060c7d97c5SJed Brown PetscFunctionBegin; 9070c7d97c5SJed Brown 9080c7d97c5SJed Brown switch(pcbddc->coarse_communications_type){ 9090c7d97c5SJed Brown case SCATTERS_BDDC: 9100c7d97c5SJed Brown ierr = VecScatterEnd(pcbddc->coarse_loc_to_glob,vec_from,vec_to,imode,smode);CHKERRQ(ierr); 9110c7d97c5SJed Brown break; 9120c7d97c5SJed Brown case GATHERS_BDDC: 9130c7d97c5SJed Brown if(vec_from) VecGetArray(vec_from,&array_from); 9140c7d97c5SJed Brown if(vec_to) VecGetArray(vec_to,&array_to); 9150c7d97c5SJed Brown switch(pcbddc->coarse_problem_type){ 9160c7d97c5SJed Brown case SEQUENTIAL_BDDC: 9170c7d97c5SJed Brown if(smode == SCATTER_FORWARD) { 91853cdbc3dSStefano Zampini ierr = MPI_Gatherv(&array_from[0],pcbddc->local_primal_size,MPIU_SCALAR,&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,0,comm);CHKERRQ(ierr); 9190c7d97c5SJed Brown if(vec_to) { 9200c7d97c5SJed Brown for(i=0;i<pcbddc->replicated_primal_size;i++) 9210c7d97c5SJed Brown array_to[pcbddc->replicated_local_primal_indices[i]]+=pcbddc->replicated_local_primal_values[i]; 9220c7d97c5SJed Brown } 9230c7d97c5SJed Brown } else { 9240c7d97c5SJed Brown if(vec_from) 9250c7d97c5SJed Brown for(i=0;i<pcbddc->replicated_primal_size;i++) 9260c7d97c5SJed Brown pcbddc->replicated_local_primal_values[i]=array_from[pcbddc->replicated_local_primal_indices[i]]; 92753cdbc3dSStefano Zampini ierr = MPI_Scatterv(&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,&array_to[0],pcbddc->local_primal_size,MPIU_SCALAR,0,comm);CHKERRQ(ierr); 9280c7d97c5SJed Brown } 9290c7d97c5SJed Brown break; 9300c7d97c5SJed Brown case REPLICATED_BDDC: 9310c7d97c5SJed Brown if(smode == SCATTER_FORWARD) { 93253cdbc3dSStefano Zampini ierr = MPI_Allgatherv(&array_from[0],pcbddc->local_primal_size,MPIU_SCALAR,&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,comm);CHKERRQ(ierr); 9330c7d97c5SJed Brown for(i=0;i<pcbddc->replicated_primal_size;i++) 9340c7d97c5SJed Brown array_to[pcbddc->replicated_local_primal_indices[i]]+=pcbddc->replicated_local_primal_values[i]; 9350c7d97c5SJed Brown } else { /* no communications needed for SCATTER_REVERSE since needed data is already present */ 9360c7d97c5SJed Brown for(i=0;i<pcbddc->local_primal_size;i++) 9370c7d97c5SJed Brown array_to[i]=array_from[pcbddc->local_primal_indices[i]]; 9380c7d97c5SJed Brown } 9390c7d97c5SJed Brown break; 94053cdbc3dSStefano Zampini case MULTILEVEL_BDDC: 94153cdbc3dSStefano Zampini break; 94253cdbc3dSStefano Zampini case PARALLEL_BDDC: 94353cdbc3dSStefano Zampini break; 9440c7d97c5SJed Brown } 9450c7d97c5SJed Brown if(vec_from) VecRestoreArray(vec_from,&array_from); 9460c7d97c5SJed Brown if(vec_to) VecRestoreArray(vec_to,&array_to); 9470c7d97c5SJed Brown break; 9480c7d97c5SJed Brown } 9490c7d97c5SJed Brown PetscFunctionReturn(0); 9500c7d97c5SJed Brown } 9510c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 952de534f79Sstefano_zampini #ifdef BDDC_USE_POD 953de534f79Sstefano_zampini #if !defined(PETSC_MISSING_LAPACK_GESVD) 9543b03a366Sstefano_zampini #define PETSC_MISSING_LAPACK_GESVD 1 955de534f79Sstefano_zampini #define UNDEF_PETSC_MISSING_LAPACK_GESVD 1 956de534f79Sstefano_zampini #endif 9573b03a366Sstefano_zampini #endif 9583b03a366Sstefano_zampini 9593b03a366Sstefano_zampini #undef __FUNCT__ 9603b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCCreateConstraintMatrix" 9613b03a366Sstefano_zampini static PetscErrorCode PCBDDCCreateConstraintMatrix(PC pc) 9623b03a366Sstefano_zampini { 9633b03a366Sstefano_zampini PetscErrorCode ierr; 9643b03a366Sstefano_zampini PC_IS* pcis = (PC_IS*)(pc->data); 9653b03a366Sstefano_zampini PC_BDDC* pcbddc = (PC_BDDC*)pc->data; 9663b03a366Sstefano_zampini Mat_IS *matis = (Mat_IS*)pc->pmat->data; 967*23d4d1a5SStefano Zampini PetscInt *nnz,*is_indices; 9683b03a366Sstefano_zampini PetscScalar *temp_quadrature_constraint; 969534831adSStefano Zampini PetscInt *temp_indices,*temp_indices_to_constraint,*temp_indices_to_constraint_B,*local_to_B; 9703b03a366Sstefano_zampini PetscInt local_primal_size,i,j,k,total_counts,max_size_of_constraint; 9713b03a366Sstefano_zampini PetscInt n_constraints,n_vertices,size_of_constraint; 972534831adSStefano Zampini PetscScalar quad_value; 9733b03a366Sstefano_zampini PetscBool nnsp_has_cnst=PETSC_FALSE,use_nnsp_true=pcbddc->use_nnsp_true; 9743b03a366Sstefano_zampini PetscInt nnsp_size=0,nnsp_addone=0,temp_constraints,temp_start_ptr; 9753b03a366Sstefano_zampini IS *used_IS; 9763b03a366Sstefano_zampini const MatType impMatType=MATSEQAIJ; 9773b03a366Sstefano_zampini PetscBLASInt Bs,Bt,lwork,lierr; 9783b03a366Sstefano_zampini PetscReal tol=1.0e-8; 979fcda91b4SJed Brown MatNullSpace nearnullsp; 980fcda91b4SJed Brown const Vec *nearnullvecs; 9813b03a366Sstefano_zampini Vec *localnearnullsp; 9823b03a366Sstefano_zampini PetscScalar *work,*temp_basis,*array_vector,*correlation_mat; 9833b03a366Sstefano_zampini PetscReal *rwork,*singular_vals; 984534831adSStefano Zampini PetscBLASInt Bone=1,*ipiv; 985534831adSStefano Zampini Vec temp_vec; 986534831adSStefano Zampini Mat temp_mat; 987534831adSStefano Zampini KSP temp_ksp; 988534831adSStefano Zampini PetscInt s,start_constraint,dual_dofs; 989534831adSStefano Zampini PetscBool compute_submatrix,useksp=PETSC_FALSE; 990534831adSStefano Zampini PetscInt *aux_primal_permutation,*aux_primal_numbering; 991534831adSStefano Zampini PetscBool boolforface,*change_basis; 992de534f79Sstefano_zampini /* some ugly conditional declarations */ 9933b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD) 9943b03a366Sstefano_zampini PetscScalar dot_result; 9953b03a366Sstefano_zampini PetscScalar one=1.0,zero=0.0; 9963b03a366Sstefano_zampini PetscInt ii; 9973b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX) 9983b03a366Sstefano_zampini PetscScalar val1,val2; 9993b03a366Sstefano_zampini #endif 10003b03a366Sstefano_zampini #else 10013b03a366Sstefano_zampini PetscBLASInt dummy_int; 10023b03a366Sstefano_zampini PetscScalar dummy_scalar; 10033b03a366Sstefano_zampini #endif 10043b03a366Sstefano_zampini 10053b03a366Sstefano_zampini PetscFunctionBegin; 10063b03a366Sstefano_zampini /* check if near null space is attached to global mat */ 1007fcda91b4SJed Brown ierr = MatGetNearNullSpace(pc->pmat,&nearnullsp);CHKERRQ(ierr); 1008fcda91b4SJed Brown if (nearnullsp) { 1009fcda91b4SJed Brown ierr = MatNullSpaceGetVecs(nearnullsp,&nnsp_has_cnst,&nnsp_size,&nearnullvecs);CHKERRQ(ierr); 10103b03a366Sstefano_zampini } else { /* if near null space is not provided it uses constants */ 10113b03a366Sstefano_zampini nnsp_has_cnst = PETSC_TRUE; 10123b03a366Sstefano_zampini use_nnsp_true = PETSC_TRUE; 10133b03a366Sstefano_zampini } 10143b03a366Sstefano_zampini if(nnsp_has_cnst) { 10153b03a366Sstefano_zampini nnsp_addone = 1; 10163b03a366Sstefano_zampini } 10173b03a366Sstefano_zampini /* 10183b03a366Sstefano_zampini Evaluate maximum storage size needed by the procedure 10193b03a366Sstefano_zampini - temp_indices will contain start index of each constraint stored as follows 10203b03a366Sstefano_zampini - temp_indices_to_constraint [temp_indices[i],...,temp[indices[i+1]-1] will contain the indices (in local numbering) on which the constraint acts 1021534831adSStefano Zampini - temp_indices_to_constraint_B[temp_indices[i],...,temp[indices[i+1]-1] will contain the indices (in boundary numbering) on which the constraint acts 10223b03a366Sstefano_zampini - temp_quadrature_constraint [temp_indices[i],...,temp[indices[i+1]-1] will contain the scalars representing the constraint itself 10233b03a366Sstefano_zampini */ 1024da1bb401SStefano Zampini 10253b03a366Sstefano_zampini total_counts = pcbddc->n_ISForFaces+pcbddc->n_ISForEdges; 10263b03a366Sstefano_zampini total_counts *= (nnsp_addone+nnsp_size); 1027da1bb401SStefano Zampini ierr = ISGetSize(pcbddc->ISForVertices,&n_vertices);CHKERRQ(ierr); 1028da1bb401SStefano Zampini total_counts += n_vertices; 10293b03a366Sstefano_zampini ierr = PetscMalloc((total_counts+1)*sizeof(PetscInt),&temp_indices);CHKERRQ(ierr); 1030534831adSStefano Zampini ierr = PetscMalloc((total_counts+1)*sizeof(PetscBool),&change_basis);CHKERRQ(ierr); 10313b03a366Sstefano_zampini total_counts = 0; 10323b03a366Sstefano_zampini max_size_of_constraint = 0; 10333b03a366Sstefano_zampini for(i=0;i<pcbddc->n_ISForEdges+pcbddc->n_ISForFaces;i++){ 10343b03a366Sstefano_zampini if(i<pcbddc->n_ISForEdges){ 10353b03a366Sstefano_zampini used_IS = &pcbddc->ISForEdges[i]; 10363b03a366Sstefano_zampini } else { 10373b03a366Sstefano_zampini used_IS = &pcbddc->ISForFaces[i-pcbddc->n_ISForEdges]; 10383b03a366Sstefano_zampini } 10393b03a366Sstefano_zampini ierr = ISGetSize(*used_IS,&j);CHKERRQ(ierr); 10403b03a366Sstefano_zampini total_counts += j; 10413b03a366Sstefano_zampini if(j>max_size_of_constraint) max_size_of_constraint=j; 10423b03a366Sstefano_zampini } 10433b03a366Sstefano_zampini total_counts *= (nnsp_addone+nnsp_size); 1044da1bb401SStefano Zampini total_counts += n_vertices; 10453b03a366Sstefano_zampini ierr = PetscMalloc(total_counts*sizeof(PetscScalar),&temp_quadrature_constraint);CHKERRQ(ierr); 10463b03a366Sstefano_zampini ierr = PetscMalloc(total_counts*sizeof(PetscInt),&temp_indices_to_constraint);CHKERRQ(ierr); 1047534831adSStefano Zampini ierr = PetscMalloc(total_counts*sizeof(PetscInt),&temp_indices_to_constraint_B);CHKERRQ(ierr); 1048534831adSStefano Zampini ierr = PetscMalloc(pcis->n*sizeof(PetscInt),&local_to_B);CHKERRQ(ierr); 1049534831adSStefano Zampini ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 1050534831adSStefano Zampini for(i=0;i<pcis->n;i++) { 1051534831adSStefano Zampini local_to_B[i]=-1; 1052534831adSStefano Zampini } 1053534831adSStefano Zampini for(i=0;i<pcis->n_B;i++) { 1054534831adSStefano Zampini local_to_B[is_indices[i]]=i; 1055534831adSStefano Zampini } 1056534831adSStefano Zampini ierr = ISRestoreIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 1057534831adSStefano Zampini 10583b03a366Sstefano_zampini /* First we issue queries to allocate optimal workspace for LAPACKgesvd or LAPACKsyev/LAPACKheev */ 10593b03a366Sstefano_zampini rwork = 0; 10603b03a366Sstefano_zampini work = 0; 10613b03a366Sstefano_zampini singular_vals = 0; 10623b03a366Sstefano_zampini temp_basis = 0; 10633b03a366Sstefano_zampini correlation_mat = 0; 10643b03a366Sstefano_zampini if(!pcbddc->use_nnsp_true) { 10653b03a366Sstefano_zampini PetscScalar temp_work; 10663b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD) 10673b03a366Sstefano_zampini /* POD */ 10683b03a366Sstefano_zampini PetscInt max_n; 10693b03a366Sstefano_zampini max_n = nnsp_addone+nnsp_size; 10703b03a366Sstefano_zampini /* using some techniques borrowed from Proper Orthogonal Decomposition */ 10713b03a366Sstefano_zampini ierr = PetscMalloc(max_n*max_n*sizeof(PetscScalar),&correlation_mat);CHKERRQ(ierr); 10723b03a366Sstefano_zampini ierr = PetscMalloc(max_n*sizeof(PetscReal),&singular_vals);CHKERRQ(ierr); 10733b03a366Sstefano_zampini ierr = PetscMalloc(max_size_of_constraint*(nnsp_addone+nnsp_size)*sizeof(PetscScalar),&temp_basis);CHKERRQ(ierr); 10743b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX) 10753b03a366Sstefano_zampini ierr = PetscMalloc(3*max_n*sizeof(PetscReal),&rwork);CHKERRQ(ierr); 10763b03a366Sstefano_zampini #endif 10773b03a366Sstefano_zampini /* now we evaluate the optimal workspace using query with lwork=-1 */ 10783b03a366Sstefano_zampini Bt = PetscBLASIntCast(max_n); 10793b03a366Sstefano_zampini lwork=-1; 10803b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX) 10813b03a366Sstefano_zampini LAPACKsyev_("V","U",&Bt,correlation_mat,&Bt,singular_vals,&temp_work,&lwork,&lierr); 10823b03a366Sstefano_zampini #else 10833b03a366Sstefano_zampini LAPACKsyev_("V","U",&Bt,correlation_mat,&Bt,singular_vals,&temp_work,&lwork,rwork,&lierr); 10843b03a366Sstefano_zampini #endif 10853b03a366Sstefano_zampini #else /* on missing GESVD */ 10863b03a366Sstefano_zampini /* SVD */ 10873b03a366Sstefano_zampini PetscInt max_n,min_n; 10883b03a366Sstefano_zampini max_n = max_size_of_constraint; 10893b03a366Sstefano_zampini min_n = nnsp_addone+nnsp_size; 10903b03a366Sstefano_zampini if(max_size_of_constraint < ( nnsp_addone+nnsp_size ) ) { 10913b03a366Sstefano_zampini min_n = max_size_of_constraint; 10923b03a366Sstefano_zampini max_n = nnsp_addone+nnsp_size; 10933b03a366Sstefano_zampini } 10943b03a366Sstefano_zampini ierr = PetscMalloc(min_n*sizeof(PetscReal),&singular_vals);CHKERRQ(ierr); 10953b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX) 10963b03a366Sstefano_zampini ierr = PetscMalloc(5*min_n*sizeof(PetscReal),&rwork);CHKERRQ(ierr); 10973b03a366Sstefano_zampini #endif 10983b03a366Sstefano_zampini /* now we evaluate the optimal workspace using query with lwork=-1 */ 10993b03a366Sstefano_zampini lwork=-1; 11003b03a366Sstefano_zampini Bs = PetscBLASIntCast(max_n); 11013b03a366Sstefano_zampini Bt = PetscBLASIntCast(min_n); 11023b03a366Sstefano_zampini dummy_int = Bs; 1103670f3ff9SJed Brown ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 11043b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX) 11053b03a366Sstefano_zampini LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[0],&Bs,singular_vals, 11063b03a366Sstefano_zampini &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,&temp_work,&lwork,&lierr); 11073b03a366Sstefano_zampini #else 11083b03a366Sstefano_zampini LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[0],&Bs,singular_vals, 11093b03a366Sstefano_zampini &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,&temp_work,&lwork,rwork,&lierr); 11103b03a366Sstefano_zampini #endif 11113b03a366Sstefano_zampini if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to SVD Lapack routine %d",(int)lierr); 1112670f3ff9SJed Brown ierr = PetscFPTrapPop();CHKERRQ(ierr); 11133b03a366Sstefano_zampini #endif 11143b03a366Sstefano_zampini /* Allocate optimal workspace */ 11153b03a366Sstefano_zampini lwork = PetscBLASIntCast((PetscInt)PetscRealPart(temp_work)); 11163b03a366Sstefano_zampini total_counts = (PetscInt)lwork; 11173b03a366Sstefano_zampini ierr = PetscMalloc(total_counts*sizeof(PetscScalar),&work);CHKERRQ(ierr); 11183b03a366Sstefano_zampini } 11193b03a366Sstefano_zampini /* get local part of global near null space vectors */ 11203b03a366Sstefano_zampini ierr = PetscMalloc(nnsp_size*sizeof(Vec),&localnearnullsp);CHKERRQ(ierr); 11213b03a366Sstefano_zampini for(k=0;k<nnsp_size;k++) { 11223b03a366Sstefano_zampini ierr = VecDuplicate(pcis->vec1_N,&localnearnullsp[k]);CHKERRQ(ierr); 1123fcda91b4SJed Brown ierr = VecScatterBegin(matis->ctx,nearnullvecs[k],localnearnullsp[k],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 1124fcda91b4SJed Brown ierr = VecScatterEnd (matis->ctx,nearnullvecs[k],localnearnullsp[k],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 11253b03a366Sstefano_zampini } 11263b03a366Sstefano_zampini /* Now we can loop on constraining sets */ 11273b03a366Sstefano_zampini total_counts=0; 11283b03a366Sstefano_zampini temp_indices[0]=0; 1129da1bb401SStefano Zampini /* vertices */ 1130da1bb401SStefano Zampini PetscBool used_vertex; 1131da1bb401SStefano Zampini ierr = ISGetIndices(pcbddc->ISForVertices,(const PetscInt**)&is_indices);CHKERRQ(ierr); 1132da1bb401SStefano Zampini if(nnsp_has_cnst) { /* consider all vertices */ 1133da1bb401SStefano Zampini for(i=0;i<n_vertices;i++) { 1134da1bb401SStefano Zampini temp_indices_to_constraint[temp_indices[total_counts]]=is_indices[i]; 1135534831adSStefano Zampini temp_indices_to_constraint_B[temp_indices[total_counts]]=local_to_B[is_indices[i]]; 1136da1bb401SStefano Zampini temp_quadrature_constraint[temp_indices[total_counts]]=1.0; 1137da1bb401SStefano Zampini temp_indices[total_counts+1]=temp_indices[total_counts]+1; 1138534831adSStefano Zampini change_basis[total_counts]=PETSC_FALSE; 1139da1bb401SStefano Zampini total_counts++; 1140da1bb401SStefano Zampini } 1141da1bb401SStefano Zampini } else { /* consider vertices for which exist at least a localnearnullsp which is not null there */ 1142da1bb401SStefano Zampini for(i=0;i<n_vertices;i++) { 1143da1bb401SStefano Zampini used_vertex=PETSC_FALSE; 1144da1bb401SStefano Zampini k=0; 1145da1bb401SStefano Zampini while(!used_vertex && k<nnsp_size) { 1146da1bb401SStefano Zampini ierr = VecGetArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr); 1147da1bb401SStefano Zampini if(PetscAbsScalar(array_vector[is_indices[i]])>0.0) { 1148da1bb401SStefano Zampini temp_indices_to_constraint[temp_indices[total_counts]]=is_indices[i]; 1149534831adSStefano Zampini temp_indices_to_constraint_B[temp_indices[total_counts]]=local_to_B[is_indices[i]]; 1150da1bb401SStefano Zampini temp_quadrature_constraint[temp_indices[total_counts]]=1.0; 1151da1bb401SStefano Zampini temp_indices[total_counts+1]=temp_indices[total_counts]+1; 1152534831adSStefano Zampini change_basis[total_counts]=PETSC_FALSE; 1153da1bb401SStefano Zampini total_counts++; 1154da1bb401SStefano Zampini used_vertex=PETSC_TRUE; 1155da1bb401SStefano Zampini } 1156da1bb401SStefano Zampini ierr = VecRestoreArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr); 1157da1bb401SStefano Zampini k++; 1158da1bb401SStefano Zampini } 1159da1bb401SStefano Zampini } 1160da1bb401SStefano Zampini } 1161da1bb401SStefano Zampini ierr = ISRestoreIndices(pcbddc->ISForVertices,(const PetscInt**)&is_indices);CHKERRQ(ierr); 1162da1bb401SStefano Zampini n_vertices=total_counts; 1163da1bb401SStefano Zampini /* edges and faces */ 11643b03a366Sstefano_zampini for(i=0;i<pcbddc->n_ISForEdges+pcbddc->n_ISForFaces;i++){ 11653b03a366Sstefano_zampini if(i<pcbddc->n_ISForEdges){ 11663b03a366Sstefano_zampini used_IS = &pcbddc->ISForEdges[i]; 1167534831adSStefano Zampini boolforface = pcbddc->usechangeofbasis; 11683b03a366Sstefano_zampini } else { 11693b03a366Sstefano_zampini used_IS = &pcbddc->ISForFaces[i-pcbddc->n_ISForEdges]; 1170534831adSStefano Zampini boolforface = pcbddc->usechangeonfaces; 11713b03a366Sstefano_zampini } 11723b03a366Sstefano_zampini temp_constraints = 0; /* zero the number of constraints I have on this conn comp */ 11733b03a366Sstefano_zampini temp_start_ptr = total_counts; /* need to know the starting index of constraints stored */ 11743b03a366Sstefano_zampini ierr = ISGetSize(*used_IS,&size_of_constraint);CHKERRQ(ierr); 11753b03a366Sstefano_zampini ierr = ISGetIndices(*used_IS,(const PetscInt**)&is_indices);CHKERRQ(ierr); 11763b03a366Sstefano_zampini if(nnsp_has_cnst) { 11773b03a366Sstefano_zampini temp_constraints++; 1178534831adSStefano Zampini quad_value = (PetscScalar) (1.0/PetscSqrtReal((PetscReal)size_of_constraint)); 11793b03a366Sstefano_zampini for(j=0;j<size_of_constraint;j++) { 11803b03a366Sstefano_zampini temp_indices_to_constraint[temp_indices[total_counts]+j]=is_indices[j]; 1181534831adSStefano Zampini temp_indices_to_constraint_B[temp_indices[total_counts]+j]=local_to_B[is_indices[j]]; 11823b03a366Sstefano_zampini temp_quadrature_constraint[temp_indices[total_counts]+j]=quad_value; 11833b03a366Sstefano_zampini } 11843b03a366Sstefano_zampini temp_indices[total_counts+1]=temp_indices[total_counts]+size_of_constraint; /* store new starting point */ 1185534831adSStefano Zampini change_basis[total_counts]=boolforface; 11863b03a366Sstefano_zampini total_counts++; 11873b03a366Sstefano_zampini } 11883b03a366Sstefano_zampini for(k=0;k<nnsp_size;k++) { 11893b03a366Sstefano_zampini ierr = VecGetArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr); 11903b03a366Sstefano_zampini for(j=0;j<size_of_constraint;j++) { 11913b03a366Sstefano_zampini temp_indices_to_constraint[temp_indices[total_counts]+j]=is_indices[j]; 1192534831adSStefano Zampini temp_indices_to_constraint_B[temp_indices[total_counts]+j]=local_to_B[is_indices[j]]; 11933b03a366Sstefano_zampini temp_quadrature_constraint[temp_indices[total_counts]+j]=array_vector[is_indices[j]]; 11943b03a366Sstefano_zampini } 11953b03a366Sstefano_zampini ierr = VecRestoreArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr); 1196de534f79Sstefano_zampini quad_value = 1.0; 1197de534f79Sstefano_zampini if( use_nnsp_true ) { /* check if array is null on the connected component in case use_nnsp_true has been requested */ 1198de534f79Sstefano_zampini Bs = PetscBLASIntCast(size_of_constraint); 1199de534f79Sstefano_zampini quad_value = BLASasum_(&Bs,&temp_quadrature_constraint[temp_indices[total_counts]],&Bone); 1200de534f79Sstefano_zampini } 1201de534f79Sstefano_zampini if ( quad_value > 0.0 ) { /* keep indices and values */ 1202de534f79Sstefano_zampini temp_constraints++; 12033b03a366Sstefano_zampini temp_indices[total_counts+1]=temp_indices[total_counts]+size_of_constraint; /* store new starting point */ 1204534831adSStefano Zampini change_basis[total_counts]=boolforface; 12053b03a366Sstefano_zampini total_counts++; 12063b03a366Sstefano_zampini } 1207de534f79Sstefano_zampini } 12083b03a366Sstefano_zampini ierr = ISRestoreIndices(*used_IS,(const PetscInt**)&is_indices);CHKERRQ(ierr); 1209de534f79Sstefano_zampini /* perform SVD on the constraint if use_nnsp_true has not be requested by the user */ 12103b03a366Sstefano_zampini if(!use_nnsp_true) { 1211de534f79Sstefano_zampini 12123b03a366Sstefano_zampini Bs = PetscBLASIntCast(size_of_constraint); 12133b03a366Sstefano_zampini Bt = PetscBLASIntCast(temp_constraints); 1214de534f79Sstefano_zampini 12153b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD) 12163b03a366Sstefano_zampini ierr = PetscMemzero(correlation_mat,Bt*Bt*sizeof(PetscScalar));CHKERRQ(ierr); 12173b03a366Sstefano_zampini /* Store upper triangular part of correlation matrix */ 12183b03a366Sstefano_zampini for(j=0;j<temp_constraints;j++) { 12193b03a366Sstefano_zampini for(k=0;k<j+1;k++) { 12203b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX) 12213b03a366Sstefano_zampini /* hand made complex dot product */ 12223b03a366Sstefano_zampini dot_result = 0.0; 12233b03a366Sstefano_zampini for (ii=0; ii<size_of_constraint; ii++) { 12243b03a366Sstefano_zampini val1 = temp_quadrature_constraint[temp_indices[temp_start_ptr+j]+ii]; 12253b03a366Sstefano_zampini val2 = temp_quadrature_constraint[temp_indices[temp_start_ptr+k]+ii]; 12263b03a366Sstefano_zampini dot_result += val1*PetscConj(val2); 12273b03a366Sstefano_zampini } 12283b03a366Sstefano_zampini #else 12293b03a366Sstefano_zampini dot_result = BLASdot_(&Bs,&temp_quadrature_constraint[temp_indices[temp_start_ptr+j]],&Bone, 12303b03a366Sstefano_zampini &temp_quadrature_constraint[temp_indices[temp_start_ptr+k]],&Bone); 12313b03a366Sstefano_zampini #endif 12323b03a366Sstefano_zampini correlation_mat[j*temp_constraints+k]=dot_result; 12333b03a366Sstefano_zampini } 12343b03a366Sstefano_zampini } 12353b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX) 12363b03a366Sstefano_zampini LAPACKsyev_("V","U",&Bt,correlation_mat,&Bt,singular_vals,work,&lwork,&lierr); 12373b03a366Sstefano_zampini #else 12383b03a366Sstefano_zampini LAPACKsyev_("V","U",&Bt,correlation_mat,&Bt,singular_vals,work,&lwork,rwork,&lierr); 12393b03a366Sstefano_zampini #endif 12403b03a366Sstefano_zampini if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in EV Lapack routine %d",(int)lierr); 12413b03a366Sstefano_zampini /* retain eigenvalues greater than tol: note that lapack SYEV gives eigs in ascending order */ 12423b03a366Sstefano_zampini j=0; 12433b03a366Sstefano_zampini while( j < Bt && singular_vals[j] < tol) j++; 12443b03a366Sstefano_zampini total_counts=total_counts-j; 12453b03a366Sstefano_zampini if(j<temp_constraints) { 12463b03a366Sstefano_zampini for(k=j;k<Bt;k++) { singular_vals[k]=1.0/PetscSqrtReal(singular_vals[k]); } 12473b03a366Sstefano_zampini BLASgemm_("N","N",&Bs,&Bt,&Bt,&one,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,correlation_mat,&Bt,&zero,temp_basis,&Bs); 12483b03a366Sstefano_zampini /* copy POD basis into used quadrature memory */ 12493b03a366Sstefano_zampini for(k=0;k<Bt-j;k++) { 12503b03a366Sstefano_zampini for(ii=0;ii<size_of_constraint;ii++) { 12513b03a366Sstefano_zampini temp_quadrature_constraint[temp_indices[temp_start_ptr+k]+ii]=singular_vals[Bt-1-k]*temp_basis[(Bt-1-k)*size_of_constraint+ii]; 12523b03a366Sstefano_zampini } 12533b03a366Sstefano_zampini } 12543b03a366Sstefano_zampini } 1255de534f79Sstefano_zampini 12563b03a366Sstefano_zampini #else /* on missing GESVD */ 1257de534f79Sstefano_zampini 12583b03a366Sstefano_zampini PetscInt min_n = temp_constraints; 12593b03a366Sstefano_zampini if(min_n > size_of_constraint) min_n = size_of_constraint; 12603b03a366Sstefano_zampini dummy_int = Bs; 1261670f3ff9SJed Brown ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 12623b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX) 12633b03a366Sstefano_zampini LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,singular_vals, 12643b03a366Sstefano_zampini &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,work,&lwork,&lierr); 12653b03a366Sstefano_zampini #else 12663b03a366Sstefano_zampini LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,singular_vals, 12673b03a366Sstefano_zampini &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,work,&lwork,rwork,&lierr); 12683b03a366Sstefano_zampini #endif 12693b03a366Sstefano_zampini if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SVD Lapack routine %d",(int)lierr); 1270670f3ff9SJed Brown ierr = PetscFPTrapPop();CHKERRQ(ierr); 12713b03a366Sstefano_zampini /* retain eigenvalues greater than tol: note that lapack SVD gives eigs in descending order */ 12723b03a366Sstefano_zampini j=0; 12733b03a366Sstefano_zampini while( j < min_n && singular_vals[min_n-j-1] < tol) j++; 12743b03a366Sstefano_zampini total_counts = total_counts-(PetscInt)Bt+(min_n-j); 12753b03a366Sstefano_zampini #endif 12763b03a366Sstefano_zampini } 12773b03a366Sstefano_zampini } 1278534831adSStefano Zampini 1279da1bb401SStefano Zampini n_constraints=total_counts-n_vertices; 1280da1bb401SStefano Zampini local_primal_size = total_counts; 12813b03a366Sstefano_zampini /* set quantities in pcbddc data structure */ 12823b03a366Sstefano_zampini pcbddc->n_vertices = n_vertices; 12833b03a366Sstefano_zampini pcbddc->n_constraints = n_constraints; 1284da1bb401SStefano Zampini pcbddc->local_primal_size = local_primal_size; 1285534831adSStefano Zampini 1286534831adSStefano Zampini /* Create constraint matrix */ 1287534831adSStefano Zampini /* The constraint matrix is used to compute the l2g map of primal dofs */ 1288534831adSStefano Zampini /* so we need to set it up properly either with or without change of basis */ 1289534831adSStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->ConstraintMatrix);CHKERRQ(ierr); 1290534831adSStefano Zampini ierr = MatSetType(pcbddc->ConstraintMatrix,impMatType);CHKERRQ(ierr); 1291534831adSStefano Zampini ierr = MatSetSizes(pcbddc->ConstraintMatrix,local_primal_size,pcis->n,local_primal_size,pcis->n);CHKERRQ(ierr); 1292534831adSStefano Zampini /* compute a local numbering of constraints : vertices first then constraints */ 1293534831adSStefano Zampini ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr); 1294534831adSStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array_vector);CHKERRQ(ierr); 1295534831adSStefano Zampini ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&aux_primal_numbering);CHKERRQ(ierr); 1296534831adSStefano Zampini ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&aux_primal_permutation);CHKERRQ(ierr); 1297534831adSStefano Zampini total_counts=0; 1298534831adSStefano Zampini /* find vertices: subdomain corners plus dofs with basis changed */ 1299534831adSStefano Zampini for(i=0;i<local_primal_size;i++) { 1300534831adSStefano Zampini size_of_constraint=temp_indices[i+1]-temp_indices[i]; 1301534831adSStefano Zampini if(change_basis[i] || size_of_constraint == 1) { 1302534831adSStefano Zampini k=0; 1303534831adSStefano Zampini while(k < size_of_constraint && array_vector[temp_indices_to_constraint[temp_indices[i]+size_of_constraint-k-1]] != 0.0) { 1304534831adSStefano Zampini k=k+1; 1305534831adSStefano Zampini } 1306534831adSStefano Zampini j=temp_indices_to_constraint[temp_indices[i]+size_of_constraint-k-1]; 1307534831adSStefano Zampini array_vector[j] = 1.0; 1308534831adSStefano Zampini aux_primal_numbering[total_counts]=j; 1309534831adSStefano Zampini aux_primal_permutation[total_counts]=total_counts; 1310534831adSStefano Zampini total_counts++; 1311534831adSStefano Zampini } 1312534831adSStefano Zampini } 1313534831adSStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array_vector);CHKERRQ(ierr); 1314534831adSStefano Zampini /* permute indices in order to have a sorted set of vertices */ 1315534831adSStefano Zampini ierr = PetscSortIntWithPermutation(total_counts,aux_primal_numbering,aux_primal_permutation); 1316534831adSStefano Zampini /* nonzero structure */ 1317534831adSStefano Zampini ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&nnz);CHKERRQ(ierr); 1318534831adSStefano Zampini for(i=0;i<total_counts;i++) { 1319534831adSStefano Zampini nnz[i]=1; 1320534831adSStefano Zampini } 1321534831adSStefano Zampini j=total_counts; 1322534831adSStefano Zampini for(i=n_vertices;i<local_primal_size;i++) { 1323534831adSStefano Zampini if(!change_basis[i]) { 1324534831adSStefano Zampini nnz[j]=temp_indices[i+1]-temp_indices[i]; 1325534831adSStefano Zampini j++; 1326534831adSStefano Zampini } 1327534831adSStefano Zampini } 1328534831adSStefano Zampini ierr = MatSeqAIJSetPreallocation(pcbddc->ConstraintMatrix,0,nnz);CHKERRQ(ierr); 1329534831adSStefano Zampini ierr = PetscFree(nnz);CHKERRQ(ierr); 1330534831adSStefano Zampini /* set values in constraint matrix */ 1331534831adSStefano Zampini for(i=0;i<total_counts;i++) { 1332534831adSStefano Zampini j = aux_primal_permutation[i]; 1333534831adSStefano Zampini k = aux_primal_numbering[j]; 1334534831adSStefano Zampini ierr = MatSetValue(pcbddc->ConstraintMatrix,i,k,1.0,INSERT_VALUES);CHKERRQ(ierr); 1335534831adSStefano Zampini } 1336534831adSStefano Zampini for(i=n_vertices;i<local_primal_size;i++) { 1337534831adSStefano Zampini if(!change_basis[i]) { 1338534831adSStefano Zampini size_of_constraint=temp_indices[i+1]-temp_indices[i]; 1339534831adSStefano Zampini ierr = MatSetValues(pcbddc->ConstraintMatrix,1,&total_counts,size_of_constraint,&temp_indices_to_constraint[temp_indices[i]],&temp_quadrature_constraint[temp_indices[i]],INSERT_VALUES);CHKERRQ(ierr); 1340534831adSStefano Zampini total_counts++; 1341534831adSStefano Zampini } 1342534831adSStefano Zampini } 1343534831adSStefano Zampini ierr = PetscFree(aux_primal_numbering);CHKERRQ(ierr); 1344534831adSStefano Zampini ierr = PetscFree(aux_primal_permutation);CHKERRQ(ierr); 1345534831adSStefano Zampini /* assembling */ 1346534831adSStefano Zampini ierr = MatAssemblyBegin(pcbddc->ConstraintMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1347534831adSStefano Zampini ierr = MatAssemblyEnd(pcbddc->ConstraintMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1348534831adSStefano Zampini 1349534831adSStefano Zampini /* Create matrix for change of basis. We don't need it in case pcbddc->usechangeofbasis is FALSE */ 1350534831adSStefano Zampini if(pcbddc->usechangeofbasis) { 1351534831adSStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->ChangeOfBasisMatrix);CHKERRQ(ierr); 1352534831adSStefano Zampini ierr = MatSetType(pcbddc->ChangeOfBasisMatrix,impMatType);CHKERRQ(ierr); 1353534831adSStefano Zampini ierr = MatSetSizes(pcbddc->ChangeOfBasisMatrix,pcis->n_B,pcis->n_B,pcis->n_B,pcis->n_B);CHKERRQ(ierr); 1354534831adSStefano Zampini /* work arrays */ 1355534831adSStefano Zampini /* we need to reuse these arrays, so we free them */ 1356534831adSStefano Zampini ierr = PetscFree(temp_basis);CHKERRQ(ierr); 1357534831adSStefano Zampini ierr = PetscFree(work);CHKERRQ(ierr); 1358534831adSStefano Zampini ierr = PetscMalloc(pcis->n_B*sizeof(PetscInt),&nnz);CHKERRQ(ierr); 1359534831adSStefano Zampini ierr = PetscMalloc((nnsp_addone+nnsp_size)*(nnsp_addone+nnsp_size)*sizeof(PetscScalar),&temp_basis);CHKERRQ(ierr); 1360534831adSStefano Zampini ierr = PetscMalloc((nnsp_addone+nnsp_size)*sizeof(PetscScalar),&work);CHKERRQ(ierr); 1361534831adSStefano Zampini ierr = PetscMalloc((nnsp_addone+nnsp_size)*sizeof(PetscBLASInt),&ipiv);CHKERRQ(ierr); 1362534831adSStefano Zampini for(i=0;i<pcis->n_B;i++) { 1363534831adSStefano Zampini nnz[i]=1; 1364534831adSStefano Zampini } 1365534831adSStefano Zampini /* Overestimated nonzeros per row */ 1366534831adSStefano Zampini k=1; 1367534831adSStefano Zampini for(i=pcbddc->n_vertices;i<local_primal_size;i++) { 1368534831adSStefano Zampini if(change_basis[i]) { 1369534831adSStefano Zampini size_of_constraint = temp_indices[i+1]-temp_indices[i]; 1370534831adSStefano Zampini if(k < size_of_constraint) { 1371534831adSStefano Zampini k = size_of_constraint; 1372534831adSStefano Zampini } 1373534831adSStefano Zampini for(j=0;j<size_of_constraint;j++) { 1374534831adSStefano Zampini nnz[temp_indices_to_constraint_B[temp_indices[i]+j]] = size_of_constraint; 1375534831adSStefano Zampini } 1376534831adSStefano Zampini } 1377534831adSStefano Zampini } 1378534831adSStefano Zampini ierr = MatSeqAIJSetPreallocation(pcbddc->ChangeOfBasisMatrix,0,nnz);CHKERRQ(ierr); 1379534831adSStefano Zampini ierr = PetscFree(nnz);CHKERRQ(ierr); 1380534831adSStefano Zampini /* Temporary array to store indices */ 1381534831adSStefano Zampini ierr = PetscMalloc(k*sizeof(PetscInt),&is_indices);CHKERRQ(ierr); 1382534831adSStefano Zampini /* Set initial identity in the matrix */ 1383534831adSStefano Zampini for(i=0;i<pcis->n_B;i++) { 1384534831adSStefano Zampini ierr = MatSetValue(pcbddc->ChangeOfBasisMatrix,i,i,1.0,INSERT_VALUES);CHKERRQ(ierr); 1385534831adSStefano Zampini } 1386534831adSStefano Zampini /* Now we loop on the constraints which need a change of basis */ 1387534831adSStefano Zampini /* Change of basis matrix is evaluated as the FIRST APPROACH in */ 1388534831adSStefano Zampini /* Klawonn and Widlund, Dual-primal FETI-DP methods for linear elasticity, (6.2.1) */ 1389534831adSStefano Zampini temp_constraints = 0; 1390534831adSStefano Zampini temp_start_ptr = temp_indices_to_constraint_B[temp_indices[pcbddc->n_vertices]]; 1391534831adSStefano Zampini for(i=pcbddc->n_vertices;i<local_primal_size;i++) { 1392534831adSStefano Zampini if(change_basis[i]) { 1393534831adSStefano Zampini compute_submatrix = PETSC_FALSE; 1394534831adSStefano Zampini useksp = PETSC_FALSE; 1395534831adSStefano Zampini if(temp_start_ptr == temp_indices_to_constraint_B[temp_indices[i]]) { 1396534831adSStefano Zampini temp_constraints++; 1397534831adSStefano Zampini if(temp_start_ptr != temp_indices_to_constraint_B[temp_indices[i+1]]) { 1398534831adSStefano Zampini compute_submatrix = PETSC_TRUE; 1399534831adSStefano Zampini } 1400534831adSStefano Zampini } 1401534831adSStefano Zampini if(compute_submatrix) { 1402534831adSStefano Zampini if(temp_constraints > 1 || pcbddc->use_nnsp_true) { 1403534831adSStefano Zampini useksp = PETSC_TRUE; 1404534831adSStefano Zampini } 1405534831adSStefano Zampini size_of_constraint = temp_indices[i+1]-temp_indices[i]; 1406534831adSStefano Zampini if(useksp) { /* experimental */ 1407534831adSStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&temp_mat);CHKERRQ(ierr); 1408534831adSStefano Zampini ierr = MatSetType(temp_mat,impMatType);CHKERRQ(ierr); 1409534831adSStefano Zampini ierr = MatSetSizes(temp_mat,size_of_constraint,size_of_constraint,size_of_constraint,size_of_constraint);CHKERRQ(ierr); 1410534831adSStefano Zampini ierr = MatSeqAIJSetPreallocation(temp_mat,size_of_constraint,PETSC_NULL);CHKERRQ(ierr); 1411534831adSStefano Zampini } 1412534831adSStefano Zampini /* First _size_of_constraint-temp_constraints_ columns */ 1413534831adSStefano Zampini dual_dofs = size_of_constraint-temp_constraints; 1414534831adSStefano Zampini start_constraint = i+1-temp_constraints; 1415534831adSStefano Zampini for(s=0;s<dual_dofs;s++) { 1416534831adSStefano Zampini is_indices[0] = s; 1417534831adSStefano Zampini for(j=0;j<temp_constraints;j++) { 1418534831adSStefano Zampini for(k=0;k<temp_constraints;k++) { 1419534831adSStefano Zampini temp_basis[j*temp_constraints+k]=temp_quadrature_constraint[temp_indices[start_constraint+k]+s+j+1]; 1420534831adSStefano Zampini } 1421534831adSStefano Zampini work[j]=-temp_quadrature_constraint[temp_indices[start_constraint+j]+s]; 1422534831adSStefano Zampini is_indices[j+1]=s+j+1; 1423534831adSStefano Zampini } 1424534831adSStefano Zampini Bt = temp_constraints; 1425534831adSStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 1426534831adSStefano Zampini LAPACKgesv_(&Bt,&Bone,temp_basis,&Bt,ipiv,work,&Bt,&lierr); 1427534831adSStefano Zampini if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GESV Lapack routine %d",(int)lierr); 1428534831adSStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 1429534831adSStefano Zampini j = temp_indices_to_constraint_B[temp_indices[start_constraint]+s]; 1430534831adSStefano Zampini ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,temp_constraints,&temp_indices_to_constraint_B[temp_indices[start_constraint]+s+1],1,&j,work,INSERT_VALUES);CHKERRQ(ierr); 1431534831adSStefano Zampini if(useksp) { 1432534831adSStefano Zampini /* temp mat with transposed rows and columns */ 1433534831adSStefano Zampini ierr = MatSetValues(temp_mat,1,&s,temp_constraints,&is_indices[1],work,INSERT_VALUES);CHKERRQ(ierr); 1434534831adSStefano Zampini ierr = MatSetValue(temp_mat,is_indices[0],is_indices[0],1.0,INSERT_VALUES);CHKERRQ(ierr); 1435534831adSStefano Zampini } 1436534831adSStefano Zampini } 1437534831adSStefano Zampini if(useksp) { 1438534831adSStefano Zampini /* last rows of temp_mat */ 1439534831adSStefano Zampini for(j=0;j<size_of_constraint;j++) { 1440534831adSStefano Zampini is_indices[j] = j; 1441534831adSStefano Zampini } 1442534831adSStefano Zampini for(s=0;s<temp_constraints;s++) { 1443534831adSStefano Zampini k = s + dual_dofs; 1444534831adSStefano Zampini ierr = MatSetValues(temp_mat,1,&k,size_of_constraint,is_indices,&temp_quadrature_constraint[temp_indices[start_constraint+s]],INSERT_VALUES);CHKERRQ(ierr); 1445534831adSStefano Zampini } 1446534831adSStefano Zampini ierr = MatAssemblyBegin(temp_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1447534831adSStefano Zampini ierr = MatAssemblyEnd(temp_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1448534831adSStefano Zampini ierr = MatGetVecs(temp_mat,&temp_vec,PETSC_NULL);CHKERRQ(ierr); 1449534831adSStefano Zampini ierr = KSPCreate(PETSC_COMM_SELF,&temp_ksp);CHKERRQ(ierr); 1450534831adSStefano Zampini ierr = KSPSetOperators(temp_ksp,temp_mat,temp_mat,SAME_PRECONDITIONER);CHKERRQ(ierr); 1451534831adSStefano Zampini ierr = KSPSetType(temp_ksp,KSPPREONLY);CHKERRQ(ierr); 1452534831adSStefano Zampini ierr = KSPSetUp(temp_ksp);CHKERRQ(ierr); 1453534831adSStefano Zampini for(s=0;s<temp_constraints;s++) { 1454534831adSStefano Zampini ierr = VecSet(temp_vec,0.0);CHKERRQ(ierr); 1455534831adSStefano Zampini ierr = VecSetValue(temp_vec,s+dual_dofs,1.0,INSERT_VALUES);CHKERRQ(ierr); 1456534831adSStefano Zampini ierr = VecAssemblyBegin(temp_vec);CHKERRQ(ierr); 1457534831adSStefano Zampini ierr = VecAssemblyEnd(temp_vec);CHKERRQ(ierr); 1458534831adSStefano Zampini ierr = KSPSolve(temp_ksp,temp_vec,temp_vec);CHKERRQ(ierr); 1459534831adSStefano Zampini ierr = VecGetArray(temp_vec,&array_vector);CHKERRQ(ierr); 1460534831adSStefano Zampini j = temp_indices_to_constraint_B[temp_indices[start_constraint+s]+size_of_constraint-s-1]; 1461534831adSStefano Zampini /* last columns of change of basis matrix associated to new primal dofs */ 1462534831adSStefano Zampini ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,size_of_constraint,&temp_indices_to_constraint_B[temp_indices[start_constraint+s]],1,&j,array_vector,INSERT_VALUES);CHKERRQ(ierr); 1463534831adSStefano Zampini ierr = VecRestoreArray(temp_vec,&array_vector);CHKERRQ(ierr); 1464534831adSStefano Zampini } 1465534831adSStefano Zampini ierr = MatDestroy(&temp_mat);CHKERRQ(ierr); 1466534831adSStefano Zampini ierr = KSPDestroy(&temp_ksp);CHKERRQ(ierr); 1467534831adSStefano Zampini ierr = VecDestroy(&temp_vec);CHKERRQ(ierr); 1468534831adSStefano Zampini } else { 1469534831adSStefano Zampini /* last columns of change of basis matrix associated to new primal dofs */ 1470534831adSStefano Zampini for(s=0;s<temp_constraints;s++) { 1471534831adSStefano Zampini j = temp_indices_to_constraint_B[temp_indices[start_constraint+s]+size_of_constraint-s-1]; 1472534831adSStefano Zampini ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,size_of_constraint,&temp_indices_to_constraint_B[temp_indices[start_constraint+s]],1,&j,&temp_quadrature_constraint[temp_indices[start_constraint+s]],INSERT_VALUES);CHKERRQ(ierr); 1473534831adSStefano Zampini } 1474534831adSStefano Zampini } 1475534831adSStefano Zampini /* prepare for the next cycle */ 1476534831adSStefano Zampini temp_constraints = 0; 1477534831adSStefano Zampini temp_start_ptr = temp_indices_to_constraint_B[temp_indices[i+1]]; 1478534831adSStefano Zampini } 1479534831adSStefano Zampini } 1480534831adSStefano Zampini } 1481534831adSStefano Zampini /* assembling */ 1482534831adSStefano Zampini ierr = MatAssemblyBegin(pcbddc->ChangeOfBasisMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1483534831adSStefano Zampini ierr = MatAssemblyEnd(pcbddc->ChangeOfBasisMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1484534831adSStefano Zampini ierr = PetscFree(ipiv);CHKERRQ(ierr); 1485534831adSStefano Zampini ierr = PetscFree(is_indices);CHKERRQ(ierr); 1486534831adSStefano Zampini } 14873b03a366Sstefano_zampini /* free workspace no longer needed */ 14883b03a366Sstefano_zampini ierr = PetscFree(rwork);CHKERRQ(ierr); 14893b03a366Sstefano_zampini ierr = PetscFree(work);CHKERRQ(ierr); 14903b03a366Sstefano_zampini ierr = PetscFree(temp_basis);CHKERRQ(ierr); 14913b03a366Sstefano_zampini ierr = PetscFree(singular_vals);CHKERRQ(ierr); 14923b03a366Sstefano_zampini ierr = PetscFree(correlation_mat);CHKERRQ(ierr); 14933b03a366Sstefano_zampini ierr = PetscFree(temp_indices);CHKERRQ(ierr); 1494534831adSStefano Zampini ierr = PetscFree(change_basis);CHKERRQ(ierr); 14953b03a366Sstefano_zampini ierr = PetscFree(temp_indices_to_constraint);CHKERRQ(ierr); 1496534831adSStefano Zampini ierr = PetscFree(temp_indices_to_constraint_B);CHKERRQ(ierr); 1497534831adSStefano Zampini ierr = PetscFree(local_to_B);CHKERRQ(ierr); 14983b03a366Sstefano_zampini ierr = PetscFree(temp_quadrature_constraint);CHKERRQ(ierr); 1499da1bb401SStefano Zampini for(k=0;k<nnsp_size;k++) { 1500da1bb401SStefano Zampini ierr = VecDestroy(&localnearnullsp[k]);CHKERRQ(ierr); 1501da1bb401SStefano Zampini } 15023b03a366Sstefano_zampini ierr = PetscFree(localnearnullsp);CHKERRQ(ierr); 15033b03a366Sstefano_zampini PetscFunctionReturn(0); 15043b03a366Sstefano_zampini } 1505de534f79Sstefano_zampini #ifdef UNDEF_PETSC_MISSING_LAPACK_GESVD 15063b03a366Sstefano_zampini #undef PETSC_MISSING_LAPACK_GESVD 15073b03a366Sstefano_zampini #endif 15083b03a366Sstefano_zampini /* -------------------------------------------------------------------------- */ 15090c7d97c5SJed Brown #undef __FUNCT__ 15100c7d97c5SJed Brown #define __FUNCT__ "PCBDDCCoarseSetUp" 151153cdbc3dSStefano Zampini static PetscErrorCode PCBDDCCoarseSetUp(PC pc) 15120c7d97c5SJed Brown { 15130c7d97c5SJed Brown PetscErrorCode ierr; 15140c7d97c5SJed Brown 15150c7d97c5SJed Brown PC_IS* pcis = (PC_IS*)(pc->data); 15160c7d97c5SJed Brown PC_BDDC* pcbddc = (PC_BDDC*)pc->data; 15170c7d97c5SJed Brown Mat_IS *matis = (Mat_IS*)pc->pmat->data; 1518534831adSStefano Zampini Mat change_mat_all; 15190c7d97c5SJed Brown IS is_R_local; 15200c7d97c5SJed Brown IS is_V_local; 15210c7d97c5SJed Brown IS is_C_local; 15220c7d97c5SJed Brown IS is_aux1; 15230c7d97c5SJed Brown IS is_aux2; 15240c7d97c5SJed Brown const VecType impVecType; 15250c7d97c5SJed Brown const MatType impMatType; 15260c7d97c5SJed Brown PetscInt n_R=0; 15270c7d97c5SJed Brown PetscInt n_D=0; 15280c7d97c5SJed Brown PetscInt n_B=0; 15290c7d97c5SJed Brown PetscScalar zero=0.0; 15300c7d97c5SJed Brown PetscScalar one=1.0; 15310c7d97c5SJed Brown PetscScalar m_one=-1.0; 15320c7d97c5SJed Brown PetscScalar* array; 15330c7d97c5SJed Brown PetscScalar *coarse_submat_vals; 15340c7d97c5SJed Brown PetscInt *idx_R_local; 15350c7d97c5SJed Brown PetscInt *idx_V_B; 15360c7d97c5SJed Brown PetscScalar *coarsefunctions_errors; 15370c7d97c5SJed Brown PetscScalar *constraints_errors; 15380c7d97c5SJed Brown /* auxiliary indices */ 1539534831adSStefano Zampini PetscInt i,j,k; 1540e269702eSStefano Zampini /* for verbose output of bddc */ 1541e269702eSStefano Zampini PetscViewer viewer=pcbddc->dbg_viewer; 1542e269702eSStefano Zampini PetscBool dbg_flag=pcbddc->dbg_flag; 1543a0ba757dSStefano Zampini /* for counting coarse dofs */ 1544534831adSStefano Zampini PetscInt n_vertices,n_constraints; 15453b03a366Sstefano_zampini PetscInt size_of_constraint; 15463b03a366Sstefano_zampini PetscInt *row_cmat_indices; 15473b03a366Sstefano_zampini PetscScalar *row_cmat_values; 1548534831adSStefano Zampini PetscInt *vertices,*nnz,*is_indices,*temp_indices; 15490c7d97c5SJed Brown 15500c7d97c5SJed Brown PetscFunctionBegin; 15510c7d97c5SJed Brown /* Set Non-overlapping dimensions */ 15520c7d97c5SJed Brown n_B = pcis->n_B; n_D = pcis->n - n_B; 1553534831adSStefano Zampini /* Set types for local objects needed by BDDC precondtioner */ 1554534831adSStefano Zampini impMatType = MATSEQDENSE; 1555534831adSStefano Zampini impVecType = VECSEQ; 1556da1bb401SStefano Zampini /* get vertex indices from constraint matrix */ 1557534831adSStefano Zampini ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscInt),&vertices);CHKERRQ(ierr); 1558534831adSStefano Zampini n_vertices=0; 1559da1bb401SStefano Zampini for(i=0;i<pcbddc->local_primal_size;i++) { 1560da1bb401SStefano Zampini ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr); 1561da1bb401SStefano Zampini if(size_of_constraint == 1) { 1562534831adSStefano Zampini vertices[n_vertices]=row_cmat_indices[0]; 1563534831adSStefano Zampini n_vertices++; 1564a0ba757dSStefano Zampini } 1565da1bb401SStefano Zampini ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr); 1566a0ba757dSStefano Zampini } 1567534831adSStefano Zampini /* Set number of constraints */ 1568534831adSStefano Zampini n_constraints = pcbddc->local_primal_size-n_vertices; 1569534831adSStefano Zampini 1570534831adSStefano Zampini /* vertices in boundary numbering */ 1571534831adSStefano Zampini if(n_vertices) { 1572534831adSStefano Zampini ierr = VecSet(pcis->vec1_N,m_one);CHKERRQ(ierr); 1573534831adSStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 1574534831adSStefano Zampini for (i=0; i<n_vertices; i++) { array[ vertices[i] ] = i; } 1575534831adSStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 1576534831adSStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 1577534831adSStefano Zampini ierr = VecScatterEnd (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 1578534831adSStefano Zampini ierr = PetscMalloc(n_vertices*sizeof(PetscInt),&idx_V_B);CHKERRQ(ierr); 1579534831adSStefano Zampini ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr); 1580534831adSStefano Zampini for (i=0; i<n_vertices; i++) { 1581534831adSStefano Zampini j=0; 1582534831adSStefano Zampini while (array[j] != i ) {j++;} 1583534831adSStefano Zampini idx_V_B[i]=j; 1584534831adSStefano Zampini } 1585534831adSStefano Zampini ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr); 1586534831adSStefano Zampini } 1587534831adSStefano Zampini 1588534831adSStefano Zampini /* transform local matrices if needed */ 1589534831adSStefano Zampini if(pcbddc->usechangeofbasis) { 1590534831adSStefano Zampini ierr = PetscMalloc(pcis->n*sizeof(PetscInt),&nnz);CHKERRQ(ierr); 1591534831adSStefano Zampini ierr = ISGetIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 1592534831adSStefano Zampini for(i=0;i<n_D;i++) { 1593534831adSStefano Zampini nnz[is_indices[i]]=1; 1594534831adSStefano Zampini } 1595534831adSStefano Zampini ierr = ISRestoreIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 1596534831adSStefano Zampini ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 1597534831adSStefano Zampini k=1; 1598534831adSStefano Zampini for(i=0;i<n_B;i++) { 1599534831adSStefano Zampini ierr = MatGetRow(pcbddc->ChangeOfBasisMatrix,i,&j,PETSC_NULL,PETSC_NULL);CHKERRQ(ierr); 1600534831adSStefano Zampini nnz[is_indices[i]]=j; 1601534831adSStefano Zampini if( k < j) { 1602534831adSStefano Zampini k = j; 1603534831adSStefano Zampini } 1604534831adSStefano Zampini ierr = MatRestoreRow(pcbddc->ChangeOfBasisMatrix,i,&j,PETSC_NULL,PETSC_NULL);CHKERRQ(ierr); 1605534831adSStefano Zampini } 1606534831adSStefano Zampini ierr = ISRestoreIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 1607534831adSStefano Zampini /* assemble change of basis matrix on the whole set of local dofs */ 1608534831adSStefano Zampini ierr = PetscMalloc(k*sizeof(PetscInt),&temp_indices);CHKERRQ(ierr); 1609534831adSStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&change_mat_all);CHKERRQ(ierr); 1610534831adSStefano Zampini ierr = MatSetSizes(change_mat_all,pcis->n,pcis->n,pcis->n,pcis->n);CHKERRQ(ierr); 1611534831adSStefano Zampini ierr = MatSetType(change_mat_all,MATSEQAIJ);CHKERRQ(ierr); 1612534831adSStefano Zampini ierr = MatSeqAIJSetPreallocation(change_mat_all,0,nnz);CHKERRQ(ierr); 1613534831adSStefano Zampini ierr = ISGetIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 1614534831adSStefano Zampini for(i=0;i<n_D;i++) { 1615534831adSStefano Zampini ierr = MatSetValue(change_mat_all,is_indices[i],is_indices[i],1.0,INSERT_VALUES);CHKERRQ(ierr); 1616534831adSStefano Zampini } 1617534831adSStefano Zampini ierr = ISRestoreIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 1618534831adSStefano Zampini ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 1619534831adSStefano Zampini for(i=0;i<n_B;i++) { 1620534831adSStefano Zampini ierr = MatGetRow(pcbddc->ChangeOfBasisMatrix,i,&j,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr); 1621534831adSStefano Zampini for(k=0;k<j;k++) { 1622534831adSStefano Zampini temp_indices[k]=is_indices[row_cmat_indices[k]]; 1623534831adSStefano Zampini } 1624534831adSStefano Zampini ierr = MatSetValues(change_mat_all,1,&is_indices[i],j,temp_indices,row_cmat_values,INSERT_VALUES);CHKERRQ(ierr); 1625534831adSStefano Zampini ierr = MatRestoreRow(pcbddc->ChangeOfBasisMatrix,i,&j,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr); 1626534831adSStefano Zampini } 1627534831adSStefano Zampini ierr = MatAssemblyBegin(change_mat_all,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1628534831adSStefano Zampini ierr = MatAssemblyEnd(change_mat_all,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 1629534831adSStefano Zampini ierr = MatPtAP(matis->A,change_mat_all,MAT_INITIAL_MATRIX,1.0,&pcbddc->local_mat);CHKERRQ(ierr); 1630534831adSStefano Zampini ierr = MatDestroy(&pcis->A_IB);CHKERRQ(ierr); 1631534831adSStefano Zampini ierr = MatDestroy(&pcis->A_BI);CHKERRQ(ierr); 1632534831adSStefano Zampini ierr = MatDestroy(&pcis->A_BB);CHKERRQ(ierr); 1633534831adSStefano Zampini ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_I_local,pcis->is_B_local,MAT_INITIAL_MATRIX,&pcis->A_IB);CHKERRQ(ierr); 1634534831adSStefano Zampini ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_B_local,pcis->is_I_local,MAT_INITIAL_MATRIX,&pcis->A_BI);CHKERRQ(ierr); 1635534831adSStefano Zampini ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_B_local,pcis->is_B_local,MAT_INITIAL_MATRIX,&pcis->A_BB);CHKERRQ(ierr); 1636534831adSStefano Zampini ierr = MatDestroy(&change_mat_all);CHKERRQ(ierr); 1637534831adSStefano Zampini ierr = PetscFree(nnz);CHKERRQ(ierr); 1638534831adSStefano Zampini ierr = PetscFree(temp_indices);CHKERRQ(ierr); 1639534831adSStefano Zampini } else { 1640534831adSStefano Zampini /* without change of basis, the local matrix is unchanged */ 1641534831adSStefano Zampini ierr = PetscObjectReference((PetscObject)matis->A);CHKERRQ(ierr); 1642534831adSStefano Zampini pcbddc->local_mat = matis->A; 1643534831adSStefano Zampini } 1644a0ba757dSStefano Zampini 16450c7d97c5SJed Brown /* Dohrmann's notation: dofs splitted in R (Remaining: all dofs but the vertices) and V (Vertices) */ 16460c7d97c5SJed Brown ierr = VecSet(pcis->vec1_N,one);CHKERRQ(ierr); 16470c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 16483b03a366Sstefano_zampini for (i=0;i<n_vertices;i++) { array[ vertices[i] ] = zero; } 16493b03a366Sstefano_zampini ierr = PetscMalloc(( pcis->n - n_vertices )*sizeof(PetscInt),&idx_R_local);CHKERRQ(ierr); 16500c7d97c5SJed Brown for (i=0, n_R=0; i<pcis->n; i++) { if (array[i] == one) { idx_R_local[n_R] = i; n_R++; } } 16510c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 1652e269702eSStefano Zampini if(dbg_flag) { 16530c7d97c5SJed Brown ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr); 16540c7d97c5SJed Brown ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 16550c7d97c5SJed Brown ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d local dimensions\n",PetscGlobalRank);CHKERRQ(ierr); 16560c7d97c5SJed Brown ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local_size = %d, dirichlet_size = %d, boundary_size = %d\n",pcis->n,n_D,n_B);CHKERRQ(ierr); 16573b03a366Sstefano_zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"r_size = %d, v_size = %d, constraints = %d, local_primal_size = %d\n",n_R,n_vertices,n_constraints,pcbddc->local_primal_size);CHKERRQ(ierr); 1658534831adSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"pcbddc->n_vertices = %d, pcbddc->n_constraints = %d\n",pcbddc->n_vertices,pcbddc->n_constraints);CHKERRQ(ierr); 16590c7d97c5SJed Brown ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 16600c7d97c5SJed Brown } 1661534831adSStefano Zampini 16620c7d97c5SJed Brown /* Allocate needed vectors */ 1663534831adSStefano Zampini ierr = VecDuplicate(pcis->vec1_global,&pcbddc->original_rhs);CHKERRQ(ierr); 16640c7d97c5SJed Brown ierr = VecDuplicate(pcis->vec1_D,&pcbddc->vec4_D);CHKERRQ(ierr); 16650c7d97c5SJed Brown ierr = VecCreate(PETSC_COMM_SELF,&pcbddc->vec1_R);CHKERRQ(ierr); 16660c7d97c5SJed Brown ierr = VecSetSizes(pcbddc->vec1_R,n_R,n_R);CHKERRQ(ierr); 16670c7d97c5SJed Brown ierr = VecSetType(pcbddc->vec1_R,impVecType);CHKERRQ(ierr); 1668d49ef151SStefano Zampini ierr = VecDuplicate(pcbddc->vec1_R,&pcbddc->vec2_R);CHKERRQ(ierr); 16690c7d97c5SJed Brown ierr = VecCreate(PETSC_COMM_SELF,&pcbddc->vec1_P);CHKERRQ(ierr); 16700c7d97c5SJed Brown ierr = VecSetSizes(pcbddc->vec1_P,pcbddc->local_primal_size,pcbddc->local_primal_size);CHKERRQ(ierr); 16710c7d97c5SJed Brown ierr = VecSetType(pcbddc->vec1_P,impVecType);CHKERRQ(ierr); 16720c7d97c5SJed Brown 16730c7d97c5SJed Brown /* Creating some index sets needed */ 16740c7d97c5SJed Brown /* For submatrices */ 1675da1bb401SStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,n_R,idx_R_local,PETSC_OWN_POINTER,&is_R_local);CHKERRQ(ierr); 16763b03a366Sstefano_zampini if(n_vertices) { 1677da1bb401SStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,n_vertices,vertices,PETSC_OWN_POINTER,&is_V_local);CHKERRQ(ierr); 16783b03a366Sstefano_zampini } 1679da1bb401SStefano Zampini if(n_constraints) { 1680da1bb401SStefano Zampini ierr = ISCreateStride(PETSC_COMM_SELF,n_constraints,n_vertices,1,&is_C_local);CHKERRQ(ierr); 1681da1bb401SStefano Zampini } 1682da1bb401SStefano Zampini 16830c7d97c5SJed Brown /* For VecScatters pcbddc->R_to_B and (optionally) pcbddc->R_to_D */ 16840c7d97c5SJed Brown { 16850c7d97c5SJed Brown PetscInt *aux_array1; 16860c7d97c5SJed Brown PetscInt *aux_array2; 16870c7d97c5SJed Brown 16883b03a366Sstefano_zampini ierr = PetscMalloc( (pcis->n_B-n_vertices)*sizeof(PetscInt),&aux_array1);CHKERRQ(ierr); 16893b03a366Sstefano_zampini ierr = PetscMalloc( (pcis->n_B-n_vertices)*sizeof(PetscInt),&aux_array2);CHKERRQ(ierr); 16900c7d97c5SJed Brown 1691d49ef151SStefano Zampini ierr = VecSet(pcis->vec1_global,zero);CHKERRQ(ierr); 16920c7d97c5SJed Brown ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 16930c7d97c5SJed Brown ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 16940c7d97c5SJed Brown ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 16950c7d97c5SJed Brown ierr = VecScatterEnd (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 16960c7d97c5SJed Brown ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 16970c7d97c5SJed Brown ierr = VecScatterEnd (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 16980c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 1699da1bb401SStefano Zampini for (i=0, j=0; i<n_R; i++) { if (array[idx_R_local[i]] > one) { aux_array1[j] = i; j++; } } 17000c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 1701da1bb401SStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array1,PETSC_COPY_VALUES,&is_aux1);CHKERRQ(ierr); 17020c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr); 1703da1bb401SStefano Zampini for (i=0, j=0; i<n_B; i++) { if (array[i] > one) { aux_array2[j] = i; j++; } } 17043828260eSStefano Zampini ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr); 1705da1bb401SStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array2,PETSC_COPY_VALUES,&is_aux2);CHKERRQ(ierr); 17060c7d97c5SJed Brown ierr = VecScatterCreate(pcbddc->vec1_R,is_aux1,pcis->vec1_B,is_aux2,&pcbddc->R_to_B);CHKERRQ(ierr); 17070c7d97c5SJed Brown ierr = PetscFree(aux_array1);CHKERRQ(ierr); 17080c7d97c5SJed Brown ierr = PetscFree(aux_array2);CHKERRQ(ierr); 17090c7d97c5SJed Brown ierr = ISDestroy(&is_aux1);CHKERRQ(ierr); 17100c7d97c5SJed Brown ierr = ISDestroy(&is_aux2);CHKERRQ(ierr); 17110c7d97c5SJed Brown 1712e269702eSStefano Zampini if(pcbddc->prec_type || dbg_flag ) { 17130c7d97c5SJed Brown ierr = PetscMalloc(n_D*sizeof(PetscInt),&aux_array1);CHKERRQ(ierr); 17140c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 1715da1bb401SStefano Zampini for (i=0, j=0; i<n_R; i++) { if (array[idx_R_local[i]] == one) { aux_array1[j] = i; j++; } } 17160c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 1717da1bb401SStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array1,PETSC_COPY_VALUES,&is_aux1);CHKERRQ(ierr); 17180c7d97c5SJed Brown ierr = VecScatterCreate(pcbddc->vec1_R,is_aux1,pcis->vec1_D,(IS)0,&pcbddc->R_to_D);CHKERRQ(ierr); 17190c7d97c5SJed Brown ierr = PetscFree(aux_array1);CHKERRQ(ierr); 17200c7d97c5SJed Brown ierr = ISDestroy(&is_aux1);CHKERRQ(ierr); 17210c7d97c5SJed Brown } 17220c7d97c5SJed Brown } 17230c7d97c5SJed Brown 17240c7d97c5SJed Brown /* Creating PC contexts for local Dirichlet and Neumann problems */ 17250c7d97c5SJed Brown { 17260c7d97c5SJed Brown Mat A_RR; 172753cdbc3dSStefano Zampini PC pc_temp; 17280c7d97c5SJed Brown /* Matrix for Dirichlet problem is A_II -> we already have it from pcis.c code */ 172953cdbc3dSStefano Zampini ierr = KSPCreate(PETSC_COMM_SELF,&pcbddc->ksp_D);CHKERRQ(ierr); 173053cdbc3dSStefano Zampini ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->ksp_D,(PetscObject)pc,1);CHKERRQ(ierr); 173153cdbc3dSStefano Zampini ierr = KSPSetOperators(pcbddc->ksp_D,pcis->A_II,pcis->A_II,SAME_PRECONDITIONER);CHKERRQ(ierr); 173253cdbc3dSStefano Zampini ierr = KSPSetType(pcbddc->ksp_D,KSPPREONLY);CHKERRQ(ierr); 1733da1bb401SStefano Zampini ierr = KSPSetOptionsPrefix(pcbddc->ksp_D,"dirichlet_");CHKERRQ(ierr); 17340c7d97c5SJed Brown /* default */ 173553cdbc3dSStefano Zampini ierr = KSPGetPC(pcbddc->ksp_D,&pc_temp);CHKERRQ(ierr); 173653cdbc3dSStefano Zampini ierr = PCSetType(pc_temp,PCLU);CHKERRQ(ierr); 17370c7d97c5SJed Brown /* Allow user's customization */ 173853cdbc3dSStefano Zampini ierr = KSPSetFromOptions(pcbddc->ksp_D);CHKERRQ(ierr); 173953cdbc3dSStefano Zampini /* Set Up KSP for Dirichlet problem of BDDC */ 174053cdbc3dSStefano Zampini ierr = KSPSetUp(pcbddc->ksp_D);CHKERRQ(ierr); 1741da1bb401SStefano Zampini if(pcbddc->dbg_flag) ierr = KSPView(pcbddc->ksp_D,PETSC_VIEWER_STDOUT_SELF); 17420c7d97c5SJed Brown /* Matrix for Neumann problem is A_RR -> we need to create it */ 1743534831adSStefano Zampini ierr = MatGetSubMatrix(pcbddc->local_mat,is_R_local,is_R_local,MAT_INITIAL_MATRIX,&A_RR);CHKERRQ(ierr); 174453cdbc3dSStefano Zampini ierr = KSPCreate(PETSC_COMM_SELF,&pcbddc->ksp_R);CHKERRQ(ierr); 174553cdbc3dSStefano Zampini ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->ksp_R,(PetscObject)pc,1);CHKERRQ(ierr); 174653cdbc3dSStefano Zampini ierr = KSPSetOperators(pcbddc->ksp_R,A_RR,A_RR,SAME_PRECONDITIONER);CHKERRQ(ierr); 174753cdbc3dSStefano Zampini ierr = KSPSetType(pcbddc->ksp_R,KSPPREONLY);CHKERRQ(ierr); 1748da1bb401SStefano Zampini ierr = KSPSetOptionsPrefix(pcbddc->ksp_R,"neumann_");CHKERRQ(ierr); 17490c7d97c5SJed Brown /* default */ 175053cdbc3dSStefano Zampini ierr = KSPGetPC(pcbddc->ksp_R,&pc_temp);CHKERRQ(ierr); 175153cdbc3dSStefano Zampini ierr = PCSetType(pc_temp,PCLU);CHKERRQ(ierr); 17520c7d97c5SJed Brown /* Allow user's customization */ 175353cdbc3dSStefano Zampini ierr = KSPSetFromOptions(pcbddc->ksp_R);CHKERRQ(ierr); 175453cdbc3dSStefano Zampini /* Set Up KSP for Neumann problem of BDDC */ 175553cdbc3dSStefano Zampini ierr = KSPSetUp(pcbddc->ksp_R);CHKERRQ(ierr); 1756da1bb401SStefano Zampini if(pcbddc->dbg_flag) ierr = KSPView(pcbddc->ksp_R,PETSC_VIEWER_STDOUT_SELF); 1757a0ba757dSStefano Zampini /* check Dirichlet and Neumann solvers */ 1758e269702eSStefano Zampini if(pcbddc->dbg_flag) { 17590c7d97c5SJed Brown Vec temp_vec; 17600c7d97c5SJed Brown PetscScalar value; 17610c7d97c5SJed Brown 1762a0ba757dSStefano Zampini ierr = VecDuplicate(pcis->vec1_D,&temp_vec);CHKERRQ(ierr); 1763a0ba757dSStefano Zampini ierr = VecSetRandom(pcis->vec1_D,PETSC_NULL);CHKERRQ(ierr); 1764a0ba757dSStefano Zampini ierr = MatMult(pcis->A_II,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr); 1765a0ba757dSStefano Zampini ierr = KSPSolve(pcbddc->ksp_D,pcis->vec2_D,temp_vec);CHKERRQ(ierr); 1766a0ba757dSStefano Zampini ierr = VecAXPY(temp_vec,m_one,pcis->vec1_D);CHKERRQ(ierr); 1767a0ba757dSStefano Zampini ierr = VecNorm(temp_vec,NORM_INFINITY,&value);CHKERRQ(ierr); 1768a0ba757dSStefano Zampini ierr = VecDestroy(&temp_vec);CHKERRQ(ierr); 1769a0ba757dSStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 1770a0ba757dSStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr); 1771a0ba757dSStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Checking solution of Dirichlet and Neumann problems\n");CHKERRQ(ierr); 1772a0ba757dSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d infinity error for Dirichlet solve = % 1.14e \n",PetscGlobalRank,value);CHKERRQ(ierr); 1773d49ef151SStefano Zampini ierr = VecDuplicate(pcbddc->vec1_R,&temp_vec);CHKERRQ(ierr); 1774d49ef151SStefano Zampini ierr = VecSetRandom(pcbddc->vec1_R,PETSC_NULL);CHKERRQ(ierr); 1775d49ef151SStefano Zampini ierr = MatMult(A_RR,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr); 1776d49ef151SStefano Zampini ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec2_R,temp_vec);CHKERRQ(ierr); 1777d49ef151SStefano Zampini ierr = VecAXPY(temp_vec,m_one,pcbddc->vec1_R);CHKERRQ(ierr); 1778d49ef151SStefano Zampini ierr = VecNorm(temp_vec,NORM_INFINITY,&value);CHKERRQ(ierr); 1779e269702eSStefano Zampini ierr = VecDestroy(&temp_vec);CHKERRQ(ierr); 17800c7d97c5SJed Brown ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d infinity error for Neumann solve = % 1.14e \n",PetscGlobalRank,value);CHKERRQ(ierr); 1781d49ef151SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 17820c7d97c5SJed Brown } 17830c7d97c5SJed Brown /* free Neumann problem's matrix */ 17840c7d97c5SJed Brown ierr = MatDestroy(&A_RR);CHKERRQ(ierr); 17850c7d97c5SJed Brown } 17860c7d97c5SJed Brown 17870c7d97c5SJed Brown /* Assemble all remaining stuff needed to apply BDDC */ 17880c7d97c5SJed Brown { 17890c7d97c5SJed Brown Mat A_RV,A_VR,A_VV; 17900c7d97c5SJed Brown Mat M1,M2; 17910c7d97c5SJed Brown Mat C_CR; 17923b03a366Sstefano_zampini Mat AUXMAT; 17930c7d97c5SJed Brown Vec vec1_C; 17940c7d97c5SJed Brown Vec vec2_C; 17950c7d97c5SJed Brown Vec vec1_V; 17960c7d97c5SJed Brown Vec vec2_V; 17970c7d97c5SJed Brown PetscInt *nnz; 17980c7d97c5SJed Brown PetscInt *auxindices; 179953cdbc3dSStefano Zampini PetscInt index; 18000c7d97c5SJed Brown PetscScalar* array2; 18010c7d97c5SJed Brown MatFactorInfo matinfo; 18020c7d97c5SJed Brown 18030c7d97c5SJed Brown /* Allocating some extra storage just to be safe */ 18040c7d97c5SJed Brown ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&nnz);CHKERRQ(ierr); 18050c7d97c5SJed Brown ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&auxindices);CHKERRQ(ierr); 18060c7d97c5SJed Brown for(i=0;i<pcis->n;i++) {auxindices[i]=i;} 18070c7d97c5SJed Brown 18080c7d97c5SJed Brown /* some work vectors on vertices and/or constraints */ 18093b03a366Sstefano_zampini if(n_vertices) { 18100c7d97c5SJed Brown ierr = VecCreate(PETSC_COMM_SELF,&vec1_V);CHKERRQ(ierr); 18113b03a366Sstefano_zampini ierr = VecSetSizes(vec1_V,n_vertices,n_vertices);CHKERRQ(ierr); 18120c7d97c5SJed Brown ierr = VecSetType(vec1_V,impVecType);CHKERRQ(ierr); 18130c7d97c5SJed Brown ierr = VecDuplicate(vec1_V,&vec2_V);CHKERRQ(ierr); 18140c7d97c5SJed Brown } 1815534831adSStefano Zampini if(n_constraints) { 18160c7d97c5SJed Brown ierr = VecCreate(PETSC_COMM_SELF,&vec1_C);CHKERRQ(ierr); 1817534831adSStefano Zampini ierr = VecSetSizes(vec1_C,n_constraints,n_constraints);CHKERRQ(ierr); 18180c7d97c5SJed Brown ierr = VecSetType(vec1_C,impVecType);CHKERRQ(ierr); 18190c7d97c5SJed Brown ierr = VecDuplicate(vec1_C,&vec2_C);CHKERRQ(ierr); 18200c7d97c5SJed Brown ierr = VecDuplicate(vec1_C,&pcbddc->vec1_C);CHKERRQ(ierr); 18210c7d97c5SJed Brown } 18220c7d97c5SJed Brown /* Precompute stuffs needed for preprocessing and application of BDDC*/ 18233b03a366Sstefano_zampini if(n_constraints) { 18240c7d97c5SJed Brown /* some work vectors */ 18250c7d97c5SJed Brown ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->local_auxmat2);CHKERRQ(ierr); 18263b03a366Sstefano_zampini ierr = MatSetSizes(pcbddc->local_auxmat2,n_R,n_constraints,n_R,n_constraints);CHKERRQ(ierr); 18270c7d97c5SJed Brown ierr = MatSetType(pcbddc->local_auxmat2,impMatType);CHKERRQ(ierr); 18283b03a366Sstefano_zampini ierr = MatSeqDenseSetPreallocation(pcbddc->local_auxmat2,PETSC_NULL);CHKERRQ(ierr); 18290c7d97c5SJed Brown 18300c7d97c5SJed Brown /* Assemble local_auxmat2 = - A_{RR}^{-1} C^T_{CR} needed by BDDC application */ 18313b03a366Sstefano_zampini for(i=0;i<n_constraints;i++) { 1832d49ef151SStefano Zampini ierr = VecSet(pcis->vec1_N,zero);CHKERRQ(ierr); 18333b03a366Sstefano_zampini ierr = VecSet(pcbddc->vec1_R,zero);CHKERRQ(ierr); 18343b03a366Sstefano_zampini /* Get row of constraint matrix in R numbering */ 18350c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 18363b03a366Sstefano_zampini ierr = MatGetRow(pcbddc->ConstraintMatrix,n_vertices+i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr); 18373b03a366Sstefano_zampini for(j=0;j<size_of_constraint;j++) { array[ row_cmat_indices[j] ] = - row_cmat_values[j]; } 18383b03a366Sstefano_zampini ierr = MatRestoreRow(pcbddc->ConstraintMatrix,n_vertices+i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr); 18390c7d97c5SJed Brown ierr = VecGetArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr); 18400c7d97c5SJed Brown for(j=0;j<n_R;j++) { array2[j] = array[ idx_R_local[j] ]; } 18410c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 18420c7d97c5SJed Brown ierr = VecRestoreArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr); 18433b03a366Sstefano_zampini /* Solve for row of constraint matrix in R numbering */ 184453cdbc3dSStefano Zampini ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr); 18453b03a366Sstefano_zampini /* Set values */ 18460c7d97c5SJed Brown ierr = VecGetArray(pcbddc->vec2_R,&array);CHKERRQ(ierr); 18473b03a366Sstefano_zampini ierr = MatSetValues(pcbddc->local_auxmat2,n_R,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr); 18480c7d97c5SJed Brown ierr = VecRestoreArray(pcbddc->vec2_R,&array);CHKERRQ(ierr); 18490c7d97c5SJed Brown } 18500c7d97c5SJed Brown ierr = MatAssemblyBegin(pcbddc->local_auxmat2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 18510c7d97c5SJed Brown ierr = MatAssemblyEnd(pcbddc->local_auxmat2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 18520c7d97c5SJed Brown 18530c7d97c5SJed Brown /* Create Constraint matrix on R nodes: C_{CR} */ 18543b03a366Sstefano_zampini ierr = MatGetSubMatrix(pcbddc->ConstraintMatrix,is_C_local,is_R_local,MAT_INITIAL_MATRIX,&C_CR);CHKERRQ(ierr); 18550c7d97c5SJed Brown ierr = ISDestroy(&is_C_local);CHKERRQ(ierr); 18560c7d97c5SJed Brown 18570c7d97c5SJed Brown /* Assemble AUXMAT = ( LUFactor )( -C_{CR} A_{RR}^{-1} C^T_{CR} )^{-1} */ 18580c7d97c5SJed Brown ierr = MatMatMult(C_CR,pcbddc->local_auxmat2,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&AUXMAT);CHKERRQ(ierr); 1859d49ef151SStefano Zampini ierr = MatFactorInfoInitialize(&matinfo);CHKERRQ(ierr); 18603b03a366Sstefano_zampini ierr = ISCreateStride(PETSC_COMM_SELF,n_constraints,0,1,&is_aux1);CHKERRQ(ierr); 18610c7d97c5SJed Brown ierr = MatLUFactor(AUXMAT,is_aux1,is_aux1,&matinfo);CHKERRQ(ierr); 18620c7d97c5SJed Brown ierr = ISDestroy(&is_aux1);CHKERRQ(ierr); 18630c7d97c5SJed Brown 18643b03a366Sstefano_zampini /* Assemble explicitly M1 = ( C_{CR} A_{RR}^{-1} C^T_{CR} )^{-1} needed in preproc */ 1865d49ef151SStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&M1);CHKERRQ(ierr); 18663b03a366Sstefano_zampini ierr = MatSetSizes(M1,n_constraints,n_constraints,n_constraints,n_constraints);CHKERRQ(ierr); 18670c7d97c5SJed Brown ierr = MatSetType(M1,impMatType);CHKERRQ(ierr); 18683b03a366Sstefano_zampini ierr = MatSeqDenseSetPreallocation(M1,PETSC_NULL);CHKERRQ(ierr); 18693b03a366Sstefano_zampini for(i=0;i<n_constraints;i++) { 18700c7d97c5SJed Brown ierr = VecSet(vec1_C,zero);CHKERRQ(ierr); 18710c7d97c5SJed Brown ierr = VecSetValue(vec1_C,i,one,INSERT_VALUES);CHKERRQ(ierr); 18720c7d97c5SJed Brown ierr = VecAssemblyBegin(vec1_C);CHKERRQ(ierr); 18730c7d97c5SJed Brown ierr = VecAssemblyEnd(vec1_C);CHKERRQ(ierr); 18740c7d97c5SJed Brown ierr = MatSolve(AUXMAT,vec1_C,vec2_C);CHKERRQ(ierr); 18750c7d97c5SJed Brown ierr = VecScale(vec2_C,m_one);CHKERRQ(ierr); 18760c7d97c5SJed Brown ierr = VecGetArray(vec2_C,&array);CHKERRQ(ierr); 18773b03a366Sstefano_zampini ierr = MatSetValues(M1,n_constraints,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr); 18780c7d97c5SJed Brown ierr = VecRestoreArray(vec2_C,&array);CHKERRQ(ierr); 18790c7d97c5SJed Brown } 18800c7d97c5SJed Brown ierr = MatAssemblyBegin(M1,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 18810c7d97c5SJed Brown ierr = MatAssemblyEnd(M1,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 18820c7d97c5SJed Brown ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr); 18830c7d97c5SJed Brown /* Assemble local_auxmat1 = M1*C_{CR} needed by BDDC application in KSP and in preproc */ 18840c7d97c5SJed Brown ierr = MatMatMult(M1,C_CR,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&pcbddc->local_auxmat1);CHKERRQ(ierr); 18850c7d97c5SJed Brown 18860c7d97c5SJed Brown } 18870c7d97c5SJed Brown 18880c7d97c5SJed Brown /* Get submatrices from subdomain matrix */ 18893b03a366Sstefano_zampini if(n_vertices){ 1890534831adSStefano Zampini ierr = MatGetSubMatrix(pcbddc->local_mat,is_R_local,is_V_local,MAT_INITIAL_MATRIX,&A_RV);CHKERRQ(ierr); 1891534831adSStefano Zampini ierr = MatGetSubMatrix(pcbddc->local_mat,is_V_local,is_R_local,MAT_INITIAL_MATRIX,&A_VR);CHKERRQ(ierr); 1892534831adSStefano Zampini ierr = MatGetSubMatrix(pcbddc->local_mat,is_V_local,is_V_local,MAT_INITIAL_MATRIX,&A_VV);CHKERRQ(ierr); 18930c7d97c5SJed Brown /* Assemble M2 = A_RR^{-1}A_RV */ 1894d49ef151SStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&M2);CHKERRQ(ierr); 18953b03a366Sstefano_zampini ierr = MatSetSizes(M2,n_R,n_vertices,n_R,n_vertices);CHKERRQ(ierr); 18960c7d97c5SJed Brown ierr = MatSetType(M2,impMatType);CHKERRQ(ierr); 18973b03a366Sstefano_zampini ierr = MatSeqDenseSetPreallocation(M2,PETSC_NULL);CHKERRQ(ierr); 18983b03a366Sstefano_zampini for(i=0;i<n_vertices;i++) { 18990c7d97c5SJed Brown ierr = VecSet(vec1_V,zero);CHKERRQ(ierr); 19000c7d97c5SJed Brown ierr = VecSetValue(vec1_V,i,one,INSERT_VALUES);CHKERRQ(ierr); 19010c7d97c5SJed Brown ierr = VecAssemblyBegin(vec1_V);CHKERRQ(ierr); 19020c7d97c5SJed Brown ierr = VecAssemblyEnd(vec1_V);CHKERRQ(ierr); 19030c7d97c5SJed Brown ierr = MatMult(A_RV,vec1_V,pcbddc->vec1_R);CHKERRQ(ierr); 190453cdbc3dSStefano Zampini ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr); 19050c7d97c5SJed Brown ierr = VecGetArray(pcbddc->vec2_R,&array);CHKERRQ(ierr); 19063b03a366Sstefano_zampini ierr = MatSetValues(M2,n_R,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr); 19070c7d97c5SJed Brown ierr = VecRestoreArray(pcbddc->vec2_R,&array);CHKERRQ(ierr); 19080c7d97c5SJed Brown } 19090c7d97c5SJed Brown ierr = MatAssemblyBegin(M2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 19100c7d97c5SJed Brown ierr = MatAssemblyEnd(M2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 19110c7d97c5SJed Brown } 19120c7d97c5SJed Brown 19130c7d97c5SJed Brown /* Matrix of coarse basis functions (local) */ 1914d49ef151SStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->coarse_phi_B);CHKERRQ(ierr); 19150c7d97c5SJed Brown ierr = MatSetSizes(pcbddc->coarse_phi_B,n_B,pcbddc->local_primal_size,n_B,pcbddc->local_primal_size);CHKERRQ(ierr); 19160c7d97c5SJed Brown ierr = MatSetType(pcbddc->coarse_phi_B,impMatType);CHKERRQ(ierr); 19173b03a366Sstefano_zampini ierr = MatSeqDenseSetPreallocation(pcbddc->coarse_phi_B,PETSC_NULL);CHKERRQ(ierr); 1918e269702eSStefano Zampini if(pcbddc->prec_type || dbg_flag ) { 1919d49ef151SStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->coarse_phi_D);CHKERRQ(ierr); 19200c7d97c5SJed Brown ierr = MatSetSizes(pcbddc->coarse_phi_D,n_D,pcbddc->local_primal_size,n_D,pcbddc->local_primal_size);CHKERRQ(ierr); 19210c7d97c5SJed Brown ierr = MatSetType(pcbddc->coarse_phi_D,impMatType);CHKERRQ(ierr); 19223b03a366Sstefano_zampini ierr = MatSeqDenseSetPreallocation(pcbddc->coarse_phi_D,PETSC_NULL);CHKERRQ(ierr); 19230c7d97c5SJed Brown } 19240c7d97c5SJed Brown 1925e269702eSStefano Zampini if(dbg_flag) { 19260c7d97c5SJed Brown ierr = PetscMalloc( pcbddc->local_primal_size*sizeof(PetscScalar),&coarsefunctions_errors);CHKERRQ(ierr); 19270c7d97c5SJed Brown ierr = PetscMalloc( pcbddc->local_primal_size*sizeof(PetscScalar),&constraints_errors);CHKERRQ(ierr); 19280c7d97c5SJed Brown } 19293b03a366Sstefano_zampini /* Subdomain contribution (Non-overlapping) to coarse matrix */ 19300c7d97c5SJed Brown ierr = PetscMalloc ((pcbddc->local_primal_size)*(pcbddc->local_primal_size)*sizeof(PetscScalar),&coarse_submat_vals);CHKERRQ(ierr); 19310c7d97c5SJed Brown 19320c7d97c5SJed Brown /* We are now ready to evaluate coarse basis functions and subdomain contribution to coarse problem */ 19333b03a366Sstefano_zampini for(i=0;i<n_vertices;i++){ 19340c7d97c5SJed Brown ierr = VecSet(vec1_V,zero);CHKERRQ(ierr); 19350c7d97c5SJed Brown ierr = VecSetValue(vec1_V,i,one,INSERT_VALUES);CHKERRQ(ierr); 19360c7d97c5SJed Brown ierr = VecAssemblyBegin(vec1_V);CHKERRQ(ierr); 19370c7d97c5SJed Brown ierr = VecAssemblyEnd(vec1_V);CHKERRQ(ierr); 19380c7d97c5SJed Brown /* solution of saddle point problem */ 19390c7d97c5SJed Brown ierr = MatMult(M2,vec1_V,pcbddc->vec1_R);CHKERRQ(ierr); 19400c7d97c5SJed Brown ierr = VecScale(pcbddc->vec1_R,m_one);CHKERRQ(ierr); 19413b03a366Sstefano_zampini if(n_constraints) { 19420c7d97c5SJed Brown ierr = MatMult(pcbddc->local_auxmat1,pcbddc->vec1_R,vec1_C);CHKERRQ(ierr); 19430c7d97c5SJed Brown ierr = MatMultAdd(pcbddc->local_auxmat2,vec1_C,pcbddc->vec1_R,pcbddc->vec1_R);CHKERRQ(ierr); 19440c7d97c5SJed Brown ierr = VecScale(vec1_C,m_one);CHKERRQ(ierr); 19450c7d97c5SJed Brown } 19460c7d97c5SJed Brown ierr = MatMult(A_VR,pcbddc->vec1_R,vec2_V);CHKERRQ(ierr); 19470c7d97c5SJed Brown ierr = MatMultAdd(A_VV,vec1_V,vec2_V,vec2_V);CHKERRQ(ierr); 19480c7d97c5SJed Brown 19490c7d97c5SJed Brown /* Set values in coarse basis function and subdomain part of coarse_mat */ 19500c7d97c5SJed Brown /* coarse basis functions */ 19510c7d97c5SJed Brown ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr); 19520c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 19530c7d97c5SJed Brown ierr = VecScatterEnd (pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 19540c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr); 19553b03a366Sstefano_zampini ierr = MatSetValues(pcbddc->coarse_phi_B,n_B,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr); 19560c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr); 19570c7d97c5SJed Brown ierr = MatSetValue(pcbddc->coarse_phi_B,idx_V_B[i],i,one,INSERT_VALUES);CHKERRQ(ierr); 1958e269702eSStefano Zampini if( pcbddc->prec_type || dbg_flag ) { 19590c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 19600c7d97c5SJed Brown ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 19610c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_D,&array);CHKERRQ(ierr); 19623b03a366Sstefano_zampini ierr = MatSetValues(pcbddc->coarse_phi_D,n_D,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr); 19630c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_D,&array);CHKERRQ(ierr); 19640c7d97c5SJed Brown } 19650c7d97c5SJed Brown /* subdomain contribution to coarse matrix */ 19660c7d97c5SJed Brown ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr); 1967da1bb401SStefano Zampini for(j=0;j<n_vertices;j++) { coarse_submat_vals[i*pcbddc->local_primal_size+j] = array[j]; } /* WARNING -> column major ordering */ 19680c7d97c5SJed Brown ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr); 19693b03a366Sstefano_zampini if(n_constraints) { 19700c7d97c5SJed Brown ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr); 1971da1bb401SStefano Zampini for(j=0;j<n_constraints;j++) { coarse_submat_vals[i*pcbddc->local_primal_size+j+n_vertices] = array[j]; } /* WARNING -> column major ordering */ 19720c7d97c5SJed Brown ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr); 19730c7d97c5SJed Brown } 19740c7d97c5SJed Brown 1975e269702eSStefano Zampini if( dbg_flag ) { 19760c7d97c5SJed Brown /* assemble subdomain vector on nodes */ 1977d49ef151SStefano Zampini ierr = VecSet(pcis->vec1_N,zero);CHKERRQ(ierr); 19780c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 19790c7d97c5SJed Brown ierr = VecGetArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr); 19800c7d97c5SJed Brown for(j=0;j<n_R;j++) { array[idx_R_local[j]] = array2[j]; } 19813b03a366Sstefano_zampini array[ vertices[i] ] = one; 19820c7d97c5SJed Brown ierr = VecRestoreArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr); 19830c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 19840c7d97c5SJed Brown /* assemble subdomain vector of lagrange multipliers (i.e. primal nodes) */ 1985d49ef151SStefano Zampini ierr = VecSet(pcbddc->vec1_P,zero);CHKERRQ(ierr); 19860c7d97c5SJed Brown ierr = VecGetArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr); 19870c7d97c5SJed Brown ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr); 19883b03a366Sstefano_zampini for(j=0;j<n_vertices;j++) { array2[j]=array[j]; } 19890c7d97c5SJed Brown ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr); 19903b03a366Sstefano_zampini if(n_constraints) { 19910c7d97c5SJed Brown ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr); 19923b03a366Sstefano_zampini for(j=0;j<n_constraints;j++) { array2[j+n_vertices]=array[j]; } 19930c7d97c5SJed Brown ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr); 19940c7d97c5SJed Brown } 19950c7d97c5SJed Brown ierr = VecRestoreArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr); 19960c7d97c5SJed Brown ierr = VecScale(pcbddc->vec1_P,m_one);CHKERRQ(ierr); 19970c7d97c5SJed Brown /* check saddle point solution */ 1998534831adSStefano Zampini ierr = MatMult(pcbddc->local_mat,pcis->vec1_N,pcis->vec2_N);CHKERRQ(ierr); 19993b03a366Sstefano_zampini ierr = MatMultTransposeAdd(pcbddc->ConstraintMatrix,pcbddc->vec1_P,pcis->vec2_N,pcis->vec2_N);CHKERRQ(ierr); 20003b03a366Sstefano_zampini ierr = VecNorm(pcis->vec2_N,NORM_INFINITY,&coarsefunctions_errors[i]);CHKERRQ(ierr); 20013b03a366Sstefano_zampini ierr = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr); 20020c7d97c5SJed Brown ierr = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr); 20033b03a366Sstefano_zampini array[i]=array[i]+m_one; /* shift by the identity matrix */ 20040c7d97c5SJed Brown ierr = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr); 20053b03a366Sstefano_zampini ierr = VecNorm(pcbddc->vec1_P,NORM_INFINITY,&constraints_errors[i]);CHKERRQ(ierr); 20060c7d97c5SJed Brown } 20070c7d97c5SJed Brown } 20080c7d97c5SJed Brown 20093b03a366Sstefano_zampini for(i=0;i<n_constraints;i++){ 2010d49ef151SStefano Zampini ierr = VecSet(vec2_C,zero);CHKERRQ(ierr); 20110c7d97c5SJed Brown ierr = VecSetValue(vec2_C,i,m_one,INSERT_VALUES);CHKERRQ(ierr); 20120c7d97c5SJed Brown ierr = VecAssemblyBegin(vec2_C);CHKERRQ(ierr); 20130c7d97c5SJed Brown ierr = VecAssemblyEnd(vec2_C);CHKERRQ(ierr); 20140c7d97c5SJed Brown /* solution of saddle point problem */ 20150c7d97c5SJed Brown ierr = MatMult(M1,vec2_C,vec1_C);CHKERRQ(ierr); 20160c7d97c5SJed Brown ierr = MatMult(pcbddc->local_auxmat2,vec1_C,pcbddc->vec1_R);CHKERRQ(ierr); 20170c7d97c5SJed Brown ierr = VecScale(vec1_C,m_one);CHKERRQ(ierr); 20183b03a366Sstefano_zampini if(n_vertices) { ierr = MatMult(A_VR,pcbddc->vec1_R,vec2_V);CHKERRQ(ierr); } 20190c7d97c5SJed Brown /* Set values in coarse basis function and subdomain part of coarse_mat */ 20200c7d97c5SJed Brown /* coarse basis functions */ 20213b03a366Sstefano_zampini index=i+n_vertices; 20220c7d97c5SJed Brown ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr); 20230c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 20240c7d97c5SJed Brown ierr = VecScatterEnd (pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 20250c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr); 202653cdbc3dSStefano Zampini ierr = MatSetValues(pcbddc->coarse_phi_B,n_B,auxindices,1,&index,array,INSERT_VALUES);CHKERRQ(ierr); 20270c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr); 2028e269702eSStefano Zampini if( pcbddc->prec_type || dbg_flag ) { 20290c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 20300c7d97c5SJed Brown ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 20310c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_D,&array);CHKERRQ(ierr); 203253cdbc3dSStefano Zampini ierr = MatSetValues(pcbddc->coarse_phi_D,n_D,auxindices,1,&index,array,INSERT_VALUES);CHKERRQ(ierr); 20330c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_D,&array);CHKERRQ(ierr); 20340c7d97c5SJed Brown } 20350c7d97c5SJed Brown /* subdomain contribution to coarse matrix */ 20363b03a366Sstefano_zampini if(n_vertices) { 20370c7d97c5SJed Brown ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr); 2038da1bb401SStefano Zampini for(j=0;j<n_vertices;j++) {coarse_submat_vals[index*pcbddc->local_primal_size+j]=array[j];} /* WARNING -> column major ordering */ 20390c7d97c5SJed Brown ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr); 20400c7d97c5SJed Brown } 20410c7d97c5SJed Brown ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr); 2042da1bb401SStefano Zampini for(j=0;j<n_constraints;j++) {coarse_submat_vals[index*pcbddc->local_primal_size+j+n_vertices]=array[j];} /* WARNING -> column major ordering */ 20430c7d97c5SJed Brown ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr); 20440c7d97c5SJed Brown 2045e269702eSStefano Zampini if( dbg_flag ) { 20460c7d97c5SJed Brown /* assemble subdomain vector on nodes */ 204753cdbc3dSStefano Zampini ierr = VecSet(pcis->vec1_N,zero);CHKERRQ(ierr); 20480c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 20490c7d97c5SJed Brown ierr = VecGetArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr); 20500c7d97c5SJed Brown for(j=0;j<n_R;j++){ array[ idx_R_local[j] ] = array2[j]; } 20510c7d97c5SJed Brown ierr = VecRestoreArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr); 20520c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 20530c7d97c5SJed Brown /* assemble subdomain vector of lagrange multipliers */ 205453cdbc3dSStefano Zampini ierr = VecSet(pcbddc->vec1_P,zero);CHKERRQ(ierr); 20550c7d97c5SJed Brown ierr = VecGetArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr); 20563b03a366Sstefano_zampini if( n_vertices) { 20570c7d97c5SJed Brown ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr); 20583b03a366Sstefano_zampini for(j=0;j<n_vertices;j++) {array2[j]=-array[j];} 20590c7d97c5SJed Brown ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr); 20600c7d97c5SJed Brown } 20610c7d97c5SJed Brown ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr); 20623b03a366Sstefano_zampini for(j=0;j<n_constraints;j++) {array2[j+n_vertices]=-array[j];} 20630c7d97c5SJed Brown ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr); 20640c7d97c5SJed Brown ierr = VecRestoreArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr); 2065534831adSStefano Zampini /* check saddle point solution CACCA*/ 2066534831adSStefano Zampini ierr = MatMult(pcbddc->local_mat,pcis->vec1_N,pcis->vec2_N);CHKERRQ(ierr); 20673b03a366Sstefano_zampini ierr = MatMultTransposeAdd(pcbddc->ConstraintMatrix,pcbddc->vec1_P,pcis->vec2_N,pcis->vec2_N);CHKERRQ(ierr); 206853cdbc3dSStefano Zampini ierr = VecNorm(pcis->vec2_N,NORM_INFINITY,&coarsefunctions_errors[index]);CHKERRQ(ierr); 20693b03a366Sstefano_zampini ierr = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr); 20700c7d97c5SJed Brown ierr = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr); 207153cdbc3dSStefano Zampini array[index]=array[index]+m_one; /* shift by the identity matrix */ 20720c7d97c5SJed Brown ierr = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr); 207353cdbc3dSStefano Zampini ierr = VecNorm(pcbddc->vec1_P,NORM_INFINITY,&constraints_errors[index]);CHKERRQ(ierr); 20740c7d97c5SJed Brown } 20750c7d97c5SJed Brown } 20760c7d97c5SJed Brown ierr = MatAssemblyBegin(pcbddc->coarse_phi_B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 20770c7d97c5SJed Brown ierr = MatAssemblyEnd (pcbddc->coarse_phi_B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2078e269702eSStefano Zampini if( pcbddc->prec_type || dbg_flag ) { 20790c7d97c5SJed Brown ierr = MatAssemblyBegin(pcbddc->coarse_phi_D,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 20800c7d97c5SJed Brown ierr = MatAssemblyEnd (pcbddc->coarse_phi_D,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 20810c7d97c5SJed Brown } 20820c7d97c5SJed Brown /* Checking coarse_sub_mat and coarse basis functios */ 20830c7d97c5SJed Brown /* It shuld be \Phi^{(j)^T} A^{(j)} \Phi^{(j)}=coarse_sub_mat */ 20849d2fce94SStefano Zampini if(dbg_flag) { 20850c7d97c5SJed Brown 20860c7d97c5SJed Brown Mat coarse_sub_mat; 20870c7d97c5SJed Brown Mat TM1,TM2,TM3,TM4; 20880c7d97c5SJed Brown Mat coarse_phi_D,coarse_phi_B,A_II,A_BB,A_IB,A_BI; 2089a0ba757dSStefano Zampini const MatType checkmattype=MATSEQAIJ; 20900c7d97c5SJed Brown PetscScalar value; 20910c7d97c5SJed Brown 2092c042a7c3SStefano Zampini ierr = MatConvert(pcis->A_II,checkmattype,MAT_INITIAL_MATRIX,&A_II);CHKERRQ(ierr); 2093c042a7c3SStefano Zampini ierr = MatConvert(pcis->A_IB,checkmattype,MAT_INITIAL_MATRIX,&A_IB);CHKERRQ(ierr); 2094c042a7c3SStefano Zampini ierr = MatConvert(pcis->A_BI,checkmattype,MAT_INITIAL_MATRIX,&A_BI);CHKERRQ(ierr); 2095c042a7c3SStefano Zampini ierr = MatConvert(pcis->A_BB,checkmattype,MAT_INITIAL_MATRIX,&A_BB);CHKERRQ(ierr); 2096c042a7c3SStefano Zampini ierr = MatConvert(pcbddc->coarse_phi_D,checkmattype,MAT_INITIAL_MATRIX,&coarse_phi_D);CHKERRQ(ierr); 2097c042a7c3SStefano Zampini ierr = MatConvert(pcbddc->coarse_phi_B,checkmattype,MAT_INITIAL_MATRIX,&coarse_phi_B);CHKERRQ(ierr); 2098c042a7c3SStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,pcbddc->local_primal_size,pcbddc->local_primal_size,coarse_submat_vals,&coarse_sub_mat);CHKERRQ(ierr); 2099c042a7c3SStefano Zampini ierr = MatConvert(coarse_sub_mat,checkmattype,MAT_REUSE_MATRIX,&coarse_sub_mat);CHKERRQ(ierr); 21000c7d97c5SJed Brown 2101da1bb401SStefano Zampini /*PetscViewer view_out; 2102da1bb401SStefano Zampini PetscMPIInt myrank; 2103da1bb401SStefano Zampini char filename[256]; 2104da1bb401SStefano Zampini MPI_Comm_rank(((PetscObject)pc)->comm,&myrank); 2105da1bb401SStefano Zampini sprintf(filename,"coarsesubmat_%04d.m",myrank); 2106da1bb401SStefano Zampini ierr = PetscViewerASCIIOpen(PETSC_COMM_SELF,filename,&view_out);CHKERRQ(ierr); 2107da1bb401SStefano Zampini ierr = PetscViewerSetFormat(view_out,PETSC_VIEWER_ASCII_MATLAB);CHKERRQ(ierr); 2108da1bb401SStefano Zampini ierr = MatView(coarse_sub_mat,view_out);CHKERRQ(ierr); 2109da1bb401SStefano Zampini ierr = PetscViewerDestroy(&view_out);CHKERRQ(ierr);*/ 2110da1bb401SStefano Zampini 21110c7d97c5SJed Brown ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr); 21120c7d97c5SJed Brown ierr = PetscViewerASCIIPrintf(viewer,"Check coarse sub mat and local basis functions\n");CHKERRQ(ierr); 21130c7d97c5SJed Brown ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 211453cdbc3dSStefano Zampini ierr = MatPtAP(A_II,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&TM1);CHKERRQ(ierr); 211553cdbc3dSStefano Zampini ierr = MatPtAP(A_BB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&TM2);CHKERRQ(ierr); 211653cdbc3dSStefano Zampini ierr = MatMatMult(A_IB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr); 2117c042a7c3SStefano Zampini ierr = MatTransposeMatMult(coarse_phi_D,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM3);CHKERRQ(ierr); 211853cdbc3dSStefano Zampini ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr); 211953cdbc3dSStefano Zampini ierr = MatMatMult(A_BI,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr); 2120c042a7c3SStefano Zampini ierr = MatTransposeMatMult(coarse_phi_B,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM4);CHKERRQ(ierr); 212153cdbc3dSStefano Zampini ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr); 212253cdbc3dSStefano Zampini ierr = MatAXPY(TM1,one,TM2,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr); 212353cdbc3dSStefano Zampini ierr = MatAXPY(TM1,one,TM3,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr); 212453cdbc3dSStefano Zampini ierr = MatAXPY(TM1,one,TM4,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr); 212553cdbc3dSStefano Zampini ierr = MatAXPY(TM1,m_one,coarse_sub_mat,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr); 212653cdbc3dSStefano Zampini ierr = MatNorm(TM1,NORM_INFINITY,&value);CHKERRQ(ierr); 21270c7d97c5SJed Brown ierr = PetscViewerASCIISynchronizedPrintf(viewer,"----------------------------------\n");CHKERRQ(ierr); 21280c7d97c5SJed Brown ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d \n",PetscGlobalRank);CHKERRQ(ierr); 21290c7d97c5SJed Brown ierr = PetscViewerASCIISynchronizedPrintf(viewer,"matrix error = % 1.14e\n",value);CHKERRQ(ierr); 21300c7d97c5SJed Brown ierr = PetscViewerASCIISynchronizedPrintf(viewer,"coarse functions errors\n");CHKERRQ(ierr); 213153cdbc3dSStefano Zampini for(i=0;i<pcbddc->local_primal_size;i++) { ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local %02d-th function error = % 1.14e\n",i,coarsefunctions_errors[i]);CHKERRQ(ierr); } 21320c7d97c5SJed Brown ierr = PetscViewerASCIISynchronizedPrintf(viewer,"constraints errors\n");CHKERRQ(ierr); 213353cdbc3dSStefano Zampini for(i=0;i<pcbddc->local_primal_size;i++) { ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local %02d-th function error = % 1.14e\n",i,constraints_errors[i]);CHKERRQ(ierr); } 21340c7d97c5SJed Brown ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 213553cdbc3dSStefano Zampini ierr = MatDestroy(&A_II);CHKERRQ(ierr); 213653cdbc3dSStefano Zampini ierr = MatDestroy(&A_BB);CHKERRQ(ierr); 213753cdbc3dSStefano Zampini ierr = MatDestroy(&A_IB);CHKERRQ(ierr); 213853cdbc3dSStefano Zampini ierr = MatDestroy(&A_BI);CHKERRQ(ierr); 213953cdbc3dSStefano Zampini ierr = MatDestroy(&TM1);CHKERRQ(ierr); 214053cdbc3dSStefano Zampini ierr = MatDestroy(&TM2);CHKERRQ(ierr); 214153cdbc3dSStefano Zampini ierr = MatDestroy(&TM3);CHKERRQ(ierr); 214253cdbc3dSStefano Zampini ierr = MatDestroy(&TM4);CHKERRQ(ierr); 214353cdbc3dSStefano Zampini ierr = MatDestroy(&coarse_phi_D);CHKERRQ(ierr); 214453cdbc3dSStefano Zampini ierr = MatDestroy(&coarse_sub_mat);CHKERRQ(ierr); 214553cdbc3dSStefano Zampini ierr = MatDestroy(&coarse_phi_B);CHKERRQ(ierr); 21460c7d97c5SJed Brown ierr = PetscFree(coarsefunctions_errors);CHKERRQ(ierr); 21470c7d97c5SJed Brown ierr = PetscFree(constraints_errors);CHKERRQ(ierr); 21480c7d97c5SJed Brown } 21490c7d97c5SJed Brown 21500c7d97c5SJed Brown /* create coarse matrix and data structures for message passing associated actual choice of coarse problem type */ 21510c7d97c5SJed Brown ierr = PCBDDCSetupCoarseEnvironment(pc,coarse_submat_vals);CHKERRQ(ierr); 21520c7d97c5SJed Brown /* free memory */ 21530c7d97c5SJed Brown ierr = PetscFree(coarse_submat_vals);CHKERRQ(ierr); 21540c7d97c5SJed Brown ierr = PetscFree(auxindices);CHKERRQ(ierr); 21550c7d97c5SJed Brown ierr = PetscFree(nnz);CHKERRQ(ierr); 21563b03a366Sstefano_zampini if(n_vertices) { 21570c7d97c5SJed Brown ierr = VecDestroy(&vec1_V);CHKERRQ(ierr); 21580c7d97c5SJed Brown ierr = VecDestroy(&vec2_V);CHKERRQ(ierr); 21590c7d97c5SJed Brown ierr = MatDestroy(&M2);CHKERRQ(ierr); 21600c7d97c5SJed Brown ierr = MatDestroy(&A_RV);CHKERRQ(ierr); 21610c7d97c5SJed Brown ierr = MatDestroy(&A_VR);CHKERRQ(ierr); 21620c7d97c5SJed Brown ierr = MatDestroy(&A_VV);CHKERRQ(ierr); 21630c7d97c5SJed Brown } 2164534831adSStefano Zampini if(n_constraints) { 21650c7d97c5SJed Brown ierr = VecDestroy(&vec1_C);CHKERRQ(ierr); 21660c7d97c5SJed Brown ierr = VecDestroy(&vec2_C);CHKERRQ(ierr); 21670c7d97c5SJed Brown ierr = MatDestroy(&M1);CHKERRQ(ierr); 21680c7d97c5SJed Brown ierr = MatDestroy(&C_CR);CHKERRQ(ierr); 21690c7d97c5SJed Brown } 21700c7d97c5SJed Brown } 21710c7d97c5SJed Brown /* free memory */ 21723b03a366Sstefano_zampini if(n_vertices) { 21730c7d97c5SJed Brown ierr = PetscFree(idx_V_B);CHKERRQ(ierr); 21740c7d97c5SJed Brown ierr = ISDestroy(&is_V_local);CHKERRQ(ierr); 21750c7d97c5SJed Brown } 21760c7d97c5SJed Brown ierr = ISDestroy(&is_R_local);CHKERRQ(ierr); 21770c7d97c5SJed Brown 21780c7d97c5SJed Brown PetscFunctionReturn(0); 21790c7d97c5SJed Brown } 21800c7d97c5SJed Brown 21810c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 21820c7d97c5SJed Brown 21830c7d97c5SJed Brown #undef __FUNCT__ 21840c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetupCoarseEnvironment" 218553cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetupCoarseEnvironment(PC pc,PetscScalar* coarse_submat_vals) 21860c7d97c5SJed Brown { 21870c7d97c5SJed Brown 21880c7d97c5SJed Brown 21890c7d97c5SJed Brown Mat_IS *matis = (Mat_IS*)pc->pmat->data; 21900c7d97c5SJed Brown PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 21910c7d97c5SJed Brown PC_IS *pcis = (PC_IS*)pc->data; 21920c7d97c5SJed Brown MPI_Comm prec_comm = ((PetscObject)pc)->comm; 21930c7d97c5SJed Brown MPI_Comm coarse_comm; 21940c7d97c5SJed Brown 21950c7d97c5SJed Brown /* common to all choiches */ 21960c7d97c5SJed Brown PetscScalar *temp_coarse_mat_vals; 21970c7d97c5SJed Brown PetscScalar *ins_coarse_mat_vals; 21980c7d97c5SJed Brown PetscInt *ins_local_primal_indices; 21990c7d97c5SJed Brown PetscMPIInt *localsizes2,*localdispl2; 22000c7d97c5SJed Brown PetscMPIInt size_prec_comm; 22010c7d97c5SJed Brown PetscMPIInt rank_prec_comm; 22020c7d97c5SJed Brown PetscMPIInt active_rank=MPI_PROC_NULL; 22030c7d97c5SJed Brown PetscMPIInt master_proc=0; 22040c7d97c5SJed Brown PetscInt ins_local_primal_size; 22050c7d97c5SJed Brown /* specific to MULTILEVEL_BDDC */ 22060c7d97c5SJed Brown PetscMPIInt *ranks_recv; 22070c7d97c5SJed Brown PetscMPIInt count_recv=0; 22080c7d97c5SJed Brown PetscMPIInt rank_coarse_proc_send_to; 22090c7d97c5SJed Brown PetscMPIInt coarse_color = MPI_UNDEFINED; 22100c7d97c5SJed Brown ISLocalToGlobalMapping coarse_ISLG; 22110c7d97c5SJed Brown /* some other variables */ 22120c7d97c5SJed Brown PetscErrorCode ierr; 22130c7d97c5SJed Brown const MatType coarse_mat_type; 22140c7d97c5SJed Brown const PCType coarse_pc_type; 221553cdbc3dSStefano Zampini const KSPType coarse_ksp_type; 221653cdbc3dSStefano Zampini PC pc_temp; 22170c7d97c5SJed Brown PetscInt i,j,k,bs; 22183b03a366Sstefano_zampini PetscInt max_it_coarse_ksp=1; /* don't increase this value */ 2219e269702eSStefano Zampini /* verbose output viewer */ 2220e269702eSStefano Zampini PetscViewer viewer=pcbddc->dbg_viewer; 2221e269702eSStefano Zampini PetscBool dbg_flag=pcbddc->dbg_flag; 22220c7d97c5SJed Brown 22230c7d97c5SJed Brown PetscFunctionBegin; 22240c7d97c5SJed Brown 22250c7d97c5SJed Brown ins_local_primal_indices = 0; 22260c7d97c5SJed Brown ins_coarse_mat_vals = 0; 22270c7d97c5SJed Brown localsizes2 = 0; 22280c7d97c5SJed Brown localdispl2 = 0; 22290c7d97c5SJed Brown temp_coarse_mat_vals = 0; 22300c7d97c5SJed Brown coarse_ISLG = 0; 22310c7d97c5SJed Brown 223253cdbc3dSStefano Zampini ierr = MPI_Comm_size(prec_comm,&size_prec_comm);CHKERRQ(ierr); 223353cdbc3dSStefano Zampini ierr = MPI_Comm_rank(prec_comm,&rank_prec_comm);CHKERRQ(ierr); 22340c7d97c5SJed Brown ierr = MatGetBlockSize(matis->A,&bs);CHKERRQ(ierr); 22350c7d97c5SJed Brown 2236beed3852SStefano Zampini /* Assign global numbering to coarse dofs */ 2237beed3852SStefano Zampini { 2238a0ba757dSStefano Zampini PetscScalar one=1.,zero=0.; 2239beed3852SStefano Zampini PetscScalar *array; 2240beed3852SStefano Zampini PetscMPIInt *auxlocal_primal; 2241beed3852SStefano Zampini PetscMPIInt *auxglobal_primal; 2242beed3852SStefano Zampini PetscMPIInt *all_auxglobal_primal; 2243beed3852SStefano Zampini PetscMPIInt *all_auxglobal_primal_dummy; 2244beed3852SStefano Zampini PetscMPIInt mpi_local_primal_size = (PetscMPIInt)pcbddc->local_primal_size; 2245da1bb401SStefano Zampini PetscInt *row_cmat_indices; 22463b03a366Sstefano_zampini PetscInt size_of_constraint; 2247da1bb401SStefano Zampini PetscScalar coarsesum; 2248beed3852SStefano Zampini 2249beed3852SStefano Zampini /* Construct needed data structures for message passing */ 2250beed3852SStefano Zampini ierr = PetscMalloc(mpi_local_primal_size*sizeof(PetscMPIInt),&pcbddc->local_primal_indices);CHKERRQ(ierr); 2251beed3852SStefano Zampini ierr = PetscMalloc(size_prec_comm*sizeof(PetscMPIInt),&pcbddc->local_primal_sizes);CHKERRQ(ierr); 2252beed3852SStefano Zampini ierr = PetscMalloc(size_prec_comm*sizeof(PetscMPIInt),&pcbddc->local_primal_displacements);CHKERRQ(ierr); 2253beed3852SStefano Zampini /* Gather local_primal_size information for all processes */ 22545619798eSStefano Zampini ierr = MPI_Allgather(&mpi_local_primal_size,1,MPIU_INT,&pcbddc->local_primal_sizes[0],1,MPIU_INT,prec_comm);CHKERRQ(ierr); 2255beed3852SStefano Zampini pcbddc->replicated_primal_size = 0; 2256beed3852SStefano Zampini for (i=0; i<size_prec_comm; i++) { 2257beed3852SStefano Zampini pcbddc->local_primal_displacements[i] = pcbddc->replicated_primal_size ; 2258beed3852SStefano Zampini pcbddc->replicated_primal_size += pcbddc->local_primal_sizes[i]; 2259beed3852SStefano Zampini } 22605619798eSStefano Zampini if(rank_prec_comm == 0) { 2261beed3852SStefano Zampini /* allocate some auxiliary space */ 2262beed3852SStefano Zampini ierr = PetscMalloc(pcbddc->replicated_primal_size*sizeof(*all_auxglobal_primal),&all_auxglobal_primal);CHKERRQ(ierr); 2263beed3852SStefano Zampini ierr = PetscMalloc(pcbddc->replicated_primal_size*sizeof(*all_auxglobal_primal_dummy),&all_auxglobal_primal_dummy);CHKERRQ(ierr); 2264beed3852SStefano Zampini } 2265beed3852SStefano Zampini ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscMPIInt),&auxlocal_primal);CHKERRQ(ierr); 2266beed3852SStefano Zampini ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscMPIInt),&auxglobal_primal);CHKERRQ(ierr); 2267beed3852SStefano Zampini 2268da1bb401SStefano Zampini /* First let's count coarse dofs. 2269beed3852SStefano Zampini This code fragment assumes that the number of local constraints per connected component 2270beed3852SStefano Zampini is not greater than the number of nodes defined for the connected component 2271beed3852SStefano Zampini (otherwise we will surely have linear dependence between constraints and thus a singular coarse problem) */ 22723b03a366Sstefano_zampini /* auxlocal_primal : primal indices in local nodes numbering (internal and interface) with complete queue sorted by global ordering */ 2273beed3852SStefano Zampini ierr = VecSet(pcis->vec1_N,zero);CHKERRQ(ierr); 2274beed3852SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 2275da1bb401SStefano Zampini for(i=0;i<pcbddc->local_primal_size;i++) { 2276da1bb401SStefano Zampini ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr); 22773b03a366Sstefano_zampini for (j=0; j<size_of_constraint; j++) { 22783b03a366Sstefano_zampini k = row_cmat_indices[j]; 2279beed3852SStefano Zampini if( array[k] == zero ) { 2280beed3852SStefano Zampini array[k] = one; 2281da1bb401SStefano Zampini auxlocal_primal[i] = k; 2282beed3852SStefano Zampini break; 2283beed3852SStefano Zampini } 2284beed3852SStefano Zampini } 2285da1bb401SStefano Zampini ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr); 2286beed3852SStefano Zampini } 2287beed3852SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 2288da1bb401SStefano Zampini ierr = VecSet(pcis->vec1_global,zero);CHKERRQ(ierr); 2289da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 2290da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 2291da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 2292da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 2293da1bb401SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 2294da1bb401SStefano Zampini for(i=0;i<pcis->n;i++) { if( array[i] > zero) array[i] = one/array[i]; } 2295da1bb401SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 2296da1bb401SStefano Zampini ierr = VecSet(pcis->vec1_global,zero);CHKERRQ(ierr); 2297da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 2298da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 2299da1bb401SStefano Zampini ierr = VecSum(pcis->vec1_global,&coarsesum);CHKERRQ(ierr); 2300da1bb401SStefano Zampini pcbddc->coarse_size = (PetscInt) coarsesum; 2301a0ba757dSStefano Zampini 2302beed3852SStefano Zampini /* Now assign them a global numbering */ 2303beed3852SStefano Zampini /* auxglobal_primal contains indices in global nodes numbering (internal and interface) */ 2304beed3852SStefano Zampini ierr = ISLocalToGlobalMappingApply(matis->mapping,pcbddc->local_primal_size,auxlocal_primal,auxglobal_primal);CHKERRQ(ierr); 2305beed3852SStefano Zampini /* all_auxglobal_primal contains all primal nodes indices in global nodes numbering (internal and interface) */ 2306beed3852SStefano Zampini ierr = MPI_Gatherv(&auxglobal_primal[0],pcbddc->local_primal_size,MPIU_INT,&all_auxglobal_primal[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,0,prec_comm);CHKERRQ(ierr); 2307beed3852SStefano Zampini 2308beed3852SStefano Zampini /* After this block all_auxglobal_primal should contains one copy of each primal node's indices in global nodes numbering */ 2309beed3852SStefano Zampini /* It implements a function similar to PetscSortRemoveDupsInt */ 2310beed3852SStefano Zampini if(rank_prec_comm==0) { 2311beed3852SStefano Zampini /* dummy argument since PetscSortMPIInt doesn't exist! */ 2312beed3852SStefano Zampini ierr = PetscSortMPIIntWithArray(pcbddc->replicated_primal_size,all_auxglobal_primal,all_auxglobal_primal_dummy);CHKERRQ(ierr); 2313beed3852SStefano Zampini k=1; 2314beed3852SStefano Zampini j=all_auxglobal_primal[0]; /* first dof in global numbering */ 2315beed3852SStefano Zampini for(i=1;i< pcbddc->replicated_primal_size ;i++) { 2316beed3852SStefano Zampini if(j != all_auxglobal_primal[i] ) { 2317beed3852SStefano Zampini all_auxglobal_primal[k]=all_auxglobal_primal[i]; 2318beed3852SStefano Zampini k++; 2319beed3852SStefano Zampini j=all_auxglobal_primal[i]; 2320beed3852SStefano Zampini } 2321beed3852SStefano Zampini } 2322beed3852SStefano Zampini } else { 2323beed3852SStefano Zampini ierr = PetscMalloc(pcbddc->coarse_size*sizeof(PetscMPIInt),&all_auxglobal_primal);CHKERRQ(ierr); 2324beed3852SStefano Zampini } 23255619798eSStefano Zampini /* We only need to broadcast the indices from 0 to pcbddc->coarse_size. Remaning elements of array all_aux_global_primal are garbage. */ 2326beed3852SStefano Zampini ierr = MPI_Bcast(all_auxglobal_primal,pcbddc->coarse_size,MPIU_INT,0,prec_comm);CHKERRQ(ierr); 2327beed3852SStefano Zampini 2328beed3852SStefano Zampini /* Now get global coarse numbering of local primal nodes */ 2329beed3852SStefano Zampini for(i=0;i<pcbddc->local_primal_size;i++) { 2330beed3852SStefano Zampini k=0; 2331beed3852SStefano Zampini while( all_auxglobal_primal[k] != auxglobal_primal[i] ) { k++;} 2332beed3852SStefano Zampini pcbddc->local_primal_indices[i]=k; 2333beed3852SStefano Zampini } 2334e269702eSStefano Zampini if(dbg_flag) { 2335e269702eSStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr); 2336da1bb401SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Size of coarse problem %d\n",pcbddc->coarse_size);CHKERRQ(ierr); 2337e269702eSStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 2338e269702eSStefano Zampini } 2339beed3852SStefano Zampini /* free allocated memory */ 2340beed3852SStefano Zampini ierr = PetscFree(auxlocal_primal);CHKERRQ(ierr); 2341beed3852SStefano Zampini ierr = PetscFree(auxglobal_primal);CHKERRQ(ierr); 2342beed3852SStefano Zampini ierr = PetscFree(all_auxglobal_primal);CHKERRQ(ierr); 2343e269702eSStefano Zampini if(rank_prec_comm == 0) { 2344beed3852SStefano Zampini ierr = PetscFree(all_auxglobal_primal_dummy);CHKERRQ(ierr); 2345beed3852SStefano Zampini } 2346e269702eSStefano Zampini } 2347beed3852SStefano Zampini 23480c7d97c5SJed Brown /* adapt coarse problem type */ 23490c7d97c5SJed Brown if(pcbddc->coarse_problem_type == MULTILEVEL_BDDC && pcbddc->active_procs < MIN_PROCS_FOR_BDDC ) 23500c7d97c5SJed Brown pcbddc->coarse_problem_type = PARALLEL_BDDC; 23510c7d97c5SJed Brown 23520c7d97c5SJed Brown switch(pcbddc->coarse_problem_type){ 23530c7d97c5SJed Brown 2354da1bb401SStefano Zampini case(MULTILEVEL_BDDC): /* we define a coarse mesh where subdomains are elements */ 23550c7d97c5SJed Brown { 23560c7d97c5SJed Brown /* we need additional variables */ 23570c7d97c5SJed Brown MetisInt n_subdomains,n_parts,objval,ncon,faces_nvtxs; 23580c7d97c5SJed Brown MetisInt *metis_coarse_subdivision; 23590c7d97c5SJed Brown MetisInt options[METIS_NOPTIONS]; 23600c7d97c5SJed Brown PetscMPIInt size_coarse_comm,rank_coarse_comm; 23610c7d97c5SJed Brown PetscMPIInt procs_jumps_coarse_comm; 23620c7d97c5SJed Brown PetscMPIInt *coarse_subdivision; 23630c7d97c5SJed Brown PetscMPIInt *total_count_recv; 23640c7d97c5SJed Brown PetscMPIInt *total_ranks_recv; 23650c7d97c5SJed Brown PetscMPIInt *displacements_recv; 23660c7d97c5SJed Brown PetscMPIInt *my_faces_connectivity; 23670c7d97c5SJed Brown PetscMPIInt *petsc_faces_adjncy; 23680c7d97c5SJed Brown MetisInt *faces_adjncy; 23690c7d97c5SJed Brown MetisInt *faces_xadj; 23700c7d97c5SJed Brown PetscMPIInt *number_of_faces; 23710c7d97c5SJed Brown PetscMPIInt *faces_displacements; 23720c7d97c5SJed Brown PetscInt *array_int; 23730c7d97c5SJed Brown PetscMPIInt my_faces=0; 23740c7d97c5SJed Brown PetscMPIInt total_faces=0; 23753828260eSStefano Zampini PetscInt ranks_stretching_ratio; 23760c7d97c5SJed Brown 23770c7d97c5SJed Brown /* define some quantities */ 23780c7d97c5SJed Brown pcbddc->coarse_communications_type = SCATTERS_BDDC; 23790c7d97c5SJed Brown coarse_mat_type = MATIS; 23800c7d97c5SJed Brown coarse_pc_type = PCBDDC; 23816c9de887SHong Zhang coarse_ksp_type = KSPCHEBYSHEV; 23820c7d97c5SJed Brown 23830c7d97c5SJed Brown /* details of coarse decomposition */ 23840c7d97c5SJed Brown n_subdomains = pcbddc->active_procs; 23850c7d97c5SJed Brown n_parts = n_subdomains/pcbddc->coarsening_ratio; 23863828260eSStefano Zampini ranks_stretching_ratio = size_prec_comm/pcbddc->active_procs; 23873828260eSStefano Zampini procs_jumps_coarse_comm = pcbddc->coarsening_ratio*ranks_stretching_ratio; 23883828260eSStefano Zampini 2389da1bb401SStefano Zampini /*printf("Coarse algorithm details: \n"); 2390da1bb401SStefano Zampini printf("n_subdomains %d, n_parts %d\nstretch %d,jumps %d,coarse_ratio %d\nlevel should be log_%d(%d)\n",n_subdomains,n_parts,ranks_stretching_ratio,procs_jumps_coarse_comm,pcbddc->coarsening_ratio,pcbddc->coarsening_ratio,(ranks_stretching_ratio/pcbddc->coarsening_ratio+1));*/ 23910c7d97c5SJed Brown 23920c7d97c5SJed Brown /* build CSR graph of subdomains' connectivity through faces */ 23930c7d97c5SJed Brown ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&array_int);CHKERRQ(ierr); 23943828260eSStefano Zampini ierr = PetscMemzero(array_int,pcis->n*sizeof(PetscInt));CHKERRQ(ierr); 23950c7d97c5SJed Brown for(i=1;i<pcis->n_neigh;i++){/* i=1 so I don't count myself -> faces nodes counts to 1 */ 23960c7d97c5SJed Brown for(j=0;j<pcis->n_shared[i];j++){ 23970c7d97c5SJed Brown array_int[ pcis->shared[i][j] ]+=1; 23980c7d97c5SJed Brown } 23990c7d97c5SJed Brown } 24000c7d97c5SJed Brown for(i=1;i<pcis->n_neigh;i++){ 24010c7d97c5SJed Brown for(j=0;j<pcis->n_shared[i];j++){ 24020c7d97c5SJed Brown if(array_int[ pcis->shared[i][j] ] == 1 ){ 24030c7d97c5SJed Brown my_faces++; 24040c7d97c5SJed Brown break; 24050c7d97c5SJed Brown } 24060c7d97c5SJed Brown } 24070c7d97c5SJed Brown } 24080c7d97c5SJed Brown 240953cdbc3dSStefano Zampini ierr = MPI_Reduce(&my_faces,&total_faces,1,MPIU_INT,MPI_SUM,master_proc,prec_comm);CHKERRQ(ierr); 24100c7d97c5SJed Brown ierr = PetscMalloc (my_faces*sizeof(PetscInt),&my_faces_connectivity);CHKERRQ(ierr); 24110c7d97c5SJed Brown my_faces=0; 24120c7d97c5SJed Brown for(i=1;i<pcis->n_neigh;i++){ 24130c7d97c5SJed Brown for(j=0;j<pcis->n_shared[i];j++){ 24140c7d97c5SJed Brown if(array_int[ pcis->shared[i][j] ] == 1 ){ 24150c7d97c5SJed Brown my_faces_connectivity[my_faces]=pcis->neigh[i]; 24160c7d97c5SJed Brown my_faces++; 24170c7d97c5SJed Brown break; 24180c7d97c5SJed Brown } 24190c7d97c5SJed Brown } 24200c7d97c5SJed Brown } 24210c7d97c5SJed Brown if(rank_prec_comm == master_proc) { 24220c7d97c5SJed Brown ierr = PetscMalloc (total_faces*sizeof(PetscMPIInt),&petsc_faces_adjncy);CHKERRQ(ierr); 24230c7d97c5SJed Brown ierr = PetscMalloc (size_prec_comm*sizeof(PetscMPIInt),&number_of_faces);CHKERRQ(ierr); 24240c7d97c5SJed Brown ierr = PetscMalloc (total_faces*sizeof(MetisInt),&faces_adjncy);CHKERRQ(ierr); 24250c7d97c5SJed Brown ierr = PetscMalloc ((n_subdomains+1)*sizeof(MetisInt),&faces_xadj);CHKERRQ(ierr); 24260c7d97c5SJed Brown ierr = PetscMalloc ((size_prec_comm+1)*sizeof(PetscMPIInt),&faces_displacements);CHKERRQ(ierr); 24270c7d97c5SJed Brown } 242853cdbc3dSStefano Zampini ierr = MPI_Gather(&my_faces,1,MPIU_INT,&number_of_faces[0],1,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr); 24290c7d97c5SJed Brown if(rank_prec_comm == master_proc) { 24300c7d97c5SJed Brown faces_xadj[0]=0; 24310c7d97c5SJed Brown faces_displacements[0]=0; 24320c7d97c5SJed Brown j=0; 24330c7d97c5SJed Brown for(i=1;i<size_prec_comm+1;i++) { 24340c7d97c5SJed Brown faces_displacements[i]=faces_displacements[i-1]+number_of_faces[i-1]; 24350c7d97c5SJed Brown if(number_of_faces[i-1]) { 24360c7d97c5SJed Brown j++; 24370c7d97c5SJed Brown faces_xadj[j]=faces_xadj[j-1]+number_of_faces[i-1]; 24380c7d97c5SJed Brown } 24390c7d97c5SJed Brown } 2440da1bb401SStefano Zampini /*printf("The J I count is %d and should be %d\n",j,n_subdomains); 2441da1bb401SStefano Zampini printf("Total faces seem %d and should be %d\n",faces_xadj[j],total_faces);*/ 24420c7d97c5SJed Brown } 244353cdbc3dSStefano Zampini ierr = MPI_Gatherv(&my_faces_connectivity[0],my_faces,MPIU_INT,&petsc_faces_adjncy[0],number_of_faces,faces_displacements,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr); 24440c7d97c5SJed Brown ierr = PetscFree(my_faces_connectivity);CHKERRQ(ierr); 24450c7d97c5SJed Brown ierr = PetscFree(array_int);CHKERRQ(ierr); 24460c7d97c5SJed Brown if(rank_prec_comm == master_proc) { 24473828260eSStefano Zampini for(i=0;i<total_faces;i++) faces_adjncy[i]=(MetisInt)(petsc_faces_adjncy[i]/ranks_stretching_ratio); /* cast to MetisInt */ 2448da1bb401SStefano Zampini /*printf("This is the face connectivity (actual ranks)\n"); 24490c7d97c5SJed Brown for(i=0;i<n_subdomains;i++){ 24500c7d97c5SJed Brown printf("proc %d is connected with \n",i); 24510c7d97c5SJed Brown for(j=faces_xadj[i];j<faces_xadj[i+1];j++) 24520c7d97c5SJed Brown printf("%d ",faces_adjncy[j]); 24530c7d97c5SJed Brown printf("\n"); 2454da1bb401SStefano Zampini }*/ 24550c7d97c5SJed Brown ierr = PetscFree(faces_displacements);CHKERRQ(ierr); 24560c7d97c5SJed Brown ierr = PetscFree(number_of_faces);CHKERRQ(ierr); 24570c7d97c5SJed Brown ierr = PetscFree(petsc_faces_adjncy);CHKERRQ(ierr); 24580c7d97c5SJed Brown } 24590c7d97c5SJed Brown 24600c7d97c5SJed Brown if( rank_prec_comm == master_proc ) { 24610c7d97c5SJed Brown 24623828260eSStefano Zampini PetscInt heuristic_for_metis=3; 24633828260eSStefano Zampini 24640c7d97c5SJed Brown ncon=1; 24650c7d97c5SJed Brown faces_nvtxs=n_subdomains; 24660c7d97c5SJed Brown /* partition graoh induced by face connectivity */ 24670c7d97c5SJed Brown ierr = PetscMalloc (n_subdomains*sizeof(MetisInt),&metis_coarse_subdivision);CHKERRQ(ierr); 24680c7d97c5SJed Brown ierr = METIS_SetDefaultOptions(options); 24690c7d97c5SJed Brown /* we need a contiguous partition of the coarse mesh */ 24700c7d97c5SJed Brown options[METIS_OPTION_CONTIG]=1; 24710c7d97c5SJed Brown options[METIS_OPTION_DBGLVL]=1; 24720c7d97c5SJed Brown options[METIS_OPTION_NITER]=30; 24733828260eSStefano Zampini if(n_subdomains>n_parts*heuristic_for_metis) { 24743828260eSStefano Zampini options[METIS_OPTION_IPTYPE]=METIS_IPTYPE_EDGE; 24753828260eSStefano Zampini options[METIS_OPTION_OBJTYPE]=METIS_OBJTYPE_CUT; 24760c7d97c5SJed Brown ierr = METIS_PartGraphKway(&faces_nvtxs,&ncon,faces_xadj,faces_adjncy,NULL,NULL,NULL,&n_parts,NULL,NULL,options,&objval,metis_coarse_subdivision); 24773828260eSStefano Zampini } else { 24783828260eSStefano Zampini ierr = METIS_PartGraphRecursive(&faces_nvtxs,&ncon,faces_xadj,faces_adjncy,NULL,NULL,NULL,&n_parts,NULL,NULL,options,&objval,metis_coarse_subdivision); 24793828260eSStefano Zampini } 24800c7d97c5SJed Brown if(ierr != METIS_OK) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in METIS_PartGraphKway (metis error code %D) called from PCBDDCSetupCoarseEnvironment\n",ierr); 24810c7d97c5SJed Brown ierr = PetscFree(faces_xadj);CHKERRQ(ierr); 24820c7d97c5SJed Brown ierr = PetscFree(faces_adjncy);CHKERRQ(ierr); 24830c7d97c5SJed Brown coarse_subdivision = (PetscMPIInt*)calloc(size_prec_comm,sizeof(PetscMPIInt)); /* calloc for contiguous memory since we need to scatter these values later */ 24840c7d97c5SJed Brown /* copy/cast values avoiding possible type conflicts between PETSc, MPI and METIS */ 24853828260eSStefano Zampini for(i=0;i<size_prec_comm;i++) coarse_subdivision[i]=MPI_PROC_NULL; 24863828260eSStefano Zampini for(i=0;i<n_subdomains;i++) coarse_subdivision[ranks_stretching_ratio*i]=(PetscInt)(metis_coarse_subdivision[i]); 24870c7d97c5SJed Brown ierr = PetscFree(metis_coarse_subdivision);CHKERRQ(ierr); 24880c7d97c5SJed Brown } 24890c7d97c5SJed Brown 24900c7d97c5SJed Brown /* Create new communicator for coarse problem splitting the old one */ 24910c7d97c5SJed Brown if( !(rank_prec_comm%procs_jumps_coarse_comm) && rank_prec_comm < procs_jumps_coarse_comm*n_parts ){ 2492da1bb401SStefano Zampini coarse_color=0; /* for communicator splitting */ 2493da1bb401SStefano Zampini active_rank=rank_prec_comm; /* for insertion of matrix values */ 24940c7d97c5SJed Brown } 2495da1bb401SStefano Zampini /* procs with coarse_color = MPI_UNDEFINED will have coarse_comm = MPI_COMM_NULL (from mpi standards) 2496da1bb401SStefano Zampini key = rank_prec_comm -> keep same ordering of ranks from the old to the new communicator */ 249753cdbc3dSStefano Zampini ierr = MPI_Comm_split(prec_comm,coarse_color,rank_prec_comm,&coarse_comm);CHKERRQ(ierr); 24980c7d97c5SJed Brown 24990c7d97c5SJed Brown if( coarse_color == 0 ) { 250053cdbc3dSStefano Zampini ierr = MPI_Comm_size(coarse_comm,&size_coarse_comm);CHKERRQ(ierr); 250153cdbc3dSStefano Zampini ierr = MPI_Comm_rank(coarse_comm,&rank_coarse_comm);CHKERRQ(ierr); 2502da1bb401SStefano Zampini /*printf("Details of coarse comm\n"); 25033828260eSStefano Zampini printf("size = %d, myrank = %d\n",size_coarse_comm,rank_coarse_comm); 2504da1bb401SStefano Zampini printf("jumps = %d, coarse_color = %d, n_parts = %d\n",procs_jumps_coarse_comm,coarse_color,n_parts);*/ 25050c7d97c5SJed Brown } else { 25060c7d97c5SJed Brown rank_coarse_comm = MPI_PROC_NULL; 25070c7d97c5SJed Brown } 25080c7d97c5SJed Brown 25090c7d97c5SJed Brown /* master proc take care of arranging and distributing coarse informations */ 25100c7d97c5SJed Brown if(rank_coarse_comm == master_proc) { 25110c7d97c5SJed Brown ierr = PetscMalloc (size_coarse_comm*sizeof(PetscMPIInt),&displacements_recv);CHKERRQ(ierr); 2512da1bb401SStefano Zampini /*ierr = PetscMalloc (size_coarse_comm*sizeof(PetscMPIInt),&total_count_recv);CHKERRQ(ierr); 2513da1bb401SStefano Zampini ierr = PetscMalloc (n_subdomains*sizeof(PetscMPIInt),&total_ranks_recv);CHKERRQ(ierr);*/ 25140c7d97c5SJed Brown total_count_recv = (PetscMPIInt*)calloc(size_prec_comm,sizeof(PetscMPIInt)); 25150c7d97c5SJed Brown total_ranks_recv = (PetscMPIInt*)calloc(n_subdomains,sizeof(PetscMPIInt)); 25160c7d97c5SJed Brown /* some initializations */ 25170c7d97c5SJed Brown displacements_recv[0]=0; 2518da1bb401SStefano Zampini /* PetscMemzero(total_count_recv,size_coarse_comm*sizeof(PetscMPIInt)); not needed -> calloc initializes to zero */ 25190c7d97c5SJed Brown /* count from how many processes the j-th process of the coarse decomposition will receive data */ 25200c7d97c5SJed Brown for(j=0;j<size_coarse_comm;j++) 25213828260eSStefano Zampini for(i=0;i<size_prec_comm;i++) 25220c7d97c5SJed Brown if(coarse_subdivision[i]==j) 25230c7d97c5SJed Brown total_count_recv[j]++; 25240c7d97c5SJed Brown /* displacements needed for scatterv of total_ranks_recv */ 25250c7d97c5SJed Brown for(i=1;i<size_coarse_comm;i++) displacements_recv[i]=displacements_recv[i-1]+total_count_recv[i-1]; 25260c7d97c5SJed Brown /* Now fill properly total_ranks_recv -> each coarse process will receive the ranks (in prec_comm communicator) of its friend (sending) processes */ 25270c7d97c5SJed Brown ierr = PetscMemzero(total_count_recv,size_coarse_comm*sizeof(PetscMPIInt));CHKERRQ(ierr); 25280c7d97c5SJed Brown for(j=0;j<size_coarse_comm;j++) { 25293828260eSStefano Zampini for(i=0;i<size_prec_comm;i++) { 25300c7d97c5SJed Brown if(coarse_subdivision[i]==j) { 25310c7d97c5SJed Brown total_ranks_recv[displacements_recv[j]+total_count_recv[j]]=i; 25323828260eSStefano Zampini total_count_recv[j]+=1; 25330c7d97c5SJed Brown } 25340c7d97c5SJed Brown } 25350c7d97c5SJed Brown } 2536da1bb401SStefano Zampini /*for(j=0;j<size_coarse_comm;j++) { 25373828260eSStefano Zampini printf("process %d in new rank will receive from %d processes (original ranks follows)\n",j,total_count_recv[j]); 25383828260eSStefano Zampini for(i=0;i<total_count_recv[j];i++) { 25393828260eSStefano Zampini printf("%d ",total_ranks_recv[displacements_recv[j]+i]); 25403828260eSStefano Zampini } 25413828260eSStefano Zampini printf("\n"); 2542da1bb401SStefano Zampini }*/ 25430c7d97c5SJed Brown 25440c7d97c5SJed Brown /* identify new decomposition in terms of ranks in the old communicator */ 25453828260eSStefano Zampini for(i=0;i<n_subdomains;i++) coarse_subdivision[ranks_stretching_ratio*i]=coarse_subdivision[ranks_stretching_ratio*i]*procs_jumps_coarse_comm; 2546da1bb401SStefano Zampini /*printf("coarse_subdivision in old end new ranks\n"); 25470c7d97c5SJed Brown for(i=0;i<size_prec_comm;i++) 25483828260eSStefano Zampini if(coarse_subdivision[i]!=MPI_PROC_NULL) { 25493828260eSStefano Zampini printf("%d=(%d %d), ",i,coarse_subdivision[i],coarse_subdivision[i]/procs_jumps_coarse_comm); 25503828260eSStefano Zampini } else { 25513828260eSStefano Zampini printf("%d=(%d %d), ",i,coarse_subdivision[i],coarse_subdivision[i]); 25523828260eSStefano Zampini } 2553da1bb401SStefano Zampini printf("\n");*/ 25540c7d97c5SJed Brown } 25550c7d97c5SJed Brown 25560c7d97c5SJed Brown /* Scatter new decomposition for send details */ 255753cdbc3dSStefano Zampini ierr = MPI_Scatter(&coarse_subdivision[0],1,MPIU_INT,&rank_coarse_proc_send_to,1,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr); 25580c7d97c5SJed Brown /* Scatter receiving details to members of coarse decomposition */ 25590c7d97c5SJed Brown if( coarse_color == 0) { 256053cdbc3dSStefano Zampini ierr = MPI_Scatter(&total_count_recv[0],1,MPIU_INT,&count_recv,1,MPIU_INT,master_proc,coarse_comm);CHKERRQ(ierr); 25610c7d97c5SJed Brown ierr = PetscMalloc (count_recv*sizeof(PetscMPIInt),&ranks_recv);CHKERRQ(ierr); 256253cdbc3dSStefano Zampini ierr = MPI_Scatterv(&total_ranks_recv[0],total_count_recv,displacements_recv,MPIU_INT,&ranks_recv[0],count_recv,MPIU_INT,master_proc,coarse_comm);CHKERRQ(ierr); 25630c7d97c5SJed Brown } 25640c7d97c5SJed Brown 2565da1bb401SStefano Zampini /*printf("I will send my matrix data to proc %d\n",rank_coarse_proc_send_to); 2566da1bb401SStefano Zampini if(coarse_color == 0) { 2567da1bb401SStefano Zampini printf("I will receive some matrix data from %d processes (ranks follows)\n",count_recv); 2568da1bb401SStefano Zampini for(i=0;i<count_recv;i++) 2569da1bb401SStefano Zampini printf("%d ",ranks_recv[i]); 2570da1bb401SStefano Zampini printf("\n"); 2571da1bb401SStefano Zampini }*/ 25720c7d97c5SJed Brown 25730c7d97c5SJed Brown if(rank_prec_comm == master_proc) { 2574da1bb401SStefano Zampini /*ierr = PetscFree(coarse_subdivision);CHKERRQ(ierr); 2575da1bb401SStefano Zampini ierr = PetscFree(total_count_recv);CHKERRQ(ierr); 2576da1bb401SStefano Zampini ierr = PetscFree(total_ranks_recv);CHKERRQ(ierr);*/ 25770c7d97c5SJed Brown free(coarse_subdivision); 25780c7d97c5SJed Brown free(total_count_recv); 25790c7d97c5SJed Brown free(total_ranks_recv); 25800c7d97c5SJed Brown ierr = PetscFree(displacements_recv);CHKERRQ(ierr); 25810c7d97c5SJed Brown } 25820c7d97c5SJed Brown break; 25830c7d97c5SJed Brown } 25840c7d97c5SJed Brown 25850c7d97c5SJed Brown case(REPLICATED_BDDC): 25860c7d97c5SJed Brown 25870c7d97c5SJed Brown pcbddc->coarse_communications_type = GATHERS_BDDC; 25880c7d97c5SJed Brown coarse_mat_type = MATSEQAIJ; 25890c7d97c5SJed Brown coarse_pc_type = PCLU; 259053cdbc3dSStefano Zampini coarse_ksp_type = KSPPREONLY; 25910c7d97c5SJed Brown coarse_comm = PETSC_COMM_SELF; 25920c7d97c5SJed Brown active_rank = rank_prec_comm; 25930c7d97c5SJed Brown break; 25940c7d97c5SJed Brown 25950c7d97c5SJed Brown case(PARALLEL_BDDC): 25960c7d97c5SJed Brown 25970c7d97c5SJed Brown pcbddc->coarse_communications_type = SCATTERS_BDDC; 25980c7d97c5SJed Brown coarse_mat_type = MATMPIAIJ; 25990c7d97c5SJed Brown coarse_pc_type = PCREDUNDANT; 260053cdbc3dSStefano Zampini coarse_ksp_type = KSPPREONLY; 26010c7d97c5SJed Brown coarse_comm = prec_comm; 26020c7d97c5SJed Brown active_rank = rank_prec_comm; 26030c7d97c5SJed Brown break; 26040c7d97c5SJed Brown 26050c7d97c5SJed Brown case(SEQUENTIAL_BDDC): 26060c7d97c5SJed Brown pcbddc->coarse_communications_type = GATHERS_BDDC; 26070c7d97c5SJed Brown coarse_mat_type = MATSEQAIJ; 26080c7d97c5SJed Brown coarse_pc_type = PCLU; 260953cdbc3dSStefano Zampini coarse_ksp_type = KSPPREONLY; 26100c7d97c5SJed Brown coarse_comm = PETSC_COMM_SELF; 26110c7d97c5SJed Brown active_rank = master_proc; 26120c7d97c5SJed Brown break; 26130c7d97c5SJed Brown } 26140c7d97c5SJed Brown 26150c7d97c5SJed Brown switch(pcbddc->coarse_communications_type){ 26160c7d97c5SJed Brown 26170c7d97c5SJed Brown case(SCATTERS_BDDC): 26180c7d97c5SJed Brown { 26190c7d97c5SJed Brown if(pcbddc->coarse_problem_type==MULTILEVEL_BDDC) { 26200c7d97c5SJed Brown 26210c7d97c5SJed Brown PetscMPIInt send_size; 26220c7d97c5SJed Brown PetscInt *aux_ins_indices; 26230c7d97c5SJed Brown PetscInt ii,jj; 26240c7d97c5SJed Brown MPI_Request *requests; 26250c7d97c5SJed Brown 26260c7d97c5SJed Brown /* allocate auxiliary space */ 26275619798eSStefano Zampini ierr = PetscMalloc (pcbddc->replicated_primal_size*sizeof(PetscMPIInt),&pcbddc->replicated_local_primal_indices);CHKERRQ(ierr); 26285619798eSStefano Zampini ierr = MPI_Allgatherv(&pcbddc->local_primal_indices[0],pcbddc->local_primal_size,MPIU_INT,&pcbddc->replicated_local_primal_indices[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,prec_comm);CHKERRQ(ierr); 26290c7d97c5SJed Brown ierr = PetscMalloc ( pcbddc->coarse_size*sizeof(PetscInt),&aux_ins_indices);CHKERRQ(ierr); 26300c7d97c5SJed Brown ierr = PetscMemzero(aux_ins_indices,pcbddc->coarse_size*sizeof(PetscInt));CHKERRQ(ierr); 26310c7d97c5SJed Brown /* allocate stuffs for message massing */ 26320c7d97c5SJed Brown ierr = PetscMalloc ( (count_recv+1)*sizeof(MPI_Request),&requests);CHKERRQ(ierr); 26330c7d97c5SJed Brown for(i=0;i<count_recv+1;i++) requests[i]=MPI_REQUEST_NULL; 26340c7d97c5SJed Brown ierr = PetscMalloc ( count_recv*sizeof(PetscMPIInt),&localsizes2);CHKERRQ(ierr); 26350c7d97c5SJed Brown ierr = PetscMalloc ( count_recv*sizeof(PetscMPIInt),&localdispl2);CHKERRQ(ierr); 26360c7d97c5SJed Brown /* fill up quantities */ 26370c7d97c5SJed Brown j=0; 26380c7d97c5SJed Brown for(i=0;i<count_recv;i++){ 26390c7d97c5SJed Brown ii = ranks_recv[i]; 26400c7d97c5SJed Brown localsizes2[i]=pcbddc->local_primal_sizes[ii]*pcbddc->local_primal_sizes[ii]; 26410c7d97c5SJed Brown localdispl2[i]=j; 26420c7d97c5SJed Brown j+=localsizes2[i]; 26430c7d97c5SJed Brown jj = pcbddc->local_primal_displacements[ii]; 2644da1bb401SStefano Zampini for(k=0;k<pcbddc->local_primal_sizes[ii];k++) aux_ins_indices[pcbddc->replicated_local_primal_indices[jj+k]]+=1; /* it counts the coarse subdomains sharing the coarse node */ 26450c7d97c5SJed Brown } 2646da1bb401SStefano Zampini /*printf("aux_ins_indices 1\n"); 2647da1bb401SStefano Zampini for(i=0;i<pcbddc->coarse_size;i++) 2648da1bb401SStefano Zampini printf("%d ",aux_ins_indices[i]); 2649da1bb401SStefano Zampini printf("\n");*/ 26500c7d97c5SJed Brown /* temp_coarse_mat_vals used to store temporarly received matrix values */ 26510c7d97c5SJed Brown ierr = PetscMalloc ( j*sizeof(PetscScalar),&temp_coarse_mat_vals);CHKERRQ(ierr); 26520c7d97c5SJed Brown /* evaluate how many values I will insert in coarse mat */ 26530c7d97c5SJed Brown ins_local_primal_size=0; 26540c7d97c5SJed Brown for(i=0;i<pcbddc->coarse_size;i++) 26550c7d97c5SJed Brown if(aux_ins_indices[i]) 26560c7d97c5SJed Brown ins_local_primal_size++; 26570c7d97c5SJed Brown /* evaluate indices I will insert in coarse mat */ 26580c7d97c5SJed Brown ierr = PetscMalloc ( ins_local_primal_size*sizeof(PetscInt),&ins_local_primal_indices);CHKERRQ(ierr); 26590c7d97c5SJed Brown j=0; 26600c7d97c5SJed Brown for(i=0;i<pcbddc->coarse_size;i++) 26610c7d97c5SJed Brown if(aux_ins_indices[i]) 26620c7d97c5SJed Brown ins_local_primal_indices[j++]=i; 26630c7d97c5SJed Brown /* use aux_ins_indices to realize a global to local mapping */ 26640c7d97c5SJed Brown j=0; 26650c7d97c5SJed Brown for(i=0;i<pcbddc->coarse_size;i++){ 26660c7d97c5SJed Brown if(aux_ins_indices[i]==0){ 26670c7d97c5SJed Brown aux_ins_indices[i]=-1; 26680c7d97c5SJed Brown } else { 26690c7d97c5SJed Brown aux_ins_indices[i]=j; 26700c7d97c5SJed Brown j++; 26710c7d97c5SJed Brown } 26720c7d97c5SJed Brown } 26730c7d97c5SJed Brown 2674da1bb401SStefano Zampini /*printf("New details localsizes2 localdispl2\n"); 2675da1bb401SStefano Zampini for(i=0;i<count_recv;i++) 2676da1bb401SStefano Zampini printf("(%d %d) ",localsizes2[i],localdispl2[i]); 2677da1bb401SStefano Zampini printf("\n"); 2678da1bb401SStefano Zampini printf("aux_ins_indices 2\n"); 2679da1bb401SStefano Zampini for(i=0;i<pcbddc->coarse_size;i++) 2680da1bb401SStefano Zampini printf("%d ",aux_ins_indices[i]); 2681da1bb401SStefano Zampini printf("\n"); 2682da1bb401SStefano Zampini printf("ins_local_primal_indices\n"); 2683da1bb401SStefano Zampini for(i=0;i<ins_local_primal_size;i++) 2684da1bb401SStefano Zampini printf("%d ",ins_local_primal_indices[i]); 2685da1bb401SStefano Zampini printf("\n"); 2686da1bb401SStefano Zampini printf("coarse_submat_vals\n"); 2687da1bb401SStefano Zampini for(i=0;i<pcbddc->local_primal_size;i++) 2688da1bb401SStefano Zampini for(j=0;j<pcbddc->local_primal_size;j++) 2689da1bb401SStefano Zampini printf("(%lf %d %d)\n",coarse_submat_vals[j*pcbddc->local_primal_size+i],pcbddc->local_primal_indices[i],pcbddc->local_primal_indices[j]); 2690da1bb401SStefano Zampini printf("\n");*/ 26910c7d97c5SJed Brown 26920c7d97c5SJed Brown /* processes partecipating in coarse problem receive matrix data from their friends */ 269353cdbc3dSStefano Zampini for(i=0;i<count_recv;i++) ierr = MPI_Irecv(&temp_coarse_mat_vals[localdispl2[i]],localsizes2[i],MPIU_SCALAR,ranks_recv[i],666,prec_comm,&requests[i]);CHKERRQ(ierr); 26940c7d97c5SJed Brown if(rank_coarse_proc_send_to != MPI_PROC_NULL ) { 26950c7d97c5SJed Brown send_size=pcbddc->local_primal_size*pcbddc->local_primal_size; 269653cdbc3dSStefano Zampini ierr = MPI_Isend(&coarse_submat_vals[0],send_size,MPIU_SCALAR,rank_coarse_proc_send_to,666,prec_comm,&requests[count_recv]);CHKERRQ(ierr); 26970c7d97c5SJed Brown } 269853cdbc3dSStefano Zampini ierr = MPI_Waitall(count_recv+1,requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 26990c7d97c5SJed Brown 2700da1bb401SStefano Zampini /*if(coarse_color == 0) { 2701da1bb401SStefano Zampini printf("temp_coarse_mat_vals\n"); 2702da1bb401SStefano Zampini for(k=0;k<count_recv;k++){ 2703da1bb401SStefano Zampini printf("---- %d ----\n",ranks_recv[k]); 2704da1bb401SStefano Zampini for(i=0;i<pcbddc->local_primal_sizes[ranks_recv[k]];i++) 2705da1bb401SStefano Zampini for(j=0;j<pcbddc->local_primal_sizes[ranks_recv[k]];j++) 2706da1bb401SStefano Zampini printf("(%lf %d %d)\n",temp_coarse_mat_vals[localdispl2[k]+j*pcbddc->local_primal_sizes[ranks_recv[k]]+i],pcbddc->replicated_local_primal_indices[pcbddc->local_primal_displacements[ranks_recv[k]]+i],pcbddc->replicated_local_primal_indices[pcbddc->local_primal_displacements[ranks_recv[k]]+j]); 2707da1bb401SStefano Zampini printf("\n"); 2708da1bb401SStefano Zampini } 2709da1bb401SStefano Zampini }*/ 27100c7d97c5SJed Brown /* calculate data to insert in coarse mat */ 27110c7d97c5SJed Brown ierr = PetscMalloc ( ins_local_primal_size*ins_local_primal_size*sizeof(PetscScalar),&ins_coarse_mat_vals);CHKERRQ(ierr); 27120c7d97c5SJed Brown PetscMemzero(ins_coarse_mat_vals,ins_local_primal_size*ins_local_primal_size*sizeof(PetscScalar)); 27130c7d97c5SJed Brown 27140c7d97c5SJed Brown PetscMPIInt rr,kk,lps,lpd; 27150c7d97c5SJed Brown PetscInt row_ind,col_ind; 27160c7d97c5SJed Brown for(k=0;k<count_recv;k++){ 27170c7d97c5SJed Brown rr = ranks_recv[k]; 27180c7d97c5SJed Brown kk = localdispl2[k]; 27190c7d97c5SJed Brown lps = pcbddc->local_primal_sizes[rr]; 27200c7d97c5SJed Brown lpd = pcbddc->local_primal_displacements[rr]; 2721da1bb401SStefano Zampini /*printf("Inserting the following indices (received from %d)\n",rr);*/ 27220c7d97c5SJed Brown for(j=0;j<lps;j++){ 27230c7d97c5SJed Brown col_ind=aux_ins_indices[pcbddc->replicated_local_primal_indices[lpd+j]]; 27240c7d97c5SJed Brown for(i=0;i<lps;i++){ 27250c7d97c5SJed Brown row_ind=aux_ins_indices[pcbddc->replicated_local_primal_indices[lpd+i]]; 2726da1bb401SStefano Zampini /*printf("%d %d\n",row_ind,col_ind);*/ 27270c7d97c5SJed Brown ins_coarse_mat_vals[col_ind*ins_local_primal_size+row_ind]+=temp_coarse_mat_vals[kk+j*lps+i]; 27280c7d97c5SJed Brown } 27290c7d97c5SJed Brown } 27300c7d97c5SJed Brown } 27310c7d97c5SJed Brown ierr = PetscFree(requests);CHKERRQ(ierr); 27320c7d97c5SJed Brown ierr = PetscFree(aux_ins_indices);CHKERRQ(ierr); 27330c7d97c5SJed Brown ierr = PetscFree(temp_coarse_mat_vals);CHKERRQ(ierr); 27340c7d97c5SJed Brown if(coarse_color == 0) { ierr = PetscFree(ranks_recv);CHKERRQ(ierr); } 27350c7d97c5SJed Brown 27360c7d97c5SJed Brown /* create local to global mapping needed by coarse MATIS */ 27370c7d97c5SJed Brown { 27380c7d97c5SJed Brown IS coarse_IS; 273953cdbc3dSStefano Zampini if(coarse_comm != MPI_COMM_NULL ) ierr = MPI_Comm_free(&coarse_comm);CHKERRQ(ierr); 27400c7d97c5SJed Brown coarse_comm = prec_comm; 27410c7d97c5SJed Brown active_rank=rank_prec_comm; 27420c7d97c5SJed Brown ierr = ISCreateGeneral(coarse_comm,ins_local_primal_size,ins_local_primal_indices,PETSC_COPY_VALUES,&coarse_IS);CHKERRQ(ierr); 27430c7d97c5SJed Brown ierr = ISLocalToGlobalMappingCreateIS(coarse_IS,&coarse_ISLG);CHKERRQ(ierr); 27440c7d97c5SJed Brown ierr = ISDestroy(&coarse_IS);CHKERRQ(ierr); 27450c7d97c5SJed Brown } 27460c7d97c5SJed Brown } 27470c7d97c5SJed Brown if(pcbddc->coarse_problem_type==PARALLEL_BDDC) { 27480c7d97c5SJed Brown /* arrays for values insertion */ 27490c7d97c5SJed Brown ins_local_primal_size = pcbddc->local_primal_size; 27500c7d97c5SJed Brown ierr = PetscMalloc ( ins_local_primal_size*sizeof(PetscMPIInt),&ins_local_primal_indices);CHKERRQ(ierr); 27510c7d97c5SJed Brown ierr = PetscMalloc ( ins_local_primal_size*ins_local_primal_size*sizeof(PetscScalar),&ins_coarse_mat_vals);CHKERRQ(ierr); 27520c7d97c5SJed Brown for(j=0;j<ins_local_primal_size;j++){ 27530c7d97c5SJed Brown ins_local_primal_indices[j]=pcbddc->local_primal_indices[j]; 27540c7d97c5SJed Brown for(i=0;i<ins_local_primal_size;i++) ins_coarse_mat_vals[j*ins_local_primal_size+i]=coarse_submat_vals[j*ins_local_primal_size+i]; 27550c7d97c5SJed Brown } 27560c7d97c5SJed Brown } 27570c7d97c5SJed Brown break; 27580c7d97c5SJed Brown 27590c7d97c5SJed Brown } 27600c7d97c5SJed Brown 27610c7d97c5SJed Brown case(GATHERS_BDDC): 27620c7d97c5SJed Brown { 27630c7d97c5SJed Brown 27640c7d97c5SJed Brown PetscMPIInt mysize,mysize2; 27650c7d97c5SJed Brown 27660c7d97c5SJed Brown if(rank_prec_comm==active_rank) { 27670c7d97c5SJed Brown ierr = PetscMalloc ( pcbddc->replicated_primal_size*sizeof(PetscMPIInt),&pcbddc->replicated_local_primal_indices);CHKERRQ(ierr); 27680c7d97c5SJed Brown pcbddc->replicated_local_primal_values = (PetscScalar*)calloc(pcbddc->replicated_primal_size,sizeof(PetscScalar)); 27690c7d97c5SJed Brown ierr = PetscMalloc ( size_prec_comm*sizeof(PetscMPIInt),&localsizes2);CHKERRQ(ierr); 27700c7d97c5SJed Brown ierr = PetscMalloc ( size_prec_comm*sizeof(PetscMPIInt),&localdispl2);CHKERRQ(ierr); 27710c7d97c5SJed Brown /* arrays for values insertion */ 27720c7d97c5SJed Brown ins_local_primal_size = pcbddc->coarse_size; 27730c7d97c5SJed Brown ierr = PetscMalloc ( ins_local_primal_size*sizeof(PetscMPIInt),&ins_local_primal_indices);CHKERRQ(ierr); 27740c7d97c5SJed Brown ierr = PetscMalloc ( ins_local_primal_size*ins_local_primal_size*sizeof(PetscScalar),&ins_coarse_mat_vals);CHKERRQ(ierr); 27750c7d97c5SJed Brown for(i=0;i<size_prec_comm;i++) localsizes2[i]=pcbddc->local_primal_sizes[i]*pcbddc->local_primal_sizes[i]; 27760c7d97c5SJed Brown localdispl2[0]=0; 27770c7d97c5SJed Brown for(i=1;i<size_prec_comm;i++) localdispl2[i]=localsizes2[i-1]+localdispl2[i-1]; 27780c7d97c5SJed Brown j=0; 27790c7d97c5SJed Brown for(i=0;i<size_prec_comm;i++) j+=localsizes2[i]; 27800c7d97c5SJed Brown ierr = PetscMalloc ( j*sizeof(PetscScalar),&temp_coarse_mat_vals);CHKERRQ(ierr); 27810c7d97c5SJed Brown } 27820c7d97c5SJed Brown 27830c7d97c5SJed Brown mysize=pcbddc->local_primal_size; 27840c7d97c5SJed Brown mysize2=pcbddc->local_primal_size*pcbddc->local_primal_size; 27850c7d97c5SJed Brown if(pcbddc->coarse_problem_type == SEQUENTIAL_BDDC){ 278653cdbc3dSStefano Zampini ierr = MPI_Gatherv(&pcbddc->local_primal_indices[0],mysize,MPIU_INT,&pcbddc->replicated_local_primal_indices[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr); 278753cdbc3dSStefano Zampini ierr = MPI_Gatherv(&coarse_submat_vals[0],mysize2,MPIU_SCALAR,&temp_coarse_mat_vals[0],localsizes2,localdispl2,MPIU_SCALAR,master_proc,prec_comm);CHKERRQ(ierr); 27880c7d97c5SJed Brown } else { 278953cdbc3dSStefano Zampini ierr = MPI_Allgatherv(&pcbddc->local_primal_indices[0],mysize,MPIU_INT,&pcbddc->replicated_local_primal_indices[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,prec_comm);CHKERRQ(ierr); 279053cdbc3dSStefano Zampini ierr = MPI_Allgatherv(&coarse_submat_vals[0],mysize2,MPIU_SCALAR,&temp_coarse_mat_vals[0],localsizes2,localdispl2,MPIU_SCALAR,prec_comm);CHKERRQ(ierr); 27910c7d97c5SJed Brown } 27920c7d97c5SJed Brown 27930c7d97c5SJed Brown /* free data structures no longer needed and allocate some space which will be needed in BDDC application */ 27940c7d97c5SJed Brown if(rank_prec_comm==active_rank) { 27950c7d97c5SJed Brown PetscInt offset,offset2,row_ind,col_ind; 27960c7d97c5SJed Brown for(j=0;j<ins_local_primal_size;j++){ 27970c7d97c5SJed Brown ins_local_primal_indices[j]=j; 27980c7d97c5SJed Brown for(i=0;i<ins_local_primal_size;i++) ins_coarse_mat_vals[j*ins_local_primal_size+i]=0.0; 27990c7d97c5SJed Brown } 28000c7d97c5SJed Brown for(k=0;k<size_prec_comm;k++){ 28010c7d97c5SJed Brown offset=pcbddc->local_primal_displacements[k]; 28020c7d97c5SJed Brown offset2=localdispl2[k]; 28030c7d97c5SJed Brown for(j=0;j<pcbddc->local_primal_sizes[k];j++){ 28040c7d97c5SJed Brown col_ind=pcbddc->replicated_local_primal_indices[offset+j]; 28050c7d97c5SJed Brown for(i=0;i<pcbddc->local_primal_sizes[k];i++){ 28060c7d97c5SJed Brown row_ind=pcbddc->replicated_local_primal_indices[offset+i]; 28070c7d97c5SJed Brown ins_coarse_mat_vals[col_ind*pcbddc->coarse_size+row_ind]+=temp_coarse_mat_vals[offset2+j*pcbddc->local_primal_sizes[k]+i]; 28080c7d97c5SJed Brown } 28090c7d97c5SJed Brown } 28100c7d97c5SJed Brown } 28110c7d97c5SJed Brown } 28120c7d97c5SJed Brown break; 2813da1bb401SStefano Zampini }/* switch on coarse problem and communications associated with finished */ 28140c7d97c5SJed Brown } 28150c7d97c5SJed Brown 28160c7d97c5SJed Brown /* Now create and fill up coarse matrix */ 28170c7d97c5SJed Brown if( rank_prec_comm == active_rank ) { 28180c7d97c5SJed Brown if(pcbddc->coarse_problem_type != MULTILEVEL_BDDC) { 28190c7d97c5SJed Brown ierr = MatCreate(coarse_comm,&pcbddc->coarse_mat);CHKERRQ(ierr); 28200c7d97c5SJed Brown ierr = MatSetSizes(pcbddc->coarse_mat,PETSC_DECIDE,PETSC_DECIDE,pcbddc->coarse_size,pcbddc->coarse_size);CHKERRQ(ierr); 28210c7d97c5SJed Brown ierr = MatSetType(pcbddc->coarse_mat,coarse_mat_type);CHKERRQ(ierr); 28223b03a366Sstefano_zampini ierr = MatSetUp(pcbddc->coarse_mat);CHKERRQ(ierr); 2823da1bb401SStefano Zampini ierr = MatSetOption(pcbddc->coarse_mat,MAT_ROW_ORIENTED,PETSC_FALSE);CHKERRQ(ierr); /* local values stored in column major */ 28243b03a366Sstefano_zampini ierr = MatSetOption(pcbddc->coarse_mat,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr); 28250c7d97c5SJed Brown } else { 28260c7d97c5SJed Brown Mat matis_coarse_local_mat; 2827d3ee2243SStefano Zampini /* remind bs */ 2828d3ee2243SStefano Zampini ierr = MatCreateIS(coarse_comm,bs,PETSC_DECIDE,PETSC_DECIDE,pcbddc->coarse_size,pcbddc->coarse_size,coarse_ISLG,&pcbddc->coarse_mat);CHKERRQ(ierr); 28293b03a366Sstefano_zampini ierr = MatSetUp(pcbddc->coarse_mat);CHKERRQ(ierr); 28300c7d97c5SJed Brown ierr = MatISGetLocalMat(pcbddc->coarse_mat,&matis_coarse_local_mat);CHKERRQ(ierr); 28313b03a366Sstefano_zampini ierr = MatSetUp(matis_coarse_local_mat);CHKERRQ(ierr); 2832da1bb401SStefano Zampini ierr = MatSetOption(matis_coarse_local_mat,MAT_ROW_ORIENTED,PETSC_FALSE);CHKERRQ(ierr); /* local values stored in column major */ 2833a0ba757dSStefano Zampini ierr = MatSetOption(matis_coarse_local_mat,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr); 28340c7d97c5SJed Brown } 2835a0ba757dSStefano Zampini ierr = MatSetOption(pcbddc->coarse_mat,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_FALSE);CHKERRQ(ierr); 28360c7d97c5SJed Brown ierr = MatSetValues(pcbddc->coarse_mat,ins_local_primal_size,ins_local_primal_indices,ins_local_primal_size,ins_local_primal_indices,ins_coarse_mat_vals,ADD_VALUES);CHKERRQ(ierr); 28370c7d97c5SJed Brown ierr = MatAssemblyBegin(pcbddc->coarse_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 28380c7d97c5SJed Brown ierr = MatAssemblyEnd(pcbddc->coarse_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 28390c7d97c5SJed Brown 2840da1bb401SStefano Zampini /* PetscViewer view_out; 2841da1bb401SStefano Zampini ierr = PetscViewerASCIIOpen(PETSC_COMM_SELF,"coarsematfull.m",&view_out);CHKERRQ(ierr); 2842da1bb401SStefano Zampini ierr = PetscViewerSetFormat(view_out,PETSC_VIEWER_ASCII_MATLAB);CHKERRQ(ierr); 2843da1bb401SStefano Zampini ierr = MatView(pcbddc->coarse_mat,view_out);CHKERRQ(ierr); 2844da1bb401SStefano Zampini ierr = PetscViewerDestroy(&view_out);CHKERRQ(ierr);*/ 2845da1bb401SStefano Zampini 28460c7d97c5SJed Brown ierr = MatGetVecs(pcbddc->coarse_mat,&pcbddc->coarse_vec,&pcbddc->coarse_rhs);CHKERRQ(ierr); 28470c7d97c5SJed Brown /* Preconditioner for coarse problem */ 284853cdbc3dSStefano Zampini ierr = KSPCreate(coarse_comm,&pcbddc->coarse_ksp);CHKERRQ(ierr); 284953cdbc3dSStefano Zampini ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->coarse_ksp,(PetscObject)pc,1);CHKERRQ(ierr); 285053cdbc3dSStefano Zampini ierr = KSPSetOperators(pcbddc->coarse_ksp,pcbddc->coarse_mat,pcbddc->coarse_mat,SAME_PRECONDITIONER);CHKERRQ(ierr); 28513b03a366Sstefano_zampini ierr = KSPSetTolerances(pcbddc->coarse_ksp,PETSC_DEFAULT,PETSC_DEFAULT,PETSC_DEFAULT,max_it_coarse_ksp);CHKERRQ(ierr); 285253cdbc3dSStefano Zampini ierr = KSPSetType(pcbddc->coarse_ksp,coarse_ksp_type);CHKERRQ(ierr); 285353cdbc3dSStefano Zampini ierr = KSPGetPC(pcbddc->coarse_ksp,&pc_temp);CHKERRQ(ierr); 285453cdbc3dSStefano Zampini ierr = PCSetType(pc_temp,coarse_pc_type);CHKERRQ(ierr); 28550c7d97c5SJed Brown /* Allow user's customization */ 2856da1bb401SStefano Zampini ierr = KSPSetOptionsPrefix(pcbddc->coarse_ksp,"coarse_");CHKERRQ(ierr); 285753cdbc3dSStefano Zampini ierr = KSPSetFromOptions(pcbddc->coarse_ksp);CHKERRQ(ierr); 28580c7d97c5SJed Brown /* Set Up PC for coarse problem BDDC */ 285953cdbc3dSStefano Zampini if(pcbddc->coarse_problem_type == MULTILEVEL_BDDC) { 2860e269702eSStefano Zampini if(dbg_flag) { 2861e269702eSStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"----------------Setting up a new level---------------\n");CHKERRQ(ierr); 2862e269702eSStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 2863e269702eSStefano Zampini } 286453cdbc3dSStefano Zampini ierr = PCBDDCSetCoarseProblemType(pc_temp,MULTILEVEL_BDDC);CHKERRQ(ierr); 286553cdbc3dSStefano Zampini } 286653cdbc3dSStefano Zampini ierr = KSPSetUp(pcbddc->coarse_ksp);CHKERRQ(ierr); 28675619798eSStefano Zampini if(pcbddc->coarse_problem_type == MULTILEVEL_BDDC) { 28685619798eSStefano Zampini if(dbg_flag) { 28695619798eSStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"----------------New level set------------------------\n");CHKERRQ(ierr); 28705619798eSStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 28715619798eSStefano Zampini } 28725619798eSStefano Zampini } 28730c7d97c5SJed Brown } 28740c7d97c5SJed Brown if(pcbddc->coarse_communications_type == SCATTERS_BDDC) { 28750c7d97c5SJed Brown IS local_IS,global_IS; 28760c7d97c5SJed Brown ierr = ISCreateStride(PETSC_COMM_SELF,pcbddc->local_primal_size,0,1,&local_IS);CHKERRQ(ierr); 28770c7d97c5SJed Brown ierr = ISCreateGeneral(PETSC_COMM_SELF,pcbddc->local_primal_size,pcbddc->local_primal_indices,PETSC_COPY_VALUES,&global_IS);CHKERRQ(ierr); 28780c7d97c5SJed Brown ierr = VecScatterCreate(pcbddc->vec1_P,local_IS,pcbddc->coarse_vec,global_IS,&pcbddc->coarse_loc_to_glob);CHKERRQ(ierr); 28790c7d97c5SJed Brown ierr = ISDestroy(&local_IS);CHKERRQ(ierr); 28800c7d97c5SJed Brown ierr = ISDestroy(&global_IS);CHKERRQ(ierr); 28810c7d97c5SJed Brown } 28820c7d97c5SJed Brown 28830c7d97c5SJed Brown 28843b03a366Sstefano_zampini /* Evaluate condition number of coarse problem for cheby (and verbose output if requested) */ 28853b03a366Sstefano_zampini if( pcbddc->coarse_problem_type == MULTILEVEL_BDDC && rank_prec_comm == active_rank ) { 28860c7d97c5SJed Brown PetscScalar m_one=-1.0; 28875619798eSStefano Zampini PetscReal infty_error,lambda_min,lambda_max,kappa_2; 28883b03a366Sstefano_zampini const KSPType check_ksp_type=KSPGMRES; 28890c7d97c5SJed Brown 28905619798eSStefano Zampini /* change coarse ksp object to an iterative method suitable for extreme eigenvalues' estimation */ 28913b03a366Sstefano_zampini ierr = KSPSetType(pcbddc->coarse_ksp,check_ksp_type);CHKERRQ(ierr); 2892d49ef151SStefano Zampini ierr = KSPSetComputeSingularValues(pcbddc->coarse_ksp,PETSC_TRUE);CHKERRQ(ierr); 28935619798eSStefano Zampini ierr = KSPSetTolerances(pcbddc->coarse_ksp,1.e-8,1.e-8,PETSC_DEFAULT,pcbddc->coarse_size);CHKERRQ(ierr); 28945619798eSStefano Zampini ierr = KSPSetUp(pcbddc->coarse_ksp);CHKERRQ(ierr); 2895d49ef151SStefano Zampini ierr = VecSetRandom(pcbddc->coarse_rhs,PETSC_NULL);CHKERRQ(ierr); 2896d49ef151SStefano Zampini ierr = MatMult(pcbddc->coarse_mat,pcbddc->coarse_rhs,pcbddc->coarse_vec);CHKERRQ(ierr); 2897d49ef151SStefano Zampini ierr = MatMult(pcbddc->coarse_mat,pcbddc->coarse_vec,pcbddc->coarse_rhs);CHKERRQ(ierr); 2898d49ef151SStefano Zampini ierr = KSPSolve(pcbddc->coarse_ksp,pcbddc->coarse_rhs,pcbddc->coarse_rhs);CHKERRQ(ierr); 2899d49ef151SStefano Zampini ierr = KSPComputeExtremeSingularValues(pcbddc->coarse_ksp,&lambda_max,&lambda_min);CHKERRQ(ierr); 29003b03a366Sstefano_zampini if(dbg_flag) { 29015619798eSStefano Zampini kappa_2=lambda_max/lambda_min; 29025619798eSStefano Zampini ierr = KSPGetIterationNumber(pcbddc->coarse_ksp,&k);CHKERRQ(ierr); 2903d49ef151SStefano Zampini ierr = VecAXPY(pcbddc->coarse_rhs,m_one,pcbddc->coarse_vec);CHKERRQ(ierr); 2904d49ef151SStefano Zampini ierr = VecNorm(pcbddc->coarse_rhs,NORM_INFINITY,&infty_error);CHKERRQ(ierr); 29053b03a366Sstefano_zampini ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem condition number estimated with %d iterations of %s is: % 1.14e\n",k,check_ksp_type,kappa_2);CHKERRQ(ierr); 2906e269702eSStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem eigenvalues: % 1.14e %1.14e\n",lambda_min,lambda_max);CHKERRQ(ierr); 2907e269702eSStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem infty_error: %1.14e\n",infty_error);CHKERRQ(ierr); 29083b03a366Sstefano_zampini } 29095619798eSStefano Zampini /* restore coarse ksp to default values */ 2910d49ef151SStefano Zampini ierr = KSPSetComputeSingularValues(pcbddc->coarse_ksp,PETSC_FALSE);CHKERRQ(ierr); 29115619798eSStefano Zampini ierr = KSPSetType(pcbddc->coarse_ksp,coarse_ksp_type);CHKERRQ(ierr); 29126c9de887SHong Zhang ierr = KSPChebyshevSetEigenvalues(pcbddc->coarse_ksp,lambda_max,lambda_min);CHKERRQ(ierr); 29133b03a366Sstefano_zampini ierr = KSPSetTolerances(pcbddc->coarse_ksp,PETSC_DEFAULT,PETSC_DEFAULT,PETSC_DEFAULT,max_it_coarse_ksp);CHKERRQ(ierr); 29145619798eSStefano Zampini ierr = KSPSetFromOptions(pcbddc->coarse_ksp);CHKERRQ(ierr); 29155619798eSStefano Zampini ierr = KSPSetUp(pcbddc->coarse_ksp);CHKERRQ(ierr); 291653cdbc3dSStefano Zampini } 29170c7d97c5SJed Brown 29180c7d97c5SJed Brown /* free data structures no longer needed */ 29190c7d97c5SJed Brown if(coarse_ISLG) { ierr = ISLocalToGlobalMappingDestroy(&coarse_ISLG);CHKERRQ(ierr); } 29200c7d97c5SJed Brown if(ins_local_primal_indices) { ierr = PetscFree(ins_local_primal_indices);CHKERRQ(ierr); } 29210c7d97c5SJed Brown if(ins_coarse_mat_vals) { ierr = PetscFree(ins_coarse_mat_vals);CHKERRQ(ierr);} 29220c7d97c5SJed Brown if(localsizes2) { ierr = PetscFree(localsizes2);CHKERRQ(ierr);} 29230c7d97c5SJed Brown if(localdispl2) { ierr = PetscFree(localdispl2);CHKERRQ(ierr);} 29240c7d97c5SJed Brown if(temp_coarse_mat_vals) { ierr = PetscFree(temp_coarse_mat_vals);CHKERRQ(ierr);} 29250c7d97c5SJed Brown 29260c7d97c5SJed Brown PetscFunctionReturn(0); 29270c7d97c5SJed Brown } 29280c7d97c5SJed Brown 29290c7d97c5SJed Brown #undef __FUNCT__ 29300c7d97c5SJed Brown #define __FUNCT__ "PCBDDCManageLocalBoundaries" 293153cdbc3dSStefano Zampini static PetscErrorCode PCBDDCManageLocalBoundaries(PC pc) 29320c7d97c5SJed Brown { 29330c7d97c5SJed Brown 29340c7d97c5SJed Brown PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 29350c7d97c5SJed Brown PC_IS *pcis = (PC_IS*)pc->data; 29360c7d97c5SJed Brown Mat_IS *matis = (Mat_IS*)pc->pmat->data; 2937da1bb401SStefano Zampini PCBDDCGraph mat_graph=pcbddc->mat_graph; 2938a81d60d8SStefano Zampini PetscInt *queue_in_global_numbering,*is_indices; 29393b03a366Sstefano_zampini PetscInt bs,ierr,i,j,s,k,iindex,neumann_bsize,dirichlet_bsize; 2940da1bb401SStefano Zampini PetscInt total_counts,nodes_touched,where_values=1,vertex_size; 2941534831adSStefano Zampini PetscMPIInt adapt_interface=0,adapt_interface_reduced=0,NEUMANNCNT=0; 2942da1bb401SStefano Zampini PetscBool same_set; 2943a0ba757dSStefano Zampini MPI_Comm interface_comm=((PetscObject)pc)->comm; 29443b03a366Sstefano_zampini PetscBool use_faces=PETSC_FALSE,use_edges=PETSC_FALSE; 29453b03a366Sstefano_zampini const PetscInt *neumann_nodes; 29463b03a366Sstefano_zampini const PetscInt *dirichlet_nodes; 2947a81d60d8SStefano Zampini IS used_IS,*custom_ISForDofs; 2948da1bb401SStefano Zampini PetscScalar *array; 2949da1bb401SStefano Zampini PetscScalar *array2; 2950da1bb401SStefano Zampini PetscViewer viewer=pcbddc->dbg_viewer; 29510c7d97c5SJed Brown 29520c7d97c5SJed Brown PetscFunctionBegin; 2953da1bb401SStefano Zampini /* Setup local adjacency graph */ 2954da1bb401SStefano Zampini mat_graph->nvtxs=pcis->n; 2955534831adSStefano Zampini if(!mat_graph->xadj) { NEUMANNCNT = 1; } 2956da1bb401SStefano Zampini ierr = PCBDDCSetupLocalAdjacencyGraph(pc);CHKERRQ(ierr); 2957a0ba757dSStefano Zampini i = mat_graph->nvtxs; 2958a0ba757dSStefano Zampini ierr = PetscMalloc4(i,PetscInt,&mat_graph->where,i,PetscInt,&mat_graph->count,i+1,PetscInt,&mat_graph->cptr,i,PetscInt,&mat_graph->queue);CHKERRQ(ierr); 2959a0ba757dSStefano Zampini ierr = PetscMalloc3(i,PetscInt,&mat_graph->which_dof,i,PetscBool,&mat_graph->touched,i,PetscInt,&queue_in_global_numbering);CHKERRQ(ierr); 2960a0ba757dSStefano Zampini ierr = PetscMemzero(mat_graph->where,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr); 2961a0ba757dSStefano Zampini ierr = PetscMemzero(mat_graph->count,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr); 2962a0ba757dSStefano Zampini ierr = PetscMemzero(mat_graph->which_dof,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr); 2963a0ba757dSStefano Zampini ierr = PetscMemzero(mat_graph->queue,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr); 29643828260eSStefano Zampini ierr = PetscMemzero(mat_graph->cptr,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr); 2965a0ba757dSStefano Zampini 2966a81d60d8SStefano Zampini /* Setting dofs splitting in mat_graph->which_dof 2967a81d60d8SStefano Zampini Get information about dofs' splitting if provided by the user 2968a81d60d8SStefano Zampini Otherwise it assumes a constant block size */ 2969a81d60d8SStefano Zampini vertex_size=0; 2970a81d60d8SStefano Zampini if(!pcbddc->n_ISForDofs) { 2971a81d60d8SStefano Zampini ierr = MatGetBlockSize(matis->A,&bs);CHKERRQ(ierr); 2972a81d60d8SStefano Zampini ierr = PetscMalloc(bs*sizeof(IS),&custom_ISForDofs);CHKERRQ(ierr); 2973a81d60d8SStefano Zampini for(i=0;i<bs;i++) { 2974a81d60d8SStefano Zampini ierr = ISCreateStride(PETSC_COMM_SELF,pcis->n/bs,i,bs,&custom_ISForDofs[i]);CHKERRQ(ierr); 2975a81d60d8SStefano Zampini } 2976a81d60d8SStefano Zampini ierr = PCBDDCSetDofsSplitting(pc,bs,custom_ISForDofs);CHKERRQ(ierr); 2977a81d60d8SStefano Zampini vertex_size=1; 2978a81d60d8SStefano Zampini /* remove my references to IS objects */ 2979a81d60d8SStefano Zampini for(i=0;i<bs;i++) { 2980a81d60d8SStefano Zampini ierr = ISDestroy(&custom_ISForDofs[i]);CHKERRQ(ierr); 2981a81d60d8SStefano Zampini } 2982a81d60d8SStefano Zampini ierr = PetscFree(custom_ISForDofs);CHKERRQ(ierr); 2983a81d60d8SStefano Zampini } 29849c0446d6SStefano Zampini for(i=0;i<pcbddc->n_ISForDofs;i++) { 2985a81d60d8SStefano Zampini ierr = ISGetSize(pcbddc->ISForDofs[i],&k);CHKERRQ(ierr); 29869c0446d6SStefano Zampini ierr = ISGetIndices(pcbddc->ISForDofs[i],(const PetscInt**)&is_indices);CHKERRQ(ierr); 2987a81d60d8SStefano Zampini for(j=0;j<k;j++) { 29889c0446d6SStefano Zampini mat_graph->which_dof[is_indices[j]]=i; 29899c0446d6SStefano Zampini } 29909c0446d6SStefano Zampini ierr = ISRestoreIndices(pcbddc->ISForDofs[i],(const PetscInt**)&is_indices);CHKERRQ(ierr); 29919c0446d6SStefano Zampini } 2992a81d60d8SStefano Zampini /* use mat block size as vertex size if it has not yet set */ 2993a81d60d8SStefano Zampini if(!vertex_size) { 29943b03a366Sstefano_zampini ierr = MatGetBlockSize(matis->A,&vertex_size);CHKERRQ(ierr); 29950c7d97c5SJed Brown } 2996a81d60d8SStefano Zampini 29973b03a366Sstefano_zampini /* count number of neigh per node */ 29980c7d97c5SJed Brown total_counts=0; 29993b03a366Sstefano_zampini for(i=1;i<pcis->n_neigh;i++){ 30000c7d97c5SJed Brown s=pcis->n_shared[i]; 30010c7d97c5SJed Brown total_counts+=s; 300253cdbc3dSStefano Zampini for(j=0;j<s;j++){ 30030c7d97c5SJed Brown mat_graph->count[pcis->shared[i][j]] += 1; 30040c7d97c5SJed Brown } 30050c7d97c5SJed Brown } 3006534831adSStefano Zampini /* Take into account Neumann data -> it increments number of sharing subdomains for nodes lying on the interface */ 300736e030ebSStefano Zampini ierr = PCBDDCGetNeumannBoundaries(pc,&used_IS);CHKERRQ(ierr); 3008da1bb401SStefano Zampini ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr); 3009da1bb401SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 301036e030ebSStefano Zampini if(used_IS) { 301136e030ebSStefano Zampini ierr = ISGetSize(used_IS,&neumann_bsize);CHKERRQ(ierr); 301236e030ebSStefano Zampini ierr = ISGetIndices(used_IS,&neumann_nodes);CHKERRQ(ierr); 301353cdbc3dSStefano Zampini for(i=0;i<neumann_bsize;i++){ 301453cdbc3dSStefano Zampini iindex = neumann_nodes[i]; 3015534831adSStefano Zampini if(mat_graph->count[iindex] > NEUMANNCNT && array[iindex]==0.0){ 301653cdbc3dSStefano Zampini mat_graph->count[iindex]+=1; 30170c7d97c5SJed Brown total_counts++; 3018da1bb401SStefano Zampini array[iindex]=array[iindex]+1.0; 3019da1bb401SStefano Zampini } else if(array[iindex]>0.0) { 3020da1bb401SStefano Zampini SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_USER,"Error for neumann nodes provided to BDDC! They must be uniquely listed! Found duplicate node %d\n",iindex); 30210c7d97c5SJed Brown } 30220c7d97c5SJed Brown } 30230c7d97c5SJed Brown } 3024da1bb401SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 3025da1bb401SStefano Zampini /* allocate space for storing the set of neighbours for each node */ 3026da1bb401SStefano Zampini ierr = PetscMalloc(mat_graph->nvtxs*sizeof(PetscInt*),&mat_graph->neighbours_set);CHKERRQ(ierr); 3027da1bb401SStefano Zampini if(mat_graph->nvtxs) { ierr = PetscMalloc(total_counts*sizeof(PetscInt),&mat_graph->neighbours_set[0]);CHKERRQ(ierr); } 3028da1bb401SStefano Zampini for(i=1;i<mat_graph->nvtxs;i++) mat_graph->neighbours_set[i]=mat_graph->neighbours_set[i-1]+mat_graph->count[i-1]; 3029a0ba757dSStefano Zampini ierr = PetscMemzero(mat_graph->count,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr); 30303b03a366Sstefano_zampini for(i=1;i<pcis->n_neigh;i++){ 30310c7d97c5SJed Brown s=pcis->n_shared[i]; 30320c7d97c5SJed Brown for(j=0;j<s;j++) { 30330c7d97c5SJed Brown k=pcis->shared[i][j]; 3034da1bb401SStefano Zampini mat_graph->neighbours_set[k][mat_graph->count[k]] = pcis->neigh[i]; 30350c7d97c5SJed Brown mat_graph->count[k]+=1; 30360c7d97c5SJed Brown } 30370c7d97c5SJed Brown } 3038da1bb401SStefano Zampini /* Check consistency of Neumann nodes */ 3039da1bb401SStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 3040da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 3041da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 3042da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 3043da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 3044da1bb401SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 30453b03a366Sstefano_zampini /* set -1 fake neighbour to mimic Neumann boundary */ 304636e030ebSStefano Zampini if(used_IS) { 304753cdbc3dSStefano Zampini for(i=0;i<neumann_bsize;i++){ 304853cdbc3dSStefano Zampini iindex = neumann_nodes[i]; 3049534831adSStefano Zampini if(mat_graph->count[iindex] > NEUMANNCNT){ 3050da1bb401SStefano Zampini if(mat_graph->count[iindex]+1 != (PetscInt)array[iindex]) { 3051da1bb401SStefano Zampini SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_USER,"Neumann nodes provided to BDDC must be consistent among neighbours!\nNode %d: number of sharing subdomains %d != number of subdomains for which it is a neumann node %d\n",iindex,mat_graph->count[iindex]+1,(PetscInt)array[iindex]); 3052da1bb401SStefano Zampini } 3053da1bb401SStefano Zampini mat_graph->neighbours_set[iindex][mat_graph->count[iindex]] = -1; 305453cdbc3dSStefano Zampini mat_graph->count[iindex]+=1; 30550c7d97c5SJed Brown } 30560c7d97c5SJed Brown } 305736e030ebSStefano Zampini ierr = ISRestoreIndices(used_IS,&neumann_nodes);CHKERRQ(ierr); 30580c7d97c5SJed Brown } 3059da1bb401SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 3060da1bb401SStefano Zampini /* sort set of sharing subdomains */ 3061da1bb401SStefano Zampini for(i=0;i<mat_graph->nvtxs;i++) { ierr = PetscSortInt(mat_graph->count[i],mat_graph->neighbours_set[i]);CHKERRQ(ierr); } 30623b03a366Sstefano_zampini /* remove interior nodes and dirichlet boundary nodes from the next search into the graph */ 3063da1bb401SStefano Zampini for(i=0;i<mat_graph->nvtxs;i++){mat_graph->touched[i]=PETSC_FALSE;} 3064da1bb401SStefano Zampini nodes_touched=0; 306536e030ebSStefano Zampini ierr = PCBDDCGetDirichletBoundaries(pc,&used_IS);CHKERRQ(ierr); 3066da1bb401SStefano Zampini ierr = VecSet(pcis->vec2_N,0.0);CHKERRQ(ierr); 3067da1bb401SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 3068da1bb401SStefano Zampini ierr = VecGetArray(pcis->vec2_N,&array2);CHKERRQ(ierr); 3069da1bb401SStefano Zampini if(used_IS) { 3070da1bb401SStefano Zampini ierr = ISGetSize(used_IS,&dirichlet_bsize);CHKERRQ(ierr); 3071da1bb401SStefano Zampini if(dirichlet_bsize && matis->pure_neumann) { 3072da1bb401SStefano Zampini SETERRQ(PETSC_COMM_SELF,PETSC_ERR_USER,"Dirichlet boundaries are intended to be used with matrices with zeroed rows!\n"); 3073da1bb401SStefano Zampini } 3074da1bb401SStefano Zampini ierr = ISGetIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr); 3075da1bb401SStefano Zampini for(i=0;i<dirichlet_bsize;i++){ 3076da1bb401SStefano Zampini iindex=dirichlet_nodes[i]; 3077da1bb401SStefano Zampini if(mat_graph->count[iindex] && !mat_graph->touched[iindex]) { 3078da1bb401SStefano Zampini if(array[iindex]>0.0) { 3079da1bb401SStefano Zampini SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_USER,"BDDC cannot have nodes which are marked as Neumann and Dirichlet at the same time! Wrong node %d\n",iindex); 3080da1bb401SStefano Zampini } 3081da1bb401SStefano Zampini mat_graph->touched[iindex]=PETSC_TRUE; 3082da1bb401SStefano Zampini mat_graph->where[iindex]=0; 3083da1bb401SStefano Zampini nodes_touched++; 3084da1bb401SStefano Zampini array2[iindex]=array2[iindex]+1.0; 3085da1bb401SStefano Zampini } 3086da1bb401SStefano Zampini } 3087da1bb401SStefano Zampini ierr = ISRestoreIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr); 3088da1bb401SStefano Zampini } 3089da1bb401SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 3090da1bb401SStefano Zampini ierr = VecRestoreArray(pcis->vec2_N,&array2);CHKERRQ(ierr); 3091da1bb401SStefano Zampini /* Check consistency of Dirichlet nodes */ 3092da1bb401SStefano Zampini ierr = VecSet(pcis->vec1_N,1.0);CHKERRQ(ierr); 3093da1bb401SStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 3094da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 3095da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 3096da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 3097da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 3098da1bb401SStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 3099da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec2_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 3100da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec2_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 3101da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 3102da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 3103da1bb401SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 3104da1bb401SStefano Zampini ierr = VecGetArray(pcis->vec2_N,&array2);CHKERRQ(ierr); 310536e030ebSStefano Zampini if(used_IS) { 310636e030ebSStefano Zampini ierr = ISGetSize(used_IS,&dirichlet_bsize);CHKERRQ(ierr); 310736e030ebSStefano Zampini ierr = ISGetIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr); 31083b03a366Sstefano_zampini for(i=0;i<dirichlet_bsize;i++){ 3109da1bb401SStefano Zampini iindex=dirichlet_nodes[i]; 3110da1bb401SStefano Zampini if(array[iindex]>1.0 && array[iindex]!=array2[iindex] ) { 3111da1bb401SStefano Zampini SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_USER,"Dirichlet nodes provided to BDDC must be consistent among neighbours!\nNode %d: number of sharing subdomains %d != number of subdomains for which it is a neumann node %d\n",iindex,(PetscInt)array[iindex],(PetscInt)array2[iindex]); 3112da1bb401SStefano Zampini } 31133b03a366Sstefano_zampini } 311436e030ebSStefano Zampini ierr = ISRestoreIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr); 31153b03a366Sstefano_zampini } 3116da1bb401SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 3117da1bb401SStefano Zampini ierr = VecRestoreArray(pcis->vec2_N,&array2);CHKERRQ(ierr); 3118da1bb401SStefano Zampini 31190c7d97c5SJed Brown for(i=0;i<mat_graph->nvtxs;i++){ 31203b03a366Sstefano_zampini if(!mat_graph->count[i]){ /* interior nodes */ 31210c7d97c5SJed Brown mat_graph->touched[i]=PETSC_TRUE; 31220c7d97c5SJed Brown mat_graph->where[i]=0; 31230c7d97c5SJed Brown nodes_touched++; 31240c7d97c5SJed Brown } 31250c7d97c5SJed Brown } 31260c7d97c5SJed Brown mat_graph->ncmps = 0; 3127da1bb401SStefano Zampini i=0; 31280c7d97c5SJed Brown while(nodes_touched<mat_graph->nvtxs) { 3129a0ba757dSStefano Zampini /* find first untouched node in local ordering */ 31300c7d97c5SJed Brown while(mat_graph->touched[i]) i++; 31310c7d97c5SJed Brown mat_graph->touched[i]=PETSC_TRUE; 3132a0ba757dSStefano Zampini mat_graph->where[i]=where_values; 31330c7d97c5SJed Brown nodes_touched++; 3134a0ba757dSStefano Zampini /* now find all other nodes having the same set of sharing subdomains */ 31350c7d97c5SJed Brown for(j=i+1;j<mat_graph->nvtxs;j++){ 3136a0ba757dSStefano Zampini /* check for same number of sharing subdomains and dof number */ 3137da1bb401SStefano Zampini if(!mat_graph->touched[j] && mat_graph->count[i]==mat_graph->count[j] && mat_graph->which_dof[i] == mat_graph->which_dof[j] ){ 3138a0ba757dSStefano Zampini /* check for same set of sharing subdomains */ 31390c7d97c5SJed Brown same_set=PETSC_TRUE; 31400c7d97c5SJed Brown for(k=0;k<mat_graph->count[j];k++){ 3141da1bb401SStefano Zampini if(mat_graph->neighbours_set[i][k]!=mat_graph->neighbours_set[j][k]) { 31420c7d97c5SJed Brown same_set=PETSC_FALSE; 31430c7d97c5SJed Brown } 31440c7d97c5SJed Brown } 3145a0ba757dSStefano Zampini /* I found a friend of mine */ 31460c7d97c5SJed Brown if(same_set) { 3147a0ba757dSStefano Zampini mat_graph->where[j]=where_values; 31480c7d97c5SJed Brown mat_graph->touched[j]=PETSC_TRUE; 31490c7d97c5SJed Brown nodes_touched++; 31500c7d97c5SJed Brown } 31510c7d97c5SJed Brown } 31520c7d97c5SJed Brown } 3153a0ba757dSStefano Zampini where_values++; 31540c7d97c5SJed Brown } 3155a0ba757dSStefano Zampini where_values--; if(where_values<0) where_values=0; 3156a0ba757dSStefano Zampini ierr = PetscMalloc(where_values*sizeof(PetscMPIInt),&mat_graph->where_ncmps);CHKERRQ(ierr); 3157a0ba757dSStefano Zampini /* Find connected components defined on the shared interface */ 3158a0ba757dSStefano Zampini if(where_values) { 3159a0ba757dSStefano Zampini ierr = PCBDDCFindConnectedComponents(mat_graph, where_values); 31603b03a366Sstefano_zampini /* For consistency among neughbouring procs, I need to sort (by global ordering) each connected component */ 3161a0ba757dSStefano Zampini for(i=0;i<mat_graph->ncmps;i++) { 3162a0ba757dSStefano Zampini ierr = ISLocalToGlobalMappingApply(matis->mapping,mat_graph->cptr[i+1]-mat_graph->cptr[i],&mat_graph->queue[mat_graph->cptr[i]],&queue_in_global_numbering[mat_graph->cptr[i]]);CHKERRQ(ierr); 3163a0ba757dSStefano Zampini ierr = PetscSortIntWithArray(mat_graph->cptr[i+1]-mat_graph->cptr[i],&queue_in_global_numbering[mat_graph->cptr[i]],&mat_graph->queue[mat_graph->cptr[i]]);CHKERRQ(ierr); 3164a0ba757dSStefano Zampini } 3165a0ba757dSStefano Zampini } 3166a0ba757dSStefano Zampini /* check consistency of connected components among neighbouring subdomains -> it adapt them in case it is needed */ 3167a0ba757dSStefano Zampini for(i=0;i<where_values;i++) { 31683b03a366Sstefano_zampini /* We are not sure that two connected components will be the same among subdomains sharing a subset of local interface */ 31693b03a366Sstefano_zampini if(mat_graph->where_ncmps[i]>1) { 3170a0ba757dSStefano Zampini adapt_interface=1; 3171a0ba757dSStefano Zampini break; 3172a0ba757dSStefano Zampini } 3173a0ba757dSStefano Zampini } 3174a0ba757dSStefano Zampini ierr = MPI_Allreduce(&adapt_interface,&adapt_interface_reduced,1,MPIU_INT,MPI_LOR,interface_comm);CHKERRQ(ierr); 3175da1bb401SStefano Zampini if(pcbddc->dbg_flag && adapt_interface_reduced) { 3176da1bb401SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Interface adapted\n");CHKERRQ(ierr); 3177da1bb401SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 3178da1bb401SStefano Zampini } 3179a0ba757dSStefano Zampini if(where_values && adapt_interface_reduced) { 31800c7d97c5SJed Brown 3181a0ba757dSStefano Zampini PetscInt sum_requests=0,my_rank; 3182a0ba757dSStefano Zampini PetscInt buffer_size,start_of_recv,size_of_recv,start_of_send; 3183a0ba757dSStefano Zampini PetscInt temp_buffer_size,ins_val,global_where_counter; 3184a0ba757dSStefano Zampini PetscInt *cum_recv_counts; 3185a0ba757dSStefano Zampini PetscInt *where_to_nodes_indices; 3186a0ba757dSStefano Zampini PetscInt *petsc_buffer; 3187a0ba757dSStefano Zampini PetscMPIInt *recv_buffer; 3188a0ba757dSStefano Zampini PetscMPIInt *recv_buffer_where; 3189a0ba757dSStefano Zampini PetscMPIInt *send_buffer; 3190a0ba757dSStefano Zampini PetscMPIInt size_of_send; 3191a0ba757dSStefano Zampini PetscInt *sizes_of_sends; 3192a0ba757dSStefano Zampini MPI_Request *send_requests; 3193a0ba757dSStefano Zampini MPI_Request *recv_requests; 3194a0ba757dSStefano Zampini PetscInt *where_cc_adapt; 3195a0ba757dSStefano Zampini PetscInt **temp_buffer; 3196a0ba757dSStefano Zampini PetscInt *nodes_to_temp_buffer_indices; 3197a0ba757dSStefano Zampini PetscInt *add_to_where; 3198a0ba757dSStefano Zampini 3199a0ba757dSStefano Zampini ierr = MPI_Comm_rank(interface_comm,&my_rank);CHKERRQ(ierr); 3200a0ba757dSStefano Zampini ierr = PetscMalloc((where_values+1)*sizeof(PetscInt),&cum_recv_counts);CHKERRQ(ierr); 3201a0ba757dSStefano Zampini ierr = PetscMemzero(cum_recv_counts,(where_values+1)*sizeof(PetscInt));CHKERRQ(ierr); 3202a0ba757dSStefano Zampini ierr = PetscMalloc(where_values*sizeof(PetscInt),&where_to_nodes_indices);CHKERRQ(ierr); 3203a0ba757dSStefano Zampini /* first count how many neighbours per connected component I will receive from */ 3204a0ba757dSStefano Zampini cum_recv_counts[0]=0; 3205a0ba757dSStefano Zampini for(i=1;i<where_values+1;i++){ 3206a0ba757dSStefano Zampini j=0; 3207a0ba757dSStefano Zampini while(mat_graph->where[j] != i) j++; 3208a0ba757dSStefano Zampini where_to_nodes_indices[i-1]=j; 3209da1bb401SStefano Zampini if(mat_graph->neighbours_set[j][0]!=-1) { cum_recv_counts[i]=cum_recv_counts[i-1]+mat_graph->count[j]; } /* We don't want sends/recvs_to/from_self -> here I don't count myself */ 32103b03a366Sstefano_zampini else { cum_recv_counts[i]=cum_recv_counts[i-1]+mat_graph->count[j]-1; } 3211a0ba757dSStefano Zampini } 3212a0ba757dSStefano Zampini buffer_size=2*cum_recv_counts[where_values]+mat_graph->nvtxs; 3213a0ba757dSStefano Zampini ierr = PetscMalloc(2*cum_recv_counts[where_values]*sizeof(PetscMPIInt),&recv_buffer_where);CHKERRQ(ierr); 3214a0ba757dSStefano Zampini ierr = PetscMalloc(buffer_size*sizeof(PetscMPIInt),&send_buffer);CHKERRQ(ierr); 3215a0ba757dSStefano Zampini ierr = PetscMalloc(cum_recv_counts[where_values]*sizeof(MPI_Request),&send_requests);CHKERRQ(ierr); 3216a0ba757dSStefano Zampini ierr = PetscMalloc(cum_recv_counts[where_values]*sizeof(MPI_Request),&recv_requests);CHKERRQ(ierr); 3217a0ba757dSStefano Zampini for(i=0;i<cum_recv_counts[where_values];i++) { 3218a0ba757dSStefano Zampini send_requests[i]=MPI_REQUEST_NULL; 3219a0ba757dSStefano Zampini recv_requests[i]=MPI_REQUEST_NULL; 3220a0ba757dSStefano Zampini } 3221a0ba757dSStefano Zampini /* exchange with my neighbours the number of my connected components on the shared interface */ 3222a0ba757dSStefano Zampini for(i=0;i<where_values;i++){ 3223a0ba757dSStefano Zampini j=where_to_nodes_indices[i]; 3224da1bb401SStefano Zampini k = (mat_graph->neighbours_set[j][0] == -1 ? 1 : 0); 3225a0ba757dSStefano Zampini for(;k<mat_graph->count[j];k++){ 3226da1bb401SStefano Zampini ierr = MPI_Isend(&mat_graph->where_ncmps[i],1,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr); 3227da1bb401SStefano Zampini ierr = MPI_Irecv(&recv_buffer_where[sum_requests],1,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr); 3228a0ba757dSStefano Zampini sum_requests++; 3229a0ba757dSStefano Zampini } 3230a0ba757dSStefano Zampini } 3231a0ba757dSStefano Zampini ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 3232a0ba757dSStefano Zampini ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 3233a0ba757dSStefano Zampini /* determine the connected component I need to adapt */ 3234a0ba757dSStefano Zampini ierr = PetscMalloc(where_values*sizeof(PetscInt),&where_cc_adapt);CHKERRQ(ierr); 3235a0ba757dSStefano Zampini ierr = PetscMemzero(where_cc_adapt,where_values*sizeof(PetscInt));CHKERRQ(ierr); 3236a0ba757dSStefano Zampini for(i=0;i<where_values;i++){ 3237a0ba757dSStefano Zampini for(j=cum_recv_counts[i];j<cum_recv_counts[i+1];j++){ 32383b03a366Sstefano_zampini /* The first condition is natural (i.e someone has a different number of cc than me), the second one is just to be safe */ 32393b03a366Sstefano_zampini if( mat_graph->where_ncmps[i]!=recv_buffer_where[j] || mat_graph->where_ncmps[i] > 1 ) { 3240a0ba757dSStefano Zampini where_cc_adapt[i]=PETSC_TRUE; 3241a0ba757dSStefano Zampini break; 3242a0ba757dSStefano Zampini } 3243a0ba757dSStefano Zampini } 3244a0ba757dSStefano Zampini } 3245a0ba757dSStefano Zampini /* now get from neighbours their ccs (in global numbering) and adapt them (in case it is needed) */ 3246a0ba757dSStefano Zampini /* first determine how much data to send (size of each queue plus the global indices) and communicate it to neighbours */ 3247a0ba757dSStefano Zampini ierr = PetscMalloc(where_values*sizeof(PetscInt),&sizes_of_sends);CHKERRQ(ierr); 3248a0ba757dSStefano Zampini ierr = PetscMemzero(sizes_of_sends,where_values*sizeof(PetscInt));CHKERRQ(ierr); 3249a0ba757dSStefano Zampini sum_requests=0; 3250a0ba757dSStefano Zampini start_of_send=0; 3251a0ba757dSStefano Zampini start_of_recv=cum_recv_counts[where_values]; 3252a0ba757dSStefano Zampini for(i=0;i<where_values;i++) { 3253a0ba757dSStefano Zampini if(where_cc_adapt[i]) { 3254a0ba757dSStefano Zampini size_of_send=0; 3255a0ba757dSStefano Zampini for(j=i;j<mat_graph->ncmps;j++) { 3256a0ba757dSStefano Zampini if(mat_graph->where[mat_graph->queue[mat_graph->cptr[j]]] == i+1) { /* WARNING -> where values goes from 1 to where_values included */ 3257a0ba757dSStefano Zampini send_buffer[start_of_send+size_of_send]=mat_graph->cptr[j+1]-mat_graph->cptr[j]; 3258a0ba757dSStefano Zampini size_of_send+=1; 3259a0ba757dSStefano Zampini for(k=0;k<mat_graph->cptr[j+1]-mat_graph->cptr[j];k++) { 3260a0ba757dSStefano Zampini send_buffer[start_of_send+size_of_send+k]=queue_in_global_numbering[mat_graph->cptr[j]+k]; 3261a0ba757dSStefano Zampini } 3262a0ba757dSStefano Zampini size_of_send=size_of_send+mat_graph->cptr[j+1]-mat_graph->cptr[j]; 3263a0ba757dSStefano Zampini } 3264a0ba757dSStefano Zampini } 3265a0ba757dSStefano Zampini j = where_to_nodes_indices[i]; 3266da1bb401SStefano Zampini k = (mat_graph->neighbours_set[j][0] == -1 ? 1 : 0); 326711d8f4c2SStefano Zampini sizes_of_sends[i]=size_of_send; 3268a0ba757dSStefano Zampini for(;k<mat_graph->count[j];k++){ 326911d8f4c2SStefano Zampini ierr = MPI_Isend(&sizes_of_sends[i],1,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr); 3270da1bb401SStefano Zampini ierr = MPI_Irecv(&recv_buffer_where[sum_requests+start_of_recv],1,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr); 3271a0ba757dSStefano Zampini sum_requests++; 3272a0ba757dSStefano Zampini } 3273a0ba757dSStefano Zampini start_of_send+=size_of_send; 3274a0ba757dSStefano Zampini } 3275a0ba757dSStefano Zampini } 3276a0ba757dSStefano Zampini ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 3277a0ba757dSStefano Zampini ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 3278a0ba757dSStefano Zampini buffer_size=0; 3279a0ba757dSStefano Zampini for(k=0;k<sum_requests;k++) { buffer_size+=recv_buffer_where[start_of_recv+k]; } 3280a0ba757dSStefano Zampini ierr = PetscMalloc(buffer_size*sizeof(PetscMPIInt),&recv_buffer);CHKERRQ(ierr); 3281a0ba757dSStefano Zampini /* now exchange the data */ 3282a0ba757dSStefano Zampini start_of_recv=0; 3283a0ba757dSStefano Zampini start_of_send=0; 3284a0ba757dSStefano Zampini sum_requests=0; 3285a0ba757dSStefano Zampini for(i=0;i<where_values;i++) { 3286a0ba757dSStefano Zampini if(where_cc_adapt[i]) { 3287a0ba757dSStefano Zampini size_of_send = sizes_of_sends[i]; 3288a0ba757dSStefano Zampini j = where_to_nodes_indices[i]; 3289da1bb401SStefano Zampini k = (mat_graph->neighbours_set[j][0] == -1 ? 1 : 0); 3290a0ba757dSStefano Zampini for(;k<mat_graph->count[j];k++){ 3291da1bb401SStefano Zampini ierr = MPI_Isend(&send_buffer[start_of_send],size_of_send,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr); 3292a0ba757dSStefano Zampini size_of_recv=recv_buffer_where[cum_recv_counts[where_values]+sum_requests]; 3293da1bb401SStefano Zampini ierr = MPI_Irecv(&recv_buffer[start_of_recv],size_of_recv,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr); 3294a0ba757dSStefano Zampini start_of_recv+=size_of_recv; 3295a0ba757dSStefano Zampini sum_requests++; 3296a0ba757dSStefano Zampini } 3297a0ba757dSStefano Zampini start_of_send+=size_of_send; 3298a0ba757dSStefano Zampini } 3299a0ba757dSStefano Zampini } 3300a0ba757dSStefano Zampini ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 3301a0ba757dSStefano Zampini ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 3302a0ba757dSStefano Zampini ierr = PetscMalloc(buffer_size*sizeof(PetscInt),&petsc_buffer);CHKERRQ(ierr); 3303a0ba757dSStefano Zampini for(k=0;k<start_of_recv;k++) { petsc_buffer[k]=(PetscInt)recv_buffer[k]; } 3304a0ba757dSStefano Zampini for(j=0;j<buffer_size;) { 3305a0ba757dSStefano Zampini ierr = ISGlobalToLocalMappingApply(matis->mapping,IS_GTOLM_MASK,petsc_buffer[j],&petsc_buffer[j+1],&petsc_buffer[j],&petsc_buffer[j+1]);CHKERRQ(ierr); 3306a0ba757dSStefano Zampini k=petsc_buffer[j]+1; 3307a0ba757dSStefano Zampini j+=k; 3308a0ba757dSStefano Zampini } 3309a0ba757dSStefano Zampini sum_requests=cum_recv_counts[where_values]; 3310a0ba757dSStefano Zampini start_of_recv=0; 3311a0ba757dSStefano Zampini ierr = PetscMalloc(mat_graph->nvtxs*sizeof(PetscInt),&nodes_to_temp_buffer_indices);CHKERRQ(ierr); 3312a0ba757dSStefano Zampini global_where_counter=0; 3313a0ba757dSStefano Zampini for(i=0;i<where_values;i++){ 3314a0ba757dSStefano Zampini if(where_cc_adapt[i]){ 3315a0ba757dSStefano Zampini temp_buffer_size=0; 3316a0ba757dSStefano Zampini /* find nodes on the shared interface we need to adapt */ 3317a0ba757dSStefano Zampini for(j=0;j<mat_graph->nvtxs;j++){ 3318a0ba757dSStefano Zampini if(mat_graph->where[j]==i+1) { 3319a0ba757dSStefano Zampini nodes_to_temp_buffer_indices[j]=temp_buffer_size; 3320a0ba757dSStefano Zampini temp_buffer_size++; 3321a0ba757dSStefano Zampini } else { 3322a0ba757dSStefano Zampini nodes_to_temp_buffer_indices[j]=-1; 3323a0ba757dSStefano Zampini } 3324a0ba757dSStefano Zampini } 3325a0ba757dSStefano Zampini /* allocate some temporary space */ 3326a0ba757dSStefano Zampini ierr = PetscMalloc(temp_buffer_size*sizeof(PetscInt*),&temp_buffer);CHKERRQ(ierr); 3327a0ba757dSStefano Zampini ierr = PetscMalloc(temp_buffer_size*(cum_recv_counts[i+1]-cum_recv_counts[i])*sizeof(PetscInt),&temp_buffer[0]);CHKERRQ(ierr); 3328a0ba757dSStefano Zampini ierr = PetscMemzero(temp_buffer[0],temp_buffer_size*(cum_recv_counts[i+1]-cum_recv_counts[i])*sizeof(PetscInt));CHKERRQ(ierr); 3329a0ba757dSStefano Zampini for(j=1;j<temp_buffer_size;j++){ 3330a0ba757dSStefano Zampini temp_buffer[j]=temp_buffer[j-1]+cum_recv_counts[i+1]-cum_recv_counts[i]; 3331a0ba757dSStefano Zampini } 3332a0ba757dSStefano Zampini /* analyze contributions from neighbouring subdomains for i-th conn comp 3333a0ba757dSStefano Zampini temp buffer structure: 3334a0ba757dSStefano Zampini supposing part of the interface has dimension 5 (global nodes 0,1,2,3,4) 3335a0ba757dSStefano Zampini 3 neighs procs with structured connected components: 3336a0ba757dSStefano Zampini neigh 0: [0 1 4], [2 3]; (2 connected components) 3337a0ba757dSStefano Zampini neigh 1: [0 1], [2 3 4]; (2 connected components) 3338a0ba757dSStefano Zampini neigh 2: [0 4], [1], [2 3]; (3 connected components) 3339a0ba757dSStefano Zampini tempbuffer (row-oriented) should be filled as: 3340a0ba757dSStefano Zampini [ 0, 0, 0; 3341a0ba757dSStefano Zampini 0, 0, 1; 3342a0ba757dSStefano Zampini 1, 1, 2; 3343a0ba757dSStefano Zampini 1, 1, 2; 3344a0ba757dSStefano Zampini 0, 1, 0; ]; 3345a0ba757dSStefano Zampini This way we can simply recover the resulting structure account for possible intersections of ccs among neighs. 3346a0ba757dSStefano Zampini The mat_graph->where array will be modified to reproduce the following 4 connected components [0], [1], [2 3], [4]; 3347a0ba757dSStefano Zampini */ 3348a0ba757dSStefano Zampini for(j=0;j<cum_recv_counts[i+1]-cum_recv_counts[i];j++) { 3349a0ba757dSStefano Zampini ins_val=0; 3350a0ba757dSStefano Zampini size_of_recv=recv_buffer_where[sum_requests]; /* total size of recv from neighs */ 3351a0ba757dSStefano Zampini for(buffer_size=0;buffer_size<size_of_recv;) { /* loop until all data from neighs has been taken into account */ 3352a0ba757dSStefano Zampini for(k=1;k<petsc_buffer[buffer_size+start_of_recv]+1;k++) { /* filling properly temp_buffer using data from a single recv */ 3353a0ba757dSStefano Zampini temp_buffer[ nodes_to_temp_buffer_indices[ petsc_buffer[ start_of_recv+buffer_size+k ] ] ][j]=ins_val; 3354a0ba757dSStefano Zampini } 3355a0ba757dSStefano Zampini buffer_size+=k; 3356a0ba757dSStefano Zampini ins_val++; 3357a0ba757dSStefano Zampini } 3358a0ba757dSStefano Zampini start_of_recv+=size_of_recv; 3359a0ba757dSStefano Zampini sum_requests++; 3360a0ba757dSStefano Zampini } 3361a0ba757dSStefano Zampini ierr = PetscMalloc(temp_buffer_size*sizeof(PetscInt),&add_to_where);CHKERRQ(ierr); 3362a0ba757dSStefano Zampini ierr = PetscMemzero(add_to_where,temp_buffer_size*sizeof(PetscInt));CHKERRQ(ierr); 3363a0ba757dSStefano Zampini for(j=0;j<temp_buffer_size;j++){ 3364a0ba757dSStefano Zampini if(!add_to_where[j]){ /* found a new cc */ 3365a0ba757dSStefano Zampini global_where_counter++; 3366a0ba757dSStefano Zampini add_to_where[j]=global_where_counter; 3367a0ba757dSStefano Zampini for(k=j+1;k<temp_buffer_size;k++){ /* check for other nodes in new cc */ 3368a0ba757dSStefano Zampini same_set=PETSC_TRUE; 3369a0ba757dSStefano Zampini for(s=0;s<cum_recv_counts[i+1]-cum_recv_counts[i];s++){ 3370a0ba757dSStefano Zampini if(temp_buffer[j][s]!=temp_buffer[k][s]) { 3371a0ba757dSStefano Zampini same_set=PETSC_FALSE; 3372a0ba757dSStefano Zampini break; 3373a0ba757dSStefano Zampini } 3374a0ba757dSStefano Zampini } 3375a0ba757dSStefano Zampini if(same_set) add_to_where[k]=global_where_counter; 3376a0ba757dSStefano Zampini } 3377a0ba757dSStefano Zampini } 3378a0ba757dSStefano Zampini } 3379a0ba757dSStefano Zampini /* insert new data in where array */ 3380a0ba757dSStefano Zampini temp_buffer_size=0; 3381a0ba757dSStefano Zampini for(j=0;j<mat_graph->nvtxs;j++){ 3382a0ba757dSStefano Zampini if(mat_graph->where[j]==i+1) { 3383a0ba757dSStefano Zampini mat_graph->where[j]=where_values+add_to_where[temp_buffer_size]; 3384a0ba757dSStefano Zampini temp_buffer_size++; 3385a0ba757dSStefano Zampini } 3386a0ba757dSStefano Zampini } 3387a0ba757dSStefano Zampini ierr = PetscFree(temp_buffer[0]);CHKERRQ(ierr); 3388a0ba757dSStefano Zampini ierr = PetscFree(temp_buffer);CHKERRQ(ierr); 3389a0ba757dSStefano Zampini ierr = PetscFree(add_to_where);CHKERRQ(ierr); 3390a0ba757dSStefano Zampini } 3391a0ba757dSStefano Zampini } 3392a0ba757dSStefano Zampini ierr = PetscFree(nodes_to_temp_buffer_indices);CHKERRQ(ierr); 3393a0ba757dSStefano Zampini ierr = PetscFree(sizes_of_sends);CHKERRQ(ierr); 3394a0ba757dSStefano Zampini ierr = PetscFree(send_requests);CHKERRQ(ierr); 3395a0ba757dSStefano Zampini ierr = PetscFree(recv_requests);CHKERRQ(ierr); 3396a0ba757dSStefano Zampini ierr = PetscFree(petsc_buffer);CHKERRQ(ierr); 3397a0ba757dSStefano Zampini ierr = PetscFree(recv_buffer);CHKERRQ(ierr); 3398a0ba757dSStefano Zampini ierr = PetscFree(recv_buffer_where);CHKERRQ(ierr); 3399a0ba757dSStefano Zampini ierr = PetscFree(send_buffer);CHKERRQ(ierr); 3400a0ba757dSStefano Zampini ierr = PetscFree(cum_recv_counts);CHKERRQ(ierr); 3401a0ba757dSStefano Zampini ierr = PetscFree(where_to_nodes_indices);CHKERRQ(ierr); 3402*23d4d1a5SStefano Zampini ierr = PetscFree(where_cc_adapt);CHKERRQ(ierr); 3403a0ba757dSStefano Zampini /* We are ready to evaluate consistent connected components on each part of the shared interface */ 3404a0ba757dSStefano Zampini if(global_where_counter) { 3405a0ba757dSStefano Zampini for(i=0;i<mat_graph->nvtxs;i++){ mat_graph->touched[i]=PETSC_FALSE; } 3406a0ba757dSStefano Zampini global_where_counter=0; 3407a0ba757dSStefano Zampini for(i=0;i<mat_graph->nvtxs;i++){ 3408a0ba757dSStefano Zampini if(mat_graph->where[i] && !mat_graph->touched[i]) { 3409a0ba757dSStefano Zampini global_where_counter++; 3410a0ba757dSStefano Zampini for(j=i+1;j<mat_graph->nvtxs;j++){ 3411a0ba757dSStefano Zampini if(!mat_graph->touched[j] && mat_graph->where[j]==mat_graph->where[i]) { 3412a0ba757dSStefano Zampini mat_graph->where[j]=global_where_counter; 3413a0ba757dSStefano Zampini mat_graph->touched[j]=PETSC_TRUE; 3414a0ba757dSStefano Zampini } 3415a0ba757dSStefano Zampini } 3416a0ba757dSStefano Zampini mat_graph->where[i]=global_where_counter; 3417a0ba757dSStefano Zampini mat_graph->touched[i]=PETSC_TRUE; 3418a0ba757dSStefano Zampini } 3419a0ba757dSStefano Zampini } 3420a0ba757dSStefano Zampini where_values=global_where_counter; 3421a0ba757dSStefano Zampini } 3422a0ba757dSStefano Zampini if(global_where_counter) { 3423a0ba757dSStefano Zampini ierr = PetscMemzero(mat_graph->cptr,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr); 3424a0ba757dSStefano Zampini ierr = PetscMemzero(mat_graph->queue,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr); 3425a0ba757dSStefano Zampini ierr = PetscFree(mat_graph->where_ncmps);CHKERRQ(ierr); 3426a0ba757dSStefano Zampini ierr = PetscMalloc(where_values*sizeof(PetscMPIInt),&mat_graph->where_ncmps);CHKERRQ(ierr); 3427a0ba757dSStefano Zampini ierr = PCBDDCFindConnectedComponents(mat_graph, where_values); 3428a0ba757dSStefano Zampini for(i=0;i<mat_graph->ncmps;i++) { 3429a0ba757dSStefano Zampini ierr = ISLocalToGlobalMappingApply(matis->mapping,mat_graph->cptr[i+1]-mat_graph->cptr[i],&mat_graph->queue[mat_graph->cptr[i]],&queue_in_global_numbering[mat_graph->cptr[i]]);CHKERRQ(ierr); 3430a0ba757dSStefano Zampini ierr = PetscSortIntWithArray(mat_graph->cptr[i+1]-mat_graph->cptr[i],&queue_in_global_numbering[mat_graph->cptr[i]],&mat_graph->queue[mat_graph->cptr[i]]);CHKERRQ(ierr); 3431a0ba757dSStefano Zampini } 3432a0ba757dSStefano Zampini } 34333b03a366Sstefano_zampini } /* Finished adapting interface */ 34340c7d97c5SJed Brown PetscInt nfc=0; 34350c7d97c5SJed Brown PetscInt nec=0; 34360c7d97c5SJed Brown PetscInt nvc=0; 34373b03a366Sstefano_zampini PetscBool twodim_flag=PETSC_FALSE; 34380c7d97c5SJed Brown for (i=0; i<mat_graph->ncmps; i++) { 34393b03a366Sstefano_zampini if( mat_graph->cptr[i+1]-mat_graph->cptr[i] > vertex_size ){ 3440534831adSStefano Zampini if(mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]==1){ /* 1 neigh Neumann fake included */ 34410c7d97c5SJed Brown nfc++; 34423b03a366Sstefano_zampini } else { /* note that nec will be zero in 2d */ 34433b03a366Sstefano_zampini nec++; 34443b03a366Sstefano_zampini } 34450c7d97c5SJed Brown } else { 34463b03a366Sstefano_zampini nvc+=mat_graph->cptr[i+1]-mat_graph->cptr[i]; 34473b03a366Sstefano_zampini } 34483b03a366Sstefano_zampini } 34493b03a366Sstefano_zampini 34503b03a366Sstefano_zampini if(!nec) { /* we are in a 2d case -> no faces, only edges */ 34513b03a366Sstefano_zampini nec = nfc; 34523b03a366Sstefano_zampini nfc = 0; 34533b03a366Sstefano_zampini twodim_flag = PETSC_TRUE; 34543b03a366Sstefano_zampini } 34553b03a366Sstefano_zampini /* allocate IS arrays for faces, edges. Vertices need a single index set. 34563b03a366Sstefano_zampini Reusing space allocated in mat_graph->where for creating IS objects */ 34573b03a366Sstefano_zampini if(!pcbddc->vertices_flag && !pcbddc->edges_flag) { 34583b03a366Sstefano_zampini ierr = PetscMalloc(nfc*sizeof(IS),&pcbddc->ISForFaces);CHKERRQ(ierr); 34593b03a366Sstefano_zampini use_faces=PETSC_TRUE; 34603b03a366Sstefano_zampini } 34613b03a366Sstefano_zampini if(!pcbddc->vertices_flag && !pcbddc->faces_flag) { 34623b03a366Sstefano_zampini ierr = PetscMalloc(nec*sizeof(IS),&pcbddc->ISForEdges);CHKERRQ(ierr); 34633b03a366Sstefano_zampini use_edges=PETSC_TRUE; 34643b03a366Sstefano_zampini } 34653b03a366Sstefano_zampini nfc=0; 34663b03a366Sstefano_zampini nec=0; 34673b03a366Sstefano_zampini for (i=0; i<mat_graph->ncmps; i++) { 34683b03a366Sstefano_zampini if( mat_graph->cptr[i+1]-mat_graph->cptr[i] > vertex_size ){ 34693b03a366Sstefano_zampini for(j=0;j<mat_graph->cptr[i+1]-mat_graph->cptr[i];j++) { 34703b03a366Sstefano_zampini mat_graph->where[j]=mat_graph->queue[mat_graph->cptr[i]+j]; 34713b03a366Sstefano_zampini } 34723b03a366Sstefano_zampini if(mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]==1){ 34733b03a366Sstefano_zampini if(twodim_flag) { 34743b03a366Sstefano_zampini if(use_edges) { 34753b03a366Sstefano_zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,j,mat_graph->where,PETSC_COPY_VALUES,&pcbddc->ISForEdges[nec]);CHKERRQ(ierr); 34763b03a366Sstefano_zampini nec++; 34773b03a366Sstefano_zampini } 34783b03a366Sstefano_zampini } else { 34793b03a366Sstefano_zampini if(use_faces) { 34803b03a366Sstefano_zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,j,mat_graph->where,PETSC_COPY_VALUES,&pcbddc->ISForFaces[nfc]);CHKERRQ(ierr); 34813b03a366Sstefano_zampini nfc++; 34823b03a366Sstefano_zampini } 34833b03a366Sstefano_zampini } 34843b03a366Sstefano_zampini } else { 34853b03a366Sstefano_zampini if(use_edges) { 34863b03a366Sstefano_zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,j,mat_graph->where,PETSC_COPY_VALUES,&pcbddc->ISForEdges[nec]);CHKERRQ(ierr); 34870c7d97c5SJed Brown nec++; 34880c7d97c5SJed Brown } 34890c7d97c5SJed Brown } 34900c7d97c5SJed Brown } 34913b03a366Sstefano_zampini } 34923b03a366Sstefano_zampini pcbddc->n_ISForFaces=nfc; 34933b03a366Sstefano_zampini pcbddc->n_ISForEdges=nec; 34943b03a366Sstefano_zampini nvc=0; 34950c7d97c5SJed Brown if( !pcbddc->constraints_flag ) { 34963b03a366Sstefano_zampini for (i=0; i<mat_graph->ncmps; i++) { 34973b03a366Sstefano_zampini if( mat_graph->cptr[i+1]-mat_graph->cptr[i] <= vertex_size ){ 34983b03a366Sstefano_zampini for( j=mat_graph->cptr[i];j<mat_graph->cptr[i+1];j++) { 34993b03a366Sstefano_zampini mat_graph->where[nvc]=mat_graph->queue[j]; 35000c7d97c5SJed Brown nvc++; 35010c7d97c5SJed Brown } 35020c7d97c5SJed Brown } 35030c7d97c5SJed Brown } 35040c7d97c5SJed Brown } 3505a0ba757dSStefano Zampini /* sort vertex set (by local ordering) */ 35063b03a366Sstefano_zampini ierr = PetscSortInt(nvc,mat_graph->where);CHKERRQ(ierr); 35073b03a366Sstefano_zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,nvc,mat_graph->where,PETSC_COPY_VALUES,&pcbddc->ISForVertices);CHKERRQ(ierr); 35080c7d97c5SJed Brown 3509e269702eSStefano Zampini if(pcbddc->dbg_flag) { 3510e269702eSStefano Zampini 3511d49ef151SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"--------------------------------------------------------------\n");CHKERRQ(ierr); 3512d49ef151SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Details from PCBDDCManageLocalBoundaries for subdomain %04d\n",PetscGlobalRank);CHKERRQ(ierr); 3513d49ef151SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"--------------------------------------------------------------\n");CHKERRQ(ierr); 3514a0ba757dSStefano Zampini /* ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Graph (adjacency structure) of local Neumann mat\n");CHKERRQ(ierr); 3515a0ba757dSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"--------------------------------------------------------------\n");CHKERRQ(ierr); 3516e269702eSStefano Zampini for(i=0;i<mat_graph->nvtxs;i++) { 3517a0ba757dSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Nodes connected to node number %d are %d\n",i,mat_graph->xadj[i+1]-mat_graph->xadj[i]);CHKERRQ(ierr); 3518e269702eSStefano Zampini for(j=mat_graph->xadj[i];j<mat_graph->xadj[i+1];j++){ 3519a0ba757dSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d ",mat_graph->adjncy[j]);CHKERRQ(ierr); 3520e269702eSStefano Zampini } 3521a0ba757dSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\n--------------------------------------------------------------\n");CHKERRQ(ierr); 3522da1bb401SStefano Zampini }*/ 3523d49ef151SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Matrix graph has %d connected components", mat_graph->ncmps);CHKERRQ(ierr); 35240c7d97c5SJed Brown for(i=0;i<mat_graph->ncmps;i++) { 35253b03a366Sstefano_zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\nDetails for connected component number %02d: size %04d, count %01d. Nodes follow.\n", 35263b03a366Sstefano_zampini i,mat_graph->cptr[i+1]-mat_graph->cptr[i],mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]);CHKERRQ(ierr); 3527da1bb401SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"subdomains: "); 3528da1bb401SStefano Zampini for (j=0;j<mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]; j++) { 3529da1bb401SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d ",mat_graph->neighbours_set[mat_graph->queue[mat_graph->cptr[i]]][j]); 3530da1bb401SStefano Zampini } 3531da1bb401SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\n"); 35320c7d97c5SJed Brown for (j=mat_graph->cptr[i]; j<mat_graph->cptr[i+1]; j++){ 3533da1bb401SStefano Zampini /* ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d (%d), ",queue_in_global_numbering[j],mat_graph->queue[j]);CHKERRQ(ierr); */ 3534da1bb401SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d, ",mat_graph->queue[j]);CHKERRQ(ierr); 35350c7d97c5SJed Brown } 35360c7d97c5SJed Brown } 3537da1bb401SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\n--------------------------------------------------------------\n");CHKERRQ(ierr); 35383b03a366Sstefano_zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local vertices\n",PetscGlobalRank,nvc);CHKERRQ(ierr); 35393b03a366Sstefano_zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local faces\n",PetscGlobalRank,nfc);CHKERRQ(ierr); 35403b03a366Sstefano_zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local edges\n",PetscGlobalRank,nec);CHKERRQ(ierr); 3541d49ef151SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 35420c7d97c5SJed Brown } 35430c7d97c5SJed Brown 3544a0ba757dSStefano Zampini /* Free graph structure */ 35450c7d97c5SJed Brown if(mat_graph->nvtxs){ 3546a0ba757dSStefano Zampini ierr = PetscFree4(mat_graph->where,mat_graph->count,mat_graph->cptr,mat_graph->queue);CHKERRQ(ierr); 3547a0ba757dSStefano Zampini ierr = PetscFree3(mat_graph->which_dof,mat_graph->touched,queue_in_global_numbering);CHKERRQ(ierr); 3548a0ba757dSStefano Zampini ierr = PetscFree(mat_graph->where_ncmps);CHKERRQ(ierr); 35490c7d97c5SJed Brown } 35500c7d97c5SJed Brown 35510c7d97c5SJed Brown PetscFunctionReturn(0); 35520c7d97c5SJed Brown 35530c7d97c5SJed Brown } 35540c7d97c5SJed Brown 35550c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 35560c7d97c5SJed Brown 35570c7d97c5SJed Brown /* The following code has been adapted from function IsConnectedSubdomain contained 3558da1bb401SStefano Zampini in source file contig.c of METIS library (version 5.0.1) 3559da1bb401SStefano Zampini It finds connected components of each partition labeled from 1 to n_dist */ 35600c7d97c5SJed Brown 35610c7d97c5SJed Brown #undef __FUNCT__ 35620c7d97c5SJed Brown #define __FUNCT__ "PCBDDCFindConnectedComponents" 35639c0446d6SStefano Zampini static PetscErrorCode PCBDDCFindConnectedComponents(PCBDDCGraph graph, PetscInt n_dist ) 35640c7d97c5SJed Brown { 35650c7d97c5SJed Brown PetscInt i, j, k, nvtxs, first, last, nleft, ncmps,pid,cum_queue,n,ncmps_pid; 35660c7d97c5SJed Brown PetscInt *xadj, *adjncy, *where, *queue; 35670c7d97c5SJed Brown PetscInt *cptr; 35680c7d97c5SJed Brown PetscBool *touched; 35690c7d97c5SJed Brown 35700c7d97c5SJed Brown PetscFunctionBegin; 35710c7d97c5SJed Brown 35720c7d97c5SJed Brown nvtxs = graph->nvtxs; 35730c7d97c5SJed Brown xadj = graph->xadj; 35740c7d97c5SJed Brown adjncy = graph->adjncy; 35750c7d97c5SJed Brown where = graph->where; 35760c7d97c5SJed Brown touched = graph->touched; 35770c7d97c5SJed Brown queue = graph->queue; 35780c7d97c5SJed Brown cptr = graph->cptr; 35790c7d97c5SJed Brown 35800c7d97c5SJed Brown for (i=0; i<nvtxs; i++) 35810c7d97c5SJed Brown touched[i] = PETSC_FALSE; 35820c7d97c5SJed Brown 35830c7d97c5SJed Brown cum_queue=0; 35840c7d97c5SJed Brown ncmps=0; 35850c7d97c5SJed Brown 35860c7d97c5SJed Brown for(n=0; n<n_dist; n++) { 3587da1bb401SStefano Zampini pid = n+1; /* partition labeled by 0 is discarded */ 35880c7d97c5SJed Brown nleft = 0; 35890c7d97c5SJed Brown for (i=0; i<nvtxs; i++) { 35900c7d97c5SJed Brown if (where[i] == pid) 35910c7d97c5SJed Brown nleft++; 35920c7d97c5SJed Brown } 35930c7d97c5SJed Brown for (i=0; i<nvtxs; i++) { 35940c7d97c5SJed Brown if (where[i] == pid) 35950c7d97c5SJed Brown break; 35960c7d97c5SJed Brown } 35970c7d97c5SJed Brown touched[i] = PETSC_TRUE; 35980c7d97c5SJed Brown queue[cum_queue] = i; 35990c7d97c5SJed Brown first = 0; last = 1; 36000c7d97c5SJed Brown cptr[ncmps] = cum_queue; /* This actually points to queue */ 36010c7d97c5SJed Brown ncmps_pid = 0; 36020c7d97c5SJed Brown while (first != nleft) { 36030c7d97c5SJed Brown if (first == last) { /* Find another starting vertex */ 36040c7d97c5SJed Brown cptr[++ncmps] = first+cum_queue; 36050c7d97c5SJed Brown ncmps_pid++; 36060c7d97c5SJed Brown for (i=0; i<nvtxs; i++) { 36070c7d97c5SJed Brown if (where[i] == pid && !touched[i]) 36080c7d97c5SJed Brown break; 36090c7d97c5SJed Brown } 36100c7d97c5SJed Brown queue[cum_queue+last] = i; 36110c7d97c5SJed Brown last++; 36120c7d97c5SJed Brown touched[i] = PETSC_TRUE; 36130c7d97c5SJed Brown } 36140c7d97c5SJed Brown i = queue[cum_queue+first]; 36150c7d97c5SJed Brown first++; 36160c7d97c5SJed Brown for (j=xadj[i]; j<xadj[i+1]; j++) { 36170c7d97c5SJed Brown k = adjncy[j]; 36180c7d97c5SJed Brown if (where[k] == pid && !touched[k]) { 36190c7d97c5SJed Brown queue[cum_queue+last] = k; 36200c7d97c5SJed Brown last++; 36210c7d97c5SJed Brown touched[k] = PETSC_TRUE; 36220c7d97c5SJed Brown } 36230c7d97c5SJed Brown } 36240c7d97c5SJed Brown } 36250c7d97c5SJed Brown cptr[++ncmps] = first+cum_queue; 36260c7d97c5SJed Brown ncmps_pid++; 36270c7d97c5SJed Brown cum_queue=cptr[ncmps]; 3628a0ba757dSStefano Zampini graph->where_ncmps[n] = ncmps_pid; 36290c7d97c5SJed Brown } 36300c7d97c5SJed Brown graph->ncmps = ncmps; 36310c7d97c5SJed Brown 36320c7d97c5SJed Brown PetscFunctionReturn(0); 36330c7d97c5SJed Brown } 36340c7d97c5SJed Brown 3635