153cdbc3dSStefano Zampini /* TODOLIST 2da1bb401SStefano Zampini DofSplitting and DM attached to pc? 3da1bb401SStefano Zampini Change SetNeumannBoundaries to SetNeumannBoundariesLocal and provide new SetNeumannBoundaries (same Dirichlet) 4da1bb401SStefano Zampini Exact solvers: Solve local saddle point directly 5831a100dSStefano Zampini - change prec_type to switch_inexact_prec_type 6831a100dSStefano Zampini - add bool solve_exact_saddle_point slot to pdbddc data 73b03a366Sstefano_zampini Inexact solvers: global preconditioner application is ready, ask to developers (Jed?) on how to best implement Dohrmann's approach (PCSHELL?) 8a0ba757dSStefano Zampini change how to deal with the coarse problem (PCBDDCSetCoarseEnvironment): 9a0ba757dSStefano Zampini - mind the problem with coarsening_factor 10a0ba757dSStefano Zampini - simplify coarse problem structure -> PCBDDC or PCREDUDANT, nothing else -> same comm for all levels? 11a0ba757dSStefano Zampini - remove coarse enums and allow use of PCBDDCGetCoarseKSP 12a0ba757dSStefano Zampini - remove metis dependency -> use MatPartitioning for multilevel -> Assemble serial adjacency in ManageLocalBoundaries? 133b03a366Sstefano_zampini - Add levels' slot to bddc data structure and associated Set/Get functions 14a0ba757dSStefano Zampini code refactoring: 15a0ba757dSStefano Zampini - pick up better names for static functions 16a0ba757dSStefano Zampini change options structure: 17a0ba757dSStefano Zampini - insert BDDC into MG framework? 18a0ba757dSStefano Zampini provide other ops? Ask to developers 19a0ba757dSStefano Zampini remove all unused printf 20a0ba757dSStefano Zampini man pages 2153cdbc3dSStefano Zampini */ 220c7d97c5SJed Brown 2353cdbc3dSStefano Zampini /* ---------------------------------------------------------------------------------------------------------------------------------------------- 240c7d97c5SJed Brown Implementation of BDDC preconditioner based on: 250c7d97c5SJed Brown C. Dohrmann "An approximate BDDC preconditioner", Numerical Linear Algebra with Applications Volume 14, Issue 2, pages 149-168, March 2007 2653cdbc3dSStefano Zampini ---------------------------------------------------------------------------------------------------------------------------------------------- */ 2753cdbc3dSStefano Zampini 2853cdbc3dSStefano Zampini #include "bddc.h" /*I "petscpc.h" I*/ /* includes for fortran wrappers */ 293b03a366Sstefano_zampini #include <petscblaslapack.h> 300c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 310c7d97c5SJed Brown #undef __FUNCT__ 320c7d97c5SJed Brown #define __FUNCT__ "PCSetFromOptions_BDDC" 330c7d97c5SJed Brown PetscErrorCode PCSetFromOptions_BDDC(PC pc) 340c7d97c5SJed Brown { 350c7d97c5SJed Brown PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 360c7d97c5SJed Brown PetscErrorCode ierr; 370c7d97c5SJed Brown 380c7d97c5SJed Brown PetscFunctionBegin; 390c7d97c5SJed Brown ierr = PetscOptionsHead("BDDC options");CHKERRQ(ierr); 400c7d97c5SJed Brown /* Verbose debugging of main data structures */ 41e269702eSStefano Zampini ierr = PetscOptionsBool("-pc_bddc_check_all" ,"Verbose (debugging) output for PCBDDC" ,"none",pcbddc->dbg_flag ,&pcbddc->dbg_flag ,PETSC_NULL);CHKERRQ(ierr); 420c7d97c5SJed Brown /* Some customization for default primal space */ 43da1bb401SStefano Zampini ierr = PetscOptionsBool("-pc_bddc_vertices_only" ,"Use only vertices in coarse space (i.e. discard constraints)","none",pcbddc->vertices_flag ,&pcbddc->vertices_flag ,PETSC_NULL);CHKERRQ(ierr); 44da1bb401SStefano Zampini ierr = PetscOptionsBool("-pc_bddc_constraints_only","Use only constraints in coarse space (i.e. discard vertices)","none",pcbddc->constraints_flag,&pcbddc->constraints_flag,PETSC_NULL);CHKERRQ(ierr); 45da1bb401SStefano Zampini ierr = PetscOptionsBool("-pc_bddc_faces_only" ,"Use only faces among constraints of coarse space (i.e. discard edges)" ,"none",pcbddc->faces_flag ,&pcbddc->faces_flag ,PETSC_NULL);CHKERRQ(ierr); 46da1bb401SStefano Zampini ierr = PetscOptionsBool("-pc_bddc_edges_only" ,"Use only edges among constraints of coarse space (i.e. discard faces)" ,"none",pcbddc->edges_flag ,&pcbddc->edges_flag ,PETSC_NULL);CHKERRQ(ierr); 470c7d97c5SJed Brown /* Coarse solver context */ 48da1bb401SStefano Zampini static const char *avail_coarse_problems[] = {"sequential","replicated","parallel","multilevel",""}; /*order of choiches depends on ENUM defined in bddc.h */ 490c7d97c5SJed Brown ierr = PetscOptionsEnum("-pc_bddc_coarse_problem_type","Set coarse problem type","none",avail_coarse_problems,(PetscEnum)pcbddc->coarse_problem_type,(PetscEnum*)&pcbddc->coarse_problem_type,PETSC_NULL);CHKERRQ(ierr); 500c7d97c5SJed Brown /* Two different application of BDDC to the whole set of dofs, internal and interface */ 510c7d97c5SJed Brown ierr = PetscOptionsBool("-pc_bddc_switch_preconditioning_type","Switch between M_2 (default) and M_3 preconditioners (as defined by Dohrmann)","none",pcbddc->prec_type,&pcbddc->prec_type,PETSC_NULL);CHKERRQ(ierr); 52534831adSStefano Zampini ierr = PetscOptionsBool("-pc_bddc_use_change_of_basis","Use change of basis approach for primal space","none",pcbddc->usechangeofbasis,&pcbddc->usechangeofbasis,PETSC_NULL);CHKERRQ(ierr); 53534831adSStefano Zampini ierr = PetscOptionsBool("-pc_bddc_use_change_on_faces","Use change of basis approach for face constraints","none",pcbddc->usechangeonfaces,&pcbddc->usechangeonfaces,PETSC_NULL);CHKERRQ(ierr); 54534831adSStefano Zampini pcbddc->usechangeonfaces = pcbddc->usechangeonfaces && pcbddc->usechangeofbasis; 550c7d97c5SJed Brown ierr = PetscOptionsInt("-pc_bddc_coarsening_ratio","Set coarsening ratio used in multilevel coarsening","none",pcbddc->coarsening_ratio,&pcbddc->coarsening_ratio,PETSC_NULL);CHKERRQ(ierr); 560c7d97c5SJed Brown ierr = PetscOptionsTail();CHKERRQ(ierr); 570c7d97c5SJed Brown PetscFunctionReturn(0); 580c7d97c5SJed Brown } 590c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 600c7d97c5SJed Brown EXTERN_C_BEGIN 610c7d97c5SJed Brown #undef __FUNCT__ 620c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetCoarseProblemType_BDDC" 6353cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetCoarseProblemType_BDDC(PC pc, CoarseProblemType CPT) 640c7d97c5SJed Brown { 650c7d97c5SJed Brown PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 660c7d97c5SJed Brown 670c7d97c5SJed Brown PetscFunctionBegin; 680c7d97c5SJed Brown pcbddc->coarse_problem_type = CPT; 690c7d97c5SJed Brown PetscFunctionReturn(0); 700c7d97c5SJed Brown } 710c7d97c5SJed Brown EXTERN_C_END 720c7d97c5SJed Brown #undef __FUNCT__ 730c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetCoarseProblemType" 7453cdbc3dSStefano Zampini /*@ 759c0446d6SStefano Zampini PCBDDCSetCoarseProblemType - Set coarse problem type in PCBDDC. 7653cdbc3dSStefano Zampini 779c0446d6SStefano Zampini Not collective 7853cdbc3dSStefano Zampini 7953cdbc3dSStefano Zampini Input Parameters: 8053cdbc3dSStefano Zampini + pc - the preconditioning context 8153cdbc3dSStefano Zampini - CoarseProblemType - pick a better name and explain what this is 8253cdbc3dSStefano Zampini 8353cdbc3dSStefano Zampini Level: intermediate 8453cdbc3dSStefano Zampini 8553cdbc3dSStefano Zampini Notes: 86da1bb401SStefano Zampini Not collective but all procs must call with same arguments. 8753cdbc3dSStefano Zampini 8853cdbc3dSStefano Zampini .seealso: PCBDDC 8953cdbc3dSStefano Zampini @*/ 900c7d97c5SJed Brown PetscErrorCode PCBDDCSetCoarseProblemType(PC pc, CoarseProblemType CPT) 910c7d97c5SJed Brown { 920c7d97c5SJed Brown PetscErrorCode ierr; 930c7d97c5SJed Brown 940c7d97c5SJed Brown PetscFunctionBegin; 950c7d97c5SJed Brown PetscValidHeaderSpecific(pc,PC_CLASSID,1); 960c7d97c5SJed Brown ierr = PetscTryMethod(pc,"PCBDDCSetCoarseProblemType_C",(PC,CoarseProblemType),(pc,CPT));CHKERRQ(ierr); 970c7d97c5SJed Brown PetscFunctionReturn(0); 980c7d97c5SJed Brown } 990c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 1000c7d97c5SJed Brown EXTERN_C_BEGIN 1010c7d97c5SJed Brown #undef __FUNCT__ 1023b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCSetDirichletBoundaries_BDDC" 1033b03a366Sstefano_zampini static PetscErrorCode PCBDDCSetDirichletBoundaries_BDDC(PC pc,IS DirichletBoundaries) 1043b03a366Sstefano_zampini { 1053b03a366Sstefano_zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 1063b03a366Sstefano_zampini PetscErrorCode ierr; 1073b03a366Sstefano_zampini 1083b03a366Sstefano_zampini PetscFunctionBegin; 1093b03a366Sstefano_zampini ierr = ISDestroy(&pcbddc->DirichletBoundaries);CHKERRQ(ierr); 11036e030ebSStefano Zampini ierr = PetscObjectReference((PetscObject)DirichletBoundaries);CHKERRQ(ierr); 11136e030ebSStefano Zampini pcbddc->DirichletBoundaries=DirichletBoundaries; 1123b03a366Sstefano_zampini PetscFunctionReturn(0); 1133b03a366Sstefano_zampini } 1143b03a366Sstefano_zampini EXTERN_C_END 1153b03a366Sstefano_zampini #undef __FUNCT__ 1163b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCSetDirichletBoundaries" 1173b03a366Sstefano_zampini /*@ 118da1bb401SStefano Zampini PCBDDCSetDirichletBoundaries - Set index set defining subdomain part (in local ordering) 119da1bb401SStefano Zampini of Dirichlet boundaries for the global problem. 1203b03a366Sstefano_zampini 1213b03a366Sstefano_zampini Not collective 1223b03a366Sstefano_zampini 1233b03a366Sstefano_zampini Input Parameters: 1243b03a366Sstefano_zampini + pc - the preconditioning context 1253b03a366Sstefano_zampini - DirichletBoundaries - sequential index set defining the subdomain part of Dirichlet boundaries (can be PETSC_NULL) 1263b03a366Sstefano_zampini 1273b03a366Sstefano_zampini Level: intermediate 1283b03a366Sstefano_zampini 1293b03a366Sstefano_zampini Notes: 1303b03a366Sstefano_zampini 1313b03a366Sstefano_zampini .seealso: PCBDDC 1323b03a366Sstefano_zampini @*/ 1333b03a366Sstefano_zampini PetscErrorCode PCBDDCSetDirichletBoundaries(PC pc,IS DirichletBoundaries) 1343b03a366Sstefano_zampini { 1353b03a366Sstefano_zampini PetscErrorCode ierr; 1363b03a366Sstefano_zampini 1373b03a366Sstefano_zampini PetscFunctionBegin; 1383b03a366Sstefano_zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 1393b03a366Sstefano_zampini ierr = PetscTryMethod(pc,"PCBDDCSetDirichletBoundaries_C",(PC,IS),(pc,DirichletBoundaries));CHKERRQ(ierr); 1403b03a366Sstefano_zampini PetscFunctionReturn(0); 1413b03a366Sstefano_zampini } 1423b03a366Sstefano_zampini /* -------------------------------------------------------------------------- */ 1433b03a366Sstefano_zampini EXTERN_C_BEGIN 1443b03a366Sstefano_zampini #undef __FUNCT__ 1450c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetNeumannBoundaries_BDDC" 14653cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetNeumannBoundaries_BDDC(PC pc,IS NeumannBoundaries) 1470c7d97c5SJed Brown { 1480c7d97c5SJed Brown PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 14953cdbc3dSStefano Zampini PetscErrorCode ierr; 1500c7d97c5SJed Brown 1510c7d97c5SJed Brown PetscFunctionBegin; 15253cdbc3dSStefano Zampini ierr = ISDestroy(&pcbddc->NeumannBoundaries);CHKERRQ(ierr); 15336e030ebSStefano Zampini ierr = PetscObjectReference((PetscObject)NeumannBoundaries);CHKERRQ(ierr); 15436e030ebSStefano Zampini pcbddc->NeumannBoundaries=NeumannBoundaries; 1550c7d97c5SJed Brown PetscFunctionReturn(0); 1560c7d97c5SJed Brown } 1570c7d97c5SJed Brown EXTERN_C_END 1580c7d97c5SJed Brown #undef __FUNCT__ 1590c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetNeumannBoundaries" 16057527edcSJed Brown /*@ 161da1bb401SStefano Zampini PCBDDCSetNeumannBoundaries - Set index set defining subdomain part (in local ordering) 162da1bb401SStefano Zampini of Neumann boundaries for the global problem. 16357527edcSJed Brown 1649c0446d6SStefano Zampini Not collective 16557527edcSJed Brown 16657527edcSJed Brown Input Parameters: 16757527edcSJed Brown + pc - the preconditioning context 1689c0446d6SStefano Zampini - NeumannBoundaries - sequential index set defining the subdomain part of Neumann boundaries (can be PETSC_NULL) 16957527edcSJed Brown 17057527edcSJed Brown Level: intermediate 17157527edcSJed Brown 17257527edcSJed Brown Notes: 17357527edcSJed Brown 17457527edcSJed Brown .seealso: PCBDDC 17557527edcSJed Brown @*/ 17653cdbc3dSStefano Zampini PetscErrorCode PCBDDCSetNeumannBoundaries(PC pc,IS NeumannBoundaries) 1770c7d97c5SJed Brown { 1780c7d97c5SJed Brown PetscErrorCode ierr; 1790c7d97c5SJed Brown 1800c7d97c5SJed Brown PetscFunctionBegin; 1810c7d97c5SJed Brown PetscValidHeaderSpecific(pc,PC_CLASSID,1); 18253cdbc3dSStefano Zampini ierr = PetscTryMethod(pc,"PCBDDCSetNeumannBoundaries_C",(PC,IS),(pc,NeumannBoundaries));CHKERRQ(ierr); 18353cdbc3dSStefano Zampini PetscFunctionReturn(0); 18453cdbc3dSStefano Zampini } 18553cdbc3dSStefano Zampini /* -------------------------------------------------------------------------- */ 18653cdbc3dSStefano Zampini EXTERN_C_BEGIN 18753cdbc3dSStefano Zampini #undef __FUNCT__ 188da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCGetDirichletBoundaries_BDDC" 189da1bb401SStefano Zampini static PetscErrorCode PCBDDCGetDirichletBoundaries_BDDC(PC pc,IS *DirichletBoundaries) 190da1bb401SStefano Zampini { 191da1bb401SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 192da1bb401SStefano Zampini 193da1bb401SStefano Zampini PetscFunctionBegin; 194da1bb401SStefano Zampini *DirichletBoundaries = pcbddc->DirichletBoundaries; 195da1bb401SStefano Zampini PetscFunctionReturn(0); 196da1bb401SStefano Zampini } 197da1bb401SStefano Zampini EXTERN_C_END 198da1bb401SStefano Zampini #undef __FUNCT__ 199da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCGetDirichletBoundaries" 200da1bb401SStefano Zampini /*@ 201da1bb401SStefano Zampini PCBDDCGetDirichletBoundaries - Get index set defining subdomain part (in local ordering) 202da1bb401SStefano Zampini of Dirichlet boundaries for the global problem. 203da1bb401SStefano Zampini 204da1bb401SStefano Zampini Not collective 205da1bb401SStefano Zampini 206da1bb401SStefano Zampini Input Parameters: 207da1bb401SStefano Zampini + pc - the preconditioning context 208da1bb401SStefano Zampini 209da1bb401SStefano Zampini Output Parameters: 210da1bb401SStefano Zampini + DirichletBoundaries - index set defining the subdomain part of Dirichlet boundaries 211da1bb401SStefano Zampini 212da1bb401SStefano Zampini Level: intermediate 213da1bb401SStefano Zampini 214da1bb401SStefano Zampini Notes: 215da1bb401SStefano Zampini 216da1bb401SStefano Zampini .seealso: PCBDDC 217da1bb401SStefano Zampini @*/ 218da1bb401SStefano Zampini PetscErrorCode PCBDDCGetDirichletBoundaries(PC pc,IS *DirichletBoundaries) 219da1bb401SStefano Zampini { 220da1bb401SStefano Zampini PetscErrorCode ierr; 221da1bb401SStefano Zampini 222da1bb401SStefano Zampini PetscFunctionBegin; 223da1bb401SStefano Zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 224da1bb401SStefano Zampini ierr = PetscUseMethod(pc,"PCBDDCGetDirichletBoundaries_C",(PC,IS*),(pc,DirichletBoundaries));CHKERRQ(ierr); 225da1bb401SStefano Zampini PetscFunctionReturn(0); 226da1bb401SStefano Zampini } 227da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */ 228da1bb401SStefano Zampini EXTERN_C_BEGIN 229da1bb401SStefano Zampini #undef __FUNCT__ 23053cdbc3dSStefano Zampini #define __FUNCT__ "PCBDDCGetNeumannBoundaries_BDDC" 23153cdbc3dSStefano Zampini static PetscErrorCode PCBDDCGetNeumannBoundaries_BDDC(PC pc,IS *NeumannBoundaries) 23253cdbc3dSStefano Zampini { 23353cdbc3dSStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 23453cdbc3dSStefano Zampini 23553cdbc3dSStefano Zampini PetscFunctionBegin; 23653cdbc3dSStefano Zampini *NeumannBoundaries = pcbddc->NeumannBoundaries; 23753cdbc3dSStefano Zampini PetscFunctionReturn(0); 23853cdbc3dSStefano Zampini } 23953cdbc3dSStefano Zampini EXTERN_C_END 24053cdbc3dSStefano Zampini #undef __FUNCT__ 24153cdbc3dSStefano Zampini #define __FUNCT__ "PCBDDCGetNeumannBoundaries" 24253cdbc3dSStefano Zampini /*@ 243da1bb401SStefano Zampini PCBDDCGetNeumannBoundaries - Get index set defining subdomain part (in local ordering) 244da1bb401SStefano Zampini of Neumann boundaries for the global problem. 24553cdbc3dSStefano Zampini 2469c0446d6SStefano Zampini Not collective 24753cdbc3dSStefano Zampini 24853cdbc3dSStefano Zampini Input Parameters: 24953cdbc3dSStefano Zampini + pc - the preconditioning context 25053cdbc3dSStefano Zampini 25153cdbc3dSStefano Zampini Output Parameters: 25253cdbc3dSStefano Zampini + NeumannBoundaries - index set defining the subdomain part of Neumann boundaries 25353cdbc3dSStefano Zampini 25453cdbc3dSStefano Zampini Level: intermediate 25553cdbc3dSStefano Zampini 25653cdbc3dSStefano Zampini Notes: 25753cdbc3dSStefano Zampini 25853cdbc3dSStefano Zampini .seealso: PCBDDC 25953cdbc3dSStefano Zampini @*/ 26053cdbc3dSStefano Zampini PetscErrorCode PCBDDCGetNeumannBoundaries(PC pc,IS *NeumannBoundaries) 26153cdbc3dSStefano Zampini { 26253cdbc3dSStefano Zampini PetscErrorCode ierr; 26353cdbc3dSStefano Zampini 26453cdbc3dSStefano Zampini PetscFunctionBegin; 26553cdbc3dSStefano Zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 26653cdbc3dSStefano Zampini ierr = PetscUseMethod(pc,"PCBDDCGetNeumannBoundaries_C",(PC,IS*),(pc,NeumannBoundaries));CHKERRQ(ierr); 2670c7d97c5SJed Brown PetscFunctionReturn(0); 2680c7d97c5SJed Brown } 26936e030ebSStefano Zampini /* -------------------------------------------------------------------------- */ 27036e030ebSStefano Zampini EXTERN_C_BEGIN 27136e030ebSStefano Zampini #undef __FUNCT__ 272da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetLocalAdjacencyGraph_BDDC" 273da1bb401SStefano Zampini static PetscErrorCode PCBDDCSetLocalAdjacencyGraph_BDDC(PC pc, PetscInt nvtxs, PetscInt xadj[], PetscInt adjncy[], PetscCopyMode copymode) 27436e030ebSStefano Zampini { 27536e030ebSStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 276da1bb401SStefano Zampini PCBDDCGraph mat_graph=pcbddc->mat_graph; 277da1bb401SStefano Zampini PetscErrorCode ierr; 27836e030ebSStefano Zampini 27936e030ebSStefano Zampini PetscFunctionBegin; 280da1bb401SStefano Zampini mat_graph->nvtxs=nvtxs; 281da1bb401SStefano Zampini ierr = PetscFree(mat_graph->xadj);CHKERRQ(ierr); 282da1bb401SStefano Zampini ierr = PetscFree(mat_graph->adjncy);CHKERRQ(ierr); 283da1bb401SStefano Zampini if(copymode == PETSC_COPY_VALUES) { 284da1bb401SStefano Zampini ierr = PetscMalloc((mat_graph->nvtxs+1)*sizeof(PetscInt),&mat_graph->xadj);CHKERRQ(ierr); 285da1bb401SStefano Zampini ierr = PetscMalloc(xadj[mat_graph->nvtxs]*sizeof(PetscInt),&mat_graph->adjncy);CHKERRQ(ierr); 286da1bb401SStefano Zampini ierr = PetscMemcpy(mat_graph->xadj,xadj,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr); 287da1bb401SStefano Zampini ierr = PetscMemcpy(mat_graph->adjncy,adjncy,xadj[mat_graph->nvtxs]*sizeof(PetscInt));CHKERRQ(ierr); 288da1bb401SStefano Zampini } else if(copymode == PETSC_OWN_POINTER) { 289da1bb401SStefano Zampini mat_graph->xadj=xadj; 290da1bb401SStefano Zampini mat_graph->adjncy=adjncy; 291da1bb401SStefano Zampini } else { 292da1bb401SStefano Zampini SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_SUP,"Unsupported copy mode %d in %s\n",copymode,__FUNCT__); 293da1bb401SStefano Zampini } 29436e030ebSStefano Zampini PetscFunctionReturn(0); 29536e030ebSStefano Zampini } 29636e030ebSStefano Zampini EXTERN_C_END 29736e030ebSStefano Zampini #undef __FUNCT__ 298da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetLocalAdjacencyGraph" 29936e030ebSStefano Zampini /*@ 300da1bb401SStefano Zampini PCBDDCSetLocalAdjacencyGraph - Set CSR graph of local matrix for use of PCBDDC. 30136e030ebSStefano Zampini 30236e030ebSStefano Zampini Not collective 30336e030ebSStefano Zampini 30436e030ebSStefano Zampini Input Parameters: 30536e030ebSStefano Zampini + pc - the preconditioning context 306da1bb401SStefano Zampini - nvtxs - number of local vertices of the graph 307da1bb401SStefano Zampini - xadj, adjncy - the CSR graph 308da1bb401SStefano Zampini - copymode - either PETSC_COPY_VALUES or PETSC_OWN_POINTER. In the former case the user must free the array passed in; 309da1bb401SStefano Zampini in the latter case, memory must be obtained with PetscMalloc. 31036e030ebSStefano Zampini 31136e030ebSStefano Zampini Level: intermediate 31236e030ebSStefano Zampini 31336e030ebSStefano Zampini Notes: 31436e030ebSStefano Zampini 31536e030ebSStefano Zampini .seealso: PCBDDC 31636e030ebSStefano Zampini @*/ 317da1bb401SStefano Zampini PetscErrorCode PCBDDCSetLocalAdjacencyGraph(PC pc,PetscInt nvtxs,PetscInt xadj[],PetscInt adjncy[], PetscCopyMode copymode) 31836e030ebSStefano Zampini { 319da1bb401SStefano Zampini PetscInt nrows,ncols; 320da1bb401SStefano Zampini Mat_IS *matis = (Mat_IS*)pc->pmat->data; 32136e030ebSStefano Zampini PetscErrorCode ierr; 32236e030ebSStefano Zampini 32336e030ebSStefano Zampini PetscFunctionBegin; 32436e030ebSStefano Zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 325da1bb401SStefano Zampini ierr = MatGetSize(matis->A,&nrows,&ncols);CHKERRQ(ierr); 326da1bb401SStefano Zampini if(nvtxs != nrows) { 327da1bb401SStefano Zampini SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Local adjacency size %d passed in %s differs from local problem size %d!\n",nvtxs,__FUNCT__,nrows); 328da1bb401SStefano Zampini } else { 329da1bb401SStefano Zampini ierr = PetscTryMethod(pc,"PCBDDCSetLocalAdjacencyGraph_C",(PC,PetscInt,PetscInt[],PetscInt[],PetscCopyMode),(pc,nvtxs,xadj,adjncy,copymode));CHKERRQ(ierr); 330da1bb401SStefano Zampini } 33136e030ebSStefano Zampini PetscFunctionReturn(0); 33236e030ebSStefano Zampini } 3339c0446d6SStefano Zampini /* -------------------------------------------------------------------------- */ 3349c0446d6SStefano Zampini EXTERN_C_BEGIN 3359c0446d6SStefano Zampini #undef __FUNCT__ 3369c0446d6SStefano Zampini #define __FUNCT__ "PCBDDCSetDofsSplitting_BDDC" 3379c0446d6SStefano Zampini static PetscErrorCode PCBDDCSetDofsSplitting_BDDC(PC pc,PetscInt n_is, IS ISForDofs[]) 3389c0446d6SStefano Zampini { 3399c0446d6SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 3409c0446d6SStefano Zampini PetscInt i; 3419c0446d6SStefano Zampini PetscErrorCode ierr; 3429c0446d6SStefano Zampini 3439c0446d6SStefano Zampini PetscFunctionBegin; 344da1bb401SStefano Zampini /* Destroy ISes if they were already set */ 3459c0446d6SStefano Zampini for(i=0;i<pcbddc->n_ISForDofs;i++) { 3469c0446d6SStefano Zampini ierr = ISDestroy(&pcbddc->ISForDofs[i]);CHKERRQ(ierr); 3479c0446d6SStefano Zampini } 348d11ae9bbSstefano_zampini ierr = PetscFree(pcbddc->ISForDofs);CHKERRQ(ierr); 349da1bb401SStefano Zampini /* allocate space then set */ 3509c0446d6SStefano Zampini ierr = PetscMalloc(n_is*sizeof(IS),&pcbddc->ISForDofs);CHKERRQ(ierr); 3519c0446d6SStefano Zampini for(i=0;i<n_is;i++) { 352da1bb401SStefano Zampini ierr = PetscObjectReference((PetscObject)ISForDofs[i]);CHKERRQ(ierr); 353da1bb401SStefano Zampini pcbddc->ISForDofs[i]=ISForDofs[i]; 3549c0446d6SStefano Zampini } 3559c0446d6SStefano Zampini pcbddc->n_ISForDofs=n_is; 3569c0446d6SStefano Zampini PetscFunctionReturn(0); 3579c0446d6SStefano Zampini } 3589c0446d6SStefano Zampini EXTERN_C_END 3599c0446d6SStefano Zampini #undef __FUNCT__ 3609c0446d6SStefano Zampini #define __FUNCT__ "PCBDDCSetDofsSplitting" 3619c0446d6SStefano Zampini /*@ 362da1bb401SStefano Zampini PCBDDCSetDofsSplitting - Set index sets defining fields of local mat. 3639c0446d6SStefano Zampini 3649c0446d6SStefano Zampini Not collective 3659c0446d6SStefano Zampini 3669c0446d6SStefano Zampini Input Parameters: 3679c0446d6SStefano Zampini + pc - the preconditioning context 368da1bb401SStefano Zampini - n - number of index sets defining the fields 369da1bb401SStefano Zampini - IS[] - array of IS describing the fields 3709c0446d6SStefano Zampini 3719c0446d6SStefano Zampini Level: intermediate 3729c0446d6SStefano Zampini 3739c0446d6SStefano Zampini Notes: 3749c0446d6SStefano Zampini 3759c0446d6SStefano Zampini .seealso: PCBDDC 3769c0446d6SStefano Zampini @*/ 3779c0446d6SStefano Zampini PetscErrorCode PCBDDCSetDofsSplitting(PC pc,PetscInt n_is, IS ISForDofs[]) 3789c0446d6SStefano Zampini { 3799c0446d6SStefano Zampini PetscErrorCode ierr; 3809c0446d6SStefano Zampini 3819c0446d6SStefano Zampini PetscFunctionBegin; 3829c0446d6SStefano Zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 3839c0446d6SStefano Zampini ierr = PetscTryMethod(pc,"PCBDDCSetDofsSplitting_C",(PC,PetscInt,IS[]),(pc,n_is,ISForDofs));CHKERRQ(ierr); 3849c0446d6SStefano Zampini PetscFunctionReturn(0); 3859c0446d6SStefano Zampini } 386da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */ 387534831adSStefano Zampini #undef __FUNCT__ 388534831adSStefano Zampini #define __FUNCT__ "PCPreSolve_BDDC" 389534831adSStefano Zampini /* -------------------------------------------------------------------------- */ 390534831adSStefano Zampini /* 391534831adSStefano Zampini PCPreSolve_BDDC - Changes the right hand side and (if necessary) the initial 392534831adSStefano Zampini guess if a transformation of basis approach has been selected. 3939c0446d6SStefano Zampini 394534831adSStefano Zampini Input Parameter: 395534831adSStefano Zampini + pc - the preconditioner contex 396534831adSStefano Zampini 397534831adSStefano Zampini Application Interface Routine: PCPreSolve() 398534831adSStefano Zampini 399534831adSStefano Zampini Notes: 400534831adSStefano Zampini The interface routine PCPreSolve() is not usually called directly by 401534831adSStefano Zampini the user, but instead is called by KSPSolve(). 402534831adSStefano Zampini */ 403534831adSStefano Zampini static PetscErrorCode PCPreSolve_BDDC(PC pc, KSP ksp, Vec rhs, Vec x) 404534831adSStefano Zampini { 405534831adSStefano Zampini PetscErrorCode ierr; 406534831adSStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 407534831adSStefano Zampini PC_IS *pcis = (PC_IS*)(pc->data); 408534831adSStefano Zampini Mat_IS *matis = (Mat_IS*)pc->pmat->data; 409534831adSStefano Zampini Mat temp_mat; 4103972b0daSStefano Zampini IS dirIS; 4113972b0daSStefano Zampini PetscInt dirsize,i,*is_indices; 4123972b0daSStefano Zampini PetscScalar *array_x,*array_diagonal; 4133972b0daSStefano Zampini Vec used_vec; 4143972b0daSStefano Zampini PetscBool guess_nonzero; 415534831adSStefano Zampini 416534831adSStefano Zampini PetscFunctionBegin; 4173972b0daSStefano Zampini if(x) { 4183972b0daSStefano Zampini ierr = PetscObjectReference((PetscObject)x);CHKERRQ(ierr); 4193972b0daSStefano Zampini used_vec = x; 4203972b0daSStefano Zampini } else { 4213972b0daSStefano Zampini ierr = PetscObjectReference((PetscObject)pcbddc->temp_solution);CHKERRQ(ierr); 4223972b0daSStefano Zampini used_vec = pcbddc->temp_solution; 4233972b0daSStefano Zampini ierr = VecSet(used_vec,0.0);CHKERRQ(ierr); 4243972b0daSStefano Zampini } 4253972b0daSStefano Zampini /* hack into ksp data structure PCPreSolve comes earlier in src/ksp/ksp/interface/itfunc.c */ 4263972b0daSStefano Zampini if (ksp) { 4273972b0daSStefano Zampini ierr = KSPGetInitialGuessNonzero(ksp,&guess_nonzero);CHKERRQ(ierr); 4283972b0daSStefano Zampini if( !guess_nonzero ) { 4293972b0daSStefano Zampini ierr = VecSet(used_vec,0.0);CHKERRQ(ierr); 4303972b0daSStefano Zampini } 4313972b0daSStefano Zampini } 4323972b0daSStefano Zampini /* store the original rhs */ 4333972b0daSStefano Zampini ierr = VecCopy(rhs,pcbddc->original_rhs);CHKERRQ(ierr); 434534831adSStefano Zampini if(pcbddc->usechangeofbasis) { 435534831adSStefano Zampini /* swap pointers for local matrices */ 436534831adSStefano Zampini temp_mat = matis->A; 437534831adSStefano Zampini matis->A = pcbddc->local_mat; 438534831adSStefano Zampini pcbddc->local_mat = temp_mat; 439534831adSStefano Zampini /* Get local rhs and apply transformation of basis */ 440534831adSStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,rhs,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 441534831adSStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,rhs,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 442534831adSStefano Zampini /* from original basis to modified basis */ 443534831adSStefano Zampini ierr = MatMultTranspose(pcbddc->ChangeOfBasisMatrix,pcis->vec1_B,pcis->vec2_B);CHKERRQ(ierr); 444534831adSStefano Zampini /* put back modified values into the global vec using INSERT_VALUES copy mode */ 445534831adSStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,pcis->vec2_B,rhs,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 446534831adSStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,pcis->vec2_B,rhs,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 447534831adSStefano Zampini } 4483972b0daSStefano Zampini 4493972b0daSStefano Zampini /* Take into account zeroed rows -> change rhs and store solution removed */ 4503972b0daSStefano Zampini ierr = MatGetDiagonal(pc->pmat,pcis->vec1_global);CHKERRQ(ierr); 4513972b0daSStefano Zampini ierr = VecPointwiseDivide(pcis->vec1_global,rhs,pcis->vec1_global);CHKERRQ(ierr); 4523972b0daSStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 4533972b0daSStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 4543972b0daSStefano Zampini ierr = VecScatterBegin(matis->ctx,used_vec,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 4553972b0daSStefano Zampini ierr = VecScatterEnd (matis->ctx,used_vec,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 4563972b0daSStefano Zampini ierr = PCBDDCGetDirichletBoundaries(pc,&dirIS);CHKERRQ(ierr); 4573972b0daSStefano Zampini if(dirIS) { 4583972b0daSStefano Zampini ierr = ISGetSize(dirIS,&dirsize);CHKERRQ(ierr); 4593972b0daSStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array_x);CHKERRQ(ierr); 4603972b0daSStefano Zampini ierr = VecGetArray(pcis->vec2_N,&array_diagonal);CHKERRQ(ierr); 4613972b0daSStefano Zampini ierr = ISGetIndices(dirIS,(const PetscInt**)&is_indices);CHKERRQ(ierr); 4623972b0daSStefano Zampini for(i=0;i<dirsize;i++) { 4633972b0daSStefano Zampini array_x[is_indices[i]]=array_diagonal[is_indices[i]]; 4643972b0daSStefano Zampini } 4653972b0daSStefano Zampini ierr = ISRestoreIndices(dirIS,(const PetscInt**)&is_indices);CHKERRQ(ierr); 4663972b0daSStefano Zampini ierr = VecRestoreArray(pcis->vec2_N,&array_diagonal);CHKERRQ(ierr); 4673972b0daSStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array_x);CHKERRQ(ierr); 4683972b0daSStefano Zampini } 4693972b0daSStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 4703972b0daSStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 4713972b0daSStefano Zampini /* remove the computed solution from the rhs */ 4723972b0daSStefano Zampini ierr = VecScale(used_vec,-1.0);CHKERRQ(ierr); 4733972b0daSStefano Zampini ierr = MatMultAdd(pc->pmat,used_vec,rhs,rhs);CHKERRQ(ierr); 4743972b0daSStefano Zampini ierr = VecScale(used_vec,-1.0);CHKERRQ(ierr); 4753972b0daSStefano Zampini if(x) { 4763972b0daSStefano Zampini /* store partially computed solution and set initial guess to 0 */ 4773972b0daSStefano Zampini ierr = VecCopy(used_vec,pcbddc->temp_solution);CHKERRQ(ierr); 4783972b0daSStefano Zampini ierr = VecSet(used_vec,0.0);CHKERRQ(ierr); 4793972b0daSStefano Zampini } 4803972b0daSStefano Zampini ierr = VecDestroy(&used_vec);CHKERRQ(ierr); 481534831adSStefano Zampini PetscFunctionReturn(0); 482534831adSStefano Zampini } 483534831adSStefano Zampini /* -------------------------------------------------------------------------- */ 484534831adSStefano Zampini #undef __FUNCT__ 485534831adSStefano Zampini #define __FUNCT__ "PCPostSolve_BDDC" 486534831adSStefano Zampini /* -------------------------------------------------------------------------- */ 487534831adSStefano Zampini /* 488534831adSStefano Zampini PCPostSolve_BDDC - Changes the computed solution if a transformation of basis 489534831adSStefano Zampini approach has been selected. Also, restores rhs to its original state. 490534831adSStefano Zampini 491534831adSStefano Zampini Input Parameter: 492534831adSStefano Zampini + pc - the preconditioner contex 493534831adSStefano Zampini 494534831adSStefano Zampini Application Interface Routine: PCPostSolve() 495534831adSStefano Zampini 496534831adSStefano Zampini Notes: 497534831adSStefano Zampini The interface routine PCPostSolve() is not usually called directly by 498534831adSStefano Zampini the user, but instead is called by KSPSolve(). 499534831adSStefano Zampini */ 500534831adSStefano Zampini static PetscErrorCode PCPostSolve_BDDC(PC pc, KSP ksp, Vec rhs, Vec x) 501534831adSStefano Zampini { 502534831adSStefano Zampini PetscErrorCode ierr; 503534831adSStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 504534831adSStefano Zampini PC_IS *pcis = (PC_IS*)(pc->data); 505534831adSStefano Zampini Mat_IS *matis = (Mat_IS*)pc->pmat->data; 506534831adSStefano Zampini Mat temp_mat; 507534831adSStefano Zampini 508534831adSStefano Zampini PetscFunctionBegin; 509534831adSStefano Zampini if(pcbddc->usechangeofbasis) { 510534831adSStefano Zampini /* swap pointers for local matrices */ 511534831adSStefano Zampini temp_mat = matis->A; 512534831adSStefano Zampini matis->A = pcbddc->local_mat; 513534831adSStefano Zampini pcbddc->local_mat = temp_mat; 514534831adSStefano Zampini /* restore rhs to its original state */ 5153425bc38SStefano Zampini if(rhs) { 5163425bc38SStefano Zampini ierr = VecCopy(pcbddc->original_rhs,rhs);CHKERRQ(ierr); 5173425bc38SStefano Zampini } 518534831adSStefano Zampini /* Get Local boundary and apply transformation of basis to solution vector */ 519534831adSStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,x,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 520534831adSStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,x,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 521534831adSStefano Zampini /* from modified basis to original basis */ 522534831adSStefano Zampini ierr = MatMult(pcbddc->ChangeOfBasisMatrix,pcis->vec1_B,pcis->vec2_B);CHKERRQ(ierr); 523534831adSStefano Zampini /* put back modified values into the global vec using INSERT_VALUES copy mode */ 524534831adSStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,pcis->vec2_B,x,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 525534831adSStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,pcis->vec2_B,x,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 526534831adSStefano Zampini } 5273972b0daSStefano Zampini /* add solution removed in presolve */ 5283425bc38SStefano Zampini if(x) { 5293425bc38SStefano Zampini ierr = VecAXPY(x,1.0,pcbddc->temp_solution);CHKERRQ(ierr); 5303425bc38SStefano Zampini } 531534831adSStefano Zampini PetscFunctionReturn(0); 532534831adSStefano Zampini } 533534831adSStefano Zampini /* -------------------------------------------------------------------------- */ 53453cdbc3dSStefano Zampini #undef __FUNCT__ 53553cdbc3dSStefano Zampini #define __FUNCT__ "PCSetUp_BDDC" 5360c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 5370c7d97c5SJed Brown /* 5380c7d97c5SJed Brown PCSetUp_BDDC - Prepares for the use of the BDDC preconditioner 5390c7d97c5SJed Brown by setting data structures and options. 5400c7d97c5SJed Brown 5410c7d97c5SJed Brown Input Parameter: 54253cdbc3dSStefano Zampini + pc - the preconditioner context 5430c7d97c5SJed Brown 5440c7d97c5SJed Brown Application Interface Routine: PCSetUp() 5450c7d97c5SJed Brown 5460c7d97c5SJed Brown Notes: 5470c7d97c5SJed Brown The interface routine PCSetUp() is not usually called directly by 5480c7d97c5SJed Brown the user, but instead is called by PCApply() if necessary. 5490c7d97c5SJed Brown */ 55053cdbc3dSStefano Zampini PetscErrorCode PCSetUp_BDDC(PC pc) 5510c7d97c5SJed Brown { 5520c7d97c5SJed Brown PetscErrorCode ierr; 5530c7d97c5SJed Brown PC_BDDC* pcbddc = (PC_BDDC*)pc->data; 5540c7d97c5SJed Brown PC_IS *pcis = (PC_IS*)(pc->data); 5550c7d97c5SJed Brown 5560c7d97c5SJed Brown PetscFunctionBegin; 5570c7d97c5SJed Brown if (!pc->setupcalled) { 5583b03a366Sstefano_zampini /* For BDDC we need to define a local "Neumann" problem different to that defined in PCISSetup 5599c0446d6SStefano Zampini So, we set to pcnone the Neumann problem of pcis in order to avoid unneeded computation 5600c7d97c5SJed Brown Also, we decide to directly build the (same) Dirichlet problem */ 5610c7d97c5SJed Brown ierr = PetscOptionsSetValue("-is_localN_pc_type","none");CHKERRQ(ierr); 5620c7d97c5SJed Brown ierr = PetscOptionsSetValue("-is_localD_pc_type","none");CHKERRQ(ierr); 5630c7d97c5SJed Brown /* Set up all the "iterative substructuring" common block */ 5640c7d97c5SJed Brown ierr = PCISSetUp(pc);CHKERRQ(ierr); 5653b03a366Sstefano_zampini /* Get stdout for dbg */ 566e269702eSStefano Zampini if(pcbddc->dbg_flag) { 567e269702eSStefano Zampini ierr = PetscViewerASCIIGetStdout(((PetscObject)pc)->comm,&pcbddc->dbg_viewer);CHKERRQ(ierr); 568e269702eSStefano Zampini ierr = PetscViewerASCIISynchronizedAllow(pcbddc->dbg_viewer,PETSC_TRUE);CHKERRQ(ierr); 569e269702eSStefano Zampini } 5703b03a366Sstefano_zampini /* TODO MOVE CODE FRAGMENT */ 5710c7d97c5SJed Brown PetscInt im_active=0; 5720c7d97c5SJed Brown if(pcis->n) im_active = 1; 57353cdbc3dSStefano Zampini ierr = MPI_Allreduce(&im_active,&pcbddc->active_procs,1,MPIU_INT,MPI_SUM,((PetscObject)pc)->comm);CHKERRQ(ierr); 5743b03a366Sstefano_zampini /* Analyze local interface */ 5750c7d97c5SJed Brown ierr = PCBDDCManageLocalBoundaries(pc);CHKERRQ(ierr); 5763b03a366Sstefano_zampini /* Set up local constraint matrix */ 5773b03a366Sstefano_zampini ierr = PCBDDCCreateConstraintMatrix(pc);CHKERRQ(ierr); 5780c7d97c5SJed Brown /* Create coarse and local stuffs used for evaluating action of preconditioner */ 5790c7d97c5SJed Brown ierr = PCBDDCCoarseSetUp(pc);CHKERRQ(ierr); 5803b03a366Sstefano_zampini /* Processes fakely involved in multilevel should not call ISLocalToGlobalMappingRestoreInfo */ 5813b03a366Sstefano_zampini if ( !pcis->n_neigh ) pcis->ISLocalToGlobalMappingGetInfoWasCalled=PETSC_FALSE; 5820c7d97c5SJed Brown } 5830c7d97c5SJed Brown PetscFunctionReturn(0); 5840c7d97c5SJed Brown } 5850c7d97c5SJed Brown 5860c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 5870c7d97c5SJed Brown /* 5880c7d97c5SJed Brown PCApply_BDDC - Applies the BDDC preconditioner to a vector. 5890c7d97c5SJed Brown 5900c7d97c5SJed Brown Input Parameters: 5910c7d97c5SJed Brown . pc - the preconditioner context 5920c7d97c5SJed Brown . r - input vector (global) 5930c7d97c5SJed Brown 5940c7d97c5SJed Brown Output Parameter: 5950c7d97c5SJed Brown . z - output vector (global) 5960c7d97c5SJed Brown 5970c7d97c5SJed Brown Application Interface Routine: PCApply() 5980c7d97c5SJed Brown */ 5990c7d97c5SJed Brown #undef __FUNCT__ 6000c7d97c5SJed Brown #define __FUNCT__ "PCApply_BDDC" 60153cdbc3dSStefano Zampini PetscErrorCode PCApply_BDDC(PC pc,Vec r,Vec z) 6020c7d97c5SJed Brown { 6030c7d97c5SJed Brown PC_IS *pcis = (PC_IS*)(pc->data); 6040c7d97c5SJed Brown PC_BDDC *pcbddc = (PC_BDDC*)(pc->data); 6050c7d97c5SJed Brown PetscErrorCode ierr; 6063b03a366Sstefano_zampini const PetscScalar one = 1.0; 6073b03a366Sstefano_zampini const PetscScalar m_one = -1.0; 6082617d88aSStefano Zampini const PetscScalar zero = 0.0; 6090c7d97c5SJed Brown 6100c7d97c5SJed Brown /* This code is similar to that provided in nn.c for PCNN 6110c7d97c5SJed Brown NN interface preconditioner changed to BDDC 6120c7d97c5SJed Brown Added support for M_3 preconditioenr in the reference article (code is active if pcbddc->prec_type = PETSC_TRUE) */ 6130c7d97c5SJed Brown 6140c7d97c5SJed Brown PetscFunctionBegin; 6150c7d97c5SJed Brown /* First Dirichlet solve */ 6160c7d97c5SJed Brown ierr = VecScatterBegin(pcis->global_to_D,r,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 6170c7d97c5SJed Brown ierr = VecScatterEnd (pcis->global_to_D,r,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 61853cdbc3dSStefano Zampini ierr = KSPSolve(pcbddc->ksp_D,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr); 6190c7d97c5SJed Brown /* 6200c7d97c5SJed Brown Assembling right hand side for BDDC operator 6210c7d97c5SJed Brown - vec1_D for the Dirichlet part (if needed, i.e. prec_flag=PETSC_TRUE) 6220c7d97c5SJed Brown - the interface part of the global vector z 6230c7d97c5SJed Brown */ 6240c7d97c5SJed Brown ierr = VecScale(pcis->vec2_D,m_one);CHKERRQ(ierr); 6250c7d97c5SJed Brown ierr = MatMult(pcis->A_BI,pcis->vec2_D,pcis->vec1_B);CHKERRQ(ierr); 6260c7d97c5SJed Brown if(pcbddc->prec_type) { ierr = MatMultAdd(pcis->A_II,pcis->vec2_D,pcis->vec1_D,pcis->vec1_D);CHKERRQ(ierr); } 6270c7d97c5SJed Brown ierr = VecScale(pcis->vec2_D,m_one);CHKERRQ(ierr); 6280c7d97c5SJed Brown ierr = VecCopy(r,z);CHKERRQ(ierr); 6290c7d97c5SJed Brown ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 6300c7d97c5SJed Brown ierr = VecScatterEnd (pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 6310c7d97c5SJed Brown 6322617d88aSStefano Zampini /* Get Local boundary and apply partition of unity */ 6332617d88aSStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 6342617d88aSStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 6352617d88aSStefano Zampini ierr = VecPointwiseMult(pcis->vec1_B,pcis->D,pcis->vec1_B);CHKERRQ(ierr); 6362617d88aSStefano Zampini 6372617d88aSStefano Zampini /* Apply interface preconditioner 6382617d88aSStefano Zampini input/output vecs: pcis->vec1_B and pcis->vec1_D */ 6392617d88aSStefano Zampini ierr = PCBDDCApplyInterfacePreconditioner(pc);CHKERRQ(ierr); 6402617d88aSStefano Zampini 6412617d88aSStefano Zampini /* Apply partition of unity and sum boundary values */ 6422617d88aSStefano Zampini ierr = VecPointwiseMult(pcis->vec1_B,pcis->D,pcis->vec1_B);CHKERRQ(ierr); 6432617d88aSStefano Zampini ierr = VecSet(z,zero);CHKERRQ(ierr); 6442617d88aSStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 6452617d88aSStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 6460c7d97c5SJed Brown 6473b03a366Sstefano_zampini /* Second Dirichlet solve and assembling of output */ 6480c7d97c5SJed Brown ierr = VecScatterBegin(pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 6490c7d97c5SJed Brown ierr = VecScatterEnd (pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 6500c7d97c5SJed Brown ierr = MatMult(pcis->A_IB,pcis->vec1_B,pcis->vec3_D);CHKERRQ(ierr); 6510c7d97c5SJed Brown if(pcbddc->prec_type) { ierr = MatMultAdd(pcis->A_II,pcis->vec1_D,pcis->vec3_D,pcis->vec3_D);CHKERRQ(ierr); } 65253cdbc3dSStefano Zampini ierr = KSPSolve(pcbddc->ksp_D,pcis->vec3_D,pcbddc->vec4_D);CHKERRQ(ierr); 6530c7d97c5SJed Brown ierr = VecScale(pcbddc->vec4_D,m_one);CHKERRQ(ierr); 6540c7d97c5SJed Brown if(pcbddc->prec_type) { ierr = VecAXPY (pcbddc->vec4_D,one,pcis->vec1_D);CHKERRQ(ierr); } 6550c7d97c5SJed Brown ierr = VecAXPY (pcis->vec2_D,one,pcbddc->vec4_D);CHKERRQ(ierr); 6560c7d97c5SJed Brown ierr = VecScatterBegin(pcis->global_to_D,pcis->vec2_D,z,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 6570c7d97c5SJed Brown ierr = VecScatterEnd (pcis->global_to_D,pcis->vec2_D,z,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 6580c7d97c5SJed Brown PetscFunctionReturn(0); 6590c7d97c5SJed Brown 6600c7d97c5SJed Brown } 661da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */ 662da1bb401SStefano Zampini #undef __FUNCT__ 663da1bb401SStefano Zampini #define __FUNCT__ "PCDestroy_BDDC" 664da1bb401SStefano Zampini PetscErrorCode PCDestroy_BDDC(PC pc) 665da1bb401SStefano Zampini { 666da1bb401SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 667da1bb401SStefano Zampini PetscErrorCode ierr; 668da1bb401SStefano Zampini 669da1bb401SStefano Zampini PetscFunctionBegin; 670da1bb401SStefano Zampini /* free data created by PCIS */ 671da1bb401SStefano Zampini ierr = PCISDestroy(pc);CHKERRQ(ierr); 672da1bb401SStefano Zampini /* free BDDC data */ 6733972b0daSStefano Zampini ierr = VecDestroy(&pcbddc->temp_solution);CHKERRQ(ierr); 674534831adSStefano Zampini ierr = VecDestroy(&pcbddc->original_rhs);CHKERRQ(ierr); 675534831adSStefano Zampini ierr = MatDestroy(&pcbddc->local_mat);CHKERRQ(ierr); 676534831adSStefano Zampini ierr = MatDestroy(&pcbddc->ChangeOfBasisMatrix);CHKERRQ(ierr); 677da1bb401SStefano Zampini ierr = VecDestroy(&pcbddc->coarse_vec);CHKERRQ(ierr); 678da1bb401SStefano Zampini ierr = VecDestroy(&pcbddc->coarse_rhs);CHKERRQ(ierr); 679da1bb401SStefano Zampini ierr = KSPDestroy(&pcbddc->coarse_ksp);CHKERRQ(ierr); 680da1bb401SStefano Zampini ierr = MatDestroy(&pcbddc->coarse_mat);CHKERRQ(ierr); 681da1bb401SStefano Zampini ierr = MatDestroy(&pcbddc->coarse_phi_B);CHKERRQ(ierr); 682da1bb401SStefano Zampini ierr = MatDestroy(&pcbddc->coarse_phi_D);CHKERRQ(ierr); 683da1bb401SStefano Zampini ierr = VecDestroy(&pcbddc->vec1_P);CHKERRQ(ierr); 684da1bb401SStefano Zampini ierr = VecDestroy(&pcbddc->vec1_C);CHKERRQ(ierr); 685da1bb401SStefano Zampini ierr = MatDestroy(&pcbddc->local_auxmat1);CHKERRQ(ierr); 686da1bb401SStefano Zampini ierr = MatDestroy(&pcbddc->local_auxmat2);CHKERRQ(ierr); 687da1bb401SStefano Zampini ierr = VecDestroy(&pcbddc->vec1_R);CHKERRQ(ierr); 688da1bb401SStefano Zampini ierr = VecDestroy(&pcbddc->vec2_R);CHKERRQ(ierr); 689da1bb401SStefano Zampini ierr = VecDestroy(&pcbddc->vec4_D);CHKERRQ(ierr); 690da1bb401SStefano Zampini ierr = VecScatterDestroy(&pcbddc->R_to_B);CHKERRQ(ierr); 691da1bb401SStefano Zampini ierr = VecScatterDestroy(&pcbddc->R_to_D);CHKERRQ(ierr); 692da1bb401SStefano Zampini ierr = VecScatterDestroy(&pcbddc->coarse_loc_to_glob);CHKERRQ(ierr); 693da1bb401SStefano Zampini ierr = KSPDestroy(&pcbddc->ksp_D);CHKERRQ(ierr); 694da1bb401SStefano Zampini ierr = KSPDestroy(&pcbddc->ksp_R);CHKERRQ(ierr); 695da1bb401SStefano Zampini ierr = ISDestroy(&pcbddc->NeumannBoundaries);CHKERRQ(ierr); 696da1bb401SStefano Zampini ierr = ISDestroy(&pcbddc->DirichletBoundaries);CHKERRQ(ierr); 697da1bb401SStefano Zampini ierr = MatDestroy(&pcbddc->ConstraintMatrix);CHKERRQ(ierr); 698da1bb401SStefano Zampini ierr = PetscFree(pcbddc->local_primal_indices);CHKERRQ(ierr); 699da1bb401SStefano Zampini ierr = PetscFree(pcbddc->replicated_local_primal_indices);CHKERRQ(ierr); 700da1bb401SStefano Zampini if (pcbddc->replicated_local_primal_values) { free(pcbddc->replicated_local_primal_values); } 701da1bb401SStefano Zampini ierr = PetscFree(pcbddc->local_primal_displacements);CHKERRQ(ierr); 702da1bb401SStefano Zampini ierr = PetscFree(pcbddc->local_primal_sizes);CHKERRQ(ierr); 703da1bb401SStefano Zampini PetscInt i; 704da1bb401SStefano Zampini for(i=0;i<pcbddc->n_ISForDofs;i++) { ierr = ISDestroy(&pcbddc->ISForDofs[i]);CHKERRQ(ierr); } 705da1bb401SStefano Zampini ierr = PetscFree(pcbddc->ISForDofs);CHKERRQ(ierr); 706da1bb401SStefano Zampini for(i=0;i<pcbddc->n_ISForFaces;i++) { ierr = ISDestroy(&pcbddc->ISForFaces[i]);CHKERRQ(ierr); } 707da1bb401SStefano Zampini ierr = PetscFree(pcbddc->ISForFaces);CHKERRQ(ierr); 708da1bb401SStefano Zampini for(i=0;i<pcbddc->n_ISForEdges;i++) { ierr = ISDestroy(&pcbddc->ISForEdges[i]);CHKERRQ(ierr); } 709da1bb401SStefano Zampini ierr = PetscFree(pcbddc->ISForEdges);CHKERRQ(ierr); 710da1bb401SStefano Zampini ierr = ISDestroy(&pcbddc->ISForVertices);CHKERRQ(ierr); 7113972b0daSStefano Zampini /* Free graph structure */ 712da1bb401SStefano Zampini ierr = PetscFree(pcbddc->mat_graph->xadj);CHKERRQ(ierr); 713da1bb401SStefano Zampini ierr = PetscFree(pcbddc->mat_graph->adjncy);CHKERRQ(ierr); 714da1bb401SStefano Zampini ierr = PetscFree(pcbddc->mat_graph->neighbours_set[0]);CHKERRQ(ierr); 715da1bb401SStefano Zampini ierr = PetscFree(pcbddc->mat_graph->neighbours_set);CHKERRQ(ierr); 7163972b0daSStefano Zampini ierr = PetscFree4(pcbddc->mat_graph->where,pcbddc->mat_graph->count,pcbddc->mat_graph->cptr,pcbddc->mat_graph->queue);CHKERRQ(ierr); 7173972b0daSStefano Zampini ierr = PetscFree2(pcbddc->mat_graph->which_dof,pcbddc->mat_graph->touched);CHKERRQ(ierr); 7183972b0daSStefano Zampini ierr = PetscFree(pcbddc->mat_graph->where_ncmps);CHKERRQ(ierr); 719da1bb401SStefano Zampini ierr = PetscFree(pcbddc->mat_graph);CHKERRQ(ierr); 7203425bc38SStefano Zampini /* remove functions */ 7213425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDirichletBoundaries_C","",PETSC_NULL);CHKERRQ(ierr); 7223425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetNeumannBoundaries_C","",PETSC_NULL);CHKERRQ(ierr); 7233425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetDirichletBoundaries_C","",PETSC_NULL);CHKERRQ(ierr); 7243425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetNeumannBoundaries_C","",PETSC_NULL);CHKERRQ(ierr); 7253425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetCoarseProblemType_C","",PETSC_NULL);CHKERRQ(ierr); 7263425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDofsSplitting_C","",PETSC_NULL);CHKERRQ(ierr); 7273425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetLocalAdjacencyGraph_C","",PETSC_NULL);CHKERRQ(ierr); 7283425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPreSolve_C","",PETSC_NULL);CHKERRQ(ierr); 7293425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPostSolve_C","",PETSC_NULL);CHKERRQ(ierr); 7303425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCCreateFETIDPOperators_C","",PETSC_NULL);CHKERRQ(ierr); 7313425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetRHS_C","",PETSC_NULL);CHKERRQ(ierr); 7323425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetSolution_C","",PETSC_NULL);CHKERRQ(ierr); 733da1bb401SStefano Zampini /* Free the private data structure that was hanging off the PC */ 734da1bb401SStefano Zampini ierr = PetscFree(pcbddc);CHKERRQ(ierr); 735da1bb401SStefano Zampini PetscFunctionReturn(0); 736da1bb401SStefano Zampini } 7373425bc38SStefano Zampini /* -------------------------------------------------------------------------- */ 7383425bc38SStefano Zampini EXTERN_C_BEGIN 7393425bc38SStefano Zampini #undef __FUNCT__ 7403425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetRHS_BDDC" 7413425bc38SStefano Zampini static PetscErrorCode PCBDDCMatFETIDPGetRHS_BDDC(Mat fetidp_mat, Vec standard_rhs, Vec fetidp_flux_rhs) 7423425bc38SStefano Zampini { 7433425bc38SStefano Zampini FETIDPMat_ctx *mat_ctx; 7443425bc38SStefano Zampini PC_IS* pcis; 7453425bc38SStefano Zampini PC_BDDC* pcbddc; 7463425bc38SStefano Zampini Mat_IS* matis; 7473425bc38SStefano Zampini PetscErrorCode ierr; 7480c7d97c5SJed Brown 7493425bc38SStefano Zampini PetscFunctionBegin; 7503425bc38SStefano Zampini ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr); 7513425bc38SStefano Zampini pcis = (PC_IS*)mat_ctx->pc->data; 7523425bc38SStefano Zampini pcbddc = (PC_BDDC*)mat_ctx->pc->data; 7533425bc38SStefano Zampini matis = (Mat_IS*)mat_ctx->pc->pmat->data; 7543425bc38SStefano Zampini 7553425bc38SStefano Zampini /* change of basis for physical rhs if needed 7563425bc38SStefano Zampini It also changes the rhs in case of dirichlet boundaries */ 7573425bc38SStefano Zampini (*mat_ctx->pc->ops->presolve)(mat_ctx->pc,PETSC_NULL,standard_rhs,PETSC_NULL); 7583425bc38SStefano Zampini /* store vectors for computation of fetidp final solution */ 7593425bc38SStefano Zampini ierr = VecScatterBegin(pcis->global_to_D,standard_rhs,mat_ctx->temp_solution_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 7603425bc38SStefano Zampini ierr = VecScatterEnd (pcis->global_to_D,standard_rhs,mat_ctx->temp_solution_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 7613425bc38SStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 7623425bc38SStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 7633425bc38SStefano Zampini /* scale rhs since it should be unassembled */ 7643425bc38SStefano Zampini ierr = VecPointwiseMult(mat_ctx->temp_solution_B,pcis->D,mat_ctx->temp_solution_B);CHKERRQ(ierr); 7653425bc38SStefano Zampini if(!pcbddc->prec_type) { 7663425bc38SStefano Zampini /* compute partially subassembled Schur complement right-hand side */ 7673425bc38SStefano Zampini ierr = KSPSolve(pcbddc->ksp_D,mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr); 7683425bc38SStefano Zampini ierr = MatMult(pcis->A_BI,pcis->vec1_D,pcis->vec1_B);CHKERRQ(ierr); 7693425bc38SStefano Zampini ierr = VecAXPY(mat_ctx->temp_solution_B,-1.0,pcis->vec1_B);CHKERRQ(ierr); 7703425bc38SStefano Zampini ierr = VecSet(standard_rhs,0.0);CHKERRQ(ierr); 7713425bc38SStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,mat_ctx->temp_solution_B,standard_rhs,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 7723425bc38SStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,mat_ctx->temp_solution_B,standard_rhs,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 7733425bc38SStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 7743425bc38SStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 7753425bc38SStefano Zampini ierr = VecPointwiseMult(mat_ctx->temp_solution_B,pcis->D,mat_ctx->temp_solution_B);CHKERRQ(ierr); 7763425bc38SStefano Zampini } 7773425bc38SStefano Zampini /* BDDC rhs */ 7783425bc38SStefano Zampini ierr = VecCopy(mat_ctx->temp_solution_B,pcis->vec1_B);CHKERRQ(ierr); 7793425bc38SStefano Zampini if(pcbddc->prec_type) { 7803425bc38SStefano Zampini ierr = VecCopy(mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr); 7813425bc38SStefano Zampini } 7823425bc38SStefano Zampini /* apply BDDC */ 7833425bc38SStefano Zampini ierr = PCBDDCApplyInterfacePreconditioner(mat_ctx->pc);CHKERRQ(ierr); 7843425bc38SStefano Zampini /* Application of B_delta and assembling of rhs for fetidp fluxes */ 7853425bc38SStefano Zampini ierr = VecSet(fetidp_flux_rhs,0.0);CHKERRQ(ierr); 7863425bc38SStefano Zampini ierr = MatMult(mat_ctx->B_delta,pcis->vec1_B,mat_ctx->lambda_local);CHKERRQ(ierr); 7873425bc38SStefano Zampini ierr = VecScatterBegin(mat_ctx->l2g_lambda,mat_ctx->lambda_local,fetidp_flux_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 7883425bc38SStefano Zampini ierr = VecScatterEnd (mat_ctx->l2g_lambda,mat_ctx->lambda_local,fetidp_flux_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 7893425bc38SStefano Zampini /* restore original rhs */ 7903425bc38SStefano Zampini ierr = VecCopy(pcbddc->original_rhs,standard_rhs);CHKERRQ(ierr); 7913425bc38SStefano Zampini PetscFunctionReturn(0); 7923425bc38SStefano Zampini } 7933425bc38SStefano Zampini EXTERN_C_END 7943425bc38SStefano Zampini #undef __FUNCT__ 7953425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetRHS" 7963425bc38SStefano Zampini /*@ 7973425bc38SStefano Zampini PCBDDCMatFETIDPGetRHS - Get rhs for FETIDP linear system. 7983425bc38SStefano Zampini 7993425bc38SStefano Zampini Collective 8003425bc38SStefano Zampini 8013425bc38SStefano Zampini Input Parameters: 8023425bc38SStefano Zampini + fetidp_mat - the FETIDP mat obtained by a call to PCBDDCCreateFETIDPOperators 8033425bc38SStefano Zampini + standard_rhs - the rhs of your linear system 8043425bc38SStefano Zampini 8053425bc38SStefano Zampini Output Parameters: 8063425bc38SStefano Zampini + fetidp_flux_rhs - the rhs of the FETIDP linear system 8073425bc38SStefano Zampini 8083425bc38SStefano Zampini Level: developer 8093425bc38SStefano Zampini 8103425bc38SStefano Zampini Notes: 8113425bc38SStefano Zampini 8123425bc38SStefano Zampini .seealso: PCBDDC 8133425bc38SStefano Zampini @*/ 8143425bc38SStefano Zampini PetscErrorCode PCBDDCMatFETIDPGetRHS(Mat fetidp_mat, Vec standard_rhs, Vec fetidp_flux_rhs) 8153425bc38SStefano Zampini { 8163425bc38SStefano Zampini FETIDPMat_ctx *mat_ctx; 8173425bc38SStefano Zampini PetscErrorCode ierr; 8183425bc38SStefano Zampini 8193425bc38SStefano Zampini PetscFunctionBegin; 8203425bc38SStefano Zampini ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr); 8213425bc38SStefano Zampini ierr = PetscTryMethod(mat_ctx->pc,"PCBDDCMatFETIDPGetRHS_C",(Mat,Vec,Vec),(fetidp_mat,standard_rhs,fetidp_flux_rhs));CHKERRQ(ierr); 8223425bc38SStefano Zampini PetscFunctionReturn(0); 8233425bc38SStefano Zampini } 8243425bc38SStefano Zampini /* -------------------------------------------------------------------------- */ 8253425bc38SStefano Zampini EXTERN_C_BEGIN 8263425bc38SStefano Zampini #undef __FUNCT__ 8273425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetSolution_BDDC" 8283425bc38SStefano Zampini static PetscErrorCode PCBDDCMatFETIDPGetSolution_BDDC(Mat fetidp_mat, Vec fetidp_flux_sol, Vec standard_sol) 8293425bc38SStefano Zampini { 8303425bc38SStefano Zampini FETIDPMat_ctx *mat_ctx; 8313425bc38SStefano Zampini PC_IS* pcis; 8323425bc38SStefano Zampini PC_BDDC* pcbddc; 8333425bc38SStefano Zampini Mat_IS* matis; 8343425bc38SStefano Zampini PetscErrorCode ierr; 8353425bc38SStefano Zampini 8363425bc38SStefano Zampini PetscFunctionBegin; 8373425bc38SStefano Zampini ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr); 8383425bc38SStefano Zampini pcis = (PC_IS*)mat_ctx->pc->data; 8393425bc38SStefano Zampini pcbddc = (PC_BDDC*)mat_ctx->pc->data; 8403425bc38SStefano Zampini matis = (Mat_IS*)mat_ctx->pc->pmat->data; 8413425bc38SStefano Zampini 8423425bc38SStefano Zampini /* apply B_delta^T */ 8433425bc38SStefano Zampini ierr = VecScatterBegin(mat_ctx->l2g_lambda,fetidp_flux_sol,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8443425bc38SStefano Zampini ierr = VecScatterEnd (mat_ctx->l2g_lambda,fetidp_flux_sol,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8453425bc38SStefano Zampini ierr = MatMultTranspose(mat_ctx->B_delta,mat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr); 8463425bc38SStefano Zampini /* compute rhs for BDDC application */ 8473425bc38SStefano Zampini ierr = VecAYPX(pcis->vec1_B,-1.0,mat_ctx->temp_solution_B);CHKERRQ(ierr); 8483425bc38SStefano Zampini if(pcbddc->prec_type) { 8493425bc38SStefano Zampini ierr = VecCopy(mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr); 8503425bc38SStefano Zampini } 8513425bc38SStefano Zampini /* apply BDDC */ 8523425bc38SStefano Zampini ierr = PCBDDCApplyInterfacePreconditioner(mat_ctx->pc);CHKERRQ(ierr); 8533425bc38SStefano Zampini /* put values into standard global vector */ 8543425bc38SStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8553425bc38SStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,pcis->vec1_B,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8563425bc38SStefano Zampini if(!pcbddc->prec_type) { 8573425bc38SStefano Zampini /* compute values into the interior if solved for the partially subassembled Schur complement */ 8583425bc38SStefano Zampini ierr = MatMult(pcis->A_IB,pcis->vec1_B,pcis->vec1_D);CHKERRQ(ierr); 8593425bc38SStefano Zampini ierr = VecAXPY(mat_ctx->temp_solution_D,-1.0,pcis->vec1_D);CHKERRQ(ierr); 8603425bc38SStefano Zampini ierr = KSPSolve(pcbddc->ksp_D,mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr); 8613425bc38SStefano Zampini } 8623425bc38SStefano Zampini ierr = VecScatterBegin(pcis->global_to_D,pcis->vec1_D,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8633425bc38SStefano Zampini ierr = VecScatterEnd (pcis->global_to_D,pcis->vec1_D,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8643425bc38SStefano Zampini /* final change of basis if needed 8653425bc38SStefano Zampini Is also sums the dirichlet part removed during RHS assembling */ 8663425bc38SStefano Zampini (*mat_ctx->pc->ops->postsolve)(mat_ctx->pc,PETSC_NULL,PETSC_NULL,standard_sol); 8673425bc38SStefano Zampini PetscFunctionReturn(0); 8683425bc38SStefano Zampini 8693425bc38SStefano Zampini } 8703425bc38SStefano Zampini EXTERN_C_END 8713425bc38SStefano Zampini #undef __FUNCT__ 8723425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetSolution" 8733425bc38SStefano Zampini /*@ 8743425bc38SStefano Zampini PCBDDCMatFETIDPGetSolution - Get Solution for FETIDP linear system. 8753425bc38SStefano Zampini 8763425bc38SStefano Zampini Collective 8773425bc38SStefano Zampini 8783425bc38SStefano Zampini Input Parameters: 8793425bc38SStefano Zampini + fetidp_mat - the FETIDP mat obtained by a call to PCBDDCCreateFETIDPOperators 8803425bc38SStefano Zampini + fetidp_flux_sol - the solution of the FETIDP linear system 8813425bc38SStefano Zampini 8823425bc38SStefano Zampini Output Parameters: 8833425bc38SStefano Zampini + standard_sol - the solution on the global domain 8843425bc38SStefano Zampini 8853425bc38SStefano Zampini Level: developer 8863425bc38SStefano Zampini 8873425bc38SStefano Zampini Notes: 8883425bc38SStefano Zampini 8893425bc38SStefano Zampini .seealso: PCBDDC 8903425bc38SStefano Zampini @*/ 8913425bc38SStefano Zampini PetscErrorCode PCBDDCMatFETIDPGetSolution(Mat fetidp_mat, Vec fetidp_flux_sol, Vec standard_sol) 8923425bc38SStefano Zampini { 8933425bc38SStefano Zampini FETIDPMat_ctx *mat_ctx; 8943425bc38SStefano Zampini PetscErrorCode ierr; 8953425bc38SStefano Zampini 8963425bc38SStefano Zampini PetscFunctionBegin; 8973425bc38SStefano Zampini ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr); 8983425bc38SStefano Zampini ierr = PetscTryMethod(mat_ctx->pc,"PCBDDCMatFETIDPGetSolution_C",(Mat,Vec,Vec),(fetidp_mat,fetidp_flux_sol,standard_sol));CHKERRQ(ierr); 8993425bc38SStefano Zampini PetscFunctionReturn(0); 9003425bc38SStefano Zampini } 9013425bc38SStefano Zampini /* -------------------------------------------------------------------------- */ 9023425bc38SStefano Zampini EXTERN_C_BEGIN 9033425bc38SStefano Zampini #undef __FUNCT__ 9043425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPOperators_BDDC" 9053425bc38SStefano Zampini static PetscErrorCode PCBDDCCreateFETIDPOperators_BDDC(PC pc, Mat *fetidp_mat, PC *fetidp_pc) 9063425bc38SStefano Zampini { 9073425bc38SStefano Zampini PETSC_EXTERN PetscErrorCode FETIDPMatMult(Mat,Vec,Vec); 9083425bc38SStefano Zampini PETSC_EXTERN PetscErrorCode PCBDDCDestroyFETIDPMat(Mat); 9093425bc38SStefano Zampini PETSC_EXTERN PetscErrorCode FETIDPPCApply(PC,Vec,Vec); 9103425bc38SStefano Zampini PETSC_EXTERN PetscErrorCode PCBDDCDestroyFETIDPPC(PC); 9113425bc38SStefano Zampini 9123425bc38SStefano Zampini FETIDPMat_ctx *fetidpmat_ctx; 9133425bc38SStefano Zampini Mat newmat; 9143425bc38SStefano Zampini FETIDPPC_ctx *fetidppc_ctx; 9153425bc38SStefano Zampini PC newpc; 9163425bc38SStefano Zampini MPI_Comm comm = ((PetscObject)pc)->comm; 9173425bc38SStefano Zampini PetscErrorCode ierr; 9183425bc38SStefano Zampini 9193425bc38SStefano Zampini PetscFunctionBegin; 9203425bc38SStefano Zampini /* FETIDP linear matrix */ 9213425bc38SStefano Zampini ierr = PCBDDCCreateFETIDPMatContext(pc, &fetidpmat_ctx);CHKERRQ(ierr); 9223425bc38SStefano Zampini ierr = PCBDDCSetupFETIDPMatContext(fetidpmat_ctx);CHKERRQ(ierr); 9233425bc38SStefano Zampini ierr = MatCreateShell(comm,PETSC_DECIDE,PETSC_DECIDE,fetidpmat_ctx->n_lambda,fetidpmat_ctx->n_lambda,fetidpmat_ctx,&newmat);CHKERRQ(ierr); 9243425bc38SStefano Zampini ierr = MatShellSetOperation(newmat,MATOP_MULT,(void (*)(void))FETIDPMatMult);CHKERRQ(ierr); 9253425bc38SStefano Zampini ierr = MatShellSetOperation(newmat,MATOP_DESTROY,(void (*)(void))PCBDDCDestroyFETIDPMat);CHKERRQ(ierr); 9263425bc38SStefano Zampini ierr = MatSetUp(newmat);CHKERRQ(ierr); 9273425bc38SStefano Zampini /* FETIDP preconditioner */ 9283425bc38SStefano Zampini ierr = PCBDDCCreateFETIDPPCContext(pc, &fetidppc_ctx);CHKERRQ(ierr); 9293425bc38SStefano Zampini ierr = PCBDDCSetupFETIDPPCContext(newmat,fetidppc_ctx);CHKERRQ(ierr); 9303425bc38SStefano Zampini ierr = PCCreate(comm,&newpc);CHKERRQ(ierr); 9313425bc38SStefano Zampini ierr = PCSetType(newpc,PCSHELL);CHKERRQ(ierr); 9323425bc38SStefano Zampini ierr = PCShellSetContext(newpc,fetidppc_ctx);CHKERRQ(ierr); 9333425bc38SStefano Zampini ierr = PCShellSetApply(newpc,FETIDPPCApply);CHKERRQ(ierr); 9343425bc38SStefano Zampini ierr = PCShellSetDestroy(newpc,PCBDDCDestroyFETIDPPC);CHKERRQ(ierr); 9353425bc38SStefano Zampini ierr = PCSetOperators(newpc,newmat,newmat,SAME_PRECONDITIONER);CHKERRQ(ierr); 9363425bc38SStefano Zampini ierr = PCSetUp(newpc);CHKERRQ(ierr); 9373425bc38SStefano Zampini /* return pointers for objects created */ 9383425bc38SStefano Zampini *fetidp_mat=newmat; 9393425bc38SStefano Zampini *fetidp_pc=newpc; 9403425bc38SStefano Zampini 9413425bc38SStefano Zampini PetscFunctionReturn(0); 9423425bc38SStefano Zampini } 9433425bc38SStefano Zampini EXTERN_C_END 9443425bc38SStefano Zampini #undef __FUNCT__ 9453425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPOperators" 9463425bc38SStefano Zampini /*@ 9473425bc38SStefano Zampini PCBDDCCreateFETIDPOperators - Create operators for FETIDP. 9483425bc38SStefano Zampini 9493425bc38SStefano Zampini Collective 9503425bc38SStefano Zampini 9513425bc38SStefano Zampini Input Parameters: 9523425bc38SStefano Zampini + pc - the BDDC preconditioning context (setup must be already called) 9533425bc38SStefano Zampini 9543425bc38SStefano Zampini Level: developer 9553425bc38SStefano Zampini 9563425bc38SStefano Zampini Notes: 9573425bc38SStefano Zampini 9583425bc38SStefano Zampini .seealso: PCBDDC 9593425bc38SStefano Zampini @*/ 9603425bc38SStefano Zampini PetscErrorCode PCBDDCCreateFETIDPOperators(PC pc, Mat *fetidp_mat, PC *fetidp_pc) 9613425bc38SStefano Zampini { 9623425bc38SStefano Zampini PetscErrorCode ierr; 9633425bc38SStefano Zampini 9643425bc38SStefano Zampini PetscFunctionBegin; 9653425bc38SStefano Zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 9663425bc38SStefano Zampini if (pc->setupcalled) { 9673425bc38SStefano Zampini ierr = PetscTryMethod(pc,"PCBDDCCreateFETIDPOperators_C",(PC,Mat*,PC*),(pc,fetidp_mat,fetidp_pc));CHKERRQ(ierr); 9683425bc38SStefano Zampini } else { 9693425bc38SStefano Zampini SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SUP,"You must call PCSetup_BDDC before calling %s\n",__FUNCT__); 9703425bc38SStefano Zampini } 9713425bc38SStefano Zampini PetscFunctionReturn(0); 9723425bc38SStefano Zampini } 9730c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 974da1bb401SStefano Zampini /*MC 975da1bb401SStefano Zampini PCBDDC - Balancing Domain Decomposition by Constraints. 9760c7d97c5SJed Brown 977da1bb401SStefano Zampini Options Database Keys: 978da1bb401SStefano Zampini . -pcbddc ??? - 979da1bb401SStefano Zampini 980da1bb401SStefano Zampini Level: intermediate 981da1bb401SStefano Zampini 982da1bb401SStefano Zampini Notes: The matrix used with this preconditioner must be of type MATIS 983da1bb401SStefano Zampini 984da1bb401SStefano Zampini Unlike more 'conventional' interface preconditioners, this iterates over ALL the 985da1bb401SStefano Zampini degrees of freedom, NOT just those on the interface (this allows the use of approximate solvers 986da1bb401SStefano Zampini on the subdomains). 987da1bb401SStefano Zampini 988da1bb401SStefano Zampini Options for the coarse grid preconditioner can be set with - 989da1bb401SStefano Zampini Options for the Dirichlet subproblem can be set with - 990da1bb401SStefano Zampini Options for the Neumann subproblem can be set with - 991da1bb401SStefano Zampini 992da1bb401SStefano Zampini Contributed by Stefano Zampini 993da1bb401SStefano Zampini 994da1bb401SStefano Zampini .seealso: PCCreate(), PCSetType(), PCType (for list of available types), PC, MATIS 995da1bb401SStefano Zampini M*/ 996da1bb401SStefano Zampini EXTERN_C_BEGIN 997da1bb401SStefano Zampini #undef __FUNCT__ 998da1bb401SStefano Zampini #define __FUNCT__ "PCCreate_BDDC" 999da1bb401SStefano Zampini PetscErrorCode PCCreate_BDDC(PC pc) 1000da1bb401SStefano Zampini { 1001da1bb401SStefano Zampini PetscErrorCode ierr; 1002da1bb401SStefano Zampini PC_BDDC *pcbddc; 1003da1bb401SStefano Zampini PCBDDCGraph mat_graph; 1004da1bb401SStefano Zampini 1005da1bb401SStefano Zampini PetscFunctionBegin; 1006da1bb401SStefano Zampini /* Creates the private data structure for this preconditioner and attach it to the PC object. */ 1007da1bb401SStefano Zampini ierr = PetscNewLog(pc,PC_BDDC,&pcbddc);CHKERRQ(ierr); 1008da1bb401SStefano Zampini pc->data = (void*)pcbddc; 1009da1bb401SStefano Zampini 1010da1bb401SStefano Zampini /* create PCIS data structure */ 1011da1bb401SStefano Zampini ierr = PCISCreate(pc);CHKERRQ(ierr); 1012da1bb401SStefano Zampini 1013da1bb401SStefano Zampini /* BDDC specific */ 10143972b0daSStefano Zampini pcbddc->temp_solution = 0; 1015534831adSStefano Zampini pcbddc->original_rhs = 0; 1016534831adSStefano Zampini pcbddc->local_mat = 0; 1017534831adSStefano Zampini pcbddc->ChangeOfBasisMatrix = 0; 1018534831adSStefano Zampini pcbddc->usechangeofbasis = PETSC_TRUE; 1019534831adSStefano Zampini pcbddc->usechangeonfaces = PETSC_FALSE; 1020da1bb401SStefano Zampini pcbddc->coarse_vec = 0; 1021da1bb401SStefano Zampini pcbddc->coarse_rhs = 0; 1022da1bb401SStefano Zampini pcbddc->coarse_ksp = 0; 1023da1bb401SStefano Zampini pcbddc->coarse_phi_B = 0; 1024da1bb401SStefano Zampini pcbddc->coarse_phi_D = 0; 1025da1bb401SStefano Zampini pcbddc->vec1_P = 0; 1026da1bb401SStefano Zampini pcbddc->vec1_R = 0; 1027da1bb401SStefano Zampini pcbddc->vec2_R = 0; 1028da1bb401SStefano Zampini pcbddc->local_auxmat1 = 0; 1029da1bb401SStefano Zampini pcbddc->local_auxmat2 = 0; 1030da1bb401SStefano Zampini pcbddc->R_to_B = 0; 1031da1bb401SStefano Zampini pcbddc->R_to_D = 0; 1032da1bb401SStefano Zampini pcbddc->ksp_D = 0; 1033da1bb401SStefano Zampini pcbddc->ksp_R = 0; 1034da1bb401SStefano Zampini pcbddc->local_primal_indices = 0; 1035da1bb401SStefano Zampini pcbddc->prec_type = PETSC_FALSE; 1036da1bb401SStefano Zampini pcbddc->NeumannBoundaries = 0; 1037da1bb401SStefano Zampini pcbddc->ISForDofs = 0; 1038da1bb401SStefano Zampini pcbddc->ISForVertices = 0; 1039da1bb401SStefano Zampini pcbddc->n_ISForFaces = 0; 1040da1bb401SStefano Zampini pcbddc->n_ISForEdges = 0; 1041da1bb401SStefano Zampini pcbddc->ConstraintMatrix = 0; 1042da1bb401SStefano Zampini pcbddc->use_nnsp_true = PETSC_FALSE; 1043da1bb401SStefano Zampini pcbddc->local_primal_sizes = 0; 1044da1bb401SStefano Zampini pcbddc->local_primal_displacements = 0; 1045da1bb401SStefano Zampini pcbddc->replicated_local_primal_indices = 0; 1046da1bb401SStefano Zampini pcbddc->replicated_local_primal_values = 0; 1047da1bb401SStefano Zampini pcbddc->coarse_loc_to_glob = 0; 1048da1bb401SStefano Zampini pcbddc->dbg_flag = PETSC_FALSE; 1049da1bb401SStefano Zampini pcbddc->coarsening_ratio = 8; 1050da1bb401SStefano Zampini 1051da1bb401SStefano Zampini /* allocate and initialize needed graph structure */ 1052da1bb401SStefano Zampini ierr = PetscMalloc(sizeof(*mat_graph),&pcbddc->mat_graph);CHKERRQ(ierr); 1053da1bb401SStefano Zampini pcbddc->mat_graph->xadj = 0; 1054da1bb401SStefano Zampini pcbddc->mat_graph->adjncy = 0; 1055da1bb401SStefano Zampini 1056da1bb401SStefano Zampini /* function pointers */ 1057da1bb401SStefano Zampini pc->ops->apply = PCApply_BDDC; 1058da1bb401SStefano Zampini pc->ops->applytranspose = 0; 1059da1bb401SStefano Zampini pc->ops->setup = PCSetUp_BDDC; 1060da1bb401SStefano Zampini pc->ops->destroy = PCDestroy_BDDC; 1061da1bb401SStefano Zampini pc->ops->setfromoptions = PCSetFromOptions_BDDC; 1062da1bb401SStefano Zampini pc->ops->view = 0; 1063da1bb401SStefano Zampini pc->ops->applyrichardson = 0; 1064da1bb401SStefano Zampini pc->ops->applysymmetricleft = 0; 1065da1bb401SStefano Zampini pc->ops->applysymmetricright = 0; 1066534831adSStefano Zampini pc->ops->presolve = PCPreSolve_BDDC; 1067534831adSStefano Zampini pc->ops->postsolve = PCPostSolve_BDDC; 1068da1bb401SStefano Zampini 1069da1bb401SStefano Zampini /* composing function */ 1070da1bb401SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDirichletBoundaries_C","PCBDDCSetDirichletBoundaries_BDDC", 1071da1bb401SStefano Zampini PCBDDCSetDirichletBoundaries_BDDC);CHKERRQ(ierr); 1072da1bb401SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetNeumannBoundaries_C","PCBDDCSetNeumannBoundaries_BDDC", 1073da1bb401SStefano Zampini PCBDDCSetNeumannBoundaries_BDDC);CHKERRQ(ierr); 1074da1bb401SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetDirichletBoundaries_C","PCBDDCGetDirichletBoundaries_BDDC", 1075da1bb401SStefano Zampini PCBDDCGetDirichletBoundaries_BDDC);CHKERRQ(ierr); 1076da1bb401SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetNeumannBoundaries_C","PCBDDCGetNeumannBoundaries_BDDC", 1077da1bb401SStefano Zampini PCBDDCGetNeumannBoundaries_BDDC);CHKERRQ(ierr); 1078da1bb401SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetCoarseProblemType_C","PCBDDCSetCoarseProblemType_BDDC", 1079da1bb401SStefano Zampini PCBDDCSetCoarseProblemType_BDDC);CHKERRQ(ierr); 1080da1bb401SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDofsSplitting_C","PCBDDCSetDofsSplitting_BDDC", 1081da1bb401SStefano Zampini PCBDDCSetDofsSplitting_BDDC);CHKERRQ(ierr); 1082da1bb401SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetLocalAdjacencyGraph_C","PCBDDCSetLocalAdjacencyGraph_BDDC", 1083da1bb401SStefano Zampini PCBDDCSetLocalAdjacencyGraph_BDDC);CHKERRQ(ierr); 1084534831adSStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPreSolve_C","PCPreSolve_BDDC", 1085534831adSStefano Zampini PCPreSolve_BDDC);CHKERRQ(ierr); 1086534831adSStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPostSolve_C","PCPostSolve_BDDC", 1087534831adSStefano Zampini PCPostSolve_BDDC);CHKERRQ(ierr); 10883425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCCreateFETIDPOperators_C","PCBDDCCreateFETIDPOperators_BDDC", 10893425bc38SStefano Zampini PCBDDCCreateFETIDPOperators_BDDC);CHKERRQ(ierr); 10903425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetRHS_C","PCBDDCMatFETIDPGetRHS_BDDC", 10913425bc38SStefano Zampini PCBDDCMatFETIDPGetRHS_BDDC);CHKERRQ(ierr); 10923425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetSolution_C","PCBDDCMatFETIDPGetSolution_BDDC", 10933425bc38SStefano Zampini PCBDDCMatFETIDPGetSolution_BDDC);CHKERRQ(ierr); 1094da1bb401SStefano Zampini PetscFunctionReturn(0); 1095da1bb401SStefano Zampini } 1096da1bb401SStefano Zampini EXTERN_C_END 10973425bc38SStefano Zampini 1098da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */ 1099da1bb401SStefano Zampini /* All static functions from now on */ 1100da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */ 11013425bc38SStefano Zampini 11023425bc38SStefano Zampini #undef __FUNCT__ 11033425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPMatContext" 11043425bc38SStefano Zampini static PetscErrorCode PCBDDCCreateFETIDPMatContext(PC pc, FETIDPMat_ctx **fetidpmat_ctx) 11053425bc38SStefano Zampini { 11063425bc38SStefano Zampini FETIDPMat_ctx *newctx; 11073425bc38SStefano Zampini PetscErrorCode ierr; 11083425bc38SStefano Zampini 11093425bc38SStefano Zampini PetscFunctionBegin; 11103425bc38SStefano Zampini ierr = PetscMalloc(sizeof(*newctx),&newctx);CHKERRQ(ierr); 11113425bc38SStefano Zampini newctx->lambda_local = 0; 11123425bc38SStefano Zampini newctx->temp_solution_B = 0; 11133425bc38SStefano Zampini newctx->temp_solution_D = 0; 11143425bc38SStefano Zampini newctx->B_delta = 0; 11153425bc38SStefano Zampini newctx->B_Ddelta = 0; /* theoretically belongs to the FETIDP preconditioner */ 11163425bc38SStefano Zampini newctx->l2g_lambda = 0; 11173425bc38SStefano Zampini /* increase the reference count for BDDC preconditioner */ 11183425bc38SStefano Zampini ierr = PetscObjectReference((PetscObject)pc);CHKERRQ(ierr); 11193425bc38SStefano Zampini newctx->pc = pc; 11203425bc38SStefano Zampini *fetidpmat_ctx = newctx; 11213425bc38SStefano Zampini PetscFunctionReturn(0); 11223425bc38SStefano Zampini } 11233425bc38SStefano Zampini 11243425bc38SStefano Zampini #undef __FUNCT__ 11253425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPPCContext" 11263425bc38SStefano Zampini static PetscErrorCode PCBDDCCreateFETIDPPCContext(PC pc, FETIDPPC_ctx **fetidppc_ctx) 11273425bc38SStefano Zampini { 11283425bc38SStefano Zampini FETIDPPC_ctx *newctx; 11293425bc38SStefano Zampini PetscErrorCode ierr; 11303425bc38SStefano Zampini 11313425bc38SStefano Zampini PetscFunctionBegin; 11323425bc38SStefano Zampini ierr = PetscMalloc(sizeof(*newctx),&newctx);CHKERRQ(ierr); 11333425bc38SStefano Zampini newctx->lambda_local = 0; 11343425bc38SStefano Zampini newctx->B_Ddelta = 0; 11353425bc38SStefano Zampini newctx->l2g_lambda = 0; 11363425bc38SStefano Zampini /* increase the reference count for BDDC preconditioner */ 11373425bc38SStefano Zampini ierr = PetscObjectReference((PetscObject)pc);CHKERRQ(ierr); 11383425bc38SStefano Zampini newctx->pc = pc; 11393425bc38SStefano Zampini *fetidppc_ctx = newctx; 11403425bc38SStefano Zampini PetscFunctionReturn(0); 11413425bc38SStefano Zampini } 11423425bc38SStefano Zampini 11433425bc38SStefano Zampini #undef __FUNCT__ 11443425bc38SStefano Zampini #define __FUNCT__ "PCBDDCDestroyFETIDPMat" 11453425bc38SStefano Zampini static PetscErrorCode PCBDDCDestroyFETIDPMat(Mat A) 11463425bc38SStefano Zampini { 11473425bc38SStefano Zampini FETIDPMat_ctx *mat_ctx; 11483425bc38SStefano Zampini PetscErrorCode ierr; 11493425bc38SStefano Zampini 11503425bc38SStefano Zampini PetscFunctionBegin; 11513425bc38SStefano Zampini ierr = MatShellGetContext(A,(void**)&mat_ctx);CHKERRQ(ierr); 11523425bc38SStefano Zampini ierr = VecDestroy(&mat_ctx->lambda_local);CHKERRQ(ierr); 11533425bc38SStefano Zampini ierr = VecDestroy(&mat_ctx->temp_solution_D);CHKERRQ(ierr); 11543425bc38SStefano Zampini ierr = VecDestroy(&mat_ctx->temp_solution_B);CHKERRQ(ierr); 11553425bc38SStefano Zampini ierr = MatDestroy(&mat_ctx->B_delta);CHKERRQ(ierr); 11563425bc38SStefano Zampini ierr = MatDestroy(&mat_ctx->B_Ddelta);CHKERRQ(ierr); 11573425bc38SStefano Zampini ierr = VecScatterDestroy(&mat_ctx->l2g_lambda);CHKERRQ(ierr); 11583425bc38SStefano Zampini ierr = PCDestroy(&mat_ctx->pc);CHKERRQ(ierr); /* actually it does not destroy BDDC, only decrease its reference count */ 11593425bc38SStefano Zampini ierr = PetscFree(mat_ctx);CHKERRQ(ierr); 11603425bc38SStefano Zampini PetscFunctionReturn(0); 11613425bc38SStefano Zampini } 11623425bc38SStefano Zampini 11633425bc38SStefano Zampini #undef __FUNCT__ 11643425bc38SStefano Zampini #define __FUNCT__ "PCBDDCDestroyFETIDPPC" 11653425bc38SStefano Zampini static PetscErrorCode PCBDDCDestroyFETIDPPC(PC pc) 11663425bc38SStefano Zampini { 11673425bc38SStefano Zampini FETIDPPC_ctx *pc_ctx; 11683425bc38SStefano Zampini PetscErrorCode ierr; 11693425bc38SStefano Zampini 11703425bc38SStefano Zampini PetscFunctionBegin; 11713425bc38SStefano Zampini ierr = PCShellGetContext(pc,(void**)&pc_ctx);CHKERRQ(ierr); 11723425bc38SStefano Zampini ierr = VecDestroy(&pc_ctx->lambda_local);CHKERRQ(ierr); 11733425bc38SStefano Zampini ierr = MatDestroy(&pc_ctx->B_Ddelta);CHKERRQ(ierr); 11743425bc38SStefano Zampini ierr = VecScatterDestroy(&pc_ctx->l2g_lambda);CHKERRQ(ierr); 11753425bc38SStefano Zampini ierr = PCDestroy(&pc_ctx->pc);CHKERRQ(ierr); /* actually it does not destroy BDDC, only decrease its reference count */ 11763425bc38SStefano Zampini ierr = PetscFree(pc_ctx);CHKERRQ(ierr); 11773425bc38SStefano Zampini PetscFunctionReturn(0); 11783425bc38SStefano Zampini } 11793425bc38SStefano Zampini 11803425bc38SStefano Zampini #undef __FUNCT__ 11813425bc38SStefano Zampini #define __FUNCT__ "PCBDDCSetupFETIDPMatContext" 11823425bc38SStefano Zampini static PetscErrorCode PCBDDCSetupFETIDPMatContext(FETIDPMat_ctx *fetidpmat_ctx ) 11833425bc38SStefano Zampini { 11843425bc38SStefano Zampini PetscErrorCode ierr; 11853425bc38SStefano Zampini PC_IS *pcis=(PC_IS*)fetidpmat_ctx->pc->data; 11863425bc38SStefano Zampini PC_BDDC *pcbddc=(PC_BDDC*)fetidpmat_ctx->pc->data; 11873425bc38SStefano Zampini PCBDDCGraph mat_graph=pcbddc->mat_graph; 11883425bc38SStefano Zampini Mat_IS *matis = (Mat_IS*)fetidpmat_ctx->pc->pmat->data; 11893425bc38SStefano Zampini MPI_Comm comm = ((PetscObject)(fetidpmat_ctx->pc))->comm; 11903425bc38SStefano Zampini 11913425bc38SStefano Zampini Mat ScalingMat; 11923425bc38SStefano Zampini Vec lambda_global; 11933425bc38SStefano Zampini IS IS_l2g_lambda; 11943425bc38SStefano Zampini 11953425bc38SStefano Zampini PetscBool skip_node,fully_redundant; 11963425bc38SStefano Zampini PetscInt i,j,k,s,n_boundary_dofs,sum_dof_sizes,n_global_lambda,n_vertices; 11973425bc38SStefano Zampini PetscInt n_local_lambda,n_lambda_for_dof,dual_size,n_neg_values,n_pos_values; 11983425bc38SStefano Zampini PetscMPIInt rank,nprocs,partial_sum; 11993425bc38SStefano Zampini PetscScalar scalar_value; 12003425bc38SStefano Zampini 12013425bc38SStefano Zampini PetscInt *vertex_indices,*temp_indices; 12023425bc38SStefano Zampini PetscInt *dual_dofs_boundary_indices,*aux_local_numbering_1,*aux_global_numbering; 12033425bc38SStefano Zampini PetscInt *aux_sums,*cols_B_delta,*l2g_indices; 12043425bc38SStefano Zampini PetscMPIInt *aux_local_numbering_2,*aux_global_numbering_mpi,*dof_sizes,*dof_displs; 12053425bc38SStefano Zampini PetscMPIInt *all_aux_global_numbering_mpi_1,*all_aux_global_numbering_mpi_2,*global_dofs_numbering; 12063425bc38SStefano Zampini PetscScalar *array,*scaling_factors,*vals_B_delta; 12073425bc38SStefano Zampini 12083425bc38SStefano Zampini /* For communication of scaling factors */ 12093425bc38SStefano Zampini PetscInt *ptrs_buffer,neigh_position; 12103425bc38SStefano Zampini PetscScalar **all_factors,*send_buffer,*recv_buffer; 12113425bc38SStefano Zampini MPI_Request *send_reqs,*recv_reqs; 12123425bc38SStefano Zampini 12133425bc38SStefano Zampini /* tests */ 12143425bc38SStefano Zampini Vec test_vec; 12153425bc38SStefano Zampini PetscBool test_fetidp; 12163425bc38SStefano Zampini PetscViewer viewer; 12173425bc38SStefano Zampini 12183425bc38SStefano Zampini PetscFunctionBegin; 12193425bc38SStefano Zampini ierr = MPI_Comm_rank(comm,&rank);CHKERRQ(ierr); 12203425bc38SStefano Zampini ierr = MPI_Comm_size(comm,&nprocs);CHKERRQ(ierr); 12213425bc38SStefano Zampini 12223425bc38SStefano Zampini /* Default type of lagrange multipliers is non-redundant */ 12233425bc38SStefano Zampini fully_redundant = PETSC_FALSE; 12243425bc38SStefano Zampini ierr = PetscOptionsGetBool(PETSC_NULL,"-fetidp_fullyredundant",&fully_redundant,PETSC_NULL);CHKERRQ(ierr); 12253425bc38SStefano Zampini 12263425bc38SStefano Zampini /* Evaluate local and global number of lagrange multipliers */ 12273425bc38SStefano Zampini ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr); 12283425bc38SStefano Zampini n_local_lambda = 0; 12293425bc38SStefano Zampini partial_sum = 0; 12303425bc38SStefano Zampini n_boundary_dofs = 0; 12313425bc38SStefano Zampini s = 0; 12323425bc38SStefano Zampini n_vertices = 0; 12333425bc38SStefano Zampini /* Get Vertices used to define the BDDC */ 12343425bc38SStefano Zampini ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(*vertex_indices),&vertex_indices);CHKERRQ(ierr); 12353425bc38SStefano Zampini for(i=0;i<pcbddc->local_primal_size;i++) { 12363425bc38SStefano Zampini ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&j,(const PetscInt**)&temp_indices,PETSC_NULL);CHKERRQ(ierr); 12373425bc38SStefano Zampini if(j == 1) { 12383425bc38SStefano Zampini vertex_indices[n_vertices]=temp_indices[0]; 12393425bc38SStefano Zampini n_vertices++; 12403425bc38SStefano Zampini } 12413425bc38SStefano Zampini ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&j,(const PetscInt**)&temp_indices,PETSC_NULL);CHKERRQ(ierr); 12423425bc38SStefano Zampini } 12433425bc38SStefano Zampini dual_size = pcis->n_B-n_vertices; 12443425bc38SStefano Zampini ierr = PetscMalloc(dual_size*sizeof(*dual_dofs_boundary_indices),&dual_dofs_boundary_indices);CHKERRQ(ierr); 12453425bc38SStefano Zampini ierr = PetscMalloc(dual_size*sizeof(*aux_local_numbering_1),&aux_local_numbering_1);CHKERRQ(ierr); 12463425bc38SStefano Zampini ierr = PetscMalloc(dual_size*sizeof(*aux_local_numbering_2),&aux_local_numbering_2);CHKERRQ(ierr); 12473425bc38SStefano Zampini 12483425bc38SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 12493425bc38SStefano Zampini for(i=0;i<pcis->n;i++){ 12503425bc38SStefano Zampini j = mat_graph->count[i]; /* RECALL: mat_graph->count[i] does not count myself */ 12513425bc38SStefano Zampini k = (mat_graph->neighbours_set[i][0] == -1 ? 1 : 0); 12523425bc38SStefano Zampini j = j - k ; 12533425bc38SStefano Zampini if( j > 0 ) { n_boundary_dofs++; } 12543425bc38SStefano Zampini 12553425bc38SStefano Zampini skip_node = PETSC_FALSE; 12563425bc38SStefano Zampini if(vertex_indices[s]==i) { /* it works for a sorted set of vertices */ 12573425bc38SStefano Zampini skip_node = PETSC_TRUE; 12583425bc38SStefano Zampini s++; 12593425bc38SStefano Zampini } 12603425bc38SStefano Zampini if(j < 1) {skip_node = PETSC_TRUE;} 12613425bc38SStefano Zampini if( !skip_node ) { 12623425bc38SStefano Zampini if(fully_redundant) { 12633425bc38SStefano Zampini /* fully redundant set of lagrange multipliers */ 12643425bc38SStefano Zampini n_lambda_for_dof = (j*(j+1))/2; 12653425bc38SStefano Zampini } else { 12663425bc38SStefano Zampini n_lambda_for_dof = j; 12673425bc38SStefano Zampini } 12683425bc38SStefano Zampini n_local_lambda += j; 12693425bc38SStefano Zampini /* needed to evaluate global number of lagrange multipliers */ 12703425bc38SStefano Zampini array[i]=(1.0*n_lambda_for_dof)/(j+1.0); /* already scaled for the next global sum */ 12713425bc38SStefano Zampini /* store some data needed */ 12723425bc38SStefano Zampini dual_dofs_boundary_indices[partial_sum] = n_boundary_dofs-1; 12733425bc38SStefano Zampini aux_local_numbering_1[partial_sum] = i; 12743425bc38SStefano Zampini aux_local_numbering_2[partial_sum] = (PetscMPIInt)n_lambda_for_dof; 12753425bc38SStefano Zampini partial_sum++; 12763425bc38SStefano Zampini } 12773425bc38SStefano Zampini } 12783425bc38SStefano Zampini /*printf("I found %d local lambda dofs\n",n_local_lambda); 12793425bc38SStefano Zampini printf("I found %d boundary dofs (should be %d)\n",n_boundary_dofs,pcis->n_B); 12803425bc38SStefano Zampini printf("Partial sum %d should be %d\n",partial_sum,dual_size);*/ 12813425bc38SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 12823425bc38SStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 12833425bc38SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 12843425bc38SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 12853425bc38SStefano Zampini ierr = VecSum(pcis->vec1_global,&scalar_value);CHKERRQ(ierr); 12863425bc38SStefano Zampini fetidpmat_ctx->n_lambda = (PetscInt) scalar_value; 12873425bc38SStefano Zampini /* printf("I found %d global multipliers (%f)\n",fetidpmat_ctx->n_lambda,scalar_value); */ 12883425bc38SStefano Zampini ierr = VecCreate(PETSC_COMM_SELF,&fetidpmat_ctx->lambda_local);CHKERRQ(ierr); 12893425bc38SStefano Zampini ierr = VecSetSizes(fetidpmat_ctx->lambda_local,n_local_lambda,n_local_lambda);CHKERRQ(ierr); 12903425bc38SStefano Zampini ierr = VecSetType(fetidpmat_ctx->lambda_local,VECSEQ);CHKERRQ(ierr); 12913425bc38SStefano Zampini ierr = VecCreate(comm,&lambda_global);CHKERRQ(ierr); 12923425bc38SStefano Zampini ierr = VecSetSizes(lambda_global,PETSC_DECIDE,fetidpmat_ctx->n_lambda);CHKERRQ(ierr); 12933425bc38SStefano Zampini ierr = VecSetType(lambda_global,VECMPI);CHKERRQ(ierr); 12943425bc38SStefano Zampini 12953425bc38SStefano Zampini /* compute global ordering of lagrange multipliers and associate l2g map */ 12963425bc38SStefano Zampini 12973425bc38SStefano Zampini ierr = PetscMalloc(dual_size*sizeof(*aux_global_numbering),&aux_global_numbering);CHKERRQ(ierr); 12983425bc38SStefano Zampini ierr = PetscMalloc(dual_size*sizeof(*aux_global_numbering_mpi),&aux_global_numbering_mpi);CHKERRQ(ierr); 12993425bc38SStefano Zampini j = (rank == 0 ? nprocs : 0); 13003425bc38SStefano Zampini ierr = PetscMalloc(j*sizeof(*dof_sizes),&dof_sizes);CHKERRQ(ierr); 13013425bc38SStefano Zampini ierr = PetscMalloc(j*sizeof(*dof_displs),&dof_displs);CHKERRQ(ierr); 13023425bc38SStefano Zampini ierr = ISLocalToGlobalMappingApply(matis->mapping,dual_size,aux_local_numbering_1,aux_global_numbering);CHKERRQ(ierr); 13033425bc38SStefano Zampini ierr = MPI_Gather(&dual_size,1,MPIU_INT,dof_sizes,1,MPIU_INT,0,comm);CHKERRQ(ierr); 13043425bc38SStefano Zampini sum_dof_sizes=0; 13053425bc38SStefano Zampini if ( rank == 0 ) { 13063425bc38SStefano Zampini dof_displs[0]=0; 13073425bc38SStefano Zampini sum_dof_sizes=dual_size; 13083425bc38SStefano Zampini for(i=1;i<nprocs;i++) { 13093425bc38SStefano Zampini dof_displs[i] = dof_displs[i-1]+dof_sizes[i-1]; 13103425bc38SStefano Zampini sum_dof_sizes += dof_sizes[i]; 13113425bc38SStefano Zampini } 13123425bc38SStefano Zampini } 13133425bc38SStefano Zampini for(i=0;i<dual_size;i++) { 13143425bc38SStefano Zampini aux_global_numbering_mpi[i]=(PetscMPIInt)aux_global_numbering[i]; 13153425bc38SStefano Zampini } 13163425bc38SStefano Zampini ierr = PetscMalloc(sum_dof_sizes*sizeof(*all_aux_global_numbering_mpi_1),&all_aux_global_numbering_mpi_1);CHKERRQ(ierr); 13173425bc38SStefano Zampini ierr = PetscMalloc(sum_dof_sizes*sizeof(*all_aux_global_numbering_mpi_2),&all_aux_global_numbering_mpi_2);CHKERRQ(ierr); 13183425bc38SStefano Zampini ierr = MPI_Gatherv(aux_global_numbering_mpi,dual_size,MPIU_INT,all_aux_global_numbering_mpi_1,dof_sizes,dof_displs,MPIU_INT,0,comm);CHKERRQ(ierr); 13193425bc38SStefano Zampini ierr = MPI_Gatherv(aux_local_numbering_2,dual_size,MPIU_INT,all_aux_global_numbering_mpi_2,dof_sizes,dof_displs,MPIU_INT,0,comm);CHKERRQ(ierr); 13203425bc38SStefano Zampini 13213425bc38SStefano Zampini ierr = PetscMalloc(fetidpmat_ctx->n_lambda*sizeof(*global_dofs_numbering),&global_dofs_numbering);CHKERRQ(ierr); 13223425bc38SStefano Zampini if( rank == 0 ) { 13233425bc38SStefano Zampini ierr = PetscSortMPIIntWithArray(sum_dof_sizes,all_aux_global_numbering_mpi_1,all_aux_global_numbering_mpi_2);CHKERRQ(ierr); 13243425bc38SStefano Zampini j=-1; 13253425bc38SStefano Zampini partial_sum = 0; 13263425bc38SStefano Zampini for(i=0;i<sum_dof_sizes;i++) { 13273425bc38SStefano Zampini if(j != all_aux_global_numbering_mpi_1[i] ) { 13283425bc38SStefano Zampini j=all_aux_global_numbering_mpi_1[i]; 13293425bc38SStefano Zampini for(k=0;k<all_aux_global_numbering_mpi_2[i];k++) { 13303425bc38SStefano Zampini global_dofs_numbering[partial_sum+k]=all_aux_global_numbering_mpi_1[i]; 13313425bc38SStefano Zampini } 13323425bc38SStefano Zampini partial_sum += all_aux_global_numbering_mpi_2[i]; 13333425bc38SStefano Zampini } 13343425bc38SStefano Zampini } 13353425bc38SStefano Zampini /* printf("Partial sum for global dofs %d should be %d\n",partial_sum,fetidpmat_ctx->n_lambda); */ 13363425bc38SStefano Zampini } 13373425bc38SStefano Zampini ierr = MPI_Bcast(global_dofs_numbering,fetidpmat_ctx->n_lambda,MPIU_INT,0,comm);CHKERRQ(ierr); 13383425bc38SStefano Zampini 13393425bc38SStefano Zampini /* init data for scaling factors exchange */ 13403425bc38SStefano Zampini partial_sum = 0; 13413425bc38SStefano Zampini j = 0; 13423425bc38SStefano Zampini ierr = PetscMalloc( pcis->n_neigh*sizeof(PetscInt),&ptrs_buffer);CHKERRQ(ierr); 13433425bc38SStefano Zampini ierr = PetscMalloc( (pcis->n_neigh-1)*sizeof(MPI_Request),&send_reqs);CHKERRQ(ierr); 13443425bc38SStefano Zampini ierr = PetscMalloc( (pcis->n_neigh-1)*sizeof(MPI_Request),&recv_reqs);CHKERRQ(ierr); 13453425bc38SStefano Zampini ierr = PetscMalloc( pcis->n*sizeof(PetscScalar*),&all_factors);CHKERRQ(ierr); 13463425bc38SStefano Zampini ptrs_buffer[0]=0; 13473425bc38SStefano Zampini for(i=1;i<pcis->n_neigh;i++) { 13483425bc38SStefano Zampini partial_sum += pcis->n_shared[i]; 13493425bc38SStefano Zampini ptrs_buffer[i] = ptrs_buffer[i-1]+pcis->n_shared[i]; 13503425bc38SStefano Zampini } 13513425bc38SStefano Zampini ierr = PetscMalloc( partial_sum*sizeof(PetscScalar),&send_buffer);CHKERRQ(ierr); 13523425bc38SStefano Zampini ierr = PetscMalloc( partial_sum*sizeof(PetscScalar),&recv_buffer);CHKERRQ(ierr); 13533425bc38SStefano Zampini ierr = PetscMalloc( partial_sum*sizeof(PetscScalar),&all_factors[0]);CHKERRQ(ierr); 13543425bc38SStefano Zampini for(i=0;i<pcis->n-1;i++) { 13553425bc38SStefano Zampini j = mat_graph->count[i]; 13563425bc38SStefano Zampini if(j>0) { 13573425bc38SStefano Zampini k = (mat_graph->neighbours_set[i][0] == -1 ? 1 : 0); 13583425bc38SStefano Zampini j = j - k; 13593425bc38SStefano Zampini } 13603425bc38SStefano Zampini all_factors[i+1]=all_factors[i]+j; 13613425bc38SStefano Zampini } 13623425bc38SStefano Zampini /* scatter B scaling to N vec */ 13633425bc38SStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->D,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 13643425bc38SStefano Zampini ierr = VecScatterEnd (pcis->N_to_B,pcis->D,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 13653425bc38SStefano Zampini /* communications */ 13663425bc38SStefano Zampini k = 0; 13673425bc38SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 13683425bc38SStefano Zampini for(i=1;i<pcis->n_neigh;i++) { 13693425bc38SStefano Zampini for(j=0;j<pcis->n_shared[i];j++) { 13703425bc38SStefano Zampini send_buffer[ptrs_buffer[i-1]+j]=array[pcis->shared[i][j]]; 13713425bc38SStefano Zampini } 13723425bc38SStefano Zampini j = ptrs_buffer[i]-ptrs_buffer[i-1]; 13733425bc38SStefano Zampini ierr = MPI_Isend(&send_buffer[ptrs_buffer[i-1]],j,MPIU_SCALAR,pcis->neigh[i],0,comm,&send_reqs[k]);CHKERRQ(ierr); 13743425bc38SStefano Zampini ierr = MPI_Irecv(&recv_buffer[ptrs_buffer[i-1]],j,MPIU_SCALAR,pcis->neigh[i],0,comm,&recv_reqs[k]);CHKERRQ(ierr); 13753425bc38SStefano Zampini k++; 13763425bc38SStefano Zampini } 13773425bc38SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 13783425bc38SStefano Zampini ierr = MPI_Waitall(k,recv_reqs,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 13793425bc38SStefano Zampini ierr = MPI_Waitall(k,send_reqs,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 13803425bc38SStefano Zampini /* put values in correct places */ 13813425bc38SStefano Zampini for(i=1;i<pcis->n_neigh;i++) { 13823425bc38SStefano Zampini for(j=0;j<pcis->n_shared[i];j++) { 13833425bc38SStefano Zampini k = pcis->shared[i][j]; 13843425bc38SStefano Zampini neigh_position = 0; 13853425bc38SStefano Zampini while(mat_graph->neighbours_set[k][neigh_position] != pcis->neigh[i]) {neigh_position++;} 13863425bc38SStefano Zampini s = (mat_graph->neighbours_set[k][0] == -1 ? 1 : 0); 13873425bc38SStefano Zampini neigh_position = neigh_position - s; 13883425bc38SStefano Zampini all_factors[k][neigh_position]=recv_buffer[ptrs_buffer[i-1]+j]; 13893425bc38SStefano Zampini } 13903425bc38SStefano Zampini } 13913425bc38SStefano Zampini ierr = PetscFree(send_reqs);CHKERRQ(ierr); 13923425bc38SStefano Zampini ierr = PetscFree(recv_reqs);CHKERRQ(ierr); 13933425bc38SStefano Zampini ierr = PetscFree(send_buffer);CHKERRQ(ierr); 13943425bc38SStefano Zampini ierr = PetscFree(recv_buffer);CHKERRQ(ierr); 13953425bc38SStefano Zampini ierr = PetscFree(ptrs_buffer);CHKERRQ(ierr); 13963425bc38SStefano Zampini 13973425bc38SStefano Zampini /* Compute B and B_delta (local actions) */ 13983425bc38SStefano Zampini ierr = PetscMalloc(pcis->n_neigh*sizeof(*aux_sums),&aux_sums);CHKERRQ(ierr); 13993425bc38SStefano Zampini ierr = PetscMalloc(n_local_lambda*sizeof(*l2g_indices),&l2g_indices);CHKERRQ(ierr); 14003425bc38SStefano Zampini ierr = PetscMalloc(n_local_lambda*sizeof(*vals_B_delta),&vals_B_delta);CHKERRQ(ierr); 14013425bc38SStefano Zampini ierr = PetscMalloc(n_local_lambda*sizeof(*cols_B_delta),&cols_B_delta);CHKERRQ(ierr); 14023425bc38SStefano Zampini ierr = PetscMalloc(n_local_lambda*sizeof(*scaling_factors),&scaling_factors);CHKERRQ(ierr); 14033425bc38SStefano Zampini n_global_lambda=0; 14043425bc38SStefano Zampini partial_sum=0; 14053425bc38SStefano Zampini for(i=0;i<dual_size;i++) { 14063425bc38SStefano Zampini while( global_dofs_numbering[n_global_lambda] != aux_global_numbering_mpi[i] ) { n_global_lambda++; } 14073425bc38SStefano Zampini j = mat_graph->count[aux_local_numbering_1[i]]; 14083425bc38SStefano Zampini k = (mat_graph->neighbours_set[aux_local_numbering_1[i]][0] == -1 ? 1 : 0); 14093425bc38SStefano Zampini j = j - k; 14103425bc38SStefano Zampini aux_sums[0]=0; 14113425bc38SStefano Zampini for(s=1;s<j;s++) { 14123425bc38SStefano Zampini aux_sums[s]=aux_sums[s-1]+j-s+1; 14133425bc38SStefano Zampini } 14143425bc38SStefano Zampini array = all_factors[aux_local_numbering_1[i]]; 14153425bc38SStefano Zampini n_neg_values = 0; 14163425bc38SStefano Zampini while(n_neg_values < j && mat_graph->neighbours_set[aux_local_numbering_1[i]][n_neg_values+k] < rank) {n_neg_values++;} 14173425bc38SStefano Zampini n_pos_values = j - n_neg_values; 14183425bc38SStefano Zampini if(fully_redundant) { 14193425bc38SStefano Zampini for(s=0;s<n_neg_values;s++) { 14203425bc38SStefano Zampini l2g_indices [partial_sum+s]=aux_sums[s]+n_neg_values-s-1+n_global_lambda; 14213425bc38SStefano Zampini cols_B_delta [partial_sum+s]=dual_dofs_boundary_indices[i]; 14223425bc38SStefano Zampini vals_B_delta [partial_sum+s]=-1.0; 14233425bc38SStefano Zampini scaling_factors[partial_sum+s]=array[s]; 14243425bc38SStefano Zampini } 14253425bc38SStefano Zampini for(s=0;s<n_pos_values;s++) { 14263425bc38SStefano Zampini l2g_indices [partial_sum+s+n_neg_values]=aux_sums[n_neg_values]+s+n_global_lambda; 14273425bc38SStefano Zampini cols_B_delta [partial_sum+s+n_neg_values]=dual_dofs_boundary_indices[i]; 14283425bc38SStefano Zampini vals_B_delta [partial_sum+s+n_neg_values]=1.0; 14293425bc38SStefano Zampini scaling_factors[partial_sum+s+n_neg_values]=array[s+n_neg_values]; 14303425bc38SStefano Zampini } 14313425bc38SStefano Zampini partial_sum += j; 14323425bc38SStefano Zampini } else { 14333425bc38SStefano Zampini /* l2g_indices and default cols and vals of B_delta */ 14343425bc38SStefano Zampini for(s=0;s<j;s++) { 14353425bc38SStefano Zampini l2g_indices [partial_sum+s]=n_global_lambda+s; 14363425bc38SStefano Zampini cols_B_delta [partial_sum+s]=dual_dofs_boundary_indices[i]; 14373425bc38SStefano Zampini vals_B_delta [partial_sum+s]=0.0; 14383425bc38SStefano Zampini } 14393425bc38SStefano Zampini /* B_delta */ 14403425bc38SStefano Zampini if( n_neg_values > 0 ) { /* there's a rank next to me to the left */ 14413425bc38SStefano Zampini vals_B_delta [partial_sum+n_neg_values-1]=-1.0; 14423425bc38SStefano Zampini } 14433425bc38SStefano Zampini if ( n_neg_values < j ) { /* there's a rank next to me to the right */ 14443425bc38SStefano Zampini vals_B_delta [partial_sum+n_neg_values]=1.0; 14453425bc38SStefano Zampini } 14463425bc38SStefano Zampini /* scaling as in Klawonn-Widlund 1999*/ 14473425bc38SStefano Zampini for(s=0;s<n_neg_values;s++) { 14483425bc38SStefano Zampini scalar_value = 0.0; 14493425bc38SStefano Zampini for(k=0;k<s+1;k++) { 14503425bc38SStefano Zampini scalar_value += array[k]; 14513425bc38SStefano Zampini } 14523425bc38SStefano Zampini scalar_value = -scalar_value; 14533425bc38SStefano Zampini scaling_factors[partial_sum+s] = scalar_value; 14543425bc38SStefano Zampini } 14553425bc38SStefano Zampini for(s=0;s<n_pos_values;s++) { 14563425bc38SStefano Zampini scalar_value = 0.0; 14573425bc38SStefano Zampini for(k=s+n_neg_values;k<j;k++) { 14583425bc38SStefano Zampini scalar_value += array[k]; 14593425bc38SStefano Zampini } 14603425bc38SStefano Zampini scaling_factors[partial_sum+s+n_neg_values] = scalar_value; 14613425bc38SStefano Zampini } 14623425bc38SStefano Zampini partial_sum += j; 14633425bc38SStefano Zampini } 14643425bc38SStefano Zampini } 14653425bc38SStefano Zampini ierr = PetscFree(all_factors[0]);CHKERRQ(ierr); 14663425bc38SStefano Zampini ierr = PetscFree(all_factors);CHKERRQ(ierr); 14673425bc38SStefano Zampini /* printf("I found %d local lambda dofs when numbering them (should be %d)\n",partial_sum,n_local_lambda); */ 14683425bc38SStefano Zampini ierr = ISCreateGeneral(comm,n_local_lambda,l2g_indices,PETSC_OWN_POINTER,&IS_l2g_lambda);CHKERRQ(ierr); 14693425bc38SStefano Zampini ierr = VecScatterCreate(fetidpmat_ctx->lambda_local,(IS)0,lambda_global,IS_l2g_lambda,&fetidpmat_ctx->l2g_lambda);CHKERRQ(ierr); 14703425bc38SStefano Zampini 14713425bc38SStefano Zampini /* Create local part of B_delta */ 14723425bc38SStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&fetidpmat_ctx->B_delta); 14733425bc38SStefano Zampini ierr = MatSetSizes(fetidpmat_ctx->B_delta,n_local_lambda,pcis->n_B,n_local_lambda,pcis->n_B);CHKERRQ(ierr); 14743425bc38SStefano Zampini ierr = MatSetType(fetidpmat_ctx->B_delta,MATSEQAIJ);CHKERRQ(ierr); 14753425bc38SStefano Zampini ierr = MatSeqAIJSetPreallocation(fetidpmat_ctx->B_delta,1,PETSC_NULL);CHKERRQ(ierr); 14763425bc38SStefano Zampini ierr = MatSetOption(fetidpmat_ctx->B_delta,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr); 14773425bc38SStefano Zampini for(i=0;i<n_local_lambda;i++) { 14783425bc38SStefano Zampini ierr = MatSetValue(fetidpmat_ctx->B_delta,i,cols_B_delta[i],vals_B_delta[i],INSERT_VALUES);CHKERRQ(ierr); 14793425bc38SStefano Zampini } 14803425bc38SStefano Zampini ierr = MatAssemblyBegin(fetidpmat_ctx->B_delta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 14813425bc38SStefano Zampini ierr = MatAssemblyEnd (fetidpmat_ctx->B_delta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 14823425bc38SStefano Zampini 14833425bc38SStefano Zampini if(fully_redundant) { 14843425bc38SStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&ScalingMat); 14853425bc38SStefano Zampini ierr = MatSetSizes(ScalingMat,n_local_lambda,n_local_lambda,n_local_lambda,n_local_lambda);CHKERRQ(ierr); 14863425bc38SStefano Zampini ierr = MatSetType(ScalingMat,MATSEQAIJ);CHKERRQ(ierr); 14873425bc38SStefano Zampini ierr = MatSeqAIJSetPreallocation(ScalingMat,1,PETSC_NULL);CHKERRQ(ierr); 14883425bc38SStefano Zampini for(i=0;i<n_local_lambda;i++) { 14893425bc38SStefano Zampini ierr = MatSetValue(ScalingMat,i,i,scaling_factors[i],INSERT_VALUES);CHKERRQ(ierr); 14903425bc38SStefano Zampini } 14913425bc38SStefano Zampini ierr = MatAssemblyBegin(ScalingMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 14923425bc38SStefano Zampini ierr = MatAssemblyEnd (ScalingMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 14933425bc38SStefano Zampini ierr = MatMatMult(ScalingMat,fetidpmat_ctx->B_delta,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&fetidpmat_ctx->B_Ddelta);CHKERRQ(ierr); 14943425bc38SStefano Zampini ierr = MatDestroy(&ScalingMat);CHKERRQ(ierr); 14953425bc38SStefano Zampini } else { 14963425bc38SStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&fetidpmat_ctx->B_Ddelta); 14973425bc38SStefano Zampini ierr = MatSetSizes(fetidpmat_ctx->B_Ddelta,n_local_lambda,pcis->n_B,n_local_lambda,pcis->n_B);CHKERRQ(ierr); 14983425bc38SStefano Zampini ierr = MatSetType(fetidpmat_ctx->B_Ddelta,MATSEQAIJ);CHKERRQ(ierr); 14993425bc38SStefano Zampini ierr = MatSeqAIJSetPreallocation(fetidpmat_ctx->B_Ddelta,1,PETSC_NULL);CHKERRQ(ierr); 15003425bc38SStefano Zampini for(i=0;i<n_local_lambda;i++) { 15013425bc38SStefano Zampini ierr = MatSetValue(fetidpmat_ctx->B_Ddelta,i,cols_B_delta[i],scaling_factors[i],INSERT_VALUES);CHKERRQ(ierr); 15023425bc38SStefano Zampini } 15033425bc38SStefano Zampini ierr = MatAssemblyBegin(fetidpmat_ctx->B_Ddelta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 15043425bc38SStefano Zampini ierr = MatAssemblyEnd (fetidpmat_ctx->B_Ddelta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 15053425bc38SStefano Zampini } 15063425bc38SStefano Zampini 15073425bc38SStefano Zampini /* Create some vectors needed by fetidp */ 15083425bc38SStefano Zampini ierr = VecDuplicate(pcis->vec1_B,&fetidpmat_ctx->temp_solution_B);CHKERRQ(ierr); 15093425bc38SStefano Zampini ierr = VecDuplicate(pcis->vec1_D,&fetidpmat_ctx->temp_solution_D);CHKERRQ(ierr); 15103425bc38SStefano Zampini 15113425bc38SStefano Zampini test_fetidp = PETSC_FALSE; 15123425bc38SStefano Zampini ierr = PetscOptionsGetBool(PETSC_NULL,"-fetidp_check",&test_fetidp,PETSC_NULL);CHKERRQ(ierr); 15133425bc38SStefano Zampini 15143425bc38SStefano Zampini if(test_fetidp) { 15153425bc38SStefano Zampini 15163425bc38SStefano Zampini ierr = PetscViewerASCIIGetStdout(((PetscObject)(fetidpmat_ctx->pc))->comm,&viewer);CHKERRQ(ierr); 15173425bc38SStefano Zampini ierr = PetscViewerASCIISynchronizedAllow(viewer,PETSC_TRUE);CHKERRQ(ierr); 15183425bc38SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"----------FETI_DP TESTS--------------\n");CHKERRQ(ierr); 15193425bc38SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"All tests should return zero!\n");CHKERRQ(ierr); 15203425bc38SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"FETIDP MAT context in the ");CHKERRQ(ierr); 15213425bc38SStefano Zampini if(fully_redundant) { 15223425bc38SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"fully redundant case for lagrange multipliers.\n");CHKERRQ(ierr); 15233425bc38SStefano Zampini } else { 15243425bc38SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Non-fully redundant case for lagrange multiplier.\n");CHKERRQ(ierr); 15253425bc38SStefano Zampini } 15263425bc38SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 15273425bc38SStefano Zampini 15283425bc38SStefano Zampini /******************************************************************/ 15293425bc38SStefano Zampini /* TEST A/B: Test numbering of global lambda dofs */ 15303425bc38SStefano Zampini /******************************************************************/ 15313425bc38SStefano Zampini 15323425bc38SStefano Zampini ierr = VecDuplicate(fetidpmat_ctx->lambda_local,&test_vec);CHKERRQ(ierr); 15333425bc38SStefano Zampini ierr = VecSet(lambda_global,1.0);CHKERRQ(ierr); 15343425bc38SStefano Zampini ierr = VecSet(test_vec,1.0);CHKERRQ(ierr); 15353425bc38SStefano Zampini ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 15363425bc38SStefano Zampini ierr = VecScatterEnd (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 15373425bc38SStefano Zampini scalar_value = -1.0; 15383425bc38SStefano Zampini ierr = VecAXPY(test_vec,scalar_value,fetidpmat_ctx->lambda_local);CHKERRQ(ierr); 15393425bc38SStefano Zampini ierr = VecNorm(test_vec,NORM_INFINITY,&scalar_value);CHKERRQ(ierr); 15403425bc38SStefano Zampini ierr = VecDestroy(&test_vec);CHKERRQ(ierr); 15413425bc38SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"A[%04d]: CHECK glob to loc: % 1.14e\n",rank,scalar_value);CHKERRQ(ierr); 15423425bc38SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 15433425bc38SStefano Zampini if(fully_redundant) { 15443425bc38SStefano Zampini ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr); 15453425bc38SStefano Zampini ierr = VecSet(fetidpmat_ctx->lambda_local,0.5);CHKERRQ(ierr); 15463425bc38SStefano Zampini ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 15473425bc38SStefano Zampini ierr = VecScatterEnd (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 15483425bc38SStefano Zampini ierr = VecSum(lambda_global,&scalar_value);CHKERRQ(ierr); 15493425bc38SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"B[%04d]: CHECK loc to glob: % 1.14e\n",rank,scalar_value-fetidpmat_ctx->n_lambda);CHKERRQ(ierr); 15503425bc38SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 15513425bc38SStefano Zampini } 15523425bc38SStefano Zampini 15533425bc38SStefano Zampini /******************************************************************/ 15543425bc38SStefano Zampini /* TEST C: It should holds B_delta*w=0, w\in\widehat{W} */ 15553425bc38SStefano Zampini /* This is the meaning of the B matrix */ 15563425bc38SStefano Zampini /******************************************************************/ 15573425bc38SStefano Zampini 15583425bc38SStefano Zampini ierr = VecSetRandom(pcis->vec1_N,PETSC_NULL);CHKERRQ(ierr); 15593425bc38SStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 15603425bc38SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 15613425bc38SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 15623425bc38SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 15633425bc38SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 15643425bc38SStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 15653425bc38SStefano Zampini ierr = VecScatterEnd (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 15663425bc38SStefano Zampini /* Action of B_delta */ 15673425bc38SStefano Zampini ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr); 15683425bc38SStefano Zampini ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr); 15693425bc38SStefano Zampini ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 15703425bc38SStefano Zampini ierr = VecScatterEnd (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 15713425bc38SStefano Zampini ierr = VecNorm(lambda_global,NORM_INFINITY,&scalar_value);CHKERRQ(ierr); 15723425bc38SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"C[coll]: CHECK infty norm of B_delta*w (w continuous): % 1.14e\n",scalar_value);CHKERRQ(ierr); 15733425bc38SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 15743425bc38SStefano Zampini 15753425bc38SStefano Zampini /******************************************************************/ 15763425bc38SStefano Zampini /* TEST D: It should holds E_Dw = w - P_Dw w\in\widetilde{W} */ 15773425bc38SStefano Zampini /* E_D = R_D^TR */ 15783425bc38SStefano Zampini /* P_D = B_{D,delta}^T B_{delta} */ 15793425bc38SStefano Zampini /* eq.44 Mandel Tezaur and Dohrmann 2005 */ 15803425bc38SStefano Zampini /******************************************************************/ 15813425bc38SStefano Zampini 15823425bc38SStefano Zampini /* compute a random vector in \widetilde{W} */ 15833425bc38SStefano Zampini ierr = VecSetRandom(pcis->vec1_N,PETSC_NULL);CHKERRQ(ierr); 15843425bc38SStefano Zampini scalar_value = 0.0; /* set zero at vertices */ 15853425bc38SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 15863425bc38SStefano Zampini for(i=0;i<n_vertices;i++) { array[vertex_indices[i]]=scalar_value; } 15873425bc38SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 15883425bc38SStefano Zampini /* store w for final comparison */ 15893425bc38SStefano Zampini ierr = VecDuplicate(pcis->vec1_B,&test_vec);CHKERRQ(ierr); 15903425bc38SStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,test_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 15913425bc38SStefano Zampini ierr = VecScatterEnd (pcis->N_to_B,pcis->vec1_N,test_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 15923425bc38SStefano Zampini 15933425bc38SStefano Zampini /* Jump operator P_D : results stored in pcis->vec1_B */ 15943425bc38SStefano Zampini 15953425bc38SStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 15963425bc38SStefano Zampini ierr = VecScatterEnd (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 15973425bc38SStefano Zampini /* Action of B_delta */ 15983425bc38SStefano Zampini ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr); 15993425bc38SStefano Zampini ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr); 16003425bc38SStefano Zampini ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 16013425bc38SStefano Zampini ierr = VecScatterEnd (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 16023425bc38SStefano Zampini /* Action of B_Ddelta^T */ 16033425bc38SStefano Zampini ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 16043425bc38SStefano Zampini ierr = VecScatterEnd (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 16053425bc38SStefano Zampini ierr = MatMultTranspose(fetidpmat_ctx->B_Ddelta,fetidpmat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr); 16063425bc38SStefano Zampini 16073425bc38SStefano Zampini /* Average operator E_D : results stored in pcis->vec2_B */ 16083425bc38SStefano Zampini 16093425bc38SStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 16103425bc38SStefano Zampini ierr = VecScatterEnd (pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 16113425bc38SStefano Zampini ierr = VecPointwiseMult(pcis->vec2_B,pcis->D,pcis->vec2_B);CHKERRQ(ierr); 16123425bc38SStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->vec2_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 16133425bc38SStefano Zampini ierr = VecScatterEnd (pcis->N_to_B,pcis->vec2_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 16143425bc38SStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 16153425bc38SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 16163425bc38SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 16173425bc38SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 16183425bc38SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 16193425bc38SStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 16203425bc38SStefano Zampini ierr = VecScatterEnd (pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 16213425bc38SStefano Zampini 16223425bc38SStefano Zampini /* test E_D=I-P_D */ 16233425bc38SStefano Zampini scalar_value = 1.0; 16243425bc38SStefano Zampini ierr = VecAXPY(pcis->vec1_B,scalar_value,pcis->vec2_B);CHKERRQ(ierr); 16253425bc38SStefano Zampini scalar_value = -1.0; 16263425bc38SStefano Zampini ierr = VecAXPY(pcis->vec1_B,scalar_value,test_vec);CHKERRQ(ierr); 16273425bc38SStefano Zampini ierr = VecNorm(pcis->vec1_B,NORM_INFINITY,&scalar_value);CHKERRQ(ierr); 16283425bc38SStefano Zampini ierr = VecDestroy(&test_vec);CHKERRQ(ierr); 16293425bc38SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"D[%04d] CHECK infty norm of E_D + P_D - I: % 1.14e\n",rank,scalar_value);CHKERRQ(ierr); 16303425bc38SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 16313425bc38SStefano Zampini 16323425bc38SStefano Zampini /******************************************************************/ 16333425bc38SStefano Zampini /* TEST E: It should holds R_D^TP_Dw=0 w\in\widetilde{W} */ 16343425bc38SStefano Zampini /* eq.48 Mandel Tezaur and Dohrmann 2005 */ 16353425bc38SStefano Zampini /******************************************************************/ 16363425bc38SStefano Zampini 16373425bc38SStefano Zampini ierr = VecSetRandom(pcis->vec1_N,PETSC_NULL);CHKERRQ(ierr); 16383425bc38SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 16393425bc38SStefano Zampini scalar_value = 0.0; /* set zero at vertices */ 16403425bc38SStefano Zampini for(i=0;i<n_vertices;i++) { array[vertex_indices[i]]=scalar_value; } 16413425bc38SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 16423425bc38SStefano Zampini 16433425bc38SStefano Zampini /* Jump operator P_D : results stored in pcis->vec1_B */ 16443425bc38SStefano Zampini 16453425bc38SStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 16463425bc38SStefano Zampini ierr = VecScatterEnd (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 16473425bc38SStefano Zampini /* Action of B_delta */ 16483425bc38SStefano Zampini ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr); 16493425bc38SStefano Zampini ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr); 16503425bc38SStefano Zampini ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 16513425bc38SStefano Zampini ierr = VecScatterEnd (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 16523425bc38SStefano Zampini /* Action of B_Ddelta^T */ 16533425bc38SStefano Zampini ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 16543425bc38SStefano Zampini ierr = VecScatterEnd (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 16553425bc38SStefano Zampini ierr = MatMultTranspose(fetidpmat_ctx->B_Ddelta,fetidpmat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr); 16563425bc38SStefano Zampini /* diagonal scaling */ 16573425bc38SStefano Zampini ierr = VecPointwiseMult(pcis->vec1_B,pcis->D,pcis->vec1_B);CHKERRQ(ierr); 16583425bc38SStefano Zampini /* sum on the interface */ 16593425bc38SStefano Zampini ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr); 16603425bc38SStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 16613425bc38SStefano Zampini ierr = VecScatterEnd (pcis->N_to_B,pcis->vec1_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 16623425bc38SStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 16633425bc38SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 16643425bc38SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 16653425bc38SStefano Zampini ierr = VecNorm(pcis->vec1_global,NORM_INFINITY,&scalar_value);CHKERRQ(ierr); 16663425bc38SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"E[coll]: CHECK infty norm of R^T_D P_D: % 1.14e\n",scalar_value);CHKERRQ(ierr); 16673425bc38SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 16683425bc38SStefano Zampini 16693425bc38SStefano Zampini if(!fully_redundant) { 16703425bc38SStefano Zampini /******************************************************************/ 16713425bc38SStefano Zampini /* TEST F: It should holds B_{delta}B^T_{D,delta}=I */ 16723425bc38SStefano Zampini /* Corollary thm 14 Mandel Tezaur and Dohrmann 2005 */ 16733425bc38SStefano Zampini /******************************************************************/ 16743425bc38SStefano Zampini ierr = VecDuplicate(lambda_global,&test_vec);CHKERRQ(ierr); 16753425bc38SStefano Zampini ierr = VecSetRandom(lambda_global,PETSC_NULL);CHKERRQ(ierr); 16763425bc38SStefano Zampini /* Action of B_Ddelta^T */ 16773425bc38SStefano Zampini ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 16783425bc38SStefano Zampini ierr = VecScatterEnd (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 16793425bc38SStefano Zampini ierr = MatMultTranspose(fetidpmat_ctx->B_Ddelta,fetidpmat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr); 16803425bc38SStefano Zampini /* Action of B_delta */ 16813425bc38SStefano Zampini ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr); 16823425bc38SStefano Zampini ierr = VecSet(test_vec,0.0);CHKERRQ(ierr); 16833425bc38SStefano Zampini ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,test_vec,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 16843425bc38SStefano Zampini ierr = VecScatterEnd (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,test_vec,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 16853425bc38SStefano Zampini scalar_value = -1.0; 16863425bc38SStefano Zampini ierr = VecAXPY(lambda_global,scalar_value,test_vec);CHKERRQ(ierr); 16873425bc38SStefano Zampini ierr = VecNorm(lambda_global,NORM_INFINITY,&scalar_value);CHKERRQ(ierr); 16883425bc38SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"E[coll]: CHECK infty norm of P^T_D - I: % 1.14e\n",scalar_value);CHKERRQ(ierr); 16893425bc38SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 16903425bc38SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 16913425bc38SStefano Zampini ierr = VecDestroy(&test_vec);CHKERRQ(ierr); 16923425bc38SStefano Zampini } 16933425bc38SStefano Zampini } 16943425bc38SStefano Zampini /* final cleanup */ 16953425bc38SStefano Zampini ierr = PetscFree(dual_dofs_boundary_indices);CHKERRQ(ierr); 16963425bc38SStefano Zampini ierr = PetscFree(vertex_indices);CHKERRQ(ierr); 16973425bc38SStefano Zampini ierr = PetscFree(aux_local_numbering_1);CHKERRQ(ierr); 16983425bc38SStefano Zampini ierr = PetscFree(aux_local_numbering_2);CHKERRQ(ierr); 16993425bc38SStefano Zampini ierr = PetscFree(aux_global_numbering);CHKERRQ(ierr); 17003425bc38SStefano Zampini ierr = PetscFree(aux_global_numbering_mpi);CHKERRQ(ierr); 17013425bc38SStefano Zampini ierr = PetscFree(dof_sizes);CHKERRQ(ierr); 17023425bc38SStefano Zampini ierr = PetscFree(dof_displs);CHKERRQ(ierr); 17033425bc38SStefano Zampini ierr = PetscFree(all_aux_global_numbering_mpi_1);CHKERRQ(ierr); 17043425bc38SStefano Zampini ierr = PetscFree(all_aux_global_numbering_mpi_2);CHKERRQ(ierr); 17053425bc38SStefano Zampini ierr = PetscFree(global_dofs_numbering);CHKERRQ(ierr); 17063425bc38SStefano Zampini ierr = PetscFree(aux_sums);CHKERRQ(ierr); 17073425bc38SStefano Zampini ierr = PetscFree(cols_B_delta);CHKERRQ(ierr); 17083425bc38SStefano Zampini ierr = PetscFree(vals_B_delta);CHKERRQ(ierr); 17093425bc38SStefano Zampini ierr = PetscFree(scaling_factors);CHKERRQ(ierr); 17103425bc38SStefano Zampini ierr = VecDestroy(&lambda_global);CHKERRQ(ierr); 17113425bc38SStefano Zampini ierr = ISDestroy(&IS_l2g_lambda);CHKERRQ(ierr); 17123425bc38SStefano Zampini 17133425bc38SStefano Zampini PetscFunctionReturn(0); 17143425bc38SStefano Zampini } 17153425bc38SStefano Zampini 17163425bc38SStefano Zampini #undef __FUNCT__ 17173425bc38SStefano Zampini #define __FUNCT__ "PCBDDCSetupFETIDPPCContext" 17183425bc38SStefano Zampini static PetscErrorCode PCBDDCSetupFETIDPPCContext(Mat fetimat, FETIDPPC_ctx *fetidppc_ctx) 17193425bc38SStefano Zampini { 17203425bc38SStefano Zampini FETIDPMat_ctx *mat_ctx; 17213425bc38SStefano Zampini PetscErrorCode ierr; 17223425bc38SStefano Zampini 17233425bc38SStefano Zampini PetscFunctionBegin; 17243425bc38SStefano Zampini ierr = MatShellGetContext(fetimat,&mat_ctx);CHKERRQ(ierr); 17253425bc38SStefano Zampini /* get references from objects created when setting up feti mat context */ 17263425bc38SStefano Zampini ierr = PetscObjectReference((PetscObject)mat_ctx->lambda_local);CHKERRQ(ierr); 17273425bc38SStefano Zampini fetidppc_ctx->lambda_local = mat_ctx->lambda_local; 17283425bc38SStefano Zampini ierr = PetscObjectReference((PetscObject)mat_ctx->B_Ddelta);CHKERRQ(ierr); 17293425bc38SStefano Zampini fetidppc_ctx->B_Ddelta = mat_ctx->B_Ddelta; 17303425bc38SStefano Zampini ierr = PetscObjectReference((PetscObject)mat_ctx->l2g_lambda);CHKERRQ(ierr); 17313425bc38SStefano Zampini fetidppc_ctx->l2g_lambda = mat_ctx->l2g_lambda; 17323425bc38SStefano Zampini PetscFunctionReturn(0); 17333425bc38SStefano Zampini } 17343425bc38SStefano Zampini 17353425bc38SStefano Zampini #undef __FUNCT__ 17363425bc38SStefano Zampini #define __FUNCT__ "FETIDPMatMult" 17373425bc38SStefano Zampini static PetscErrorCode FETIDPMatMult(Mat fetimat, Vec x, Vec y) 17383425bc38SStefano Zampini { 17393425bc38SStefano Zampini FETIDPMat_ctx *mat_ctx; 17403425bc38SStefano Zampini PC_IS *pcis; 17413425bc38SStefano Zampini PetscErrorCode ierr; 17423425bc38SStefano Zampini 17433425bc38SStefano Zampini PetscFunctionBegin; 17443425bc38SStefano Zampini ierr = MatShellGetContext(fetimat,&mat_ctx);CHKERRQ(ierr); 17453425bc38SStefano Zampini pcis = (PC_IS*)mat_ctx->pc->data; 17463425bc38SStefano Zampini /* Application of B_delta^T */ 17473425bc38SStefano Zampini ierr = VecScatterBegin(mat_ctx->l2g_lambda,x,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 17483425bc38SStefano Zampini ierr = VecScatterEnd(mat_ctx->l2g_lambda,x,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 17493425bc38SStefano Zampini ierr = MatMultTranspose(mat_ctx->B_delta,mat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr); 17503425bc38SStefano Zampini /* Application of \widetilde{S}^-1 */ 17513425bc38SStefano Zampini ierr = VecSet(pcis->vec1_D,0.0);CHKERRQ(ierr); 17523425bc38SStefano Zampini ierr = PCBDDCApplyInterfacePreconditioner(mat_ctx->pc);CHKERRQ(ierr); 17533425bc38SStefano Zampini /* Application of B_delta */ 17543425bc38SStefano Zampini ierr = MatMult(mat_ctx->B_delta,pcis->vec1_B,mat_ctx->lambda_local);CHKERRQ(ierr); 17553425bc38SStefano Zampini ierr = VecSet(y,0.0);CHKERRQ(ierr); 17563425bc38SStefano Zampini ierr = VecScatterBegin(mat_ctx->l2g_lambda,mat_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 17573425bc38SStefano Zampini ierr = VecScatterEnd(mat_ctx->l2g_lambda,mat_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 17583425bc38SStefano Zampini PetscFunctionReturn(0); 17593425bc38SStefano Zampini } 17603425bc38SStefano Zampini 17613425bc38SStefano Zampini #undef __FUNCT__ 17623425bc38SStefano Zampini #define __FUNCT__ "FETIDPPCApply" 17633425bc38SStefano Zampini static PetscErrorCode FETIDPPCApply(PC fetipc, Vec x, Vec y) 17643425bc38SStefano Zampini { 17653425bc38SStefano Zampini FETIDPPC_ctx *pc_ctx; 17663425bc38SStefano Zampini PC_IS *pcis; 17673425bc38SStefano Zampini PetscErrorCode ierr; 17683425bc38SStefano Zampini 17693425bc38SStefano Zampini PetscFunctionBegin; 17703425bc38SStefano Zampini ierr = PCShellGetContext(fetipc,(void**)&pc_ctx); 17713425bc38SStefano Zampini pcis = (PC_IS*)pc_ctx->pc->data; 17723425bc38SStefano Zampini /* Application of B_Ddelta^T */ 17733425bc38SStefano Zampini ierr = VecScatterBegin(pc_ctx->l2g_lambda,x,pc_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 17743425bc38SStefano Zampini ierr = VecScatterEnd(pc_ctx->l2g_lambda,x,pc_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 17753425bc38SStefano Zampini ierr = VecSet(pcis->vec2_B,0.0);CHKERRQ(ierr); 17763425bc38SStefano Zampini ierr = MatMultTranspose(pc_ctx->B_Ddelta,pc_ctx->lambda_local,pcis->vec2_B);CHKERRQ(ierr); 17773425bc38SStefano Zampini /* Application of S */ 17783425bc38SStefano Zampini ierr = PCISApplySchur(pc_ctx->pc,pcis->vec2_B,pcis->vec1_B,(Vec)0,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr); 17793425bc38SStefano Zampini /* Application of B_Ddelta */ 17803425bc38SStefano Zampini ierr = MatMult(pc_ctx->B_Ddelta,pcis->vec1_B,pc_ctx->lambda_local);CHKERRQ(ierr); 17813425bc38SStefano Zampini ierr = VecSet(y,0.0);CHKERRQ(ierr); 17823425bc38SStefano Zampini ierr = VecScatterBegin(pc_ctx->l2g_lambda,pc_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 17833425bc38SStefano Zampini ierr = VecScatterEnd(pc_ctx->l2g_lambda,pc_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 17843425bc38SStefano Zampini PetscFunctionReturn(0); 17853425bc38SStefano Zampini } 17863425bc38SStefano Zampini 1787da1bb401SStefano Zampini #undef __FUNCT__ 1788da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetupLocalAdjacencyGraph" 1789da1bb401SStefano Zampini static PetscErrorCode PCBDDCSetupLocalAdjacencyGraph(PC pc) 1790da1bb401SStefano Zampini { 1791da1bb401SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 1792da1bb401SStefano Zampini Mat_IS *matis = (Mat_IS*)pc->pmat->data; 1793da1bb401SStefano Zampini PetscInt nvtxs,*xadj,*adjncy; 1794da1bb401SStefano Zampini Mat mat_adj; 1795da1bb401SStefano Zampini PetscBool symmetrize_rowij=PETSC_TRUE,compressed_rowij=PETSC_FALSE,flg_row=PETSC_TRUE; 1796da1bb401SStefano Zampini PCBDDCGraph mat_graph=pcbddc->mat_graph; 1797da1bb401SStefano Zampini PetscErrorCode ierr; 1798da1bb401SStefano Zampini 1799da1bb401SStefano Zampini PetscFunctionBegin; 1800da1bb401SStefano Zampini /* get CSR adjacency from local matrix if user has not yet provided local graph using PCBDDCSetLocalAdjacencyGraph function */ 1801da1bb401SStefano Zampini if(!mat_graph->xadj) { 1802da1bb401SStefano Zampini ierr = MatConvert(matis->A,MATMPIADJ,MAT_INITIAL_MATRIX,&mat_adj);CHKERRQ(ierr); 1803da1bb401SStefano Zampini ierr = MatGetRowIJ(mat_adj,0,symmetrize_rowij,compressed_rowij,&nvtxs,&xadj,&adjncy,&flg_row);CHKERRQ(ierr); 1804da1bb401SStefano Zampini if(!flg_row) { 1805da1bb401SStefano Zampini SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in MatGetRowIJ called in %s\n",__FUNCT__); 1806da1bb401SStefano Zampini } 1807da1bb401SStefano Zampini /* Get adjacency into BDDC workspace */ 1808da1bb401SStefano Zampini ierr = PCBDDCSetLocalAdjacencyGraph(pc,nvtxs,xadj,adjncy,PETSC_COPY_VALUES);CHKERRQ(ierr); 1809da1bb401SStefano Zampini ierr = MatRestoreRowIJ(mat_adj,0,symmetrize_rowij,compressed_rowij,&nvtxs,&xadj,&adjncy,&flg_row);CHKERRQ(ierr); 1810da1bb401SStefano Zampini if(!flg_row) { 1811da1bb401SStefano Zampini SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in MatRestoreRowIJ called in %s\n",__FUNCT__); 1812da1bb401SStefano Zampini } 1813da1bb401SStefano Zampini ierr = MatDestroy(&mat_adj);CHKERRQ(ierr); 1814da1bb401SStefano Zampini } 1815da1bb401SStefano Zampini PetscFunctionReturn(0); 1816da1bb401SStefano Zampini } 1817da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */ 18180c7d97c5SJed Brown #undef __FUNCT__ 18190c7d97c5SJed Brown #define __FUNCT__ "PCBDDCApplyInterfacePreconditioner" 18202617d88aSStefano Zampini static PetscErrorCode PCBDDCApplyInterfacePreconditioner(PC pc) 18210c7d97c5SJed Brown { 18220c7d97c5SJed Brown PetscErrorCode ierr; 18230c7d97c5SJed Brown PC_BDDC* pcbddc = (PC_BDDC*)(pc->data); 18240c7d97c5SJed Brown PC_IS* pcis = (PC_IS*) (pc->data); 18253b03a366Sstefano_zampini const PetscScalar zero = 0.0; 18260c7d97c5SJed Brown 18270c7d97c5SJed Brown PetscFunctionBegin; 18280c7d97c5SJed Brown /* Application of PHI^T */ 18290c7d97c5SJed Brown ierr = MatMultTranspose(pcbddc->coarse_phi_B,pcis->vec1_B,pcbddc->vec1_P);CHKERRQ(ierr); 18300c7d97c5SJed Brown if(pcbddc->prec_type) { ierr = MatMultTransposeAdd(pcbddc->coarse_phi_D,pcis->vec1_D,pcbddc->vec1_P,pcbddc->vec1_P);CHKERRQ(ierr); } 18310c7d97c5SJed Brown 18320c7d97c5SJed Brown /* Scatter data of coarse_rhs */ 18330c7d97c5SJed Brown if(pcbddc->coarse_rhs) ierr = VecSet(pcbddc->coarse_rhs,zero);CHKERRQ(ierr); 18340c7d97c5SJed Brown ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->vec1_P,pcbddc->coarse_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 18350c7d97c5SJed Brown 18360c7d97c5SJed Brown /* Local solution on R nodes */ 18370c7d97c5SJed Brown ierr = VecSet(pcbddc->vec1_R,zero);CHKERRQ(ierr); 18380c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->R_to_B,pcis->vec1_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 18390c7d97c5SJed Brown ierr = VecScatterEnd (pcbddc->R_to_B,pcis->vec1_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 18400c7d97c5SJed Brown if(pcbddc->prec_type) { 18410c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->R_to_D,pcis->vec1_D,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 18420c7d97c5SJed Brown ierr = VecScatterEnd (pcbddc->R_to_D,pcis->vec1_D,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 18430c7d97c5SJed Brown } 18440c7d97c5SJed Brown ierr = PCBDDCSolveSaddlePoint(pc);CHKERRQ(ierr); 18450c7d97c5SJed Brown ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr); 18460c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec2_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 18470c7d97c5SJed Brown ierr = VecScatterEnd (pcbddc->R_to_B,pcbddc->vec2_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 18480c7d97c5SJed Brown if(pcbddc->prec_type) { 18490c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec2_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 18500c7d97c5SJed Brown ierr = VecScatterEnd (pcbddc->R_to_D,pcbddc->vec2_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 18510c7d97c5SJed Brown } 18520c7d97c5SJed Brown 18530c7d97c5SJed Brown /* Coarse solution */ 18540c7d97c5SJed Brown ierr = PCBDDCScatterCoarseDataEnd(pc,pcbddc->vec1_P,pcbddc->coarse_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 185553cdbc3dSStefano Zampini if(pcbddc->coarse_rhs) ierr = KSPSolve(pcbddc->coarse_ksp,pcbddc->coarse_rhs,pcbddc->coarse_vec);CHKERRQ(ierr); 18560c7d97c5SJed Brown ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->coarse_vec,pcbddc->vec1_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 18570c7d97c5SJed Brown ierr = PCBDDCScatterCoarseDataEnd (pc,pcbddc->coarse_vec,pcbddc->vec1_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 18580c7d97c5SJed Brown 18590c7d97c5SJed Brown /* Sum contributions from two levels */ 18600c7d97c5SJed Brown ierr = MatMultAdd(pcbddc->coarse_phi_B,pcbddc->vec1_P,pcis->vec1_B,pcis->vec1_B);CHKERRQ(ierr); 18610c7d97c5SJed Brown if(pcbddc->prec_type) { ierr = MatMultAdd(pcbddc->coarse_phi_D,pcbddc->vec1_P,pcis->vec1_D,pcis->vec1_D);CHKERRQ(ierr); } 18620c7d97c5SJed Brown PetscFunctionReturn(0); 18630c7d97c5SJed Brown } 18640c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 18650c7d97c5SJed Brown #undef __FUNCT__ 18660c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSolveSaddlePoint" 186753cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSolveSaddlePoint(PC pc) 18680c7d97c5SJed Brown { 18690c7d97c5SJed Brown PetscErrorCode ierr; 18700c7d97c5SJed Brown PC_BDDC* pcbddc = (PC_BDDC*)(pc->data); 18710c7d97c5SJed Brown 18720c7d97c5SJed Brown PetscFunctionBegin; 187353cdbc3dSStefano Zampini ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr); 1874534831adSStefano Zampini if(pcbddc->local_auxmat1) { 18750c7d97c5SJed Brown ierr = MatMult(pcbddc->local_auxmat1,pcbddc->vec2_R,pcbddc->vec1_C);CHKERRQ(ierr); 18760c7d97c5SJed Brown ierr = MatMultAdd(pcbddc->local_auxmat2,pcbddc->vec1_C,pcbddc->vec2_R,pcbddc->vec2_R);CHKERRQ(ierr); 18770c7d97c5SJed Brown } 18780c7d97c5SJed Brown PetscFunctionReturn(0); 18790c7d97c5SJed Brown } 18800c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 18810c7d97c5SJed Brown #undef __FUNCT__ 18820c7d97c5SJed Brown #define __FUNCT__ "PCBDDCScatterCoarseDataBegin" 188353cdbc3dSStefano Zampini static PetscErrorCode PCBDDCScatterCoarseDataBegin(PC pc,Vec vec_from, Vec vec_to, InsertMode imode, ScatterMode smode) 18840c7d97c5SJed Brown { 18850c7d97c5SJed Brown PetscErrorCode ierr; 18860c7d97c5SJed Brown PC_BDDC* pcbddc = (PC_BDDC*)(pc->data); 18870c7d97c5SJed Brown 18880c7d97c5SJed Brown PetscFunctionBegin; 18890c7d97c5SJed Brown switch(pcbddc->coarse_communications_type){ 18900c7d97c5SJed Brown case SCATTERS_BDDC: 18910c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->coarse_loc_to_glob,vec_from,vec_to,imode,smode);CHKERRQ(ierr); 18920c7d97c5SJed Brown break; 18930c7d97c5SJed Brown case GATHERS_BDDC: 18940c7d97c5SJed Brown break; 18950c7d97c5SJed Brown } 18960c7d97c5SJed Brown PetscFunctionReturn(0); 18970c7d97c5SJed Brown } 18980c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 18990c7d97c5SJed Brown #undef __FUNCT__ 19000c7d97c5SJed Brown #define __FUNCT__ "PCBDDCScatterCoarseDataEnd" 190153cdbc3dSStefano Zampini static PetscErrorCode PCBDDCScatterCoarseDataEnd(PC pc,Vec vec_from, Vec vec_to, InsertMode imode, ScatterMode smode) 19020c7d97c5SJed Brown { 19030c7d97c5SJed Brown PetscErrorCode ierr; 19040c7d97c5SJed Brown PC_BDDC* pcbddc = (PC_BDDC*)(pc->data); 19050c7d97c5SJed Brown PetscScalar* array_to; 19060c7d97c5SJed Brown PetscScalar* array_from; 19070c7d97c5SJed Brown MPI_Comm comm=((PetscObject)pc)->comm; 19080c7d97c5SJed Brown PetscInt i; 19090c7d97c5SJed Brown 19100c7d97c5SJed Brown PetscFunctionBegin; 19110c7d97c5SJed Brown 19120c7d97c5SJed Brown switch(pcbddc->coarse_communications_type){ 19130c7d97c5SJed Brown case SCATTERS_BDDC: 19140c7d97c5SJed Brown ierr = VecScatterEnd(pcbddc->coarse_loc_to_glob,vec_from,vec_to,imode,smode);CHKERRQ(ierr); 19150c7d97c5SJed Brown break; 19160c7d97c5SJed Brown case GATHERS_BDDC: 19170c7d97c5SJed Brown if(vec_from) VecGetArray(vec_from,&array_from); 19180c7d97c5SJed Brown if(vec_to) VecGetArray(vec_to,&array_to); 19190c7d97c5SJed Brown switch(pcbddc->coarse_problem_type){ 19200c7d97c5SJed Brown case SEQUENTIAL_BDDC: 19210c7d97c5SJed Brown if(smode == SCATTER_FORWARD) { 192253cdbc3dSStefano Zampini ierr = MPI_Gatherv(&array_from[0],pcbddc->local_primal_size,MPIU_SCALAR,&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,0,comm);CHKERRQ(ierr); 19230c7d97c5SJed Brown if(vec_to) { 19240c7d97c5SJed Brown for(i=0;i<pcbddc->replicated_primal_size;i++) 19250c7d97c5SJed Brown array_to[pcbddc->replicated_local_primal_indices[i]]+=pcbddc->replicated_local_primal_values[i]; 19260c7d97c5SJed Brown } 19270c7d97c5SJed Brown } else { 19280c7d97c5SJed Brown if(vec_from) 19290c7d97c5SJed Brown for(i=0;i<pcbddc->replicated_primal_size;i++) 19300c7d97c5SJed Brown pcbddc->replicated_local_primal_values[i]=array_from[pcbddc->replicated_local_primal_indices[i]]; 193153cdbc3dSStefano Zampini ierr = MPI_Scatterv(&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,&array_to[0],pcbddc->local_primal_size,MPIU_SCALAR,0,comm);CHKERRQ(ierr); 19320c7d97c5SJed Brown } 19330c7d97c5SJed Brown break; 19340c7d97c5SJed Brown case REPLICATED_BDDC: 19350c7d97c5SJed Brown if(smode == SCATTER_FORWARD) { 193653cdbc3dSStefano Zampini ierr = MPI_Allgatherv(&array_from[0],pcbddc->local_primal_size,MPIU_SCALAR,&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,comm);CHKERRQ(ierr); 19370c7d97c5SJed Brown for(i=0;i<pcbddc->replicated_primal_size;i++) 19380c7d97c5SJed Brown array_to[pcbddc->replicated_local_primal_indices[i]]+=pcbddc->replicated_local_primal_values[i]; 19390c7d97c5SJed Brown } else { /* no communications needed for SCATTER_REVERSE since needed data is already present */ 19400c7d97c5SJed Brown for(i=0;i<pcbddc->local_primal_size;i++) 19410c7d97c5SJed Brown array_to[i]=array_from[pcbddc->local_primal_indices[i]]; 19420c7d97c5SJed Brown } 19430c7d97c5SJed Brown break; 194453cdbc3dSStefano Zampini case MULTILEVEL_BDDC: 194553cdbc3dSStefano Zampini break; 194653cdbc3dSStefano Zampini case PARALLEL_BDDC: 194753cdbc3dSStefano Zampini break; 19480c7d97c5SJed Brown } 19490c7d97c5SJed Brown if(vec_from) VecRestoreArray(vec_from,&array_from); 19500c7d97c5SJed Brown if(vec_to) VecRestoreArray(vec_to,&array_to); 19510c7d97c5SJed Brown break; 19520c7d97c5SJed Brown } 19530c7d97c5SJed Brown PetscFunctionReturn(0); 19540c7d97c5SJed Brown } 19550c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 19563b03a366Sstefano_zampini #undef __FUNCT__ 19573b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCCreateConstraintMatrix" 19583b03a366Sstefano_zampini static PetscErrorCode PCBDDCCreateConstraintMatrix(PC pc) 19593b03a366Sstefano_zampini { 19603b03a366Sstefano_zampini PetscErrorCode ierr; 19613b03a366Sstefano_zampini PC_IS* pcis = (PC_IS*)(pc->data); 19623b03a366Sstefano_zampini PC_BDDC* pcbddc = (PC_BDDC*)pc->data; 19633b03a366Sstefano_zampini Mat_IS *matis = (Mat_IS*)pc->pmat->data; 196423d4d1a5SStefano Zampini PetscInt *nnz,*is_indices; 19653b03a366Sstefano_zampini PetscScalar *temp_quadrature_constraint; 1966534831adSStefano Zampini PetscInt *temp_indices,*temp_indices_to_constraint,*temp_indices_to_constraint_B,*local_to_B; 19673b03a366Sstefano_zampini PetscInt local_primal_size,i,j,k,total_counts,max_size_of_constraint; 19683b03a366Sstefano_zampini PetscInt n_constraints,n_vertices,size_of_constraint; 1969534831adSStefano Zampini PetscScalar quad_value; 19703b03a366Sstefano_zampini PetscBool nnsp_has_cnst=PETSC_FALSE,use_nnsp_true=pcbddc->use_nnsp_true; 19713b03a366Sstefano_zampini PetscInt nnsp_size=0,nnsp_addone=0,temp_constraints,temp_start_ptr; 19723b03a366Sstefano_zampini IS *used_IS; 19733b03a366Sstefano_zampini const MatType impMatType=MATSEQAIJ; 19743b03a366Sstefano_zampini PetscBLASInt Bs,Bt,lwork,lierr; 19753b03a366Sstefano_zampini PetscReal tol=1.0e-8; 1976fcda91b4SJed Brown MatNullSpace nearnullsp; 1977fcda91b4SJed Brown const Vec *nearnullvecs; 19783b03a366Sstefano_zampini Vec *localnearnullsp; 19793b03a366Sstefano_zampini PetscScalar *work,*temp_basis,*array_vector,*correlation_mat; 19803b03a366Sstefano_zampini PetscReal *rwork,*singular_vals; 1981534831adSStefano Zampini PetscBLASInt Bone=1,*ipiv; 1982534831adSStefano Zampini Vec temp_vec; 1983534831adSStefano Zampini Mat temp_mat; 1984534831adSStefano Zampini KSP temp_ksp; 1985534831adSStefano Zampini PetscInt s,start_constraint,dual_dofs; 1986534831adSStefano Zampini PetscBool compute_submatrix,useksp=PETSC_FALSE; 1987534831adSStefano Zampini PetscInt *aux_primal_permutation,*aux_primal_numbering; 1988534831adSStefano Zampini PetscBool boolforface,*change_basis; 1989de534f79Sstefano_zampini /* some ugly conditional declarations */ 19903b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD) 19913b03a366Sstefano_zampini PetscScalar dot_result; 19923b03a366Sstefano_zampini PetscScalar one=1.0,zero=0.0; 19933b03a366Sstefano_zampini PetscInt ii; 19943425bc38SStefano Zampini PetscScalar *singular_vectors; 19953425bc38SStefano Zampini PetscBLASInt *iwork,*ifail; 19963425bc38SStefano Zampini PetscReal dummy_real,abs_tol; 19973425bc38SStefano Zampini PetscBLASInt eigs_found; 19983b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX) 19993b03a366Sstefano_zampini PetscScalar val1,val2; 20003b03a366Sstefano_zampini #endif 20013425bc38SStefano Zampini #endif 20023b03a366Sstefano_zampini PetscBLASInt dummy_int; 20033b03a366Sstefano_zampini PetscScalar dummy_scalar; 20043b03a366Sstefano_zampini 20053b03a366Sstefano_zampini PetscFunctionBegin; 20063b03a366Sstefano_zampini /* check if near null space is attached to global mat */ 2007fcda91b4SJed Brown ierr = MatGetNearNullSpace(pc->pmat,&nearnullsp);CHKERRQ(ierr); 2008fcda91b4SJed Brown if (nearnullsp) { 2009fcda91b4SJed Brown ierr = MatNullSpaceGetVecs(nearnullsp,&nnsp_has_cnst,&nnsp_size,&nearnullvecs);CHKERRQ(ierr); 20103b03a366Sstefano_zampini } else { /* if near null space is not provided it uses constants */ 20113b03a366Sstefano_zampini nnsp_has_cnst = PETSC_TRUE; 20123b03a366Sstefano_zampini use_nnsp_true = PETSC_TRUE; 20133b03a366Sstefano_zampini } 20143b03a366Sstefano_zampini if(nnsp_has_cnst) { 20153b03a366Sstefano_zampini nnsp_addone = 1; 20163b03a366Sstefano_zampini } 20173b03a366Sstefano_zampini /* 20183b03a366Sstefano_zampini Evaluate maximum storage size needed by the procedure 20193b03a366Sstefano_zampini - temp_indices will contain start index of each constraint stored as follows 20203b03a366Sstefano_zampini - temp_indices_to_constraint [temp_indices[i],...,temp[indices[i+1]-1] will contain the indices (in local numbering) on which the constraint acts 2021534831adSStefano Zampini - temp_indices_to_constraint_B[temp_indices[i],...,temp[indices[i+1]-1] will contain the indices (in boundary numbering) on which the constraint acts 20223b03a366Sstefano_zampini - temp_quadrature_constraint [temp_indices[i],...,temp[indices[i+1]-1] will contain the scalars representing the constraint itself 20233b03a366Sstefano_zampini */ 2024da1bb401SStefano Zampini 20253b03a366Sstefano_zampini total_counts = pcbddc->n_ISForFaces+pcbddc->n_ISForEdges; 20263b03a366Sstefano_zampini total_counts *= (nnsp_addone+nnsp_size); 2027da1bb401SStefano Zampini ierr = ISGetSize(pcbddc->ISForVertices,&n_vertices);CHKERRQ(ierr); 2028da1bb401SStefano Zampini total_counts += n_vertices; 20293b03a366Sstefano_zampini ierr = PetscMalloc((total_counts+1)*sizeof(PetscInt),&temp_indices);CHKERRQ(ierr); 2030534831adSStefano Zampini ierr = PetscMalloc((total_counts+1)*sizeof(PetscBool),&change_basis);CHKERRQ(ierr); 20313b03a366Sstefano_zampini total_counts = 0; 20323b03a366Sstefano_zampini max_size_of_constraint = 0; 20333b03a366Sstefano_zampini for(i=0;i<pcbddc->n_ISForEdges+pcbddc->n_ISForFaces;i++){ 20343b03a366Sstefano_zampini if(i<pcbddc->n_ISForEdges){ 20353b03a366Sstefano_zampini used_IS = &pcbddc->ISForEdges[i]; 20363b03a366Sstefano_zampini } else { 20373b03a366Sstefano_zampini used_IS = &pcbddc->ISForFaces[i-pcbddc->n_ISForEdges]; 20383b03a366Sstefano_zampini } 20393b03a366Sstefano_zampini ierr = ISGetSize(*used_IS,&j);CHKERRQ(ierr); 20403b03a366Sstefano_zampini total_counts += j; 20413b03a366Sstefano_zampini if(j>max_size_of_constraint) max_size_of_constraint=j; 20423b03a366Sstefano_zampini } 20433b03a366Sstefano_zampini total_counts *= (nnsp_addone+nnsp_size); 2044da1bb401SStefano Zampini total_counts += n_vertices; 20453b03a366Sstefano_zampini ierr = PetscMalloc(total_counts*sizeof(PetscScalar),&temp_quadrature_constraint);CHKERRQ(ierr); 20463b03a366Sstefano_zampini ierr = PetscMalloc(total_counts*sizeof(PetscInt),&temp_indices_to_constraint);CHKERRQ(ierr); 2047534831adSStefano Zampini ierr = PetscMalloc(total_counts*sizeof(PetscInt),&temp_indices_to_constraint_B);CHKERRQ(ierr); 2048534831adSStefano Zampini ierr = PetscMalloc(pcis->n*sizeof(PetscInt),&local_to_B);CHKERRQ(ierr); 2049534831adSStefano Zampini ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 2050534831adSStefano Zampini for(i=0;i<pcis->n;i++) { 2051534831adSStefano Zampini local_to_B[i]=-1; 2052534831adSStefano Zampini } 2053534831adSStefano Zampini for(i=0;i<pcis->n_B;i++) { 2054534831adSStefano Zampini local_to_B[is_indices[i]]=i; 2055534831adSStefano Zampini } 2056534831adSStefano Zampini ierr = ISRestoreIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 2057534831adSStefano Zampini 20583b03a366Sstefano_zampini /* First we issue queries to allocate optimal workspace for LAPACKgesvd or LAPACKsyev/LAPACKheev */ 20593b03a366Sstefano_zampini rwork = 0; 20603b03a366Sstefano_zampini work = 0; 20613b03a366Sstefano_zampini singular_vals = 0; 20623b03a366Sstefano_zampini temp_basis = 0; 20633b03a366Sstefano_zampini correlation_mat = 0; 20643b03a366Sstefano_zampini if(!pcbddc->use_nnsp_true) { 20653b03a366Sstefano_zampini PetscScalar temp_work; 20663b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD) 20673b03a366Sstefano_zampini /* POD */ 20683b03a366Sstefano_zampini PetscInt max_n; 20693b03a366Sstefano_zampini max_n = nnsp_addone+nnsp_size; 20703b03a366Sstefano_zampini /* using some techniques borrowed from Proper Orthogonal Decomposition */ 20713b03a366Sstefano_zampini ierr = PetscMalloc(max_n*max_n*sizeof(PetscScalar),&correlation_mat);CHKERRQ(ierr); 20723425bc38SStefano Zampini ierr = PetscMalloc(max_n*max_n*sizeof(PetscScalar),&singular_vectors);CHKERRQ(ierr); 20733b03a366Sstefano_zampini ierr = PetscMalloc(max_n*sizeof(PetscReal),&singular_vals);CHKERRQ(ierr); 20743b03a366Sstefano_zampini ierr = PetscMalloc(max_size_of_constraint*(nnsp_addone+nnsp_size)*sizeof(PetscScalar),&temp_basis);CHKERRQ(ierr); 20753b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX) 20763b03a366Sstefano_zampini ierr = PetscMalloc(3*max_n*sizeof(PetscReal),&rwork);CHKERRQ(ierr); 20773b03a366Sstefano_zampini #endif 20783425bc38SStefano Zampini ierr = PetscMalloc(5*max_n*sizeof(PetscBLASInt),&iwork);CHKERRQ(ierr); 20793425bc38SStefano Zampini ierr = PetscMalloc(max_n*sizeof(PetscBLASInt),&ifail);CHKERRQ(ierr); 20803b03a366Sstefano_zampini /* now we evaluate the optimal workspace using query with lwork=-1 */ 20813b03a366Sstefano_zampini Bt = PetscBLASIntCast(max_n); 20823b03a366Sstefano_zampini lwork=-1; 20833425bc38SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 20843b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX) 20853425bc38SStefano Zampini abs_tol=1.e-8; 20863425bc38SStefano Zampini /* LAPACKsyev_("V","U",&Bt,correlation_mat,&Bt,singular_vals,&temp_work,&lwork,&lierr); */ 20873425bc38SStefano Zampini LAPACKsyevx_("V","A","U",&Bt,correlation_mat,&Bt,&dummy_real,&dummy_real,&dummy_int,&dummy_int, 20883425bc38SStefano Zampini &abs_tol,&eigs_found,singular_vals,singular_vectors,&Bt,&temp_work,&lwork,iwork,ifail,&lierr); 20893b03a366Sstefano_zampini #else 20903425bc38SStefano Zampini /* LAPACKsyev_("V","U",&Bt,correlation_mat,&Bt,singular_vals,&temp_work,&lwork,rwork,&lierr); */ 20913425bc38SStefano Zampini /* LAPACK call is missing here! TODO */ 20923425bc38SStefano Zampini SETERRQ(((PetscObject) pc)->comm, PETSC_ERR_SUP, "Not yet implemented for complexes when PETSC_MISSING_GESVD = 1"); 20933b03a366Sstefano_zampini #endif 20943425bc38SStefano Zampini if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to SYEVX Lapack routine %d",(int)lierr); 20953425bc38SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 20963b03a366Sstefano_zampini #else /* on missing GESVD */ 20973b03a366Sstefano_zampini /* SVD */ 20983b03a366Sstefano_zampini PetscInt max_n,min_n; 20993b03a366Sstefano_zampini max_n = max_size_of_constraint; 21003b03a366Sstefano_zampini min_n = nnsp_addone+nnsp_size; 21013b03a366Sstefano_zampini if(max_size_of_constraint < ( nnsp_addone+nnsp_size ) ) { 21023b03a366Sstefano_zampini min_n = max_size_of_constraint; 21033b03a366Sstefano_zampini max_n = nnsp_addone+nnsp_size; 21043b03a366Sstefano_zampini } 21053b03a366Sstefano_zampini ierr = PetscMalloc(min_n*sizeof(PetscReal),&singular_vals);CHKERRQ(ierr); 21063b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX) 21073b03a366Sstefano_zampini ierr = PetscMalloc(5*min_n*sizeof(PetscReal),&rwork);CHKERRQ(ierr); 21083b03a366Sstefano_zampini #endif 21093b03a366Sstefano_zampini /* now we evaluate the optimal workspace using query with lwork=-1 */ 21103b03a366Sstefano_zampini lwork=-1; 21113b03a366Sstefano_zampini Bs = PetscBLASIntCast(max_n); 21123b03a366Sstefano_zampini Bt = PetscBLASIntCast(min_n); 21133b03a366Sstefano_zampini dummy_int = Bs; 2114670f3ff9SJed Brown ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 21153b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX) 21163b03a366Sstefano_zampini LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[0],&Bs,singular_vals, 21173b03a366Sstefano_zampini &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,&temp_work,&lwork,&lierr); 21183b03a366Sstefano_zampini #else 21193b03a366Sstefano_zampini LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[0],&Bs,singular_vals, 21203b03a366Sstefano_zampini &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,&temp_work,&lwork,rwork,&lierr); 21213b03a366Sstefano_zampini #endif 21223b03a366Sstefano_zampini if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to SVD Lapack routine %d",(int)lierr); 2123670f3ff9SJed Brown ierr = PetscFPTrapPop();CHKERRQ(ierr); 21243b03a366Sstefano_zampini #endif 21253b03a366Sstefano_zampini /* Allocate optimal workspace */ 21263b03a366Sstefano_zampini lwork = PetscBLASIntCast((PetscInt)PetscRealPart(temp_work)); 21273b03a366Sstefano_zampini total_counts = (PetscInt)lwork; 21283b03a366Sstefano_zampini ierr = PetscMalloc(total_counts*sizeof(PetscScalar),&work);CHKERRQ(ierr); 21293b03a366Sstefano_zampini } 21303b03a366Sstefano_zampini /* get local part of global near null space vectors */ 21313b03a366Sstefano_zampini ierr = PetscMalloc(nnsp_size*sizeof(Vec),&localnearnullsp);CHKERRQ(ierr); 21323b03a366Sstefano_zampini for(k=0;k<nnsp_size;k++) { 21333b03a366Sstefano_zampini ierr = VecDuplicate(pcis->vec1_N,&localnearnullsp[k]);CHKERRQ(ierr); 2134fcda91b4SJed Brown ierr = VecScatterBegin(matis->ctx,nearnullvecs[k],localnearnullsp[k],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 2135fcda91b4SJed Brown ierr = VecScatterEnd (matis->ctx,nearnullvecs[k],localnearnullsp[k],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 21363b03a366Sstefano_zampini } 21373b03a366Sstefano_zampini /* Now we can loop on constraining sets */ 21383b03a366Sstefano_zampini total_counts=0; 21393b03a366Sstefano_zampini temp_indices[0]=0; 2140da1bb401SStefano Zampini /* vertices */ 2141da1bb401SStefano Zampini PetscBool used_vertex; 2142da1bb401SStefano Zampini ierr = ISGetIndices(pcbddc->ISForVertices,(const PetscInt**)&is_indices);CHKERRQ(ierr); 2143da1bb401SStefano Zampini if(nnsp_has_cnst) { /* consider all vertices */ 2144da1bb401SStefano Zampini for(i=0;i<n_vertices;i++) { 2145da1bb401SStefano Zampini temp_indices_to_constraint[temp_indices[total_counts]]=is_indices[i]; 2146534831adSStefano Zampini temp_indices_to_constraint_B[temp_indices[total_counts]]=local_to_B[is_indices[i]]; 2147da1bb401SStefano Zampini temp_quadrature_constraint[temp_indices[total_counts]]=1.0; 2148da1bb401SStefano Zampini temp_indices[total_counts+1]=temp_indices[total_counts]+1; 2149534831adSStefano Zampini change_basis[total_counts]=PETSC_FALSE; 2150da1bb401SStefano Zampini total_counts++; 2151da1bb401SStefano Zampini } 2152da1bb401SStefano Zampini } else { /* consider vertices for which exist at least a localnearnullsp which is not null there */ 2153da1bb401SStefano Zampini for(i=0;i<n_vertices;i++) { 2154da1bb401SStefano Zampini used_vertex=PETSC_FALSE; 2155da1bb401SStefano Zampini k=0; 2156da1bb401SStefano Zampini while(!used_vertex && k<nnsp_size) { 2157da1bb401SStefano Zampini ierr = VecGetArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr); 2158da1bb401SStefano Zampini if(PetscAbsScalar(array_vector[is_indices[i]])>0.0) { 2159da1bb401SStefano Zampini temp_indices_to_constraint[temp_indices[total_counts]]=is_indices[i]; 2160534831adSStefano Zampini temp_indices_to_constraint_B[temp_indices[total_counts]]=local_to_B[is_indices[i]]; 2161da1bb401SStefano Zampini temp_quadrature_constraint[temp_indices[total_counts]]=1.0; 2162da1bb401SStefano Zampini temp_indices[total_counts+1]=temp_indices[total_counts]+1; 2163534831adSStefano Zampini change_basis[total_counts]=PETSC_FALSE; 2164da1bb401SStefano Zampini total_counts++; 2165da1bb401SStefano Zampini used_vertex=PETSC_TRUE; 2166da1bb401SStefano Zampini } 2167da1bb401SStefano Zampini ierr = VecRestoreArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr); 2168da1bb401SStefano Zampini k++; 2169da1bb401SStefano Zampini } 2170da1bb401SStefano Zampini } 2171da1bb401SStefano Zampini } 2172da1bb401SStefano Zampini ierr = ISRestoreIndices(pcbddc->ISForVertices,(const PetscInt**)&is_indices);CHKERRQ(ierr); 2173da1bb401SStefano Zampini n_vertices=total_counts; 2174da1bb401SStefano Zampini /* edges and faces */ 21753b03a366Sstefano_zampini for(i=0;i<pcbddc->n_ISForEdges+pcbddc->n_ISForFaces;i++){ 21763b03a366Sstefano_zampini if(i<pcbddc->n_ISForEdges){ 21773b03a366Sstefano_zampini used_IS = &pcbddc->ISForEdges[i]; 2178534831adSStefano Zampini boolforface = pcbddc->usechangeofbasis; 21793b03a366Sstefano_zampini } else { 21803b03a366Sstefano_zampini used_IS = &pcbddc->ISForFaces[i-pcbddc->n_ISForEdges]; 2181534831adSStefano Zampini boolforface = pcbddc->usechangeonfaces; 21823b03a366Sstefano_zampini } 21833b03a366Sstefano_zampini temp_constraints = 0; /* zero the number of constraints I have on this conn comp */ 21843b03a366Sstefano_zampini temp_start_ptr = total_counts; /* need to know the starting index of constraints stored */ 21853b03a366Sstefano_zampini ierr = ISGetSize(*used_IS,&size_of_constraint);CHKERRQ(ierr); 21863b03a366Sstefano_zampini ierr = ISGetIndices(*used_IS,(const PetscInt**)&is_indices);CHKERRQ(ierr); 21873b03a366Sstefano_zampini if(nnsp_has_cnst) { 21883b03a366Sstefano_zampini temp_constraints++; 2189534831adSStefano Zampini quad_value = (PetscScalar) (1.0/PetscSqrtReal((PetscReal)size_of_constraint)); 21903b03a366Sstefano_zampini for(j=0;j<size_of_constraint;j++) { 21913b03a366Sstefano_zampini temp_indices_to_constraint[temp_indices[total_counts]+j]=is_indices[j]; 2192534831adSStefano Zampini temp_indices_to_constraint_B[temp_indices[total_counts]+j]=local_to_B[is_indices[j]]; 21933b03a366Sstefano_zampini temp_quadrature_constraint[temp_indices[total_counts]+j]=quad_value; 21943b03a366Sstefano_zampini } 21953b03a366Sstefano_zampini temp_indices[total_counts+1]=temp_indices[total_counts]+size_of_constraint; /* store new starting point */ 2196534831adSStefano Zampini change_basis[total_counts]=boolforface; 21973b03a366Sstefano_zampini total_counts++; 21983b03a366Sstefano_zampini } 21993b03a366Sstefano_zampini for(k=0;k<nnsp_size;k++) { 22003b03a366Sstefano_zampini ierr = VecGetArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr); 22013b03a366Sstefano_zampini for(j=0;j<size_of_constraint;j++) { 22023b03a366Sstefano_zampini temp_indices_to_constraint[temp_indices[total_counts]+j]=is_indices[j]; 2203534831adSStefano Zampini temp_indices_to_constraint_B[temp_indices[total_counts]+j]=local_to_B[is_indices[j]]; 22043b03a366Sstefano_zampini temp_quadrature_constraint[temp_indices[total_counts]+j]=array_vector[is_indices[j]]; 22053b03a366Sstefano_zampini } 22063b03a366Sstefano_zampini ierr = VecRestoreArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr); 2207de534f79Sstefano_zampini quad_value = 1.0; 2208de534f79Sstefano_zampini if( use_nnsp_true ) { /* check if array is null on the connected component in case use_nnsp_true has been requested */ 2209de534f79Sstefano_zampini Bs = PetscBLASIntCast(size_of_constraint); 2210de534f79Sstefano_zampini quad_value = BLASasum_(&Bs,&temp_quadrature_constraint[temp_indices[total_counts]],&Bone); 2211de534f79Sstefano_zampini } 2212de534f79Sstefano_zampini if ( quad_value > 0.0 ) { /* keep indices and values */ 2213de534f79Sstefano_zampini temp_constraints++; 22143b03a366Sstefano_zampini temp_indices[total_counts+1]=temp_indices[total_counts]+size_of_constraint; /* store new starting point */ 2215534831adSStefano Zampini change_basis[total_counts]=boolforface; 22163b03a366Sstefano_zampini total_counts++; 22173b03a366Sstefano_zampini } 2218de534f79Sstefano_zampini } 22193b03a366Sstefano_zampini ierr = ISRestoreIndices(*used_IS,(const PetscInt**)&is_indices);CHKERRQ(ierr); 2220de534f79Sstefano_zampini /* perform SVD on the constraint if use_nnsp_true has not be requested by the user */ 22213b03a366Sstefano_zampini if(!use_nnsp_true) { 2222de534f79Sstefano_zampini 22233b03a366Sstefano_zampini Bs = PetscBLASIntCast(size_of_constraint); 22243b03a366Sstefano_zampini Bt = PetscBLASIntCast(temp_constraints); 2225de534f79Sstefano_zampini 22263b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD) 22273b03a366Sstefano_zampini ierr = PetscMemzero(correlation_mat,Bt*Bt*sizeof(PetscScalar));CHKERRQ(ierr); 22283b03a366Sstefano_zampini /* Store upper triangular part of correlation matrix */ 22293b03a366Sstefano_zampini for(j=0;j<temp_constraints;j++) { 22303b03a366Sstefano_zampini for(k=0;k<j+1;k++) { 22313b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX) 22323425bc38SStefano Zampini /* hand made complex dot product -> replace */ 22333b03a366Sstefano_zampini dot_result = 0.0; 22343b03a366Sstefano_zampini for (ii=0; ii<size_of_constraint; ii++) { 22353b03a366Sstefano_zampini val1 = temp_quadrature_constraint[temp_indices[temp_start_ptr+j]+ii]; 22363b03a366Sstefano_zampini val2 = temp_quadrature_constraint[temp_indices[temp_start_ptr+k]+ii]; 22373b03a366Sstefano_zampini dot_result += val1*PetscConj(val2); 22383b03a366Sstefano_zampini } 22393b03a366Sstefano_zampini #else 22403b03a366Sstefano_zampini dot_result = BLASdot_(&Bs,&temp_quadrature_constraint[temp_indices[temp_start_ptr+j]],&Bone, 22413b03a366Sstefano_zampini &temp_quadrature_constraint[temp_indices[temp_start_ptr+k]],&Bone); 22423b03a366Sstefano_zampini #endif 22433b03a366Sstefano_zampini correlation_mat[j*temp_constraints+k]=dot_result; 22443b03a366Sstefano_zampini } 22453b03a366Sstefano_zampini } 22463425bc38SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 22473b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX) 22483425bc38SStefano Zampini /* LAPACKsyev_("V","U",&Bt,correlation_mat,&Bt,singular_vals,work,&lwork,&lierr); */ 22493425bc38SStefano Zampini LAPACKsyevx_("V","A","U",&Bt,correlation_mat,&Bt,&dummy_real,&dummy_real,&dummy_int,&dummy_int, 22503425bc38SStefano Zampini &abs_tol,&eigs_found,singular_vals,singular_vectors,&Bt,work,&lwork,iwork,ifail,&lierr); 22513b03a366Sstefano_zampini #else 22523425bc38SStefano Zampini /* LAPACK call is missing here! TODO */ 22533425bc38SStefano Zampini SETERRQ(((PetscObject) pc)->comm, PETSC_ERR_SUP, "Not yet implemented for complexes when PETSC_MISSING_GESVD = 1"); 22543b03a366Sstefano_zampini #endif 22553425bc38SStefano Zampini if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYEVX Lapack routine %d",(int)lierr); 22563425bc38SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 22573b03a366Sstefano_zampini /* retain eigenvalues greater than tol: note that lapack SYEV gives eigs in ascending order */ 22583b03a366Sstefano_zampini j=0; 22593b03a366Sstefano_zampini while( j < Bt && singular_vals[j] < tol) j++; 22603b03a366Sstefano_zampini total_counts=total_counts-j; 22613b03a366Sstefano_zampini if(j<temp_constraints) { 22623b03a366Sstefano_zampini for(k=j;k<Bt;k++) { singular_vals[k]=1.0/PetscSqrtReal(singular_vals[k]); } 22633425bc38SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 22643b03a366Sstefano_zampini BLASgemm_("N","N",&Bs,&Bt,&Bt,&one,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,correlation_mat,&Bt,&zero,temp_basis,&Bs); 22653425bc38SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 22663b03a366Sstefano_zampini /* copy POD basis into used quadrature memory */ 22673b03a366Sstefano_zampini for(k=0;k<Bt-j;k++) { 22683b03a366Sstefano_zampini for(ii=0;ii<size_of_constraint;ii++) { 22693b03a366Sstefano_zampini temp_quadrature_constraint[temp_indices[temp_start_ptr+k]+ii]=singular_vals[Bt-1-k]*temp_basis[(Bt-1-k)*size_of_constraint+ii]; 22703b03a366Sstefano_zampini } 22713b03a366Sstefano_zampini } 22723b03a366Sstefano_zampini } 2273de534f79Sstefano_zampini 22743b03a366Sstefano_zampini #else /* on missing GESVD */ 22753b03a366Sstefano_zampini PetscInt min_n = temp_constraints; 22763b03a366Sstefano_zampini if(min_n > size_of_constraint) min_n = size_of_constraint; 22773b03a366Sstefano_zampini dummy_int = Bs; 2278670f3ff9SJed Brown ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 22793b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX) 22803b03a366Sstefano_zampini LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,singular_vals, 22813b03a366Sstefano_zampini &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,work,&lwork,&lierr); 22823b03a366Sstefano_zampini #else 22833b03a366Sstefano_zampini LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,singular_vals, 22843b03a366Sstefano_zampini &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,work,&lwork,rwork,&lierr); 22853b03a366Sstefano_zampini #endif 22863b03a366Sstefano_zampini if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SVD Lapack routine %d",(int)lierr); 2287670f3ff9SJed Brown ierr = PetscFPTrapPop();CHKERRQ(ierr); 22883b03a366Sstefano_zampini /* retain eigenvalues greater than tol: note that lapack SVD gives eigs in descending order */ 22893b03a366Sstefano_zampini j=0; 22903b03a366Sstefano_zampini while( j < min_n && singular_vals[min_n-j-1] < tol) j++; 22913b03a366Sstefano_zampini total_counts = total_counts-(PetscInt)Bt+(min_n-j); 22923b03a366Sstefano_zampini #endif 22933b03a366Sstefano_zampini } 22943b03a366Sstefano_zampini } 2295534831adSStefano Zampini 2296da1bb401SStefano Zampini n_constraints=total_counts-n_vertices; 2297da1bb401SStefano Zampini local_primal_size = total_counts; 22983b03a366Sstefano_zampini /* set quantities in pcbddc data structure */ 22993b03a366Sstefano_zampini pcbddc->n_vertices = n_vertices; 23003b03a366Sstefano_zampini pcbddc->n_constraints = n_constraints; 2301da1bb401SStefano Zampini pcbddc->local_primal_size = local_primal_size; 2302534831adSStefano Zampini 2303534831adSStefano Zampini /* Create constraint matrix */ 2304534831adSStefano Zampini /* The constraint matrix is used to compute the l2g map of primal dofs */ 2305534831adSStefano Zampini /* so we need to set it up properly either with or without change of basis */ 2306534831adSStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->ConstraintMatrix);CHKERRQ(ierr); 2307534831adSStefano Zampini ierr = MatSetType(pcbddc->ConstraintMatrix,impMatType);CHKERRQ(ierr); 2308534831adSStefano Zampini ierr = MatSetSizes(pcbddc->ConstraintMatrix,local_primal_size,pcis->n,local_primal_size,pcis->n);CHKERRQ(ierr); 2309534831adSStefano Zampini /* compute a local numbering of constraints : vertices first then constraints */ 2310534831adSStefano Zampini ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr); 2311534831adSStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array_vector);CHKERRQ(ierr); 2312534831adSStefano Zampini ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&aux_primal_numbering);CHKERRQ(ierr); 2313534831adSStefano Zampini ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&aux_primal_permutation);CHKERRQ(ierr); 2314534831adSStefano Zampini total_counts=0; 2315534831adSStefano Zampini /* find vertices: subdomain corners plus dofs with basis changed */ 2316534831adSStefano Zampini for(i=0;i<local_primal_size;i++) { 2317534831adSStefano Zampini size_of_constraint=temp_indices[i+1]-temp_indices[i]; 2318534831adSStefano Zampini if(change_basis[i] || size_of_constraint == 1) { 2319534831adSStefano Zampini k=0; 2320534831adSStefano Zampini while(k < size_of_constraint && array_vector[temp_indices_to_constraint[temp_indices[i]+size_of_constraint-k-1]] != 0.0) { 2321534831adSStefano Zampini k=k+1; 2322534831adSStefano Zampini } 2323534831adSStefano Zampini j=temp_indices_to_constraint[temp_indices[i]+size_of_constraint-k-1]; 2324534831adSStefano Zampini array_vector[j] = 1.0; 2325534831adSStefano Zampini aux_primal_numbering[total_counts]=j; 2326534831adSStefano Zampini aux_primal_permutation[total_counts]=total_counts; 2327534831adSStefano Zampini total_counts++; 2328534831adSStefano Zampini } 2329534831adSStefano Zampini } 2330534831adSStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array_vector);CHKERRQ(ierr); 2331534831adSStefano Zampini /* permute indices in order to have a sorted set of vertices */ 2332534831adSStefano Zampini ierr = PetscSortIntWithPermutation(total_counts,aux_primal_numbering,aux_primal_permutation); 2333534831adSStefano Zampini /* nonzero structure */ 2334534831adSStefano Zampini ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&nnz);CHKERRQ(ierr); 2335534831adSStefano Zampini for(i=0;i<total_counts;i++) { 2336534831adSStefano Zampini nnz[i]=1; 2337534831adSStefano Zampini } 2338534831adSStefano Zampini j=total_counts; 2339534831adSStefano Zampini for(i=n_vertices;i<local_primal_size;i++) { 2340534831adSStefano Zampini if(!change_basis[i]) { 2341534831adSStefano Zampini nnz[j]=temp_indices[i+1]-temp_indices[i]; 2342534831adSStefano Zampini j++; 2343534831adSStefano Zampini } 2344534831adSStefano Zampini } 2345534831adSStefano Zampini ierr = MatSeqAIJSetPreallocation(pcbddc->ConstraintMatrix,0,nnz);CHKERRQ(ierr); 2346534831adSStefano Zampini ierr = PetscFree(nnz);CHKERRQ(ierr); 2347534831adSStefano Zampini /* set values in constraint matrix */ 2348534831adSStefano Zampini for(i=0;i<total_counts;i++) { 2349534831adSStefano Zampini j = aux_primal_permutation[i]; 2350534831adSStefano Zampini k = aux_primal_numbering[j]; 2351534831adSStefano Zampini ierr = MatSetValue(pcbddc->ConstraintMatrix,i,k,1.0,INSERT_VALUES);CHKERRQ(ierr); 2352534831adSStefano Zampini } 2353534831adSStefano Zampini for(i=n_vertices;i<local_primal_size;i++) { 2354534831adSStefano Zampini if(!change_basis[i]) { 2355534831adSStefano Zampini size_of_constraint=temp_indices[i+1]-temp_indices[i]; 2356534831adSStefano Zampini ierr = MatSetValues(pcbddc->ConstraintMatrix,1,&total_counts,size_of_constraint,&temp_indices_to_constraint[temp_indices[i]],&temp_quadrature_constraint[temp_indices[i]],INSERT_VALUES);CHKERRQ(ierr); 2357534831adSStefano Zampini total_counts++; 2358534831adSStefano Zampini } 2359534831adSStefano Zampini } 2360534831adSStefano Zampini ierr = PetscFree(aux_primal_numbering);CHKERRQ(ierr); 2361534831adSStefano Zampini ierr = PetscFree(aux_primal_permutation);CHKERRQ(ierr); 2362534831adSStefano Zampini /* assembling */ 2363534831adSStefano Zampini ierr = MatAssemblyBegin(pcbddc->ConstraintMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2364534831adSStefano Zampini ierr = MatAssemblyEnd(pcbddc->ConstraintMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2365534831adSStefano Zampini 2366534831adSStefano Zampini /* Create matrix for change of basis. We don't need it in case pcbddc->usechangeofbasis is FALSE */ 2367534831adSStefano Zampini if(pcbddc->usechangeofbasis) { 2368534831adSStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->ChangeOfBasisMatrix);CHKERRQ(ierr); 2369534831adSStefano Zampini ierr = MatSetType(pcbddc->ChangeOfBasisMatrix,impMatType);CHKERRQ(ierr); 2370534831adSStefano Zampini ierr = MatSetSizes(pcbddc->ChangeOfBasisMatrix,pcis->n_B,pcis->n_B,pcis->n_B,pcis->n_B);CHKERRQ(ierr); 2371534831adSStefano Zampini /* work arrays */ 2372534831adSStefano Zampini /* we need to reuse these arrays, so we free them */ 2373534831adSStefano Zampini ierr = PetscFree(temp_basis);CHKERRQ(ierr); 2374534831adSStefano Zampini ierr = PetscFree(work);CHKERRQ(ierr); 2375534831adSStefano Zampini ierr = PetscMalloc(pcis->n_B*sizeof(PetscInt),&nnz);CHKERRQ(ierr); 2376534831adSStefano Zampini ierr = PetscMalloc((nnsp_addone+nnsp_size)*(nnsp_addone+nnsp_size)*sizeof(PetscScalar),&temp_basis);CHKERRQ(ierr); 2377534831adSStefano Zampini ierr = PetscMalloc((nnsp_addone+nnsp_size)*sizeof(PetscScalar),&work);CHKERRQ(ierr); 2378534831adSStefano Zampini ierr = PetscMalloc((nnsp_addone+nnsp_size)*sizeof(PetscBLASInt),&ipiv);CHKERRQ(ierr); 2379534831adSStefano Zampini for(i=0;i<pcis->n_B;i++) { 2380534831adSStefano Zampini nnz[i]=1; 2381534831adSStefano Zampini } 2382534831adSStefano Zampini /* Overestimated nonzeros per row */ 2383534831adSStefano Zampini k=1; 2384534831adSStefano Zampini for(i=pcbddc->n_vertices;i<local_primal_size;i++) { 2385534831adSStefano Zampini if(change_basis[i]) { 2386534831adSStefano Zampini size_of_constraint = temp_indices[i+1]-temp_indices[i]; 2387534831adSStefano Zampini if(k < size_of_constraint) { 2388534831adSStefano Zampini k = size_of_constraint; 2389534831adSStefano Zampini } 2390534831adSStefano Zampini for(j=0;j<size_of_constraint;j++) { 2391534831adSStefano Zampini nnz[temp_indices_to_constraint_B[temp_indices[i]+j]] = size_of_constraint; 2392534831adSStefano Zampini } 2393534831adSStefano Zampini } 2394534831adSStefano Zampini } 2395534831adSStefano Zampini ierr = MatSeqAIJSetPreallocation(pcbddc->ChangeOfBasisMatrix,0,nnz);CHKERRQ(ierr); 2396534831adSStefano Zampini ierr = PetscFree(nnz);CHKERRQ(ierr); 2397534831adSStefano Zampini /* Temporary array to store indices */ 2398534831adSStefano Zampini ierr = PetscMalloc(k*sizeof(PetscInt),&is_indices);CHKERRQ(ierr); 2399534831adSStefano Zampini /* Set initial identity in the matrix */ 2400534831adSStefano Zampini for(i=0;i<pcis->n_B;i++) { 2401534831adSStefano Zampini ierr = MatSetValue(pcbddc->ChangeOfBasisMatrix,i,i,1.0,INSERT_VALUES);CHKERRQ(ierr); 2402534831adSStefano Zampini } 2403534831adSStefano Zampini /* Now we loop on the constraints which need a change of basis */ 2404534831adSStefano Zampini /* Change of basis matrix is evaluated as the FIRST APPROACH in */ 2405534831adSStefano Zampini /* Klawonn and Widlund, Dual-primal FETI-DP methods for linear elasticity, (6.2.1) */ 2406534831adSStefano Zampini temp_constraints = 0; 2407534831adSStefano Zampini temp_start_ptr = temp_indices_to_constraint_B[temp_indices[pcbddc->n_vertices]]; 2408534831adSStefano Zampini for(i=pcbddc->n_vertices;i<local_primal_size;i++) { 2409534831adSStefano Zampini if(change_basis[i]) { 2410534831adSStefano Zampini compute_submatrix = PETSC_FALSE; 2411534831adSStefano Zampini useksp = PETSC_FALSE; 2412534831adSStefano Zampini if(temp_start_ptr == temp_indices_to_constraint_B[temp_indices[i]]) { 2413534831adSStefano Zampini temp_constraints++; 2414*04eaf177SStefano Zampini if(i == local_primal_size -1 || temp_start_ptr != temp_indices_to_constraint_B[temp_indices[i+1]]) { 2415534831adSStefano Zampini compute_submatrix = PETSC_TRUE; 2416534831adSStefano Zampini } 2417534831adSStefano Zampini } 2418534831adSStefano Zampini if(compute_submatrix) { 2419534831adSStefano Zampini if(temp_constraints > 1 || pcbddc->use_nnsp_true) { 2420534831adSStefano Zampini useksp = PETSC_TRUE; 2421534831adSStefano Zampini } 2422534831adSStefano Zampini size_of_constraint = temp_indices[i+1]-temp_indices[i]; 2423534831adSStefano Zampini if(useksp) { /* experimental */ 2424534831adSStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&temp_mat);CHKERRQ(ierr); 2425534831adSStefano Zampini ierr = MatSetType(temp_mat,impMatType);CHKERRQ(ierr); 2426534831adSStefano Zampini ierr = MatSetSizes(temp_mat,size_of_constraint,size_of_constraint,size_of_constraint,size_of_constraint);CHKERRQ(ierr); 2427534831adSStefano Zampini ierr = MatSeqAIJSetPreallocation(temp_mat,size_of_constraint,PETSC_NULL);CHKERRQ(ierr); 2428534831adSStefano Zampini } 2429534831adSStefano Zampini /* First _size_of_constraint-temp_constraints_ columns */ 2430534831adSStefano Zampini dual_dofs = size_of_constraint-temp_constraints; 2431534831adSStefano Zampini start_constraint = i+1-temp_constraints; 2432534831adSStefano Zampini for(s=0;s<dual_dofs;s++) { 2433534831adSStefano Zampini is_indices[0] = s; 2434534831adSStefano Zampini for(j=0;j<temp_constraints;j++) { 2435534831adSStefano Zampini for(k=0;k<temp_constraints;k++) { 2436534831adSStefano Zampini temp_basis[j*temp_constraints+k]=temp_quadrature_constraint[temp_indices[start_constraint+k]+s+j+1]; 2437534831adSStefano Zampini } 2438534831adSStefano Zampini work[j]=-temp_quadrature_constraint[temp_indices[start_constraint+j]+s]; 2439534831adSStefano Zampini is_indices[j+1]=s+j+1; 2440534831adSStefano Zampini } 2441534831adSStefano Zampini Bt = temp_constraints; 2442534831adSStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 2443534831adSStefano Zampini LAPACKgesv_(&Bt,&Bone,temp_basis,&Bt,ipiv,work,&Bt,&lierr); 2444534831adSStefano Zampini if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GESV Lapack routine %d",(int)lierr); 2445534831adSStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 2446534831adSStefano Zampini j = temp_indices_to_constraint_B[temp_indices[start_constraint]+s]; 2447534831adSStefano Zampini ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,temp_constraints,&temp_indices_to_constraint_B[temp_indices[start_constraint]+s+1],1,&j,work,INSERT_VALUES);CHKERRQ(ierr); 2448534831adSStefano Zampini if(useksp) { 2449534831adSStefano Zampini /* temp mat with transposed rows and columns */ 2450534831adSStefano Zampini ierr = MatSetValues(temp_mat,1,&s,temp_constraints,&is_indices[1],work,INSERT_VALUES);CHKERRQ(ierr); 2451534831adSStefano Zampini ierr = MatSetValue(temp_mat,is_indices[0],is_indices[0],1.0,INSERT_VALUES);CHKERRQ(ierr); 2452534831adSStefano Zampini } 2453534831adSStefano Zampini } 2454534831adSStefano Zampini if(useksp) { 2455534831adSStefano Zampini /* last rows of temp_mat */ 2456534831adSStefano Zampini for(j=0;j<size_of_constraint;j++) { 2457534831adSStefano Zampini is_indices[j] = j; 2458534831adSStefano Zampini } 2459534831adSStefano Zampini for(s=0;s<temp_constraints;s++) { 2460534831adSStefano Zampini k = s + dual_dofs; 2461534831adSStefano Zampini ierr = MatSetValues(temp_mat,1,&k,size_of_constraint,is_indices,&temp_quadrature_constraint[temp_indices[start_constraint+s]],INSERT_VALUES);CHKERRQ(ierr); 2462534831adSStefano Zampini } 2463534831adSStefano Zampini ierr = MatAssemblyBegin(temp_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2464534831adSStefano Zampini ierr = MatAssemblyEnd(temp_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2465534831adSStefano Zampini ierr = MatGetVecs(temp_mat,&temp_vec,PETSC_NULL);CHKERRQ(ierr); 2466534831adSStefano Zampini ierr = KSPCreate(PETSC_COMM_SELF,&temp_ksp);CHKERRQ(ierr); 2467534831adSStefano Zampini ierr = KSPSetOperators(temp_ksp,temp_mat,temp_mat,SAME_PRECONDITIONER);CHKERRQ(ierr); 2468534831adSStefano Zampini ierr = KSPSetType(temp_ksp,KSPPREONLY);CHKERRQ(ierr); 2469534831adSStefano Zampini ierr = KSPSetUp(temp_ksp);CHKERRQ(ierr); 2470534831adSStefano Zampini for(s=0;s<temp_constraints;s++) { 2471534831adSStefano Zampini ierr = VecSet(temp_vec,0.0);CHKERRQ(ierr); 2472534831adSStefano Zampini ierr = VecSetValue(temp_vec,s+dual_dofs,1.0,INSERT_VALUES);CHKERRQ(ierr); 2473534831adSStefano Zampini ierr = VecAssemblyBegin(temp_vec);CHKERRQ(ierr); 2474534831adSStefano Zampini ierr = VecAssemblyEnd(temp_vec);CHKERRQ(ierr); 2475534831adSStefano Zampini ierr = KSPSolve(temp_ksp,temp_vec,temp_vec);CHKERRQ(ierr); 2476534831adSStefano Zampini ierr = VecGetArray(temp_vec,&array_vector);CHKERRQ(ierr); 2477534831adSStefano Zampini j = temp_indices_to_constraint_B[temp_indices[start_constraint+s]+size_of_constraint-s-1]; 2478534831adSStefano Zampini /* last columns of change of basis matrix associated to new primal dofs */ 2479534831adSStefano Zampini ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,size_of_constraint,&temp_indices_to_constraint_B[temp_indices[start_constraint+s]],1,&j,array_vector,INSERT_VALUES);CHKERRQ(ierr); 2480534831adSStefano Zampini ierr = VecRestoreArray(temp_vec,&array_vector);CHKERRQ(ierr); 2481534831adSStefano Zampini } 2482534831adSStefano Zampini ierr = MatDestroy(&temp_mat);CHKERRQ(ierr); 2483534831adSStefano Zampini ierr = KSPDestroy(&temp_ksp);CHKERRQ(ierr); 2484534831adSStefano Zampini ierr = VecDestroy(&temp_vec);CHKERRQ(ierr); 2485534831adSStefano Zampini } else { 2486534831adSStefano Zampini /* last columns of change of basis matrix associated to new primal dofs */ 2487534831adSStefano Zampini for(s=0;s<temp_constraints;s++) { 2488534831adSStefano Zampini j = temp_indices_to_constraint_B[temp_indices[start_constraint+s]+size_of_constraint-s-1]; 2489534831adSStefano Zampini ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,size_of_constraint,&temp_indices_to_constraint_B[temp_indices[start_constraint+s]],1,&j,&temp_quadrature_constraint[temp_indices[start_constraint+s]],INSERT_VALUES);CHKERRQ(ierr); 2490534831adSStefano Zampini } 2491534831adSStefano Zampini } 2492534831adSStefano Zampini /* prepare for the next cycle */ 2493534831adSStefano Zampini temp_constraints = 0; 2494*04eaf177SStefano Zampini if(i != local_primal_size -1 ) { 2495534831adSStefano Zampini temp_start_ptr = temp_indices_to_constraint_B[temp_indices[i+1]]; 2496534831adSStefano Zampini } 2497534831adSStefano Zampini } 2498534831adSStefano Zampini } 2499*04eaf177SStefano Zampini } 2500534831adSStefano Zampini /* assembling */ 2501534831adSStefano Zampini ierr = MatAssemblyBegin(pcbddc->ChangeOfBasisMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2502534831adSStefano Zampini ierr = MatAssemblyEnd(pcbddc->ChangeOfBasisMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2503534831adSStefano Zampini ierr = PetscFree(ipiv);CHKERRQ(ierr); 2504534831adSStefano Zampini ierr = PetscFree(is_indices);CHKERRQ(ierr); 2505534831adSStefano Zampini } 25063b03a366Sstefano_zampini /* free workspace no longer needed */ 25073b03a366Sstefano_zampini ierr = PetscFree(rwork);CHKERRQ(ierr); 25083b03a366Sstefano_zampini ierr = PetscFree(work);CHKERRQ(ierr); 25093b03a366Sstefano_zampini ierr = PetscFree(temp_basis);CHKERRQ(ierr); 25103b03a366Sstefano_zampini ierr = PetscFree(singular_vals);CHKERRQ(ierr); 25113b03a366Sstefano_zampini ierr = PetscFree(correlation_mat);CHKERRQ(ierr); 25123b03a366Sstefano_zampini ierr = PetscFree(temp_indices);CHKERRQ(ierr); 2513534831adSStefano Zampini ierr = PetscFree(change_basis);CHKERRQ(ierr); 25143b03a366Sstefano_zampini ierr = PetscFree(temp_indices_to_constraint);CHKERRQ(ierr); 2515534831adSStefano Zampini ierr = PetscFree(temp_indices_to_constraint_B);CHKERRQ(ierr); 2516534831adSStefano Zampini ierr = PetscFree(local_to_B);CHKERRQ(ierr); 25173b03a366Sstefano_zampini ierr = PetscFree(temp_quadrature_constraint);CHKERRQ(ierr); 25183425bc38SStefano Zampini #if defined(PETSC_MISSING_LAPACK_GESVD) 25193425bc38SStefano Zampini ierr = PetscFree(iwork);CHKERRQ(ierr); 25203425bc38SStefano Zampini ierr = PetscFree(ifail);CHKERRQ(ierr); 25213425bc38SStefano Zampini ierr = PetscFree(singular_vectors);CHKERRQ(ierr); 25223425bc38SStefano Zampini #endif 2523da1bb401SStefano Zampini for(k=0;k<nnsp_size;k++) { 2524da1bb401SStefano Zampini ierr = VecDestroy(&localnearnullsp[k]);CHKERRQ(ierr); 2525da1bb401SStefano Zampini } 25263b03a366Sstefano_zampini ierr = PetscFree(localnearnullsp);CHKERRQ(ierr); 25273b03a366Sstefano_zampini PetscFunctionReturn(0); 25283b03a366Sstefano_zampini } 25293b03a366Sstefano_zampini /* -------------------------------------------------------------------------- */ 25300c7d97c5SJed Brown #undef __FUNCT__ 25310c7d97c5SJed Brown #define __FUNCT__ "PCBDDCCoarseSetUp" 253253cdbc3dSStefano Zampini static PetscErrorCode PCBDDCCoarseSetUp(PC pc) 25330c7d97c5SJed Brown { 25340c7d97c5SJed Brown PetscErrorCode ierr; 25350c7d97c5SJed Brown 25360c7d97c5SJed Brown PC_IS* pcis = (PC_IS*)(pc->data); 25370c7d97c5SJed Brown PC_BDDC* pcbddc = (PC_BDDC*)pc->data; 25380c7d97c5SJed Brown Mat_IS *matis = (Mat_IS*)pc->pmat->data; 2539534831adSStefano Zampini Mat change_mat_all; 25400c7d97c5SJed Brown IS is_R_local; 25410c7d97c5SJed Brown IS is_V_local; 25420c7d97c5SJed Brown IS is_C_local; 25430c7d97c5SJed Brown IS is_aux1; 25440c7d97c5SJed Brown IS is_aux2; 25450c7d97c5SJed Brown const VecType impVecType; 25460c7d97c5SJed Brown const MatType impMatType; 25470c7d97c5SJed Brown PetscInt n_R=0; 25480c7d97c5SJed Brown PetscInt n_D=0; 25490c7d97c5SJed Brown PetscInt n_B=0; 25500c7d97c5SJed Brown PetscScalar zero=0.0; 25510c7d97c5SJed Brown PetscScalar one=1.0; 25520c7d97c5SJed Brown PetscScalar m_one=-1.0; 25530c7d97c5SJed Brown PetscScalar* array; 25540c7d97c5SJed Brown PetscScalar *coarse_submat_vals; 25550c7d97c5SJed Brown PetscInt *idx_R_local; 25560c7d97c5SJed Brown PetscInt *idx_V_B; 25570c7d97c5SJed Brown PetscScalar *coarsefunctions_errors; 25580c7d97c5SJed Brown PetscScalar *constraints_errors; 25590c7d97c5SJed Brown /* auxiliary indices */ 2560534831adSStefano Zampini PetscInt i,j,k; 2561e269702eSStefano Zampini /* for verbose output of bddc */ 2562e269702eSStefano Zampini PetscViewer viewer=pcbddc->dbg_viewer; 2563e269702eSStefano Zampini PetscBool dbg_flag=pcbddc->dbg_flag; 2564a0ba757dSStefano Zampini /* for counting coarse dofs */ 2565534831adSStefano Zampini PetscInt n_vertices,n_constraints; 25663b03a366Sstefano_zampini PetscInt size_of_constraint; 25673b03a366Sstefano_zampini PetscInt *row_cmat_indices; 25683b03a366Sstefano_zampini PetscScalar *row_cmat_values; 2569534831adSStefano Zampini PetscInt *vertices,*nnz,*is_indices,*temp_indices; 25700c7d97c5SJed Brown 25710c7d97c5SJed Brown PetscFunctionBegin; 25720c7d97c5SJed Brown /* Set Non-overlapping dimensions */ 25730c7d97c5SJed Brown n_B = pcis->n_B; n_D = pcis->n - n_B; 2574534831adSStefano Zampini /* Set types for local objects needed by BDDC precondtioner */ 2575534831adSStefano Zampini impMatType = MATSEQDENSE; 2576534831adSStefano Zampini impVecType = VECSEQ; 2577da1bb401SStefano Zampini /* get vertex indices from constraint matrix */ 2578534831adSStefano Zampini ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscInt),&vertices);CHKERRQ(ierr); 2579534831adSStefano Zampini n_vertices=0; 2580da1bb401SStefano Zampini for(i=0;i<pcbddc->local_primal_size;i++) { 2581da1bb401SStefano Zampini ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr); 2582da1bb401SStefano Zampini if(size_of_constraint == 1) { 2583534831adSStefano Zampini vertices[n_vertices]=row_cmat_indices[0]; 2584534831adSStefano Zampini n_vertices++; 2585a0ba757dSStefano Zampini } 2586da1bb401SStefano Zampini ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr); 2587a0ba757dSStefano Zampini } 2588534831adSStefano Zampini /* Set number of constraints */ 2589534831adSStefano Zampini n_constraints = pcbddc->local_primal_size-n_vertices; 2590534831adSStefano Zampini 2591534831adSStefano Zampini /* vertices in boundary numbering */ 2592534831adSStefano Zampini if(n_vertices) { 2593534831adSStefano Zampini ierr = VecSet(pcis->vec1_N,m_one);CHKERRQ(ierr); 2594534831adSStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 2595534831adSStefano Zampini for (i=0; i<n_vertices; i++) { array[ vertices[i] ] = i; } 2596534831adSStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 2597534831adSStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 2598534831adSStefano Zampini ierr = VecScatterEnd (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 2599534831adSStefano Zampini ierr = PetscMalloc(n_vertices*sizeof(PetscInt),&idx_V_B);CHKERRQ(ierr); 2600534831adSStefano Zampini ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr); 2601534831adSStefano Zampini for (i=0; i<n_vertices; i++) { 2602534831adSStefano Zampini j=0; 2603534831adSStefano Zampini while (array[j] != i ) {j++;} 2604534831adSStefano Zampini idx_V_B[i]=j; 2605534831adSStefano Zampini } 2606534831adSStefano Zampini ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr); 2607534831adSStefano Zampini } 2608534831adSStefano Zampini 2609534831adSStefano Zampini /* transform local matrices if needed */ 2610534831adSStefano Zampini if(pcbddc->usechangeofbasis) { 2611534831adSStefano Zampini ierr = PetscMalloc(pcis->n*sizeof(PetscInt),&nnz);CHKERRQ(ierr); 2612534831adSStefano Zampini ierr = ISGetIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 2613534831adSStefano Zampini for(i=0;i<n_D;i++) { 2614534831adSStefano Zampini nnz[is_indices[i]]=1; 2615534831adSStefano Zampini } 2616534831adSStefano Zampini ierr = ISRestoreIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 2617534831adSStefano Zampini ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 2618534831adSStefano Zampini k=1; 2619534831adSStefano Zampini for(i=0;i<n_B;i++) { 2620534831adSStefano Zampini ierr = MatGetRow(pcbddc->ChangeOfBasisMatrix,i,&j,PETSC_NULL,PETSC_NULL);CHKERRQ(ierr); 2621534831adSStefano Zampini nnz[is_indices[i]]=j; 2622534831adSStefano Zampini if( k < j) { 2623534831adSStefano Zampini k = j; 2624534831adSStefano Zampini } 2625534831adSStefano Zampini ierr = MatRestoreRow(pcbddc->ChangeOfBasisMatrix,i,&j,PETSC_NULL,PETSC_NULL);CHKERRQ(ierr); 2626534831adSStefano Zampini } 2627534831adSStefano Zampini ierr = ISRestoreIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 2628534831adSStefano Zampini /* assemble change of basis matrix on the whole set of local dofs */ 2629534831adSStefano Zampini ierr = PetscMalloc(k*sizeof(PetscInt),&temp_indices);CHKERRQ(ierr); 2630534831adSStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&change_mat_all);CHKERRQ(ierr); 2631534831adSStefano Zampini ierr = MatSetSizes(change_mat_all,pcis->n,pcis->n,pcis->n,pcis->n);CHKERRQ(ierr); 2632534831adSStefano Zampini ierr = MatSetType(change_mat_all,MATSEQAIJ);CHKERRQ(ierr); 2633534831adSStefano Zampini ierr = MatSeqAIJSetPreallocation(change_mat_all,0,nnz);CHKERRQ(ierr); 2634534831adSStefano Zampini ierr = ISGetIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 2635534831adSStefano Zampini for(i=0;i<n_D;i++) { 2636534831adSStefano Zampini ierr = MatSetValue(change_mat_all,is_indices[i],is_indices[i],1.0,INSERT_VALUES);CHKERRQ(ierr); 2637534831adSStefano Zampini } 2638534831adSStefano Zampini ierr = ISRestoreIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 2639534831adSStefano Zampini ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 2640534831adSStefano Zampini for(i=0;i<n_B;i++) { 2641534831adSStefano Zampini ierr = MatGetRow(pcbddc->ChangeOfBasisMatrix,i,&j,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr); 2642534831adSStefano Zampini for(k=0;k<j;k++) { 2643534831adSStefano Zampini temp_indices[k]=is_indices[row_cmat_indices[k]]; 2644534831adSStefano Zampini } 2645534831adSStefano Zampini ierr = MatSetValues(change_mat_all,1,&is_indices[i],j,temp_indices,row_cmat_values,INSERT_VALUES);CHKERRQ(ierr); 2646534831adSStefano Zampini ierr = MatRestoreRow(pcbddc->ChangeOfBasisMatrix,i,&j,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr); 2647534831adSStefano Zampini } 2648534831adSStefano Zampini ierr = MatAssemblyBegin(change_mat_all,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2649534831adSStefano Zampini ierr = MatAssemblyEnd(change_mat_all,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2650534831adSStefano Zampini ierr = MatPtAP(matis->A,change_mat_all,MAT_INITIAL_MATRIX,1.0,&pcbddc->local_mat);CHKERRQ(ierr); 2651534831adSStefano Zampini ierr = MatDestroy(&pcis->A_IB);CHKERRQ(ierr); 2652534831adSStefano Zampini ierr = MatDestroy(&pcis->A_BI);CHKERRQ(ierr); 2653534831adSStefano Zampini ierr = MatDestroy(&pcis->A_BB);CHKERRQ(ierr); 2654534831adSStefano Zampini ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_I_local,pcis->is_B_local,MAT_INITIAL_MATRIX,&pcis->A_IB);CHKERRQ(ierr); 2655534831adSStefano Zampini ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_B_local,pcis->is_I_local,MAT_INITIAL_MATRIX,&pcis->A_BI);CHKERRQ(ierr); 2656534831adSStefano Zampini ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_B_local,pcis->is_B_local,MAT_INITIAL_MATRIX,&pcis->A_BB);CHKERRQ(ierr); 2657534831adSStefano Zampini ierr = MatDestroy(&change_mat_all);CHKERRQ(ierr); 2658534831adSStefano Zampini ierr = PetscFree(nnz);CHKERRQ(ierr); 2659534831adSStefano Zampini ierr = PetscFree(temp_indices);CHKERRQ(ierr); 2660534831adSStefano Zampini } else { 2661534831adSStefano Zampini /* without change of basis, the local matrix is unchanged */ 2662534831adSStefano Zampini ierr = PetscObjectReference((PetscObject)matis->A);CHKERRQ(ierr); 2663534831adSStefano Zampini pcbddc->local_mat = matis->A; 2664534831adSStefano Zampini } 2665a0ba757dSStefano Zampini 26660c7d97c5SJed Brown /* Dohrmann's notation: dofs splitted in R (Remaining: all dofs but the vertices) and V (Vertices) */ 26670c7d97c5SJed Brown ierr = VecSet(pcis->vec1_N,one);CHKERRQ(ierr); 26680c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 26693b03a366Sstefano_zampini for (i=0;i<n_vertices;i++) { array[ vertices[i] ] = zero; } 26703b03a366Sstefano_zampini ierr = PetscMalloc(( pcis->n - n_vertices )*sizeof(PetscInt),&idx_R_local);CHKERRQ(ierr); 26710c7d97c5SJed Brown for (i=0, n_R=0; i<pcis->n; i++) { if (array[i] == one) { idx_R_local[n_R] = i; n_R++; } } 26720c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 2673e269702eSStefano Zampini if(dbg_flag) { 26740c7d97c5SJed Brown ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr); 26750c7d97c5SJed Brown ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 26760c7d97c5SJed Brown ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d local dimensions\n",PetscGlobalRank);CHKERRQ(ierr); 26770c7d97c5SJed Brown ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local_size = %d, dirichlet_size = %d, boundary_size = %d\n",pcis->n,n_D,n_B);CHKERRQ(ierr); 26783b03a366Sstefano_zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"r_size = %d, v_size = %d, constraints = %d, local_primal_size = %d\n",n_R,n_vertices,n_constraints,pcbddc->local_primal_size);CHKERRQ(ierr); 2679534831adSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"pcbddc->n_vertices = %d, pcbddc->n_constraints = %d\n",pcbddc->n_vertices,pcbddc->n_constraints);CHKERRQ(ierr); 26800c7d97c5SJed Brown ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 26810c7d97c5SJed Brown } 2682534831adSStefano Zampini 26830c7d97c5SJed Brown /* Allocate needed vectors */ 2684534831adSStefano Zampini ierr = VecDuplicate(pcis->vec1_global,&pcbddc->original_rhs);CHKERRQ(ierr); 26853972b0daSStefano Zampini ierr = VecDuplicate(pcis->vec1_global,&pcbddc->temp_solution);CHKERRQ(ierr); 26860c7d97c5SJed Brown ierr = VecDuplicate(pcis->vec1_D,&pcbddc->vec4_D);CHKERRQ(ierr); 26870c7d97c5SJed Brown ierr = VecCreate(PETSC_COMM_SELF,&pcbddc->vec1_R);CHKERRQ(ierr); 26880c7d97c5SJed Brown ierr = VecSetSizes(pcbddc->vec1_R,n_R,n_R);CHKERRQ(ierr); 26890c7d97c5SJed Brown ierr = VecSetType(pcbddc->vec1_R,impVecType);CHKERRQ(ierr); 2690d49ef151SStefano Zampini ierr = VecDuplicate(pcbddc->vec1_R,&pcbddc->vec2_R);CHKERRQ(ierr); 26910c7d97c5SJed Brown ierr = VecCreate(PETSC_COMM_SELF,&pcbddc->vec1_P);CHKERRQ(ierr); 26920c7d97c5SJed Brown ierr = VecSetSizes(pcbddc->vec1_P,pcbddc->local_primal_size,pcbddc->local_primal_size);CHKERRQ(ierr); 26930c7d97c5SJed Brown ierr = VecSetType(pcbddc->vec1_P,impVecType);CHKERRQ(ierr); 26940c7d97c5SJed Brown 26950c7d97c5SJed Brown /* Creating some index sets needed */ 26960c7d97c5SJed Brown /* For submatrices */ 2697da1bb401SStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,n_R,idx_R_local,PETSC_OWN_POINTER,&is_R_local);CHKERRQ(ierr); 26983b03a366Sstefano_zampini if(n_vertices) { 2699da1bb401SStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,n_vertices,vertices,PETSC_OWN_POINTER,&is_V_local);CHKERRQ(ierr); 27003b03a366Sstefano_zampini } 2701da1bb401SStefano Zampini if(n_constraints) { 2702da1bb401SStefano Zampini ierr = ISCreateStride(PETSC_COMM_SELF,n_constraints,n_vertices,1,&is_C_local);CHKERRQ(ierr); 2703da1bb401SStefano Zampini } 2704da1bb401SStefano Zampini 27050c7d97c5SJed Brown /* For VecScatters pcbddc->R_to_B and (optionally) pcbddc->R_to_D */ 27060c7d97c5SJed Brown { 27070c7d97c5SJed Brown PetscInt *aux_array1; 27080c7d97c5SJed Brown PetscInt *aux_array2; 27090c7d97c5SJed Brown 27103b03a366Sstefano_zampini ierr = PetscMalloc( (pcis->n_B-n_vertices)*sizeof(PetscInt),&aux_array1);CHKERRQ(ierr); 27113b03a366Sstefano_zampini ierr = PetscMalloc( (pcis->n_B-n_vertices)*sizeof(PetscInt),&aux_array2);CHKERRQ(ierr); 27120c7d97c5SJed Brown 2713d49ef151SStefano Zampini ierr = VecSet(pcis->vec1_global,zero);CHKERRQ(ierr); 27140c7d97c5SJed Brown ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 27150c7d97c5SJed Brown ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 27160c7d97c5SJed Brown ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 27170c7d97c5SJed Brown ierr = VecScatterEnd (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 27180c7d97c5SJed Brown ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 27190c7d97c5SJed Brown ierr = VecScatterEnd (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 27200c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 2721da1bb401SStefano Zampini for (i=0, j=0; i<n_R; i++) { if (array[idx_R_local[i]] > one) { aux_array1[j] = i; j++; } } 27220c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 2723da1bb401SStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array1,PETSC_COPY_VALUES,&is_aux1);CHKERRQ(ierr); 27240c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr); 2725da1bb401SStefano Zampini for (i=0, j=0; i<n_B; i++) { if (array[i] > one) { aux_array2[j] = i; j++; } } 27263828260eSStefano Zampini ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr); 2727da1bb401SStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array2,PETSC_COPY_VALUES,&is_aux2);CHKERRQ(ierr); 27280c7d97c5SJed Brown ierr = VecScatterCreate(pcbddc->vec1_R,is_aux1,pcis->vec1_B,is_aux2,&pcbddc->R_to_B);CHKERRQ(ierr); 27290c7d97c5SJed Brown ierr = PetscFree(aux_array1);CHKERRQ(ierr); 27300c7d97c5SJed Brown ierr = PetscFree(aux_array2);CHKERRQ(ierr); 27310c7d97c5SJed Brown ierr = ISDestroy(&is_aux1);CHKERRQ(ierr); 27320c7d97c5SJed Brown ierr = ISDestroy(&is_aux2);CHKERRQ(ierr); 27330c7d97c5SJed Brown 2734e269702eSStefano Zampini if(pcbddc->prec_type || dbg_flag ) { 27350c7d97c5SJed Brown ierr = PetscMalloc(n_D*sizeof(PetscInt),&aux_array1);CHKERRQ(ierr); 27360c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 2737da1bb401SStefano Zampini for (i=0, j=0; i<n_R; i++) { if (array[idx_R_local[i]] == one) { aux_array1[j] = i; j++; } } 27380c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 2739da1bb401SStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array1,PETSC_COPY_VALUES,&is_aux1);CHKERRQ(ierr); 27400c7d97c5SJed Brown ierr = VecScatterCreate(pcbddc->vec1_R,is_aux1,pcis->vec1_D,(IS)0,&pcbddc->R_to_D);CHKERRQ(ierr); 27410c7d97c5SJed Brown ierr = PetscFree(aux_array1);CHKERRQ(ierr); 27420c7d97c5SJed Brown ierr = ISDestroy(&is_aux1);CHKERRQ(ierr); 27430c7d97c5SJed Brown } 27440c7d97c5SJed Brown } 27450c7d97c5SJed Brown 27460c7d97c5SJed Brown /* Creating PC contexts for local Dirichlet and Neumann problems */ 27470c7d97c5SJed Brown { 27480c7d97c5SJed Brown Mat A_RR; 274953cdbc3dSStefano Zampini PC pc_temp; 27500c7d97c5SJed Brown /* Matrix for Dirichlet problem is A_II -> we already have it from pcis.c code */ 275153cdbc3dSStefano Zampini ierr = KSPCreate(PETSC_COMM_SELF,&pcbddc->ksp_D);CHKERRQ(ierr); 275253cdbc3dSStefano Zampini ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->ksp_D,(PetscObject)pc,1);CHKERRQ(ierr); 275353cdbc3dSStefano Zampini ierr = KSPSetOperators(pcbddc->ksp_D,pcis->A_II,pcis->A_II,SAME_PRECONDITIONER);CHKERRQ(ierr); 275453cdbc3dSStefano Zampini ierr = KSPSetType(pcbddc->ksp_D,KSPPREONLY);CHKERRQ(ierr); 2755da1bb401SStefano Zampini ierr = KSPSetOptionsPrefix(pcbddc->ksp_D,"dirichlet_");CHKERRQ(ierr); 27560c7d97c5SJed Brown /* default */ 275753cdbc3dSStefano Zampini ierr = KSPGetPC(pcbddc->ksp_D,&pc_temp);CHKERRQ(ierr); 275853cdbc3dSStefano Zampini ierr = PCSetType(pc_temp,PCLU);CHKERRQ(ierr); 27590c7d97c5SJed Brown /* Allow user's customization */ 276053cdbc3dSStefano Zampini ierr = KSPSetFromOptions(pcbddc->ksp_D);CHKERRQ(ierr); 276153cdbc3dSStefano Zampini /* Set Up KSP for Dirichlet problem of BDDC */ 276253cdbc3dSStefano Zampini ierr = KSPSetUp(pcbddc->ksp_D);CHKERRQ(ierr); 27633972b0daSStefano Zampini /* set ksp_D into pcis data */ 27643972b0daSStefano Zampini ierr = KSPDestroy(&pcis->ksp_D);CHKERRQ(ierr); 27653972b0daSStefano Zampini ierr = PetscObjectReference((PetscObject)pcbddc->ksp_D);CHKERRQ(ierr); 27663972b0daSStefano Zampini pcis->ksp_D = pcbddc->ksp_D; 2767da1bb401SStefano Zampini if(pcbddc->dbg_flag) ierr = KSPView(pcbddc->ksp_D,PETSC_VIEWER_STDOUT_SELF); 27680c7d97c5SJed Brown /* Matrix for Neumann problem is A_RR -> we need to create it */ 2769534831adSStefano Zampini ierr = MatGetSubMatrix(pcbddc->local_mat,is_R_local,is_R_local,MAT_INITIAL_MATRIX,&A_RR);CHKERRQ(ierr); 277053cdbc3dSStefano Zampini ierr = KSPCreate(PETSC_COMM_SELF,&pcbddc->ksp_R);CHKERRQ(ierr); 277153cdbc3dSStefano Zampini ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->ksp_R,(PetscObject)pc,1);CHKERRQ(ierr); 277253cdbc3dSStefano Zampini ierr = KSPSetOperators(pcbddc->ksp_R,A_RR,A_RR,SAME_PRECONDITIONER);CHKERRQ(ierr); 277353cdbc3dSStefano Zampini ierr = KSPSetType(pcbddc->ksp_R,KSPPREONLY);CHKERRQ(ierr); 2774da1bb401SStefano Zampini ierr = KSPSetOptionsPrefix(pcbddc->ksp_R,"neumann_");CHKERRQ(ierr); 27750c7d97c5SJed Brown /* default */ 277653cdbc3dSStefano Zampini ierr = KSPGetPC(pcbddc->ksp_R,&pc_temp);CHKERRQ(ierr); 277753cdbc3dSStefano Zampini ierr = PCSetType(pc_temp,PCLU);CHKERRQ(ierr); 27780c7d97c5SJed Brown /* Allow user's customization */ 277953cdbc3dSStefano Zampini ierr = KSPSetFromOptions(pcbddc->ksp_R);CHKERRQ(ierr); 278053cdbc3dSStefano Zampini /* Set Up KSP for Neumann problem of BDDC */ 278153cdbc3dSStefano Zampini ierr = KSPSetUp(pcbddc->ksp_R);CHKERRQ(ierr); 2782da1bb401SStefano Zampini if(pcbddc->dbg_flag) ierr = KSPView(pcbddc->ksp_R,PETSC_VIEWER_STDOUT_SELF); 2783a0ba757dSStefano Zampini /* check Dirichlet and Neumann solvers */ 2784ba1573a8SStefano Zampini if(dbg_flag) { 27850c7d97c5SJed Brown Vec temp_vec; 27860c7d97c5SJed Brown PetscScalar value; 27870c7d97c5SJed Brown 2788a0ba757dSStefano Zampini ierr = VecDuplicate(pcis->vec1_D,&temp_vec);CHKERRQ(ierr); 2789a0ba757dSStefano Zampini ierr = VecSetRandom(pcis->vec1_D,PETSC_NULL);CHKERRQ(ierr); 2790a0ba757dSStefano Zampini ierr = MatMult(pcis->A_II,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr); 2791a0ba757dSStefano Zampini ierr = KSPSolve(pcbddc->ksp_D,pcis->vec2_D,temp_vec);CHKERRQ(ierr); 2792a0ba757dSStefano Zampini ierr = VecAXPY(temp_vec,m_one,pcis->vec1_D);CHKERRQ(ierr); 2793a0ba757dSStefano Zampini ierr = VecNorm(temp_vec,NORM_INFINITY,&value);CHKERRQ(ierr); 2794a0ba757dSStefano Zampini ierr = VecDestroy(&temp_vec);CHKERRQ(ierr); 2795a0ba757dSStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 2796a0ba757dSStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr); 2797a0ba757dSStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Checking solution of Dirichlet and Neumann problems\n");CHKERRQ(ierr); 2798a0ba757dSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d infinity error for Dirichlet solve = % 1.14e \n",PetscGlobalRank,value);CHKERRQ(ierr); 2799d49ef151SStefano Zampini ierr = VecDuplicate(pcbddc->vec1_R,&temp_vec);CHKERRQ(ierr); 2800d49ef151SStefano Zampini ierr = VecSetRandom(pcbddc->vec1_R,PETSC_NULL);CHKERRQ(ierr); 2801d49ef151SStefano Zampini ierr = MatMult(A_RR,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr); 2802d49ef151SStefano Zampini ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec2_R,temp_vec);CHKERRQ(ierr); 2803d49ef151SStefano Zampini ierr = VecAXPY(temp_vec,m_one,pcbddc->vec1_R);CHKERRQ(ierr); 2804d49ef151SStefano Zampini ierr = VecNorm(temp_vec,NORM_INFINITY,&value);CHKERRQ(ierr); 2805e269702eSStefano Zampini ierr = VecDestroy(&temp_vec);CHKERRQ(ierr); 28060c7d97c5SJed Brown ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d infinity error for Neumann solve = % 1.14e \n",PetscGlobalRank,value);CHKERRQ(ierr); 2807d49ef151SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 28080c7d97c5SJed Brown } 28090c7d97c5SJed Brown /* free Neumann problem's matrix */ 28100c7d97c5SJed Brown ierr = MatDestroy(&A_RR);CHKERRQ(ierr); 28110c7d97c5SJed Brown } 28120c7d97c5SJed Brown 28130c7d97c5SJed Brown /* Assemble all remaining stuff needed to apply BDDC */ 28140c7d97c5SJed Brown { 28150c7d97c5SJed Brown Mat A_RV,A_VR,A_VV; 28160c7d97c5SJed Brown Mat M1,M2; 28170c7d97c5SJed Brown Mat C_CR; 28183b03a366Sstefano_zampini Mat AUXMAT; 28190c7d97c5SJed Brown Vec vec1_C; 28200c7d97c5SJed Brown Vec vec2_C; 28210c7d97c5SJed Brown Vec vec1_V; 28220c7d97c5SJed Brown Vec vec2_V; 28230c7d97c5SJed Brown PetscInt *nnz; 28240c7d97c5SJed Brown PetscInt *auxindices; 282553cdbc3dSStefano Zampini PetscInt index; 28260c7d97c5SJed Brown PetscScalar* array2; 28270c7d97c5SJed Brown MatFactorInfo matinfo; 28280c7d97c5SJed Brown 28290c7d97c5SJed Brown /* Allocating some extra storage just to be safe */ 28300c7d97c5SJed Brown ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&nnz);CHKERRQ(ierr); 28310c7d97c5SJed Brown ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&auxindices);CHKERRQ(ierr); 28320c7d97c5SJed Brown for(i=0;i<pcis->n;i++) {auxindices[i]=i;} 28330c7d97c5SJed Brown 28340c7d97c5SJed Brown /* some work vectors on vertices and/or constraints */ 28353b03a366Sstefano_zampini if(n_vertices) { 28360c7d97c5SJed Brown ierr = VecCreate(PETSC_COMM_SELF,&vec1_V);CHKERRQ(ierr); 28373b03a366Sstefano_zampini ierr = VecSetSizes(vec1_V,n_vertices,n_vertices);CHKERRQ(ierr); 28380c7d97c5SJed Brown ierr = VecSetType(vec1_V,impVecType);CHKERRQ(ierr); 28390c7d97c5SJed Brown ierr = VecDuplicate(vec1_V,&vec2_V);CHKERRQ(ierr); 28400c7d97c5SJed Brown } 2841534831adSStefano Zampini if(n_constraints) { 28420c7d97c5SJed Brown ierr = VecCreate(PETSC_COMM_SELF,&vec1_C);CHKERRQ(ierr); 2843534831adSStefano Zampini ierr = VecSetSizes(vec1_C,n_constraints,n_constraints);CHKERRQ(ierr); 28440c7d97c5SJed Brown ierr = VecSetType(vec1_C,impVecType);CHKERRQ(ierr); 28450c7d97c5SJed Brown ierr = VecDuplicate(vec1_C,&vec2_C);CHKERRQ(ierr); 28460c7d97c5SJed Brown ierr = VecDuplicate(vec1_C,&pcbddc->vec1_C);CHKERRQ(ierr); 28470c7d97c5SJed Brown } 28480c7d97c5SJed Brown /* Precompute stuffs needed for preprocessing and application of BDDC*/ 28493b03a366Sstefano_zampini if(n_constraints) { 28500c7d97c5SJed Brown ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->local_auxmat2);CHKERRQ(ierr); 28513b03a366Sstefano_zampini ierr = MatSetSizes(pcbddc->local_auxmat2,n_R,n_constraints,n_R,n_constraints);CHKERRQ(ierr); 28520c7d97c5SJed Brown ierr = MatSetType(pcbddc->local_auxmat2,impMatType);CHKERRQ(ierr); 28533b03a366Sstefano_zampini ierr = MatSeqDenseSetPreallocation(pcbddc->local_auxmat2,PETSC_NULL);CHKERRQ(ierr); 28540c7d97c5SJed Brown 285557a90decSStefano Zampini /* Create Constraint matrix on R nodes: C_{CR} */ 285657a90decSStefano Zampini ierr = MatGetSubMatrix(pcbddc->ConstraintMatrix,is_C_local,is_R_local,MAT_INITIAL_MATRIX,&C_CR);CHKERRQ(ierr); 285757a90decSStefano Zampini ierr = ISDestroy(&is_C_local);CHKERRQ(ierr); 285857a90decSStefano Zampini 28590c7d97c5SJed Brown /* Assemble local_auxmat2 = - A_{RR}^{-1} C^T_{CR} needed by BDDC application */ 28603b03a366Sstefano_zampini for(i=0;i<n_constraints;i++) { 28613b03a366Sstefano_zampini ierr = VecSet(pcbddc->vec1_R,zero);CHKERRQ(ierr); 28623b03a366Sstefano_zampini /* Get row of constraint matrix in R numbering */ 286357a90decSStefano Zampini ierr = VecGetArray(pcbddc->vec1_R,&array);CHKERRQ(ierr); 286457a90decSStefano Zampini ierr = MatGetRow(C_CR,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr); 28653b03a366Sstefano_zampini for(j=0;j<size_of_constraint;j++) { array[ row_cmat_indices[j] ] = - row_cmat_values[j]; } 286657a90decSStefano Zampini ierr = MatRestoreRow(C_CR,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr); 286757a90decSStefano Zampini ierr = VecRestoreArray(pcbddc->vec1_R,&array);CHKERRQ(ierr); 28683b03a366Sstefano_zampini /* Solve for row of constraint matrix in R numbering */ 286953cdbc3dSStefano Zampini ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr); 28703b03a366Sstefano_zampini /* Set values */ 28710c7d97c5SJed Brown ierr = VecGetArray(pcbddc->vec2_R,&array);CHKERRQ(ierr); 28723b03a366Sstefano_zampini ierr = MatSetValues(pcbddc->local_auxmat2,n_R,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr); 28730c7d97c5SJed Brown ierr = VecRestoreArray(pcbddc->vec2_R,&array);CHKERRQ(ierr); 28740c7d97c5SJed Brown } 28750c7d97c5SJed Brown ierr = MatAssemblyBegin(pcbddc->local_auxmat2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 28760c7d97c5SJed Brown ierr = MatAssemblyEnd(pcbddc->local_auxmat2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 28770c7d97c5SJed Brown 28780c7d97c5SJed Brown /* Assemble AUXMAT = ( LUFactor )( -C_{CR} A_{RR}^{-1} C^T_{CR} )^{-1} */ 28790c7d97c5SJed Brown ierr = MatMatMult(C_CR,pcbddc->local_auxmat2,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&AUXMAT);CHKERRQ(ierr); 2880d49ef151SStefano Zampini ierr = MatFactorInfoInitialize(&matinfo);CHKERRQ(ierr); 28813b03a366Sstefano_zampini ierr = ISCreateStride(PETSC_COMM_SELF,n_constraints,0,1,&is_aux1);CHKERRQ(ierr); 28820c7d97c5SJed Brown ierr = MatLUFactor(AUXMAT,is_aux1,is_aux1,&matinfo);CHKERRQ(ierr); 28830c7d97c5SJed Brown ierr = ISDestroy(&is_aux1);CHKERRQ(ierr); 28840c7d97c5SJed Brown 28853b03a366Sstefano_zampini /* Assemble explicitly M1 = ( C_{CR} A_{RR}^{-1} C^T_{CR} )^{-1} needed in preproc */ 2886d49ef151SStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&M1);CHKERRQ(ierr); 28873b03a366Sstefano_zampini ierr = MatSetSizes(M1,n_constraints,n_constraints,n_constraints,n_constraints);CHKERRQ(ierr); 28880c7d97c5SJed Brown ierr = MatSetType(M1,impMatType);CHKERRQ(ierr); 28893b03a366Sstefano_zampini ierr = MatSeqDenseSetPreallocation(M1,PETSC_NULL);CHKERRQ(ierr); 28903b03a366Sstefano_zampini for(i=0;i<n_constraints;i++) { 28910c7d97c5SJed Brown ierr = VecSet(vec1_C,zero);CHKERRQ(ierr); 28920c7d97c5SJed Brown ierr = VecSetValue(vec1_C,i,one,INSERT_VALUES);CHKERRQ(ierr); 28930c7d97c5SJed Brown ierr = VecAssemblyBegin(vec1_C);CHKERRQ(ierr); 28940c7d97c5SJed Brown ierr = VecAssemblyEnd(vec1_C);CHKERRQ(ierr); 28950c7d97c5SJed Brown ierr = MatSolve(AUXMAT,vec1_C,vec2_C);CHKERRQ(ierr); 28960c7d97c5SJed Brown ierr = VecScale(vec2_C,m_one);CHKERRQ(ierr); 28970c7d97c5SJed Brown ierr = VecGetArray(vec2_C,&array);CHKERRQ(ierr); 28983b03a366Sstefano_zampini ierr = MatSetValues(M1,n_constraints,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr); 28990c7d97c5SJed Brown ierr = VecRestoreArray(vec2_C,&array);CHKERRQ(ierr); 29000c7d97c5SJed Brown } 29010c7d97c5SJed Brown ierr = MatAssemblyBegin(M1,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 29020c7d97c5SJed Brown ierr = MatAssemblyEnd(M1,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 29030c7d97c5SJed Brown ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr); 29040c7d97c5SJed Brown /* Assemble local_auxmat1 = M1*C_{CR} needed by BDDC application in KSP and in preproc */ 29050c7d97c5SJed Brown ierr = MatMatMult(M1,C_CR,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&pcbddc->local_auxmat1);CHKERRQ(ierr); 29060c7d97c5SJed Brown 29070c7d97c5SJed Brown } 29080c7d97c5SJed Brown 29090c7d97c5SJed Brown /* Get submatrices from subdomain matrix */ 29103b03a366Sstefano_zampini if(n_vertices){ 2911534831adSStefano Zampini ierr = MatGetSubMatrix(pcbddc->local_mat,is_R_local,is_V_local,MAT_INITIAL_MATRIX,&A_RV);CHKERRQ(ierr); 2912534831adSStefano Zampini ierr = MatGetSubMatrix(pcbddc->local_mat,is_V_local,is_R_local,MAT_INITIAL_MATRIX,&A_VR);CHKERRQ(ierr); 2913534831adSStefano Zampini ierr = MatGetSubMatrix(pcbddc->local_mat,is_V_local,is_V_local,MAT_INITIAL_MATRIX,&A_VV);CHKERRQ(ierr); 29140c7d97c5SJed Brown /* Assemble M2 = A_RR^{-1}A_RV */ 2915d49ef151SStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&M2);CHKERRQ(ierr); 29163b03a366Sstefano_zampini ierr = MatSetSizes(M2,n_R,n_vertices,n_R,n_vertices);CHKERRQ(ierr); 29170c7d97c5SJed Brown ierr = MatSetType(M2,impMatType);CHKERRQ(ierr); 29183b03a366Sstefano_zampini ierr = MatSeqDenseSetPreallocation(M2,PETSC_NULL);CHKERRQ(ierr); 29193b03a366Sstefano_zampini for(i=0;i<n_vertices;i++) { 29200c7d97c5SJed Brown ierr = VecSet(vec1_V,zero);CHKERRQ(ierr); 29210c7d97c5SJed Brown ierr = VecSetValue(vec1_V,i,one,INSERT_VALUES);CHKERRQ(ierr); 29220c7d97c5SJed Brown ierr = VecAssemblyBegin(vec1_V);CHKERRQ(ierr); 29230c7d97c5SJed Brown ierr = VecAssemblyEnd(vec1_V);CHKERRQ(ierr); 29240c7d97c5SJed Brown ierr = MatMult(A_RV,vec1_V,pcbddc->vec1_R);CHKERRQ(ierr); 292553cdbc3dSStefano Zampini ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr); 29260c7d97c5SJed Brown ierr = VecGetArray(pcbddc->vec2_R,&array);CHKERRQ(ierr); 29273b03a366Sstefano_zampini ierr = MatSetValues(M2,n_R,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr); 29280c7d97c5SJed Brown ierr = VecRestoreArray(pcbddc->vec2_R,&array);CHKERRQ(ierr); 29290c7d97c5SJed Brown } 29300c7d97c5SJed Brown ierr = MatAssemblyBegin(M2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 29310c7d97c5SJed Brown ierr = MatAssemblyEnd(M2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 29320c7d97c5SJed Brown } 29330c7d97c5SJed Brown 29340c7d97c5SJed Brown /* Matrix of coarse basis functions (local) */ 2935d49ef151SStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->coarse_phi_B);CHKERRQ(ierr); 29360c7d97c5SJed Brown ierr = MatSetSizes(pcbddc->coarse_phi_B,n_B,pcbddc->local_primal_size,n_B,pcbddc->local_primal_size);CHKERRQ(ierr); 29370c7d97c5SJed Brown ierr = MatSetType(pcbddc->coarse_phi_B,impMatType);CHKERRQ(ierr); 29383b03a366Sstefano_zampini ierr = MatSeqDenseSetPreallocation(pcbddc->coarse_phi_B,PETSC_NULL);CHKERRQ(ierr); 2939e269702eSStefano Zampini if(pcbddc->prec_type || dbg_flag ) { 2940d49ef151SStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->coarse_phi_D);CHKERRQ(ierr); 29410c7d97c5SJed Brown ierr = MatSetSizes(pcbddc->coarse_phi_D,n_D,pcbddc->local_primal_size,n_D,pcbddc->local_primal_size);CHKERRQ(ierr); 29420c7d97c5SJed Brown ierr = MatSetType(pcbddc->coarse_phi_D,impMatType);CHKERRQ(ierr); 29433b03a366Sstefano_zampini ierr = MatSeqDenseSetPreallocation(pcbddc->coarse_phi_D,PETSC_NULL);CHKERRQ(ierr); 29440c7d97c5SJed Brown } 29450c7d97c5SJed Brown 2946e269702eSStefano Zampini if(dbg_flag) { 29470c7d97c5SJed Brown ierr = PetscMalloc( pcbddc->local_primal_size*sizeof(PetscScalar),&coarsefunctions_errors);CHKERRQ(ierr); 29480c7d97c5SJed Brown ierr = PetscMalloc( pcbddc->local_primal_size*sizeof(PetscScalar),&constraints_errors);CHKERRQ(ierr); 29490c7d97c5SJed Brown } 29503b03a366Sstefano_zampini /* Subdomain contribution (Non-overlapping) to coarse matrix */ 29510c7d97c5SJed Brown ierr = PetscMalloc ((pcbddc->local_primal_size)*(pcbddc->local_primal_size)*sizeof(PetscScalar),&coarse_submat_vals);CHKERRQ(ierr); 29520c7d97c5SJed Brown 29530c7d97c5SJed Brown /* We are now ready to evaluate coarse basis functions and subdomain contribution to coarse problem */ 29543b03a366Sstefano_zampini for(i=0;i<n_vertices;i++){ 29550c7d97c5SJed Brown ierr = VecSet(vec1_V,zero);CHKERRQ(ierr); 29560c7d97c5SJed Brown ierr = VecSetValue(vec1_V,i,one,INSERT_VALUES);CHKERRQ(ierr); 29570c7d97c5SJed Brown ierr = VecAssemblyBegin(vec1_V);CHKERRQ(ierr); 29580c7d97c5SJed Brown ierr = VecAssemblyEnd(vec1_V);CHKERRQ(ierr); 29590c7d97c5SJed Brown /* solution of saddle point problem */ 29600c7d97c5SJed Brown ierr = MatMult(M2,vec1_V,pcbddc->vec1_R);CHKERRQ(ierr); 29610c7d97c5SJed Brown ierr = VecScale(pcbddc->vec1_R,m_one);CHKERRQ(ierr); 29623b03a366Sstefano_zampini if(n_constraints) { 29630c7d97c5SJed Brown ierr = MatMult(pcbddc->local_auxmat1,pcbddc->vec1_R,vec1_C);CHKERRQ(ierr); 29640c7d97c5SJed Brown ierr = MatMultAdd(pcbddc->local_auxmat2,vec1_C,pcbddc->vec1_R,pcbddc->vec1_R);CHKERRQ(ierr); 29650c7d97c5SJed Brown ierr = VecScale(vec1_C,m_one);CHKERRQ(ierr); 29660c7d97c5SJed Brown } 29670c7d97c5SJed Brown ierr = MatMult(A_VR,pcbddc->vec1_R,vec2_V);CHKERRQ(ierr); 29680c7d97c5SJed Brown ierr = MatMultAdd(A_VV,vec1_V,vec2_V,vec2_V);CHKERRQ(ierr); 29690c7d97c5SJed Brown 29700c7d97c5SJed Brown /* Set values in coarse basis function and subdomain part of coarse_mat */ 29710c7d97c5SJed Brown /* coarse basis functions */ 29720c7d97c5SJed Brown ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr); 29730c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 29740c7d97c5SJed Brown ierr = VecScatterEnd (pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 29750c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr); 29763b03a366Sstefano_zampini ierr = MatSetValues(pcbddc->coarse_phi_B,n_B,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr); 29770c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr); 29780c7d97c5SJed Brown ierr = MatSetValue(pcbddc->coarse_phi_B,idx_V_B[i],i,one,INSERT_VALUES);CHKERRQ(ierr); 2979e269702eSStefano Zampini if( pcbddc->prec_type || dbg_flag ) { 29800c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 29810c7d97c5SJed Brown ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 29820c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_D,&array);CHKERRQ(ierr); 29833b03a366Sstefano_zampini ierr = MatSetValues(pcbddc->coarse_phi_D,n_D,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr); 29840c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_D,&array);CHKERRQ(ierr); 29850c7d97c5SJed Brown } 29860c7d97c5SJed Brown /* subdomain contribution to coarse matrix */ 29870c7d97c5SJed Brown ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr); 2988da1bb401SStefano Zampini for(j=0;j<n_vertices;j++) { coarse_submat_vals[i*pcbddc->local_primal_size+j] = array[j]; } /* WARNING -> column major ordering */ 29890c7d97c5SJed Brown ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr); 29903b03a366Sstefano_zampini if(n_constraints) { 29910c7d97c5SJed Brown ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr); 2992da1bb401SStefano Zampini for(j=0;j<n_constraints;j++) { coarse_submat_vals[i*pcbddc->local_primal_size+j+n_vertices] = array[j]; } /* WARNING -> column major ordering */ 29930c7d97c5SJed Brown ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr); 29940c7d97c5SJed Brown } 29950c7d97c5SJed Brown 2996e269702eSStefano Zampini if( dbg_flag ) { 29970c7d97c5SJed Brown /* assemble subdomain vector on nodes */ 2998d49ef151SStefano Zampini ierr = VecSet(pcis->vec1_N,zero);CHKERRQ(ierr); 29990c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 30000c7d97c5SJed Brown ierr = VecGetArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr); 30010c7d97c5SJed Brown for(j=0;j<n_R;j++) { array[idx_R_local[j]] = array2[j]; } 30023b03a366Sstefano_zampini array[ vertices[i] ] = one; 30030c7d97c5SJed Brown ierr = VecRestoreArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr); 30040c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 30050c7d97c5SJed Brown /* assemble subdomain vector of lagrange multipliers (i.e. primal nodes) */ 3006d49ef151SStefano Zampini ierr = VecSet(pcbddc->vec1_P,zero);CHKERRQ(ierr); 30070c7d97c5SJed Brown ierr = VecGetArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr); 30080c7d97c5SJed Brown ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr); 30093b03a366Sstefano_zampini for(j=0;j<n_vertices;j++) { array2[j]=array[j]; } 30100c7d97c5SJed Brown ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr); 30113b03a366Sstefano_zampini if(n_constraints) { 30120c7d97c5SJed Brown ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr); 30133b03a366Sstefano_zampini for(j=0;j<n_constraints;j++) { array2[j+n_vertices]=array[j]; } 30140c7d97c5SJed Brown ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr); 30150c7d97c5SJed Brown } 30160c7d97c5SJed Brown ierr = VecRestoreArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr); 30170c7d97c5SJed Brown ierr = VecScale(pcbddc->vec1_P,m_one);CHKERRQ(ierr); 30180c7d97c5SJed Brown /* check saddle point solution */ 3019534831adSStefano Zampini ierr = MatMult(pcbddc->local_mat,pcis->vec1_N,pcis->vec2_N);CHKERRQ(ierr); 30203b03a366Sstefano_zampini ierr = MatMultTransposeAdd(pcbddc->ConstraintMatrix,pcbddc->vec1_P,pcis->vec2_N,pcis->vec2_N);CHKERRQ(ierr); 30213b03a366Sstefano_zampini ierr = VecNorm(pcis->vec2_N,NORM_INFINITY,&coarsefunctions_errors[i]);CHKERRQ(ierr); 30223b03a366Sstefano_zampini ierr = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr); 30230c7d97c5SJed Brown ierr = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr); 30243b03a366Sstefano_zampini array[i]=array[i]+m_one; /* shift by the identity matrix */ 30250c7d97c5SJed Brown ierr = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr); 30263b03a366Sstefano_zampini ierr = VecNorm(pcbddc->vec1_P,NORM_INFINITY,&constraints_errors[i]);CHKERRQ(ierr); 30270c7d97c5SJed Brown } 30280c7d97c5SJed Brown } 30290c7d97c5SJed Brown 30303b03a366Sstefano_zampini for(i=0;i<n_constraints;i++){ 3031d49ef151SStefano Zampini ierr = VecSet(vec2_C,zero);CHKERRQ(ierr); 30320c7d97c5SJed Brown ierr = VecSetValue(vec2_C,i,m_one,INSERT_VALUES);CHKERRQ(ierr); 30330c7d97c5SJed Brown ierr = VecAssemblyBegin(vec2_C);CHKERRQ(ierr); 30340c7d97c5SJed Brown ierr = VecAssemblyEnd(vec2_C);CHKERRQ(ierr); 30350c7d97c5SJed Brown /* solution of saddle point problem */ 30360c7d97c5SJed Brown ierr = MatMult(M1,vec2_C,vec1_C);CHKERRQ(ierr); 30370c7d97c5SJed Brown ierr = MatMult(pcbddc->local_auxmat2,vec1_C,pcbddc->vec1_R);CHKERRQ(ierr); 30380c7d97c5SJed Brown ierr = VecScale(vec1_C,m_one);CHKERRQ(ierr); 30393b03a366Sstefano_zampini if(n_vertices) { ierr = MatMult(A_VR,pcbddc->vec1_R,vec2_V);CHKERRQ(ierr); } 30400c7d97c5SJed Brown /* Set values in coarse basis function and subdomain part of coarse_mat */ 30410c7d97c5SJed Brown /* coarse basis functions */ 30423b03a366Sstefano_zampini index=i+n_vertices; 30430c7d97c5SJed Brown ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr); 30440c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 30450c7d97c5SJed Brown ierr = VecScatterEnd (pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 30460c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr); 304753cdbc3dSStefano Zampini ierr = MatSetValues(pcbddc->coarse_phi_B,n_B,auxindices,1,&index,array,INSERT_VALUES);CHKERRQ(ierr); 30480c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr); 3049e269702eSStefano Zampini if( pcbddc->prec_type || dbg_flag ) { 30500c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 30510c7d97c5SJed Brown ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 30520c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_D,&array);CHKERRQ(ierr); 305353cdbc3dSStefano Zampini ierr = MatSetValues(pcbddc->coarse_phi_D,n_D,auxindices,1,&index,array,INSERT_VALUES);CHKERRQ(ierr); 30540c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_D,&array);CHKERRQ(ierr); 30550c7d97c5SJed Brown } 30560c7d97c5SJed Brown /* subdomain contribution to coarse matrix */ 30573b03a366Sstefano_zampini if(n_vertices) { 30580c7d97c5SJed Brown ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr); 3059da1bb401SStefano Zampini for(j=0;j<n_vertices;j++) {coarse_submat_vals[index*pcbddc->local_primal_size+j]=array[j];} /* WARNING -> column major ordering */ 30600c7d97c5SJed Brown ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr); 30610c7d97c5SJed Brown } 30620c7d97c5SJed Brown ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr); 3063da1bb401SStefano Zampini for(j=0;j<n_constraints;j++) {coarse_submat_vals[index*pcbddc->local_primal_size+j+n_vertices]=array[j];} /* WARNING -> column major ordering */ 30640c7d97c5SJed Brown ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr); 30650c7d97c5SJed Brown 3066e269702eSStefano Zampini if( dbg_flag ) { 30670c7d97c5SJed Brown /* assemble subdomain vector on nodes */ 306853cdbc3dSStefano Zampini ierr = VecSet(pcis->vec1_N,zero);CHKERRQ(ierr); 30690c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 30700c7d97c5SJed Brown ierr = VecGetArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr); 30710c7d97c5SJed Brown for(j=0;j<n_R;j++){ array[ idx_R_local[j] ] = array2[j]; } 30720c7d97c5SJed Brown ierr = VecRestoreArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr); 30730c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 30740c7d97c5SJed Brown /* assemble subdomain vector of lagrange multipliers */ 307553cdbc3dSStefano Zampini ierr = VecSet(pcbddc->vec1_P,zero);CHKERRQ(ierr); 30760c7d97c5SJed Brown ierr = VecGetArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr); 30773b03a366Sstefano_zampini if( n_vertices) { 30780c7d97c5SJed Brown ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr); 30793b03a366Sstefano_zampini for(j=0;j<n_vertices;j++) {array2[j]=-array[j];} 30800c7d97c5SJed Brown ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr); 30810c7d97c5SJed Brown } 30820c7d97c5SJed Brown ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr); 30833b03a366Sstefano_zampini for(j=0;j<n_constraints;j++) {array2[j+n_vertices]=-array[j];} 30840c7d97c5SJed Brown ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr); 30850c7d97c5SJed Brown ierr = VecRestoreArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr); 30863972b0daSStefano Zampini /* check saddle point solution */ 3087534831adSStefano Zampini ierr = MatMult(pcbddc->local_mat,pcis->vec1_N,pcis->vec2_N);CHKERRQ(ierr); 30883b03a366Sstefano_zampini ierr = MatMultTransposeAdd(pcbddc->ConstraintMatrix,pcbddc->vec1_P,pcis->vec2_N,pcis->vec2_N);CHKERRQ(ierr); 308953cdbc3dSStefano Zampini ierr = VecNorm(pcis->vec2_N,NORM_INFINITY,&coarsefunctions_errors[index]);CHKERRQ(ierr); 30903b03a366Sstefano_zampini ierr = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr); 30910c7d97c5SJed Brown ierr = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr); 309253cdbc3dSStefano Zampini array[index]=array[index]+m_one; /* shift by the identity matrix */ 30930c7d97c5SJed Brown ierr = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr); 309453cdbc3dSStefano Zampini ierr = VecNorm(pcbddc->vec1_P,NORM_INFINITY,&constraints_errors[index]);CHKERRQ(ierr); 30950c7d97c5SJed Brown } 30960c7d97c5SJed Brown } 30970c7d97c5SJed Brown ierr = MatAssemblyBegin(pcbddc->coarse_phi_B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 30980c7d97c5SJed Brown ierr = MatAssemblyEnd (pcbddc->coarse_phi_B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 3099e269702eSStefano Zampini if( pcbddc->prec_type || dbg_flag ) { 31000c7d97c5SJed Brown ierr = MatAssemblyBegin(pcbddc->coarse_phi_D,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 31010c7d97c5SJed Brown ierr = MatAssemblyEnd (pcbddc->coarse_phi_D,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 31020c7d97c5SJed Brown } 31030c7d97c5SJed Brown /* Checking coarse_sub_mat and coarse basis functios */ 31040c7d97c5SJed Brown /* It shuld be \Phi^{(j)^T} A^{(j)} \Phi^{(j)}=coarse_sub_mat */ 31059d2fce94SStefano Zampini if(dbg_flag) { 31060c7d97c5SJed Brown 31070c7d97c5SJed Brown Mat coarse_sub_mat; 31080c7d97c5SJed Brown Mat TM1,TM2,TM3,TM4; 31090c7d97c5SJed Brown Mat coarse_phi_D,coarse_phi_B,A_II,A_BB,A_IB,A_BI; 3110a0ba757dSStefano Zampini const MatType checkmattype=MATSEQAIJ; 31110c7d97c5SJed Brown PetscScalar value; 31120c7d97c5SJed Brown 3113c042a7c3SStefano Zampini ierr = MatConvert(pcis->A_II,checkmattype,MAT_INITIAL_MATRIX,&A_II);CHKERRQ(ierr); 3114c042a7c3SStefano Zampini ierr = MatConvert(pcis->A_IB,checkmattype,MAT_INITIAL_MATRIX,&A_IB);CHKERRQ(ierr); 3115c042a7c3SStefano Zampini ierr = MatConvert(pcis->A_BI,checkmattype,MAT_INITIAL_MATRIX,&A_BI);CHKERRQ(ierr); 3116c042a7c3SStefano Zampini ierr = MatConvert(pcis->A_BB,checkmattype,MAT_INITIAL_MATRIX,&A_BB);CHKERRQ(ierr); 3117c042a7c3SStefano Zampini ierr = MatConvert(pcbddc->coarse_phi_D,checkmattype,MAT_INITIAL_MATRIX,&coarse_phi_D);CHKERRQ(ierr); 3118c042a7c3SStefano Zampini ierr = MatConvert(pcbddc->coarse_phi_B,checkmattype,MAT_INITIAL_MATRIX,&coarse_phi_B);CHKERRQ(ierr); 3119c042a7c3SStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,pcbddc->local_primal_size,pcbddc->local_primal_size,coarse_submat_vals,&coarse_sub_mat);CHKERRQ(ierr); 3120c042a7c3SStefano Zampini ierr = MatConvert(coarse_sub_mat,checkmattype,MAT_REUSE_MATRIX,&coarse_sub_mat);CHKERRQ(ierr); 31210c7d97c5SJed Brown 3122da1bb401SStefano Zampini /*PetscViewer view_out; 3123da1bb401SStefano Zampini PetscMPIInt myrank; 3124da1bb401SStefano Zampini char filename[256]; 3125da1bb401SStefano Zampini MPI_Comm_rank(((PetscObject)pc)->comm,&myrank); 3126da1bb401SStefano Zampini sprintf(filename,"coarsesubmat_%04d.m",myrank); 3127da1bb401SStefano Zampini ierr = PetscViewerASCIIOpen(PETSC_COMM_SELF,filename,&view_out);CHKERRQ(ierr); 3128da1bb401SStefano Zampini ierr = PetscViewerSetFormat(view_out,PETSC_VIEWER_ASCII_MATLAB);CHKERRQ(ierr); 3129da1bb401SStefano Zampini ierr = MatView(coarse_sub_mat,view_out);CHKERRQ(ierr); 3130da1bb401SStefano Zampini ierr = PetscViewerDestroy(&view_out);CHKERRQ(ierr);*/ 3131da1bb401SStefano Zampini 31320c7d97c5SJed Brown ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr); 31330c7d97c5SJed Brown ierr = PetscViewerASCIIPrintf(viewer,"Check coarse sub mat and local basis functions\n");CHKERRQ(ierr); 31340c7d97c5SJed Brown ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 313553cdbc3dSStefano Zampini ierr = MatPtAP(A_II,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&TM1);CHKERRQ(ierr); 313653cdbc3dSStefano Zampini ierr = MatPtAP(A_BB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&TM2);CHKERRQ(ierr); 313753cdbc3dSStefano Zampini ierr = MatMatMult(A_IB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr); 3138c042a7c3SStefano Zampini ierr = MatTransposeMatMult(coarse_phi_D,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM3);CHKERRQ(ierr); 313953cdbc3dSStefano Zampini ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr); 314053cdbc3dSStefano Zampini ierr = MatMatMult(A_BI,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr); 3141c042a7c3SStefano Zampini ierr = MatTransposeMatMult(coarse_phi_B,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM4);CHKERRQ(ierr); 314253cdbc3dSStefano Zampini ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr); 314353cdbc3dSStefano Zampini ierr = MatAXPY(TM1,one,TM2,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr); 314453cdbc3dSStefano Zampini ierr = MatAXPY(TM1,one,TM3,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr); 314553cdbc3dSStefano Zampini ierr = MatAXPY(TM1,one,TM4,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr); 314653cdbc3dSStefano Zampini ierr = MatAXPY(TM1,m_one,coarse_sub_mat,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr); 314753cdbc3dSStefano Zampini ierr = MatNorm(TM1,NORM_INFINITY,&value);CHKERRQ(ierr); 31480c7d97c5SJed Brown ierr = PetscViewerASCIISynchronizedPrintf(viewer,"----------------------------------\n");CHKERRQ(ierr); 31490c7d97c5SJed Brown ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d \n",PetscGlobalRank);CHKERRQ(ierr); 31500c7d97c5SJed Brown ierr = PetscViewerASCIISynchronizedPrintf(viewer,"matrix error = % 1.14e\n",value);CHKERRQ(ierr); 31510c7d97c5SJed Brown ierr = PetscViewerASCIISynchronizedPrintf(viewer,"coarse functions errors\n");CHKERRQ(ierr); 315253cdbc3dSStefano Zampini for(i=0;i<pcbddc->local_primal_size;i++) { ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local %02d-th function error = % 1.14e\n",i,coarsefunctions_errors[i]);CHKERRQ(ierr); } 31530c7d97c5SJed Brown ierr = PetscViewerASCIISynchronizedPrintf(viewer,"constraints errors\n");CHKERRQ(ierr); 315453cdbc3dSStefano Zampini for(i=0;i<pcbddc->local_primal_size;i++) { ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local %02d-th function error = % 1.14e\n",i,constraints_errors[i]);CHKERRQ(ierr); } 31550c7d97c5SJed Brown ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 315653cdbc3dSStefano Zampini ierr = MatDestroy(&A_II);CHKERRQ(ierr); 315753cdbc3dSStefano Zampini ierr = MatDestroy(&A_BB);CHKERRQ(ierr); 315853cdbc3dSStefano Zampini ierr = MatDestroy(&A_IB);CHKERRQ(ierr); 315953cdbc3dSStefano Zampini ierr = MatDestroy(&A_BI);CHKERRQ(ierr); 316053cdbc3dSStefano Zampini ierr = MatDestroy(&TM1);CHKERRQ(ierr); 316153cdbc3dSStefano Zampini ierr = MatDestroy(&TM2);CHKERRQ(ierr); 316253cdbc3dSStefano Zampini ierr = MatDestroy(&TM3);CHKERRQ(ierr); 316353cdbc3dSStefano Zampini ierr = MatDestroy(&TM4);CHKERRQ(ierr); 316453cdbc3dSStefano Zampini ierr = MatDestroy(&coarse_phi_D);CHKERRQ(ierr); 316553cdbc3dSStefano Zampini ierr = MatDestroy(&coarse_sub_mat);CHKERRQ(ierr); 316653cdbc3dSStefano Zampini ierr = MatDestroy(&coarse_phi_B);CHKERRQ(ierr); 31670c7d97c5SJed Brown ierr = PetscFree(coarsefunctions_errors);CHKERRQ(ierr); 31680c7d97c5SJed Brown ierr = PetscFree(constraints_errors);CHKERRQ(ierr); 31690c7d97c5SJed Brown } 31700c7d97c5SJed Brown 31710c7d97c5SJed Brown /* create coarse matrix and data structures for message passing associated actual choice of coarse problem type */ 31720c7d97c5SJed Brown ierr = PCBDDCSetupCoarseEnvironment(pc,coarse_submat_vals);CHKERRQ(ierr); 31730c7d97c5SJed Brown /* free memory */ 31740c7d97c5SJed Brown ierr = PetscFree(coarse_submat_vals);CHKERRQ(ierr); 31750c7d97c5SJed Brown ierr = PetscFree(auxindices);CHKERRQ(ierr); 31760c7d97c5SJed Brown ierr = PetscFree(nnz);CHKERRQ(ierr); 31773b03a366Sstefano_zampini if(n_vertices) { 31780c7d97c5SJed Brown ierr = VecDestroy(&vec1_V);CHKERRQ(ierr); 31790c7d97c5SJed Brown ierr = VecDestroy(&vec2_V);CHKERRQ(ierr); 31800c7d97c5SJed Brown ierr = MatDestroy(&M2);CHKERRQ(ierr); 31810c7d97c5SJed Brown ierr = MatDestroy(&A_RV);CHKERRQ(ierr); 31820c7d97c5SJed Brown ierr = MatDestroy(&A_VR);CHKERRQ(ierr); 31830c7d97c5SJed Brown ierr = MatDestroy(&A_VV);CHKERRQ(ierr); 31840c7d97c5SJed Brown } 3185534831adSStefano Zampini if(n_constraints) { 31860c7d97c5SJed Brown ierr = VecDestroy(&vec1_C);CHKERRQ(ierr); 31870c7d97c5SJed Brown ierr = VecDestroy(&vec2_C);CHKERRQ(ierr); 31880c7d97c5SJed Brown ierr = MatDestroy(&M1);CHKERRQ(ierr); 31890c7d97c5SJed Brown ierr = MatDestroy(&C_CR);CHKERRQ(ierr); 31900c7d97c5SJed Brown } 31910c7d97c5SJed Brown } 31920c7d97c5SJed Brown /* free memory */ 31933b03a366Sstefano_zampini if(n_vertices) { 31940c7d97c5SJed Brown ierr = PetscFree(idx_V_B);CHKERRQ(ierr); 31950c7d97c5SJed Brown ierr = ISDestroy(&is_V_local);CHKERRQ(ierr); 31960c7d97c5SJed Brown } 31970c7d97c5SJed Brown ierr = ISDestroy(&is_R_local);CHKERRQ(ierr); 31980c7d97c5SJed Brown 31990c7d97c5SJed Brown PetscFunctionReturn(0); 32000c7d97c5SJed Brown } 32010c7d97c5SJed Brown 32020c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 32030c7d97c5SJed Brown 32040c7d97c5SJed Brown #undef __FUNCT__ 32050c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetupCoarseEnvironment" 320653cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetupCoarseEnvironment(PC pc,PetscScalar* coarse_submat_vals) 32070c7d97c5SJed Brown { 32080c7d97c5SJed Brown 32090c7d97c5SJed Brown 32100c7d97c5SJed Brown Mat_IS *matis = (Mat_IS*)pc->pmat->data; 32110c7d97c5SJed Brown PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 32120c7d97c5SJed Brown PC_IS *pcis = (PC_IS*)pc->data; 32130c7d97c5SJed Brown MPI_Comm prec_comm = ((PetscObject)pc)->comm; 32140c7d97c5SJed Brown MPI_Comm coarse_comm; 32150c7d97c5SJed Brown 32160c7d97c5SJed Brown /* common to all choiches */ 32170c7d97c5SJed Brown PetscScalar *temp_coarse_mat_vals; 32180c7d97c5SJed Brown PetscScalar *ins_coarse_mat_vals; 32190c7d97c5SJed Brown PetscInt *ins_local_primal_indices; 32200c7d97c5SJed Brown PetscMPIInt *localsizes2,*localdispl2; 32210c7d97c5SJed Brown PetscMPIInt size_prec_comm; 32220c7d97c5SJed Brown PetscMPIInt rank_prec_comm; 32230c7d97c5SJed Brown PetscMPIInt active_rank=MPI_PROC_NULL; 32240c7d97c5SJed Brown PetscMPIInt master_proc=0; 32250c7d97c5SJed Brown PetscInt ins_local_primal_size; 32260c7d97c5SJed Brown /* specific to MULTILEVEL_BDDC */ 32270c7d97c5SJed Brown PetscMPIInt *ranks_recv; 32280c7d97c5SJed Brown PetscMPIInt count_recv=0; 32290c7d97c5SJed Brown PetscMPIInt rank_coarse_proc_send_to; 32300c7d97c5SJed Brown PetscMPIInt coarse_color = MPI_UNDEFINED; 32310c7d97c5SJed Brown ISLocalToGlobalMapping coarse_ISLG; 32320c7d97c5SJed Brown /* some other variables */ 32330c7d97c5SJed Brown PetscErrorCode ierr; 32340c7d97c5SJed Brown const MatType coarse_mat_type; 32350c7d97c5SJed Brown const PCType coarse_pc_type; 323653cdbc3dSStefano Zampini const KSPType coarse_ksp_type; 323753cdbc3dSStefano Zampini PC pc_temp; 32380c7d97c5SJed Brown PetscInt i,j,k,bs; 32393b03a366Sstefano_zampini PetscInt max_it_coarse_ksp=1; /* don't increase this value */ 3240e269702eSStefano Zampini /* verbose output viewer */ 3241e269702eSStefano Zampini PetscViewer viewer=pcbddc->dbg_viewer; 3242e269702eSStefano Zampini PetscBool dbg_flag=pcbddc->dbg_flag; 32430c7d97c5SJed Brown 32440c7d97c5SJed Brown PetscFunctionBegin; 32450c7d97c5SJed Brown 32460c7d97c5SJed Brown ins_local_primal_indices = 0; 32470c7d97c5SJed Brown ins_coarse_mat_vals = 0; 32480c7d97c5SJed Brown localsizes2 = 0; 32490c7d97c5SJed Brown localdispl2 = 0; 32500c7d97c5SJed Brown temp_coarse_mat_vals = 0; 32510c7d97c5SJed Brown coarse_ISLG = 0; 32520c7d97c5SJed Brown 325353cdbc3dSStefano Zampini ierr = MPI_Comm_size(prec_comm,&size_prec_comm);CHKERRQ(ierr); 325453cdbc3dSStefano Zampini ierr = MPI_Comm_rank(prec_comm,&rank_prec_comm);CHKERRQ(ierr); 32550c7d97c5SJed Brown ierr = MatGetBlockSize(matis->A,&bs);CHKERRQ(ierr); 32560c7d97c5SJed Brown 3257beed3852SStefano Zampini /* Assign global numbering to coarse dofs */ 3258beed3852SStefano Zampini { 3259a0ba757dSStefano Zampini PetscScalar one=1.,zero=0.; 3260beed3852SStefano Zampini PetscScalar *array; 3261beed3852SStefano Zampini PetscMPIInt *auxlocal_primal; 3262beed3852SStefano Zampini PetscMPIInt *auxglobal_primal; 3263beed3852SStefano Zampini PetscMPIInt *all_auxglobal_primal; 3264beed3852SStefano Zampini PetscMPIInt *all_auxglobal_primal_dummy; 3265beed3852SStefano Zampini PetscMPIInt mpi_local_primal_size = (PetscMPIInt)pcbddc->local_primal_size; 3266da1bb401SStefano Zampini PetscInt *row_cmat_indices; 32673b03a366Sstefano_zampini PetscInt size_of_constraint; 3268da1bb401SStefano Zampini PetscScalar coarsesum; 3269beed3852SStefano Zampini 3270beed3852SStefano Zampini /* Construct needed data structures for message passing */ 3271beed3852SStefano Zampini ierr = PetscMalloc(mpi_local_primal_size*sizeof(PetscMPIInt),&pcbddc->local_primal_indices);CHKERRQ(ierr); 3272beed3852SStefano Zampini ierr = PetscMalloc(size_prec_comm*sizeof(PetscMPIInt),&pcbddc->local_primal_sizes);CHKERRQ(ierr); 3273beed3852SStefano Zampini ierr = PetscMalloc(size_prec_comm*sizeof(PetscMPIInt),&pcbddc->local_primal_displacements);CHKERRQ(ierr); 3274beed3852SStefano Zampini /* Gather local_primal_size information for all processes */ 32755619798eSStefano Zampini ierr = MPI_Allgather(&mpi_local_primal_size,1,MPIU_INT,&pcbddc->local_primal_sizes[0],1,MPIU_INT,prec_comm);CHKERRQ(ierr); 3276beed3852SStefano Zampini pcbddc->replicated_primal_size = 0; 3277beed3852SStefano Zampini for (i=0; i<size_prec_comm; i++) { 3278beed3852SStefano Zampini pcbddc->local_primal_displacements[i] = pcbddc->replicated_primal_size ; 3279beed3852SStefano Zampini pcbddc->replicated_primal_size += pcbddc->local_primal_sizes[i]; 3280beed3852SStefano Zampini } 32815619798eSStefano Zampini if(rank_prec_comm == 0) { 3282beed3852SStefano Zampini /* allocate some auxiliary space */ 3283beed3852SStefano Zampini ierr = PetscMalloc(pcbddc->replicated_primal_size*sizeof(*all_auxglobal_primal),&all_auxglobal_primal);CHKERRQ(ierr); 3284beed3852SStefano Zampini ierr = PetscMalloc(pcbddc->replicated_primal_size*sizeof(*all_auxglobal_primal_dummy),&all_auxglobal_primal_dummy);CHKERRQ(ierr); 3285beed3852SStefano Zampini } 3286beed3852SStefano Zampini ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscMPIInt),&auxlocal_primal);CHKERRQ(ierr); 3287beed3852SStefano Zampini ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscMPIInt),&auxglobal_primal);CHKERRQ(ierr); 3288beed3852SStefano Zampini 3289da1bb401SStefano Zampini /* First let's count coarse dofs. 3290beed3852SStefano Zampini This code fragment assumes that the number of local constraints per connected component 3291beed3852SStefano Zampini is not greater than the number of nodes defined for the connected component 3292beed3852SStefano Zampini (otherwise we will surely have linear dependence between constraints and thus a singular coarse problem) */ 32933b03a366Sstefano_zampini /* auxlocal_primal : primal indices in local nodes numbering (internal and interface) with complete queue sorted by global ordering */ 3294beed3852SStefano Zampini ierr = VecSet(pcis->vec1_N,zero);CHKERRQ(ierr); 3295beed3852SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 3296da1bb401SStefano Zampini for(i=0;i<pcbddc->local_primal_size;i++) { 3297da1bb401SStefano Zampini ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr); 32983b03a366Sstefano_zampini for (j=0; j<size_of_constraint; j++) { 32993b03a366Sstefano_zampini k = row_cmat_indices[j]; 3300beed3852SStefano Zampini if( array[k] == zero ) { 3301beed3852SStefano Zampini array[k] = one; 3302da1bb401SStefano Zampini auxlocal_primal[i] = k; 3303beed3852SStefano Zampini break; 3304beed3852SStefano Zampini } 3305beed3852SStefano Zampini } 3306da1bb401SStefano Zampini ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr); 3307beed3852SStefano Zampini } 3308beed3852SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 3309da1bb401SStefano Zampini ierr = VecSet(pcis->vec1_global,zero);CHKERRQ(ierr); 3310da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 3311da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 3312da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 3313da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 3314da1bb401SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 3315da1bb401SStefano Zampini for(i=0;i<pcis->n;i++) { if( array[i] > zero) array[i] = one/array[i]; } 3316da1bb401SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 3317da1bb401SStefano Zampini ierr = VecSet(pcis->vec1_global,zero);CHKERRQ(ierr); 3318da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 3319da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 3320da1bb401SStefano Zampini ierr = VecSum(pcis->vec1_global,&coarsesum);CHKERRQ(ierr); 3321da1bb401SStefano Zampini pcbddc->coarse_size = (PetscInt) coarsesum; 3322a0ba757dSStefano Zampini 3323beed3852SStefano Zampini /* Now assign them a global numbering */ 3324beed3852SStefano Zampini /* auxglobal_primal contains indices in global nodes numbering (internal and interface) */ 3325beed3852SStefano Zampini ierr = ISLocalToGlobalMappingApply(matis->mapping,pcbddc->local_primal_size,auxlocal_primal,auxglobal_primal);CHKERRQ(ierr); 3326beed3852SStefano Zampini /* all_auxglobal_primal contains all primal nodes indices in global nodes numbering (internal and interface) */ 3327beed3852SStefano Zampini ierr = MPI_Gatherv(&auxglobal_primal[0],pcbddc->local_primal_size,MPIU_INT,&all_auxglobal_primal[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,0,prec_comm);CHKERRQ(ierr); 3328beed3852SStefano Zampini 3329beed3852SStefano Zampini /* After this block all_auxglobal_primal should contains one copy of each primal node's indices in global nodes numbering */ 3330beed3852SStefano Zampini /* It implements a function similar to PetscSortRemoveDupsInt */ 3331beed3852SStefano Zampini if(rank_prec_comm==0) { 3332beed3852SStefano Zampini /* dummy argument since PetscSortMPIInt doesn't exist! */ 3333beed3852SStefano Zampini ierr = PetscSortMPIIntWithArray(pcbddc->replicated_primal_size,all_auxglobal_primal,all_auxglobal_primal_dummy);CHKERRQ(ierr); 3334beed3852SStefano Zampini k=1; 3335beed3852SStefano Zampini j=all_auxglobal_primal[0]; /* first dof in global numbering */ 3336beed3852SStefano Zampini for(i=1;i< pcbddc->replicated_primal_size ;i++) { 3337beed3852SStefano Zampini if(j != all_auxglobal_primal[i] ) { 3338beed3852SStefano Zampini all_auxglobal_primal[k]=all_auxglobal_primal[i]; 3339beed3852SStefano Zampini k++; 3340beed3852SStefano Zampini j=all_auxglobal_primal[i]; 3341beed3852SStefano Zampini } 3342beed3852SStefano Zampini } 3343beed3852SStefano Zampini } else { 3344beed3852SStefano Zampini ierr = PetscMalloc(pcbddc->coarse_size*sizeof(PetscMPIInt),&all_auxglobal_primal);CHKERRQ(ierr); 3345beed3852SStefano Zampini } 33465619798eSStefano Zampini /* We only need to broadcast the indices from 0 to pcbddc->coarse_size. Remaning elements of array all_aux_global_primal are garbage. */ 3347beed3852SStefano Zampini ierr = MPI_Bcast(all_auxglobal_primal,pcbddc->coarse_size,MPIU_INT,0,prec_comm);CHKERRQ(ierr); 3348beed3852SStefano Zampini 3349beed3852SStefano Zampini /* Now get global coarse numbering of local primal nodes */ 3350beed3852SStefano Zampini for(i=0;i<pcbddc->local_primal_size;i++) { 3351beed3852SStefano Zampini k=0; 3352beed3852SStefano Zampini while( all_auxglobal_primal[k] != auxglobal_primal[i] ) { k++;} 3353beed3852SStefano Zampini pcbddc->local_primal_indices[i]=k; 3354beed3852SStefano Zampini } 3355e269702eSStefano Zampini if(dbg_flag) { 3356e269702eSStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr); 3357da1bb401SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Size of coarse problem %d\n",pcbddc->coarse_size);CHKERRQ(ierr); 3358e269702eSStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 3359e269702eSStefano Zampini } 3360beed3852SStefano Zampini /* free allocated memory */ 3361beed3852SStefano Zampini ierr = PetscFree(auxlocal_primal);CHKERRQ(ierr); 3362beed3852SStefano Zampini ierr = PetscFree(auxglobal_primal);CHKERRQ(ierr); 3363beed3852SStefano Zampini ierr = PetscFree(all_auxglobal_primal);CHKERRQ(ierr); 3364e269702eSStefano Zampini if(rank_prec_comm == 0) { 3365beed3852SStefano Zampini ierr = PetscFree(all_auxglobal_primal_dummy);CHKERRQ(ierr); 3366beed3852SStefano Zampini } 3367e269702eSStefano Zampini } 3368beed3852SStefano Zampini 33690c7d97c5SJed Brown /* adapt coarse problem type */ 33700c7d97c5SJed Brown if(pcbddc->coarse_problem_type == MULTILEVEL_BDDC && pcbddc->active_procs < MIN_PROCS_FOR_BDDC ) 33710c7d97c5SJed Brown pcbddc->coarse_problem_type = PARALLEL_BDDC; 33720c7d97c5SJed Brown 33730c7d97c5SJed Brown switch(pcbddc->coarse_problem_type){ 33740c7d97c5SJed Brown 3375da1bb401SStefano Zampini case(MULTILEVEL_BDDC): /* we define a coarse mesh where subdomains are elements */ 33760c7d97c5SJed Brown { 33770c7d97c5SJed Brown /* we need additional variables */ 33780c7d97c5SJed Brown MetisInt n_subdomains,n_parts,objval,ncon,faces_nvtxs; 33790c7d97c5SJed Brown MetisInt *metis_coarse_subdivision; 33800c7d97c5SJed Brown MetisInt options[METIS_NOPTIONS]; 33810c7d97c5SJed Brown PetscMPIInt size_coarse_comm,rank_coarse_comm; 33820c7d97c5SJed Brown PetscMPIInt procs_jumps_coarse_comm; 33830c7d97c5SJed Brown PetscMPIInt *coarse_subdivision; 33840c7d97c5SJed Brown PetscMPIInt *total_count_recv; 33850c7d97c5SJed Brown PetscMPIInt *total_ranks_recv; 33860c7d97c5SJed Brown PetscMPIInt *displacements_recv; 33870c7d97c5SJed Brown PetscMPIInt *my_faces_connectivity; 33880c7d97c5SJed Brown PetscMPIInt *petsc_faces_adjncy; 33890c7d97c5SJed Brown MetisInt *faces_adjncy; 33900c7d97c5SJed Brown MetisInt *faces_xadj; 33910c7d97c5SJed Brown PetscMPIInt *number_of_faces; 33920c7d97c5SJed Brown PetscMPIInt *faces_displacements; 33930c7d97c5SJed Brown PetscInt *array_int; 33940c7d97c5SJed Brown PetscMPIInt my_faces=0; 33950c7d97c5SJed Brown PetscMPIInt total_faces=0; 33963828260eSStefano Zampini PetscInt ranks_stretching_ratio; 33970c7d97c5SJed Brown 33980c7d97c5SJed Brown /* define some quantities */ 33990c7d97c5SJed Brown pcbddc->coarse_communications_type = SCATTERS_BDDC; 34000c7d97c5SJed Brown coarse_mat_type = MATIS; 34010c7d97c5SJed Brown coarse_pc_type = PCBDDC; 34026c9de887SHong Zhang coarse_ksp_type = KSPCHEBYSHEV; 34030c7d97c5SJed Brown 34040c7d97c5SJed Brown /* details of coarse decomposition */ 34050c7d97c5SJed Brown n_subdomains = pcbddc->active_procs; 34060c7d97c5SJed Brown n_parts = n_subdomains/pcbddc->coarsening_ratio; 34073828260eSStefano Zampini ranks_stretching_ratio = size_prec_comm/pcbddc->active_procs; 34083828260eSStefano Zampini procs_jumps_coarse_comm = pcbddc->coarsening_ratio*ranks_stretching_ratio; 34093828260eSStefano Zampini 3410da1bb401SStefano Zampini /*printf("Coarse algorithm details: \n"); 3411da1bb401SStefano Zampini printf("n_subdomains %d, n_parts %d\nstretch %d,jumps %d,coarse_ratio %d\nlevel should be log_%d(%d)\n",n_subdomains,n_parts,ranks_stretching_ratio,procs_jumps_coarse_comm,pcbddc->coarsening_ratio,pcbddc->coarsening_ratio,(ranks_stretching_ratio/pcbddc->coarsening_ratio+1));*/ 34120c7d97c5SJed Brown 34130c7d97c5SJed Brown /* build CSR graph of subdomains' connectivity through faces */ 34140c7d97c5SJed Brown ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&array_int);CHKERRQ(ierr); 34153828260eSStefano Zampini ierr = PetscMemzero(array_int,pcis->n*sizeof(PetscInt));CHKERRQ(ierr); 34160c7d97c5SJed Brown for(i=1;i<pcis->n_neigh;i++){/* i=1 so I don't count myself -> faces nodes counts to 1 */ 34170c7d97c5SJed Brown for(j=0;j<pcis->n_shared[i];j++){ 34180c7d97c5SJed Brown array_int[ pcis->shared[i][j] ]+=1; 34190c7d97c5SJed Brown } 34200c7d97c5SJed Brown } 34210c7d97c5SJed Brown for(i=1;i<pcis->n_neigh;i++){ 34220c7d97c5SJed Brown for(j=0;j<pcis->n_shared[i];j++){ 34230c7d97c5SJed Brown if(array_int[ pcis->shared[i][j] ] == 1 ){ 34240c7d97c5SJed Brown my_faces++; 34250c7d97c5SJed Brown break; 34260c7d97c5SJed Brown } 34270c7d97c5SJed Brown } 34280c7d97c5SJed Brown } 34290c7d97c5SJed Brown 343053cdbc3dSStefano Zampini ierr = MPI_Reduce(&my_faces,&total_faces,1,MPIU_INT,MPI_SUM,master_proc,prec_comm);CHKERRQ(ierr); 34310c7d97c5SJed Brown ierr = PetscMalloc (my_faces*sizeof(PetscInt),&my_faces_connectivity);CHKERRQ(ierr); 34320c7d97c5SJed Brown my_faces=0; 34330c7d97c5SJed Brown for(i=1;i<pcis->n_neigh;i++){ 34340c7d97c5SJed Brown for(j=0;j<pcis->n_shared[i];j++){ 34350c7d97c5SJed Brown if(array_int[ pcis->shared[i][j] ] == 1 ){ 34360c7d97c5SJed Brown my_faces_connectivity[my_faces]=pcis->neigh[i]; 34370c7d97c5SJed Brown my_faces++; 34380c7d97c5SJed Brown break; 34390c7d97c5SJed Brown } 34400c7d97c5SJed Brown } 34410c7d97c5SJed Brown } 34420c7d97c5SJed Brown if(rank_prec_comm == master_proc) { 34430c7d97c5SJed Brown ierr = PetscMalloc (total_faces*sizeof(PetscMPIInt),&petsc_faces_adjncy);CHKERRQ(ierr); 34440c7d97c5SJed Brown ierr = PetscMalloc (size_prec_comm*sizeof(PetscMPIInt),&number_of_faces);CHKERRQ(ierr); 34450c7d97c5SJed Brown ierr = PetscMalloc (total_faces*sizeof(MetisInt),&faces_adjncy);CHKERRQ(ierr); 34460c7d97c5SJed Brown ierr = PetscMalloc ((n_subdomains+1)*sizeof(MetisInt),&faces_xadj);CHKERRQ(ierr); 34470c7d97c5SJed Brown ierr = PetscMalloc ((size_prec_comm+1)*sizeof(PetscMPIInt),&faces_displacements);CHKERRQ(ierr); 34480c7d97c5SJed Brown } 344953cdbc3dSStefano Zampini ierr = MPI_Gather(&my_faces,1,MPIU_INT,&number_of_faces[0],1,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr); 34500c7d97c5SJed Brown if(rank_prec_comm == master_proc) { 34510c7d97c5SJed Brown faces_xadj[0]=0; 34520c7d97c5SJed Brown faces_displacements[0]=0; 34530c7d97c5SJed Brown j=0; 34540c7d97c5SJed Brown for(i=1;i<size_prec_comm+1;i++) { 34550c7d97c5SJed Brown faces_displacements[i]=faces_displacements[i-1]+number_of_faces[i-1]; 34560c7d97c5SJed Brown if(number_of_faces[i-1]) { 34570c7d97c5SJed Brown j++; 34580c7d97c5SJed Brown faces_xadj[j]=faces_xadj[j-1]+number_of_faces[i-1]; 34590c7d97c5SJed Brown } 34600c7d97c5SJed Brown } 3461da1bb401SStefano Zampini /*printf("The J I count is %d and should be %d\n",j,n_subdomains); 3462da1bb401SStefano Zampini printf("Total faces seem %d and should be %d\n",faces_xadj[j],total_faces);*/ 34630c7d97c5SJed Brown } 346453cdbc3dSStefano Zampini ierr = MPI_Gatherv(&my_faces_connectivity[0],my_faces,MPIU_INT,&petsc_faces_adjncy[0],number_of_faces,faces_displacements,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr); 34650c7d97c5SJed Brown ierr = PetscFree(my_faces_connectivity);CHKERRQ(ierr); 34660c7d97c5SJed Brown ierr = PetscFree(array_int);CHKERRQ(ierr); 34670c7d97c5SJed Brown if(rank_prec_comm == master_proc) { 34683828260eSStefano Zampini for(i=0;i<total_faces;i++) faces_adjncy[i]=(MetisInt)(petsc_faces_adjncy[i]/ranks_stretching_ratio); /* cast to MetisInt */ 3469da1bb401SStefano Zampini /*printf("This is the face connectivity (actual ranks)\n"); 34700c7d97c5SJed Brown for(i=0;i<n_subdomains;i++){ 34710c7d97c5SJed Brown printf("proc %d is connected with \n",i); 34720c7d97c5SJed Brown for(j=faces_xadj[i];j<faces_xadj[i+1];j++) 34730c7d97c5SJed Brown printf("%d ",faces_adjncy[j]); 34740c7d97c5SJed Brown printf("\n"); 3475da1bb401SStefano Zampini }*/ 34760c7d97c5SJed Brown ierr = PetscFree(faces_displacements);CHKERRQ(ierr); 34770c7d97c5SJed Brown ierr = PetscFree(number_of_faces);CHKERRQ(ierr); 34780c7d97c5SJed Brown ierr = PetscFree(petsc_faces_adjncy);CHKERRQ(ierr); 34790c7d97c5SJed Brown } 34800c7d97c5SJed Brown 34810c7d97c5SJed Brown if( rank_prec_comm == master_proc ) { 34820c7d97c5SJed Brown 34833828260eSStefano Zampini PetscInt heuristic_for_metis=3; 34843828260eSStefano Zampini 34850c7d97c5SJed Brown ncon=1; 34860c7d97c5SJed Brown faces_nvtxs=n_subdomains; 34870c7d97c5SJed Brown /* partition graoh induced by face connectivity */ 34880c7d97c5SJed Brown ierr = PetscMalloc (n_subdomains*sizeof(MetisInt),&metis_coarse_subdivision);CHKERRQ(ierr); 34890c7d97c5SJed Brown ierr = METIS_SetDefaultOptions(options); 34900c7d97c5SJed Brown /* we need a contiguous partition of the coarse mesh */ 34910c7d97c5SJed Brown options[METIS_OPTION_CONTIG]=1; 34920c7d97c5SJed Brown options[METIS_OPTION_DBGLVL]=1; 34930c7d97c5SJed Brown options[METIS_OPTION_NITER]=30; 34943828260eSStefano Zampini if(n_subdomains>n_parts*heuristic_for_metis) { 34953828260eSStefano Zampini options[METIS_OPTION_IPTYPE]=METIS_IPTYPE_EDGE; 34963828260eSStefano Zampini options[METIS_OPTION_OBJTYPE]=METIS_OBJTYPE_CUT; 34970c7d97c5SJed Brown ierr = METIS_PartGraphKway(&faces_nvtxs,&ncon,faces_xadj,faces_adjncy,NULL,NULL,NULL,&n_parts,NULL,NULL,options,&objval,metis_coarse_subdivision); 34983828260eSStefano Zampini } else { 34993828260eSStefano Zampini ierr = METIS_PartGraphRecursive(&faces_nvtxs,&ncon,faces_xadj,faces_adjncy,NULL,NULL,NULL,&n_parts,NULL,NULL,options,&objval,metis_coarse_subdivision); 35003828260eSStefano Zampini } 35010c7d97c5SJed Brown if(ierr != METIS_OK) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in METIS_PartGraphKway (metis error code %D) called from PCBDDCSetupCoarseEnvironment\n",ierr); 35020c7d97c5SJed Brown ierr = PetscFree(faces_xadj);CHKERRQ(ierr); 35030c7d97c5SJed Brown ierr = PetscFree(faces_adjncy);CHKERRQ(ierr); 35040c7d97c5SJed Brown coarse_subdivision = (PetscMPIInt*)calloc(size_prec_comm,sizeof(PetscMPIInt)); /* calloc for contiguous memory since we need to scatter these values later */ 35050c7d97c5SJed Brown /* copy/cast values avoiding possible type conflicts between PETSc, MPI and METIS */ 35063828260eSStefano Zampini for(i=0;i<size_prec_comm;i++) coarse_subdivision[i]=MPI_PROC_NULL; 35073828260eSStefano Zampini for(i=0;i<n_subdomains;i++) coarse_subdivision[ranks_stretching_ratio*i]=(PetscInt)(metis_coarse_subdivision[i]); 35080c7d97c5SJed Brown ierr = PetscFree(metis_coarse_subdivision);CHKERRQ(ierr); 35090c7d97c5SJed Brown } 35100c7d97c5SJed Brown 35110c7d97c5SJed Brown /* Create new communicator for coarse problem splitting the old one */ 35120c7d97c5SJed Brown if( !(rank_prec_comm%procs_jumps_coarse_comm) && rank_prec_comm < procs_jumps_coarse_comm*n_parts ){ 3513da1bb401SStefano Zampini coarse_color=0; /* for communicator splitting */ 3514da1bb401SStefano Zampini active_rank=rank_prec_comm; /* for insertion of matrix values */ 35150c7d97c5SJed Brown } 3516da1bb401SStefano Zampini /* procs with coarse_color = MPI_UNDEFINED will have coarse_comm = MPI_COMM_NULL (from mpi standards) 3517da1bb401SStefano Zampini key = rank_prec_comm -> keep same ordering of ranks from the old to the new communicator */ 351853cdbc3dSStefano Zampini ierr = MPI_Comm_split(prec_comm,coarse_color,rank_prec_comm,&coarse_comm);CHKERRQ(ierr); 35190c7d97c5SJed Brown 35200c7d97c5SJed Brown if( coarse_color == 0 ) { 352153cdbc3dSStefano Zampini ierr = MPI_Comm_size(coarse_comm,&size_coarse_comm);CHKERRQ(ierr); 352253cdbc3dSStefano Zampini ierr = MPI_Comm_rank(coarse_comm,&rank_coarse_comm);CHKERRQ(ierr); 3523da1bb401SStefano Zampini /*printf("Details of coarse comm\n"); 35243828260eSStefano Zampini printf("size = %d, myrank = %d\n",size_coarse_comm,rank_coarse_comm); 3525da1bb401SStefano Zampini printf("jumps = %d, coarse_color = %d, n_parts = %d\n",procs_jumps_coarse_comm,coarse_color,n_parts);*/ 35260c7d97c5SJed Brown } else { 35270c7d97c5SJed Brown rank_coarse_comm = MPI_PROC_NULL; 35280c7d97c5SJed Brown } 35290c7d97c5SJed Brown 35300c7d97c5SJed Brown /* master proc take care of arranging and distributing coarse informations */ 35310c7d97c5SJed Brown if(rank_coarse_comm == master_proc) { 35320c7d97c5SJed Brown ierr = PetscMalloc (size_coarse_comm*sizeof(PetscMPIInt),&displacements_recv);CHKERRQ(ierr); 3533da1bb401SStefano Zampini /*ierr = PetscMalloc (size_coarse_comm*sizeof(PetscMPIInt),&total_count_recv);CHKERRQ(ierr); 3534da1bb401SStefano Zampini ierr = PetscMalloc (n_subdomains*sizeof(PetscMPIInt),&total_ranks_recv);CHKERRQ(ierr);*/ 35350c7d97c5SJed Brown total_count_recv = (PetscMPIInt*)calloc(size_prec_comm,sizeof(PetscMPIInt)); 35360c7d97c5SJed Brown total_ranks_recv = (PetscMPIInt*)calloc(n_subdomains,sizeof(PetscMPIInt)); 35370c7d97c5SJed Brown /* some initializations */ 35380c7d97c5SJed Brown displacements_recv[0]=0; 3539da1bb401SStefano Zampini /* PetscMemzero(total_count_recv,size_coarse_comm*sizeof(PetscMPIInt)); not needed -> calloc initializes to zero */ 35400c7d97c5SJed Brown /* count from how many processes the j-th process of the coarse decomposition will receive data */ 35410c7d97c5SJed Brown for(j=0;j<size_coarse_comm;j++) 35423828260eSStefano Zampini for(i=0;i<size_prec_comm;i++) 35430c7d97c5SJed Brown if(coarse_subdivision[i]==j) 35440c7d97c5SJed Brown total_count_recv[j]++; 35450c7d97c5SJed Brown /* displacements needed for scatterv of total_ranks_recv */ 35460c7d97c5SJed Brown for(i=1;i<size_coarse_comm;i++) displacements_recv[i]=displacements_recv[i-1]+total_count_recv[i-1]; 35470c7d97c5SJed Brown /* Now fill properly total_ranks_recv -> each coarse process will receive the ranks (in prec_comm communicator) of its friend (sending) processes */ 35480c7d97c5SJed Brown ierr = PetscMemzero(total_count_recv,size_coarse_comm*sizeof(PetscMPIInt));CHKERRQ(ierr); 35490c7d97c5SJed Brown for(j=0;j<size_coarse_comm;j++) { 35503828260eSStefano Zampini for(i=0;i<size_prec_comm;i++) { 35510c7d97c5SJed Brown if(coarse_subdivision[i]==j) { 35520c7d97c5SJed Brown total_ranks_recv[displacements_recv[j]+total_count_recv[j]]=i; 35533828260eSStefano Zampini total_count_recv[j]+=1; 35540c7d97c5SJed Brown } 35550c7d97c5SJed Brown } 35560c7d97c5SJed Brown } 3557da1bb401SStefano Zampini /*for(j=0;j<size_coarse_comm;j++) { 35583828260eSStefano Zampini printf("process %d in new rank will receive from %d processes (original ranks follows)\n",j,total_count_recv[j]); 35593828260eSStefano Zampini for(i=0;i<total_count_recv[j];i++) { 35603828260eSStefano Zampini printf("%d ",total_ranks_recv[displacements_recv[j]+i]); 35613828260eSStefano Zampini } 35623828260eSStefano Zampini printf("\n"); 3563da1bb401SStefano Zampini }*/ 35640c7d97c5SJed Brown 35650c7d97c5SJed Brown /* identify new decomposition in terms of ranks in the old communicator */ 35663828260eSStefano Zampini for(i=0;i<n_subdomains;i++) coarse_subdivision[ranks_stretching_ratio*i]=coarse_subdivision[ranks_stretching_ratio*i]*procs_jumps_coarse_comm; 3567da1bb401SStefano Zampini /*printf("coarse_subdivision in old end new ranks\n"); 35680c7d97c5SJed Brown for(i=0;i<size_prec_comm;i++) 35693828260eSStefano Zampini if(coarse_subdivision[i]!=MPI_PROC_NULL) { 35703828260eSStefano Zampini printf("%d=(%d %d), ",i,coarse_subdivision[i],coarse_subdivision[i]/procs_jumps_coarse_comm); 35713828260eSStefano Zampini } else { 35723828260eSStefano Zampini printf("%d=(%d %d), ",i,coarse_subdivision[i],coarse_subdivision[i]); 35733828260eSStefano Zampini } 3574da1bb401SStefano Zampini printf("\n");*/ 35750c7d97c5SJed Brown } 35760c7d97c5SJed Brown 35770c7d97c5SJed Brown /* Scatter new decomposition for send details */ 357853cdbc3dSStefano Zampini ierr = MPI_Scatter(&coarse_subdivision[0],1,MPIU_INT,&rank_coarse_proc_send_to,1,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr); 35790c7d97c5SJed Brown /* Scatter receiving details to members of coarse decomposition */ 35800c7d97c5SJed Brown if( coarse_color == 0) { 358153cdbc3dSStefano Zampini ierr = MPI_Scatter(&total_count_recv[0],1,MPIU_INT,&count_recv,1,MPIU_INT,master_proc,coarse_comm);CHKERRQ(ierr); 35820c7d97c5SJed Brown ierr = PetscMalloc (count_recv*sizeof(PetscMPIInt),&ranks_recv);CHKERRQ(ierr); 358353cdbc3dSStefano Zampini ierr = MPI_Scatterv(&total_ranks_recv[0],total_count_recv,displacements_recv,MPIU_INT,&ranks_recv[0],count_recv,MPIU_INT,master_proc,coarse_comm);CHKERRQ(ierr); 35840c7d97c5SJed Brown } 35850c7d97c5SJed Brown 3586da1bb401SStefano Zampini /*printf("I will send my matrix data to proc %d\n",rank_coarse_proc_send_to); 3587da1bb401SStefano Zampini if(coarse_color == 0) { 3588da1bb401SStefano Zampini printf("I will receive some matrix data from %d processes (ranks follows)\n",count_recv); 3589da1bb401SStefano Zampini for(i=0;i<count_recv;i++) 3590da1bb401SStefano Zampini printf("%d ",ranks_recv[i]); 3591da1bb401SStefano Zampini printf("\n"); 3592da1bb401SStefano Zampini }*/ 35930c7d97c5SJed Brown 35940c7d97c5SJed Brown if(rank_prec_comm == master_proc) { 3595da1bb401SStefano Zampini /*ierr = PetscFree(coarse_subdivision);CHKERRQ(ierr); 3596da1bb401SStefano Zampini ierr = PetscFree(total_count_recv);CHKERRQ(ierr); 3597da1bb401SStefano Zampini ierr = PetscFree(total_ranks_recv);CHKERRQ(ierr);*/ 35980c7d97c5SJed Brown free(coarse_subdivision); 35990c7d97c5SJed Brown free(total_count_recv); 36000c7d97c5SJed Brown free(total_ranks_recv); 36010c7d97c5SJed Brown ierr = PetscFree(displacements_recv);CHKERRQ(ierr); 36020c7d97c5SJed Brown } 36030c7d97c5SJed Brown break; 36040c7d97c5SJed Brown } 36050c7d97c5SJed Brown 36060c7d97c5SJed Brown case(REPLICATED_BDDC): 36070c7d97c5SJed Brown 36080c7d97c5SJed Brown pcbddc->coarse_communications_type = GATHERS_BDDC; 36090c7d97c5SJed Brown coarse_mat_type = MATSEQAIJ; 36100c7d97c5SJed Brown coarse_pc_type = PCLU; 361153cdbc3dSStefano Zampini coarse_ksp_type = KSPPREONLY; 36120c7d97c5SJed Brown coarse_comm = PETSC_COMM_SELF; 36130c7d97c5SJed Brown active_rank = rank_prec_comm; 36140c7d97c5SJed Brown break; 36150c7d97c5SJed Brown 36160c7d97c5SJed Brown case(PARALLEL_BDDC): 36170c7d97c5SJed Brown 36180c7d97c5SJed Brown pcbddc->coarse_communications_type = SCATTERS_BDDC; 36190c7d97c5SJed Brown coarse_mat_type = MATMPIAIJ; 36200c7d97c5SJed Brown coarse_pc_type = PCREDUNDANT; 362153cdbc3dSStefano Zampini coarse_ksp_type = KSPPREONLY; 36220c7d97c5SJed Brown coarse_comm = prec_comm; 36230c7d97c5SJed Brown active_rank = rank_prec_comm; 36240c7d97c5SJed Brown break; 36250c7d97c5SJed Brown 36260c7d97c5SJed Brown case(SEQUENTIAL_BDDC): 36270c7d97c5SJed Brown pcbddc->coarse_communications_type = GATHERS_BDDC; 36280c7d97c5SJed Brown coarse_mat_type = MATSEQAIJ; 36290c7d97c5SJed Brown coarse_pc_type = PCLU; 363053cdbc3dSStefano Zampini coarse_ksp_type = KSPPREONLY; 36310c7d97c5SJed Brown coarse_comm = PETSC_COMM_SELF; 36320c7d97c5SJed Brown active_rank = master_proc; 36330c7d97c5SJed Brown break; 36340c7d97c5SJed Brown } 36350c7d97c5SJed Brown 36360c7d97c5SJed Brown switch(pcbddc->coarse_communications_type){ 36370c7d97c5SJed Brown 36380c7d97c5SJed Brown case(SCATTERS_BDDC): 36390c7d97c5SJed Brown { 36400c7d97c5SJed Brown if(pcbddc->coarse_problem_type==MULTILEVEL_BDDC) { 36410c7d97c5SJed Brown 36420c7d97c5SJed Brown PetscMPIInt send_size; 36430c7d97c5SJed Brown PetscInt *aux_ins_indices; 36440c7d97c5SJed Brown PetscInt ii,jj; 36450c7d97c5SJed Brown MPI_Request *requests; 36460c7d97c5SJed Brown 36470c7d97c5SJed Brown /* allocate auxiliary space */ 36485619798eSStefano Zampini ierr = PetscMalloc (pcbddc->replicated_primal_size*sizeof(PetscMPIInt),&pcbddc->replicated_local_primal_indices);CHKERRQ(ierr); 36495619798eSStefano Zampini ierr = MPI_Allgatherv(&pcbddc->local_primal_indices[0],pcbddc->local_primal_size,MPIU_INT,&pcbddc->replicated_local_primal_indices[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,prec_comm);CHKERRQ(ierr); 36500c7d97c5SJed Brown ierr = PetscMalloc ( pcbddc->coarse_size*sizeof(PetscInt),&aux_ins_indices);CHKERRQ(ierr); 36510c7d97c5SJed Brown ierr = PetscMemzero(aux_ins_indices,pcbddc->coarse_size*sizeof(PetscInt));CHKERRQ(ierr); 36520c7d97c5SJed Brown /* allocate stuffs for message massing */ 36530c7d97c5SJed Brown ierr = PetscMalloc ( (count_recv+1)*sizeof(MPI_Request),&requests);CHKERRQ(ierr); 36540c7d97c5SJed Brown for(i=0;i<count_recv+1;i++) requests[i]=MPI_REQUEST_NULL; 36550c7d97c5SJed Brown ierr = PetscMalloc ( count_recv*sizeof(PetscMPIInt),&localsizes2);CHKERRQ(ierr); 36560c7d97c5SJed Brown ierr = PetscMalloc ( count_recv*sizeof(PetscMPIInt),&localdispl2);CHKERRQ(ierr); 36570c7d97c5SJed Brown /* fill up quantities */ 36580c7d97c5SJed Brown j=0; 36590c7d97c5SJed Brown for(i=0;i<count_recv;i++){ 36600c7d97c5SJed Brown ii = ranks_recv[i]; 36610c7d97c5SJed Brown localsizes2[i]=pcbddc->local_primal_sizes[ii]*pcbddc->local_primal_sizes[ii]; 36620c7d97c5SJed Brown localdispl2[i]=j; 36630c7d97c5SJed Brown j+=localsizes2[i]; 36640c7d97c5SJed Brown jj = pcbddc->local_primal_displacements[ii]; 3665da1bb401SStefano Zampini for(k=0;k<pcbddc->local_primal_sizes[ii];k++) aux_ins_indices[pcbddc->replicated_local_primal_indices[jj+k]]+=1; /* it counts the coarse subdomains sharing the coarse node */ 36660c7d97c5SJed Brown } 3667da1bb401SStefano Zampini /*printf("aux_ins_indices 1\n"); 3668da1bb401SStefano Zampini for(i=0;i<pcbddc->coarse_size;i++) 3669da1bb401SStefano Zampini printf("%d ",aux_ins_indices[i]); 3670da1bb401SStefano Zampini printf("\n");*/ 36710c7d97c5SJed Brown /* temp_coarse_mat_vals used to store temporarly received matrix values */ 36720c7d97c5SJed Brown ierr = PetscMalloc ( j*sizeof(PetscScalar),&temp_coarse_mat_vals);CHKERRQ(ierr); 36730c7d97c5SJed Brown /* evaluate how many values I will insert in coarse mat */ 36740c7d97c5SJed Brown ins_local_primal_size=0; 36750c7d97c5SJed Brown for(i=0;i<pcbddc->coarse_size;i++) 36760c7d97c5SJed Brown if(aux_ins_indices[i]) 36770c7d97c5SJed Brown ins_local_primal_size++; 36780c7d97c5SJed Brown /* evaluate indices I will insert in coarse mat */ 36790c7d97c5SJed Brown ierr = PetscMalloc ( ins_local_primal_size*sizeof(PetscInt),&ins_local_primal_indices);CHKERRQ(ierr); 36800c7d97c5SJed Brown j=0; 36810c7d97c5SJed Brown for(i=0;i<pcbddc->coarse_size;i++) 36820c7d97c5SJed Brown if(aux_ins_indices[i]) 36830c7d97c5SJed Brown ins_local_primal_indices[j++]=i; 36840c7d97c5SJed Brown /* use aux_ins_indices to realize a global to local mapping */ 36850c7d97c5SJed Brown j=0; 36860c7d97c5SJed Brown for(i=0;i<pcbddc->coarse_size;i++){ 36870c7d97c5SJed Brown if(aux_ins_indices[i]==0){ 36880c7d97c5SJed Brown aux_ins_indices[i]=-1; 36890c7d97c5SJed Brown } else { 36900c7d97c5SJed Brown aux_ins_indices[i]=j; 36910c7d97c5SJed Brown j++; 36920c7d97c5SJed Brown } 36930c7d97c5SJed Brown } 36940c7d97c5SJed Brown 3695da1bb401SStefano Zampini /*printf("New details localsizes2 localdispl2\n"); 3696da1bb401SStefano Zampini for(i=0;i<count_recv;i++) 3697da1bb401SStefano Zampini printf("(%d %d) ",localsizes2[i],localdispl2[i]); 3698da1bb401SStefano Zampini printf("\n"); 3699da1bb401SStefano Zampini printf("aux_ins_indices 2\n"); 3700da1bb401SStefano Zampini for(i=0;i<pcbddc->coarse_size;i++) 3701da1bb401SStefano Zampini printf("%d ",aux_ins_indices[i]); 3702da1bb401SStefano Zampini printf("\n"); 3703da1bb401SStefano Zampini printf("ins_local_primal_indices\n"); 3704da1bb401SStefano Zampini for(i=0;i<ins_local_primal_size;i++) 3705da1bb401SStefano Zampini printf("%d ",ins_local_primal_indices[i]); 3706da1bb401SStefano Zampini printf("\n"); 3707da1bb401SStefano Zampini printf("coarse_submat_vals\n"); 3708da1bb401SStefano Zampini for(i=0;i<pcbddc->local_primal_size;i++) 3709da1bb401SStefano Zampini for(j=0;j<pcbddc->local_primal_size;j++) 3710da1bb401SStefano Zampini printf("(%lf %d %d)\n",coarse_submat_vals[j*pcbddc->local_primal_size+i],pcbddc->local_primal_indices[i],pcbddc->local_primal_indices[j]); 3711da1bb401SStefano Zampini printf("\n");*/ 37120c7d97c5SJed Brown 37130c7d97c5SJed Brown /* processes partecipating in coarse problem receive matrix data from their friends */ 371453cdbc3dSStefano Zampini for(i=0;i<count_recv;i++) ierr = MPI_Irecv(&temp_coarse_mat_vals[localdispl2[i]],localsizes2[i],MPIU_SCALAR,ranks_recv[i],666,prec_comm,&requests[i]);CHKERRQ(ierr); 37150c7d97c5SJed Brown if(rank_coarse_proc_send_to != MPI_PROC_NULL ) { 37160c7d97c5SJed Brown send_size=pcbddc->local_primal_size*pcbddc->local_primal_size; 371753cdbc3dSStefano Zampini ierr = MPI_Isend(&coarse_submat_vals[0],send_size,MPIU_SCALAR,rank_coarse_proc_send_to,666,prec_comm,&requests[count_recv]);CHKERRQ(ierr); 37180c7d97c5SJed Brown } 371953cdbc3dSStefano Zampini ierr = MPI_Waitall(count_recv+1,requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 37200c7d97c5SJed Brown 3721da1bb401SStefano Zampini /*if(coarse_color == 0) { 3722da1bb401SStefano Zampini printf("temp_coarse_mat_vals\n"); 3723da1bb401SStefano Zampini for(k=0;k<count_recv;k++){ 3724da1bb401SStefano Zampini printf("---- %d ----\n",ranks_recv[k]); 3725da1bb401SStefano Zampini for(i=0;i<pcbddc->local_primal_sizes[ranks_recv[k]];i++) 3726da1bb401SStefano Zampini for(j=0;j<pcbddc->local_primal_sizes[ranks_recv[k]];j++) 3727da1bb401SStefano Zampini printf("(%lf %d %d)\n",temp_coarse_mat_vals[localdispl2[k]+j*pcbddc->local_primal_sizes[ranks_recv[k]]+i],pcbddc->replicated_local_primal_indices[pcbddc->local_primal_displacements[ranks_recv[k]]+i],pcbddc->replicated_local_primal_indices[pcbddc->local_primal_displacements[ranks_recv[k]]+j]); 3728da1bb401SStefano Zampini printf("\n"); 3729da1bb401SStefano Zampini } 3730da1bb401SStefano Zampini }*/ 37310c7d97c5SJed Brown /* calculate data to insert in coarse mat */ 37320c7d97c5SJed Brown ierr = PetscMalloc ( ins_local_primal_size*ins_local_primal_size*sizeof(PetscScalar),&ins_coarse_mat_vals);CHKERRQ(ierr); 37330c7d97c5SJed Brown PetscMemzero(ins_coarse_mat_vals,ins_local_primal_size*ins_local_primal_size*sizeof(PetscScalar)); 37340c7d97c5SJed Brown 37350c7d97c5SJed Brown PetscMPIInt rr,kk,lps,lpd; 37360c7d97c5SJed Brown PetscInt row_ind,col_ind; 37370c7d97c5SJed Brown for(k=0;k<count_recv;k++){ 37380c7d97c5SJed Brown rr = ranks_recv[k]; 37390c7d97c5SJed Brown kk = localdispl2[k]; 37400c7d97c5SJed Brown lps = pcbddc->local_primal_sizes[rr]; 37410c7d97c5SJed Brown lpd = pcbddc->local_primal_displacements[rr]; 3742da1bb401SStefano Zampini /*printf("Inserting the following indices (received from %d)\n",rr);*/ 37430c7d97c5SJed Brown for(j=0;j<lps;j++){ 37440c7d97c5SJed Brown col_ind=aux_ins_indices[pcbddc->replicated_local_primal_indices[lpd+j]]; 37450c7d97c5SJed Brown for(i=0;i<lps;i++){ 37460c7d97c5SJed Brown row_ind=aux_ins_indices[pcbddc->replicated_local_primal_indices[lpd+i]]; 3747da1bb401SStefano Zampini /*printf("%d %d\n",row_ind,col_ind);*/ 37480c7d97c5SJed Brown ins_coarse_mat_vals[col_ind*ins_local_primal_size+row_ind]+=temp_coarse_mat_vals[kk+j*lps+i]; 37490c7d97c5SJed Brown } 37500c7d97c5SJed Brown } 37510c7d97c5SJed Brown } 37520c7d97c5SJed Brown ierr = PetscFree(requests);CHKERRQ(ierr); 37530c7d97c5SJed Brown ierr = PetscFree(aux_ins_indices);CHKERRQ(ierr); 37540c7d97c5SJed Brown ierr = PetscFree(temp_coarse_mat_vals);CHKERRQ(ierr); 37550c7d97c5SJed Brown if(coarse_color == 0) { ierr = PetscFree(ranks_recv);CHKERRQ(ierr); } 37560c7d97c5SJed Brown 37570c7d97c5SJed Brown /* create local to global mapping needed by coarse MATIS */ 37580c7d97c5SJed Brown { 37590c7d97c5SJed Brown IS coarse_IS; 376053cdbc3dSStefano Zampini if(coarse_comm != MPI_COMM_NULL ) ierr = MPI_Comm_free(&coarse_comm);CHKERRQ(ierr); 37610c7d97c5SJed Brown coarse_comm = prec_comm; 37620c7d97c5SJed Brown active_rank=rank_prec_comm; 37630c7d97c5SJed Brown ierr = ISCreateGeneral(coarse_comm,ins_local_primal_size,ins_local_primal_indices,PETSC_COPY_VALUES,&coarse_IS);CHKERRQ(ierr); 37640c7d97c5SJed Brown ierr = ISLocalToGlobalMappingCreateIS(coarse_IS,&coarse_ISLG);CHKERRQ(ierr); 37650c7d97c5SJed Brown ierr = ISDestroy(&coarse_IS);CHKERRQ(ierr); 37660c7d97c5SJed Brown } 37670c7d97c5SJed Brown } 37680c7d97c5SJed Brown if(pcbddc->coarse_problem_type==PARALLEL_BDDC) { 37690c7d97c5SJed Brown /* arrays for values insertion */ 37700c7d97c5SJed Brown ins_local_primal_size = pcbddc->local_primal_size; 37710c7d97c5SJed Brown ierr = PetscMalloc ( ins_local_primal_size*sizeof(PetscMPIInt),&ins_local_primal_indices);CHKERRQ(ierr); 37720c7d97c5SJed Brown ierr = PetscMalloc ( ins_local_primal_size*ins_local_primal_size*sizeof(PetscScalar),&ins_coarse_mat_vals);CHKERRQ(ierr); 37730c7d97c5SJed Brown for(j=0;j<ins_local_primal_size;j++){ 37740c7d97c5SJed Brown ins_local_primal_indices[j]=pcbddc->local_primal_indices[j]; 37750c7d97c5SJed Brown for(i=0;i<ins_local_primal_size;i++) ins_coarse_mat_vals[j*ins_local_primal_size+i]=coarse_submat_vals[j*ins_local_primal_size+i]; 37760c7d97c5SJed Brown } 37770c7d97c5SJed Brown } 37780c7d97c5SJed Brown break; 37790c7d97c5SJed Brown 37800c7d97c5SJed Brown } 37810c7d97c5SJed Brown 37820c7d97c5SJed Brown case(GATHERS_BDDC): 37830c7d97c5SJed Brown { 37840c7d97c5SJed Brown 37850c7d97c5SJed Brown PetscMPIInt mysize,mysize2; 37860c7d97c5SJed Brown 37870c7d97c5SJed Brown if(rank_prec_comm==active_rank) { 37880c7d97c5SJed Brown ierr = PetscMalloc ( pcbddc->replicated_primal_size*sizeof(PetscMPIInt),&pcbddc->replicated_local_primal_indices);CHKERRQ(ierr); 37890c7d97c5SJed Brown pcbddc->replicated_local_primal_values = (PetscScalar*)calloc(pcbddc->replicated_primal_size,sizeof(PetscScalar)); 37900c7d97c5SJed Brown ierr = PetscMalloc ( size_prec_comm*sizeof(PetscMPIInt),&localsizes2);CHKERRQ(ierr); 37910c7d97c5SJed Brown ierr = PetscMalloc ( size_prec_comm*sizeof(PetscMPIInt),&localdispl2);CHKERRQ(ierr); 37920c7d97c5SJed Brown /* arrays for values insertion */ 37930c7d97c5SJed Brown ins_local_primal_size = pcbddc->coarse_size; 37940c7d97c5SJed Brown ierr = PetscMalloc ( ins_local_primal_size*sizeof(PetscMPIInt),&ins_local_primal_indices);CHKERRQ(ierr); 37950c7d97c5SJed Brown ierr = PetscMalloc ( ins_local_primal_size*ins_local_primal_size*sizeof(PetscScalar),&ins_coarse_mat_vals);CHKERRQ(ierr); 37960c7d97c5SJed Brown for(i=0;i<size_prec_comm;i++) localsizes2[i]=pcbddc->local_primal_sizes[i]*pcbddc->local_primal_sizes[i]; 37970c7d97c5SJed Brown localdispl2[0]=0; 37980c7d97c5SJed Brown for(i=1;i<size_prec_comm;i++) localdispl2[i]=localsizes2[i-1]+localdispl2[i-1]; 37990c7d97c5SJed Brown j=0; 38000c7d97c5SJed Brown for(i=0;i<size_prec_comm;i++) j+=localsizes2[i]; 38010c7d97c5SJed Brown ierr = PetscMalloc ( j*sizeof(PetscScalar),&temp_coarse_mat_vals);CHKERRQ(ierr); 38020c7d97c5SJed Brown } 38030c7d97c5SJed Brown 38040c7d97c5SJed Brown mysize=pcbddc->local_primal_size; 38050c7d97c5SJed Brown mysize2=pcbddc->local_primal_size*pcbddc->local_primal_size; 38060c7d97c5SJed Brown if(pcbddc->coarse_problem_type == SEQUENTIAL_BDDC){ 380753cdbc3dSStefano Zampini ierr = MPI_Gatherv(&pcbddc->local_primal_indices[0],mysize,MPIU_INT,&pcbddc->replicated_local_primal_indices[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr); 380853cdbc3dSStefano Zampini ierr = MPI_Gatherv(&coarse_submat_vals[0],mysize2,MPIU_SCALAR,&temp_coarse_mat_vals[0],localsizes2,localdispl2,MPIU_SCALAR,master_proc,prec_comm);CHKERRQ(ierr); 38090c7d97c5SJed Brown } else { 381053cdbc3dSStefano Zampini ierr = MPI_Allgatherv(&pcbddc->local_primal_indices[0],mysize,MPIU_INT,&pcbddc->replicated_local_primal_indices[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,prec_comm);CHKERRQ(ierr); 381153cdbc3dSStefano Zampini ierr = MPI_Allgatherv(&coarse_submat_vals[0],mysize2,MPIU_SCALAR,&temp_coarse_mat_vals[0],localsizes2,localdispl2,MPIU_SCALAR,prec_comm);CHKERRQ(ierr); 38120c7d97c5SJed Brown } 38130c7d97c5SJed Brown 38140c7d97c5SJed Brown /* free data structures no longer needed and allocate some space which will be needed in BDDC application */ 38150c7d97c5SJed Brown if(rank_prec_comm==active_rank) { 38160c7d97c5SJed Brown PetscInt offset,offset2,row_ind,col_ind; 38170c7d97c5SJed Brown for(j=0;j<ins_local_primal_size;j++){ 38180c7d97c5SJed Brown ins_local_primal_indices[j]=j; 38190c7d97c5SJed Brown for(i=0;i<ins_local_primal_size;i++) ins_coarse_mat_vals[j*ins_local_primal_size+i]=0.0; 38200c7d97c5SJed Brown } 38210c7d97c5SJed Brown for(k=0;k<size_prec_comm;k++){ 38220c7d97c5SJed Brown offset=pcbddc->local_primal_displacements[k]; 38230c7d97c5SJed Brown offset2=localdispl2[k]; 38240c7d97c5SJed Brown for(j=0;j<pcbddc->local_primal_sizes[k];j++){ 38250c7d97c5SJed Brown col_ind=pcbddc->replicated_local_primal_indices[offset+j]; 38260c7d97c5SJed Brown for(i=0;i<pcbddc->local_primal_sizes[k];i++){ 38270c7d97c5SJed Brown row_ind=pcbddc->replicated_local_primal_indices[offset+i]; 38280c7d97c5SJed Brown ins_coarse_mat_vals[col_ind*pcbddc->coarse_size+row_ind]+=temp_coarse_mat_vals[offset2+j*pcbddc->local_primal_sizes[k]+i]; 38290c7d97c5SJed Brown } 38300c7d97c5SJed Brown } 38310c7d97c5SJed Brown } 38320c7d97c5SJed Brown } 38330c7d97c5SJed Brown break; 3834da1bb401SStefano Zampini }/* switch on coarse problem and communications associated with finished */ 38350c7d97c5SJed Brown } 38360c7d97c5SJed Brown 38370c7d97c5SJed Brown /* Now create and fill up coarse matrix */ 38380c7d97c5SJed Brown if( rank_prec_comm == active_rank ) { 38390c7d97c5SJed Brown if(pcbddc->coarse_problem_type != MULTILEVEL_BDDC) { 38400c7d97c5SJed Brown ierr = MatCreate(coarse_comm,&pcbddc->coarse_mat);CHKERRQ(ierr); 38410c7d97c5SJed Brown ierr = MatSetSizes(pcbddc->coarse_mat,PETSC_DECIDE,PETSC_DECIDE,pcbddc->coarse_size,pcbddc->coarse_size);CHKERRQ(ierr); 38420c7d97c5SJed Brown ierr = MatSetType(pcbddc->coarse_mat,coarse_mat_type);CHKERRQ(ierr); 38433b03a366Sstefano_zampini ierr = MatSetUp(pcbddc->coarse_mat);CHKERRQ(ierr); 3844da1bb401SStefano Zampini ierr = MatSetOption(pcbddc->coarse_mat,MAT_ROW_ORIENTED,PETSC_FALSE);CHKERRQ(ierr); /* local values stored in column major */ 38453b03a366Sstefano_zampini ierr = MatSetOption(pcbddc->coarse_mat,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr); 38460c7d97c5SJed Brown } else { 38470c7d97c5SJed Brown Mat matis_coarse_local_mat; 3848d3ee2243SStefano Zampini /* remind bs */ 3849d3ee2243SStefano Zampini ierr = MatCreateIS(coarse_comm,bs,PETSC_DECIDE,PETSC_DECIDE,pcbddc->coarse_size,pcbddc->coarse_size,coarse_ISLG,&pcbddc->coarse_mat);CHKERRQ(ierr); 38503b03a366Sstefano_zampini ierr = MatSetUp(pcbddc->coarse_mat);CHKERRQ(ierr); 38510c7d97c5SJed Brown ierr = MatISGetLocalMat(pcbddc->coarse_mat,&matis_coarse_local_mat);CHKERRQ(ierr); 38523b03a366Sstefano_zampini ierr = MatSetUp(matis_coarse_local_mat);CHKERRQ(ierr); 3853da1bb401SStefano Zampini ierr = MatSetOption(matis_coarse_local_mat,MAT_ROW_ORIENTED,PETSC_FALSE);CHKERRQ(ierr); /* local values stored in column major */ 3854a0ba757dSStefano Zampini ierr = MatSetOption(matis_coarse_local_mat,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr); 38550c7d97c5SJed Brown } 3856a0ba757dSStefano Zampini ierr = MatSetOption(pcbddc->coarse_mat,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_FALSE);CHKERRQ(ierr); 38570c7d97c5SJed Brown ierr = MatSetValues(pcbddc->coarse_mat,ins_local_primal_size,ins_local_primal_indices,ins_local_primal_size,ins_local_primal_indices,ins_coarse_mat_vals,ADD_VALUES);CHKERRQ(ierr); 38580c7d97c5SJed Brown ierr = MatAssemblyBegin(pcbddc->coarse_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 38590c7d97c5SJed Brown ierr = MatAssemblyEnd(pcbddc->coarse_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 38600c7d97c5SJed Brown 3861da1bb401SStefano Zampini /* PetscViewer view_out; 3862da1bb401SStefano Zampini ierr = PetscViewerASCIIOpen(PETSC_COMM_SELF,"coarsematfull.m",&view_out);CHKERRQ(ierr); 3863da1bb401SStefano Zampini ierr = PetscViewerSetFormat(view_out,PETSC_VIEWER_ASCII_MATLAB);CHKERRQ(ierr); 3864da1bb401SStefano Zampini ierr = MatView(pcbddc->coarse_mat,view_out);CHKERRQ(ierr); 3865da1bb401SStefano Zampini ierr = PetscViewerDestroy(&view_out);CHKERRQ(ierr);*/ 3866da1bb401SStefano Zampini 38670c7d97c5SJed Brown ierr = MatGetVecs(pcbddc->coarse_mat,&pcbddc->coarse_vec,&pcbddc->coarse_rhs);CHKERRQ(ierr); 38680c7d97c5SJed Brown /* Preconditioner for coarse problem */ 386953cdbc3dSStefano Zampini ierr = KSPCreate(coarse_comm,&pcbddc->coarse_ksp);CHKERRQ(ierr); 387053cdbc3dSStefano Zampini ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->coarse_ksp,(PetscObject)pc,1);CHKERRQ(ierr); 387153cdbc3dSStefano Zampini ierr = KSPSetOperators(pcbddc->coarse_ksp,pcbddc->coarse_mat,pcbddc->coarse_mat,SAME_PRECONDITIONER);CHKERRQ(ierr); 38723b03a366Sstefano_zampini ierr = KSPSetTolerances(pcbddc->coarse_ksp,PETSC_DEFAULT,PETSC_DEFAULT,PETSC_DEFAULT,max_it_coarse_ksp);CHKERRQ(ierr); 387353cdbc3dSStefano Zampini ierr = KSPSetType(pcbddc->coarse_ksp,coarse_ksp_type);CHKERRQ(ierr); 387453cdbc3dSStefano Zampini ierr = KSPGetPC(pcbddc->coarse_ksp,&pc_temp);CHKERRQ(ierr); 387553cdbc3dSStefano Zampini ierr = PCSetType(pc_temp,coarse_pc_type);CHKERRQ(ierr); 38760c7d97c5SJed Brown /* Allow user's customization */ 3877da1bb401SStefano Zampini ierr = KSPSetOptionsPrefix(pcbddc->coarse_ksp,"coarse_");CHKERRQ(ierr); 387853cdbc3dSStefano Zampini ierr = KSPSetFromOptions(pcbddc->coarse_ksp);CHKERRQ(ierr); 38790c7d97c5SJed Brown /* Set Up PC for coarse problem BDDC */ 388053cdbc3dSStefano Zampini if(pcbddc->coarse_problem_type == MULTILEVEL_BDDC) { 3881e269702eSStefano Zampini if(dbg_flag) { 3882e269702eSStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"----------------Setting up a new level---------------\n");CHKERRQ(ierr); 3883e269702eSStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 3884e269702eSStefano Zampini } 388553cdbc3dSStefano Zampini ierr = PCBDDCSetCoarseProblemType(pc_temp,MULTILEVEL_BDDC);CHKERRQ(ierr); 388653cdbc3dSStefano Zampini } 388753cdbc3dSStefano Zampini ierr = KSPSetUp(pcbddc->coarse_ksp);CHKERRQ(ierr); 38885619798eSStefano Zampini if(pcbddc->coarse_problem_type == MULTILEVEL_BDDC) { 38895619798eSStefano Zampini if(dbg_flag) { 38905619798eSStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"----------------New level set------------------------\n");CHKERRQ(ierr); 38915619798eSStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 38925619798eSStefano Zampini } 38935619798eSStefano Zampini } 38940c7d97c5SJed Brown } 38950c7d97c5SJed Brown if(pcbddc->coarse_communications_type == SCATTERS_BDDC) { 38960c7d97c5SJed Brown IS local_IS,global_IS; 38970c7d97c5SJed Brown ierr = ISCreateStride(PETSC_COMM_SELF,pcbddc->local_primal_size,0,1,&local_IS);CHKERRQ(ierr); 38980c7d97c5SJed Brown ierr = ISCreateGeneral(PETSC_COMM_SELF,pcbddc->local_primal_size,pcbddc->local_primal_indices,PETSC_COPY_VALUES,&global_IS);CHKERRQ(ierr); 38990c7d97c5SJed Brown ierr = VecScatterCreate(pcbddc->vec1_P,local_IS,pcbddc->coarse_vec,global_IS,&pcbddc->coarse_loc_to_glob);CHKERRQ(ierr); 39000c7d97c5SJed Brown ierr = ISDestroy(&local_IS);CHKERRQ(ierr); 39010c7d97c5SJed Brown ierr = ISDestroy(&global_IS);CHKERRQ(ierr); 39020c7d97c5SJed Brown } 39030c7d97c5SJed Brown 39040c7d97c5SJed Brown 39053b03a366Sstefano_zampini /* Evaluate condition number of coarse problem for cheby (and verbose output if requested) */ 39063b03a366Sstefano_zampini if( pcbddc->coarse_problem_type == MULTILEVEL_BDDC && rank_prec_comm == active_rank ) { 39070c7d97c5SJed Brown PetscScalar m_one=-1.0; 39085619798eSStefano Zampini PetscReal infty_error,lambda_min,lambda_max,kappa_2; 39093b03a366Sstefano_zampini const KSPType check_ksp_type=KSPGMRES; 39100c7d97c5SJed Brown 39115619798eSStefano Zampini /* change coarse ksp object to an iterative method suitable for extreme eigenvalues' estimation */ 39123b03a366Sstefano_zampini ierr = KSPSetType(pcbddc->coarse_ksp,check_ksp_type);CHKERRQ(ierr); 3913d49ef151SStefano Zampini ierr = KSPSetComputeSingularValues(pcbddc->coarse_ksp,PETSC_TRUE);CHKERRQ(ierr); 39145619798eSStefano Zampini ierr = KSPSetTolerances(pcbddc->coarse_ksp,1.e-8,1.e-8,PETSC_DEFAULT,pcbddc->coarse_size);CHKERRQ(ierr); 39155619798eSStefano Zampini ierr = KSPSetUp(pcbddc->coarse_ksp);CHKERRQ(ierr); 3916d49ef151SStefano Zampini ierr = VecSetRandom(pcbddc->coarse_rhs,PETSC_NULL);CHKERRQ(ierr); 3917d49ef151SStefano Zampini ierr = MatMult(pcbddc->coarse_mat,pcbddc->coarse_rhs,pcbddc->coarse_vec);CHKERRQ(ierr); 3918d49ef151SStefano Zampini ierr = MatMult(pcbddc->coarse_mat,pcbddc->coarse_vec,pcbddc->coarse_rhs);CHKERRQ(ierr); 3919d49ef151SStefano Zampini ierr = KSPSolve(pcbddc->coarse_ksp,pcbddc->coarse_rhs,pcbddc->coarse_rhs);CHKERRQ(ierr); 3920d49ef151SStefano Zampini ierr = KSPComputeExtremeSingularValues(pcbddc->coarse_ksp,&lambda_max,&lambda_min);CHKERRQ(ierr); 39213b03a366Sstefano_zampini if(dbg_flag) { 39225619798eSStefano Zampini kappa_2=lambda_max/lambda_min; 39235619798eSStefano Zampini ierr = KSPGetIterationNumber(pcbddc->coarse_ksp,&k);CHKERRQ(ierr); 3924d49ef151SStefano Zampini ierr = VecAXPY(pcbddc->coarse_rhs,m_one,pcbddc->coarse_vec);CHKERRQ(ierr); 3925d49ef151SStefano Zampini ierr = VecNorm(pcbddc->coarse_rhs,NORM_INFINITY,&infty_error);CHKERRQ(ierr); 39263b03a366Sstefano_zampini ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem condition number estimated with %d iterations of %s is: % 1.14e\n",k,check_ksp_type,kappa_2);CHKERRQ(ierr); 3927e269702eSStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem eigenvalues: % 1.14e %1.14e\n",lambda_min,lambda_max);CHKERRQ(ierr); 3928e269702eSStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem infty_error: %1.14e\n",infty_error);CHKERRQ(ierr); 39293b03a366Sstefano_zampini } 39305619798eSStefano Zampini /* restore coarse ksp to default values */ 3931d49ef151SStefano Zampini ierr = KSPSetComputeSingularValues(pcbddc->coarse_ksp,PETSC_FALSE);CHKERRQ(ierr); 39325619798eSStefano Zampini ierr = KSPSetType(pcbddc->coarse_ksp,coarse_ksp_type);CHKERRQ(ierr); 39336c9de887SHong Zhang ierr = KSPChebyshevSetEigenvalues(pcbddc->coarse_ksp,lambda_max,lambda_min);CHKERRQ(ierr); 39343b03a366Sstefano_zampini ierr = KSPSetTolerances(pcbddc->coarse_ksp,PETSC_DEFAULT,PETSC_DEFAULT,PETSC_DEFAULT,max_it_coarse_ksp);CHKERRQ(ierr); 39355619798eSStefano Zampini ierr = KSPSetFromOptions(pcbddc->coarse_ksp);CHKERRQ(ierr); 39365619798eSStefano Zampini ierr = KSPSetUp(pcbddc->coarse_ksp);CHKERRQ(ierr); 393753cdbc3dSStefano Zampini } 39380c7d97c5SJed Brown 39390c7d97c5SJed Brown /* free data structures no longer needed */ 39400c7d97c5SJed Brown if(coarse_ISLG) { ierr = ISLocalToGlobalMappingDestroy(&coarse_ISLG);CHKERRQ(ierr); } 39410c7d97c5SJed Brown if(ins_local_primal_indices) { ierr = PetscFree(ins_local_primal_indices);CHKERRQ(ierr); } 39420c7d97c5SJed Brown if(ins_coarse_mat_vals) { ierr = PetscFree(ins_coarse_mat_vals);CHKERRQ(ierr);} 39430c7d97c5SJed Brown if(localsizes2) { ierr = PetscFree(localsizes2);CHKERRQ(ierr);} 39440c7d97c5SJed Brown if(localdispl2) { ierr = PetscFree(localdispl2);CHKERRQ(ierr);} 39450c7d97c5SJed Brown if(temp_coarse_mat_vals) { ierr = PetscFree(temp_coarse_mat_vals);CHKERRQ(ierr);} 39460c7d97c5SJed Brown 39470c7d97c5SJed Brown PetscFunctionReturn(0); 39480c7d97c5SJed Brown } 39490c7d97c5SJed Brown 39500c7d97c5SJed Brown #undef __FUNCT__ 39510c7d97c5SJed Brown #define __FUNCT__ "PCBDDCManageLocalBoundaries" 395253cdbc3dSStefano Zampini static PetscErrorCode PCBDDCManageLocalBoundaries(PC pc) 39530c7d97c5SJed Brown { 39540c7d97c5SJed Brown 39550c7d97c5SJed Brown PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 39560c7d97c5SJed Brown PC_IS *pcis = (PC_IS*)pc->data; 39570c7d97c5SJed Brown Mat_IS *matis = (Mat_IS*)pc->pmat->data; 3958da1bb401SStefano Zampini PCBDDCGraph mat_graph=pcbddc->mat_graph; 39593972b0daSStefano Zampini PetscInt *queue_in_global_numbering,*is_indices,*auxis; 39603b03a366Sstefano_zampini PetscInt bs,ierr,i,j,s,k,iindex,neumann_bsize,dirichlet_bsize; 3961da1bb401SStefano Zampini PetscInt total_counts,nodes_touched,where_values=1,vertex_size; 3962534831adSStefano Zampini PetscMPIInt adapt_interface=0,adapt_interface_reduced=0,NEUMANNCNT=0; 3963da1bb401SStefano Zampini PetscBool same_set; 3964a0ba757dSStefano Zampini MPI_Comm interface_comm=((PetscObject)pc)->comm; 39653b03a366Sstefano_zampini PetscBool use_faces=PETSC_FALSE,use_edges=PETSC_FALSE; 39663b03a366Sstefano_zampini const PetscInt *neumann_nodes; 39673b03a366Sstefano_zampini const PetscInt *dirichlet_nodes; 3968a81d60d8SStefano Zampini IS used_IS,*custom_ISForDofs; 3969da1bb401SStefano Zampini PetscScalar *array; 3970da1bb401SStefano Zampini PetscScalar *array2; 3971da1bb401SStefano Zampini PetscViewer viewer=pcbddc->dbg_viewer; 39720c7d97c5SJed Brown 39730c7d97c5SJed Brown PetscFunctionBegin; 3974da1bb401SStefano Zampini /* Setup local adjacency graph */ 3975da1bb401SStefano Zampini mat_graph->nvtxs=pcis->n; 3976534831adSStefano Zampini if(!mat_graph->xadj) { NEUMANNCNT = 1; } 3977da1bb401SStefano Zampini ierr = PCBDDCSetupLocalAdjacencyGraph(pc);CHKERRQ(ierr); 3978a0ba757dSStefano Zampini i = mat_graph->nvtxs; 3979a0ba757dSStefano Zampini ierr = PetscMalloc4(i,PetscInt,&mat_graph->where,i,PetscInt,&mat_graph->count,i+1,PetscInt,&mat_graph->cptr,i,PetscInt,&mat_graph->queue);CHKERRQ(ierr); 39803972b0daSStefano Zampini ierr = PetscMalloc2(i,PetscInt,&mat_graph->which_dof,i,PetscBool,&mat_graph->touched);CHKERRQ(ierr); 39813972b0daSStefano Zampini ierr = PetscMalloc(i*sizeof(PetscInt),&queue_in_global_numbering);CHKERRQ(ierr); 3982a0ba757dSStefano Zampini ierr = PetscMemzero(mat_graph->where,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr); 3983a0ba757dSStefano Zampini ierr = PetscMemzero(mat_graph->count,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr); 3984a0ba757dSStefano Zampini ierr = PetscMemzero(mat_graph->which_dof,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr); 3985a0ba757dSStefano Zampini ierr = PetscMemzero(mat_graph->queue,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr); 39863828260eSStefano Zampini ierr = PetscMemzero(mat_graph->cptr,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr); 3987a0ba757dSStefano Zampini 3988a81d60d8SStefano Zampini /* Setting dofs splitting in mat_graph->which_dof 3989a81d60d8SStefano Zampini Get information about dofs' splitting if provided by the user 3990a81d60d8SStefano Zampini Otherwise it assumes a constant block size */ 3991a81d60d8SStefano Zampini vertex_size=0; 3992a81d60d8SStefano Zampini if(!pcbddc->n_ISForDofs) { 3993a81d60d8SStefano Zampini ierr = MatGetBlockSize(matis->A,&bs);CHKERRQ(ierr); 3994a81d60d8SStefano Zampini ierr = PetscMalloc(bs*sizeof(IS),&custom_ISForDofs);CHKERRQ(ierr); 3995a81d60d8SStefano Zampini for(i=0;i<bs;i++) { 3996a81d60d8SStefano Zampini ierr = ISCreateStride(PETSC_COMM_SELF,pcis->n/bs,i,bs,&custom_ISForDofs[i]);CHKERRQ(ierr); 3997a81d60d8SStefano Zampini } 3998a81d60d8SStefano Zampini ierr = PCBDDCSetDofsSplitting(pc,bs,custom_ISForDofs);CHKERRQ(ierr); 3999a81d60d8SStefano Zampini vertex_size=1; 4000a81d60d8SStefano Zampini /* remove my references to IS objects */ 4001a81d60d8SStefano Zampini for(i=0;i<bs;i++) { 4002a81d60d8SStefano Zampini ierr = ISDestroy(&custom_ISForDofs[i]);CHKERRQ(ierr); 4003a81d60d8SStefano Zampini } 4004a81d60d8SStefano Zampini ierr = PetscFree(custom_ISForDofs);CHKERRQ(ierr); 4005a81d60d8SStefano Zampini } 40069c0446d6SStefano Zampini for(i=0;i<pcbddc->n_ISForDofs;i++) { 4007a81d60d8SStefano Zampini ierr = ISGetSize(pcbddc->ISForDofs[i],&k);CHKERRQ(ierr); 40089c0446d6SStefano Zampini ierr = ISGetIndices(pcbddc->ISForDofs[i],(const PetscInt**)&is_indices);CHKERRQ(ierr); 4009a81d60d8SStefano Zampini for(j=0;j<k;j++) { 40109c0446d6SStefano Zampini mat_graph->which_dof[is_indices[j]]=i; 40119c0446d6SStefano Zampini } 40129c0446d6SStefano Zampini ierr = ISRestoreIndices(pcbddc->ISForDofs[i],(const PetscInt**)&is_indices);CHKERRQ(ierr); 40139c0446d6SStefano Zampini } 4014a81d60d8SStefano Zampini /* use mat block size as vertex size if it has not yet set */ 4015a81d60d8SStefano Zampini if(!vertex_size) { 40163b03a366Sstefano_zampini ierr = MatGetBlockSize(matis->A,&vertex_size);CHKERRQ(ierr); 40170c7d97c5SJed Brown } 4018a81d60d8SStefano Zampini 40193b03a366Sstefano_zampini /* count number of neigh per node */ 40200c7d97c5SJed Brown total_counts=0; 40213b03a366Sstefano_zampini for(i=1;i<pcis->n_neigh;i++){ 40220c7d97c5SJed Brown s=pcis->n_shared[i]; 40230c7d97c5SJed Brown total_counts+=s; 402453cdbc3dSStefano Zampini for(j=0;j<s;j++){ 40250c7d97c5SJed Brown mat_graph->count[pcis->shared[i][j]] += 1; 40260c7d97c5SJed Brown } 40270c7d97c5SJed Brown } 4028534831adSStefano Zampini /* Take into account Neumann data -> it increments number of sharing subdomains for nodes lying on the interface */ 402936e030ebSStefano Zampini ierr = PCBDDCGetNeumannBoundaries(pc,&used_IS);CHKERRQ(ierr); 4030da1bb401SStefano Zampini ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr); 4031da1bb401SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 403236e030ebSStefano Zampini if(used_IS) { 403336e030ebSStefano Zampini ierr = ISGetSize(used_IS,&neumann_bsize);CHKERRQ(ierr); 403436e030ebSStefano Zampini ierr = ISGetIndices(used_IS,&neumann_nodes);CHKERRQ(ierr); 403553cdbc3dSStefano Zampini for(i=0;i<neumann_bsize;i++){ 403653cdbc3dSStefano Zampini iindex = neumann_nodes[i]; 4037534831adSStefano Zampini if(mat_graph->count[iindex] > NEUMANNCNT && array[iindex]==0.0){ 403853cdbc3dSStefano Zampini mat_graph->count[iindex]+=1; 40390c7d97c5SJed Brown total_counts++; 4040da1bb401SStefano Zampini array[iindex]=array[iindex]+1.0; 4041da1bb401SStefano Zampini } else if(array[iindex]>0.0) { 4042da1bb401SStefano Zampini SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_USER,"Error for neumann nodes provided to BDDC! They must be uniquely listed! Found duplicate node %d\n",iindex); 40430c7d97c5SJed Brown } 40440c7d97c5SJed Brown } 40450c7d97c5SJed Brown } 4046da1bb401SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 4047da1bb401SStefano Zampini /* allocate space for storing the set of neighbours for each node */ 4048da1bb401SStefano Zampini ierr = PetscMalloc(mat_graph->nvtxs*sizeof(PetscInt*),&mat_graph->neighbours_set);CHKERRQ(ierr); 4049da1bb401SStefano Zampini if(mat_graph->nvtxs) { ierr = PetscMalloc(total_counts*sizeof(PetscInt),&mat_graph->neighbours_set[0]);CHKERRQ(ierr); } 4050da1bb401SStefano Zampini for(i=1;i<mat_graph->nvtxs;i++) mat_graph->neighbours_set[i]=mat_graph->neighbours_set[i-1]+mat_graph->count[i-1]; 4051a0ba757dSStefano Zampini ierr = PetscMemzero(mat_graph->count,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr); 40523b03a366Sstefano_zampini for(i=1;i<pcis->n_neigh;i++){ 40530c7d97c5SJed Brown s=pcis->n_shared[i]; 40540c7d97c5SJed Brown for(j=0;j<s;j++) { 40550c7d97c5SJed Brown k=pcis->shared[i][j]; 4056da1bb401SStefano Zampini mat_graph->neighbours_set[k][mat_graph->count[k]] = pcis->neigh[i]; 40570c7d97c5SJed Brown mat_graph->count[k]+=1; 40580c7d97c5SJed Brown } 40590c7d97c5SJed Brown } 4060da1bb401SStefano Zampini /* Check consistency of Neumann nodes */ 4061da1bb401SStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 4062da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 4063da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 4064da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 4065da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 4066da1bb401SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 40673b03a366Sstefano_zampini /* set -1 fake neighbour to mimic Neumann boundary */ 406836e030ebSStefano Zampini if(used_IS) { 406953cdbc3dSStefano Zampini for(i=0;i<neumann_bsize;i++){ 407053cdbc3dSStefano Zampini iindex = neumann_nodes[i]; 4071534831adSStefano Zampini if(mat_graph->count[iindex] > NEUMANNCNT){ 4072da1bb401SStefano Zampini if(mat_graph->count[iindex]+1 != (PetscInt)array[iindex]) { 4073da1bb401SStefano Zampini SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_USER,"Neumann nodes provided to BDDC must be consistent among neighbours!\nNode %d: number of sharing subdomains %d != number of subdomains for which it is a neumann node %d\n",iindex,mat_graph->count[iindex]+1,(PetscInt)array[iindex]); 4074da1bb401SStefano Zampini } 4075da1bb401SStefano Zampini mat_graph->neighbours_set[iindex][mat_graph->count[iindex]] = -1; 407653cdbc3dSStefano Zampini mat_graph->count[iindex]+=1; 40770c7d97c5SJed Brown } 40780c7d97c5SJed Brown } 407936e030ebSStefano Zampini ierr = ISRestoreIndices(used_IS,&neumann_nodes);CHKERRQ(ierr); 40800c7d97c5SJed Brown } 4081da1bb401SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 4082da1bb401SStefano Zampini /* sort set of sharing subdomains */ 4083da1bb401SStefano Zampini for(i=0;i<mat_graph->nvtxs;i++) { ierr = PetscSortInt(mat_graph->count[i],mat_graph->neighbours_set[i]);CHKERRQ(ierr); } 40843b03a366Sstefano_zampini /* remove interior nodes and dirichlet boundary nodes from the next search into the graph */ 4085da1bb401SStefano Zampini for(i=0;i<mat_graph->nvtxs;i++){mat_graph->touched[i]=PETSC_FALSE;} 4086da1bb401SStefano Zampini nodes_touched=0; 408736e030ebSStefano Zampini ierr = PCBDDCGetDirichletBoundaries(pc,&used_IS);CHKERRQ(ierr); 4088da1bb401SStefano Zampini ierr = VecSet(pcis->vec2_N,0.0);CHKERRQ(ierr); 4089da1bb401SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 4090da1bb401SStefano Zampini ierr = VecGetArray(pcis->vec2_N,&array2);CHKERRQ(ierr); 4091da1bb401SStefano Zampini if(used_IS) { 4092da1bb401SStefano Zampini ierr = ISGetSize(used_IS,&dirichlet_bsize);CHKERRQ(ierr); 4093da1bb401SStefano Zampini if(dirichlet_bsize && matis->pure_neumann) { 4094da1bb401SStefano Zampini SETERRQ(PETSC_COMM_SELF,PETSC_ERR_USER,"Dirichlet boundaries are intended to be used with matrices with zeroed rows!\n"); 4095da1bb401SStefano Zampini } 4096da1bb401SStefano Zampini ierr = ISGetIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr); 4097da1bb401SStefano Zampini for(i=0;i<dirichlet_bsize;i++){ 4098da1bb401SStefano Zampini iindex=dirichlet_nodes[i]; 4099da1bb401SStefano Zampini if(mat_graph->count[iindex] && !mat_graph->touched[iindex]) { 4100da1bb401SStefano Zampini if(array[iindex]>0.0) { 4101da1bb401SStefano Zampini SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_USER,"BDDC cannot have nodes which are marked as Neumann and Dirichlet at the same time! Wrong node %d\n",iindex); 4102da1bb401SStefano Zampini } 4103da1bb401SStefano Zampini mat_graph->touched[iindex]=PETSC_TRUE; 4104da1bb401SStefano Zampini mat_graph->where[iindex]=0; 4105da1bb401SStefano Zampini nodes_touched++; 4106da1bb401SStefano Zampini array2[iindex]=array2[iindex]+1.0; 4107da1bb401SStefano Zampini } 4108da1bb401SStefano Zampini } 4109da1bb401SStefano Zampini ierr = ISRestoreIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr); 4110da1bb401SStefano Zampini } 4111da1bb401SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 4112da1bb401SStefano Zampini ierr = VecRestoreArray(pcis->vec2_N,&array2);CHKERRQ(ierr); 4113da1bb401SStefano Zampini /* Check consistency of Dirichlet nodes */ 4114da1bb401SStefano Zampini ierr = VecSet(pcis->vec1_N,1.0);CHKERRQ(ierr); 4115da1bb401SStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 4116da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 4117da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 4118da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 4119da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 4120da1bb401SStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 4121da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec2_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 4122da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec2_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 4123da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 4124da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 4125da1bb401SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 4126da1bb401SStefano Zampini ierr = VecGetArray(pcis->vec2_N,&array2);CHKERRQ(ierr); 412736e030ebSStefano Zampini if(used_IS) { 412836e030ebSStefano Zampini ierr = ISGetSize(used_IS,&dirichlet_bsize);CHKERRQ(ierr); 412936e030ebSStefano Zampini ierr = ISGetIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr); 41303b03a366Sstefano_zampini for(i=0;i<dirichlet_bsize;i++){ 4131da1bb401SStefano Zampini iindex=dirichlet_nodes[i]; 4132da1bb401SStefano Zampini if(array[iindex]>1.0 && array[iindex]!=array2[iindex] ) { 4133da1bb401SStefano Zampini SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_USER,"Dirichlet nodes provided to BDDC must be consistent among neighbours!\nNode %d: number of sharing subdomains %d != number of subdomains for which it is a neumann node %d\n",iindex,(PetscInt)array[iindex],(PetscInt)array2[iindex]); 4134da1bb401SStefano Zampini } 41353b03a366Sstefano_zampini } 413636e030ebSStefano Zampini ierr = ISRestoreIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr); 41373b03a366Sstefano_zampini } 4138da1bb401SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 4139da1bb401SStefano Zampini ierr = VecRestoreArray(pcis->vec2_N,&array2);CHKERRQ(ierr); 4140da1bb401SStefano Zampini 41410c7d97c5SJed Brown for(i=0;i<mat_graph->nvtxs;i++){ 41423b03a366Sstefano_zampini if(!mat_graph->count[i]){ /* interior nodes */ 41430c7d97c5SJed Brown mat_graph->touched[i]=PETSC_TRUE; 41440c7d97c5SJed Brown mat_graph->where[i]=0; 41450c7d97c5SJed Brown nodes_touched++; 41460c7d97c5SJed Brown } 41470c7d97c5SJed Brown } 41480c7d97c5SJed Brown mat_graph->ncmps = 0; 4149da1bb401SStefano Zampini i=0; 41500c7d97c5SJed Brown while(nodes_touched<mat_graph->nvtxs) { 4151a0ba757dSStefano Zampini /* find first untouched node in local ordering */ 41520c7d97c5SJed Brown while(mat_graph->touched[i]) i++; 41530c7d97c5SJed Brown mat_graph->touched[i]=PETSC_TRUE; 4154a0ba757dSStefano Zampini mat_graph->where[i]=where_values; 41550c7d97c5SJed Brown nodes_touched++; 4156a0ba757dSStefano Zampini /* now find all other nodes having the same set of sharing subdomains */ 41570c7d97c5SJed Brown for(j=i+1;j<mat_graph->nvtxs;j++){ 4158a0ba757dSStefano Zampini /* check for same number of sharing subdomains and dof number */ 4159da1bb401SStefano Zampini if(!mat_graph->touched[j] && mat_graph->count[i]==mat_graph->count[j] && mat_graph->which_dof[i] == mat_graph->which_dof[j] ){ 4160a0ba757dSStefano Zampini /* check for same set of sharing subdomains */ 41610c7d97c5SJed Brown same_set=PETSC_TRUE; 41620c7d97c5SJed Brown for(k=0;k<mat_graph->count[j];k++){ 4163da1bb401SStefano Zampini if(mat_graph->neighbours_set[i][k]!=mat_graph->neighbours_set[j][k]) { 41640c7d97c5SJed Brown same_set=PETSC_FALSE; 41650c7d97c5SJed Brown } 41660c7d97c5SJed Brown } 4167a0ba757dSStefano Zampini /* I found a friend of mine */ 41680c7d97c5SJed Brown if(same_set) { 4169a0ba757dSStefano Zampini mat_graph->where[j]=where_values; 41700c7d97c5SJed Brown mat_graph->touched[j]=PETSC_TRUE; 41710c7d97c5SJed Brown nodes_touched++; 41720c7d97c5SJed Brown } 41730c7d97c5SJed Brown } 41740c7d97c5SJed Brown } 4175a0ba757dSStefano Zampini where_values++; 41760c7d97c5SJed Brown } 4177a0ba757dSStefano Zampini where_values--; if(where_values<0) where_values=0; 4178a0ba757dSStefano Zampini ierr = PetscMalloc(where_values*sizeof(PetscMPIInt),&mat_graph->where_ncmps);CHKERRQ(ierr); 4179a0ba757dSStefano Zampini /* Find connected components defined on the shared interface */ 4180a0ba757dSStefano Zampini if(where_values) { 4181a0ba757dSStefano Zampini ierr = PCBDDCFindConnectedComponents(mat_graph, where_values); 41823b03a366Sstefano_zampini /* For consistency among neughbouring procs, I need to sort (by global ordering) each connected component */ 4183a0ba757dSStefano Zampini for(i=0;i<mat_graph->ncmps;i++) { 4184a0ba757dSStefano Zampini ierr = ISLocalToGlobalMappingApply(matis->mapping,mat_graph->cptr[i+1]-mat_graph->cptr[i],&mat_graph->queue[mat_graph->cptr[i]],&queue_in_global_numbering[mat_graph->cptr[i]]);CHKERRQ(ierr); 4185a0ba757dSStefano Zampini ierr = PetscSortIntWithArray(mat_graph->cptr[i+1]-mat_graph->cptr[i],&queue_in_global_numbering[mat_graph->cptr[i]],&mat_graph->queue[mat_graph->cptr[i]]);CHKERRQ(ierr); 4186a0ba757dSStefano Zampini } 4187a0ba757dSStefano Zampini } 4188a0ba757dSStefano Zampini /* check consistency of connected components among neighbouring subdomains -> it adapt them in case it is needed */ 4189a0ba757dSStefano Zampini for(i=0;i<where_values;i++) { 41903b03a366Sstefano_zampini /* We are not sure that two connected components will be the same among subdomains sharing a subset of local interface */ 41913b03a366Sstefano_zampini if(mat_graph->where_ncmps[i]>1) { 4192a0ba757dSStefano Zampini adapt_interface=1; 4193a0ba757dSStefano Zampini break; 4194a0ba757dSStefano Zampini } 4195a0ba757dSStefano Zampini } 4196a0ba757dSStefano Zampini ierr = MPI_Allreduce(&adapt_interface,&adapt_interface_reduced,1,MPIU_INT,MPI_LOR,interface_comm);CHKERRQ(ierr); 4197da1bb401SStefano Zampini if(pcbddc->dbg_flag && adapt_interface_reduced) { 4198da1bb401SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Interface adapted\n");CHKERRQ(ierr); 4199da1bb401SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 4200da1bb401SStefano Zampini } 4201a0ba757dSStefano Zampini if(where_values && adapt_interface_reduced) { 42020c7d97c5SJed Brown 4203a0ba757dSStefano Zampini PetscInt sum_requests=0,my_rank; 4204a0ba757dSStefano Zampini PetscInt buffer_size,start_of_recv,size_of_recv,start_of_send; 4205a0ba757dSStefano Zampini PetscInt temp_buffer_size,ins_val,global_where_counter; 4206a0ba757dSStefano Zampini PetscInt *cum_recv_counts; 4207a0ba757dSStefano Zampini PetscInt *where_to_nodes_indices; 4208a0ba757dSStefano Zampini PetscInt *petsc_buffer; 4209a0ba757dSStefano Zampini PetscMPIInt *recv_buffer; 4210a0ba757dSStefano Zampini PetscMPIInt *recv_buffer_where; 4211a0ba757dSStefano Zampini PetscMPIInt *send_buffer; 4212a0ba757dSStefano Zampini PetscMPIInt size_of_send; 4213a0ba757dSStefano Zampini PetscInt *sizes_of_sends; 4214a0ba757dSStefano Zampini MPI_Request *send_requests; 4215a0ba757dSStefano Zampini MPI_Request *recv_requests; 4216a0ba757dSStefano Zampini PetscInt *where_cc_adapt; 4217a0ba757dSStefano Zampini PetscInt **temp_buffer; 4218a0ba757dSStefano Zampini PetscInt *nodes_to_temp_buffer_indices; 4219a0ba757dSStefano Zampini PetscInt *add_to_where; 4220a0ba757dSStefano Zampini 4221a0ba757dSStefano Zampini ierr = MPI_Comm_rank(interface_comm,&my_rank);CHKERRQ(ierr); 4222a0ba757dSStefano Zampini ierr = PetscMalloc((where_values+1)*sizeof(PetscInt),&cum_recv_counts);CHKERRQ(ierr); 4223a0ba757dSStefano Zampini ierr = PetscMemzero(cum_recv_counts,(where_values+1)*sizeof(PetscInt));CHKERRQ(ierr); 4224a0ba757dSStefano Zampini ierr = PetscMalloc(where_values*sizeof(PetscInt),&where_to_nodes_indices);CHKERRQ(ierr); 4225a0ba757dSStefano Zampini /* first count how many neighbours per connected component I will receive from */ 4226a0ba757dSStefano Zampini cum_recv_counts[0]=0; 4227a0ba757dSStefano Zampini for(i=1;i<where_values+1;i++){ 4228a0ba757dSStefano Zampini j=0; 4229a0ba757dSStefano Zampini while(mat_graph->where[j] != i) j++; 4230a0ba757dSStefano Zampini where_to_nodes_indices[i-1]=j; 4231da1bb401SStefano Zampini if(mat_graph->neighbours_set[j][0]!=-1) { cum_recv_counts[i]=cum_recv_counts[i-1]+mat_graph->count[j]; } /* We don't want sends/recvs_to/from_self -> here I don't count myself */ 42323b03a366Sstefano_zampini else { cum_recv_counts[i]=cum_recv_counts[i-1]+mat_graph->count[j]-1; } 4233a0ba757dSStefano Zampini } 4234a0ba757dSStefano Zampini buffer_size=2*cum_recv_counts[where_values]+mat_graph->nvtxs; 4235a0ba757dSStefano Zampini ierr = PetscMalloc(2*cum_recv_counts[where_values]*sizeof(PetscMPIInt),&recv_buffer_where);CHKERRQ(ierr); 4236a0ba757dSStefano Zampini ierr = PetscMalloc(buffer_size*sizeof(PetscMPIInt),&send_buffer);CHKERRQ(ierr); 4237a0ba757dSStefano Zampini ierr = PetscMalloc(cum_recv_counts[where_values]*sizeof(MPI_Request),&send_requests);CHKERRQ(ierr); 4238a0ba757dSStefano Zampini ierr = PetscMalloc(cum_recv_counts[where_values]*sizeof(MPI_Request),&recv_requests);CHKERRQ(ierr); 4239a0ba757dSStefano Zampini for(i=0;i<cum_recv_counts[where_values];i++) { 4240a0ba757dSStefano Zampini send_requests[i]=MPI_REQUEST_NULL; 4241a0ba757dSStefano Zampini recv_requests[i]=MPI_REQUEST_NULL; 4242a0ba757dSStefano Zampini } 4243a0ba757dSStefano Zampini /* exchange with my neighbours the number of my connected components on the shared interface */ 4244a0ba757dSStefano Zampini for(i=0;i<where_values;i++){ 4245a0ba757dSStefano Zampini j=where_to_nodes_indices[i]; 4246da1bb401SStefano Zampini k = (mat_graph->neighbours_set[j][0] == -1 ? 1 : 0); 4247a0ba757dSStefano Zampini for(;k<mat_graph->count[j];k++){ 4248da1bb401SStefano Zampini ierr = MPI_Isend(&mat_graph->where_ncmps[i],1,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr); 4249da1bb401SStefano Zampini ierr = MPI_Irecv(&recv_buffer_where[sum_requests],1,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr); 4250a0ba757dSStefano Zampini sum_requests++; 4251a0ba757dSStefano Zampini } 4252a0ba757dSStefano Zampini } 4253a0ba757dSStefano Zampini ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 4254a0ba757dSStefano Zampini ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 4255a0ba757dSStefano Zampini /* determine the connected component I need to adapt */ 4256a0ba757dSStefano Zampini ierr = PetscMalloc(where_values*sizeof(PetscInt),&where_cc_adapt);CHKERRQ(ierr); 4257a0ba757dSStefano Zampini ierr = PetscMemzero(where_cc_adapt,where_values*sizeof(PetscInt));CHKERRQ(ierr); 4258a0ba757dSStefano Zampini for(i=0;i<where_values;i++){ 4259a0ba757dSStefano Zampini for(j=cum_recv_counts[i];j<cum_recv_counts[i+1];j++){ 42603b03a366Sstefano_zampini /* The first condition is natural (i.e someone has a different number of cc than me), the second one is just to be safe */ 42613b03a366Sstefano_zampini if( mat_graph->where_ncmps[i]!=recv_buffer_where[j] || mat_graph->where_ncmps[i] > 1 ) { 4262a0ba757dSStefano Zampini where_cc_adapt[i]=PETSC_TRUE; 4263a0ba757dSStefano Zampini break; 4264a0ba757dSStefano Zampini } 4265a0ba757dSStefano Zampini } 4266a0ba757dSStefano Zampini } 4267a0ba757dSStefano Zampini /* now get from neighbours their ccs (in global numbering) and adapt them (in case it is needed) */ 4268a0ba757dSStefano Zampini /* first determine how much data to send (size of each queue plus the global indices) and communicate it to neighbours */ 4269a0ba757dSStefano Zampini ierr = PetscMalloc(where_values*sizeof(PetscInt),&sizes_of_sends);CHKERRQ(ierr); 4270a0ba757dSStefano Zampini ierr = PetscMemzero(sizes_of_sends,where_values*sizeof(PetscInt));CHKERRQ(ierr); 4271a0ba757dSStefano Zampini sum_requests=0; 4272a0ba757dSStefano Zampini start_of_send=0; 4273a0ba757dSStefano Zampini start_of_recv=cum_recv_counts[where_values]; 4274a0ba757dSStefano Zampini for(i=0;i<where_values;i++) { 4275a0ba757dSStefano Zampini if(where_cc_adapt[i]) { 4276a0ba757dSStefano Zampini size_of_send=0; 4277a0ba757dSStefano Zampini for(j=i;j<mat_graph->ncmps;j++) { 4278a0ba757dSStefano Zampini if(mat_graph->where[mat_graph->queue[mat_graph->cptr[j]]] == i+1) { /* WARNING -> where values goes from 1 to where_values included */ 4279a0ba757dSStefano Zampini send_buffer[start_of_send+size_of_send]=mat_graph->cptr[j+1]-mat_graph->cptr[j]; 4280a0ba757dSStefano Zampini size_of_send+=1; 4281a0ba757dSStefano Zampini for(k=0;k<mat_graph->cptr[j+1]-mat_graph->cptr[j];k++) { 4282a0ba757dSStefano Zampini send_buffer[start_of_send+size_of_send+k]=queue_in_global_numbering[mat_graph->cptr[j]+k]; 4283a0ba757dSStefano Zampini } 4284a0ba757dSStefano Zampini size_of_send=size_of_send+mat_graph->cptr[j+1]-mat_graph->cptr[j]; 4285a0ba757dSStefano Zampini } 4286a0ba757dSStefano Zampini } 4287a0ba757dSStefano Zampini j = where_to_nodes_indices[i]; 4288da1bb401SStefano Zampini k = (mat_graph->neighbours_set[j][0] == -1 ? 1 : 0); 428911d8f4c2SStefano Zampini sizes_of_sends[i]=size_of_send; 4290a0ba757dSStefano Zampini for(;k<mat_graph->count[j];k++){ 429111d8f4c2SStefano Zampini ierr = MPI_Isend(&sizes_of_sends[i],1,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr); 4292da1bb401SStefano Zampini ierr = MPI_Irecv(&recv_buffer_where[sum_requests+start_of_recv],1,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr); 4293a0ba757dSStefano Zampini sum_requests++; 4294a0ba757dSStefano Zampini } 4295a0ba757dSStefano Zampini start_of_send+=size_of_send; 4296a0ba757dSStefano Zampini } 4297a0ba757dSStefano Zampini } 4298a0ba757dSStefano Zampini ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 4299a0ba757dSStefano Zampini ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 4300a0ba757dSStefano Zampini buffer_size=0; 4301a0ba757dSStefano Zampini for(k=0;k<sum_requests;k++) { buffer_size+=recv_buffer_where[start_of_recv+k]; } 4302a0ba757dSStefano Zampini ierr = PetscMalloc(buffer_size*sizeof(PetscMPIInt),&recv_buffer);CHKERRQ(ierr); 4303a0ba757dSStefano Zampini /* now exchange the data */ 4304a0ba757dSStefano Zampini start_of_recv=0; 4305a0ba757dSStefano Zampini start_of_send=0; 4306a0ba757dSStefano Zampini sum_requests=0; 4307a0ba757dSStefano Zampini for(i=0;i<where_values;i++) { 4308a0ba757dSStefano Zampini if(where_cc_adapt[i]) { 4309a0ba757dSStefano Zampini size_of_send = sizes_of_sends[i]; 4310a0ba757dSStefano Zampini j = where_to_nodes_indices[i]; 4311da1bb401SStefano Zampini k = (mat_graph->neighbours_set[j][0] == -1 ? 1 : 0); 4312a0ba757dSStefano Zampini for(;k<mat_graph->count[j];k++){ 4313da1bb401SStefano Zampini ierr = MPI_Isend(&send_buffer[start_of_send],size_of_send,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr); 4314a0ba757dSStefano Zampini size_of_recv=recv_buffer_where[cum_recv_counts[where_values]+sum_requests]; 4315da1bb401SStefano Zampini ierr = MPI_Irecv(&recv_buffer[start_of_recv],size_of_recv,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr); 4316a0ba757dSStefano Zampini start_of_recv+=size_of_recv; 4317a0ba757dSStefano Zampini sum_requests++; 4318a0ba757dSStefano Zampini } 4319a0ba757dSStefano Zampini start_of_send+=size_of_send; 4320a0ba757dSStefano Zampini } 4321a0ba757dSStefano Zampini } 4322a0ba757dSStefano Zampini ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 4323a0ba757dSStefano Zampini ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 4324a0ba757dSStefano Zampini ierr = PetscMalloc(buffer_size*sizeof(PetscInt),&petsc_buffer);CHKERRQ(ierr); 4325a0ba757dSStefano Zampini for(k=0;k<start_of_recv;k++) { petsc_buffer[k]=(PetscInt)recv_buffer[k]; } 4326a0ba757dSStefano Zampini for(j=0;j<buffer_size;) { 4327a0ba757dSStefano Zampini ierr = ISGlobalToLocalMappingApply(matis->mapping,IS_GTOLM_MASK,petsc_buffer[j],&petsc_buffer[j+1],&petsc_buffer[j],&petsc_buffer[j+1]);CHKERRQ(ierr); 4328a0ba757dSStefano Zampini k=petsc_buffer[j]+1; 4329a0ba757dSStefano Zampini j+=k; 4330a0ba757dSStefano Zampini } 4331a0ba757dSStefano Zampini sum_requests=cum_recv_counts[where_values]; 4332a0ba757dSStefano Zampini start_of_recv=0; 4333a0ba757dSStefano Zampini ierr = PetscMalloc(mat_graph->nvtxs*sizeof(PetscInt),&nodes_to_temp_buffer_indices);CHKERRQ(ierr); 4334a0ba757dSStefano Zampini global_where_counter=0; 4335a0ba757dSStefano Zampini for(i=0;i<where_values;i++){ 4336a0ba757dSStefano Zampini if(where_cc_adapt[i]){ 4337a0ba757dSStefano Zampini temp_buffer_size=0; 4338a0ba757dSStefano Zampini /* find nodes on the shared interface we need to adapt */ 4339a0ba757dSStefano Zampini for(j=0;j<mat_graph->nvtxs;j++){ 4340a0ba757dSStefano Zampini if(mat_graph->where[j]==i+1) { 4341a0ba757dSStefano Zampini nodes_to_temp_buffer_indices[j]=temp_buffer_size; 4342a0ba757dSStefano Zampini temp_buffer_size++; 4343a0ba757dSStefano Zampini } else { 4344a0ba757dSStefano Zampini nodes_to_temp_buffer_indices[j]=-1; 4345a0ba757dSStefano Zampini } 4346a0ba757dSStefano Zampini } 4347a0ba757dSStefano Zampini /* allocate some temporary space */ 4348a0ba757dSStefano Zampini ierr = PetscMalloc(temp_buffer_size*sizeof(PetscInt*),&temp_buffer);CHKERRQ(ierr); 4349a0ba757dSStefano Zampini ierr = PetscMalloc(temp_buffer_size*(cum_recv_counts[i+1]-cum_recv_counts[i])*sizeof(PetscInt),&temp_buffer[0]);CHKERRQ(ierr); 4350a0ba757dSStefano Zampini ierr = PetscMemzero(temp_buffer[0],temp_buffer_size*(cum_recv_counts[i+1]-cum_recv_counts[i])*sizeof(PetscInt));CHKERRQ(ierr); 4351a0ba757dSStefano Zampini for(j=1;j<temp_buffer_size;j++){ 4352a0ba757dSStefano Zampini temp_buffer[j]=temp_buffer[j-1]+cum_recv_counts[i+1]-cum_recv_counts[i]; 4353a0ba757dSStefano Zampini } 4354a0ba757dSStefano Zampini /* analyze contributions from neighbouring subdomains for i-th conn comp 4355a0ba757dSStefano Zampini temp buffer structure: 4356a0ba757dSStefano Zampini supposing part of the interface has dimension 5 (global nodes 0,1,2,3,4) 4357a0ba757dSStefano Zampini 3 neighs procs with structured connected components: 4358a0ba757dSStefano Zampini neigh 0: [0 1 4], [2 3]; (2 connected components) 4359a0ba757dSStefano Zampini neigh 1: [0 1], [2 3 4]; (2 connected components) 4360a0ba757dSStefano Zampini neigh 2: [0 4], [1], [2 3]; (3 connected components) 4361a0ba757dSStefano Zampini tempbuffer (row-oriented) should be filled as: 4362a0ba757dSStefano Zampini [ 0, 0, 0; 4363a0ba757dSStefano Zampini 0, 0, 1; 4364a0ba757dSStefano Zampini 1, 1, 2; 4365a0ba757dSStefano Zampini 1, 1, 2; 4366a0ba757dSStefano Zampini 0, 1, 0; ]; 4367a0ba757dSStefano Zampini This way we can simply recover the resulting structure account for possible intersections of ccs among neighs. 4368a0ba757dSStefano Zampini The mat_graph->where array will be modified to reproduce the following 4 connected components [0], [1], [2 3], [4]; 4369a0ba757dSStefano Zampini */ 4370a0ba757dSStefano Zampini for(j=0;j<cum_recv_counts[i+1]-cum_recv_counts[i];j++) { 4371a0ba757dSStefano Zampini ins_val=0; 4372a0ba757dSStefano Zampini size_of_recv=recv_buffer_where[sum_requests]; /* total size of recv from neighs */ 4373a0ba757dSStefano Zampini for(buffer_size=0;buffer_size<size_of_recv;) { /* loop until all data from neighs has been taken into account */ 4374a0ba757dSStefano Zampini for(k=1;k<petsc_buffer[buffer_size+start_of_recv]+1;k++) { /* filling properly temp_buffer using data from a single recv */ 4375a0ba757dSStefano Zampini temp_buffer[ nodes_to_temp_buffer_indices[ petsc_buffer[ start_of_recv+buffer_size+k ] ] ][j]=ins_val; 4376a0ba757dSStefano Zampini } 4377a0ba757dSStefano Zampini buffer_size+=k; 4378a0ba757dSStefano Zampini ins_val++; 4379a0ba757dSStefano Zampini } 4380a0ba757dSStefano Zampini start_of_recv+=size_of_recv; 4381a0ba757dSStefano Zampini sum_requests++; 4382a0ba757dSStefano Zampini } 4383a0ba757dSStefano Zampini ierr = PetscMalloc(temp_buffer_size*sizeof(PetscInt),&add_to_where);CHKERRQ(ierr); 4384a0ba757dSStefano Zampini ierr = PetscMemzero(add_to_where,temp_buffer_size*sizeof(PetscInt));CHKERRQ(ierr); 4385a0ba757dSStefano Zampini for(j=0;j<temp_buffer_size;j++){ 4386a0ba757dSStefano Zampini if(!add_to_where[j]){ /* found a new cc */ 4387a0ba757dSStefano Zampini global_where_counter++; 4388a0ba757dSStefano Zampini add_to_where[j]=global_where_counter; 4389a0ba757dSStefano Zampini for(k=j+1;k<temp_buffer_size;k++){ /* check for other nodes in new cc */ 4390a0ba757dSStefano Zampini same_set=PETSC_TRUE; 4391a0ba757dSStefano Zampini for(s=0;s<cum_recv_counts[i+1]-cum_recv_counts[i];s++){ 4392a0ba757dSStefano Zampini if(temp_buffer[j][s]!=temp_buffer[k][s]) { 4393a0ba757dSStefano Zampini same_set=PETSC_FALSE; 4394a0ba757dSStefano Zampini break; 4395a0ba757dSStefano Zampini } 4396a0ba757dSStefano Zampini } 4397a0ba757dSStefano Zampini if(same_set) add_to_where[k]=global_where_counter; 4398a0ba757dSStefano Zampini } 4399a0ba757dSStefano Zampini } 4400a0ba757dSStefano Zampini } 4401a0ba757dSStefano Zampini /* insert new data in where array */ 4402a0ba757dSStefano Zampini temp_buffer_size=0; 4403a0ba757dSStefano Zampini for(j=0;j<mat_graph->nvtxs;j++){ 4404a0ba757dSStefano Zampini if(mat_graph->where[j]==i+1) { 4405a0ba757dSStefano Zampini mat_graph->where[j]=where_values+add_to_where[temp_buffer_size]; 4406a0ba757dSStefano Zampini temp_buffer_size++; 4407a0ba757dSStefano Zampini } 4408a0ba757dSStefano Zampini } 4409a0ba757dSStefano Zampini ierr = PetscFree(temp_buffer[0]);CHKERRQ(ierr); 4410a0ba757dSStefano Zampini ierr = PetscFree(temp_buffer);CHKERRQ(ierr); 4411a0ba757dSStefano Zampini ierr = PetscFree(add_to_where);CHKERRQ(ierr); 4412a0ba757dSStefano Zampini } 4413a0ba757dSStefano Zampini } 4414a0ba757dSStefano Zampini ierr = PetscFree(nodes_to_temp_buffer_indices);CHKERRQ(ierr); 4415a0ba757dSStefano Zampini ierr = PetscFree(sizes_of_sends);CHKERRQ(ierr); 4416a0ba757dSStefano Zampini ierr = PetscFree(send_requests);CHKERRQ(ierr); 4417a0ba757dSStefano Zampini ierr = PetscFree(recv_requests);CHKERRQ(ierr); 4418a0ba757dSStefano Zampini ierr = PetscFree(petsc_buffer);CHKERRQ(ierr); 4419a0ba757dSStefano Zampini ierr = PetscFree(recv_buffer);CHKERRQ(ierr); 4420a0ba757dSStefano Zampini ierr = PetscFree(recv_buffer_where);CHKERRQ(ierr); 4421a0ba757dSStefano Zampini ierr = PetscFree(send_buffer);CHKERRQ(ierr); 4422a0ba757dSStefano Zampini ierr = PetscFree(cum_recv_counts);CHKERRQ(ierr); 4423a0ba757dSStefano Zampini ierr = PetscFree(where_to_nodes_indices);CHKERRQ(ierr); 442423d4d1a5SStefano Zampini ierr = PetscFree(where_cc_adapt);CHKERRQ(ierr); 4425a0ba757dSStefano Zampini /* We are ready to evaluate consistent connected components on each part of the shared interface */ 4426a0ba757dSStefano Zampini if(global_where_counter) { 4427a0ba757dSStefano Zampini for(i=0;i<mat_graph->nvtxs;i++){ mat_graph->touched[i]=PETSC_FALSE; } 4428a0ba757dSStefano Zampini global_where_counter=0; 4429a0ba757dSStefano Zampini for(i=0;i<mat_graph->nvtxs;i++){ 4430a0ba757dSStefano Zampini if(mat_graph->where[i] && !mat_graph->touched[i]) { 4431a0ba757dSStefano Zampini global_where_counter++; 4432a0ba757dSStefano Zampini for(j=i+1;j<mat_graph->nvtxs;j++){ 4433a0ba757dSStefano Zampini if(!mat_graph->touched[j] && mat_graph->where[j]==mat_graph->where[i]) { 4434a0ba757dSStefano Zampini mat_graph->where[j]=global_where_counter; 4435a0ba757dSStefano Zampini mat_graph->touched[j]=PETSC_TRUE; 4436a0ba757dSStefano Zampini } 4437a0ba757dSStefano Zampini } 4438a0ba757dSStefano Zampini mat_graph->where[i]=global_where_counter; 4439a0ba757dSStefano Zampini mat_graph->touched[i]=PETSC_TRUE; 4440a0ba757dSStefano Zampini } 4441a0ba757dSStefano Zampini } 4442a0ba757dSStefano Zampini where_values=global_where_counter; 4443a0ba757dSStefano Zampini } 4444a0ba757dSStefano Zampini if(global_where_counter) { 4445a0ba757dSStefano Zampini ierr = PetscMemzero(mat_graph->cptr,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr); 4446a0ba757dSStefano Zampini ierr = PetscMemzero(mat_graph->queue,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr); 4447a0ba757dSStefano Zampini ierr = PetscFree(mat_graph->where_ncmps);CHKERRQ(ierr); 4448a0ba757dSStefano Zampini ierr = PetscMalloc(where_values*sizeof(PetscMPIInt),&mat_graph->where_ncmps);CHKERRQ(ierr); 4449a0ba757dSStefano Zampini ierr = PCBDDCFindConnectedComponents(mat_graph, where_values); 4450a0ba757dSStefano Zampini for(i=0;i<mat_graph->ncmps;i++) { 4451a0ba757dSStefano Zampini ierr = ISLocalToGlobalMappingApply(matis->mapping,mat_graph->cptr[i+1]-mat_graph->cptr[i],&mat_graph->queue[mat_graph->cptr[i]],&queue_in_global_numbering[mat_graph->cptr[i]]);CHKERRQ(ierr); 4452a0ba757dSStefano Zampini ierr = PetscSortIntWithArray(mat_graph->cptr[i+1]-mat_graph->cptr[i],&queue_in_global_numbering[mat_graph->cptr[i]],&mat_graph->queue[mat_graph->cptr[i]]);CHKERRQ(ierr); 4453a0ba757dSStefano Zampini } 4454a0ba757dSStefano Zampini } 44553b03a366Sstefano_zampini } /* Finished adapting interface */ 44560c7d97c5SJed Brown PetscInt nfc=0; 44570c7d97c5SJed Brown PetscInt nec=0; 44580c7d97c5SJed Brown PetscInt nvc=0; 44593b03a366Sstefano_zampini PetscBool twodim_flag=PETSC_FALSE; 44600c7d97c5SJed Brown for (i=0; i<mat_graph->ncmps; i++) { 44613b03a366Sstefano_zampini if( mat_graph->cptr[i+1]-mat_graph->cptr[i] > vertex_size ){ 4462534831adSStefano Zampini if(mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]==1){ /* 1 neigh Neumann fake included */ 44630c7d97c5SJed Brown nfc++; 44643b03a366Sstefano_zampini } else { /* note that nec will be zero in 2d */ 44653b03a366Sstefano_zampini nec++; 44663b03a366Sstefano_zampini } 44670c7d97c5SJed Brown } else { 44683b03a366Sstefano_zampini nvc+=mat_graph->cptr[i+1]-mat_graph->cptr[i]; 44693b03a366Sstefano_zampini } 44703b03a366Sstefano_zampini } 44713b03a366Sstefano_zampini 44723b03a366Sstefano_zampini if(!nec) { /* we are in a 2d case -> no faces, only edges */ 44733b03a366Sstefano_zampini nec = nfc; 44743b03a366Sstefano_zampini nfc = 0; 44753b03a366Sstefano_zampini twodim_flag = PETSC_TRUE; 44763b03a366Sstefano_zampini } 44773972b0daSStefano Zampini /* allocate IS arrays for faces, edges. Vertices need a single index set. */ 44783972b0daSStefano Zampini k=0; 44793972b0daSStefano Zampini for (i=0; i<mat_graph->ncmps; i++) { 44803972b0daSStefano Zampini j=mat_graph->cptr[i+1]-mat_graph->cptr[i]; 44813972b0daSStefano Zampini if( j > k) { 44823972b0daSStefano Zampini k=j; 44833972b0daSStefano Zampini } 4484ba1573a8SStefano Zampini if(j<=vertex_size) { 4485ba1573a8SStefano Zampini k+=vertex_size; 4486ba1573a8SStefano Zampini } 44873972b0daSStefano Zampini } 44883972b0daSStefano Zampini ierr = PetscMalloc(k*sizeof(PetscInt),&auxis);CHKERRQ(ierr); 44893972b0daSStefano Zampini 44903b03a366Sstefano_zampini if(!pcbddc->vertices_flag && !pcbddc->edges_flag) { 44913b03a366Sstefano_zampini ierr = PetscMalloc(nfc*sizeof(IS),&pcbddc->ISForFaces);CHKERRQ(ierr); 44923b03a366Sstefano_zampini use_faces=PETSC_TRUE; 44933b03a366Sstefano_zampini } 44943b03a366Sstefano_zampini if(!pcbddc->vertices_flag && !pcbddc->faces_flag) { 44953b03a366Sstefano_zampini ierr = PetscMalloc(nec*sizeof(IS),&pcbddc->ISForEdges);CHKERRQ(ierr); 44963b03a366Sstefano_zampini use_edges=PETSC_TRUE; 44973b03a366Sstefano_zampini } 44983b03a366Sstefano_zampini nfc=0; 44993b03a366Sstefano_zampini nec=0; 45003b03a366Sstefano_zampini for (i=0; i<mat_graph->ncmps; i++) { 45013b03a366Sstefano_zampini if( mat_graph->cptr[i+1]-mat_graph->cptr[i] > vertex_size ){ 45023b03a366Sstefano_zampini for(j=0;j<mat_graph->cptr[i+1]-mat_graph->cptr[i];j++) { 45033972b0daSStefano Zampini auxis[j]=mat_graph->queue[mat_graph->cptr[i]+j]; 45043b03a366Sstefano_zampini } 45053b03a366Sstefano_zampini if(mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]==1){ 45063b03a366Sstefano_zampini if(twodim_flag) { 45073b03a366Sstefano_zampini if(use_edges) { 45083972b0daSStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,j,auxis,PETSC_COPY_VALUES,&pcbddc->ISForEdges[nec]);CHKERRQ(ierr); 45093b03a366Sstefano_zampini nec++; 45103b03a366Sstefano_zampini } 45113b03a366Sstefano_zampini } else { 45123b03a366Sstefano_zampini if(use_faces) { 45133972b0daSStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,j,auxis,PETSC_COPY_VALUES,&pcbddc->ISForFaces[nfc]);CHKERRQ(ierr); 45143b03a366Sstefano_zampini nfc++; 45153b03a366Sstefano_zampini } 45163b03a366Sstefano_zampini } 45173b03a366Sstefano_zampini } else { 45183b03a366Sstefano_zampini if(use_edges) { 45193972b0daSStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,j,auxis,PETSC_COPY_VALUES,&pcbddc->ISForEdges[nec]);CHKERRQ(ierr); 45200c7d97c5SJed Brown nec++; 45210c7d97c5SJed Brown } 45220c7d97c5SJed Brown } 45230c7d97c5SJed Brown } 45243b03a366Sstefano_zampini } 45253b03a366Sstefano_zampini pcbddc->n_ISForFaces=nfc; 45263b03a366Sstefano_zampini pcbddc->n_ISForEdges=nec; 45273b03a366Sstefano_zampini nvc=0; 45280c7d97c5SJed Brown if( !pcbddc->constraints_flag ) { 45293b03a366Sstefano_zampini for (i=0; i<mat_graph->ncmps; i++) { 45303b03a366Sstefano_zampini if( mat_graph->cptr[i+1]-mat_graph->cptr[i] <= vertex_size ){ 45313b03a366Sstefano_zampini for( j=mat_graph->cptr[i];j<mat_graph->cptr[i+1];j++) { 45323972b0daSStefano Zampini auxis[nvc]=mat_graph->queue[j]; 45330c7d97c5SJed Brown nvc++; 45340c7d97c5SJed Brown } 45350c7d97c5SJed Brown } 45360c7d97c5SJed Brown } 45370c7d97c5SJed Brown } 4538a0ba757dSStefano Zampini /* sort vertex set (by local ordering) */ 45393972b0daSStefano Zampini ierr = PetscSortInt(nvc,auxis);CHKERRQ(ierr); 45403972b0daSStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,nvc,auxis,PETSC_COPY_VALUES,&pcbddc->ISForVertices);CHKERRQ(ierr); 45410c7d97c5SJed Brown 4542e269702eSStefano Zampini if(pcbddc->dbg_flag) { 4543e269702eSStefano Zampini 4544d49ef151SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"--------------------------------------------------------------\n");CHKERRQ(ierr); 4545d49ef151SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Details from PCBDDCManageLocalBoundaries for subdomain %04d\n",PetscGlobalRank);CHKERRQ(ierr); 4546d49ef151SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"--------------------------------------------------------------\n");CHKERRQ(ierr); 4547a0ba757dSStefano Zampini /* ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Graph (adjacency structure) of local Neumann mat\n");CHKERRQ(ierr); 4548a0ba757dSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"--------------------------------------------------------------\n");CHKERRQ(ierr); 4549e269702eSStefano Zampini for(i=0;i<mat_graph->nvtxs;i++) { 4550a0ba757dSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Nodes connected to node number %d are %d\n",i,mat_graph->xadj[i+1]-mat_graph->xadj[i]);CHKERRQ(ierr); 4551e269702eSStefano Zampini for(j=mat_graph->xadj[i];j<mat_graph->xadj[i+1];j++){ 4552a0ba757dSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d ",mat_graph->adjncy[j]);CHKERRQ(ierr); 4553e269702eSStefano Zampini } 4554a0ba757dSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\n--------------------------------------------------------------\n");CHKERRQ(ierr); 4555da1bb401SStefano Zampini }*/ 4556d49ef151SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Matrix graph has %d connected components", mat_graph->ncmps);CHKERRQ(ierr); 45570c7d97c5SJed Brown for(i=0;i<mat_graph->ncmps;i++) { 45583b03a366Sstefano_zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\nDetails for connected component number %02d: size %04d, count %01d. Nodes follow.\n", 45593b03a366Sstefano_zampini i,mat_graph->cptr[i+1]-mat_graph->cptr[i],mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]);CHKERRQ(ierr); 4560da1bb401SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"subdomains: "); 4561da1bb401SStefano Zampini for (j=0;j<mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]; j++) { 4562da1bb401SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d ",mat_graph->neighbours_set[mat_graph->queue[mat_graph->cptr[i]]][j]); 4563da1bb401SStefano Zampini } 4564da1bb401SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\n"); 45650c7d97c5SJed Brown for (j=mat_graph->cptr[i]; j<mat_graph->cptr[i+1]; j++){ 4566da1bb401SStefano Zampini /* ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d (%d), ",queue_in_global_numbering[j],mat_graph->queue[j]);CHKERRQ(ierr); */ 4567da1bb401SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d, ",mat_graph->queue[j]);CHKERRQ(ierr); 45680c7d97c5SJed Brown } 45690c7d97c5SJed Brown } 4570da1bb401SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\n--------------------------------------------------------------\n");CHKERRQ(ierr); 45713b03a366Sstefano_zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local vertices\n",PetscGlobalRank,nvc);CHKERRQ(ierr); 45723b03a366Sstefano_zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local faces\n",PetscGlobalRank,nfc);CHKERRQ(ierr); 45733b03a366Sstefano_zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local edges\n",PetscGlobalRank,nec);CHKERRQ(ierr); 4574d49ef151SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 45750c7d97c5SJed Brown } 45760c7d97c5SJed Brown 45773972b0daSStefano Zampini ierr = PetscFree(queue_in_global_numbering);CHKERRQ(ierr); 45783972b0daSStefano Zampini ierr = PetscFree(auxis);CHKERRQ(ierr); 45790c7d97c5SJed Brown PetscFunctionReturn(0); 45800c7d97c5SJed Brown 45810c7d97c5SJed Brown } 45820c7d97c5SJed Brown 45830c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 45840c7d97c5SJed Brown 45850c7d97c5SJed Brown /* The following code has been adapted from function IsConnectedSubdomain contained 4586da1bb401SStefano Zampini in source file contig.c of METIS library (version 5.0.1) 4587da1bb401SStefano Zampini It finds connected components of each partition labeled from 1 to n_dist */ 45880c7d97c5SJed Brown 45890c7d97c5SJed Brown #undef __FUNCT__ 45900c7d97c5SJed Brown #define __FUNCT__ "PCBDDCFindConnectedComponents" 45919c0446d6SStefano Zampini static PetscErrorCode PCBDDCFindConnectedComponents(PCBDDCGraph graph, PetscInt n_dist ) 45920c7d97c5SJed Brown { 45930c7d97c5SJed Brown PetscInt i, j, k, nvtxs, first, last, nleft, ncmps,pid,cum_queue,n,ncmps_pid; 45940c7d97c5SJed Brown PetscInt *xadj, *adjncy, *where, *queue; 45950c7d97c5SJed Brown PetscInt *cptr; 45960c7d97c5SJed Brown PetscBool *touched; 45970c7d97c5SJed Brown 45980c7d97c5SJed Brown PetscFunctionBegin; 45990c7d97c5SJed Brown 46000c7d97c5SJed Brown nvtxs = graph->nvtxs; 46010c7d97c5SJed Brown xadj = graph->xadj; 46020c7d97c5SJed Brown adjncy = graph->adjncy; 46030c7d97c5SJed Brown where = graph->where; 46040c7d97c5SJed Brown touched = graph->touched; 46050c7d97c5SJed Brown queue = graph->queue; 46060c7d97c5SJed Brown cptr = graph->cptr; 46070c7d97c5SJed Brown 46080c7d97c5SJed Brown for (i=0; i<nvtxs; i++) 46090c7d97c5SJed Brown touched[i] = PETSC_FALSE; 46100c7d97c5SJed Brown 46110c7d97c5SJed Brown cum_queue=0; 46120c7d97c5SJed Brown ncmps=0; 46130c7d97c5SJed Brown 46140c7d97c5SJed Brown for(n=0; n<n_dist; n++) { 4615da1bb401SStefano Zampini pid = n+1; /* partition labeled by 0 is discarded */ 46160c7d97c5SJed Brown nleft = 0; 46170c7d97c5SJed Brown for (i=0; i<nvtxs; i++) { 46180c7d97c5SJed Brown if (where[i] == pid) 46190c7d97c5SJed Brown nleft++; 46200c7d97c5SJed Brown } 46210c7d97c5SJed Brown for (i=0; i<nvtxs; i++) { 46220c7d97c5SJed Brown if (where[i] == pid) 46230c7d97c5SJed Brown break; 46240c7d97c5SJed Brown } 46250c7d97c5SJed Brown touched[i] = PETSC_TRUE; 46260c7d97c5SJed Brown queue[cum_queue] = i; 46270c7d97c5SJed Brown first = 0; last = 1; 46280c7d97c5SJed Brown cptr[ncmps] = cum_queue; /* This actually points to queue */ 46290c7d97c5SJed Brown ncmps_pid = 0; 46300c7d97c5SJed Brown while (first != nleft) { 46310c7d97c5SJed Brown if (first == last) { /* Find another starting vertex */ 46320c7d97c5SJed Brown cptr[++ncmps] = first+cum_queue; 46330c7d97c5SJed Brown ncmps_pid++; 46340c7d97c5SJed Brown for (i=0; i<nvtxs; i++) { 46350c7d97c5SJed Brown if (where[i] == pid && !touched[i]) 46360c7d97c5SJed Brown break; 46370c7d97c5SJed Brown } 46380c7d97c5SJed Brown queue[cum_queue+last] = i; 46390c7d97c5SJed Brown last++; 46400c7d97c5SJed Brown touched[i] = PETSC_TRUE; 46410c7d97c5SJed Brown } 46420c7d97c5SJed Brown i = queue[cum_queue+first]; 46430c7d97c5SJed Brown first++; 46440c7d97c5SJed Brown for (j=xadj[i]; j<xadj[i+1]; j++) { 46450c7d97c5SJed Brown k = adjncy[j]; 46460c7d97c5SJed Brown if (where[k] == pid && !touched[k]) { 46470c7d97c5SJed Brown queue[cum_queue+last] = k; 46480c7d97c5SJed Brown last++; 46490c7d97c5SJed Brown touched[k] = PETSC_TRUE; 46500c7d97c5SJed Brown } 46510c7d97c5SJed Brown } 46520c7d97c5SJed Brown } 46530c7d97c5SJed Brown cptr[++ncmps] = first+cum_queue; 46540c7d97c5SJed Brown ncmps_pid++; 46550c7d97c5SJed Brown cum_queue=cptr[ncmps]; 4656a0ba757dSStefano Zampini graph->where_ncmps[n] = ncmps_pid; 46570c7d97c5SJed Brown } 46580c7d97c5SJed Brown graph->ncmps = ncmps; 46590c7d97c5SJed Brown 46600c7d97c5SJed Brown PetscFunctionReturn(0); 46610c7d97c5SJed Brown } 4662