153cdbc3dSStefano Zampini /* TODOLIST 2da1bb401SStefano Zampini DofSplitting and DM attached to pc? 3da1bb401SStefano Zampini Change SetNeumannBoundaries to SetNeumannBoundariesLocal and provide new SetNeumannBoundaries (same Dirichlet) 4831a100dSStefano Zampini - change prec_type to switch_inexact_prec_type 53b03a366Sstefano_zampini Inexact solvers: global preconditioner application is ready, ask to developers (Jed?) on how to best implement Dohrmann's approach (PCSHELL?) 6a0ba757dSStefano Zampini change how to deal with the coarse problem (PCBDDCSetCoarseEnvironment): 7a0ba757dSStefano Zampini - mind the problem with coarsening_factor 8a0ba757dSStefano Zampini - simplify coarse problem structure -> PCBDDC or PCREDUDANT, nothing else -> same comm for all levels? 9a0ba757dSStefano Zampini - remove coarse enums and allow use of PCBDDCGetCoarseKSP 10a0ba757dSStefano Zampini - remove metis dependency -> use MatPartitioning for multilevel -> Assemble serial adjacency in ManageLocalBoundaries? 113b03a366Sstefano_zampini - Add levels' slot to bddc data structure and associated Set/Get functions 12a0ba757dSStefano Zampini code refactoring: 13a0ba757dSStefano Zampini - pick up better names for static functions 14a0ba757dSStefano Zampini change options structure: 15a0ba757dSStefano Zampini - insert BDDC into MG framework? 16a0ba757dSStefano Zampini provide other ops? Ask to developers 17a0ba757dSStefano Zampini remove all unused printf 18a0ba757dSStefano Zampini man pages 1953cdbc3dSStefano Zampini */ 200c7d97c5SJed Brown 2153cdbc3dSStefano Zampini /* ---------------------------------------------------------------------------------------------------------------------------------------------- 220c7d97c5SJed Brown Implementation of BDDC preconditioner based on: 230c7d97c5SJed Brown C. Dohrmann "An approximate BDDC preconditioner", Numerical Linear Algebra with Applications Volume 14, Issue 2, pages 149-168, March 2007 2453cdbc3dSStefano Zampini ---------------------------------------------------------------------------------------------------------------------------------------------- */ 2553cdbc3dSStefano Zampini 2653cdbc3dSStefano Zampini #include "bddc.h" /*I "petscpc.h" I*/ /* includes for fortran wrappers */ 273b03a366Sstefano_zampini #include <petscblaslapack.h> 280c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 290c7d97c5SJed Brown #undef __FUNCT__ 300c7d97c5SJed Brown #define __FUNCT__ "PCSetFromOptions_BDDC" 310c7d97c5SJed Brown PetscErrorCode PCSetFromOptions_BDDC(PC pc) 320c7d97c5SJed Brown { 330c7d97c5SJed Brown PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 340c7d97c5SJed Brown PetscErrorCode ierr; 350c7d97c5SJed Brown 360c7d97c5SJed Brown PetscFunctionBegin; 370c7d97c5SJed Brown ierr = PetscOptionsHead("BDDC options");CHKERRQ(ierr); 380c7d97c5SJed Brown /* Verbose debugging of main data structures */ 39e269702eSStefano Zampini ierr = PetscOptionsBool("-pc_bddc_check_all" ,"Verbose (debugging) output for PCBDDC" ,"none",pcbddc->dbg_flag ,&pcbddc->dbg_flag ,PETSC_NULL);CHKERRQ(ierr); 400c7d97c5SJed Brown /* Some customization for default primal space */ 41da1bb401SStefano Zampini ierr = PetscOptionsBool("-pc_bddc_vertices_only" ,"Use only vertices in coarse space (i.e. discard constraints)","none",pcbddc->vertices_flag ,&pcbddc->vertices_flag ,PETSC_NULL);CHKERRQ(ierr); 42da1bb401SStefano Zampini ierr = PetscOptionsBool("-pc_bddc_constraints_only","Use only constraints in coarse space (i.e. discard vertices)","none",pcbddc->constraints_flag,&pcbddc->constraints_flag,PETSC_NULL);CHKERRQ(ierr); 43da1bb401SStefano Zampini ierr = PetscOptionsBool("-pc_bddc_faces_only" ,"Use only faces among constraints of coarse space (i.e. discard edges)" ,"none",pcbddc->faces_flag ,&pcbddc->faces_flag ,PETSC_NULL);CHKERRQ(ierr); 44da1bb401SStefano Zampini ierr = PetscOptionsBool("-pc_bddc_edges_only" ,"Use only edges among constraints of coarse space (i.e. discard faces)" ,"none",pcbddc->edges_flag ,&pcbddc->edges_flag ,PETSC_NULL);CHKERRQ(ierr); 450c7d97c5SJed Brown /* Coarse solver context */ 46da1bb401SStefano Zampini static const char *avail_coarse_problems[] = {"sequential","replicated","parallel","multilevel",""}; /*order of choiches depends on ENUM defined in bddc.h */ 470c7d97c5SJed Brown ierr = PetscOptionsEnum("-pc_bddc_coarse_problem_type","Set coarse problem type","none",avail_coarse_problems,(PetscEnum)pcbddc->coarse_problem_type,(PetscEnum*)&pcbddc->coarse_problem_type,PETSC_NULL);CHKERRQ(ierr); 480c7d97c5SJed Brown /* Two different application of BDDC to the whole set of dofs, internal and interface */ 490c7d97c5SJed Brown ierr = PetscOptionsBool("-pc_bddc_switch_preconditioning_type","Switch between M_2 (default) and M_3 preconditioners (as defined by Dohrmann)","none",pcbddc->prec_type,&pcbddc->prec_type,PETSC_NULL);CHKERRQ(ierr); 50534831adSStefano Zampini ierr = PetscOptionsBool("-pc_bddc_use_change_of_basis","Use change of basis approach for primal space","none",pcbddc->usechangeofbasis,&pcbddc->usechangeofbasis,PETSC_NULL);CHKERRQ(ierr); 51534831adSStefano Zampini ierr = PetscOptionsBool("-pc_bddc_use_change_on_faces","Use change of basis approach for face constraints","none",pcbddc->usechangeonfaces,&pcbddc->usechangeonfaces,PETSC_NULL);CHKERRQ(ierr); 52534831adSStefano Zampini pcbddc->usechangeonfaces = pcbddc->usechangeonfaces && pcbddc->usechangeofbasis; 530c7d97c5SJed Brown ierr = PetscOptionsInt("-pc_bddc_coarsening_ratio","Set coarsening ratio used in multilevel coarsening","none",pcbddc->coarsening_ratio,&pcbddc->coarsening_ratio,PETSC_NULL);CHKERRQ(ierr); 540c7d97c5SJed Brown ierr = PetscOptionsTail();CHKERRQ(ierr); 550c7d97c5SJed Brown PetscFunctionReturn(0); 560c7d97c5SJed Brown } 570c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 580c7d97c5SJed Brown EXTERN_C_BEGIN 590c7d97c5SJed Brown #undef __FUNCT__ 600c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetCoarseProblemType_BDDC" 6153cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetCoarseProblemType_BDDC(PC pc, CoarseProblemType CPT) 620c7d97c5SJed Brown { 630c7d97c5SJed Brown PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 640c7d97c5SJed Brown 650c7d97c5SJed Brown PetscFunctionBegin; 660c7d97c5SJed Brown pcbddc->coarse_problem_type = CPT; 670c7d97c5SJed Brown PetscFunctionReturn(0); 680c7d97c5SJed Brown } 690c7d97c5SJed Brown EXTERN_C_END 700c7d97c5SJed Brown #undef __FUNCT__ 710c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetCoarseProblemType" 7253cdbc3dSStefano Zampini /*@ 739c0446d6SStefano Zampini PCBDDCSetCoarseProblemType - Set coarse problem type in PCBDDC. 7453cdbc3dSStefano Zampini 759c0446d6SStefano Zampini Not collective 7653cdbc3dSStefano Zampini 7753cdbc3dSStefano Zampini Input Parameters: 7853cdbc3dSStefano Zampini + pc - the preconditioning context 7953cdbc3dSStefano Zampini - CoarseProblemType - pick a better name and explain what this is 8053cdbc3dSStefano Zampini 8153cdbc3dSStefano Zampini Level: intermediate 8253cdbc3dSStefano Zampini 8353cdbc3dSStefano Zampini Notes: 84da1bb401SStefano Zampini Not collective but all procs must call with same arguments. 8553cdbc3dSStefano Zampini 8653cdbc3dSStefano Zampini .seealso: PCBDDC 8753cdbc3dSStefano Zampini @*/ 880c7d97c5SJed Brown PetscErrorCode PCBDDCSetCoarseProblemType(PC pc, CoarseProblemType CPT) 890c7d97c5SJed Brown { 900c7d97c5SJed Brown PetscErrorCode ierr; 910c7d97c5SJed Brown 920c7d97c5SJed Brown PetscFunctionBegin; 930c7d97c5SJed Brown PetscValidHeaderSpecific(pc,PC_CLASSID,1); 940c7d97c5SJed Brown ierr = PetscTryMethod(pc,"PCBDDCSetCoarseProblemType_C",(PC,CoarseProblemType),(pc,CPT));CHKERRQ(ierr); 950c7d97c5SJed Brown PetscFunctionReturn(0); 960c7d97c5SJed Brown } 970c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 980c7d97c5SJed Brown EXTERN_C_BEGIN 990c7d97c5SJed Brown #undef __FUNCT__ 1003b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCSetDirichletBoundaries_BDDC" 1013b03a366Sstefano_zampini static PetscErrorCode PCBDDCSetDirichletBoundaries_BDDC(PC pc,IS DirichletBoundaries) 1023b03a366Sstefano_zampini { 1033b03a366Sstefano_zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 1043b03a366Sstefano_zampini PetscErrorCode ierr; 1053b03a366Sstefano_zampini 1063b03a366Sstefano_zampini PetscFunctionBegin; 1073b03a366Sstefano_zampini ierr = ISDestroy(&pcbddc->DirichletBoundaries);CHKERRQ(ierr); 10836e030ebSStefano Zampini ierr = PetscObjectReference((PetscObject)DirichletBoundaries);CHKERRQ(ierr); 10936e030ebSStefano Zampini pcbddc->DirichletBoundaries=DirichletBoundaries; 1103b03a366Sstefano_zampini PetscFunctionReturn(0); 1113b03a366Sstefano_zampini } 1123b03a366Sstefano_zampini EXTERN_C_END 1133b03a366Sstefano_zampini #undef __FUNCT__ 1143b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCSetDirichletBoundaries" 1153b03a366Sstefano_zampini /*@ 116da1bb401SStefano Zampini PCBDDCSetDirichletBoundaries - Set index set defining subdomain part (in local ordering) 117da1bb401SStefano Zampini of Dirichlet boundaries for the global problem. 1183b03a366Sstefano_zampini 1193b03a366Sstefano_zampini Not collective 1203b03a366Sstefano_zampini 1213b03a366Sstefano_zampini Input Parameters: 1223b03a366Sstefano_zampini + pc - the preconditioning context 1233b03a366Sstefano_zampini - DirichletBoundaries - sequential index set defining the subdomain part of Dirichlet boundaries (can be PETSC_NULL) 1243b03a366Sstefano_zampini 1253b03a366Sstefano_zampini Level: intermediate 1263b03a366Sstefano_zampini 1273b03a366Sstefano_zampini Notes: 1283b03a366Sstefano_zampini 1293b03a366Sstefano_zampini .seealso: PCBDDC 1303b03a366Sstefano_zampini @*/ 1313b03a366Sstefano_zampini PetscErrorCode PCBDDCSetDirichletBoundaries(PC pc,IS DirichletBoundaries) 1323b03a366Sstefano_zampini { 1333b03a366Sstefano_zampini PetscErrorCode ierr; 1343b03a366Sstefano_zampini 1353b03a366Sstefano_zampini PetscFunctionBegin; 1363b03a366Sstefano_zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 1373b03a366Sstefano_zampini ierr = PetscTryMethod(pc,"PCBDDCSetDirichletBoundaries_C",(PC,IS),(pc,DirichletBoundaries));CHKERRQ(ierr); 1383b03a366Sstefano_zampini PetscFunctionReturn(0); 1393b03a366Sstefano_zampini } 1403b03a366Sstefano_zampini /* -------------------------------------------------------------------------- */ 1413b03a366Sstefano_zampini EXTERN_C_BEGIN 1423b03a366Sstefano_zampini #undef __FUNCT__ 1430c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetNeumannBoundaries_BDDC" 14453cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetNeumannBoundaries_BDDC(PC pc,IS NeumannBoundaries) 1450c7d97c5SJed Brown { 1460c7d97c5SJed Brown PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 14753cdbc3dSStefano Zampini PetscErrorCode ierr; 1480c7d97c5SJed Brown 1490c7d97c5SJed Brown PetscFunctionBegin; 15053cdbc3dSStefano Zampini ierr = ISDestroy(&pcbddc->NeumannBoundaries);CHKERRQ(ierr); 15136e030ebSStefano Zampini ierr = PetscObjectReference((PetscObject)NeumannBoundaries);CHKERRQ(ierr); 15236e030ebSStefano Zampini pcbddc->NeumannBoundaries=NeumannBoundaries; 1530c7d97c5SJed Brown PetscFunctionReturn(0); 1540c7d97c5SJed Brown } 1550c7d97c5SJed Brown EXTERN_C_END 1560c7d97c5SJed Brown #undef __FUNCT__ 1570c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetNeumannBoundaries" 15857527edcSJed Brown /*@ 159da1bb401SStefano Zampini PCBDDCSetNeumannBoundaries - Set index set defining subdomain part (in local ordering) 160da1bb401SStefano Zampini of Neumann boundaries for the global problem. 16157527edcSJed Brown 1629c0446d6SStefano Zampini Not collective 16357527edcSJed Brown 16457527edcSJed Brown Input Parameters: 16557527edcSJed Brown + pc - the preconditioning context 1669c0446d6SStefano Zampini - NeumannBoundaries - sequential index set defining the subdomain part of Neumann boundaries (can be PETSC_NULL) 16757527edcSJed Brown 16857527edcSJed Brown Level: intermediate 16957527edcSJed Brown 17057527edcSJed Brown Notes: 17157527edcSJed Brown 17257527edcSJed Brown .seealso: PCBDDC 17357527edcSJed Brown @*/ 17453cdbc3dSStefano Zampini PetscErrorCode PCBDDCSetNeumannBoundaries(PC pc,IS NeumannBoundaries) 1750c7d97c5SJed Brown { 1760c7d97c5SJed Brown PetscErrorCode ierr; 1770c7d97c5SJed Brown 1780c7d97c5SJed Brown PetscFunctionBegin; 1790c7d97c5SJed Brown PetscValidHeaderSpecific(pc,PC_CLASSID,1); 18053cdbc3dSStefano Zampini ierr = PetscTryMethod(pc,"PCBDDCSetNeumannBoundaries_C",(PC,IS),(pc,NeumannBoundaries));CHKERRQ(ierr); 18153cdbc3dSStefano Zampini PetscFunctionReturn(0); 18253cdbc3dSStefano Zampini } 18353cdbc3dSStefano Zampini /* -------------------------------------------------------------------------- */ 18453cdbc3dSStefano Zampini EXTERN_C_BEGIN 18553cdbc3dSStefano Zampini #undef __FUNCT__ 186da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCGetDirichletBoundaries_BDDC" 187da1bb401SStefano Zampini static PetscErrorCode PCBDDCGetDirichletBoundaries_BDDC(PC pc,IS *DirichletBoundaries) 188da1bb401SStefano Zampini { 189da1bb401SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 190da1bb401SStefano Zampini 191da1bb401SStefano Zampini PetscFunctionBegin; 192da1bb401SStefano Zampini *DirichletBoundaries = pcbddc->DirichletBoundaries; 193da1bb401SStefano Zampini PetscFunctionReturn(0); 194da1bb401SStefano Zampini } 195da1bb401SStefano Zampini EXTERN_C_END 196da1bb401SStefano Zampini #undef __FUNCT__ 197da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCGetDirichletBoundaries" 198da1bb401SStefano Zampini /*@ 199da1bb401SStefano Zampini PCBDDCGetDirichletBoundaries - Get index set defining subdomain part (in local ordering) 200da1bb401SStefano Zampini of Dirichlet boundaries for the global problem. 201da1bb401SStefano Zampini 202da1bb401SStefano Zampini Not collective 203da1bb401SStefano Zampini 204da1bb401SStefano Zampini Input Parameters: 205da1bb401SStefano Zampini + pc - the preconditioning context 206da1bb401SStefano Zampini 207da1bb401SStefano Zampini Output Parameters: 208da1bb401SStefano Zampini + DirichletBoundaries - index set defining the subdomain part of Dirichlet boundaries 209da1bb401SStefano Zampini 210da1bb401SStefano Zampini Level: intermediate 211da1bb401SStefano Zampini 212da1bb401SStefano Zampini Notes: 213da1bb401SStefano Zampini 214da1bb401SStefano Zampini .seealso: PCBDDC 215da1bb401SStefano Zampini @*/ 216da1bb401SStefano Zampini PetscErrorCode PCBDDCGetDirichletBoundaries(PC pc,IS *DirichletBoundaries) 217da1bb401SStefano Zampini { 218da1bb401SStefano Zampini PetscErrorCode ierr; 219da1bb401SStefano Zampini 220da1bb401SStefano Zampini PetscFunctionBegin; 221da1bb401SStefano Zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 222da1bb401SStefano Zampini ierr = PetscUseMethod(pc,"PCBDDCGetDirichletBoundaries_C",(PC,IS*),(pc,DirichletBoundaries));CHKERRQ(ierr); 223da1bb401SStefano Zampini PetscFunctionReturn(0); 224da1bb401SStefano Zampini } 225da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */ 226da1bb401SStefano Zampini EXTERN_C_BEGIN 227da1bb401SStefano Zampini #undef __FUNCT__ 22853cdbc3dSStefano Zampini #define __FUNCT__ "PCBDDCGetNeumannBoundaries_BDDC" 22953cdbc3dSStefano Zampini static PetscErrorCode PCBDDCGetNeumannBoundaries_BDDC(PC pc,IS *NeumannBoundaries) 23053cdbc3dSStefano Zampini { 23153cdbc3dSStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 23253cdbc3dSStefano Zampini 23353cdbc3dSStefano Zampini PetscFunctionBegin; 23453cdbc3dSStefano Zampini *NeumannBoundaries = pcbddc->NeumannBoundaries; 23553cdbc3dSStefano Zampini PetscFunctionReturn(0); 23653cdbc3dSStefano Zampini } 23753cdbc3dSStefano Zampini EXTERN_C_END 23853cdbc3dSStefano Zampini #undef __FUNCT__ 23953cdbc3dSStefano Zampini #define __FUNCT__ "PCBDDCGetNeumannBoundaries" 24053cdbc3dSStefano Zampini /*@ 241da1bb401SStefano Zampini PCBDDCGetNeumannBoundaries - Get index set defining subdomain part (in local ordering) 242da1bb401SStefano Zampini of Neumann boundaries for the global problem. 24353cdbc3dSStefano Zampini 2449c0446d6SStefano Zampini Not collective 24553cdbc3dSStefano Zampini 24653cdbc3dSStefano Zampini Input Parameters: 24753cdbc3dSStefano Zampini + pc - the preconditioning context 24853cdbc3dSStefano Zampini 24953cdbc3dSStefano Zampini Output Parameters: 25053cdbc3dSStefano Zampini + NeumannBoundaries - index set defining the subdomain part of Neumann boundaries 25153cdbc3dSStefano Zampini 25253cdbc3dSStefano Zampini Level: intermediate 25353cdbc3dSStefano Zampini 25453cdbc3dSStefano Zampini Notes: 25553cdbc3dSStefano Zampini 25653cdbc3dSStefano Zampini .seealso: PCBDDC 25753cdbc3dSStefano Zampini @*/ 25853cdbc3dSStefano Zampini PetscErrorCode PCBDDCGetNeumannBoundaries(PC pc,IS *NeumannBoundaries) 25953cdbc3dSStefano Zampini { 26053cdbc3dSStefano Zampini PetscErrorCode ierr; 26153cdbc3dSStefano Zampini 26253cdbc3dSStefano Zampini PetscFunctionBegin; 26353cdbc3dSStefano Zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 26453cdbc3dSStefano Zampini ierr = PetscUseMethod(pc,"PCBDDCGetNeumannBoundaries_C",(PC,IS*),(pc,NeumannBoundaries));CHKERRQ(ierr); 2650c7d97c5SJed Brown PetscFunctionReturn(0); 2660c7d97c5SJed Brown } 26736e030ebSStefano Zampini /* -------------------------------------------------------------------------- */ 26836e030ebSStefano Zampini EXTERN_C_BEGIN 26936e030ebSStefano Zampini #undef __FUNCT__ 270da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetLocalAdjacencyGraph_BDDC" 271da1bb401SStefano Zampini static PetscErrorCode PCBDDCSetLocalAdjacencyGraph_BDDC(PC pc, PetscInt nvtxs, PetscInt xadj[], PetscInt adjncy[], PetscCopyMode copymode) 27236e030ebSStefano Zampini { 27336e030ebSStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 274da1bb401SStefano Zampini PCBDDCGraph mat_graph=pcbddc->mat_graph; 275da1bb401SStefano Zampini PetscErrorCode ierr; 27636e030ebSStefano Zampini 27736e030ebSStefano Zampini PetscFunctionBegin; 278da1bb401SStefano Zampini mat_graph->nvtxs=nvtxs; 279da1bb401SStefano Zampini ierr = PetscFree(mat_graph->xadj);CHKERRQ(ierr); 280da1bb401SStefano Zampini ierr = PetscFree(mat_graph->adjncy);CHKERRQ(ierr); 281da1bb401SStefano Zampini if(copymode == PETSC_COPY_VALUES) { 282da1bb401SStefano Zampini ierr = PetscMalloc((mat_graph->nvtxs+1)*sizeof(PetscInt),&mat_graph->xadj);CHKERRQ(ierr); 283da1bb401SStefano Zampini ierr = PetscMalloc(xadj[mat_graph->nvtxs]*sizeof(PetscInt),&mat_graph->adjncy);CHKERRQ(ierr); 284da1bb401SStefano Zampini ierr = PetscMemcpy(mat_graph->xadj,xadj,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr); 285da1bb401SStefano Zampini ierr = PetscMemcpy(mat_graph->adjncy,adjncy,xadj[mat_graph->nvtxs]*sizeof(PetscInt));CHKERRQ(ierr); 286da1bb401SStefano Zampini } else if(copymode == PETSC_OWN_POINTER) { 287da1bb401SStefano Zampini mat_graph->xadj=xadj; 288da1bb401SStefano Zampini mat_graph->adjncy=adjncy; 289da1bb401SStefano Zampini } else { 290da1bb401SStefano Zampini SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_SUP,"Unsupported copy mode %d in %s\n",copymode,__FUNCT__); 291da1bb401SStefano Zampini } 29236e030ebSStefano Zampini PetscFunctionReturn(0); 29336e030ebSStefano Zampini } 29436e030ebSStefano Zampini EXTERN_C_END 29536e030ebSStefano Zampini #undef __FUNCT__ 296da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetLocalAdjacencyGraph" 29736e030ebSStefano Zampini /*@ 298da1bb401SStefano Zampini PCBDDCSetLocalAdjacencyGraph - Set CSR graph of local matrix for use of PCBDDC. 29936e030ebSStefano Zampini 30036e030ebSStefano Zampini Not collective 30136e030ebSStefano Zampini 30236e030ebSStefano Zampini Input Parameters: 30336e030ebSStefano Zampini + pc - the preconditioning context 304da1bb401SStefano Zampini - nvtxs - number of local vertices of the graph 305da1bb401SStefano Zampini - xadj, adjncy - the CSR graph 306da1bb401SStefano Zampini - copymode - either PETSC_COPY_VALUES or PETSC_OWN_POINTER. In the former case the user must free the array passed in; 307da1bb401SStefano Zampini in the latter case, memory must be obtained with PetscMalloc. 30836e030ebSStefano Zampini 30936e030ebSStefano Zampini Level: intermediate 31036e030ebSStefano Zampini 31136e030ebSStefano Zampini Notes: 31236e030ebSStefano Zampini 31336e030ebSStefano Zampini .seealso: PCBDDC 31436e030ebSStefano Zampini @*/ 315da1bb401SStefano Zampini PetscErrorCode PCBDDCSetLocalAdjacencyGraph(PC pc,PetscInt nvtxs,PetscInt xadj[],PetscInt adjncy[], PetscCopyMode copymode) 31636e030ebSStefano Zampini { 317da1bb401SStefano Zampini PetscInt nrows,ncols; 318da1bb401SStefano Zampini Mat_IS *matis = (Mat_IS*)pc->pmat->data; 31936e030ebSStefano Zampini PetscErrorCode ierr; 32036e030ebSStefano Zampini 32136e030ebSStefano Zampini PetscFunctionBegin; 32236e030ebSStefano Zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 323da1bb401SStefano Zampini ierr = MatGetSize(matis->A,&nrows,&ncols);CHKERRQ(ierr); 324da1bb401SStefano Zampini if(nvtxs != nrows) { 325da1bb401SStefano Zampini SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Local adjacency size %d passed in %s differs from local problem size %d!\n",nvtxs,__FUNCT__,nrows); 326da1bb401SStefano Zampini } else { 327da1bb401SStefano Zampini ierr = PetscTryMethod(pc,"PCBDDCSetLocalAdjacencyGraph_C",(PC,PetscInt,PetscInt[],PetscInt[],PetscCopyMode),(pc,nvtxs,xadj,adjncy,copymode));CHKERRQ(ierr); 328da1bb401SStefano Zampini } 32936e030ebSStefano Zampini PetscFunctionReturn(0); 33036e030ebSStefano Zampini } 3319c0446d6SStefano Zampini /* -------------------------------------------------------------------------- */ 3329c0446d6SStefano Zampini EXTERN_C_BEGIN 3339c0446d6SStefano Zampini #undef __FUNCT__ 3349c0446d6SStefano Zampini #define __FUNCT__ "PCBDDCSetDofsSplitting_BDDC" 3359c0446d6SStefano Zampini static PetscErrorCode PCBDDCSetDofsSplitting_BDDC(PC pc,PetscInt n_is, IS ISForDofs[]) 3369c0446d6SStefano Zampini { 3379c0446d6SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 3389c0446d6SStefano Zampini PetscInt i; 3399c0446d6SStefano Zampini PetscErrorCode ierr; 3409c0446d6SStefano Zampini 3419c0446d6SStefano Zampini PetscFunctionBegin; 342da1bb401SStefano Zampini /* Destroy ISes if they were already set */ 3439c0446d6SStefano Zampini for(i=0;i<pcbddc->n_ISForDofs;i++) { 3449c0446d6SStefano Zampini ierr = ISDestroy(&pcbddc->ISForDofs[i]);CHKERRQ(ierr); 3459c0446d6SStefano Zampini } 346d11ae9bbSstefano_zampini ierr = PetscFree(pcbddc->ISForDofs);CHKERRQ(ierr); 347da1bb401SStefano Zampini /* allocate space then set */ 3489c0446d6SStefano Zampini ierr = PetscMalloc(n_is*sizeof(IS),&pcbddc->ISForDofs);CHKERRQ(ierr); 3499c0446d6SStefano Zampini for(i=0;i<n_is;i++) { 350da1bb401SStefano Zampini ierr = PetscObjectReference((PetscObject)ISForDofs[i]);CHKERRQ(ierr); 351da1bb401SStefano Zampini pcbddc->ISForDofs[i]=ISForDofs[i]; 3529c0446d6SStefano Zampini } 3539c0446d6SStefano Zampini pcbddc->n_ISForDofs=n_is; 3549c0446d6SStefano Zampini PetscFunctionReturn(0); 3559c0446d6SStefano Zampini } 3569c0446d6SStefano Zampini EXTERN_C_END 3579c0446d6SStefano Zampini #undef __FUNCT__ 3589c0446d6SStefano Zampini #define __FUNCT__ "PCBDDCSetDofsSplitting" 3599c0446d6SStefano Zampini /*@ 360da1bb401SStefano Zampini PCBDDCSetDofsSplitting - Set index sets defining fields of local mat. 3619c0446d6SStefano Zampini 3629c0446d6SStefano Zampini Not collective 3639c0446d6SStefano Zampini 3649c0446d6SStefano Zampini Input Parameters: 3659c0446d6SStefano Zampini + pc - the preconditioning context 366da1bb401SStefano Zampini - n - number of index sets defining the fields 367da1bb401SStefano Zampini - IS[] - array of IS describing the fields 3689c0446d6SStefano Zampini 3699c0446d6SStefano Zampini Level: intermediate 3709c0446d6SStefano Zampini 3719c0446d6SStefano Zampini Notes: 3729c0446d6SStefano Zampini 3739c0446d6SStefano Zampini .seealso: PCBDDC 3749c0446d6SStefano Zampini @*/ 3759c0446d6SStefano Zampini PetscErrorCode PCBDDCSetDofsSplitting(PC pc,PetscInt n_is, IS ISForDofs[]) 3769c0446d6SStefano Zampini { 3779c0446d6SStefano Zampini PetscErrorCode ierr; 3789c0446d6SStefano Zampini 3799c0446d6SStefano Zampini PetscFunctionBegin; 3809c0446d6SStefano Zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 3819c0446d6SStefano Zampini ierr = PetscTryMethod(pc,"PCBDDCSetDofsSplitting_C",(PC,PetscInt,IS[]),(pc,n_is,ISForDofs));CHKERRQ(ierr); 3829c0446d6SStefano Zampini PetscFunctionReturn(0); 3839c0446d6SStefano Zampini } 384da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */ 385534831adSStefano Zampini #undef __FUNCT__ 386534831adSStefano Zampini #define __FUNCT__ "PCPreSolve_BDDC" 387534831adSStefano Zampini /* -------------------------------------------------------------------------- */ 388534831adSStefano Zampini /* 389534831adSStefano Zampini PCPreSolve_BDDC - Changes the right hand side and (if necessary) the initial 390534831adSStefano Zampini guess if a transformation of basis approach has been selected. 3919c0446d6SStefano Zampini 392534831adSStefano Zampini Input Parameter: 393534831adSStefano Zampini + pc - the preconditioner contex 394534831adSStefano Zampini 395534831adSStefano Zampini Application Interface Routine: PCPreSolve() 396534831adSStefano Zampini 397534831adSStefano Zampini Notes: 398534831adSStefano Zampini The interface routine PCPreSolve() is not usually called directly by 399534831adSStefano Zampini the user, but instead is called by KSPSolve(). 400534831adSStefano Zampini */ 401534831adSStefano Zampini static PetscErrorCode PCPreSolve_BDDC(PC pc, KSP ksp, Vec rhs, Vec x) 402534831adSStefano Zampini { 403534831adSStefano Zampini PetscErrorCode ierr; 404534831adSStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 405534831adSStefano Zampini PC_IS *pcis = (PC_IS*)(pc->data); 406534831adSStefano Zampini Mat_IS *matis = (Mat_IS*)pc->pmat->data; 407534831adSStefano Zampini Mat temp_mat; 4083972b0daSStefano Zampini IS dirIS; 4093972b0daSStefano Zampini PetscInt dirsize,i,*is_indices; 4103972b0daSStefano Zampini PetscScalar *array_x,*array_diagonal; 4113972b0daSStefano Zampini Vec used_vec; 4123972b0daSStefano Zampini PetscBool guess_nonzero; 413534831adSStefano Zampini 414534831adSStefano Zampini PetscFunctionBegin; 4153972b0daSStefano Zampini if(x) { 4163972b0daSStefano Zampini ierr = PetscObjectReference((PetscObject)x);CHKERRQ(ierr); 4173972b0daSStefano Zampini used_vec = x; 4183972b0daSStefano Zampini } else { 4193972b0daSStefano Zampini ierr = PetscObjectReference((PetscObject)pcbddc->temp_solution);CHKERRQ(ierr); 4203972b0daSStefano Zampini used_vec = pcbddc->temp_solution; 4213972b0daSStefano Zampini ierr = VecSet(used_vec,0.0);CHKERRQ(ierr); 4223972b0daSStefano Zampini } 4233972b0daSStefano Zampini /* hack into ksp data structure PCPreSolve comes earlier in src/ksp/ksp/interface/itfunc.c */ 4243972b0daSStefano Zampini if (ksp) { 4253972b0daSStefano Zampini ierr = KSPGetInitialGuessNonzero(ksp,&guess_nonzero);CHKERRQ(ierr); 4263972b0daSStefano Zampini if( !guess_nonzero ) { 4273972b0daSStefano Zampini ierr = VecSet(used_vec,0.0);CHKERRQ(ierr); 4283972b0daSStefano Zampini } 4293972b0daSStefano Zampini } 4303972b0daSStefano Zampini /* store the original rhs */ 4313972b0daSStefano Zampini ierr = VecCopy(rhs,pcbddc->original_rhs);CHKERRQ(ierr); 4323972b0daSStefano Zampini 4333972b0daSStefano Zampini /* Take into account zeroed rows -> change rhs and store solution removed */ 4343972b0daSStefano Zampini ierr = MatGetDiagonal(pc->pmat,pcis->vec1_global);CHKERRQ(ierr); 4353972b0daSStefano Zampini ierr = VecPointwiseDivide(pcis->vec1_global,rhs,pcis->vec1_global);CHKERRQ(ierr); 4363972b0daSStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 4373972b0daSStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 4383972b0daSStefano Zampini ierr = VecScatterBegin(matis->ctx,used_vec,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 4393972b0daSStefano Zampini ierr = VecScatterEnd (matis->ctx,used_vec,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 4403972b0daSStefano Zampini ierr = PCBDDCGetDirichletBoundaries(pc,&dirIS);CHKERRQ(ierr); 4413972b0daSStefano Zampini if(dirIS) { 4423972b0daSStefano Zampini ierr = ISGetSize(dirIS,&dirsize);CHKERRQ(ierr); 4433972b0daSStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array_x);CHKERRQ(ierr); 4443972b0daSStefano Zampini ierr = VecGetArray(pcis->vec2_N,&array_diagonal);CHKERRQ(ierr); 4453972b0daSStefano Zampini ierr = ISGetIndices(dirIS,(const PetscInt**)&is_indices);CHKERRQ(ierr); 4463972b0daSStefano Zampini for(i=0;i<dirsize;i++) { 4473972b0daSStefano Zampini array_x[is_indices[i]]=array_diagonal[is_indices[i]]; 4483972b0daSStefano Zampini } 4493972b0daSStefano Zampini ierr = ISRestoreIndices(dirIS,(const PetscInt**)&is_indices);CHKERRQ(ierr); 4503972b0daSStefano Zampini ierr = VecRestoreArray(pcis->vec2_N,&array_diagonal);CHKERRQ(ierr); 4513972b0daSStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array_x);CHKERRQ(ierr); 4523972b0daSStefano Zampini } 4533972b0daSStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 4543972b0daSStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 455b76ba322SStefano Zampini 4563972b0daSStefano Zampini /* remove the computed solution from the rhs */ 4573972b0daSStefano Zampini ierr = VecScale(used_vec,-1.0);CHKERRQ(ierr); 4583972b0daSStefano Zampini ierr = MatMultAdd(pc->pmat,used_vec,rhs,rhs);CHKERRQ(ierr); 4593972b0daSStefano Zampini ierr = VecScale(used_vec,-1.0);CHKERRQ(ierr); 460b76ba322SStefano Zampini 461b76ba322SStefano Zampini /* store partially computed solution and set initial guess */ 4623972b0daSStefano Zampini if(x) { 4633972b0daSStefano Zampini ierr = VecCopy(used_vec,pcbddc->temp_solution);CHKERRQ(ierr); 4643972b0daSStefano Zampini ierr = VecSet(used_vec,0.0);CHKERRQ(ierr); 465b76ba322SStefano Zampini if(pcbddc->use_exact_dirichlet) { 466b76ba322SStefano Zampini ierr = VecScatterBegin(pcis->global_to_D,rhs,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 467b76ba322SStefano Zampini ierr = VecScatterEnd (pcis->global_to_D,rhs,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 468b76ba322SStefano Zampini ierr = KSPSolve(pcbddc->ksp_D,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr); 469b76ba322SStefano Zampini ierr = VecScatterBegin(pcis->global_to_D,pcis->vec2_D,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 470b76ba322SStefano Zampini ierr = VecScatterEnd (pcis->global_to_D,pcis->vec2_D,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 471b76ba322SStefano Zampini if(ksp) { 472b76ba322SStefano Zampini ierr = KSPSetInitialGuessNonzero(ksp,PETSC_TRUE);CHKERRQ(ierr); 473b76ba322SStefano Zampini } 474b76ba322SStefano Zampini } 4753972b0daSStefano Zampini } 4763972b0daSStefano Zampini ierr = VecDestroy(&used_vec);CHKERRQ(ierr); 477b76ba322SStefano Zampini 478b76ba322SStefano Zampini /* rhs change of basis */ 479b76ba322SStefano Zampini if(pcbddc->usechangeofbasis) { 480b76ba322SStefano Zampini /* swap pointers for local matrices */ 481b76ba322SStefano Zampini temp_mat = matis->A; 482b76ba322SStefano Zampini matis->A = pcbddc->local_mat; 483b76ba322SStefano Zampini pcbddc->local_mat = temp_mat; 484b76ba322SStefano Zampini /* Get local rhs and apply transformation of basis */ 485b76ba322SStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,rhs,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 486b76ba322SStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,rhs,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 487b76ba322SStefano Zampini /* from original basis to modified basis */ 488b76ba322SStefano Zampini ierr = MatMultTranspose(pcbddc->ChangeOfBasisMatrix,pcis->vec1_B,pcis->vec2_B);CHKERRQ(ierr); 489b76ba322SStefano Zampini /* put back modified values into the global vec using INSERT_VALUES copy mode */ 490b76ba322SStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,pcis->vec2_B,rhs,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 491b76ba322SStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,pcis->vec2_B,rhs,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 492b76ba322SStefano Zampini } 493534831adSStefano Zampini PetscFunctionReturn(0); 494534831adSStefano Zampini } 495534831adSStefano Zampini /* -------------------------------------------------------------------------- */ 496534831adSStefano Zampini #undef __FUNCT__ 497534831adSStefano Zampini #define __FUNCT__ "PCPostSolve_BDDC" 498534831adSStefano Zampini /* -------------------------------------------------------------------------- */ 499534831adSStefano Zampini /* 500534831adSStefano Zampini PCPostSolve_BDDC - Changes the computed solution if a transformation of basis 501534831adSStefano Zampini approach has been selected. Also, restores rhs to its original state. 502534831adSStefano Zampini 503534831adSStefano Zampini Input Parameter: 504534831adSStefano Zampini + pc - the preconditioner contex 505534831adSStefano Zampini 506534831adSStefano Zampini Application Interface Routine: PCPostSolve() 507534831adSStefano Zampini 508534831adSStefano Zampini Notes: 509534831adSStefano Zampini The interface routine PCPostSolve() is not usually called directly by 510534831adSStefano Zampini the user, but instead is called by KSPSolve(). 511534831adSStefano Zampini */ 512534831adSStefano Zampini static PetscErrorCode PCPostSolve_BDDC(PC pc, KSP ksp, Vec rhs, Vec x) 513534831adSStefano Zampini { 514534831adSStefano Zampini PetscErrorCode ierr; 515534831adSStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 516534831adSStefano Zampini PC_IS *pcis = (PC_IS*)(pc->data); 517534831adSStefano Zampini Mat_IS *matis = (Mat_IS*)pc->pmat->data; 518534831adSStefano Zampini Mat temp_mat; 519534831adSStefano Zampini 520534831adSStefano Zampini PetscFunctionBegin; 521534831adSStefano Zampini if(pcbddc->usechangeofbasis) { 522534831adSStefano Zampini /* swap pointers for local matrices */ 523534831adSStefano Zampini temp_mat = matis->A; 524534831adSStefano Zampini matis->A = pcbddc->local_mat; 525534831adSStefano Zampini pcbddc->local_mat = temp_mat; 526534831adSStefano Zampini /* restore rhs to its original state */ 5273425bc38SStefano Zampini if(rhs) { 5283425bc38SStefano Zampini ierr = VecCopy(pcbddc->original_rhs,rhs);CHKERRQ(ierr); 5293425bc38SStefano Zampini } 530534831adSStefano Zampini /* Get Local boundary and apply transformation of basis to solution vector */ 531534831adSStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,x,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 532534831adSStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,x,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 533534831adSStefano Zampini /* from modified basis to original basis */ 534534831adSStefano Zampini ierr = MatMult(pcbddc->ChangeOfBasisMatrix,pcis->vec1_B,pcis->vec2_B);CHKERRQ(ierr); 535534831adSStefano Zampini /* put back modified values into the global vec using INSERT_VALUES copy mode */ 536534831adSStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,pcis->vec2_B,x,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 537534831adSStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,pcis->vec2_B,x,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 538534831adSStefano Zampini } 5393972b0daSStefano Zampini /* add solution removed in presolve */ 5403425bc38SStefano Zampini if(x) { 5413425bc38SStefano Zampini ierr = VecAXPY(x,1.0,pcbddc->temp_solution);CHKERRQ(ierr); 5423425bc38SStefano Zampini } 543534831adSStefano Zampini PetscFunctionReturn(0); 544534831adSStefano Zampini } 545534831adSStefano Zampini /* -------------------------------------------------------------------------- */ 54653cdbc3dSStefano Zampini #undef __FUNCT__ 54753cdbc3dSStefano Zampini #define __FUNCT__ "PCSetUp_BDDC" 5480c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 5490c7d97c5SJed Brown /* 5500c7d97c5SJed Brown PCSetUp_BDDC - Prepares for the use of the BDDC preconditioner 5510c7d97c5SJed Brown by setting data structures and options. 5520c7d97c5SJed Brown 5530c7d97c5SJed Brown Input Parameter: 55453cdbc3dSStefano Zampini + pc - the preconditioner context 5550c7d97c5SJed Brown 5560c7d97c5SJed Brown Application Interface Routine: PCSetUp() 5570c7d97c5SJed Brown 5580c7d97c5SJed Brown Notes: 5590c7d97c5SJed Brown The interface routine PCSetUp() is not usually called directly by 5600c7d97c5SJed Brown the user, but instead is called by PCApply() if necessary. 5610c7d97c5SJed Brown */ 56253cdbc3dSStefano Zampini PetscErrorCode PCSetUp_BDDC(PC pc) 5630c7d97c5SJed Brown { 5640c7d97c5SJed Brown PetscErrorCode ierr; 5650c7d97c5SJed Brown PC_BDDC* pcbddc = (PC_BDDC*)pc->data; 5660c7d97c5SJed Brown PC_IS *pcis = (PC_IS*)(pc->data); 5670c7d97c5SJed Brown 5680c7d97c5SJed Brown PetscFunctionBegin; 5690c7d97c5SJed Brown if (!pc->setupcalled) { 5703b03a366Sstefano_zampini /* For BDDC we need to define a local "Neumann" problem different to that defined in PCISSetup 5719c0446d6SStefano Zampini So, we set to pcnone the Neumann problem of pcis in order to avoid unneeded computation 5720c7d97c5SJed Brown Also, we decide to directly build the (same) Dirichlet problem */ 5730c7d97c5SJed Brown ierr = PetscOptionsSetValue("-is_localN_pc_type","none");CHKERRQ(ierr); 5740c7d97c5SJed Brown ierr = PetscOptionsSetValue("-is_localD_pc_type","none");CHKERRQ(ierr); 5750c7d97c5SJed Brown /* Set up all the "iterative substructuring" common block */ 5760c7d97c5SJed Brown ierr = PCISSetUp(pc);CHKERRQ(ierr); 5773b03a366Sstefano_zampini /* Get stdout for dbg */ 578e269702eSStefano Zampini if(pcbddc->dbg_flag) { 579e269702eSStefano Zampini ierr = PetscViewerASCIIGetStdout(((PetscObject)pc)->comm,&pcbddc->dbg_viewer);CHKERRQ(ierr); 580e269702eSStefano Zampini ierr = PetscViewerASCIISynchronizedAllow(pcbddc->dbg_viewer,PETSC_TRUE);CHKERRQ(ierr); 581e269702eSStefano Zampini } 5823b03a366Sstefano_zampini /* TODO MOVE CODE FRAGMENT */ 5830c7d97c5SJed Brown PetscInt im_active=0; 5840c7d97c5SJed Brown if(pcis->n) im_active = 1; 58553cdbc3dSStefano Zampini ierr = MPI_Allreduce(&im_active,&pcbddc->active_procs,1,MPIU_INT,MPI_SUM,((PetscObject)pc)->comm);CHKERRQ(ierr); 5863b03a366Sstefano_zampini /* Analyze local interface */ 5870c7d97c5SJed Brown ierr = PCBDDCManageLocalBoundaries(pc);CHKERRQ(ierr); 5883b03a366Sstefano_zampini /* Set up local constraint matrix */ 5893b03a366Sstefano_zampini ierr = PCBDDCCreateConstraintMatrix(pc);CHKERRQ(ierr); 5900c7d97c5SJed Brown /* Create coarse and local stuffs used for evaluating action of preconditioner */ 5910c7d97c5SJed Brown ierr = PCBDDCCoarseSetUp(pc);CHKERRQ(ierr); 5923b03a366Sstefano_zampini /* Processes fakely involved in multilevel should not call ISLocalToGlobalMappingRestoreInfo */ 5933b03a366Sstefano_zampini if ( !pcis->n_neigh ) pcis->ISLocalToGlobalMappingGetInfoWasCalled=PETSC_FALSE; 5940c7d97c5SJed Brown } 5950c7d97c5SJed Brown PetscFunctionReturn(0); 5960c7d97c5SJed Brown } 5970c7d97c5SJed Brown 5980c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 5990c7d97c5SJed Brown /* 6000c7d97c5SJed Brown PCApply_BDDC - Applies the BDDC preconditioner to a vector. 6010c7d97c5SJed Brown 6020c7d97c5SJed Brown Input Parameters: 6030c7d97c5SJed Brown . pc - the preconditioner context 6040c7d97c5SJed Brown . r - input vector (global) 6050c7d97c5SJed Brown 6060c7d97c5SJed Brown Output Parameter: 6070c7d97c5SJed Brown . z - output vector (global) 6080c7d97c5SJed Brown 6090c7d97c5SJed Brown Application Interface Routine: PCApply() 6100c7d97c5SJed Brown */ 6110c7d97c5SJed Brown #undef __FUNCT__ 6120c7d97c5SJed Brown #define __FUNCT__ "PCApply_BDDC" 61353cdbc3dSStefano Zampini PetscErrorCode PCApply_BDDC(PC pc,Vec r,Vec z) 6140c7d97c5SJed Brown { 6150c7d97c5SJed Brown PC_IS *pcis = (PC_IS*)(pc->data); 6160c7d97c5SJed Brown PC_BDDC *pcbddc = (PC_BDDC*)(pc->data); 6170c7d97c5SJed Brown PetscErrorCode ierr; 6183b03a366Sstefano_zampini const PetscScalar one = 1.0; 6193b03a366Sstefano_zampini const PetscScalar m_one = -1.0; 6202617d88aSStefano Zampini const PetscScalar zero = 0.0; 6210c7d97c5SJed Brown 6220c7d97c5SJed Brown /* This code is similar to that provided in nn.c for PCNN 6230c7d97c5SJed Brown NN interface preconditioner changed to BDDC 6240c7d97c5SJed Brown Added support for M_3 preconditioenr in the reference article (code is active if pcbddc->prec_type = PETSC_TRUE) */ 6250c7d97c5SJed Brown 6260c7d97c5SJed Brown PetscFunctionBegin; 627b76ba322SStefano Zampini if(!pcbddc->use_exact_dirichlet) { 6280c7d97c5SJed Brown /* First Dirichlet solve */ 6290c7d97c5SJed Brown ierr = VecScatterBegin(pcis->global_to_D,r,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 6300c7d97c5SJed Brown ierr = VecScatterEnd (pcis->global_to_D,r,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 63153cdbc3dSStefano Zampini ierr = KSPSolve(pcbddc->ksp_D,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr); 6320c7d97c5SJed Brown /* 6330c7d97c5SJed Brown Assembling right hand side for BDDC operator 6340c7d97c5SJed Brown - vec1_D for the Dirichlet part (if needed, i.e. prec_flag=PETSC_TRUE) 6350c7d97c5SJed Brown - the interface part of the global vector z 6360c7d97c5SJed Brown */ 6370c7d97c5SJed Brown ierr = VecScale(pcis->vec2_D,m_one);CHKERRQ(ierr); 6380c7d97c5SJed Brown ierr = MatMult(pcis->A_BI,pcis->vec2_D,pcis->vec1_B);CHKERRQ(ierr); 6390c7d97c5SJed Brown if(pcbddc->prec_type) { ierr = MatMultAdd(pcis->A_II,pcis->vec2_D,pcis->vec1_D,pcis->vec1_D);CHKERRQ(ierr); } 6400c7d97c5SJed Brown ierr = VecScale(pcis->vec2_D,m_one);CHKERRQ(ierr); 6410c7d97c5SJed Brown ierr = VecCopy(r,z);CHKERRQ(ierr); 6420c7d97c5SJed Brown ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 6430c7d97c5SJed Brown ierr = VecScatterEnd (pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 6442617d88aSStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 6452617d88aSStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 646b76ba322SStefano Zampini } else { 647b76ba322SStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,r,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 648b76ba322SStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,r,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 649b76ba322SStefano Zampini ierr = VecSet(pcis->vec2_D,zero);CHKERRQ(ierr); 650b76ba322SStefano Zampini } 651b76ba322SStefano Zampini 652b76ba322SStefano Zampini /* Apply partition of unity */ 6532617d88aSStefano Zampini ierr = VecPointwiseMult(pcis->vec1_B,pcis->D,pcis->vec1_B);CHKERRQ(ierr); 6542617d88aSStefano Zampini 6552617d88aSStefano Zampini /* Apply interface preconditioner 6562617d88aSStefano Zampini input/output vecs: pcis->vec1_B and pcis->vec1_D */ 6572617d88aSStefano Zampini ierr = PCBDDCApplyInterfacePreconditioner(pc);CHKERRQ(ierr); 6582617d88aSStefano Zampini 6592617d88aSStefano Zampini /* Apply partition of unity and sum boundary values */ 6602617d88aSStefano Zampini ierr = VecPointwiseMult(pcis->vec1_B,pcis->D,pcis->vec1_B);CHKERRQ(ierr); 6612617d88aSStefano Zampini ierr = VecSet(z,zero);CHKERRQ(ierr); 6622617d88aSStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 6632617d88aSStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 6640c7d97c5SJed Brown 6653b03a366Sstefano_zampini /* Second Dirichlet solve and assembling of output */ 6660c7d97c5SJed Brown ierr = VecScatterBegin(pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 6670c7d97c5SJed Brown ierr = VecScatterEnd (pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 6680c7d97c5SJed Brown ierr = MatMult(pcis->A_IB,pcis->vec1_B,pcis->vec3_D);CHKERRQ(ierr); 6690c7d97c5SJed Brown if(pcbddc->prec_type) { ierr = MatMultAdd(pcis->A_II,pcis->vec1_D,pcis->vec3_D,pcis->vec3_D);CHKERRQ(ierr); } 67053cdbc3dSStefano Zampini ierr = KSPSolve(pcbddc->ksp_D,pcis->vec3_D,pcbddc->vec4_D);CHKERRQ(ierr); 6710c7d97c5SJed Brown ierr = VecScale(pcbddc->vec4_D,m_one);CHKERRQ(ierr); 6720c7d97c5SJed Brown if(pcbddc->prec_type) { ierr = VecAXPY (pcbddc->vec4_D,one,pcis->vec1_D);CHKERRQ(ierr); } 6730c7d97c5SJed Brown ierr = VecAXPY (pcis->vec2_D,one,pcbddc->vec4_D);CHKERRQ(ierr); 6740c7d97c5SJed Brown ierr = VecScatterBegin(pcis->global_to_D,pcis->vec2_D,z,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 6750c7d97c5SJed Brown ierr = VecScatterEnd (pcis->global_to_D,pcis->vec2_D,z,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 6760c7d97c5SJed Brown PetscFunctionReturn(0); 6770c7d97c5SJed Brown 6780c7d97c5SJed Brown } 679da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */ 680da1bb401SStefano Zampini #undef __FUNCT__ 681da1bb401SStefano Zampini #define __FUNCT__ "PCDestroy_BDDC" 682da1bb401SStefano Zampini PetscErrorCode PCDestroy_BDDC(PC pc) 683da1bb401SStefano Zampini { 684da1bb401SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 685da1bb401SStefano Zampini PetscErrorCode ierr; 686da1bb401SStefano Zampini 687da1bb401SStefano Zampini PetscFunctionBegin; 688da1bb401SStefano Zampini /* free data created by PCIS */ 689da1bb401SStefano Zampini ierr = PCISDestroy(pc);CHKERRQ(ierr); 690da1bb401SStefano Zampini /* free BDDC data */ 6913972b0daSStefano Zampini ierr = VecDestroy(&pcbddc->temp_solution);CHKERRQ(ierr); 692534831adSStefano Zampini ierr = VecDestroy(&pcbddc->original_rhs);CHKERRQ(ierr); 693534831adSStefano Zampini ierr = MatDestroy(&pcbddc->local_mat);CHKERRQ(ierr); 694534831adSStefano Zampini ierr = MatDestroy(&pcbddc->ChangeOfBasisMatrix);CHKERRQ(ierr); 695da1bb401SStefano Zampini ierr = VecDestroy(&pcbddc->coarse_vec);CHKERRQ(ierr); 696da1bb401SStefano Zampini ierr = VecDestroy(&pcbddc->coarse_rhs);CHKERRQ(ierr); 697da1bb401SStefano Zampini ierr = KSPDestroy(&pcbddc->coarse_ksp);CHKERRQ(ierr); 698da1bb401SStefano Zampini ierr = MatDestroy(&pcbddc->coarse_mat);CHKERRQ(ierr); 699da1bb401SStefano Zampini ierr = MatDestroy(&pcbddc->coarse_phi_B);CHKERRQ(ierr); 700da1bb401SStefano Zampini ierr = MatDestroy(&pcbddc->coarse_phi_D);CHKERRQ(ierr); 701da1bb401SStefano Zampini ierr = VecDestroy(&pcbddc->vec1_P);CHKERRQ(ierr); 702da1bb401SStefano Zampini ierr = VecDestroy(&pcbddc->vec1_C);CHKERRQ(ierr); 703da1bb401SStefano Zampini ierr = MatDestroy(&pcbddc->local_auxmat1);CHKERRQ(ierr); 704da1bb401SStefano Zampini ierr = MatDestroy(&pcbddc->local_auxmat2);CHKERRQ(ierr); 705da1bb401SStefano Zampini ierr = VecDestroy(&pcbddc->vec1_R);CHKERRQ(ierr); 706da1bb401SStefano Zampini ierr = VecDestroy(&pcbddc->vec2_R);CHKERRQ(ierr); 707da1bb401SStefano Zampini ierr = VecDestroy(&pcbddc->vec4_D);CHKERRQ(ierr); 708da1bb401SStefano Zampini ierr = VecScatterDestroy(&pcbddc->R_to_B);CHKERRQ(ierr); 709da1bb401SStefano Zampini ierr = VecScatterDestroy(&pcbddc->R_to_D);CHKERRQ(ierr); 710da1bb401SStefano Zampini ierr = VecScatterDestroy(&pcbddc->coarse_loc_to_glob);CHKERRQ(ierr); 711da1bb401SStefano Zampini ierr = KSPDestroy(&pcbddc->ksp_D);CHKERRQ(ierr); 712da1bb401SStefano Zampini ierr = KSPDestroy(&pcbddc->ksp_R);CHKERRQ(ierr); 713da1bb401SStefano Zampini ierr = ISDestroy(&pcbddc->NeumannBoundaries);CHKERRQ(ierr); 714da1bb401SStefano Zampini ierr = ISDestroy(&pcbddc->DirichletBoundaries);CHKERRQ(ierr); 715da1bb401SStefano Zampini ierr = MatDestroy(&pcbddc->ConstraintMatrix);CHKERRQ(ierr); 716da1bb401SStefano Zampini ierr = PetscFree(pcbddc->local_primal_indices);CHKERRQ(ierr); 717da1bb401SStefano Zampini ierr = PetscFree(pcbddc->replicated_local_primal_indices);CHKERRQ(ierr); 718da1bb401SStefano Zampini if (pcbddc->replicated_local_primal_values) { free(pcbddc->replicated_local_primal_values); } 719da1bb401SStefano Zampini ierr = PetscFree(pcbddc->local_primal_displacements);CHKERRQ(ierr); 720da1bb401SStefano Zampini ierr = PetscFree(pcbddc->local_primal_sizes);CHKERRQ(ierr); 721da1bb401SStefano Zampini PetscInt i; 722da1bb401SStefano Zampini for(i=0;i<pcbddc->n_ISForDofs;i++) { ierr = ISDestroy(&pcbddc->ISForDofs[i]);CHKERRQ(ierr); } 723da1bb401SStefano Zampini ierr = PetscFree(pcbddc->ISForDofs);CHKERRQ(ierr); 724da1bb401SStefano Zampini for(i=0;i<pcbddc->n_ISForFaces;i++) { ierr = ISDestroy(&pcbddc->ISForFaces[i]);CHKERRQ(ierr); } 725da1bb401SStefano Zampini ierr = PetscFree(pcbddc->ISForFaces);CHKERRQ(ierr); 726da1bb401SStefano Zampini for(i=0;i<pcbddc->n_ISForEdges;i++) { ierr = ISDestroy(&pcbddc->ISForEdges[i]);CHKERRQ(ierr); } 727da1bb401SStefano Zampini ierr = PetscFree(pcbddc->ISForEdges);CHKERRQ(ierr); 728da1bb401SStefano Zampini ierr = ISDestroy(&pcbddc->ISForVertices);CHKERRQ(ierr); 7293972b0daSStefano Zampini /* Free graph structure */ 730da1bb401SStefano Zampini ierr = PetscFree(pcbddc->mat_graph->xadj);CHKERRQ(ierr); 731da1bb401SStefano Zampini ierr = PetscFree(pcbddc->mat_graph->adjncy);CHKERRQ(ierr); 732da1bb401SStefano Zampini ierr = PetscFree(pcbddc->mat_graph->neighbours_set[0]);CHKERRQ(ierr); 733da1bb401SStefano Zampini ierr = PetscFree(pcbddc->mat_graph->neighbours_set);CHKERRQ(ierr); 7343972b0daSStefano Zampini ierr = PetscFree4(pcbddc->mat_graph->where,pcbddc->mat_graph->count,pcbddc->mat_graph->cptr,pcbddc->mat_graph->queue);CHKERRQ(ierr); 7353972b0daSStefano Zampini ierr = PetscFree2(pcbddc->mat_graph->which_dof,pcbddc->mat_graph->touched);CHKERRQ(ierr); 7363972b0daSStefano Zampini ierr = PetscFree(pcbddc->mat_graph->where_ncmps);CHKERRQ(ierr); 737da1bb401SStefano Zampini ierr = PetscFree(pcbddc->mat_graph);CHKERRQ(ierr); 7383425bc38SStefano Zampini /* remove functions */ 7393425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDirichletBoundaries_C","",PETSC_NULL);CHKERRQ(ierr); 7403425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetNeumannBoundaries_C","",PETSC_NULL);CHKERRQ(ierr); 7413425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetDirichletBoundaries_C","",PETSC_NULL);CHKERRQ(ierr); 7423425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetNeumannBoundaries_C","",PETSC_NULL);CHKERRQ(ierr); 7433425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetCoarseProblemType_C","",PETSC_NULL);CHKERRQ(ierr); 7443425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDofsSplitting_C","",PETSC_NULL);CHKERRQ(ierr); 7453425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetLocalAdjacencyGraph_C","",PETSC_NULL);CHKERRQ(ierr); 7463425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPreSolve_C","",PETSC_NULL);CHKERRQ(ierr); 7473425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPostSolve_C","",PETSC_NULL);CHKERRQ(ierr); 7483425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCCreateFETIDPOperators_C","",PETSC_NULL);CHKERRQ(ierr); 7493425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetRHS_C","",PETSC_NULL);CHKERRQ(ierr); 7503425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetSolution_C","",PETSC_NULL);CHKERRQ(ierr); 751da1bb401SStefano Zampini /* Free the private data structure that was hanging off the PC */ 752da1bb401SStefano Zampini ierr = PetscFree(pcbddc);CHKERRQ(ierr); 753da1bb401SStefano Zampini PetscFunctionReturn(0); 754da1bb401SStefano Zampini } 7553425bc38SStefano Zampini /* -------------------------------------------------------------------------- */ 7563425bc38SStefano Zampini EXTERN_C_BEGIN 7573425bc38SStefano Zampini #undef __FUNCT__ 7583425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetRHS_BDDC" 7593425bc38SStefano Zampini static PetscErrorCode PCBDDCMatFETIDPGetRHS_BDDC(Mat fetidp_mat, Vec standard_rhs, Vec fetidp_flux_rhs) 7603425bc38SStefano Zampini { 7613425bc38SStefano Zampini FETIDPMat_ctx *mat_ctx; 7623425bc38SStefano Zampini PC_IS* pcis; 7633425bc38SStefano Zampini PC_BDDC* pcbddc; 7643425bc38SStefano Zampini Mat_IS* matis; 7653425bc38SStefano Zampini PetscErrorCode ierr; 7660c7d97c5SJed Brown 7673425bc38SStefano Zampini PetscFunctionBegin; 7683425bc38SStefano Zampini ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr); 7693425bc38SStefano Zampini pcis = (PC_IS*)mat_ctx->pc->data; 7703425bc38SStefano Zampini pcbddc = (PC_BDDC*)mat_ctx->pc->data; 7713425bc38SStefano Zampini matis = (Mat_IS*)mat_ctx->pc->pmat->data; 7723425bc38SStefano Zampini 7733425bc38SStefano Zampini /* change of basis for physical rhs if needed 7743425bc38SStefano Zampini It also changes the rhs in case of dirichlet boundaries */ 7753425bc38SStefano Zampini (*mat_ctx->pc->ops->presolve)(mat_ctx->pc,PETSC_NULL,standard_rhs,PETSC_NULL); 7763425bc38SStefano Zampini /* store vectors for computation of fetidp final solution */ 7773425bc38SStefano Zampini ierr = VecScatterBegin(pcis->global_to_D,standard_rhs,mat_ctx->temp_solution_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 7783425bc38SStefano Zampini ierr = VecScatterEnd (pcis->global_to_D,standard_rhs,mat_ctx->temp_solution_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 7793425bc38SStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 7803425bc38SStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 7813425bc38SStefano Zampini /* scale rhs since it should be unassembled */ 7823425bc38SStefano Zampini ierr = VecPointwiseMult(mat_ctx->temp_solution_B,pcis->D,mat_ctx->temp_solution_B);CHKERRQ(ierr); 7833425bc38SStefano Zampini if(!pcbddc->prec_type) { 7843425bc38SStefano Zampini /* compute partially subassembled Schur complement right-hand side */ 7853425bc38SStefano Zampini ierr = KSPSolve(pcbddc->ksp_D,mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr); 7863425bc38SStefano Zampini ierr = MatMult(pcis->A_BI,pcis->vec1_D,pcis->vec1_B);CHKERRQ(ierr); 7873425bc38SStefano Zampini ierr = VecAXPY(mat_ctx->temp_solution_B,-1.0,pcis->vec1_B);CHKERRQ(ierr); 7883425bc38SStefano Zampini ierr = VecSet(standard_rhs,0.0);CHKERRQ(ierr); 7893425bc38SStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,mat_ctx->temp_solution_B,standard_rhs,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 7903425bc38SStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,mat_ctx->temp_solution_B,standard_rhs,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 7913425bc38SStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 7923425bc38SStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 7933425bc38SStefano Zampini ierr = VecPointwiseMult(mat_ctx->temp_solution_B,pcis->D,mat_ctx->temp_solution_B);CHKERRQ(ierr); 7943425bc38SStefano Zampini } 7953425bc38SStefano Zampini /* BDDC rhs */ 7963425bc38SStefano Zampini ierr = VecCopy(mat_ctx->temp_solution_B,pcis->vec1_B);CHKERRQ(ierr); 7973425bc38SStefano Zampini if(pcbddc->prec_type) { 7983425bc38SStefano Zampini ierr = VecCopy(mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr); 7993425bc38SStefano Zampini } 8003425bc38SStefano Zampini /* apply BDDC */ 8013425bc38SStefano Zampini ierr = PCBDDCApplyInterfacePreconditioner(mat_ctx->pc);CHKERRQ(ierr); 8023425bc38SStefano Zampini /* Application of B_delta and assembling of rhs for fetidp fluxes */ 8033425bc38SStefano Zampini ierr = VecSet(fetidp_flux_rhs,0.0);CHKERRQ(ierr); 8043425bc38SStefano Zampini ierr = MatMult(mat_ctx->B_delta,pcis->vec1_B,mat_ctx->lambda_local);CHKERRQ(ierr); 8053425bc38SStefano Zampini ierr = VecScatterBegin(mat_ctx->l2g_lambda,mat_ctx->lambda_local,fetidp_flux_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 8063425bc38SStefano Zampini ierr = VecScatterEnd (mat_ctx->l2g_lambda,mat_ctx->lambda_local,fetidp_flux_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 8073425bc38SStefano Zampini /* restore original rhs */ 8083425bc38SStefano Zampini ierr = VecCopy(pcbddc->original_rhs,standard_rhs);CHKERRQ(ierr); 8093425bc38SStefano Zampini PetscFunctionReturn(0); 8103425bc38SStefano Zampini } 8113425bc38SStefano Zampini EXTERN_C_END 8123425bc38SStefano Zampini #undef __FUNCT__ 8133425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetRHS" 8143425bc38SStefano Zampini /*@ 8153425bc38SStefano Zampini PCBDDCMatFETIDPGetRHS - Get rhs for FETIDP linear system. 8163425bc38SStefano Zampini 8173425bc38SStefano Zampini Collective 8183425bc38SStefano Zampini 8193425bc38SStefano Zampini Input Parameters: 8203425bc38SStefano Zampini + fetidp_mat - the FETIDP mat obtained by a call to PCBDDCCreateFETIDPOperators 8213425bc38SStefano Zampini + standard_rhs - the rhs of your linear system 8223425bc38SStefano Zampini 8233425bc38SStefano Zampini Output Parameters: 8243425bc38SStefano Zampini + fetidp_flux_rhs - the rhs of the FETIDP linear system 8253425bc38SStefano Zampini 8263425bc38SStefano Zampini Level: developer 8273425bc38SStefano Zampini 8283425bc38SStefano Zampini Notes: 8293425bc38SStefano Zampini 8303425bc38SStefano Zampini .seealso: PCBDDC 8313425bc38SStefano Zampini @*/ 8323425bc38SStefano Zampini PetscErrorCode PCBDDCMatFETIDPGetRHS(Mat fetidp_mat, Vec standard_rhs, Vec fetidp_flux_rhs) 8333425bc38SStefano Zampini { 8343425bc38SStefano Zampini FETIDPMat_ctx *mat_ctx; 8353425bc38SStefano Zampini PetscErrorCode ierr; 8363425bc38SStefano Zampini 8373425bc38SStefano Zampini PetscFunctionBegin; 8383425bc38SStefano Zampini ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr); 8393425bc38SStefano Zampini ierr = PetscTryMethod(mat_ctx->pc,"PCBDDCMatFETIDPGetRHS_C",(Mat,Vec,Vec),(fetidp_mat,standard_rhs,fetidp_flux_rhs));CHKERRQ(ierr); 8403425bc38SStefano Zampini PetscFunctionReturn(0); 8413425bc38SStefano Zampini } 8423425bc38SStefano Zampini /* -------------------------------------------------------------------------- */ 8433425bc38SStefano Zampini EXTERN_C_BEGIN 8443425bc38SStefano Zampini #undef __FUNCT__ 8453425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetSolution_BDDC" 8463425bc38SStefano Zampini static PetscErrorCode PCBDDCMatFETIDPGetSolution_BDDC(Mat fetidp_mat, Vec fetidp_flux_sol, Vec standard_sol) 8473425bc38SStefano Zampini { 8483425bc38SStefano Zampini FETIDPMat_ctx *mat_ctx; 8493425bc38SStefano Zampini PC_IS* pcis; 8503425bc38SStefano Zampini PC_BDDC* pcbddc; 8513425bc38SStefano Zampini Mat_IS* matis; 8523425bc38SStefano Zampini PetscErrorCode ierr; 8533425bc38SStefano Zampini 8543425bc38SStefano Zampini PetscFunctionBegin; 8553425bc38SStefano Zampini ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr); 8563425bc38SStefano Zampini pcis = (PC_IS*)mat_ctx->pc->data; 8573425bc38SStefano Zampini pcbddc = (PC_BDDC*)mat_ctx->pc->data; 8583425bc38SStefano Zampini matis = (Mat_IS*)mat_ctx->pc->pmat->data; 8593425bc38SStefano Zampini 8603425bc38SStefano Zampini /* apply B_delta^T */ 8613425bc38SStefano Zampini ierr = VecScatterBegin(mat_ctx->l2g_lambda,fetidp_flux_sol,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8623425bc38SStefano Zampini ierr = VecScatterEnd (mat_ctx->l2g_lambda,fetidp_flux_sol,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8633425bc38SStefano Zampini ierr = MatMultTranspose(mat_ctx->B_delta,mat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr); 8643425bc38SStefano Zampini /* compute rhs for BDDC application */ 8653425bc38SStefano Zampini ierr = VecAYPX(pcis->vec1_B,-1.0,mat_ctx->temp_solution_B);CHKERRQ(ierr); 8663425bc38SStefano Zampini if(pcbddc->prec_type) { 8673425bc38SStefano Zampini ierr = VecCopy(mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr); 8683425bc38SStefano Zampini } 8693425bc38SStefano Zampini /* apply BDDC */ 8703425bc38SStefano Zampini ierr = PCBDDCApplyInterfacePreconditioner(mat_ctx->pc);CHKERRQ(ierr); 8713425bc38SStefano Zampini /* put values into standard global vector */ 8723425bc38SStefano Zampini ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8733425bc38SStefano Zampini ierr = VecScatterEnd (pcis->global_to_B,pcis->vec1_B,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8743425bc38SStefano Zampini if(!pcbddc->prec_type) { 8753425bc38SStefano Zampini /* compute values into the interior if solved for the partially subassembled Schur complement */ 8763425bc38SStefano Zampini ierr = MatMult(pcis->A_IB,pcis->vec1_B,pcis->vec1_D);CHKERRQ(ierr); 8773425bc38SStefano Zampini ierr = VecAXPY(mat_ctx->temp_solution_D,-1.0,pcis->vec1_D);CHKERRQ(ierr); 8783425bc38SStefano Zampini ierr = KSPSolve(pcbddc->ksp_D,mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr); 8793425bc38SStefano Zampini } 8803425bc38SStefano Zampini ierr = VecScatterBegin(pcis->global_to_D,pcis->vec1_D,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8813425bc38SStefano Zampini ierr = VecScatterEnd (pcis->global_to_D,pcis->vec1_D,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 8823425bc38SStefano Zampini /* final change of basis if needed 8833425bc38SStefano Zampini Is also sums the dirichlet part removed during RHS assembling */ 8843425bc38SStefano Zampini (*mat_ctx->pc->ops->postsolve)(mat_ctx->pc,PETSC_NULL,PETSC_NULL,standard_sol); 8853425bc38SStefano Zampini PetscFunctionReturn(0); 8863425bc38SStefano Zampini 8873425bc38SStefano Zampini } 8883425bc38SStefano Zampini EXTERN_C_END 8893425bc38SStefano Zampini #undef __FUNCT__ 8903425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetSolution" 8913425bc38SStefano Zampini /*@ 8923425bc38SStefano Zampini PCBDDCMatFETIDPGetSolution - Get Solution for FETIDP linear system. 8933425bc38SStefano Zampini 8943425bc38SStefano Zampini Collective 8953425bc38SStefano Zampini 8963425bc38SStefano Zampini Input Parameters: 8973425bc38SStefano Zampini + fetidp_mat - the FETIDP mat obtained by a call to PCBDDCCreateFETIDPOperators 8983425bc38SStefano Zampini + fetidp_flux_sol - the solution of the FETIDP linear system 8993425bc38SStefano Zampini 9003425bc38SStefano Zampini Output Parameters: 9013425bc38SStefano Zampini + standard_sol - the solution on the global domain 9023425bc38SStefano Zampini 9033425bc38SStefano Zampini Level: developer 9043425bc38SStefano Zampini 9053425bc38SStefano Zampini Notes: 9063425bc38SStefano Zampini 9073425bc38SStefano Zampini .seealso: PCBDDC 9083425bc38SStefano Zampini @*/ 9093425bc38SStefano Zampini PetscErrorCode PCBDDCMatFETIDPGetSolution(Mat fetidp_mat, Vec fetidp_flux_sol, Vec standard_sol) 9103425bc38SStefano Zampini { 9113425bc38SStefano Zampini FETIDPMat_ctx *mat_ctx; 9123425bc38SStefano Zampini PetscErrorCode ierr; 9133425bc38SStefano Zampini 9143425bc38SStefano Zampini PetscFunctionBegin; 9153425bc38SStefano Zampini ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr); 9163425bc38SStefano Zampini ierr = PetscTryMethod(mat_ctx->pc,"PCBDDCMatFETIDPGetSolution_C",(Mat,Vec,Vec),(fetidp_mat,fetidp_flux_sol,standard_sol));CHKERRQ(ierr); 9173425bc38SStefano Zampini PetscFunctionReturn(0); 9183425bc38SStefano Zampini } 9193425bc38SStefano Zampini /* -------------------------------------------------------------------------- */ 9203425bc38SStefano Zampini EXTERN_C_BEGIN 9213425bc38SStefano Zampini #undef __FUNCT__ 9223425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPOperators_BDDC" 9233425bc38SStefano Zampini static PetscErrorCode PCBDDCCreateFETIDPOperators_BDDC(PC pc, Mat *fetidp_mat, PC *fetidp_pc) 9243425bc38SStefano Zampini { 9253425bc38SStefano Zampini PETSC_EXTERN PetscErrorCode FETIDPMatMult(Mat,Vec,Vec); 9263425bc38SStefano Zampini PETSC_EXTERN PetscErrorCode PCBDDCDestroyFETIDPMat(Mat); 9273425bc38SStefano Zampini PETSC_EXTERN PetscErrorCode FETIDPPCApply(PC,Vec,Vec); 9283425bc38SStefano Zampini PETSC_EXTERN PetscErrorCode PCBDDCDestroyFETIDPPC(PC); 9293425bc38SStefano Zampini 9303425bc38SStefano Zampini FETIDPMat_ctx *fetidpmat_ctx; 9313425bc38SStefano Zampini Mat newmat; 9323425bc38SStefano Zampini FETIDPPC_ctx *fetidppc_ctx; 9333425bc38SStefano Zampini PC newpc; 9343425bc38SStefano Zampini MPI_Comm comm = ((PetscObject)pc)->comm; 9353425bc38SStefano Zampini PetscErrorCode ierr; 9363425bc38SStefano Zampini 9373425bc38SStefano Zampini PetscFunctionBegin; 9383425bc38SStefano Zampini /* FETIDP linear matrix */ 9393425bc38SStefano Zampini ierr = PCBDDCCreateFETIDPMatContext(pc, &fetidpmat_ctx);CHKERRQ(ierr); 9403425bc38SStefano Zampini ierr = PCBDDCSetupFETIDPMatContext(fetidpmat_ctx);CHKERRQ(ierr); 9413425bc38SStefano Zampini ierr = MatCreateShell(comm,PETSC_DECIDE,PETSC_DECIDE,fetidpmat_ctx->n_lambda,fetidpmat_ctx->n_lambda,fetidpmat_ctx,&newmat);CHKERRQ(ierr); 9423425bc38SStefano Zampini ierr = MatShellSetOperation(newmat,MATOP_MULT,(void (*)(void))FETIDPMatMult);CHKERRQ(ierr); 9433425bc38SStefano Zampini ierr = MatShellSetOperation(newmat,MATOP_DESTROY,(void (*)(void))PCBDDCDestroyFETIDPMat);CHKERRQ(ierr); 9443425bc38SStefano Zampini ierr = MatSetUp(newmat);CHKERRQ(ierr); 9453425bc38SStefano Zampini /* FETIDP preconditioner */ 9463425bc38SStefano Zampini ierr = PCBDDCCreateFETIDPPCContext(pc, &fetidppc_ctx);CHKERRQ(ierr); 9473425bc38SStefano Zampini ierr = PCBDDCSetupFETIDPPCContext(newmat,fetidppc_ctx);CHKERRQ(ierr); 9483425bc38SStefano Zampini ierr = PCCreate(comm,&newpc);CHKERRQ(ierr); 9493425bc38SStefano Zampini ierr = PCSetType(newpc,PCSHELL);CHKERRQ(ierr); 9503425bc38SStefano Zampini ierr = PCShellSetContext(newpc,fetidppc_ctx);CHKERRQ(ierr); 9513425bc38SStefano Zampini ierr = PCShellSetApply(newpc,FETIDPPCApply);CHKERRQ(ierr); 9523425bc38SStefano Zampini ierr = PCShellSetDestroy(newpc,PCBDDCDestroyFETIDPPC);CHKERRQ(ierr); 9533425bc38SStefano Zampini ierr = PCSetOperators(newpc,newmat,newmat,SAME_PRECONDITIONER);CHKERRQ(ierr); 9543425bc38SStefano Zampini ierr = PCSetUp(newpc);CHKERRQ(ierr); 9553425bc38SStefano Zampini /* return pointers for objects created */ 9563425bc38SStefano Zampini *fetidp_mat=newmat; 9573425bc38SStefano Zampini *fetidp_pc=newpc; 9583425bc38SStefano Zampini 9593425bc38SStefano Zampini PetscFunctionReturn(0); 9603425bc38SStefano Zampini } 9613425bc38SStefano Zampini EXTERN_C_END 9623425bc38SStefano Zampini #undef __FUNCT__ 9633425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPOperators" 9643425bc38SStefano Zampini /*@ 9653425bc38SStefano Zampini PCBDDCCreateFETIDPOperators - Create operators for FETIDP. 9663425bc38SStefano Zampini 9673425bc38SStefano Zampini Collective 9683425bc38SStefano Zampini 9693425bc38SStefano Zampini Input Parameters: 9703425bc38SStefano Zampini + pc - the BDDC preconditioning context (setup must be already called) 9713425bc38SStefano Zampini 9723425bc38SStefano Zampini Level: developer 9733425bc38SStefano Zampini 9743425bc38SStefano Zampini Notes: 9753425bc38SStefano Zampini 9763425bc38SStefano Zampini .seealso: PCBDDC 9773425bc38SStefano Zampini @*/ 9783425bc38SStefano Zampini PetscErrorCode PCBDDCCreateFETIDPOperators(PC pc, Mat *fetidp_mat, PC *fetidp_pc) 9793425bc38SStefano Zampini { 9803425bc38SStefano Zampini PetscErrorCode ierr; 9813425bc38SStefano Zampini 9823425bc38SStefano Zampini PetscFunctionBegin; 9833425bc38SStefano Zampini PetscValidHeaderSpecific(pc,PC_CLASSID,1); 9843425bc38SStefano Zampini if (pc->setupcalled) { 9853425bc38SStefano Zampini ierr = PetscTryMethod(pc,"PCBDDCCreateFETIDPOperators_C",(PC,Mat*,PC*),(pc,fetidp_mat,fetidp_pc));CHKERRQ(ierr); 9863425bc38SStefano Zampini } else { 9873425bc38SStefano Zampini SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SUP,"You must call PCSetup_BDDC before calling %s\n",__FUNCT__); 9883425bc38SStefano Zampini } 9893425bc38SStefano Zampini PetscFunctionReturn(0); 9903425bc38SStefano Zampini } 9910c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 992da1bb401SStefano Zampini /*MC 993da1bb401SStefano Zampini PCBDDC - Balancing Domain Decomposition by Constraints. 9940c7d97c5SJed Brown 995da1bb401SStefano Zampini Options Database Keys: 996da1bb401SStefano Zampini . -pcbddc ??? - 997da1bb401SStefano Zampini 998da1bb401SStefano Zampini Level: intermediate 999da1bb401SStefano Zampini 1000da1bb401SStefano Zampini Notes: The matrix used with this preconditioner must be of type MATIS 1001da1bb401SStefano Zampini 1002da1bb401SStefano Zampini Unlike more 'conventional' interface preconditioners, this iterates over ALL the 1003da1bb401SStefano Zampini degrees of freedom, NOT just those on the interface (this allows the use of approximate solvers 1004da1bb401SStefano Zampini on the subdomains). 1005da1bb401SStefano Zampini 1006da1bb401SStefano Zampini Options for the coarse grid preconditioner can be set with - 1007da1bb401SStefano Zampini Options for the Dirichlet subproblem can be set with - 1008da1bb401SStefano Zampini Options for the Neumann subproblem can be set with - 1009da1bb401SStefano Zampini 1010da1bb401SStefano Zampini Contributed by Stefano Zampini 1011da1bb401SStefano Zampini 1012da1bb401SStefano Zampini .seealso: PCCreate(), PCSetType(), PCType (for list of available types), PC, MATIS 1013da1bb401SStefano Zampini M*/ 1014da1bb401SStefano Zampini EXTERN_C_BEGIN 1015da1bb401SStefano Zampini #undef __FUNCT__ 1016da1bb401SStefano Zampini #define __FUNCT__ "PCCreate_BDDC" 1017da1bb401SStefano Zampini PetscErrorCode PCCreate_BDDC(PC pc) 1018da1bb401SStefano Zampini { 1019da1bb401SStefano Zampini PetscErrorCode ierr; 1020da1bb401SStefano Zampini PC_BDDC *pcbddc; 1021da1bb401SStefano Zampini PCBDDCGraph mat_graph; 1022da1bb401SStefano Zampini 1023da1bb401SStefano Zampini PetscFunctionBegin; 1024da1bb401SStefano Zampini /* Creates the private data structure for this preconditioner and attach it to the PC object. */ 1025da1bb401SStefano Zampini ierr = PetscNewLog(pc,PC_BDDC,&pcbddc);CHKERRQ(ierr); 1026da1bb401SStefano Zampini pc->data = (void*)pcbddc; 1027da1bb401SStefano Zampini 1028da1bb401SStefano Zampini /* create PCIS data structure */ 1029da1bb401SStefano Zampini ierr = PCISCreate(pc);CHKERRQ(ierr); 1030da1bb401SStefano Zampini 1031da1bb401SStefano Zampini /* BDDC specific */ 10323972b0daSStefano Zampini pcbddc->temp_solution = 0; 1033534831adSStefano Zampini pcbddc->original_rhs = 0; 1034534831adSStefano Zampini pcbddc->local_mat = 0; 1035534831adSStefano Zampini pcbddc->ChangeOfBasisMatrix = 0; 1036534831adSStefano Zampini pcbddc->usechangeofbasis = PETSC_TRUE; 1037534831adSStefano Zampini pcbddc->usechangeonfaces = PETSC_FALSE; 1038da1bb401SStefano Zampini pcbddc->coarse_vec = 0; 1039da1bb401SStefano Zampini pcbddc->coarse_rhs = 0; 1040da1bb401SStefano Zampini pcbddc->coarse_ksp = 0; 1041da1bb401SStefano Zampini pcbddc->coarse_phi_B = 0; 1042da1bb401SStefano Zampini pcbddc->coarse_phi_D = 0; 1043da1bb401SStefano Zampini pcbddc->vec1_P = 0; 1044da1bb401SStefano Zampini pcbddc->vec1_R = 0; 1045da1bb401SStefano Zampini pcbddc->vec2_R = 0; 1046da1bb401SStefano Zampini pcbddc->local_auxmat1 = 0; 1047da1bb401SStefano Zampini pcbddc->local_auxmat2 = 0; 1048da1bb401SStefano Zampini pcbddc->R_to_B = 0; 1049da1bb401SStefano Zampini pcbddc->R_to_D = 0; 1050da1bb401SStefano Zampini pcbddc->ksp_D = 0; 1051da1bb401SStefano Zampini pcbddc->ksp_R = 0; 1052da1bb401SStefano Zampini pcbddc->local_primal_indices = 0; 1053da1bb401SStefano Zampini pcbddc->prec_type = PETSC_FALSE; 1054da1bb401SStefano Zampini pcbddc->NeumannBoundaries = 0; 1055da1bb401SStefano Zampini pcbddc->ISForDofs = 0; 1056da1bb401SStefano Zampini pcbddc->ISForVertices = 0; 1057da1bb401SStefano Zampini pcbddc->n_ISForFaces = 0; 1058da1bb401SStefano Zampini pcbddc->n_ISForEdges = 0; 1059da1bb401SStefano Zampini pcbddc->ConstraintMatrix = 0; 1060da1bb401SStefano Zampini pcbddc->use_nnsp_true = PETSC_FALSE; 1061da1bb401SStefano Zampini pcbddc->local_primal_sizes = 0; 1062da1bb401SStefano Zampini pcbddc->local_primal_displacements = 0; 1063da1bb401SStefano Zampini pcbddc->replicated_local_primal_indices = 0; 1064da1bb401SStefano Zampini pcbddc->replicated_local_primal_values = 0; 1065da1bb401SStefano Zampini pcbddc->coarse_loc_to_glob = 0; 1066da1bb401SStefano Zampini pcbddc->dbg_flag = PETSC_FALSE; 1067da1bb401SStefano Zampini pcbddc->coarsening_ratio = 8; 1068b76ba322SStefano Zampini pcbddc->use_exact_dirichlet = PETSC_TRUE; 1069da1bb401SStefano Zampini 1070da1bb401SStefano Zampini /* allocate and initialize needed graph structure */ 1071da1bb401SStefano Zampini ierr = PetscMalloc(sizeof(*mat_graph),&pcbddc->mat_graph);CHKERRQ(ierr); 1072da1bb401SStefano Zampini pcbddc->mat_graph->xadj = 0; 1073da1bb401SStefano Zampini pcbddc->mat_graph->adjncy = 0; 1074da1bb401SStefano Zampini 1075da1bb401SStefano Zampini /* function pointers */ 1076da1bb401SStefano Zampini pc->ops->apply = PCApply_BDDC; 1077da1bb401SStefano Zampini pc->ops->applytranspose = 0; 1078da1bb401SStefano Zampini pc->ops->setup = PCSetUp_BDDC; 1079da1bb401SStefano Zampini pc->ops->destroy = PCDestroy_BDDC; 1080da1bb401SStefano Zampini pc->ops->setfromoptions = PCSetFromOptions_BDDC; 1081da1bb401SStefano Zampini pc->ops->view = 0; 1082da1bb401SStefano Zampini pc->ops->applyrichardson = 0; 1083da1bb401SStefano Zampini pc->ops->applysymmetricleft = 0; 1084da1bb401SStefano Zampini pc->ops->applysymmetricright = 0; 1085534831adSStefano Zampini pc->ops->presolve = PCPreSolve_BDDC; 1086534831adSStefano Zampini pc->ops->postsolve = PCPostSolve_BDDC; 1087da1bb401SStefano Zampini 1088da1bb401SStefano Zampini /* composing function */ 1089da1bb401SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDirichletBoundaries_C","PCBDDCSetDirichletBoundaries_BDDC", 1090da1bb401SStefano Zampini PCBDDCSetDirichletBoundaries_BDDC);CHKERRQ(ierr); 1091da1bb401SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetNeumannBoundaries_C","PCBDDCSetNeumannBoundaries_BDDC", 1092da1bb401SStefano Zampini PCBDDCSetNeumannBoundaries_BDDC);CHKERRQ(ierr); 1093da1bb401SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetDirichletBoundaries_C","PCBDDCGetDirichletBoundaries_BDDC", 1094da1bb401SStefano Zampini PCBDDCGetDirichletBoundaries_BDDC);CHKERRQ(ierr); 1095da1bb401SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetNeumannBoundaries_C","PCBDDCGetNeumannBoundaries_BDDC", 1096da1bb401SStefano Zampini PCBDDCGetNeumannBoundaries_BDDC);CHKERRQ(ierr); 1097da1bb401SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetCoarseProblemType_C","PCBDDCSetCoarseProblemType_BDDC", 1098da1bb401SStefano Zampini PCBDDCSetCoarseProblemType_BDDC);CHKERRQ(ierr); 1099da1bb401SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDofsSplitting_C","PCBDDCSetDofsSplitting_BDDC", 1100da1bb401SStefano Zampini PCBDDCSetDofsSplitting_BDDC);CHKERRQ(ierr); 1101da1bb401SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetLocalAdjacencyGraph_C","PCBDDCSetLocalAdjacencyGraph_BDDC", 1102da1bb401SStefano Zampini PCBDDCSetLocalAdjacencyGraph_BDDC);CHKERRQ(ierr); 1103534831adSStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPreSolve_C","PCPreSolve_BDDC", 1104534831adSStefano Zampini PCPreSolve_BDDC);CHKERRQ(ierr); 1105534831adSStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPostSolve_C","PCPostSolve_BDDC", 1106534831adSStefano Zampini PCPostSolve_BDDC);CHKERRQ(ierr); 11073425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCCreateFETIDPOperators_C","PCBDDCCreateFETIDPOperators_BDDC", 11083425bc38SStefano Zampini PCBDDCCreateFETIDPOperators_BDDC);CHKERRQ(ierr); 11093425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetRHS_C","PCBDDCMatFETIDPGetRHS_BDDC", 11103425bc38SStefano Zampini PCBDDCMatFETIDPGetRHS_BDDC);CHKERRQ(ierr); 11113425bc38SStefano Zampini ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetSolution_C","PCBDDCMatFETIDPGetSolution_BDDC", 11123425bc38SStefano Zampini PCBDDCMatFETIDPGetSolution_BDDC);CHKERRQ(ierr); 1113da1bb401SStefano Zampini PetscFunctionReturn(0); 1114da1bb401SStefano Zampini } 1115da1bb401SStefano Zampini EXTERN_C_END 11163425bc38SStefano Zampini 1117da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */ 1118da1bb401SStefano Zampini /* All static functions from now on */ 1119da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */ 11203425bc38SStefano Zampini 11213425bc38SStefano Zampini #undef __FUNCT__ 11223425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPMatContext" 11233425bc38SStefano Zampini static PetscErrorCode PCBDDCCreateFETIDPMatContext(PC pc, FETIDPMat_ctx **fetidpmat_ctx) 11243425bc38SStefano Zampini { 11253425bc38SStefano Zampini FETIDPMat_ctx *newctx; 11263425bc38SStefano Zampini PetscErrorCode ierr; 11273425bc38SStefano Zampini 11283425bc38SStefano Zampini PetscFunctionBegin; 11293425bc38SStefano Zampini ierr = PetscMalloc(sizeof(*newctx),&newctx);CHKERRQ(ierr); 11303425bc38SStefano Zampini newctx->lambda_local = 0; 11313425bc38SStefano Zampini newctx->temp_solution_B = 0; 11323425bc38SStefano Zampini newctx->temp_solution_D = 0; 11333425bc38SStefano Zampini newctx->B_delta = 0; 11343425bc38SStefano Zampini newctx->B_Ddelta = 0; /* theoretically belongs to the FETIDP preconditioner */ 11353425bc38SStefano Zampini newctx->l2g_lambda = 0; 11363425bc38SStefano Zampini /* increase the reference count for BDDC preconditioner */ 11373425bc38SStefano Zampini ierr = PetscObjectReference((PetscObject)pc);CHKERRQ(ierr); 11383425bc38SStefano Zampini newctx->pc = pc; 11393425bc38SStefano Zampini *fetidpmat_ctx = newctx; 11403425bc38SStefano Zampini PetscFunctionReturn(0); 11413425bc38SStefano Zampini } 11423425bc38SStefano Zampini 11433425bc38SStefano Zampini #undef __FUNCT__ 11443425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPPCContext" 11453425bc38SStefano Zampini static PetscErrorCode PCBDDCCreateFETIDPPCContext(PC pc, FETIDPPC_ctx **fetidppc_ctx) 11463425bc38SStefano Zampini { 11473425bc38SStefano Zampini FETIDPPC_ctx *newctx; 11483425bc38SStefano Zampini PetscErrorCode ierr; 11493425bc38SStefano Zampini 11503425bc38SStefano Zampini PetscFunctionBegin; 11513425bc38SStefano Zampini ierr = PetscMalloc(sizeof(*newctx),&newctx);CHKERRQ(ierr); 11523425bc38SStefano Zampini newctx->lambda_local = 0; 11533425bc38SStefano Zampini newctx->B_Ddelta = 0; 11543425bc38SStefano Zampini newctx->l2g_lambda = 0; 11553425bc38SStefano Zampini /* increase the reference count for BDDC preconditioner */ 11563425bc38SStefano Zampini ierr = PetscObjectReference((PetscObject)pc);CHKERRQ(ierr); 11573425bc38SStefano Zampini newctx->pc = pc; 11583425bc38SStefano Zampini *fetidppc_ctx = newctx; 11593425bc38SStefano Zampini PetscFunctionReturn(0); 11603425bc38SStefano Zampini } 11613425bc38SStefano Zampini 11623425bc38SStefano Zampini #undef __FUNCT__ 11633425bc38SStefano Zampini #define __FUNCT__ "PCBDDCDestroyFETIDPMat" 11643425bc38SStefano Zampini static PetscErrorCode PCBDDCDestroyFETIDPMat(Mat A) 11653425bc38SStefano Zampini { 11663425bc38SStefano Zampini FETIDPMat_ctx *mat_ctx; 11673425bc38SStefano Zampini PetscErrorCode ierr; 11683425bc38SStefano Zampini 11693425bc38SStefano Zampini PetscFunctionBegin; 11703425bc38SStefano Zampini ierr = MatShellGetContext(A,(void**)&mat_ctx);CHKERRQ(ierr); 11713425bc38SStefano Zampini ierr = VecDestroy(&mat_ctx->lambda_local);CHKERRQ(ierr); 11723425bc38SStefano Zampini ierr = VecDestroy(&mat_ctx->temp_solution_D);CHKERRQ(ierr); 11733425bc38SStefano Zampini ierr = VecDestroy(&mat_ctx->temp_solution_B);CHKERRQ(ierr); 11743425bc38SStefano Zampini ierr = MatDestroy(&mat_ctx->B_delta);CHKERRQ(ierr); 11753425bc38SStefano Zampini ierr = MatDestroy(&mat_ctx->B_Ddelta);CHKERRQ(ierr); 11763425bc38SStefano Zampini ierr = VecScatterDestroy(&mat_ctx->l2g_lambda);CHKERRQ(ierr); 11773425bc38SStefano Zampini ierr = PCDestroy(&mat_ctx->pc);CHKERRQ(ierr); /* actually it does not destroy BDDC, only decrease its reference count */ 11783425bc38SStefano Zampini ierr = PetscFree(mat_ctx);CHKERRQ(ierr); 11793425bc38SStefano Zampini PetscFunctionReturn(0); 11803425bc38SStefano Zampini } 11813425bc38SStefano Zampini 11823425bc38SStefano Zampini #undef __FUNCT__ 11833425bc38SStefano Zampini #define __FUNCT__ "PCBDDCDestroyFETIDPPC" 11843425bc38SStefano Zampini static PetscErrorCode PCBDDCDestroyFETIDPPC(PC pc) 11853425bc38SStefano Zampini { 11863425bc38SStefano Zampini FETIDPPC_ctx *pc_ctx; 11873425bc38SStefano Zampini PetscErrorCode ierr; 11883425bc38SStefano Zampini 11893425bc38SStefano Zampini PetscFunctionBegin; 11903425bc38SStefano Zampini ierr = PCShellGetContext(pc,(void**)&pc_ctx);CHKERRQ(ierr); 11913425bc38SStefano Zampini ierr = VecDestroy(&pc_ctx->lambda_local);CHKERRQ(ierr); 11923425bc38SStefano Zampini ierr = MatDestroy(&pc_ctx->B_Ddelta);CHKERRQ(ierr); 11933425bc38SStefano Zampini ierr = VecScatterDestroy(&pc_ctx->l2g_lambda);CHKERRQ(ierr); 11943425bc38SStefano Zampini ierr = PCDestroy(&pc_ctx->pc);CHKERRQ(ierr); /* actually it does not destroy BDDC, only decrease its reference count */ 11953425bc38SStefano Zampini ierr = PetscFree(pc_ctx);CHKERRQ(ierr); 11963425bc38SStefano Zampini PetscFunctionReturn(0); 11973425bc38SStefano Zampini } 11983425bc38SStefano Zampini 11993425bc38SStefano Zampini #undef __FUNCT__ 12003425bc38SStefano Zampini #define __FUNCT__ "PCBDDCSetupFETIDPMatContext" 12013425bc38SStefano Zampini static PetscErrorCode PCBDDCSetupFETIDPMatContext(FETIDPMat_ctx *fetidpmat_ctx ) 12023425bc38SStefano Zampini { 12033425bc38SStefano Zampini PetscErrorCode ierr; 12043425bc38SStefano Zampini PC_IS *pcis=(PC_IS*)fetidpmat_ctx->pc->data; 12053425bc38SStefano Zampini PC_BDDC *pcbddc=(PC_BDDC*)fetidpmat_ctx->pc->data; 12063425bc38SStefano Zampini PCBDDCGraph mat_graph=pcbddc->mat_graph; 12073425bc38SStefano Zampini Mat_IS *matis = (Mat_IS*)fetidpmat_ctx->pc->pmat->data; 12083425bc38SStefano Zampini MPI_Comm comm = ((PetscObject)(fetidpmat_ctx->pc))->comm; 12093425bc38SStefano Zampini 12103425bc38SStefano Zampini Mat ScalingMat; 12113425bc38SStefano Zampini Vec lambda_global; 12123425bc38SStefano Zampini IS IS_l2g_lambda; 12133425bc38SStefano Zampini 12143425bc38SStefano Zampini PetscBool skip_node,fully_redundant; 12153425bc38SStefano Zampini PetscInt i,j,k,s,n_boundary_dofs,sum_dof_sizes,n_global_lambda,n_vertices; 12163425bc38SStefano Zampini PetscInt n_local_lambda,n_lambda_for_dof,dual_size,n_neg_values,n_pos_values; 12173425bc38SStefano Zampini PetscMPIInt rank,nprocs,partial_sum; 12183425bc38SStefano Zampini PetscScalar scalar_value; 12193425bc38SStefano Zampini 12203425bc38SStefano Zampini PetscInt *vertex_indices,*temp_indices; 12213425bc38SStefano Zampini PetscInt *dual_dofs_boundary_indices,*aux_local_numbering_1,*aux_global_numbering; 12223425bc38SStefano Zampini PetscInt *aux_sums,*cols_B_delta,*l2g_indices; 12233425bc38SStefano Zampini PetscMPIInt *aux_local_numbering_2,*aux_global_numbering_mpi,*dof_sizes,*dof_displs; 12243425bc38SStefano Zampini PetscMPIInt *all_aux_global_numbering_mpi_1,*all_aux_global_numbering_mpi_2,*global_dofs_numbering; 12253425bc38SStefano Zampini PetscScalar *array,*scaling_factors,*vals_B_delta; 12263425bc38SStefano Zampini 12273425bc38SStefano Zampini /* For communication of scaling factors */ 12283425bc38SStefano Zampini PetscInt *ptrs_buffer,neigh_position; 12293425bc38SStefano Zampini PetscScalar **all_factors,*send_buffer,*recv_buffer; 12303425bc38SStefano Zampini MPI_Request *send_reqs,*recv_reqs; 12313425bc38SStefano Zampini 12323425bc38SStefano Zampini /* tests */ 12333425bc38SStefano Zampini Vec test_vec; 12343425bc38SStefano Zampini PetscBool test_fetidp; 12353425bc38SStefano Zampini PetscViewer viewer; 12363425bc38SStefano Zampini 12373425bc38SStefano Zampini PetscFunctionBegin; 12383425bc38SStefano Zampini ierr = MPI_Comm_rank(comm,&rank);CHKERRQ(ierr); 12393425bc38SStefano Zampini ierr = MPI_Comm_size(comm,&nprocs);CHKERRQ(ierr); 12403425bc38SStefano Zampini 12413425bc38SStefano Zampini /* Default type of lagrange multipliers is non-redundant */ 12423425bc38SStefano Zampini fully_redundant = PETSC_FALSE; 12433425bc38SStefano Zampini ierr = PetscOptionsGetBool(PETSC_NULL,"-fetidp_fullyredundant",&fully_redundant,PETSC_NULL);CHKERRQ(ierr); 12443425bc38SStefano Zampini 12453425bc38SStefano Zampini /* Evaluate local and global number of lagrange multipliers */ 12463425bc38SStefano Zampini ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr); 12473425bc38SStefano Zampini n_local_lambda = 0; 12483425bc38SStefano Zampini partial_sum = 0; 12493425bc38SStefano Zampini n_boundary_dofs = 0; 12503425bc38SStefano Zampini s = 0; 12513425bc38SStefano Zampini n_vertices = 0; 12523425bc38SStefano Zampini /* Get Vertices used to define the BDDC */ 12533425bc38SStefano Zampini ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(*vertex_indices),&vertex_indices);CHKERRQ(ierr); 12543425bc38SStefano Zampini for(i=0;i<pcbddc->local_primal_size;i++) { 12553425bc38SStefano Zampini ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&j,(const PetscInt**)&temp_indices,PETSC_NULL);CHKERRQ(ierr); 12563425bc38SStefano Zampini if(j == 1) { 12573425bc38SStefano Zampini vertex_indices[n_vertices]=temp_indices[0]; 12583425bc38SStefano Zampini n_vertices++; 12593425bc38SStefano Zampini } 12603425bc38SStefano Zampini ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&j,(const PetscInt**)&temp_indices,PETSC_NULL);CHKERRQ(ierr); 12613425bc38SStefano Zampini } 12623425bc38SStefano Zampini dual_size = pcis->n_B-n_vertices; 12633425bc38SStefano Zampini ierr = PetscMalloc(dual_size*sizeof(*dual_dofs_boundary_indices),&dual_dofs_boundary_indices);CHKERRQ(ierr); 12643425bc38SStefano Zampini ierr = PetscMalloc(dual_size*sizeof(*aux_local_numbering_1),&aux_local_numbering_1);CHKERRQ(ierr); 12653425bc38SStefano Zampini ierr = PetscMalloc(dual_size*sizeof(*aux_local_numbering_2),&aux_local_numbering_2);CHKERRQ(ierr); 12663425bc38SStefano Zampini 12673425bc38SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 12683425bc38SStefano Zampini for(i=0;i<pcis->n;i++){ 12693425bc38SStefano Zampini j = mat_graph->count[i]; /* RECALL: mat_graph->count[i] does not count myself */ 1270c6582918SStefano Zampini k = 0; 1271c6582918SStefano Zampini if(j > 0) { 12723425bc38SStefano Zampini k = (mat_graph->neighbours_set[i][0] == -1 ? 1 : 0); 1273c6582918SStefano Zampini } 12743425bc38SStefano Zampini j = j - k ; 12753425bc38SStefano Zampini if( j > 0 ) { n_boundary_dofs++; } 12763425bc38SStefano Zampini 12773425bc38SStefano Zampini skip_node = PETSC_FALSE; 1278c6582918SStefano Zampini if( s < n_vertices && vertex_indices[s]==i) { /* it works for a sorted set of vertices */ 12793425bc38SStefano Zampini skip_node = PETSC_TRUE; 12803425bc38SStefano Zampini s++; 12813425bc38SStefano Zampini } 12823425bc38SStefano Zampini if(j < 1) {skip_node = PETSC_TRUE;} 12833425bc38SStefano Zampini if( !skip_node ) { 12843425bc38SStefano Zampini if(fully_redundant) { 12853425bc38SStefano Zampini /* fully redundant set of lagrange multipliers */ 12863425bc38SStefano Zampini n_lambda_for_dof = (j*(j+1))/2; 12873425bc38SStefano Zampini } else { 12883425bc38SStefano Zampini n_lambda_for_dof = j; 12893425bc38SStefano Zampini } 12903425bc38SStefano Zampini n_local_lambda += j; 12913425bc38SStefano Zampini /* needed to evaluate global number of lagrange multipliers */ 12923425bc38SStefano Zampini array[i]=(1.0*n_lambda_for_dof)/(j+1.0); /* already scaled for the next global sum */ 12933425bc38SStefano Zampini /* store some data needed */ 12943425bc38SStefano Zampini dual_dofs_boundary_indices[partial_sum] = n_boundary_dofs-1; 12953425bc38SStefano Zampini aux_local_numbering_1[partial_sum] = i; 12963425bc38SStefano Zampini aux_local_numbering_2[partial_sum] = (PetscMPIInt)n_lambda_for_dof; 12973425bc38SStefano Zampini partial_sum++; 12983425bc38SStefano Zampini } 12993425bc38SStefano Zampini } 13003425bc38SStefano Zampini /*printf("I found %d local lambda dofs\n",n_local_lambda); 13013425bc38SStefano Zampini printf("I found %d boundary dofs (should be %d)\n",n_boundary_dofs,pcis->n_B); 13023425bc38SStefano Zampini printf("Partial sum %d should be %d\n",partial_sum,dual_size);*/ 13033425bc38SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 13043425bc38SStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 13053425bc38SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 13063425bc38SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 13073425bc38SStefano Zampini ierr = VecSum(pcis->vec1_global,&scalar_value);CHKERRQ(ierr); 13083425bc38SStefano Zampini fetidpmat_ctx->n_lambda = (PetscInt) scalar_value; 13093425bc38SStefano Zampini /* printf("I found %d global multipliers (%f)\n",fetidpmat_ctx->n_lambda,scalar_value); */ 13103425bc38SStefano Zampini ierr = VecCreate(PETSC_COMM_SELF,&fetidpmat_ctx->lambda_local);CHKERRQ(ierr); 13113425bc38SStefano Zampini ierr = VecSetSizes(fetidpmat_ctx->lambda_local,n_local_lambda,n_local_lambda);CHKERRQ(ierr); 13123425bc38SStefano Zampini ierr = VecSetType(fetidpmat_ctx->lambda_local,VECSEQ);CHKERRQ(ierr); 13133425bc38SStefano Zampini ierr = VecCreate(comm,&lambda_global);CHKERRQ(ierr); 13143425bc38SStefano Zampini ierr = VecSetSizes(lambda_global,PETSC_DECIDE,fetidpmat_ctx->n_lambda);CHKERRQ(ierr); 13153425bc38SStefano Zampini ierr = VecSetType(lambda_global,VECMPI);CHKERRQ(ierr); 13163425bc38SStefano Zampini 13173425bc38SStefano Zampini /* compute global ordering of lagrange multipliers and associate l2g map */ 13183425bc38SStefano Zampini 13193425bc38SStefano Zampini ierr = PetscMalloc(dual_size*sizeof(*aux_global_numbering),&aux_global_numbering);CHKERRQ(ierr); 13203425bc38SStefano Zampini ierr = PetscMalloc(dual_size*sizeof(*aux_global_numbering_mpi),&aux_global_numbering_mpi);CHKERRQ(ierr); 13213425bc38SStefano Zampini j = (rank == 0 ? nprocs : 0); 13223425bc38SStefano Zampini ierr = PetscMalloc(j*sizeof(*dof_sizes),&dof_sizes);CHKERRQ(ierr); 13233425bc38SStefano Zampini ierr = PetscMalloc(j*sizeof(*dof_displs),&dof_displs);CHKERRQ(ierr); 13243425bc38SStefano Zampini ierr = ISLocalToGlobalMappingApply(matis->mapping,dual_size,aux_local_numbering_1,aux_global_numbering);CHKERRQ(ierr); 13253425bc38SStefano Zampini ierr = MPI_Gather(&dual_size,1,MPIU_INT,dof_sizes,1,MPIU_INT,0,comm);CHKERRQ(ierr); 13263425bc38SStefano Zampini sum_dof_sizes=0; 13273425bc38SStefano Zampini if ( rank == 0 ) { 13283425bc38SStefano Zampini dof_displs[0]=0; 13293425bc38SStefano Zampini sum_dof_sizes=dual_size; 13303425bc38SStefano Zampini for(i=1;i<nprocs;i++) { 13313425bc38SStefano Zampini dof_displs[i] = dof_displs[i-1]+dof_sizes[i-1]; 13323425bc38SStefano Zampini sum_dof_sizes += dof_sizes[i]; 13333425bc38SStefano Zampini } 13343425bc38SStefano Zampini } 13353425bc38SStefano Zampini for(i=0;i<dual_size;i++) { 13363425bc38SStefano Zampini aux_global_numbering_mpi[i]=(PetscMPIInt)aux_global_numbering[i]; 13373425bc38SStefano Zampini } 13383425bc38SStefano Zampini ierr = PetscMalloc(sum_dof_sizes*sizeof(*all_aux_global_numbering_mpi_1),&all_aux_global_numbering_mpi_1);CHKERRQ(ierr); 13393425bc38SStefano Zampini ierr = PetscMalloc(sum_dof_sizes*sizeof(*all_aux_global_numbering_mpi_2),&all_aux_global_numbering_mpi_2);CHKERRQ(ierr); 13403425bc38SStefano Zampini ierr = MPI_Gatherv(aux_global_numbering_mpi,dual_size,MPIU_INT,all_aux_global_numbering_mpi_1,dof_sizes,dof_displs,MPIU_INT,0,comm);CHKERRQ(ierr); 13413425bc38SStefano Zampini ierr = MPI_Gatherv(aux_local_numbering_2,dual_size,MPIU_INT,all_aux_global_numbering_mpi_2,dof_sizes,dof_displs,MPIU_INT,0,comm);CHKERRQ(ierr); 13423425bc38SStefano Zampini 13433425bc38SStefano Zampini ierr = PetscMalloc(fetidpmat_ctx->n_lambda*sizeof(*global_dofs_numbering),&global_dofs_numbering);CHKERRQ(ierr); 13443425bc38SStefano Zampini if( rank == 0 ) { 13453425bc38SStefano Zampini ierr = PetscSortMPIIntWithArray(sum_dof_sizes,all_aux_global_numbering_mpi_1,all_aux_global_numbering_mpi_2);CHKERRQ(ierr); 13463425bc38SStefano Zampini j=-1; 13473425bc38SStefano Zampini partial_sum = 0; 13483425bc38SStefano Zampini for(i=0;i<sum_dof_sizes;i++) { 13493425bc38SStefano Zampini if(j != all_aux_global_numbering_mpi_1[i] ) { 13503425bc38SStefano Zampini j=all_aux_global_numbering_mpi_1[i]; 13513425bc38SStefano Zampini for(k=0;k<all_aux_global_numbering_mpi_2[i];k++) { 13523425bc38SStefano Zampini global_dofs_numbering[partial_sum+k]=all_aux_global_numbering_mpi_1[i]; 13533425bc38SStefano Zampini } 13543425bc38SStefano Zampini partial_sum += all_aux_global_numbering_mpi_2[i]; 13553425bc38SStefano Zampini } 13563425bc38SStefano Zampini } 13573425bc38SStefano Zampini /* printf("Partial sum for global dofs %d should be %d\n",partial_sum,fetidpmat_ctx->n_lambda); */ 13583425bc38SStefano Zampini } 13593425bc38SStefano Zampini ierr = MPI_Bcast(global_dofs_numbering,fetidpmat_ctx->n_lambda,MPIU_INT,0,comm);CHKERRQ(ierr); 13603425bc38SStefano Zampini 13613425bc38SStefano Zampini /* init data for scaling factors exchange */ 13623425bc38SStefano Zampini partial_sum = 0; 13633425bc38SStefano Zampini j = 0; 13643425bc38SStefano Zampini ierr = PetscMalloc( pcis->n_neigh*sizeof(PetscInt),&ptrs_buffer);CHKERRQ(ierr); 13653425bc38SStefano Zampini ierr = PetscMalloc( (pcis->n_neigh-1)*sizeof(MPI_Request),&send_reqs);CHKERRQ(ierr); 13663425bc38SStefano Zampini ierr = PetscMalloc( (pcis->n_neigh-1)*sizeof(MPI_Request),&recv_reqs);CHKERRQ(ierr); 13673425bc38SStefano Zampini ierr = PetscMalloc( pcis->n*sizeof(PetscScalar*),&all_factors);CHKERRQ(ierr); 13683425bc38SStefano Zampini ptrs_buffer[0]=0; 13693425bc38SStefano Zampini for(i=1;i<pcis->n_neigh;i++) { 13703425bc38SStefano Zampini partial_sum += pcis->n_shared[i]; 13713425bc38SStefano Zampini ptrs_buffer[i] = ptrs_buffer[i-1]+pcis->n_shared[i]; 13723425bc38SStefano Zampini } 13733425bc38SStefano Zampini ierr = PetscMalloc( partial_sum*sizeof(PetscScalar),&send_buffer);CHKERRQ(ierr); 13743425bc38SStefano Zampini ierr = PetscMalloc( partial_sum*sizeof(PetscScalar),&recv_buffer);CHKERRQ(ierr); 13753425bc38SStefano Zampini ierr = PetscMalloc( partial_sum*sizeof(PetscScalar),&all_factors[0]);CHKERRQ(ierr); 13763425bc38SStefano Zampini for(i=0;i<pcis->n-1;i++) { 13773425bc38SStefano Zampini j = mat_graph->count[i]; 13783425bc38SStefano Zampini if(j>0) { 13793425bc38SStefano Zampini k = (mat_graph->neighbours_set[i][0] == -1 ? 1 : 0); 13803425bc38SStefano Zampini j = j - k; 13813425bc38SStefano Zampini } 13823425bc38SStefano Zampini all_factors[i+1]=all_factors[i]+j; 13833425bc38SStefano Zampini } 13843425bc38SStefano Zampini /* scatter B scaling to N vec */ 13853425bc38SStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->D,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 13863425bc38SStefano Zampini ierr = VecScatterEnd (pcis->N_to_B,pcis->D,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 13873425bc38SStefano Zampini /* communications */ 13883425bc38SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 13893425bc38SStefano Zampini for(i=1;i<pcis->n_neigh;i++) { 13903425bc38SStefano Zampini for(j=0;j<pcis->n_shared[i];j++) { 13913425bc38SStefano Zampini send_buffer[ptrs_buffer[i-1]+j]=array[pcis->shared[i][j]]; 13923425bc38SStefano Zampini } 13933425bc38SStefano Zampini j = ptrs_buffer[i]-ptrs_buffer[i-1]; 1394*ea7e1babSStefano Zampini ierr = MPI_Isend(&send_buffer[ptrs_buffer[i-1]],j,MPIU_SCALAR,pcis->neigh[i],0,comm,&send_reqs[i-1]);CHKERRQ(ierr); 1395*ea7e1babSStefano Zampini ierr = MPI_Irecv(&recv_buffer[ptrs_buffer[i-1]],j,MPIU_SCALAR,pcis->neigh[i],0,comm,&recv_reqs[i-1]);CHKERRQ(ierr); 13963425bc38SStefano Zampini } 13973425bc38SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 1398*ea7e1babSStefano Zampini ierr = MPI_Waitall((pcis->n_neigh-1),recv_reqs,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 13993425bc38SStefano Zampini /* put values in correct places */ 14003425bc38SStefano Zampini for(i=1;i<pcis->n_neigh;i++) { 14013425bc38SStefano Zampini for(j=0;j<pcis->n_shared[i];j++) { 14023425bc38SStefano Zampini k = pcis->shared[i][j]; 14033425bc38SStefano Zampini neigh_position = 0; 14043425bc38SStefano Zampini while(mat_graph->neighbours_set[k][neigh_position] != pcis->neigh[i]) {neigh_position++;} 14053425bc38SStefano Zampini s = (mat_graph->neighbours_set[k][0] == -1 ? 1 : 0); 14063425bc38SStefano Zampini neigh_position = neigh_position - s; 14073425bc38SStefano Zampini all_factors[k][neigh_position]=recv_buffer[ptrs_buffer[i-1]+j]; 14083425bc38SStefano Zampini } 14093425bc38SStefano Zampini } 1410*ea7e1babSStefano Zampini ierr = MPI_Waitall((pcis->n_neigh-1),send_reqs,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 14113425bc38SStefano Zampini ierr = PetscFree(send_reqs);CHKERRQ(ierr); 14123425bc38SStefano Zampini ierr = PetscFree(recv_reqs);CHKERRQ(ierr); 14133425bc38SStefano Zampini ierr = PetscFree(send_buffer);CHKERRQ(ierr); 14143425bc38SStefano Zampini ierr = PetscFree(recv_buffer);CHKERRQ(ierr); 14153425bc38SStefano Zampini ierr = PetscFree(ptrs_buffer);CHKERRQ(ierr); 14163425bc38SStefano Zampini 14173425bc38SStefano Zampini /* Compute B and B_delta (local actions) */ 14183425bc38SStefano Zampini ierr = PetscMalloc(pcis->n_neigh*sizeof(*aux_sums),&aux_sums);CHKERRQ(ierr); 14193425bc38SStefano Zampini ierr = PetscMalloc(n_local_lambda*sizeof(*l2g_indices),&l2g_indices);CHKERRQ(ierr); 14203425bc38SStefano Zampini ierr = PetscMalloc(n_local_lambda*sizeof(*vals_B_delta),&vals_B_delta);CHKERRQ(ierr); 14213425bc38SStefano Zampini ierr = PetscMalloc(n_local_lambda*sizeof(*cols_B_delta),&cols_B_delta);CHKERRQ(ierr); 14223425bc38SStefano Zampini ierr = PetscMalloc(n_local_lambda*sizeof(*scaling_factors),&scaling_factors);CHKERRQ(ierr); 14233425bc38SStefano Zampini n_global_lambda=0; 14243425bc38SStefano Zampini partial_sum=0; 14253425bc38SStefano Zampini for(i=0;i<dual_size;i++) { 14263425bc38SStefano Zampini while( global_dofs_numbering[n_global_lambda] != aux_global_numbering_mpi[i] ) { n_global_lambda++; } 14273425bc38SStefano Zampini j = mat_graph->count[aux_local_numbering_1[i]]; 14283425bc38SStefano Zampini k = (mat_graph->neighbours_set[aux_local_numbering_1[i]][0] == -1 ? 1 : 0); 14293425bc38SStefano Zampini j = j - k; 14303425bc38SStefano Zampini aux_sums[0]=0; 14313425bc38SStefano Zampini for(s=1;s<j;s++) { 14323425bc38SStefano Zampini aux_sums[s]=aux_sums[s-1]+j-s+1; 14333425bc38SStefano Zampini } 14343425bc38SStefano Zampini array = all_factors[aux_local_numbering_1[i]]; 14353425bc38SStefano Zampini n_neg_values = 0; 14363425bc38SStefano Zampini while(n_neg_values < j && mat_graph->neighbours_set[aux_local_numbering_1[i]][n_neg_values+k] < rank) {n_neg_values++;} 14373425bc38SStefano Zampini n_pos_values = j - n_neg_values; 14383425bc38SStefano Zampini if(fully_redundant) { 14393425bc38SStefano Zampini for(s=0;s<n_neg_values;s++) { 14403425bc38SStefano Zampini l2g_indices [partial_sum+s]=aux_sums[s]+n_neg_values-s-1+n_global_lambda; 14413425bc38SStefano Zampini cols_B_delta [partial_sum+s]=dual_dofs_boundary_indices[i]; 14423425bc38SStefano Zampini vals_B_delta [partial_sum+s]=-1.0; 14433425bc38SStefano Zampini scaling_factors[partial_sum+s]=array[s]; 14443425bc38SStefano Zampini } 14453425bc38SStefano Zampini for(s=0;s<n_pos_values;s++) { 14463425bc38SStefano Zampini l2g_indices [partial_sum+s+n_neg_values]=aux_sums[n_neg_values]+s+n_global_lambda; 14473425bc38SStefano Zampini cols_B_delta [partial_sum+s+n_neg_values]=dual_dofs_boundary_indices[i]; 14483425bc38SStefano Zampini vals_B_delta [partial_sum+s+n_neg_values]=1.0; 14493425bc38SStefano Zampini scaling_factors[partial_sum+s+n_neg_values]=array[s+n_neg_values]; 14503425bc38SStefano Zampini } 14513425bc38SStefano Zampini partial_sum += j; 14523425bc38SStefano Zampini } else { 14533425bc38SStefano Zampini /* l2g_indices and default cols and vals of B_delta */ 14543425bc38SStefano Zampini for(s=0;s<j;s++) { 14553425bc38SStefano Zampini l2g_indices [partial_sum+s]=n_global_lambda+s; 14563425bc38SStefano Zampini cols_B_delta [partial_sum+s]=dual_dofs_boundary_indices[i]; 14573425bc38SStefano Zampini vals_B_delta [partial_sum+s]=0.0; 14583425bc38SStefano Zampini } 14593425bc38SStefano Zampini /* B_delta */ 14603425bc38SStefano Zampini if( n_neg_values > 0 ) { /* there's a rank next to me to the left */ 14613425bc38SStefano Zampini vals_B_delta [partial_sum+n_neg_values-1]=-1.0; 14623425bc38SStefano Zampini } 14633425bc38SStefano Zampini if ( n_neg_values < j ) { /* there's a rank next to me to the right */ 14643425bc38SStefano Zampini vals_B_delta [partial_sum+n_neg_values]=1.0; 14653425bc38SStefano Zampini } 14663425bc38SStefano Zampini /* scaling as in Klawonn-Widlund 1999*/ 14673425bc38SStefano Zampini for(s=0;s<n_neg_values;s++) { 14683425bc38SStefano Zampini scalar_value = 0.0; 14693425bc38SStefano Zampini for(k=0;k<s+1;k++) { 14703425bc38SStefano Zampini scalar_value += array[k]; 14713425bc38SStefano Zampini } 14723425bc38SStefano Zampini scalar_value = -scalar_value; 14733425bc38SStefano Zampini scaling_factors[partial_sum+s] = scalar_value; 14743425bc38SStefano Zampini } 14753425bc38SStefano Zampini for(s=0;s<n_pos_values;s++) { 14763425bc38SStefano Zampini scalar_value = 0.0; 14773425bc38SStefano Zampini for(k=s+n_neg_values;k<j;k++) { 14783425bc38SStefano Zampini scalar_value += array[k]; 14793425bc38SStefano Zampini } 14803425bc38SStefano Zampini scaling_factors[partial_sum+s+n_neg_values] = scalar_value; 14813425bc38SStefano Zampini } 14823425bc38SStefano Zampini partial_sum += j; 14833425bc38SStefano Zampini } 14843425bc38SStefano Zampini } 14853425bc38SStefano Zampini ierr = PetscFree(all_factors[0]);CHKERRQ(ierr); 14863425bc38SStefano Zampini ierr = PetscFree(all_factors);CHKERRQ(ierr); 14873425bc38SStefano Zampini /* printf("I found %d local lambda dofs when numbering them (should be %d)\n",partial_sum,n_local_lambda); */ 14883425bc38SStefano Zampini ierr = ISCreateGeneral(comm,n_local_lambda,l2g_indices,PETSC_OWN_POINTER,&IS_l2g_lambda);CHKERRQ(ierr); 14893425bc38SStefano Zampini ierr = VecScatterCreate(fetidpmat_ctx->lambda_local,(IS)0,lambda_global,IS_l2g_lambda,&fetidpmat_ctx->l2g_lambda);CHKERRQ(ierr); 14903425bc38SStefano Zampini 14913425bc38SStefano Zampini /* Create local part of B_delta */ 14923425bc38SStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&fetidpmat_ctx->B_delta); 14933425bc38SStefano Zampini ierr = MatSetSizes(fetidpmat_ctx->B_delta,n_local_lambda,pcis->n_B,n_local_lambda,pcis->n_B);CHKERRQ(ierr); 14943425bc38SStefano Zampini ierr = MatSetType(fetidpmat_ctx->B_delta,MATSEQAIJ);CHKERRQ(ierr); 14953425bc38SStefano Zampini ierr = MatSeqAIJSetPreallocation(fetidpmat_ctx->B_delta,1,PETSC_NULL);CHKERRQ(ierr); 14963425bc38SStefano Zampini ierr = MatSetOption(fetidpmat_ctx->B_delta,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr); 14973425bc38SStefano Zampini for(i=0;i<n_local_lambda;i++) { 14983425bc38SStefano Zampini ierr = MatSetValue(fetidpmat_ctx->B_delta,i,cols_B_delta[i],vals_B_delta[i],INSERT_VALUES);CHKERRQ(ierr); 14993425bc38SStefano Zampini } 15003425bc38SStefano Zampini ierr = MatAssemblyBegin(fetidpmat_ctx->B_delta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 15013425bc38SStefano Zampini ierr = MatAssemblyEnd (fetidpmat_ctx->B_delta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 15023425bc38SStefano Zampini 15033425bc38SStefano Zampini if(fully_redundant) { 15043425bc38SStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&ScalingMat); 15053425bc38SStefano Zampini ierr = MatSetSizes(ScalingMat,n_local_lambda,n_local_lambda,n_local_lambda,n_local_lambda);CHKERRQ(ierr); 15063425bc38SStefano Zampini ierr = MatSetType(ScalingMat,MATSEQAIJ);CHKERRQ(ierr); 15073425bc38SStefano Zampini ierr = MatSeqAIJSetPreallocation(ScalingMat,1,PETSC_NULL);CHKERRQ(ierr); 15083425bc38SStefano Zampini for(i=0;i<n_local_lambda;i++) { 15093425bc38SStefano Zampini ierr = MatSetValue(ScalingMat,i,i,scaling_factors[i],INSERT_VALUES);CHKERRQ(ierr); 15103425bc38SStefano Zampini } 15113425bc38SStefano Zampini ierr = MatAssemblyBegin(ScalingMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 15123425bc38SStefano Zampini ierr = MatAssemblyEnd (ScalingMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 15133425bc38SStefano Zampini ierr = MatMatMult(ScalingMat,fetidpmat_ctx->B_delta,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&fetidpmat_ctx->B_Ddelta);CHKERRQ(ierr); 15143425bc38SStefano Zampini ierr = MatDestroy(&ScalingMat);CHKERRQ(ierr); 15153425bc38SStefano Zampini } else { 15163425bc38SStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&fetidpmat_ctx->B_Ddelta); 15173425bc38SStefano Zampini ierr = MatSetSizes(fetidpmat_ctx->B_Ddelta,n_local_lambda,pcis->n_B,n_local_lambda,pcis->n_B);CHKERRQ(ierr); 15183425bc38SStefano Zampini ierr = MatSetType(fetidpmat_ctx->B_Ddelta,MATSEQAIJ);CHKERRQ(ierr); 15193425bc38SStefano Zampini ierr = MatSeqAIJSetPreallocation(fetidpmat_ctx->B_Ddelta,1,PETSC_NULL);CHKERRQ(ierr); 15203425bc38SStefano Zampini for(i=0;i<n_local_lambda;i++) { 15213425bc38SStefano Zampini ierr = MatSetValue(fetidpmat_ctx->B_Ddelta,i,cols_B_delta[i],scaling_factors[i],INSERT_VALUES);CHKERRQ(ierr); 15223425bc38SStefano Zampini } 15233425bc38SStefano Zampini ierr = MatAssemblyBegin(fetidpmat_ctx->B_Ddelta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 15243425bc38SStefano Zampini ierr = MatAssemblyEnd (fetidpmat_ctx->B_Ddelta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 15253425bc38SStefano Zampini } 15263425bc38SStefano Zampini 15273425bc38SStefano Zampini /* Create some vectors needed by fetidp */ 15283425bc38SStefano Zampini ierr = VecDuplicate(pcis->vec1_B,&fetidpmat_ctx->temp_solution_B);CHKERRQ(ierr); 15293425bc38SStefano Zampini ierr = VecDuplicate(pcis->vec1_D,&fetidpmat_ctx->temp_solution_D);CHKERRQ(ierr); 15303425bc38SStefano Zampini 15313425bc38SStefano Zampini test_fetidp = PETSC_FALSE; 15323425bc38SStefano Zampini ierr = PetscOptionsGetBool(PETSC_NULL,"-fetidp_check",&test_fetidp,PETSC_NULL);CHKERRQ(ierr); 15333425bc38SStefano Zampini 15343425bc38SStefano Zampini if(test_fetidp) { 15353425bc38SStefano Zampini 15363425bc38SStefano Zampini ierr = PetscViewerASCIIGetStdout(((PetscObject)(fetidpmat_ctx->pc))->comm,&viewer);CHKERRQ(ierr); 15373425bc38SStefano Zampini ierr = PetscViewerASCIISynchronizedAllow(viewer,PETSC_TRUE);CHKERRQ(ierr); 15383425bc38SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"----------FETI_DP TESTS--------------\n");CHKERRQ(ierr); 15393425bc38SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"All tests should return zero!\n");CHKERRQ(ierr); 15403425bc38SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"FETIDP MAT context in the ");CHKERRQ(ierr); 15413425bc38SStefano Zampini if(fully_redundant) { 15423425bc38SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"fully redundant case for lagrange multipliers.\n");CHKERRQ(ierr); 15433425bc38SStefano Zampini } else { 15443425bc38SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Non-fully redundant case for lagrange multiplier.\n");CHKERRQ(ierr); 15453425bc38SStefano Zampini } 15463425bc38SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 15473425bc38SStefano Zampini 15483425bc38SStefano Zampini /******************************************************************/ 15493425bc38SStefano Zampini /* TEST A/B: Test numbering of global lambda dofs */ 15503425bc38SStefano Zampini /******************************************************************/ 15513425bc38SStefano Zampini 15523425bc38SStefano Zampini ierr = VecDuplicate(fetidpmat_ctx->lambda_local,&test_vec);CHKERRQ(ierr); 15533425bc38SStefano Zampini ierr = VecSet(lambda_global,1.0);CHKERRQ(ierr); 15543425bc38SStefano Zampini ierr = VecSet(test_vec,1.0);CHKERRQ(ierr); 15553425bc38SStefano Zampini ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 15563425bc38SStefano Zampini ierr = VecScatterEnd (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 15573425bc38SStefano Zampini scalar_value = -1.0; 15583425bc38SStefano Zampini ierr = VecAXPY(test_vec,scalar_value,fetidpmat_ctx->lambda_local);CHKERRQ(ierr); 15593425bc38SStefano Zampini ierr = VecNorm(test_vec,NORM_INFINITY,&scalar_value);CHKERRQ(ierr); 15603425bc38SStefano Zampini ierr = VecDestroy(&test_vec);CHKERRQ(ierr); 15613425bc38SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"A[%04d]: CHECK glob to loc: % 1.14e\n",rank,scalar_value);CHKERRQ(ierr); 15623425bc38SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 15633425bc38SStefano Zampini if(fully_redundant) { 15643425bc38SStefano Zampini ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr); 15653425bc38SStefano Zampini ierr = VecSet(fetidpmat_ctx->lambda_local,0.5);CHKERRQ(ierr); 15663425bc38SStefano Zampini ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 15673425bc38SStefano Zampini ierr = VecScatterEnd (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 15683425bc38SStefano Zampini ierr = VecSum(lambda_global,&scalar_value);CHKERRQ(ierr); 15693425bc38SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"B[%04d]: CHECK loc to glob: % 1.14e\n",rank,scalar_value-fetidpmat_ctx->n_lambda);CHKERRQ(ierr); 15703425bc38SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 15713425bc38SStefano Zampini } 15723425bc38SStefano Zampini 15733425bc38SStefano Zampini /******************************************************************/ 15743425bc38SStefano Zampini /* TEST C: It should holds B_delta*w=0, w\in\widehat{W} */ 15753425bc38SStefano Zampini /* This is the meaning of the B matrix */ 15763425bc38SStefano Zampini /******************************************************************/ 15773425bc38SStefano Zampini 15783425bc38SStefano Zampini ierr = VecSetRandom(pcis->vec1_N,PETSC_NULL);CHKERRQ(ierr); 15793425bc38SStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 15803425bc38SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 15813425bc38SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 15823425bc38SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 15833425bc38SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 15843425bc38SStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 15853425bc38SStefano Zampini ierr = VecScatterEnd (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 15863425bc38SStefano Zampini /* Action of B_delta */ 15873425bc38SStefano Zampini ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr); 15883425bc38SStefano Zampini ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr); 15893425bc38SStefano Zampini ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 15903425bc38SStefano Zampini ierr = VecScatterEnd (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 15913425bc38SStefano Zampini ierr = VecNorm(lambda_global,NORM_INFINITY,&scalar_value);CHKERRQ(ierr); 15923425bc38SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"C[coll]: CHECK infty norm of B_delta*w (w continuous): % 1.14e\n",scalar_value);CHKERRQ(ierr); 15933425bc38SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 15943425bc38SStefano Zampini 15953425bc38SStefano Zampini /******************************************************************/ 15963425bc38SStefano Zampini /* TEST D: It should holds E_Dw = w - P_Dw w\in\widetilde{W} */ 15973425bc38SStefano Zampini /* E_D = R_D^TR */ 15983425bc38SStefano Zampini /* P_D = B_{D,delta}^T B_{delta} */ 15993425bc38SStefano Zampini /* eq.44 Mandel Tezaur and Dohrmann 2005 */ 16003425bc38SStefano Zampini /******************************************************************/ 16013425bc38SStefano Zampini 16023425bc38SStefano Zampini /* compute a random vector in \widetilde{W} */ 16033425bc38SStefano Zampini ierr = VecSetRandom(pcis->vec1_N,PETSC_NULL);CHKERRQ(ierr); 16043425bc38SStefano Zampini scalar_value = 0.0; /* set zero at vertices */ 16053425bc38SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 16063425bc38SStefano Zampini for(i=0;i<n_vertices;i++) { array[vertex_indices[i]]=scalar_value; } 16073425bc38SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 16083425bc38SStefano Zampini /* store w for final comparison */ 16093425bc38SStefano Zampini ierr = VecDuplicate(pcis->vec1_B,&test_vec);CHKERRQ(ierr); 16103425bc38SStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,test_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 16113425bc38SStefano Zampini ierr = VecScatterEnd (pcis->N_to_B,pcis->vec1_N,test_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 16123425bc38SStefano Zampini 16133425bc38SStefano Zampini /* Jump operator P_D : results stored in pcis->vec1_B */ 16143425bc38SStefano Zampini 16153425bc38SStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 16163425bc38SStefano Zampini ierr = VecScatterEnd (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 16173425bc38SStefano Zampini /* Action of B_delta */ 16183425bc38SStefano Zampini ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr); 16193425bc38SStefano Zampini ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr); 16203425bc38SStefano Zampini ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 16213425bc38SStefano Zampini ierr = VecScatterEnd (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 16223425bc38SStefano Zampini /* Action of B_Ddelta^T */ 16233425bc38SStefano Zampini ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 16243425bc38SStefano Zampini ierr = VecScatterEnd (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 16253425bc38SStefano Zampini ierr = MatMultTranspose(fetidpmat_ctx->B_Ddelta,fetidpmat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr); 16263425bc38SStefano Zampini 16273425bc38SStefano Zampini /* Average operator E_D : results stored in pcis->vec2_B */ 16283425bc38SStefano Zampini 16293425bc38SStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 16303425bc38SStefano Zampini ierr = VecScatterEnd (pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 16313425bc38SStefano Zampini ierr = VecPointwiseMult(pcis->vec2_B,pcis->D,pcis->vec2_B);CHKERRQ(ierr); 16323425bc38SStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->vec2_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 16333425bc38SStefano Zampini ierr = VecScatterEnd (pcis->N_to_B,pcis->vec2_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 16343425bc38SStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 16353425bc38SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 16363425bc38SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 16373425bc38SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 16383425bc38SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 16393425bc38SStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 16403425bc38SStefano Zampini ierr = VecScatterEnd (pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 16413425bc38SStefano Zampini 16423425bc38SStefano Zampini /* test E_D=I-P_D */ 16433425bc38SStefano Zampini scalar_value = 1.0; 16443425bc38SStefano Zampini ierr = VecAXPY(pcis->vec1_B,scalar_value,pcis->vec2_B);CHKERRQ(ierr); 16453425bc38SStefano Zampini scalar_value = -1.0; 16463425bc38SStefano Zampini ierr = VecAXPY(pcis->vec1_B,scalar_value,test_vec);CHKERRQ(ierr); 16473425bc38SStefano Zampini ierr = VecNorm(pcis->vec1_B,NORM_INFINITY,&scalar_value);CHKERRQ(ierr); 16483425bc38SStefano Zampini ierr = VecDestroy(&test_vec);CHKERRQ(ierr); 16493425bc38SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"D[%04d] CHECK infty norm of E_D + P_D - I: % 1.14e\n",rank,scalar_value);CHKERRQ(ierr); 16503425bc38SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 16513425bc38SStefano Zampini 16523425bc38SStefano Zampini /******************************************************************/ 16533425bc38SStefano Zampini /* TEST E: It should holds R_D^TP_Dw=0 w\in\widetilde{W} */ 16543425bc38SStefano Zampini /* eq.48 Mandel Tezaur and Dohrmann 2005 */ 16553425bc38SStefano Zampini /******************************************************************/ 16563425bc38SStefano Zampini 16573425bc38SStefano Zampini ierr = VecSetRandom(pcis->vec1_N,PETSC_NULL);CHKERRQ(ierr); 16583425bc38SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 16593425bc38SStefano Zampini scalar_value = 0.0; /* set zero at vertices */ 16603425bc38SStefano Zampini for(i=0;i<n_vertices;i++) { array[vertex_indices[i]]=scalar_value; } 16613425bc38SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 16623425bc38SStefano Zampini 16633425bc38SStefano Zampini /* Jump operator P_D : results stored in pcis->vec1_B */ 16643425bc38SStefano Zampini 16653425bc38SStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 16663425bc38SStefano Zampini ierr = VecScatterEnd (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 16673425bc38SStefano Zampini /* Action of B_delta */ 16683425bc38SStefano Zampini ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr); 16693425bc38SStefano Zampini ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr); 16703425bc38SStefano Zampini ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 16713425bc38SStefano Zampini ierr = VecScatterEnd (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 16723425bc38SStefano Zampini /* Action of B_Ddelta^T */ 16733425bc38SStefano Zampini ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 16743425bc38SStefano Zampini ierr = VecScatterEnd (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 16753425bc38SStefano Zampini ierr = MatMultTranspose(fetidpmat_ctx->B_Ddelta,fetidpmat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr); 16763425bc38SStefano Zampini /* diagonal scaling */ 16773425bc38SStefano Zampini ierr = VecPointwiseMult(pcis->vec1_B,pcis->D,pcis->vec1_B);CHKERRQ(ierr); 16783425bc38SStefano Zampini /* sum on the interface */ 16793425bc38SStefano Zampini ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr); 16803425bc38SStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 16813425bc38SStefano Zampini ierr = VecScatterEnd (pcis->N_to_B,pcis->vec1_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 16823425bc38SStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 16833425bc38SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 16843425bc38SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 16853425bc38SStefano Zampini ierr = VecNorm(pcis->vec1_global,NORM_INFINITY,&scalar_value);CHKERRQ(ierr); 16863425bc38SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"E[coll]: CHECK infty norm of R^T_D P_D: % 1.14e\n",scalar_value);CHKERRQ(ierr); 16873425bc38SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 16883425bc38SStefano Zampini 16893425bc38SStefano Zampini if(!fully_redundant) { 16903425bc38SStefano Zampini /******************************************************************/ 16913425bc38SStefano Zampini /* TEST F: It should holds B_{delta}B^T_{D,delta}=I */ 16923425bc38SStefano Zampini /* Corollary thm 14 Mandel Tezaur and Dohrmann 2005 */ 16933425bc38SStefano Zampini /******************************************************************/ 16943425bc38SStefano Zampini ierr = VecDuplicate(lambda_global,&test_vec);CHKERRQ(ierr); 16953425bc38SStefano Zampini ierr = VecSetRandom(lambda_global,PETSC_NULL);CHKERRQ(ierr); 16963425bc38SStefano Zampini /* Action of B_Ddelta^T */ 16973425bc38SStefano Zampini ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 16983425bc38SStefano Zampini ierr = VecScatterEnd (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 16993425bc38SStefano Zampini ierr = MatMultTranspose(fetidpmat_ctx->B_Ddelta,fetidpmat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr); 17003425bc38SStefano Zampini /* Action of B_delta */ 17013425bc38SStefano Zampini ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr); 17023425bc38SStefano Zampini ierr = VecSet(test_vec,0.0);CHKERRQ(ierr); 17033425bc38SStefano Zampini ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,test_vec,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 17043425bc38SStefano Zampini ierr = VecScatterEnd (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,test_vec,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 17053425bc38SStefano Zampini scalar_value = -1.0; 17063425bc38SStefano Zampini ierr = VecAXPY(lambda_global,scalar_value,test_vec);CHKERRQ(ierr); 17073425bc38SStefano Zampini ierr = VecNorm(lambda_global,NORM_INFINITY,&scalar_value);CHKERRQ(ierr); 17083425bc38SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"E[coll]: CHECK infty norm of P^T_D - I: % 1.14e\n",scalar_value);CHKERRQ(ierr); 17093425bc38SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 17103425bc38SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 17113425bc38SStefano Zampini ierr = VecDestroy(&test_vec);CHKERRQ(ierr); 17123425bc38SStefano Zampini } 17133425bc38SStefano Zampini } 17143425bc38SStefano Zampini /* final cleanup */ 17153425bc38SStefano Zampini ierr = PetscFree(dual_dofs_boundary_indices);CHKERRQ(ierr); 17163425bc38SStefano Zampini ierr = PetscFree(vertex_indices);CHKERRQ(ierr); 17173425bc38SStefano Zampini ierr = PetscFree(aux_local_numbering_1);CHKERRQ(ierr); 17183425bc38SStefano Zampini ierr = PetscFree(aux_local_numbering_2);CHKERRQ(ierr); 17193425bc38SStefano Zampini ierr = PetscFree(aux_global_numbering);CHKERRQ(ierr); 17203425bc38SStefano Zampini ierr = PetscFree(aux_global_numbering_mpi);CHKERRQ(ierr); 17213425bc38SStefano Zampini ierr = PetscFree(dof_sizes);CHKERRQ(ierr); 17223425bc38SStefano Zampini ierr = PetscFree(dof_displs);CHKERRQ(ierr); 17233425bc38SStefano Zampini ierr = PetscFree(all_aux_global_numbering_mpi_1);CHKERRQ(ierr); 17243425bc38SStefano Zampini ierr = PetscFree(all_aux_global_numbering_mpi_2);CHKERRQ(ierr); 17253425bc38SStefano Zampini ierr = PetscFree(global_dofs_numbering);CHKERRQ(ierr); 17263425bc38SStefano Zampini ierr = PetscFree(aux_sums);CHKERRQ(ierr); 17273425bc38SStefano Zampini ierr = PetscFree(cols_B_delta);CHKERRQ(ierr); 17283425bc38SStefano Zampini ierr = PetscFree(vals_B_delta);CHKERRQ(ierr); 17293425bc38SStefano Zampini ierr = PetscFree(scaling_factors);CHKERRQ(ierr); 17303425bc38SStefano Zampini ierr = VecDestroy(&lambda_global);CHKERRQ(ierr); 17313425bc38SStefano Zampini ierr = ISDestroy(&IS_l2g_lambda);CHKERRQ(ierr); 17323425bc38SStefano Zampini 17333425bc38SStefano Zampini PetscFunctionReturn(0); 17343425bc38SStefano Zampini } 17353425bc38SStefano Zampini 17363425bc38SStefano Zampini #undef __FUNCT__ 17373425bc38SStefano Zampini #define __FUNCT__ "PCBDDCSetupFETIDPPCContext" 17383425bc38SStefano Zampini static PetscErrorCode PCBDDCSetupFETIDPPCContext(Mat fetimat, FETIDPPC_ctx *fetidppc_ctx) 17393425bc38SStefano Zampini { 17403425bc38SStefano Zampini FETIDPMat_ctx *mat_ctx; 17413425bc38SStefano Zampini PetscErrorCode ierr; 17423425bc38SStefano Zampini 17433425bc38SStefano Zampini PetscFunctionBegin; 17443425bc38SStefano Zampini ierr = MatShellGetContext(fetimat,&mat_ctx);CHKERRQ(ierr); 17453425bc38SStefano Zampini /* get references from objects created when setting up feti mat context */ 17463425bc38SStefano Zampini ierr = PetscObjectReference((PetscObject)mat_ctx->lambda_local);CHKERRQ(ierr); 17473425bc38SStefano Zampini fetidppc_ctx->lambda_local = mat_ctx->lambda_local; 17483425bc38SStefano Zampini ierr = PetscObjectReference((PetscObject)mat_ctx->B_Ddelta);CHKERRQ(ierr); 17493425bc38SStefano Zampini fetidppc_ctx->B_Ddelta = mat_ctx->B_Ddelta; 17503425bc38SStefano Zampini ierr = PetscObjectReference((PetscObject)mat_ctx->l2g_lambda);CHKERRQ(ierr); 17513425bc38SStefano Zampini fetidppc_ctx->l2g_lambda = mat_ctx->l2g_lambda; 17523425bc38SStefano Zampini PetscFunctionReturn(0); 17533425bc38SStefano Zampini } 17543425bc38SStefano Zampini 17553425bc38SStefano Zampini #undef __FUNCT__ 17563425bc38SStefano Zampini #define __FUNCT__ "FETIDPMatMult" 17573425bc38SStefano Zampini static PetscErrorCode FETIDPMatMult(Mat fetimat, Vec x, Vec y) 17583425bc38SStefano Zampini { 17593425bc38SStefano Zampini FETIDPMat_ctx *mat_ctx; 17603425bc38SStefano Zampini PC_IS *pcis; 17613425bc38SStefano Zampini PetscErrorCode ierr; 17623425bc38SStefano Zampini 17633425bc38SStefano Zampini PetscFunctionBegin; 17643425bc38SStefano Zampini ierr = MatShellGetContext(fetimat,&mat_ctx);CHKERRQ(ierr); 17653425bc38SStefano Zampini pcis = (PC_IS*)mat_ctx->pc->data; 17663425bc38SStefano Zampini /* Application of B_delta^T */ 17673425bc38SStefano Zampini ierr = VecScatterBegin(mat_ctx->l2g_lambda,x,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 17683425bc38SStefano Zampini ierr = VecScatterEnd(mat_ctx->l2g_lambda,x,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 17693425bc38SStefano Zampini ierr = MatMultTranspose(mat_ctx->B_delta,mat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr); 17703425bc38SStefano Zampini /* Application of \widetilde{S}^-1 */ 17713425bc38SStefano Zampini ierr = VecSet(pcis->vec1_D,0.0);CHKERRQ(ierr); 17723425bc38SStefano Zampini ierr = PCBDDCApplyInterfacePreconditioner(mat_ctx->pc);CHKERRQ(ierr); 17733425bc38SStefano Zampini /* Application of B_delta */ 17743425bc38SStefano Zampini ierr = MatMult(mat_ctx->B_delta,pcis->vec1_B,mat_ctx->lambda_local);CHKERRQ(ierr); 17753425bc38SStefano Zampini ierr = VecSet(y,0.0);CHKERRQ(ierr); 17763425bc38SStefano Zampini ierr = VecScatterBegin(mat_ctx->l2g_lambda,mat_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 17773425bc38SStefano Zampini ierr = VecScatterEnd(mat_ctx->l2g_lambda,mat_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 17783425bc38SStefano Zampini PetscFunctionReturn(0); 17793425bc38SStefano Zampini } 17803425bc38SStefano Zampini 17813425bc38SStefano Zampini #undef __FUNCT__ 17823425bc38SStefano Zampini #define __FUNCT__ "FETIDPPCApply" 17833425bc38SStefano Zampini static PetscErrorCode FETIDPPCApply(PC fetipc, Vec x, Vec y) 17843425bc38SStefano Zampini { 17853425bc38SStefano Zampini FETIDPPC_ctx *pc_ctx; 17863425bc38SStefano Zampini PC_IS *pcis; 17873425bc38SStefano Zampini PetscErrorCode ierr; 17883425bc38SStefano Zampini 17893425bc38SStefano Zampini PetscFunctionBegin; 17903425bc38SStefano Zampini ierr = PCShellGetContext(fetipc,(void**)&pc_ctx); 17913425bc38SStefano Zampini pcis = (PC_IS*)pc_ctx->pc->data; 17923425bc38SStefano Zampini /* Application of B_Ddelta^T */ 17933425bc38SStefano Zampini ierr = VecScatterBegin(pc_ctx->l2g_lambda,x,pc_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 17943425bc38SStefano Zampini ierr = VecScatterEnd(pc_ctx->l2g_lambda,x,pc_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 17953425bc38SStefano Zampini ierr = VecSet(pcis->vec2_B,0.0);CHKERRQ(ierr); 17963425bc38SStefano Zampini ierr = MatMultTranspose(pc_ctx->B_Ddelta,pc_ctx->lambda_local,pcis->vec2_B);CHKERRQ(ierr); 17973425bc38SStefano Zampini /* Application of S */ 17983425bc38SStefano Zampini ierr = PCISApplySchur(pc_ctx->pc,pcis->vec2_B,pcis->vec1_B,(Vec)0,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr); 17993425bc38SStefano Zampini /* Application of B_Ddelta */ 18003425bc38SStefano Zampini ierr = MatMult(pc_ctx->B_Ddelta,pcis->vec1_B,pc_ctx->lambda_local);CHKERRQ(ierr); 18013425bc38SStefano Zampini ierr = VecSet(y,0.0);CHKERRQ(ierr); 18023425bc38SStefano Zampini ierr = VecScatterBegin(pc_ctx->l2g_lambda,pc_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 18033425bc38SStefano Zampini ierr = VecScatterEnd(pc_ctx->l2g_lambda,pc_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 18043425bc38SStefano Zampini PetscFunctionReturn(0); 18053425bc38SStefano Zampini } 18063425bc38SStefano Zampini 1807da1bb401SStefano Zampini #undef __FUNCT__ 1808da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetupLocalAdjacencyGraph" 1809da1bb401SStefano Zampini static PetscErrorCode PCBDDCSetupLocalAdjacencyGraph(PC pc) 1810da1bb401SStefano Zampini { 1811da1bb401SStefano Zampini PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 1812da1bb401SStefano Zampini Mat_IS *matis = (Mat_IS*)pc->pmat->data; 1813da1bb401SStefano Zampini PetscInt nvtxs,*xadj,*adjncy; 1814da1bb401SStefano Zampini Mat mat_adj; 1815da1bb401SStefano Zampini PetscBool symmetrize_rowij=PETSC_TRUE,compressed_rowij=PETSC_FALSE,flg_row=PETSC_TRUE; 1816da1bb401SStefano Zampini PCBDDCGraph mat_graph=pcbddc->mat_graph; 1817da1bb401SStefano Zampini PetscErrorCode ierr; 1818da1bb401SStefano Zampini 1819da1bb401SStefano Zampini PetscFunctionBegin; 1820da1bb401SStefano Zampini /* get CSR adjacency from local matrix if user has not yet provided local graph using PCBDDCSetLocalAdjacencyGraph function */ 1821da1bb401SStefano Zampini if(!mat_graph->xadj) { 1822da1bb401SStefano Zampini ierr = MatConvert(matis->A,MATMPIADJ,MAT_INITIAL_MATRIX,&mat_adj);CHKERRQ(ierr); 1823da1bb401SStefano Zampini ierr = MatGetRowIJ(mat_adj,0,symmetrize_rowij,compressed_rowij,&nvtxs,&xadj,&adjncy,&flg_row);CHKERRQ(ierr); 1824da1bb401SStefano Zampini if(!flg_row) { 1825da1bb401SStefano Zampini SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in MatGetRowIJ called in %s\n",__FUNCT__); 1826da1bb401SStefano Zampini } 1827da1bb401SStefano Zampini /* Get adjacency into BDDC workspace */ 1828da1bb401SStefano Zampini ierr = PCBDDCSetLocalAdjacencyGraph(pc,nvtxs,xadj,adjncy,PETSC_COPY_VALUES);CHKERRQ(ierr); 1829da1bb401SStefano Zampini ierr = MatRestoreRowIJ(mat_adj,0,symmetrize_rowij,compressed_rowij,&nvtxs,&xadj,&adjncy,&flg_row);CHKERRQ(ierr); 1830da1bb401SStefano Zampini if(!flg_row) { 1831da1bb401SStefano Zampini SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in MatRestoreRowIJ called in %s\n",__FUNCT__); 1832da1bb401SStefano Zampini } 1833da1bb401SStefano Zampini ierr = MatDestroy(&mat_adj);CHKERRQ(ierr); 1834da1bb401SStefano Zampini } 1835da1bb401SStefano Zampini PetscFunctionReturn(0); 1836da1bb401SStefano Zampini } 1837da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */ 18380c7d97c5SJed Brown #undef __FUNCT__ 18390c7d97c5SJed Brown #define __FUNCT__ "PCBDDCApplyInterfacePreconditioner" 18402617d88aSStefano Zampini static PetscErrorCode PCBDDCApplyInterfacePreconditioner(PC pc) 18410c7d97c5SJed Brown { 18420c7d97c5SJed Brown PetscErrorCode ierr; 18430c7d97c5SJed Brown PC_BDDC* pcbddc = (PC_BDDC*)(pc->data); 18440c7d97c5SJed Brown PC_IS* pcis = (PC_IS*) (pc->data); 18453b03a366Sstefano_zampini const PetscScalar zero = 0.0; 18460c7d97c5SJed Brown 18470c7d97c5SJed Brown PetscFunctionBegin; 18480c7d97c5SJed Brown /* Application of PHI^T */ 18490c7d97c5SJed Brown ierr = MatMultTranspose(pcbddc->coarse_phi_B,pcis->vec1_B,pcbddc->vec1_P);CHKERRQ(ierr); 18500c7d97c5SJed Brown if(pcbddc->prec_type) { ierr = MatMultTransposeAdd(pcbddc->coarse_phi_D,pcis->vec1_D,pcbddc->vec1_P,pcbddc->vec1_P);CHKERRQ(ierr); } 18510c7d97c5SJed Brown 18520c7d97c5SJed Brown /* Scatter data of coarse_rhs */ 18530c7d97c5SJed Brown if(pcbddc->coarse_rhs) ierr = VecSet(pcbddc->coarse_rhs,zero);CHKERRQ(ierr); 18540c7d97c5SJed Brown ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->vec1_P,pcbddc->coarse_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 18550c7d97c5SJed Brown 18560c7d97c5SJed Brown /* Local solution on R nodes */ 18570c7d97c5SJed Brown ierr = VecSet(pcbddc->vec1_R,zero);CHKERRQ(ierr); 18580c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->R_to_B,pcis->vec1_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 18590c7d97c5SJed Brown ierr = VecScatterEnd (pcbddc->R_to_B,pcis->vec1_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 18600c7d97c5SJed Brown if(pcbddc->prec_type) { 18610c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->R_to_D,pcis->vec1_D,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 18620c7d97c5SJed Brown ierr = VecScatterEnd (pcbddc->R_to_D,pcis->vec1_D,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 18630c7d97c5SJed Brown } 18640c7d97c5SJed Brown ierr = PCBDDCSolveSaddlePoint(pc);CHKERRQ(ierr); 18650c7d97c5SJed Brown ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr); 18660c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec2_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 18670c7d97c5SJed Brown ierr = VecScatterEnd (pcbddc->R_to_B,pcbddc->vec2_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 18680c7d97c5SJed Brown if(pcbddc->prec_type) { 18690c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec2_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 18700c7d97c5SJed Brown ierr = VecScatterEnd (pcbddc->R_to_D,pcbddc->vec2_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 18710c7d97c5SJed Brown } 18720c7d97c5SJed Brown 18730c7d97c5SJed Brown /* Coarse solution */ 18740c7d97c5SJed Brown ierr = PCBDDCScatterCoarseDataEnd(pc,pcbddc->vec1_P,pcbddc->coarse_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 187553cdbc3dSStefano Zampini if(pcbddc->coarse_rhs) ierr = KSPSolve(pcbddc->coarse_ksp,pcbddc->coarse_rhs,pcbddc->coarse_vec);CHKERRQ(ierr); 18760c7d97c5SJed Brown ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->coarse_vec,pcbddc->vec1_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 18770c7d97c5SJed Brown ierr = PCBDDCScatterCoarseDataEnd (pc,pcbddc->coarse_vec,pcbddc->vec1_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 18780c7d97c5SJed Brown 18790c7d97c5SJed Brown /* Sum contributions from two levels */ 18800c7d97c5SJed Brown ierr = MatMultAdd(pcbddc->coarse_phi_B,pcbddc->vec1_P,pcis->vec1_B,pcis->vec1_B);CHKERRQ(ierr); 18810c7d97c5SJed Brown if(pcbddc->prec_type) { ierr = MatMultAdd(pcbddc->coarse_phi_D,pcbddc->vec1_P,pcis->vec1_D,pcis->vec1_D);CHKERRQ(ierr); } 18820c7d97c5SJed Brown PetscFunctionReturn(0); 18830c7d97c5SJed Brown } 18840c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 18850c7d97c5SJed Brown #undef __FUNCT__ 18860c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSolveSaddlePoint" 188753cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSolveSaddlePoint(PC pc) 18880c7d97c5SJed Brown { 18890c7d97c5SJed Brown PetscErrorCode ierr; 18900c7d97c5SJed Brown PC_BDDC* pcbddc = (PC_BDDC*)(pc->data); 18910c7d97c5SJed Brown 18920c7d97c5SJed Brown PetscFunctionBegin; 189353cdbc3dSStefano Zampini ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr); 1894534831adSStefano Zampini if(pcbddc->local_auxmat1) { 18950c7d97c5SJed Brown ierr = MatMult(pcbddc->local_auxmat1,pcbddc->vec2_R,pcbddc->vec1_C);CHKERRQ(ierr); 18960c7d97c5SJed Brown ierr = MatMultAdd(pcbddc->local_auxmat2,pcbddc->vec1_C,pcbddc->vec2_R,pcbddc->vec2_R);CHKERRQ(ierr); 18970c7d97c5SJed Brown } 18980c7d97c5SJed Brown PetscFunctionReturn(0); 18990c7d97c5SJed Brown } 19000c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 19010c7d97c5SJed Brown #undef __FUNCT__ 19020c7d97c5SJed Brown #define __FUNCT__ "PCBDDCScatterCoarseDataBegin" 190353cdbc3dSStefano Zampini static PetscErrorCode PCBDDCScatterCoarseDataBegin(PC pc,Vec vec_from, Vec vec_to, InsertMode imode, ScatterMode smode) 19040c7d97c5SJed Brown { 19050c7d97c5SJed Brown PetscErrorCode ierr; 19060c7d97c5SJed Brown PC_BDDC* pcbddc = (PC_BDDC*)(pc->data); 19070c7d97c5SJed Brown 19080c7d97c5SJed Brown PetscFunctionBegin; 19090c7d97c5SJed Brown switch(pcbddc->coarse_communications_type){ 19100c7d97c5SJed Brown case SCATTERS_BDDC: 19110c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->coarse_loc_to_glob,vec_from,vec_to,imode,smode);CHKERRQ(ierr); 19120c7d97c5SJed Brown break; 19130c7d97c5SJed Brown case GATHERS_BDDC: 19140c7d97c5SJed Brown break; 19150c7d97c5SJed Brown } 19160c7d97c5SJed Brown PetscFunctionReturn(0); 19170c7d97c5SJed Brown } 19180c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 19190c7d97c5SJed Brown #undef __FUNCT__ 19200c7d97c5SJed Brown #define __FUNCT__ "PCBDDCScatterCoarseDataEnd" 192153cdbc3dSStefano Zampini static PetscErrorCode PCBDDCScatterCoarseDataEnd(PC pc,Vec vec_from, Vec vec_to, InsertMode imode, ScatterMode smode) 19220c7d97c5SJed Brown { 19230c7d97c5SJed Brown PetscErrorCode ierr; 19240c7d97c5SJed Brown PC_BDDC* pcbddc = (PC_BDDC*)(pc->data); 19250c7d97c5SJed Brown PetscScalar* array_to; 19260c7d97c5SJed Brown PetscScalar* array_from; 19270c7d97c5SJed Brown MPI_Comm comm=((PetscObject)pc)->comm; 19280c7d97c5SJed Brown PetscInt i; 19290c7d97c5SJed Brown 19300c7d97c5SJed Brown PetscFunctionBegin; 19310c7d97c5SJed Brown 19320c7d97c5SJed Brown switch(pcbddc->coarse_communications_type){ 19330c7d97c5SJed Brown case SCATTERS_BDDC: 19340c7d97c5SJed Brown ierr = VecScatterEnd(pcbddc->coarse_loc_to_glob,vec_from,vec_to,imode,smode);CHKERRQ(ierr); 19350c7d97c5SJed Brown break; 19360c7d97c5SJed Brown case GATHERS_BDDC: 19370c7d97c5SJed Brown if(vec_from) VecGetArray(vec_from,&array_from); 19380c7d97c5SJed Brown if(vec_to) VecGetArray(vec_to,&array_to); 19390c7d97c5SJed Brown switch(pcbddc->coarse_problem_type){ 19400c7d97c5SJed Brown case SEQUENTIAL_BDDC: 19410c7d97c5SJed Brown if(smode == SCATTER_FORWARD) { 194253cdbc3dSStefano Zampini ierr = MPI_Gatherv(&array_from[0],pcbddc->local_primal_size,MPIU_SCALAR,&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,0,comm);CHKERRQ(ierr); 19430c7d97c5SJed Brown if(vec_to) { 19440c7d97c5SJed Brown for(i=0;i<pcbddc->replicated_primal_size;i++) 19450c7d97c5SJed Brown array_to[pcbddc->replicated_local_primal_indices[i]]+=pcbddc->replicated_local_primal_values[i]; 19460c7d97c5SJed Brown } 19470c7d97c5SJed Brown } else { 19480c7d97c5SJed Brown if(vec_from) 19490c7d97c5SJed Brown for(i=0;i<pcbddc->replicated_primal_size;i++) 19500c7d97c5SJed Brown pcbddc->replicated_local_primal_values[i]=array_from[pcbddc->replicated_local_primal_indices[i]]; 195153cdbc3dSStefano Zampini ierr = MPI_Scatterv(&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,&array_to[0],pcbddc->local_primal_size,MPIU_SCALAR,0,comm);CHKERRQ(ierr); 19520c7d97c5SJed Brown } 19530c7d97c5SJed Brown break; 19540c7d97c5SJed Brown case REPLICATED_BDDC: 19550c7d97c5SJed Brown if(smode == SCATTER_FORWARD) { 195653cdbc3dSStefano Zampini ierr = MPI_Allgatherv(&array_from[0],pcbddc->local_primal_size,MPIU_SCALAR,&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,comm);CHKERRQ(ierr); 19570c7d97c5SJed Brown for(i=0;i<pcbddc->replicated_primal_size;i++) 19580c7d97c5SJed Brown array_to[pcbddc->replicated_local_primal_indices[i]]+=pcbddc->replicated_local_primal_values[i]; 19590c7d97c5SJed Brown } else { /* no communications needed for SCATTER_REVERSE since needed data is already present */ 19600c7d97c5SJed Brown for(i=0;i<pcbddc->local_primal_size;i++) 19610c7d97c5SJed Brown array_to[i]=array_from[pcbddc->local_primal_indices[i]]; 19620c7d97c5SJed Brown } 19630c7d97c5SJed Brown break; 196453cdbc3dSStefano Zampini case MULTILEVEL_BDDC: 196553cdbc3dSStefano Zampini break; 196653cdbc3dSStefano Zampini case PARALLEL_BDDC: 196753cdbc3dSStefano Zampini break; 19680c7d97c5SJed Brown } 19690c7d97c5SJed Brown if(vec_from) VecRestoreArray(vec_from,&array_from); 19700c7d97c5SJed Brown if(vec_to) VecRestoreArray(vec_to,&array_to); 19710c7d97c5SJed Brown break; 19720c7d97c5SJed Brown } 19730c7d97c5SJed Brown PetscFunctionReturn(0); 19740c7d97c5SJed Brown } 19750c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 19763b03a366Sstefano_zampini #undef __FUNCT__ 19773b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCCreateConstraintMatrix" 19783b03a366Sstefano_zampini static PetscErrorCode PCBDDCCreateConstraintMatrix(PC pc) 19793b03a366Sstefano_zampini { 19803b03a366Sstefano_zampini PetscErrorCode ierr; 19813b03a366Sstefano_zampini PC_IS* pcis = (PC_IS*)(pc->data); 19823b03a366Sstefano_zampini PC_BDDC* pcbddc = (PC_BDDC*)pc->data; 19833b03a366Sstefano_zampini Mat_IS *matis = (Mat_IS*)pc->pmat->data; 198423d4d1a5SStefano Zampini PetscInt *nnz,*is_indices; 19853b03a366Sstefano_zampini PetscScalar *temp_quadrature_constraint; 1986534831adSStefano Zampini PetscInt *temp_indices,*temp_indices_to_constraint,*temp_indices_to_constraint_B,*local_to_B; 19873b03a366Sstefano_zampini PetscInt local_primal_size,i,j,k,total_counts,max_size_of_constraint; 19883b03a366Sstefano_zampini PetscInt n_constraints,n_vertices,size_of_constraint; 1989534831adSStefano Zampini PetscScalar quad_value; 19903b03a366Sstefano_zampini PetscBool nnsp_has_cnst=PETSC_FALSE,use_nnsp_true=pcbddc->use_nnsp_true; 19913b03a366Sstefano_zampini PetscInt nnsp_size=0,nnsp_addone=0,temp_constraints,temp_start_ptr; 19923b03a366Sstefano_zampini IS *used_IS; 19933b03a366Sstefano_zampini const MatType impMatType=MATSEQAIJ; 19943b03a366Sstefano_zampini PetscBLASInt Bs,Bt,lwork,lierr; 19953b03a366Sstefano_zampini PetscReal tol=1.0e-8; 1996fcda91b4SJed Brown MatNullSpace nearnullsp; 1997fcda91b4SJed Brown const Vec *nearnullvecs; 19983b03a366Sstefano_zampini Vec *localnearnullsp; 19993b03a366Sstefano_zampini PetscScalar *work,*temp_basis,*array_vector,*correlation_mat; 20003b03a366Sstefano_zampini PetscReal *rwork,*singular_vals; 2001534831adSStefano Zampini PetscBLASInt Bone=1,*ipiv; 2002534831adSStefano Zampini Vec temp_vec; 2003534831adSStefano Zampini Mat temp_mat; 2004534831adSStefano Zampini KSP temp_ksp; 2005ffe5efe1SStefano Zampini PC temp_pc; 2006534831adSStefano Zampini PetscInt s,start_constraint,dual_dofs; 2007534831adSStefano Zampini PetscBool compute_submatrix,useksp=PETSC_FALSE; 2008534831adSStefano Zampini PetscInt *aux_primal_permutation,*aux_primal_numbering; 2009534831adSStefano Zampini PetscBool boolforface,*change_basis; 2010de534f79Sstefano_zampini /* some ugly conditional declarations */ 20113b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD) 20123b03a366Sstefano_zampini PetscScalar dot_result; 20133b03a366Sstefano_zampini PetscScalar one=1.0,zero=0.0; 20143b03a366Sstefano_zampini PetscInt ii; 20153425bc38SStefano Zampini PetscScalar *singular_vectors; 20163425bc38SStefano Zampini PetscBLASInt *iwork,*ifail; 20173425bc38SStefano Zampini PetscReal dummy_real,abs_tol; 20183425bc38SStefano Zampini PetscBLASInt eigs_found; 20193b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX) 20203b03a366Sstefano_zampini PetscScalar val1,val2; 20213b03a366Sstefano_zampini #endif 20223425bc38SStefano Zampini #endif 20233b03a366Sstefano_zampini PetscBLASInt dummy_int; 20243b03a366Sstefano_zampini PetscScalar dummy_scalar; 20253b03a366Sstefano_zampini 20263b03a366Sstefano_zampini PetscFunctionBegin; 20273b03a366Sstefano_zampini /* check if near null space is attached to global mat */ 2028fcda91b4SJed Brown ierr = MatGetNearNullSpace(pc->pmat,&nearnullsp);CHKERRQ(ierr); 2029fcda91b4SJed Brown if (nearnullsp) { 2030fcda91b4SJed Brown ierr = MatNullSpaceGetVecs(nearnullsp,&nnsp_has_cnst,&nnsp_size,&nearnullvecs);CHKERRQ(ierr); 20313b03a366Sstefano_zampini } else { /* if near null space is not provided it uses constants */ 20323b03a366Sstefano_zampini nnsp_has_cnst = PETSC_TRUE; 20333b03a366Sstefano_zampini use_nnsp_true = PETSC_TRUE; 20343b03a366Sstefano_zampini } 20353b03a366Sstefano_zampini if(nnsp_has_cnst) { 20363b03a366Sstefano_zampini nnsp_addone = 1; 20373b03a366Sstefano_zampini } 20383b03a366Sstefano_zampini /* 20393b03a366Sstefano_zampini Evaluate maximum storage size needed by the procedure 20403b03a366Sstefano_zampini - temp_indices will contain start index of each constraint stored as follows 20413b03a366Sstefano_zampini - temp_indices_to_constraint [temp_indices[i],...,temp[indices[i+1]-1] will contain the indices (in local numbering) on which the constraint acts 2042534831adSStefano Zampini - temp_indices_to_constraint_B[temp_indices[i],...,temp[indices[i+1]-1] will contain the indices (in boundary numbering) on which the constraint acts 20433b03a366Sstefano_zampini - temp_quadrature_constraint [temp_indices[i],...,temp[indices[i+1]-1] will contain the scalars representing the constraint itself 20443b03a366Sstefano_zampini */ 2045da1bb401SStefano Zampini 20463b03a366Sstefano_zampini total_counts = pcbddc->n_ISForFaces+pcbddc->n_ISForEdges; 20473b03a366Sstefano_zampini total_counts *= (nnsp_addone+nnsp_size); 2048da1bb401SStefano Zampini ierr = ISGetSize(pcbddc->ISForVertices,&n_vertices);CHKERRQ(ierr); 2049da1bb401SStefano Zampini total_counts += n_vertices; 20503b03a366Sstefano_zampini ierr = PetscMalloc((total_counts+1)*sizeof(PetscInt),&temp_indices);CHKERRQ(ierr); 2051534831adSStefano Zampini ierr = PetscMalloc((total_counts+1)*sizeof(PetscBool),&change_basis);CHKERRQ(ierr); 20523b03a366Sstefano_zampini total_counts = 0; 20533b03a366Sstefano_zampini max_size_of_constraint = 0; 20543b03a366Sstefano_zampini for(i=0;i<pcbddc->n_ISForEdges+pcbddc->n_ISForFaces;i++){ 20553b03a366Sstefano_zampini if(i<pcbddc->n_ISForEdges){ 20563b03a366Sstefano_zampini used_IS = &pcbddc->ISForEdges[i]; 20573b03a366Sstefano_zampini } else { 20583b03a366Sstefano_zampini used_IS = &pcbddc->ISForFaces[i-pcbddc->n_ISForEdges]; 20593b03a366Sstefano_zampini } 20603b03a366Sstefano_zampini ierr = ISGetSize(*used_IS,&j);CHKERRQ(ierr); 20613b03a366Sstefano_zampini total_counts += j; 20623b03a366Sstefano_zampini if(j>max_size_of_constraint) max_size_of_constraint=j; 20633b03a366Sstefano_zampini } 20643b03a366Sstefano_zampini total_counts *= (nnsp_addone+nnsp_size); 2065da1bb401SStefano Zampini total_counts += n_vertices; 20663b03a366Sstefano_zampini ierr = PetscMalloc(total_counts*sizeof(PetscScalar),&temp_quadrature_constraint);CHKERRQ(ierr); 20673b03a366Sstefano_zampini ierr = PetscMalloc(total_counts*sizeof(PetscInt),&temp_indices_to_constraint);CHKERRQ(ierr); 2068534831adSStefano Zampini ierr = PetscMalloc(total_counts*sizeof(PetscInt),&temp_indices_to_constraint_B);CHKERRQ(ierr); 2069534831adSStefano Zampini ierr = PetscMalloc(pcis->n*sizeof(PetscInt),&local_to_B);CHKERRQ(ierr); 2070534831adSStefano Zampini ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 2071534831adSStefano Zampini for(i=0;i<pcis->n;i++) { 2072534831adSStefano Zampini local_to_B[i]=-1; 2073534831adSStefano Zampini } 2074534831adSStefano Zampini for(i=0;i<pcis->n_B;i++) { 2075534831adSStefano Zampini local_to_B[is_indices[i]]=i; 2076534831adSStefano Zampini } 2077534831adSStefano Zampini ierr = ISRestoreIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 2078534831adSStefano Zampini 20793b03a366Sstefano_zampini /* First we issue queries to allocate optimal workspace for LAPACKgesvd or LAPACKsyev/LAPACKheev */ 20803b03a366Sstefano_zampini rwork = 0; 20813b03a366Sstefano_zampini work = 0; 20823b03a366Sstefano_zampini singular_vals = 0; 20833b03a366Sstefano_zampini temp_basis = 0; 20843b03a366Sstefano_zampini correlation_mat = 0; 20853b03a366Sstefano_zampini if(!pcbddc->use_nnsp_true) { 20863b03a366Sstefano_zampini PetscScalar temp_work; 20873b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD) 20883b03a366Sstefano_zampini /* POD */ 20893b03a366Sstefano_zampini PetscInt max_n; 20903b03a366Sstefano_zampini max_n = nnsp_addone+nnsp_size; 20913b03a366Sstefano_zampini /* using some techniques borrowed from Proper Orthogonal Decomposition */ 20923b03a366Sstefano_zampini ierr = PetscMalloc(max_n*max_n*sizeof(PetscScalar),&correlation_mat);CHKERRQ(ierr); 20933425bc38SStefano Zampini ierr = PetscMalloc(max_n*max_n*sizeof(PetscScalar),&singular_vectors);CHKERRQ(ierr); 20943b03a366Sstefano_zampini ierr = PetscMalloc(max_n*sizeof(PetscReal),&singular_vals);CHKERRQ(ierr); 20953b03a366Sstefano_zampini ierr = PetscMalloc(max_size_of_constraint*(nnsp_addone+nnsp_size)*sizeof(PetscScalar),&temp_basis);CHKERRQ(ierr); 20963b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX) 20973b03a366Sstefano_zampini ierr = PetscMalloc(3*max_n*sizeof(PetscReal),&rwork);CHKERRQ(ierr); 20983b03a366Sstefano_zampini #endif 20993425bc38SStefano Zampini ierr = PetscMalloc(5*max_n*sizeof(PetscBLASInt),&iwork);CHKERRQ(ierr); 21003425bc38SStefano Zampini ierr = PetscMalloc(max_n*sizeof(PetscBLASInt),&ifail);CHKERRQ(ierr); 21013b03a366Sstefano_zampini /* now we evaluate the optimal workspace using query with lwork=-1 */ 21023b03a366Sstefano_zampini Bt = PetscBLASIntCast(max_n); 21033b03a366Sstefano_zampini lwork=-1; 21043425bc38SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 21053b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX) 21063425bc38SStefano Zampini abs_tol=1.e-8; 21073425bc38SStefano Zampini /* LAPACKsyev_("V","U",&Bt,correlation_mat,&Bt,singular_vals,&temp_work,&lwork,&lierr); */ 21083425bc38SStefano Zampini LAPACKsyevx_("V","A","U",&Bt,correlation_mat,&Bt,&dummy_real,&dummy_real,&dummy_int,&dummy_int, 21093425bc38SStefano Zampini &abs_tol,&eigs_found,singular_vals,singular_vectors,&Bt,&temp_work,&lwork,iwork,ifail,&lierr); 21103b03a366Sstefano_zampini #else 21113425bc38SStefano Zampini /* LAPACKsyev_("V","U",&Bt,correlation_mat,&Bt,singular_vals,&temp_work,&lwork,rwork,&lierr); */ 21123425bc38SStefano Zampini /* LAPACK call is missing here! TODO */ 21133425bc38SStefano Zampini SETERRQ(((PetscObject) pc)->comm, PETSC_ERR_SUP, "Not yet implemented for complexes when PETSC_MISSING_GESVD = 1"); 21143b03a366Sstefano_zampini #endif 21153425bc38SStefano Zampini if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to SYEVX Lapack routine %d",(int)lierr); 21163425bc38SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 21173b03a366Sstefano_zampini #else /* on missing GESVD */ 21183b03a366Sstefano_zampini /* SVD */ 21193b03a366Sstefano_zampini PetscInt max_n,min_n; 21203b03a366Sstefano_zampini max_n = max_size_of_constraint; 21213b03a366Sstefano_zampini min_n = nnsp_addone+nnsp_size; 21223b03a366Sstefano_zampini if(max_size_of_constraint < ( nnsp_addone+nnsp_size ) ) { 21233b03a366Sstefano_zampini min_n = max_size_of_constraint; 21243b03a366Sstefano_zampini max_n = nnsp_addone+nnsp_size; 21253b03a366Sstefano_zampini } 21263b03a366Sstefano_zampini ierr = PetscMalloc(min_n*sizeof(PetscReal),&singular_vals);CHKERRQ(ierr); 21273b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX) 21283b03a366Sstefano_zampini ierr = PetscMalloc(5*min_n*sizeof(PetscReal),&rwork);CHKERRQ(ierr); 21293b03a366Sstefano_zampini #endif 21303b03a366Sstefano_zampini /* now we evaluate the optimal workspace using query with lwork=-1 */ 21313b03a366Sstefano_zampini lwork=-1; 21323b03a366Sstefano_zampini Bs = PetscBLASIntCast(max_n); 21333b03a366Sstefano_zampini Bt = PetscBLASIntCast(min_n); 21343b03a366Sstefano_zampini dummy_int = Bs; 2135670f3ff9SJed Brown ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 21363b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX) 21373b03a366Sstefano_zampini LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[0],&Bs,singular_vals, 21383b03a366Sstefano_zampini &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,&temp_work,&lwork,&lierr); 21393b03a366Sstefano_zampini #else 21403b03a366Sstefano_zampini LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[0],&Bs,singular_vals, 21413b03a366Sstefano_zampini &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,&temp_work,&lwork,rwork,&lierr); 21423b03a366Sstefano_zampini #endif 21433b03a366Sstefano_zampini if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to SVD Lapack routine %d",(int)lierr); 2144670f3ff9SJed Brown ierr = PetscFPTrapPop();CHKERRQ(ierr); 21453b03a366Sstefano_zampini #endif 21463b03a366Sstefano_zampini /* Allocate optimal workspace */ 21473b03a366Sstefano_zampini lwork = PetscBLASIntCast((PetscInt)PetscRealPart(temp_work)); 21483b03a366Sstefano_zampini total_counts = (PetscInt)lwork; 21493b03a366Sstefano_zampini ierr = PetscMalloc(total_counts*sizeof(PetscScalar),&work);CHKERRQ(ierr); 21503b03a366Sstefano_zampini } 21513b03a366Sstefano_zampini /* get local part of global near null space vectors */ 21523b03a366Sstefano_zampini ierr = PetscMalloc(nnsp_size*sizeof(Vec),&localnearnullsp);CHKERRQ(ierr); 21533b03a366Sstefano_zampini for(k=0;k<nnsp_size;k++) { 21543b03a366Sstefano_zampini ierr = VecDuplicate(pcis->vec1_N,&localnearnullsp[k]);CHKERRQ(ierr); 2155fcda91b4SJed Brown ierr = VecScatterBegin(matis->ctx,nearnullvecs[k],localnearnullsp[k],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 2156fcda91b4SJed Brown ierr = VecScatterEnd (matis->ctx,nearnullvecs[k],localnearnullsp[k],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 21573b03a366Sstefano_zampini } 21583b03a366Sstefano_zampini /* Now we can loop on constraining sets */ 21593b03a366Sstefano_zampini total_counts=0; 21603b03a366Sstefano_zampini temp_indices[0]=0; 2161da1bb401SStefano Zampini /* vertices */ 2162da1bb401SStefano Zampini PetscBool used_vertex; 2163da1bb401SStefano Zampini ierr = ISGetIndices(pcbddc->ISForVertices,(const PetscInt**)&is_indices);CHKERRQ(ierr); 2164da1bb401SStefano Zampini if(nnsp_has_cnst) { /* consider all vertices */ 2165da1bb401SStefano Zampini for(i=0;i<n_vertices;i++) { 2166da1bb401SStefano Zampini temp_indices_to_constraint[temp_indices[total_counts]]=is_indices[i]; 2167534831adSStefano Zampini temp_indices_to_constraint_B[temp_indices[total_counts]]=local_to_B[is_indices[i]]; 2168da1bb401SStefano Zampini temp_quadrature_constraint[temp_indices[total_counts]]=1.0; 2169da1bb401SStefano Zampini temp_indices[total_counts+1]=temp_indices[total_counts]+1; 2170534831adSStefano Zampini change_basis[total_counts]=PETSC_FALSE; 2171da1bb401SStefano Zampini total_counts++; 2172da1bb401SStefano Zampini } 2173da1bb401SStefano Zampini } else { /* consider vertices for which exist at least a localnearnullsp which is not null there */ 2174da1bb401SStefano Zampini for(i=0;i<n_vertices;i++) { 2175da1bb401SStefano Zampini used_vertex=PETSC_FALSE; 2176da1bb401SStefano Zampini k=0; 2177da1bb401SStefano Zampini while(!used_vertex && k<nnsp_size) { 2178da1bb401SStefano Zampini ierr = VecGetArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr); 2179da1bb401SStefano Zampini if(PetscAbsScalar(array_vector[is_indices[i]])>0.0) { 2180da1bb401SStefano Zampini temp_indices_to_constraint[temp_indices[total_counts]]=is_indices[i]; 2181534831adSStefano Zampini temp_indices_to_constraint_B[temp_indices[total_counts]]=local_to_B[is_indices[i]]; 2182da1bb401SStefano Zampini temp_quadrature_constraint[temp_indices[total_counts]]=1.0; 2183da1bb401SStefano Zampini temp_indices[total_counts+1]=temp_indices[total_counts]+1; 2184534831adSStefano Zampini change_basis[total_counts]=PETSC_FALSE; 2185da1bb401SStefano Zampini total_counts++; 2186da1bb401SStefano Zampini used_vertex=PETSC_TRUE; 2187da1bb401SStefano Zampini } 2188da1bb401SStefano Zampini ierr = VecRestoreArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr); 2189da1bb401SStefano Zampini k++; 2190da1bb401SStefano Zampini } 2191da1bb401SStefano Zampini } 2192da1bb401SStefano Zampini } 2193da1bb401SStefano Zampini ierr = ISRestoreIndices(pcbddc->ISForVertices,(const PetscInt**)&is_indices);CHKERRQ(ierr); 2194da1bb401SStefano Zampini n_vertices=total_counts; 2195da1bb401SStefano Zampini /* edges and faces */ 21963b03a366Sstefano_zampini for(i=0;i<pcbddc->n_ISForEdges+pcbddc->n_ISForFaces;i++){ 21973b03a366Sstefano_zampini if(i<pcbddc->n_ISForEdges){ 21983b03a366Sstefano_zampini used_IS = &pcbddc->ISForEdges[i]; 2199534831adSStefano Zampini boolforface = pcbddc->usechangeofbasis; 22003b03a366Sstefano_zampini } else { 22013b03a366Sstefano_zampini used_IS = &pcbddc->ISForFaces[i-pcbddc->n_ISForEdges]; 2202534831adSStefano Zampini boolforface = pcbddc->usechangeonfaces; 22033b03a366Sstefano_zampini } 22043b03a366Sstefano_zampini temp_constraints = 0; /* zero the number of constraints I have on this conn comp */ 22053b03a366Sstefano_zampini temp_start_ptr = total_counts; /* need to know the starting index of constraints stored */ 22063b03a366Sstefano_zampini ierr = ISGetSize(*used_IS,&size_of_constraint);CHKERRQ(ierr); 22073b03a366Sstefano_zampini ierr = ISGetIndices(*used_IS,(const PetscInt**)&is_indices);CHKERRQ(ierr); 22083b03a366Sstefano_zampini if(nnsp_has_cnst) { 22093b03a366Sstefano_zampini temp_constraints++; 2210534831adSStefano Zampini quad_value = (PetscScalar) (1.0/PetscSqrtReal((PetscReal)size_of_constraint)); 22113b03a366Sstefano_zampini for(j=0;j<size_of_constraint;j++) { 22123b03a366Sstefano_zampini temp_indices_to_constraint[temp_indices[total_counts]+j]=is_indices[j]; 2213534831adSStefano Zampini temp_indices_to_constraint_B[temp_indices[total_counts]+j]=local_to_B[is_indices[j]]; 22143b03a366Sstefano_zampini temp_quadrature_constraint[temp_indices[total_counts]+j]=quad_value; 22153b03a366Sstefano_zampini } 22163b03a366Sstefano_zampini temp_indices[total_counts+1]=temp_indices[total_counts]+size_of_constraint; /* store new starting point */ 2217534831adSStefano Zampini change_basis[total_counts]=boolforface; 22183b03a366Sstefano_zampini total_counts++; 22193b03a366Sstefano_zampini } 22203b03a366Sstefano_zampini for(k=0;k<nnsp_size;k++) { 22213b03a366Sstefano_zampini ierr = VecGetArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr); 22223b03a366Sstefano_zampini for(j=0;j<size_of_constraint;j++) { 22233b03a366Sstefano_zampini temp_indices_to_constraint[temp_indices[total_counts]+j]=is_indices[j]; 2224534831adSStefano Zampini temp_indices_to_constraint_B[temp_indices[total_counts]+j]=local_to_B[is_indices[j]]; 22253b03a366Sstefano_zampini temp_quadrature_constraint[temp_indices[total_counts]+j]=array_vector[is_indices[j]]; 22263b03a366Sstefano_zampini } 22273b03a366Sstefano_zampini ierr = VecRestoreArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr); 2228de534f79Sstefano_zampini quad_value = 1.0; 2229de534f79Sstefano_zampini if( use_nnsp_true ) { /* check if array is null on the connected component in case use_nnsp_true has been requested */ 2230de534f79Sstefano_zampini Bs = PetscBLASIntCast(size_of_constraint); 2231de534f79Sstefano_zampini quad_value = BLASasum_(&Bs,&temp_quadrature_constraint[temp_indices[total_counts]],&Bone); 2232de534f79Sstefano_zampini } 2233de534f79Sstefano_zampini if ( quad_value > 0.0 ) { /* keep indices and values */ 2234de534f79Sstefano_zampini temp_constraints++; 22353b03a366Sstefano_zampini temp_indices[total_counts+1]=temp_indices[total_counts]+size_of_constraint; /* store new starting point */ 2236534831adSStefano Zampini change_basis[total_counts]=boolforface; 22373b03a366Sstefano_zampini total_counts++; 22383b03a366Sstefano_zampini } 2239de534f79Sstefano_zampini } 22403b03a366Sstefano_zampini ierr = ISRestoreIndices(*used_IS,(const PetscInt**)&is_indices);CHKERRQ(ierr); 2241de534f79Sstefano_zampini /* perform SVD on the constraint if use_nnsp_true has not be requested by the user */ 22423b03a366Sstefano_zampini if(!use_nnsp_true) { 2243de534f79Sstefano_zampini 22443b03a366Sstefano_zampini Bs = PetscBLASIntCast(size_of_constraint); 22453b03a366Sstefano_zampini Bt = PetscBLASIntCast(temp_constraints); 2246de534f79Sstefano_zampini 22473b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD) 22483b03a366Sstefano_zampini ierr = PetscMemzero(correlation_mat,Bt*Bt*sizeof(PetscScalar));CHKERRQ(ierr); 22493b03a366Sstefano_zampini /* Store upper triangular part of correlation matrix */ 22503b03a366Sstefano_zampini for(j=0;j<temp_constraints;j++) { 22513b03a366Sstefano_zampini for(k=0;k<j+1;k++) { 22523b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX) 22533425bc38SStefano Zampini /* hand made complex dot product -> replace */ 22543b03a366Sstefano_zampini dot_result = 0.0; 22553b03a366Sstefano_zampini for (ii=0; ii<size_of_constraint; ii++) { 22563b03a366Sstefano_zampini val1 = temp_quadrature_constraint[temp_indices[temp_start_ptr+j]+ii]; 22573b03a366Sstefano_zampini val2 = temp_quadrature_constraint[temp_indices[temp_start_ptr+k]+ii]; 22583b03a366Sstefano_zampini dot_result += val1*PetscConj(val2); 22593b03a366Sstefano_zampini } 22603b03a366Sstefano_zampini #else 22613b03a366Sstefano_zampini dot_result = BLASdot_(&Bs,&temp_quadrature_constraint[temp_indices[temp_start_ptr+j]],&Bone, 22623b03a366Sstefano_zampini &temp_quadrature_constraint[temp_indices[temp_start_ptr+k]],&Bone); 22633b03a366Sstefano_zampini #endif 22643b03a366Sstefano_zampini correlation_mat[j*temp_constraints+k]=dot_result; 22653b03a366Sstefano_zampini } 22663b03a366Sstefano_zampini } 22673425bc38SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 22683b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX) 22693425bc38SStefano Zampini /* LAPACKsyev_("V","U",&Bt,correlation_mat,&Bt,singular_vals,work,&lwork,&lierr); */ 22703425bc38SStefano Zampini LAPACKsyevx_("V","A","U",&Bt,correlation_mat,&Bt,&dummy_real,&dummy_real,&dummy_int,&dummy_int, 22713425bc38SStefano Zampini &abs_tol,&eigs_found,singular_vals,singular_vectors,&Bt,work,&lwork,iwork,ifail,&lierr); 22723b03a366Sstefano_zampini #else 22733425bc38SStefano Zampini /* LAPACK call is missing here! TODO */ 22743425bc38SStefano Zampini SETERRQ(((PetscObject) pc)->comm, PETSC_ERR_SUP, "Not yet implemented for complexes when PETSC_MISSING_GESVD = 1"); 22753b03a366Sstefano_zampini #endif 22763425bc38SStefano Zampini if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYEVX Lapack routine %d",(int)lierr); 22773425bc38SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 22783b03a366Sstefano_zampini /* retain eigenvalues greater than tol: note that lapack SYEV gives eigs in ascending order */ 22793b03a366Sstefano_zampini j=0; 22803b03a366Sstefano_zampini while( j < Bt && singular_vals[j] < tol) j++; 22813b03a366Sstefano_zampini total_counts=total_counts-j; 22823b03a366Sstefano_zampini if(j<temp_constraints) { 22833b03a366Sstefano_zampini for(k=j;k<Bt;k++) { singular_vals[k]=1.0/PetscSqrtReal(singular_vals[k]); } 22843425bc38SStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 22853b03a366Sstefano_zampini BLASgemm_("N","N",&Bs,&Bt,&Bt,&one,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,correlation_mat,&Bt,&zero,temp_basis,&Bs); 22863425bc38SStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 22873b03a366Sstefano_zampini /* copy POD basis into used quadrature memory */ 22883b03a366Sstefano_zampini for(k=0;k<Bt-j;k++) { 22893b03a366Sstefano_zampini for(ii=0;ii<size_of_constraint;ii++) { 22903b03a366Sstefano_zampini temp_quadrature_constraint[temp_indices[temp_start_ptr+k]+ii]=singular_vals[Bt-1-k]*temp_basis[(Bt-1-k)*size_of_constraint+ii]; 22913b03a366Sstefano_zampini } 22923b03a366Sstefano_zampini } 22933b03a366Sstefano_zampini } 2294de534f79Sstefano_zampini 22953b03a366Sstefano_zampini #else /* on missing GESVD */ 22963b03a366Sstefano_zampini PetscInt min_n = temp_constraints; 22973b03a366Sstefano_zampini if(min_n > size_of_constraint) min_n = size_of_constraint; 22983b03a366Sstefano_zampini dummy_int = Bs; 2299670f3ff9SJed Brown ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 23003b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX) 23013b03a366Sstefano_zampini LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,singular_vals, 23023b03a366Sstefano_zampini &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,work,&lwork,&lierr); 23033b03a366Sstefano_zampini #else 23043b03a366Sstefano_zampini LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,singular_vals, 23053b03a366Sstefano_zampini &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,work,&lwork,rwork,&lierr); 23063b03a366Sstefano_zampini #endif 23073b03a366Sstefano_zampini if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SVD Lapack routine %d",(int)lierr); 2308670f3ff9SJed Brown ierr = PetscFPTrapPop();CHKERRQ(ierr); 23093b03a366Sstefano_zampini /* retain eigenvalues greater than tol: note that lapack SVD gives eigs in descending order */ 23103b03a366Sstefano_zampini j=0; 23113b03a366Sstefano_zampini while( j < min_n && singular_vals[min_n-j-1] < tol) j++; 23123b03a366Sstefano_zampini total_counts = total_counts-(PetscInt)Bt+(min_n-j); 23133b03a366Sstefano_zampini #endif 23143b03a366Sstefano_zampini } 23153b03a366Sstefano_zampini } 2316534831adSStefano Zampini 2317da1bb401SStefano Zampini n_constraints=total_counts-n_vertices; 2318da1bb401SStefano Zampini local_primal_size = total_counts; 23193b03a366Sstefano_zampini /* set quantities in pcbddc data structure */ 23203b03a366Sstefano_zampini pcbddc->n_vertices = n_vertices; 23213b03a366Sstefano_zampini pcbddc->n_constraints = n_constraints; 2322da1bb401SStefano Zampini pcbddc->local_primal_size = local_primal_size; 2323534831adSStefano Zampini 2324534831adSStefano Zampini /* Create constraint matrix */ 2325534831adSStefano Zampini /* The constraint matrix is used to compute the l2g map of primal dofs */ 2326534831adSStefano Zampini /* so we need to set it up properly either with or without change of basis */ 2327534831adSStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->ConstraintMatrix);CHKERRQ(ierr); 2328534831adSStefano Zampini ierr = MatSetType(pcbddc->ConstraintMatrix,impMatType);CHKERRQ(ierr); 2329534831adSStefano Zampini ierr = MatSetSizes(pcbddc->ConstraintMatrix,local_primal_size,pcis->n,local_primal_size,pcis->n);CHKERRQ(ierr); 2330534831adSStefano Zampini /* compute a local numbering of constraints : vertices first then constraints */ 2331534831adSStefano Zampini ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr); 2332534831adSStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array_vector);CHKERRQ(ierr); 2333534831adSStefano Zampini ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&aux_primal_numbering);CHKERRQ(ierr); 2334534831adSStefano Zampini ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&aux_primal_permutation);CHKERRQ(ierr); 2335534831adSStefano Zampini total_counts=0; 2336534831adSStefano Zampini /* find vertices: subdomain corners plus dofs with basis changed */ 2337534831adSStefano Zampini for(i=0;i<local_primal_size;i++) { 2338534831adSStefano Zampini size_of_constraint=temp_indices[i+1]-temp_indices[i]; 2339534831adSStefano Zampini if(change_basis[i] || size_of_constraint == 1) { 2340534831adSStefano Zampini k=0; 2341534831adSStefano Zampini while(k < size_of_constraint && array_vector[temp_indices_to_constraint[temp_indices[i]+size_of_constraint-k-1]] != 0.0) { 2342534831adSStefano Zampini k=k+1; 2343534831adSStefano Zampini } 2344534831adSStefano Zampini j=temp_indices_to_constraint[temp_indices[i]+size_of_constraint-k-1]; 2345534831adSStefano Zampini array_vector[j] = 1.0; 2346534831adSStefano Zampini aux_primal_numbering[total_counts]=j; 2347534831adSStefano Zampini aux_primal_permutation[total_counts]=total_counts; 2348534831adSStefano Zampini total_counts++; 2349534831adSStefano Zampini } 2350534831adSStefano Zampini } 2351534831adSStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array_vector);CHKERRQ(ierr); 2352534831adSStefano Zampini /* permute indices in order to have a sorted set of vertices */ 2353534831adSStefano Zampini ierr = PetscSortIntWithPermutation(total_counts,aux_primal_numbering,aux_primal_permutation); 2354534831adSStefano Zampini /* nonzero structure */ 2355534831adSStefano Zampini ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&nnz);CHKERRQ(ierr); 2356534831adSStefano Zampini for(i=0;i<total_counts;i++) { 2357534831adSStefano Zampini nnz[i]=1; 2358534831adSStefano Zampini } 2359534831adSStefano Zampini j=total_counts; 2360534831adSStefano Zampini for(i=n_vertices;i<local_primal_size;i++) { 2361534831adSStefano Zampini if(!change_basis[i]) { 2362534831adSStefano Zampini nnz[j]=temp_indices[i+1]-temp_indices[i]; 2363534831adSStefano Zampini j++; 2364534831adSStefano Zampini } 2365534831adSStefano Zampini } 2366534831adSStefano Zampini ierr = MatSeqAIJSetPreallocation(pcbddc->ConstraintMatrix,0,nnz);CHKERRQ(ierr); 2367534831adSStefano Zampini ierr = PetscFree(nnz);CHKERRQ(ierr); 2368534831adSStefano Zampini /* set values in constraint matrix */ 2369534831adSStefano Zampini for(i=0;i<total_counts;i++) { 2370534831adSStefano Zampini j = aux_primal_permutation[i]; 2371534831adSStefano Zampini k = aux_primal_numbering[j]; 2372534831adSStefano Zampini ierr = MatSetValue(pcbddc->ConstraintMatrix,i,k,1.0,INSERT_VALUES);CHKERRQ(ierr); 2373534831adSStefano Zampini } 2374534831adSStefano Zampini for(i=n_vertices;i<local_primal_size;i++) { 2375534831adSStefano Zampini if(!change_basis[i]) { 2376534831adSStefano Zampini size_of_constraint=temp_indices[i+1]-temp_indices[i]; 2377534831adSStefano Zampini ierr = MatSetValues(pcbddc->ConstraintMatrix,1,&total_counts,size_of_constraint,&temp_indices_to_constraint[temp_indices[i]],&temp_quadrature_constraint[temp_indices[i]],INSERT_VALUES);CHKERRQ(ierr); 2378534831adSStefano Zampini total_counts++; 2379534831adSStefano Zampini } 2380534831adSStefano Zampini } 2381534831adSStefano Zampini ierr = PetscFree(aux_primal_numbering);CHKERRQ(ierr); 2382534831adSStefano Zampini ierr = PetscFree(aux_primal_permutation);CHKERRQ(ierr); 2383534831adSStefano Zampini /* assembling */ 2384534831adSStefano Zampini ierr = MatAssemblyBegin(pcbddc->ConstraintMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2385534831adSStefano Zampini ierr = MatAssemblyEnd(pcbddc->ConstraintMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2386534831adSStefano Zampini 2387534831adSStefano Zampini /* Create matrix for change of basis. We don't need it in case pcbddc->usechangeofbasis is FALSE */ 2388534831adSStefano Zampini if(pcbddc->usechangeofbasis) { 2389534831adSStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->ChangeOfBasisMatrix);CHKERRQ(ierr); 2390534831adSStefano Zampini ierr = MatSetType(pcbddc->ChangeOfBasisMatrix,impMatType);CHKERRQ(ierr); 2391534831adSStefano Zampini ierr = MatSetSizes(pcbddc->ChangeOfBasisMatrix,pcis->n_B,pcis->n_B,pcis->n_B,pcis->n_B);CHKERRQ(ierr); 2392534831adSStefano Zampini /* work arrays */ 2393534831adSStefano Zampini /* we need to reuse these arrays, so we free them */ 2394534831adSStefano Zampini ierr = PetscFree(temp_basis);CHKERRQ(ierr); 2395534831adSStefano Zampini ierr = PetscFree(work);CHKERRQ(ierr); 2396534831adSStefano Zampini ierr = PetscMalloc(pcis->n_B*sizeof(PetscInt),&nnz);CHKERRQ(ierr); 2397534831adSStefano Zampini ierr = PetscMalloc((nnsp_addone+nnsp_size)*(nnsp_addone+nnsp_size)*sizeof(PetscScalar),&temp_basis);CHKERRQ(ierr); 2398534831adSStefano Zampini ierr = PetscMalloc((nnsp_addone+nnsp_size)*sizeof(PetscScalar),&work);CHKERRQ(ierr); 2399534831adSStefano Zampini ierr = PetscMalloc((nnsp_addone+nnsp_size)*sizeof(PetscBLASInt),&ipiv);CHKERRQ(ierr); 2400534831adSStefano Zampini for(i=0;i<pcis->n_B;i++) { 2401534831adSStefano Zampini nnz[i]=1; 2402534831adSStefano Zampini } 2403534831adSStefano Zampini /* Overestimated nonzeros per row */ 2404534831adSStefano Zampini k=1; 2405534831adSStefano Zampini for(i=pcbddc->n_vertices;i<local_primal_size;i++) { 2406534831adSStefano Zampini if(change_basis[i]) { 2407534831adSStefano Zampini size_of_constraint = temp_indices[i+1]-temp_indices[i]; 2408534831adSStefano Zampini if(k < size_of_constraint) { 2409534831adSStefano Zampini k = size_of_constraint; 2410534831adSStefano Zampini } 2411534831adSStefano Zampini for(j=0;j<size_of_constraint;j++) { 2412534831adSStefano Zampini nnz[temp_indices_to_constraint_B[temp_indices[i]+j]] = size_of_constraint; 2413534831adSStefano Zampini } 2414534831adSStefano Zampini } 2415534831adSStefano Zampini } 2416534831adSStefano Zampini ierr = MatSeqAIJSetPreallocation(pcbddc->ChangeOfBasisMatrix,0,nnz);CHKERRQ(ierr); 2417534831adSStefano Zampini ierr = PetscFree(nnz);CHKERRQ(ierr); 2418534831adSStefano Zampini /* Temporary array to store indices */ 2419534831adSStefano Zampini ierr = PetscMalloc(k*sizeof(PetscInt),&is_indices);CHKERRQ(ierr); 2420534831adSStefano Zampini /* Set initial identity in the matrix */ 2421534831adSStefano Zampini for(i=0;i<pcis->n_B;i++) { 2422534831adSStefano Zampini ierr = MatSetValue(pcbddc->ChangeOfBasisMatrix,i,i,1.0,INSERT_VALUES);CHKERRQ(ierr); 2423534831adSStefano Zampini } 2424534831adSStefano Zampini /* Now we loop on the constraints which need a change of basis */ 2425534831adSStefano Zampini /* Change of basis matrix is evaluated as the FIRST APPROACH in */ 2426534831adSStefano Zampini /* Klawonn and Widlund, Dual-primal FETI-DP methods for linear elasticity, (6.2.1) */ 2427534831adSStefano Zampini temp_constraints = 0; 242893dc3b60SStefano Zampini if(pcbddc->n_vertices < local_primal_size) { 2429534831adSStefano Zampini temp_start_ptr = temp_indices_to_constraint_B[temp_indices[pcbddc->n_vertices]]; 243093dc3b60SStefano Zampini } 2431534831adSStefano Zampini for(i=pcbddc->n_vertices;i<local_primal_size;i++) { 2432534831adSStefano Zampini if(change_basis[i]) { 2433534831adSStefano Zampini compute_submatrix = PETSC_FALSE; 2434534831adSStefano Zampini useksp = PETSC_FALSE; 2435534831adSStefano Zampini if(temp_start_ptr == temp_indices_to_constraint_B[temp_indices[i]]) { 2436534831adSStefano Zampini temp_constraints++; 243704eaf177SStefano Zampini if(i == local_primal_size -1 || temp_start_ptr != temp_indices_to_constraint_B[temp_indices[i+1]]) { 2438534831adSStefano Zampini compute_submatrix = PETSC_TRUE; 2439534831adSStefano Zampini } 2440534831adSStefano Zampini } 2441534831adSStefano Zampini if(compute_submatrix) { 2442534831adSStefano Zampini if(temp_constraints > 1 || pcbddc->use_nnsp_true) { 2443534831adSStefano Zampini useksp = PETSC_TRUE; 2444534831adSStefano Zampini } 2445534831adSStefano Zampini size_of_constraint = temp_indices[i+1]-temp_indices[i]; 2446534831adSStefano Zampini if(useksp) { /* experimental */ 2447534831adSStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&temp_mat);CHKERRQ(ierr); 2448534831adSStefano Zampini ierr = MatSetType(temp_mat,impMatType);CHKERRQ(ierr); 2449534831adSStefano Zampini ierr = MatSetSizes(temp_mat,size_of_constraint,size_of_constraint,size_of_constraint,size_of_constraint);CHKERRQ(ierr); 2450534831adSStefano Zampini ierr = MatSeqAIJSetPreallocation(temp_mat,size_of_constraint,PETSC_NULL);CHKERRQ(ierr); 2451534831adSStefano Zampini } 2452534831adSStefano Zampini /* First _size_of_constraint-temp_constraints_ columns */ 2453534831adSStefano Zampini dual_dofs = size_of_constraint-temp_constraints; 2454534831adSStefano Zampini start_constraint = i+1-temp_constraints; 2455534831adSStefano Zampini for(s=0;s<dual_dofs;s++) { 2456534831adSStefano Zampini is_indices[0] = s; 2457534831adSStefano Zampini for(j=0;j<temp_constraints;j++) { 2458534831adSStefano Zampini for(k=0;k<temp_constraints;k++) { 2459534831adSStefano Zampini temp_basis[j*temp_constraints+k]=temp_quadrature_constraint[temp_indices[start_constraint+k]+s+j+1]; 2460534831adSStefano Zampini } 2461534831adSStefano Zampini work[j]=-temp_quadrature_constraint[temp_indices[start_constraint+j]+s]; 2462534831adSStefano Zampini is_indices[j+1]=s+j+1; 2463534831adSStefano Zampini } 2464534831adSStefano Zampini Bt = temp_constraints; 2465534831adSStefano Zampini ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr); 2466534831adSStefano Zampini LAPACKgesv_(&Bt,&Bone,temp_basis,&Bt,ipiv,work,&Bt,&lierr); 2467534831adSStefano Zampini if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GESV Lapack routine %d",(int)lierr); 2468534831adSStefano Zampini ierr = PetscFPTrapPop();CHKERRQ(ierr); 2469534831adSStefano Zampini j = temp_indices_to_constraint_B[temp_indices[start_constraint]+s]; 2470534831adSStefano Zampini ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,temp_constraints,&temp_indices_to_constraint_B[temp_indices[start_constraint]+s+1],1,&j,work,INSERT_VALUES);CHKERRQ(ierr); 2471534831adSStefano Zampini if(useksp) { 2472534831adSStefano Zampini /* temp mat with transposed rows and columns */ 2473534831adSStefano Zampini ierr = MatSetValues(temp_mat,1,&s,temp_constraints,&is_indices[1],work,INSERT_VALUES);CHKERRQ(ierr); 2474534831adSStefano Zampini ierr = MatSetValue(temp_mat,is_indices[0],is_indices[0],1.0,INSERT_VALUES);CHKERRQ(ierr); 2475534831adSStefano Zampini } 2476534831adSStefano Zampini } 2477534831adSStefano Zampini if(useksp) { 2478534831adSStefano Zampini /* last rows of temp_mat */ 2479534831adSStefano Zampini for(j=0;j<size_of_constraint;j++) { 2480534831adSStefano Zampini is_indices[j] = j; 2481534831adSStefano Zampini } 2482534831adSStefano Zampini for(s=0;s<temp_constraints;s++) { 2483534831adSStefano Zampini k = s + dual_dofs; 2484534831adSStefano Zampini ierr = MatSetValues(temp_mat,1,&k,size_of_constraint,is_indices,&temp_quadrature_constraint[temp_indices[start_constraint+s]],INSERT_VALUES);CHKERRQ(ierr); 2485534831adSStefano Zampini } 2486534831adSStefano Zampini ierr = MatAssemblyBegin(temp_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2487534831adSStefano Zampini ierr = MatAssemblyEnd(temp_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2488534831adSStefano Zampini ierr = MatGetVecs(temp_mat,&temp_vec,PETSC_NULL);CHKERRQ(ierr); 2489534831adSStefano Zampini ierr = KSPCreate(PETSC_COMM_SELF,&temp_ksp);CHKERRQ(ierr); 2490534831adSStefano Zampini ierr = KSPSetOperators(temp_ksp,temp_mat,temp_mat,SAME_PRECONDITIONER);CHKERRQ(ierr); 2491534831adSStefano Zampini ierr = KSPSetType(temp_ksp,KSPPREONLY);CHKERRQ(ierr); 2492ffe5efe1SStefano Zampini ierr = KSPGetPC(temp_ksp,&temp_pc);CHKERRQ(ierr); 2493ffe5efe1SStefano Zampini ierr = PCSetType(temp_pc,PCLU);CHKERRQ(ierr); 2494534831adSStefano Zampini ierr = KSPSetUp(temp_ksp);CHKERRQ(ierr); 2495534831adSStefano Zampini for(s=0;s<temp_constraints;s++) { 2496534831adSStefano Zampini ierr = VecSet(temp_vec,0.0);CHKERRQ(ierr); 2497534831adSStefano Zampini ierr = VecSetValue(temp_vec,s+dual_dofs,1.0,INSERT_VALUES);CHKERRQ(ierr); 2498534831adSStefano Zampini ierr = VecAssemblyBegin(temp_vec);CHKERRQ(ierr); 2499534831adSStefano Zampini ierr = VecAssemblyEnd(temp_vec);CHKERRQ(ierr); 2500534831adSStefano Zampini ierr = KSPSolve(temp_ksp,temp_vec,temp_vec);CHKERRQ(ierr); 2501534831adSStefano Zampini ierr = VecGetArray(temp_vec,&array_vector);CHKERRQ(ierr); 2502534831adSStefano Zampini j = temp_indices_to_constraint_B[temp_indices[start_constraint+s]+size_of_constraint-s-1]; 2503534831adSStefano Zampini /* last columns of change of basis matrix associated to new primal dofs */ 2504534831adSStefano Zampini ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,size_of_constraint,&temp_indices_to_constraint_B[temp_indices[start_constraint+s]],1,&j,array_vector,INSERT_VALUES);CHKERRQ(ierr); 2505534831adSStefano Zampini ierr = VecRestoreArray(temp_vec,&array_vector);CHKERRQ(ierr); 2506534831adSStefano Zampini } 2507534831adSStefano Zampini ierr = MatDestroy(&temp_mat);CHKERRQ(ierr); 2508534831adSStefano Zampini ierr = KSPDestroy(&temp_ksp);CHKERRQ(ierr); 2509534831adSStefano Zampini ierr = VecDestroy(&temp_vec);CHKERRQ(ierr); 2510534831adSStefano Zampini } else { 2511534831adSStefano Zampini /* last columns of change of basis matrix associated to new primal dofs */ 2512534831adSStefano Zampini for(s=0;s<temp_constraints;s++) { 2513534831adSStefano Zampini j = temp_indices_to_constraint_B[temp_indices[start_constraint+s]+size_of_constraint-s-1]; 2514534831adSStefano Zampini ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,size_of_constraint,&temp_indices_to_constraint_B[temp_indices[start_constraint+s]],1,&j,&temp_quadrature_constraint[temp_indices[start_constraint+s]],INSERT_VALUES);CHKERRQ(ierr); 2515534831adSStefano Zampini } 2516534831adSStefano Zampini } 2517534831adSStefano Zampini /* prepare for the next cycle */ 2518534831adSStefano Zampini temp_constraints = 0; 251904eaf177SStefano Zampini if(i != local_primal_size -1 ) { 2520534831adSStefano Zampini temp_start_ptr = temp_indices_to_constraint_B[temp_indices[i+1]]; 2521534831adSStefano Zampini } 2522534831adSStefano Zampini } 2523534831adSStefano Zampini } 252404eaf177SStefano Zampini } 2525534831adSStefano Zampini /* assembling */ 2526534831adSStefano Zampini ierr = MatAssemblyBegin(pcbddc->ChangeOfBasisMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2527534831adSStefano Zampini ierr = MatAssemblyEnd(pcbddc->ChangeOfBasisMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2528534831adSStefano Zampini ierr = PetscFree(ipiv);CHKERRQ(ierr); 2529534831adSStefano Zampini ierr = PetscFree(is_indices);CHKERRQ(ierr); 2530534831adSStefano Zampini } 25313b03a366Sstefano_zampini /* free workspace no longer needed */ 25323b03a366Sstefano_zampini ierr = PetscFree(rwork);CHKERRQ(ierr); 25333b03a366Sstefano_zampini ierr = PetscFree(work);CHKERRQ(ierr); 25343b03a366Sstefano_zampini ierr = PetscFree(temp_basis);CHKERRQ(ierr); 25353b03a366Sstefano_zampini ierr = PetscFree(singular_vals);CHKERRQ(ierr); 25363b03a366Sstefano_zampini ierr = PetscFree(correlation_mat);CHKERRQ(ierr); 25373b03a366Sstefano_zampini ierr = PetscFree(temp_indices);CHKERRQ(ierr); 2538534831adSStefano Zampini ierr = PetscFree(change_basis);CHKERRQ(ierr); 25393b03a366Sstefano_zampini ierr = PetscFree(temp_indices_to_constraint);CHKERRQ(ierr); 2540534831adSStefano Zampini ierr = PetscFree(temp_indices_to_constraint_B);CHKERRQ(ierr); 2541534831adSStefano Zampini ierr = PetscFree(local_to_B);CHKERRQ(ierr); 25423b03a366Sstefano_zampini ierr = PetscFree(temp_quadrature_constraint);CHKERRQ(ierr); 25433425bc38SStefano Zampini #if defined(PETSC_MISSING_LAPACK_GESVD) 25443425bc38SStefano Zampini ierr = PetscFree(iwork);CHKERRQ(ierr); 25453425bc38SStefano Zampini ierr = PetscFree(ifail);CHKERRQ(ierr); 25463425bc38SStefano Zampini ierr = PetscFree(singular_vectors);CHKERRQ(ierr); 25473425bc38SStefano Zampini #endif 2548da1bb401SStefano Zampini for(k=0;k<nnsp_size;k++) { 2549da1bb401SStefano Zampini ierr = VecDestroy(&localnearnullsp[k]);CHKERRQ(ierr); 2550da1bb401SStefano Zampini } 25513b03a366Sstefano_zampini ierr = PetscFree(localnearnullsp);CHKERRQ(ierr); 25523b03a366Sstefano_zampini PetscFunctionReturn(0); 25533b03a366Sstefano_zampini } 25543b03a366Sstefano_zampini /* -------------------------------------------------------------------------- */ 25550c7d97c5SJed Brown #undef __FUNCT__ 25560c7d97c5SJed Brown #define __FUNCT__ "PCBDDCCoarseSetUp" 255753cdbc3dSStefano Zampini static PetscErrorCode PCBDDCCoarseSetUp(PC pc) 25580c7d97c5SJed Brown { 25590c7d97c5SJed Brown PetscErrorCode ierr; 25600c7d97c5SJed Brown 25610c7d97c5SJed Brown PC_IS* pcis = (PC_IS*)(pc->data); 25620c7d97c5SJed Brown PC_BDDC* pcbddc = (PC_BDDC*)pc->data; 25630c7d97c5SJed Brown Mat_IS *matis = (Mat_IS*)pc->pmat->data; 2564534831adSStefano Zampini Mat change_mat_all; 25650c7d97c5SJed Brown IS is_R_local; 25660c7d97c5SJed Brown IS is_V_local; 25670c7d97c5SJed Brown IS is_C_local; 25680c7d97c5SJed Brown IS is_aux1; 25690c7d97c5SJed Brown IS is_aux2; 25700c7d97c5SJed Brown const VecType impVecType; 25710c7d97c5SJed Brown const MatType impMatType; 25720c7d97c5SJed Brown PetscInt n_R=0; 25730c7d97c5SJed Brown PetscInt n_D=0; 25740c7d97c5SJed Brown PetscInt n_B=0; 25750c7d97c5SJed Brown PetscScalar zero=0.0; 25760c7d97c5SJed Brown PetscScalar one=1.0; 25770c7d97c5SJed Brown PetscScalar m_one=-1.0; 25780c7d97c5SJed Brown PetscScalar* array; 25790c7d97c5SJed Brown PetscScalar *coarse_submat_vals; 25800c7d97c5SJed Brown PetscInt *idx_R_local; 25810c7d97c5SJed Brown PetscInt *idx_V_B; 25820c7d97c5SJed Brown PetscScalar *coarsefunctions_errors; 25830c7d97c5SJed Brown PetscScalar *constraints_errors; 25840c7d97c5SJed Brown /* auxiliary indices */ 2585534831adSStefano Zampini PetscInt i,j,k; 2586e269702eSStefano Zampini /* for verbose output of bddc */ 2587e269702eSStefano Zampini PetscViewer viewer=pcbddc->dbg_viewer; 2588e269702eSStefano Zampini PetscBool dbg_flag=pcbddc->dbg_flag; 2589a0ba757dSStefano Zampini /* for counting coarse dofs */ 2590534831adSStefano Zampini PetscInt n_vertices,n_constraints; 25913b03a366Sstefano_zampini PetscInt size_of_constraint; 25923b03a366Sstefano_zampini PetscInt *row_cmat_indices; 25933b03a366Sstefano_zampini PetscScalar *row_cmat_values; 2594534831adSStefano Zampini PetscInt *vertices,*nnz,*is_indices,*temp_indices; 25950c7d97c5SJed Brown 25960c7d97c5SJed Brown PetscFunctionBegin; 25970c7d97c5SJed Brown /* Set Non-overlapping dimensions */ 25980c7d97c5SJed Brown n_B = pcis->n_B; n_D = pcis->n - n_B; 2599534831adSStefano Zampini /* Set types for local objects needed by BDDC precondtioner */ 2600534831adSStefano Zampini impMatType = MATSEQDENSE; 2601534831adSStefano Zampini impVecType = VECSEQ; 2602da1bb401SStefano Zampini /* get vertex indices from constraint matrix */ 2603534831adSStefano Zampini ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscInt),&vertices);CHKERRQ(ierr); 2604534831adSStefano Zampini n_vertices=0; 2605da1bb401SStefano Zampini for(i=0;i<pcbddc->local_primal_size;i++) { 2606da1bb401SStefano Zampini ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr); 2607da1bb401SStefano Zampini if(size_of_constraint == 1) { 2608534831adSStefano Zampini vertices[n_vertices]=row_cmat_indices[0]; 2609534831adSStefano Zampini n_vertices++; 2610a0ba757dSStefano Zampini } 2611da1bb401SStefano Zampini ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr); 2612a0ba757dSStefano Zampini } 2613534831adSStefano Zampini /* Set number of constraints */ 2614534831adSStefano Zampini n_constraints = pcbddc->local_primal_size-n_vertices; 2615534831adSStefano Zampini 2616534831adSStefano Zampini /* vertices in boundary numbering */ 2617534831adSStefano Zampini if(n_vertices) { 2618534831adSStefano Zampini ierr = VecSet(pcis->vec1_N,m_one);CHKERRQ(ierr); 2619534831adSStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 2620534831adSStefano Zampini for (i=0; i<n_vertices; i++) { array[ vertices[i] ] = i; } 2621534831adSStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 2622534831adSStefano Zampini ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 2623534831adSStefano Zampini ierr = VecScatterEnd (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 2624534831adSStefano Zampini ierr = PetscMalloc(n_vertices*sizeof(PetscInt),&idx_V_B);CHKERRQ(ierr); 2625534831adSStefano Zampini ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr); 2626534831adSStefano Zampini for (i=0; i<n_vertices; i++) { 2627534831adSStefano Zampini j=0; 2628534831adSStefano Zampini while (array[j] != i ) {j++;} 2629534831adSStefano Zampini idx_V_B[i]=j; 2630534831adSStefano Zampini } 2631534831adSStefano Zampini ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr); 2632534831adSStefano Zampini } 2633534831adSStefano Zampini 2634534831adSStefano Zampini /* transform local matrices if needed */ 2635534831adSStefano Zampini if(pcbddc->usechangeofbasis) { 2636534831adSStefano Zampini ierr = PetscMalloc(pcis->n*sizeof(PetscInt),&nnz);CHKERRQ(ierr); 2637534831adSStefano Zampini ierr = ISGetIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 2638534831adSStefano Zampini for(i=0;i<n_D;i++) { 2639534831adSStefano Zampini nnz[is_indices[i]]=1; 2640534831adSStefano Zampini } 2641534831adSStefano Zampini ierr = ISRestoreIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 2642534831adSStefano Zampini ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 2643534831adSStefano Zampini k=1; 2644534831adSStefano Zampini for(i=0;i<n_B;i++) { 2645534831adSStefano Zampini ierr = MatGetRow(pcbddc->ChangeOfBasisMatrix,i,&j,PETSC_NULL,PETSC_NULL);CHKERRQ(ierr); 2646534831adSStefano Zampini nnz[is_indices[i]]=j; 2647534831adSStefano Zampini if( k < j) { 2648534831adSStefano Zampini k = j; 2649534831adSStefano Zampini } 2650534831adSStefano Zampini ierr = MatRestoreRow(pcbddc->ChangeOfBasisMatrix,i,&j,PETSC_NULL,PETSC_NULL);CHKERRQ(ierr); 2651534831adSStefano Zampini } 2652534831adSStefano Zampini ierr = ISRestoreIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 2653534831adSStefano Zampini /* assemble change of basis matrix on the whole set of local dofs */ 2654534831adSStefano Zampini ierr = PetscMalloc(k*sizeof(PetscInt),&temp_indices);CHKERRQ(ierr); 2655534831adSStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&change_mat_all);CHKERRQ(ierr); 2656534831adSStefano Zampini ierr = MatSetSizes(change_mat_all,pcis->n,pcis->n,pcis->n,pcis->n);CHKERRQ(ierr); 2657534831adSStefano Zampini ierr = MatSetType(change_mat_all,MATSEQAIJ);CHKERRQ(ierr); 2658534831adSStefano Zampini ierr = MatSeqAIJSetPreallocation(change_mat_all,0,nnz);CHKERRQ(ierr); 2659534831adSStefano Zampini ierr = ISGetIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 2660534831adSStefano Zampini for(i=0;i<n_D;i++) { 2661534831adSStefano Zampini ierr = MatSetValue(change_mat_all,is_indices[i],is_indices[i],1.0,INSERT_VALUES);CHKERRQ(ierr); 2662534831adSStefano Zampini } 2663534831adSStefano Zampini ierr = ISRestoreIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 2664534831adSStefano Zampini ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr); 2665534831adSStefano Zampini for(i=0;i<n_B;i++) { 2666534831adSStefano Zampini ierr = MatGetRow(pcbddc->ChangeOfBasisMatrix,i,&j,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr); 2667534831adSStefano Zampini for(k=0;k<j;k++) { 2668534831adSStefano Zampini temp_indices[k]=is_indices[row_cmat_indices[k]]; 2669534831adSStefano Zampini } 2670534831adSStefano Zampini ierr = MatSetValues(change_mat_all,1,&is_indices[i],j,temp_indices,row_cmat_values,INSERT_VALUES);CHKERRQ(ierr); 2671534831adSStefano Zampini ierr = MatRestoreRow(pcbddc->ChangeOfBasisMatrix,i,&j,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr); 2672534831adSStefano Zampini } 2673534831adSStefano Zampini ierr = MatAssemblyBegin(change_mat_all,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2674534831adSStefano Zampini ierr = MatAssemblyEnd(change_mat_all,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 2675534831adSStefano Zampini ierr = MatPtAP(matis->A,change_mat_all,MAT_INITIAL_MATRIX,1.0,&pcbddc->local_mat);CHKERRQ(ierr); 2676534831adSStefano Zampini ierr = MatDestroy(&pcis->A_IB);CHKERRQ(ierr); 2677534831adSStefano Zampini ierr = MatDestroy(&pcis->A_BI);CHKERRQ(ierr); 2678534831adSStefano Zampini ierr = MatDestroy(&pcis->A_BB);CHKERRQ(ierr); 2679534831adSStefano Zampini ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_I_local,pcis->is_B_local,MAT_INITIAL_MATRIX,&pcis->A_IB);CHKERRQ(ierr); 2680534831adSStefano Zampini ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_B_local,pcis->is_I_local,MAT_INITIAL_MATRIX,&pcis->A_BI);CHKERRQ(ierr); 2681534831adSStefano Zampini ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_B_local,pcis->is_B_local,MAT_INITIAL_MATRIX,&pcis->A_BB);CHKERRQ(ierr); 2682534831adSStefano Zampini ierr = MatDestroy(&change_mat_all);CHKERRQ(ierr); 2683534831adSStefano Zampini ierr = PetscFree(nnz);CHKERRQ(ierr); 2684534831adSStefano Zampini ierr = PetscFree(temp_indices);CHKERRQ(ierr); 2685534831adSStefano Zampini } else { 2686534831adSStefano Zampini /* without change of basis, the local matrix is unchanged */ 2687534831adSStefano Zampini ierr = PetscObjectReference((PetscObject)matis->A);CHKERRQ(ierr); 2688534831adSStefano Zampini pcbddc->local_mat = matis->A; 2689534831adSStefano Zampini } 2690a0ba757dSStefano Zampini 26910c7d97c5SJed Brown /* Dohrmann's notation: dofs splitted in R (Remaining: all dofs but the vertices) and V (Vertices) */ 26920c7d97c5SJed Brown ierr = VecSet(pcis->vec1_N,one);CHKERRQ(ierr); 26930c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 26943b03a366Sstefano_zampini for (i=0;i<n_vertices;i++) { array[ vertices[i] ] = zero; } 26953b03a366Sstefano_zampini ierr = PetscMalloc(( pcis->n - n_vertices )*sizeof(PetscInt),&idx_R_local);CHKERRQ(ierr); 26960c7d97c5SJed Brown for (i=0, n_R=0; i<pcis->n; i++) { if (array[i] == one) { idx_R_local[n_R] = i; n_R++; } } 26970c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 2698e269702eSStefano Zampini if(dbg_flag) { 26990c7d97c5SJed Brown ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr); 27000c7d97c5SJed Brown ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 27010c7d97c5SJed Brown ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d local dimensions\n",PetscGlobalRank);CHKERRQ(ierr); 27020c7d97c5SJed Brown ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local_size = %d, dirichlet_size = %d, boundary_size = %d\n",pcis->n,n_D,n_B);CHKERRQ(ierr); 27033b03a366Sstefano_zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"r_size = %d, v_size = %d, constraints = %d, local_primal_size = %d\n",n_R,n_vertices,n_constraints,pcbddc->local_primal_size);CHKERRQ(ierr); 2704534831adSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"pcbddc->n_vertices = %d, pcbddc->n_constraints = %d\n",pcbddc->n_vertices,pcbddc->n_constraints);CHKERRQ(ierr); 27050c7d97c5SJed Brown ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 27060c7d97c5SJed Brown } 2707534831adSStefano Zampini 27080c7d97c5SJed Brown /* Allocate needed vectors */ 2709534831adSStefano Zampini ierr = VecDuplicate(pcis->vec1_global,&pcbddc->original_rhs);CHKERRQ(ierr); 27103972b0daSStefano Zampini ierr = VecDuplicate(pcis->vec1_global,&pcbddc->temp_solution);CHKERRQ(ierr); 27110c7d97c5SJed Brown ierr = VecDuplicate(pcis->vec1_D,&pcbddc->vec4_D);CHKERRQ(ierr); 27120c7d97c5SJed Brown ierr = VecCreate(PETSC_COMM_SELF,&pcbddc->vec1_R);CHKERRQ(ierr); 27130c7d97c5SJed Brown ierr = VecSetSizes(pcbddc->vec1_R,n_R,n_R);CHKERRQ(ierr); 27140c7d97c5SJed Brown ierr = VecSetType(pcbddc->vec1_R,impVecType);CHKERRQ(ierr); 2715d49ef151SStefano Zampini ierr = VecDuplicate(pcbddc->vec1_R,&pcbddc->vec2_R);CHKERRQ(ierr); 27160c7d97c5SJed Brown ierr = VecCreate(PETSC_COMM_SELF,&pcbddc->vec1_P);CHKERRQ(ierr); 27170c7d97c5SJed Brown ierr = VecSetSizes(pcbddc->vec1_P,pcbddc->local_primal_size,pcbddc->local_primal_size);CHKERRQ(ierr); 27180c7d97c5SJed Brown ierr = VecSetType(pcbddc->vec1_P,impVecType);CHKERRQ(ierr); 27190c7d97c5SJed Brown 27200c7d97c5SJed Brown /* Creating some index sets needed */ 27210c7d97c5SJed Brown /* For submatrices */ 2722da1bb401SStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,n_R,idx_R_local,PETSC_OWN_POINTER,&is_R_local);CHKERRQ(ierr); 27233b03a366Sstefano_zampini if(n_vertices) { 2724da1bb401SStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,n_vertices,vertices,PETSC_OWN_POINTER,&is_V_local);CHKERRQ(ierr); 27253b03a366Sstefano_zampini } 2726da1bb401SStefano Zampini if(n_constraints) { 2727da1bb401SStefano Zampini ierr = ISCreateStride(PETSC_COMM_SELF,n_constraints,n_vertices,1,&is_C_local);CHKERRQ(ierr); 2728da1bb401SStefano Zampini } 2729da1bb401SStefano Zampini 27300c7d97c5SJed Brown /* For VecScatters pcbddc->R_to_B and (optionally) pcbddc->R_to_D */ 27310c7d97c5SJed Brown { 27320c7d97c5SJed Brown PetscInt *aux_array1; 27330c7d97c5SJed Brown PetscInt *aux_array2; 27340c7d97c5SJed Brown 27353b03a366Sstefano_zampini ierr = PetscMalloc( (pcis->n_B-n_vertices)*sizeof(PetscInt),&aux_array1);CHKERRQ(ierr); 27363b03a366Sstefano_zampini ierr = PetscMalloc( (pcis->n_B-n_vertices)*sizeof(PetscInt),&aux_array2);CHKERRQ(ierr); 27370c7d97c5SJed Brown 2738d49ef151SStefano Zampini ierr = VecSet(pcis->vec1_global,zero);CHKERRQ(ierr); 27390c7d97c5SJed Brown ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 27400c7d97c5SJed Brown ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 27410c7d97c5SJed Brown ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 27420c7d97c5SJed Brown ierr = VecScatterEnd (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 27430c7d97c5SJed Brown ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 27440c7d97c5SJed Brown ierr = VecScatterEnd (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 27450c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 2746da1bb401SStefano Zampini for (i=0, j=0; i<n_R; i++) { if (array[idx_R_local[i]] > one) { aux_array1[j] = i; j++; } } 27470c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 2748da1bb401SStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array1,PETSC_COPY_VALUES,&is_aux1);CHKERRQ(ierr); 27490c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr); 2750da1bb401SStefano Zampini for (i=0, j=0; i<n_B; i++) { if (array[i] > one) { aux_array2[j] = i; j++; } } 27513828260eSStefano Zampini ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr); 2752da1bb401SStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array2,PETSC_COPY_VALUES,&is_aux2);CHKERRQ(ierr); 27530c7d97c5SJed Brown ierr = VecScatterCreate(pcbddc->vec1_R,is_aux1,pcis->vec1_B,is_aux2,&pcbddc->R_to_B);CHKERRQ(ierr); 27540c7d97c5SJed Brown ierr = PetscFree(aux_array1);CHKERRQ(ierr); 27550c7d97c5SJed Brown ierr = PetscFree(aux_array2);CHKERRQ(ierr); 27560c7d97c5SJed Brown ierr = ISDestroy(&is_aux1);CHKERRQ(ierr); 27570c7d97c5SJed Brown ierr = ISDestroy(&is_aux2);CHKERRQ(ierr); 27580c7d97c5SJed Brown 2759e269702eSStefano Zampini if(pcbddc->prec_type || dbg_flag ) { 27600c7d97c5SJed Brown ierr = PetscMalloc(n_D*sizeof(PetscInt),&aux_array1);CHKERRQ(ierr); 27610c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 2762da1bb401SStefano Zampini for (i=0, j=0; i<n_R; i++) { if (array[idx_R_local[i]] == one) { aux_array1[j] = i; j++; } } 27630c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 2764da1bb401SStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array1,PETSC_COPY_VALUES,&is_aux1);CHKERRQ(ierr); 27650c7d97c5SJed Brown ierr = VecScatterCreate(pcbddc->vec1_R,is_aux1,pcis->vec1_D,(IS)0,&pcbddc->R_to_D);CHKERRQ(ierr); 27660c7d97c5SJed Brown ierr = PetscFree(aux_array1);CHKERRQ(ierr); 27670c7d97c5SJed Brown ierr = ISDestroy(&is_aux1);CHKERRQ(ierr); 27680c7d97c5SJed Brown } 27690c7d97c5SJed Brown } 27700c7d97c5SJed Brown 27710c7d97c5SJed Brown /* Creating PC contexts for local Dirichlet and Neumann problems */ 27720c7d97c5SJed Brown { 27730c7d97c5SJed Brown Mat A_RR; 277453cdbc3dSStefano Zampini PC pc_temp; 27750c7d97c5SJed Brown /* Matrix for Dirichlet problem is A_II -> we already have it from pcis.c code */ 277653cdbc3dSStefano Zampini ierr = KSPCreate(PETSC_COMM_SELF,&pcbddc->ksp_D);CHKERRQ(ierr); 277753cdbc3dSStefano Zampini ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->ksp_D,(PetscObject)pc,1);CHKERRQ(ierr); 277853cdbc3dSStefano Zampini ierr = KSPSetOperators(pcbddc->ksp_D,pcis->A_II,pcis->A_II,SAME_PRECONDITIONER);CHKERRQ(ierr); 277953cdbc3dSStefano Zampini ierr = KSPSetType(pcbddc->ksp_D,KSPPREONLY);CHKERRQ(ierr); 2780da1bb401SStefano Zampini ierr = KSPSetOptionsPrefix(pcbddc->ksp_D,"dirichlet_");CHKERRQ(ierr); 27810c7d97c5SJed Brown /* default */ 278253cdbc3dSStefano Zampini ierr = KSPGetPC(pcbddc->ksp_D,&pc_temp);CHKERRQ(ierr); 278353cdbc3dSStefano Zampini ierr = PCSetType(pc_temp,PCLU);CHKERRQ(ierr); 27840c7d97c5SJed Brown /* Allow user's customization */ 278553cdbc3dSStefano Zampini ierr = KSPSetFromOptions(pcbddc->ksp_D);CHKERRQ(ierr); 278653cdbc3dSStefano Zampini /* Set Up KSP for Dirichlet problem of BDDC */ 278753cdbc3dSStefano Zampini ierr = KSPSetUp(pcbddc->ksp_D);CHKERRQ(ierr); 27883972b0daSStefano Zampini /* set ksp_D into pcis data */ 27893972b0daSStefano Zampini ierr = KSPDestroy(&pcis->ksp_D);CHKERRQ(ierr); 27903972b0daSStefano Zampini ierr = PetscObjectReference((PetscObject)pcbddc->ksp_D);CHKERRQ(ierr); 27913972b0daSStefano Zampini pcis->ksp_D = pcbddc->ksp_D; 27920c7d97c5SJed Brown /* Matrix for Neumann problem is A_RR -> we need to create it */ 2793534831adSStefano Zampini ierr = MatGetSubMatrix(pcbddc->local_mat,is_R_local,is_R_local,MAT_INITIAL_MATRIX,&A_RR);CHKERRQ(ierr); 279453cdbc3dSStefano Zampini ierr = KSPCreate(PETSC_COMM_SELF,&pcbddc->ksp_R);CHKERRQ(ierr); 279553cdbc3dSStefano Zampini ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->ksp_R,(PetscObject)pc,1);CHKERRQ(ierr); 279653cdbc3dSStefano Zampini ierr = KSPSetOperators(pcbddc->ksp_R,A_RR,A_RR,SAME_PRECONDITIONER);CHKERRQ(ierr); 279753cdbc3dSStefano Zampini ierr = KSPSetType(pcbddc->ksp_R,KSPPREONLY);CHKERRQ(ierr); 2798da1bb401SStefano Zampini ierr = KSPSetOptionsPrefix(pcbddc->ksp_R,"neumann_");CHKERRQ(ierr); 27990c7d97c5SJed Brown /* default */ 280053cdbc3dSStefano Zampini ierr = KSPGetPC(pcbddc->ksp_R,&pc_temp);CHKERRQ(ierr); 280153cdbc3dSStefano Zampini ierr = PCSetType(pc_temp,PCLU);CHKERRQ(ierr); 28020c7d97c5SJed Brown /* Allow user's customization */ 280353cdbc3dSStefano Zampini ierr = KSPSetFromOptions(pcbddc->ksp_R);CHKERRQ(ierr); 280453cdbc3dSStefano Zampini /* Set Up KSP for Neumann problem of BDDC */ 280553cdbc3dSStefano Zampini ierr = KSPSetUp(pcbddc->ksp_R);CHKERRQ(ierr); 2806a0ba757dSStefano Zampini /* check Dirichlet and Neumann solvers */ 2807b76ba322SStefano Zampini { 28080c7d97c5SJed Brown Vec temp_vec; 2809b76ba322SStefano Zampini PetscReal value; 2810b76ba322SStefano Zampini PetscMPIInt use_exact,use_exact_reduced; 28110c7d97c5SJed Brown 2812a0ba757dSStefano Zampini ierr = VecDuplicate(pcis->vec1_D,&temp_vec);CHKERRQ(ierr); 2813a0ba757dSStefano Zampini ierr = VecSetRandom(pcis->vec1_D,PETSC_NULL);CHKERRQ(ierr); 2814a0ba757dSStefano Zampini ierr = MatMult(pcis->A_II,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr); 2815a0ba757dSStefano Zampini ierr = KSPSolve(pcbddc->ksp_D,pcis->vec2_D,temp_vec);CHKERRQ(ierr); 2816a0ba757dSStefano Zampini ierr = VecAXPY(temp_vec,m_one,pcis->vec1_D);CHKERRQ(ierr); 2817a0ba757dSStefano Zampini ierr = VecNorm(temp_vec,NORM_INFINITY,&value);CHKERRQ(ierr); 2818b76ba322SStefano Zampini use_exact = 1; 2819b76ba322SStefano Zampini if(PetscAbsReal(value) > 1.e-4) { 2820b76ba322SStefano Zampini use_exact = 0; 2821b76ba322SStefano Zampini } 2822b76ba322SStefano Zampini ierr = MPI_Allreduce(&use_exact,&use_exact_reduced,1,MPIU_INT,MPI_LAND,((PetscObject)pc)->comm);CHKERRQ(ierr); 2823b76ba322SStefano Zampini pcbddc->use_exact_dirichlet = (PetscBool) use_exact_reduced; 2824a0ba757dSStefano Zampini ierr = VecDestroy(&temp_vec);CHKERRQ(ierr); 2825b76ba322SStefano Zampini if(dbg_flag) { 2826a0ba757dSStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 2827a0ba757dSStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr); 2828a0ba757dSStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Checking solution of Dirichlet and Neumann problems\n");CHKERRQ(ierr); 2829a0ba757dSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d infinity error for Dirichlet solve = % 1.14e \n",PetscGlobalRank,value);CHKERRQ(ierr); 2830d49ef151SStefano Zampini ierr = VecDuplicate(pcbddc->vec1_R,&temp_vec);CHKERRQ(ierr); 2831d49ef151SStefano Zampini ierr = VecSetRandom(pcbddc->vec1_R,PETSC_NULL);CHKERRQ(ierr); 2832d49ef151SStefano Zampini ierr = MatMult(A_RR,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr); 2833d49ef151SStefano Zampini ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec2_R,temp_vec);CHKERRQ(ierr); 2834d49ef151SStefano Zampini ierr = VecAXPY(temp_vec,m_one,pcbddc->vec1_R);CHKERRQ(ierr); 2835d49ef151SStefano Zampini ierr = VecNorm(temp_vec,NORM_INFINITY,&value);CHKERRQ(ierr); 2836e269702eSStefano Zampini ierr = VecDestroy(&temp_vec);CHKERRQ(ierr); 28370c7d97c5SJed Brown ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d infinity error for Neumann solve = % 1.14e \n",PetscGlobalRank,value);CHKERRQ(ierr); 2838d49ef151SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 28390c7d97c5SJed Brown } 2840b76ba322SStefano Zampini } 28410c7d97c5SJed Brown /* free Neumann problem's matrix */ 28420c7d97c5SJed Brown ierr = MatDestroy(&A_RR);CHKERRQ(ierr); 28430c7d97c5SJed Brown } 28440c7d97c5SJed Brown 28450c7d97c5SJed Brown /* Assemble all remaining stuff needed to apply BDDC */ 28460c7d97c5SJed Brown { 28470c7d97c5SJed Brown Mat A_RV,A_VR,A_VV; 28480c7d97c5SJed Brown Mat M1,M2; 28490c7d97c5SJed Brown Mat C_CR; 28503b03a366Sstefano_zampini Mat AUXMAT; 28510c7d97c5SJed Brown Vec vec1_C; 28520c7d97c5SJed Brown Vec vec2_C; 28530c7d97c5SJed Brown Vec vec1_V; 28540c7d97c5SJed Brown Vec vec2_V; 28550c7d97c5SJed Brown PetscInt *nnz; 28560c7d97c5SJed Brown PetscInt *auxindices; 285753cdbc3dSStefano Zampini PetscInt index; 28580c7d97c5SJed Brown PetscScalar* array2; 28590c7d97c5SJed Brown MatFactorInfo matinfo; 28600c7d97c5SJed Brown 28610c7d97c5SJed Brown /* Allocating some extra storage just to be safe */ 28620c7d97c5SJed Brown ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&nnz);CHKERRQ(ierr); 28630c7d97c5SJed Brown ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&auxindices);CHKERRQ(ierr); 28640c7d97c5SJed Brown for(i=0;i<pcis->n;i++) {auxindices[i]=i;} 28650c7d97c5SJed Brown 28660c7d97c5SJed Brown /* some work vectors on vertices and/or constraints */ 28673b03a366Sstefano_zampini if(n_vertices) { 28680c7d97c5SJed Brown ierr = VecCreate(PETSC_COMM_SELF,&vec1_V);CHKERRQ(ierr); 28693b03a366Sstefano_zampini ierr = VecSetSizes(vec1_V,n_vertices,n_vertices);CHKERRQ(ierr); 28700c7d97c5SJed Brown ierr = VecSetType(vec1_V,impVecType);CHKERRQ(ierr); 28710c7d97c5SJed Brown ierr = VecDuplicate(vec1_V,&vec2_V);CHKERRQ(ierr); 28720c7d97c5SJed Brown } 2873534831adSStefano Zampini if(n_constraints) { 28740c7d97c5SJed Brown ierr = VecCreate(PETSC_COMM_SELF,&vec1_C);CHKERRQ(ierr); 2875534831adSStefano Zampini ierr = VecSetSizes(vec1_C,n_constraints,n_constraints);CHKERRQ(ierr); 28760c7d97c5SJed Brown ierr = VecSetType(vec1_C,impVecType);CHKERRQ(ierr); 28770c7d97c5SJed Brown ierr = VecDuplicate(vec1_C,&vec2_C);CHKERRQ(ierr); 28780c7d97c5SJed Brown ierr = VecDuplicate(vec1_C,&pcbddc->vec1_C);CHKERRQ(ierr); 28790c7d97c5SJed Brown } 28800c7d97c5SJed Brown /* Precompute stuffs needed for preprocessing and application of BDDC*/ 28813b03a366Sstefano_zampini if(n_constraints) { 28820c7d97c5SJed Brown ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->local_auxmat2);CHKERRQ(ierr); 28833b03a366Sstefano_zampini ierr = MatSetSizes(pcbddc->local_auxmat2,n_R,n_constraints,n_R,n_constraints);CHKERRQ(ierr); 28840c7d97c5SJed Brown ierr = MatSetType(pcbddc->local_auxmat2,impMatType);CHKERRQ(ierr); 28853b03a366Sstefano_zampini ierr = MatSeqDenseSetPreallocation(pcbddc->local_auxmat2,PETSC_NULL);CHKERRQ(ierr); 28860c7d97c5SJed Brown 288757a90decSStefano Zampini /* Create Constraint matrix on R nodes: C_{CR} */ 288857a90decSStefano Zampini ierr = MatGetSubMatrix(pcbddc->ConstraintMatrix,is_C_local,is_R_local,MAT_INITIAL_MATRIX,&C_CR);CHKERRQ(ierr); 288957a90decSStefano Zampini ierr = ISDestroy(&is_C_local);CHKERRQ(ierr); 289057a90decSStefano Zampini 28910c7d97c5SJed Brown /* Assemble local_auxmat2 = - A_{RR}^{-1} C^T_{CR} needed by BDDC application */ 28923b03a366Sstefano_zampini for(i=0;i<n_constraints;i++) { 28933b03a366Sstefano_zampini ierr = VecSet(pcbddc->vec1_R,zero);CHKERRQ(ierr); 28943b03a366Sstefano_zampini /* Get row of constraint matrix in R numbering */ 289557a90decSStefano Zampini ierr = VecGetArray(pcbddc->vec1_R,&array);CHKERRQ(ierr); 289657a90decSStefano Zampini ierr = MatGetRow(C_CR,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr); 28973b03a366Sstefano_zampini for(j=0;j<size_of_constraint;j++) { array[ row_cmat_indices[j] ] = - row_cmat_values[j]; } 289857a90decSStefano Zampini ierr = MatRestoreRow(C_CR,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr); 289957a90decSStefano Zampini ierr = VecRestoreArray(pcbddc->vec1_R,&array);CHKERRQ(ierr); 29003b03a366Sstefano_zampini /* Solve for row of constraint matrix in R numbering */ 290153cdbc3dSStefano Zampini ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr); 29023b03a366Sstefano_zampini /* Set values */ 29030c7d97c5SJed Brown ierr = VecGetArray(pcbddc->vec2_R,&array);CHKERRQ(ierr); 29043b03a366Sstefano_zampini ierr = MatSetValues(pcbddc->local_auxmat2,n_R,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr); 29050c7d97c5SJed Brown ierr = VecRestoreArray(pcbddc->vec2_R,&array);CHKERRQ(ierr); 29060c7d97c5SJed Brown } 29070c7d97c5SJed Brown ierr = MatAssemblyBegin(pcbddc->local_auxmat2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 29080c7d97c5SJed Brown ierr = MatAssemblyEnd(pcbddc->local_auxmat2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 29090c7d97c5SJed Brown 29100c7d97c5SJed Brown /* Assemble AUXMAT = ( LUFactor )( -C_{CR} A_{RR}^{-1} C^T_{CR} )^{-1} */ 29110c7d97c5SJed Brown ierr = MatMatMult(C_CR,pcbddc->local_auxmat2,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&AUXMAT);CHKERRQ(ierr); 2912d49ef151SStefano Zampini ierr = MatFactorInfoInitialize(&matinfo);CHKERRQ(ierr); 29133b03a366Sstefano_zampini ierr = ISCreateStride(PETSC_COMM_SELF,n_constraints,0,1,&is_aux1);CHKERRQ(ierr); 29140c7d97c5SJed Brown ierr = MatLUFactor(AUXMAT,is_aux1,is_aux1,&matinfo);CHKERRQ(ierr); 29150c7d97c5SJed Brown ierr = ISDestroy(&is_aux1);CHKERRQ(ierr); 29160c7d97c5SJed Brown 29173b03a366Sstefano_zampini /* Assemble explicitly M1 = ( C_{CR} A_{RR}^{-1} C^T_{CR} )^{-1} needed in preproc */ 2918d49ef151SStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&M1);CHKERRQ(ierr); 29193b03a366Sstefano_zampini ierr = MatSetSizes(M1,n_constraints,n_constraints,n_constraints,n_constraints);CHKERRQ(ierr); 29200c7d97c5SJed Brown ierr = MatSetType(M1,impMatType);CHKERRQ(ierr); 29213b03a366Sstefano_zampini ierr = MatSeqDenseSetPreallocation(M1,PETSC_NULL);CHKERRQ(ierr); 29223b03a366Sstefano_zampini for(i=0;i<n_constraints;i++) { 29230c7d97c5SJed Brown ierr = VecSet(vec1_C,zero);CHKERRQ(ierr); 29240c7d97c5SJed Brown ierr = VecSetValue(vec1_C,i,one,INSERT_VALUES);CHKERRQ(ierr); 29250c7d97c5SJed Brown ierr = VecAssemblyBegin(vec1_C);CHKERRQ(ierr); 29260c7d97c5SJed Brown ierr = VecAssemblyEnd(vec1_C);CHKERRQ(ierr); 29270c7d97c5SJed Brown ierr = MatSolve(AUXMAT,vec1_C,vec2_C);CHKERRQ(ierr); 29280c7d97c5SJed Brown ierr = VecScale(vec2_C,m_one);CHKERRQ(ierr); 29290c7d97c5SJed Brown ierr = VecGetArray(vec2_C,&array);CHKERRQ(ierr); 29303b03a366Sstefano_zampini ierr = MatSetValues(M1,n_constraints,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr); 29310c7d97c5SJed Brown ierr = VecRestoreArray(vec2_C,&array);CHKERRQ(ierr); 29320c7d97c5SJed Brown } 29330c7d97c5SJed Brown ierr = MatAssemblyBegin(M1,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 29340c7d97c5SJed Brown ierr = MatAssemblyEnd(M1,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 29350c7d97c5SJed Brown ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr); 29360c7d97c5SJed Brown /* Assemble local_auxmat1 = M1*C_{CR} needed by BDDC application in KSP and in preproc */ 29370c7d97c5SJed Brown ierr = MatMatMult(M1,C_CR,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&pcbddc->local_auxmat1);CHKERRQ(ierr); 29380c7d97c5SJed Brown 29390c7d97c5SJed Brown } 29400c7d97c5SJed Brown 29410c7d97c5SJed Brown /* Get submatrices from subdomain matrix */ 29423b03a366Sstefano_zampini if(n_vertices){ 2943534831adSStefano Zampini ierr = MatGetSubMatrix(pcbddc->local_mat,is_R_local,is_V_local,MAT_INITIAL_MATRIX,&A_RV);CHKERRQ(ierr); 2944534831adSStefano Zampini ierr = MatGetSubMatrix(pcbddc->local_mat,is_V_local,is_R_local,MAT_INITIAL_MATRIX,&A_VR);CHKERRQ(ierr); 2945534831adSStefano Zampini ierr = MatGetSubMatrix(pcbddc->local_mat,is_V_local,is_V_local,MAT_INITIAL_MATRIX,&A_VV);CHKERRQ(ierr); 29460c7d97c5SJed Brown /* Assemble M2 = A_RR^{-1}A_RV */ 2947d49ef151SStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&M2);CHKERRQ(ierr); 29483b03a366Sstefano_zampini ierr = MatSetSizes(M2,n_R,n_vertices,n_R,n_vertices);CHKERRQ(ierr); 29490c7d97c5SJed Brown ierr = MatSetType(M2,impMatType);CHKERRQ(ierr); 29503b03a366Sstefano_zampini ierr = MatSeqDenseSetPreallocation(M2,PETSC_NULL);CHKERRQ(ierr); 29513b03a366Sstefano_zampini for(i=0;i<n_vertices;i++) { 29520c7d97c5SJed Brown ierr = VecSet(vec1_V,zero);CHKERRQ(ierr); 29530c7d97c5SJed Brown ierr = VecSetValue(vec1_V,i,one,INSERT_VALUES);CHKERRQ(ierr); 29540c7d97c5SJed Brown ierr = VecAssemblyBegin(vec1_V);CHKERRQ(ierr); 29550c7d97c5SJed Brown ierr = VecAssemblyEnd(vec1_V);CHKERRQ(ierr); 29560c7d97c5SJed Brown ierr = MatMult(A_RV,vec1_V,pcbddc->vec1_R);CHKERRQ(ierr); 295753cdbc3dSStefano Zampini ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr); 29580c7d97c5SJed Brown ierr = VecGetArray(pcbddc->vec2_R,&array);CHKERRQ(ierr); 29593b03a366Sstefano_zampini ierr = MatSetValues(M2,n_R,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr); 29600c7d97c5SJed Brown ierr = VecRestoreArray(pcbddc->vec2_R,&array);CHKERRQ(ierr); 29610c7d97c5SJed Brown } 29620c7d97c5SJed Brown ierr = MatAssemblyBegin(M2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 29630c7d97c5SJed Brown ierr = MatAssemblyEnd(M2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 29640c7d97c5SJed Brown } 29650c7d97c5SJed Brown 29660c7d97c5SJed Brown /* Matrix of coarse basis functions (local) */ 2967d49ef151SStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->coarse_phi_B);CHKERRQ(ierr); 29680c7d97c5SJed Brown ierr = MatSetSizes(pcbddc->coarse_phi_B,n_B,pcbddc->local_primal_size,n_B,pcbddc->local_primal_size);CHKERRQ(ierr); 29690c7d97c5SJed Brown ierr = MatSetType(pcbddc->coarse_phi_B,impMatType);CHKERRQ(ierr); 29703b03a366Sstefano_zampini ierr = MatSeqDenseSetPreallocation(pcbddc->coarse_phi_B,PETSC_NULL);CHKERRQ(ierr); 2971e269702eSStefano Zampini if(pcbddc->prec_type || dbg_flag ) { 2972d49ef151SStefano Zampini ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->coarse_phi_D);CHKERRQ(ierr); 29730c7d97c5SJed Brown ierr = MatSetSizes(pcbddc->coarse_phi_D,n_D,pcbddc->local_primal_size,n_D,pcbddc->local_primal_size);CHKERRQ(ierr); 29740c7d97c5SJed Brown ierr = MatSetType(pcbddc->coarse_phi_D,impMatType);CHKERRQ(ierr); 29753b03a366Sstefano_zampini ierr = MatSeqDenseSetPreallocation(pcbddc->coarse_phi_D,PETSC_NULL);CHKERRQ(ierr); 29760c7d97c5SJed Brown } 29770c7d97c5SJed Brown 2978e269702eSStefano Zampini if(dbg_flag) { 29790c7d97c5SJed Brown ierr = PetscMalloc( pcbddc->local_primal_size*sizeof(PetscScalar),&coarsefunctions_errors);CHKERRQ(ierr); 29800c7d97c5SJed Brown ierr = PetscMalloc( pcbddc->local_primal_size*sizeof(PetscScalar),&constraints_errors);CHKERRQ(ierr); 29810c7d97c5SJed Brown } 29823b03a366Sstefano_zampini /* Subdomain contribution (Non-overlapping) to coarse matrix */ 29830c7d97c5SJed Brown ierr = PetscMalloc ((pcbddc->local_primal_size)*(pcbddc->local_primal_size)*sizeof(PetscScalar),&coarse_submat_vals);CHKERRQ(ierr); 29840c7d97c5SJed Brown 29850c7d97c5SJed Brown /* We are now ready to evaluate coarse basis functions and subdomain contribution to coarse problem */ 29863b03a366Sstefano_zampini for(i=0;i<n_vertices;i++){ 29870c7d97c5SJed Brown ierr = VecSet(vec1_V,zero);CHKERRQ(ierr); 29880c7d97c5SJed Brown ierr = VecSetValue(vec1_V,i,one,INSERT_VALUES);CHKERRQ(ierr); 29890c7d97c5SJed Brown ierr = VecAssemblyBegin(vec1_V);CHKERRQ(ierr); 29900c7d97c5SJed Brown ierr = VecAssemblyEnd(vec1_V);CHKERRQ(ierr); 29910c7d97c5SJed Brown /* solution of saddle point problem */ 29920c7d97c5SJed Brown ierr = MatMult(M2,vec1_V,pcbddc->vec1_R);CHKERRQ(ierr); 29930c7d97c5SJed Brown ierr = VecScale(pcbddc->vec1_R,m_one);CHKERRQ(ierr); 29943b03a366Sstefano_zampini if(n_constraints) { 29950c7d97c5SJed Brown ierr = MatMult(pcbddc->local_auxmat1,pcbddc->vec1_R,vec1_C);CHKERRQ(ierr); 29960c7d97c5SJed Brown ierr = MatMultAdd(pcbddc->local_auxmat2,vec1_C,pcbddc->vec1_R,pcbddc->vec1_R);CHKERRQ(ierr); 29970c7d97c5SJed Brown ierr = VecScale(vec1_C,m_one);CHKERRQ(ierr); 29980c7d97c5SJed Brown } 29990c7d97c5SJed Brown ierr = MatMult(A_VR,pcbddc->vec1_R,vec2_V);CHKERRQ(ierr); 30000c7d97c5SJed Brown ierr = MatMultAdd(A_VV,vec1_V,vec2_V,vec2_V);CHKERRQ(ierr); 30010c7d97c5SJed Brown 30020c7d97c5SJed Brown /* Set values in coarse basis function and subdomain part of coarse_mat */ 30030c7d97c5SJed Brown /* coarse basis functions */ 30040c7d97c5SJed Brown ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr); 30050c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 30060c7d97c5SJed Brown ierr = VecScatterEnd (pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 30070c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr); 30083b03a366Sstefano_zampini ierr = MatSetValues(pcbddc->coarse_phi_B,n_B,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr); 30090c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr); 30100c7d97c5SJed Brown ierr = MatSetValue(pcbddc->coarse_phi_B,idx_V_B[i],i,one,INSERT_VALUES);CHKERRQ(ierr); 3011e269702eSStefano Zampini if( pcbddc->prec_type || dbg_flag ) { 30120c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 30130c7d97c5SJed Brown ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 30140c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_D,&array);CHKERRQ(ierr); 30153b03a366Sstefano_zampini ierr = MatSetValues(pcbddc->coarse_phi_D,n_D,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr); 30160c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_D,&array);CHKERRQ(ierr); 30170c7d97c5SJed Brown } 30180c7d97c5SJed Brown /* subdomain contribution to coarse matrix */ 30190c7d97c5SJed Brown ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr); 3020da1bb401SStefano Zampini for(j=0;j<n_vertices;j++) { coarse_submat_vals[i*pcbddc->local_primal_size+j] = array[j]; } /* WARNING -> column major ordering */ 30210c7d97c5SJed Brown ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr); 30223b03a366Sstefano_zampini if(n_constraints) { 30230c7d97c5SJed Brown ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr); 3024da1bb401SStefano Zampini for(j=0;j<n_constraints;j++) { coarse_submat_vals[i*pcbddc->local_primal_size+j+n_vertices] = array[j]; } /* WARNING -> column major ordering */ 30250c7d97c5SJed Brown ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr); 30260c7d97c5SJed Brown } 30270c7d97c5SJed Brown 3028e269702eSStefano Zampini if( dbg_flag ) { 30290c7d97c5SJed Brown /* assemble subdomain vector on nodes */ 3030d49ef151SStefano Zampini ierr = VecSet(pcis->vec1_N,zero);CHKERRQ(ierr); 30310c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 30320c7d97c5SJed Brown ierr = VecGetArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr); 30330c7d97c5SJed Brown for(j=0;j<n_R;j++) { array[idx_R_local[j]] = array2[j]; } 30343b03a366Sstefano_zampini array[ vertices[i] ] = one; 30350c7d97c5SJed Brown ierr = VecRestoreArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr); 30360c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 30370c7d97c5SJed Brown /* assemble subdomain vector of lagrange multipliers (i.e. primal nodes) */ 3038d49ef151SStefano Zampini ierr = VecSet(pcbddc->vec1_P,zero);CHKERRQ(ierr); 30390c7d97c5SJed Brown ierr = VecGetArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr); 30400c7d97c5SJed Brown ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr); 30413b03a366Sstefano_zampini for(j=0;j<n_vertices;j++) { array2[j]=array[j]; } 30420c7d97c5SJed Brown ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr); 30433b03a366Sstefano_zampini if(n_constraints) { 30440c7d97c5SJed Brown ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr); 30453b03a366Sstefano_zampini for(j=0;j<n_constraints;j++) { array2[j+n_vertices]=array[j]; } 30460c7d97c5SJed Brown ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr); 30470c7d97c5SJed Brown } 30480c7d97c5SJed Brown ierr = VecRestoreArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr); 30490c7d97c5SJed Brown ierr = VecScale(pcbddc->vec1_P,m_one);CHKERRQ(ierr); 30500c7d97c5SJed Brown /* check saddle point solution */ 3051534831adSStefano Zampini ierr = MatMult(pcbddc->local_mat,pcis->vec1_N,pcis->vec2_N);CHKERRQ(ierr); 30523b03a366Sstefano_zampini ierr = MatMultTransposeAdd(pcbddc->ConstraintMatrix,pcbddc->vec1_P,pcis->vec2_N,pcis->vec2_N);CHKERRQ(ierr); 30533b03a366Sstefano_zampini ierr = VecNorm(pcis->vec2_N,NORM_INFINITY,&coarsefunctions_errors[i]);CHKERRQ(ierr); 30543b03a366Sstefano_zampini ierr = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr); 30550c7d97c5SJed Brown ierr = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr); 30563b03a366Sstefano_zampini array[i]=array[i]+m_one; /* shift by the identity matrix */ 30570c7d97c5SJed Brown ierr = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr); 30583b03a366Sstefano_zampini ierr = VecNorm(pcbddc->vec1_P,NORM_INFINITY,&constraints_errors[i]);CHKERRQ(ierr); 30590c7d97c5SJed Brown } 30600c7d97c5SJed Brown } 30610c7d97c5SJed Brown 30623b03a366Sstefano_zampini for(i=0;i<n_constraints;i++){ 3063d49ef151SStefano Zampini ierr = VecSet(vec2_C,zero);CHKERRQ(ierr); 30640c7d97c5SJed Brown ierr = VecSetValue(vec2_C,i,m_one,INSERT_VALUES);CHKERRQ(ierr); 30650c7d97c5SJed Brown ierr = VecAssemblyBegin(vec2_C);CHKERRQ(ierr); 30660c7d97c5SJed Brown ierr = VecAssemblyEnd(vec2_C);CHKERRQ(ierr); 30670c7d97c5SJed Brown /* solution of saddle point problem */ 30680c7d97c5SJed Brown ierr = MatMult(M1,vec2_C,vec1_C);CHKERRQ(ierr); 30690c7d97c5SJed Brown ierr = MatMult(pcbddc->local_auxmat2,vec1_C,pcbddc->vec1_R);CHKERRQ(ierr); 30700c7d97c5SJed Brown ierr = VecScale(vec1_C,m_one);CHKERRQ(ierr); 30713b03a366Sstefano_zampini if(n_vertices) { ierr = MatMult(A_VR,pcbddc->vec1_R,vec2_V);CHKERRQ(ierr); } 30720c7d97c5SJed Brown /* Set values in coarse basis function and subdomain part of coarse_mat */ 30730c7d97c5SJed Brown /* coarse basis functions */ 30743b03a366Sstefano_zampini index=i+n_vertices; 30750c7d97c5SJed Brown ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr); 30760c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 30770c7d97c5SJed Brown ierr = VecScatterEnd (pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 30780c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr); 307953cdbc3dSStefano Zampini ierr = MatSetValues(pcbddc->coarse_phi_B,n_B,auxindices,1,&index,array,INSERT_VALUES);CHKERRQ(ierr); 30800c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr); 3081e269702eSStefano Zampini if( pcbddc->prec_type || dbg_flag ) { 30820c7d97c5SJed Brown ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 30830c7d97c5SJed Brown ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 30840c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_D,&array);CHKERRQ(ierr); 308553cdbc3dSStefano Zampini ierr = MatSetValues(pcbddc->coarse_phi_D,n_D,auxindices,1,&index,array,INSERT_VALUES);CHKERRQ(ierr); 30860c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_D,&array);CHKERRQ(ierr); 30870c7d97c5SJed Brown } 30880c7d97c5SJed Brown /* subdomain contribution to coarse matrix */ 30893b03a366Sstefano_zampini if(n_vertices) { 30900c7d97c5SJed Brown ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr); 3091da1bb401SStefano Zampini for(j=0;j<n_vertices;j++) {coarse_submat_vals[index*pcbddc->local_primal_size+j]=array[j];} /* WARNING -> column major ordering */ 30920c7d97c5SJed Brown ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr); 30930c7d97c5SJed Brown } 30940c7d97c5SJed Brown ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr); 3095da1bb401SStefano Zampini for(j=0;j<n_constraints;j++) {coarse_submat_vals[index*pcbddc->local_primal_size+j+n_vertices]=array[j];} /* WARNING -> column major ordering */ 30960c7d97c5SJed Brown ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr); 30970c7d97c5SJed Brown 3098e269702eSStefano Zampini if( dbg_flag ) { 30990c7d97c5SJed Brown /* assemble subdomain vector on nodes */ 310053cdbc3dSStefano Zampini ierr = VecSet(pcis->vec1_N,zero);CHKERRQ(ierr); 31010c7d97c5SJed Brown ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 31020c7d97c5SJed Brown ierr = VecGetArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr); 31030c7d97c5SJed Brown for(j=0;j<n_R;j++){ array[ idx_R_local[j] ] = array2[j]; } 31040c7d97c5SJed Brown ierr = VecRestoreArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr); 31050c7d97c5SJed Brown ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 31060c7d97c5SJed Brown /* assemble subdomain vector of lagrange multipliers */ 310753cdbc3dSStefano Zampini ierr = VecSet(pcbddc->vec1_P,zero);CHKERRQ(ierr); 31080c7d97c5SJed Brown ierr = VecGetArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr); 31093b03a366Sstefano_zampini if( n_vertices) { 31100c7d97c5SJed Brown ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr); 31113b03a366Sstefano_zampini for(j=0;j<n_vertices;j++) {array2[j]=-array[j];} 31120c7d97c5SJed Brown ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr); 31130c7d97c5SJed Brown } 31140c7d97c5SJed Brown ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr); 31153b03a366Sstefano_zampini for(j=0;j<n_constraints;j++) {array2[j+n_vertices]=-array[j];} 31160c7d97c5SJed Brown ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr); 31170c7d97c5SJed Brown ierr = VecRestoreArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr); 31183972b0daSStefano Zampini /* check saddle point solution */ 3119534831adSStefano Zampini ierr = MatMult(pcbddc->local_mat,pcis->vec1_N,pcis->vec2_N);CHKERRQ(ierr); 31203b03a366Sstefano_zampini ierr = MatMultTransposeAdd(pcbddc->ConstraintMatrix,pcbddc->vec1_P,pcis->vec2_N,pcis->vec2_N);CHKERRQ(ierr); 312153cdbc3dSStefano Zampini ierr = VecNorm(pcis->vec2_N,NORM_INFINITY,&coarsefunctions_errors[index]);CHKERRQ(ierr); 31223b03a366Sstefano_zampini ierr = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr); 31230c7d97c5SJed Brown ierr = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr); 312453cdbc3dSStefano Zampini array[index]=array[index]+m_one; /* shift by the identity matrix */ 31250c7d97c5SJed Brown ierr = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr); 312653cdbc3dSStefano Zampini ierr = VecNorm(pcbddc->vec1_P,NORM_INFINITY,&constraints_errors[index]);CHKERRQ(ierr); 31270c7d97c5SJed Brown } 31280c7d97c5SJed Brown } 31290c7d97c5SJed Brown ierr = MatAssemblyBegin(pcbddc->coarse_phi_B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 31300c7d97c5SJed Brown ierr = MatAssemblyEnd (pcbddc->coarse_phi_B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 3131e269702eSStefano Zampini if( pcbddc->prec_type || dbg_flag ) { 31320c7d97c5SJed Brown ierr = MatAssemblyBegin(pcbddc->coarse_phi_D,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 31330c7d97c5SJed Brown ierr = MatAssemblyEnd (pcbddc->coarse_phi_D,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 31340c7d97c5SJed Brown } 31350c7d97c5SJed Brown /* Checking coarse_sub_mat and coarse basis functios */ 31360c7d97c5SJed Brown /* It shuld be \Phi^{(j)^T} A^{(j)} \Phi^{(j)}=coarse_sub_mat */ 31379d2fce94SStefano Zampini if(dbg_flag) { 31380c7d97c5SJed Brown 31390c7d97c5SJed Brown Mat coarse_sub_mat; 31400c7d97c5SJed Brown Mat TM1,TM2,TM3,TM4; 31410c7d97c5SJed Brown Mat coarse_phi_D,coarse_phi_B,A_II,A_BB,A_IB,A_BI; 3142a0ba757dSStefano Zampini const MatType checkmattype=MATSEQAIJ; 31430c7d97c5SJed Brown PetscScalar value; 31440c7d97c5SJed Brown 3145c042a7c3SStefano Zampini ierr = MatConvert(pcis->A_II,checkmattype,MAT_INITIAL_MATRIX,&A_II);CHKERRQ(ierr); 3146c042a7c3SStefano Zampini ierr = MatConvert(pcis->A_IB,checkmattype,MAT_INITIAL_MATRIX,&A_IB);CHKERRQ(ierr); 3147c042a7c3SStefano Zampini ierr = MatConvert(pcis->A_BI,checkmattype,MAT_INITIAL_MATRIX,&A_BI);CHKERRQ(ierr); 3148c042a7c3SStefano Zampini ierr = MatConvert(pcis->A_BB,checkmattype,MAT_INITIAL_MATRIX,&A_BB);CHKERRQ(ierr); 3149c042a7c3SStefano Zampini ierr = MatConvert(pcbddc->coarse_phi_D,checkmattype,MAT_INITIAL_MATRIX,&coarse_phi_D);CHKERRQ(ierr); 3150c042a7c3SStefano Zampini ierr = MatConvert(pcbddc->coarse_phi_B,checkmattype,MAT_INITIAL_MATRIX,&coarse_phi_B);CHKERRQ(ierr); 3151c042a7c3SStefano Zampini ierr = MatCreateSeqDense(PETSC_COMM_SELF,pcbddc->local_primal_size,pcbddc->local_primal_size,coarse_submat_vals,&coarse_sub_mat);CHKERRQ(ierr); 3152c042a7c3SStefano Zampini ierr = MatConvert(coarse_sub_mat,checkmattype,MAT_REUSE_MATRIX,&coarse_sub_mat);CHKERRQ(ierr); 31530c7d97c5SJed Brown 3154da1bb401SStefano Zampini /*PetscViewer view_out; 3155da1bb401SStefano Zampini PetscMPIInt myrank; 3156da1bb401SStefano Zampini char filename[256]; 3157da1bb401SStefano Zampini MPI_Comm_rank(((PetscObject)pc)->comm,&myrank); 3158da1bb401SStefano Zampini sprintf(filename,"coarsesubmat_%04d.m",myrank); 3159da1bb401SStefano Zampini ierr = PetscViewerASCIIOpen(PETSC_COMM_SELF,filename,&view_out);CHKERRQ(ierr); 3160da1bb401SStefano Zampini ierr = PetscViewerSetFormat(view_out,PETSC_VIEWER_ASCII_MATLAB);CHKERRQ(ierr); 3161da1bb401SStefano Zampini ierr = MatView(coarse_sub_mat,view_out);CHKERRQ(ierr); 3162da1bb401SStefano Zampini ierr = PetscViewerDestroy(&view_out);CHKERRQ(ierr);*/ 3163da1bb401SStefano Zampini 31640c7d97c5SJed Brown ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr); 31650c7d97c5SJed Brown ierr = PetscViewerASCIIPrintf(viewer,"Check coarse sub mat and local basis functions\n");CHKERRQ(ierr); 31660c7d97c5SJed Brown ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 316753cdbc3dSStefano Zampini ierr = MatPtAP(A_II,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&TM1);CHKERRQ(ierr); 316853cdbc3dSStefano Zampini ierr = MatPtAP(A_BB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&TM2);CHKERRQ(ierr); 316953cdbc3dSStefano Zampini ierr = MatMatMult(A_IB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr); 3170c042a7c3SStefano Zampini ierr = MatTransposeMatMult(coarse_phi_D,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM3);CHKERRQ(ierr); 317153cdbc3dSStefano Zampini ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr); 317253cdbc3dSStefano Zampini ierr = MatMatMult(A_BI,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr); 3173c042a7c3SStefano Zampini ierr = MatTransposeMatMult(coarse_phi_B,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM4);CHKERRQ(ierr); 317453cdbc3dSStefano Zampini ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr); 317553cdbc3dSStefano Zampini ierr = MatAXPY(TM1,one,TM2,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr); 317653cdbc3dSStefano Zampini ierr = MatAXPY(TM1,one,TM3,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr); 317753cdbc3dSStefano Zampini ierr = MatAXPY(TM1,one,TM4,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr); 317853cdbc3dSStefano Zampini ierr = MatAXPY(TM1,m_one,coarse_sub_mat,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr); 317953cdbc3dSStefano Zampini ierr = MatNorm(TM1,NORM_INFINITY,&value);CHKERRQ(ierr); 31800c7d97c5SJed Brown ierr = PetscViewerASCIISynchronizedPrintf(viewer,"----------------------------------\n");CHKERRQ(ierr); 31810c7d97c5SJed Brown ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d \n",PetscGlobalRank);CHKERRQ(ierr); 31820c7d97c5SJed Brown ierr = PetscViewerASCIISynchronizedPrintf(viewer,"matrix error = % 1.14e\n",value);CHKERRQ(ierr); 31830c7d97c5SJed Brown ierr = PetscViewerASCIISynchronizedPrintf(viewer,"coarse functions errors\n");CHKERRQ(ierr); 318453cdbc3dSStefano Zampini for(i=0;i<pcbddc->local_primal_size;i++) { ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local %02d-th function error = % 1.14e\n",i,coarsefunctions_errors[i]);CHKERRQ(ierr); } 31850c7d97c5SJed Brown ierr = PetscViewerASCIISynchronizedPrintf(viewer,"constraints errors\n");CHKERRQ(ierr); 318653cdbc3dSStefano Zampini for(i=0;i<pcbddc->local_primal_size;i++) { ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local %02d-th function error = % 1.14e\n",i,constraints_errors[i]);CHKERRQ(ierr); } 31870c7d97c5SJed Brown ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 318853cdbc3dSStefano Zampini ierr = MatDestroy(&A_II);CHKERRQ(ierr); 318953cdbc3dSStefano Zampini ierr = MatDestroy(&A_BB);CHKERRQ(ierr); 319053cdbc3dSStefano Zampini ierr = MatDestroy(&A_IB);CHKERRQ(ierr); 319153cdbc3dSStefano Zampini ierr = MatDestroy(&A_BI);CHKERRQ(ierr); 319253cdbc3dSStefano Zampini ierr = MatDestroy(&TM1);CHKERRQ(ierr); 319353cdbc3dSStefano Zampini ierr = MatDestroy(&TM2);CHKERRQ(ierr); 319453cdbc3dSStefano Zampini ierr = MatDestroy(&TM3);CHKERRQ(ierr); 319553cdbc3dSStefano Zampini ierr = MatDestroy(&TM4);CHKERRQ(ierr); 319653cdbc3dSStefano Zampini ierr = MatDestroy(&coarse_phi_D);CHKERRQ(ierr); 319753cdbc3dSStefano Zampini ierr = MatDestroy(&coarse_sub_mat);CHKERRQ(ierr); 319853cdbc3dSStefano Zampini ierr = MatDestroy(&coarse_phi_B);CHKERRQ(ierr); 31990c7d97c5SJed Brown ierr = PetscFree(coarsefunctions_errors);CHKERRQ(ierr); 32000c7d97c5SJed Brown ierr = PetscFree(constraints_errors);CHKERRQ(ierr); 32010c7d97c5SJed Brown } 32020c7d97c5SJed Brown 32030c7d97c5SJed Brown /* create coarse matrix and data structures for message passing associated actual choice of coarse problem type */ 32040c7d97c5SJed Brown ierr = PCBDDCSetupCoarseEnvironment(pc,coarse_submat_vals);CHKERRQ(ierr); 32050c7d97c5SJed Brown /* free memory */ 32060c7d97c5SJed Brown ierr = PetscFree(coarse_submat_vals);CHKERRQ(ierr); 32070c7d97c5SJed Brown ierr = PetscFree(auxindices);CHKERRQ(ierr); 32080c7d97c5SJed Brown ierr = PetscFree(nnz);CHKERRQ(ierr); 32093b03a366Sstefano_zampini if(n_vertices) { 32100c7d97c5SJed Brown ierr = VecDestroy(&vec1_V);CHKERRQ(ierr); 32110c7d97c5SJed Brown ierr = VecDestroy(&vec2_V);CHKERRQ(ierr); 32120c7d97c5SJed Brown ierr = MatDestroy(&M2);CHKERRQ(ierr); 32130c7d97c5SJed Brown ierr = MatDestroy(&A_RV);CHKERRQ(ierr); 32140c7d97c5SJed Brown ierr = MatDestroy(&A_VR);CHKERRQ(ierr); 32150c7d97c5SJed Brown ierr = MatDestroy(&A_VV);CHKERRQ(ierr); 32160c7d97c5SJed Brown } 3217534831adSStefano Zampini if(n_constraints) { 32180c7d97c5SJed Brown ierr = VecDestroy(&vec1_C);CHKERRQ(ierr); 32190c7d97c5SJed Brown ierr = VecDestroy(&vec2_C);CHKERRQ(ierr); 32200c7d97c5SJed Brown ierr = MatDestroy(&M1);CHKERRQ(ierr); 32210c7d97c5SJed Brown ierr = MatDestroy(&C_CR);CHKERRQ(ierr); 32220c7d97c5SJed Brown } 32230c7d97c5SJed Brown } 32240c7d97c5SJed Brown /* free memory */ 32253b03a366Sstefano_zampini if(n_vertices) { 32260c7d97c5SJed Brown ierr = PetscFree(idx_V_B);CHKERRQ(ierr); 32270c7d97c5SJed Brown ierr = ISDestroy(&is_V_local);CHKERRQ(ierr); 32280c7d97c5SJed Brown } 32290c7d97c5SJed Brown ierr = ISDestroy(&is_R_local);CHKERRQ(ierr); 32300c7d97c5SJed Brown 32310c7d97c5SJed Brown PetscFunctionReturn(0); 32320c7d97c5SJed Brown } 32330c7d97c5SJed Brown 32340c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 32350c7d97c5SJed Brown 32360c7d97c5SJed Brown #undef __FUNCT__ 32370c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetupCoarseEnvironment" 323853cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetupCoarseEnvironment(PC pc,PetscScalar* coarse_submat_vals) 32390c7d97c5SJed Brown { 32400c7d97c5SJed Brown 32410c7d97c5SJed Brown 32420c7d97c5SJed Brown Mat_IS *matis = (Mat_IS*)pc->pmat->data; 32430c7d97c5SJed Brown PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 32440c7d97c5SJed Brown PC_IS *pcis = (PC_IS*)pc->data; 32450c7d97c5SJed Brown MPI_Comm prec_comm = ((PetscObject)pc)->comm; 32460c7d97c5SJed Brown MPI_Comm coarse_comm; 32470c7d97c5SJed Brown 32480c7d97c5SJed Brown /* common to all choiches */ 32490c7d97c5SJed Brown PetscScalar *temp_coarse_mat_vals; 32500c7d97c5SJed Brown PetscScalar *ins_coarse_mat_vals; 32510c7d97c5SJed Brown PetscInt *ins_local_primal_indices; 32520c7d97c5SJed Brown PetscMPIInt *localsizes2,*localdispl2; 32530c7d97c5SJed Brown PetscMPIInt size_prec_comm; 32540c7d97c5SJed Brown PetscMPIInt rank_prec_comm; 32550c7d97c5SJed Brown PetscMPIInt active_rank=MPI_PROC_NULL; 32560c7d97c5SJed Brown PetscMPIInt master_proc=0; 32570c7d97c5SJed Brown PetscInt ins_local_primal_size; 32580c7d97c5SJed Brown /* specific to MULTILEVEL_BDDC */ 32590c7d97c5SJed Brown PetscMPIInt *ranks_recv; 32600c7d97c5SJed Brown PetscMPIInt count_recv=0; 32610c7d97c5SJed Brown PetscMPIInt rank_coarse_proc_send_to; 32620c7d97c5SJed Brown PetscMPIInt coarse_color = MPI_UNDEFINED; 32630c7d97c5SJed Brown ISLocalToGlobalMapping coarse_ISLG; 32640c7d97c5SJed Brown /* some other variables */ 32650c7d97c5SJed Brown PetscErrorCode ierr; 32660c7d97c5SJed Brown const MatType coarse_mat_type; 32670c7d97c5SJed Brown const PCType coarse_pc_type; 326853cdbc3dSStefano Zampini const KSPType coarse_ksp_type; 326953cdbc3dSStefano Zampini PC pc_temp; 32700c7d97c5SJed Brown PetscInt i,j,k,bs; 32713b03a366Sstefano_zampini PetscInt max_it_coarse_ksp=1; /* don't increase this value */ 3272e269702eSStefano Zampini /* verbose output viewer */ 3273e269702eSStefano Zampini PetscViewer viewer=pcbddc->dbg_viewer; 3274e269702eSStefano Zampini PetscBool dbg_flag=pcbddc->dbg_flag; 3275*ea7e1babSStefano Zampini PetscInt offset,offset2; 32760c7d97c5SJed Brown 32770c7d97c5SJed Brown PetscFunctionBegin; 32780c7d97c5SJed Brown ins_local_primal_indices = 0; 32790c7d97c5SJed Brown ins_coarse_mat_vals = 0; 32800c7d97c5SJed Brown localsizes2 = 0; 32810c7d97c5SJed Brown localdispl2 = 0; 32820c7d97c5SJed Brown temp_coarse_mat_vals = 0; 32830c7d97c5SJed Brown coarse_ISLG = 0; 32840c7d97c5SJed Brown 328553cdbc3dSStefano Zampini ierr = MPI_Comm_size(prec_comm,&size_prec_comm);CHKERRQ(ierr); 328653cdbc3dSStefano Zampini ierr = MPI_Comm_rank(prec_comm,&rank_prec_comm);CHKERRQ(ierr); 32870c7d97c5SJed Brown ierr = MatGetBlockSize(matis->A,&bs);CHKERRQ(ierr); 32880c7d97c5SJed Brown 3289ffe5efe1SStefano Zampini /* adapt coarse problem type */ 3290ffe5efe1SStefano Zampini if(pcbddc->coarse_problem_type == MULTILEVEL_BDDC && pcbddc->active_procs < MIN_PROCS_FOR_BDDC ) 3291ffe5efe1SStefano Zampini pcbddc->coarse_problem_type = PARALLEL_BDDC; 3292ffe5efe1SStefano Zampini 3293beed3852SStefano Zampini /* Assign global numbering to coarse dofs */ 3294beed3852SStefano Zampini { 3295a0ba757dSStefano Zampini PetscScalar one=1.,zero=0.; 3296beed3852SStefano Zampini PetscScalar *array; 3297beed3852SStefano Zampini PetscMPIInt *auxlocal_primal; 3298beed3852SStefano Zampini PetscMPIInt *auxglobal_primal; 3299beed3852SStefano Zampini PetscMPIInt *all_auxglobal_primal; 3300beed3852SStefano Zampini PetscMPIInt mpi_local_primal_size = (PetscMPIInt)pcbddc->local_primal_size; 3301da1bb401SStefano Zampini PetscInt *row_cmat_indices; 33023b03a366Sstefano_zampini PetscInt size_of_constraint; 3303da1bb401SStefano Zampini PetscScalar coarsesum; 3304beed3852SStefano Zampini 3305beed3852SStefano Zampini /* Construct needed data structures for message passing */ 3306beed3852SStefano Zampini ierr = PetscMalloc(mpi_local_primal_size*sizeof(PetscMPIInt),&pcbddc->local_primal_indices);CHKERRQ(ierr); 3307ffe5efe1SStefano Zampini j = 0; 3308ffe5efe1SStefano Zampini if(rank_prec_comm == 0 || pcbddc->coarse_problem_type == REPLICATED_BDDC) { 3309ffe5efe1SStefano Zampini j = size_prec_comm; 3310ffe5efe1SStefano Zampini } 3311ffe5efe1SStefano Zampini ierr = PetscMalloc(j*sizeof(PetscMPIInt),&pcbddc->local_primal_sizes);CHKERRQ(ierr); 3312ffe5efe1SStefano Zampini ierr = PetscMalloc(j*sizeof(PetscMPIInt),&pcbddc->local_primal_displacements);CHKERRQ(ierr); 3313beed3852SStefano Zampini /* Gather local_primal_size information for all processes */ 3314ffe5efe1SStefano Zampini if(pcbddc->coarse_problem_type == REPLICATED_BDDC) { 33155619798eSStefano Zampini ierr = MPI_Allgather(&mpi_local_primal_size,1,MPIU_INT,&pcbddc->local_primal_sizes[0],1,MPIU_INT,prec_comm);CHKERRQ(ierr); 3316ffe5efe1SStefano Zampini } else { 3317ffe5efe1SStefano Zampini ierr = MPI_Gather(&mpi_local_primal_size,1,MPIU_INT,&pcbddc->local_primal_sizes[0],1,MPIU_INT,0,prec_comm);CHKERRQ(ierr); 3318ffe5efe1SStefano Zampini } 3319beed3852SStefano Zampini pcbddc->replicated_primal_size = 0; 3320ffe5efe1SStefano Zampini for (i=0; i<j; i++) { 3321beed3852SStefano Zampini pcbddc->local_primal_displacements[i] = pcbddc->replicated_primal_size ; 3322beed3852SStefano Zampini pcbddc->replicated_primal_size += pcbddc->local_primal_sizes[i]; 3323beed3852SStefano Zampini } 33245619798eSStefano Zampini if(rank_prec_comm == 0) { 3325beed3852SStefano Zampini /* allocate some auxiliary space */ 3326beed3852SStefano Zampini ierr = PetscMalloc(pcbddc->replicated_primal_size*sizeof(*all_auxglobal_primal),&all_auxglobal_primal);CHKERRQ(ierr); 3327beed3852SStefano Zampini } 3328beed3852SStefano Zampini ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscMPIInt),&auxlocal_primal);CHKERRQ(ierr); 3329beed3852SStefano Zampini ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscMPIInt),&auxglobal_primal);CHKERRQ(ierr); 3330beed3852SStefano Zampini 3331da1bb401SStefano Zampini /* First let's count coarse dofs. 3332beed3852SStefano Zampini This code fragment assumes that the number of local constraints per connected component 3333beed3852SStefano Zampini is not greater than the number of nodes defined for the connected component 3334beed3852SStefano Zampini (otherwise we will surely have linear dependence between constraints and thus a singular coarse problem) */ 33353b03a366Sstefano_zampini /* auxlocal_primal : primal indices in local nodes numbering (internal and interface) with complete queue sorted by global ordering */ 3336beed3852SStefano Zampini ierr = VecSet(pcis->vec1_N,zero);CHKERRQ(ierr); 3337beed3852SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 3338da1bb401SStefano Zampini for(i=0;i<pcbddc->local_primal_size;i++) { 3339da1bb401SStefano Zampini ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr); 33403b03a366Sstefano_zampini for (j=0; j<size_of_constraint; j++) { 33413b03a366Sstefano_zampini k = row_cmat_indices[j]; 3342beed3852SStefano Zampini if( array[k] == zero ) { 3343beed3852SStefano Zampini array[k] = one; 3344da1bb401SStefano Zampini auxlocal_primal[i] = k; 3345beed3852SStefano Zampini break; 3346beed3852SStefano Zampini } 3347beed3852SStefano Zampini } 3348da1bb401SStefano Zampini ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr); 3349beed3852SStefano Zampini } 3350beed3852SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 3351da1bb401SStefano Zampini ierr = VecSet(pcis->vec1_global,zero);CHKERRQ(ierr); 3352da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 3353da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 3354da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 3355da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 3356da1bb401SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 3357da1bb401SStefano Zampini for(i=0;i<pcis->n;i++) { if( array[i] > zero) array[i] = one/array[i]; } 3358da1bb401SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 3359da1bb401SStefano Zampini ierr = VecSet(pcis->vec1_global,zero);CHKERRQ(ierr); 3360da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 3361da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 3362da1bb401SStefano Zampini ierr = VecSum(pcis->vec1_global,&coarsesum);CHKERRQ(ierr); 3363da1bb401SStefano Zampini pcbddc->coarse_size = (PetscInt) coarsesum; 3364a0ba757dSStefano Zampini 3365beed3852SStefano Zampini /* Now assign them a global numbering */ 3366beed3852SStefano Zampini /* auxglobal_primal contains indices in global nodes numbering (internal and interface) */ 3367beed3852SStefano Zampini ierr = ISLocalToGlobalMappingApply(matis->mapping,pcbddc->local_primal_size,auxlocal_primal,auxglobal_primal);CHKERRQ(ierr); 3368beed3852SStefano Zampini /* all_auxglobal_primal contains all primal nodes indices in global nodes numbering (internal and interface) */ 3369beed3852SStefano Zampini ierr = MPI_Gatherv(&auxglobal_primal[0],pcbddc->local_primal_size,MPIU_INT,&all_auxglobal_primal[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,0,prec_comm);CHKERRQ(ierr); 3370beed3852SStefano Zampini 3371beed3852SStefano Zampini /* After this block all_auxglobal_primal should contains one copy of each primal node's indices in global nodes numbering */ 3372beed3852SStefano Zampini if(rank_prec_comm==0) { 337317d7d925SStefano Zampini j=pcbddc->replicated_primal_size; 337417d7d925SStefano Zampini ierr = PetscSortRemoveDupsMPIInt(&j,all_auxglobal_primal);CHKERRQ(ierr); 3375beed3852SStefano Zampini } else { 3376beed3852SStefano Zampini ierr = PetscMalloc(pcbddc->coarse_size*sizeof(PetscMPIInt),&all_auxglobal_primal);CHKERRQ(ierr); 3377beed3852SStefano Zampini } 33785619798eSStefano Zampini /* We only need to broadcast the indices from 0 to pcbddc->coarse_size. Remaning elements of array all_aux_global_primal are garbage. */ 3379beed3852SStefano Zampini ierr = MPI_Bcast(all_auxglobal_primal,pcbddc->coarse_size,MPIU_INT,0,prec_comm);CHKERRQ(ierr); 3380beed3852SStefano Zampini 3381beed3852SStefano Zampini /* Now get global coarse numbering of local primal nodes */ 3382beed3852SStefano Zampini for(i=0;i<pcbddc->local_primal_size;i++) { 3383beed3852SStefano Zampini k=0; 3384beed3852SStefano Zampini while( all_auxglobal_primal[k] != auxglobal_primal[i] ) { k++;} 3385beed3852SStefano Zampini pcbddc->local_primal_indices[i]=k; 3386beed3852SStefano Zampini } 3387e269702eSStefano Zampini if(dbg_flag) { 3388e269702eSStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr); 3389da1bb401SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Size of coarse problem %d\n",pcbddc->coarse_size);CHKERRQ(ierr); 3390e269702eSStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 3391e269702eSStefano Zampini } 3392beed3852SStefano Zampini /* free allocated memory */ 3393beed3852SStefano Zampini ierr = PetscFree(auxlocal_primal);CHKERRQ(ierr); 3394beed3852SStefano Zampini ierr = PetscFree(auxglobal_primal);CHKERRQ(ierr); 3395beed3852SStefano Zampini ierr = PetscFree(all_auxglobal_primal);CHKERRQ(ierr); 3396e269702eSStefano Zampini } 3397beed3852SStefano Zampini 33980c7d97c5SJed Brown switch(pcbddc->coarse_problem_type){ 33990c7d97c5SJed Brown 3400da1bb401SStefano Zampini case(MULTILEVEL_BDDC): /* we define a coarse mesh where subdomains are elements */ 34010c7d97c5SJed Brown { 34020c7d97c5SJed Brown /* we need additional variables */ 34030c7d97c5SJed Brown MetisInt n_subdomains,n_parts,objval,ncon,faces_nvtxs; 34040c7d97c5SJed Brown MetisInt *metis_coarse_subdivision; 34050c7d97c5SJed Brown MetisInt options[METIS_NOPTIONS]; 34060c7d97c5SJed Brown PetscMPIInt size_coarse_comm,rank_coarse_comm; 34070c7d97c5SJed Brown PetscMPIInt procs_jumps_coarse_comm; 34080c7d97c5SJed Brown PetscMPIInt *coarse_subdivision; 34090c7d97c5SJed Brown PetscMPIInt *total_count_recv; 34100c7d97c5SJed Brown PetscMPIInt *total_ranks_recv; 34110c7d97c5SJed Brown PetscMPIInt *displacements_recv; 34120c7d97c5SJed Brown PetscMPIInt *my_faces_connectivity; 34130c7d97c5SJed Brown PetscMPIInt *petsc_faces_adjncy; 34140c7d97c5SJed Brown MetisInt *faces_adjncy; 34150c7d97c5SJed Brown MetisInt *faces_xadj; 34160c7d97c5SJed Brown PetscMPIInt *number_of_faces; 34170c7d97c5SJed Brown PetscMPIInt *faces_displacements; 34180c7d97c5SJed Brown PetscInt *array_int; 34190c7d97c5SJed Brown PetscMPIInt my_faces=0; 34200c7d97c5SJed Brown PetscMPIInt total_faces=0; 34213828260eSStefano Zampini PetscInt ranks_stretching_ratio; 34220c7d97c5SJed Brown 34230c7d97c5SJed Brown /* define some quantities */ 34240c7d97c5SJed Brown pcbddc->coarse_communications_type = SCATTERS_BDDC; 34250c7d97c5SJed Brown coarse_mat_type = MATIS; 34260c7d97c5SJed Brown coarse_pc_type = PCBDDC; 34276c9de887SHong Zhang coarse_ksp_type = KSPCHEBYSHEV; 34280c7d97c5SJed Brown 34290c7d97c5SJed Brown /* details of coarse decomposition */ 34300c7d97c5SJed Brown n_subdomains = pcbddc->active_procs; 34310c7d97c5SJed Brown n_parts = n_subdomains/pcbddc->coarsening_ratio; 34323828260eSStefano Zampini ranks_stretching_ratio = size_prec_comm/pcbddc->active_procs; 34333828260eSStefano Zampini procs_jumps_coarse_comm = pcbddc->coarsening_ratio*ranks_stretching_ratio; 34343828260eSStefano Zampini 3435da1bb401SStefano Zampini /*printf("Coarse algorithm details: \n"); 3436da1bb401SStefano Zampini printf("n_subdomains %d, n_parts %d\nstretch %d,jumps %d,coarse_ratio %d\nlevel should be log_%d(%d)\n",n_subdomains,n_parts,ranks_stretching_ratio,procs_jumps_coarse_comm,pcbddc->coarsening_ratio,pcbddc->coarsening_ratio,(ranks_stretching_ratio/pcbddc->coarsening_ratio+1));*/ 34370c7d97c5SJed Brown 34380c7d97c5SJed Brown /* build CSR graph of subdomains' connectivity through faces */ 34390c7d97c5SJed Brown ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&array_int);CHKERRQ(ierr); 34403828260eSStefano Zampini ierr = PetscMemzero(array_int,pcis->n*sizeof(PetscInt));CHKERRQ(ierr); 34410c7d97c5SJed Brown for(i=1;i<pcis->n_neigh;i++){/* i=1 so I don't count myself -> faces nodes counts to 1 */ 34420c7d97c5SJed Brown for(j=0;j<pcis->n_shared[i];j++){ 34430c7d97c5SJed Brown array_int[ pcis->shared[i][j] ]+=1; 34440c7d97c5SJed Brown } 34450c7d97c5SJed Brown } 34460c7d97c5SJed Brown for(i=1;i<pcis->n_neigh;i++){ 34470c7d97c5SJed Brown for(j=0;j<pcis->n_shared[i];j++){ 34480c7d97c5SJed Brown if(array_int[ pcis->shared[i][j] ] == 1 ){ 34490c7d97c5SJed Brown my_faces++; 34500c7d97c5SJed Brown break; 34510c7d97c5SJed Brown } 34520c7d97c5SJed Brown } 34530c7d97c5SJed Brown } 34540c7d97c5SJed Brown 345553cdbc3dSStefano Zampini ierr = MPI_Reduce(&my_faces,&total_faces,1,MPIU_INT,MPI_SUM,master_proc,prec_comm);CHKERRQ(ierr); 34560c7d97c5SJed Brown ierr = PetscMalloc (my_faces*sizeof(PetscInt),&my_faces_connectivity);CHKERRQ(ierr); 34570c7d97c5SJed Brown my_faces=0; 34580c7d97c5SJed Brown for(i=1;i<pcis->n_neigh;i++){ 34590c7d97c5SJed Brown for(j=0;j<pcis->n_shared[i];j++){ 34600c7d97c5SJed Brown if(array_int[ pcis->shared[i][j] ] == 1 ){ 34610c7d97c5SJed Brown my_faces_connectivity[my_faces]=pcis->neigh[i]; 34620c7d97c5SJed Brown my_faces++; 34630c7d97c5SJed Brown break; 34640c7d97c5SJed Brown } 34650c7d97c5SJed Brown } 34660c7d97c5SJed Brown } 34670c7d97c5SJed Brown if(rank_prec_comm == master_proc) { 34680c7d97c5SJed Brown ierr = PetscMalloc (total_faces*sizeof(PetscMPIInt),&petsc_faces_adjncy);CHKERRQ(ierr); 34690c7d97c5SJed Brown ierr = PetscMalloc (size_prec_comm*sizeof(PetscMPIInt),&number_of_faces);CHKERRQ(ierr); 34700c7d97c5SJed Brown ierr = PetscMalloc (total_faces*sizeof(MetisInt),&faces_adjncy);CHKERRQ(ierr); 34710c7d97c5SJed Brown ierr = PetscMalloc ((n_subdomains+1)*sizeof(MetisInt),&faces_xadj);CHKERRQ(ierr); 34720c7d97c5SJed Brown ierr = PetscMalloc ((size_prec_comm+1)*sizeof(PetscMPIInt),&faces_displacements);CHKERRQ(ierr); 34730c7d97c5SJed Brown } 347453cdbc3dSStefano Zampini ierr = MPI_Gather(&my_faces,1,MPIU_INT,&number_of_faces[0],1,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr); 34750c7d97c5SJed Brown if(rank_prec_comm == master_proc) { 34760c7d97c5SJed Brown faces_xadj[0]=0; 34770c7d97c5SJed Brown faces_displacements[0]=0; 34780c7d97c5SJed Brown j=0; 34790c7d97c5SJed Brown for(i=1;i<size_prec_comm+1;i++) { 34800c7d97c5SJed Brown faces_displacements[i]=faces_displacements[i-1]+number_of_faces[i-1]; 34810c7d97c5SJed Brown if(number_of_faces[i-1]) { 34820c7d97c5SJed Brown j++; 34830c7d97c5SJed Brown faces_xadj[j]=faces_xadj[j-1]+number_of_faces[i-1]; 34840c7d97c5SJed Brown } 34850c7d97c5SJed Brown } 3486da1bb401SStefano Zampini /*printf("The J I count is %d and should be %d\n",j,n_subdomains); 3487da1bb401SStefano Zampini printf("Total faces seem %d and should be %d\n",faces_xadj[j],total_faces);*/ 34880c7d97c5SJed Brown } 348953cdbc3dSStefano Zampini ierr = MPI_Gatherv(&my_faces_connectivity[0],my_faces,MPIU_INT,&petsc_faces_adjncy[0],number_of_faces,faces_displacements,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr); 34900c7d97c5SJed Brown ierr = PetscFree(my_faces_connectivity);CHKERRQ(ierr); 34910c7d97c5SJed Brown ierr = PetscFree(array_int);CHKERRQ(ierr); 34920c7d97c5SJed Brown if(rank_prec_comm == master_proc) { 34933828260eSStefano Zampini for(i=0;i<total_faces;i++) faces_adjncy[i]=(MetisInt)(petsc_faces_adjncy[i]/ranks_stretching_ratio); /* cast to MetisInt */ 3494da1bb401SStefano Zampini /*printf("This is the face connectivity (actual ranks)\n"); 34950c7d97c5SJed Brown for(i=0;i<n_subdomains;i++){ 34960c7d97c5SJed Brown printf("proc %d is connected with \n",i); 34970c7d97c5SJed Brown for(j=faces_xadj[i];j<faces_xadj[i+1];j++) 34980c7d97c5SJed Brown printf("%d ",faces_adjncy[j]); 34990c7d97c5SJed Brown printf("\n"); 3500da1bb401SStefano Zampini }*/ 35010c7d97c5SJed Brown ierr = PetscFree(faces_displacements);CHKERRQ(ierr); 35020c7d97c5SJed Brown ierr = PetscFree(number_of_faces);CHKERRQ(ierr); 35030c7d97c5SJed Brown ierr = PetscFree(petsc_faces_adjncy);CHKERRQ(ierr); 35040c7d97c5SJed Brown } 35050c7d97c5SJed Brown 35060c7d97c5SJed Brown if( rank_prec_comm == master_proc ) { 35070c7d97c5SJed Brown 35083828260eSStefano Zampini PetscInt heuristic_for_metis=3; 35093828260eSStefano Zampini 35100c7d97c5SJed Brown ncon=1; 35110c7d97c5SJed Brown faces_nvtxs=n_subdomains; 35120c7d97c5SJed Brown /* partition graoh induced by face connectivity */ 35130c7d97c5SJed Brown ierr = PetscMalloc (n_subdomains*sizeof(MetisInt),&metis_coarse_subdivision);CHKERRQ(ierr); 35140c7d97c5SJed Brown ierr = METIS_SetDefaultOptions(options); 35150c7d97c5SJed Brown /* we need a contiguous partition of the coarse mesh */ 35160c7d97c5SJed Brown options[METIS_OPTION_CONTIG]=1; 35170c7d97c5SJed Brown options[METIS_OPTION_DBGLVL]=1; 35180c7d97c5SJed Brown options[METIS_OPTION_NITER]=30; 35193828260eSStefano Zampini if(n_subdomains>n_parts*heuristic_for_metis) { 35203828260eSStefano Zampini options[METIS_OPTION_IPTYPE]=METIS_IPTYPE_EDGE; 35213828260eSStefano Zampini options[METIS_OPTION_OBJTYPE]=METIS_OBJTYPE_CUT; 35220c7d97c5SJed Brown ierr = METIS_PartGraphKway(&faces_nvtxs,&ncon,faces_xadj,faces_adjncy,NULL,NULL,NULL,&n_parts,NULL,NULL,options,&objval,metis_coarse_subdivision); 35233828260eSStefano Zampini } else { 35243828260eSStefano Zampini ierr = METIS_PartGraphRecursive(&faces_nvtxs,&ncon,faces_xadj,faces_adjncy,NULL,NULL,NULL,&n_parts,NULL,NULL,options,&objval,metis_coarse_subdivision); 35253828260eSStefano Zampini } 35260c7d97c5SJed Brown if(ierr != METIS_OK) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in METIS_PartGraphKway (metis error code %D) called from PCBDDCSetupCoarseEnvironment\n",ierr); 35270c7d97c5SJed Brown ierr = PetscFree(faces_xadj);CHKERRQ(ierr); 35280c7d97c5SJed Brown ierr = PetscFree(faces_adjncy);CHKERRQ(ierr); 35290c7d97c5SJed Brown coarse_subdivision = (PetscMPIInt*)calloc(size_prec_comm,sizeof(PetscMPIInt)); /* calloc for contiguous memory since we need to scatter these values later */ 35300c7d97c5SJed Brown /* copy/cast values avoiding possible type conflicts between PETSc, MPI and METIS */ 35313828260eSStefano Zampini for(i=0;i<size_prec_comm;i++) coarse_subdivision[i]=MPI_PROC_NULL; 35323828260eSStefano Zampini for(i=0;i<n_subdomains;i++) coarse_subdivision[ranks_stretching_ratio*i]=(PetscInt)(metis_coarse_subdivision[i]); 35330c7d97c5SJed Brown ierr = PetscFree(metis_coarse_subdivision);CHKERRQ(ierr); 35340c7d97c5SJed Brown } 35350c7d97c5SJed Brown 35360c7d97c5SJed Brown /* Create new communicator for coarse problem splitting the old one */ 35370c7d97c5SJed Brown if( !(rank_prec_comm%procs_jumps_coarse_comm) && rank_prec_comm < procs_jumps_coarse_comm*n_parts ){ 3538da1bb401SStefano Zampini coarse_color=0; /* for communicator splitting */ 3539da1bb401SStefano Zampini active_rank=rank_prec_comm; /* for insertion of matrix values */ 35400c7d97c5SJed Brown } 3541da1bb401SStefano Zampini /* procs with coarse_color = MPI_UNDEFINED will have coarse_comm = MPI_COMM_NULL (from mpi standards) 3542da1bb401SStefano Zampini key = rank_prec_comm -> keep same ordering of ranks from the old to the new communicator */ 354353cdbc3dSStefano Zampini ierr = MPI_Comm_split(prec_comm,coarse_color,rank_prec_comm,&coarse_comm);CHKERRQ(ierr); 35440c7d97c5SJed Brown 35450c7d97c5SJed Brown if( coarse_color == 0 ) { 354653cdbc3dSStefano Zampini ierr = MPI_Comm_size(coarse_comm,&size_coarse_comm);CHKERRQ(ierr); 354753cdbc3dSStefano Zampini ierr = MPI_Comm_rank(coarse_comm,&rank_coarse_comm);CHKERRQ(ierr); 3548da1bb401SStefano Zampini /*printf("Details of coarse comm\n"); 35493828260eSStefano Zampini printf("size = %d, myrank = %d\n",size_coarse_comm,rank_coarse_comm); 3550da1bb401SStefano Zampini printf("jumps = %d, coarse_color = %d, n_parts = %d\n",procs_jumps_coarse_comm,coarse_color,n_parts);*/ 35510c7d97c5SJed Brown } else { 35520c7d97c5SJed Brown rank_coarse_comm = MPI_PROC_NULL; 35530c7d97c5SJed Brown } 35540c7d97c5SJed Brown 35550c7d97c5SJed Brown /* master proc take care of arranging and distributing coarse informations */ 35560c7d97c5SJed Brown if(rank_coarse_comm == master_proc) { 35570c7d97c5SJed Brown ierr = PetscMalloc (size_coarse_comm*sizeof(PetscMPIInt),&displacements_recv);CHKERRQ(ierr); 3558da1bb401SStefano Zampini /*ierr = PetscMalloc (size_coarse_comm*sizeof(PetscMPIInt),&total_count_recv);CHKERRQ(ierr); 3559da1bb401SStefano Zampini ierr = PetscMalloc (n_subdomains*sizeof(PetscMPIInt),&total_ranks_recv);CHKERRQ(ierr);*/ 35600c7d97c5SJed Brown total_count_recv = (PetscMPIInt*)calloc(size_prec_comm,sizeof(PetscMPIInt)); 35610c7d97c5SJed Brown total_ranks_recv = (PetscMPIInt*)calloc(n_subdomains,sizeof(PetscMPIInt)); 35620c7d97c5SJed Brown /* some initializations */ 35630c7d97c5SJed Brown displacements_recv[0]=0; 3564da1bb401SStefano Zampini /* PetscMemzero(total_count_recv,size_coarse_comm*sizeof(PetscMPIInt)); not needed -> calloc initializes to zero */ 35650c7d97c5SJed Brown /* count from how many processes the j-th process of the coarse decomposition will receive data */ 35660c7d97c5SJed Brown for(j=0;j<size_coarse_comm;j++) 35673828260eSStefano Zampini for(i=0;i<size_prec_comm;i++) 35680c7d97c5SJed Brown if(coarse_subdivision[i]==j) 35690c7d97c5SJed Brown total_count_recv[j]++; 35700c7d97c5SJed Brown /* displacements needed for scatterv of total_ranks_recv */ 35710c7d97c5SJed Brown for(i=1;i<size_coarse_comm;i++) displacements_recv[i]=displacements_recv[i-1]+total_count_recv[i-1]; 35720c7d97c5SJed Brown /* Now fill properly total_ranks_recv -> each coarse process will receive the ranks (in prec_comm communicator) of its friend (sending) processes */ 35730c7d97c5SJed Brown ierr = PetscMemzero(total_count_recv,size_coarse_comm*sizeof(PetscMPIInt));CHKERRQ(ierr); 35740c7d97c5SJed Brown for(j=0;j<size_coarse_comm;j++) { 35753828260eSStefano Zampini for(i=0;i<size_prec_comm;i++) { 35760c7d97c5SJed Brown if(coarse_subdivision[i]==j) { 35770c7d97c5SJed Brown total_ranks_recv[displacements_recv[j]+total_count_recv[j]]=i; 35783828260eSStefano Zampini total_count_recv[j]+=1; 35790c7d97c5SJed Brown } 35800c7d97c5SJed Brown } 35810c7d97c5SJed Brown } 3582da1bb401SStefano Zampini /*for(j=0;j<size_coarse_comm;j++) { 35833828260eSStefano Zampini printf("process %d in new rank will receive from %d processes (original ranks follows)\n",j,total_count_recv[j]); 35843828260eSStefano Zampini for(i=0;i<total_count_recv[j];i++) { 35853828260eSStefano Zampini printf("%d ",total_ranks_recv[displacements_recv[j]+i]); 35863828260eSStefano Zampini } 35873828260eSStefano Zampini printf("\n"); 3588da1bb401SStefano Zampini }*/ 35890c7d97c5SJed Brown 35900c7d97c5SJed Brown /* identify new decomposition in terms of ranks in the old communicator */ 35913828260eSStefano Zampini for(i=0;i<n_subdomains;i++) coarse_subdivision[ranks_stretching_ratio*i]=coarse_subdivision[ranks_stretching_ratio*i]*procs_jumps_coarse_comm; 3592da1bb401SStefano Zampini /*printf("coarse_subdivision in old end new ranks\n"); 35930c7d97c5SJed Brown for(i=0;i<size_prec_comm;i++) 35943828260eSStefano Zampini if(coarse_subdivision[i]!=MPI_PROC_NULL) { 35953828260eSStefano Zampini printf("%d=(%d %d), ",i,coarse_subdivision[i],coarse_subdivision[i]/procs_jumps_coarse_comm); 35963828260eSStefano Zampini } else { 35973828260eSStefano Zampini printf("%d=(%d %d), ",i,coarse_subdivision[i],coarse_subdivision[i]); 35983828260eSStefano Zampini } 3599da1bb401SStefano Zampini printf("\n");*/ 36000c7d97c5SJed Brown } 36010c7d97c5SJed Brown 36020c7d97c5SJed Brown /* Scatter new decomposition for send details */ 360353cdbc3dSStefano Zampini ierr = MPI_Scatter(&coarse_subdivision[0],1,MPIU_INT,&rank_coarse_proc_send_to,1,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr); 36040c7d97c5SJed Brown /* Scatter receiving details to members of coarse decomposition */ 36050c7d97c5SJed Brown if( coarse_color == 0) { 360653cdbc3dSStefano Zampini ierr = MPI_Scatter(&total_count_recv[0],1,MPIU_INT,&count_recv,1,MPIU_INT,master_proc,coarse_comm);CHKERRQ(ierr); 36070c7d97c5SJed Brown ierr = PetscMalloc (count_recv*sizeof(PetscMPIInt),&ranks_recv);CHKERRQ(ierr); 360853cdbc3dSStefano Zampini ierr = MPI_Scatterv(&total_ranks_recv[0],total_count_recv,displacements_recv,MPIU_INT,&ranks_recv[0],count_recv,MPIU_INT,master_proc,coarse_comm);CHKERRQ(ierr); 36090c7d97c5SJed Brown } 36100c7d97c5SJed Brown 3611da1bb401SStefano Zampini /*printf("I will send my matrix data to proc %d\n",rank_coarse_proc_send_to); 3612da1bb401SStefano Zampini if(coarse_color == 0) { 3613da1bb401SStefano Zampini printf("I will receive some matrix data from %d processes (ranks follows)\n",count_recv); 3614da1bb401SStefano Zampini for(i=0;i<count_recv;i++) 3615da1bb401SStefano Zampini printf("%d ",ranks_recv[i]); 3616da1bb401SStefano Zampini printf("\n"); 3617da1bb401SStefano Zampini }*/ 36180c7d97c5SJed Brown 36190c7d97c5SJed Brown if(rank_prec_comm == master_proc) { 3620da1bb401SStefano Zampini /*ierr = PetscFree(coarse_subdivision);CHKERRQ(ierr); 3621da1bb401SStefano Zampini ierr = PetscFree(total_count_recv);CHKERRQ(ierr); 3622da1bb401SStefano Zampini ierr = PetscFree(total_ranks_recv);CHKERRQ(ierr);*/ 36230c7d97c5SJed Brown free(coarse_subdivision); 36240c7d97c5SJed Brown free(total_count_recv); 36250c7d97c5SJed Brown free(total_ranks_recv); 36260c7d97c5SJed Brown ierr = PetscFree(displacements_recv);CHKERRQ(ierr); 36270c7d97c5SJed Brown } 36280c7d97c5SJed Brown break; 36290c7d97c5SJed Brown } 36300c7d97c5SJed Brown 36310c7d97c5SJed Brown case(REPLICATED_BDDC): 36320c7d97c5SJed Brown 36330c7d97c5SJed Brown pcbddc->coarse_communications_type = GATHERS_BDDC; 36340c7d97c5SJed Brown coarse_mat_type = MATSEQAIJ; 36350c7d97c5SJed Brown coarse_pc_type = PCLU; 363653cdbc3dSStefano Zampini coarse_ksp_type = KSPPREONLY; 36370c7d97c5SJed Brown coarse_comm = PETSC_COMM_SELF; 36380c7d97c5SJed Brown active_rank = rank_prec_comm; 36390c7d97c5SJed Brown break; 36400c7d97c5SJed Brown 36410c7d97c5SJed Brown case(PARALLEL_BDDC): 36420c7d97c5SJed Brown 36430c7d97c5SJed Brown pcbddc->coarse_communications_type = SCATTERS_BDDC; 36440c7d97c5SJed Brown coarse_mat_type = MATMPIAIJ; 36450c7d97c5SJed Brown coarse_pc_type = PCREDUNDANT; 364653cdbc3dSStefano Zampini coarse_ksp_type = KSPPREONLY; 36470c7d97c5SJed Brown coarse_comm = prec_comm; 36480c7d97c5SJed Brown active_rank = rank_prec_comm; 36490c7d97c5SJed Brown break; 36500c7d97c5SJed Brown 36510c7d97c5SJed Brown case(SEQUENTIAL_BDDC): 36520c7d97c5SJed Brown pcbddc->coarse_communications_type = GATHERS_BDDC; 36530c7d97c5SJed Brown coarse_mat_type = MATSEQAIJ; 36540c7d97c5SJed Brown coarse_pc_type = PCLU; 365553cdbc3dSStefano Zampini coarse_ksp_type = KSPPREONLY; 36560c7d97c5SJed Brown coarse_comm = PETSC_COMM_SELF; 36570c7d97c5SJed Brown active_rank = master_proc; 36580c7d97c5SJed Brown break; 36590c7d97c5SJed Brown } 36600c7d97c5SJed Brown 36610c7d97c5SJed Brown switch(pcbddc->coarse_communications_type){ 36620c7d97c5SJed Brown 36630c7d97c5SJed Brown case(SCATTERS_BDDC): 36640c7d97c5SJed Brown { 36650c7d97c5SJed Brown if(pcbddc->coarse_problem_type==MULTILEVEL_BDDC) { 36660c7d97c5SJed Brown 36670c7d97c5SJed Brown PetscMPIInt send_size; 36680c7d97c5SJed Brown PetscInt *aux_ins_indices; 36690c7d97c5SJed Brown PetscInt ii,jj; 36700c7d97c5SJed Brown MPI_Request *requests; 36710c7d97c5SJed Brown 36720c7d97c5SJed Brown /* allocate auxiliary space */ 36735619798eSStefano Zampini ierr = PetscMalloc (pcbddc->replicated_primal_size*sizeof(PetscMPIInt),&pcbddc->replicated_local_primal_indices);CHKERRQ(ierr); 36745619798eSStefano Zampini ierr = MPI_Allgatherv(&pcbddc->local_primal_indices[0],pcbddc->local_primal_size,MPIU_INT,&pcbddc->replicated_local_primal_indices[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,prec_comm);CHKERRQ(ierr); 36750c7d97c5SJed Brown ierr = PetscMalloc ( pcbddc->coarse_size*sizeof(PetscInt),&aux_ins_indices);CHKERRQ(ierr); 36760c7d97c5SJed Brown ierr = PetscMemzero(aux_ins_indices,pcbddc->coarse_size*sizeof(PetscInt));CHKERRQ(ierr); 36770c7d97c5SJed Brown /* allocate stuffs for message massing */ 36780c7d97c5SJed Brown ierr = PetscMalloc ( (count_recv+1)*sizeof(MPI_Request),&requests);CHKERRQ(ierr); 36790c7d97c5SJed Brown for(i=0;i<count_recv+1;i++) requests[i]=MPI_REQUEST_NULL; 36800c7d97c5SJed Brown ierr = PetscMalloc ( count_recv*sizeof(PetscMPIInt),&localsizes2);CHKERRQ(ierr); 36810c7d97c5SJed Brown ierr = PetscMalloc ( count_recv*sizeof(PetscMPIInt),&localdispl2);CHKERRQ(ierr); 36820c7d97c5SJed Brown /* fill up quantities */ 36830c7d97c5SJed Brown j=0; 36840c7d97c5SJed Brown for(i=0;i<count_recv;i++){ 36850c7d97c5SJed Brown ii = ranks_recv[i]; 36860c7d97c5SJed Brown localsizes2[i]=pcbddc->local_primal_sizes[ii]*pcbddc->local_primal_sizes[ii]; 36870c7d97c5SJed Brown localdispl2[i]=j; 36880c7d97c5SJed Brown j+=localsizes2[i]; 36890c7d97c5SJed Brown jj = pcbddc->local_primal_displacements[ii]; 3690da1bb401SStefano Zampini for(k=0;k<pcbddc->local_primal_sizes[ii];k++) aux_ins_indices[pcbddc->replicated_local_primal_indices[jj+k]]+=1; /* it counts the coarse subdomains sharing the coarse node */ 36910c7d97c5SJed Brown } 3692da1bb401SStefano Zampini /*printf("aux_ins_indices 1\n"); 3693da1bb401SStefano Zampini for(i=0;i<pcbddc->coarse_size;i++) 3694da1bb401SStefano Zampini printf("%d ",aux_ins_indices[i]); 3695da1bb401SStefano Zampini printf("\n");*/ 36960c7d97c5SJed Brown /* temp_coarse_mat_vals used to store temporarly received matrix values */ 36970c7d97c5SJed Brown ierr = PetscMalloc ( j*sizeof(PetscScalar),&temp_coarse_mat_vals);CHKERRQ(ierr); 36980c7d97c5SJed Brown /* evaluate how many values I will insert in coarse mat */ 36990c7d97c5SJed Brown ins_local_primal_size=0; 3700*ea7e1babSStefano Zampini for(i=0;i<pcbddc->coarse_size;i++){ 3701*ea7e1babSStefano Zampini if(aux_ins_indices[i]){ 37020c7d97c5SJed Brown ins_local_primal_size++; 3703*ea7e1babSStefano Zampini } 3704*ea7e1babSStefano Zampini } 37050c7d97c5SJed Brown /* evaluate indices I will insert in coarse mat */ 37060c7d97c5SJed Brown ierr = PetscMalloc ( ins_local_primal_size*sizeof(PetscInt),&ins_local_primal_indices);CHKERRQ(ierr); 37070c7d97c5SJed Brown j=0; 3708*ea7e1babSStefano Zampini for(i=0;i<pcbddc->coarse_size;i++){ 3709*ea7e1babSStefano Zampini if(aux_ins_indices[i]){ 37100c7d97c5SJed Brown ins_local_primal_indices[j++]=i; 3711*ea7e1babSStefano Zampini } 3712*ea7e1babSStefano Zampini } 37130c7d97c5SJed Brown /* use aux_ins_indices to realize a global to local mapping */ 37140c7d97c5SJed Brown j=0; 37150c7d97c5SJed Brown for(i=0;i<pcbddc->coarse_size;i++){ 37160c7d97c5SJed Brown if(aux_ins_indices[i]==0){ 37170c7d97c5SJed Brown aux_ins_indices[i]=-1; 37180c7d97c5SJed Brown } else { 37190c7d97c5SJed Brown aux_ins_indices[i]=j; 37200c7d97c5SJed Brown j++; 37210c7d97c5SJed Brown } 37220c7d97c5SJed Brown } 37230c7d97c5SJed Brown 3724da1bb401SStefano Zampini /*printf("New details localsizes2 localdispl2\n"); 3725da1bb401SStefano Zampini for(i=0;i<count_recv;i++) 3726da1bb401SStefano Zampini printf("(%d %d) ",localsizes2[i],localdispl2[i]); 3727da1bb401SStefano Zampini printf("\n"); 3728da1bb401SStefano Zampini printf("aux_ins_indices 2\n"); 3729da1bb401SStefano Zampini for(i=0;i<pcbddc->coarse_size;i++) 3730da1bb401SStefano Zampini printf("%d ",aux_ins_indices[i]); 3731da1bb401SStefano Zampini printf("\n"); 3732da1bb401SStefano Zampini printf("ins_local_primal_indices\n"); 3733da1bb401SStefano Zampini for(i=0;i<ins_local_primal_size;i++) 3734da1bb401SStefano Zampini printf("%d ",ins_local_primal_indices[i]); 3735da1bb401SStefano Zampini printf("\n"); 3736da1bb401SStefano Zampini printf("coarse_submat_vals\n"); 3737da1bb401SStefano Zampini for(i=0;i<pcbddc->local_primal_size;i++) 3738da1bb401SStefano Zampini for(j=0;j<pcbddc->local_primal_size;j++) 3739da1bb401SStefano Zampini printf("(%lf %d %d)\n",coarse_submat_vals[j*pcbddc->local_primal_size+i],pcbddc->local_primal_indices[i],pcbddc->local_primal_indices[j]); 3740da1bb401SStefano Zampini printf("\n");*/ 37410c7d97c5SJed Brown 37420c7d97c5SJed Brown /* processes partecipating in coarse problem receive matrix data from their friends */ 374353cdbc3dSStefano Zampini for(i=0;i<count_recv;i++) ierr = MPI_Irecv(&temp_coarse_mat_vals[localdispl2[i]],localsizes2[i],MPIU_SCALAR,ranks_recv[i],666,prec_comm,&requests[i]);CHKERRQ(ierr); 37440c7d97c5SJed Brown if(rank_coarse_proc_send_to != MPI_PROC_NULL ) { 37450c7d97c5SJed Brown send_size=pcbddc->local_primal_size*pcbddc->local_primal_size; 374653cdbc3dSStefano Zampini ierr = MPI_Isend(&coarse_submat_vals[0],send_size,MPIU_SCALAR,rank_coarse_proc_send_to,666,prec_comm,&requests[count_recv]);CHKERRQ(ierr); 37470c7d97c5SJed Brown } 374853cdbc3dSStefano Zampini ierr = MPI_Waitall(count_recv+1,requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 37490c7d97c5SJed Brown 3750da1bb401SStefano Zampini /*if(coarse_color == 0) { 3751da1bb401SStefano Zampini printf("temp_coarse_mat_vals\n"); 3752da1bb401SStefano Zampini for(k=0;k<count_recv;k++){ 3753da1bb401SStefano Zampini printf("---- %d ----\n",ranks_recv[k]); 3754da1bb401SStefano Zampini for(i=0;i<pcbddc->local_primal_sizes[ranks_recv[k]];i++) 3755da1bb401SStefano Zampini for(j=0;j<pcbddc->local_primal_sizes[ranks_recv[k]];j++) 3756da1bb401SStefano Zampini printf("(%lf %d %d)\n",temp_coarse_mat_vals[localdispl2[k]+j*pcbddc->local_primal_sizes[ranks_recv[k]]+i],pcbddc->replicated_local_primal_indices[pcbddc->local_primal_displacements[ranks_recv[k]]+i],pcbddc->replicated_local_primal_indices[pcbddc->local_primal_displacements[ranks_recv[k]]+j]); 3757da1bb401SStefano Zampini printf("\n"); 3758da1bb401SStefano Zampini } 3759da1bb401SStefano Zampini }*/ 37600c7d97c5SJed Brown /* calculate data to insert in coarse mat */ 37610c7d97c5SJed Brown ierr = PetscMalloc ( ins_local_primal_size*ins_local_primal_size*sizeof(PetscScalar),&ins_coarse_mat_vals);CHKERRQ(ierr); 37620c7d97c5SJed Brown PetscMemzero(ins_coarse_mat_vals,ins_local_primal_size*ins_local_primal_size*sizeof(PetscScalar)); 37630c7d97c5SJed Brown 37640c7d97c5SJed Brown PetscMPIInt rr,kk,lps,lpd; 37650c7d97c5SJed Brown PetscInt row_ind,col_ind; 37660c7d97c5SJed Brown for(k=0;k<count_recv;k++){ 37670c7d97c5SJed Brown rr = ranks_recv[k]; 37680c7d97c5SJed Brown kk = localdispl2[k]; 37690c7d97c5SJed Brown lps = pcbddc->local_primal_sizes[rr]; 37700c7d97c5SJed Brown lpd = pcbddc->local_primal_displacements[rr]; 3771da1bb401SStefano Zampini /*printf("Inserting the following indices (received from %d)\n",rr);*/ 37720c7d97c5SJed Brown for(j=0;j<lps;j++){ 37730c7d97c5SJed Brown col_ind=aux_ins_indices[pcbddc->replicated_local_primal_indices[lpd+j]]; 37740c7d97c5SJed Brown for(i=0;i<lps;i++){ 37750c7d97c5SJed Brown row_ind=aux_ins_indices[pcbddc->replicated_local_primal_indices[lpd+i]]; 3776da1bb401SStefano Zampini /*printf("%d %d\n",row_ind,col_ind);*/ 37770c7d97c5SJed Brown ins_coarse_mat_vals[col_ind*ins_local_primal_size+row_ind]+=temp_coarse_mat_vals[kk+j*lps+i]; 37780c7d97c5SJed Brown } 37790c7d97c5SJed Brown } 37800c7d97c5SJed Brown } 37810c7d97c5SJed Brown ierr = PetscFree(requests);CHKERRQ(ierr); 37820c7d97c5SJed Brown ierr = PetscFree(aux_ins_indices);CHKERRQ(ierr); 37830c7d97c5SJed Brown ierr = PetscFree(temp_coarse_mat_vals);CHKERRQ(ierr); 37840c7d97c5SJed Brown if(coarse_color == 0) { ierr = PetscFree(ranks_recv);CHKERRQ(ierr); } 37850c7d97c5SJed Brown 37860c7d97c5SJed Brown /* create local to global mapping needed by coarse MATIS */ 37870c7d97c5SJed Brown { 37880c7d97c5SJed Brown IS coarse_IS; 378953cdbc3dSStefano Zampini if(coarse_comm != MPI_COMM_NULL ) ierr = MPI_Comm_free(&coarse_comm);CHKERRQ(ierr); 37900c7d97c5SJed Brown coarse_comm = prec_comm; 37910c7d97c5SJed Brown active_rank=rank_prec_comm; 37920c7d97c5SJed Brown ierr = ISCreateGeneral(coarse_comm,ins_local_primal_size,ins_local_primal_indices,PETSC_COPY_VALUES,&coarse_IS);CHKERRQ(ierr); 37930c7d97c5SJed Brown ierr = ISLocalToGlobalMappingCreateIS(coarse_IS,&coarse_ISLG);CHKERRQ(ierr); 37940c7d97c5SJed Brown ierr = ISDestroy(&coarse_IS);CHKERRQ(ierr); 37950c7d97c5SJed Brown } 37960c7d97c5SJed Brown } 37970c7d97c5SJed Brown if(pcbddc->coarse_problem_type==PARALLEL_BDDC) { 37980c7d97c5SJed Brown /* arrays for values insertion */ 37990c7d97c5SJed Brown ins_local_primal_size = pcbddc->local_primal_size; 38000c7d97c5SJed Brown ierr = PetscMalloc ( ins_local_primal_size*sizeof(PetscMPIInt),&ins_local_primal_indices);CHKERRQ(ierr); 38010c7d97c5SJed Brown ierr = PetscMalloc ( ins_local_primal_size*ins_local_primal_size*sizeof(PetscScalar),&ins_coarse_mat_vals);CHKERRQ(ierr); 38020c7d97c5SJed Brown for(j=0;j<ins_local_primal_size;j++){ 38030c7d97c5SJed Brown ins_local_primal_indices[j]=pcbddc->local_primal_indices[j]; 38040c7d97c5SJed Brown for(i=0;i<ins_local_primal_size;i++) ins_coarse_mat_vals[j*ins_local_primal_size+i]=coarse_submat_vals[j*ins_local_primal_size+i]; 38050c7d97c5SJed Brown } 38060c7d97c5SJed Brown } 38070c7d97c5SJed Brown break; 38080c7d97c5SJed Brown 38090c7d97c5SJed Brown } 38100c7d97c5SJed Brown 38110c7d97c5SJed Brown case(GATHERS_BDDC): 38120c7d97c5SJed Brown { 38130c7d97c5SJed Brown 38140c7d97c5SJed Brown PetscMPIInt mysize,mysize2; 38150c7d97c5SJed Brown 38160c7d97c5SJed Brown if(rank_prec_comm==active_rank) { 38170c7d97c5SJed Brown ierr = PetscMalloc ( pcbddc->replicated_primal_size*sizeof(PetscMPIInt),&pcbddc->replicated_local_primal_indices);CHKERRQ(ierr); 38180c7d97c5SJed Brown pcbddc->replicated_local_primal_values = (PetscScalar*)calloc(pcbddc->replicated_primal_size,sizeof(PetscScalar)); 38190c7d97c5SJed Brown ierr = PetscMalloc ( size_prec_comm*sizeof(PetscMPIInt),&localsizes2);CHKERRQ(ierr); 38200c7d97c5SJed Brown ierr = PetscMalloc ( size_prec_comm*sizeof(PetscMPIInt),&localdispl2);CHKERRQ(ierr); 38210c7d97c5SJed Brown /* arrays for values insertion */ 38220c7d97c5SJed Brown for(i=0;i<size_prec_comm;i++) localsizes2[i]=pcbddc->local_primal_sizes[i]*pcbddc->local_primal_sizes[i]; 38230c7d97c5SJed Brown localdispl2[0]=0; 38240c7d97c5SJed Brown for(i=1;i<size_prec_comm;i++) localdispl2[i]=localsizes2[i-1]+localdispl2[i-1]; 38250c7d97c5SJed Brown j=0; 38260c7d97c5SJed Brown for(i=0;i<size_prec_comm;i++) j+=localsizes2[i]; 38270c7d97c5SJed Brown ierr = PetscMalloc ( j*sizeof(PetscScalar),&temp_coarse_mat_vals);CHKERRQ(ierr); 38280c7d97c5SJed Brown } 38290c7d97c5SJed Brown 38300c7d97c5SJed Brown mysize=pcbddc->local_primal_size; 38310c7d97c5SJed Brown mysize2=pcbddc->local_primal_size*pcbddc->local_primal_size; 38320c7d97c5SJed Brown if(pcbddc->coarse_problem_type == SEQUENTIAL_BDDC){ 383353cdbc3dSStefano Zampini ierr = MPI_Gatherv(&pcbddc->local_primal_indices[0],mysize,MPIU_INT,&pcbddc->replicated_local_primal_indices[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr); 383453cdbc3dSStefano Zampini ierr = MPI_Gatherv(&coarse_submat_vals[0],mysize2,MPIU_SCALAR,&temp_coarse_mat_vals[0],localsizes2,localdispl2,MPIU_SCALAR,master_proc,prec_comm);CHKERRQ(ierr); 38350c7d97c5SJed Brown } else { 383653cdbc3dSStefano Zampini ierr = MPI_Allgatherv(&pcbddc->local_primal_indices[0],mysize,MPIU_INT,&pcbddc->replicated_local_primal_indices[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,prec_comm);CHKERRQ(ierr); 383753cdbc3dSStefano Zampini ierr = MPI_Allgatherv(&coarse_submat_vals[0],mysize2,MPIU_SCALAR,&temp_coarse_mat_vals[0],localsizes2,localdispl2,MPIU_SCALAR,prec_comm);CHKERRQ(ierr); 38380c7d97c5SJed Brown } 38390c7d97c5SJed Brown break; 3840da1bb401SStefano Zampini }/* switch on coarse problem and communications associated with finished */ 38410c7d97c5SJed Brown } 38420c7d97c5SJed Brown 38430c7d97c5SJed Brown /* Now create and fill up coarse matrix */ 38440c7d97c5SJed Brown if( rank_prec_comm == active_rank ) { 38450c7d97c5SJed Brown if(pcbddc->coarse_problem_type != MULTILEVEL_BDDC) { 38460c7d97c5SJed Brown ierr = MatCreate(coarse_comm,&pcbddc->coarse_mat);CHKERRQ(ierr); 38470c7d97c5SJed Brown ierr = MatSetSizes(pcbddc->coarse_mat,PETSC_DECIDE,PETSC_DECIDE,pcbddc->coarse_size,pcbddc->coarse_size);CHKERRQ(ierr); 38480c7d97c5SJed Brown ierr = MatSetType(pcbddc->coarse_mat,coarse_mat_type);CHKERRQ(ierr); 38493b03a366Sstefano_zampini ierr = MatSetUp(pcbddc->coarse_mat);CHKERRQ(ierr); 3850da1bb401SStefano Zampini ierr = MatSetOption(pcbddc->coarse_mat,MAT_ROW_ORIENTED,PETSC_FALSE);CHKERRQ(ierr); /* local values stored in column major */ 38513b03a366Sstefano_zampini ierr = MatSetOption(pcbddc->coarse_mat,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr); 38520c7d97c5SJed Brown } else { 38530c7d97c5SJed Brown Mat matis_coarse_local_mat; 3854d3ee2243SStefano Zampini /* remind bs */ 3855d3ee2243SStefano Zampini ierr = MatCreateIS(coarse_comm,bs,PETSC_DECIDE,PETSC_DECIDE,pcbddc->coarse_size,pcbddc->coarse_size,coarse_ISLG,&pcbddc->coarse_mat);CHKERRQ(ierr); 38563b03a366Sstefano_zampini ierr = MatSetUp(pcbddc->coarse_mat);CHKERRQ(ierr); 38570c7d97c5SJed Brown ierr = MatISGetLocalMat(pcbddc->coarse_mat,&matis_coarse_local_mat);CHKERRQ(ierr); 38583b03a366Sstefano_zampini ierr = MatSetUp(matis_coarse_local_mat);CHKERRQ(ierr); 3859da1bb401SStefano Zampini ierr = MatSetOption(matis_coarse_local_mat,MAT_ROW_ORIENTED,PETSC_FALSE);CHKERRQ(ierr); /* local values stored in column major */ 3860a0ba757dSStefano Zampini ierr = MatSetOption(matis_coarse_local_mat,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr); 38610c7d97c5SJed Brown } 3862a0ba757dSStefano Zampini ierr = MatSetOption(pcbddc->coarse_mat,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_FALSE);CHKERRQ(ierr); 3863*ea7e1babSStefano Zampini if(pcbddc->coarse_communications_type != GATHERS_BDDC) { 38640c7d97c5SJed Brown ierr = MatSetValues(pcbddc->coarse_mat,ins_local_primal_size,ins_local_primal_indices,ins_local_primal_size,ins_local_primal_indices,ins_coarse_mat_vals,ADD_VALUES);CHKERRQ(ierr); 3865*ea7e1babSStefano Zampini } else { 3866*ea7e1babSStefano Zampini for(k=0;k<size_prec_comm;k++){ 3867*ea7e1babSStefano Zampini offset=pcbddc->local_primal_displacements[k]; 3868*ea7e1babSStefano Zampini offset2=localdispl2[k]; 3869*ea7e1babSStefano Zampini ins_local_primal_size = pcbddc->local_primal_sizes[k]; 3870*ea7e1babSStefano Zampini ins_local_primal_indices = &pcbddc->replicated_local_primal_indices[offset]; 3871*ea7e1babSStefano Zampini ins_coarse_mat_vals = &temp_coarse_mat_vals[offset2]; 3872*ea7e1babSStefano Zampini ierr = MatSetValues(pcbddc->coarse_mat,ins_local_primal_size,ins_local_primal_indices,ins_local_primal_size,ins_local_primal_indices,ins_coarse_mat_vals,ADD_VALUES);CHKERRQ(ierr); 3873*ea7e1babSStefano Zampini } 3874*ea7e1babSStefano Zampini ins_local_primal_indices = 0; 3875*ea7e1babSStefano Zampini ins_coarse_mat_vals = 0; 3876*ea7e1babSStefano Zampini } 38770c7d97c5SJed Brown ierr = MatAssemblyBegin(pcbddc->coarse_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 38780c7d97c5SJed Brown ierr = MatAssemblyEnd(pcbddc->coarse_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr); 38790c7d97c5SJed Brown 3880da1bb401SStefano Zampini /* PetscViewer view_out; 3881da1bb401SStefano Zampini ierr = PetscViewerASCIIOpen(PETSC_COMM_SELF,"coarsematfull.m",&view_out);CHKERRQ(ierr); 3882da1bb401SStefano Zampini ierr = PetscViewerSetFormat(view_out,PETSC_VIEWER_ASCII_MATLAB);CHKERRQ(ierr); 3883da1bb401SStefano Zampini ierr = MatView(pcbddc->coarse_mat,view_out);CHKERRQ(ierr); 3884da1bb401SStefano Zampini ierr = PetscViewerDestroy(&view_out);CHKERRQ(ierr);*/ 3885da1bb401SStefano Zampini 38860c7d97c5SJed Brown ierr = MatGetVecs(pcbddc->coarse_mat,&pcbddc->coarse_vec,&pcbddc->coarse_rhs);CHKERRQ(ierr); 38870c7d97c5SJed Brown /* Preconditioner for coarse problem */ 388853cdbc3dSStefano Zampini ierr = KSPCreate(coarse_comm,&pcbddc->coarse_ksp);CHKERRQ(ierr); 388953cdbc3dSStefano Zampini ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->coarse_ksp,(PetscObject)pc,1);CHKERRQ(ierr); 389053cdbc3dSStefano Zampini ierr = KSPSetOperators(pcbddc->coarse_ksp,pcbddc->coarse_mat,pcbddc->coarse_mat,SAME_PRECONDITIONER);CHKERRQ(ierr); 38913b03a366Sstefano_zampini ierr = KSPSetTolerances(pcbddc->coarse_ksp,PETSC_DEFAULT,PETSC_DEFAULT,PETSC_DEFAULT,max_it_coarse_ksp);CHKERRQ(ierr); 389253cdbc3dSStefano Zampini ierr = KSPSetType(pcbddc->coarse_ksp,coarse_ksp_type);CHKERRQ(ierr); 389353cdbc3dSStefano Zampini ierr = KSPGetPC(pcbddc->coarse_ksp,&pc_temp);CHKERRQ(ierr); 389453cdbc3dSStefano Zampini ierr = PCSetType(pc_temp,coarse_pc_type);CHKERRQ(ierr); 38950c7d97c5SJed Brown /* Allow user's customization */ 3896da1bb401SStefano Zampini ierr = KSPSetOptionsPrefix(pcbddc->coarse_ksp,"coarse_");CHKERRQ(ierr); 389753cdbc3dSStefano Zampini ierr = KSPSetFromOptions(pcbddc->coarse_ksp);CHKERRQ(ierr); 38980c7d97c5SJed Brown /* Set Up PC for coarse problem BDDC */ 389953cdbc3dSStefano Zampini if(pcbddc->coarse_problem_type == MULTILEVEL_BDDC) { 3900e269702eSStefano Zampini if(dbg_flag) { 3901e269702eSStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"----------------Setting up a new level---------------\n");CHKERRQ(ierr); 3902e269702eSStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 3903e269702eSStefano Zampini } 390453cdbc3dSStefano Zampini ierr = PCBDDCSetCoarseProblemType(pc_temp,MULTILEVEL_BDDC);CHKERRQ(ierr); 390553cdbc3dSStefano Zampini } 390653cdbc3dSStefano Zampini ierr = KSPSetUp(pcbddc->coarse_ksp);CHKERRQ(ierr); 39075619798eSStefano Zampini if(pcbddc->coarse_problem_type == MULTILEVEL_BDDC) { 39085619798eSStefano Zampini if(dbg_flag) { 39095619798eSStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"----------------New level set------------------------\n");CHKERRQ(ierr); 39105619798eSStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 39115619798eSStefano Zampini } 39125619798eSStefano Zampini } 39130c7d97c5SJed Brown } 39140c7d97c5SJed Brown if(pcbddc->coarse_communications_type == SCATTERS_BDDC) { 39150c7d97c5SJed Brown IS local_IS,global_IS; 39160c7d97c5SJed Brown ierr = ISCreateStride(PETSC_COMM_SELF,pcbddc->local_primal_size,0,1,&local_IS);CHKERRQ(ierr); 39170c7d97c5SJed Brown ierr = ISCreateGeneral(PETSC_COMM_SELF,pcbddc->local_primal_size,pcbddc->local_primal_indices,PETSC_COPY_VALUES,&global_IS);CHKERRQ(ierr); 39180c7d97c5SJed Brown ierr = VecScatterCreate(pcbddc->vec1_P,local_IS,pcbddc->coarse_vec,global_IS,&pcbddc->coarse_loc_to_glob);CHKERRQ(ierr); 39190c7d97c5SJed Brown ierr = ISDestroy(&local_IS);CHKERRQ(ierr); 39200c7d97c5SJed Brown ierr = ISDestroy(&global_IS);CHKERRQ(ierr); 39210c7d97c5SJed Brown } 39220c7d97c5SJed Brown 39230c7d97c5SJed Brown 39243b03a366Sstefano_zampini /* Evaluate condition number of coarse problem for cheby (and verbose output if requested) */ 39253b03a366Sstefano_zampini if( pcbddc->coarse_problem_type == MULTILEVEL_BDDC && rank_prec_comm == active_rank ) { 39260c7d97c5SJed Brown PetscScalar m_one=-1.0; 39275619798eSStefano Zampini PetscReal infty_error,lambda_min,lambda_max,kappa_2; 39283b03a366Sstefano_zampini const KSPType check_ksp_type=KSPGMRES; 39290c7d97c5SJed Brown 39305619798eSStefano Zampini /* change coarse ksp object to an iterative method suitable for extreme eigenvalues' estimation */ 39313b03a366Sstefano_zampini ierr = KSPSetType(pcbddc->coarse_ksp,check_ksp_type);CHKERRQ(ierr); 3932d49ef151SStefano Zampini ierr = KSPSetComputeSingularValues(pcbddc->coarse_ksp,PETSC_TRUE);CHKERRQ(ierr); 39335619798eSStefano Zampini ierr = KSPSetTolerances(pcbddc->coarse_ksp,1.e-8,1.e-8,PETSC_DEFAULT,pcbddc->coarse_size);CHKERRQ(ierr); 39345619798eSStefano Zampini ierr = KSPSetUp(pcbddc->coarse_ksp);CHKERRQ(ierr); 3935d49ef151SStefano Zampini ierr = VecSetRandom(pcbddc->coarse_rhs,PETSC_NULL);CHKERRQ(ierr); 3936d49ef151SStefano Zampini ierr = MatMult(pcbddc->coarse_mat,pcbddc->coarse_rhs,pcbddc->coarse_vec);CHKERRQ(ierr); 3937d49ef151SStefano Zampini ierr = MatMult(pcbddc->coarse_mat,pcbddc->coarse_vec,pcbddc->coarse_rhs);CHKERRQ(ierr); 3938d49ef151SStefano Zampini ierr = KSPSolve(pcbddc->coarse_ksp,pcbddc->coarse_rhs,pcbddc->coarse_rhs);CHKERRQ(ierr); 3939d49ef151SStefano Zampini ierr = KSPComputeExtremeSingularValues(pcbddc->coarse_ksp,&lambda_max,&lambda_min);CHKERRQ(ierr); 39403b03a366Sstefano_zampini if(dbg_flag) { 39415619798eSStefano Zampini kappa_2=lambda_max/lambda_min; 39425619798eSStefano Zampini ierr = KSPGetIterationNumber(pcbddc->coarse_ksp,&k);CHKERRQ(ierr); 3943d49ef151SStefano Zampini ierr = VecAXPY(pcbddc->coarse_rhs,m_one,pcbddc->coarse_vec);CHKERRQ(ierr); 3944d49ef151SStefano Zampini ierr = VecNorm(pcbddc->coarse_rhs,NORM_INFINITY,&infty_error);CHKERRQ(ierr); 39453b03a366Sstefano_zampini ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem condition number estimated with %d iterations of %s is: % 1.14e\n",k,check_ksp_type,kappa_2);CHKERRQ(ierr); 3946e269702eSStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem eigenvalues: % 1.14e %1.14e\n",lambda_min,lambda_max);CHKERRQ(ierr); 3947e269702eSStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem infty_error: %1.14e\n",infty_error);CHKERRQ(ierr); 39483b03a366Sstefano_zampini } 39495619798eSStefano Zampini /* restore coarse ksp to default values */ 3950d49ef151SStefano Zampini ierr = KSPSetComputeSingularValues(pcbddc->coarse_ksp,PETSC_FALSE);CHKERRQ(ierr); 39515619798eSStefano Zampini ierr = KSPSetType(pcbddc->coarse_ksp,coarse_ksp_type);CHKERRQ(ierr); 39526c9de887SHong Zhang ierr = KSPChebyshevSetEigenvalues(pcbddc->coarse_ksp,lambda_max,lambda_min);CHKERRQ(ierr); 39533b03a366Sstefano_zampini ierr = KSPSetTolerances(pcbddc->coarse_ksp,PETSC_DEFAULT,PETSC_DEFAULT,PETSC_DEFAULT,max_it_coarse_ksp);CHKERRQ(ierr); 39545619798eSStefano Zampini ierr = KSPSetFromOptions(pcbddc->coarse_ksp);CHKERRQ(ierr); 39555619798eSStefano Zampini ierr = KSPSetUp(pcbddc->coarse_ksp);CHKERRQ(ierr); 395653cdbc3dSStefano Zampini } 39570c7d97c5SJed Brown 39580c7d97c5SJed Brown /* free data structures no longer needed */ 39590c7d97c5SJed Brown if(coarse_ISLG) { ierr = ISLocalToGlobalMappingDestroy(&coarse_ISLG);CHKERRQ(ierr); } 39600c7d97c5SJed Brown if(ins_local_primal_indices) { ierr = PetscFree(ins_local_primal_indices);CHKERRQ(ierr); } 39610c7d97c5SJed Brown if(ins_coarse_mat_vals) { ierr = PetscFree(ins_coarse_mat_vals);CHKERRQ(ierr);} 39620c7d97c5SJed Brown if(localsizes2) { ierr = PetscFree(localsizes2);CHKERRQ(ierr);} 39630c7d97c5SJed Brown if(localdispl2) { ierr = PetscFree(localdispl2);CHKERRQ(ierr);} 39640c7d97c5SJed Brown if(temp_coarse_mat_vals) { ierr = PetscFree(temp_coarse_mat_vals);CHKERRQ(ierr);} 39650c7d97c5SJed Brown 39660c7d97c5SJed Brown PetscFunctionReturn(0); 39670c7d97c5SJed Brown } 39680c7d97c5SJed Brown 39690c7d97c5SJed Brown #undef __FUNCT__ 39700c7d97c5SJed Brown #define __FUNCT__ "PCBDDCManageLocalBoundaries" 397153cdbc3dSStefano Zampini static PetscErrorCode PCBDDCManageLocalBoundaries(PC pc) 39720c7d97c5SJed Brown { 39730c7d97c5SJed Brown 39740c7d97c5SJed Brown PC_BDDC *pcbddc = (PC_BDDC*)pc->data; 39750c7d97c5SJed Brown PC_IS *pcis = (PC_IS*)pc->data; 39760c7d97c5SJed Brown Mat_IS *matis = (Mat_IS*)pc->pmat->data; 3977da1bb401SStefano Zampini PCBDDCGraph mat_graph=pcbddc->mat_graph; 39783972b0daSStefano Zampini PetscInt *queue_in_global_numbering,*is_indices,*auxis; 39793b03a366Sstefano_zampini PetscInt bs,ierr,i,j,s,k,iindex,neumann_bsize,dirichlet_bsize; 3980da1bb401SStefano Zampini PetscInt total_counts,nodes_touched,where_values=1,vertex_size; 3981534831adSStefano Zampini PetscMPIInt adapt_interface=0,adapt_interface_reduced=0,NEUMANNCNT=0; 3982da1bb401SStefano Zampini PetscBool same_set; 3983a0ba757dSStefano Zampini MPI_Comm interface_comm=((PetscObject)pc)->comm; 39843b03a366Sstefano_zampini PetscBool use_faces=PETSC_FALSE,use_edges=PETSC_FALSE; 39853b03a366Sstefano_zampini const PetscInt *neumann_nodes; 39863b03a366Sstefano_zampini const PetscInt *dirichlet_nodes; 3987a81d60d8SStefano Zampini IS used_IS,*custom_ISForDofs; 3988da1bb401SStefano Zampini PetscScalar *array; 3989da1bb401SStefano Zampini PetscScalar *array2; 3990da1bb401SStefano Zampini PetscViewer viewer=pcbddc->dbg_viewer; 39910c7d97c5SJed Brown 39920c7d97c5SJed Brown PetscFunctionBegin; 3993da1bb401SStefano Zampini /* Setup local adjacency graph */ 3994da1bb401SStefano Zampini mat_graph->nvtxs=pcis->n; 3995534831adSStefano Zampini if(!mat_graph->xadj) { NEUMANNCNT = 1; } 3996da1bb401SStefano Zampini ierr = PCBDDCSetupLocalAdjacencyGraph(pc);CHKERRQ(ierr); 3997a0ba757dSStefano Zampini i = mat_graph->nvtxs; 3998a0ba757dSStefano Zampini ierr = PetscMalloc4(i,PetscInt,&mat_graph->where,i,PetscInt,&mat_graph->count,i+1,PetscInt,&mat_graph->cptr,i,PetscInt,&mat_graph->queue);CHKERRQ(ierr); 39993972b0daSStefano Zampini ierr = PetscMalloc2(i,PetscInt,&mat_graph->which_dof,i,PetscBool,&mat_graph->touched);CHKERRQ(ierr); 40003972b0daSStefano Zampini ierr = PetscMalloc(i*sizeof(PetscInt),&queue_in_global_numbering);CHKERRQ(ierr); 4001a0ba757dSStefano Zampini ierr = PetscMemzero(mat_graph->where,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr); 4002a0ba757dSStefano Zampini ierr = PetscMemzero(mat_graph->count,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr); 4003a0ba757dSStefano Zampini ierr = PetscMemzero(mat_graph->which_dof,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr); 4004a0ba757dSStefano Zampini ierr = PetscMemzero(mat_graph->queue,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr); 40053828260eSStefano Zampini ierr = PetscMemzero(mat_graph->cptr,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr); 4006a0ba757dSStefano Zampini 4007a81d60d8SStefano Zampini /* Setting dofs splitting in mat_graph->which_dof 4008a81d60d8SStefano Zampini Get information about dofs' splitting if provided by the user 4009a81d60d8SStefano Zampini Otherwise it assumes a constant block size */ 4010a81d60d8SStefano Zampini vertex_size=0; 4011a81d60d8SStefano Zampini if(!pcbddc->n_ISForDofs) { 4012a81d60d8SStefano Zampini ierr = MatGetBlockSize(matis->A,&bs);CHKERRQ(ierr); 4013a81d60d8SStefano Zampini ierr = PetscMalloc(bs*sizeof(IS),&custom_ISForDofs);CHKERRQ(ierr); 4014a81d60d8SStefano Zampini for(i=0;i<bs;i++) { 4015a81d60d8SStefano Zampini ierr = ISCreateStride(PETSC_COMM_SELF,pcis->n/bs,i,bs,&custom_ISForDofs[i]);CHKERRQ(ierr); 4016a81d60d8SStefano Zampini } 4017a81d60d8SStefano Zampini ierr = PCBDDCSetDofsSplitting(pc,bs,custom_ISForDofs);CHKERRQ(ierr); 4018a81d60d8SStefano Zampini vertex_size=1; 4019a81d60d8SStefano Zampini /* remove my references to IS objects */ 4020a81d60d8SStefano Zampini for(i=0;i<bs;i++) { 4021a81d60d8SStefano Zampini ierr = ISDestroy(&custom_ISForDofs[i]);CHKERRQ(ierr); 4022a81d60d8SStefano Zampini } 4023a81d60d8SStefano Zampini ierr = PetscFree(custom_ISForDofs);CHKERRQ(ierr); 4024a81d60d8SStefano Zampini } 40259c0446d6SStefano Zampini for(i=0;i<pcbddc->n_ISForDofs;i++) { 4026a81d60d8SStefano Zampini ierr = ISGetSize(pcbddc->ISForDofs[i],&k);CHKERRQ(ierr); 40279c0446d6SStefano Zampini ierr = ISGetIndices(pcbddc->ISForDofs[i],(const PetscInt**)&is_indices);CHKERRQ(ierr); 4028a81d60d8SStefano Zampini for(j=0;j<k;j++) { 40299c0446d6SStefano Zampini mat_graph->which_dof[is_indices[j]]=i; 40309c0446d6SStefano Zampini } 40319c0446d6SStefano Zampini ierr = ISRestoreIndices(pcbddc->ISForDofs[i],(const PetscInt**)&is_indices);CHKERRQ(ierr); 40329c0446d6SStefano Zampini } 4033a81d60d8SStefano Zampini /* use mat block size as vertex size if it has not yet set */ 4034a81d60d8SStefano Zampini if(!vertex_size) { 40353b03a366Sstefano_zampini ierr = MatGetBlockSize(matis->A,&vertex_size);CHKERRQ(ierr); 40360c7d97c5SJed Brown } 4037a81d60d8SStefano Zampini 40383b03a366Sstefano_zampini /* count number of neigh per node */ 40390c7d97c5SJed Brown total_counts=0; 40403b03a366Sstefano_zampini for(i=1;i<pcis->n_neigh;i++){ 40410c7d97c5SJed Brown s=pcis->n_shared[i]; 40420c7d97c5SJed Brown total_counts+=s; 404353cdbc3dSStefano Zampini for(j=0;j<s;j++){ 40440c7d97c5SJed Brown mat_graph->count[pcis->shared[i][j]] += 1; 40450c7d97c5SJed Brown } 40460c7d97c5SJed Brown } 4047534831adSStefano Zampini /* Take into account Neumann data -> it increments number of sharing subdomains for nodes lying on the interface */ 404836e030ebSStefano Zampini ierr = PCBDDCGetNeumannBoundaries(pc,&used_IS);CHKERRQ(ierr); 4049da1bb401SStefano Zampini ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr); 4050da1bb401SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 405136e030ebSStefano Zampini if(used_IS) { 405236e030ebSStefano Zampini ierr = ISGetSize(used_IS,&neumann_bsize);CHKERRQ(ierr); 405336e030ebSStefano Zampini ierr = ISGetIndices(used_IS,&neumann_nodes);CHKERRQ(ierr); 405453cdbc3dSStefano Zampini for(i=0;i<neumann_bsize;i++){ 405553cdbc3dSStefano Zampini iindex = neumann_nodes[i]; 4056534831adSStefano Zampini if(mat_graph->count[iindex] > NEUMANNCNT && array[iindex]==0.0){ 405753cdbc3dSStefano Zampini mat_graph->count[iindex]+=1; 40580c7d97c5SJed Brown total_counts++; 4059da1bb401SStefano Zampini array[iindex]=array[iindex]+1.0; 4060da1bb401SStefano Zampini } else if(array[iindex]>0.0) { 4061da1bb401SStefano Zampini SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_USER,"Error for neumann nodes provided to BDDC! They must be uniquely listed! Found duplicate node %d\n",iindex); 40620c7d97c5SJed Brown } 40630c7d97c5SJed Brown } 40640c7d97c5SJed Brown } 4065da1bb401SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 4066da1bb401SStefano Zampini /* allocate space for storing the set of neighbours for each node */ 4067da1bb401SStefano Zampini ierr = PetscMalloc(mat_graph->nvtxs*sizeof(PetscInt*),&mat_graph->neighbours_set);CHKERRQ(ierr); 4068da1bb401SStefano Zampini if(mat_graph->nvtxs) { ierr = PetscMalloc(total_counts*sizeof(PetscInt),&mat_graph->neighbours_set[0]);CHKERRQ(ierr); } 4069da1bb401SStefano Zampini for(i=1;i<mat_graph->nvtxs;i++) mat_graph->neighbours_set[i]=mat_graph->neighbours_set[i-1]+mat_graph->count[i-1]; 4070a0ba757dSStefano Zampini ierr = PetscMemzero(mat_graph->count,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr); 40713b03a366Sstefano_zampini for(i=1;i<pcis->n_neigh;i++){ 40720c7d97c5SJed Brown s=pcis->n_shared[i]; 40730c7d97c5SJed Brown for(j=0;j<s;j++) { 40740c7d97c5SJed Brown k=pcis->shared[i][j]; 4075da1bb401SStefano Zampini mat_graph->neighbours_set[k][mat_graph->count[k]] = pcis->neigh[i]; 40760c7d97c5SJed Brown mat_graph->count[k]+=1; 40770c7d97c5SJed Brown } 40780c7d97c5SJed Brown } 4079da1bb401SStefano Zampini /* Check consistency of Neumann nodes */ 4080da1bb401SStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 4081da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 4082da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 4083da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 4084da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 4085da1bb401SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 40863b03a366Sstefano_zampini /* set -1 fake neighbour to mimic Neumann boundary */ 408736e030ebSStefano Zampini if(used_IS) { 408853cdbc3dSStefano Zampini for(i=0;i<neumann_bsize;i++){ 408953cdbc3dSStefano Zampini iindex = neumann_nodes[i]; 4090534831adSStefano Zampini if(mat_graph->count[iindex] > NEUMANNCNT){ 4091da1bb401SStefano Zampini if(mat_graph->count[iindex]+1 != (PetscInt)array[iindex]) { 4092da1bb401SStefano Zampini SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_USER,"Neumann nodes provided to BDDC must be consistent among neighbours!\nNode %d: number of sharing subdomains %d != number of subdomains for which it is a neumann node %d\n",iindex,mat_graph->count[iindex]+1,(PetscInt)array[iindex]); 4093da1bb401SStefano Zampini } 4094da1bb401SStefano Zampini mat_graph->neighbours_set[iindex][mat_graph->count[iindex]] = -1; 409553cdbc3dSStefano Zampini mat_graph->count[iindex]+=1; 40960c7d97c5SJed Brown } 40970c7d97c5SJed Brown } 409836e030ebSStefano Zampini ierr = ISRestoreIndices(used_IS,&neumann_nodes);CHKERRQ(ierr); 40990c7d97c5SJed Brown } 4100da1bb401SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 4101da1bb401SStefano Zampini /* sort set of sharing subdomains */ 4102da1bb401SStefano Zampini for(i=0;i<mat_graph->nvtxs;i++) { ierr = PetscSortInt(mat_graph->count[i],mat_graph->neighbours_set[i]);CHKERRQ(ierr); } 41033b03a366Sstefano_zampini /* remove interior nodes and dirichlet boundary nodes from the next search into the graph */ 4104da1bb401SStefano Zampini for(i=0;i<mat_graph->nvtxs;i++){mat_graph->touched[i]=PETSC_FALSE;} 4105da1bb401SStefano Zampini nodes_touched=0; 410636e030ebSStefano Zampini ierr = PCBDDCGetDirichletBoundaries(pc,&used_IS);CHKERRQ(ierr); 4107da1bb401SStefano Zampini ierr = VecSet(pcis->vec2_N,0.0);CHKERRQ(ierr); 4108da1bb401SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 4109da1bb401SStefano Zampini ierr = VecGetArray(pcis->vec2_N,&array2);CHKERRQ(ierr); 4110da1bb401SStefano Zampini if(used_IS) { 4111da1bb401SStefano Zampini ierr = ISGetSize(used_IS,&dirichlet_bsize);CHKERRQ(ierr); 4112da1bb401SStefano Zampini if(dirichlet_bsize && matis->pure_neumann) { 4113da1bb401SStefano Zampini SETERRQ(PETSC_COMM_SELF,PETSC_ERR_USER,"Dirichlet boundaries are intended to be used with matrices with zeroed rows!\n"); 4114da1bb401SStefano Zampini } 4115da1bb401SStefano Zampini ierr = ISGetIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr); 4116da1bb401SStefano Zampini for(i=0;i<dirichlet_bsize;i++){ 4117da1bb401SStefano Zampini iindex=dirichlet_nodes[i]; 4118da1bb401SStefano Zampini if(mat_graph->count[iindex] && !mat_graph->touched[iindex]) { 4119da1bb401SStefano Zampini if(array[iindex]>0.0) { 4120da1bb401SStefano Zampini SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_USER,"BDDC cannot have nodes which are marked as Neumann and Dirichlet at the same time! Wrong node %d\n",iindex); 4121da1bb401SStefano Zampini } 4122da1bb401SStefano Zampini mat_graph->touched[iindex]=PETSC_TRUE; 4123da1bb401SStefano Zampini mat_graph->where[iindex]=0; 4124da1bb401SStefano Zampini nodes_touched++; 4125da1bb401SStefano Zampini array2[iindex]=array2[iindex]+1.0; 4126da1bb401SStefano Zampini } 4127da1bb401SStefano Zampini } 4128da1bb401SStefano Zampini ierr = ISRestoreIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr); 4129da1bb401SStefano Zampini } 4130da1bb401SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 4131da1bb401SStefano Zampini ierr = VecRestoreArray(pcis->vec2_N,&array2);CHKERRQ(ierr); 4132da1bb401SStefano Zampini /* Check consistency of Dirichlet nodes */ 4133da1bb401SStefano Zampini ierr = VecSet(pcis->vec1_N,1.0);CHKERRQ(ierr); 4134da1bb401SStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 4135da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 4136da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 4137da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 4138da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 4139da1bb401SStefano Zampini ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr); 4140da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec2_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 4141da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec2_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr); 4142da1bb401SStefano Zampini ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 4143da1bb401SStefano Zampini ierr = VecScatterEnd (matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr); 4144da1bb401SStefano Zampini ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr); 4145da1bb401SStefano Zampini ierr = VecGetArray(pcis->vec2_N,&array2);CHKERRQ(ierr); 414636e030ebSStefano Zampini if(used_IS) { 414736e030ebSStefano Zampini ierr = ISGetSize(used_IS,&dirichlet_bsize);CHKERRQ(ierr); 414836e030ebSStefano Zampini ierr = ISGetIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr); 41493b03a366Sstefano_zampini for(i=0;i<dirichlet_bsize;i++){ 4150da1bb401SStefano Zampini iindex=dirichlet_nodes[i]; 4151da1bb401SStefano Zampini if(array[iindex]>1.0 && array[iindex]!=array2[iindex] ) { 4152da1bb401SStefano Zampini SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_USER,"Dirichlet nodes provided to BDDC must be consistent among neighbours!\nNode %d: number of sharing subdomains %d != number of subdomains for which it is a neumann node %d\n",iindex,(PetscInt)array[iindex],(PetscInt)array2[iindex]); 4153da1bb401SStefano Zampini } 41543b03a366Sstefano_zampini } 415536e030ebSStefano Zampini ierr = ISRestoreIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr); 41563b03a366Sstefano_zampini } 4157da1bb401SStefano Zampini ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr); 4158da1bb401SStefano Zampini ierr = VecRestoreArray(pcis->vec2_N,&array2);CHKERRQ(ierr); 4159da1bb401SStefano Zampini 41600c7d97c5SJed Brown for(i=0;i<mat_graph->nvtxs;i++){ 41613b03a366Sstefano_zampini if(!mat_graph->count[i]){ /* interior nodes */ 41620c7d97c5SJed Brown mat_graph->touched[i]=PETSC_TRUE; 41630c7d97c5SJed Brown mat_graph->where[i]=0; 41640c7d97c5SJed Brown nodes_touched++; 41650c7d97c5SJed Brown } 41660c7d97c5SJed Brown } 41670c7d97c5SJed Brown mat_graph->ncmps = 0; 4168da1bb401SStefano Zampini i=0; 41690c7d97c5SJed Brown while(nodes_touched<mat_graph->nvtxs) { 4170a0ba757dSStefano Zampini /* find first untouched node in local ordering */ 41710c7d97c5SJed Brown while(mat_graph->touched[i]) i++; 41720c7d97c5SJed Brown mat_graph->touched[i]=PETSC_TRUE; 4173a0ba757dSStefano Zampini mat_graph->where[i]=where_values; 41740c7d97c5SJed Brown nodes_touched++; 4175a0ba757dSStefano Zampini /* now find all other nodes having the same set of sharing subdomains */ 41760c7d97c5SJed Brown for(j=i+1;j<mat_graph->nvtxs;j++){ 4177a0ba757dSStefano Zampini /* check for same number of sharing subdomains and dof number */ 4178da1bb401SStefano Zampini if(!mat_graph->touched[j] && mat_graph->count[i]==mat_graph->count[j] && mat_graph->which_dof[i] == mat_graph->which_dof[j] ){ 4179a0ba757dSStefano Zampini /* check for same set of sharing subdomains */ 41800c7d97c5SJed Brown same_set=PETSC_TRUE; 41810c7d97c5SJed Brown for(k=0;k<mat_graph->count[j];k++){ 4182da1bb401SStefano Zampini if(mat_graph->neighbours_set[i][k]!=mat_graph->neighbours_set[j][k]) { 41830c7d97c5SJed Brown same_set=PETSC_FALSE; 41840c7d97c5SJed Brown } 41850c7d97c5SJed Brown } 4186a0ba757dSStefano Zampini /* I found a friend of mine */ 41870c7d97c5SJed Brown if(same_set) { 4188a0ba757dSStefano Zampini mat_graph->where[j]=where_values; 41890c7d97c5SJed Brown mat_graph->touched[j]=PETSC_TRUE; 41900c7d97c5SJed Brown nodes_touched++; 41910c7d97c5SJed Brown } 41920c7d97c5SJed Brown } 41930c7d97c5SJed Brown } 4194a0ba757dSStefano Zampini where_values++; 41950c7d97c5SJed Brown } 4196a0ba757dSStefano Zampini where_values--; if(where_values<0) where_values=0; 4197a0ba757dSStefano Zampini ierr = PetscMalloc(where_values*sizeof(PetscMPIInt),&mat_graph->where_ncmps);CHKERRQ(ierr); 4198a0ba757dSStefano Zampini /* Find connected components defined on the shared interface */ 4199a0ba757dSStefano Zampini if(where_values) { 4200a0ba757dSStefano Zampini ierr = PCBDDCFindConnectedComponents(mat_graph, where_values); 42013b03a366Sstefano_zampini /* For consistency among neughbouring procs, I need to sort (by global ordering) each connected component */ 4202a0ba757dSStefano Zampini for(i=0;i<mat_graph->ncmps;i++) { 4203a0ba757dSStefano Zampini ierr = ISLocalToGlobalMappingApply(matis->mapping,mat_graph->cptr[i+1]-mat_graph->cptr[i],&mat_graph->queue[mat_graph->cptr[i]],&queue_in_global_numbering[mat_graph->cptr[i]]);CHKERRQ(ierr); 4204a0ba757dSStefano Zampini ierr = PetscSortIntWithArray(mat_graph->cptr[i+1]-mat_graph->cptr[i],&queue_in_global_numbering[mat_graph->cptr[i]],&mat_graph->queue[mat_graph->cptr[i]]);CHKERRQ(ierr); 4205a0ba757dSStefano Zampini } 4206a0ba757dSStefano Zampini } 4207a0ba757dSStefano Zampini /* check consistency of connected components among neighbouring subdomains -> it adapt them in case it is needed */ 4208a0ba757dSStefano Zampini for(i=0;i<where_values;i++) { 42093b03a366Sstefano_zampini /* We are not sure that two connected components will be the same among subdomains sharing a subset of local interface */ 42103b03a366Sstefano_zampini if(mat_graph->where_ncmps[i]>1) { 4211a0ba757dSStefano Zampini adapt_interface=1; 4212a0ba757dSStefano Zampini break; 4213a0ba757dSStefano Zampini } 4214a0ba757dSStefano Zampini } 4215a0ba757dSStefano Zampini ierr = MPI_Allreduce(&adapt_interface,&adapt_interface_reduced,1,MPIU_INT,MPI_LOR,interface_comm);CHKERRQ(ierr); 4216da1bb401SStefano Zampini if(pcbddc->dbg_flag && adapt_interface_reduced) { 4217da1bb401SStefano Zampini ierr = PetscViewerASCIIPrintf(viewer,"Interface adapted\n");CHKERRQ(ierr); 4218da1bb401SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 4219da1bb401SStefano Zampini } 4220a0ba757dSStefano Zampini if(where_values && adapt_interface_reduced) { 42210c7d97c5SJed Brown 4222a0ba757dSStefano Zampini PetscInt sum_requests=0,my_rank; 4223a0ba757dSStefano Zampini PetscInt buffer_size,start_of_recv,size_of_recv,start_of_send; 4224a0ba757dSStefano Zampini PetscInt temp_buffer_size,ins_val,global_where_counter; 4225a0ba757dSStefano Zampini PetscInt *cum_recv_counts; 4226a0ba757dSStefano Zampini PetscInt *where_to_nodes_indices; 4227a0ba757dSStefano Zampini PetscInt *petsc_buffer; 4228a0ba757dSStefano Zampini PetscMPIInt *recv_buffer; 4229a0ba757dSStefano Zampini PetscMPIInt *recv_buffer_where; 4230a0ba757dSStefano Zampini PetscMPIInt *send_buffer; 4231a0ba757dSStefano Zampini PetscMPIInt size_of_send; 4232a0ba757dSStefano Zampini PetscInt *sizes_of_sends; 4233a0ba757dSStefano Zampini MPI_Request *send_requests; 4234a0ba757dSStefano Zampini MPI_Request *recv_requests; 4235a0ba757dSStefano Zampini PetscInt *where_cc_adapt; 4236a0ba757dSStefano Zampini PetscInt **temp_buffer; 4237a0ba757dSStefano Zampini PetscInt *nodes_to_temp_buffer_indices; 4238a0ba757dSStefano Zampini PetscInt *add_to_where; 4239a0ba757dSStefano Zampini 4240a0ba757dSStefano Zampini ierr = MPI_Comm_rank(interface_comm,&my_rank);CHKERRQ(ierr); 4241a0ba757dSStefano Zampini ierr = PetscMalloc((where_values+1)*sizeof(PetscInt),&cum_recv_counts);CHKERRQ(ierr); 4242a0ba757dSStefano Zampini ierr = PetscMemzero(cum_recv_counts,(where_values+1)*sizeof(PetscInt));CHKERRQ(ierr); 4243a0ba757dSStefano Zampini ierr = PetscMalloc(where_values*sizeof(PetscInt),&where_to_nodes_indices);CHKERRQ(ierr); 4244a0ba757dSStefano Zampini /* first count how many neighbours per connected component I will receive from */ 4245a0ba757dSStefano Zampini cum_recv_counts[0]=0; 4246a0ba757dSStefano Zampini for(i=1;i<where_values+1;i++){ 4247a0ba757dSStefano Zampini j=0; 4248a0ba757dSStefano Zampini while(mat_graph->where[j] != i) j++; 4249a0ba757dSStefano Zampini where_to_nodes_indices[i-1]=j; 4250da1bb401SStefano Zampini if(mat_graph->neighbours_set[j][0]!=-1) { cum_recv_counts[i]=cum_recv_counts[i-1]+mat_graph->count[j]; } /* We don't want sends/recvs_to/from_self -> here I don't count myself */ 42513b03a366Sstefano_zampini else { cum_recv_counts[i]=cum_recv_counts[i-1]+mat_graph->count[j]-1; } 4252a0ba757dSStefano Zampini } 4253a0ba757dSStefano Zampini buffer_size=2*cum_recv_counts[where_values]+mat_graph->nvtxs; 4254a0ba757dSStefano Zampini ierr = PetscMalloc(2*cum_recv_counts[where_values]*sizeof(PetscMPIInt),&recv_buffer_where);CHKERRQ(ierr); 4255a0ba757dSStefano Zampini ierr = PetscMalloc(buffer_size*sizeof(PetscMPIInt),&send_buffer);CHKERRQ(ierr); 4256a0ba757dSStefano Zampini ierr = PetscMalloc(cum_recv_counts[where_values]*sizeof(MPI_Request),&send_requests);CHKERRQ(ierr); 4257a0ba757dSStefano Zampini ierr = PetscMalloc(cum_recv_counts[where_values]*sizeof(MPI_Request),&recv_requests);CHKERRQ(ierr); 4258a0ba757dSStefano Zampini for(i=0;i<cum_recv_counts[where_values];i++) { 4259a0ba757dSStefano Zampini send_requests[i]=MPI_REQUEST_NULL; 4260a0ba757dSStefano Zampini recv_requests[i]=MPI_REQUEST_NULL; 4261a0ba757dSStefano Zampini } 4262a0ba757dSStefano Zampini /* exchange with my neighbours the number of my connected components on the shared interface */ 4263a0ba757dSStefano Zampini for(i=0;i<where_values;i++){ 4264a0ba757dSStefano Zampini j=where_to_nodes_indices[i]; 4265da1bb401SStefano Zampini k = (mat_graph->neighbours_set[j][0] == -1 ? 1 : 0); 4266a0ba757dSStefano Zampini for(;k<mat_graph->count[j];k++){ 4267da1bb401SStefano Zampini ierr = MPI_Isend(&mat_graph->where_ncmps[i],1,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr); 4268da1bb401SStefano Zampini ierr = MPI_Irecv(&recv_buffer_where[sum_requests],1,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr); 4269a0ba757dSStefano Zampini sum_requests++; 4270a0ba757dSStefano Zampini } 4271a0ba757dSStefano Zampini } 4272a0ba757dSStefano Zampini ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 4273a0ba757dSStefano Zampini ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 4274a0ba757dSStefano Zampini /* determine the connected component I need to adapt */ 4275a0ba757dSStefano Zampini ierr = PetscMalloc(where_values*sizeof(PetscInt),&where_cc_adapt);CHKERRQ(ierr); 4276a0ba757dSStefano Zampini ierr = PetscMemzero(where_cc_adapt,where_values*sizeof(PetscInt));CHKERRQ(ierr); 4277a0ba757dSStefano Zampini for(i=0;i<where_values;i++){ 4278a0ba757dSStefano Zampini for(j=cum_recv_counts[i];j<cum_recv_counts[i+1];j++){ 42793b03a366Sstefano_zampini /* The first condition is natural (i.e someone has a different number of cc than me), the second one is just to be safe */ 42803b03a366Sstefano_zampini if( mat_graph->where_ncmps[i]!=recv_buffer_where[j] || mat_graph->where_ncmps[i] > 1 ) { 4281a0ba757dSStefano Zampini where_cc_adapt[i]=PETSC_TRUE; 4282a0ba757dSStefano Zampini break; 4283a0ba757dSStefano Zampini } 4284a0ba757dSStefano Zampini } 4285a0ba757dSStefano Zampini } 4286a0ba757dSStefano Zampini /* now get from neighbours their ccs (in global numbering) and adapt them (in case it is needed) */ 4287a0ba757dSStefano Zampini /* first determine how much data to send (size of each queue plus the global indices) and communicate it to neighbours */ 4288a0ba757dSStefano Zampini ierr = PetscMalloc(where_values*sizeof(PetscInt),&sizes_of_sends);CHKERRQ(ierr); 4289a0ba757dSStefano Zampini ierr = PetscMemzero(sizes_of_sends,where_values*sizeof(PetscInt));CHKERRQ(ierr); 4290a0ba757dSStefano Zampini sum_requests=0; 4291a0ba757dSStefano Zampini start_of_send=0; 4292a0ba757dSStefano Zampini start_of_recv=cum_recv_counts[where_values]; 4293a0ba757dSStefano Zampini for(i=0;i<where_values;i++) { 4294a0ba757dSStefano Zampini if(where_cc_adapt[i]) { 4295a0ba757dSStefano Zampini size_of_send=0; 4296a0ba757dSStefano Zampini for(j=i;j<mat_graph->ncmps;j++) { 4297a0ba757dSStefano Zampini if(mat_graph->where[mat_graph->queue[mat_graph->cptr[j]]] == i+1) { /* WARNING -> where values goes from 1 to where_values included */ 4298a0ba757dSStefano Zampini send_buffer[start_of_send+size_of_send]=mat_graph->cptr[j+1]-mat_graph->cptr[j]; 4299a0ba757dSStefano Zampini size_of_send+=1; 4300a0ba757dSStefano Zampini for(k=0;k<mat_graph->cptr[j+1]-mat_graph->cptr[j];k++) { 4301a0ba757dSStefano Zampini send_buffer[start_of_send+size_of_send+k]=queue_in_global_numbering[mat_graph->cptr[j]+k]; 4302a0ba757dSStefano Zampini } 4303a0ba757dSStefano Zampini size_of_send=size_of_send+mat_graph->cptr[j+1]-mat_graph->cptr[j]; 4304a0ba757dSStefano Zampini } 4305a0ba757dSStefano Zampini } 4306a0ba757dSStefano Zampini j = where_to_nodes_indices[i]; 4307da1bb401SStefano Zampini k = (mat_graph->neighbours_set[j][0] == -1 ? 1 : 0); 430811d8f4c2SStefano Zampini sizes_of_sends[i]=size_of_send; 4309a0ba757dSStefano Zampini for(;k<mat_graph->count[j];k++){ 431011d8f4c2SStefano Zampini ierr = MPI_Isend(&sizes_of_sends[i],1,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr); 4311da1bb401SStefano Zampini ierr = MPI_Irecv(&recv_buffer_where[sum_requests+start_of_recv],1,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr); 4312a0ba757dSStefano Zampini sum_requests++; 4313a0ba757dSStefano Zampini } 4314a0ba757dSStefano Zampini start_of_send+=size_of_send; 4315a0ba757dSStefano Zampini } 4316a0ba757dSStefano Zampini } 4317a0ba757dSStefano Zampini ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 4318a0ba757dSStefano Zampini ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 4319a0ba757dSStefano Zampini buffer_size=0; 4320a0ba757dSStefano Zampini for(k=0;k<sum_requests;k++) { buffer_size+=recv_buffer_where[start_of_recv+k]; } 4321a0ba757dSStefano Zampini ierr = PetscMalloc(buffer_size*sizeof(PetscMPIInt),&recv_buffer);CHKERRQ(ierr); 4322a0ba757dSStefano Zampini /* now exchange the data */ 4323a0ba757dSStefano Zampini start_of_recv=0; 4324a0ba757dSStefano Zampini start_of_send=0; 4325a0ba757dSStefano Zampini sum_requests=0; 4326a0ba757dSStefano Zampini for(i=0;i<where_values;i++) { 4327a0ba757dSStefano Zampini if(where_cc_adapt[i]) { 4328a0ba757dSStefano Zampini size_of_send = sizes_of_sends[i]; 4329a0ba757dSStefano Zampini j = where_to_nodes_indices[i]; 4330da1bb401SStefano Zampini k = (mat_graph->neighbours_set[j][0] == -1 ? 1 : 0); 4331a0ba757dSStefano Zampini for(;k<mat_graph->count[j];k++){ 4332da1bb401SStefano Zampini ierr = MPI_Isend(&send_buffer[start_of_send],size_of_send,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr); 4333a0ba757dSStefano Zampini size_of_recv=recv_buffer_where[cum_recv_counts[where_values]+sum_requests]; 4334da1bb401SStefano Zampini ierr = MPI_Irecv(&recv_buffer[start_of_recv],size_of_recv,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr); 4335a0ba757dSStefano Zampini start_of_recv+=size_of_recv; 4336a0ba757dSStefano Zampini sum_requests++; 4337a0ba757dSStefano Zampini } 4338a0ba757dSStefano Zampini start_of_send+=size_of_send; 4339a0ba757dSStefano Zampini } 4340a0ba757dSStefano Zampini } 4341a0ba757dSStefano Zampini ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 4342a0ba757dSStefano Zampini ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr); 4343a0ba757dSStefano Zampini ierr = PetscMalloc(buffer_size*sizeof(PetscInt),&petsc_buffer);CHKERRQ(ierr); 4344a0ba757dSStefano Zampini for(k=0;k<start_of_recv;k++) { petsc_buffer[k]=(PetscInt)recv_buffer[k]; } 4345a0ba757dSStefano Zampini for(j=0;j<buffer_size;) { 4346a0ba757dSStefano Zampini ierr = ISGlobalToLocalMappingApply(matis->mapping,IS_GTOLM_MASK,petsc_buffer[j],&petsc_buffer[j+1],&petsc_buffer[j],&petsc_buffer[j+1]);CHKERRQ(ierr); 4347a0ba757dSStefano Zampini k=petsc_buffer[j]+1; 4348a0ba757dSStefano Zampini j+=k; 4349a0ba757dSStefano Zampini } 4350a0ba757dSStefano Zampini sum_requests=cum_recv_counts[where_values]; 4351a0ba757dSStefano Zampini start_of_recv=0; 4352a0ba757dSStefano Zampini ierr = PetscMalloc(mat_graph->nvtxs*sizeof(PetscInt),&nodes_to_temp_buffer_indices);CHKERRQ(ierr); 4353a0ba757dSStefano Zampini global_where_counter=0; 4354a0ba757dSStefano Zampini for(i=0;i<where_values;i++){ 4355a0ba757dSStefano Zampini if(where_cc_adapt[i]){ 4356a0ba757dSStefano Zampini temp_buffer_size=0; 4357a0ba757dSStefano Zampini /* find nodes on the shared interface we need to adapt */ 4358a0ba757dSStefano Zampini for(j=0;j<mat_graph->nvtxs;j++){ 4359a0ba757dSStefano Zampini if(mat_graph->where[j]==i+1) { 4360a0ba757dSStefano Zampini nodes_to_temp_buffer_indices[j]=temp_buffer_size; 4361a0ba757dSStefano Zampini temp_buffer_size++; 4362a0ba757dSStefano Zampini } else { 4363a0ba757dSStefano Zampini nodes_to_temp_buffer_indices[j]=-1; 4364a0ba757dSStefano Zampini } 4365a0ba757dSStefano Zampini } 4366a0ba757dSStefano Zampini /* allocate some temporary space */ 4367a0ba757dSStefano Zampini ierr = PetscMalloc(temp_buffer_size*sizeof(PetscInt*),&temp_buffer);CHKERRQ(ierr); 4368a0ba757dSStefano Zampini ierr = PetscMalloc(temp_buffer_size*(cum_recv_counts[i+1]-cum_recv_counts[i])*sizeof(PetscInt),&temp_buffer[0]);CHKERRQ(ierr); 4369a0ba757dSStefano Zampini ierr = PetscMemzero(temp_buffer[0],temp_buffer_size*(cum_recv_counts[i+1]-cum_recv_counts[i])*sizeof(PetscInt));CHKERRQ(ierr); 4370a0ba757dSStefano Zampini for(j=1;j<temp_buffer_size;j++){ 4371a0ba757dSStefano Zampini temp_buffer[j]=temp_buffer[j-1]+cum_recv_counts[i+1]-cum_recv_counts[i]; 4372a0ba757dSStefano Zampini } 4373a0ba757dSStefano Zampini /* analyze contributions from neighbouring subdomains for i-th conn comp 4374a0ba757dSStefano Zampini temp buffer structure: 4375a0ba757dSStefano Zampini supposing part of the interface has dimension 5 (global nodes 0,1,2,3,4) 4376a0ba757dSStefano Zampini 3 neighs procs with structured connected components: 4377a0ba757dSStefano Zampini neigh 0: [0 1 4], [2 3]; (2 connected components) 4378a0ba757dSStefano Zampini neigh 1: [0 1], [2 3 4]; (2 connected components) 4379a0ba757dSStefano Zampini neigh 2: [0 4], [1], [2 3]; (3 connected components) 4380a0ba757dSStefano Zampini tempbuffer (row-oriented) should be filled as: 4381a0ba757dSStefano Zampini [ 0, 0, 0; 4382a0ba757dSStefano Zampini 0, 0, 1; 4383a0ba757dSStefano Zampini 1, 1, 2; 4384a0ba757dSStefano Zampini 1, 1, 2; 4385a0ba757dSStefano Zampini 0, 1, 0; ]; 4386a0ba757dSStefano Zampini This way we can simply recover the resulting structure account for possible intersections of ccs among neighs. 4387a0ba757dSStefano Zampini The mat_graph->where array will be modified to reproduce the following 4 connected components [0], [1], [2 3], [4]; 4388a0ba757dSStefano Zampini */ 4389a0ba757dSStefano Zampini for(j=0;j<cum_recv_counts[i+1]-cum_recv_counts[i];j++) { 4390a0ba757dSStefano Zampini ins_val=0; 4391a0ba757dSStefano Zampini size_of_recv=recv_buffer_where[sum_requests]; /* total size of recv from neighs */ 4392a0ba757dSStefano Zampini for(buffer_size=0;buffer_size<size_of_recv;) { /* loop until all data from neighs has been taken into account */ 4393a0ba757dSStefano Zampini for(k=1;k<petsc_buffer[buffer_size+start_of_recv]+1;k++) { /* filling properly temp_buffer using data from a single recv */ 4394a0ba757dSStefano Zampini temp_buffer[ nodes_to_temp_buffer_indices[ petsc_buffer[ start_of_recv+buffer_size+k ] ] ][j]=ins_val; 4395a0ba757dSStefano Zampini } 4396a0ba757dSStefano Zampini buffer_size+=k; 4397a0ba757dSStefano Zampini ins_val++; 4398a0ba757dSStefano Zampini } 4399a0ba757dSStefano Zampini start_of_recv+=size_of_recv; 4400a0ba757dSStefano Zampini sum_requests++; 4401a0ba757dSStefano Zampini } 4402a0ba757dSStefano Zampini ierr = PetscMalloc(temp_buffer_size*sizeof(PetscInt),&add_to_where);CHKERRQ(ierr); 4403a0ba757dSStefano Zampini ierr = PetscMemzero(add_to_where,temp_buffer_size*sizeof(PetscInt));CHKERRQ(ierr); 4404a0ba757dSStefano Zampini for(j=0;j<temp_buffer_size;j++){ 4405a0ba757dSStefano Zampini if(!add_to_where[j]){ /* found a new cc */ 4406a0ba757dSStefano Zampini global_where_counter++; 4407a0ba757dSStefano Zampini add_to_where[j]=global_where_counter; 4408a0ba757dSStefano Zampini for(k=j+1;k<temp_buffer_size;k++){ /* check for other nodes in new cc */ 4409a0ba757dSStefano Zampini same_set=PETSC_TRUE; 4410a0ba757dSStefano Zampini for(s=0;s<cum_recv_counts[i+1]-cum_recv_counts[i];s++){ 4411a0ba757dSStefano Zampini if(temp_buffer[j][s]!=temp_buffer[k][s]) { 4412a0ba757dSStefano Zampini same_set=PETSC_FALSE; 4413a0ba757dSStefano Zampini break; 4414a0ba757dSStefano Zampini } 4415a0ba757dSStefano Zampini } 4416a0ba757dSStefano Zampini if(same_set) add_to_where[k]=global_where_counter; 4417a0ba757dSStefano Zampini } 4418a0ba757dSStefano Zampini } 4419a0ba757dSStefano Zampini } 4420a0ba757dSStefano Zampini /* insert new data in where array */ 4421a0ba757dSStefano Zampini temp_buffer_size=0; 4422a0ba757dSStefano Zampini for(j=0;j<mat_graph->nvtxs;j++){ 4423a0ba757dSStefano Zampini if(mat_graph->where[j]==i+1) { 4424a0ba757dSStefano Zampini mat_graph->where[j]=where_values+add_to_where[temp_buffer_size]; 4425a0ba757dSStefano Zampini temp_buffer_size++; 4426a0ba757dSStefano Zampini } 4427a0ba757dSStefano Zampini } 4428a0ba757dSStefano Zampini ierr = PetscFree(temp_buffer[0]);CHKERRQ(ierr); 4429a0ba757dSStefano Zampini ierr = PetscFree(temp_buffer);CHKERRQ(ierr); 4430a0ba757dSStefano Zampini ierr = PetscFree(add_to_where);CHKERRQ(ierr); 4431a0ba757dSStefano Zampini } 4432a0ba757dSStefano Zampini } 4433a0ba757dSStefano Zampini ierr = PetscFree(nodes_to_temp_buffer_indices);CHKERRQ(ierr); 4434a0ba757dSStefano Zampini ierr = PetscFree(sizes_of_sends);CHKERRQ(ierr); 4435a0ba757dSStefano Zampini ierr = PetscFree(send_requests);CHKERRQ(ierr); 4436a0ba757dSStefano Zampini ierr = PetscFree(recv_requests);CHKERRQ(ierr); 4437a0ba757dSStefano Zampini ierr = PetscFree(petsc_buffer);CHKERRQ(ierr); 4438a0ba757dSStefano Zampini ierr = PetscFree(recv_buffer);CHKERRQ(ierr); 4439a0ba757dSStefano Zampini ierr = PetscFree(recv_buffer_where);CHKERRQ(ierr); 4440a0ba757dSStefano Zampini ierr = PetscFree(send_buffer);CHKERRQ(ierr); 4441a0ba757dSStefano Zampini ierr = PetscFree(cum_recv_counts);CHKERRQ(ierr); 4442a0ba757dSStefano Zampini ierr = PetscFree(where_to_nodes_indices);CHKERRQ(ierr); 444323d4d1a5SStefano Zampini ierr = PetscFree(where_cc_adapt);CHKERRQ(ierr); 4444a0ba757dSStefano Zampini /* We are ready to evaluate consistent connected components on each part of the shared interface */ 4445a0ba757dSStefano Zampini if(global_where_counter) { 4446a0ba757dSStefano Zampini for(i=0;i<mat_graph->nvtxs;i++){ mat_graph->touched[i]=PETSC_FALSE; } 4447a0ba757dSStefano Zampini global_where_counter=0; 4448a0ba757dSStefano Zampini for(i=0;i<mat_graph->nvtxs;i++){ 4449a0ba757dSStefano Zampini if(mat_graph->where[i] && !mat_graph->touched[i]) { 4450a0ba757dSStefano Zampini global_where_counter++; 4451a0ba757dSStefano Zampini for(j=i+1;j<mat_graph->nvtxs;j++){ 4452a0ba757dSStefano Zampini if(!mat_graph->touched[j] && mat_graph->where[j]==mat_graph->where[i]) { 4453a0ba757dSStefano Zampini mat_graph->where[j]=global_where_counter; 4454a0ba757dSStefano Zampini mat_graph->touched[j]=PETSC_TRUE; 4455a0ba757dSStefano Zampini } 4456a0ba757dSStefano Zampini } 4457a0ba757dSStefano Zampini mat_graph->where[i]=global_where_counter; 4458a0ba757dSStefano Zampini mat_graph->touched[i]=PETSC_TRUE; 4459a0ba757dSStefano Zampini } 4460a0ba757dSStefano Zampini } 4461a0ba757dSStefano Zampini where_values=global_where_counter; 4462a0ba757dSStefano Zampini } 4463a0ba757dSStefano Zampini if(global_where_counter) { 4464a0ba757dSStefano Zampini ierr = PetscMemzero(mat_graph->cptr,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr); 4465a0ba757dSStefano Zampini ierr = PetscMemzero(mat_graph->queue,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr); 4466a0ba757dSStefano Zampini ierr = PetscFree(mat_graph->where_ncmps);CHKERRQ(ierr); 4467a0ba757dSStefano Zampini ierr = PetscMalloc(where_values*sizeof(PetscMPIInt),&mat_graph->where_ncmps);CHKERRQ(ierr); 4468a0ba757dSStefano Zampini ierr = PCBDDCFindConnectedComponents(mat_graph, where_values); 4469a0ba757dSStefano Zampini for(i=0;i<mat_graph->ncmps;i++) { 4470a0ba757dSStefano Zampini ierr = ISLocalToGlobalMappingApply(matis->mapping,mat_graph->cptr[i+1]-mat_graph->cptr[i],&mat_graph->queue[mat_graph->cptr[i]],&queue_in_global_numbering[mat_graph->cptr[i]]);CHKERRQ(ierr); 4471a0ba757dSStefano Zampini ierr = PetscSortIntWithArray(mat_graph->cptr[i+1]-mat_graph->cptr[i],&queue_in_global_numbering[mat_graph->cptr[i]],&mat_graph->queue[mat_graph->cptr[i]]);CHKERRQ(ierr); 4472a0ba757dSStefano Zampini } 4473a0ba757dSStefano Zampini } 44743b03a366Sstefano_zampini } /* Finished adapting interface */ 44750c7d97c5SJed Brown PetscInt nfc=0; 44760c7d97c5SJed Brown PetscInt nec=0; 44770c7d97c5SJed Brown PetscInt nvc=0; 44783b03a366Sstefano_zampini PetscBool twodim_flag=PETSC_FALSE; 44790c7d97c5SJed Brown for (i=0; i<mat_graph->ncmps; i++) { 44803b03a366Sstefano_zampini if( mat_graph->cptr[i+1]-mat_graph->cptr[i] > vertex_size ){ 4481534831adSStefano Zampini if(mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]==1){ /* 1 neigh Neumann fake included */ 44820c7d97c5SJed Brown nfc++; 44833b03a366Sstefano_zampini } else { /* note that nec will be zero in 2d */ 44843b03a366Sstefano_zampini nec++; 44853b03a366Sstefano_zampini } 44860c7d97c5SJed Brown } else { 44873b03a366Sstefano_zampini nvc+=mat_graph->cptr[i+1]-mat_graph->cptr[i]; 44883b03a366Sstefano_zampini } 44893b03a366Sstefano_zampini } 44903b03a366Sstefano_zampini 44913b03a366Sstefano_zampini if(!nec) { /* we are in a 2d case -> no faces, only edges */ 44923b03a366Sstefano_zampini nec = nfc; 44933b03a366Sstefano_zampini nfc = 0; 44943b03a366Sstefano_zampini twodim_flag = PETSC_TRUE; 44953b03a366Sstefano_zampini } 44963972b0daSStefano Zampini /* allocate IS arrays for faces, edges. Vertices need a single index set. */ 44973972b0daSStefano Zampini k=0; 44983972b0daSStefano Zampini for (i=0; i<mat_graph->ncmps; i++) { 44993972b0daSStefano Zampini j=mat_graph->cptr[i+1]-mat_graph->cptr[i]; 45003972b0daSStefano Zampini if( j > k) { 45013972b0daSStefano Zampini k=j; 45023972b0daSStefano Zampini } 4503ba1573a8SStefano Zampini if(j<=vertex_size) { 4504ba1573a8SStefano Zampini k+=vertex_size; 4505ba1573a8SStefano Zampini } 45063972b0daSStefano Zampini } 45073972b0daSStefano Zampini ierr = PetscMalloc(k*sizeof(PetscInt),&auxis);CHKERRQ(ierr); 45083972b0daSStefano Zampini 45093b03a366Sstefano_zampini if(!pcbddc->vertices_flag && !pcbddc->edges_flag) { 45103b03a366Sstefano_zampini ierr = PetscMalloc(nfc*sizeof(IS),&pcbddc->ISForFaces);CHKERRQ(ierr); 45113b03a366Sstefano_zampini use_faces=PETSC_TRUE; 45123b03a366Sstefano_zampini } 45133b03a366Sstefano_zampini if(!pcbddc->vertices_flag && !pcbddc->faces_flag) { 45143b03a366Sstefano_zampini ierr = PetscMalloc(nec*sizeof(IS),&pcbddc->ISForEdges);CHKERRQ(ierr); 45153b03a366Sstefano_zampini use_edges=PETSC_TRUE; 45163b03a366Sstefano_zampini } 45173b03a366Sstefano_zampini nfc=0; 45183b03a366Sstefano_zampini nec=0; 45193b03a366Sstefano_zampini for (i=0; i<mat_graph->ncmps; i++) { 45203b03a366Sstefano_zampini if( mat_graph->cptr[i+1]-mat_graph->cptr[i] > vertex_size ){ 45213b03a366Sstefano_zampini for(j=0;j<mat_graph->cptr[i+1]-mat_graph->cptr[i];j++) { 45223972b0daSStefano Zampini auxis[j]=mat_graph->queue[mat_graph->cptr[i]+j]; 45233b03a366Sstefano_zampini } 45243b03a366Sstefano_zampini if(mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]==1){ 45253b03a366Sstefano_zampini if(twodim_flag) { 45263b03a366Sstefano_zampini if(use_edges) { 45273972b0daSStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,j,auxis,PETSC_COPY_VALUES,&pcbddc->ISForEdges[nec]);CHKERRQ(ierr); 45283b03a366Sstefano_zampini nec++; 45293b03a366Sstefano_zampini } 45303b03a366Sstefano_zampini } else { 45313b03a366Sstefano_zampini if(use_faces) { 45323972b0daSStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,j,auxis,PETSC_COPY_VALUES,&pcbddc->ISForFaces[nfc]);CHKERRQ(ierr); 45333b03a366Sstefano_zampini nfc++; 45343b03a366Sstefano_zampini } 45353b03a366Sstefano_zampini } 45363b03a366Sstefano_zampini } else { 45373b03a366Sstefano_zampini if(use_edges) { 45383972b0daSStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,j,auxis,PETSC_COPY_VALUES,&pcbddc->ISForEdges[nec]);CHKERRQ(ierr); 45390c7d97c5SJed Brown nec++; 45400c7d97c5SJed Brown } 45410c7d97c5SJed Brown } 45420c7d97c5SJed Brown } 45433b03a366Sstefano_zampini } 45443b03a366Sstefano_zampini pcbddc->n_ISForFaces=nfc; 45453b03a366Sstefano_zampini pcbddc->n_ISForEdges=nec; 45463b03a366Sstefano_zampini nvc=0; 45470c7d97c5SJed Brown if( !pcbddc->constraints_flag ) { 45483b03a366Sstefano_zampini for (i=0; i<mat_graph->ncmps; i++) { 45493b03a366Sstefano_zampini if( mat_graph->cptr[i+1]-mat_graph->cptr[i] <= vertex_size ){ 45503b03a366Sstefano_zampini for( j=mat_graph->cptr[i];j<mat_graph->cptr[i+1];j++) { 45513972b0daSStefano Zampini auxis[nvc]=mat_graph->queue[j]; 45520c7d97c5SJed Brown nvc++; 45530c7d97c5SJed Brown } 45540c7d97c5SJed Brown } 45550c7d97c5SJed Brown } 45560c7d97c5SJed Brown } 4557a0ba757dSStefano Zampini /* sort vertex set (by local ordering) */ 45583972b0daSStefano Zampini ierr = PetscSortInt(nvc,auxis);CHKERRQ(ierr); 45593972b0daSStefano Zampini ierr = ISCreateGeneral(PETSC_COMM_SELF,nvc,auxis,PETSC_COPY_VALUES,&pcbddc->ISForVertices);CHKERRQ(ierr); 45600c7d97c5SJed Brown 4561e269702eSStefano Zampini if(pcbddc->dbg_flag) { 4562e269702eSStefano Zampini 4563d49ef151SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"--------------------------------------------------------------\n");CHKERRQ(ierr); 4564d49ef151SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Details from PCBDDCManageLocalBoundaries for subdomain %04d\n",PetscGlobalRank);CHKERRQ(ierr); 4565d49ef151SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"--------------------------------------------------------------\n");CHKERRQ(ierr); 4566a0ba757dSStefano Zampini /* ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Graph (adjacency structure) of local Neumann mat\n");CHKERRQ(ierr); 4567a0ba757dSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"--------------------------------------------------------------\n");CHKERRQ(ierr); 4568e269702eSStefano Zampini for(i=0;i<mat_graph->nvtxs;i++) { 4569a0ba757dSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Nodes connected to node number %d are %d\n",i,mat_graph->xadj[i+1]-mat_graph->xadj[i]);CHKERRQ(ierr); 4570e269702eSStefano Zampini for(j=mat_graph->xadj[i];j<mat_graph->xadj[i+1];j++){ 4571a0ba757dSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d ",mat_graph->adjncy[j]);CHKERRQ(ierr); 4572e269702eSStefano Zampini } 4573a0ba757dSStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\n--------------------------------------------------------------\n");CHKERRQ(ierr); 4574da1bb401SStefano Zampini }*/ 4575d49ef151SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Matrix graph has %d connected components", mat_graph->ncmps);CHKERRQ(ierr); 45760c7d97c5SJed Brown for(i=0;i<mat_graph->ncmps;i++) { 45773b03a366Sstefano_zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\nDetails for connected component number %02d: size %04d, count %01d. Nodes follow.\n", 45783b03a366Sstefano_zampini i,mat_graph->cptr[i+1]-mat_graph->cptr[i],mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]);CHKERRQ(ierr); 4579da1bb401SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"subdomains: "); 4580da1bb401SStefano Zampini for (j=0;j<mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]; j++) { 4581da1bb401SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d ",mat_graph->neighbours_set[mat_graph->queue[mat_graph->cptr[i]]][j]); 4582da1bb401SStefano Zampini } 4583da1bb401SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\n"); 45840c7d97c5SJed Brown for (j=mat_graph->cptr[i]; j<mat_graph->cptr[i+1]; j++){ 4585da1bb401SStefano Zampini /* ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d (%d), ",queue_in_global_numbering[j],mat_graph->queue[j]);CHKERRQ(ierr); */ 4586da1bb401SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d, ",mat_graph->queue[j]);CHKERRQ(ierr); 45870c7d97c5SJed Brown } 45880c7d97c5SJed Brown } 4589da1bb401SStefano Zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\n--------------------------------------------------------------\n");CHKERRQ(ierr); 45903b03a366Sstefano_zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local vertices\n",PetscGlobalRank,nvc);CHKERRQ(ierr); 45913b03a366Sstefano_zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local faces\n",PetscGlobalRank,nfc);CHKERRQ(ierr); 45923b03a366Sstefano_zampini ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local edges\n",PetscGlobalRank,nec);CHKERRQ(ierr); 4593d49ef151SStefano Zampini ierr = PetscViewerFlush(viewer);CHKERRQ(ierr); 45940c7d97c5SJed Brown } 45950c7d97c5SJed Brown 45963972b0daSStefano Zampini ierr = PetscFree(queue_in_global_numbering);CHKERRQ(ierr); 45973972b0daSStefano Zampini ierr = PetscFree(auxis);CHKERRQ(ierr); 45980c7d97c5SJed Brown PetscFunctionReturn(0); 45990c7d97c5SJed Brown 46000c7d97c5SJed Brown } 46010c7d97c5SJed Brown 46020c7d97c5SJed Brown /* -------------------------------------------------------------------------- */ 46030c7d97c5SJed Brown 46040c7d97c5SJed Brown /* The following code has been adapted from function IsConnectedSubdomain contained 4605da1bb401SStefano Zampini in source file contig.c of METIS library (version 5.0.1) 4606da1bb401SStefano Zampini It finds connected components of each partition labeled from 1 to n_dist */ 46070c7d97c5SJed Brown 46080c7d97c5SJed Brown #undef __FUNCT__ 46090c7d97c5SJed Brown #define __FUNCT__ "PCBDDCFindConnectedComponents" 46109c0446d6SStefano Zampini static PetscErrorCode PCBDDCFindConnectedComponents(PCBDDCGraph graph, PetscInt n_dist ) 46110c7d97c5SJed Brown { 46120c7d97c5SJed Brown PetscInt i, j, k, nvtxs, first, last, nleft, ncmps,pid,cum_queue,n,ncmps_pid; 46130c7d97c5SJed Brown PetscInt *xadj, *adjncy, *where, *queue; 46140c7d97c5SJed Brown PetscInt *cptr; 46150c7d97c5SJed Brown PetscBool *touched; 46160c7d97c5SJed Brown 46170c7d97c5SJed Brown PetscFunctionBegin; 46180c7d97c5SJed Brown 46190c7d97c5SJed Brown nvtxs = graph->nvtxs; 46200c7d97c5SJed Brown xadj = graph->xadj; 46210c7d97c5SJed Brown adjncy = graph->adjncy; 46220c7d97c5SJed Brown where = graph->where; 46230c7d97c5SJed Brown touched = graph->touched; 46240c7d97c5SJed Brown queue = graph->queue; 46250c7d97c5SJed Brown cptr = graph->cptr; 46260c7d97c5SJed Brown 46270c7d97c5SJed Brown for (i=0; i<nvtxs; i++) 46280c7d97c5SJed Brown touched[i] = PETSC_FALSE; 46290c7d97c5SJed Brown 46300c7d97c5SJed Brown cum_queue=0; 46310c7d97c5SJed Brown ncmps=0; 46320c7d97c5SJed Brown 46330c7d97c5SJed Brown for(n=0; n<n_dist; n++) { 4634da1bb401SStefano Zampini pid = n+1; /* partition labeled by 0 is discarded */ 46350c7d97c5SJed Brown nleft = 0; 46360c7d97c5SJed Brown for (i=0; i<nvtxs; i++) { 46370c7d97c5SJed Brown if (where[i] == pid) 46380c7d97c5SJed Brown nleft++; 46390c7d97c5SJed Brown } 46400c7d97c5SJed Brown for (i=0; i<nvtxs; i++) { 46410c7d97c5SJed Brown if (where[i] == pid) 46420c7d97c5SJed Brown break; 46430c7d97c5SJed Brown } 46440c7d97c5SJed Brown touched[i] = PETSC_TRUE; 46450c7d97c5SJed Brown queue[cum_queue] = i; 46460c7d97c5SJed Brown first = 0; last = 1; 46470c7d97c5SJed Brown cptr[ncmps] = cum_queue; /* This actually points to queue */ 46480c7d97c5SJed Brown ncmps_pid = 0; 46490c7d97c5SJed Brown while (first != nleft) { 46500c7d97c5SJed Brown if (first == last) { /* Find another starting vertex */ 46510c7d97c5SJed Brown cptr[++ncmps] = first+cum_queue; 46520c7d97c5SJed Brown ncmps_pid++; 46530c7d97c5SJed Brown for (i=0; i<nvtxs; i++) { 46540c7d97c5SJed Brown if (where[i] == pid && !touched[i]) 46550c7d97c5SJed Brown break; 46560c7d97c5SJed Brown } 46570c7d97c5SJed Brown queue[cum_queue+last] = i; 46580c7d97c5SJed Brown last++; 46590c7d97c5SJed Brown touched[i] = PETSC_TRUE; 46600c7d97c5SJed Brown } 46610c7d97c5SJed Brown i = queue[cum_queue+first]; 46620c7d97c5SJed Brown first++; 46630c7d97c5SJed Brown for (j=xadj[i]; j<xadj[i+1]; j++) { 46640c7d97c5SJed Brown k = adjncy[j]; 46650c7d97c5SJed Brown if (where[k] == pid && !touched[k]) { 46660c7d97c5SJed Brown queue[cum_queue+last] = k; 46670c7d97c5SJed Brown last++; 46680c7d97c5SJed Brown touched[k] = PETSC_TRUE; 46690c7d97c5SJed Brown } 46700c7d97c5SJed Brown } 46710c7d97c5SJed Brown } 46720c7d97c5SJed Brown cptr[++ncmps] = first+cum_queue; 46730c7d97c5SJed Brown ncmps_pid++; 46740c7d97c5SJed Brown cum_queue=cptr[ncmps]; 4675a0ba757dSStefano Zampini graph->where_ncmps[n] = ncmps_pid; 46760c7d97c5SJed Brown } 46770c7d97c5SJed Brown graph->ncmps = ncmps; 46780c7d97c5SJed Brown 46790c7d97c5SJed Brown PetscFunctionReturn(0); 46800c7d97c5SJed Brown } 4681