xref: /petsc/src/ksp/pc/impls/bddc/bddc.c (revision 3425bc38356cbc0d49875b3b7bc7d76134e20c58)
153cdbc3dSStefano Zampini /* TODOLIST
2da1bb401SStefano Zampini    DofSplitting and DM attached to pc?
3da1bb401SStefano Zampini    Change SetNeumannBoundaries to SetNeumannBoundariesLocal and provide new SetNeumannBoundaries (same Dirichlet)
4da1bb401SStefano Zampini    Exact solvers: Solve local saddle point directly
5831a100dSStefano Zampini      - change prec_type to switch_inexact_prec_type
6831a100dSStefano Zampini      - add bool solve_exact_saddle_point slot to pdbddc data
73b03a366Sstefano_zampini    Inexact solvers: global preconditioner application is ready, ask to developers (Jed?) on how to best implement Dohrmann's approach (PCSHELL?)
8a0ba757dSStefano Zampini    change how to deal with the coarse problem (PCBDDCSetCoarseEnvironment):
9a0ba757dSStefano Zampini      - mind the problem with coarsening_factor
10a0ba757dSStefano Zampini      - simplify coarse problem structure -> PCBDDC or PCREDUDANT, nothing else -> same comm for all levels?
11a0ba757dSStefano Zampini      - remove coarse enums and allow use of PCBDDCGetCoarseKSP
12a0ba757dSStefano Zampini      - remove metis dependency -> use MatPartitioning for multilevel -> Assemble serial adjacency in ManageLocalBoundaries?
133b03a366Sstefano_zampini      - Add levels' slot to bddc data structure and associated Set/Get functions
14a0ba757dSStefano Zampini    code refactoring:
15a0ba757dSStefano Zampini      - pick up better names for static functions
16a0ba757dSStefano Zampini    change options structure:
17a0ba757dSStefano Zampini      - insert BDDC into MG framework?
18a0ba757dSStefano Zampini    provide other ops? Ask to developers
19a0ba757dSStefano Zampini    remove all unused printf
20a0ba757dSStefano Zampini    man pages
2153cdbc3dSStefano Zampini */
220c7d97c5SJed Brown 
2353cdbc3dSStefano Zampini /* ----------------------------------------------------------------------------------------------------------------------------------------------
240c7d97c5SJed Brown    Implementation of BDDC preconditioner based on:
250c7d97c5SJed Brown    C. Dohrmann "An approximate BDDC preconditioner", Numerical Linear Algebra with Applications Volume 14, Issue 2, pages 149-168, March 2007
2653cdbc3dSStefano Zampini    ---------------------------------------------------------------------------------------------------------------------------------------------- */
2753cdbc3dSStefano Zampini 
2853cdbc3dSStefano Zampini #include "bddc.h" /*I "petscpc.h" I*/  /* includes for fortran wrappers */
293b03a366Sstefano_zampini #include <petscblaslapack.h>
300c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
310c7d97c5SJed Brown #undef __FUNCT__
320c7d97c5SJed Brown #define __FUNCT__ "PCSetFromOptions_BDDC"
330c7d97c5SJed Brown PetscErrorCode PCSetFromOptions_BDDC(PC pc)
340c7d97c5SJed Brown {
350c7d97c5SJed Brown   PC_BDDC         *pcbddc = (PC_BDDC*)pc->data;
360c7d97c5SJed Brown   PetscErrorCode ierr;
370c7d97c5SJed Brown 
380c7d97c5SJed Brown   PetscFunctionBegin;
390c7d97c5SJed Brown   ierr = PetscOptionsHead("BDDC options");CHKERRQ(ierr);
400c7d97c5SJed Brown   /* Verbose debugging of main data structures */
41e269702eSStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_check_all"       ,"Verbose (debugging) output for PCBDDC"                       ,"none",pcbddc->dbg_flag      ,&pcbddc->dbg_flag      ,PETSC_NULL);CHKERRQ(ierr);
420c7d97c5SJed Brown   /* Some customization for default primal space */
43da1bb401SStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_vertices_only"   ,"Use only vertices in coarse space (i.e. discard constraints)","none",pcbddc->vertices_flag   ,&pcbddc->vertices_flag   ,PETSC_NULL);CHKERRQ(ierr);
44da1bb401SStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_constraints_only","Use only constraints in coarse space (i.e. discard vertices)","none",pcbddc->constraints_flag,&pcbddc->constraints_flag,PETSC_NULL);CHKERRQ(ierr);
45da1bb401SStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_faces_only"      ,"Use only faces among constraints of coarse space (i.e. discard edges)"         ,"none",pcbddc->faces_flag      ,&pcbddc->faces_flag      ,PETSC_NULL);CHKERRQ(ierr);
46da1bb401SStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_edges_only"      ,"Use only edges among constraints of coarse space (i.e. discard faces)"         ,"none",pcbddc->edges_flag      ,&pcbddc->edges_flag      ,PETSC_NULL);CHKERRQ(ierr);
470c7d97c5SJed Brown   /* Coarse solver context */
48da1bb401SStefano Zampini   static const char *avail_coarse_problems[] = {"sequential","replicated","parallel","multilevel",""}; /*order of choiches depends on ENUM defined in bddc.h */
490c7d97c5SJed Brown   ierr = PetscOptionsEnum("-pc_bddc_coarse_problem_type","Set coarse problem type","none",avail_coarse_problems,(PetscEnum)pcbddc->coarse_problem_type,(PetscEnum*)&pcbddc->coarse_problem_type,PETSC_NULL);CHKERRQ(ierr);
500c7d97c5SJed Brown   /* Two different application of BDDC to the whole set of dofs, internal and interface */
510c7d97c5SJed Brown   ierr = PetscOptionsBool("-pc_bddc_switch_preconditioning_type","Switch between M_2 (default) and M_3 preconditioners (as defined by Dohrmann)","none",pcbddc->prec_type,&pcbddc->prec_type,PETSC_NULL);CHKERRQ(ierr);
52534831adSStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_use_change_of_basis","Use change of basis approach for primal space","none",pcbddc->usechangeofbasis,&pcbddc->usechangeofbasis,PETSC_NULL);CHKERRQ(ierr);
53534831adSStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_use_change_on_faces","Use change of basis approach for face constraints","none",pcbddc->usechangeonfaces,&pcbddc->usechangeonfaces,PETSC_NULL);CHKERRQ(ierr);
54534831adSStefano Zampini   pcbddc->usechangeonfaces = pcbddc->usechangeonfaces && pcbddc->usechangeofbasis;
550c7d97c5SJed Brown   ierr = PetscOptionsInt("-pc_bddc_coarsening_ratio","Set coarsening ratio used in multilevel coarsening","none",pcbddc->coarsening_ratio,&pcbddc->coarsening_ratio,PETSC_NULL);CHKERRQ(ierr);
560c7d97c5SJed Brown   ierr = PetscOptionsTail();CHKERRQ(ierr);
570c7d97c5SJed Brown   PetscFunctionReturn(0);
580c7d97c5SJed Brown }
590c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
600c7d97c5SJed Brown EXTERN_C_BEGIN
610c7d97c5SJed Brown #undef __FUNCT__
620c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetCoarseProblemType_BDDC"
6353cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetCoarseProblemType_BDDC(PC pc, CoarseProblemType CPT)
640c7d97c5SJed Brown {
650c7d97c5SJed Brown   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
660c7d97c5SJed Brown 
670c7d97c5SJed Brown   PetscFunctionBegin;
680c7d97c5SJed Brown   pcbddc->coarse_problem_type = CPT;
690c7d97c5SJed Brown   PetscFunctionReturn(0);
700c7d97c5SJed Brown }
710c7d97c5SJed Brown EXTERN_C_END
720c7d97c5SJed Brown #undef __FUNCT__
730c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetCoarseProblemType"
7453cdbc3dSStefano Zampini /*@
759c0446d6SStefano Zampini  PCBDDCSetCoarseProblemType - Set coarse problem type in PCBDDC.
7653cdbc3dSStefano Zampini 
779c0446d6SStefano Zampini    Not collective
7853cdbc3dSStefano Zampini 
7953cdbc3dSStefano Zampini    Input Parameters:
8053cdbc3dSStefano Zampini +  pc - the preconditioning context
8153cdbc3dSStefano Zampini -  CoarseProblemType - pick a better name and explain what this is
8253cdbc3dSStefano Zampini 
8353cdbc3dSStefano Zampini    Level: intermediate
8453cdbc3dSStefano Zampini 
8553cdbc3dSStefano Zampini    Notes:
86da1bb401SStefano Zampini    Not collective but all procs must call with same arguments.
8753cdbc3dSStefano Zampini 
8853cdbc3dSStefano Zampini .seealso: PCBDDC
8953cdbc3dSStefano Zampini @*/
900c7d97c5SJed Brown PetscErrorCode PCBDDCSetCoarseProblemType(PC pc, CoarseProblemType CPT)
910c7d97c5SJed Brown {
920c7d97c5SJed Brown   PetscErrorCode ierr;
930c7d97c5SJed Brown 
940c7d97c5SJed Brown   PetscFunctionBegin;
950c7d97c5SJed Brown   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
960c7d97c5SJed Brown   ierr = PetscTryMethod(pc,"PCBDDCSetCoarseProblemType_C",(PC,CoarseProblemType),(pc,CPT));CHKERRQ(ierr);
970c7d97c5SJed Brown   PetscFunctionReturn(0);
980c7d97c5SJed Brown }
990c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
1000c7d97c5SJed Brown EXTERN_C_BEGIN
1010c7d97c5SJed Brown #undef __FUNCT__
1023b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCSetDirichletBoundaries_BDDC"
1033b03a366Sstefano_zampini static PetscErrorCode PCBDDCSetDirichletBoundaries_BDDC(PC pc,IS DirichletBoundaries)
1043b03a366Sstefano_zampini {
1053b03a366Sstefano_zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
1063b03a366Sstefano_zampini   PetscErrorCode ierr;
1073b03a366Sstefano_zampini 
1083b03a366Sstefano_zampini   PetscFunctionBegin;
1093b03a366Sstefano_zampini   ierr = ISDestroy(&pcbddc->DirichletBoundaries);CHKERRQ(ierr);
11036e030ebSStefano Zampini   ierr = PetscObjectReference((PetscObject)DirichletBoundaries);CHKERRQ(ierr);
11136e030ebSStefano Zampini   pcbddc->DirichletBoundaries=DirichletBoundaries;
1123b03a366Sstefano_zampini   PetscFunctionReturn(0);
1133b03a366Sstefano_zampini }
1143b03a366Sstefano_zampini EXTERN_C_END
1153b03a366Sstefano_zampini #undef __FUNCT__
1163b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCSetDirichletBoundaries"
1173b03a366Sstefano_zampini /*@
118da1bb401SStefano Zampini  PCBDDCSetDirichletBoundaries - Set index set defining subdomain part (in local ordering)
119da1bb401SStefano Zampini                               of Dirichlet boundaries for the global problem.
1203b03a366Sstefano_zampini 
1213b03a366Sstefano_zampini    Not collective
1223b03a366Sstefano_zampini 
1233b03a366Sstefano_zampini    Input Parameters:
1243b03a366Sstefano_zampini +  pc - the preconditioning context
1253b03a366Sstefano_zampini -  DirichletBoundaries - sequential index set defining the subdomain part of Dirichlet boundaries (can be PETSC_NULL)
1263b03a366Sstefano_zampini 
1273b03a366Sstefano_zampini    Level: intermediate
1283b03a366Sstefano_zampini 
1293b03a366Sstefano_zampini    Notes:
1303b03a366Sstefano_zampini 
1313b03a366Sstefano_zampini .seealso: PCBDDC
1323b03a366Sstefano_zampini @*/
1333b03a366Sstefano_zampini PetscErrorCode PCBDDCSetDirichletBoundaries(PC pc,IS DirichletBoundaries)
1343b03a366Sstefano_zampini {
1353b03a366Sstefano_zampini   PetscErrorCode ierr;
1363b03a366Sstefano_zampini 
1373b03a366Sstefano_zampini   PetscFunctionBegin;
1383b03a366Sstefano_zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
1393b03a366Sstefano_zampini   ierr = PetscTryMethod(pc,"PCBDDCSetDirichletBoundaries_C",(PC,IS),(pc,DirichletBoundaries));CHKERRQ(ierr);
1403b03a366Sstefano_zampini   PetscFunctionReturn(0);
1413b03a366Sstefano_zampini }
1423b03a366Sstefano_zampini /* -------------------------------------------------------------------------- */
1433b03a366Sstefano_zampini EXTERN_C_BEGIN
1443b03a366Sstefano_zampini #undef __FUNCT__
1450c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetNeumannBoundaries_BDDC"
14653cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetNeumannBoundaries_BDDC(PC pc,IS NeumannBoundaries)
1470c7d97c5SJed Brown {
1480c7d97c5SJed Brown   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
14953cdbc3dSStefano Zampini   PetscErrorCode ierr;
1500c7d97c5SJed Brown 
1510c7d97c5SJed Brown   PetscFunctionBegin;
15253cdbc3dSStefano Zampini   ierr = ISDestroy(&pcbddc->NeumannBoundaries);CHKERRQ(ierr);
15336e030ebSStefano Zampini   ierr = PetscObjectReference((PetscObject)NeumannBoundaries);CHKERRQ(ierr);
15436e030ebSStefano Zampini   pcbddc->NeumannBoundaries=NeumannBoundaries;
1550c7d97c5SJed Brown   PetscFunctionReturn(0);
1560c7d97c5SJed Brown }
1570c7d97c5SJed Brown EXTERN_C_END
1580c7d97c5SJed Brown #undef __FUNCT__
1590c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetNeumannBoundaries"
16057527edcSJed Brown /*@
161da1bb401SStefano Zampini  PCBDDCSetNeumannBoundaries - Set index set defining subdomain part (in local ordering)
162da1bb401SStefano Zampini                               of Neumann boundaries for the global problem.
16357527edcSJed Brown 
1649c0446d6SStefano Zampini    Not collective
16557527edcSJed Brown 
16657527edcSJed Brown    Input Parameters:
16757527edcSJed Brown +  pc - the preconditioning context
1689c0446d6SStefano Zampini -  NeumannBoundaries - sequential index set defining the subdomain part of Neumann boundaries (can be PETSC_NULL)
16957527edcSJed Brown 
17057527edcSJed Brown    Level: intermediate
17157527edcSJed Brown 
17257527edcSJed Brown    Notes:
17357527edcSJed Brown 
17457527edcSJed Brown .seealso: PCBDDC
17557527edcSJed Brown @*/
17653cdbc3dSStefano Zampini PetscErrorCode PCBDDCSetNeumannBoundaries(PC pc,IS NeumannBoundaries)
1770c7d97c5SJed Brown {
1780c7d97c5SJed Brown   PetscErrorCode ierr;
1790c7d97c5SJed Brown 
1800c7d97c5SJed Brown   PetscFunctionBegin;
1810c7d97c5SJed Brown   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
18253cdbc3dSStefano Zampini   ierr = PetscTryMethod(pc,"PCBDDCSetNeumannBoundaries_C",(PC,IS),(pc,NeumannBoundaries));CHKERRQ(ierr);
18353cdbc3dSStefano Zampini   PetscFunctionReturn(0);
18453cdbc3dSStefano Zampini }
18553cdbc3dSStefano Zampini /* -------------------------------------------------------------------------- */
18653cdbc3dSStefano Zampini EXTERN_C_BEGIN
18753cdbc3dSStefano Zampini #undef __FUNCT__
188da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCGetDirichletBoundaries_BDDC"
189da1bb401SStefano Zampini static PetscErrorCode PCBDDCGetDirichletBoundaries_BDDC(PC pc,IS *DirichletBoundaries)
190da1bb401SStefano Zampini {
191da1bb401SStefano Zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
192da1bb401SStefano Zampini 
193da1bb401SStefano Zampini   PetscFunctionBegin;
194da1bb401SStefano Zampini   *DirichletBoundaries = pcbddc->DirichletBoundaries;
195da1bb401SStefano Zampini   PetscFunctionReturn(0);
196da1bb401SStefano Zampini }
197da1bb401SStefano Zampini EXTERN_C_END
198da1bb401SStefano Zampini #undef __FUNCT__
199da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCGetDirichletBoundaries"
200da1bb401SStefano Zampini /*@
201da1bb401SStefano Zampini  PCBDDCGetDirichletBoundaries - Get index set defining subdomain part (in local ordering)
202da1bb401SStefano Zampini                                 of Dirichlet boundaries for the global problem.
203da1bb401SStefano Zampini 
204da1bb401SStefano Zampini    Not collective
205da1bb401SStefano Zampini 
206da1bb401SStefano Zampini    Input Parameters:
207da1bb401SStefano Zampini +  pc - the preconditioning context
208da1bb401SStefano Zampini 
209da1bb401SStefano Zampini    Output Parameters:
210da1bb401SStefano Zampini +  DirichletBoundaries - index set defining the subdomain part of Dirichlet boundaries
211da1bb401SStefano Zampini 
212da1bb401SStefano Zampini    Level: intermediate
213da1bb401SStefano Zampini 
214da1bb401SStefano Zampini    Notes:
215da1bb401SStefano Zampini 
216da1bb401SStefano Zampini .seealso: PCBDDC
217da1bb401SStefano Zampini @*/
218da1bb401SStefano Zampini PetscErrorCode PCBDDCGetDirichletBoundaries(PC pc,IS *DirichletBoundaries)
219da1bb401SStefano Zampini {
220da1bb401SStefano Zampini   PetscErrorCode ierr;
221da1bb401SStefano Zampini 
222da1bb401SStefano Zampini   PetscFunctionBegin;
223da1bb401SStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
224da1bb401SStefano Zampini   ierr = PetscUseMethod(pc,"PCBDDCGetDirichletBoundaries_C",(PC,IS*),(pc,DirichletBoundaries));CHKERRQ(ierr);
225da1bb401SStefano Zampini   PetscFunctionReturn(0);
226da1bb401SStefano Zampini }
227da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
228da1bb401SStefano Zampini EXTERN_C_BEGIN
229da1bb401SStefano Zampini #undef __FUNCT__
23053cdbc3dSStefano Zampini #define __FUNCT__ "PCBDDCGetNeumannBoundaries_BDDC"
23153cdbc3dSStefano Zampini static PetscErrorCode PCBDDCGetNeumannBoundaries_BDDC(PC pc,IS *NeumannBoundaries)
23253cdbc3dSStefano Zampini {
23353cdbc3dSStefano Zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
23453cdbc3dSStefano Zampini 
23553cdbc3dSStefano Zampini   PetscFunctionBegin;
23653cdbc3dSStefano Zampini   *NeumannBoundaries = pcbddc->NeumannBoundaries;
23753cdbc3dSStefano Zampini   PetscFunctionReturn(0);
23853cdbc3dSStefano Zampini }
23953cdbc3dSStefano Zampini EXTERN_C_END
24053cdbc3dSStefano Zampini #undef __FUNCT__
24153cdbc3dSStefano Zampini #define __FUNCT__ "PCBDDCGetNeumannBoundaries"
24253cdbc3dSStefano Zampini /*@
243da1bb401SStefano Zampini  PCBDDCGetNeumannBoundaries - Get index set defining subdomain part (in local ordering)
244da1bb401SStefano Zampini                               of Neumann boundaries for the global problem.
24553cdbc3dSStefano Zampini 
2469c0446d6SStefano Zampini    Not collective
24753cdbc3dSStefano Zampini 
24853cdbc3dSStefano Zampini    Input Parameters:
24953cdbc3dSStefano Zampini +  pc - the preconditioning context
25053cdbc3dSStefano Zampini 
25153cdbc3dSStefano Zampini    Output Parameters:
25253cdbc3dSStefano Zampini +  NeumannBoundaries - index set defining the subdomain part of Neumann boundaries
25353cdbc3dSStefano Zampini 
25453cdbc3dSStefano Zampini    Level: intermediate
25553cdbc3dSStefano Zampini 
25653cdbc3dSStefano Zampini    Notes:
25753cdbc3dSStefano Zampini 
25853cdbc3dSStefano Zampini .seealso: PCBDDC
25953cdbc3dSStefano Zampini @*/
26053cdbc3dSStefano Zampini PetscErrorCode PCBDDCGetNeumannBoundaries(PC pc,IS *NeumannBoundaries)
26153cdbc3dSStefano Zampini {
26253cdbc3dSStefano Zampini   PetscErrorCode ierr;
26353cdbc3dSStefano Zampini 
26453cdbc3dSStefano Zampini   PetscFunctionBegin;
26553cdbc3dSStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
26653cdbc3dSStefano Zampini   ierr = PetscUseMethod(pc,"PCBDDCGetNeumannBoundaries_C",(PC,IS*),(pc,NeumannBoundaries));CHKERRQ(ierr);
2670c7d97c5SJed Brown   PetscFunctionReturn(0);
2680c7d97c5SJed Brown }
26936e030ebSStefano Zampini /* -------------------------------------------------------------------------- */
27036e030ebSStefano Zampini EXTERN_C_BEGIN
27136e030ebSStefano Zampini #undef __FUNCT__
272da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetLocalAdjacencyGraph_BDDC"
273da1bb401SStefano Zampini static PetscErrorCode PCBDDCSetLocalAdjacencyGraph_BDDC(PC pc, PetscInt nvtxs, PetscInt xadj[], PetscInt adjncy[], PetscCopyMode copymode)
27436e030ebSStefano Zampini {
27536e030ebSStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
276da1bb401SStefano Zampini   PCBDDCGraph    mat_graph=pcbddc->mat_graph;
277da1bb401SStefano Zampini   PetscErrorCode ierr;
27836e030ebSStefano Zampini 
27936e030ebSStefano Zampini   PetscFunctionBegin;
280da1bb401SStefano Zampini   mat_graph->nvtxs=nvtxs;
281da1bb401SStefano Zampini   ierr = PetscFree(mat_graph->xadj);CHKERRQ(ierr);
282da1bb401SStefano Zampini   ierr = PetscFree(mat_graph->adjncy);CHKERRQ(ierr);
283da1bb401SStefano Zampini   if(copymode == PETSC_COPY_VALUES) {
284da1bb401SStefano Zampini     ierr = PetscMalloc((mat_graph->nvtxs+1)*sizeof(PetscInt),&mat_graph->xadj);CHKERRQ(ierr);
285da1bb401SStefano Zampini     ierr = PetscMalloc(xadj[mat_graph->nvtxs]*sizeof(PetscInt),&mat_graph->adjncy);CHKERRQ(ierr);
286da1bb401SStefano Zampini     ierr = PetscMemcpy(mat_graph->xadj,xadj,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr);
287da1bb401SStefano Zampini     ierr = PetscMemcpy(mat_graph->adjncy,adjncy,xadj[mat_graph->nvtxs]*sizeof(PetscInt));CHKERRQ(ierr);
288da1bb401SStefano Zampini   } else if(copymode == PETSC_OWN_POINTER) {
289da1bb401SStefano Zampini     mat_graph->xadj=xadj;
290da1bb401SStefano Zampini     mat_graph->adjncy=adjncy;
291da1bb401SStefano Zampini   } else {
292da1bb401SStefano Zampini     SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_SUP,"Unsupported copy mode %d in %s\n",copymode,__FUNCT__);
293da1bb401SStefano Zampini   }
29436e030ebSStefano Zampini   PetscFunctionReturn(0);
29536e030ebSStefano Zampini }
29636e030ebSStefano Zampini EXTERN_C_END
29736e030ebSStefano Zampini #undef __FUNCT__
298da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetLocalAdjacencyGraph"
29936e030ebSStefano Zampini /*@
300da1bb401SStefano Zampini  PCBDDCSetLocalAdjacencyGraph - Set CSR graph of local matrix for use of PCBDDC.
30136e030ebSStefano Zampini 
30236e030ebSStefano Zampini    Not collective
30336e030ebSStefano Zampini 
30436e030ebSStefano Zampini    Input Parameters:
30536e030ebSStefano Zampini +  pc - the preconditioning context
306da1bb401SStefano Zampini -  nvtxs - number of local vertices of the graph
307da1bb401SStefano Zampini -  xadj, adjncy - the CSR graph
308da1bb401SStefano Zampini -  copymode - either PETSC_COPY_VALUES or PETSC_OWN_POINTER. In the former case the user must free the array passed in;
309da1bb401SStefano Zampini                                                              in the latter case, memory must be obtained with PetscMalloc.
31036e030ebSStefano Zampini 
31136e030ebSStefano Zampini    Level: intermediate
31236e030ebSStefano Zampini 
31336e030ebSStefano Zampini    Notes:
31436e030ebSStefano Zampini 
31536e030ebSStefano Zampini .seealso: PCBDDC
31636e030ebSStefano Zampini @*/
317da1bb401SStefano Zampini PetscErrorCode PCBDDCSetLocalAdjacencyGraph(PC pc,PetscInt nvtxs,PetscInt xadj[],PetscInt adjncy[], PetscCopyMode copymode)
31836e030ebSStefano Zampini {
319da1bb401SStefano Zampini   PetscInt       nrows,ncols;
320da1bb401SStefano Zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
32136e030ebSStefano Zampini   PetscErrorCode ierr;
32236e030ebSStefano Zampini 
32336e030ebSStefano Zampini   PetscFunctionBegin;
32436e030ebSStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
325da1bb401SStefano Zampini   ierr = MatGetSize(matis->A,&nrows,&ncols);CHKERRQ(ierr);
326da1bb401SStefano Zampini   if(nvtxs != nrows) {
327da1bb401SStefano Zampini     SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Local adjacency size %d passed in %s differs from local problem size %d!\n",nvtxs,__FUNCT__,nrows);
328da1bb401SStefano Zampini   } else {
329da1bb401SStefano Zampini     ierr = PetscTryMethod(pc,"PCBDDCSetLocalAdjacencyGraph_C",(PC,PetscInt,PetscInt[],PetscInt[],PetscCopyMode),(pc,nvtxs,xadj,adjncy,copymode));CHKERRQ(ierr);
330da1bb401SStefano Zampini   }
33136e030ebSStefano Zampini   PetscFunctionReturn(0);
33236e030ebSStefano Zampini }
3339c0446d6SStefano Zampini /* -------------------------------------------------------------------------- */
3349c0446d6SStefano Zampini EXTERN_C_BEGIN
3359c0446d6SStefano Zampini #undef __FUNCT__
3369c0446d6SStefano Zampini #define __FUNCT__ "PCBDDCSetDofsSplitting_BDDC"
3379c0446d6SStefano Zampini static PetscErrorCode PCBDDCSetDofsSplitting_BDDC(PC pc,PetscInt n_is, IS ISForDofs[])
3389c0446d6SStefano Zampini {
3399c0446d6SStefano Zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
3409c0446d6SStefano Zampini   PetscInt i;
3419c0446d6SStefano Zampini   PetscErrorCode ierr;
3429c0446d6SStefano Zampini 
3439c0446d6SStefano Zampini   PetscFunctionBegin;
344da1bb401SStefano Zampini   /* Destroy ISes if they were already set */
3459c0446d6SStefano Zampini   for(i=0;i<pcbddc->n_ISForDofs;i++) {
3469c0446d6SStefano Zampini     ierr = ISDestroy(&pcbddc->ISForDofs[i]);CHKERRQ(ierr);
3479c0446d6SStefano Zampini   }
348d11ae9bbSstefano_zampini   ierr = PetscFree(pcbddc->ISForDofs);CHKERRQ(ierr);
349da1bb401SStefano Zampini   /* allocate space then set */
3509c0446d6SStefano Zampini   ierr = PetscMalloc(n_is*sizeof(IS),&pcbddc->ISForDofs);CHKERRQ(ierr);
3519c0446d6SStefano Zampini   for(i=0;i<n_is;i++) {
352da1bb401SStefano Zampini     ierr = PetscObjectReference((PetscObject)ISForDofs[i]);CHKERRQ(ierr);
353da1bb401SStefano Zampini     pcbddc->ISForDofs[i]=ISForDofs[i];
3549c0446d6SStefano Zampini   }
3559c0446d6SStefano Zampini   pcbddc->n_ISForDofs=n_is;
3569c0446d6SStefano Zampini   PetscFunctionReturn(0);
3579c0446d6SStefano Zampini }
3589c0446d6SStefano Zampini EXTERN_C_END
3599c0446d6SStefano Zampini #undef __FUNCT__
3609c0446d6SStefano Zampini #define __FUNCT__ "PCBDDCSetDofsSplitting"
3619c0446d6SStefano Zampini /*@
362da1bb401SStefano Zampini  PCBDDCSetDofsSplitting - Set index sets defining fields of local mat.
3639c0446d6SStefano Zampini 
3649c0446d6SStefano Zampini    Not collective
3659c0446d6SStefano Zampini 
3669c0446d6SStefano Zampini    Input Parameters:
3679c0446d6SStefano Zampini +  pc - the preconditioning context
368da1bb401SStefano Zampini -  n - number of index sets defining the fields
369da1bb401SStefano Zampini -  IS[] - array of IS describing the fields
3709c0446d6SStefano Zampini 
3719c0446d6SStefano Zampini    Level: intermediate
3729c0446d6SStefano Zampini 
3739c0446d6SStefano Zampini    Notes:
3749c0446d6SStefano Zampini 
3759c0446d6SStefano Zampini .seealso: PCBDDC
3769c0446d6SStefano Zampini @*/
3779c0446d6SStefano Zampini PetscErrorCode PCBDDCSetDofsSplitting(PC pc,PetscInt n_is, IS ISForDofs[])
3789c0446d6SStefano Zampini {
3799c0446d6SStefano Zampini   PetscErrorCode ierr;
3809c0446d6SStefano Zampini 
3819c0446d6SStefano Zampini   PetscFunctionBegin;
3829c0446d6SStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
3839c0446d6SStefano Zampini   ierr = PetscTryMethod(pc,"PCBDDCSetDofsSplitting_C",(PC,PetscInt,IS[]),(pc,n_is,ISForDofs));CHKERRQ(ierr);
3849c0446d6SStefano Zampini   PetscFunctionReturn(0);
3859c0446d6SStefano Zampini }
386da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
387534831adSStefano Zampini #undef __FUNCT__
388534831adSStefano Zampini #define __FUNCT__ "PCPreSolve_BDDC"
389534831adSStefano Zampini /* -------------------------------------------------------------------------- */
390534831adSStefano Zampini /*
391534831adSStefano Zampini    PCPreSolve_BDDC - Changes the right hand side and (if necessary) the initial
392534831adSStefano Zampini                      guess if a transformation of basis approach has been selected.
3939c0446d6SStefano Zampini 
394534831adSStefano Zampini    Input Parameter:
395534831adSStefano Zampini +  pc - the preconditioner contex
396534831adSStefano Zampini 
397534831adSStefano Zampini    Application Interface Routine: PCPreSolve()
398534831adSStefano Zampini 
399534831adSStefano Zampini    Notes:
400534831adSStefano Zampini    The interface routine PCPreSolve() is not usually called directly by
401534831adSStefano Zampini    the user, but instead is called by KSPSolve().
402534831adSStefano Zampini */
403534831adSStefano Zampini static PetscErrorCode PCPreSolve_BDDC(PC pc, KSP ksp, Vec rhs, Vec x)
404534831adSStefano Zampini {
405534831adSStefano Zampini   PetscErrorCode ierr;
406534831adSStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
407534831adSStefano Zampini   PC_IS          *pcis = (PC_IS*)(pc->data);
408534831adSStefano Zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
409534831adSStefano Zampini   Mat            temp_mat;
4103972b0daSStefano Zampini   IS             dirIS;
4113972b0daSStefano Zampini   PetscInt       dirsize,i,*is_indices;
4123972b0daSStefano Zampini   PetscScalar    *array_x,*array_diagonal;
4133972b0daSStefano Zampini   Vec            used_vec;
4143972b0daSStefano Zampini   PetscBool      guess_nonzero;
415534831adSStefano Zampini 
416534831adSStefano Zampini   PetscFunctionBegin;
4173972b0daSStefano Zampini   if(x) {
4183972b0daSStefano Zampini     ierr = PetscObjectReference((PetscObject)x);CHKERRQ(ierr);
4193972b0daSStefano Zampini     used_vec = x;
4203972b0daSStefano Zampini   } else {
4213972b0daSStefano Zampini     ierr = PetscObjectReference((PetscObject)pcbddc->temp_solution);CHKERRQ(ierr);
4223972b0daSStefano Zampini     used_vec = pcbddc->temp_solution;
4233972b0daSStefano Zampini     ierr = VecSet(used_vec,0.0);CHKERRQ(ierr);
4243972b0daSStefano Zampini   }
4253972b0daSStefano Zampini   /* hack into ksp data structure PCPreSolve comes earlier in src/ksp/ksp/interface/itfunc.c */
4263972b0daSStefano Zampini   if (ksp) {
4273972b0daSStefano Zampini     ierr = KSPGetInitialGuessNonzero(ksp,&guess_nonzero);CHKERRQ(ierr);
4283972b0daSStefano Zampini     if( !guess_nonzero ) {
4293972b0daSStefano Zampini       ierr = VecSet(used_vec,0.0);CHKERRQ(ierr);
4303972b0daSStefano Zampini     }
4313972b0daSStefano Zampini   }
4323972b0daSStefano Zampini   /* store the original rhs */
4333972b0daSStefano Zampini   ierr = VecCopy(rhs,pcbddc->original_rhs);CHKERRQ(ierr);
434534831adSStefano Zampini   if(pcbddc->usechangeofbasis) {
435534831adSStefano Zampini     /* swap pointers for local matrices */
436534831adSStefano Zampini     temp_mat = matis->A;
437534831adSStefano Zampini     matis->A = pcbddc->local_mat;
438534831adSStefano Zampini     pcbddc->local_mat = temp_mat;
439534831adSStefano Zampini     /* Get local rhs and apply transformation of basis */
440534831adSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,rhs,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
441534831adSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,rhs,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
442534831adSStefano Zampini     /* from original basis to modified basis */
443534831adSStefano Zampini     ierr = MatMultTranspose(pcbddc->ChangeOfBasisMatrix,pcis->vec1_B,pcis->vec2_B);CHKERRQ(ierr);
444534831adSStefano Zampini     /* put back modified values into the global vec using INSERT_VALUES copy mode */
445534831adSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,pcis->vec2_B,rhs,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
446534831adSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec2_B,rhs,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
447534831adSStefano Zampini   }
4483972b0daSStefano Zampini 
4493972b0daSStefano Zampini   /* Take into account zeroed rows -> change rhs and store solution removed */
4503972b0daSStefano Zampini   ierr = MatGetDiagonal(pc->pmat,pcis->vec1_global);CHKERRQ(ierr);
4513972b0daSStefano Zampini   ierr = VecPointwiseDivide(pcis->vec1_global,rhs,pcis->vec1_global);CHKERRQ(ierr);
4523972b0daSStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4533972b0daSStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4543972b0daSStefano Zampini   ierr = VecScatterBegin(matis->ctx,used_vec,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4553972b0daSStefano Zampini   ierr = VecScatterEnd  (matis->ctx,used_vec,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4563972b0daSStefano Zampini   ierr = PCBDDCGetDirichletBoundaries(pc,&dirIS);CHKERRQ(ierr);
4573972b0daSStefano Zampini   if(dirIS) {
4583972b0daSStefano Zampini     ierr = ISGetSize(dirIS,&dirsize);CHKERRQ(ierr);
4593972b0daSStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array_x);CHKERRQ(ierr);
4603972b0daSStefano Zampini     ierr = VecGetArray(pcis->vec2_N,&array_diagonal);CHKERRQ(ierr);
4613972b0daSStefano Zampini     ierr = ISGetIndices(dirIS,(const PetscInt**)&is_indices);CHKERRQ(ierr);
4623972b0daSStefano Zampini     for(i=0;i<dirsize;i++) {
4633972b0daSStefano Zampini       array_x[is_indices[i]]=array_diagonal[is_indices[i]];
4643972b0daSStefano Zampini     }
4653972b0daSStefano Zampini     ierr = ISRestoreIndices(dirIS,(const PetscInt**)&is_indices);CHKERRQ(ierr);
4663972b0daSStefano Zampini     ierr = VecRestoreArray(pcis->vec2_N,&array_diagonal);CHKERRQ(ierr);
4673972b0daSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array_x);CHKERRQ(ierr);
4683972b0daSStefano Zampini   }
4693972b0daSStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4703972b0daSStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4713972b0daSStefano Zampini   /* remove the computed solution from the rhs */
4723972b0daSStefano Zampini   ierr = VecScale(used_vec,-1.0);CHKERRQ(ierr);
4733972b0daSStefano Zampini   ierr = MatMultAdd(pc->pmat,used_vec,rhs,rhs);CHKERRQ(ierr);
4743972b0daSStefano Zampini   ierr = VecScale(used_vec,-1.0);CHKERRQ(ierr);
4753972b0daSStefano Zampini   if(x) {
4763972b0daSStefano Zampini     /* store partially computed solution and set initial guess to 0 */
4773972b0daSStefano Zampini     ierr = VecCopy(used_vec,pcbddc->temp_solution);CHKERRQ(ierr);
4783972b0daSStefano Zampini     ierr = VecSet(used_vec,0.0);CHKERRQ(ierr);
4793972b0daSStefano Zampini   }
4803972b0daSStefano Zampini   ierr = VecDestroy(&used_vec);CHKERRQ(ierr);
481534831adSStefano Zampini   PetscFunctionReturn(0);
482534831adSStefano Zampini }
483534831adSStefano Zampini /* -------------------------------------------------------------------------- */
484534831adSStefano Zampini #undef __FUNCT__
485534831adSStefano Zampini #define __FUNCT__ "PCPostSolve_BDDC"
486534831adSStefano Zampini /* -------------------------------------------------------------------------- */
487534831adSStefano Zampini /*
488534831adSStefano Zampini    PCPostSolve_BDDC - Changes the computed solution if a transformation of basis
489534831adSStefano Zampini                      approach has been selected. Also, restores rhs to its original state.
490534831adSStefano Zampini 
491534831adSStefano Zampini    Input Parameter:
492534831adSStefano Zampini +  pc - the preconditioner contex
493534831adSStefano Zampini 
494534831adSStefano Zampini    Application Interface Routine: PCPostSolve()
495534831adSStefano Zampini 
496534831adSStefano Zampini    Notes:
497534831adSStefano Zampini    The interface routine PCPostSolve() is not usually called directly by
498534831adSStefano Zampini    the user, but instead is called by KSPSolve().
499534831adSStefano Zampini */
500534831adSStefano Zampini static PetscErrorCode PCPostSolve_BDDC(PC pc, KSP ksp, Vec rhs, Vec x)
501534831adSStefano Zampini {
502534831adSStefano Zampini   PetscErrorCode ierr;
503534831adSStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
504534831adSStefano Zampini   PC_IS          *pcis = (PC_IS*)(pc->data);
505534831adSStefano Zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
506534831adSStefano Zampini   Mat            temp_mat;
507534831adSStefano Zampini 
508534831adSStefano Zampini   PetscFunctionBegin;
509534831adSStefano Zampini   if(pcbddc->usechangeofbasis) {
510534831adSStefano Zampini     /* swap pointers for local matrices */
511534831adSStefano Zampini     temp_mat = matis->A;
512534831adSStefano Zampini     matis->A = pcbddc->local_mat;
513534831adSStefano Zampini     pcbddc->local_mat = temp_mat;
514534831adSStefano Zampini     /* restore rhs to its original state */
515*3425bc38SStefano Zampini     if(rhs) {
516*3425bc38SStefano Zampini       ierr = VecCopy(pcbddc->original_rhs,rhs);CHKERRQ(ierr);
517*3425bc38SStefano Zampini     }
518534831adSStefano Zampini     /* Get Local boundary and apply transformation of basis to solution vector */
519534831adSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,x,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
520534831adSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,x,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
521534831adSStefano Zampini     /* from modified basis to original basis */
522534831adSStefano Zampini     ierr = MatMult(pcbddc->ChangeOfBasisMatrix,pcis->vec1_B,pcis->vec2_B);CHKERRQ(ierr);
523534831adSStefano Zampini     /* put back modified values into the global vec using INSERT_VALUES copy mode */
524534831adSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,pcis->vec2_B,x,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
525534831adSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec2_B,x,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
526534831adSStefano Zampini   }
5273972b0daSStefano Zampini   /* add solution removed in presolve */
528*3425bc38SStefano Zampini   if(x) {
529*3425bc38SStefano Zampini     ierr = VecAXPY(x,1.0,pcbddc->temp_solution);CHKERRQ(ierr);
530*3425bc38SStefano Zampini   }
531534831adSStefano Zampini   PetscFunctionReturn(0);
532534831adSStefano Zampini }
533534831adSStefano Zampini /* -------------------------------------------------------------------------- */
53453cdbc3dSStefano Zampini #undef __FUNCT__
53553cdbc3dSStefano Zampini #define __FUNCT__ "PCSetUp_BDDC"
5360c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
5370c7d97c5SJed Brown /*
5380c7d97c5SJed Brown    PCSetUp_BDDC - Prepares for the use of the BDDC preconditioner
5390c7d97c5SJed Brown                   by setting data structures and options.
5400c7d97c5SJed Brown 
5410c7d97c5SJed Brown    Input Parameter:
54253cdbc3dSStefano Zampini +  pc - the preconditioner context
5430c7d97c5SJed Brown 
5440c7d97c5SJed Brown    Application Interface Routine: PCSetUp()
5450c7d97c5SJed Brown 
5460c7d97c5SJed Brown    Notes:
5470c7d97c5SJed Brown    The interface routine PCSetUp() is not usually called directly by
5480c7d97c5SJed Brown    the user, but instead is called by PCApply() if necessary.
5490c7d97c5SJed Brown */
55053cdbc3dSStefano Zampini PetscErrorCode PCSetUp_BDDC(PC pc)
5510c7d97c5SJed Brown {
5520c7d97c5SJed Brown   PetscErrorCode ierr;
5530c7d97c5SJed Brown   PC_BDDC*       pcbddc   = (PC_BDDC*)pc->data;
5540c7d97c5SJed Brown   PC_IS            *pcis = (PC_IS*)(pc->data);
5550c7d97c5SJed Brown 
5560c7d97c5SJed Brown   PetscFunctionBegin;
5570c7d97c5SJed Brown   if (!pc->setupcalled) {
5583b03a366Sstefano_zampini     /* For BDDC we need to define a local "Neumann" problem different to that defined in PCISSetup
5599c0446d6SStefano Zampini        So, we set to pcnone the Neumann problem of pcis in order to avoid unneeded computation
5600c7d97c5SJed Brown        Also, we decide to directly build the (same) Dirichlet problem */
5610c7d97c5SJed Brown     ierr = PetscOptionsSetValue("-is_localN_pc_type","none");CHKERRQ(ierr);
5620c7d97c5SJed Brown     ierr = PetscOptionsSetValue("-is_localD_pc_type","none");CHKERRQ(ierr);
5630c7d97c5SJed Brown     /* Set up all the "iterative substructuring" common block */
5640c7d97c5SJed Brown     ierr = PCISSetUp(pc);CHKERRQ(ierr);
5653b03a366Sstefano_zampini     /* Get stdout for dbg */
566e269702eSStefano Zampini     if(pcbddc->dbg_flag) {
567e269702eSStefano Zampini       ierr = PetscViewerASCIIGetStdout(((PetscObject)pc)->comm,&pcbddc->dbg_viewer);CHKERRQ(ierr);
568e269702eSStefano Zampini       ierr = PetscViewerASCIISynchronizedAllow(pcbddc->dbg_viewer,PETSC_TRUE);CHKERRQ(ierr);
569e269702eSStefano Zampini     }
5703b03a366Sstefano_zampini     /* TODO MOVE CODE FRAGMENT */
5710c7d97c5SJed Brown     PetscInt im_active=0;
5720c7d97c5SJed Brown     if(pcis->n) im_active = 1;
57353cdbc3dSStefano Zampini     ierr = MPI_Allreduce(&im_active,&pcbddc->active_procs,1,MPIU_INT,MPI_SUM,((PetscObject)pc)->comm);CHKERRQ(ierr);
5743b03a366Sstefano_zampini     /* Analyze local interface */
5750c7d97c5SJed Brown     ierr = PCBDDCManageLocalBoundaries(pc);CHKERRQ(ierr);
5763b03a366Sstefano_zampini     /* Set up local constraint matrix */
5773b03a366Sstefano_zampini     ierr = PCBDDCCreateConstraintMatrix(pc);CHKERRQ(ierr);
5780c7d97c5SJed Brown     /* Create coarse and local stuffs used for evaluating action of preconditioner */
5790c7d97c5SJed Brown     ierr = PCBDDCCoarseSetUp(pc);CHKERRQ(ierr);
5803b03a366Sstefano_zampini     /* Processes fakely involved in multilevel should not call ISLocalToGlobalMappingRestoreInfo */
5813b03a366Sstefano_zampini     if ( !pcis->n_neigh ) pcis->ISLocalToGlobalMappingGetInfoWasCalled=PETSC_FALSE;
5820c7d97c5SJed Brown   }
5830c7d97c5SJed Brown   PetscFunctionReturn(0);
5840c7d97c5SJed Brown }
5850c7d97c5SJed Brown 
5860c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
5870c7d97c5SJed Brown /*
5880c7d97c5SJed Brown    PCApply_BDDC - Applies the BDDC preconditioner to a vector.
5890c7d97c5SJed Brown 
5900c7d97c5SJed Brown    Input Parameters:
5910c7d97c5SJed Brown .  pc - the preconditioner context
5920c7d97c5SJed Brown .  r - input vector (global)
5930c7d97c5SJed Brown 
5940c7d97c5SJed Brown    Output Parameter:
5950c7d97c5SJed Brown .  z - output vector (global)
5960c7d97c5SJed Brown 
5970c7d97c5SJed Brown    Application Interface Routine: PCApply()
5980c7d97c5SJed Brown  */
5990c7d97c5SJed Brown #undef __FUNCT__
6000c7d97c5SJed Brown #define __FUNCT__ "PCApply_BDDC"
60153cdbc3dSStefano Zampini PetscErrorCode PCApply_BDDC(PC pc,Vec r,Vec z)
6020c7d97c5SJed Brown {
6030c7d97c5SJed Brown   PC_IS             *pcis = (PC_IS*)(pc->data);
6040c7d97c5SJed Brown   PC_BDDC           *pcbddc = (PC_BDDC*)(pc->data);
6050c7d97c5SJed Brown   PetscErrorCode    ierr;
6063b03a366Sstefano_zampini   const PetscScalar one = 1.0;
6073b03a366Sstefano_zampini   const PetscScalar m_one = -1.0;
6082617d88aSStefano Zampini   const PetscScalar zero = 0.0;
6090c7d97c5SJed Brown 
6100c7d97c5SJed Brown /* This code is similar to that provided in nn.c for PCNN
6110c7d97c5SJed Brown    NN interface preconditioner changed to BDDC
6120c7d97c5SJed Brown    Added support for M_3 preconditioenr in the reference article (code is active if pcbddc->prec_type = PETSC_TRUE) */
6130c7d97c5SJed Brown 
6140c7d97c5SJed Brown   PetscFunctionBegin;
6150c7d97c5SJed Brown   /* First Dirichlet solve */
6160c7d97c5SJed Brown   ierr = VecScatterBegin(pcis->global_to_D,r,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
6170c7d97c5SJed Brown   ierr = VecScatterEnd  (pcis->global_to_D,r,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
61853cdbc3dSStefano Zampini   ierr = KSPSolve(pcbddc->ksp_D,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr);
6190c7d97c5SJed Brown   /*
6200c7d97c5SJed Brown     Assembling right hand side for BDDC operator
6210c7d97c5SJed Brown     - vec1_D for the Dirichlet part (if needed, i.e. prec_flag=PETSC_TRUE)
6220c7d97c5SJed Brown     - the interface part of the global vector z
6230c7d97c5SJed Brown   */
6240c7d97c5SJed Brown   ierr = VecScale(pcis->vec2_D,m_one);CHKERRQ(ierr);
6250c7d97c5SJed Brown   ierr = MatMult(pcis->A_BI,pcis->vec2_D,pcis->vec1_B);CHKERRQ(ierr);
6260c7d97c5SJed Brown   if(pcbddc->prec_type) { ierr = MatMultAdd(pcis->A_II,pcis->vec2_D,pcis->vec1_D,pcis->vec1_D);CHKERRQ(ierr); }
6270c7d97c5SJed Brown   ierr = VecScale(pcis->vec2_D,m_one);CHKERRQ(ierr);
6280c7d97c5SJed Brown   ierr = VecCopy(r,z);CHKERRQ(ierr);
6290c7d97c5SJed Brown   ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
6300c7d97c5SJed Brown   ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
6310c7d97c5SJed Brown 
6322617d88aSStefano Zampini   /* Get Local boundary and apply partition of unity */
6332617d88aSStefano Zampini   ierr = VecScatterBegin(pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
6342617d88aSStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
6352617d88aSStefano Zampini   ierr = VecPointwiseMult(pcis->vec1_B,pcis->D,pcis->vec1_B);CHKERRQ(ierr);
6362617d88aSStefano Zampini 
6372617d88aSStefano Zampini   /* Apply interface preconditioner
6382617d88aSStefano Zampini      input/output vecs: pcis->vec1_B and pcis->vec1_D */
6392617d88aSStefano Zampini   ierr = PCBDDCApplyInterfacePreconditioner(pc);CHKERRQ(ierr);
6402617d88aSStefano Zampini 
6412617d88aSStefano Zampini   /* Apply partition of unity and sum boundary values */
6422617d88aSStefano Zampini   ierr = VecPointwiseMult(pcis->vec1_B,pcis->D,pcis->vec1_B);CHKERRQ(ierr);
6432617d88aSStefano Zampini   ierr = VecSet(z,zero);CHKERRQ(ierr);
6442617d88aSStefano Zampini   ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
6452617d88aSStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
6460c7d97c5SJed Brown 
6473b03a366Sstefano_zampini   /* Second Dirichlet solve and assembling of output */
6480c7d97c5SJed Brown   ierr = VecScatterBegin(pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
6490c7d97c5SJed Brown   ierr = VecScatterEnd  (pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
6500c7d97c5SJed Brown   ierr = MatMult(pcis->A_IB,pcis->vec1_B,pcis->vec3_D);CHKERRQ(ierr);
6510c7d97c5SJed Brown   if(pcbddc->prec_type) { ierr = MatMultAdd(pcis->A_II,pcis->vec1_D,pcis->vec3_D,pcis->vec3_D);CHKERRQ(ierr); }
65253cdbc3dSStefano Zampini   ierr = KSPSolve(pcbddc->ksp_D,pcis->vec3_D,pcbddc->vec4_D);CHKERRQ(ierr);
6530c7d97c5SJed Brown   ierr = VecScale(pcbddc->vec4_D,m_one);CHKERRQ(ierr);
6540c7d97c5SJed Brown   if(pcbddc->prec_type) { ierr = VecAXPY (pcbddc->vec4_D,one,pcis->vec1_D);CHKERRQ(ierr); }
6550c7d97c5SJed Brown   ierr = VecAXPY (pcis->vec2_D,one,pcbddc->vec4_D);CHKERRQ(ierr);
6560c7d97c5SJed Brown   ierr = VecScatterBegin(pcis->global_to_D,pcis->vec2_D,z,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
6570c7d97c5SJed Brown   ierr = VecScatterEnd  (pcis->global_to_D,pcis->vec2_D,z,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
6580c7d97c5SJed Brown   PetscFunctionReturn(0);
6590c7d97c5SJed Brown 
6600c7d97c5SJed Brown }
661da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
662da1bb401SStefano Zampini #undef __FUNCT__
663da1bb401SStefano Zampini #define __FUNCT__ "PCDestroy_BDDC"
664da1bb401SStefano Zampini PetscErrorCode PCDestroy_BDDC(PC pc)
665da1bb401SStefano Zampini {
666da1bb401SStefano Zampini   PC_BDDC          *pcbddc = (PC_BDDC*)pc->data;
667da1bb401SStefano Zampini   PetscErrorCode ierr;
668da1bb401SStefano Zampini 
669da1bb401SStefano Zampini   PetscFunctionBegin;
670da1bb401SStefano Zampini   /* free data created by PCIS */
671da1bb401SStefano Zampini   ierr = PCISDestroy(pc);CHKERRQ(ierr);
672da1bb401SStefano Zampini   /* free BDDC data  */
6733972b0daSStefano Zampini   ierr = VecDestroy(&pcbddc->temp_solution);CHKERRQ(ierr);
674534831adSStefano Zampini   ierr = VecDestroy(&pcbddc->original_rhs);CHKERRQ(ierr);
675534831adSStefano Zampini   ierr = MatDestroy(&pcbddc->local_mat);CHKERRQ(ierr);
676534831adSStefano Zampini   ierr = MatDestroy(&pcbddc->ChangeOfBasisMatrix);CHKERRQ(ierr);
677da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->coarse_vec);CHKERRQ(ierr);
678da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->coarse_rhs);CHKERRQ(ierr);
679da1bb401SStefano Zampini   ierr = KSPDestroy(&pcbddc->coarse_ksp);CHKERRQ(ierr);
680da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->coarse_mat);CHKERRQ(ierr);
681da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->coarse_phi_B);CHKERRQ(ierr);
682da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->coarse_phi_D);CHKERRQ(ierr);
683da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec1_P);CHKERRQ(ierr);
684da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec1_C);CHKERRQ(ierr);
685da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->local_auxmat1);CHKERRQ(ierr);
686da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->local_auxmat2);CHKERRQ(ierr);
687da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec1_R);CHKERRQ(ierr);
688da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec2_R);CHKERRQ(ierr);
689da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec4_D);CHKERRQ(ierr);
690da1bb401SStefano Zampini   ierr = VecScatterDestroy(&pcbddc->R_to_B);CHKERRQ(ierr);
691da1bb401SStefano Zampini   ierr = VecScatterDestroy(&pcbddc->R_to_D);CHKERRQ(ierr);
692da1bb401SStefano Zampini   ierr = VecScatterDestroy(&pcbddc->coarse_loc_to_glob);CHKERRQ(ierr);
693da1bb401SStefano Zampini   ierr = KSPDestroy(&pcbddc->ksp_D);CHKERRQ(ierr);
694da1bb401SStefano Zampini   ierr = KSPDestroy(&pcbddc->ksp_R);CHKERRQ(ierr);
695da1bb401SStefano Zampini   ierr = ISDestroy(&pcbddc->NeumannBoundaries);CHKERRQ(ierr);
696da1bb401SStefano Zampini   ierr = ISDestroy(&pcbddc->DirichletBoundaries);CHKERRQ(ierr);
697da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->ConstraintMatrix);CHKERRQ(ierr);
698da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->local_primal_indices);CHKERRQ(ierr);
699da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->replicated_local_primal_indices);CHKERRQ(ierr);
700da1bb401SStefano Zampini   if (pcbddc->replicated_local_primal_values)    { free(pcbddc->replicated_local_primal_values); }
701da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->local_primal_displacements);CHKERRQ(ierr);
702da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->local_primal_sizes);CHKERRQ(ierr);
703da1bb401SStefano Zampini   PetscInt i;
704da1bb401SStefano Zampini   for(i=0;i<pcbddc->n_ISForDofs;i++) { ierr = ISDestroy(&pcbddc->ISForDofs[i]);CHKERRQ(ierr); }
705da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->ISForDofs);CHKERRQ(ierr);
706da1bb401SStefano Zampini   for(i=0;i<pcbddc->n_ISForFaces;i++) { ierr = ISDestroy(&pcbddc->ISForFaces[i]);CHKERRQ(ierr); }
707da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->ISForFaces);CHKERRQ(ierr);
708da1bb401SStefano Zampini   for(i=0;i<pcbddc->n_ISForEdges;i++) { ierr = ISDestroy(&pcbddc->ISForEdges[i]);CHKERRQ(ierr); }
709da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->ISForEdges);CHKERRQ(ierr);
710da1bb401SStefano Zampini   ierr = ISDestroy(&pcbddc->ISForVertices);CHKERRQ(ierr);
7113972b0daSStefano Zampini   /* Free graph structure */
712da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph->xadj);CHKERRQ(ierr);
713da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph->adjncy);CHKERRQ(ierr);
714da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph->neighbours_set[0]);CHKERRQ(ierr);
715da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph->neighbours_set);CHKERRQ(ierr);
7163972b0daSStefano Zampini   ierr = PetscFree4(pcbddc->mat_graph->where,pcbddc->mat_graph->count,pcbddc->mat_graph->cptr,pcbddc->mat_graph->queue);CHKERRQ(ierr);
7173972b0daSStefano Zampini   ierr = PetscFree2(pcbddc->mat_graph->which_dof,pcbddc->mat_graph->touched);CHKERRQ(ierr);
7183972b0daSStefano Zampini   ierr = PetscFree(pcbddc->mat_graph->where_ncmps);CHKERRQ(ierr);
719da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph);CHKERRQ(ierr);
720*3425bc38SStefano Zampini   /* remove functions */
721*3425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDirichletBoundaries_C","",PETSC_NULL);CHKERRQ(ierr);
722*3425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetNeumannBoundaries_C","",PETSC_NULL);CHKERRQ(ierr);
723*3425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetDirichletBoundaries_C","",PETSC_NULL);CHKERRQ(ierr);
724*3425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetNeumannBoundaries_C","",PETSC_NULL);CHKERRQ(ierr);
725*3425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetCoarseProblemType_C","",PETSC_NULL);CHKERRQ(ierr);
726*3425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDofsSplitting_C","",PETSC_NULL);CHKERRQ(ierr);
727*3425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetLocalAdjacencyGraph_C","",PETSC_NULL);CHKERRQ(ierr);
728*3425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPreSolve_C","",PETSC_NULL);CHKERRQ(ierr);
729*3425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPostSolve_C","",PETSC_NULL);CHKERRQ(ierr);
730*3425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCCreateFETIDPOperators_C","",PETSC_NULL);CHKERRQ(ierr);
731*3425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetRHS_C","",PETSC_NULL);CHKERRQ(ierr);
732*3425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetSolution_C","",PETSC_NULL);CHKERRQ(ierr);
733da1bb401SStefano Zampini   /* Free the private data structure that was hanging off the PC */
734da1bb401SStefano Zampini   ierr = PetscFree(pcbddc);CHKERRQ(ierr);
735da1bb401SStefano Zampini   PetscFunctionReturn(0);
736da1bb401SStefano Zampini }
737*3425bc38SStefano Zampini /* -------------------------------------------------------------------------- */
738*3425bc38SStefano Zampini EXTERN_C_BEGIN
739*3425bc38SStefano Zampini #undef __FUNCT__
740*3425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetRHS_BDDC"
741*3425bc38SStefano Zampini static PetscErrorCode PCBDDCMatFETIDPGetRHS_BDDC(Mat fetidp_mat, Vec standard_rhs, Vec fetidp_flux_rhs)
742*3425bc38SStefano Zampini {
743*3425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
744*3425bc38SStefano Zampini   PC_IS*         pcis;
745*3425bc38SStefano Zampini   PC_BDDC*       pcbddc;
746*3425bc38SStefano Zampini   Mat_IS*        matis;
747*3425bc38SStefano Zampini   PetscErrorCode ierr;
7480c7d97c5SJed Brown 
749*3425bc38SStefano Zampini   PetscFunctionBegin;
750*3425bc38SStefano Zampini   ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr);
751*3425bc38SStefano Zampini   pcis = (PC_IS*)mat_ctx->pc->data;
752*3425bc38SStefano Zampini   pcbddc = (PC_BDDC*)mat_ctx->pc->data;
753*3425bc38SStefano Zampini   matis = (Mat_IS*)mat_ctx->pc->pmat->data;
754*3425bc38SStefano Zampini 
755*3425bc38SStefano Zampini   /* change of basis for physical rhs if needed
756*3425bc38SStefano Zampini      It also changes the rhs in case of dirichlet boundaries */
757*3425bc38SStefano Zampini   (*mat_ctx->pc->ops->presolve)(mat_ctx->pc,PETSC_NULL,standard_rhs,PETSC_NULL);
758*3425bc38SStefano Zampini   /* store vectors for computation of fetidp final solution */
759*3425bc38SStefano Zampini   ierr = VecScatterBegin(pcis->global_to_D,standard_rhs,mat_ctx->temp_solution_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
760*3425bc38SStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_D,standard_rhs,mat_ctx->temp_solution_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
761*3425bc38SStefano Zampini   ierr = VecScatterBegin(pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
762*3425bc38SStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
763*3425bc38SStefano Zampini   /* scale rhs since it should be unassembled */
764*3425bc38SStefano Zampini   ierr = VecPointwiseMult(mat_ctx->temp_solution_B,pcis->D,mat_ctx->temp_solution_B);CHKERRQ(ierr);
765*3425bc38SStefano Zampini   if(!pcbddc->prec_type) {
766*3425bc38SStefano Zampini     /* compute partially subassembled Schur complement right-hand side */
767*3425bc38SStefano Zampini     ierr = KSPSolve(pcbddc->ksp_D,mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr);
768*3425bc38SStefano Zampini     ierr = MatMult(pcis->A_BI,pcis->vec1_D,pcis->vec1_B);CHKERRQ(ierr);
769*3425bc38SStefano Zampini     ierr = VecAXPY(mat_ctx->temp_solution_B,-1.0,pcis->vec1_B);CHKERRQ(ierr);
770*3425bc38SStefano Zampini     ierr = VecSet(standard_rhs,0.0);CHKERRQ(ierr);
771*3425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,mat_ctx->temp_solution_B,standard_rhs,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
772*3425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,mat_ctx->temp_solution_B,standard_rhs,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
773*3425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
774*3425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
775*3425bc38SStefano Zampini     ierr = VecPointwiseMult(mat_ctx->temp_solution_B,pcis->D,mat_ctx->temp_solution_B);CHKERRQ(ierr);
776*3425bc38SStefano Zampini   }
777*3425bc38SStefano Zampini   /* BDDC rhs */
778*3425bc38SStefano Zampini   ierr = VecCopy(mat_ctx->temp_solution_B,pcis->vec1_B);CHKERRQ(ierr);
779*3425bc38SStefano Zampini   if(pcbddc->prec_type) {
780*3425bc38SStefano Zampini     ierr = VecCopy(mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr);
781*3425bc38SStefano Zampini   }
782*3425bc38SStefano Zampini   /* apply BDDC */
783*3425bc38SStefano Zampini   ierr = PCBDDCApplyInterfacePreconditioner(mat_ctx->pc);CHKERRQ(ierr);
784*3425bc38SStefano Zampini   /* Application of B_delta and assembling of rhs for fetidp fluxes */
785*3425bc38SStefano Zampini   ierr = VecSet(fetidp_flux_rhs,0.0);CHKERRQ(ierr);
786*3425bc38SStefano Zampini   ierr = MatMult(mat_ctx->B_delta,pcis->vec1_B,mat_ctx->lambda_local);CHKERRQ(ierr);
787*3425bc38SStefano Zampini   ierr = VecScatterBegin(mat_ctx->l2g_lambda,mat_ctx->lambda_local,fetidp_flux_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
788*3425bc38SStefano Zampini   ierr = VecScatterEnd  (mat_ctx->l2g_lambda,mat_ctx->lambda_local,fetidp_flux_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
789*3425bc38SStefano Zampini   /* restore original rhs */
790*3425bc38SStefano Zampini   ierr = VecCopy(pcbddc->original_rhs,standard_rhs);CHKERRQ(ierr);
791*3425bc38SStefano Zampini   PetscFunctionReturn(0);
792*3425bc38SStefano Zampini }
793*3425bc38SStefano Zampini EXTERN_C_END
794*3425bc38SStefano Zampini #undef __FUNCT__
795*3425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetRHS"
796*3425bc38SStefano Zampini /*@
797*3425bc38SStefano Zampini  PCBDDCMatFETIDPGetRHS - Get rhs for FETIDP linear system.
798*3425bc38SStefano Zampini 
799*3425bc38SStefano Zampini    Collective
800*3425bc38SStefano Zampini 
801*3425bc38SStefano Zampini    Input Parameters:
802*3425bc38SStefano Zampini +  fetidp_mat   - the FETIDP mat obtained by a call to PCBDDCCreateFETIDPOperators
803*3425bc38SStefano Zampini +  standard_rhs - the rhs of your linear system
804*3425bc38SStefano Zampini 
805*3425bc38SStefano Zampini    Output Parameters:
806*3425bc38SStefano Zampini +  fetidp_flux_rhs   - the rhs of the FETIDP linear system
807*3425bc38SStefano Zampini 
808*3425bc38SStefano Zampini    Level: developer
809*3425bc38SStefano Zampini 
810*3425bc38SStefano Zampini    Notes:
811*3425bc38SStefano Zampini 
812*3425bc38SStefano Zampini .seealso: PCBDDC
813*3425bc38SStefano Zampini @*/
814*3425bc38SStefano Zampini PetscErrorCode PCBDDCMatFETIDPGetRHS(Mat fetidp_mat, Vec standard_rhs, Vec fetidp_flux_rhs)
815*3425bc38SStefano Zampini {
816*3425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
817*3425bc38SStefano Zampini   PetscErrorCode ierr;
818*3425bc38SStefano Zampini 
819*3425bc38SStefano Zampini   PetscFunctionBegin;
820*3425bc38SStefano Zampini   ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr);
821*3425bc38SStefano Zampini   ierr = PetscTryMethod(mat_ctx->pc,"PCBDDCMatFETIDPGetRHS_C",(Mat,Vec,Vec),(fetidp_mat,standard_rhs,fetidp_flux_rhs));CHKERRQ(ierr);
822*3425bc38SStefano Zampini   PetscFunctionReturn(0);
823*3425bc38SStefano Zampini }
824*3425bc38SStefano Zampini /* -------------------------------------------------------------------------- */
825*3425bc38SStefano Zampini EXTERN_C_BEGIN
826*3425bc38SStefano Zampini #undef __FUNCT__
827*3425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetSolution_BDDC"
828*3425bc38SStefano Zampini static PetscErrorCode PCBDDCMatFETIDPGetSolution_BDDC(Mat fetidp_mat, Vec fetidp_flux_sol, Vec standard_sol)
829*3425bc38SStefano Zampini {
830*3425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
831*3425bc38SStefano Zampini   PC_IS*         pcis;
832*3425bc38SStefano Zampini   PC_BDDC*       pcbddc;
833*3425bc38SStefano Zampini   Mat_IS*        matis;
834*3425bc38SStefano Zampini   PetscErrorCode ierr;
835*3425bc38SStefano Zampini 
836*3425bc38SStefano Zampini   PetscFunctionBegin;
837*3425bc38SStefano Zampini   ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr);
838*3425bc38SStefano Zampini   pcis = (PC_IS*)mat_ctx->pc->data;
839*3425bc38SStefano Zampini   pcbddc = (PC_BDDC*)mat_ctx->pc->data;
840*3425bc38SStefano Zampini   matis = (Mat_IS*)mat_ctx->pc->pmat->data;
841*3425bc38SStefano Zampini 
842*3425bc38SStefano Zampini   /* apply B_delta^T */
843*3425bc38SStefano Zampini   ierr = VecScatterBegin(mat_ctx->l2g_lambda,fetidp_flux_sol,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
844*3425bc38SStefano Zampini   ierr = VecScatterEnd  (mat_ctx->l2g_lambda,fetidp_flux_sol,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
845*3425bc38SStefano Zampini   ierr = MatMultTranspose(mat_ctx->B_delta,mat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr);
846*3425bc38SStefano Zampini   /* compute rhs for BDDC application */
847*3425bc38SStefano Zampini   ierr = VecAYPX(pcis->vec1_B,-1.0,mat_ctx->temp_solution_B);CHKERRQ(ierr);
848*3425bc38SStefano Zampini   if(pcbddc->prec_type) {
849*3425bc38SStefano Zampini     ierr = VecCopy(mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr);
850*3425bc38SStefano Zampini   }
851*3425bc38SStefano Zampini   /* apply BDDC */
852*3425bc38SStefano Zampini   ierr = PCBDDCApplyInterfacePreconditioner(mat_ctx->pc);CHKERRQ(ierr);
853*3425bc38SStefano Zampini   /* put values into standard global vector */
854*3425bc38SStefano Zampini   ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
855*3425bc38SStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec1_B,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
856*3425bc38SStefano Zampini   if(!pcbddc->prec_type) {
857*3425bc38SStefano Zampini     /* compute values into the interior if solved for the partially subassembled Schur complement */
858*3425bc38SStefano Zampini     ierr = MatMult(pcis->A_IB,pcis->vec1_B,pcis->vec1_D);CHKERRQ(ierr);
859*3425bc38SStefano Zampini     ierr = VecAXPY(mat_ctx->temp_solution_D,-1.0,pcis->vec1_D);CHKERRQ(ierr);
860*3425bc38SStefano Zampini     ierr = KSPSolve(pcbddc->ksp_D,mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr);
861*3425bc38SStefano Zampini   }
862*3425bc38SStefano Zampini   ierr = VecScatterBegin(pcis->global_to_D,pcis->vec1_D,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
863*3425bc38SStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_D,pcis->vec1_D,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
864*3425bc38SStefano Zampini   /* final change of basis if needed
865*3425bc38SStefano Zampini      Is also sums the dirichlet part removed during RHS assembling */
866*3425bc38SStefano Zampini   (*mat_ctx->pc->ops->postsolve)(mat_ctx->pc,PETSC_NULL,PETSC_NULL,standard_sol);
867*3425bc38SStefano Zampini   PetscFunctionReturn(0);
868*3425bc38SStefano Zampini 
869*3425bc38SStefano Zampini }
870*3425bc38SStefano Zampini EXTERN_C_END
871*3425bc38SStefano Zampini #undef __FUNCT__
872*3425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetSolution"
873*3425bc38SStefano Zampini /*@
874*3425bc38SStefano Zampini  PCBDDCMatFETIDPGetSolution - Get Solution for FETIDP linear system.
875*3425bc38SStefano Zampini 
876*3425bc38SStefano Zampini    Collective
877*3425bc38SStefano Zampini 
878*3425bc38SStefano Zampini    Input Parameters:
879*3425bc38SStefano Zampini +  fetidp_mat        - the FETIDP mat obtained by a call to PCBDDCCreateFETIDPOperators
880*3425bc38SStefano Zampini +  fetidp_flux_sol - the solution of the FETIDP linear system
881*3425bc38SStefano Zampini 
882*3425bc38SStefano Zampini    Output Parameters:
883*3425bc38SStefano Zampini +  standard_sol      - the solution on the global domain
884*3425bc38SStefano Zampini 
885*3425bc38SStefano Zampini    Level: developer
886*3425bc38SStefano Zampini 
887*3425bc38SStefano Zampini    Notes:
888*3425bc38SStefano Zampini 
889*3425bc38SStefano Zampini .seealso: PCBDDC
890*3425bc38SStefano Zampini @*/
891*3425bc38SStefano Zampini PetscErrorCode PCBDDCMatFETIDPGetSolution(Mat fetidp_mat, Vec fetidp_flux_sol, Vec standard_sol)
892*3425bc38SStefano Zampini {
893*3425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
894*3425bc38SStefano Zampini   PetscErrorCode ierr;
895*3425bc38SStefano Zampini 
896*3425bc38SStefano Zampini   PetscFunctionBegin;
897*3425bc38SStefano Zampini   ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr);
898*3425bc38SStefano Zampini   ierr = PetscTryMethod(mat_ctx->pc,"PCBDDCMatFETIDPGetSolution_C",(Mat,Vec,Vec),(fetidp_mat,fetidp_flux_sol,standard_sol));CHKERRQ(ierr);
899*3425bc38SStefano Zampini   PetscFunctionReturn(0);
900*3425bc38SStefano Zampini }
901*3425bc38SStefano Zampini /* -------------------------------------------------------------------------- */
902*3425bc38SStefano Zampini EXTERN_C_BEGIN
903*3425bc38SStefano Zampini #undef __FUNCT__
904*3425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPOperators_BDDC"
905*3425bc38SStefano Zampini static PetscErrorCode PCBDDCCreateFETIDPOperators_BDDC(PC pc, Mat *fetidp_mat, PC *fetidp_pc)
906*3425bc38SStefano Zampini {
907*3425bc38SStefano Zampini   PETSC_EXTERN PetscErrorCode FETIDPMatMult(Mat,Vec,Vec);
908*3425bc38SStefano Zampini   PETSC_EXTERN PetscErrorCode PCBDDCDestroyFETIDPMat(Mat);
909*3425bc38SStefano Zampini   PETSC_EXTERN PetscErrorCode FETIDPPCApply(PC,Vec,Vec);
910*3425bc38SStefano Zampini   PETSC_EXTERN PetscErrorCode PCBDDCDestroyFETIDPPC(PC);
911*3425bc38SStefano Zampini 
912*3425bc38SStefano Zampini   FETIDPMat_ctx  *fetidpmat_ctx;
913*3425bc38SStefano Zampini   Mat            newmat;
914*3425bc38SStefano Zampini   FETIDPPC_ctx  *fetidppc_ctx;
915*3425bc38SStefano Zampini   PC             newpc;
916*3425bc38SStefano Zampini   MPI_Comm       comm = ((PetscObject)pc)->comm;
917*3425bc38SStefano Zampini   PetscErrorCode ierr;
918*3425bc38SStefano Zampini 
919*3425bc38SStefano Zampini   PetscFunctionBegin;
920*3425bc38SStefano Zampini   /* FETIDP linear matrix */
921*3425bc38SStefano Zampini   ierr = PCBDDCCreateFETIDPMatContext(pc, &fetidpmat_ctx);CHKERRQ(ierr);
922*3425bc38SStefano Zampini   ierr = PCBDDCSetupFETIDPMatContext(fetidpmat_ctx);CHKERRQ(ierr);
923*3425bc38SStefano Zampini   ierr = MatCreateShell(comm,PETSC_DECIDE,PETSC_DECIDE,fetidpmat_ctx->n_lambda,fetidpmat_ctx->n_lambda,fetidpmat_ctx,&newmat);CHKERRQ(ierr);
924*3425bc38SStefano Zampini   ierr = MatShellSetOperation(newmat,MATOP_MULT,(void (*)(void))FETIDPMatMult);CHKERRQ(ierr);
925*3425bc38SStefano Zampini   ierr = MatShellSetOperation(newmat,MATOP_DESTROY,(void (*)(void))PCBDDCDestroyFETIDPMat);CHKERRQ(ierr);
926*3425bc38SStefano Zampini   ierr = MatSetUp(newmat);CHKERRQ(ierr);
927*3425bc38SStefano Zampini   /* FETIDP preconditioner */
928*3425bc38SStefano Zampini   ierr = PCBDDCCreateFETIDPPCContext(pc, &fetidppc_ctx);CHKERRQ(ierr);
929*3425bc38SStefano Zampini   ierr = PCBDDCSetupFETIDPPCContext(newmat,fetidppc_ctx);CHKERRQ(ierr);
930*3425bc38SStefano Zampini   ierr = PCCreate(comm,&newpc);CHKERRQ(ierr);
931*3425bc38SStefano Zampini   ierr = PCSetType(newpc,PCSHELL);CHKERRQ(ierr);
932*3425bc38SStefano Zampini   ierr = PCShellSetContext(newpc,fetidppc_ctx);CHKERRQ(ierr);
933*3425bc38SStefano Zampini   ierr = PCShellSetApply(newpc,FETIDPPCApply);CHKERRQ(ierr);
934*3425bc38SStefano Zampini   ierr = PCShellSetDestroy(newpc,PCBDDCDestroyFETIDPPC);CHKERRQ(ierr);
935*3425bc38SStefano Zampini   ierr = PCSetOperators(newpc,newmat,newmat,SAME_PRECONDITIONER);CHKERRQ(ierr);
936*3425bc38SStefano Zampini   ierr = PCSetUp(newpc);CHKERRQ(ierr);
937*3425bc38SStefano Zampini   /* return pointers for objects created */
938*3425bc38SStefano Zampini   *fetidp_mat=newmat;
939*3425bc38SStefano Zampini   *fetidp_pc=newpc;
940*3425bc38SStefano Zampini 
941*3425bc38SStefano Zampini   PetscFunctionReturn(0);
942*3425bc38SStefano Zampini }
943*3425bc38SStefano Zampini EXTERN_C_END
944*3425bc38SStefano Zampini #undef __FUNCT__
945*3425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPOperators"
946*3425bc38SStefano Zampini /*@
947*3425bc38SStefano Zampini  PCBDDCCreateFETIDPOperators - Create operators for FETIDP.
948*3425bc38SStefano Zampini 
949*3425bc38SStefano Zampini    Collective
950*3425bc38SStefano Zampini 
951*3425bc38SStefano Zampini    Input Parameters:
952*3425bc38SStefano Zampini +  pc - the BDDC preconditioning context (setup must be already called)
953*3425bc38SStefano Zampini 
954*3425bc38SStefano Zampini    Level: developer
955*3425bc38SStefano Zampini 
956*3425bc38SStefano Zampini    Notes:
957*3425bc38SStefano Zampini 
958*3425bc38SStefano Zampini .seealso: PCBDDC
959*3425bc38SStefano Zampini @*/
960*3425bc38SStefano Zampini PetscErrorCode PCBDDCCreateFETIDPOperators(PC pc, Mat *fetidp_mat, PC *fetidp_pc)
961*3425bc38SStefano Zampini {
962*3425bc38SStefano Zampini   PetscErrorCode ierr;
963*3425bc38SStefano Zampini 
964*3425bc38SStefano Zampini   PetscFunctionBegin;
965*3425bc38SStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
966*3425bc38SStefano Zampini   if (pc->setupcalled) {
967*3425bc38SStefano Zampini     ierr = PetscTryMethod(pc,"PCBDDCCreateFETIDPOperators_C",(PC,Mat*,PC*),(pc,fetidp_mat,fetidp_pc));CHKERRQ(ierr);
968*3425bc38SStefano Zampini   } else {
969*3425bc38SStefano Zampini     SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SUP,"You must call PCSetup_BDDC before calling %s\n",__FUNCT__);
970*3425bc38SStefano Zampini   }
971*3425bc38SStefano Zampini   PetscFunctionReturn(0);
972*3425bc38SStefano Zampini }
9730c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
974da1bb401SStefano Zampini /*MC
975da1bb401SStefano Zampini    PCBDDC - Balancing Domain Decomposition by Constraints.
9760c7d97c5SJed Brown 
977da1bb401SStefano Zampini    Options Database Keys:
978da1bb401SStefano Zampini .    -pcbddc ??? -
979da1bb401SStefano Zampini 
980da1bb401SStefano Zampini    Level: intermediate
981da1bb401SStefano Zampini 
982da1bb401SStefano Zampini    Notes: The matrix used with this preconditioner must be of type MATIS
983da1bb401SStefano Zampini 
984da1bb401SStefano Zampini           Unlike more 'conventional' interface preconditioners, this iterates over ALL the
985da1bb401SStefano Zampini           degrees of freedom, NOT just those on the interface (this allows the use of approximate solvers
986da1bb401SStefano Zampini           on the subdomains).
987da1bb401SStefano Zampini 
988da1bb401SStefano Zampini           Options for the coarse grid preconditioner can be set with -
989da1bb401SStefano Zampini           Options for the Dirichlet subproblem can be set with -
990da1bb401SStefano Zampini           Options for the Neumann subproblem can be set with -
991da1bb401SStefano Zampini 
992da1bb401SStefano Zampini    Contributed by Stefano Zampini
993da1bb401SStefano Zampini 
994da1bb401SStefano Zampini .seealso:  PCCreate(), PCSetType(), PCType (for list of available types), PC,  MATIS
995da1bb401SStefano Zampini M*/
996da1bb401SStefano Zampini EXTERN_C_BEGIN
997da1bb401SStefano Zampini #undef __FUNCT__
998da1bb401SStefano Zampini #define __FUNCT__ "PCCreate_BDDC"
999da1bb401SStefano Zampini PetscErrorCode PCCreate_BDDC(PC pc)
1000da1bb401SStefano Zampini {
1001da1bb401SStefano Zampini   PetscErrorCode ierr;
1002da1bb401SStefano Zampini   PC_BDDC        *pcbddc;
1003da1bb401SStefano Zampini   PCBDDCGraph    mat_graph;
1004da1bb401SStefano Zampini 
1005da1bb401SStefano Zampini   PetscFunctionBegin;
1006da1bb401SStefano Zampini   /* Creates the private data structure for this preconditioner and attach it to the PC object. */
1007da1bb401SStefano Zampini   ierr      = PetscNewLog(pc,PC_BDDC,&pcbddc);CHKERRQ(ierr);
1008da1bb401SStefano Zampini   pc->data  = (void*)pcbddc;
1009da1bb401SStefano Zampini 
1010da1bb401SStefano Zampini   /* create PCIS data structure */
1011da1bb401SStefano Zampini   ierr = PCISCreate(pc);CHKERRQ(ierr);
1012da1bb401SStefano Zampini 
1013da1bb401SStefano Zampini   /* BDDC specific */
10143972b0daSStefano Zampini   pcbddc->temp_solution              = 0;
1015534831adSStefano Zampini   pcbddc->original_rhs               = 0;
1016534831adSStefano Zampini   pcbddc->local_mat                  = 0;
1017534831adSStefano Zampini   pcbddc->ChangeOfBasisMatrix        = 0;
1018534831adSStefano Zampini   pcbddc->usechangeofbasis           = PETSC_TRUE;
1019534831adSStefano Zampini   pcbddc->usechangeonfaces           = PETSC_FALSE;
1020da1bb401SStefano Zampini   pcbddc->coarse_vec                 = 0;
1021da1bb401SStefano Zampini   pcbddc->coarse_rhs                 = 0;
1022da1bb401SStefano Zampini   pcbddc->coarse_ksp                 = 0;
1023da1bb401SStefano Zampini   pcbddc->coarse_phi_B               = 0;
1024da1bb401SStefano Zampini   pcbddc->coarse_phi_D               = 0;
1025da1bb401SStefano Zampini   pcbddc->vec1_P                     = 0;
1026da1bb401SStefano Zampini   pcbddc->vec1_R                     = 0;
1027da1bb401SStefano Zampini   pcbddc->vec2_R                     = 0;
1028da1bb401SStefano Zampini   pcbddc->local_auxmat1              = 0;
1029da1bb401SStefano Zampini   pcbddc->local_auxmat2              = 0;
1030da1bb401SStefano Zampini   pcbddc->R_to_B                     = 0;
1031da1bb401SStefano Zampini   pcbddc->R_to_D                     = 0;
1032da1bb401SStefano Zampini   pcbddc->ksp_D                      = 0;
1033da1bb401SStefano Zampini   pcbddc->ksp_R                      = 0;
1034da1bb401SStefano Zampini   pcbddc->local_primal_indices       = 0;
1035da1bb401SStefano Zampini   pcbddc->prec_type                  = PETSC_FALSE;
1036da1bb401SStefano Zampini   pcbddc->NeumannBoundaries          = 0;
1037da1bb401SStefano Zampini   pcbddc->ISForDofs                  = 0;
1038da1bb401SStefano Zampini   pcbddc->ISForVertices              = 0;
1039da1bb401SStefano Zampini   pcbddc->n_ISForFaces               = 0;
1040da1bb401SStefano Zampini   pcbddc->n_ISForEdges               = 0;
1041da1bb401SStefano Zampini   pcbddc->ConstraintMatrix           = 0;
1042da1bb401SStefano Zampini   pcbddc->use_nnsp_true              = PETSC_FALSE;
1043da1bb401SStefano Zampini   pcbddc->local_primal_sizes         = 0;
1044da1bb401SStefano Zampini   pcbddc->local_primal_displacements = 0;
1045da1bb401SStefano Zampini   pcbddc->replicated_local_primal_indices = 0;
1046da1bb401SStefano Zampini   pcbddc->replicated_local_primal_values  = 0;
1047da1bb401SStefano Zampini   pcbddc->coarse_loc_to_glob         = 0;
1048da1bb401SStefano Zampini   pcbddc->dbg_flag                   = PETSC_FALSE;
1049da1bb401SStefano Zampini   pcbddc->coarsening_ratio           = 8;
1050da1bb401SStefano Zampini 
1051da1bb401SStefano Zampini   /* allocate and initialize needed graph structure */
1052da1bb401SStefano Zampini   ierr = PetscMalloc(sizeof(*mat_graph),&pcbddc->mat_graph);CHKERRQ(ierr);
1053da1bb401SStefano Zampini   pcbddc->mat_graph->xadj            = 0;
1054da1bb401SStefano Zampini   pcbddc->mat_graph->adjncy          = 0;
1055da1bb401SStefano Zampini 
1056da1bb401SStefano Zampini   /* function pointers */
1057da1bb401SStefano Zampini   pc->ops->apply               = PCApply_BDDC;
1058da1bb401SStefano Zampini   pc->ops->applytranspose      = 0;
1059da1bb401SStefano Zampini   pc->ops->setup               = PCSetUp_BDDC;
1060da1bb401SStefano Zampini   pc->ops->destroy             = PCDestroy_BDDC;
1061da1bb401SStefano Zampini   pc->ops->setfromoptions      = PCSetFromOptions_BDDC;
1062da1bb401SStefano Zampini   pc->ops->view                = 0;
1063da1bb401SStefano Zampini   pc->ops->applyrichardson     = 0;
1064da1bb401SStefano Zampini   pc->ops->applysymmetricleft  = 0;
1065da1bb401SStefano Zampini   pc->ops->applysymmetricright = 0;
1066534831adSStefano Zampini   pc->ops->presolve            = PCPreSolve_BDDC;
1067534831adSStefano Zampini   pc->ops->postsolve           = PCPostSolve_BDDC;
1068da1bb401SStefano Zampini 
1069da1bb401SStefano Zampini   /* composing function */
1070da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDirichletBoundaries_C","PCBDDCSetDirichletBoundaries_BDDC",
1071da1bb401SStefano Zampini                     PCBDDCSetDirichletBoundaries_BDDC);CHKERRQ(ierr);
1072da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetNeumannBoundaries_C","PCBDDCSetNeumannBoundaries_BDDC",
1073da1bb401SStefano Zampini                     PCBDDCSetNeumannBoundaries_BDDC);CHKERRQ(ierr);
1074da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetDirichletBoundaries_C","PCBDDCGetDirichletBoundaries_BDDC",
1075da1bb401SStefano Zampini                     PCBDDCGetDirichletBoundaries_BDDC);CHKERRQ(ierr);
1076da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetNeumannBoundaries_C","PCBDDCGetNeumannBoundaries_BDDC",
1077da1bb401SStefano Zampini                     PCBDDCGetNeumannBoundaries_BDDC);CHKERRQ(ierr);
1078da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetCoarseProblemType_C","PCBDDCSetCoarseProblemType_BDDC",
1079da1bb401SStefano Zampini                     PCBDDCSetCoarseProblemType_BDDC);CHKERRQ(ierr);
1080da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDofsSplitting_C","PCBDDCSetDofsSplitting_BDDC",
1081da1bb401SStefano Zampini                     PCBDDCSetDofsSplitting_BDDC);CHKERRQ(ierr);
1082da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetLocalAdjacencyGraph_C","PCBDDCSetLocalAdjacencyGraph_BDDC",
1083da1bb401SStefano Zampini                     PCBDDCSetLocalAdjacencyGraph_BDDC);CHKERRQ(ierr);
1084534831adSStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPreSolve_C","PCPreSolve_BDDC",
1085534831adSStefano Zampini                     PCPreSolve_BDDC);CHKERRQ(ierr);
1086534831adSStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPostSolve_C","PCPostSolve_BDDC",
1087534831adSStefano Zampini                     PCPostSolve_BDDC);CHKERRQ(ierr);
1088*3425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCCreateFETIDPOperators_C","PCBDDCCreateFETIDPOperators_BDDC",
1089*3425bc38SStefano Zampini                     PCBDDCCreateFETIDPOperators_BDDC);CHKERRQ(ierr);
1090*3425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetRHS_C","PCBDDCMatFETIDPGetRHS_BDDC",
1091*3425bc38SStefano Zampini                     PCBDDCMatFETIDPGetRHS_BDDC);CHKERRQ(ierr);
1092*3425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetSolution_C","PCBDDCMatFETIDPGetSolution_BDDC",
1093*3425bc38SStefano Zampini                     PCBDDCMatFETIDPGetSolution_BDDC);CHKERRQ(ierr);
1094da1bb401SStefano Zampini   PetscFunctionReturn(0);
1095da1bb401SStefano Zampini }
1096da1bb401SStefano Zampini EXTERN_C_END
1097*3425bc38SStefano Zampini 
1098da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
1099da1bb401SStefano Zampini /* All static functions from now on                                           */
1100da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
1101*3425bc38SStefano Zampini 
1102*3425bc38SStefano Zampini #undef __FUNCT__
1103*3425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPMatContext"
1104*3425bc38SStefano Zampini static PetscErrorCode PCBDDCCreateFETIDPMatContext(PC pc, FETIDPMat_ctx **fetidpmat_ctx)
1105*3425bc38SStefano Zampini {
1106*3425bc38SStefano Zampini   FETIDPMat_ctx  *newctx;
1107*3425bc38SStefano Zampini   PetscErrorCode ierr;
1108*3425bc38SStefano Zampini 
1109*3425bc38SStefano Zampini   PetscFunctionBegin;
1110*3425bc38SStefano Zampini   ierr = PetscMalloc(sizeof(*newctx),&newctx);CHKERRQ(ierr);
1111*3425bc38SStefano Zampini   newctx->lambda_local    = 0;
1112*3425bc38SStefano Zampini   newctx->temp_solution_B = 0;
1113*3425bc38SStefano Zampini   newctx->temp_solution_D = 0;
1114*3425bc38SStefano Zampini   newctx->B_delta         = 0;
1115*3425bc38SStefano Zampini   newctx->B_Ddelta        = 0; /* theoretically belongs to the FETIDP preconditioner */
1116*3425bc38SStefano Zampini   newctx->l2g_lambda      = 0;
1117*3425bc38SStefano Zampini   /* increase the reference count for BDDC preconditioner */
1118*3425bc38SStefano Zampini   ierr = PetscObjectReference((PetscObject)pc);CHKERRQ(ierr);
1119*3425bc38SStefano Zampini   newctx->pc              = pc;
1120*3425bc38SStefano Zampini   *fetidpmat_ctx          = newctx;
1121*3425bc38SStefano Zampini   PetscFunctionReturn(0);
1122*3425bc38SStefano Zampini }
1123*3425bc38SStefano Zampini 
1124*3425bc38SStefano Zampini #undef __FUNCT__
1125*3425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPPCContext"
1126*3425bc38SStefano Zampini static PetscErrorCode PCBDDCCreateFETIDPPCContext(PC pc, FETIDPPC_ctx **fetidppc_ctx)
1127*3425bc38SStefano Zampini {
1128*3425bc38SStefano Zampini   FETIDPPC_ctx  *newctx;
1129*3425bc38SStefano Zampini   PetscErrorCode ierr;
1130*3425bc38SStefano Zampini 
1131*3425bc38SStefano Zampini   PetscFunctionBegin;
1132*3425bc38SStefano Zampini   ierr = PetscMalloc(sizeof(*newctx),&newctx);CHKERRQ(ierr);
1133*3425bc38SStefano Zampini   newctx->lambda_local    = 0;
1134*3425bc38SStefano Zampini   newctx->B_Ddelta        = 0;
1135*3425bc38SStefano Zampini   newctx->l2g_lambda      = 0;
1136*3425bc38SStefano Zampini   /* increase the reference count for BDDC preconditioner */
1137*3425bc38SStefano Zampini   ierr = PetscObjectReference((PetscObject)pc);CHKERRQ(ierr);
1138*3425bc38SStefano Zampini   newctx->pc              = pc;
1139*3425bc38SStefano Zampini   *fetidppc_ctx           = newctx;
1140*3425bc38SStefano Zampini   PetscFunctionReturn(0);
1141*3425bc38SStefano Zampini }
1142*3425bc38SStefano Zampini 
1143*3425bc38SStefano Zampini #undef __FUNCT__
1144*3425bc38SStefano Zampini #define __FUNCT__ "PCBDDCDestroyFETIDPMat"
1145*3425bc38SStefano Zampini static PetscErrorCode PCBDDCDestroyFETIDPMat(Mat A)
1146*3425bc38SStefano Zampini {
1147*3425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
1148*3425bc38SStefano Zampini   PetscErrorCode ierr;
1149*3425bc38SStefano Zampini 
1150*3425bc38SStefano Zampini   PetscFunctionBegin;
1151*3425bc38SStefano Zampini   ierr = MatShellGetContext(A,(void**)&mat_ctx);CHKERRQ(ierr);
1152*3425bc38SStefano Zampini   ierr = VecDestroy(&mat_ctx->lambda_local);CHKERRQ(ierr);
1153*3425bc38SStefano Zampini   ierr = VecDestroy(&mat_ctx->temp_solution_D);CHKERRQ(ierr);
1154*3425bc38SStefano Zampini   ierr = VecDestroy(&mat_ctx->temp_solution_B);CHKERRQ(ierr);
1155*3425bc38SStefano Zampini   ierr = MatDestroy(&mat_ctx->B_delta);CHKERRQ(ierr);
1156*3425bc38SStefano Zampini   ierr = MatDestroy(&mat_ctx->B_Ddelta);CHKERRQ(ierr);
1157*3425bc38SStefano Zampini   ierr = VecScatterDestroy(&mat_ctx->l2g_lambda);CHKERRQ(ierr);
1158*3425bc38SStefano Zampini   ierr = PCDestroy(&mat_ctx->pc);CHKERRQ(ierr); /* actually it does not destroy BDDC, only decrease its reference count */
1159*3425bc38SStefano Zampini   ierr = PetscFree(mat_ctx);CHKERRQ(ierr);
1160*3425bc38SStefano Zampini   PetscFunctionReturn(0);
1161*3425bc38SStefano Zampini }
1162*3425bc38SStefano Zampini 
1163*3425bc38SStefano Zampini #undef __FUNCT__
1164*3425bc38SStefano Zampini #define __FUNCT__ "PCBDDCDestroyFETIDPPC"
1165*3425bc38SStefano Zampini static PetscErrorCode PCBDDCDestroyFETIDPPC(PC pc)
1166*3425bc38SStefano Zampini {
1167*3425bc38SStefano Zampini   FETIDPPC_ctx  *pc_ctx;
1168*3425bc38SStefano Zampini   PetscErrorCode ierr;
1169*3425bc38SStefano Zampini 
1170*3425bc38SStefano Zampini   PetscFunctionBegin;
1171*3425bc38SStefano Zampini   ierr = PCShellGetContext(pc,(void**)&pc_ctx);CHKERRQ(ierr);
1172*3425bc38SStefano Zampini   ierr = VecDestroy(&pc_ctx->lambda_local);CHKERRQ(ierr);
1173*3425bc38SStefano Zampini   ierr = MatDestroy(&pc_ctx->B_Ddelta);CHKERRQ(ierr);
1174*3425bc38SStefano Zampini   ierr = VecScatterDestroy(&pc_ctx->l2g_lambda);CHKERRQ(ierr);
1175*3425bc38SStefano Zampini   ierr = PCDestroy(&pc_ctx->pc);CHKERRQ(ierr); /* actually it does not destroy BDDC, only decrease its reference count */
1176*3425bc38SStefano Zampini   ierr = PetscFree(pc_ctx);CHKERRQ(ierr);
1177*3425bc38SStefano Zampini   PetscFunctionReturn(0);
1178*3425bc38SStefano Zampini }
1179*3425bc38SStefano Zampini 
1180*3425bc38SStefano Zampini #undef __FUNCT__
1181*3425bc38SStefano Zampini #define __FUNCT__ "PCBDDCSetupFETIDPMatContext"
1182*3425bc38SStefano Zampini static PetscErrorCode PCBDDCSetupFETIDPMatContext(FETIDPMat_ctx *fetidpmat_ctx )
1183*3425bc38SStefano Zampini {
1184*3425bc38SStefano Zampini   PetscErrorCode ierr;
1185*3425bc38SStefano Zampini   PC_IS          *pcis=(PC_IS*)fetidpmat_ctx->pc->data;
1186*3425bc38SStefano Zampini   PC_BDDC        *pcbddc=(PC_BDDC*)fetidpmat_ctx->pc->data;
1187*3425bc38SStefano Zampini   PCBDDCGraph    mat_graph=pcbddc->mat_graph;
1188*3425bc38SStefano Zampini   Mat_IS         *matis  = (Mat_IS*)fetidpmat_ctx->pc->pmat->data;
1189*3425bc38SStefano Zampini   MPI_Comm       comm = ((PetscObject)(fetidpmat_ctx->pc))->comm;
1190*3425bc38SStefano Zampini 
1191*3425bc38SStefano Zampini   Mat            ScalingMat;
1192*3425bc38SStefano Zampini   Vec            lambda_global;
1193*3425bc38SStefano Zampini   IS             IS_l2g_lambda;
1194*3425bc38SStefano Zampini 
1195*3425bc38SStefano Zampini   PetscBool      skip_node,fully_redundant;
1196*3425bc38SStefano Zampini   PetscInt       i,j,k,s,n_boundary_dofs,sum_dof_sizes,n_global_lambda,n_vertices;
1197*3425bc38SStefano Zampini   PetscInt       n_local_lambda,n_lambda_for_dof,dual_size,n_neg_values,n_pos_values;
1198*3425bc38SStefano Zampini   PetscMPIInt    rank,nprocs,partial_sum;
1199*3425bc38SStefano Zampini   PetscScalar    scalar_value;
1200*3425bc38SStefano Zampini 
1201*3425bc38SStefano Zampini   PetscInt       *vertex_indices,*temp_indices;
1202*3425bc38SStefano Zampini   PetscInt       *dual_dofs_boundary_indices,*aux_local_numbering_1,*aux_global_numbering;
1203*3425bc38SStefano Zampini   PetscInt       *aux_sums,*cols_B_delta,*l2g_indices;
1204*3425bc38SStefano Zampini   PetscMPIInt    *aux_local_numbering_2,*aux_global_numbering_mpi,*dof_sizes,*dof_displs;
1205*3425bc38SStefano Zampini   PetscMPIInt    *all_aux_global_numbering_mpi_1,*all_aux_global_numbering_mpi_2,*global_dofs_numbering;
1206*3425bc38SStefano Zampini   PetscScalar    *array,*scaling_factors,*vals_B_delta;
1207*3425bc38SStefano Zampini 
1208*3425bc38SStefano Zampini   /* For communication of scaling factors */
1209*3425bc38SStefano Zampini   PetscInt       *ptrs_buffer,neigh_position;
1210*3425bc38SStefano Zampini   PetscScalar    **all_factors,*send_buffer,*recv_buffer;
1211*3425bc38SStefano Zampini   MPI_Request    *send_reqs,*recv_reqs;
1212*3425bc38SStefano Zampini 
1213*3425bc38SStefano Zampini   /* tests */
1214*3425bc38SStefano Zampini   Vec            test_vec;
1215*3425bc38SStefano Zampini   PetscBool      test_fetidp;
1216*3425bc38SStefano Zampini   PetscViewer    viewer;
1217*3425bc38SStefano Zampini 
1218*3425bc38SStefano Zampini   PetscFunctionBegin;
1219*3425bc38SStefano Zampini   ierr = MPI_Comm_rank(comm,&rank);CHKERRQ(ierr);
1220*3425bc38SStefano Zampini   ierr = MPI_Comm_size(comm,&nprocs);CHKERRQ(ierr);
1221*3425bc38SStefano Zampini 
1222*3425bc38SStefano Zampini   /* Default type of lagrange multipliers is non-redundant */
1223*3425bc38SStefano Zampini   fully_redundant = PETSC_FALSE;
1224*3425bc38SStefano Zampini   ierr = PetscOptionsGetBool(PETSC_NULL,"-fetidp_fullyredundant",&fully_redundant,PETSC_NULL);CHKERRQ(ierr);
1225*3425bc38SStefano Zampini 
1226*3425bc38SStefano Zampini   /* Evaluate local and global number of lagrange multipliers */
1227*3425bc38SStefano Zampini   ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
1228*3425bc38SStefano Zampini   n_local_lambda = 0;
1229*3425bc38SStefano Zampini   partial_sum = 0;
1230*3425bc38SStefano Zampini   n_boundary_dofs = 0;
1231*3425bc38SStefano Zampini   s = 0;
1232*3425bc38SStefano Zampini   n_vertices = 0;
1233*3425bc38SStefano Zampini   /* Get Vertices used to define the BDDC */
1234*3425bc38SStefano Zampini   ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(*vertex_indices),&vertex_indices);CHKERRQ(ierr);
1235*3425bc38SStefano Zampini   for(i=0;i<pcbddc->local_primal_size;i++) {
1236*3425bc38SStefano Zampini     ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&j,(const PetscInt**)&temp_indices,PETSC_NULL);CHKERRQ(ierr);
1237*3425bc38SStefano Zampini     if(j == 1) {
1238*3425bc38SStefano Zampini       vertex_indices[n_vertices]=temp_indices[0];
1239*3425bc38SStefano Zampini       n_vertices++;
1240*3425bc38SStefano Zampini     }
1241*3425bc38SStefano Zampini     ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&j,(const PetscInt**)&temp_indices,PETSC_NULL);CHKERRQ(ierr);
1242*3425bc38SStefano Zampini   }
1243*3425bc38SStefano Zampini   dual_size = pcis->n_B-n_vertices;
1244*3425bc38SStefano Zampini   ierr = PetscMalloc(dual_size*sizeof(*dual_dofs_boundary_indices),&dual_dofs_boundary_indices);CHKERRQ(ierr);
1245*3425bc38SStefano Zampini   ierr = PetscMalloc(dual_size*sizeof(*aux_local_numbering_1),&aux_local_numbering_1);CHKERRQ(ierr);
1246*3425bc38SStefano Zampini   ierr = PetscMalloc(dual_size*sizeof(*aux_local_numbering_2),&aux_local_numbering_2);CHKERRQ(ierr);
1247*3425bc38SStefano Zampini 
1248*3425bc38SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
1249*3425bc38SStefano Zampini   for(i=0;i<pcis->n;i++){
1250*3425bc38SStefano Zampini     j = mat_graph->count[i]; /* RECALL: mat_graph->count[i] does not count myself */
1251*3425bc38SStefano Zampini     k = (mat_graph->neighbours_set[i][0] == -1 ?  1 : 0);
1252*3425bc38SStefano Zampini     j = j - k ;
1253*3425bc38SStefano Zampini     if( j > 0 ) { n_boundary_dofs++; }
1254*3425bc38SStefano Zampini 
1255*3425bc38SStefano Zampini     skip_node = PETSC_FALSE;
1256*3425bc38SStefano Zampini     if(vertex_indices[s]==i) { /* it works for a sorted set of vertices */
1257*3425bc38SStefano Zampini       skip_node = PETSC_TRUE;
1258*3425bc38SStefano Zampini       s++;
1259*3425bc38SStefano Zampini     }
1260*3425bc38SStefano Zampini     if(j < 1) {skip_node = PETSC_TRUE;}
1261*3425bc38SStefano Zampini     if( !skip_node ) {
1262*3425bc38SStefano Zampini       if(fully_redundant) {
1263*3425bc38SStefano Zampini         /* fully redundant set of lagrange multipliers */
1264*3425bc38SStefano Zampini         n_lambda_for_dof = (j*(j+1))/2;
1265*3425bc38SStefano Zampini       } else {
1266*3425bc38SStefano Zampini         n_lambda_for_dof = j;
1267*3425bc38SStefano Zampini       }
1268*3425bc38SStefano Zampini       n_local_lambda += j;
1269*3425bc38SStefano Zampini       /* needed to evaluate global number of lagrange multipliers */
1270*3425bc38SStefano Zampini       array[i]=(1.0*n_lambda_for_dof)/(j+1.0); /* already scaled for the next global sum */
1271*3425bc38SStefano Zampini       /* store some data needed */
1272*3425bc38SStefano Zampini       dual_dofs_boundary_indices[partial_sum] = n_boundary_dofs-1;
1273*3425bc38SStefano Zampini       aux_local_numbering_1[partial_sum] = i;
1274*3425bc38SStefano Zampini       aux_local_numbering_2[partial_sum] = (PetscMPIInt)n_lambda_for_dof;
1275*3425bc38SStefano Zampini       partial_sum++;
1276*3425bc38SStefano Zampini     }
1277*3425bc38SStefano Zampini   }
1278*3425bc38SStefano Zampini   /*printf("I found %d local lambda dofs\n",n_local_lambda);
1279*3425bc38SStefano Zampini   printf("I found %d boundary dofs (should be %d)\n",n_boundary_dofs,pcis->n_B);
1280*3425bc38SStefano Zampini   printf("Partial sum %d should be %d\n",partial_sum,dual_size);*/
1281*3425bc38SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
1282*3425bc38SStefano Zampini   ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
1283*3425bc38SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
1284*3425bc38SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
1285*3425bc38SStefano Zampini   ierr = VecSum(pcis->vec1_global,&scalar_value);CHKERRQ(ierr);
1286*3425bc38SStefano Zampini   fetidpmat_ctx->n_lambda = (PetscInt) scalar_value;
1287*3425bc38SStefano Zampini   /* printf("I found %d global multipliers (%f)\n",fetidpmat_ctx->n_lambda,scalar_value); */
1288*3425bc38SStefano Zampini   ierr = VecCreate(PETSC_COMM_SELF,&fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
1289*3425bc38SStefano Zampini   ierr = VecSetSizes(fetidpmat_ctx->lambda_local,n_local_lambda,n_local_lambda);CHKERRQ(ierr);
1290*3425bc38SStefano Zampini   ierr = VecSetType(fetidpmat_ctx->lambda_local,VECSEQ);CHKERRQ(ierr);
1291*3425bc38SStefano Zampini   ierr = VecCreate(comm,&lambda_global);CHKERRQ(ierr);
1292*3425bc38SStefano Zampini   ierr = VecSetSizes(lambda_global,PETSC_DECIDE,fetidpmat_ctx->n_lambda);CHKERRQ(ierr);
1293*3425bc38SStefano Zampini   ierr = VecSetType(lambda_global,VECMPI);CHKERRQ(ierr);
1294*3425bc38SStefano Zampini 
1295*3425bc38SStefano Zampini   /* compute global ordering of lagrange multipliers and associate l2g map */
1296*3425bc38SStefano Zampini 
1297*3425bc38SStefano Zampini   ierr = PetscMalloc(dual_size*sizeof(*aux_global_numbering),&aux_global_numbering);CHKERRQ(ierr);
1298*3425bc38SStefano Zampini   ierr = PetscMalloc(dual_size*sizeof(*aux_global_numbering_mpi),&aux_global_numbering_mpi);CHKERRQ(ierr);
1299*3425bc38SStefano Zampini   j = (rank == 0 ? nprocs : 0);
1300*3425bc38SStefano Zampini   ierr = PetscMalloc(j*sizeof(*dof_sizes),&dof_sizes);CHKERRQ(ierr);
1301*3425bc38SStefano Zampini   ierr = PetscMalloc(j*sizeof(*dof_displs),&dof_displs);CHKERRQ(ierr);
1302*3425bc38SStefano Zampini   ierr = ISLocalToGlobalMappingApply(matis->mapping,dual_size,aux_local_numbering_1,aux_global_numbering);CHKERRQ(ierr);
1303*3425bc38SStefano Zampini   ierr = MPI_Gather(&dual_size,1,MPIU_INT,dof_sizes,1,MPIU_INT,0,comm);CHKERRQ(ierr);
1304*3425bc38SStefano Zampini   sum_dof_sizes=0;
1305*3425bc38SStefano Zampini   if ( rank == 0 ) {
1306*3425bc38SStefano Zampini     dof_displs[0]=0;
1307*3425bc38SStefano Zampini     sum_dof_sizes=dual_size;
1308*3425bc38SStefano Zampini     for(i=1;i<nprocs;i++) {
1309*3425bc38SStefano Zampini       dof_displs[i] = dof_displs[i-1]+dof_sizes[i-1];
1310*3425bc38SStefano Zampini       sum_dof_sizes += dof_sizes[i];
1311*3425bc38SStefano Zampini     }
1312*3425bc38SStefano Zampini   }
1313*3425bc38SStefano Zampini   for(i=0;i<dual_size;i++) {
1314*3425bc38SStefano Zampini     aux_global_numbering_mpi[i]=(PetscMPIInt)aux_global_numbering[i];
1315*3425bc38SStefano Zampini   }
1316*3425bc38SStefano Zampini   ierr = PetscMalloc(sum_dof_sizes*sizeof(*all_aux_global_numbering_mpi_1),&all_aux_global_numbering_mpi_1);CHKERRQ(ierr);
1317*3425bc38SStefano Zampini   ierr = PetscMalloc(sum_dof_sizes*sizeof(*all_aux_global_numbering_mpi_2),&all_aux_global_numbering_mpi_2);CHKERRQ(ierr);
1318*3425bc38SStefano Zampini   ierr = MPI_Gatherv(aux_global_numbering_mpi,dual_size,MPIU_INT,all_aux_global_numbering_mpi_1,dof_sizes,dof_displs,MPIU_INT,0,comm);CHKERRQ(ierr);
1319*3425bc38SStefano Zampini   ierr = MPI_Gatherv(aux_local_numbering_2,dual_size,MPIU_INT,all_aux_global_numbering_mpi_2,dof_sizes,dof_displs,MPIU_INT,0,comm);CHKERRQ(ierr);
1320*3425bc38SStefano Zampini 
1321*3425bc38SStefano Zampini   ierr = PetscMalloc(fetidpmat_ctx->n_lambda*sizeof(*global_dofs_numbering),&global_dofs_numbering);CHKERRQ(ierr);
1322*3425bc38SStefano Zampini   if( rank == 0 ) {
1323*3425bc38SStefano Zampini     ierr = PetscSortMPIIntWithArray(sum_dof_sizes,all_aux_global_numbering_mpi_1,all_aux_global_numbering_mpi_2);CHKERRQ(ierr);
1324*3425bc38SStefano Zampini     j=-1;
1325*3425bc38SStefano Zampini     partial_sum = 0;
1326*3425bc38SStefano Zampini     for(i=0;i<sum_dof_sizes;i++) {
1327*3425bc38SStefano Zampini       if(j != all_aux_global_numbering_mpi_1[i] ) {
1328*3425bc38SStefano Zampini         j=all_aux_global_numbering_mpi_1[i];
1329*3425bc38SStefano Zampini         for(k=0;k<all_aux_global_numbering_mpi_2[i];k++) {
1330*3425bc38SStefano Zampini           global_dofs_numbering[partial_sum+k]=all_aux_global_numbering_mpi_1[i];
1331*3425bc38SStefano Zampini         }
1332*3425bc38SStefano Zampini         partial_sum += all_aux_global_numbering_mpi_2[i];
1333*3425bc38SStefano Zampini       }
1334*3425bc38SStefano Zampini     }
1335*3425bc38SStefano Zampini     /* printf("Partial sum for global dofs %d should be %d\n",partial_sum,fetidpmat_ctx->n_lambda); */
1336*3425bc38SStefano Zampini   }
1337*3425bc38SStefano Zampini   ierr = MPI_Bcast(global_dofs_numbering,fetidpmat_ctx->n_lambda,MPIU_INT,0,comm);CHKERRQ(ierr);
1338*3425bc38SStefano Zampini 
1339*3425bc38SStefano Zampini   /* init data for scaling factors exchange */
1340*3425bc38SStefano Zampini   partial_sum = 0;
1341*3425bc38SStefano Zampini   j = 0;
1342*3425bc38SStefano Zampini   ierr = PetscMalloc( pcis->n_neigh*sizeof(PetscInt),&ptrs_buffer);CHKERRQ(ierr);
1343*3425bc38SStefano Zampini   ierr = PetscMalloc( (pcis->n_neigh-1)*sizeof(MPI_Request),&send_reqs);CHKERRQ(ierr);
1344*3425bc38SStefano Zampini   ierr = PetscMalloc( (pcis->n_neigh-1)*sizeof(MPI_Request),&recv_reqs);CHKERRQ(ierr);
1345*3425bc38SStefano Zampini   ierr = PetscMalloc( pcis->n*sizeof(PetscScalar*),&all_factors);CHKERRQ(ierr);
1346*3425bc38SStefano Zampini   ptrs_buffer[0]=0;
1347*3425bc38SStefano Zampini   for(i=1;i<pcis->n_neigh;i++) {
1348*3425bc38SStefano Zampini     partial_sum += pcis->n_shared[i];
1349*3425bc38SStefano Zampini     ptrs_buffer[i] = ptrs_buffer[i-1]+pcis->n_shared[i];
1350*3425bc38SStefano Zampini   }
1351*3425bc38SStefano Zampini   ierr = PetscMalloc( partial_sum*sizeof(PetscScalar),&send_buffer);CHKERRQ(ierr);
1352*3425bc38SStefano Zampini   ierr = PetscMalloc( partial_sum*sizeof(PetscScalar),&recv_buffer);CHKERRQ(ierr);
1353*3425bc38SStefano Zampini   ierr = PetscMalloc( partial_sum*sizeof(PetscScalar),&all_factors[0]);CHKERRQ(ierr);
1354*3425bc38SStefano Zampini   for(i=0;i<pcis->n-1;i++) {
1355*3425bc38SStefano Zampini     j = mat_graph->count[i];
1356*3425bc38SStefano Zampini     if(j>0) {
1357*3425bc38SStefano Zampini       k = (mat_graph->neighbours_set[i][0] == -1 ?  1 : 0);
1358*3425bc38SStefano Zampini       j = j - k;
1359*3425bc38SStefano Zampini     }
1360*3425bc38SStefano Zampini     all_factors[i+1]=all_factors[i]+j;
1361*3425bc38SStefano Zampini   }
1362*3425bc38SStefano Zampini   /* scatter B scaling to N vec */
1363*3425bc38SStefano Zampini   ierr = VecScatterBegin(pcis->N_to_B,pcis->D,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
1364*3425bc38SStefano Zampini   ierr = VecScatterEnd  (pcis->N_to_B,pcis->D,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
1365*3425bc38SStefano Zampini   /* communications */
1366*3425bc38SStefano Zampini   k = 0;
1367*3425bc38SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
1368*3425bc38SStefano Zampini   for(i=1;i<pcis->n_neigh;i++) {
1369*3425bc38SStefano Zampini     for(j=0;j<pcis->n_shared[i];j++) {
1370*3425bc38SStefano Zampini       send_buffer[ptrs_buffer[i-1]+j]=array[pcis->shared[i][j]];
1371*3425bc38SStefano Zampini     }
1372*3425bc38SStefano Zampini     j = ptrs_buffer[i]-ptrs_buffer[i-1];
1373*3425bc38SStefano Zampini     ierr = MPI_Isend(&send_buffer[ptrs_buffer[i-1]],j,MPIU_SCALAR,pcis->neigh[i],0,comm,&send_reqs[k]);CHKERRQ(ierr);
1374*3425bc38SStefano Zampini     ierr = MPI_Irecv(&recv_buffer[ptrs_buffer[i-1]],j,MPIU_SCALAR,pcis->neigh[i],0,comm,&recv_reqs[k]);CHKERRQ(ierr);
1375*3425bc38SStefano Zampini     k++;
1376*3425bc38SStefano Zampini   }
1377*3425bc38SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
1378*3425bc38SStefano Zampini   ierr = MPI_Waitall(k,recv_reqs,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
1379*3425bc38SStefano Zampini   ierr = MPI_Waitall(k,send_reqs,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
1380*3425bc38SStefano Zampini   /* put values in correct places */
1381*3425bc38SStefano Zampini   for(i=1;i<pcis->n_neigh;i++) {
1382*3425bc38SStefano Zampini     for(j=0;j<pcis->n_shared[i];j++) {
1383*3425bc38SStefano Zampini       k = pcis->shared[i][j];
1384*3425bc38SStefano Zampini       neigh_position = 0;
1385*3425bc38SStefano Zampini       while(mat_graph->neighbours_set[k][neigh_position] != pcis->neigh[i]) {neigh_position++;}
1386*3425bc38SStefano Zampini       s = (mat_graph->neighbours_set[k][0] == -1 ?  1 : 0);
1387*3425bc38SStefano Zampini       neigh_position = neigh_position - s;
1388*3425bc38SStefano Zampini       all_factors[k][neigh_position]=recv_buffer[ptrs_buffer[i-1]+j];
1389*3425bc38SStefano Zampini     }
1390*3425bc38SStefano Zampini   }
1391*3425bc38SStefano Zampini   ierr = PetscFree(send_reqs);CHKERRQ(ierr);
1392*3425bc38SStefano Zampini   ierr = PetscFree(recv_reqs);CHKERRQ(ierr);
1393*3425bc38SStefano Zampini   ierr = PetscFree(send_buffer);CHKERRQ(ierr);
1394*3425bc38SStefano Zampini   ierr = PetscFree(recv_buffer);CHKERRQ(ierr);
1395*3425bc38SStefano Zampini   ierr = PetscFree(ptrs_buffer);CHKERRQ(ierr);
1396*3425bc38SStefano Zampini 
1397*3425bc38SStefano Zampini   /* Compute B and B_delta (local actions) */
1398*3425bc38SStefano Zampini   ierr = PetscMalloc(pcis->n_neigh*sizeof(*aux_sums),&aux_sums);CHKERRQ(ierr);
1399*3425bc38SStefano Zampini   ierr = PetscMalloc(n_local_lambda*sizeof(*l2g_indices),&l2g_indices);CHKERRQ(ierr);
1400*3425bc38SStefano Zampini   ierr = PetscMalloc(n_local_lambda*sizeof(*vals_B_delta),&vals_B_delta);CHKERRQ(ierr);
1401*3425bc38SStefano Zampini   ierr = PetscMalloc(n_local_lambda*sizeof(*cols_B_delta),&cols_B_delta);CHKERRQ(ierr);
1402*3425bc38SStefano Zampini   ierr = PetscMalloc(n_local_lambda*sizeof(*scaling_factors),&scaling_factors);CHKERRQ(ierr);
1403*3425bc38SStefano Zampini   n_global_lambda=0;
1404*3425bc38SStefano Zampini   partial_sum=0;
1405*3425bc38SStefano Zampini   for(i=0;i<dual_size;i++) {
1406*3425bc38SStefano Zampini     while( global_dofs_numbering[n_global_lambda] != aux_global_numbering_mpi[i] ) { n_global_lambda++; }
1407*3425bc38SStefano Zampini     j = mat_graph->count[aux_local_numbering_1[i]];
1408*3425bc38SStefano Zampini     k = (mat_graph->neighbours_set[aux_local_numbering_1[i]][0] == -1 ?  1 : 0);
1409*3425bc38SStefano Zampini     j = j - k;
1410*3425bc38SStefano Zampini     aux_sums[0]=0;
1411*3425bc38SStefano Zampini     for(s=1;s<j;s++) {
1412*3425bc38SStefano Zampini       aux_sums[s]=aux_sums[s-1]+j-s+1;
1413*3425bc38SStefano Zampini     }
1414*3425bc38SStefano Zampini     array = all_factors[aux_local_numbering_1[i]];
1415*3425bc38SStefano Zampini     n_neg_values = 0;
1416*3425bc38SStefano Zampini     while(n_neg_values < j && mat_graph->neighbours_set[aux_local_numbering_1[i]][n_neg_values+k] < rank) {n_neg_values++;}
1417*3425bc38SStefano Zampini     n_pos_values = j - n_neg_values;
1418*3425bc38SStefano Zampini     if(fully_redundant) {
1419*3425bc38SStefano Zampini       for(s=0;s<n_neg_values;s++) {
1420*3425bc38SStefano Zampini         l2g_indices    [partial_sum+s]=aux_sums[s]+n_neg_values-s-1+n_global_lambda;
1421*3425bc38SStefano Zampini         cols_B_delta   [partial_sum+s]=dual_dofs_boundary_indices[i];
1422*3425bc38SStefano Zampini         vals_B_delta   [partial_sum+s]=-1.0;
1423*3425bc38SStefano Zampini         scaling_factors[partial_sum+s]=array[s];
1424*3425bc38SStefano Zampini       }
1425*3425bc38SStefano Zampini       for(s=0;s<n_pos_values;s++) {
1426*3425bc38SStefano Zampini         l2g_indices    [partial_sum+s+n_neg_values]=aux_sums[n_neg_values]+s+n_global_lambda;
1427*3425bc38SStefano Zampini         cols_B_delta   [partial_sum+s+n_neg_values]=dual_dofs_boundary_indices[i];
1428*3425bc38SStefano Zampini         vals_B_delta   [partial_sum+s+n_neg_values]=1.0;
1429*3425bc38SStefano Zampini         scaling_factors[partial_sum+s+n_neg_values]=array[s+n_neg_values];
1430*3425bc38SStefano Zampini       }
1431*3425bc38SStefano Zampini       partial_sum += j;
1432*3425bc38SStefano Zampini     } else {
1433*3425bc38SStefano Zampini       /* l2g_indices and default cols and vals of B_delta */
1434*3425bc38SStefano Zampini       for(s=0;s<j;s++) {
1435*3425bc38SStefano Zampini         l2g_indices    [partial_sum+s]=n_global_lambda+s;
1436*3425bc38SStefano Zampini         cols_B_delta   [partial_sum+s]=dual_dofs_boundary_indices[i];
1437*3425bc38SStefano Zampini         vals_B_delta   [partial_sum+s]=0.0;
1438*3425bc38SStefano Zampini       }
1439*3425bc38SStefano Zampini       /* B_delta */
1440*3425bc38SStefano Zampini       if( n_neg_values > 0 ) { /* there's a rank next to me to the left */
1441*3425bc38SStefano Zampini         vals_B_delta   [partial_sum+n_neg_values-1]=-1.0;
1442*3425bc38SStefano Zampini       }
1443*3425bc38SStefano Zampini       if ( n_neg_values < j ) { /* there's a rank next to me to the right */
1444*3425bc38SStefano Zampini         vals_B_delta   [partial_sum+n_neg_values]=1.0;
1445*3425bc38SStefano Zampini       }
1446*3425bc38SStefano Zampini       /* scaling as in Klawonn-Widlund 1999*/
1447*3425bc38SStefano Zampini       for(s=0;s<n_neg_values;s++) {
1448*3425bc38SStefano Zampini         scalar_value = 0.0;
1449*3425bc38SStefano Zampini         for(k=0;k<s+1;k++) {
1450*3425bc38SStefano Zampini           scalar_value += array[k];
1451*3425bc38SStefano Zampini         }
1452*3425bc38SStefano Zampini         scalar_value = -scalar_value;
1453*3425bc38SStefano Zampini         scaling_factors[partial_sum+s] = scalar_value;
1454*3425bc38SStefano Zampini       }
1455*3425bc38SStefano Zampini       for(s=0;s<n_pos_values;s++) {
1456*3425bc38SStefano Zampini         scalar_value = 0.0;
1457*3425bc38SStefano Zampini         for(k=s+n_neg_values;k<j;k++) {
1458*3425bc38SStefano Zampini           scalar_value += array[k];
1459*3425bc38SStefano Zampini         }
1460*3425bc38SStefano Zampini         scaling_factors[partial_sum+s+n_neg_values] = scalar_value;
1461*3425bc38SStefano Zampini       }
1462*3425bc38SStefano Zampini       partial_sum += j;
1463*3425bc38SStefano Zampini     }
1464*3425bc38SStefano Zampini   }
1465*3425bc38SStefano Zampini   ierr = PetscFree(all_factors[0]);CHKERRQ(ierr);
1466*3425bc38SStefano Zampini   ierr = PetscFree(all_factors);CHKERRQ(ierr);
1467*3425bc38SStefano Zampini   /* printf("I found %d local lambda dofs when numbering them (should be %d)\n",partial_sum,n_local_lambda); */
1468*3425bc38SStefano Zampini   ierr = ISCreateGeneral(comm,n_local_lambda,l2g_indices,PETSC_OWN_POINTER,&IS_l2g_lambda);CHKERRQ(ierr);
1469*3425bc38SStefano Zampini   ierr = VecScatterCreate(fetidpmat_ctx->lambda_local,(IS)0,lambda_global,IS_l2g_lambda,&fetidpmat_ctx->l2g_lambda);CHKERRQ(ierr);
1470*3425bc38SStefano Zampini 
1471*3425bc38SStefano Zampini   /* Create local part of B_delta */
1472*3425bc38SStefano Zampini   ierr = MatCreate(PETSC_COMM_SELF,&fetidpmat_ctx->B_delta);
1473*3425bc38SStefano Zampini   ierr = MatSetSizes(fetidpmat_ctx->B_delta,n_local_lambda,pcis->n_B,n_local_lambda,pcis->n_B);CHKERRQ(ierr);
1474*3425bc38SStefano Zampini   ierr = MatSetType(fetidpmat_ctx->B_delta,MATSEQAIJ);CHKERRQ(ierr);
1475*3425bc38SStefano Zampini   ierr = MatSeqAIJSetPreallocation(fetidpmat_ctx->B_delta,1,PETSC_NULL);CHKERRQ(ierr);
1476*3425bc38SStefano Zampini   ierr = MatSetOption(fetidpmat_ctx->B_delta,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr);
1477*3425bc38SStefano Zampini   for(i=0;i<n_local_lambda;i++) {
1478*3425bc38SStefano Zampini     ierr = MatSetValue(fetidpmat_ctx->B_delta,i,cols_B_delta[i],vals_B_delta[i],INSERT_VALUES);CHKERRQ(ierr);
1479*3425bc38SStefano Zampini   }
1480*3425bc38SStefano Zampini   ierr = MatAssemblyBegin(fetidpmat_ctx->B_delta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1481*3425bc38SStefano Zampini   ierr = MatAssemblyEnd  (fetidpmat_ctx->B_delta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1482*3425bc38SStefano Zampini 
1483*3425bc38SStefano Zampini   if(fully_redundant) {
1484*3425bc38SStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&ScalingMat);
1485*3425bc38SStefano Zampini     ierr = MatSetSizes(ScalingMat,n_local_lambda,n_local_lambda,n_local_lambda,n_local_lambda);CHKERRQ(ierr);
1486*3425bc38SStefano Zampini     ierr = MatSetType(ScalingMat,MATSEQAIJ);CHKERRQ(ierr);
1487*3425bc38SStefano Zampini     ierr = MatSeqAIJSetPreallocation(ScalingMat,1,PETSC_NULL);CHKERRQ(ierr);
1488*3425bc38SStefano Zampini     for(i=0;i<n_local_lambda;i++) {
1489*3425bc38SStefano Zampini       ierr = MatSetValue(ScalingMat,i,i,scaling_factors[i],INSERT_VALUES);CHKERRQ(ierr);
1490*3425bc38SStefano Zampini     }
1491*3425bc38SStefano Zampini     ierr = MatAssemblyBegin(ScalingMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1492*3425bc38SStefano Zampini     ierr = MatAssemblyEnd  (ScalingMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1493*3425bc38SStefano Zampini     ierr = MatMatMult(ScalingMat,fetidpmat_ctx->B_delta,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&fetidpmat_ctx->B_Ddelta);CHKERRQ(ierr);
1494*3425bc38SStefano Zampini     ierr = MatDestroy(&ScalingMat);CHKERRQ(ierr);
1495*3425bc38SStefano Zampini   } else {
1496*3425bc38SStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&fetidpmat_ctx->B_Ddelta);
1497*3425bc38SStefano Zampini     ierr = MatSetSizes(fetidpmat_ctx->B_Ddelta,n_local_lambda,pcis->n_B,n_local_lambda,pcis->n_B);CHKERRQ(ierr);
1498*3425bc38SStefano Zampini     ierr = MatSetType(fetidpmat_ctx->B_Ddelta,MATSEQAIJ);CHKERRQ(ierr);
1499*3425bc38SStefano Zampini     ierr = MatSeqAIJSetPreallocation(fetidpmat_ctx->B_Ddelta,1,PETSC_NULL);CHKERRQ(ierr);
1500*3425bc38SStefano Zampini     for(i=0;i<n_local_lambda;i++) {
1501*3425bc38SStefano Zampini       ierr = MatSetValue(fetidpmat_ctx->B_Ddelta,i,cols_B_delta[i],scaling_factors[i],INSERT_VALUES);CHKERRQ(ierr);
1502*3425bc38SStefano Zampini     }
1503*3425bc38SStefano Zampini     ierr = MatAssemblyBegin(fetidpmat_ctx->B_Ddelta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1504*3425bc38SStefano Zampini     ierr = MatAssemblyEnd  (fetidpmat_ctx->B_Ddelta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1505*3425bc38SStefano Zampini   }
1506*3425bc38SStefano Zampini 
1507*3425bc38SStefano Zampini   /* Create some vectors needed by fetidp */
1508*3425bc38SStefano Zampini   ierr = VecDuplicate(pcis->vec1_B,&fetidpmat_ctx->temp_solution_B);CHKERRQ(ierr);
1509*3425bc38SStefano Zampini   ierr = VecDuplicate(pcis->vec1_D,&fetidpmat_ctx->temp_solution_D);CHKERRQ(ierr);
1510*3425bc38SStefano Zampini 
1511*3425bc38SStefano Zampini   test_fetidp = PETSC_FALSE;
1512*3425bc38SStefano Zampini   ierr = PetscOptionsGetBool(PETSC_NULL,"-fetidp_check",&test_fetidp,PETSC_NULL);CHKERRQ(ierr);
1513*3425bc38SStefano Zampini 
1514*3425bc38SStefano Zampini   if(test_fetidp) {
1515*3425bc38SStefano Zampini 
1516*3425bc38SStefano Zampini     ierr = PetscViewerASCIIGetStdout(((PetscObject)(fetidpmat_ctx->pc))->comm,&viewer);CHKERRQ(ierr);
1517*3425bc38SStefano Zampini     ierr = PetscViewerASCIISynchronizedAllow(viewer,PETSC_TRUE);CHKERRQ(ierr);
1518*3425bc38SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"----------FETI_DP TESTS--------------\n");CHKERRQ(ierr);
1519*3425bc38SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"All tests should return zero!\n");CHKERRQ(ierr);
1520*3425bc38SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"FETIDP MAT context in the ");CHKERRQ(ierr);
1521*3425bc38SStefano Zampini     if(fully_redundant) {
1522*3425bc38SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"fully redundant case for lagrange multipliers.\n");CHKERRQ(ierr);
1523*3425bc38SStefano Zampini     } else {
1524*3425bc38SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Non-fully redundant case for lagrange multiplier.\n");CHKERRQ(ierr);
1525*3425bc38SStefano Zampini     }
1526*3425bc38SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
1527*3425bc38SStefano Zampini 
1528*3425bc38SStefano Zampini     /******************************************************************/
1529*3425bc38SStefano Zampini     /* TEST A/B: Test numbering of global lambda dofs             */
1530*3425bc38SStefano Zampini     /******************************************************************/
1531*3425bc38SStefano Zampini 
1532*3425bc38SStefano Zampini     ierr = VecDuplicate(fetidpmat_ctx->lambda_local,&test_vec);CHKERRQ(ierr);
1533*3425bc38SStefano Zampini     ierr = VecSet(lambda_global,1.0);CHKERRQ(ierr);
1534*3425bc38SStefano Zampini     ierr = VecSet(test_vec,1.0);CHKERRQ(ierr);
1535*3425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
1536*3425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
1537*3425bc38SStefano Zampini     scalar_value = -1.0;
1538*3425bc38SStefano Zampini     ierr = VecAXPY(test_vec,scalar_value,fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
1539*3425bc38SStefano Zampini     ierr = VecNorm(test_vec,NORM_INFINITY,&scalar_value);CHKERRQ(ierr);
1540*3425bc38SStefano Zampini     ierr = VecDestroy(&test_vec);CHKERRQ(ierr);
1541*3425bc38SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"A[%04d]: CHECK glob to loc: % 1.14e\n",rank,scalar_value);CHKERRQ(ierr);
1542*3425bc38SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
1543*3425bc38SStefano Zampini     if(fully_redundant) {
1544*3425bc38SStefano Zampini       ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr);
1545*3425bc38SStefano Zampini       ierr = VecSet(fetidpmat_ctx->lambda_local,0.5);CHKERRQ(ierr);
1546*3425bc38SStefano Zampini       ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1547*3425bc38SStefano Zampini       ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1548*3425bc38SStefano Zampini       ierr = VecSum(lambda_global,&scalar_value);CHKERRQ(ierr);
1549*3425bc38SStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"B[%04d]: CHECK loc to glob: % 1.14e\n",rank,scalar_value-fetidpmat_ctx->n_lambda);CHKERRQ(ierr);
1550*3425bc38SStefano Zampini       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
1551*3425bc38SStefano Zampini     }
1552*3425bc38SStefano Zampini 
1553*3425bc38SStefano Zampini     /******************************************************************/
1554*3425bc38SStefano Zampini     /* TEST C: It should holds B_delta*w=0, w\in\widehat{W}           */
1555*3425bc38SStefano Zampini     /* This is the meaning of the B matrix                            */
1556*3425bc38SStefano Zampini     /******************************************************************/
1557*3425bc38SStefano Zampini 
1558*3425bc38SStefano Zampini     ierr = VecSetRandom(pcis->vec1_N,PETSC_NULL);CHKERRQ(ierr);
1559*3425bc38SStefano Zampini     ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
1560*3425bc38SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
1561*3425bc38SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
1562*3425bc38SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1563*3425bc38SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1564*3425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1565*3425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1566*3425bc38SStefano Zampini     /* Action of B_delta */
1567*3425bc38SStefano Zampini     ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
1568*3425bc38SStefano Zampini     ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr);
1569*3425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1570*3425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1571*3425bc38SStefano Zampini     ierr = VecNorm(lambda_global,NORM_INFINITY,&scalar_value);CHKERRQ(ierr);
1572*3425bc38SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"C[coll]: CHECK infty norm of B_delta*w (w continuous): % 1.14e\n",scalar_value);CHKERRQ(ierr);
1573*3425bc38SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
1574*3425bc38SStefano Zampini 
1575*3425bc38SStefano Zampini     /******************************************************************/
1576*3425bc38SStefano Zampini     /* TEST D: It should holds E_Dw = w - P_Dw w\in\widetilde{W}     */
1577*3425bc38SStefano Zampini     /* E_D = R_D^TR                                                   */
1578*3425bc38SStefano Zampini     /* P_D = B_{D,delta}^T B_{delta}                                  */
1579*3425bc38SStefano Zampini     /* eq.44 Mandel Tezaur and Dohrmann 2005                          */
1580*3425bc38SStefano Zampini     /******************************************************************/
1581*3425bc38SStefano Zampini 
1582*3425bc38SStefano Zampini     /* compute a random vector in \widetilde{W} */
1583*3425bc38SStefano Zampini     ierr = VecSetRandom(pcis->vec1_N,PETSC_NULL);CHKERRQ(ierr);
1584*3425bc38SStefano Zampini     scalar_value = 0.0;  /* set zero at vertices */
1585*3425bc38SStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
1586*3425bc38SStefano Zampini     for(i=0;i<n_vertices;i++) { array[vertex_indices[i]]=scalar_value; }
1587*3425bc38SStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
1588*3425bc38SStefano Zampini     /* store w for final comparison */
1589*3425bc38SStefano Zampini     ierr = VecDuplicate(pcis->vec1_B,&test_vec);CHKERRQ(ierr);
1590*3425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,test_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1591*3425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,test_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1592*3425bc38SStefano Zampini 
1593*3425bc38SStefano Zampini     /* Jump operator P_D : results stored in pcis->vec1_B */
1594*3425bc38SStefano Zampini 
1595*3425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1596*3425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1597*3425bc38SStefano Zampini     /* Action of B_delta */
1598*3425bc38SStefano Zampini     ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
1599*3425bc38SStefano Zampini     ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr);
1600*3425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1601*3425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1602*3425bc38SStefano Zampini     /* Action of B_Ddelta^T */
1603*3425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
1604*3425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
1605*3425bc38SStefano Zampini     ierr = MatMultTranspose(fetidpmat_ctx->B_Ddelta,fetidpmat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr);
1606*3425bc38SStefano Zampini 
1607*3425bc38SStefano Zampini     /* Average operator E_D : results stored in pcis->vec2_B */
1608*3425bc38SStefano Zampini 
1609*3425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1610*3425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1611*3425bc38SStefano Zampini     ierr = VecPointwiseMult(pcis->vec2_B,pcis->D,pcis->vec2_B);CHKERRQ(ierr);
1612*3425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec2_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
1613*3425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec2_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
1614*3425bc38SStefano Zampini     ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
1615*3425bc38SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
1616*3425bc38SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
1617*3425bc38SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1618*3425bc38SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1619*3425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1620*3425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1621*3425bc38SStefano Zampini 
1622*3425bc38SStefano Zampini     /* test E_D=I-P_D */
1623*3425bc38SStefano Zampini     scalar_value = 1.0;
1624*3425bc38SStefano Zampini     ierr = VecAXPY(pcis->vec1_B,scalar_value,pcis->vec2_B);CHKERRQ(ierr);
1625*3425bc38SStefano Zampini     scalar_value = -1.0;
1626*3425bc38SStefano Zampini     ierr = VecAXPY(pcis->vec1_B,scalar_value,test_vec);CHKERRQ(ierr);
1627*3425bc38SStefano Zampini     ierr = VecNorm(pcis->vec1_B,NORM_INFINITY,&scalar_value);CHKERRQ(ierr);
1628*3425bc38SStefano Zampini     ierr = VecDestroy(&test_vec);CHKERRQ(ierr);
1629*3425bc38SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"D[%04d] CHECK infty norm of E_D + P_D - I: % 1.14e\n",rank,scalar_value);CHKERRQ(ierr);
1630*3425bc38SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
1631*3425bc38SStefano Zampini 
1632*3425bc38SStefano Zampini     /******************************************************************/
1633*3425bc38SStefano Zampini     /* TEST E: It should holds R_D^TP_Dw=0 w\in\widetilde{W}          */
1634*3425bc38SStefano Zampini     /* eq.48 Mandel Tezaur and Dohrmann 2005                          */
1635*3425bc38SStefano Zampini     /******************************************************************/
1636*3425bc38SStefano Zampini 
1637*3425bc38SStefano Zampini     ierr = VecSetRandom(pcis->vec1_N,PETSC_NULL);CHKERRQ(ierr);
1638*3425bc38SStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
1639*3425bc38SStefano Zampini     scalar_value = 0.0;  /* set zero at vertices */
1640*3425bc38SStefano Zampini     for(i=0;i<n_vertices;i++) { array[vertex_indices[i]]=scalar_value; }
1641*3425bc38SStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
1642*3425bc38SStefano Zampini 
1643*3425bc38SStefano Zampini     /* Jump operator P_D : results stored in pcis->vec1_B */
1644*3425bc38SStefano Zampini 
1645*3425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1646*3425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1647*3425bc38SStefano Zampini     /* Action of B_delta */
1648*3425bc38SStefano Zampini     ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
1649*3425bc38SStefano Zampini     ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr);
1650*3425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1651*3425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1652*3425bc38SStefano Zampini     /* Action of B_Ddelta^T */
1653*3425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
1654*3425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
1655*3425bc38SStefano Zampini     ierr = MatMultTranspose(fetidpmat_ctx->B_Ddelta,fetidpmat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr);
1656*3425bc38SStefano Zampini     /* diagonal scaling */
1657*3425bc38SStefano Zampini     ierr = VecPointwiseMult(pcis->vec1_B,pcis->D,pcis->vec1_B);CHKERRQ(ierr);
1658*3425bc38SStefano Zampini     /* sum on the interface */
1659*3425bc38SStefano Zampini     ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
1660*3425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
1661*3425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
1662*3425bc38SStefano Zampini     ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
1663*3425bc38SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
1664*3425bc38SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
1665*3425bc38SStefano Zampini     ierr = VecNorm(pcis->vec1_global,NORM_INFINITY,&scalar_value);CHKERRQ(ierr);
1666*3425bc38SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"E[coll]: CHECK infty norm of R^T_D P_D: % 1.14e\n",scalar_value);CHKERRQ(ierr);
1667*3425bc38SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
1668*3425bc38SStefano Zampini 
1669*3425bc38SStefano Zampini     if(!fully_redundant) {
1670*3425bc38SStefano Zampini       /******************************************************************/
1671*3425bc38SStefano Zampini       /* TEST F: It should holds B_{delta}B^T_{D,delta}=I               */
1672*3425bc38SStefano Zampini       /* Corollary thm 14 Mandel Tezaur and Dohrmann 2005               */
1673*3425bc38SStefano Zampini       /******************************************************************/
1674*3425bc38SStefano Zampini       ierr = VecDuplicate(lambda_global,&test_vec);CHKERRQ(ierr);
1675*3425bc38SStefano Zampini       ierr = VecSetRandom(lambda_global,PETSC_NULL);CHKERRQ(ierr);
1676*3425bc38SStefano Zampini       /* Action of B_Ddelta^T */
1677*3425bc38SStefano Zampini       ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
1678*3425bc38SStefano Zampini       ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
1679*3425bc38SStefano Zampini       ierr = MatMultTranspose(fetidpmat_ctx->B_Ddelta,fetidpmat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr);
1680*3425bc38SStefano Zampini       /* Action of B_delta */
1681*3425bc38SStefano Zampini       ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
1682*3425bc38SStefano Zampini       ierr = VecSet(test_vec,0.0);CHKERRQ(ierr);
1683*3425bc38SStefano Zampini       ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,test_vec,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1684*3425bc38SStefano Zampini       ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,test_vec,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1685*3425bc38SStefano Zampini       scalar_value = -1.0;
1686*3425bc38SStefano Zampini       ierr = VecAXPY(lambda_global,scalar_value,test_vec);CHKERRQ(ierr);
1687*3425bc38SStefano Zampini       ierr = VecNorm(lambda_global,NORM_INFINITY,&scalar_value);CHKERRQ(ierr);
1688*3425bc38SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"E[coll]: CHECK infty norm of P^T_D - I: % 1.14e\n",scalar_value);CHKERRQ(ierr);
1689*3425bc38SStefano Zampini       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
1690*3425bc38SStefano Zampini       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
1691*3425bc38SStefano Zampini       ierr = VecDestroy(&test_vec);CHKERRQ(ierr);
1692*3425bc38SStefano Zampini     }
1693*3425bc38SStefano Zampini   }
1694*3425bc38SStefano Zampini   /* final cleanup */
1695*3425bc38SStefano Zampini   ierr = PetscFree(dual_dofs_boundary_indices);CHKERRQ(ierr);
1696*3425bc38SStefano Zampini   ierr = PetscFree(vertex_indices);CHKERRQ(ierr);
1697*3425bc38SStefano Zampini   ierr = PetscFree(aux_local_numbering_1);CHKERRQ(ierr);
1698*3425bc38SStefano Zampini   ierr = PetscFree(aux_local_numbering_2);CHKERRQ(ierr);
1699*3425bc38SStefano Zampini   ierr = PetscFree(aux_global_numbering);CHKERRQ(ierr);
1700*3425bc38SStefano Zampini   ierr = PetscFree(aux_global_numbering_mpi);CHKERRQ(ierr);
1701*3425bc38SStefano Zampini   ierr = PetscFree(dof_sizes);CHKERRQ(ierr);
1702*3425bc38SStefano Zampini   ierr = PetscFree(dof_displs);CHKERRQ(ierr);
1703*3425bc38SStefano Zampini   ierr = PetscFree(all_aux_global_numbering_mpi_1);CHKERRQ(ierr);
1704*3425bc38SStefano Zampini   ierr = PetscFree(all_aux_global_numbering_mpi_2);CHKERRQ(ierr);
1705*3425bc38SStefano Zampini   ierr = PetscFree(global_dofs_numbering);CHKERRQ(ierr);
1706*3425bc38SStefano Zampini   ierr = PetscFree(aux_sums);CHKERRQ(ierr);
1707*3425bc38SStefano Zampini   ierr = PetscFree(cols_B_delta);CHKERRQ(ierr);
1708*3425bc38SStefano Zampini   ierr = PetscFree(vals_B_delta);CHKERRQ(ierr);
1709*3425bc38SStefano Zampini   ierr = PetscFree(scaling_factors);CHKERRQ(ierr);
1710*3425bc38SStefano Zampini   ierr = VecDestroy(&lambda_global);CHKERRQ(ierr);
1711*3425bc38SStefano Zampini   ierr = ISDestroy(&IS_l2g_lambda);CHKERRQ(ierr);
1712*3425bc38SStefano Zampini 
1713*3425bc38SStefano Zampini   PetscFunctionReturn(0);
1714*3425bc38SStefano Zampini }
1715*3425bc38SStefano Zampini 
1716*3425bc38SStefano Zampini #undef __FUNCT__
1717*3425bc38SStefano Zampini #define __FUNCT__ "PCBDDCSetupFETIDPPCContext"
1718*3425bc38SStefano Zampini static PetscErrorCode PCBDDCSetupFETIDPPCContext(Mat fetimat, FETIDPPC_ctx *fetidppc_ctx)
1719*3425bc38SStefano Zampini {
1720*3425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
1721*3425bc38SStefano Zampini   PetscErrorCode ierr;
1722*3425bc38SStefano Zampini 
1723*3425bc38SStefano Zampini   PetscFunctionBegin;
1724*3425bc38SStefano Zampini   ierr = MatShellGetContext(fetimat,&mat_ctx);CHKERRQ(ierr);
1725*3425bc38SStefano Zampini   /* get references from objects created when setting up feti mat context */
1726*3425bc38SStefano Zampini   ierr = PetscObjectReference((PetscObject)mat_ctx->lambda_local);CHKERRQ(ierr);
1727*3425bc38SStefano Zampini   fetidppc_ctx->lambda_local = mat_ctx->lambda_local;
1728*3425bc38SStefano Zampini   ierr = PetscObjectReference((PetscObject)mat_ctx->B_Ddelta);CHKERRQ(ierr);
1729*3425bc38SStefano Zampini   fetidppc_ctx->B_Ddelta = mat_ctx->B_Ddelta;
1730*3425bc38SStefano Zampini   ierr = PetscObjectReference((PetscObject)mat_ctx->l2g_lambda);CHKERRQ(ierr);
1731*3425bc38SStefano Zampini   fetidppc_ctx->l2g_lambda = mat_ctx->l2g_lambda;
1732*3425bc38SStefano Zampini   PetscFunctionReturn(0);
1733*3425bc38SStefano Zampini }
1734*3425bc38SStefano Zampini 
1735*3425bc38SStefano Zampini #undef __FUNCT__
1736*3425bc38SStefano Zampini #define __FUNCT__ "FETIDPMatMult"
1737*3425bc38SStefano Zampini static PetscErrorCode FETIDPMatMult(Mat fetimat, Vec x, Vec y)
1738*3425bc38SStefano Zampini {
1739*3425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
1740*3425bc38SStefano Zampini   PC_IS          *pcis;
1741*3425bc38SStefano Zampini   PetscErrorCode ierr;
1742*3425bc38SStefano Zampini 
1743*3425bc38SStefano Zampini   PetscFunctionBegin;
1744*3425bc38SStefano Zampini   ierr = MatShellGetContext(fetimat,&mat_ctx);CHKERRQ(ierr);
1745*3425bc38SStefano Zampini   pcis = (PC_IS*)mat_ctx->pc->data;
1746*3425bc38SStefano Zampini   /* Application of B_delta^T */
1747*3425bc38SStefano Zampini   ierr = VecScatterBegin(mat_ctx->l2g_lambda,x,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
1748*3425bc38SStefano Zampini   ierr = VecScatterEnd(mat_ctx->l2g_lambda,x,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
1749*3425bc38SStefano Zampini   ierr = MatMultTranspose(mat_ctx->B_delta,mat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr);
1750*3425bc38SStefano Zampini   /* Application of \widetilde{S}^-1 */
1751*3425bc38SStefano Zampini   ierr = VecSet(pcis->vec1_D,0.0);CHKERRQ(ierr);
1752*3425bc38SStefano Zampini   ierr = PCBDDCApplyInterfacePreconditioner(mat_ctx->pc);CHKERRQ(ierr);
1753*3425bc38SStefano Zampini   /* Application of B_delta */
1754*3425bc38SStefano Zampini   ierr = MatMult(mat_ctx->B_delta,pcis->vec1_B,mat_ctx->lambda_local);CHKERRQ(ierr);
1755*3425bc38SStefano Zampini   ierr = VecSet(y,0.0);CHKERRQ(ierr);
1756*3425bc38SStefano Zampini   ierr = VecScatterBegin(mat_ctx->l2g_lambda,mat_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1757*3425bc38SStefano Zampini   ierr = VecScatterEnd(mat_ctx->l2g_lambda,mat_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1758*3425bc38SStefano Zampini   PetscFunctionReturn(0);
1759*3425bc38SStefano Zampini }
1760*3425bc38SStefano Zampini 
1761*3425bc38SStefano Zampini #undef __FUNCT__
1762*3425bc38SStefano Zampini #define __FUNCT__ "FETIDPPCApply"
1763*3425bc38SStefano Zampini static PetscErrorCode FETIDPPCApply(PC fetipc, Vec x, Vec y)
1764*3425bc38SStefano Zampini {
1765*3425bc38SStefano Zampini   FETIDPPC_ctx   *pc_ctx;
1766*3425bc38SStefano Zampini   PC_IS          *pcis;
1767*3425bc38SStefano Zampini   PetscErrorCode ierr;
1768*3425bc38SStefano Zampini 
1769*3425bc38SStefano Zampini   PetscFunctionBegin;
1770*3425bc38SStefano Zampini   ierr = PCShellGetContext(fetipc,(void**)&pc_ctx);
1771*3425bc38SStefano Zampini   pcis = (PC_IS*)pc_ctx->pc->data;
1772*3425bc38SStefano Zampini   /* Application of B_Ddelta^T */
1773*3425bc38SStefano Zampini   ierr = VecScatterBegin(pc_ctx->l2g_lambda,x,pc_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
1774*3425bc38SStefano Zampini   ierr = VecScatterEnd(pc_ctx->l2g_lambda,x,pc_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
1775*3425bc38SStefano Zampini   ierr = VecSet(pcis->vec2_B,0.0);CHKERRQ(ierr);
1776*3425bc38SStefano Zampini   ierr = MatMultTranspose(pc_ctx->B_Ddelta,pc_ctx->lambda_local,pcis->vec2_B);CHKERRQ(ierr);
1777*3425bc38SStefano Zampini   /* Application of S */
1778*3425bc38SStefano Zampini   ierr = PCISApplySchur(pc_ctx->pc,pcis->vec2_B,pcis->vec1_B,(Vec)0,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr);
1779*3425bc38SStefano Zampini   /* Application of B_Ddelta */
1780*3425bc38SStefano Zampini   ierr = MatMult(pc_ctx->B_Ddelta,pcis->vec1_B,pc_ctx->lambda_local);CHKERRQ(ierr);
1781*3425bc38SStefano Zampini   ierr = VecSet(y,0.0);CHKERRQ(ierr);
1782*3425bc38SStefano Zampini   ierr = VecScatterBegin(pc_ctx->l2g_lambda,pc_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1783*3425bc38SStefano Zampini   ierr = VecScatterEnd(pc_ctx->l2g_lambda,pc_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1784*3425bc38SStefano Zampini   PetscFunctionReturn(0);
1785*3425bc38SStefano Zampini }
1786*3425bc38SStefano Zampini 
1787da1bb401SStefano Zampini #undef __FUNCT__
1788da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetupLocalAdjacencyGraph"
1789da1bb401SStefano Zampini static PetscErrorCode PCBDDCSetupLocalAdjacencyGraph(PC pc)
1790da1bb401SStefano Zampini {
1791da1bb401SStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
1792da1bb401SStefano Zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
1793da1bb401SStefano Zampini   PetscInt       nvtxs,*xadj,*adjncy;
1794da1bb401SStefano Zampini   Mat            mat_adj;
1795da1bb401SStefano Zampini   PetscBool      symmetrize_rowij=PETSC_TRUE,compressed_rowij=PETSC_FALSE,flg_row=PETSC_TRUE;
1796da1bb401SStefano Zampini   PCBDDCGraph    mat_graph=pcbddc->mat_graph;
1797da1bb401SStefano Zampini   PetscErrorCode ierr;
1798da1bb401SStefano Zampini 
1799da1bb401SStefano Zampini   PetscFunctionBegin;
1800da1bb401SStefano Zampini   /* get CSR adjacency from local matrix if user has not yet provided local graph using PCBDDCSetLocalAdjacencyGraph function */
1801da1bb401SStefano Zampini   if(!mat_graph->xadj) {
1802da1bb401SStefano Zampini     ierr = MatConvert(matis->A,MATMPIADJ,MAT_INITIAL_MATRIX,&mat_adj);CHKERRQ(ierr);
1803da1bb401SStefano Zampini     ierr = MatGetRowIJ(mat_adj,0,symmetrize_rowij,compressed_rowij,&nvtxs,&xadj,&adjncy,&flg_row);CHKERRQ(ierr);
1804da1bb401SStefano Zampini     if(!flg_row) {
1805da1bb401SStefano Zampini       SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in MatGetRowIJ called in %s\n",__FUNCT__);
1806da1bb401SStefano Zampini     }
1807da1bb401SStefano Zampini     /* Get adjacency into BDDC workspace */
1808da1bb401SStefano Zampini     ierr = PCBDDCSetLocalAdjacencyGraph(pc,nvtxs,xadj,adjncy,PETSC_COPY_VALUES);CHKERRQ(ierr);
1809da1bb401SStefano Zampini     ierr = MatRestoreRowIJ(mat_adj,0,symmetrize_rowij,compressed_rowij,&nvtxs,&xadj,&adjncy,&flg_row);CHKERRQ(ierr);
1810da1bb401SStefano Zampini     if(!flg_row) {
1811da1bb401SStefano Zampini       SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in MatRestoreRowIJ called in %s\n",__FUNCT__);
1812da1bb401SStefano Zampini     }
1813da1bb401SStefano Zampini     ierr = MatDestroy(&mat_adj);CHKERRQ(ierr);
1814da1bb401SStefano Zampini   }
1815da1bb401SStefano Zampini   PetscFunctionReturn(0);
1816da1bb401SStefano Zampini }
1817da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
18180c7d97c5SJed Brown #undef __FUNCT__
18190c7d97c5SJed Brown #define __FUNCT__ "PCBDDCApplyInterfacePreconditioner"
18202617d88aSStefano Zampini static PetscErrorCode  PCBDDCApplyInterfacePreconditioner(PC pc)
18210c7d97c5SJed Brown {
18220c7d97c5SJed Brown   PetscErrorCode ierr;
18230c7d97c5SJed Brown   PC_BDDC*        pcbddc = (PC_BDDC*)(pc->data);
18240c7d97c5SJed Brown   PC_IS*            pcis = (PC_IS*)  (pc->data);
18253b03a366Sstefano_zampini   const PetscScalar zero = 0.0;
18260c7d97c5SJed Brown 
18270c7d97c5SJed Brown   PetscFunctionBegin;
18280c7d97c5SJed Brown   /* Application of PHI^T  */
18290c7d97c5SJed Brown   ierr = MatMultTranspose(pcbddc->coarse_phi_B,pcis->vec1_B,pcbddc->vec1_P);CHKERRQ(ierr);
18300c7d97c5SJed Brown   if(pcbddc->prec_type) { ierr = MatMultTransposeAdd(pcbddc->coarse_phi_D,pcis->vec1_D,pcbddc->vec1_P,pcbddc->vec1_P);CHKERRQ(ierr); }
18310c7d97c5SJed Brown 
18320c7d97c5SJed Brown   /* Scatter data of coarse_rhs */
18330c7d97c5SJed Brown   if(pcbddc->coarse_rhs) ierr = VecSet(pcbddc->coarse_rhs,zero);CHKERRQ(ierr);
18340c7d97c5SJed Brown   ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->vec1_P,pcbddc->coarse_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18350c7d97c5SJed Brown 
18360c7d97c5SJed Brown   /* Local solution on R nodes */
18370c7d97c5SJed Brown   ierr = VecSet(pcbddc->vec1_R,zero);CHKERRQ(ierr);
18380c7d97c5SJed Brown   ierr = VecScatterBegin(pcbddc->R_to_B,pcis->vec1_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
18390c7d97c5SJed Brown   ierr = VecScatterEnd  (pcbddc->R_to_B,pcis->vec1_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
18400c7d97c5SJed Brown   if(pcbddc->prec_type) {
18410c7d97c5SJed Brown     ierr = VecScatterBegin(pcbddc->R_to_D,pcis->vec1_D,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
18420c7d97c5SJed Brown     ierr = VecScatterEnd  (pcbddc->R_to_D,pcis->vec1_D,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
18430c7d97c5SJed Brown   }
18440c7d97c5SJed Brown   ierr = PCBDDCSolveSaddlePoint(pc);CHKERRQ(ierr);
18450c7d97c5SJed Brown   ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr);
18460c7d97c5SJed Brown   ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec2_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18470c7d97c5SJed Brown   ierr = VecScatterEnd  (pcbddc->R_to_B,pcbddc->vec2_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18480c7d97c5SJed Brown   if(pcbddc->prec_type) {
18490c7d97c5SJed Brown     ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec2_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18500c7d97c5SJed Brown     ierr = VecScatterEnd  (pcbddc->R_to_D,pcbddc->vec2_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18510c7d97c5SJed Brown   }
18520c7d97c5SJed Brown 
18530c7d97c5SJed Brown   /* Coarse solution */
18540c7d97c5SJed Brown   ierr = PCBDDCScatterCoarseDataEnd(pc,pcbddc->vec1_P,pcbddc->coarse_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
185553cdbc3dSStefano Zampini   if(pcbddc->coarse_rhs) ierr = KSPSolve(pcbddc->coarse_ksp,pcbddc->coarse_rhs,pcbddc->coarse_vec);CHKERRQ(ierr);
18560c7d97c5SJed Brown   ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->coarse_vec,pcbddc->vec1_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
18570c7d97c5SJed Brown   ierr = PCBDDCScatterCoarseDataEnd  (pc,pcbddc->coarse_vec,pcbddc->vec1_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
18580c7d97c5SJed Brown 
18590c7d97c5SJed Brown   /* Sum contributions from two levels */
18600c7d97c5SJed Brown   ierr = MatMultAdd(pcbddc->coarse_phi_B,pcbddc->vec1_P,pcis->vec1_B,pcis->vec1_B);CHKERRQ(ierr);
18610c7d97c5SJed Brown   if(pcbddc->prec_type) { ierr = MatMultAdd(pcbddc->coarse_phi_D,pcbddc->vec1_P,pcis->vec1_D,pcis->vec1_D);CHKERRQ(ierr); }
18620c7d97c5SJed Brown   PetscFunctionReturn(0);
18630c7d97c5SJed Brown }
18640c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
18650c7d97c5SJed Brown #undef __FUNCT__
18660c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSolveSaddlePoint"
186753cdbc3dSStefano Zampini static PetscErrorCode  PCBDDCSolveSaddlePoint(PC pc)
18680c7d97c5SJed Brown {
18690c7d97c5SJed Brown   PetscErrorCode ierr;
18700c7d97c5SJed Brown   PC_BDDC*       pcbddc = (PC_BDDC*)(pc->data);
18710c7d97c5SJed Brown 
18720c7d97c5SJed Brown   PetscFunctionBegin;
187353cdbc3dSStefano Zampini   ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr);
1874534831adSStefano Zampini   if(pcbddc->local_auxmat1) {
18750c7d97c5SJed Brown     ierr = MatMult(pcbddc->local_auxmat1,pcbddc->vec2_R,pcbddc->vec1_C);CHKERRQ(ierr);
18760c7d97c5SJed Brown     ierr = MatMultAdd(pcbddc->local_auxmat2,pcbddc->vec1_C,pcbddc->vec2_R,pcbddc->vec2_R);CHKERRQ(ierr);
18770c7d97c5SJed Brown   }
18780c7d97c5SJed Brown   PetscFunctionReturn(0);
18790c7d97c5SJed Brown }
18800c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
18810c7d97c5SJed Brown #undef __FUNCT__
18820c7d97c5SJed Brown #define __FUNCT__ "PCBDDCScatterCoarseDataBegin"
188353cdbc3dSStefano Zampini static PetscErrorCode  PCBDDCScatterCoarseDataBegin(PC pc,Vec vec_from, Vec vec_to, InsertMode imode, ScatterMode smode)
18840c7d97c5SJed Brown {
18850c7d97c5SJed Brown   PetscErrorCode ierr;
18860c7d97c5SJed Brown   PC_BDDC*       pcbddc = (PC_BDDC*)(pc->data);
18870c7d97c5SJed Brown 
18880c7d97c5SJed Brown   PetscFunctionBegin;
18890c7d97c5SJed Brown   switch(pcbddc->coarse_communications_type){
18900c7d97c5SJed Brown     case SCATTERS_BDDC:
18910c7d97c5SJed Brown       ierr = VecScatterBegin(pcbddc->coarse_loc_to_glob,vec_from,vec_to,imode,smode);CHKERRQ(ierr);
18920c7d97c5SJed Brown       break;
18930c7d97c5SJed Brown     case GATHERS_BDDC:
18940c7d97c5SJed Brown       break;
18950c7d97c5SJed Brown   }
18960c7d97c5SJed Brown   PetscFunctionReturn(0);
18970c7d97c5SJed Brown }
18980c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
18990c7d97c5SJed Brown #undef __FUNCT__
19000c7d97c5SJed Brown #define __FUNCT__ "PCBDDCScatterCoarseDataEnd"
190153cdbc3dSStefano Zampini static PetscErrorCode  PCBDDCScatterCoarseDataEnd(PC pc,Vec vec_from, Vec vec_to, InsertMode imode, ScatterMode smode)
19020c7d97c5SJed Brown {
19030c7d97c5SJed Brown   PetscErrorCode ierr;
19040c7d97c5SJed Brown   PC_BDDC*       pcbddc = (PC_BDDC*)(pc->data);
19050c7d97c5SJed Brown   PetscScalar*   array_to;
19060c7d97c5SJed Brown   PetscScalar*   array_from;
19070c7d97c5SJed Brown   MPI_Comm       comm=((PetscObject)pc)->comm;
19080c7d97c5SJed Brown   PetscInt i;
19090c7d97c5SJed Brown 
19100c7d97c5SJed Brown   PetscFunctionBegin;
19110c7d97c5SJed Brown 
19120c7d97c5SJed Brown   switch(pcbddc->coarse_communications_type){
19130c7d97c5SJed Brown     case SCATTERS_BDDC:
19140c7d97c5SJed Brown       ierr = VecScatterEnd(pcbddc->coarse_loc_to_glob,vec_from,vec_to,imode,smode);CHKERRQ(ierr);
19150c7d97c5SJed Brown       break;
19160c7d97c5SJed Brown     case GATHERS_BDDC:
19170c7d97c5SJed Brown       if(vec_from) VecGetArray(vec_from,&array_from);
19180c7d97c5SJed Brown       if(vec_to)   VecGetArray(vec_to,&array_to);
19190c7d97c5SJed Brown       switch(pcbddc->coarse_problem_type){
19200c7d97c5SJed Brown         case SEQUENTIAL_BDDC:
19210c7d97c5SJed Brown           if(smode == SCATTER_FORWARD) {
192253cdbc3dSStefano Zampini             ierr = MPI_Gatherv(&array_from[0],pcbddc->local_primal_size,MPIU_SCALAR,&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,0,comm);CHKERRQ(ierr);
19230c7d97c5SJed Brown             if(vec_to) {
19240c7d97c5SJed Brown               for(i=0;i<pcbddc->replicated_primal_size;i++)
19250c7d97c5SJed Brown                 array_to[pcbddc->replicated_local_primal_indices[i]]+=pcbddc->replicated_local_primal_values[i];
19260c7d97c5SJed Brown             }
19270c7d97c5SJed Brown           } else {
19280c7d97c5SJed Brown             if(vec_from)
19290c7d97c5SJed Brown               for(i=0;i<pcbddc->replicated_primal_size;i++)
19300c7d97c5SJed Brown                 pcbddc->replicated_local_primal_values[i]=array_from[pcbddc->replicated_local_primal_indices[i]];
193153cdbc3dSStefano Zampini             ierr = MPI_Scatterv(&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,&array_to[0],pcbddc->local_primal_size,MPIU_SCALAR,0,comm);CHKERRQ(ierr);
19320c7d97c5SJed Brown           }
19330c7d97c5SJed Brown           break;
19340c7d97c5SJed Brown         case REPLICATED_BDDC:
19350c7d97c5SJed Brown           if(smode == SCATTER_FORWARD) {
193653cdbc3dSStefano Zampini             ierr = MPI_Allgatherv(&array_from[0],pcbddc->local_primal_size,MPIU_SCALAR,&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,comm);CHKERRQ(ierr);
19370c7d97c5SJed Brown             for(i=0;i<pcbddc->replicated_primal_size;i++)
19380c7d97c5SJed Brown               array_to[pcbddc->replicated_local_primal_indices[i]]+=pcbddc->replicated_local_primal_values[i];
19390c7d97c5SJed Brown           } else { /* no communications needed for SCATTER_REVERSE since needed data is already present */
19400c7d97c5SJed Brown             for(i=0;i<pcbddc->local_primal_size;i++)
19410c7d97c5SJed Brown               array_to[i]=array_from[pcbddc->local_primal_indices[i]];
19420c7d97c5SJed Brown           }
19430c7d97c5SJed Brown           break;
194453cdbc3dSStefano Zampini         case MULTILEVEL_BDDC:
194553cdbc3dSStefano Zampini           break;
194653cdbc3dSStefano Zampini         case PARALLEL_BDDC:
194753cdbc3dSStefano Zampini           break;
19480c7d97c5SJed Brown       }
19490c7d97c5SJed Brown       if(vec_from) VecRestoreArray(vec_from,&array_from);
19500c7d97c5SJed Brown       if(vec_to)   VecRestoreArray(vec_to,&array_to);
19510c7d97c5SJed Brown       break;
19520c7d97c5SJed Brown   }
19530c7d97c5SJed Brown   PetscFunctionReturn(0);
19540c7d97c5SJed Brown }
19550c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
19563b03a366Sstefano_zampini #undef __FUNCT__
19573b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCCreateConstraintMatrix"
19583b03a366Sstefano_zampini static PetscErrorCode PCBDDCCreateConstraintMatrix(PC pc)
19593b03a366Sstefano_zampini {
19603b03a366Sstefano_zampini   PetscErrorCode ierr;
19613b03a366Sstefano_zampini   PC_IS*         pcis = (PC_IS*)(pc->data);
19623b03a366Sstefano_zampini   PC_BDDC*       pcbddc = (PC_BDDC*)pc->data;
19633b03a366Sstefano_zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
196423d4d1a5SStefano Zampini   PetscInt       *nnz,*is_indices;
19653b03a366Sstefano_zampini   PetscScalar    *temp_quadrature_constraint;
1966534831adSStefano Zampini   PetscInt       *temp_indices,*temp_indices_to_constraint,*temp_indices_to_constraint_B,*local_to_B;
19673b03a366Sstefano_zampini   PetscInt       local_primal_size,i,j,k,total_counts,max_size_of_constraint;
19683b03a366Sstefano_zampini   PetscInt       n_constraints,n_vertices,size_of_constraint;
1969534831adSStefano Zampini   PetscScalar    quad_value;
19703b03a366Sstefano_zampini   PetscBool      nnsp_has_cnst=PETSC_FALSE,use_nnsp_true=pcbddc->use_nnsp_true;
19713b03a366Sstefano_zampini   PetscInt       nnsp_size=0,nnsp_addone=0,temp_constraints,temp_start_ptr;
19723b03a366Sstefano_zampini   IS             *used_IS;
19733b03a366Sstefano_zampini   const MatType  impMatType=MATSEQAIJ;
19743b03a366Sstefano_zampini   PetscBLASInt   Bs,Bt,lwork,lierr;
19753b03a366Sstefano_zampini   PetscReal      tol=1.0e-8;
1976fcda91b4SJed Brown   MatNullSpace   nearnullsp;
1977fcda91b4SJed Brown   const Vec      *nearnullvecs;
19783b03a366Sstefano_zampini   Vec            *localnearnullsp;
19793b03a366Sstefano_zampini   PetscScalar    *work,*temp_basis,*array_vector,*correlation_mat;
19803b03a366Sstefano_zampini   PetscReal      *rwork,*singular_vals;
1981534831adSStefano Zampini   PetscBLASInt   Bone=1,*ipiv;
1982534831adSStefano Zampini   Vec            temp_vec;
1983534831adSStefano Zampini   Mat            temp_mat;
1984534831adSStefano Zampini   KSP            temp_ksp;
1985534831adSStefano Zampini   PetscInt       s,start_constraint,dual_dofs;
1986534831adSStefano Zampini   PetscBool      compute_submatrix,useksp=PETSC_FALSE;
1987534831adSStefano Zampini   PetscInt       *aux_primal_permutation,*aux_primal_numbering;
1988534831adSStefano Zampini   PetscBool      boolforface,*change_basis;
1989de534f79Sstefano_zampini /* some ugly conditional declarations */
19903b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD)
19913b03a366Sstefano_zampini   PetscScalar    dot_result;
19923b03a366Sstefano_zampini   PetscScalar    one=1.0,zero=0.0;
19933b03a366Sstefano_zampini   PetscInt       ii;
1994*3425bc38SStefano Zampini   PetscScalar    *singular_vectors;
1995*3425bc38SStefano Zampini   PetscBLASInt   *iwork,*ifail;
1996*3425bc38SStefano Zampini   PetscReal      dummy_real,abs_tol;
1997*3425bc38SStefano Zampini   PetscBLASInt   eigs_found;
19983b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX)
19993b03a366Sstefano_zampini   PetscScalar    val1,val2;
20003b03a366Sstefano_zampini #endif
2001*3425bc38SStefano Zampini #endif
20023b03a366Sstefano_zampini   PetscBLASInt   dummy_int;
20033b03a366Sstefano_zampini   PetscScalar    dummy_scalar;
20043b03a366Sstefano_zampini 
20053b03a366Sstefano_zampini   PetscFunctionBegin;
20063b03a366Sstefano_zampini   /* check if near null space is attached to global mat */
2007fcda91b4SJed Brown   ierr = MatGetNearNullSpace(pc->pmat,&nearnullsp);CHKERRQ(ierr);
2008fcda91b4SJed Brown   if (nearnullsp) {
2009fcda91b4SJed Brown     ierr = MatNullSpaceGetVecs(nearnullsp,&nnsp_has_cnst,&nnsp_size,&nearnullvecs);CHKERRQ(ierr);
20103b03a366Sstefano_zampini   } else { /* if near null space is not provided it uses constants */
20113b03a366Sstefano_zampini     nnsp_has_cnst = PETSC_TRUE;
20123b03a366Sstefano_zampini     use_nnsp_true = PETSC_TRUE;
20133b03a366Sstefano_zampini   }
20143b03a366Sstefano_zampini   if(nnsp_has_cnst) {
20153b03a366Sstefano_zampini     nnsp_addone = 1;
20163b03a366Sstefano_zampini   }
20173b03a366Sstefano_zampini   /*
20183b03a366Sstefano_zampini        Evaluate maximum storage size needed by the procedure
20193b03a366Sstefano_zampini        - temp_indices will contain start index of each constraint stored as follows
20203b03a366Sstefano_zampini        - temp_indices_to_constraint  [temp_indices[i],...,temp[indices[i+1]-1] will contain the indices (in local numbering) on which the constraint acts
2021534831adSStefano Zampini        - temp_indices_to_constraint_B[temp_indices[i],...,temp[indices[i+1]-1] will contain the indices (in boundary numbering) on which the constraint acts
20223b03a366Sstefano_zampini        - temp_quadrature_constraint  [temp_indices[i],...,temp[indices[i+1]-1] will contain the scalars representing the constraint itself
20233b03a366Sstefano_zampini                                                                                                                                                          */
2024da1bb401SStefano Zampini 
20253b03a366Sstefano_zampini   total_counts = pcbddc->n_ISForFaces+pcbddc->n_ISForEdges;
20263b03a366Sstefano_zampini   total_counts *= (nnsp_addone+nnsp_size);
2027da1bb401SStefano Zampini   ierr = ISGetSize(pcbddc->ISForVertices,&n_vertices);CHKERRQ(ierr);
2028da1bb401SStefano Zampini   total_counts += n_vertices;
20293b03a366Sstefano_zampini   ierr = PetscMalloc((total_counts+1)*sizeof(PetscInt),&temp_indices);CHKERRQ(ierr);
2030534831adSStefano Zampini   ierr = PetscMalloc((total_counts+1)*sizeof(PetscBool),&change_basis);CHKERRQ(ierr);
20313b03a366Sstefano_zampini   total_counts = 0;
20323b03a366Sstefano_zampini   max_size_of_constraint = 0;
20333b03a366Sstefano_zampini   for(i=0;i<pcbddc->n_ISForEdges+pcbddc->n_ISForFaces;i++){
20343b03a366Sstefano_zampini     if(i<pcbddc->n_ISForEdges){
20353b03a366Sstefano_zampini       used_IS = &pcbddc->ISForEdges[i];
20363b03a366Sstefano_zampini     } else {
20373b03a366Sstefano_zampini       used_IS = &pcbddc->ISForFaces[i-pcbddc->n_ISForEdges];
20383b03a366Sstefano_zampini     }
20393b03a366Sstefano_zampini     ierr = ISGetSize(*used_IS,&j);CHKERRQ(ierr);
20403b03a366Sstefano_zampini     total_counts += j;
20413b03a366Sstefano_zampini     if(j>max_size_of_constraint) max_size_of_constraint=j;
20423b03a366Sstefano_zampini   }
20433b03a366Sstefano_zampini   total_counts *= (nnsp_addone+nnsp_size);
2044da1bb401SStefano Zampini   total_counts += n_vertices;
20453b03a366Sstefano_zampini   ierr = PetscMalloc(total_counts*sizeof(PetscScalar),&temp_quadrature_constraint);CHKERRQ(ierr);
20463b03a366Sstefano_zampini   ierr = PetscMalloc(total_counts*sizeof(PetscInt),&temp_indices_to_constraint);CHKERRQ(ierr);
2047534831adSStefano Zampini   ierr = PetscMalloc(total_counts*sizeof(PetscInt),&temp_indices_to_constraint_B);CHKERRQ(ierr);
2048534831adSStefano Zampini   ierr = PetscMalloc(pcis->n*sizeof(PetscInt),&local_to_B);CHKERRQ(ierr);
2049534831adSStefano Zampini   ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2050534831adSStefano Zampini   for(i=0;i<pcis->n;i++) {
2051534831adSStefano Zampini     local_to_B[i]=-1;
2052534831adSStefano Zampini   }
2053534831adSStefano Zampini   for(i=0;i<pcis->n_B;i++) {
2054534831adSStefano Zampini     local_to_B[is_indices[i]]=i;
2055534831adSStefano Zampini   }
2056534831adSStefano Zampini   ierr = ISRestoreIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2057534831adSStefano Zampini 
20583b03a366Sstefano_zampini   /* First we issue queries to allocate optimal workspace for LAPACKgesvd or LAPACKsyev/LAPACKheev */
20593b03a366Sstefano_zampini   rwork = 0;
20603b03a366Sstefano_zampini   work = 0;
20613b03a366Sstefano_zampini   singular_vals = 0;
20623b03a366Sstefano_zampini   temp_basis = 0;
20633b03a366Sstefano_zampini   correlation_mat = 0;
20643b03a366Sstefano_zampini   if(!pcbddc->use_nnsp_true) {
20653b03a366Sstefano_zampini     PetscScalar temp_work;
20663b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD)
20673b03a366Sstefano_zampini     /* POD */
20683b03a366Sstefano_zampini     PetscInt max_n;
20693b03a366Sstefano_zampini     max_n = nnsp_addone+nnsp_size;
20703b03a366Sstefano_zampini     /* using some techniques borrowed from Proper Orthogonal Decomposition */
20713b03a366Sstefano_zampini     ierr = PetscMalloc(max_n*max_n*sizeof(PetscScalar),&correlation_mat);CHKERRQ(ierr);
2072*3425bc38SStefano Zampini     ierr = PetscMalloc(max_n*max_n*sizeof(PetscScalar),&singular_vectors);CHKERRQ(ierr);
20733b03a366Sstefano_zampini     ierr = PetscMalloc(max_n*sizeof(PetscReal),&singular_vals);CHKERRQ(ierr);
20743b03a366Sstefano_zampini     ierr = PetscMalloc(max_size_of_constraint*(nnsp_addone+nnsp_size)*sizeof(PetscScalar),&temp_basis);CHKERRQ(ierr);
20753b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX)
20763b03a366Sstefano_zampini     ierr = PetscMalloc(3*max_n*sizeof(PetscReal),&rwork);CHKERRQ(ierr);
20773b03a366Sstefano_zampini #endif
2078*3425bc38SStefano Zampini     ierr = PetscMalloc(5*max_n*sizeof(PetscBLASInt),&iwork);CHKERRQ(ierr);
2079*3425bc38SStefano Zampini     ierr = PetscMalloc(max_n*sizeof(PetscBLASInt),&ifail);CHKERRQ(ierr);
20803b03a366Sstefano_zampini     /* now we evaluate the optimal workspace using query with lwork=-1 */
20813b03a366Sstefano_zampini     Bt = PetscBLASIntCast(max_n);
20823b03a366Sstefano_zampini     lwork=-1;
2083*3425bc38SStefano Zampini     ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
20843b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX)
2085*3425bc38SStefano Zampini     abs_tol=1.e-8;
2086*3425bc38SStefano Zampini /*    LAPACKsyev_("V","U",&Bt,correlation_mat,&Bt,singular_vals,&temp_work,&lwork,&lierr); */
2087*3425bc38SStefano Zampini     LAPACKsyevx_("V","A","U",&Bt,correlation_mat,&Bt,&dummy_real,&dummy_real,&dummy_int,&dummy_int,
2088*3425bc38SStefano Zampini                  &abs_tol,&eigs_found,singular_vals,singular_vectors,&Bt,&temp_work,&lwork,iwork,ifail,&lierr);
20893b03a366Sstefano_zampini #else
2090*3425bc38SStefano Zampini /*    LAPACKsyev_("V","U",&Bt,correlation_mat,&Bt,singular_vals,&temp_work,&lwork,rwork,&lierr); */
2091*3425bc38SStefano Zampini /*  LAPACK call is missing here! TODO */
2092*3425bc38SStefano Zampini     SETERRQ(((PetscObject) pc)->comm, PETSC_ERR_SUP, "Not yet implemented for complexes when PETSC_MISSING_GESVD = 1");
20933b03a366Sstefano_zampini #endif
2094*3425bc38SStefano Zampini     if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to SYEVX Lapack routine %d",(int)lierr);
2095*3425bc38SStefano Zampini     ierr = PetscFPTrapPop();CHKERRQ(ierr);
20963b03a366Sstefano_zampini #else /* on missing GESVD */
20973b03a366Sstefano_zampini     /* SVD */
20983b03a366Sstefano_zampini     PetscInt max_n,min_n;
20993b03a366Sstefano_zampini     max_n = max_size_of_constraint;
21003b03a366Sstefano_zampini     min_n = nnsp_addone+nnsp_size;
21013b03a366Sstefano_zampini     if(max_size_of_constraint < ( nnsp_addone+nnsp_size ) ) {
21023b03a366Sstefano_zampini       min_n = max_size_of_constraint;
21033b03a366Sstefano_zampini       max_n = nnsp_addone+nnsp_size;
21043b03a366Sstefano_zampini     }
21053b03a366Sstefano_zampini     ierr = PetscMalloc(min_n*sizeof(PetscReal),&singular_vals);CHKERRQ(ierr);
21063b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX)
21073b03a366Sstefano_zampini     ierr = PetscMalloc(5*min_n*sizeof(PetscReal),&rwork);CHKERRQ(ierr);
21083b03a366Sstefano_zampini #endif
21093b03a366Sstefano_zampini     /* now we evaluate the optimal workspace using query with lwork=-1 */
21103b03a366Sstefano_zampini     lwork=-1;
21113b03a366Sstefano_zampini     Bs = PetscBLASIntCast(max_n);
21123b03a366Sstefano_zampini     Bt = PetscBLASIntCast(min_n);
21133b03a366Sstefano_zampini     dummy_int = Bs;
2114670f3ff9SJed Brown     ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
21153b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX)
21163b03a366Sstefano_zampini     LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[0],&Bs,singular_vals,
21173b03a366Sstefano_zampini                  &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,&temp_work,&lwork,&lierr);
21183b03a366Sstefano_zampini #else
21193b03a366Sstefano_zampini     LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[0],&Bs,singular_vals,
21203b03a366Sstefano_zampini                  &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,&temp_work,&lwork,rwork,&lierr);
21213b03a366Sstefano_zampini #endif
21223b03a366Sstefano_zampini     if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to SVD Lapack routine %d",(int)lierr);
2123670f3ff9SJed Brown     ierr = PetscFPTrapPop();CHKERRQ(ierr);
21243b03a366Sstefano_zampini #endif
21253b03a366Sstefano_zampini     /* Allocate optimal workspace */
21263b03a366Sstefano_zampini     lwork = PetscBLASIntCast((PetscInt)PetscRealPart(temp_work));
21273b03a366Sstefano_zampini     total_counts = (PetscInt)lwork;
21283b03a366Sstefano_zampini     ierr = PetscMalloc(total_counts*sizeof(PetscScalar),&work);CHKERRQ(ierr);
21293b03a366Sstefano_zampini   }
21303b03a366Sstefano_zampini   /* get local part of global near null space vectors */
21313b03a366Sstefano_zampini   ierr = PetscMalloc(nnsp_size*sizeof(Vec),&localnearnullsp);CHKERRQ(ierr);
21323b03a366Sstefano_zampini   for(k=0;k<nnsp_size;k++) {
21333b03a366Sstefano_zampini     ierr = VecDuplicate(pcis->vec1_N,&localnearnullsp[k]);CHKERRQ(ierr);
2134fcda91b4SJed Brown     ierr = VecScatterBegin(matis->ctx,nearnullvecs[k],localnearnullsp[k],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
2135fcda91b4SJed Brown     ierr = VecScatterEnd  (matis->ctx,nearnullvecs[k],localnearnullsp[k],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21363b03a366Sstefano_zampini   }
21373b03a366Sstefano_zampini   /* Now we can loop on constraining sets */
21383b03a366Sstefano_zampini   total_counts=0;
21393b03a366Sstefano_zampini   temp_indices[0]=0;
2140da1bb401SStefano Zampini   /* vertices */
2141da1bb401SStefano Zampini   PetscBool used_vertex;
2142da1bb401SStefano Zampini   ierr = ISGetIndices(pcbddc->ISForVertices,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2143da1bb401SStefano Zampini   if(nnsp_has_cnst) { /* consider all vertices */
2144da1bb401SStefano Zampini     for(i=0;i<n_vertices;i++) {
2145da1bb401SStefano Zampini       temp_indices_to_constraint[temp_indices[total_counts]]=is_indices[i];
2146534831adSStefano Zampini       temp_indices_to_constraint_B[temp_indices[total_counts]]=local_to_B[is_indices[i]];
2147da1bb401SStefano Zampini       temp_quadrature_constraint[temp_indices[total_counts]]=1.0;
2148da1bb401SStefano Zampini       temp_indices[total_counts+1]=temp_indices[total_counts]+1;
2149534831adSStefano Zampini       change_basis[total_counts]=PETSC_FALSE;
2150da1bb401SStefano Zampini       total_counts++;
2151da1bb401SStefano Zampini     }
2152da1bb401SStefano Zampini   } else { /* consider vertices for which exist at least a localnearnullsp which is not null there */
2153da1bb401SStefano Zampini     for(i=0;i<n_vertices;i++) {
2154da1bb401SStefano Zampini       used_vertex=PETSC_FALSE;
2155da1bb401SStefano Zampini       k=0;
2156da1bb401SStefano Zampini       while(!used_vertex && k<nnsp_size) {
2157da1bb401SStefano Zampini         ierr = VecGetArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr);
2158da1bb401SStefano Zampini         if(PetscAbsScalar(array_vector[is_indices[i]])>0.0) {
2159da1bb401SStefano Zampini           temp_indices_to_constraint[temp_indices[total_counts]]=is_indices[i];
2160534831adSStefano Zampini           temp_indices_to_constraint_B[temp_indices[total_counts]]=local_to_B[is_indices[i]];
2161da1bb401SStefano Zampini           temp_quadrature_constraint[temp_indices[total_counts]]=1.0;
2162da1bb401SStefano Zampini           temp_indices[total_counts+1]=temp_indices[total_counts]+1;
2163534831adSStefano Zampini           change_basis[total_counts]=PETSC_FALSE;
2164da1bb401SStefano Zampini           total_counts++;
2165da1bb401SStefano Zampini           used_vertex=PETSC_TRUE;
2166da1bb401SStefano Zampini         }
2167da1bb401SStefano Zampini         ierr = VecRestoreArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr);
2168da1bb401SStefano Zampini         k++;
2169da1bb401SStefano Zampini       }
2170da1bb401SStefano Zampini     }
2171da1bb401SStefano Zampini   }
2172da1bb401SStefano Zampini   ierr = ISRestoreIndices(pcbddc->ISForVertices,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2173da1bb401SStefano Zampini   n_vertices=total_counts;
2174da1bb401SStefano Zampini   /* edges and faces */
21753b03a366Sstefano_zampini   for(i=0;i<pcbddc->n_ISForEdges+pcbddc->n_ISForFaces;i++){
21763b03a366Sstefano_zampini     if(i<pcbddc->n_ISForEdges){
21773b03a366Sstefano_zampini       used_IS = &pcbddc->ISForEdges[i];
2178534831adSStefano Zampini       boolforface = pcbddc->usechangeofbasis;
21793b03a366Sstefano_zampini     } else {
21803b03a366Sstefano_zampini       used_IS = &pcbddc->ISForFaces[i-pcbddc->n_ISForEdges];
2181534831adSStefano Zampini       boolforface = pcbddc->usechangeonfaces;
21823b03a366Sstefano_zampini     }
21833b03a366Sstefano_zampini     temp_constraints = 0;          /* zero the number of constraints I have on this conn comp */
21843b03a366Sstefano_zampini     temp_start_ptr = total_counts; /* need to know the starting index of constraints stored */
21853b03a366Sstefano_zampini     ierr = ISGetSize(*used_IS,&size_of_constraint);CHKERRQ(ierr);
21863b03a366Sstefano_zampini     ierr = ISGetIndices(*used_IS,(const PetscInt**)&is_indices);CHKERRQ(ierr);
21873b03a366Sstefano_zampini     if(nnsp_has_cnst) {
21883b03a366Sstefano_zampini       temp_constraints++;
2189534831adSStefano Zampini       quad_value = (PetscScalar) (1.0/PetscSqrtReal((PetscReal)size_of_constraint));
21903b03a366Sstefano_zampini       for(j=0;j<size_of_constraint;j++) {
21913b03a366Sstefano_zampini         temp_indices_to_constraint[temp_indices[total_counts]+j]=is_indices[j];
2192534831adSStefano Zampini         temp_indices_to_constraint_B[temp_indices[total_counts]+j]=local_to_B[is_indices[j]];
21933b03a366Sstefano_zampini         temp_quadrature_constraint[temp_indices[total_counts]+j]=quad_value;
21943b03a366Sstefano_zampini       }
21953b03a366Sstefano_zampini       temp_indices[total_counts+1]=temp_indices[total_counts]+size_of_constraint;  /* store new starting point */
2196534831adSStefano Zampini       change_basis[total_counts]=boolforface;
21973b03a366Sstefano_zampini       total_counts++;
21983b03a366Sstefano_zampini     }
21993b03a366Sstefano_zampini     for(k=0;k<nnsp_size;k++) {
22003b03a366Sstefano_zampini       ierr = VecGetArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr);
22013b03a366Sstefano_zampini       for(j=0;j<size_of_constraint;j++) {
22023b03a366Sstefano_zampini         temp_indices_to_constraint[temp_indices[total_counts]+j]=is_indices[j];
2203534831adSStefano Zampini         temp_indices_to_constraint_B[temp_indices[total_counts]+j]=local_to_B[is_indices[j]];
22043b03a366Sstefano_zampini         temp_quadrature_constraint[temp_indices[total_counts]+j]=array_vector[is_indices[j]];
22053b03a366Sstefano_zampini       }
22063b03a366Sstefano_zampini       ierr = VecRestoreArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr);
2207de534f79Sstefano_zampini       quad_value = 1.0;
2208de534f79Sstefano_zampini       if( use_nnsp_true ) { /* check if array is null on the connected component in case use_nnsp_true has been requested */
2209de534f79Sstefano_zampini         Bs = PetscBLASIntCast(size_of_constraint);
2210de534f79Sstefano_zampini         quad_value = BLASasum_(&Bs,&temp_quadrature_constraint[temp_indices[total_counts]],&Bone);
2211de534f79Sstefano_zampini       }
2212de534f79Sstefano_zampini       if ( quad_value > 0.0 ) { /* keep indices and values */
2213de534f79Sstefano_zampini         temp_constraints++;
22143b03a366Sstefano_zampini         temp_indices[total_counts+1]=temp_indices[total_counts]+size_of_constraint;  /* store new starting point */
2215534831adSStefano Zampini         change_basis[total_counts]=boolforface;
22163b03a366Sstefano_zampini         total_counts++;
22173b03a366Sstefano_zampini       }
2218de534f79Sstefano_zampini     }
22193b03a366Sstefano_zampini     ierr = ISRestoreIndices(*used_IS,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2220de534f79Sstefano_zampini     /* perform SVD on the constraint if use_nnsp_true has not be requested by the user */
22213b03a366Sstefano_zampini     if(!use_nnsp_true) {
2222de534f79Sstefano_zampini 
22233b03a366Sstefano_zampini       Bs = PetscBLASIntCast(size_of_constraint);
22243b03a366Sstefano_zampini       Bt = PetscBLASIntCast(temp_constraints);
2225de534f79Sstefano_zampini 
22263b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD)
22273b03a366Sstefano_zampini       ierr = PetscMemzero(correlation_mat,Bt*Bt*sizeof(PetscScalar));CHKERRQ(ierr);
22283b03a366Sstefano_zampini       /* Store upper triangular part of correlation matrix */
22293b03a366Sstefano_zampini       for(j=0;j<temp_constraints;j++) {
22303b03a366Sstefano_zampini         for(k=0;k<j+1;k++) {
22313b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX)
2232*3425bc38SStefano Zampini           /* hand made complex dot product -> replace */
22333b03a366Sstefano_zampini           dot_result = 0.0;
22343b03a366Sstefano_zampini           for (ii=0; ii<size_of_constraint; ii++) {
22353b03a366Sstefano_zampini             val1 = temp_quadrature_constraint[temp_indices[temp_start_ptr+j]+ii];
22363b03a366Sstefano_zampini             val2 = temp_quadrature_constraint[temp_indices[temp_start_ptr+k]+ii];
22373b03a366Sstefano_zampini             dot_result += val1*PetscConj(val2);
22383b03a366Sstefano_zampini           }
22393b03a366Sstefano_zampini #else
22403b03a366Sstefano_zampini           dot_result = BLASdot_(&Bs,&temp_quadrature_constraint[temp_indices[temp_start_ptr+j]],&Bone,
22413b03a366Sstefano_zampini                                     &temp_quadrature_constraint[temp_indices[temp_start_ptr+k]],&Bone);
22423b03a366Sstefano_zampini #endif
22433b03a366Sstefano_zampini           correlation_mat[j*temp_constraints+k]=dot_result;
22443b03a366Sstefano_zampini         }
22453b03a366Sstefano_zampini       }
2246*3425bc38SStefano Zampini       ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
22473b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX)
2248*3425bc38SStefano Zampini /*      LAPACKsyev_("V","U",&Bt,correlation_mat,&Bt,singular_vals,work,&lwork,&lierr); */
2249*3425bc38SStefano Zampini       LAPACKsyevx_("V","A","U",&Bt,correlation_mat,&Bt,&dummy_real,&dummy_real,&dummy_int,&dummy_int,
2250*3425bc38SStefano Zampini                  &abs_tol,&eigs_found,singular_vals,singular_vectors,&Bt,work,&lwork,iwork,ifail,&lierr);
22513b03a366Sstefano_zampini #else
2252*3425bc38SStefano Zampini /*  LAPACK call is missing here! TODO */
2253*3425bc38SStefano Zampini       SETERRQ(((PetscObject) pc)->comm, PETSC_ERR_SUP, "Not yet implemented for complexes when PETSC_MISSING_GESVD = 1");
22543b03a366Sstefano_zampini #endif
2255*3425bc38SStefano Zampini       if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYEVX Lapack routine %d",(int)lierr);
2256*3425bc38SStefano Zampini       ierr = PetscFPTrapPop();CHKERRQ(ierr);
22573b03a366Sstefano_zampini       /* retain eigenvalues greater than tol: note that lapack SYEV gives eigs in ascending order */
22583b03a366Sstefano_zampini       j=0;
22593b03a366Sstefano_zampini       while( j < Bt && singular_vals[j] < tol) j++;
22603b03a366Sstefano_zampini       total_counts=total_counts-j;
22613b03a366Sstefano_zampini       if(j<temp_constraints) {
22623b03a366Sstefano_zampini         for(k=j;k<Bt;k++) { singular_vals[k]=1.0/PetscSqrtReal(singular_vals[k]); }
2263*3425bc38SStefano Zampini         ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
22643b03a366Sstefano_zampini         BLASgemm_("N","N",&Bs,&Bt,&Bt,&one,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,correlation_mat,&Bt,&zero,temp_basis,&Bs);
2265*3425bc38SStefano Zampini         ierr = PetscFPTrapPop();CHKERRQ(ierr);
22663b03a366Sstefano_zampini         /* copy POD basis into used quadrature memory */
22673b03a366Sstefano_zampini         for(k=0;k<Bt-j;k++) {
22683b03a366Sstefano_zampini           for(ii=0;ii<size_of_constraint;ii++) {
22693b03a366Sstefano_zampini             temp_quadrature_constraint[temp_indices[temp_start_ptr+k]+ii]=singular_vals[Bt-1-k]*temp_basis[(Bt-1-k)*size_of_constraint+ii];
22703b03a366Sstefano_zampini           }
22713b03a366Sstefano_zampini         }
22723b03a366Sstefano_zampini       }
2273de534f79Sstefano_zampini 
22743b03a366Sstefano_zampini #else  /* on missing GESVD */
22753b03a366Sstefano_zampini       PetscInt min_n = temp_constraints;
22763b03a366Sstefano_zampini       if(min_n > size_of_constraint) min_n = size_of_constraint;
22773b03a366Sstefano_zampini       dummy_int = Bs;
2278670f3ff9SJed Brown       ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
22793b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX)
22803b03a366Sstefano_zampini       LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,singular_vals,
22813b03a366Sstefano_zampini                    &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,work,&lwork,&lierr);
22823b03a366Sstefano_zampini #else
22833b03a366Sstefano_zampini       LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,singular_vals,
22843b03a366Sstefano_zampini                    &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,work,&lwork,rwork,&lierr);
22853b03a366Sstefano_zampini #endif
22863b03a366Sstefano_zampini       if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SVD Lapack routine %d",(int)lierr);
2287670f3ff9SJed Brown       ierr = PetscFPTrapPop();CHKERRQ(ierr);
22883b03a366Sstefano_zampini       /* retain eigenvalues greater than tol: note that lapack SVD gives eigs in descending order */
22893b03a366Sstefano_zampini       j=0;
22903b03a366Sstefano_zampini       while( j < min_n && singular_vals[min_n-j-1] < tol) j++;
22913b03a366Sstefano_zampini       total_counts = total_counts-(PetscInt)Bt+(min_n-j);
22923b03a366Sstefano_zampini #endif
22933b03a366Sstefano_zampini     }
22943b03a366Sstefano_zampini   }
2295534831adSStefano Zampini 
2296da1bb401SStefano Zampini   n_constraints=total_counts-n_vertices;
2297da1bb401SStefano Zampini   local_primal_size = total_counts;
22983b03a366Sstefano_zampini   /* set quantities in pcbddc data structure */
22993b03a366Sstefano_zampini   pcbddc->n_vertices = n_vertices;
23003b03a366Sstefano_zampini   pcbddc->n_constraints = n_constraints;
2301da1bb401SStefano Zampini   pcbddc->local_primal_size = local_primal_size;
2302534831adSStefano Zampini 
2303534831adSStefano Zampini   /* Create constraint matrix */
2304534831adSStefano Zampini   /* The constraint matrix is used to compute the l2g map of primal dofs */
2305534831adSStefano Zampini   /* so we need to set it up properly either with or without change of basis */
2306534831adSStefano Zampini   ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->ConstraintMatrix);CHKERRQ(ierr);
2307534831adSStefano Zampini   ierr = MatSetType(pcbddc->ConstraintMatrix,impMatType);CHKERRQ(ierr);
2308534831adSStefano Zampini   ierr = MatSetSizes(pcbddc->ConstraintMatrix,local_primal_size,pcis->n,local_primal_size,pcis->n);CHKERRQ(ierr);
2309534831adSStefano Zampini   /* compute a local numbering of constraints : vertices first then constraints */
2310534831adSStefano Zampini   ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
2311534831adSStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array_vector);CHKERRQ(ierr);
2312534831adSStefano Zampini   ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&aux_primal_numbering);CHKERRQ(ierr);
2313534831adSStefano Zampini   ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&aux_primal_permutation);CHKERRQ(ierr);
2314534831adSStefano Zampini   total_counts=0;
2315534831adSStefano Zampini   /* find vertices: subdomain corners plus dofs with basis changed */
2316534831adSStefano Zampini   for(i=0;i<local_primal_size;i++) {
2317534831adSStefano Zampini     size_of_constraint=temp_indices[i+1]-temp_indices[i];
2318534831adSStefano Zampini     if(change_basis[i] || size_of_constraint == 1) {
2319534831adSStefano Zampini       k=0;
2320534831adSStefano Zampini       while(k < size_of_constraint && array_vector[temp_indices_to_constraint[temp_indices[i]+size_of_constraint-k-1]] != 0.0) {
2321534831adSStefano Zampini         k=k+1;
2322534831adSStefano Zampini       }
2323534831adSStefano Zampini       j=temp_indices_to_constraint[temp_indices[i]+size_of_constraint-k-1];
2324534831adSStefano Zampini       array_vector[j] = 1.0;
2325534831adSStefano Zampini       aux_primal_numbering[total_counts]=j;
2326534831adSStefano Zampini       aux_primal_permutation[total_counts]=total_counts;
2327534831adSStefano Zampini       total_counts++;
2328534831adSStefano Zampini     }
2329534831adSStefano Zampini   }
2330534831adSStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array_vector);CHKERRQ(ierr);
2331534831adSStefano Zampini   /* permute indices in order to have a sorted set of vertices */
2332534831adSStefano Zampini   ierr = PetscSortIntWithPermutation(total_counts,aux_primal_numbering,aux_primal_permutation);
2333534831adSStefano Zampini   /* nonzero structure */
2334534831adSStefano Zampini   ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&nnz);CHKERRQ(ierr);
2335534831adSStefano Zampini   for(i=0;i<total_counts;i++) {
2336534831adSStefano Zampini     nnz[i]=1;
2337534831adSStefano Zampini   }
2338534831adSStefano Zampini   j=total_counts;
2339534831adSStefano Zampini   for(i=n_vertices;i<local_primal_size;i++) {
2340534831adSStefano Zampini     if(!change_basis[i]) {
2341534831adSStefano Zampini       nnz[j]=temp_indices[i+1]-temp_indices[i];
2342534831adSStefano Zampini       j++;
2343534831adSStefano Zampini     }
2344534831adSStefano Zampini   }
2345534831adSStefano Zampini   ierr = MatSeqAIJSetPreallocation(pcbddc->ConstraintMatrix,0,nnz);CHKERRQ(ierr);
2346534831adSStefano Zampini   ierr = PetscFree(nnz);CHKERRQ(ierr);
2347534831adSStefano Zampini   /* set values in constraint matrix */
2348534831adSStefano Zampini   for(i=0;i<total_counts;i++) {
2349534831adSStefano Zampini     j = aux_primal_permutation[i];
2350534831adSStefano Zampini     k = aux_primal_numbering[j];
2351534831adSStefano Zampini     ierr = MatSetValue(pcbddc->ConstraintMatrix,i,k,1.0,INSERT_VALUES);CHKERRQ(ierr);
2352534831adSStefano Zampini   }
2353534831adSStefano Zampini   for(i=n_vertices;i<local_primal_size;i++) {
2354534831adSStefano Zampini     if(!change_basis[i]) {
2355534831adSStefano Zampini       size_of_constraint=temp_indices[i+1]-temp_indices[i];
2356534831adSStefano Zampini       ierr = MatSetValues(pcbddc->ConstraintMatrix,1,&total_counts,size_of_constraint,&temp_indices_to_constraint[temp_indices[i]],&temp_quadrature_constraint[temp_indices[i]],INSERT_VALUES);CHKERRQ(ierr);
2357534831adSStefano Zampini       total_counts++;
2358534831adSStefano Zampini     }
2359534831adSStefano Zampini   }
2360534831adSStefano Zampini   ierr = PetscFree(aux_primal_numbering);CHKERRQ(ierr);
2361534831adSStefano Zampini   ierr = PetscFree(aux_primal_permutation);CHKERRQ(ierr);
2362534831adSStefano Zampini   /* assembling */
2363534831adSStefano Zampini   ierr = MatAssemblyBegin(pcbddc->ConstraintMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2364534831adSStefano Zampini   ierr = MatAssemblyEnd(pcbddc->ConstraintMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2365534831adSStefano Zampini 
2366534831adSStefano Zampini   /* Create matrix for change of basis. We don't need it in case pcbddc->usechangeofbasis is FALSE */
2367534831adSStefano Zampini   if(pcbddc->usechangeofbasis) {
2368534831adSStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->ChangeOfBasisMatrix);CHKERRQ(ierr);
2369534831adSStefano Zampini     ierr = MatSetType(pcbddc->ChangeOfBasisMatrix,impMatType);CHKERRQ(ierr);
2370534831adSStefano Zampini     ierr = MatSetSizes(pcbddc->ChangeOfBasisMatrix,pcis->n_B,pcis->n_B,pcis->n_B,pcis->n_B);CHKERRQ(ierr);
2371534831adSStefano Zampini     /* work arrays */
2372534831adSStefano Zampini     /* we need to reuse these arrays, so we free them */
2373534831adSStefano Zampini     ierr = PetscFree(temp_basis);CHKERRQ(ierr);
2374534831adSStefano Zampini     ierr = PetscFree(work);CHKERRQ(ierr);
2375534831adSStefano Zampini     ierr = PetscMalloc(pcis->n_B*sizeof(PetscInt),&nnz);CHKERRQ(ierr);
2376534831adSStefano Zampini     ierr = PetscMalloc((nnsp_addone+nnsp_size)*(nnsp_addone+nnsp_size)*sizeof(PetscScalar),&temp_basis);CHKERRQ(ierr);
2377534831adSStefano Zampini     ierr = PetscMalloc((nnsp_addone+nnsp_size)*sizeof(PetscScalar),&work);CHKERRQ(ierr);
2378534831adSStefano Zampini     ierr = PetscMalloc((nnsp_addone+nnsp_size)*sizeof(PetscBLASInt),&ipiv);CHKERRQ(ierr);
2379534831adSStefano Zampini     for(i=0;i<pcis->n_B;i++) {
2380534831adSStefano Zampini       nnz[i]=1;
2381534831adSStefano Zampini     }
2382534831adSStefano Zampini     /* Overestimated nonzeros per row */
2383534831adSStefano Zampini     k=1;
2384534831adSStefano Zampini     for(i=pcbddc->n_vertices;i<local_primal_size;i++) {
2385534831adSStefano Zampini       if(change_basis[i]) {
2386534831adSStefano Zampini         size_of_constraint = temp_indices[i+1]-temp_indices[i];
2387534831adSStefano Zampini         if(k < size_of_constraint) {
2388534831adSStefano Zampini           k = size_of_constraint;
2389534831adSStefano Zampini         }
2390534831adSStefano Zampini         for(j=0;j<size_of_constraint;j++) {
2391534831adSStefano Zampini           nnz[temp_indices_to_constraint_B[temp_indices[i]+j]] = size_of_constraint;
2392534831adSStefano Zampini         }
2393534831adSStefano Zampini       }
2394534831adSStefano Zampini     }
2395534831adSStefano Zampini     ierr = MatSeqAIJSetPreallocation(pcbddc->ChangeOfBasisMatrix,0,nnz);CHKERRQ(ierr);
2396534831adSStefano Zampini     ierr = PetscFree(nnz);CHKERRQ(ierr);
2397534831adSStefano Zampini     /* Temporary array to store indices */
2398534831adSStefano Zampini     ierr = PetscMalloc(k*sizeof(PetscInt),&is_indices);CHKERRQ(ierr);
2399534831adSStefano Zampini     /* Set initial identity in the matrix */
2400534831adSStefano Zampini     for(i=0;i<pcis->n_B;i++) {
2401534831adSStefano Zampini       ierr = MatSetValue(pcbddc->ChangeOfBasisMatrix,i,i,1.0,INSERT_VALUES);CHKERRQ(ierr);
2402534831adSStefano Zampini     }
2403534831adSStefano Zampini     /* Now we loop on the constraints which need a change of basis */
2404534831adSStefano Zampini     /* Change of basis matrix is evaluated as the FIRST APPROACH in */
2405534831adSStefano Zampini     /* Klawonn and Widlund, Dual-primal FETI-DP methods for linear elasticity, (6.2.1) */
2406534831adSStefano Zampini     temp_constraints = 0;
2407534831adSStefano Zampini     temp_start_ptr = temp_indices_to_constraint_B[temp_indices[pcbddc->n_vertices]];
2408534831adSStefano Zampini     for(i=pcbddc->n_vertices;i<local_primal_size;i++) {
2409534831adSStefano Zampini       if(change_basis[i]) {
2410534831adSStefano Zampini         compute_submatrix = PETSC_FALSE;
2411534831adSStefano Zampini         useksp = PETSC_FALSE;
2412534831adSStefano Zampini         if(temp_start_ptr == temp_indices_to_constraint_B[temp_indices[i]]) {
2413534831adSStefano Zampini           temp_constraints++;
2414534831adSStefano Zampini           if(temp_start_ptr != temp_indices_to_constraint_B[temp_indices[i+1]]) {
2415534831adSStefano Zampini             compute_submatrix = PETSC_TRUE;
2416534831adSStefano Zampini           }
2417534831adSStefano Zampini         }
2418534831adSStefano Zampini         if(compute_submatrix) {
2419534831adSStefano Zampini           if(temp_constraints > 1 || pcbddc->use_nnsp_true) {
2420534831adSStefano Zampini             useksp = PETSC_TRUE;
2421534831adSStefano Zampini           }
2422534831adSStefano Zampini           size_of_constraint = temp_indices[i+1]-temp_indices[i];
2423534831adSStefano Zampini           if(useksp) { /* experimental */
2424534831adSStefano Zampini             ierr = MatCreate(PETSC_COMM_SELF,&temp_mat);CHKERRQ(ierr);
2425534831adSStefano Zampini             ierr = MatSetType(temp_mat,impMatType);CHKERRQ(ierr);
2426534831adSStefano Zampini             ierr = MatSetSizes(temp_mat,size_of_constraint,size_of_constraint,size_of_constraint,size_of_constraint);CHKERRQ(ierr);
2427534831adSStefano Zampini             ierr = MatSeqAIJSetPreallocation(temp_mat,size_of_constraint,PETSC_NULL);CHKERRQ(ierr);
2428534831adSStefano Zampini           }
2429534831adSStefano Zampini           /* First _size_of_constraint-temp_constraints_ columns */
2430534831adSStefano Zampini           dual_dofs = size_of_constraint-temp_constraints;
2431534831adSStefano Zampini           start_constraint = i+1-temp_constraints;
2432534831adSStefano Zampini           for(s=0;s<dual_dofs;s++) {
2433534831adSStefano Zampini             is_indices[0] = s;
2434534831adSStefano Zampini             for(j=0;j<temp_constraints;j++) {
2435534831adSStefano Zampini               for(k=0;k<temp_constraints;k++) {
2436534831adSStefano Zampini                 temp_basis[j*temp_constraints+k]=temp_quadrature_constraint[temp_indices[start_constraint+k]+s+j+1];
2437534831adSStefano Zampini               }
2438534831adSStefano Zampini               work[j]=-temp_quadrature_constraint[temp_indices[start_constraint+j]+s];
2439534831adSStefano Zampini               is_indices[j+1]=s+j+1;
2440534831adSStefano Zampini             }
2441534831adSStefano Zampini             Bt = temp_constraints;
2442534831adSStefano Zampini             ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
2443534831adSStefano Zampini             LAPACKgesv_(&Bt,&Bone,temp_basis,&Bt,ipiv,work,&Bt,&lierr);
2444534831adSStefano Zampini             if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GESV Lapack routine %d",(int)lierr);
2445534831adSStefano Zampini             ierr = PetscFPTrapPop();CHKERRQ(ierr);
2446534831adSStefano Zampini             j = temp_indices_to_constraint_B[temp_indices[start_constraint]+s];
2447534831adSStefano Zampini             ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,temp_constraints,&temp_indices_to_constraint_B[temp_indices[start_constraint]+s+1],1,&j,work,INSERT_VALUES);CHKERRQ(ierr);
2448534831adSStefano Zampini             if(useksp) {
2449534831adSStefano Zampini               /* temp mat with transposed rows and columns */
2450534831adSStefano Zampini               ierr = MatSetValues(temp_mat,1,&s,temp_constraints,&is_indices[1],work,INSERT_VALUES);CHKERRQ(ierr);
2451534831adSStefano Zampini               ierr = MatSetValue(temp_mat,is_indices[0],is_indices[0],1.0,INSERT_VALUES);CHKERRQ(ierr);
2452534831adSStefano Zampini             }
2453534831adSStefano Zampini           }
2454534831adSStefano Zampini           if(useksp) {
2455534831adSStefano Zampini             /* last rows of temp_mat */
2456534831adSStefano Zampini             for(j=0;j<size_of_constraint;j++) {
2457534831adSStefano Zampini               is_indices[j] = j;
2458534831adSStefano Zampini             }
2459534831adSStefano Zampini             for(s=0;s<temp_constraints;s++) {
2460534831adSStefano Zampini               k = s + dual_dofs;
2461534831adSStefano Zampini               ierr = MatSetValues(temp_mat,1,&k,size_of_constraint,is_indices,&temp_quadrature_constraint[temp_indices[start_constraint+s]],INSERT_VALUES);CHKERRQ(ierr);
2462534831adSStefano Zampini             }
2463534831adSStefano Zampini             ierr = MatAssemblyBegin(temp_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2464534831adSStefano Zampini             ierr = MatAssemblyEnd(temp_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2465534831adSStefano Zampini             ierr = MatGetVecs(temp_mat,&temp_vec,PETSC_NULL);CHKERRQ(ierr);
2466534831adSStefano Zampini             ierr = KSPCreate(PETSC_COMM_SELF,&temp_ksp);CHKERRQ(ierr);
2467534831adSStefano Zampini             ierr = KSPSetOperators(temp_ksp,temp_mat,temp_mat,SAME_PRECONDITIONER);CHKERRQ(ierr);
2468534831adSStefano Zampini             ierr = KSPSetType(temp_ksp,KSPPREONLY);CHKERRQ(ierr);
2469534831adSStefano Zampini             ierr = KSPSetUp(temp_ksp);CHKERRQ(ierr);
2470534831adSStefano Zampini             for(s=0;s<temp_constraints;s++) {
2471534831adSStefano Zampini               ierr = VecSet(temp_vec,0.0);CHKERRQ(ierr);
2472534831adSStefano Zampini               ierr = VecSetValue(temp_vec,s+dual_dofs,1.0,INSERT_VALUES);CHKERRQ(ierr);
2473534831adSStefano Zampini               ierr = VecAssemblyBegin(temp_vec);CHKERRQ(ierr);
2474534831adSStefano Zampini               ierr = VecAssemblyEnd(temp_vec);CHKERRQ(ierr);
2475534831adSStefano Zampini               ierr = KSPSolve(temp_ksp,temp_vec,temp_vec);CHKERRQ(ierr);
2476534831adSStefano Zampini               ierr = VecGetArray(temp_vec,&array_vector);CHKERRQ(ierr);
2477534831adSStefano Zampini               j = temp_indices_to_constraint_B[temp_indices[start_constraint+s]+size_of_constraint-s-1];
2478534831adSStefano Zampini               /* last columns of change of basis matrix associated to new primal dofs */
2479534831adSStefano Zampini               ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,size_of_constraint,&temp_indices_to_constraint_B[temp_indices[start_constraint+s]],1,&j,array_vector,INSERT_VALUES);CHKERRQ(ierr);
2480534831adSStefano Zampini               ierr = VecRestoreArray(temp_vec,&array_vector);CHKERRQ(ierr);
2481534831adSStefano Zampini             }
2482534831adSStefano Zampini             ierr = MatDestroy(&temp_mat);CHKERRQ(ierr);
2483534831adSStefano Zampini             ierr = KSPDestroy(&temp_ksp);CHKERRQ(ierr);
2484534831adSStefano Zampini             ierr = VecDestroy(&temp_vec);CHKERRQ(ierr);
2485534831adSStefano Zampini           } else {
2486534831adSStefano Zampini             /* last columns of change of basis matrix associated to new primal dofs */
2487534831adSStefano Zampini             for(s=0;s<temp_constraints;s++) {
2488534831adSStefano Zampini               j = temp_indices_to_constraint_B[temp_indices[start_constraint+s]+size_of_constraint-s-1];
2489534831adSStefano Zampini               ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,size_of_constraint,&temp_indices_to_constraint_B[temp_indices[start_constraint+s]],1,&j,&temp_quadrature_constraint[temp_indices[start_constraint+s]],INSERT_VALUES);CHKERRQ(ierr);
2490534831adSStefano Zampini             }
2491534831adSStefano Zampini           }
2492534831adSStefano Zampini           /* prepare for the next cycle */
2493534831adSStefano Zampini           temp_constraints = 0;
2494534831adSStefano Zampini           temp_start_ptr = temp_indices_to_constraint_B[temp_indices[i+1]];
2495534831adSStefano Zampini         }
2496534831adSStefano Zampini       }
2497534831adSStefano Zampini     }
2498534831adSStefano Zampini     /* assembling */
2499534831adSStefano Zampini     ierr = MatAssemblyBegin(pcbddc->ChangeOfBasisMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2500534831adSStefano Zampini     ierr = MatAssemblyEnd(pcbddc->ChangeOfBasisMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2501534831adSStefano Zampini     ierr = PetscFree(ipiv);CHKERRQ(ierr);
2502534831adSStefano Zampini     ierr = PetscFree(is_indices);CHKERRQ(ierr);
2503534831adSStefano Zampini   }
25043b03a366Sstefano_zampini   /* free workspace no longer needed */
25053b03a366Sstefano_zampini   ierr = PetscFree(rwork);CHKERRQ(ierr);
25063b03a366Sstefano_zampini   ierr = PetscFree(work);CHKERRQ(ierr);
25073b03a366Sstefano_zampini   ierr = PetscFree(temp_basis);CHKERRQ(ierr);
25083b03a366Sstefano_zampini   ierr = PetscFree(singular_vals);CHKERRQ(ierr);
25093b03a366Sstefano_zampini   ierr = PetscFree(correlation_mat);CHKERRQ(ierr);
25103b03a366Sstefano_zampini   ierr = PetscFree(temp_indices);CHKERRQ(ierr);
2511534831adSStefano Zampini   ierr = PetscFree(change_basis);CHKERRQ(ierr);
25123b03a366Sstefano_zampini   ierr = PetscFree(temp_indices_to_constraint);CHKERRQ(ierr);
2513534831adSStefano Zampini   ierr = PetscFree(temp_indices_to_constraint_B);CHKERRQ(ierr);
2514534831adSStefano Zampini   ierr = PetscFree(local_to_B);CHKERRQ(ierr);
25153b03a366Sstefano_zampini   ierr = PetscFree(temp_quadrature_constraint);CHKERRQ(ierr);
2516*3425bc38SStefano Zampini #if defined(PETSC_MISSING_LAPACK_GESVD)
2517*3425bc38SStefano Zampini   ierr = PetscFree(iwork);CHKERRQ(ierr);
2518*3425bc38SStefano Zampini   ierr = PetscFree(ifail);CHKERRQ(ierr);
2519*3425bc38SStefano Zampini   ierr = PetscFree(singular_vectors);CHKERRQ(ierr);
2520*3425bc38SStefano Zampini #endif
2521da1bb401SStefano Zampini   for(k=0;k<nnsp_size;k++) {
2522da1bb401SStefano Zampini     ierr = VecDestroy(&localnearnullsp[k]);CHKERRQ(ierr);
2523da1bb401SStefano Zampini   }
25243b03a366Sstefano_zampini   ierr = PetscFree(localnearnullsp);CHKERRQ(ierr);
25253b03a366Sstefano_zampini   PetscFunctionReturn(0);
25263b03a366Sstefano_zampini }
25273b03a366Sstefano_zampini /* -------------------------------------------------------------------------- */
25280c7d97c5SJed Brown #undef __FUNCT__
25290c7d97c5SJed Brown #define __FUNCT__ "PCBDDCCoarseSetUp"
253053cdbc3dSStefano Zampini static PetscErrorCode PCBDDCCoarseSetUp(PC pc)
25310c7d97c5SJed Brown {
25320c7d97c5SJed Brown   PetscErrorCode  ierr;
25330c7d97c5SJed Brown 
25340c7d97c5SJed Brown   PC_IS*            pcis = (PC_IS*)(pc->data);
25350c7d97c5SJed Brown   PC_BDDC*          pcbddc = (PC_BDDC*)pc->data;
25360c7d97c5SJed Brown   Mat_IS            *matis = (Mat_IS*)pc->pmat->data;
2537534831adSStefano Zampini   Mat               change_mat_all;
25380c7d97c5SJed Brown   IS                is_R_local;
25390c7d97c5SJed Brown   IS                is_V_local;
25400c7d97c5SJed Brown   IS                is_C_local;
25410c7d97c5SJed Brown   IS                is_aux1;
25420c7d97c5SJed Brown   IS                is_aux2;
25430c7d97c5SJed Brown   const VecType     impVecType;
25440c7d97c5SJed Brown   const MatType     impMatType;
25450c7d97c5SJed Brown   PetscInt          n_R=0;
25460c7d97c5SJed Brown   PetscInt          n_D=0;
25470c7d97c5SJed Brown   PetscInt          n_B=0;
25480c7d97c5SJed Brown   PetscScalar       zero=0.0;
25490c7d97c5SJed Brown   PetscScalar       one=1.0;
25500c7d97c5SJed Brown   PetscScalar       m_one=-1.0;
25510c7d97c5SJed Brown   PetscScalar*      array;
25520c7d97c5SJed Brown   PetscScalar       *coarse_submat_vals;
25530c7d97c5SJed Brown   PetscInt          *idx_R_local;
25540c7d97c5SJed Brown   PetscInt          *idx_V_B;
25550c7d97c5SJed Brown   PetscScalar       *coarsefunctions_errors;
25560c7d97c5SJed Brown   PetscScalar       *constraints_errors;
25570c7d97c5SJed Brown   /* auxiliary indices */
2558534831adSStefano Zampini   PetscInt i,j,k;
2559e269702eSStefano Zampini   /* for verbose output of bddc */
2560e269702eSStefano Zampini   PetscViewer       viewer=pcbddc->dbg_viewer;
2561e269702eSStefano Zampini   PetscBool         dbg_flag=pcbddc->dbg_flag;
2562a0ba757dSStefano Zampini   /* for counting coarse dofs */
2563534831adSStefano Zampini   PetscInt          n_vertices,n_constraints;
25643b03a366Sstefano_zampini   PetscInt          size_of_constraint;
25653b03a366Sstefano_zampini   PetscInt          *row_cmat_indices;
25663b03a366Sstefano_zampini   PetscScalar       *row_cmat_values;
2567534831adSStefano Zampini   PetscInt          *vertices,*nnz,*is_indices,*temp_indices;
25680c7d97c5SJed Brown 
25690c7d97c5SJed Brown   PetscFunctionBegin;
25700c7d97c5SJed Brown   /* Set Non-overlapping dimensions */
25710c7d97c5SJed Brown   n_B = pcis->n_B; n_D = pcis->n - n_B;
2572534831adSStefano Zampini   /* Set types for local objects needed by BDDC precondtioner */
2573534831adSStefano Zampini   impMatType = MATSEQDENSE;
2574534831adSStefano Zampini   impVecType = VECSEQ;
2575da1bb401SStefano Zampini   /* get vertex indices from constraint matrix */
2576534831adSStefano Zampini   ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscInt),&vertices);CHKERRQ(ierr);
2577534831adSStefano Zampini   n_vertices=0;
2578da1bb401SStefano Zampini   for(i=0;i<pcbddc->local_primal_size;i++) {
2579da1bb401SStefano Zampini     ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr);
2580da1bb401SStefano Zampini     if(size_of_constraint == 1) {
2581534831adSStefano Zampini       vertices[n_vertices]=row_cmat_indices[0];
2582534831adSStefano Zampini       n_vertices++;
2583a0ba757dSStefano Zampini     }
2584da1bb401SStefano Zampini     ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr);
2585a0ba757dSStefano Zampini   }
2586534831adSStefano Zampini   /* Set number of constraints */
2587534831adSStefano Zampini   n_constraints = pcbddc->local_primal_size-n_vertices;
2588534831adSStefano Zampini 
2589534831adSStefano Zampini   /* vertices in boundary numbering */
2590534831adSStefano Zampini   if(n_vertices) {
2591534831adSStefano Zampini     ierr = VecSet(pcis->vec1_N,m_one);CHKERRQ(ierr);
2592534831adSStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
2593534831adSStefano Zampini     for (i=0; i<n_vertices; i++) { array[ vertices[i] ] = i; }
2594534831adSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
2595534831adSStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
2596534831adSStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
2597534831adSStefano Zampini     ierr = PetscMalloc(n_vertices*sizeof(PetscInt),&idx_V_B);CHKERRQ(ierr);
2598534831adSStefano Zampini     ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr);
2599534831adSStefano Zampini     for (i=0; i<n_vertices; i++) {
2600534831adSStefano Zampini       j=0;
2601534831adSStefano Zampini       while (array[j] != i ) {j++;}
2602534831adSStefano Zampini       idx_V_B[i]=j;
2603534831adSStefano Zampini     }
2604534831adSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr);
2605534831adSStefano Zampini   }
2606534831adSStefano Zampini 
2607534831adSStefano Zampini   /* transform local matrices if needed */
2608534831adSStefano Zampini   if(pcbddc->usechangeofbasis) {
2609534831adSStefano Zampini     ierr = PetscMalloc(pcis->n*sizeof(PetscInt),&nnz);CHKERRQ(ierr);
2610534831adSStefano Zampini     ierr = ISGetIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2611534831adSStefano Zampini     for(i=0;i<n_D;i++) {
2612534831adSStefano Zampini       nnz[is_indices[i]]=1;
2613534831adSStefano Zampini     }
2614534831adSStefano Zampini     ierr = ISRestoreIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2615534831adSStefano Zampini     ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2616534831adSStefano Zampini     k=1;
2617534831adSStefano Zampini     for(i=0;i<n_B;i++) {
2618534831adSStefano Zampini       ierr = MatGetRow(pcbddc->ChangeOfBasisMatrix,i,&j,PETSC_NULL,PETSC_NULL);CHKERRQ(ierr);
2619534831adSStefano Zampini       nnz[is_indices[i]]=j;
2620534831adSStefano Zampini       if( k < j) {
2621534831adSStefano Zampini         k = j;
2622534831adSStefano Zampini       }
2623534831adSStefano Zampini       ierr = MatRestoreRow(pcbddc->ChangeOfBasisMatrix,i,&j,PETSC_NULL,PETSC_NULL);CHKERRQ(ierr);
2624534831adSStefano Zampini     }
2625534831adSStefano Zampini     ierr = ISRestoreIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2626534831adSStefano Zampini     /* assemble change of basis matrix on the whole set of local dofs */
2627534831adSStefano Zampini     ierr = PetscMalloc(k*sizeof(PetscInt),&temp_indices);CHKERRQ(ierr);
2628534831adSStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&change_mat_all);CHKERRQ(ierr);
2629534831adSStefano Zampini     ierr = MatSetSizes(change_mat_all,pcis->n,pcis->n,pcis->n,pcis->n);CHKERRQ(ierr);
2630534831adSStefano Zampini     ierr = MatSetType(change_mat_all,MATSEQAIJ);CHKERRQ(ierr);
2631534831adSStefano Zampini     ierr = MatSeqAIJSetPreallocation(change_mat_all,0,nnz);CHKERRQ(ierr);
2632534831adSStefano Zampini     ierr = ISGetIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2633534831adSStefano Zampini     for(i=0;i<n_D;i++) {
2634534831adSStefano Zampini       ierr = MatSetValue(change_mat_all,is_indices[i],is_indices[i],1.0,INSERT_VALUES);CHKERRQ(ierr);
2635534831adSStefano Zampini     }
2636534831adSStefano Zampini     ierr = ISRestoreIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2637534831adSStefano Zampini     ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2638534831adSStefano Zampini     for(i=0;i<n_B;i++) {
2639534831adSStefano Zampini       ierr = MatGetRow(pcbddc->ChangeOfBasisMatrix,i,&j,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr);
2640534831adSStefano Zampini       for(k=0;k<j;k++) {
2641534831adSStefano Zampini         temp_indices[k]=is_indices[row_cmat_indices[k]];
2642534831adSStefano Zampini       }
2643534831adSStefano Zampini       ierr = MatSetValues(change_mat_all,1,&is_indices[i],j,temp_indices,row_cmat_values,INSERT_VALUES);CHKERRQ(ierr);
2644534831adSStefano Zampini       ierr = MatRestoreRow(pcbddc->ChangeOfBasisMatrix,i,&j,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr);
2645534831adSStefano Zampini     }
2646534831adSStefano Zampini     ierr = MatAssemblyBegin(change_mat_all,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2647534831adSStefano Zampini     ierr = MatAssemblyEnd(change_mat_all,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2648534831adSStefano Zampini     ierr = MatPtAP(matis->A,change_mat_all,MAT_INITIAL_MATRIX,1.0,&pcbddc->local_mat);CHKERRQ(ierr);
2649534831adSStefano Zampini     ierr = MatDestroy(&pcis->A_IB);CHKERRQ(ierr);
2650534831adSStefano Zampini     ierr = MatDestroy(&pcis->A_BI);CHKERRQ(ierr);
2651534831adSStefano Zampini     ierr = MatDestroy(&pcis->A_BB);CHKERRQ(ierr);
2652534831adSStefano Zampini     ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_I_local,pcis->is_B_local,MAT_INITIAL_MATRIX,&pcis->A_IB);CHKERRQ(ierr);
2653534831adSStefano Zampini     ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_B_local,pcis->is_I_local,MAT_INITIAL_MATRIX,&pcis->A_BI);CHKERRQ(ierr);
2654534831adSStefano Zampini     ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_B_local,pcis->is_B_local,MAT_INITIAL_MATRIX,&pcis->A_BB);CHKERRQ(ierr);
2655534831adSStefano Zampini     ierr = MatDestroy(&change_mat_all);CHKERRQ(ierr);
2656534831adSStefano Zampini     ierr = PetscFree(nnz);CHKERRQ(ierr);
2657534831adSStefano Zampini     ierr = PetscFree(temp_indices);CHKERRQ(ierr);
2658534831adSStefano Zampini   } else {
2659534831adSStefano Zampini     /* without change of basis, the local matrix is unchanged */
2660534831adSStefano Zampini     ierr = PetscObjectReference((PetscObject)matis->A);CHKERRQ(ierr);
2661534831adSStefano Zampini     pcbddc->local_mat = matis->A;
2662534831adSStefano Zampini   }
2663a0ba757dSStefano Zampini 
26640c7d97c5SJed Brown   /* Dohrmann's notation: dofs splitted in R (Remaining: all dofs but the vertices) and V (Vertices) */
26650c7d97c5SJed Brown   ierr = VecSet(pcis->vec1_N,one);CHKERRQ(ierr);
26660c7d97c5SJed Brown   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
26673b03a366Sstefano_zampini   for (i=0;i<n_vertices;i++) { array[ vertices[i] ] = zero; }
26683b03a366Sstefano_zampini   ierr = PetscMalloc(( pcis->n - n_vertices )*sizeof(PetscInt),&idx_R_local);CHKERRQ(ierr);
26690c7d97c5SJed Brown   for (i=0, n_R=0; i<pcis->n; i++) { if (array[i] == one) { idx_R_local[n_R] = i; n_R++; } }
26700c7d97c5SJed Brown   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
2671e269702eSStefano Zampini   if(dbg_flag) {
26720c7d97c5SJed Brown     ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
26730c7d97c5SJed Brown     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
26740c7d97c5SJed Brown     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d local dimensions\n",PetscGlobalRank);CHKERRQ(ierr);
26750c7d97c5SJed Brown     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local_size = %d, dirichlet_size = %d, boundary_size = %d\n",pcis->n,n_D,n_B);CHKERRQ(ierr);
26763b03a366Sstefano_zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"r_size = %d, v_size = %d, constraints = %d, local_primal_size = %d\n",n_R,n_vertices,n_constraints,pcbddc->local_primal_size);CHKERRQ(ierr);
2677534831adSStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"pcbddc->n_vertices = %d, pcbddc->n_constraints = %d\n",pcbddc->n_vertices,pcbddc->n_constraints);CHKERRQ(ierr);
26780c7d97c5SJed Brown     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
26790c7d97c5SJed Brown   }
2680534831adSStefano Zampini 
26810c7d97c5SJed Brown   /* Allocate needed vectors */
2682534831adSStefano Zampini   ierr = VecDuplicate(pcis->vec1_global,&pcbddc->original_rhs);CHKERRQ(ierr);
26833972b0daSStefano Zampini   ierr = VecDuplicate(pcis->vec1_global,&pcbddc->temp_solution);CHKERRQ(ierr);
26840c7d97c5SJed Brown   ierr = VecDuplicate(pcis->vec1_D,&pcbddc->vec4_D);CHKERRQ(ierr);
26850c7d97c5SJed Brown   ierr = VecCreate(PETSC_COMM_SELF,&pcbddc->vec1_R);CHKERRQ(ierr);
26860c7d97c5SJed Brown   ierr = VecSetSizes(pcbddc->vec1_R,n_R,n_R);CHKERRQ(ierr);
26870c7d97c5SJed Brown   ierr = VecSetType(pcbddc->vec1_R,impVecType);CHKERRQ(ierr);
2688d49ef151SStefano Zampini   ierr = VecDuplicate(pcbddc->vec1_R,&pcbddc->vec2_R);CHKERRQ(ierr);
26890c7d97c5SJed Brown   ierr = VecCreate(PETSC_COMM_SELF,&pcbddc->vec1_P);CHKERRQ(ierr);
26900c7d97c5SJed Brown   ierr = VecSetSizes(pcbddc->vec1_P,pcbddc->local_primal_size,pcbddc->local_primal_size);CHKERRQ(ierr);
26910c7d97c5SJed Brown   ierr = VecSetType(pcbddc->vec1_P,impVecType);CHKERRQ(ierr);
26920c7d97c5SJed Brown 
26930c7d97c5SJed Brown   /* Creating some index sets needed  */
26940c7d97c5SJed Brown   /* For submatrices */
2695da1bb401SStefano Zampini   ierr = ISCreateGeneral(PETSC_COMM_SELF,n_R,idx_R_local,PETSC_OWN_POINTER,&is_R_local);CHKERRQ(ierr);
26963b03a366Sstefano_zampini   if(n_vertices)    {
2697da1bb401SStefano Zampini     ierr = ISCreateGeneral(PETSC_COMM_SELF,n_vertices,vertices,PETSC_OWN_POINTER,&is_V_local);CHKERRQ(ierr);
26983b03a366Sstefano_zampini   }
2699da1bb401SStefano Zampini   if(n_constraints) {
2700da1bb401SStefano Zampini     ierr = ISCreateStride(PETSC_COMM_SELF,n_constraints,n_vertices,1,&is_C_local);CHKERRQ(ierr);
2701da1bb401SStefano Zampini   }
2702da1bb401SStefano Zampini 
27030c7d97c5SJed Brown   /* For VecScatters pcbddc->R_to_B and (optionally) pcbddc->R_to_D */
27040c7d97c5SJed Brown   {
27050c7d97c5SJed Brown     PetscInt   *aux_array1;
27060c7d97c5SJed Brown     PetscInt   *aux_array2;
27070c7d97c5SJed Brown 
27083b03a366Sstefano_zampini     ierr = PetscMalloc( (pcis->n_B-n_vertices)*sizeof(PetscInt),&aux_array1);CHKERRQ(ierr);
27093b03a366Sstefano_zampini     ierr = PetscMalloc( (pcis->n_B-n_vertices)*sizeof(PetscInt),&aux_array2);CHKERRQ(ierr);
27100c7d97c5SJed Brown 
2711d49ef151SStefano Zampini     ierr = VecSet(pcis->vec1_global,zero);CHKERRQ(ierr);
27120c7d97c5SJed Brown     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
27130c7d97c5SJed Brown     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
27140c7d97c5SJed Brown     ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
27150c7d97c5SJed Brown     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
27160c7d97c5SJed Brown     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
27170c7d97c5SJed Brown     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
27180c7d97c5SJed Brown     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
2719da1bb401SStefano Zampini     for (i=0, j=0; i<n_R; i++) { if (array[idx_R_local[i]] > one) { aux_array1[j] = i; j++; } }
27200c7d97c5SJed Brown     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
2721da1bb401SStefano Zampini     ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array1,PETSC_COPY_VALUES,&is_aux1);CHKERRQ(ierr);
27220c7d97c5SJed Brown     ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr);
2723da1bb401SStefano Zampini     for (i=0, j=0; i<n_B; i++) { if (array[i] > one) { aux_array2[j] = i; j++; } }
27243828260eSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr);
2725da1bb401SStefano Zampini     ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array2,PETSC_COPY_VALUES,&is_aux2);CHKERRQ(ierr);
27260c7d97c5SJed Brown     ierr = VecScatterCreate(pcbddc->vec1_R,is_aux1,pcis->vec1_B,is_aux2,&pcbddc->R_to_B);CHKERRQ(ierr);
27270c7d97c5SJed Brown     ierr = PetscFree(aux_array1);CHKERRQ(ierr);
27280c7d97c5SJed Brown     ierr = PetscFree(aux_array2);CHKERRQ(ierr);
27290c7d97c5SJed Brown     ierr = ISDestroy(&is_aux1);CHKERRQ(ierr);
27300c7d97c5SJed Brown     ierr = ISDestroy(&is_aux2);CHKERRQ(ierr);
27310c7d97c5SJed Brown 
2732e269702eSStefano Zampini     if(pcbddc->prec_type || dbg_flag ) {
27330c7d97c5SJed Brown       ierr = PetscMalloc(n_D*sizeof(PetscInt),&aux_array1);CHKERRQ(ierr);
27340c7d97c5SJed Brown       ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
2735da1bb401SStefano Zampini       for (i=0, j=0; i<n_R; i++) { if (array[idx_R_local[i]] == one) { aux_array1[j] = i; j++; } }
27360c7d97c5SJed Brown       ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
2737da1bb401SStefano Zampini       ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array1,PETSC_COPY_VALUES,&is_aux1);CHKERRQ(ierr);
27380c7d97c5SJed Brown       ierr = VecScatterCreate(pcbddc->vec1_R,is_aux1,pcis->vec1_D,(IS)0,&pcbddc->R_to_D);CHKERRQ(ierr);
27390c7d97c5SJed Brown       ierr = PetscFree(aux_array1);CHKERRQ(ierr);
27400c7d97c5SJed Brown       ierr = ISDestroy(&is_aux1);CHKERRQ(ierr);
27410c7d97c5SJed Brown     }
27420c7d97c5SJed Brown   }
27430c7d97c5SJed Brown 
27440c7d97c5SJed Brown   /* Creating PC contexts for local Dirichlet and Neumann problems */
27450c7d97c5SJed Brown   {
27460c7d97c5SJed Brown     Mat  A_RR;
274753cdbc3dSStefano Zampini     PC   pc_temp;
27480c7d97c5SJed Brown     /* Matrix for Dirichlet problem is A_II -> we already have it from pcis.c code */
274953cdbc3dSStefano Zampini     ierr = KSPCreate(PETSC_COMM_SELF,&pcbddc->ksp_D);CHKERRQ(ierr);
275053cdbc3dSStefano Zampini     ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->ksp_D,(PetscObject)pc,1);CHKERRQ(ierr);
275153cdbc3dSStefano Zampini     ierr = KSPSetOperators(pcbddc->ksp_D,pcis->A_II,pcis->A_II,SAME_PRECONDITIONER);CHKERRQ(ierr);
275253cdbc3dSStefano Zampini     ierr = KSPSetType(pcbddc->ksp_D,KSPPREONLY);CHKERRQ(ierr);
2753da1bb401SStefano Zampini     ierr = KSPSetOptionsPrefix(pcbddc->ksp_D,"dirichlet_");CHKERRQ(ierr);
27540c7d97c5SJed Brown     /* default */
275553cdbc3dSStefano Zampini     ierr = KSPGetPC(pcbddc->ksp_D,&pc_temp);CHKERRQ(ierr);
275653cdbc3dSStefano Zampini     ierr = PCSetType(pc_temp,PCLU);CHKERRQ(ierr);
27570c7d97c5SJed Brown     /* Allow user's customization */
275853cdbc3dSStefano Zampini     ierr = KSPSetFromOptions(pcbddc->ksp_D);CHKERRQ(ierr);
275953cdbc3dSStefano Zampini     /* Set Up KSP for Dirichlet problem of BDDC */
276053cdbc3dSStefano Zampini     ierr = KSPSetUp(pcbddc->ksp_D);CHKERRQ(ierr);
27613972b0daSStefano Zampini     /* set ksp_D into pcis data */
27623972b0daSStefano Zampini     ierr = KSPDestroy(&pcis->ksp_D);CHKERRQ(ierr);
27633972b0daSStefano Zampini     ierr = PetscObjectReference((PetscObject)pcbddc->ksp_D);CHKERRQ(ierr);
27643972b0daSStefano Zampini     pcis->ksp_D = pcbddc->ksp_D;
2765da1bb401SStefano Zampini     if(pcbddc->dbg_flag) ierr = KSPView(pcbddc->ksp_D,PETSC_VIEWER_STDOUT_SELF);
27660c7d97c5SJed Brown     /* Matrix for Neumann problem is A_RR -> we need to create it */
2767534831adSStefano Zampini     ierr = MatGetSubMatrix(pcbddc->local_mat,is_R_local,is_R_local,MAT_INITIAL_MATRIX,&A_RR);CHKERRQ(ierr);
276853cdbc3dSStefano Zampini     ierr = KSPCreate(PETSC_COMM_SELF,&pcbddc->ksp_R);CHKERRQ(ierr);
276953cdbc3dSStefano Zampini     ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->ksp_R,(PetscObject)pc,1);CHKERRQ(ierr);
277053cdbc3dSStefano Zampini     ierr = KSPSetOperators(pcbddc->ksp_R,A_RR,A_RR,SAME_PRECONDITIONER);CHKERRQ(ierr);
277153cdbc3dSStefano Zampini     ierr = KSPSetType(pcbddc->ksp_R,KSPPREONLY);CHKERRQ(ierr);
2772da1bb401SStefano Zampini     ierr = KSPSetOptionsPrefix(pcbddc->ksp_R,"neumann_");CHKERRQ(ierr);
27730c7d97c5SJed Brown     /* default */
277453cdbc3dSStefano Zampini     ierr = KSPGetPC(pcbddc->ksp_R,&pc_temp);CHKERRQ(ierr);
277553cdbc3dSStefano Zampini     ierr = PCSetType(pc_temp,PCLU);CHKERRQ(ierr);
27760c7d97c5SJed Brown     /* Allow user's customization */
277753cdbc3dSStefano Zampini     ierr = KSPSetFromOptions(pcbddc->ksp_R);CHKERRQ(ierr);
277853cdbc3dSStefano Zampini     /* Set Up KSP for Neumann problem of BDDC */
277953cdbc3dSStefano Zampini     ierr = KSPSetUp(pcbddc->ksp_R);CHKERRQ(ierr);
2780da1bb401SStefano Zampini     if(pcbddc->dbg_flag) ierr = KSPView(pcbddc->ksp_R,PETSC_VIEWER_STDOUT_SELF);
2781a0ba757dSStefano Zampini     /* check Dirichlet and Neumann solvers */
2782ba1573a8SStefano Zampini     if(dbg_flag) {
27830c7d97c5SJed Brown       Vec temp_vec;
27840c7d97c5SJed Brown       PetscScalar value;
27850c7d97c5SJed Brown 
2786a0ba757dSStefano Zampini       ierr = VecDuplicate(pcis->vec1_D,&temp_vec);CHKERRQ(ierr);
2787a0ba757dSStefano Zampini       ierr = VecSetRandom(pcis->vec1_D,PETSC_NULL);CHKERRQ(ierr);
2788a0ba757dSStefano Zampini       ierr = MatMult(pcis->A_II,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr);
2789a0ba757dSStefano Zampini       ierr = KSPSolve(pcbddc->ksp_D,pcis->vec2_D,temp_vec);CHKERRQ(ierr);
2790a0ba757dSStefano Zampini       ierr = VecAXPY(temp_vec,m_one,pcis->vec1_D);CHKERRQ(ierr);
2791a0ba757dSStefano Zampini       ierr = VecNorm(temp_vec,NORM_INFINITY,&value);CHKERRQ(ierr);
2792a0ba757dSStefano Zampini       ierr = VecDestroy(&temp_vec);CHKERRQ(ierr);
2793a0ba757dSStefano Zampini       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
2794a0ba757dSStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
2795a0ba757dSStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Checking solution of Dirichlet and Neumann problems\n");CHKERRQ(ierr);
2796a0ba757dSStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d infinity error for Dirichlet solve = % 1.14e \n",PetscGlobalRank,value);CHKERRQ(ierr);
2797d49ef151SStefano Zampini       ierr = VecDuplicate(pcbddc->vec1_R,&temp_vec);CHKERRQ(ierr);
2798d49ef151SStefano Zampini       ierr = VecSetRandom(pcbddc->vec1_R,PETSC_NULL);CHKERRQ(ierr);
2799d49ef151SStefano Zampini       ierr = MatMult(A_RR,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr);
2800d49ef151SStefano Zampini       ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec2_R,temp_vec);CHKERRQ(ierr);
2801d49ef151SStefano Zampini       ierr = VecAXPY(temp_vec,m_one,pcbddc->vec1_R);CHKERRQ(ierr);
2802d49ef151SStefano Zampini       ierr = VecNorm(temp_vec,NORM_INFINITY,&value);CHKERRQ(ierr);
2803e269702eSStefano Zampini       ierr = VecDestroy(&temp_vec);CHKERRQ(ierr);
28040c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d infinity error for  Neumann  solve = % 1.14e \n",PetscGlobalRank,value);CHKERRQ(ierr);
2805d49ef151SStefano Zampini       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
28060c7d97c5SJed Brown     }
28070c7d97c5SJed Brown     /* free Neumann problem's matrix */
28080c7d97c5SJed Brown     ierr = MatDestroy(&A_RR);CHKERRQ(ierr);
28090c7d97c5SJed Brown   }
28100c7d97c5SJed Brown 
28110c7d97c5SJed Brown   /* Assemble all remaining stuff needed to apply BDDC  */
28120c7d97c5SJed Brown   {
28130c7d97c5SJed Brown     Mat          A_RV,A_VR,A_VV;
28140c7d97c5SJed Brown     Mat          M1,M2;
28150c7d97c5SJed Brown     Mat          C_CR;
28163b03a366Sstefano_zampini     Mat          AUXMAT;
28170c7d97c5SJed Brown     Vec          vec1_C;
28180c7d97c5SJed Brown     Vec          vec2_C;
28190c7d97c5SJed Brown     Vec          vec1_V;
28200c7d97c5SJed Brown     Vec          vec2_V;
28210c7d97c5SJed Brown     PetscInt     *nnz;
28220c7d97c5SJed Brown     PetscInt     *auxindices;
282353cdbc3dSStefano Zampini     PetscInt     index;
28240c7d97c5SJed Brown     PetscScalar* array2;
28250c7d97c5SJed Brown     MatFactorInfo matinfo;
28260c7d97c5SJed Brown 
28270c7d97c5SJed Brown     /* Allocating some extra storage just to be safe */
28280c7d97c5SJed Brown     ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&nnz);CHKERRQ(ierr);
28290c7d97c5SJed Brown     ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&auxindices);CHKERRQ(ierr);
28300c7d97c5SJed Brown     for(i=0;i<pcis->n;i++) {auxindices[i]=i;}
28310c7d97c5SJed Brown 
28320c7d97c5SJed Brown     /* some work vectors on vertices and/or constraints */
28333b03a366Sstefano_zampini     if(n_vertices) {
28340c7d97c5SJed Brown       ierr = VecCreate(PETSC_COMM_SELF,&vec1_V);CHKERRQ(ierr);
28353b03a366Sstefano_zampini       ierr = VecSetSizes(vec1_V,n_vertices,n_vertices);CHKERRQ(ierr);
28360c7d97c5SJed Brown       ierr = VecSetType(vec1_V,impVecType);CHKERRQ(ierr);
28370c7d97c5SJed Brown       ierr = VecDuplicate(vec1_V,&vec2_V);CHKERRQ(ierr);
28380c7d97c5SJed Brown     }
2839534831adSStefano Zampini     if(n_constraints) {
28400c7d97c5SJed Brown       ierr = VecCreate(PETSC_COMM_SELF,&vec1_C);CHKERRQ(ierr);
2841534831adSStefano Zampini       ierr = VecSetSizes(vec1_C,n_constraints,n_constraints);CHKERRQ(ierr);
28420c7d97c5SJed Brown       ierr = VecSetType(vec1_C,impVecType);CHKERRQ(ierr);
28430c7d97c5SJed Brown       ierr = VecDuplicate(vec1_C,&vec2_C);CHKERRQ(ierr);
28440c7d97c5SJed Brown       ierr = VecDuplicate(vec1_C,&pcbddc->vec1_C);CHKERRQ(ierr);
28450c7d97c5SJed Brown     }
28460c7d97c5SJed Brown     /* Precompute stuffs needed for preprocessing and application of BDDC*/
28473b03a366Sstefano_zampini     if(n_constraints) {
28480c7d97c5SJed Brown       ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->local_auxmat2);CHKERRQ(ierr);
28493b03a366Sstefano_zampini       ierr = MatSetSizes(pcbddc->local_auxmat2,n_R,n_constraints,n_R,n_constraints);CHKERRQ(ierr);
28500c7d97c5SJed Brown       ierr = MatSetType(pcbddc->local_auxmat2,impMatType);CHKERRQ(ierr);
28513b03a366Sstefano_zampini       ierr = MatSeqDenseSetPreallocation(pcbddc->local_auxmat2,PETSC_NULL);CHKERRQ(ierr);
28520c7d97c5SJed Brown 
285357a90decSStefano Zampini       /* Create Constraint matrix on R nodes: C_{CR}  */
285457a90decSStefano Zampini       ierr = MatGetSubMatrix(pcbddc->ConstraintMatrix,is_C_local,is_R_local,MAT_INITIAL_MATRIX,&C_CR);CHKERRQ(ierr);
285557a90decSStefano Zampini       ierr = ISDestroy(&is_C_local);CHKERRQ(ierr);
285657a90decSStefano Zampini 
28570c7d97c5SJed Brown       /* Assemble local_auxmat2 = - A_{RR}^{-1} C^T_{CR} needed by BDDC application */
28583b03a366Sstefano_zampini       for(i=0;i<n_constraints;i++) {
28593b03a366Sstefano_zampini         ierr = VecSet(pcbddc->vec1_R,zero);CHKERRQ(ierr);
28603b03a366Sstefano_zampini         /* Get row of constraint matrix in R numbering */
286157a90decSStefano Zampini         ierr = VecGetArray(pcbddc->vec1_R,&array);CHKERRQ(ierr);
286257a90decSStefano Zampini         ierr = MatGetRow(C_CR,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr);
28633b03a366Sstefano_zampini         for(j=0;j<size_of_constraint;j++) { array[ row_cmat_indices[j] ] = - row_cmat_values[j]; }
286457a90decSStefano Zampini         ierr = MatRestoreRow(C_CR,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr);
286557a90decSStefano Zampini         ierr = VecRestoreArray(pcbddc->vec1_R,&array);CHKERRQ(ierr);
28663b03a366Sstefano_zampini         /* Solve for row of constraint matrix in R numbering */
286753cdbc3dSStefano Zampini         ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr);
28683b03a366Sstefano_zampini         /* Set values */
28690c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec2_R,&array);CHKERRQ(ierr);
28703b03a366Sstefano_zampini         ierr = MatSetValues(pcbddc->local_auxmat2,n_R,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
28710c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec2_R,&array);CHKERRQ(ierr);
28720c7d97c5SJed Brown       }
28730c7d97c5SJed Brown       ierr = MatAssemblyBegin(pcbddc->local_auxmat2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
28740c7d97c5SJed Brown       ierr = MatAssemblyEnd(pcbddc->local_auxmat2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
28750c7d97c5SJed Brown 
28760c7d97c5SJed Brown       /* Assemble AUXMAT = ( LUFactor )( -C_{CR} A_{RR}^{-1} C^T_{CR} )^{-1} */
28770c7d97c5SJed Brown       ierr = MatMatMult(C_CR,pcbddc->local_auxmat2,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&AUXMAT);CHKERRQ(ierr);
2878d49ef151SStefano Zampini       ierr = MatFactorInfoInitialize(&matinfo);CHKERRQ(ierr);
28793b03a366Sstefano_zampini       ierr = ISCreateStride(PETSC_COMM_SELF,n_constraints,0,1,&is_aux1);CHKERRQ(ierr);
28800c7d97c5SJed Brown       ierr = MatLUFactor(AUXMAT,is_aux1,is_aux1,&matinfo);CHKERRQ(ierr);
28810c7d97c5SJed Brown       ierr = ISDestroy(&is_aux1);CHKERRQ(ierr);
28820c7d97c5SJed Brown 
28833b03a366Sstefano_zampini       /* Assemble explicitly M1 = ( C_{CR} A_{RR}^{-1} C^T_{CR} )^{-1} needed in preproc  */
2884d49ef151SStefano Zampini       ierr = MatCreate(PETSC_COMM_SELF,&M1);CHKERRQ(ierr);
28853b03a366Sstefano_zampini       ierr = MatSetSizes(M1,n_constraints,n_constraints,n_constraints,n_constraints);CHKERRQ(ierr);
28860c7d97c5SJed Brown       ierr = MatSetType(M1,impMatType);CHKERRQ(ierr);
28873b03a366Sstefano_zampini       ierr = MatSeqDenseSetPreallocation(M1,PETSC_NULL);CHKERRQ(ierr);
28883b03a366Sstefano_zampini       for(i=0;i<n_constraints;i++) {
28890c7d97c5SJed Brown         ierr = VecSet(vec1_C,zero);CHKERRQ(ierr);
28900c7d97c5SJed Brown         ierr = VecSetValue(vec1_C,i,one,INSERT_VALUES);CHKERRQ(ierr);
28910c7d97c5SJed Brown         ierr = VecAssemblyBegin(vec1_C);CHKERRQ(ierr);
28920c7d97c5SJed Brown         ierr = VecAssemblyEnd(vec1_C);CHKERRQ(ierr);
28930c7d97c5SJed Brown         ierr = MatSolve(AUXMAT,vec1_C,vec2_C);CHKERRQ(ierr);
28940c7d97c5SJed Brown         ierr = VecScale(vec2_C,m_one);CHKERRQ(ierr);
28950c7d97c5SJed Brown         ierr = VecGetArray(vec2_C,&array);CHKERRQ(ierr);
28963b03a366Sstefano_zampini         ierr = MatSetValues(M1,n_constraints,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
28970c7d97c5SJed Brown         ierr = VecRestoreArray(vec2_C,&array);CHKERRQ(ierr);
28980c7d97c5SJed Brown       }
28990c7d97c5SJed Brown       ierr = MatAssemblyBegin(M1,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
29000c7d97c5SJed Brown       ierr = MatAssemblyEnd(M1,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
29010c7d97c5SJed Brown       ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr);
29020c7d97c5SJed Brown       /* Assemble local_auxmat1 = M1*C_{CR} needed by BDDC application in KSP and in preproc */
29030c7d97c5SJed Brown       ierr = MatMatMult(M1,C_CR,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&pcbddc->local_auxmat1);CHKERRQ(ierr);
29040c7d97c5SJed Brown 
29050c7d97c5SJed Brown     }
29060c7d97c5SJed Brown 
29070c7d97c5SJed Brown     /* Get submatrices from subdomain matrix */
29083b03a366Sstefano_zampini     if(n_vertices){
2909534831adSStefano Zampini       ierr = MatGetSubMatrix(pcbddc->local_mat,is_R_local,is_V_local,MAT_INITIAL_MATRIX,&A_RV);CHKERRQ(ierr);
2910534831adSStefano Zampini       ierr = MatGetSubMatrix(pcbddc->local_mat,is_V_local,is_R_local,MAT_INITIAL_MATRIX,&A_VR);CHKERRQ(ierr);
2911534831adSStefano Zampini       ierr = MatGetSubMatrix(pcbddc->local_mat,is_V_local,is_V_local,MAT_INITIAL_MATRIX,&A_VV);CHKERRQ(ierr);
29120c7d97c5SJed Brown       /* Assemble M2 = A_RR^{-1}A_RV */
2913d49ef151SStefano Zampini       ierr = MatCreate(PETSC_COMM_SELF,&M2);CHKERRQ(ierr);
29143b03a366Sstefano_zampini       ierr = MatSetSizes(M2,n_R,n_vertices,n_R,n_vertices);CHKERRQ(ierr);
29150c7d97c5SJed Brown       ierr = MatSetType(M2,impMatType);CHKERRQ(ierr);
29163b03a366Sstefano_zampini       ierr = MatSeqDenseSetPreallocation(M2,PETSC_NULL);CHKERRQ(ierr);
29173b03a366Sstefano_zampini       for(i=0;i<n_vertices;i++) {
29180c7d97c5SJed Brown         ierr = VecSet(vec1_V,zero);CHKERRQ(ierr);
29190c7d97c5SJed Brown         ierr = VecSetValue(vec1_V,i,one,INSERT_VALUES);CHKERRQ(ierr);
29200c7d97c5SJed Brown         ierr = VecAssemblyBegin(vec1_V);CHKERRQ(ierr);
29210c7d97c5SJed Brown         ierr = VecAssemblyEnd(vec1_V);CHKERRQ(ierr);
29220c7d97c5SJed Brown         ierr = MatMult(A_RV,vec1_V,pcbddc->vec1_R);CHKERRQ(ierr);
292353cdbc3dSStefano Zampini         ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr);
29240c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec2_R,&array);CHKERRQ(ierr);
29253b03a366Sstefano_zampini         ierr = MatSetValues(M2,n_R,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
29260c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec2_R,&array);CHKERRQ(ierr);
29270c7d97c5SJed Brown       }
29280c7d97c5SJed Brown       ierr = MatAssemblyBegin(M2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
29290c7d97c5SJed Brown       ierr = MatAssemblyEnd(M2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
29300c7d97c5SJed Brown     }
29310c7d97c5SJed Brown 
29320c7d97c5SJed Brown     /* Matrix of coarse basis functions (local) */
2933d49ef151SStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->coarse_phi_B);CHKERRQ(ierr);
29340c7d97c5SJed Brown     ierr = MatSetSizes(pcbddc->coarse_phi_B,n_B,pcbddc->local_primal_size,n_B,pcbddc->local_primal_size);CHKERRQ(ierr);
29350c7d97c5SJed Brown     ierr = MatSetType(pcbddc->coarse_phi_B,impMatType);CHKERRQ(ierr);
29363b03a366Sstefano_zampini     ierr = MatSeqDenseSetPreallocation(pcbddc->coarse_phi_B,PETSC_NULL);CHKERRQ(ierr);
2937e269702eSStefano Zampini     if(pcbddc->prec_type || dbg_flag ) {
2938d49ef151SStefano Zampini       ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->coarse_phi_D);CHKERRQ(ierr);
29390c7d97c5SJed Brown       ierr = MatSetSizes(pcbddc->coarse_phi_D,n_D,pcbddc->local_primal_size,n_D,pcbddc->local_primal_size);CHKERRQ(ierr);
29400c7d97c5SJed Brown       ierr = MatSetType(pcbddc->coarse_phi_D,impMatType);CHKERRQ(ierr);
29413b03a366Sstefano_zampini       ierr = MatSeqDenseSetPreallocation(pcbddc->coarse_phi_D,PETSC_NULL);CHKERRQ(ierr);
29420c7d97c5SJed Brown     }
29430c7d97c5SJed Brown 
2944e269702eSStefano Zampini     if(dbg_flag) {
29450c7d97c5SJed Brown       ierr = PetscMalloc( pcbddc->local_primal_size*sizeof(PetscScalar),&coarsefunctions_errors);CHKERRQ(ierr);
29460c7d97c5SJed Brown       ierr = PetscMalloc( pcbddc->local_primal_size*sizeof(PetscScalar),&constraints_errors);CHKERRQ(ierr);
29470c7d97c5SJed Brown     }
29483b03a366Sstefano_zampini     /* Subdomain contribution (Non-overlapping) to coarse matrix  */
29490c7d97c5SJed Brown     ierr = PetscMalloc ((pcbddc->local_primal_size)*(pcbddc->local_primal_size)*sizeof(PetscScalar),&coarse_submat_vals);CHKERRQ(ierr);
29500c7d97c5SJed Brown 
29510c7d97c5SJed Brown     /* We are now ready to evaluate coarse basis functions and subdomain contribution to coarse problem */
29523b03a366Sstefano_zampini     for(i=0;i<n_vertices;i++){
29530c7d97c5SJed Brown       ierr = VecSet(vec1_V,zero);CHKERRQ(ierr);
29540c7d97c5SJed Brown       ierr = VecSetValue(vec1_V,i,one,INSERT_VALUES);CHKERRQ(ierr);
29550c7d97c5SJed Brown       ierr = VecAssemblyBegin(vec1_V);CHKERRQ(ierr);
29560c7d97c5SJed Brown       ierr = VecAssemblyEnd(vec1_V);CHKERRQ(ierr);
29570c7d97c5SJed Brown       /* solution of saddle point problem */
29580c7d97c5SJed Brown       ierr = MatMult(M2,vec1_V,pcbddc->vec1_R);CHKERRQ(ierr);
29590c7d97c5SJed Brown       ierr = VecScale(pcbddc->vec1_R,m_one);CHKERRQ(ierr);
29603b03a366Sstefano_zampini       if(n_constraints) {
29610c7d97c5SJed Brown         ierr = MatMult(pcbddc->local_auxmat1,pcbddc->vec1_R,vec1_C);CHKERRQ(ierr);
29620c7d97c5SJed Brown         ierr = MatMultAdd(pcbddc->local_auxmat2,vec1_C,pcbddc->vec1_R,pcbddc->vec1_R);CHKERRQ(ierr);
29630c7d97c5SJed Brown         ierr = VecScale(vec1_C,m_one);CHKERRQ(ierr);
29640c7d97c5SJed Brown       }
29650c7d97c5SJed Brown       ierr = MatMult(A_VR,pcbddc->vec1_R,vec2_V);CHKERRQ(ierr);
29660c7d97c5SJed Brown       ierr = MatMultAdd(A_VV,vec1_V,vec2_V,vec2_V);CHKERRQ(ierr);
29670c7d97c5SJed Brown 
29680c7d97c5SJed Brown       /* Set values in coarse basis function and subdomain part of coarse_mat */
29690c7d97c5SJed Brown       /* coarse basis functions */
29700c7d97c5SJed Brown       ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr);
29710c7d97c5SJed Brown       ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
29720c7d97c5SJed Brown       ierr = VecScatterEnd  (pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
29730c7d97c5SJed Brown       ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr);
29743b03a366Sstefano_zampini       ierr = MatSetValues(pcbddc->coarse_phi_B,n_B,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
29750c7d97c5SJed Brown       ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr);
29760c7d97c5SJed Brown       ierr = MatSetValue(pcbddc->coarse_phi_B,idx_V_B[i],i,one,INSERT_VALUES);CHKERRQ(ierr);
2977e269702eSStefano Zampini       if( pcbddc->prec_type || dbg_flag  ) {
29780c7d97c5SJed Brown         ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
29790c7d97c5SJed Brown         ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
29800c7d97c5SJed Brown         ierr = VecGetArray(pcis->vec1_D,&array);CHKERRQ(ierr);
29813b03a366Sstefano_zampini         ierr = MatSetValues(pcbddc->coarse_phi_D,n_D,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
29820c7d97c5SJed Brown         ierr = VecRestoreArray(pcis->vec1_D,&array);CHKERRQ(ierr);
29830c7d97c5SJed Brown       }
29840c7d97c5SJed Brown       /* subdomain contribution to coarse matrix */
29850c7d97c5SJed Brown       ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr);
2986da1bb401SStefano Zampini       for(j=0;j<n_vertices;j++) { coarse_submat_vals[i*pcbddc->local_primal_size+j] = array[j]; } /* WARNING -> column major ordering */
29870c7d97c5SJed Brown       ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr);
29883b03a366Sstefano_zampini       if(n_constraints) {
29890c7d97c5SJed Brown         ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr);
2990da1bb401SStefano Zampini         for(j=0;j<n_constraints;j++) { coarse_submat_vals[i*pcbddc->local_primal_size+j+n_vertices] = array[j]; } /* WARNING -> column major ordering */
29910c7d97c5SJed Brown         ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr);
29920c7d97c5SJed Brown       }
29930c7d97c5SJed Brown 
2994e269702eSStefano Zampini       if( dbg_flag ) {
29950c7d97c5SJed Brown         /* assemble subdomain vector on nodes */
2996d49ef151SStefano Zampini         ierr = VecSet(pcis->vec1_N,zero);CHKERRQ(ierr);
29970c7d97c5SJed Brown         ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
29980c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr);
29990c7d97c5SJed Brown         for(j=0;j<n_R;j++) { array[idx_R_local[j]] = array2[j]; }
30003b03a366Sstefano_zampini         array[ vertices[i] ] = one;
30010c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr);
30020c7d97c5SJed Brown         ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
30030c7d97c5SJed Brown         /* assemble subdomain vector of lagrange multipliers (i.e. primal nodes) */
3004d49ef151SStefano Zampini         ierr = VecSet(pcbddc->vec1_P,zero);CHKERRQ(ierr);
30050c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr);
30060c7d97c5SJed Brown         ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr);
30073b03a366Sstefano_zampini         for(j=0;j<n_vertices;j++) { array2[j]=array[j]; }
30080c7d97c5SJed Brown         ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr);
30093b03a366Sstefano_zampini         if(n_constraints) {
30100c7d97c5SJed Brown           ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr);
30113b03a366Sstefano_zampini           for(j=0;j<n_constraints;j++) { array2[j+n_vertices]=array[j]; }
30120c7d97c5SJed Brown           ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr);
30130c7d97c5SJed Brown         }
30140c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr);
30150c7d97c5SJed Brown         ierr = VecScale(pcbddc->vec1_P,m_one);CHKERRQ(ierr);
30160c7d97c5SJed Brown         /* check saddle point solution */
3017534831adSStefano Zampini         ierr = MatMult(pcbddc->local_mat,pcis->vec1_N,pcis->vec2_N);CHKERRQ(ierr);
30183b03a366Sstefano_zampini         ierr = MatMultTransposeAdd(pcbddc->ConstraintMatrix,pcbddc->vec1_P,pcis->vec2_N,pcis->vec2_N);CHKERRQ(ierr);
30193b03a366Sstefano_zampini         ierr = VecNorm(pcis->vec2_N,NORM_INFINITY,&coarsefunctions_errors[i]);CHKERRQ(ierr);
30203b03a366Sstefano_zampini         ierr = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr);
30210c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
30223b03a366Sstefano_zampini         array[i]=array[i]+m_one;  /* shift by the identity matrix */
30230c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
30243b03a366Sstefano_zampini         ierr = VecNorm(pcbddc->vec1_P,NORM_INFINITY,&constraints_errors[i]);CHKERRQ(ierr);
30250c7d97c5SJed Brown       }
30260c7d97c5SJed Brown     }
30270c7d97c5SJed Brown 
30283b03a366Sstefano_zampini     for(i=0;i<n_constraints;i++){
3029d49ef151SStefano Zampini       ierr = VecSet(vec2_C,zero);CHKERRQ(ierr);
30300c7d97c5SJed Brown       ierr = VecSetValue(vec2_C,i,m_one,INSERT_VALUES);CHKERRQ(ierr);
30310c7d97c5SJed Brown       ierr = VecAssemblyBegin(vec2_C);CHKERRQ(ierr);
30320c7d97c5SJed Brown       ierr = VecAssemblyEnd(vec2_C);CHKERRQ(ierr);
30330c7d97c5SJed Brown       /* solution of saddle point problem */
30340c7d97c5SJed Brown       ierr = MatMult(M1,vec2_C,vec1_C);CHKERRQ(ierr);
30350c7d97c5SJed Brown       ierr = MatMult(pcbddc->local_auxmat2,vec1_C,pcbddc->vec1_R);CHKERRQ(ierr);
30360c7d97c5SJed Brown       ierr = VecScale(vec1_C,m_one);CHKERRQ(ierr);
30373b03a366Sstefano_zampini       if(n_vertices) { ierr = MatMult(A_VR,pcbddc->vec1_R,vec2_V);CHKERRQ(ierr); }
30380c7d97c5SJed Brown       /* Set values in coarse basis function and subdomain part of coarse_mat */
30390c7d97c5SJed Brown       /* coarse basis functions */
30403b03a366Sstefano_zampini       index=i+n_vertices;
30410c7d97c5SJed Brown       ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr);
30420c7d97c5SJed Brown       ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
30430c7d97c5SJed Brown       ierr = VecScatterEnd  (pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
30440c7d97c5SJed Brown       ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr);
304553cdbc3dSStefano Zampini       ierr = MatSetValues(pcbddc->coarse_phi_B,n_B,auxindices,1,&index,array,INSERT_VALUES);CHKERRQ(ierr);
30460c7d97c5SJed Brown       ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr);
3047e269702eSStefano Zampini       if( pcbddc->prec_type || dbg_flag ) {
30480c7d97c5SJed Brown         ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
30490c7d97c5SJed Brown         ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
30500c7d97c5SJed Brown         ierr = VecGetArray(pcis->vec1_D,&array);CHKERRQ(ierr);
305153cdbc3dSStefano Zampini         ierr = MatSetValues(pcbddc->coarse_phi_D,n_D,auxindices,1,&index,array,INSERT_VALUES);CHKERRQ(ierr);
30520c7d97c5SJed Brown         ierr = VecRestoreArray(pcis->vec1_D,&array);CHKERRQ(ierr);
30530c7d97c5SJed Brown       }
30540c7d97c5SJed Brown       /* subdomain contribution to coarse matrix */
30553b03a366Sstefano_zampini       if(n_vertices) {
30560c7d97c5SJed Brown         ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr);
3057da1bb401SStefano Zampini         for(j=0;j<n_vertices;j++) {coarse_submat_vals[index*pcbddc->local_primal_size+j]=array[j];} /* WARNING -> column major ordering */
30580c7d97c5SJed Brown         ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr);
30590c7d97c5SJed Brown       }
30600c7d97c5SJed Brown       ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr);
3061da1bb401SStefano Zampini       for(j=0;j<n_constraints;j++) {coarse_submat_vals[index*pcbddc->local_primal_size+j+n_vertices]=array[j];} /* WARNING -> column major ordering */
30620c7d97c5SJed Brown       ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr);
30630c7d97c5SJed Brown 
3064e269702eSStefano Zampini       if( dbg_flag ) {
30650c7d97c5SJed Brown         /* assemble subdomain vector on nodes */
306653cdbc3dSStefano Zampini         ierr = VecSet(pcis->vec1_N,zero);CHKERRQ(ierr);
30670c7d97c5SJed Brown         ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
30680c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr);
30690c7d97c5SJed Brown         for(j=0;j<n_R;j++){ array[ idx_R_local[j] ] = array2[j]; }
30700c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr);
30710c7d97c5SJed Brown         ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
30720c7d97c5SJed Brown         /* assemble subdomain vector of lagrange multipliers */
307353cdbc3dSStefano Zampini         ierr = VecSet(pcbddc->vec1_P,zero);CHKERRQ(ierr);
30740c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr);
30753b03a366Sstefano_zampini         if( n_vertices) {
30760c7d97c5SJed Brown           ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr);
30773b03a366Sstefano_zampini           for(j=0;j<n_vertices;j++) {array2[j]=-array[j];}
30780c7d97c5SJed Brown           ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr);
30790c7d97c5SJed Brown         }
30800c7d97c5SJed Brown         ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr);
30813b03a366Sstefano_zampini         for(j=0;j<n_constraints;j++) {array2[j+n_vertices]=-array[j];}
30820c7d97c5SJed Brown         ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr);
30830c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr);
30843972b0daSStefano Zampini         /* check saddle point solution */
3085534831adSStefano Zampini         ierr = MatMult(pcbddc->local_mat,pcis->vec1_N,pcis->vec2_N);CHKERRQ(ierr);
30863b03a366Sstefano_zampini         ierr = MatMultTransposeAdd(pcbddc->ConstraintMatrix,pcbddc->vec1_P,pcis->vec2_N,pcis->vec2_N);CHKERRQ(ierr);
308753cdbc3dSStefano Zampini         ierr = VecNorm(pcis->vec2_N,NORM_INFINITY,&coarsefunctions_errors[index]);CHKERRQ(ierr);
30883b03a366Sstefano_zampini         ierr = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr);
30890c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
309053cdbc3dSStefano Zampini         array[index]=array[index]+m_one; /* shift by the identity matrix */
30910c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
309253cdbc3dSStefano Zampini         ierr = VecNorm(pcbddc->vec1_P,NORM_INFINITY,&constraints_errors[index]);CHKERRQ(ierr);
30930c7d97c5SJed Brown       }
30940c7d97c5SJed Brown     }
30950c7d97c5SJed Brown     ierr = MatAssemblyBegin(pcbddc->coarse_phi_B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
30960c7d97c5SJed Brown     ierr = MatAssemblyEnd  (pcbddc->coarse_phi_B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
3097e269702eSStefano Zampini     if( pcbddc->prec_type || dbg_flag ) {
30980c7d97c5SJed Brown       ierr = MatAssemblyBegin(pcbddc->coarse_phi_D,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
30990c7d97c5SJed Brown       ierr = MatAssemblyEnd  (pcbddc->coarse_phi_D,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
31000c7d97c5SJed Brown     }
31010c7d97c5SJed Brown     /* Checking coarse_sub_mat and coarse basis functios */
31020c7d97c5SJed Brown     /* It shuld be \Phi^{(j)^T} A^{(j)} \Phi^{(j)}=coarse_sub_mat */
31039d2fce94SStefano Zampini     if(dbg_flag) {
31040c7d97c5SJed Brown 
31050c7d97c5SJed Brown       Mat coarse_sub_mat;
31060c7d97c5SJed Brown       Mat TM1,TM2,TM3,TM4;
31070c7d97c5SJed Brown       Mat coarse_phi_D,coarse_phi_B,A_II,A_BB,A_IB,A_BI;
3108a0ba757dSStefano Zampini       const MatType checkmattype=MATSEQAIJ;
31090c7d97c5SJed Brown       PetscScalar      value;
31100c7d97c5SJed Brown 
3111c042a7c3SStefano Zampini       ierr = MatConvert(pcis->A_II,checkmattype,MAT_INITIAL_MATRIX,&A_II);CHKERRQ(ierr);
3112c042a7c3SStefano Zampini       ierr = MatConvert(pcis->A_IB,checkmattype,MAT_INITIAL_MATRIX,&A_IB);CHKERRQ(ierr);
3113c042a7c3SStefano Zampini       ierr = MatConvert(pcis->A_BI,checkmattype,MAT_INITIAL_MATRIX,&A_BI);CHKERRQ(ierr);
3114c042a7c3SStefano Zampini       ierr = MatConvert(pcis->A_BB,checkmattype,MAT_INITIAL_MATRIX,&A_BB);CHKERRQ(ierr);
3115c042a7c3SStefano Zampini       ierr = MatConvert(pcbddc->coarse_phi_D,checkmattype,MAT_INITIAL_MATRIX,&coarse_phi_D);CHKERRQ(ierr);
3116c042a7c3SStefano Zampini       ierr = MatConvert(pcbddc->coarse_phi_B,checkmattype,MAT_INITIAL_MATRIX,&coarse_phi_B);CHKERRQ(ierr);
3117c042a7c3SStefano Zampini       ierr = MatCreateSeqDense(PETSC_COMM_SELF,pcbddc->local_primal_size,pcbddc->local_primal_size,coarse_submat_vals,&coarse_sub_mat);CHKERRQ(ierr);
3118c042a7c3SStefano Zampini       ierr = MatConvert(coarse_sub_mat,checkmattype,MAT_REUSE_MATRIX,&coarse_sub_mat);CHKERRQ(ierr);
31190c7d97c5SJed Brown 
3120da1bb401SStefano Zampini       /*PetscViewer view_out;
3121da1bb401SStefano Zampini       PetscMPIInt myrank;
3122da1bb401SStefano Zampini       char filename[256];
3123da1bb401SStefano Zampini       MPI_Comm_rank(((PetscObject)pc)->comm,&myrank);
3124da1bb401SStefano Zampini       sprintf(filename,"coarsesubmat_%04d.m",myrank);
3125da1bb401SStefano Zampini       ierr = PetscViewerASCIIOpen(PETSC_COMM_SELF,filename,&view_out);CHKERRQ(ierr);
3126da1bb401SStefano Zampini       ierr = PetscViewerSetFormat(view_out,PETSC_VIEWER_ASCII_MATLAB);CHKERRQ(ierr);
3127da1bb401SStefano Zampini       ierr = MatView(coarse_sub_mat,view_out);CHKERRQ(ierr);
3128da1bb401SStefano Zampini       ierr = PetscViewerDestroy(&view_out);CHKERRQ(ierr);*/
3129da1bb401SStefano Zampini 
31300c7d97c5SJed Brown       ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
31310c7d97c5SJed Brown       ierr = PetscViewerASCIIPrintf(viewer,"Check coarse sub mat and local basis functions\n");CHKERRQ(ierr);
31320c7d97c5SJed Brown       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
313353cdbc3dSStefano Zampini       ierr = MatPtAP(A_II,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&TM1);CHKERRQ(ierr);
313453cdbc3dSStefano Zampini       ierr = MatPtAP(A_BB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&TM2);CHKERRQ(ierr);
313553cdbc3dSStefano Zampini       ierr = MatMatMult(A_IB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr);
3136c042a7c3SStefano Zampini       ierr = MatTransposeMatMult(coarse_phi_D,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM3);CHKERRQ(ierr);
313753cdbc3dSStefano Zampini       ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr);
313853cdbc3dSStefano Zampini       ierr = MatMatMult(A_BI,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr);
3139c042a7c3SStefano Zampini       ierr = MatTransposeMatMult(coarse_phi_B,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM4);CHKERRQ(ierr);
314053cdbc3dSStefano Zampini       ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr);
314153cdbc3dSStefano Zampini       ierr = MatAXPY(TM1,one,TM2,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
314253cdbc3dSStefano Zampini       ierr = MatAXPY(TM1,one,TM3,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
314353cdbc3dSStefano Zampini       ierr = MatAXPY(TM1,one,TM4,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
314453cdbc3dSStefano Zampini       ierr = MatAXPY(TM1,m_one,coarse_sub_mat,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
314553cdbc3dSStefano Zampini       ierr = MatNorm(TM1,NORM_INFINITY,&value);CHKERRQ(ierr);
31460c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"----------------------------------\n");CHKERRQ(ierr);
31470c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d \n",PetscGlobalRank);CHKERRQ(ierr);
31480c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"matrix error = % 1.14e\n",value);CHKERRQ(ierr);
31490c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"coarse functions errors\n");CHKERRQ(ierr);
315053cdbc3dSStefano Zampini       for(i=0;i<pcbddc->local_primal_size;i++) { ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local %02d-th function error = % 1.14e\n",i,coarsefunctions_errors[i]);CHKERRQ(ierr); }
31510c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"constraints errors\n");CHKERRQ(ierr);
315253cdbc3dSStefano Zampini       for(i=0;i<pcbddc->local_primal_size;i++) { ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local %02d-th function error = % 1.14e\n",i,constraints_errors[i]);CHKERRQ(ierr); }
31530c7d97c5SJed Brown       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
315453cdbc3dSStefano Zampini       ierr = MatDestroy(&A_II);CHKERRQ(ierr);
315553cdbc3dSStefano Zampini       ierr = MatDestroy(&A_BB);CHKERRQ(ierr);
315653cdbc3dSStefano Zampini       ierr = MatDestroy(&A_IB);CHKERRQ(ierr);
315753cdbc3dSStefano Zampini       ierr = MatDestroy(&A_BI);CHKERRQ(ierr);
315853cdbc3dSStefano Zampini       ierr = MatDestroy(&TM1);CHKERRQ(ierr);
315953cdbc3dSStefano Zampini       ierr = MatDestroy(&TM2);CHKERRQ(ierr);
316053cdbc3dSStefano Zampini       ierr = MatDestroy(&TM3);CHKERRQ(ierr);
316153cdbc3dSStefano Zampini       ierr = MatDestroy(&TM4);CHKERRQ(ierr);
316253cdbc3dSStefano Zampini       ierr = MatDestroy(&coarse_phi_D);CHKERRQ(ierr);
316353cdbc3dSStefano Zampini       ierr = MatDestroy(&coarse_sub_mat);CHKERRQ(ierr);
316453cdbc3dSStefano Zampini       ierr = MatDestroy(&coarse_phi_B);CHKERRQ(ierr);
31650c7d97c5SJed Brown       ierr = PetscFree(coarsefunctions_errors);CHKERRQ(ierr);
31660c7d97c5SJed Brown       ierr = PetscFree(constraints_errors);CHKERRQ(ierr);
31670c7d97c5SJed Brown     }
31680c7d97c5SJed Brown 
31690c7d97c5SJed Brown     /* create coarse matrix and data structures for message passing associated actual choice of coarse problem type */
31700c7d97c5SJed Brown     ierr = PCBDDCSetupCoarseEnvironment(pc,coarse_submat_vals);CHKERRQ(ierr);
31710c7d97c5SJed Brown     /* free memory */
31720c7d97c5SJed Brown     ierr = PetscFree(coarse_submat_vals);CHKERRQ(ierr);
31730c7d97c5SJed Brown     ierr = PetscFree(auxindices);CHKERRQ(ierr);
31740c7d97c5SJed Brown     ierr = PetscFree(nnz);CHKERRQ(ierr);
31753b03a366Sstefano_zampini     if(n_vertices) {
31760c7d97c5SJed Brown       ierr = VecDestroy(&vec1_V);CHKERRQ(ierr);
31770c7d97c5SJed Brown       ierr = VecDestroy(&vec2_V);CHKERRQ(ierr);
31780c7d97c5SJed Brown       ierr = MatDestroy(&M2);CHKERRQ(ierr);
31790c7d97c5SJed Brown       ierr = MatDestroy(&A_RV);CHKERRQ(ierr);
31800c7d97c5SJed Brown       ierr = MatDestroy(&A_VR);CHKERRQ(ierr);
31810c7d97c5SJed Brown       ierr = MatDestroy(&A_VV);CHKERRQ(ierr);
31820c7d97c5SJed Brown     }
3183534831adSStefano Zampini     if(n_constraints) {
31840c7d97c5SJed Brown       ierr = VecDestroy(&vec1_C);CHKERRQ(ierr);
31850c7d97c5SJed Brown       ierr = VecDestroy(&vec2_C);CHKERRQ(ierr);
31860c7d97c5SJed Brown       ierr = MatDestroy(&M1);CHKERRQ(ierr);
31870c7d97c5SJed Brown       ierr = MatDestroy(&C_CR);CHKERRQ(ierr);
31880c7d97c5SJed Brown     }
31890c7d97c5SJed Brown   }
31900c7d97c5SJed Brown   /* free memory */
31913b03a366Sstefano_zampini   if(n_vertices) {
31920c7d97c5SJed Brown     ierr = PetscFree(idx_V_B);CHKERRQ(ierr);
31930c7d97c5SJed Brown     ierr = ISDestroy(&is_V_local);CHKERRQ(ierr);
31940c7d97c5SJed Brown   }
31950c7d97c5SJed Brown   ierr = ISDestroy(&is_R_local);CHKERRQ(ierr);
31960c7d97c5SJed Brown 
31970c7d97c5SJed Brown   PetscFunctionReturn(0);
31980c7d97c5SJed Brown }
31990c7d97c5SJed Brown 
32000c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
32010c7d97c5SJed Brown 
32020c7d97c5SJed Brown #undef __FUNCT__
32030c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetupCoarseEnvironment"
320453cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetupCoarseEnvironment(PC pc,PetscScalar* coarse_submat_vals)
32050c7d97c5SJed Brown {
32060c7d97c5SJed Brown 
32070c7d97c5SJed Brown 
32080c7d97c5SJed Brown   Mat_IS    *matis    = (Mat_IS*)pc->pmat->data;
32090c7d97c5SJed Brown   PC_BDDC   *pcbddc   = (PC_BDDC*)pc->data;
32100c7d97c5SJed Brown   PC_IS     *pcis     = (PC_IS*)pc->data;
32110c7d97c5SJed Brown   MPI_Comm  prec_comm = ((PetscObject)pc)->comm;
32120c7d97c5SJed Brown   MPI_Comm  coarse_comm;
32130c7d97c5SJed Brown 
32140c7d97c5SJed Brown   /* common to all choiches */
32150c7d97c5SJed Brown   PetscScalar *temp_coarse_mat_vals;
32160c7d97c5SJed Brown   PetscScalar *ins_coarse_mat_vals;
32170c7d97c5SJed Brown   PetscInt    *ins_local_primal_indices;
32180c7d97c5SJed Brown   PetscMPIInt *localsizes2,*localdispl2;
32190c7d97c5SJed Brown   PetscMPIInt size_prec_comm;
32200c7d97c5SJed Brown   PetscMPIInt rank_prec_comm;
32210c7d97c5SJed Brown   PetscMPIInt active_rank=MPI_PROC_NULL;
32220c7d97c5SJed Brown   PetscMPIInt master_proc=0;
32230c7d97c5SJed Brown   PetscInt    ins_local_primal_size;
32240c7d97c5SJed Brown   /* specific to MULTILEVEL_BDDC */
32250c7d97c5SJed Brown   PetscMPIInt *ranks_recv;
32260c7d97c5SJed Brown   PetscMPIInt count_recv=0;
32270c7d97c5SJed Brown   PetscMPIInt rank_coarse_proc_send_to;
32280c7d97c5SJed Brown   PetscMPIInt coarse_color = MPI_UNDEFINED;
32290c7d97c5SJed Brown   ISLocalToGlobalMapping coarse_ISLG;
32300c7d97c5SJed Brown   /* some other variables */
32310c7d97c5SJed Brown   PetscErrorCode ierr;
32320c7d97c5SJed Brown   const MatType coarse_mat_type;
32330c7d97c5SJed Brown   const PCType  coarse_pc_type;
323453cdbc3dSStefano Zampini   const KSPType  coarse_ksp_type;
323553cdbc3dSStefano Zampini   PC pc_temp;
32360c7d97c5SJed Brown   PetscInt i,j,k,bs;
32373b03a366Sstefano_zampini   PetscInt max_it_coarse_ksp=1;  /* don't increase this value */
3238e269702eSStefano Zampini   /* verbose output viewer */
3239e269702eSStefano Zampini   PetscViewer viewer=pcbddc->dbg_viewer;
3240e269702eSStefano Zampini   PetscBool   dbg_flag=pcbddc->dbg_flag;
32410c7d97c5SJed Brown 
32420c7d97c5SJed Brown   PetscFunctionBegin;
32430c7d97c5SJed Brown 
32440c7d97c5SJed Brown   ins_local_primal_indices = 0;
32450c7d97c5SJed Brown   ins_coarse_mat_vals      = 0;
32460c7d97c5SJed Brown   localsizes2              = 0;
32470c7d97c5SJed Brown   localdispl2              = 0;
32480c7d97c5SJed Brown   temp_coarse_mat_vals     = 0;
32490c7d97c5SJed Brown   coarse_ISLG              = 0;
32500c7d97c5SJed Brown 
325153cdbc3dSStefano Zampini   ierr = MPI_Comm_size(prec_comm,&size_prec_comm);CHKERRQ(ierr);
325253cdbc3dSStefano Zampini   ierr = MPI_Comm_rank(prec_comm,&rank_prec_comm);CHKERRQ(ierr);
32530c7d97c5SJed Brown   ierr = MatGetBlockSize(matis->A,&bs);CHKERRQ(ierr);
32540c7d97c5SJed Brown 
3255beed3852SStefano Zampini   /* Assign global numbering to coarse dofs */
3256beed3852SStefano Zampini   {
3257a0ba757dSStefano Zampini     PetscScalar    one=1.,zero=0.;
3258beed3852SStefano Zampini     PetscScalar    *array;
3259beed3852SStefano Zampini     PetscMPIInt    *auxlocal_primal;
3260beed3852SStefano Zampini     PetscMPIInt    *auxglobal_primal;
3261beed3852SStefano Zampini     PetscMPIInt    *all_auxglobal_primal;
3262beed3852SStefano Zampini     PetscMPIInt    *all_auxglobal_primal_dummy;
3263beed3852SStefano Zampini     PetscMPIInt    mpi_local_primal_size = (PetscMPIInt)pcbddc->local_primal_size;
3264da1bb401SStefano Zampini     PetscInt       *row_cmat_indices;
32653b03a366Sstefano_zampini     PetscInt       size_of_constraint;
3266da1bb401SStefano Zampini     PetscScalar    coarsesum;
3267beed3852SStefano Zampini 
3268beed3852SStefano Zampini     /* Construct needed data structures for message passing */
3269beed3852SStefano Zampini     ierr = PetscMalloc(mpi_local_primal_size*sizeof(PetscMPIInt),&pcbddc->local_primal_indices);CHKERRQ(ierr);
3270beed3852SStefano Zampini     ierr = PetscMalloc(size_prec_comm*sizeof(PetscMPIInt),&pcbddc->local_primal_sizes);CHKERRQ(ierr);
3271beed3852SStefano Zampini     ierr = PetscMalloc(size_prec_comm*sizeof(PetscMPIInt),&pcbddc->local_primal_displacements);CHKERRQ(ierr);
3272beed3852SStefano Zampini     /* Gather local_primal_size information for all processes  */
32735619798eSStefano Zampini     ierr = MPI_Allgather(&mpi_local_primal_size,1,MPIU_INT,&pcbddc->local_primal_sizes[0],1,MPIU_INT,prec_comm);CHKERRQ(ierr);
3274beed3852SStefano Zampini     pcbddc->replicated_primal_size = 0;
3275beed3852SStefano Zampini     for (i=0; i<size_prec_comm; i++) {
3276beed3852SStefano Zampini       pcbddc->local_primal_displacements[i] = pcbddc->replicated_primal_size ;
3277beed3852SStefano Zampini       pcbddc->replicated_primal_size += pcbddc->local_primal_sizes[i];
3278beed3852SStefano Zampini     }
32795619798eSStefano Zampini     if(rank_prec_comm == 0) {
3280beed3852SStefano Zampini       /* allocate some auxiliary space */
3281beed3852SStefano Zampini       ierr = PetscMalloc(pcbddc->replicated_primal_size*sizeof(*all_auxglobal_primal),&all_auxglobal_primal);CHKERRQ(ierr);
3282beed3852SStefano Zampini       ierr = PetscMalloc(pcbddc->replicated_primal_size*sizeof(*all_auxglobal_primal_dummy),&all_auxglobal_primal_dummy);CHKERRQ(ierr);
3283beed3852SStefano Zampini     }
3284beed3852SStefano Zampini     ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscMPIInt),&auxlocal_primal);CHKERRQ(ierr);
3285beed3852SStefano Zampini     ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscMPIInt),&auxglobal_primal);CHKERRQ(ierr);
3286beed3852SStefano Zampini 
3287da1bb401SStefano Zampini     /* First let's count coarse dofs.
3288beed3852SStefano Zampini        This code fragment assumes that the number of local constraints per connected component
3289beed3852SStefano Zampini        is not greater than the number of nodes defined for the connected component
3290beed3852SStefano Zampini        (otherwise we will surely have linear dependence between constraints and thus a singular coarse problem) */
32913b03a366Sstefano_zampini     /* auxlocal_primal      : primal indices in local nodes numbering (internal and interface) with complete queue sorted by global ordering */
3292beed3852SStefano Zampini     ierr = VecSet(pcis->vec1_N,zero);CHKERRQ(ierr);
3293beed3852SStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3294da1bb401SStefano Zampini     for(i=0;i<pcbddc->local_primal_size;i++) {
3295da1bb401SStefano Zampini       ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr);
32963b03a366Sstefano_zampini       for (j=0; j<size_of_constraint; j++) {
32973b03a366Sstefano_zampini         k = row_cmat_indices[j];
3298beed3852SStefano Zampini         if( array[k] == zero ) {
3299beed3852SStefano Zampini           array[k] = one;
3300da1bb401SStefano Zampini           auxlocal_primal[i] = k;
3301beed3852SStefano Zampini           break;
3302beed3852SStefano Zampini         }
3303beed3852SStefano Zampini       }
3304da1bb401SStefano Zampini       ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr);
3305beed3852SStefano Zampini     }
3306beed3852SStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3307da1bb401SStefano Zampini     ierr = VecSet(pcis->vec1_global,zero);CHKERRQ(ierr);
3308da1bb401SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3309da1bb401SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3310da1bb401SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3311da1bb401SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3312da1bb401SStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3313da1bb401SStefano Zampini     for(i=0;i<pcis->n;i++) { if( array[i] > zero) array[i] = one/array[i]; }
3314da1bb401SStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3315da1bb401SStefano Zampini     ierr = VecSet(pcis->vec1_global,zero);CHKERRQ(ierr);
3316da1bb401SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3317da1bb401SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3318da1bb401SStefano Zampini     ierr = VecSum(pcis->vec1_global,&coarsesum);CHKERRQ(ierr);
3319da1bb401SStefano Zampini     pcbddc->coarse_size = (PetscInt) coarsesum;
3320a0ba757dSStefano Zampini 
3321beed3852SStefano Zampini     /* Now assign them a global numbering */
3322beed3852SStefano Zampini     /* auxglobal_primal contains indices in global nodes numbering (internal and interface) */
3323beed3852SStefano Zampini     ierr = ISLocalToGlobalMappingApply(matis->mapping,pcbddc->local_primal_size,auxlocal_primal,auxglobal_primal);CHKERRQ(ierr);
3324beed3852SStefano Zampini     /* all_auxglobal_primal contains all primal nodes indices in global nodes numbering (internal and interface) */
3325beed3852SStefano Zampini     ierr = MPI_Gatherv(&auxglobal_primal[0],pcbddc->local_primal_size,MPIU_INT,&all_auxglobal_primal[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,0,prec_comm);CHKERRQ(ierr);
3326beed3852SStefano Zampini 
3327beed3852SStefano Zampini     /* After this block all_auxglobal_primal should contains one copy of each primal node's indices in global nodes numbering */
3328beed3852SStefano Zampini     /* It implements a function similar to PetscSortRemoveDupsInt */
3329beed3852SStefano Zampini     if(rank_prec_comm==0) {
3330beed3852SStefano Zampini       /* dummy argument since PetscSortMPIInt doesn't exist! */
3331beed3852SStefano Zampini       ierr = PetscSortMPIIntWithArray(pcbddc->replicated_primal_size,all_auxglobal_primal,all_auxglobal_primal_dummy);CHKERRQ(ierr);
3332beed3852SStefano Zampini       k=1;
3333beed3852SStefano Zampini       j=all_auxglobal_primal[0];  /* first dof in global numbering */
3334beed3852SStefano Zampini       for(i=1;i< pcbddc->replicated_primal_size ;i++) {
3335beed3852SStefano Zampini         if(j != all_auxglobal_primal[i] ) {
3336beed3852SStefano Zampini           all_auxglobal_primal[k]=all_auxglobal_primal[i];
3337beed3852SStefano Zampini           k++;
3338beed3852SStefano Zampini           j=all_auxglobal_primal[i];
3339beed3852SStefano Zampini         }
3340beed3852SStefano Zampini       }
3341beed3852SStefano Zampini     } else {
3342beed3852SStefano Zampini       ierr = PetscMalloc(pcbddc->coarse_size*sizeof(PetscMPIInt),&all_auxglobal_primal);CHKERRQ(ierr);
3343beed3852SStefano Zampini     }
33445619798eSStefano Zampini     /* We only need to broadcast the indices from 0 to pcbddc->coarse_size. Remaning elements of array all_aux_global_primal are garbage. */
3345beed3852SStefano Zampini     ierr = MPI_Bcast(all_auxglobal_primal,pcbddc->coarse_size,MPIU_INT,0,prec_comm);CHKERRQ(ierr);
3346beed3852SStefano Zampini 
3347beed3852SStefano Zampini     /* Now get global coarse numbering of local primal nodes */
3348beed3852SStefano Zampini     for(i=0;i<pcbddc->local_primal_size;i++) {
3349beed3852SStefano Zampini       k=0;
3350beed3852SStefano Zampini       while( all_auxglobal_primal[k] != auxglobal_primal[i] ) { k++;}
3351beed3852SStefano Zampini       pcbddc->local_primal_indices[i]=k;
3352beed3852SStefano Zampini     }
3353e269702eSStefano Zampini     if(dbg_flag) {
3354e269702eSStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
3355da1bb401SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Size of coarse problem %d\n",pcbddc->coarse_size);CHKERRQ(ierr);
3356e269702eSStefano Zampini       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
3357e269702eSStefano Zampini     }
3358beed3852SStefano Zampini     /* free allocated memory */
3359beed3852SStefano Zampini     ierr = PetscFree(auxlocal_primal);CHKERRQ(ierr);
3360beed3852SStefano Zampini     ierr = PetscFree(auxglobal_primal);CHKERRQ(ierr);
3361beed3852SStefano Zampini     ierr = PetscFree(all_auxglobal_primal);CHKERRQ(ierr);
3362e269702eSStefano Zampini     if(rank_prec_comm == 0) {
3363beed3852SStefano Zampini       ierr = PetscFree(all_auxglobal_primal_dummy);CHKERRQ(ierr);
3364beed3852SStefano Zampini     }
3365e269702eSStefano Zampini   }
3366beed3852SStefano Zampini 
33670c7d97c5SJed Brown   /* adapt coarse problem type */
33680c7d97c5SJed Brown   if(pcbddc->coarse_problem_type == MULTILEVEL_BDDC && pcbddc->active_procs < MIN_PROCS_FOR_BDDC )
33690c7d97c5SJed Brown     pcbddc->coarse_problem_type = PARALLEL_BDDC;
33700c7d97c5SJed Brown 
33710c7d97c5SJed Brown   switch(pcbddc->coarse_problem_type){
33720c7d97c5SJed Brown 
3373da1bb401SStefano Zampini     case(MULTILEVEL_BDDC):   /* we define a coarse mesh where subdomains are elements */
33740c7d97c5SJed Brown     {
33750c7d97c5SJed Brown       /* we need additional variables */
33760c7d97c5SJed Brown       MetisInt   n_subdomains,n_parts,objval,ncon,faces_nvtxs;
33770c7d97c5SJed Brown       MetisInt   *metis_coarse_subdivision;
33780c7d97c5SJed Brown       MetisInt   options[METIS_NOPTIONS];
33790c7d97c5SJed Brown       PetscMPIInt size_coarse_comm,rank_coarse_comm;
33800c7d97c5SJed Brown       PetscMPIInt procs_jumps_coarse_comm;
33810c7d97c5SJed Brown       PetscMPIInt *coarse_subdivision;
33820c7d97c5SJed Brown       PetscMPIInt *total_count_recv;
33830c7d97c5SJed Brown       PetscMPIInt *total_ranks_recv;
33840c7d97c5SJed Brown       PetscMPIInt *displacements_recv;
33850c7d97c5SJed Brown       PetscMPIInt *my_faces_connectivity;
33860c7d97c5SJed Brown       PetscMPIInt *petsc_faces_adjncy;
33870c7d97c5SJed Brown       MetisInt    *faces_adjncy;
33880c7d97c5SJed Brown       MetisInt    *faces_xadj;
33890c7d97c5SJed Brown       PetscMPIInt *number_of_faces;
33900c7d97c5SJed Brown       PetscMPIInt *faces_displacements;
33910c7d97c5SJed Brown       PetscInt    *array_int;
33920c7d97c5SJed Brown       PetscMPIInt my_faces=0;
33930c7d97c5SJed Brown       PetscMPIInt total_faces=0;
33943828260eSStefano Zampini       PetscInt    ranks_stretching_ratio;
33950c7d97c5SJed Brown 
33960c7d97c5SJed Brown       /* define some quantities */
33970c7d97c5SJed Brown       pcbddc->coarse_communications_type = SCATTERS_BDDC;
33980c7d97c5SJed Brown       coarse_mat_type = MATIS;
33990c7d97c5SJed Brown       coarse_pc_type  = PCBDDC;
34006c9de887SHong Zhang       coarse_ksp_type  = KSPCHEBYSHEV;
34010c7d97c5SJed Brown 
34020c7d97c5SJed Brown       /* details of coarse decomposition */
34030c7d97c5SJed Brown       n_subdomains = pcbddc->active_procs;
34040c7d97c5SJed Brown       n_parts      = n_subdomains/pcbddc->coarsening_ratio;
34053828260eSStefano Zampini       ranks_stretching_ratio = size_prec_comm/pcbddc->active_procs;
34063828260eSStefano Zampini       procs_jumps_coarse_comm = pcbddc->coarsening_ratio*ranks_stretching_ratio;
34073828260eSStefano Zampini 
3408da1bb401SStefano Zampini       /*printf("Coarse algorithm details: \n");
3409da1bb401SStefano Zampini       printf("n_subdomains %d, n_parts %d\nstretch %d,jumps %d,coarse_ratio %d\nlevel should be log_%d(%d)\n",n_subdomains,n_parts,ranks_stretching_ratio,procs_jumps_coarse_comm,pcbddc->coarsening_ratio,pcbddc->coarsening_ratio,(ranks_stretching_ratio/pcbddc->coarsening_ratio+1));*/
34100c7d97c5SJed Brown 
34110c7d97c5SJed Brown       /* build CSR graph of subdomains' connectivity through faces */
34120c7d97c5SJed Brown       ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&array_int);CHKERRQ(ierr);
34133828260eSStefano Zampini       ierr = PetscMemzero(array_int,pcis->n*sizeof(PetscInt));CHKERRQ(ierr);
34140c7d97c5SJed Brown       for(i=1;i<pcis->n_neigh;i++){/* i=1 so I don't count myself -> faces nodes counts to 1 */
34150c7d97c5SJed Brown         for(j=0;j<pcis->n_shared[i];j++){
34160c7d97c5SJed Brown           array_int[ pcis->shared[i][j] ]+=1;
34170c7d97c5SJed Brown         }
34180c7d97c5SJed Brown       }
34190c7d97c5SJed Brown       for(i=1;i<pcis->n_neigh;i++){
34200c7d97c5SJed Brown         for(j=0;j<pcis->n_shared[i];j++){
34210c7d97c5SJed Brown           if(array_int[ pcis->shared[i][j] ] == 1 ){
34220c7d97c5SJed Brown             my_faces++;
34230c7d97c5SJed Brown             break;
34240c7d97c5SJed Brown           }
34250c7d97c5SJed Brown         }
34260c7d97c5SJed Brown       }
34270c7d97c5SJed Brown 
342853cdbc3dSStefano Zampini       ierr = MPI_Reduce(&my_faces,&total_faces,1,MPIU_INT,MPI_SUM,master_proc,prec_comm);CHKERRQ(ierr);
34290c7d97c5SJed Brown       ierr = PetscMalloc (my_faces*sizeof(PetscInt),&my_faces_connectivity);CHKERRQ(ierr);
34300c7d97c5SJed Brown       my_faces=0;
34310c7d97c5SJed Brown       for(i=1;i<pcis->n_neigh;i++){
34320c7d97c5SJed Brown         for(j=0;j<pcis->n_shared[i];j++){
34330c7d97c5SJed Brown           if(array_int[ pcis->shared[i][j] ] == 1 ){
34340c7d97c5SJed Brown             my_faces_connectivity[my_faces]=pcis->neigh[i];
34350c7d97c5SJed Brown             my_faces++;
34360c7d97c5SJed Brown             break;
34370c7d97c5SJed Brown           }
34380c7d97c5SJed Brown         }
34390c7d97c5SJed Brown       }
34400c7d97c5SJed Brown       if(rank_prec_comm == master_proc) {
34410c7d97c5SJed Brown         ierr = PetscMalloc (total_faces*sizeof(PetscMPIInt),&petsc_faces_adjncy);CHKERRQ(ierr);
34420c7d97c5SJed Brown         ierr = PetscMalloc (size_prec_comm*sizeof(PetscMPIInt),&number_of_faces);CHKERRQ(ierr);
34430c7d97c5SJed Brown         ierr = PetscMalloc (total_faces*sizeof(MetisInt),&faces_adjncy);CHKERRQ(ierr);
34440c7d97c5SJed Brown         ierr = PetscMalloc ((n_subdomains+1)*sizeof(MetisInt),&faces_xadj);CHKERRQ(ierr);
34450c7d97c5SJed Brown         ierr = PetscMalloc ((size_prec_comm+1)*sizeof(PetscMPIInt),&faces_displacements);CHKERRQ(ierr);
34460c7d97c5SJed Brown       }
344753cdbc3dSStefano Zampini       ierr = MPI_Gather(&my_faces,1,MPIU_INT,&number_of_faces[0],1,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr);
34480c7d97c5SJed Brown       if(rank_prec_comm == master_proc) {
34490c7d97c5SJed Brown         faces_xadj[0]=0;
34500c7d97c5SJed Brown         faces_displacements[0]=0;
34510c7d97c5SJed Brown         j=0;
34520c7d97c5SJed Brown         for(i=1;i<size_prec_comm+1;i++) {
34530c7d97c5SJed Brown           faces_displacements[i]=faces_displacements[i-1]+number_of_faces[i-1];
34540c7d97c5SJed Brown           if(number_of_faces[i-1]) {
34550c7d97c5SJed Brown             j++;
34560c7d97c5SJed Brown             faces_xadj[j]=faces_xadj[j-1]+number_of_faces[i-1];
34570c7d97c5SJed Brown           }
34580c7d97c5SJed Brown         }
3459da1bb401SStefano Zampini         /*printf("The J I count is %d and should be %d\n",j,n_subdomains);
3460da1bb401SStefano Zampini         printf("Total faces seem %d and should be %d\n",faces_xadj[j],total_faces);*/
34610c7d97c5SJed Brown       }
346253cdbc3dSStefano Zampini       ierr = MPI_Gatherv(&my_faces_connectivity[0],my_faces,MPIU_INT,&petsc_faces_adjncy[0],number_of_faces,faces_displacements,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr);
34630c7d97c5SJed Brown       ierr = PetscFree(my_faces_connectivity);CHKERRQ(ierr);
34640c7d97c5SJed Brown       ierr = PetscFree(array_int);CHKERRQ(ierr);
34650c7d97c5SJed Brown       if(rank_prec_comm == master_proc) {
34663828260eSStefano Zampini         for(i=0;i<total_faces;i++) faces_adjncy[i]=(MetisInt)(petsc_faces_adjncy[i]/ranks_stretching_ratio); /* cast to MetisInt */
3467da1bb401SStefano Zampini         /*printf("This is the face connectivity (actual ranks)\n");
34680c7d97c5SJed Brown         for(i=0;i<n_subdomains;i++){
34690c7d97c5SJed Brown           printf("proc %d is connected with \n",i);
34700c7d97c5SJed Brown           for(j=faces_xadj[i];j<faces_xadj[i+1];j++)
34710c7d97c5SJed Brown             printf("%d ",faces_adjncy[j]);
34720c7d97c5SJed Brown           printf("\n");
3473da1bb401SStefano Zampini         }*/
34740c7d97c5SJed Brown         ierr = PetscFree(faces_displacements);CHKERRQ(ierr);
34750c7d97c5SJed Brown         ierr = PetscFree(number_of_faces);CHKERRQ(ierr);
34760c7d97c5SJed Brown         ierr = PetscFree(petsc_faces_adjncy);CHKERRQ(ierr);
34770c7d97c5SJed Brown       }
34780c7d97c5SJed Brown 
34790c7d97c5SJed Brown       if( rank_prec_comm == master_proc ) {
34800c7d97c5SJed Brown 
34813828260eSStefano Zampini         PetscInt heuristic_for_metis=3;
34823828260eSStefano Zampini 
34830c7d97c5SJed Brown         ncon=1;
34840c7d97c5SJed Brown         faces_nvtxs=n_subdomains;
34850c7d97c5SJed Brown         /* partition graoh induced by face connectivity */
34860c7d97c5SJed Brown         ierr = PetscMalloc (n_subdomains*sizeof(MetisInt),&metis_coarse_subdivision);CHKERRQ(ierr);
34870c7d97c5SJed Brown         ierr = METIS_SetDefaultOptions(options);
34880c7d97c5SJed Brown         /* we need a contiguous partition of the coarse mesh */
34890c7d97c5SJed Brown         options[METIS_OPTION_CONTIG]=1;
34900c7d97c5SJed Brown         options[METIS_OPTION_DBGLVL]=1;
34910c7d97c5SJed Brown         options[METIS_OPTION_NITER]=30;
34923828260eSStefano Zampini         if(n_subdomains>n_parts*heuristic_for_metis) {
34933828260eSStefano Zampini           options[METIS_OPTION_IPTYPE]=METIS_IPTYPE_EDGE;
34943828260eSStefano Zampini           options[METIS_OPTION_OBJTYPE]=METIS_OBJTYPE_CUT;
34950c7d97c5SJed Brown           ierr = METIS_PartGraphKway(&faces_nvtxs,&ncon,faces_xadj,faces_adjncy,NULL,NULL,NULL,&n_parts,NULL,NULL,options,&objval,metis_coarse_subdivision);
34963828260eSStefano Zampini         } else {
34973828260eSStefano Zampini           ierr = METIS_PartGraphRecursive(&faces_nvtxs,&ncon,faces_xadj,faces_adjncy,NULL,NULL,NULL,&n_parts,NULL,NULL,options,&objval,metis_coarse_subdivision);
34983828260eSStefano Zampini         }
34990c7d97c5SJed Brown         if(ierr != METIS_OK) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in METIS_PartGraphKway (metis error code %D) called from PCBDDCSetupCoarseEnvironment\n",ierr);
35000c7d97c5SJed Brown         ierr = PetscFree(faces_xadj);CHKERRQ(ierr);
35010c7d97c5SJed Brown         ierr = PetscFree(faces_adjncy);CHKERRQ(ierr);
35020c7d97c5SJed Brown         coarse_subdivision = (PetscMPIInt*)calloc(size_prec_comm,sizeof(PetscMPIInt)); /* calloc for contiguous memory since we need to scatter these values later */
35030c7d97c5SJed Brown         /* copy/cast values avoiding possible type conflicts between PETSc, MPI and METIS */
35043828260eSStefano Zampini         for(i=0;i<size_prec_comm;i++) coarse_subdivision[i]=MPI_PROC_NULL;
35053828260eSStefano Zampini         for(i=0;i<n_subdomains;i++)   coarse_subdivision[ranks_stretching_ratio*i]=(PetscInt)(metis_coarse_subdivision[i]);
35060c7d97c5SJed Brown         ierr = PetscFree(metis_coarse_subdivision);CHKERRQ(ierr);
35070c7d97c5SJed Brown       }
35080c7d97c5SJed Brown 
35090c7d97c5SJed Brown       /* Create new communicator for coarse problem splitting the old one */
35100c7d97c5SJed Brown       if( !(rank_prec_comm%procs_jumps_coarse_comm) && rank_prec_comm < procs_jumps_coarse_comm*n_parts ){
3511da1bb401SStefano Zampini         coarse_color=0;              /* for communicator splitting */
3512da1bb401SStefano Zampini         active_rank=rank_prec_comm;  /* for insertion of matrix values */
35130c7d97c5SJed Brown       }
3514da1bb401SStefano Zampini       /* procs with coarse_color = MPI_UNDEFINED will have coarse_comm = MPI_COMM_NULL (from mpi standards)
3515da1bb401SStefano Zampini          key = rank_prec_comm -> keep same ordering of ranks from the old to the new communicator */
351653cdbc3dSStefano Zampini       ierr = MPI_Comm_split(prec_comm,coarse_color,rank_prec_comm,&coarse_comm);CHKERRQ(ierr);
35170c7d97c5SJed Brown 
35180c7d97c5SJed Brown       if( coarse_color == 0 ) {
351953cdbc3dSStefano Zampini         ierr = MPI_Comm_size(coarse_comm,&size_coarse_comm);CHKERRQ(ierr);
352053cdbc3dSStefano Zampini         ierr = MPI_Comm_rank(coarse_comm,&rank_coarse_comm);CHKERRQ(ierr);
3521da1bb401SStefano Zampini         /*printf("Details of coarse comm\n");
35223828260eSStefano Zampini         printf("size = %d, myrank = %d\n",size_coarse_comm,rank_coarse_comm);
3523da1bb401SStefano Zampini         printf("jumps = %d, coarse_color = %d, n_parts = %d\n",procs_jumps_coarse_comm,coarse_color,n_parts);*/
35240c7d97c5SJed Brown       } else {
35250c7d97c5SJed Brown         rank_coarse_comm = MPI_PROC_NULL;
35260c7d97c5SJed Brown       }
35270c7d97c5SJed Brown 
35280c7d97c5SJed Brown       /* master proc take care of arranging and distributing coarse informations */
35290c7d97c5SJed Brown       if(rank_coarse_comm == master_proc) {
35300c7d97c5SJed Brown         ierr = PetscMalloc (size_coarse_comm*sizeof(PetscMPIInt),&displacements_recv);CHKERRQ(ierr);
3531da1bb401SStefano Zampini         /*ierr = PetscMalloc (size_coarse_comm*sizeof(PetscMPIInt),&total_count_recv);CHKERRQ(ierr);
3532da1bb401SStefano Zampini           ierr = PetscMalloc (n_subdomains*sizeof(PetscMPIInt),&total_ranks_recv);CHKERRQ(ierr);*/
35330c7d97c5SJed Brown         total_count_recv = (PetscMPIInt*)calloc(size_prec_comm,sizeof(PetscMPIInt));
35340c7d97c5SJed Brown         total_ranks_recv = (PetscMPIInt*)calloc(n_subdomains,sizeof(PetscMPIInt));
35350c7d97c5SJed Brown         /* some initializations */
35360c7d97c5SJed Brown         displacements_recv[0]=0;
3537da1bb401SStefano Zampini         /* PetscMemzero(total_count_recv,size_coarse_comm*sizeof(PetscMPIInt)); not needed -> calloc initializes to zero */
35380c7d97c5SJed Brown         /* count from how many processes the j-th process of the coarse decomposition will receive data */
35390c7d97c5SJed Brown         for(j=0;j<size_coarse_comm;j++)
35403828260eSStefano Zampini           for(i=0;i<size_prec_comm;i++)
35410c7d97c5SJed Brown             if(coarse_subdivision[i]==j)
35420c7d97c5SJed Brown               total_count_recv[j]++;
35430c7d97c5SJed Brown         /* displacements needed for scatterv of total_ranks_recv */
35440c7d97c5SJed Brown         for(i=1;i<size_coarse_comm;i++) displacements_recv[i]=displacements_recv[i-1]+total_count_recv[i-1];
35450c7d97c5SJed Brown         /* Now fill properly total_ranks_recv -> each coarse process will receive the ranks (in prec_comm communicator) of its friend (sending) processes */
35460c7d97c5SJed Brown         ierr = PetscMemzero(total_count_recv,size_coarse_comm*sizeof(PetscMPIInt));CHKERRQ(ierr);
35470c7d97c5SJed Brown         for(j=0;j<size_coarse_comm;j++) {
35483828260eSStefano Zampini           for(i=0;i<size_prec_comm;i++) {
35490c7d97c5SJed Brown             if(coarse_subdivision[i]==j) {
35500c7d97c5SJed Brown               total_ranks_recv[displacements_recv[j]+total_count_recv[j]]=i;
35513828260eSStefano Zampini               total_count_recv[j]+=1;
35520c7d97c5SJed Brown             }
35530c7d97c5SJed Brown           }
35540c7d97c5SJed Brown         }
3555da1bb401SStefano Zampini         /*for(j=0;j<size_coarse_comm;j++) {
35563828260eSStefano Zampini           printf("process %d in new rank will receive from %d processes (original ranks follows)\n",j,total_count_recv[j]);
35573828260eSStefano Zampini           for(i=0;i<total_count_recv[j];i++) {
35583828260eSStefano Zampini             printf("%d ",total_ranks_recv[displacements_recv[j]+i]);
35593828260eSStefano Zampini           }
35603828260eSStefano Zampini           printf("\n");
3561da1bb401SStefano Zampini         }*/
35620c7d97c5SJed Brown 
35630c7d97c5SJed Brown         /* identify new decomposition in terms of ranks in the old communicator */
35643828260eSStefano Zampini         for(i=0;i<n_subdomains;i++) coarse_subdivision[ranks_stretching_ratio*i]=coarse_subdivision[ranks_stretching_ratio*i]*procs_jumps_coarse_comm;
3565da1bb401SStefano Zampini         /*printf("coarse_subdivision in old end new ranks\n");
35660c7d97c5SJed Brown         for(i=0;i<size_prec_comm;i++)
35673828260eSStefano Zampini           if(coarse_subdivision[i]!=MPI_PROC_NULL) {
35683828260eSStefano Zampini             printf("%d=(%d %d), ",i,coarse_subdivision[i],coarse_subdivision[i]/procs_jumps_coarse_comm);
35693828260eSStefano Zampini           } else {
35703828260eSStefano Zampini             printf("%d=(%d %d), ",i,coarse_subdivision[i],coarse_subdivision[i]);
35713828260eSStefano Zampini           }
3572da1bb401SStefano Zampini         printf("\n");*/
35730c7d97c5SJed Brown       }
35740c7d97c5SJed Brown 
35750c7d97c5SJed Brown       /* Scatter new decomposition for send details */
357653cdbc3dSStefano Zampini       ierr = MPI_Scatter(&coarse_subdivision[0],1,MPIU_INT,&rank_coarse_proc_send_to,1,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr);
35770c7d97c5SJed Brown       /* Scatter receiving details to members of coarse decomposition */
35780c7d97c5SJed Brown       if( coarse_color == 0) {
357953cdbc3dSStefano Zampini         ierr = MPI_Scatter(&total_count_recv[0],1,MPIU_INT,&count_recv,1,MPIU_INT,master_proc,coarse_comm);CHKERRQ(ierr);
35800c7d97c5SJed Brown         ierr = PetscMalloc (count_recv*sizeof(PetscMPIInt),&ranks_recv);CHKERRQ(ierr);
358153cdbc3dSStefano Zampini         ierr = MPI_Scatterv(&total_ranks_recv[0],total_count_recv,displacements_recv,MPIU_INT,&ranks_recv[0],count_recv,MPIU_INT,master_proc,coarse_comm);CHKERRQ(ierr);
35820c7d97c5SJed Brown       }
35830c7d97c5SJed Brown 
3584da1bb401SStefano Zampini       /*printf("I will send my matrix data to proc  %d\n",rank_coarse_proc_send_to);
3585da1bb401SStefano Zampini       if(coarse_color == 0) {
3586da1bb401SStefano Zampini         printf("I will receive some matrix data from %d processes (ranks follows)\n",count_recv);
3587da1bb401SStefano Zampini         for(i=0;i<count_recv;i++)
3588da1bb401SStefano Zampini           printf("%d ",ranks_recv[i]);
3589da1bb401SStefano Zampini         printf("\n");
3590da1bb401SStefano Zampini       }*/
35910c7d97c5SJed Brown 
35920c7d97c5SJed Brown       if(rank_prec_comm == master_proc) {
3593da1bb401SStefano Zampini         /*ierr = PetscFree(coarse_subdivision);CHKERRQ(ierr);
3594da1bb401SStefano Zampini         ierr = PetscFree(total_count_recv);CHKERRQ(ierr);
3595da1bb401SStefano Zampini         ierr = PetscFree(total_ranks_recv);CHKERRQ(ierr);*/
35960c7d97c5SJed Brown         free(coarse_subdivision);
35970c7d97c5SJed Brown         free(total_count_recv);
35980c7d97c5SJed Brown         free(total_ranks_recv);
35990c7d97c5SJed Brown         ierr = PetscFree(displacements_recv);CHKERRQ(ierr);
36000c7d97c5SJed Brown       }
36010c7d97c5SJed Brown       break;
36020c7d97c5SJed Brown     }
36030c7d97c5SJed Brown 
36040c7d97c5SJed Brown     case(REPLICATED_BDDC):
36050c7d97c5SJed Brown 
36060c7d97c5SJed Brown       pcbddc->coarse_communications_type = GATHERS_BDDC;
36070c7d97c5SJed Brown       coarse_mat_type = MATSEQAIJ;
36080c7d97c5SJed Brown       coarse_pc_type  = PCLU;
360953cdbc3dSStefano Zampini       coarse_ksp_type  = KSPPREONLY;
36100c7d97c5SJed Brown       coarse_comm = PETSC_COMM_SELF;
36110c7d97c5SJed Brown       active_rank = rank_prec_comm;
36120c7d97c5SJed Brown       break;
36130c7d97c5SJed Brown 
36140c7d97c5SJed Brown     case(PARALLEL_BDDC):
36150c7d97c5SJed Brown 
36160c7d97c5SJed Brown       pcbddc->coarse_communications_type = SCATTERS_BDDC;
36170c7d97c5SJed Brown       coarse_mat_type = MATMPIAIJ;
36180c7d97c5SJed Brown       coarse_pc_type  = PCREDUNDANT;
361953cdbc3dSStefano Zampini       coarse_ksp_type  = KSPPREONLY;
36200c7d97c5SJed Brown       coarse_comm = prec_comm;
36210c7d97c5SJed Brown       active_rank = rank_prec_comm;
36220c7d97c5SJed Brown       break;
36230c7d97c5SJed Brown 
36240c7d97c5SJed Brown     case(SEQUENTIAL_BDDC):
36250c7d97c5SJed Brown       pcbddc->coarse_communications_type = GATHERS_BDDC;
36260c7d97c5SJed Brown       coarse_mat_type = MATSEQAIJ;
36270c7d97c5SJed Brown       coarse_pc_type = PCLU;
362853cdbc3dSStefano Zampini       coarse_ksp_type  = KSPPREONLY;
36290c7d97c5SJed Brown       coarse_comm = PETSC_COMM_SELF;
36300c7d97c5SJed Brown       active_rank = master_proc;
36310c7d97c5SJed Brown       break;
36320c7d97c5SJed Brown   }
36330c7d97c5SJed Brown 
36340c7d97c5SJed Brown   switch(pcbddc->coarse_communications_type){
36350c7d97c5SJed Brown 
36360c7d97c5SJed Brown     case(SCATTERS_BDDC):
36370c7d97c5SJed Brown       {
36380c7d97c5SJed Brown         if(pcbddc->coarse_problem_type==MULTILEVEL_BDDC) {
36390c7d97c5SJed Brown 
36400c7d97c5SJed Brown           PetscMPIInt send_size;
36410c7d97c5SJed Brown           PetscInt    *aux_ins_indices;
36420c7d97c5SJed Brown           PetscInt    ii,jj;
36430c7d97c5SJed Brown           MPI_Request *requests;
36440c7d97c5SJed Brown 
36450c7d97c5SJed Brown           /* allocate auxiliary space */
36465619798eSStefano Zampini           ierr = PetscMalloc (pcbddc->replicated_primal_size*sizeof(PetscMPIInt),&pcbddc->replicated_local_primal_indices);CHKERRQ(ierr);
36475619798eSStefano Zampini           ierr = MPI_Allgatherv(&pcbddc->local_primal_indices[0],pcbddc->local_primal_size,MPIU_INT,&pcbddc->replicated_local_primal_indices[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,prec_comm);CHKERRQ(ierr);
36480c7d97c5SJed Brown           ierr = PetscMalloc ( pcbddc->coarse_size*sizeof(PetscInt),&aux_ins_indices);CHKERRQ(ierr);
36490c7d97c5SJed Brown           ierr = PetscMemzero(aux_ins_indices,pcbddc->coarse_size*sizeof(PetscInt));CHKERRQ(ierr);
36500c7d97c5SJed Brown           /* allocate stuffs for message massing */
36510c7d97c5SJed Brown           ierr = PetscMalloc ( (count_recv+1)*sizeof(MPI_Request),&requests);CHKERRQ(ierr);
36520c7d97c5SJed Brown           for(i=0;i<count_recv+1;i++) requests[i]=MPI_REQUEST_NULL;
36530c7d97c5SJed Brown           ierr = PetscMalloc ( count_recv*sizeof(PetscMPIInt),&localsizes2);CHKERRQ(ierr);
36540c7d97c5SJed Brown           ierr = PetscMalloc ( count_recv*sizeof(PetscMPIInt),&localdispl2);CHKERRQ(ierr);
36550c7d97c5SJed Brown           /* fill up quantities */
36560c7d97c5SJed Brown           j=0;
36570c7d97c5SJed Brown           for(i=0;i<count_recv;i++){
36580c7d97c5SJed Brown             ii = ranks_recv[i];
36590c7d97c5SJed Brown             localsizes2[i]=pcbddc->local_primal_sizes[ii]*pcbddc->local_primal_sizes[ii];
36600c7d97c5SJed Brown             localdispl2[i]=j;
36610c7d97c5SJed Brown             j+=localsizes2[i];
36620c7d97c5SJed Brown             jj = pcbddc->local_primal_displacements[ii];
3663da1bb401SStefano Zampini             for(k=0;k<pcbddc->local_primal_sizes[ii];k++) aux_ins_indices[pcbddc->replicated_local_primal_indices[jj+k]]+=1;  /* it counts the coarse subdomains sharing the coarse node */
36640c7d97c5SJed Brown           }
3665da1bb401SStefano Zampini           /*printf("aux_ins_indices 1\n");
3666da1bb401SStefano Zampini           for(i=0;i<pcbddc->coarse_size;i++)
3667da1bb401SStefano Zampini             printf("%d ",aux_ins_indices[i]);
3668da1bb401SStefano Zampini           printf("\n");*/
36690c7d97c5SJed Brown           /* temp_coarse_mat_vals used to store temporarly received matrix values */
36700c7d97c5SJed Brown           ierr = PetscMalloc ( j*sizeof(PetscScalar),&temp_coarse_mat_vals);CHKERRQ(ierr);
36710c7d97c5SJed Brown           /* evaluate how many values I will insert in coarse mat */
36720c7d97c5SJed Brown           ins_local_primal_size=0;
36730c7d97c5SJed Brown           for(i=0;i<pcbddc->coarse_size;i++)
36740c7d97c5SJed Brown             if(aux_ins_indices[i])
36750c7d97c5SJed Brown               ins_local_primal_size++;
36760c7d97c5SJed Brown           /* evaluate indices I will insert in coarse mat */
36770c7d97c5SJed Brown           ierr = PetscMalloc ( ins_local_primal_size*sizeof(PetscInt),&ins_local_primal_indices);CHKERRQ(ierr);
36780c7d97c5SJed Brown           j=0;
36790c7d97c5SJed Brown           for(i=0;i<pcbddc->coarse_size;i++)
36800c7d97c5SJed Brown             if(aux_ins_indices[i])
36810c7d97c5SJed Brown               ins_local_primal_indices[j++]=i;
36820c7d97c5SJed Brown           /* use aux_ins_indices to realize a global to local mapping */
36830c7d97c5SJed Brown           j=0;
36840c7d97c5SJed Brown           for(i=0;i<pcbddc->coarse_size;i++){
36850c7d97c5SJed Brown             if(aux_ins_indices[i]==0){
36860c7d97c5SJed Brown               aux_ins_indices[i]=-1;
36870c7d97c5SJed Brown             } else {
36880c7d97c5SJed Brown               aux_ins_indices[i]=j;
36890c7d97c5SJed Brown               j++;
36900c7d97c5SJed Brown             }
36910c7d97c5SJed Brown           }
36920c7d97c5SJed Brown 
3693da1bb401SStefano Zampini           /*printf("New details localsizes2 localdispl2\n");
3694da1bb401SStefano Zampini           for(i=0;i<count_recv;i++)
3695da1bb401SStefano Zampini             printf("(%d %d) ",localsizes2[i],localdispl2[i]);
3696da1bb401SStefano Zampini           printf("\n");
3697da1bb401SStefano Zampini           printf("aux_ins_indices 2\n");
3698da1bb401SStefano Zampini           for(i=0;i<pcbddc->coarse_size;i++)
3699da1bb401SStefano Zampini             printf("%d ",aux_ins_indices[i]);
3700da1bb401SStefano Zampini           printf("\n");
3701da1bb401SStefano Zampini           printf("ins_local_primal_indices\n");
3702da1bb401SStefano Zampini           for(i=0;i<ins_local_primal_size;i++)
3703da1bb401SStefano Zampini             printf("%d ",ins_local_primal_indices[i]);
3704da1bb401SStefano Zampini           printf("\n");
3705da1bb401SStefano Zampini           printf("coarse_submat_vals\n");
3706da1bb401SStefano Zampini           for(i=0;i<pcbddc->local_primal_size;i++)
3707da1bb401SStefano Zampini             for(j=0;j<pcbddc->local_primal_size;j++)
3708da1bb401SStefano Zampini               printf("(%lf %d %d)\n",coarse_submat_vals[j*pcbddc->local_primal_size+i],pcbddc->local_primal_indices[i],pcbddc->local_primal_indices[j]);
3709da1bb401SStefano Zampini           printf("\n");*/
37100c7d97c5SJed Brown 
37110c7d97c5SJed Brown           /* processes partecipating in coarse problem receive matrix data from their friends */
371253cdbc3dSStefano Zampini           for(i=0;i<count_recv;i++) ierr = MPI_Irecv(&temp_coarse_mat_vals[localdispl2[i]],localsizes2[i],MPIU_SCALAR,ranks_recv[i],666,prec_comm,&requests[i]);CHKERRQ(ierr);
37130c7d97c5SJed Brown           if(rank_coarse_proc_send_to != MPI_PROC_NULL ) {
37140c7d97c5SJed Brown             send_size=pcbddc->local_primal_size*pcbddc->local_primal_size;
371553cdbc3dSStefano Zampini             ierr = MPI_Isend(&coarse_submat_vals[0],send_size,MPIU_SCALAR,rank_coarse_proc_send_to,666,prec_comm,&requests[count_recv]);CHKERRQ(ierr);
37160c7d97c5SJed Brown           }
371753cdbc3dSStefano Zampini           ierr = MPI_Waitall(count_recv+1,requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
37180c7d97c5SJed Brown 
3719da1bb401SStefano Zampini           /*if(coarse_color == 0) {
3720da1bb401SStefano Zampini             printf("temp_coarse_mat_vals\n");
3721da1bb401SStefano Zampini             for(k=0;k<count_recv;k++){
3722da1bb401SStefano Zampini               printf("---- %d ----\n",ranks_recv[k]);
3723da1bb401SStefano Zampini               for(i=0;i<pcbddc->local_primal_sizes[ranks_recv[k]];i++)
3724da1bb401SStefano Zampini                 for(j=0;j<pcbddc->local_primal_sizes[ranks_recv[k]];j++)
3725da1bb401SStefano Zampini                   printf("(%lf %d %d)\n",temp_coarse_mat_vals[localdispl2[k]+j*pcbddc->local_primal_sizes[ranks_recv[k]]+i],pcbddc->replicated_local_primal_indices[pcbddc->local_primal_displacements[ranks_recv[k]]+i],pcbddc->replicated_local_primal_indices[pcbddc->local_primal_displacements[ranks_recv[k]]+j]);
3726da1bb401SStefano Zampini               printf("\n");
3727da1bb401SStefano Zampini             }
3728da1bb401SStefano Zampini           }*/
37290c7d97c5SJed Brown           /* calculate data to insert in coarse mat */
37300c7d97c5SJed Brown           ierr = PetscMalloc ( ins_local_primal_size*ins_local_primal_size*sizeof(PetscScalar),&ins_coarse_mat_vals);CHKERRQ(ierr);
37310c7d97c5SJed Brown           PetscMemzero(ins_coarse_mat_vals,ins_local_primal_size*ins_local_primal_size*sizeof(PetscScalar));
37320c7d97c5SJed Brown 
37330c7d97c5SJed Brown           PetscMPIInt rr,kk,lps,lpd;
37340c7d97c5SJed Brown           PetscInt row_ind,col_ind;
37350c7d97c5SJed Brown           for(k=0;k<count_recv;k++){
37360c7d97c5SJed Brown             rr = ranks_recv[k];
37370c7d97c5SJed Brown             kk = localdispl2[k];
37380c7d97c5SJed Brown             lps = pcbddc->local_primal_sizes[rr];
37390c7d97c5SJed Brown             lpd = pcbddc->local_primal_displacements[rr];
3740da1bb401SStefano Zampini             /*printf("Inserting the following indices (received from %d)\n",rr);*/
37410c7d97c5SJed Brown             for(j=0;j<lps;j++){
37420c7d97c5SJed Brown               col_ind=aux_ins_indices[pcbddc->replicated_local_primal_indices[lpd+j]];
37430c7d97c5SJed Brown               for(i=0;i<lps;i++){
37440c7d97c5SJed Brown                 row_ind=aux_ins_indices[pcbddc->replicated_local_primal_indices[lpd+i]];
3745da1bb401SStefano Zampini                 /*printf("%d %d\n",row_ind,col_ind);*/
37460c7d97c5SJed Brown                 ins_coarse_mat_vals[col_ind*ins_local_primal_size+row_ind]+=temp_coarse_mat_vals[kk+j*lps+i];
37470c7d97c5SJed Brown               }
37480c7d97c5SJed Brown             }
37490c7d97c5SJed Brown           }
37500c7d97c5SJed Brown           ierr = PetscFree(requests);CHKERRQ(ierr);
37510c7d97c5SJed Brown           ierr = PetscFree(aux_ins_indices);CHKERRQ(ierr);
37520c7d97c5SJed Brown           ierr = PetscFree(temp_coarse_mat_vals);CHKERRQ(ierr);
37530c7d97c5SJed Brown           if(coarse_color == 0) { ierr = PetscFree(ranks_recv);CHKERRQ(ierr); }
37540c7d97c5SJed Brown 
37550c7d97c5SJed Brown           /* create local to global mapping needed by coarse MATIS */
37560c7d97c5SJed Brown           {
37570c7d97c5SJed Brown             IS coarse_IS;
375853cdbc3dSStefano Zampini             if(coarse_comm != MPI_COMM_NULL ) ierr = MPI_Comm_free(&coarse_comm);CHKERRQ(ierr);
37590c7d97c5SJed Brown             coarse_comm = prec_comm;
37600c7d97c5SJed Brown             active_rank=rank_prec_comm;
37610c7d97c5SJed Brown             ierr = ISCreateGeneral(coarse_comm,ins_local_primal_size,ins_local_primal_indices,PETSC_COPY_VALUES,&coarse_IS);CHKERRQ(ierr);
37620c7d97c5SJed Brown             ierr = ISLocalToGlobalMappingCreateIS(coarse_IS,&coarse_ISLG);CHKERRQ(ierr);
37630c7d97c5SJed Brown             ierr = ISDestroy(&coarse_IS);CHKERRQ(ierr);
37640c7d97c5SJed Brown           }
37650c7d97c5SJed Brown         }
37660c7d97c5SJed Brown         if(pcbddc->coarse_problem_type==PARALLEL_BDDC) {
37670c7d97c5SJed Brown           /* arrays for values insertion */
37680c7d97c5SJed Brown           ins_local_primal_size = pcbddc->local_primal_size;
37690c7d97c5SJed Brown           ierr = PetscMalloc ( ins_local_primal_size*sizeof(PetscMPIInt),&ins_local_primal_indices);CHKERRQ(ierr);
37700c7d97c5SJed Brown           ierr = PetscMalloc ( ins_local_primal_size*ins_local_primal_size*sizeof(PetscScalar),&ins_coarse_mat_vals);CHKERRQ(ierr);
37710c7d97c5SJed Brown           for(j=0;j<ins_local_primal_size;j++){
37720c7d97c5SJed Brown             ins_local_primal_indices[j]=pcbddc->local_primal_indices[j];
37730c7d97c5SJed Brown             for(i=0;i<ins_local_primal_size;i++) ins_coarse_mat_vals[j*ins_local_primal_size+i]=coarse_submat_vals[j*ins_local_primal_size+i];
37740c7d97c5SJed Brown           }
37750c7d97c5SJed Brown         }
37760c7d97c5SJed Brown         break;
37770c7d97c5SJed Brown 
37780c7d97c5SJed Brown     }
37790c7d97c5SJed Brown 
37800c7d97c5SJed Brown     case(GATHERS_BDDC):
37810c7d97c5SJed Brown       {
37820c7d97c5SJed Brown 
37830c7d97c5SJed Brown         PetscMPIInt mysize,mysize2;
37840c7d97c5SJed Brown 
37850c7d97c5SJed Brown         if(rank_prec_comm==active_rank) {
37860c7d97c5SJed Brown           ierr = PetscMalloc ( pcbddc->replicated_primal_size*sizeof(PetscMPIInt),&pcbddc->replicated_local_primal_indices);CHKERRQ(ierr);
37870c7d97c5SJed Brown           pcbddc->replicated_local_primal_values = (PetscScalar*)calloc(pcbddc->replicated_primal_size,sizeof(PetscScalar));
37880c7d97c5SJed Brown           ierr = PetscMalloc ( size_prec_comm*sizeof(PetscMPIInt),&localsizes2);CHKERRQ(ierr);
37890c7d97c5SJed Brown           ierr = PetscMalloc ( size_prec_comm*sizeof(PetscMPIInt),&localdispl2);CHKERRQ(ierr);
37900c7d97c5SJed Brown           /* arrays for values insertion */
37910c7d97c5SJed Brown           ins_local_primal_size = pcbddc->coarse_size;
37920c7d97c5SJed Brown           ierr = PetscMalloc ( ins_local_primal_size*sizeof(PetscMPIInt),&ins_local_primal_indices);CHKERRQ(ierr);
37930c7d97c5SJed Brown           ierr = PetscMalloc ( ins_local_primal_size*ins_local_primal_size*sizeof(PetscScalar),&ins_coarse_mat_vals);CHKERRQ(ierr);
37940c7d97c5SJed Brown           for(i=0;i<size_prec_comm;i++) localsizes2[i]=pcbddc->local_primal_sizes[i]*pcbddc->local_primal_sizes[i];
37950c7d97c5SJed Brown           localdispl2[0]=0;
37960c7d97c5SJed Brown           for(i=1;i<size_prec_comm;i++) localdispl2[i]=localsizes2[i-1]+localdispl2[i-1];
37970c7d97c5SJed Brown           j=0;
37980c7d97c5SJed Brown           for(i=0;i<size_prec_comm;i++) j+=localsizes2[i];
37990c7d97c5SJed Brown           ierr = PetscMalloc ( j*sizeof(PetscScalar),&temp_coarse_mat_vals);CHKERRQ(ierr);
38000c7d97c5SJed Brown         }
38010c7d97c5SJed Brown 
38020c7d97c5SJed Brown         mysize=pcbddc->local_primal_size;
38030c7d97c5SJed Brown         mysize2=pcbddc->local_primal_size*pcbddc->local_primal_size;
38040c7d97c5SJed Brown         if(pcbddc->coarse_problem_type == SEQUENTIAL_BDDC){
380553cdbc3dSStefano Zampini           ierr = MPI_Gatherv(&pcbddc->local_primal_indices[0],mysize,MPIU_INT,&pcbddc->replicated_local_primal_indices[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr);
380653cdbc3dSStefano Zampini           ierr = MPI_Gatherv(&coarse_submat_vals[0],mysize2,MPIU_SCALAR,&temp_coarse_mat_vals[0],localsizes2,localdispl2,MPIU_SCALAR,master_proc,prec_comm);CHKERRQ(ierr);
38070c7d97c5SJed Brown         } else {
380853cdbc3dSStefano Zampini           ierr = MPI_Allgatherv(&pcbddc->local_primal_indices[0],mysize,MPIU_INT,&pcbddc->replicated_local_primal_indices[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,prec_comm);CHKERRQ(ierr);
380953cdbc3dSStefano Zampini           ierr = MPI_Allgatherv(&coarse_submat_vals[0],mysize2,MPIU_SCALAR,&temp_coarse_mat_vals[0],localsizes2,localdispl2,MPIU_SCALAR,prec_comm);CHKERRQ(ierr);
38100c7d97c5SJed Brown         }
38110c7d97c5SJed Brown 
38120c7d97c5SJed Brown   /* free data structures no longer needed and allocate some space which will be needed in BDDC application */
38130c7d97c5SJed Brown         if(rank_prec_comm==active_rank) {
38140c7d97c5SJed Brown           PetscInt offset,offset2,row_ind,col_ind;
38150c7d97c5SJed Brown           for(j=0;j<ins_local_primal_size;j++){
38160c7d97c5SJed Brown             ins_local_primal_indices[j]=j;
38170c7d97c5SJed Brown             for(i=0;i<ins_local_primal_size;i++) ins_coarse_mat_vals[j*ins_local_primal_size+i]=0.0;
38180c7d97c5SJed Brown           }
38190c7d97c5SJed Brown           for(k=0;k<size_prec_comm;k++){
38200c7d97c5SJed Brown             offset=pcbddc->local_primal_displacements[k];
38210c7d97c5SJed Brown             offset2=localdispl2[k];
38220c7d97c5SJed Brown             for(j=0;j<pcbddc->local_primal_sizes[k];j++){
38230c7d97c5SJed Brown               col_ind=pcbddc->replicated_local_primal_indices[offset+j];
38240c7d97c5SJed Brown               for(i=0;i<pcbddc->local_primal_sizes[k];i++){
38250c7d97c5SJed Brown                 row_ind=pcbddc->replicated_local_primal_indices[offset+i];
38260c7d97c5SJed Brown                 ins_coarse_mat_vals[col_ind*pcbddc->coarse_size+row_ind]+=temp_coarse_mat_vals[offset2+j*pcbddc->local_primal_sizes[k]+i];
38270c7d97c5SJed Brown               }
38280c7d97c5SJed Brown             }
38290c7d97c5SJed Brown           }
38300c7d97c5SJed Brown         }
38310c7d97c5SJed Brown         break;
3832da1bb401SStefano Zampini       }/* switch on coarse problem and communications associated with finished */
38330c7d97c5SJed Brown   }
38340c7d97c5SJed Brown 
38350c7d97c5SJed Brown   /* Now create and fill up coarse matrix */
38360c7d97c5SJed Brown   if( rank_prec_comm == active_rank ) {
38370c7d97c5SJed Brown     if(pcbddc->coarse_problem_type != MULTILEVEL_BDDC) {
38380c7d97c5SJed Brown       ierr = MatCreate(coarse_comm,&pcbddc->coarse_mat);CHKERRQ(ierr);
38390c7d97c5SJed Brown       ierr = MatSetSizes(pcbddc->coarse_mat,PETSC_DECIDE,PETSC_DECIDE,pcbddc->coarse_size,pcbddc->coarse_size);CHKERRQ(ierr);
38400c7d97c5SJed Brown       ierr = MatSetType(pcbddc->coarse_mat,coarse_mat_type);CHKERRQ(ierr);
38413b03a366Sstefano_zampini       ierr = MatSetUp(pcbddc->coarse_mat);CHKERRQ(ierr);
3842da1bb401SStefano Zampini       ierr = MatSetOption(pcbddc->coarse_mat,MAT_ROW_ORIENTED,PETSC_FALSE);CHKERRQ(ierr); /* local values stored in column major */
38433b03a366Sstefano_zampini       ierr = MatSetOption(pcbddc->coarse_mat,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr);
38440c7d97c5SJed Brown     } else {
38450c7d97c5SJed Brown       Mat matis_coarse_local_mat;
3846d3ee2243SStefano Zampini       /* remind bs */
3847d3ee2243SStefano Zampini       ierr = MatCreateIS(coarse_comm,bs,PETSC_DECIDE,PETSC_DECIDE,pcbddc->coarse_size,pcbddc->coarse_size,coarse_ISLG,&pcbddc->coarse_mat);CHKERRQ(ierr);
38483b03a366Sstefano_zampini       ierr = MatSetUp(pcbddc->coarse_mat);CHKERRQ(ierr);
38490c7d97c5SJed Brown       ierr = MatISGetLocalMat(pcbddc->coarse_mat,&matis_coarse_local_mat);CHKERRQ(ierr);
38503b03a366Sstefano_zampini       ierr = MatSetUp(matis_coarse_local_mat);CHKERRQ(ierr);
3851da1bb401SStefano Zampini       ierr = MatSetOption(matis_coarse_local_mat,MAT_ROW_ORIENTED,PETSC_FALSE);CHKERRQ(ierr); /* local values stored in column major */
3852a0ba757dSStefano Zampini       ierr = MatSetOption(matis_coarse_local_mat,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr);
38530c7d97c5SJed Brown     }
3854a0ba757dSStefano Zampini     ierr = MatSetOption(pcbddc->coarse_mat,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_FALSE);CHKERRQ(ierr);
38550c7d97c5SJed Brown     ierr = MatSetValues(pcbddc->coarse_mat,ins_local_primal_size,ins_local_primal_indices,ins_local_primal_size,ins_local_primal_indices,ins_coarse_mat_vals,ADD_VALUES);CHKERRQ(ierr);
38560c7d97c5SJed Brown     ierr = MatAssemblyBegin(pcbddc->coarse_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
38570c7d97c5SJed Brown     ierr = MatAssemblyEnd(pcbddc->coarse_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
38580c7d97c5SJed Brown 
3859da1bb401SStefano Zampini     /*  PetscViewer view_out;
3860da1bb401SStefano Zampini       ierr = PetscViewerASCIIOpen(PETSC_COMM_SELF,"coarsematfull.m",&view_out);CHKERRQ(ierr);
3861da1bb401SStefano Zampini       ierr = PetscViewerSetFormat(view_out,PETSC_VIEWER_ASCII_MATLAB);CHKERRQ(ierr);
3862da1bb401SStefano Zampini       ierr = MatView(pcbddc->coarse_mat,view_out);CHKERRQ(ierr);
3863da1bb401SStefano Zampini       ierr = PetscViewerDestroy(&view_out);CHKERRQ(ierr);*/
3864da1bb401SStefano Zampini 
38650c7d97c5SJed Brown     ierr = MatGetVecs(pcbddc->coarse_mat,&pcbddc->coarse_vec,&pcbddc->coarse_rhs);CHKERRQ(ierr);
38660c7d97c5SJed Brown     /* Preconditioner for coarse problem */
386753cdbc3dSStefano Zampini     ierr = KSPCreate(coarse_comm,&pcbddc->coarse_ksp);CHKERRQ(ierr);
386853cdbc3dSStefano Zampini     ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->coarse_ksp,(PetscObject)pc,1);CHKERRQ(ierr);
386953cdbc3dSStefano Zampini     ierr = KSPSetOperators(pcbddc->coarse_ksp,pcbddc->coarse_mat,pcbddc->coarse_mat,SAME_PRECONDITIONER);CHKERRQ(ierr);
38703b03a366Sstefano_zampini     ierr = KSPSetTolerances(pcbddc->coarse_ksp,PETSC_DEFAULT,PETSC_DEFAULT,PETSC_DEFAULT,max_it_coarse_ksp);CHKERRQ(ierr);
387153cdbc3dSStefano Zampini     ierr = KSPSetType(pcbddc->coarse_ksp,coarse_ksp_type);CHKERRQ(ierr);
387253cdbc3dSStefano Zampini     ierr = KSPGetPC(pcbddc->coarse_ksp,&pc_temp);CHKERRQ(ierr);
387353cdbc3dSStefano Zampini     ierr = PCSetType(pc_temp,coarse_pc_type);CHKERRQ(ierr);
38740c7d97c5SJed Brown     /* Allow user's customization */
3875da1bb401SStefano Zampini     ierr = KSPSetOptionsPrefix(pcbddc->coarse_ksp,"coarse_");CHKERRQ(ierr);
387653cdbc3dSStefano Zampini     ierr = KSPSetFromOptions(pcbddc->coarse_ksp);CHKERRQ(ierr);
38770c7d97c5SJed Brown     /* Set Up PC for coarse problem BDDC */
387853cdbc3dSStefano Zampini     if(pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
3879e269702eSStefano Zampini       if(dbg_flag) {
3880e269702eSStefano Zampini         ierr = PetscViewerASCIIPrintf(viewer,"----------------Setting up a new level---------------\n");CHKERRQ(ierr);
3881e269702eSStefano Zampini         ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
3882e269702eSStefano Zampini       }
388353cdbc3dSStefano Zampini       ierr = PCBDDCSetCoarseProblemType(pc_temp,MULTILEVEL_BDDC);CHKERRQ(ierr);
388453cdbc3dSStefano Zampini     }
388553cdbc3dSStefano Zampini     ierr = KSPSetUp(pcbddc->coarse_ksp);CHKERRQ(ierr);
38865619798eSStefano Zampini     if(pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
38875619798eSStefano Zampini       if(dbg_flag) {
38885619798eSStefano Zampini         ierr = PetscViewerASCIIPrintf(viewer,"----------------New level set------------------------\n");CHKERRQ(ierr);
38895619798eSStefano Zampini         ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
38905619798eSStefano Zampini       }
38915619798eSStefano Zampini     }
38920c7d97c5SJed Brown   }
38930c7d97c5SJed Brown   if(pcbddc->coarse_communications_type == SCATTERS_BDDC) {
38940c7d97c5SJed Brown      IS local_IS,global_IS;
38950c7d97c5SJed Brown      ierr = ISCreateStride(PETSC_COMM_SELF,pcbddc->local_primal_size,0,1,&local_IS);CHKERRQ(ierr);
38960c7d97c5SJed Brown      ierr = ISCreateGeneral(PETSC_COMM_SELF,pcbddc->local_primal_size,pcbddc->local_primal_indices,PETSC_COPY_VALUES,&global_IS);CHKERRQ(ierr);
38970c7d97c5SJed Brown      ierr = VecScatterCreate(pcbddc->vec1_P,local_IS,pcbddc->coarse_vec,global_IS,&pcbddc->coarse_loc_to_glob);CHKERRQ(ierr);
38980c7d97c5SJed Brown      ierr = ISDestroy(&local_IS);CHKERRQ(ierr);
38990c7d97c5SJed Brown      ierr = ISDestroy(&global_IS);CHKERRQ(ierr);
39000c7d97c5SJed Brown   }
39010c7d97c5SJed Brown 
39020c7d97c5SJed Brown 
39033b03a366Sstefano_zampini   /* Evaluate condition number of coarse problem for cheby (and verbose output if requested) */
39043b03a366Sstefano_zampini   if( pcbddc->coarse_problem_type == MULTILEVEL_BDDC && rank_prec_comm == active_rank ) {
39050c7d97c5SJed Brown     PetscScalar m_one=-1.0;
39065619798eSStefano Zampini     PetscReal   infty_error,lambda_min,lambda_max,kappa_2;
39073b03a366Sstefano_zampini     const KSPType check_ksp_type=KSPGMRES;
39080c7d97c5SJed Brown 
39095619798eSStefano Zampini     /* change coarse ksp object to an iterative method suitable for extreme eigenvalues' estimation */
39103b03a366Sstefano_zampini     ierr = KSPSetType(pcbddc->coarse_ksp,check_ksp_type);CHKERRQ(ierr);
3911d49ef151SStefano Zampini     ierr = KSPSetComputeSingularValues(pcbddc->coarse_ksp,PETSC_TRUE);CHKERRQ(ierr);
39125619798eSStefano Zampini     ierr = KSPSetTolerances(pcbddc->coarse_ksp,1.e-8,1.e-8,PETSC_DEFAULT,pcbddc->coarse_size);CHKERRQ(ierr);
39135619798eSStefano Zampini     ierr = KSPSetUp(pcbddc->coarse_ksp);CHKERRQ(ierr);
3914d49ef151SStefano Zampini     ierr = VecSetRandom(pcbddc->coarse_rhs,PETSC_NULL);CHKERRQ(ierr);
3915d49ef151SStefano Zampini     ierr = MatMult(pcbddc->coarse_mat,pcbddc->coarse_rhs,pcbddc->coarse_vec);CHKERRQ(ierr);
3916d49ef151SStefano Zampini     ierr = MatMult(pcbddc->coarse_mat,pcbddc->coarse_vec,pcbddc->coarse_rhs);CHKERRQ(ierr);
3917d49ef151SStefano Zampini     ierr = KSPSolve(pcbddc->coarse_ksp,pcbddc->coarse_rhs,pcbddc->coarse_rhs);CHKERRQ(ierr);
3918d49ef151SStefano Zampini     ierr = KSPComputeExtremeSingularValues(pcbddc->coarse_ksp,&lambda_max,&lambda_min);CHKERRQ(ierr);
39193b03a366Sstefano_zampini     if(dbg_flag) {
39205619798eSStefano Zampini       kappa_2=lambda_max/lambda_min;
39215619798eSStefano Zampini       ierr = KSPGetIterationNumber(pcbddc->coarse_ksp,&k);CHKERRQ(ierr);
3922d49ef151SStefano Zampini       ierr = VecAXPY(pcbddc->coarse_rhs,m_one,pcbddc->coarse_vec);CHKERRQ(ierr);
3923d49ef151SStefano Zampini       ierr = VecNorm(pcbddc->coarse_rhs,NORM_INFINITY,&infty_error);CHKERRQ(ierr);
39243b03a366Sstefano_zampini       ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem condition number estimated with %d iterations of %s is: % 1.14e\n",k,check_ksp_type,kappa_2);CHKERRQ(ierr);
3925e269702eSStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem eigenvalues: % 1.14e %1.14e\n",lambda_min,lambda_max);CHKERRQ(ierr);
3926e269702eSStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem infty_error: %1.14e\n",infty_error);CHKERRQ(ierr);
39273b03a366Sstefano_zampini     }
39285619798eSStefano Zampini     /* restore coarse ksp to default values */
3929d49ef151SStefano Zampini     ierr = KSPSetComputeSingularValues(pcbddc->coarse_ksp,PETSC_FALSE);CHKERRQ(ierr);
39305619798eSStefano Zampini     ierr = KSPSetType(pcbddc->coarse_ksp,coarse_ksp_type);CHKERRQ(ierr);
39316c9de887SHong Zhang     ierr = KSPChebyshevSetEigenvalues(pcbddc->coarse_ksp,lambda_max,lambda_min);CHKERRQ(ierr);
39323b03a366Sstefano_zampini     ierr = KSPSetTolerances(pcbddc->coarse_ksp,PETSC_DEFAULT,PETSC_DEFAULT,PETSC_DEFAULT,max_it_coarse_ksp);CHKERRQ(ierr);
39335619798eSStefano Zampini     ierr = KSPSetFromOptions(pcbddc->coarse_ksp);CHKERRQ(ierr);
39345619798eSStefano Zampini     ierr = KSPSetUp(pcbddc->coarse_ksp);CHKERRQ(ierr);
393553cdbc3dSStefano Zampini   }
39360c7d97c5SJed Brown 
39370c7d97c5SJed Brown   /* free data structures no longer needed */
39380c7d97c5SJed Brown   if(coarse_ISLG)                { ierr = ISLocalToGlobalMappingDestroy(&coarse_ISLG);CHKERRQ(ierr); }
39390c7d97c5SJed Brown   if(ins_local_primal_indices)   { ierr = PetscFree(ins_local_primal_indices);CHKERRQ(ierr);  }
39400c7d97c5SJed Brown   if(ins_coarse_mat_vals)        { ierr = PetscFree(ins_coarse_mat_vals);CHKERRQ(ierr);}
39410c7d97c5SJed Brown   if(localsizes2)                { ierr = PetscFree(localsizes2);CHKERRQ(ierr);}
39420c7d97c5SJed Brown   if(localdispl2)                { ierr = PetscFree(localdispl2);CHKERRQ(ierr);}
39430c7d97c5SJed Brown   if(temp_coarse_mat_vals)       { ierr = PetscFree(temp_coarse_mat_vals);CHKERRQ(ierr);}
39440c7d97c5SJed Brown 
39450c7d97c5SJed Brown   PetscFunctionReturn(0);
39460c7d97c5SJed Brown }
39470c7d97c5SJed Brown 
39480c7d97c5SJed Brown #undef __FUNCT__
39490c7d97c5SJed Brown #define __FUNCT__ "PCBDDCManageLocalBoundaries"
395053cdbc3dSStefano Zampini static PetscErrorCode PCBDDCManageLocalBoundaries(PC pc)
39510c7d97c5SJed Brown {
39520c7d97c5SJed Brown 
39530c7d97c5SJed Brown   PC_BDDC     *pcbddc = (PC_BDDC*)pc->data;
39540c7d97c5SJed Brown   PC_IS         *pcis = (PC_IS*)pc->data;
39550c7d97c5SJed Brown   Mat_IS      *matis  = (Mat_IS*)pc->pmat->data;
3956da1bb401SStefano Zampini   PCBDDCGraph mat_graph=pcbddc->mat_graph;
39573972b0daSStefano Zampini   PetscInt    *queue_in_global_numbering,*is_indices,*auxis;
39583b03a366Sstefano_zampini   PetscInt    bs,ierr,i,j,s,k,iindex,neumann_bsize,dirichlet_bsize;
3959da1bb401SStefano Zampini   PetscInt    total_counts,nodes_touched,where_values=1,vertex_size;
3960534831adSStefano Zampini   PetscMPIInt adapt_interface=0,adapt_interface_reduced=0,NEUMANNCNT=0;
3961da1bb401SStefano Zampini   PetscBool   same_set;
3962a0ba757dSStefano Zampini   MPI_Comm    interface_comm=((PetscObject)pc)->comm;
39633b03a366Sstefano_zampini   PetscBool   use_faces=PETSC_FALSE,use_edges=PETSC_FALSE;
39643b03a366Sstefano_zampini   const PetscInt *neumann_nodes;
39653b03a366Sstefano_zampini   const PetscInt *dirichlet_nodes;
3966a81d60d8SStefano Zampini   IS          used_IS,*custom_ISForDofs;
3967da1bb401SStefano Zampini   PetscScalar *array;
3968da1bb401SStefano Zampini   PetscScalar *array2;
3969da1bb401SStefano Zampini   PetscViewer viewer=pcbddc->dbg_viewer;
39700c7d97c5SJed Brown 
39710c7d97c5SJed Brown   PetscFunctionBegin;
3972da1bb401SStefano Zampini   /* Setup local adjacency graph */
3973da1bb401SStefano Zampini   mat_graph->nvtxs=pcis->n;
3974534831adSStefano Zampini   if(!mat_graph->xadj) { NEUMANNCNT = 1; }
3975da1bb401SStefano Zampini   ierr = PCBDDCSetupLocalAdjacencyGraph(pc);CHKERRQ(ierr);
3976a0ba757dSStefano Zampini   i = mat_graph->nvtxs;
3977a0ba757dSStefano Zampini   ierr = PetscMalloc4(i,PetscInt,&mat_graph->where,i,PetscInt,&mat_graph->count,i+1,PetscInt,&mat_graph->cptr,i,PetscInt,&mat_graph->queue);CHKERRQ(ierr);
39783972b0daSStefano Zampini   ierr = PetscMalloc2(i,PetscInt,&mat_graph->which_dof,i,PetscBool,&mat_graph->touched);CHKERRQ(ierr);
39793972b0daSStefano Zampini   ierr = PetscMalloc(i*sizeof(PetscInt),&queue_in_global_numbering);CHKERRQ(ierr);
3980a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->where,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
3981a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->count,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
3982a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->which_dof,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
3983a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->queue,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
39843828260eSStefano Zampini   ierr = PetscMemzero(mat_graph->cptr,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr);
3985a0ba757dSStefano Zampini 
3986a81d60d8SStefano Zampini   /* Setting dofs splitting in mat_graph->which_dof
3987a81d60d8SStefano Zampini      Get information about dofs' splitting if provided by the user
3988a81d60d8SStefano Zampini      Otherwise it assumes a constant block size */
3989a81d60d8SStefano Zampini   vertex_size=0;
3990a81d60d8SStefano Zampini   if(!pcbddc->n_ISForDofs) {
3991a81d60d8SStefano Zampini     ierr = MatGetBlockSize(matis->A,&bs);CHKERRQ(ierr);
3992a81d60d8SStefano Zampini     ierr = PetscMalloc(bs*sizeof(IS),&custom_ISForDofs);CHKERRQ(ierr);
3993a81d60d8SStefano Zampini     for(i=0;i<bs;i++) {
3994a81d60d8SStefano Zampini       ierr = ISCreateStride(PETSC_COMM_SELF,pcis->n/bs,i,bs,&custom_ISForDofs[i]);CHKERRQ(ierr);
3995a81d60d8SStefano Zampini     }
3996a81d60d8SStefano Zampini     ierr = PCBDDCSetDofsSplitting(pc,bs,custom_ISForDofs);CHKERRQ(ierr);
3997a81d60d8SStefano Zampini     vertex_size=1;
3998a81d60d8SStefano Zampini     /* remove my references to IS objects */
3999a81d60d8SStefano Zampini     for(i=0;i<bs;i++) {
4000a81d60d8SStefano Zampini       ierr = ISDestroy(&custom_ISForDofs[i]);CHKERRQ(ierr);
4001a81d60d8SStefano Zampini     }
4002a81d60d8SStefano Zampini     ierr = PetscFree(custom_ISForDofs);CHKERRQ(ierr);
4003a81d60d8SStefano Zampini   }
40049c0446d6SStefano Zampini   for(i=0;i<pcbddc->n_ISForDofs;i++) {
4005a81d60d8SStefano Zampini     ierr = ISGetSize(pcbddc->ISForDofs[i],&k);CHKERRQ(ierr);
40069c0446d6SStefano Zampini     ierr = ISGetIndices(pcbddc->ISForDofs[i],(const PetscInt**)&is_indices);CHKERRQ(ierr);
4007a81d60d8SStefano Zampini     for(j=0;j<k;j++) {
40089c0446d6SStefano Zampini       mat_graph->which_dof[is_indices[j]]=i;
40099c0446d6SStefano Zampini     }
40109c0446d6SStefano Zampini     ierr = ISRestoreIndices(pcbddc->ISForDofs[i],(const PetscInt**)&is_indices);CHKERRQ(ierr);
40119c0446d6SStefano Zampini   }
4012a81d60d8SStefano Zampini   /* use mat block size as vertex size if it has not yet set */
4013a81d60d8SStefano Zampini   if(!vertex_size) {
40143b03a366Sstefano_zampini     ierr = MatGetBlockSize(matis->A,&vertex_size);CHKERRQ(ierr);
40150c7d97c5SJed Brown   }
4016a81d60d8SStefano Zampini 
40173b03a366Sstefano_zampini   /* count number of neigh per node */
40180c7d97c5SJed Brown   total_counts=0;
40193b03a366Sstefano_zampini   for(i=1;i<pcis->n_neigh;i++){
40200c7d97c5SJed Brown     s=pcis->n_shared[i];
40210c7d97c5SJed Brown     total_counts+=s;
402253cdbc3dSStefano Zampini     for(j=0;j<s;j++){
40230c7d97c5SJed Brown       mat_graph->count[pcis->shared[i][j]] += 1;
40240c7d97c5SJed Brown     }
40250c7d97c5SJed Brown   }
4026534831adSStefano Zampini   /* Take into account Neumann data -> it increments number of sharing subdomains for nodes lying on the interface */
402736e030ebSStefano Zampini   ierr = PCBDDCGetNeumannBoundaries(pc,&used_IS);CHKERRQ(ierr);
4028da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
4029da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
403036e030ebSStefano Zampini   if(used_IS) {
403136e030ebSStefano Zampini     ierr = ISGetSize(used_IS,&neumann_bsize);CHKERRQ(ierr);
403236e030ebSStefano Zampini     ierr = ISGetIndices(used_IS,&neumann_nodes);CHKERRQ(ierr);
403353cdbc3dSStefano Zampini     for(i=0;i<neumann_bsize;i++){
403453cdbc3dSStefano Zampini       iindex = neumann_nodes[i];
4035534831adSStefano Zampini       if(mat_graph->count[iindex] > NEUMANNCNT && array[iindex]==0.0){
403653cdbc3dSStefano Zampini         mat_graph->count[iindex]+=1;
40370c7d97c5SJed Brown         total_counts++;
4038da1bb401SStefano Zampini         array[iindex]=array[iindex]+1.0;
4039da1bb401SStefano Zampini       } else if(array[iindex]>0.0) {
4040da1bb401SStefano Zampini         SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_USER,"Error for neumann nodes provided to BDDC! They must be uniquely listed! Found duplicate node %d\n",iindex);
40410c7d97c5SJed Brown       }
40420c7d97c5SJed Brown     }
40430c7d97c5SJed Brown   }
4044da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
4045da1bb401SStefano Zampini   /* allocate space for storing the set of neighbours for each node */
4046da1bb401SStefano Zampini   ierr = PetscMalloc(mat_graph->nvtxs*sizeof(PetscInt*),&mat_graph->neighbours_set);CHKERRQ(ierr);
4047da1bb401SStefano Zampini   if(mat_graph->nvtxs) { ierr = PetscMalloc(total_counts*sizeof(PetscInt),&mat_graph->neighbours_set[0]);CHKERRQ(ierr); }
4048da1bb401SStefano Zampini   for(i=1;i<mat_graph->nvtxs;i++) mat_graph->neighbours_set[i]=mat_graph->neighbours_set[i-1]+mat_graph->count[i-1];
4049a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->count,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
40503b03a366Sstefano_zampini   for(i=1;i<pcis->n_neigh;i++){
40510c7d97c5SJed Brown     s=pcis->n_shared[i];
40520c7d97c5SJed Brown     for(j=0;j<s;j++) {
40530c7d97c5SJed Brown       k=pcis->shared[i][j];
4054da1bb401SStefano Zampini       mat_graph->neighbours_set[k][mat_graph->count[k]] = pcis->neigh[i];
40550c7d97c5SJed Brown       mat_graph->count[k]+=1;
40560c7d97c5SJed Brown     }
40570c7d97c5SJed Brown   }
4058da1bb401SStefano Zampini   /* Check consistency of Neumann nodes */
4059da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
4060da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4061da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4062da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4063da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4064da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
40653b03a366Sstefano_zampini   /* set -1 fake neighbour to mimic Neumann boundary */
406636e030ebSStefano Zampini   if(used_IS) {
406753cdbc3dSStefano Zampini     for(i=0;i<neumann_bsize;i++){
406853cdbc3dSStefano Zampini       iindex = neumann_nodes[i];
4069534831adSStefano Zampini       if(mat_graph->count[iindex] > NEUMANNCNT){
4070da1bb401SStefano Zampini         if(mat_graph->count[iindex]+1 != (PetscInt)array[iindex]) {
4071da1bb401SStefano Zampini           SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_USER,"Neumann nodes provided to BDDC must be consistent among neighbours!\nNode %d: number of sharing subdomains %d != number of subdomains for which it is a neumann node %d\n",iindex,mat_graph->count[iindex]+1,(PetscInt)array[iindex]);
4072da1bb401SStefano Zampini         }
4073da1bb401SStefano Zampini         mat_graph->neighbours_set[iindex][mat_graph->count[iindex]] = -1;
407453cdbc3dSStefano Zampini         mat_graph->count[iindex]+=1;
40750c7d97c5SJed Brown       }
40760c7d97c5SJed Brown     }
407736e030ebSStefano Zampini     ierr = ISRestoreIndices(used_IS,&neumann_nodes);CHKERRQ(ierr);
40780c7d97c5SJed Brown   }
4079da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
4080da1bb401SStefano Zampini   /* sort set of sharing subdomains */
4081da1bb401SStefano Zampini   for(i=0;i<mat_graph->nvtxs;i++) { ierr = PetscSortInt(mat_graph->count[i],mat_graph->neighbours_set[i]);CHKERRQ(ierr); }
40823b03a366Sstefano_zampini   /* remove interior nodes and dirichlet boundary nodes from the next search into the graph */
4083da1bb401SStefano Zampini   for(i=0;i<mat_graph->nvtxs;i++){mat_graph->touched[i]=PETSC_FALSE;}
4084da1bb401SStefano Zampini   nodes_touched=0;
408536e030ebSStefano Zampini   ierr = PCBDDCGetDirichletBoundaries(pc,&used_IS);CHKERRQ(ierr);
4086da1bb401SStefano Zampini   ierr = VecSet(pcis->vec2_N,0.0);CHKERRQ(ierr);
4087da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
4088da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec2_N,&array2);CHKERRQ(ierr);
4089da1bb401SStefano Zampini   if(used_IS) {
4090da1bb401SStefano Zampini     ierr = ISGetSize(used_IS,&dirichlet_bsize);CHKERRQ(ierr);
4091da1bb401SStefano Zampini     if(dirichlet_bsize && matis->pure_neumann) {
4092da1bb401SStefano Zampini       SETERRQ(PETSC_COMM_SELF,PETSC_ERR_USER,"Dirichlet boundaries are intended to be used with matrices with zeroed rows!\n");
4093da1bb401SStefano Zampini     }
4094da1bb401SStefano Zampini     ierr = ISGetIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr);
4095da1bb401SStefano Zampini     for(i=0;i<dirichlet_bsize;i++){
4096da1bb401SStefano Zampini       iindex=dirichlet_nodes[i];
4097da1bb401SStefano Zampini       if(mat_graph->count[iindex] && !mat_graph->touched[iindex]) {
4098da1bb401SStefano Zampini         if(array[iindex]>0.0) {
4099da1bb401SStefano Zampini           SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_USER,"BDDC cannot have nodes which are marked as Neumann and Dirichlet at the same time! Wrong node %d\n",iindex);
4100da1bb401SStefano Zampini         }
4101da1bb401SStefano Zampini         mat_graph->touched[iindex]=PETSC_TRUE;
4102da1bb401SStefano Zampini         mat_graph->where[iindex]=0;
4103da1bb401SStefano Zampini         nodes_touched++;
4104da1bb401SStefano Zampini         array2[iindex]=array2[iindex]+1.0;
4105da1bb401SStefano Zampini       }
4106da1bb401SStefano Zampini     }
4107da1bb401SStefano Zampini     ierr = ISRestoreIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr);
4108da1bb401SStefano Zampini   }
4109da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
4110da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec2_N,&array2);CHKERRQ(ierr);
4111da1bb401SStefano Zampini   /* Check consistency of Dirichlet nodes */
4112da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_N,1.0);CHKERRQ(ierr);
4113da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
4114da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4115da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4116da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4117da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4118da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
4119da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec2_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4120da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec2_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4121da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4122da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4123da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
4124da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec2_N,&array2);CHKERRQ(ierr);
412536e030ebSStefano Zampini   if(used_IS) {
412636e030ebSStefano Zampini     ierr = ISGetSize(used_IS,&dirichlet_bsize);CHKERRQ(ierr);
412736e030ebSStefano Zampini     ierr = ISGetIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr);
41283b03a366Sstefano_zampini     for(i=0;i<dirichlet_bsize;i++){
4129da1bb401SStefano Zampini       iindex=dirichlet_nodes[i];
4130da1bb401SStefano Zampini       if(array[iindex]>1.0 && array[iindex]!=array2[iindex] ) {
4131da1bb401SStefano Zampini          SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_USER,"Dirichlet nodes provided to BDDC must be consistent among neighbours!\nNode %d: number of sharing subdomains %d != number of subdomains for which it is a neumann node %d\n",iindex,(PetscInt)array[iindex],(PetscInt)array2[iindex]);
4132da1bb401SStefano Zampini       }
41333b03a366Sstefano_zampini     }
413436e030ebSStefano Zampini     ierr = ISRestoreIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr);
41353b03a366Sstefano_zampini   }
4136da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
4137da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec2_N,&array2);CHKERRQ(ierr);
4138da1bb401SStefano Zampini 
41390c7d97c5SJed Brown   for(i=0;i<mat_graph->nvtxs;i++){
41403b03a366Sstefano_zampini     if(!mat_graph->count[i]){  /* interior nodes */
41410c7d97c5SJed Brown       mat_graph->touched[i]=PETSC_TRUE;
41420c7d97c5SJed Brown       mat_graph->where[i]=0;
41430c7d97c5SJed Brown       nodes_touched++;
41440c7d97c5SJed Brown     }
41450c7d97c5SJed Brown   }
41460c7d97c5SJed Brown   mat_graph->ncmps = 0;
4147da1bb401SStefano Zampini   i=0;
41480c7d97c5SJed Brown   while(nodes_touched<mat_graph->nvtxs) {
4149a0ba757dSStefano Zampini     /*  find first untouched node in local ordering */
41500c7d97c5SJed Brown     while(mat_graph->touched[i]) i++;
41510c7d97c5SJed Brown     mat_graph->touched[i]=PETSC_TRUE;
4152a0ba757dSStefano Zampini     mat_graph->where[i]=where_values;
41530c7d97c5SJed Brown     nodes_touched++;
4154a0ba757dSStefano Zampini     /* now find all other nodes having the same set of sharing subdomains */
41550c7d97c5SJed Brown     for(j=i+1;j<mat_graph->nvtxs;j++){
4156a0ba757dSStefano Zampini       /* check for same number of sharing subdomains and dof number */
4157da1bb401SStefano Zampini       if(!mat_graph->touched[j] && mat_graph->count[i]==mat_graph->count[j] && mat_graph->which_dof[i] == mat_graph->which_dof[j] ){
4158a0ba757dSStefano Zampini         /* check for same set of sharing subdomains */
41590c7d97c5SJed Brown         same_set=PETSC_TRUE;
41600c7d97c5SJed Brown         for(k=0;k<mat_graph->count[j];k++){
4161da1bb401SStefano Zampini           if(mat_graph->neighbours_set[i][k]!=mat_graph->neighbours_set[j][k]) {
41620c7d97c5SJed Brown             same_set=PETSC_FALSE;
41630c7d97c5SJed Brown           }
41640c7d97c5SJed Brown         }
4165a0ba757dSStefano Zampini         /* I found a friend of mine */
41660c7d97c5SJed Brown         if(same_set) {
4167a0ba757dSStefano Zampini           mat_graph->where[j]=where_values;
41680c7d97c5SJed Brown           mat_graph->touched[j]=PETSC_TRUE;
41690c7d97c5SJed Brown           nodes_touched++;
41700c7d97c5SJed Brown         }
41710c7d97c5SJed Brown       }
41720c7d97c5SJed Brown     }
4173a0ba757dSStefano Zampini     where_values++;
41740c7d97c5SJed Brown   }
4175a0ba757dSStefano Zampini   where_values--; if(where_values<0) where_values=0;
4176a0ba757dSStefano Zampini   ierr = PetscMalloc(where_values*sizeof(PetscMPIInt),&mat_graph->where_ncmps);CHKERRQ(ierr);
4177a0ba757dSStefano Zampini   /* Find connected components defined on the shared interface */
4178a0ba757dSStefano Zampini   if(where_values) {
4179a0ba757dSStefano Zampini     ierr = PCBDDCFindConnectedComponents(mat_graph, where_values);
41803b03a366Sstefano_zampini     /* For consistency among neughbouring procs, I need to sort (by global ordering) each connected component */
4181a0ba757dSStefano Zampini     for(i=0;i<mat_graph->ncmps;i++) {
4182a0ba757dSStefano Zampini       ierr = ISLocalToGlobalMappingApply(matis->mapping,mat_graph->cptr[i+1]-mat_graph->cptr[i],&mat_graph->queue[mat_graph->cptr[i]],&queue_in_global_numbering[mat_graph->cptr[i]]);CHKERRQ(ierr);
4183a0ba757dSStefano Zampini       ierr = PetscSortIntWithArray(mat_graph->cptr[i+1]-mat_graph->cptr[i],&queue_in_global_numbering[mat_graph->cptr[i]],&mat_graph->queue[mat_graph->cptr[i]]);CHKERRQ(ierr);
4184a0ba757dSStefano Zampini     }
4185a0ba757dSStefano Zampini   }
4186a0ba757dSStefano Zampini   /* check consistency of connected components among neighbouring subdomains -> it adapt them in case it is needed */
4187a0ba757dSStefano Zampini   for(i=0;i<where_values;i++) {
41883b03a366Sstefano_zampini     /* We are not sure that two connected components will be the same among subdomains sharing a subset of local interface */
41893b03a366Sstefano_zampini     if(mat_graph->where_ncmps[i]>1) {
4190a0ba757dSStefano Zampini       adapt_interface=1;
4191a0ba757dSStefano Zampini       break;
4192a0ba757dSStefano Zampini     }
4193a0ba757dSStefano Zampini   }
4194a0ba757dSStefano Zampini   ierr = MPI_Allreduce(&adapt_interface,&adapt_interface_reduced,1,MPIU_INT,MPI_LOR,interface_comm);CHKERRQ(ierr);
4195da1bb401SStefano Zampini   if(pcbddc->dbg_flag && adapt_interface_reduced) {
4196da1bb401SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"Interface adapted\n");CHKERRQ(ierr);
4197da1bb401SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
4198da1bb401SStefano Zampini   }
4199a0ba757dSStefano Zampini   if(where_values && adapt_interface_reduced) {
42000c7d97c5SJed Brown 
4201a0ba757dSStefano Zampini     PetscInt sum_requests=0,my_rank;
4202a0ba757dSStefano Zampini     PetscInt buffer_size,start_of_recv,size_of_recv,start_of_send;
4203a0ba757dSStefano Zampini     PetscInt temp_buffer_size,ins_val,global_where_counter;
4204a0ba757dSStefano Zampini     PetscInt *cum_recv_counts;
4205a0ba757dSStefano Zampini     PetscInt *where_to_nodes_indices;
4206a0ba757dSStefano Zampini     PetscInt *petsc_buffer;
4207a0ba757dSStefano Zampini     PetscMPIInt *recv_buffer;
4208a0ba757dSStefano Zampini     PetscMPIInt *recv_buffer_where;
4209a0ba757dSStefano Zampini     PetscMPIInt *send_buffer;
4210a0ba757dSStefano Zampini     PetscMPIInt size_of_send;
4211a0ba757dSStefano Zampini     PetscInt *sizes_of_sends;
4212a0ba757dSStefano Zampini     MPI_Request *send_requests;
4213a0ba757dSStefano Zampini     MPI_Request *recv_requests;
4214a0ba757dSStefano Zampini     PetscInt *where_cc_adapt;
4215a0ba757dSStefano Zampini     PetscInt **temp_buffer;
4216a0ba757dSStefano Zampini     PetscInt *nodes_to_temp_buffer_indices;
4217a0ba757dSStefano Zampini     PetscInt *add_to_where;
4218a0ba757dSStefano Zampini 
4219a0ba757dSStefano Zampini     ierr = MPI_Comm_rank(interface_comm,&my_rank);CHKERRQ(ierr);
4220a0ba757dSStefano Zampini     ierr = PetscMalloc((where_values+1)*sizeof(PetscInt),&cum_recv_counts);CHKERRQ(ierr);
4221a0ba757dSStefano Zampini     ierr = PetscMemzero(cum_recv_counts,(where_values+1)*sizeof(PetscInt));CHKERRQ(ierr);
4222a0ba757dSStefano Zampini     ierr = PetscMalloc(where_values*sizeof(PetscInt),&where_to_nodes_indices);CHKERRQ(ierr);
4223a0ba757dSStefano Zampini     /* first count how many neighbours per connected component I will receive from */
4224a0ba757dSStefano Zampini     cum_recv_counts[0]=0;
4225a0ba757dSStefano Zampini     for(i=1;i<where_values+1;i++){
4226a0ba757dSStefano Zampini       j=0;
4227a0ba757dSStefano Zampini       while(mat_graph->where[j] != i) j++;
4228a0ba757dSStefano Zampini       where_to_nodes_indices[i-1]=j;
4229da1bb401SStefano Zampini       if(mat_graph->neighbours_set[j][0]!=-1) { cum_recv_counts[i]=cum_recv_counts[i-1]+mat_graph->count[j]; } /* We don't want sends/recvs_to/from_self -> here I don't count myself  */
42303b03a366Sstefano_zampini       else { cum_recv_counts[i]=cum_recv_counts[i-1]+mat_graph->count[j]-1; }
4231a0ba757dSStefano Zampini     }
4232a0ba757dSStefano Zampini     buffer_size=2*cum_recv_counts[where_values]+mat_graph->nvtxs;
4233a0ba757dSStefano Zampini     ierr = PetscMalloc(2*cum_recv_counts[where_values]*sizeof(PetscMPIInt),&recv_buffer_where);CHKERRQ(ierr);
4234a0ba757dSStefano Zampini     ierr = PetscMalloc(buffer_size*sizeof(PetscMPIInt),&send_buffer);CHKERRQ(ierr);
4235a0ba757dSStefano Zampini     ierr = PetscMalloc(cum_recv_counts[where_values]*sizeof(MPI_Request),&send_requests);CHKERRQ(ierr);
4236a0ba757dSStefano Zampini     ierr = PetscMalloc(cum_recv_counts[where_values]*sizeof(MPI_Request),&recv_requests);CHKERRQ(ierr);
4237a0ba757dSStefano Zampini     for(i=0;i<cum_recv_counts[where_values];i++) {
4238a0ba757dSStefano Zampini       send_requests[i]=MPI_REQUEST_NULL;
4239a0ba757dSStefano Zampini       recv_requests[i]=MPI_REQUEST_NULL;
4240a0ba757dSStefano Zampini     }
4241a0ba757dSStefano Zampini     /* exchange with my neighbours the number of my connected components on the shared interface */
4242a0ba757dSStefano Zampini     for(i=0;i<where_values;i++){
4243a0ba757dSStefano Zampini       j=where_to_nodes_indices[i];
4244da1bb401SStefano Zampini       k = (mat_graph->neighbours_set[j][0] == -1 ?  1 : 0);
4245a0ba757dSStefano Zampini       for(;k<mat_graph->count[j];k++){
4246da1bb401SStefano Zampini         ierr = MPI_Isend(&mat_graph->where_ncmps[i],1,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr);
4247da1bb401SStefano Zampini         ierr = MPI_Irecv(&recv_buffer_where[sum_requests],1,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr);
4248a0ba757dSStefano Zampini         sum_requests++;
4249a0ba757dSStefano Zampini       }
4250a0ba757dSStefano Zampini     }
4251a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
4252a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
4253a0ba757dSStefano Zampini     /* determine the connected component I need to adapt */
4254a0ba757dSStefano Zampini     ierr = PetscMalloc(where_values*sizeof(PetscInt),&where_cc_adapt);CHKERRQ(ierr);
4255a0ba757dSStefano Zampini     ierr = PetscMemzero(where_cc_adapt,where_values*sizeof(PetscInt));CHKERRQ(ierr);
4256a0ba757dSStefano Zampini     for(i=0;i<where_values;i++){
4257a0ba757dSStefano Zampini       for(j=cum_recv_counts[i];j<cum_recv_counts[i+1];j++){
42583b03a366Sstefano_zampini         /* The first condition is natural (i.e someone has a different number of cc than me), the second one is just to be safe */
42593b03a366Sstefano_zampini         if( mat_graph->where_ncmps[i]!=recv_buffer_where[j] || mat_graph->where_ncmps[i] > 1 ) {
4260a0ba757dSStefano Zampini           where_cc_adapt[i]=PETSC_TRUE;
4261a0ba757dSStefano Zampini           break;
4262a0ba757dSStefano Zampini         }
4263a0ba757dSStefano Zampini       }
4264a0ba757dSStefano Zampini     }
4265a0ba757dSStefano Zampini     /* now get from neighbours their ccs (in global numbering) and adapt them (in case it is needed) */
4266a0ba757dSStefano Zampini     /* first determine how much data to send (size of each queue plus the global indices) and communicate it to neighbours */
4267a0ba757dSStefano Zampini     ierr = PetscMalloc(where_values*sizeof(PetscInt),&sizes_of_sends);CHKERRQ(ierr);
4268a0ba757dSStefano Zampini     ierr = PetscMemzero(sizes_of_sends,where_values*sizeof(PetscInt));CHKERRQ(ierr);
4269a0ba757dSStefano Zampini     sum_requests=0;
4270a0ba757dSStefano Zampini     start_of_send=0;
4271a0ba757dSStefano Zampini     start_of_recv=cum_recv_counts[where_values];
4272a0ba757dSStefano Zampini     for(i=0;i<where_values;i++) {
4273a0ba757dSStefano Zampini       if(where_cc_adapt[i]) {
4274a0ba757dSStefano Zampini         size_of_send=0;
4275a0ba757dSStefano Zampini         for(j=i;j<mat_graph->ncmps;j++) {
4276a0ba757dSStefano Zampini           if(mat_graph->where[mat_graph->queue[mat_graph->cptr[j]]] == i+1) { /* WARNING -> where values goes from 1 to where_values included */
4277a0ba757dSStefano Zampini             send_buffer[start_of_send+size_of_send]=mat_graph->cptr[j+1]-mat_graph->cptr[j];
4278a0ba757dSStefano Zampini             size_of_send+=1;
4279a0ba757dSStefano Zampini             for(k=0;k<mat_graph->cptr[j+1]-mat_graph->cptr[j];k++) {
4280a0ba757dSStefano Zampini               send_buffer[start_of_send+size_of_send+k]=queue_in_global_numbering[mat_graph->cptr[j]+k];
4281a0ba757dSStefano Zampini             }
4282a0ba757dSStefano Zampini             size_of_send=size_of_send+mat_graph->cptr[j+1]-mat_graph->cptr[j];
4283a0ba757dSStefano Zampini           }
4284a0ba757dSStefano Zampini         }
4285a0ba757dSStefano Zampini         j = where_to_nodes_indices[i];
4286da1bb401SStefano Zampini         k = (mat_graph->neighbours_set[j][0] == -1 ?  1 : 0);
428711d8f4c2SStefano Zampini         sizes_of_sends[i]=size_of_send;
4288a0ba757dSStefano Zampini         for(;k<mat_graph->count[j];k++){
428911d8f4c2SStefano Zampini           ierr = MPI_Isend(&sizes_of_sends[i],1,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr);
4290da1bb401SStefano Zampini           ierr = MPI_Irecv(&recv_buffer_where[sum_requests+start_of_recv],1,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr);
4291a0ba757dSStefano Zampini           sum_requests++;
4292a0ba757dSStefano Zampini         }
4293a0ba757dSStefano Zampini         start_of_send+=size_of_send;
4294a0ba757dSStefano Zampini       }
4295a0ba757dSStefano Zampini     }
4296a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
4297a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
4298a0ba757dSStefano Zampini     buffer_size=0;
4299a0ba757dSStefano Zampini     for(k=0;k<sum_requests;k++) { buffer_size+=recv_buffer_where[start_of_recv+k]; }
4300a0ba757dSStefano Zampini     ierr = PetscMalloc(buffer_size*sizeof(PetscMPIInt),&recv_buffer);CHKERRQ(ierr);
4301a0ba757dSStefano Zampini     /* now exchange the data */
4302a0ba757dSStefano Zampini     start_of_recv=0;
4303a0ba757dSStefano Zampini     start_of_send=0;
4304a0ba757dSStefano Zampini     sum_requests=0;
4305a0ba757dSStefano Zampini     for(i=0;i<where_values;i++) {
4306a0ba757dSStefano Zampini       if(where_cc_adapt[i]) {
4307a0ba757dSStefano Zampini         size_of_send = sizes_of_sends[i];
4308a0ba757dSStefano Zampini         j = where_to_nodes_indices[i];
4309da1bb401SStefano Zampini         k = (mat_graph->neighbours_set[j][0] == -1 ?  1 : 0);
4310a0ba757dSStefano Zampini         for(;k<mat_graph->count[j];k++){
4311da1bb401SStefano Zampini           ierr = MPI_Isend(&send_buffer[start_of_send],size_of_send,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr);
4312a0ba757dSStefano Zampini           size_of_recv=recv_buffer_where[cum_recv_counts[where_values]+sum_requests];
4313da1bb401SStefano Zampini           ierr = MPI_Irecv(&recv_buffer[start_of_recv],size_of_recv,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr);
4314a0ba757dSStefano Zampini           start_of_recv+=size_of_recv;
4315a0ba757dSStefano Zampini           sum_requests++;
4316a0ba757dSStefano Zampini         }
4317a0ba757dSStefano Zampini         start_of_send+=size_of_send;
4318a0ba757dSStefano Zampini       }
4319a0ba757dSStefano Zampini     }
4320a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
4321a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
4322a0ba757dSStefano Zampini     ierr = PetscMalloc(buffer_size*sizeof(PetscInt),&petsc_buffer);CHKERRQ(ierr);
4323a0ba757dSStefano Zampini     for(k=0;k<start_of_recv;k++) { petsc_buffer[k]=(PetscInt)recv_buffer[k]; }
4324a0ba757dSStefano Zampini     for(j=0;j<buffer_size;) {
4325a0ba757dSStefano Zampini        ierr = ISGlobalToLocalMappingApply(matis->mapping,IS_GTOLM_MASK,petsc_buffer[j],&petsc_buffer[j+1],&petsc_buffer[j],&petsc_buffer[j+1]);CHKERRQ(ierr);
4326a0ba757dSStefano Zampini        k=petsc_buffer[j]+1;
4327a0ba757dSStefano Zampini        j+=k;
4328a0ba757dSStefano Zampini     }
4329a0ba757dSStefano Zampini     sum_requests=cum_recv_counts[where_values];
4330a0ba757dSStefano Zampini     start_of_recv=0;
4331a0ba757dSStefano Zampini     ierr = PetscMalloc(mat_graph->nvtxs*sizeof(PetscInt),&nodes_to_temp_buffer_indices);CHKERRQ(ierr);
4332a0ba757dSStefano Zampini     global_where_counter=0;
4333a0ba757dSStefano Zampini     for(i=0;i<where_values;i++){
4334a0ba757dSStefano Zampini       if(where_cc_adapt[i]){
4335a0ba757dSStefano Zampini         temp_buffer_size=0;
4336a0ba757dSStefano Zampini         /* find nodes on the shared interface we need to adapt */
4337a0ba757dSStefano Zampini         for(j=0;j<mat_graph->nvtxs;j++){
4338a0ba757dSStefano Zampini           if(mat_graph->where[j]==i+1) {
4339a0ba757dSStefano Zampini             nodes_to_temp_buffer_indices[j]=temp_buffer_size;
4340a0ba757dSStefano Zampini             temp_buffer_size++;
4341a0ba757dSStefano Zampini           } else {
4342a0ba757dSStefano Zampini             nodes_to_temp_buffer_indices[j]=-1;
4343a0ba757dSStefano Zampini           }
4344a0ba757dSStefano Zampini         }
4345a0ba757dSStefano Zampini         /* allocate some temporary space */
4346a0ba757dSStefano Zampini         ierr = PetscMalloc(temp_buffer_size*sizeof(PetscInt*),&temp_buffer);CHKERRQ(ierr);
4347a0ba757dSStefano Zampini         ierr = PetscMalloc(temp_buffer_size*(cum_recv_counts[i+1]-cum_recv_counts[i])*sizeof(PetscInt),&temp_buffer[0]);CHKERRQ(ierr);
4348a0ba757dSStefano Zampini         ierr = PetscMemzero(temp_buffer[0],temp_buffer_size*(cum_recv_counts[i+1]-cum_recv_counts[i])*sizeof(PetscInt));CHKERRQ(ierr);
4349a0ba757dSStefano Zampini         for(j=1;j<temp_buffer_size;j++){
4350a0ba757dSStefano Zampini           temp_buffer[j]=temp_buffer[j-1]+cum_recv_counts[i+1]-cum_recv_counts[i];
4351a0ba757dSStefano Zampini         }
4352a0ba757dSStefano Zampini         /* analyze contributions from neighbouring subdomains for i-th conn comp
4353a0ba757dSStefano Zampini            temp buffer structure:
4354a0ba757dSStefano Zampini            supposing part of the interface has dimension 5 (global nodes 0,1,2,3,4)
4355a0ba757dSStefano Zampini            3 neighs procs with structured connected components:
4356a0ba757dSStefano Zampini              neigh 0: [0 1 4], [2 3];  (2 connected components)
4357a0ba757dSStefano Zampini              neigh 1: [0 1], [2 3 4];  (2 connected components)
4358a0ba757dSStefano Zampini              neigh 2: [0 4], [1], [2 3]; (3 connected components)
4359a0ba757dSStefano Zampini            tempbuffer (row-oriented) should be filled as:
4360a0ba757dSStefano Zampini              [ 0, 0, 0;
4361a0ba757dSStefano Zampini                0, 0, 1;
4362a0ba757dSStefano Zampini                1, 1, 2;
4363a0ba757dSStefano Zampini                1, 1, 2;
4364a0ba757dSStefano Zampini                0, 1, 0; ];
4365a0ba757dSStefano Zampini            This way we can simply recover the resulting structure account for possible intersections of ccs among neighs.
4366a0ba757dSStefano Zampini            The mat_graph->where array will be modified to reproduce the following 4 connected components [0], [1], [2 3], [4];
4367a0ba757dSStefano Zampini                                                                                                                                    */
4368a0ba757dSStefano Zampini         for(j=0;j<cum_recv_counts[i+1]-cum_recv_counts[i];j++) {
4369a0ba757dSStefano Zampini           ins_val=0;
4370a0ba757dSStefano Zampini           size_of_recv=recv_buffer_where[sum_requests];  /* total size of recv from neighs */
4371a0ba757dSStefano Zampini           for(buffer_size=0;buffer_size<size_of_recv;) {  /* loop until all data from neighs has been taken into account */
4372a0ba757dSStefano Zampini             for(k=1;k<petsc_buffer[buffer_size+start_of_recv]+1;k++) { /* filling properly temp_buffer using data from a single recv */
4373a0ba757dSStefano Zampini               temp_buffer[ nodes_to_temp_buffer_indices[ petsc_buffer[ start_of_recv+buffer_size+k ] ] ][j]=ins_val;
4374a0ba757dSStefano Zampini             }
4375a0ba757dSStefano Zampini             buffer_size+=k;
4376a0ba757dSStefano Zampini             ins_val++;
4377a0ba757dSStefano Zampini           }
4378a0ba757dSStefano Zampini           start_of_recv+=size_of_recv;
4379a0ba757dSStefano Zampini           sum_requests++;
4380a0ba757dSStefano Zampini         }
4381a0ba757dSStefano Zampini         ierr = PetscMalloc(temp_buffer_size*sizeof(PetscInt),&add_to_where);CHKERRQ(ierr);
4382a0ba757dSStefano Zampini         ierr = PetscMemzero(add_to_where,temp_buffer_size*sizeof(PetscInt));CHKERRQ(ierr);
4383a0ba757dSStefano Zampini         for(j=0;j<temp_buffer_size;j++){
4384a0ba757dSStefano Zampini           if(!add_to_where[j]){ /* found a new cc  */
4385a0ba757dSStefano Zampini             global_where_counter++;
4386a0ba757dSStefano Zampini             add_to_where[j]=global_where_counter;
4387a0ba757dSStefano Zampini             for(k=j+1;k<temp_buffer_size;k++){ /* check for other nodes in new cc */
4388a0ba757dSStefano Zampini               same_set=PETSC_TRUE;
4389a0ba757dSStefano Zampini               for(s=0;s<cum_recv_counts[i+1]-cum_recv_counts[i];s++){
4390a0ba757dSStefano Zampini                 if(temp_buffer[j][s]!=temp_buffer[k][s]) {
4391a0ba757dSStefano Zampini                   same_set=PETSC_FALSE;
4392a0ba757dSStefano Zampini                   break;
4393a0ba757dSStefano Zampini                 }
4394a0ba757dSStefano Zampini               }
4395a0ba757dSStefano Zampini               if(same_set) add_to_where[k]=global_where_counter;
4396a0ba757dSStefano Zampini             }
4397a0ba757dSStefano Zampini           }
4398a0ba757dSStefano Zampini         }
4399a0ba757dSStefano Zampini         /* insert new data in where array */
4400a0ba757dSStefano Zampini         temp_buffer_size=0;
4401a0ba757dSStefano Zampini         for(j=0;j<mat_graph->nvtxs;j++){
4402a0ba757dSStefano Zampini           if(mat_graph->where[j]==i+1) {
4403a0ba757dSStefano Zampini             mat_graph->where[j]=where_values+add_to_where[temp_buffer_size];
4404a0ba757dSStefano Zampini             temp_buffer_size++;
4405a0ba757dSStefano Zampini           }
4406a0ba757dSStefano Zampini         }
4407a0ba757dSStefano Zampini         ierr = PetscFree(temp_buffer[0]);CHKERRQ(ierr);
4408a0ba757dSStefano Zampini         ierr = PetscFree(temp_buffer);CHKERRQ(ierr);
4409a0ba757dSStefano Zampini         ierr = PetscFree(add_to_where);CHKERRQ(ierr);
4410a0ba757dSStefano Zampini       }
4411a0ba757dSStefano Zampini     }
4412a0ba757dSStefano Zampini     ierr = PetscFree(nodes_to_temp_buffer_indices);CHKERRQ(ierr);
4413a0ba757dSStefano Zampini     ierr = PetscFree(sizes_of_sends);CHKERRQ(ierr);
4414a0ba757dSStefano Zampini     ierr = PetscFree(send_requests);CHKERRQ(ierr);
4415a0ba757dSStefano Zampini     ierr = PetscFree(recv_requests);CHKERRQ(ierr);
4416a0ba757dSStefano Zampini     ierr = PetscFree(petsc_buffer);CHKERRQ(ierr);
4417a0ba757dSStefano Zampini     ierr = PetscFree(recv_buffer);CHKERRQ(ierr);
4418a0ba757dSStefano Zampini     ierr = PetscFree(recv_buffer_where);CHKERRQ(ierr);
4419a0ba757dSStefano Zampini     ierr = PetscFree(send_buffer);CHKERRQ(ierr);
4420a0ba757dSStefano Zampini     ierr = PetscFree(cum_recv_counts);CHKERRQ(ierr);
4421a0ba757dSStefano Zampini     ierr = PetscFree(where_to_nodes_indices);CHKERRQ(ierr);
442223d4d1a5SStefano Zampini     ierr = PetscFree(where_cc_adapt);CHKERRQ(ierr);
4423a0ba757dSStefano Zampini     /* We are ready to evaluate consistent connected components on each part of the shared interface */
4424a0ba757dSStefano Zampini     if(global_where_counter) {
4425a0ba757dSStefano Zampini       for(i=0;i<mat_graph->nvtxs;i++){ mat_graph->touched[i]=PETSC_FALSE; }
4426a0ba757dSStefano Zampini       global_where_counter=0;
4427a0ba757dSStefano Zampini       for(i=0;i<mat_graph->nvtxs;i++){
4428a0ba757dSStefano Zampini         if(mat_graph->where[i] && !mat_graph->touched[i]) {
4429a0ba757dSStefano Zampini           global_where_counter++;
4430a0ba757dSStefano Zampini           for(j=i+1;j<mat_graph->nvtxs;j++){
4431a0ba757dSStefano Zampini             if(!mat_graph->touched[j] && mat_graph->where[j]==mat_graph->where[i]) {
4432a0ba757dSStefano Zampini               mat_graph->where[j]=global_where_counter;
4433a0ba757dSStefano Zampini               mat_graph->touched[j]=PETSC_TRUE;
4434a0ba757dSStefano Zampini             }
4435a0ba757dSStefano Zampini           }
4436a0ba757dSStefano Zampini           mat_graph->where[i]=global_where_counter;
4437a0ba757dSStefano Zampini           mat_graph->touched[i]=PETSC_TRUE;
4438a0ba757dSStefano Zampini         }
4439a0ba757dSStefano Zampini       }
4440a0ba757dSStefano Zampini       where_values=global_where_counter;
4441a0ba757dSStefano Zampini     }
4442a0ba757dSStefano Zampini     if(global_where_counter) {
4443a0ba757dSStefano Zampini       ierr = PetscMemzero(mat_graph->cptr,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr);
4444a0ba757dSStefano Zampini       ierr = PetscMemzero(mat_graph->queue,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
4445a0ba757dSStefano Zampini       ierr = PetscFree(mat_graph->where_ncmps);CHKERRQ(ierr);
4446a0ba757dSStefano Zampini       ierr = PetscMalloc(where_values*sizeof(PetscMPIInt),&mat_graph->where_ncmps);CHKERRQ(ierr);
4447a0ba757dSStefano Zampini       ierr = PCBDDCFindConnectedComponents(mat_graph, where_values);
4448a0ba757dSStefano Zampini       for(i=0;i<mat_graph->ncmps;i++) {
4449a0ba757dSStefano Zampini         ierr = ISLocalToGlobalMappingApply(matis->mapping,mat_graph->cptr[i+1]-mat_graph->cptr[i],&mat_graph->queue[mat_graph->cptr[i]],&queue_in_global_numbering[mat_graph->cptr[i]]);CHKERRQ(ierr);
4450a0ba757dSStefano Zampini         ierr = PetscSortIntWithArray(mat_graph->cptr[i+1]-mat_graph->cptr[i],&queue_in_global_numbering[mat_graph->cptr[i]],&mat_graph->queue[mat_graph->cptr[i]]);CHKERRQ(ierr);
4451a0ba757dSStefano Zampini       }
4452a0ba757dSStefano Zampini     }
44533b03a366Sstefano_zampini   } /* Finished adapting interface */
44540c7d97c5SJed Brown   PetscInt nfc=0;
44550c7d97c5SJed Brown   PetscInt nec=0;
44560c7d97c5SJed Brown   PetscInt nvc=0;
44573b03a366Sstefano_zampini   PetscBool twodim_flag=PETSC_FALSE;
44580c7d97c5SJed Brown   for (i=0; i<mat_graph->ncmps; i++) {
44593b03a366Sstefano_zampini     if( mat_graph->cptr[i+1]-mat_graph->cptr[i] > vertex_size ){
4460534831adSStefano Zampini       if(mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]==1){ /* 1 neigh Neumann fake included */
44610c7d97c5SJed Brown         nfc++;
44623b03a366Sstefano_zampini       } else { /* note that nec will be zero in 2d */
44633b03a366Sstefano_zampini         nec++;
44643b03a366Sstefano_zampini       }
44650c7d97c5SJed Brown     } else {
44663b03a366Sstefano_zampini       nvc+=mat_graph->cptr[i+1]-mat_graph->cptr[i];
44673b03a366Sstefano_zampini     }
44683b03a366Sstefano_zampini   }
44693b03a366Sstefano_zampini 
44703b03a366Sstefano_zampini   if(!nec) { /* we are in a 2d case -> no faces, only edges */
44713b03a366Sstefano_zampini     nec = nfc;
44723b03a366Sstefano_zampini     nfc = 0;
44733b03a366Sstefano_zampini     twodim_flag = PETSC_TRUE;
44743b03a366Sstefano_zampini   }
44753972b0daSStefano Zampini   /* allocate IS arrays for faces, edges. Vertices need a single index set. */
44763972b0daSStefano Zampini   k=0;
44773972b0daSStefano Zampini   for (i=0; i<mat_graph->ncmps; i++) {
44783972b0daSStefano Zampini     j=mat_graph->cptr[i+1]-mat_graph->cptr[i];
44793972b0daSStefano Zampini     if( j > k) {
44803972b0daSStefano Zampini       k=j;
44813972b0daSStefano Zampini     }
4482ba1573a8SStefano Zampini     if(j<=vertex_size) {
4483ba1573a8SStefano Zampini       k+=vertex_size;
4484ba1573a8SStefano Zampini     }
44853972b0daSStefano Zampini   }
44863972b0daSStefano Zampini   ierr = PetscMalloc(k*sizeof(PetscInt),&auxis);CHKERRQ(ierr);
44873972b0daSStefano Zampini 
44883b03a366Sstefano_zampini   if(!pcbddc->vertices_flag && !pcbddc->edges_flag) {
44893b03a366Sstefano_zampini     ierr = PetscMalloc(nfc*sizeof(IS),&pcbddc->ISForFaces);CHKERRQ(ierr);
44903b03a366Sstefano_zampini     use_faces=PETSC_TRUE;
44913b03a366Sstefano_zampini   }
44923b03a366Sstefano_zampini   if(!pcbddc->vertices_flag && !pcbddc->faces_flag) {
44933b03a366Sstefano_zampini     ierr = PetscMalloc(nec*sizeof(IS),&pcbddc->ISForEdges);CHKERRQ(ierr);
44943b03a366Sstefano_zampini     use_edges=PETSC_TRUE;
44953b03a366Sstefano_zampini   }
44963b03a366Sstefano_zampini   nfc=0;
44973b03a366Sstefano_zampini   nec=0;
44983b03a366Sstefano_zampini   for (i=0; i<mat_graph->ncmps; i++) {
44993b03a366Sstefano_zampini     if( mat_graph->cptr[i+1]-mat_graph->cptr[i] > vertex_size ){
45003b03a366Sstefano_zampini       for(j=0;j<mat_graph->cptr[i+1]-mat_graph->cptr[i];j++) {
45013972b0daSStefano Zampini         auxis[j]=mat_graph->queue[mat_graph->cptr[i]+j];
45023b03a366Sstefano_zampini       }
45033b03a366Sstefano_zampini       if(mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]==1){
45043b03a366Sstefano_zampini         if(twodim_flag) {
45053b03a366Sstefano_zampini           if(use_edges) {
45063972b0daSStefano Zampini             ierr = ISCreateGeneral(PETSC_COMM_SELF,j,auxis,PETSC_COPY_VALUES,&pcbddc->ISForEdges[nec]);CHKERRQ(ierr);
45073b03a366Sstefano_zampini             nec++;
45083b03a366Sstefano_zampini           }
45093b03a366Sstefano_zampini         } else {
45103b03a366Sstefano_zampini           if(use_faces) {
45113972b0daSStefano Zampini             ierr = ISCreateGeneral(PETSC_COMM_SELF,j,auxis,PETSC_COPY_VALUES,&pcbddc->ISForFaces[nfc]);CHKERRQ(ierr);
45123b03a366Sstefano_zampini             nfc++;
45133b03a366Sstefano_zampini           }
45143b03a366Sstefano_zampini         }
45153b03a366Sstefano_zampini       } else {
45163b03a366Sstefano_zampini         if(use_edges) {
45173972b0daSStefano Zampini           ierr = ISCreateGeneral(PETSC_COMM_SELF,j,auxis,PETSC_COPY_VALUES,&pcbddc->ISForEdges[nec]);CHKERRQ(ierr);
45180c7d97c5SJed Brown           nec++;
45190c7d97c5SJed Brown         }
45200c7d97c5SJed Brown       }
45210c7d97c5SJed Brown     }
45223b03a366Sstefano_zampini   }
45233b03a366Sstefano_zampini   pcbddc->n_ISForFaces=nfc;
45243b03a366Sstefano_zampini   pcbddc->n_ISForEdges=nec;
45253b03a366Sstefano_zampini   nvc=0;
45260c7d97c5SJed Brown   if( !pcbddc->constraints_flag ) {
45273b03a366Sstefano_zampini     for (i=0; i<mat_graph->ncmps; i++) {
45283b03a366Sstefano_zampini       if( mat_graph->cptr[i+1]-mat_graph->cptr[i] <= vertex_size ){
45293b03a366Sstefano_zampini         for( j=mat_graph->cptr[i];j<mat_graph->cptr[i+1];j++) {
45303972b0daSStefano Zampini           auxis[nvc]=mat_graph->queue[j];
45310c7d97c5SJed Brown           nvc++;
45320c7d97c5SJed Brown         }
45330c7d97c5SJed Brown       }
45340c7d97c5SJed Brown     }
45350c7d97c5SJed Brown   }
4536a0ba757dSStefano Zampini   /* sort vertex set (by local ordering) */
45373972b0daSStefano Zampini   ierr = PetscSortInt(nvc,auxis);CHKERRQ(ierr);
45383972b0daSStefano Zampini   ierr = ISCreateGeneral(PETSC_COMM_SELF,nvc,auxis,PETSC_COPY_VALUES,&pcbddc->ISForVertices);CHKERRQ(ierr);
45390c7d97c5SJed Brown 
4540e269702eSStefano Zampini   if(pcbddc->dbg_flag) {
4541e269702eSStefano Zampini 
4542d49ef151SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"--------------------------------------------------------------\n");CHKERRQ(ierr);
4543d49ef151SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Details from PCBDDCManageLocalBoundaries for subdomain %04d\n",PetscGlobalRank);CHKERRQ(ierr);
4544d49ef151SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"--------------------------------------------------------------\n");CHKERRQ(ierr);
4545a0ba757dSStefano Zampini /*    ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Graph (adjacency structure) of local Neumann mat\n");CHKERRQ(ierr);
4546a0ba757dSStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"--------------------------------------------------------------\n");CHKERRQ(ierr);
4547e269702eSStefano Zampini     for(i=0;i<mat_graph->nvtxs;i++) {
4548a0ba757dSStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Nodes connected to node number %d are %d\n",i,mat_graph->xadj[i+1]-mat_graph->xadj[i]);CHKERRQ(ierr);
4549e269702eSStefano Zampini       for(j=mat_graph->xadj[i];j<mat_graph->xadj[i+1];j++){
4550a0ba757dSStefano Zampini         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d ",mat_graph->adjncy[j]);CHKERRQ(ierr);
4551e269702eSStefano Zampini       }
4552a0ba757dSStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\n--------------------------------------------------------------\n");CHKERRQ(ierr);
4553da1bb401SStefano Zampini     }*/
4554d49ef151SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Matrix graph has %d connected components", mat_graph->ncmps);CHKERRQ(ierr);
45550c7d97c5SJed Brown     for(i=0;i<mat_graph->ncmps;i++) {
45563b03a366Sstefano_zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\nDetails for connected component number %02d: size %04d, count %01d. Nodes follow.\n",
45573b03a366Sstefano_zampini              i,mat_graph->cptr[i+1]-mat_graph->cptr[i],mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]);CHKERRQ(ierr);
4558da1bb401SStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"subdomains: ");
4559da1bb401SStefano Zampini       for (j=0;j<mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]; j++) {
4560da1bb401SStefano Zampini         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d ",mat_graph->neighbours_set[mat_graph->queue[mat_graph->cptr[i]]][j]);
4561da1bb401SStefano Zampini       }
4562da1bb401SStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\n");
45630c7d97c5SJed Brown       for (j=mat_graph->cptr[i]; j<mat_graph->cptr[i+1]; j++){
4564da1bb401SStefano Zampini         /* ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d (%d), ",queue_in_global_numbering[j],mat_graph->queue[j]);CHKERRQ(ierr); */
4565da1bb401SStefano Zampini         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d, ",mat_graph->queue[j]);CHKERRQ(ierr);
45660c7d97c5SJed Brown       }
45670c7d97c5SJed Brown     }
4568da1bb401SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\n--------------------------------------------------------------\n");CHKERRQ(ierr);
45693b03a366Sstefano_zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local vertices\n",PetscGlobalRank,nvc);CHKERRQ(ierr);
45703b03a366Sstefano_zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local faces\n",PetscGlobalRank,nfc);CHKERRQ(ierr);
45713b03a366Sstefano_zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local edges\n",PetscGlobalRank,nec);CHKERRQ(ierr);
4572d49ef151SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
45730c7d97c5SJed Brown   }
45740c7d97c5SJed Brown 
45753972b0daSStefano Zampini   ierr = PetscFree(queue_in_global_numbering);CHKERRQ(ierr);
45763972b0daSStefano Zampini   ierr = PetscFree(auxis);CHKERRQ(ierr);
45770c7d97c5SJed Brown   PetscFunctionReturn(0);
45780c7d97c5SJed Brown 
45790c7d97c5SJed Brown }
45800c7d97c5SJed Brown 
45810c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
45820c7d97c5SJed Brown 
45830c7d97c5SJed Brown /* The following code has been adapted from function IsConnectedSubdomain contained
4584da1bb401SStefano Zampini    in source file contig.c of METIS library (version 5.0.1)
4585da1bb401SStefano Zampini    It finds connected components of each partition labeled from 1 to n_dist  */
45860c7d97c5SJed Brown 
45870c7d97c5SJed Brown #undef __FUNCT__
45880c7d97c5SJed Brown #define __FUNCT__ "PCBDDCFindConnectedComponents"
45899c0446d6SStefano Zampini static PetscErrorCode PCBDDCFindConnectedComponents(PCBDDCGraph graph, PetscInt n_dist )
45900c7d97c5SJed Brown {
45910c7d97c5SJed Brown   PetscInt i, j, k, nvtxs, first, last, nleft, ncmps,pid,cum_queue,n,ncmps_pid;
45920c7d97c5SJed Brown   PetscInt *xadj, *adjncy, *where, *queue;
45930c7d97c5SJed Brown   PetscInt *cptr;
45940c7d97c5SJed Brown   PetscBool *touched;
45950c7d97c5SJed Brown 
45960c7d97c5SJed Brown   PetscFunctionBegin;
45970c7d97c5SJed Brown 
45980c7d97c5SJed Brown   nvtxs   = graph->nvtxs;
45990c7d97c5SJed Brown   xadj    = graph->xadj;
46000c7d97c5SJed Brown   adjncy  = graph->adjncy;
46010c7d97c5SJed Brown   where   = graph->where;
46020c7d97c5SJed Brown   touched = graph->touched;
46030c7d97c5SJed Brown   queue   = graph->queue;
46040c7d97c5SJed Brown   cptr    = graph->cptr;
46050c7d97c5SJed Brown 
46060c7d97c5SJed Brown   for (i=0; i<nvtxs; i++)
46070c7d97c5SJed Brown     touched[i] = PETSC_FALSE;
46080c7d97c5SJed Brown 
46090c7d97c5SJed Brown   cum_queue=0;
46100c7d97c5SJed Brown   ncmps=0;
46110c7d97c5SJed Brown 
46120c7d97c5SJed Brown   for(n=0; n<n_dist; n++) {
4613da1bb401SStefano Zampini     pid = n+1;  /* partition labeled by 0 is discarded */
46140c7d97c5SJed Brown     nleft = 0;
46150c7d97c5SJed Brown     for (i=0; i<nvtxs; i++) {
46160c7d97c5SJed Brown       if (where[i] == pid)
46170c7d97c5SJed Brown         nleft++;
46180c7d97c5SJed Brown     }
46190c7d97c5SJed Brown     for (i=0; i<nvtxs; i++) {
46200c7d97c5SJed Brown       if (where[i] == pid)
46210c7d97c5SJed Brown         break;
46220c7d97c5SJed Brown     }
46230c7d97c5SJed Brown     touched[i] = PETSC_TRUE;
46240c7d97c5SJed Brown     queue[cum_queue] = i;
46250c7d97c5SJed Brown     first = 0; last = 1;
46260c7d97c5SJed Brown     cptr[ncmps] = cum_queue;  /* This actually points to queue */
46270c7d97c5SJed Brown     ncmps_pid = 0;
46280c7d97c5SJed Brown     while (first != nleft) {
46290c7d97c5SJed Brown       if (first == last) { /* Find another starting vertex */
46300c7d97c5SJed Brown         cptr[++ncmps] = first+cum_queue;
46310c7d97c5SJed Brown         ncmps_pid++;
46320c7d97c5SJed Brown         for (i=0; i<nvtxs; i++) {
46330c7d97c5SJed Brown           if (where[i] == pid && !touched[i])
46340c7d97c5SJed Brown             break;
46350c7d97c5SJed Brown         }
46360c7d97c5SJed Brown         queue[cum_queue+last] = i;
46370c7d97c5SJed Brown         last++;
46380c7d97c5SJed Brown         touched[i] = PETSC_TRUE;
46390c7d97c5SJed Brown       }
46400c7d97c5SJed Brown       i = queue[cum_queue+first];
46410c7d97c5SJed Brown       first++;
46420c7d97c5SJed Brown       for (j=xadj[i]; j<xadj[i+1]; j++) {
46430c7d97c5SJed Brown         k = adjncy[j];
46440c7d97c5SJed Brown         if (where[k] == pid && !touched[k]) {
46450c7d97c5SJed Brown           queue[cum_queue+last] = k;
46460c7d97c5SJed Brown           last++;
46470c7d97c5SJed Brown           touched[k] = PETSC_TRUE;
46480c7d97c5SJed Brown         }
46490c7d97c5SJed Brown       }
46500c7d97c5SJed Brown     }
46510c7d97c5SJed Brown     cptr[++ncmps] = first+cum_queue;
46520c7d97c5SJed Brown     ncmps_pid++;
46530c7d97c5SJed Brown     cum_queue=cptr[ncmps];
4654a0ba757dSStefano Zampini     graph->where_ncmps[n] = ncmps_pid;
46550c7d97c5SJed Brown   }
46560c7d97c5SJed Brown   graph->ncmps = ncmps;
46570c7d97c5SJed Brown 
46580c7d97c5SJed Brown   PetscFunctionReturn(0);
46590c7d97c5SJed Brown }
4660