xref: /petsc/src/ksp/pc/impls/bddc/bddc.c (revision 93dc3b609793c36ad3d3a530f4e276bb50cf9238)
153cdbc3dSStefano Zampini /* TODOLIST
2da1bb401SStefano Zampini    DofSplitting and DM attached to pc?
3da1bb401SStefano Zampini    Change SetNeumannBoundaries to SetNeumannBoundariesLocal and provide new SetNeumannBoundaries (same Dirichlet)
4831a100dSStefano Zampini      - change prec_type to switch_inexact_prec_type
53b03a366Sstefano_zampini    Inexact solvers: global preconditioner application is ready, ask to developers (Jed?) on how to best implement Dohrmann's approach (PCSHELL?)
6a0ba757dSStefano Zampini    change how to deal with the coarse problem (PCBDDCSetCoarseEnvironment):
7a0ba757dSStefano Zampini      - mind the problem with coarsening_factor
8a0ba757dSStefano Zampini      - simplify coarse problem structure -> PCBDDC or PCREDUDANT, nothing else -> same comm for all levels?
9a0ba757dSStefano Zampini      - remove coarse enums and allow use of PCBDDCGetCoarseKSP
10a0ba757dSStefano Zampini      - remove metis dependency -> use MatPartitioning for multilevel -> Assemble serial adjacency in ManageLocalBoundaries?
113b03a366Sstefano_zampini      - Add levels' slot to bddc data structure and associated Set/Get functions
12a0ba757dSStefano Zampini    code refactoring:
13a0ba757dSStefano Zampini      - pick up better names for static functions
14a0ba757dSStefano Zampini    change options structure:
15a0ba757dSStefano Zampini      - insert BDDC into MG framework?
16a0ba757dSStefano Zampini    provide other ops? Ask to developers
17a0ba757dSStefano Zampini    remove all unused printf
18a0ba757dSStefano Zampini    man pages
1953cdbc3dSStefano Zampini */
200c7d97c5SJed Brown 
2153cdbc3dSStefano Zampini /* ----------------------------------------------------------------------------------------------------------------------------------------------
220c7d97c5SJed Brown    Implementation of BDDC preconditioner based on:
230c7d97c5SJed Brown    C. Dohrmann "An approximate BDDC preconditioner", Numerical Linear Algebra with Applications Volume 14, Issue 2, pages 149-168, March 2007
2453cdbc3dSStefano Zampini    ---------------------------------------------------------------------------------------------------------------------------------------------- */
2553cdbc3dSStefano Zampini 
2653cdbc3dSStefano Zampini #include "bddc.h" /*I "petscpc.h" I*/  /* includes for fortran wrappers */
273b03a366Sstefano_zampini #include <petscblaslapack.h>
280c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
290c7d97c5SJed Brown #undef __FUNCT__
300c7d97c5SJed Brown #define __FUNCT__ "PCSetFromOptions_BDDC"
310c7d97c5SJed Brown PetscErrorCode PCSetFromOptions_BDDC(PC pc)
320c7d97c5SJed Brown {
330c7d97c5SJed Brown   PC_BDDC         *pcbddc = (PC_BDDC*)pc->data;
340c7d97c5SJed Brown   PetscErrorCode ierr;
350c7d97c5SJed Brown 
360c7d97c5SJed Brown   PetscFunctionBegin;
370c7d97c5SJed Brown   ierr = PetscOptionsHead("BDDC options");CHKERRQ(ierr);
380c7d97c5SJed Brown   /* Verbose debugging of main data structures */
39e269702eSStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_check_all"       ,"Verbose (debugging) output for PCBDDC"                       ,"none",pcbddc->dbg_flag      ,&pcbddc->dbg_flag      ,PETSC_NULL);CHKERRQ(ierr);
400c7d97c5SJed Brown   /* Some customization for default primal space */
41da1bb401SStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_vertices_only"   ,"Use only vertices in coarse space (i.e. discard constraints)","none",pcbddc->vertices_flag   ,&pcbddc->vertices_flag   ,PETSC_NULL);CHKERRQ(ierr);
42da1bb401SStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_constraints_only","Use only constraints in coarse space (i.e. discard vertices)","none",pcbddc->constraints_flag,&pcbddc->constraints_flag,PETSC_NULL);CHKERRQ(ierr);
43da1bb401SStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_faces_only"      ,"Use only faces among constraints of coarse space (i.e. discard edges)"         ,"none",pcbddc->faces_flag      ,&pcbddc->faces_flag      ,PETSC_NULL);CHKERRQ(ierr);
44da1bb401SStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_edges_only"      ,"Use only edges among constraints of coarse space (i.e. discard faces)"         ,"none",pcbddc->edges_flag      ,&pcbddc->edges_flag      ,PETSC_NULL);CHKERRQ(ierr);
450c7d97c5SJed Brown   /* Coarse solver context */
46da1bb401SStefano Zampini   static const char *avail_coarse_problems[] = {"sequential","replicated","parallel","multilevel",""}; /*order of choiches depends on ENUM defined in bddc.h */
470c7d97c5SJed Brown   ierr = PetscOptionsEnum("-pc_bddc_coarse_problem_type","Set coarse problem type","none",avail_coarse_problems,(PetscEnum)pcbddc->coarse_problem_type,(PetscEnum*)&pcbddc->coarse_problem_type,PETSC_NULL);CHKERRQ(ierr);
480c7d97c5SJed Brown   /* Two different application of BDDC to the whole set of dofs, internal and interface */
490c7d97c5SJed Brown   ierr = PetscOptionsBool("-pc_bddc_switch_preconditioning_type","Switch between M_2 (default) and M_3 preconditioners (as defined by Dohrmann)","none",pcbddc->prec_type,&pcbddc->prec_type,PETSC_NULL);CHKERRQ(ierr);
50534831adSStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_use_change_of_basis","Use change of basis approach for primal space","none",pcbddc->usechangeofbasis,&pcbddc->usechangeofbasis,PETSC_NULL);CHKERRQ(ierr);
51534831adSStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_use_change_on_faces","Use change of basis approach for face constraints","none",pcbddc->usechangeonfaces,&pcbddc->usechangeonfaces,PETSC_NULL);CHKERRQ(ierr);
52534831adSStefano Zampini   pcbddc->usechangeonfaces = pcbddc->usechangeonfaces && pcbddc->usechangeofbasis;
530c7d97c5SJed Brown   ierr = PetscOptionsInt("-pc_bddc_coarsening_ratio","Set coarsening ratio used in multilevel coarsening","none",pcbddc->coarsening_ratio,&pcbddc->coarsening_ratio,PETSC_NULL);CHKERRQ(ierr);
540c7d97c5SJed Brown   ierr = PetscOptionsTail();CHKERRQ(ierr);
550c7d97c5SJed Brown   PetscFunctionReturn(0);
560c7d97c5SJed Brown }
570c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
580c7d97c5SJed Brown EXTERN_C_BEGIN
590c7d97c5SJed Brown #undef __FUNCT__
600c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetCoarseProblemType_BDDC"
6153cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetCoarseProblemType_BDDC(PC pc, CoarseProblemType CPT)
620c7d97c5SJed Brown {
630c7d97c5SJed Brown   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
640c7d97c5SJed Brown 
650c7d97c5SJed Brown   PetscFunctionBegin;
660c7d97c5SJed Brown   pcbddc->coarse_problem_type = CPT;
670c7d97c5SJed Brown   PetscFunctionReturn(0);
680c7d97c5SJed Brown }
690c7d97c5SJed Brown EXTERN_C_END
700c7d97c5SJed Brown #undef __FUNCT__
710c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetCoarseProblemType"
7253cdbc3dSStefano Zampini /*@
739c0446d6SStefano Zampini  PCBDDCSetCoarseProblemType - Set coarse problem type in PCBDDC.
7453cdbc3dSStefano Zampini 
759c0446d6SStefano Zampini    Not collective
7653cdbc3dSStefano Zampini 
7753cdbc3dSStefano Zampini    Input Parameters:
7853cdbc3dSStefano Zampini +  pc - the preconditioning context
7953cdbc3dSStefano Zampini -  CoarseProblemType - pick a better name and explain what this is
8053cdbc3dSStefano Zampini 
8153cdbc3dSStefano Zampini    Level: intermediate
8253cdbc3dSStefano Zampini 
8353cdbc3dSStefano Zampini    Notes:
84da1bb401SStefano Zampini    Not collective but all procs must call with same arguments.
8553cdbc3dSStefano Zampini 
8653cdbc3dSStefano Zampini .seealso: PCBDDC
8753cdbc3dSStefano Zampini @*/
880c7d97c5SJed Brown PetscErrorCode PCBDDCSetCoarseProblemType(PC pc, CoarseProblemType CPT)
890c7d97c5SJed Brown {
900c7d97c5SJed Brown   PetscErrorCode ierr;
910c7d97c5SJed Brown 
920c7d97c5SJed Brown   PetscFunctionBegin;
930c7d97c5SJed Brown   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
940c7d97c5SJed Brown   ierr = PetscTryMethod(pc,"PCBDDCSetCoarseProblemType_C",(PC,CoarseProblemType),(pc,CPT));CHKERRQ(ierr);
950c7d97c5SJed Brown   PetscFunctionReturn(0);
960c7d97c5SJed Brown }
970c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
980c7d97c5SJed Brown EXTERN_C_BEGIN
990c7d97c5SJed Brown #undef __FUNCT__
1003b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCSetDirichletBoundaries_BDDC"
1013b03a366Sstefano_zampini static PetscErrorCode PCBDDCSetDirichletBoundaries_BDDC(PC pc,IS DirichletBoundaries)
1023b03a366Sstefano_zampini {
1033b03a366Sstefano_zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
1043b03a366Sstefano_zampini   PetscErrorCode ierr;
1053b03a366Sstefano_zampini 
1063b03a366Sstefano_zampini   PetscFunctionBegin;
1073b03a366Sstefano_zampini   ierr = ISDestroy(&pcbddc->DirichletBoundaries);CHKERRQ(ierr);
10836e030ebSStefano Zampini   ierr = PetscObjectReference((PetscObject)DirichletBoundaries);CHKERRQ(ierr);
10936e030ebSStefano Zampini   pcbddc->DirichletBoundaries=DirichletBoundaries;
1103b03a366Sstefano_zampini   PetscFunctionReturn(0);
1113b03a366Sstefano_zampini }
1123b03a366Sstefano_zampini EXTERN_C_END
1133b03a366Sstefano_zampini #undef __FUNCT__
1143b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCSetDirichletBoundaries"
1153b03a366Sstefano_zampini /*@
116da1bb401SStefano Zampini  PCBDDCSetDirichletBoundaries - Set index set defining subdomain part (in local ordering)
117da1bb401SStefano Zampini                               of Dirichlet boundaries for the global problem.
1183b03a366Sstefano_zampini 
1193b03a366Sstefano_zampini    Not collective
1203b03a366Sstefano_zampini 
1213b03a366Sstefano_zampini    Input Parameters:
1223b03a366Sstefano_zampini +  pc - the preconditioning context
1233b03a366Sstefano_zampini -  DirichletBoundaries - sequential index set defining the subdomain part of Dirichlet boundaries (can be PETSC_NULL)
1243b03a366Sstefano_zampini 
1253b03a366Sstefano_zampini    Level: intermediate
1263b03a366Sstefano_zampini 
1273b03a366Sstefano_zampini    Notes:
1283b03a366Sstefano_zampini 
1293b03a366Sstefano_zampini .seealso: PCBDDC
1303b03a366Sstefano_zampini @*/
1313b03a366Sstefano_zampini PetscErrorCode PCBDDCSetDirichletBoundaries(PC pc,IS DirichletBoundaries)
1323b03a366Sstefano_zampini {
1333b03a366Sstefano_zampini   PetscErrorCode ierr;
1343b03a366Sstefano_zampini 
1353b03a366Sstefano_zampini   PetscFunctionBegin;
1363b03a366Sstefano_zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
1373b03a366Sstefano_zampini   ierr = PetscTryMethod(pc,"PCBDDCSetDirichletBoundaries_C",(PC,IS),(pc,DirichletBoundaries));CHKERRQ(ierr);
1383b03a366Sstefano_zampini   PetscFunctionReturn(0);
1393b03a366Sstefano_zampini }
1403b03a366Sstefano_zampini /* -------------------------------------------------------------------------- */
1413b03a366Sstefano_zampini EXTERN_C_BEGIN
1423b03a366Sstefano_zampini #undef __FUNCT__
1430c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetNeumannBoundaries_BDDC"
14453cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetNeumannBoundaries_BDDC(PC pc,IS NeumannBoundaries)
1450c7d97c5SJed Brown {
1460c7d97c5SJed Brown   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
14753cdbc3dSStefano Zampini   PetscErrorCode ierr;
1480c7d97c5SJed Brown 
1490c7d97c5SJed Brown   PetscFunctionBegin;
15053cdbc3dSStefano Zampini   ierr = ISDestroy(&pcbddc->NeumannBoundaries);CHKERRQ(ierr);
15136e030ebSStefano Zampini   ierr = PetscObjectReference((PetscObject)NeumannBoundaries);CHKERRQ(ierr);
15236e030ebSStefano Zampini   pcbddc->NeumannBoundaries=NeumannBoundaries;
1530c7d97c5SJed Brown   PetscFunctionReturn(0);
1540c7d97c5SJed Brown }
1550c7d97c5SJed Brown EXTERN_C_END
1560c7d97c5SJed Brown #undef __FUNCT__
1570c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetNeumannBoundaries"
15857527edcSJed Brown /*@
159da1bb401SStefano Zampini  PCBDDCSetNeumannBoundaries - Set index set defining subdomain part (in local ordering)
160da1bb401SStefano Zampini                               of Neumann boundaries for the global problem.
16157527edcSJed Brown 
1629c0446d6SStefano Zampini    Not collective
16357527edcSJed Brown 
16457527edcSJed Brown    Input Parameters:
16557527edcSJed Brown +  pc - the preconditioning context
1669c0446d6SStefano Zampini -  NeumannBoundaries - sequential index set defining the subdomain part of Neumann boundaries (can be PETSC_NULL)
16757527edcSJed Brown 
16857527edcSJed Brown    Level: intermediate
16957527edcSJed Brown 
17057527edcSJed Brown    Notes:
17157527edcSJed Brown 
17257527edcSJed Brown .seealso: PCBDDC
17357527edcSJed Brown @*/
17453cdbc3dSStefano Zampini PetscErrorCode PCBDDCSetNeumannBoundaries(PC pc,IS NeumannBoundaries)
1750c7d97c5SJed Brown {
1760c7d97c5SJed Brown   PetscErrorCode ierr;
1770c7d97c5SJed Brown 
1780c7d97c5SJed Brown   PetscFunctionBegin;
1790c7d97c5SJed Brown   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
18053cdbc3dSStefano Zampini   ierr = PetscTryMethod(pc,"PCBDDCSetNeumannBoundaries_C",(PC,IS),(pc,NeumannBoundaries));CHKERRQ(ierr);
18153cdbc3dSStefano Zampini   PetscFunctionReturn(0);
18253cdbc3dSStefano Zampini }
18353cdbc3dSStefano Zampini /* -------------------------------------------------------------------------- */
18453cdbc3dSStefano Zampini EXTERN_C_BEGIN
18553cdbc3dSStefano Zampini #undef __FUNCT__
186da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCGetDirichletBoundaries_BDDC"
187da1bb401SStefano Zampini static PetscErrorCode PCBDDCGetDirichletBoundaries_BDDC(PC pc,IS *DirichletBoundaries)
188da1bb401SStefano Zampini {
189da1bb401SStefano Zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
190da1bb401SStefano Zampini 
191da1bb401SStefano Zampini   PetscFunctionBegin;
192da1bb401SStefano Zampini   *DirichletBoundaries = pcbddc->DirichletBoundaries;
193da1bb401SStefano Zampini   PetscFunctionReturn(0);
194da1bb401SStefano Zampini }
195da1bb401SStefano Zampini EXTERN_C_END
196da1bb401SStefano Zampini #undef __FUNCT__
197da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCGetDirichletBoundaries"
198da1bb401SStefano Zampini /*@
199da1bb401SStefano Zampini  PCBDDCGetDirichletBoundaries - Get index set defining subdomain part (in local ordering)
200da1bb401SStefano Zampini                                 of Dirichlet boundaries for the global problem.
201da1bb401SStefano Zampini 
202da1bb401SStefano Zampini    Not collective
203da1bb401SStefano Zampini 
204da1bb401SStefano Zampini    Input Parameters:
205da1bb401SStefano Zampini +  pc - the preconditioning context
206da1bb401SStefano Zampini 
207da1bb401SStefano Zampini    Output Parameters:
208da1bb401SStefano Zampini +  DirichletBoundaries - index set defining the subdomain part of Dirichlet boundaries
209da1bb401SStefano Zampini 
210da1bb401SStefano Zampini    Level: intermediate
211da1bb401SStefano Zampini 
212da1bb401SStefano Zampini    Notes:
213da1bb401SStefano Zampini 
214da1bb401SStefano Zampini .seealso: PCBDDC
215da1bb401SStefano Zampini @*/
216da1bb401SStefano Zampini PetscErrorCode PCBDDCGetDirichletBoundaries(PC pc,IS *DirichletBoundaries)
217da1bb401SStefano Zampini {
218da1bb401SStefano Zampini   PetscErrorCode ierr;
219da1bb401SStefano Zampini 
220da1bb401SStefano Zampini   PetscFunctionBegin;
221da1bb401SStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
222da1bb401SStefano Zampini   ierr = PetscUseMethod(pc,"PCBDDCGetDirichletBoundaries_C",(PC,IS*),(pc,DirichletBoundaries));CHKERRQ(ierr);
223da1bb401SStefano Zampini   PetscFunctionReturn(0);
224da1bb401SStefano Zampini }
225da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
226da1bb401SStefano Zampini EXTERN_C_BEGIN
227da1bb401SStefano Zampini #undef __FUNCT__
22853cdbc3dSStefano Zampini #define __FUNCT__ "PCBDDCGetNeumannBoundaries_BDDC"
22953cdbc3dSStefano Zampini static PetscErrorCode PCBDDCGetNeumannBoundaries_BDDC(PC pc,IS *NeumannBoundaries)
23053cdbc3dSStefano Zampini {
23153cdbc3dSStefano Zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
23253cdbc3dSStefano Zampini 
23353cdbc3dSStefano Zampini   PetscFunctionBegin;
23453cdbc3dSStefano Zampini   *NeumannBoundaries = pcbddc->NeumannBoundaries;
23553cdbc3dSStefano Zampini   PetscFunctionReturn(0);
23653cdbc3dSStefano Zampini }
23753cdbc3dSStefano Zampini EXTERN_C_END
23853cdbc3dSStefano Zampini #undef __FUNCT__
23953cdbc3dSStefano Zampini #define __FUNCT__ "PCBDDCGetNeumannBoundaries"
24053cdbc3dSStefano Zampini /*@
241da1bb401SStefano Zampini  PCBDDCGetNeumannBoundaries - Get index set defining subdomain part (in local ordering)
242da1bb401SStefano Zampini                               of Neumann boundaries for the global problem.
24353cdbc3dSStefano Zampini 
2449c0446d6SStefano Zampini    Not collective
24553cdbc3dSStefano Zampini 
24653cdbc3dSStefano Zampini    Input Parameters:
24753cdbc3dSStefano Zampini +  pc - the preconditioning context
24853cdbc3dSStefano Zampini 
24953cdbc3dSStefano Zampini    Output Parameters:
25053cdbc3dSStefano Zampini +  NeumannBoundaries - index set defining the subdomain part of Neumann boundaries
25153cdbc3dSStefano Zampini 
25253cdbc3dSStefano Zampini    Level: intermediate
25353cdbc3dSStefano Zampini 
25453cdbc3dSStefano Zampini    Notes:
25553cdbc3dSStefano Zampini 
25653cdbc3dSStefano Zampini .seealso: PCBDDC
25753cdbc3dSStefano Zampini @*/
25853cdbc3dSStefano Zampini PetscErrorCode PCBDDCGetNeumannBoundaries(PC pc,IS *NeumannBoundaries)
25953cdbc3dSStefano Zampini {
26053cdbc3dSStefano Zampini   PetscErrorCode ierr;
26153cdbc3dSStefano Zampini 
26253cdbc3dSStefano Zampini   PetscFunctionBegin;
26353cdbc3dSStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
26453cdbc3dSStefano Zampini   ierr = PetscUseMethod(pc,"PCBDDCGetNeumannBoundaries_C",(PC,IS*),(pc,NeumannBoundaries));CHKERRQ(ierr);
2650c7d97c5SJed Brown   PetscFunctionReturn(0);
2660c7d97c5SJed Brown }
26736e030ebSStefano Zampini /* -------------------------------------------------------------------------- */
26836e030ebSStefano Zampini EXTERN_C_BEGIN
26936e030ebSStefano Zampini #undef __FUNCT__
270da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetLocalAdjacencyGraph_BDDC"
271da1bb401SStefano Zampini static PetscErrorCode PCBDDCSetLocalAdjacencyGraph_BDDC(PC pc, PetscInt nvtxs, PetscInt xadj[], PetscInt adjncy[], PetscCopyMode copymode)
27236e030ebSStefano Zampini {
27336e030ebSStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
274da1bb401SStefano Zampini   PCBDDCGraph    mat_graph=pcbddc->mat_graph;
275da1bb401SStefano Zampini   PetscErrorCode ierr;
27636e030ebSStefano Zampini 
27736e030ebSStefano Zampini   PetscFunctionBegin;
278da1bb401SStefano Zampini   mat_graph->nvtxs=nvtxs;
279da1bb401SStefano Zampini   ierr = PetscFree(mat_graph->xadj);CHKERRQ(ierr);
280da1bb401SStefano Zampini   ierr = PetscFree(mat_graph->adjncy);CHKERRQ(ierr);
281da1bb401SStefano Zampini   if(copymode == PETSC_COPY_VALUES) {
282da1bb401SStefano Zampini     ierr = PetscMalloc((mat_graph->nvtxs+1)*sizeof(PetscInt),&mat_graph->xadj);CHKERRQ(ierr);
283da1bb401SStefano Zampini     ierr = PetscMalloc(xadj[mat_graph->nvtxs]*sizeof(PetscInt),&mat_graph->adjncy);CHKERRQ(ierr);
284da1bb401SStefano Zampini     ierr = PetscMemcpy(mat_graph->xadj,xadj,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr);
285da1bb401SStefano Zampini     ierr = PetscMemcpy(mat_graph->adjncy,adjncy,xadj[mat_graph->nvtxs]*sizeof(PetscInt));CHKERRQ(ierr);
286da1bb401SStefano Zampini   } else if(copymode == PETSC_OWN_POINTER) {
287da1bb401SStefano Zampini     mat_graph->xadj=xadj;
288da1bb401SStefano Zampini     mat_graph->adjncy=adjncy;
289da1bb401SStefano Zampini   } else {
290da1bb401SStefano Zampini     SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_SUP,"Unsupported copy mode %d in %s\n",copymode,__FUNCT__);
291da1bb401SStefano Zampini   }
29236e030ebSStefano Zampini   PetscFunctionReturn(0);
29336e030ebSStefano Zampini }
29436e030ebSStefano Zampini EXTERN_C_END
29536e030ebSStefano Zampini #undef __FUNCT__
296da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetLocalAdjacencyGraph"
29736e030ebSStefano Zampini /*@
298da1bb401SStefano Zampini  PCBDDCSetLocalAdjacencyGraph - Set CSR graph of local matrix for use of PCBDDC.
29936e030ebSStefano Zampini 
30036e030ebSStefano Zampini    Not collective
30136e030ebSStefano Zampini 
30236e030ebSStefano Zampini    Input Parameters:
30336e030ebSStefano Zampini +  pc - the preconditioning context
304da1bb401SStefano Zampini -  nvtxs - number of local vertices of the graph
305da1bb401SStefano Zampini -  xadj, adjncy - the CSR graph
306da1bb401SStefano Zampini -  copymode - either PETSC_COPY_VALUES or PETSC_OWN_POINTER. In the former case the user must free the array passed in;
307da1bb401SStefano Zampini                                                              in the latter case, memory must be obtained with PetscMalloc.
30836e030ebSStefano Zampini 
30936e030ebSStefano Zampini    Level: intermediate
31036e030ebSStefano Zampini 
31136e030ebSStefano Zampini    Notes:
31236e030ebSStefano Zampini 
31336e030ebSStefano Zampini .seealso: PCBDDC
31436e030ebSStefano Zampini @*/
315da1bb401SStefano Zampini PetscErrorCode PCBDDCSetLocalAdjacencyGraph(PC pc,PetscInt nvtxs,PetscInt xadj[],PetscInt adjncy[], PetscCopyMode copymode)
31636e030ebSStefano Zampini {
317da1bb401SStefano Zampini   PetscInt       nrows,ncols;
318da1bb401SStefano Zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
31936e030ebSStefano Zampini   PetscErrorCode ierr;
32036e030ebSStefano Zampini 
32136e030ebSStefano Zampini   PetscFunctionBegin;
32236e030ebSStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
323da1bb401SStefano Zampini   ierr = MatGetSize(matis->A,&nrows,&ncols);CHKERRQ(ierr);
324da1bb401SStefano Zampini   if(nvtxs != nrows) {
325da1bb401SStefano Zampini     SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Local adjacency size %d passed in %s differs from local problem size %d!\n",nvtxs,__FUNCT__,nrows);
326da1bb401SStefano Zampini   } else {
327da1bb401SStefano Zampini     ierr = PetscTryMethod(pc,"PCBDDCSetLocalAdjacencyGraph_C",(PC,PetscInt,PetscInt[],PetscInt[],PetscCopyMode),(pc,nvtxs,xadj,adjncy,copymode));CHKERRQ(ierr);
328da1bb401SStefano Zampini   }
32936e030ebSStefano Zampini   PetscFunctionReturn(0);
33036e030ebSStefano Zampini }
3319c0446d6SStefano Zampini /* -------------------------------------------------------------------------- */
3329c0446d6SStefano Zampini EXTERN_C_BEGIN
3339c0446d6SStefano Zampini #undef __FUNCT__
3349c0446d6SStefano Zampini #define __FUNCT__ "PCBDDCSetDofsSplitting_BDDC"
3359c0446d6SStefano Zampini static PetscErrorCode PCBDDCSetDofsSplitting_BDDC(PC pc,PetscInt n_is, IS ISForDofs[])
3369c0446d6SStefano Zampini {
3379c0446d6SStefano Zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
3389c0446d6SStefano Zampini   PetscInt i;
3399c0446d6SStefano Zampini   PetscErrorCode ierr;
3409c0446d6SStefano Zampini 
3419c0446d6SStefano Zampini   PetscFunctionBegin;
342da1bb401SStefano Zampini   /* Destroy ISes if they were already set */
3439c0446d6SStefano Zampini   for(i=0;i<pcbddc->n_ISForDofs;i++) {
3449c0446d6SStefano Zampini     ierr = ISDestroy(&pcbddc->ISForDofs[i]);CHKERRQ(ierr);
3459c0446d6SStefano Zampini   }
346d11ae9bbSstefano_zampini   ierr = PetscFree(pcbddc->ISForDofs);CHKERRQ(ierr);
347da1bb401SStefano Zampini   /* allocate space then set */
3489c0446d6SStefano Zampini   ierr = PetscMalloc(n_is*sizeof(IS),&pcbddc->ISForDofs);CHKERRQ(ierr);
3499c0446d6SStefano Zampini   for(i=0;i<n_is;i++) {
350da1bb401SStefano Zampini     ierr = PetscObjectReference((PetscObject)ISForDofs[i]);CHKERRQ(ierr);
351da1bb401SStefano Zampini     pcbddc->ISForDofs[i]=ISForDofs[i];
3529c0446d6SStefano Zampini   }
3539c0446d6SStefano Zampini   pcbddc->n_ISForDofs=n_is;
3549c0446d6SStefano Zampini   PetscFunctionReturn(0);
3559c0446d6SStefano Zampini }
3569c0446d6SStefano Zampini EXTERN_C_END
3579c0446d6SStefano Zampini #undef __FUNCT__
3589c0446d6SStefano Zampini #define __FUNCT__ "PCBDDCSetDofsSplitting"
3599c0446d6SStefano Zampini /*@
360da1bb401SStefano Zampini  PCBDDCSetDofsSplitting - Set index sets defining fields of local mat.
3619c0446d6SStefano Zampini 
3629c0446d6SStefano Zampini    Not collective
3639c0446d6SStefano Zampini 
3649c0446d6SStefano Zampini    Input Parameters:
3659c0446d6SStefano Zampini +  pc - the preconditioning context
366da1bb401SStefano Zampini -  n - number of index sets defining the fields
367da1bb401SStefano Zampini -  IS[] - array of IS describing the fields
3689c0446d6SStefano Zampini 
3699c0446d6SStefano Zampini    Level: intermediate
3709c0446d6SStefano Zampini 
3719c0446d6SStefano Zampini    Notes:
3729c0446d6SStefano Zampini 
3739c0446d6SStefano Zampini .seealso: PCBDDC
3749c0446d6SStefano Zampini @*/
3759c0446d6SStefano Zampini PetscErrorCode PCBDDCSetDofsSplitting(PC pc,PetscInt n_is, IS ISForDofs[])
3769c0446d6SStefano Zampini {
3779c0446d6SStefano Zampini   PetscErrorCode ierr;
3789c0446d6SStefano Zampini 
3799c0446d6SStefano Zampini   PetscFunctionBegin;
3809c0446d6SStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
3819c0446d6SStefano Zampini   ierr = PetscTryMethod(pc,"PCBDDCSetDofsSplitting_C",(PC,PetscInt,IS[]),(pc,n_is,ISForDofs));CHKERRQ(ierr);
3829c0446d6SStefano Zampini   PetscFunctionReturn(0);
3839c0446d6SStefano Zampini }
384da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
385534831adSStefano Zampini #undef __FUNCT__
386534831adSStefano Zampini #define __FUNCT__ "PCPreSolve_BDDC"
387534831adSStefano Zampini /* -------------------------------------------------------------------------- */
388534831adSStefano Zampini /*
389534831adSStefano Zampini    PCPreSolve_BDDC - Changes the right hand side and (if necessary) the initial
390534831adSStefano Zampini                      guess if a transformation of basis approach has been selected.
3919c0446d6SStefano Zampini 
392534831adSStefano Zampini    Input Parameter:
393534831adSStefano Zampini +  pc - the preconditioner contex
394534831adSStefano Zampini 
395534831adSStefano Zampini    Application Interface Routine: PCPreSolve()
396534831adSStefano Zampini 
397534831adSStefano Zampini    Notes:
398534831adSStefano Zampini    The interface routine PCPreSolve() is not usually called directly by
399534831adSStefano Zampini    the user, but instead is called by KSPSolve().
400534831adSStefano Zampini */
401534831adSStefano Zampini static PetscErrorCode PCPreSolve_BDDC(PC pc, KSP ksp, Vec rhs, Vec x)
402534831adSStefano Zampini {
403534831adSStefano Zampini   PetscErrorCode ierr;
404534831adSStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
405534831adSStefano Zampini   PC_IS          *pcis = (PC_IS*)(pc->data);
406534831adSStefano Zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
407534831adSStefano Zampini   Mat            temp_mat;
4083972b0daSStefano Zampini   IS             dirIS;
4093972b0daSStefano Zampini   PetscInt       dirsize,i,*is_indices;
4103972b0daSStefano Zampini   PetscScalar    *array_x,*array_diagonal;
4113972b0daSStefano Zampini   Vec            used_vec;
4123972b0daSStefano Zampini   PetscBool      guess_nonzero;
413534831adSStefano Zampini 
414534831adSStefano Zampini   PetscFunctionBegin;
4153972b0daSStefano Zampini   if(x) {
4163972b0daSStefano Zampini     ierr = PetscObjectReference((PetscObject)x);CHKERRQ(ierr);
4173972b0daSStefano Zampini     used_vec = x;
4183972b0daSStefano Zampini   } else {
4193972b0daSStefano Zampini     ierr = PetscObjectReference((PetscObject)pcbddc->temp_solution);CHKERRQ(ierr);
4203972b0daSStefano Zampini     used_vec = pcbddc->temp_solution;
4213972b0daSStefano Zampini     ierr = VecSet(used_vec,0.0);CHKERRQ(ierr);
4223972b0daSStefano Zampini   }
4233972b0daSStefano Zampini   /* hack into ksp data structure PCPreSolve comes earlier in src/ksp/ksp/interface/itfunc.c */
4243972b0daSStefano Zampini   if (ksp) {
4253972b0daSStefano Zampini     ierr = KSPGetInitialGuessNonzero(ksp,&guess_nonzero);CHKERRQ(ierr);
4263972b0daSStefano Zampini     if( !guess_nonzero ) {
4273972b0daSStefano Zampini       ierr = VecSet(used_vec,0.0);CHKERRQ(ierr);
4283972b0daSStefano Zampini     }
4293972b0daSStefano Zampini   }
4303972b0daSStefano Zampini   /* store the original rhs */
4313972b0daSStefano Zampini   ierr = VecCopy(rhs,pcbddc->original_rhs);CHKERRQ(ierr);
4323972b0daSStefano Zampini 
4333972b0daSStefano Zampini   /* Take into account zeroed rows -> change rhs and store solution removed */
4343972b0daSStefano Zampini   ierr = MatGetDiagonal(pc->pmat,pcis->vec1_global);CHKERRQ(ierr);
4353972b0daSStefano Zampini   ierr = VecPointwiseDivide(pcis->vec1_global,rhs,pcis->vec1_global);CHKERRQ(ierr);
4363972b0daSStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4373972b0daSStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4383972b0daSStefano Zampini   ierr = VecScatterBegin(matis->ctx,used_vec,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4393972b0daSStefano Zampini   ierr = VecScatterEnd  (matis->ctx,used_vec,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4403972b0daSStefano Zampini   ierr = PCBDDCGetDirichletBoundaries(pc,&dirIS);CHKERRQ(ierr);
4413972b0daSStefano Zampini   if(dirIS) {
4423972b0daSStefano Zampini     ierr = ISGetSize(dirIS,&dirsize);CHKERRQ(ierr);
4433972b0daSStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array_x);CHKERRQ(ierr);
4443972b0daSStefano Zampini     ierr = VecGetArray(pcis->vec2_N,&array_diagonal);CHKERRQ(ierr);
4453972b0daSStefano Zampini     ierr = ISGetIndices(dirIS,(const PetscInt**)&is_indices);CHKERRQ(ierr);
4463972b0daSStefano Zampini     for(i=0;i<dirsize;i++) {
4473972b0daSStefano Zampini       array_x[is_indices[i]]=array_diagonal[is_indices[i]];
4483972b0daSStefano Zampini     }
4493972b0daSStefano Zampini     ierr = ISRestoreIndices(dirIS,(const PetscInt**)&is_indices);CHKERRQ(ierr);
4503972b0daSStefano Zampini     ierr = VecRestoreArray(pcis->vec2_N,&array_diagonal);CHKERRQ(ierr);
4513972b0daSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array_x);CHKERRQ(ierr);
4523972b0daSStefano Zampini   }
4533972b0daSStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4543972b0daSStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
455b76ba322SStefano Zampini 
4563972b0daSStefano Zampini   /* remove the computed solution from the rhs */
4573972b0daSStefano Zampini   ierr = VecScale(used_vec,-1.0);CHKERRQ(ierr);
4583972b0daSStefano Zampini   ierr = MatMultAdd(pc->pmat,used_vec,rhs,rhs);CHKERRQ(ierr);
4593972b0daSStefano Zampini   ierr = VecScale(used_vec,-1.0);CHKERRQ(ierr);
460b76ba322SStefano Zampini 
461b76ba322SStefano Zampini   /* store partially computed solution and set initial guess */
4623972b0daSStefano Zampini   if(x) {
4633972b0daSStefano Zampini     ierr = VecCopy(used_vec,pcbddc->temp_solution);CHKERRQ(ierr);
4643972b0daSStefano Zampini     ierr = VecSet(used_vec,0.0);CHKERRQ(ierr);
465b76ba322SStefano Zampini     if(pcbddc->use_exact_dirichlet) {
466b76ba322SStefano Zampini       ierr = VecScatterBegin(pcis->global_to_D,rhs,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
467b76ba322SStefano Zampini       ierr = VecScatterEnd  (pcis->global_to_D,rhs,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
468b76ba322SStefano Zampini       ierr = KSPSolve(pcbddc->ksp_D,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr);
469b76ba322SStefano Zampini       ierr = VecScatterBegin(pcis->global_to_D,pcis->vec2_D,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
470b76ba322SStefano Zampini       ierr = VecScatterEnd  (pcis->global_to_D,pcis->vec2_D,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
471b76ba322SStefano Zampini       if(ksp) {
472b76ba322SStefano Zampini         ierr = KSPSetInitialGuessNonzero(ksp,PETSC_TRUE);CHKERRQ(ierr);
473b76ba322SStefano Zampini       }
474b76ba322SStefano Zampini     }
4753972b0daSStefano Zampini   }
4763972b0daSStefano Zampini   ierr = VecDestroy(&used_vec);CHKERRQ(ierr);
477b76ba322SStefano Zampini 
478b76ba322SStefano Zampini   /* rhs change of basis */
479b76ba322SStefano Zampini   if(pcbddc->usechangeofbasis) {
480b76ba322SStefano Zampini     /* swap pointers for local matrices */
481b76ba322SStefano Zampini     temp_mat = matis->A;
482b76ba322SStefano Zampini     matis->A = pcbddc->local_mat;
483b76ba322SStefano Zampini     pcbddc->local_mat = temp_mat;
484b76ba322SStefano Zampini     /* Get local rhs and apply transformation of basis */
485b76ba322SStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,rhs,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
486b76ba322SStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,rhs,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
487b76ba322SStefano Zampini     /* from original basis to modified basis */
488b76ba322SStefano Zampini     ierr = MatMultTranspose(pcbddc->ChangeOfBasisMatrix,pcis->vec1_B,pcis->vec2_B);CHKERRQ(ierr);
489b76ba322SStefano Zampini     /* put back modified values into the global vec using INSERT_VALUES copy mode */
490b76ba322SStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,pcis->vec2_B,rhs,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
491b76ba322SStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec2_B,rhs,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
492b76ba322SStefano Zampini   }
493534831adSStefano Zampini   PetscFunctionReturn(0);
494534831adSStefano Zampini }
495534831adSStefano Zampini /* -------------------------------------------------------------------------- */
496534831adSStefano Zampini #undef __FUNCT__
497534831adSStefano Zampini #define __FUNCT__ "PCPostSolve_BDDC"
498534831adSStefano Zampini /* -------------------------------------------------------------------------- */
499534831adSStefano Zampini /*
500534831adSStefano Zampini    PCPostSolve_BDDC - Changes the computed solution if a transformation of basis
501534831adSStefano Zampini                      approach has been selected. Also, restores rhs to its original state.
502534831adSStefano Zampini 
503534831adSStefano Zampini    Input Parameter:
504534831adSStefano Zampini +  pc - the preconditioner contex
505534831adSStefano Zampini 
506534831adSStefano Zampini    Application Interface Routine: PCPostSolve()
507534831adSStefano Zampini 
508534831adSStefano Zampini    Notes:
509534831adSStefano Zampini    The interface routine PCPostSolve() is not usually called directly by
510534831adSStefano Zampini    the user, but instead is called by KSPSolve().
511534831adSStefano Zampini */
512534831adSStefano Zampini static PetscErrorCode PCPostSolve_BDDC(PC pc, KSP ksp, Vec rhs, Vec x)
513534831adSStefano Zampini {
514534831adSStefano Zampini   PetscErrorCode ierr;
515534831adSStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
516534831adSStefano Zampini   PC_IS          *pcis = (PC_IS*)(pc->data);
517534831adSStefano Zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
518534831adSStefano Zampini   Mat            temp_mat;
519534831adSStefano Zampini 
520534831adSStefano Zampini   PetscFunctionBegin;
521534831adSStefano Zampini   if(pcbddc->usechangeofbasis) {
522534831adSStefano Zampini     /* swap pointers for local matrices */
523534831adSStefano Zampini     temp_mat = matis->A;
524534831adSStefano Zampini     matis->A = pcbddc->local_mat;
525534831adSStefano Zampini     pcbddc->local_mat = temp_mat;
526534831adSStefano Zampini     /* restore rhs to its original state */
5273425bc38SStefano Zampini     if(rhs) {
5283425bc38SStefano Zampini       ierr = VecCopy(pcbddc->original_rhs,rhs);CHKERRQ(ierr);
5293425bc38SStefano Zampini     }
530534831adSStefano Zampini     /* Get Local boundary and apply transformation of basis to solution vector */
531534831adSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,x,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
532534831adSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,x,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
533534831adSStefano Zampini     /* from modified basis to original basis */
534534831adSStefano Zampini     ierr = MatMult(pcbddc->ChangeOfBasisMatrix,pcis->vec1_B,pcis->vec2_B);CHKERRQ(ierr);
535534831adSStefano Zampini     /* put back modified values into the global vec using INSERT_VALUES copy mode */
536534831adSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,pcis->vec2_B,x,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
537534831adSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec2_B,x,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
538534831adSStefano Zampini   }
5393972b0daSStefano Zampini   /* add solution removed in presolve */
5403425bc38SStefano Zampini   if(x) {
5413425bc38SStefano Zampini     ierr = VecAXPY(x,1.0,pcbddc->temp_solution);CHKERRQ(ierr);
5423425bc38SStefano Zampini   }
543534831adSStefano Zampini   PetscFunctionReturn(0);
544534831adSStefano Zampini }
545534831adSStefano Zampini /* -------------------------------------------------------------------------- */
54653cdbc3dSStefano Zampini #undef __FUNCT__
54753cdbc3dSStefano Zampini #define __FUNCT__ "PCSetUp_BDDC"
5480c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
5490c7d97c5SJed Brown /*
5500c7d97c5SJed Brown    PCSetUp_BDDC - Prepares for the use of the BDDC preconditioner
5510c7d97c5SJed Brown                   by setting data structures and options.
5520c7d97c5SJed Brown 
5530c7d97c5SJed Brown    Input Parameter:
55453cdbc3dSStefano Zampini +  pc - the preconditioner context
5550c7d97c5SJed Brown 
5560c7d97c5SJed Brown    Application Interface Routine: PCSetUp()
5570c7d97c5SJed Brown 
5580c7d97c5SJed Brown    Notes:
5590c7d97c5SJed Brown    The interface routine PCSetUp() is not usually called directly by
5600c7d97c5SJed Brown    the user, but instead is called by PCApply() if necessary.
5610c7d97c5SJed Brown */
56253cdbc3dSStefano Zampini PetscErrorCode PCSetUp_BDDC(PC pc)
5630c7d97c5SJed Brown {
5640c7d97c5SJed Brown   PetscErrorCode ierr;
5650c7d97c5SJed Brown   PC_BDDC*       pcbddc   = (PC_BDDC*)pc->data;
5660c7d97c5SJed Brown   PC_IS            *pcis = (PC_IS*)(pc->data);
5670c7d97c5SJed Brown 
5680c7d97c5SJed Brown   PetscFunctionBegin;
5690c7d97c5SJed Brown   if (!pc->setupcalled) {
5703b03a366Sstefano_zampini     /* For BDDC we need to define a local "Neumann" problem different to that defined in PCISSetup
5719c0446d6SStefano Zampini        So, we set to pcnone the Neumann problem of pcis in order to avoid unneeded computation
5720c7d97c5SJed Brown        Also, we decide to directly build the (same) Dirichlet problem */
5730c7d97c5SJed Brown     ierr = PetscOptionsSetValue("-is_localN_pc_type","none");CHKERRQ(ierr);
5740c7d97c5SJed Brown     ierr = PetscOptionsSetValue("-is_localD_pc_type","none");CHKERRQ(ierr);
5750c7d97c5SJed Brown     /* Set up all the "iterative substructuring" common block */
5760c7d97c5SJed Brown     ierr = PCISSetUp(pc);CHKERRQ(ierr);
5773b03a366Sstefano_zampini     /* Get stdout for dbg */
578e269702eSStefano Zampini     if(pcbddc->dbg_flag) {
579e269702eSStefano Zampini       ierr = PetscViewerASCIIGetStdout(((PetscObject)pc)->comm,&pcbddc->dbg_viewer);CHKERRQ(ierr);
580e269702eSStefano Zampini       ierr = PetscViewerASCIISynchronizedAllow(pcbddc->dbg_viewer,PETSC_TRUE);CHKERRQ(ierr);
581e269702eSStefano Zampini     }
5823b03a366Sstefano_zampini     /* TODO MOVE CODE FRAGMENT */
5830c7d97c5SJed Brown     PetscInt im_active=0;
5840c7d97c5SJed Brown     if(pcis->n) im_active = 1;
58553cdbc3dSStefano Zampini     ierr = MPI_Allreduce(&im_active,&pcbddc->active_procs,1,MPIU_INT,MPI_SUM,((PetscObject)pc)->comm);CHKERRQ(ierr);
5863b03a366Sstefano_zampini     /* Analyze local interface */
5870c7d97c5SJed Brown     ierr = PCBDDCManageLocalBoundaries(pc);CHKERRQ(ierr);
5883b03a366Sstefano_zampini     /* Set up local constraint matrix */
5893b03a366Sstefano_zampini     ierr = PCBDDCCreateConstraintMatrix(pc);CHKERRQ(ierr);
5900c7d97c5SJed Brown     /* Create coarse and local stuffs used for evaluating action of preconditioner */
5910c7d97c5SJed Brown     ierr = PCBDDCCoarseSetUp(pc);CHKERRQ(ierr);
5923b03a366Sstefano_zampini     /* Processes fakely involved in multilevel should not call ISLocalToGlobalMappingRestoreInfo */
5933b03a366Sstefano_zampini     if ( !pcis->n_neigh ) pcis->ISLocalToGlobalMappingGetInfoWasCalled=PETSC_FALSE;
5940c7d97c5SJed Brown   }
5950c7d97c5SJed Brown   PetscFunctionReturn(0);
5960c7d97c5SJed Brown }
5970c7d97c5SJed Brown 
5980c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
5990c7d97c5SJed Brown /*
6000c7d97c5SJed Brown    PCApply_BDDC - Applies the BDDC preconditioner to a vector.
6010c7d97c5SJed Brown 
6020c7d97c5SJed Brown    Input Parameters:
6030c7d97c5SJed Brown .  pc - the preconditioner context
6040c7d97c5SJed Brown .  r - input vector (global)
6050c7d97c5SJed Brown 
6060c7d97c5SJed Brown    Output Parameter:
6070c7d97c5SJed Brown .  z - output vector (global)
6080c7d97c5SJed Brown 
6090c7d97c5SJed Brown    Application Interface Routine: PCApply()
6100c7d97c5SJed Brown  */
6110c7d97c5SJed Brown #undef __FUNCT__
6120c7d97c5SJed Brown #define __FUNCT__ "PCApply_BDDC"
61353cdbc3dSStefano Zampini PetscErrorCode PCApply_BDDC(PC pc,Vec r,Vec z)
6140c7d97c5SJed Brown {
6150c7d97c5SJed Brown   PC_IS             *pcis = (PC_IS*)(pc->data);
6160c7d97c5SJed Brown   PC_BDDC           *pcbddc = (PC_BDDC*)(pc->data);
6170c7d97c5SJed Brown   PetscErrorCode    ierr;
6183b03a366Sstefano_zampini   const PetscScalar one = 1.0;
6193b03a366Sstefano_zampini   const PetscScalar m_one = -1.0;
6202617d88aSStefano Zampini   const PetscScalar zero = 0.0;
6210c7d97c5SJed Brown 
6220c7d97c5SJed Brown /* This code is similar to that provided in nn.c for PCNN
6230c7d97c5SJed Brown    NN interface preconditioner changed to BDDC
6240c7d97c5SJed Brown    Added support for M_3 preconditioenr in the reference article (code is active if pcbddc->prec_type = PETSC_TRUE) */
6250c7d97c5SJed Brown 
6260c7d97c5SJed Brown   PetscFunctionBegin;
627b76ba322SStefano Zampini   if(!pcbddc->use_exact_dirichlet) {
6280c7d97c5SJed Brown     /* First Dirichlet solve */
6290c7d97c5SJed Brown     ierr = VecScatterBegin(pcis->global_to_D,r,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
6300c7d97c5SJed Brown     ierr = VecScatterEnd  (pcis->global_to_D,r,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
63153cdbc3dSStefano Zampini     ierr = KSPSolve(pcbddc->ksp_D,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr);
6320c7d97c5SJed Brown     /*
6330c7d97c5SJed Brown       Assembling right hand side for BDDC operator
6340c7d97c5SJed Brown       - vec1_D for the Dirichlet part (if needed, i.e. prec_flag=PETSC_TRUE)
6350c7d97c5SJed Brown       - the interface part of the global vector z
6360c7d97c5SJed Brown     */
6370c7d97c5SJed Brown     ierr = VecScale(pcis->vec2_D,m_one);CHKERRQ(ierr);
6380c7d97c5SJed Brown     ierr = MatMult(pcis->A_BI,pcis->vec2_D,pcis->vec1_B);CHKERRQ(ierr);
6390c7d97c5SJed Brown     if(pcbddc->prec_type) { ierr = MatMultAdd(pcis->A_II,pcis->vec2_D,pcis->vec1_D,pcis->vec1_D);CHKERRQ(ierr); }
6400c7d97c5SJed Brown     ierr = VecScale(pcis->vec2_D,m_one);CHKERRQ(ierr);
6410c7d97c5SJed Brown     ierr = VecCopy(r,z);CHKERRQ(ierr);
6420c7d97c5SJed Brown     ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
6430c7d97c5SJed Brown     ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
6442617d88aSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
6452617d88aSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
646b76ba322SStefano Zampini   } else {
647b76ba322SStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,r,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
648b76ba322SStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,r,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
649b76ba322SStefano Zampini     ierr = VecSet(pcis->vec2_D,zero);CHKERRQ(ierr);
650b76ba322SStefano Zampini   }
651b76ba322SStefano Zampini 
652b76ba322SStefano Zampini   /* Apply partition of unity */
6532617d88aSStefano Zampini   ierr = VecPointwiseMult(pcis->vec1_B,pcis->D,pcis->vec1_B);CHKERRQ(ierr);
6542617d88aSStefano Zampini 
6552617d88aSStefano Zampini   /* Apply interface preconditioner
6562617d88aSStefano Zampini      input/output vecs: pcis->vec1_B and pcis->vec1_D */
6572617d88aSStefano Zampini   ierr = PCBDDCApplyInterfacePreconditioner(pc);CHKERRQ(ierr);
6582617d88aSStefano Zampini 
6592617d88aSStefano Zampini   /* Apply partition of unity and sum boundary values */
6602617d88aSStefano Zampini   ierr = VecPointwiseMult(pcis->vec1_B,pcis->D,pcis->vec1_B);CHKERRQ(ierr);
6612617d88aSStefano Zampini   ierr = VecSet(z,zero);CHKERRQ(ierr);
6622617d88aSStefano Zampini   ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
6632617d88aSStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
6640c7d97c5SJed Brown 
6653b03a366Sstefano_zampini   /* Second Dirichlet solve and assembling of output */
6660c7d97c5SJed Brown   ierr = VecScatterBegin(pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
6670c7d97c5SJed Brown   ierr = VecScatterEnd  (pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
6680c7d97c5SJed Brown   ierr = MatMult(pcis->A_IB,pcis->vec1_B,pcis->vec3_D);CHKERRQ(ierr);
6690c7d97c5SJed Brown   if(pcbddc->prec_type) { ierr = MatMultAdd(pcis->A_II,pcis->vec1_D,pcis->vec3_D,pcis->vec3_D);CHKERRQ(ierr); }
67053cdbc3dSStefano Zampini   ierr = KSPSolve(pcbddc->ksp_D,pcis->vec3_D,pcbddc->vec4_D);CHKERRQ(ierr);
6710c7d97c5SJed Brown   ierr = VecScale(pcbddc->vec4_D,m_one);CHKERRQ(ierr);
6720c7d97c5SJed Brown   if(pcbddc->prec_type) { ierr = VecAXPY (pcbddc->vec4_D,one,pcis->vec1_D);CHKERRQ(ierr); }
6730c7d97c5SJed Brown   ierr = VecAXPY (pcis->vec2_D,one,pcbddc->vec4_D);CHKERRQ(ierr);
6740c7d97c5SJed Brown   ierr = VecScatterBegin(pcis->global_to_D,pcis->vec2_D,z,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
6750c7d97c5SJed Brown   ierr = VecScatterEnd  (pcis->global_to_D,pcis->vec2_D,z,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
6760c7d97c5SJed Brown   PetscFunctionReturn(0);
6770c7d97c5SJed Brown 
6780c7d97c5SJed Brown }
679da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
680da1bb401SStefano Zampini #undef __FUNCT__
681da1bb401SStefano Zampini #define __FUNCT__ "PCDestroy_BDDC"
682da1bb401SStefano Zampini PetscErrorCode PCDestroy_BDDC(PC pc)
683da1bb401SStefano Zampini {
684da1bb401SStefano Zampini   PC_BDDC          *pcbddc = (PC_BDDC*)pc->data;
685da1bb401SStefano Zampini   PetscErrorCode ierr;
686da1bb401SStefano Zampini 
687da1bb401SStefano Zampini   PetscFunctionBegin;
688da1bb401SStefano Zampini   /* free data created by PCIS */
689da1bb401SStefano Zampini   ierr = PCISDestroy(pc);CHKERRQ(ierr);
690da1bb401SStefano Zampini   /* free BDDC data  */
6913972b0daSStefano Zampini   ierr = VecDestroy(&pcbddc->temp_solution);CHKERRQ(ierr);
692534831adSStefano Zampini   ierr = VecDestroy(&pcbddc->original_rhs);CHKERRQ(ierr);
693534831adSStefano Zampini   ierr = MatDestroy(&pcbddc->local_mat);CHKERRQ(ierr);
694534831adSStefano Zampini   ierr = MatDestroy(&pcbddc->ChangeOfBasisMatrix);CHKERRQ(ierr);
695da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->coarse_vec);CHKERRQ(ierr);
696da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->coarse_rhs);CHKERRQ(ierr);
697da1bb401SStefano Zampini   ierr = KSPDestroy(&pcbddc->coarse_ksp);CHKERRQ(ierr);
698da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->coarse_mat);CHKERRQ(ierr);
699da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->coarse_phi_B);CHKERRQ(ierr);
700da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->coarse_phi_D);CHKERRQ(ierr);
701da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec1_P);CHKERRQ(ierr);
702da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec1_C);CHKERRQ(ierr);
703da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->local_auxmat1);CHKERRQ(ierr);
704da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->local_auxmat2);CHKERRQ(ierr);
705da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec1_R);CHKERRQ(ierr);
706da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec2_R);CHKERRQ(ierr);
707da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec4_D);CHKERRQ(ierr);
708da1bb401SStefano Zampini   ierr = VecScatterDestroy(&pcbddc->R_to_B);CHKERRQ(ierr);
709da1bb401SStefano Zampini   ierr = VecScatterDestroy(&pcbddc->R_to_D);CHKERRQ(ierr);
710da1bb401SStefano Zampini   ierr = VecScatterDestroy(&pcbddc->coarse_loc_to_glob);CHKERRQ(ierr);
711da1bb401SStefano Zampini   ierr = KSPDestroy(&pcbddc->ksp_D);CHKERRQ(ierr);
712da1bb401SStefano Zampini   ierr = KSPDestroy(&pcbddc->ksp_R);CHKERRQ(ierr);
713da1bb401SStefano Zampini   ierr = ISDestroy(&pcbddc->NeumannBoundaries);CHKERRQ(ierr);
714da1bb401SStefano Zampini   ierr = ISDestroy(&pcbddc->DirichletBoundaries);CHKERRQ(ierr);
715da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->ConstraintMatrix);CHKERRQ(ierr);
716da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->local_primal_indices);CHKERRQ(ierr);
717da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->replicated_local_primal_indices);CHKERRQ(ierr);
718da1bb401SStefano Zampini   if (pcbddc->replicated_local_primal_values)    { free(pcbddc->replicated_local_primal_values); }
719da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->local_primal_displacements);CHKERRQ(ierr);
720da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->local_primal_sizes);CHKERRQ(ierr);
721da1bb401SStefano Zampini   PetscInt i;
722da1bb401SStefano Zampini   for(i=0;i<pcbddc->n_ISForDofs;i++) { ierr = ISDestroy(&pcbddc->ISForDofs[i]);CHKERRQ(ierr); }
723da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->ISForDofs);CHKERRQ(ierr);
724da1bb401SStefano Zampini   for(i=0;i<pcbddc->n_ISForFaces;i++) { ierr = ISDestroy(&pcbddc->ISForFaces[i]);CHKERRQ(ierr); }
725da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->ISForFaces);CHKERRQ(ierr);
726da1bb401SStefano Zampini   for(i=0;i<pcbddc->n_ISForEdges;i++) { ierr = ISDestroy(&pcbddc->ISForEdges[i]);CHKERRQ(ierr); }
727da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->ISForEdges);CHKERRQ(ierr);
728da1bb401SStefano Zampini   ierr = ISDestroy(&pcbddc->ISForVertices);CHKERRQ(ierr);
7293972b0daSStefano Zampini   /* Free graph structure */
730da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph->xadj);CHKERRQ(ierr);
731da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph->adjncy);CHKERRQ(ierr);
732da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph->neighbours_set[0]);CHKERRQ(ierr);
733da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph->neighbours_set);CHKERRQ(ierr);
7343972b0daSStefano Zampini   ierr = PetscFree4(pcbddc->mat_graph->where,pcbddc->mat_graph->count,pcbddc->mat_graph->cptr,pcbddc->mat_graph->queue);CHKERRQ(ierr);
7353972b0daSStefano Zampini   ierr = PetscFree2(pcbddc->mat_graph->which_dof,pcbddc->mat_graph->touched);CHKERRQ(ierr);
7363972b0daSStefano Zampini   ierr = PetscFree(pcbddc->mat_graph->where_ncmps);CHKERRQ(ierr);
737da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph);CHKERRQ(ierr);
7383425bc38SStefano Zampini   /* remove functions */
7393425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDirichletBoundaries_C","",PETSC_NULL);CHKERRQ(ierr);
7403425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetNeumannBoundaries_C","",PETSC_NULL);CHKERRQ(ierr);
7413425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetDirichletBoundaries_C","",PETSC_NULL);CHKERRQ(ierr);
7423425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetNeumannBoundaries_C","",PETSC_NULL);CHKERRQ(ierr);
7433425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetCoarseProblemType_C","",PETSC_NULL);CHKERRQ(ierr);
7443425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDofsSplitting_C","",PETSC_NULL);CHKERRQ(ierr);
7453425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetLocalAdjacencyGraph_C","",PETSC_NULL);CHKERRQ(ierr);
7463425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPreSolve_C","",PETSC_NULL);CHKERRQ(ierr);
7473425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPostSolve_C","",PETSC_NULL);CHKERRQ(ierr);
7483425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCCreateFETIDPOperators_C","",PETSC_NULL);CHKERRQ(ierr);
7493425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetRHS_C","",PETSC_NULL);CHKERRQ(ierr);
7503425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetSolution_C","",PETSC_NULL);CHKERRQ(ierr);
751da1bb401SStefano Zampini   /* Free the private data structure that was hanging off the PC */
752da1bb401SStefano Zampini   ierr = PetscFree(pcbddc);CHKERRQ(ierr);
753da1bb401SStefano Zampini   PetscFunctionReturn(0);
754da1bb401SStefano Zampini }
7553425bc38SStefano Zampini /* -------------------------------------------------------------------------- */
7563425bc38SStefano Zampini EXTERN_C_BEGIN
7573425bc38SStefano Zampini #undef __FUNCT__
7583425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetRHS_BDDC"
7593425bc38SStefano Zampini static PetscErrorCode PCBDDCMatFETIDPGetRHS_BDDC(Mat fetidp_mat, Vec standard_rhs, Vec fetidp_flux_rhs)
7603425bc38SStefano Zampini {
7613425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
7623425bc38SStefano Zampini   PC_IS*         pcis;
7633425bc38SStefano Zampini   PC_BDDC*       pcbddc;
7643425bc38SStefano Zampini   Mat_IS*        matis;
7653425bc38SStefano Zampini   PetscErrorCode ierr;
7660c7d97c5SJed Brown 
7673425bc38SStefano Zampini   PetscFunctionBegin;
7683425bc38SStefano Zampini   ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr);
7693425bc38SStefano Zampini   pcis = (PC_IS*)mat_ctx->pc->data;
7703425bc38SStefano Zampini   pcbddc = (PC_BDDC*)mat_ctx->pc->data;
7713425bc38SStefano Zampini   matis = (Mat_IS*)mat_ctx->pc->pmat->data;
7723425bc38SStefano Zampini 
7733425bc38SStefano Zampini   /* change of basis for physical rhs if needed
7743425bc38SStefano Zampini      It also changes the rhs in case of dirichlet boundaries */
7753425bc38SStefano Zampini   (*mat_ctx->pc->ops->presolve)(mat_ctx->pc,PETSC_NULL,standard_rhs,PETSC_NULL);
7763425bc38SStefano Zampini   /* store vectors for computation of fetidp final solution */
7773425bc38SStefano Zampini   ierr = VecScatterBegin(pcis->global_to_D,standard_rhs,mat_ctx->temp_solution_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
7783425bc38SStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_D,standard_rhs,mat_ctx->temp_solution_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
7793425bc38SStefano Zampini   ierr = VecScatterBegin(pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
7803425bc38SStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
7813425bc38SStefano Zampini   /* scale rhs since it should be unassembled */
7823425bc38SStefano Zampini   ierr = VecPointwiseMult(mat_ctx->temp_solution_B,pcis->D,mat_ctx->temp_solution_B);CHKERRQ(ierr);
7833425bc38SStefano Zampini   if(!pcbddc->prec_type) {
7843425bc38SStefano Zampini     /* compute partially subassembled Schur complement right-hand side */
7853425bc38SStefano Zampini     ierr = KSPSolve(pcbddc->ksp_D,mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr);
7863425bc38SStefano Zampini     ierr = MatMult(pcis->A_BI,pcis->vec1_D,pcis->vec1_B);CHKERRQ(ierr);
7873425bc38SStefano Zampini     ierr = VecAXPY(mat_ctx->temp_solution_B,-1.0,pcis->vec1_B);CHKERRQ(ierr);
7883425bc38SStefano Zampini     ierr = VecSet(standard_rhs,0.0);CHKERRQ(ierr);
7893425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,mat_ctx->temp_solution_B,standard_rhs,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
7903425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,mat_ctx->temp_solution_B,standard_rhs,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
7913425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
7923425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,standard_rhs,mat_ctx->temp_solution_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
7933425bc38SStefano Zampini     ierr = VecPointwiseMult(mat_ctx->temp_solution_B,pcis->D,mat_ctx->temp_solution_B);CHKERRQ(ierr);
7943425bc38SStefano Zampini   }
7953425bc38SStefano Zampini   /* BDDC rhs */
7963425bc38SStefano Zampini   ierr = VecCopy(mat_ctx->temp_solution_B,pcis->vec1_B);CHKERRQ(ierr);
7973425bc38SStefano Zampini   if(pcbddc->prec_type) {
7983425bc38SStefano Zampini     ierr = VecCopy(mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr);
7993425bc38SStefano Zampini   }
8003425bc38SStefano Zampini   /* apply BDDC */
8013425bc38SStefano Zampini   ierr = PCBDDCApplyInterfacePreconditioner(mat_ctx->pc);CHKERRQ(ierr);
8023425bc38SStefano Zampini   /* Application of B_delta and assembling of rhs for fetidp fluxes */
8033425bc38SStefano Zampini   ierr = VecSet(fetidp_flux_rhs,0.0);CHKERRQ(ierr);
8043425bc38SStefano Zampini   ierr = MatMult(mat_ctx->B_delta,pcis->vec1_B,mat_ctx->lambda_local);CHKERRQ(ierr);
8053425bc38SStefano Zampini   ierr = VecScatterBegin(mat_ctx->l2g_lambda,mat_ctx->lambda_local,fetidp_flux_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
8063425bc38SStefano Zampini   ierr = VecScatterEnd  (mat_ctx->l2g_lambda,mat_ctx->lambda_local,fetidp_flux_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
8073425bc38SStefano Zampini   /* restore original rhs */
8083425bc38SStefano Zampini   ierr = VecCopy(pcbddc->original_rhs,standard_rhs);CHKERRQ(ierr);
8093425bc38SStefano Zampini   PetscFunctionReturn(0);
8103425bc38SStefano Zampini }
8113425bc38SStefano Zampini EXTERN_C_END
8123425bc38SStefano Zampini #undef __FUNCT__
8133425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetRHS"
8143425bc38SStefano Zampini /*@
8153425bc38SStefano Zampini  PCBDDCMatFETIDPGetRHS - Get rhs for FETIDP linear system.
8163425bc38SStefano Zampini 
8173425bc38SStefano Zampini    Collective
8183425bc38SStefano Zampini 
8193425bc38SStefano Zampini    Input Parameters:
8203425bc38SStefano Zampini +  fetidp_mat   - the FETIDP mat obtained by a call to PCBDDCCreateFETIDPOperators
8213425bc38SStefano Zampini +  standard_rhs - the rhs of your linear system
8223425bc38SStefano Zampini 
8233425bc38SStefano Zampini    Output Parameters:
8243425bc38SStefano Zampini +  fetidp_flux_rhs   - the rhs of the FETIDP linear system
8253425bc38SStefano Zampini 
8263425bc38SStefano Zampini    Level: developer
8273425bc38SStefano Zampini 
8283425bc38SStefano Zampini    Notes:
8293425bc38SStefano Zampini 
8303425bc38SStefano Zampini .seealso: PCBDDC
8313425bc38SStefano Zampini @*/
8323425bc38SStefano Zampini PetscErrorCode PCBDDCMatFETIDPGetRHS(Mat fetidp_mat, Vec standard_rhs, Vec fetidp_flux_rhs)
8333425bc38SStefano Zampini {
8343425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
8353425bc38SStefano Zampini   PetscErrorCode ierr;
8363425bc38SStefano Zampini 
8373425bc38SStefano Zampini   PetscFunctionBegin;
8383425bc38SStefano Zampini   ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr);
8393425bc38SStefano Zampini   ierr = PetscTryMethod(mat_ctx->pc,"PCBDDCMatFETIDPGetRHS_C",(Mat,Vec,Vec),(fetidp_mat,standard_rhs,fetidp_flux_rhs));CHKERRQ(ierr);
8403425bc38SStefano Zampini   PetscFunctionReturn(0);
8413425bc38SStefano Zampini }
8423425bc38SStefano Zampini /* -------------------------------------------------------------------------- */
8433425bc38SStefano Zampini EXTERN_C_BEGIN
8443425bc38SStefano Zampini #undef __FUNCT__
8453425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetSolution_BDDC"
8463425bc38SStefano Zampini static PetscErrorCode PCBDDCMatFETIDPGetSolution_BDDC(Mat fetidp_mat, Vec fetidp_flux_sol, Vec standard_sol)
8473425bc38SStefano Zampini {
8483425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
8493425bc38SStefano Zampini   PC_IS*         pcis;
8503425bc38SStefano Zampini   PC_BDDC*       pcbddc;
8513425bc38SStefano Zampini   Mat_IS*        matis;
8523425bc38SStefano Zampini   PetscErrorCode ierr;
8533425bc38SStefano Zampini 
8543425bc38SStefano Zampini   PetscFunctionBegin;
8553425bc38SStefano Zampini   ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr);
8563425bc38SStefano Zampini   pcis = (PC_IS*)mat_ctx->pc->data;
8573425bc38SStefano Zampini   pcbddc = (PC_BDDC*)mat_ctx->pc->data;
8583425bc38SStefano Zampini   matis = (Mat_IS*)mat_ctx->pc->pmat->data;
8593425bc38SStefano Zampini 
8603425bc38SStefano Zampini   /* apply B_delta^T */
8613425bc38SStefano Zampini   ierr = VecScatterBegin(mat_ctx->l2g_lambda,fetidp_flux_sol,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
8623425bc38SStefano Zampini   ierr = VecScatterEnd  (mat_ctx->l2g_lambda,fetidp_flux_sol,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
8633425bc38SStefano Zampini   ierr = MatMultTranspose(mat_ctx->B_delta,mat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr);
8643425bc38SStefano Zampini   /* compute rhs for BDDC application */
8653425bc38SStefano Zampini   ierr = VecAYPX(pcis->vec1_B,-1.0,mat_ctx->temp_solution_B);CHKERRQ(ierr);
8663425bc38SStefano Zampini   if(pcbddc->prec_type) {
8673425bc38SStefano Zampini     ierr = VecCopy(mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr);
8683425bc38SStefano Zampini   }
8693425bc38SStefano Zampini   /* apply BDDC */
8703425bc38SStefano Zampini   ierr = PCBDDCApplyInterfacePreconditioner(mat_ctx->pc);CHKERRQ(ierr);
8713425bc38SStefano Zampini   /* put values into standard global vector */
8723425bc38SStefano Zampini   ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
8733425bc38SStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec1_B,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
8743425bc38SStefano Zampini   if(!pcbddc->prec_type) {
8753425bc38SStefano Zampini     /* compute values into the interior if solved for the partially subassembled Schur complement */
8763425bc38SStefano Zampini     ierr = MatMult(pcis->A_IB,pcis->vec1_B,pcis->vec1_D);CHKERRQ(ierr);
8773425bc38SStefano Zampini     ierr = VecAXPY(mat_ctx->temp_solution_D,-1.0,pcis->vec1_D);CHKERRQ(ierr);
8783425bc38SStefano Zampini     ierr = KSPSolve(pcbddc->ksp_D,mat_ctx->temp_solution_D,pcis->vec1_D);CHKERRQ(ierr);
8793425bc38SStefano Zampini   }
8803425bc38SStefano Zampini   ierr = VecScatterBegin(pcis->global_to_D,pcis->vec1_D,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
8813425bc38SStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_D,pcis->vec1_D,standard_sol,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
8823425bc38SStefano Zampini   /* final change of basis if needed
8833425bc38SStefano Zampini      Is also sums the dirichlet part removed during RHS assembling */
8843425bc38SStefano Zampini   (*mat_ctx->pc->ops->postsolve)(mat_ctx->pc,PETSC_NULL,PETSC_NULL,standard_sol);
8853425bc38SStefano Zampini   PetscFunctionReturn(0);
8863425bc38SStefano Zampini 
8873425bc38SStefano Zampini }
8883425bc38SStefano Zampini EXTERN_C_END
8893425bc38SStefano Zampini #undef __FUNCT__
8903425bc38SStefano Zampini #define __FUNCT__ "PCBDDCMatFETIDPGetSolution"
8913425bc38SStefano Zampini /*@
8923425bc38SStefano Zampini  PCBDDCMatFETIDPGetSolution - Get Solution for FETIDP linear system.
8933425bc38SStefano Zampini 
8943425bc38SStefano Zampini    Collective
8953425bc38SStefano Zampini 
8963425bc38SStefano Zampini    Input Parameters:
8973425bc38SStefano Zampini +  fetidp_mat        - the FETIDP mat obtained by a call to PCBDDCCreateFETIDPOperators
8983425bc38SStefano Zampini +  fetidp_flux_sol - the solution of the FETIDP linear system
8993425bc38SStefano Zampini 
9003425bc38SStefano Zampini    Output Parameters:
9013425bc38SStefano Zampini +  standard_sol      - the solution on the global domain
9023425bc38SStefano Zampini 
9033425bc38SStefano Zampini    Level: developer
9043425bc38SStefano Zampini 
9053425bc38SStefano Zampini    Notes:
9063425bc38SStefano Zampini 
9073425bc38SStefano Zampini .seealso: PCBDDC
9083425bc38SStefano Zampini @*/
9093425bc38SStefano Zampini PetscErrorCode PCBDDCMatFETIDPGetSolution(Mat fetidp_mat, Vec fetidp_flux_sol, Vec standard_sol)
9103425bc38SStefano Zampini {
9113425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
9123425bc38SStefano Zampini   PetscErrorCode ierr;
9133425bc38SStefano Zampini 
9143425bc38SStefano Zampini   PetscFunctionBegin;
9153425bc38SStefano Zampini   ierr = MatShellGetContext(fetidp_mat,&mat_ctx);CHKERRQ(ierr);
9163425bc38SStefano Zampini   ierr = PetscTryMethod(mat_ctx->pc,"PCBDDCMatFETIDPGetSolution_C",(Mat,Vec,Vec),(fetidp_mat,fetidp_flux_sol,standard_sol));CHKERRQ(ierr);
9173425bc38SStefano Zampini   PetscFunctionReturn(0);
9183425bc38SStefano Zampini }
9193425bc38SStefano Zampini /* -------------------------------------------------------------------------- */
9203425bc38SStefano Zampini EXTERN_C_BEGIN
9213425bc38SStefano Zampini #undef __FUNCT__
9223425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPOperators_BDDC"
9233425bc38SStefano Zampini static PetscErrorCode PCBDDCCreateFETIDPOperators_BDDC(PC pc, Mat *fetidp_mat, PC *fetidp_pc)
9243425bc38SStefano Zampini {
9253425bc38SStefano Zampini   PETSC_EXTERN PetscErrorCode FETIDPMatMult(Mat,Vec,Vec);
9263425bc38SStefano Zampini   PETSC_EXTERN PetscErrorCode PCBDDCDestroyFETIDPMat(Mat);
9273425bc38SStefano Zampini   PETSC_EXTERN PetscErrorCode FETIDPPCApply(PC,Vec,Vec);
9283425bc38SStefano Zampini   PETSC_EXTERN PetscErrorCode PCBDDCDestroyFETIDPPC(PC);
9293425bc38SStefano Zampini 
9303425bc38SStefano Zampini   FETIDPMat_ctx  *fetidpmat_ctx;
9313425bc38SStefano Zampini   Mat            newmat;
9323425bc38SStefano Zampini   FETIDPPC_ctx  *fetidppc_ctx;
9333425bc38SStefano Zampini   PC             newpc;
9343425bc38SStefano Zampini   MPI_Comm       comm = ((PetscObject)pc)->comm;
9353425bc38SStefano Zampini   PetscErrorCode ierr;
9363425bc38SStefano Zampini 
9373425bc38SStefano Zampini   PetscFunctionBegin;
9383425bc38SStefano Zampini   /* FETIDP linear matrix */
9393425bc38SStefano Zampini   ierr = PCBDDCCreateFETIDPMatContext(pc, &fetidpmat_ctx);CHKERRQ(ierr);
9403425bc38SStefano Zampini   ierr = PCBDDCSetupFETIDPMatContext(fetidpmat_ctx);CHKERRQ(ierr);
9413425bc38SStefano Zampini   ierr = MatCreateShell(comm,PETSC_DECIDE,PETSC_DECIDE,fetidpmat_ctx->n_lambda,fetidpmat_ctx->n_lambda,fetidpmat_ctx,&newmat);CHKERRQ(ierr);
9423425bc38SStefano Zampini   ierr = MatShellSetOperation(newmat,MATOP_MULT,(void (*)(void))FETIDPMatMult);CHKERRQ(ierr);
9433425bc38SStefano Zampini   ierr = MatShellSetOperation(newmat,MATOP_DESTROY,(void (*)(void))PCBDDCDestroyFETIDPMat);CHKERRQ(ierr);
9443425bc38SStefano Zampini   ierr = MatSetUp(newmat);CHKERRQ(ierr);
9453425bc38SStefano Zampini   /* FETIDP preconditioner */
9463425bc38SStefano Zampini   ierr = PCBDDCCreateFETIDPPCContext(pc, &fetidppc_ctx);CHKERRQ(ierr);
9473425bc38SStefano Zampini   ierr = PCBDDCSetupFETIDPPCContext(newmat,fetidppc_ctx);CHKERRQ(ierr);
9483425bc38SStefano Zampini   ierr = PCCreate(comm,&newpc);CHKERRQ(ierr);
9493425bc38SStefano Zampini   ierr = PCSetType(newpc,PCSHELL);CHKERRQ(ierr);
9503425bc38SStefano Zampini   ierr = PCShellSetContext(newpc,fetidppc_ctx);CHKERRQ(ierr);
9513425bc38SStefano Zampini   ierr = PCShellSetApply(newpc,FETIDPPCApply);CHKERRQ(ierr);
9523425bc38SStefano Zampini   ierr = PCShellSetDestroy(newpc,PCBDDCDestroyFETIDPPC);CHKERRQ(ierr);
9533425bc38SStefano Zampini   ierr = PCSetOperators(newpc,newmat,newmat,SAME_PRECONDITIONER);CHKERRQ(ierr);
9543425bc38SStefano Zampini   ierr = PCSetUp(newpc);CHKERRQ(ierr);
9553425bc38SStefano Zampini   /* return pointers for objects created */
9563425bc38SStefano Zampini   *fetidp_mat=newmat;
9573425bc38SStefano Zampini   *fetidp_pc=newpc;
9583425bc38SStefano Zampini 
9593425bc38SStefano Zampini   PetscFunctionReturn(0);
9603425bc38SStefano Zampini }
9613425bc38SStefano Zampini EXTERN_C_END
9623425bc38SStefano Zampini #undef __FUNCT__
9633425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPOperators"
9643425bc38SStefano Zampini /*@
9653425bc38SStefano Zampini  PCBDDCCreateFETIDPOperators - Create operators for FETIDP.
9663425bc38SStefano Zampini 
9673425bc38SStefano Zampini    Collective
9683425bc38SStefano Zampini 
9693425bc38SStefano Zampini    Input Parameters:
9703425bc38SStefano Zampini +  pc - the BDDC preconditioning context (setup must be already called)
9713425bc38SStefano Zampini 
9723425bc38SStefano Zampini    Level: developer
9733425bc38SStefano Zampini 
9743425bc38SStefano Zampini    Notes:
9753425bc38SStefano Zampini 
9763425bc38SStefano Zampini .seealso: PCBDDC
9773425bc38SStefano Zampini @*/
9783425bc38SStefano Zampini PetscErrorCode PCBDDCCreateFETIDPOperators(PC pc, Mat *fetidp_mat, PC *fetidp_pc)
9793425bc38SStefano Zampini {
9803425bc38SStefano Zampini   PetscErrorCode ierr;
9813425bc38SStefano Zampini 
9823425bc38SStefano Zampini   PetscFunctionBegin;
9833425bc38SStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
9843425bc38SStefano Zampini   if (pc->setupcalled) {
9853425bc38SStefano Zampini     ierr = PetscTryMethod(pc,"PCBDDCCreateFETIDPOperators_C",(PC,Mat*,PC*),(pc,fetidp_mat,fetidp_pc));CHKERRQ(ierr);
9863425bc38SStefano Zampini   } else {
9873425bc38SStefano Zampini     SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_SUP,"You must call PCSetup_BDDC before calling %s\n",__FUNCT__);
9883425bc38SStefano Zampini   }
9893425bc38SStefano Zampini   PetscFunctionReturn(0);
9903425bc38SStefano Zampini }
9910c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
992da1bb401SStefano Zampini /*MC
993da1bb401SStefano Zampini    PCBDDC - Balancing Domain Decomposition by Constraints.
9940c7d97c5SJed Brown 
995da1bb401SStefano Zampini    Options Database Keys:
996da1bb401SStefano Zampini .    -pcbddc ??? -
997da1bb401SStefano Zampini 
998da1bb401SStefano Zampini    Level: intermediate
999da1bb401SStefano Zampini 
1000da1bb401SStefano Zampini    Notes: The matrix used with this preconditioner must be of type MATIS
1001da1bb401SStefano Zampini 
1002da1bb401SStefano Zampini           Unlike more 'conventional' interface preconditioners, this iterates over ALL the
1003da1bb401SStefano Zampini           degrees of freedom, NOT just those on the interface (this allows the use of approximate solvers
1004da1bb401SStefano Zampini           on the subdomains).
1005da1bb401SStefano Zampini 
1006da1bb401SStefano Zampini           Options for the coarse grid preconditioner can be set with -
1007da1bb401SStefano Zampini           Options for the Dirichlet subproblem can be set with -
1008da1bb401SStefano Zampini           Options for the Neumann subproblem can be set with -
1009da1bb401SStefano Zampini 
1010da1bb401SStefano Zampini    Contributed by Stefano Zampini
1011da1bb401SStefano Zampini 
1012da1bb401SStefano Zampini .seealso:  PCCreate(), PCSetType(), PCType (for list of available types), PC,  MATIS
1013da1bb401SStefano Zampini M*/
1014da1bb401SStefano Zampini EXTERN_C_BEGIN
1015da1bb401SStefano Zampini #undef __FUNCT__
1016da1bb401SStefano Zampini #define __FUNCT__ "PCCreate_BDDC"
1017da1bb401SStefano Zampini PetscErrorCode PCCreate_BDDC(PC pc)
1018da1bb401SStefano Zampini {
1019da1bb401SStefano Zampini   PetscErrorCode ierr;
1020da1bb401SStefano Zampini   PC_BDDC        *pcbddc;
1021da1bb401SStefano Zampini   PCBDDCGraph    mat_graph;
1022da1bb401SStefano Zampini 
1023da1bb401SStefano Zampini   PetscFunctionBegin;
1024da1bb401SStefano Zampini   /* Creates the private data structure for this preconditioner and attach it to the PC object. */
1025da1bb401SStefano Zampini   ierr      = PetscNewLog(pc,PC_BDDC,&pcbddc);CHKERRQ(ierr);
1026da1bb401SStefano Zampini   pc->data  = (void*)pcbddc;
1027da1bb401SStefano Zampini 
1028da1bb401SStefano Zampini   /* create PCIS data structure */
1029da1bb401SStefano Zampini   ierr = PCISCreate(pc);CHKERRQ(ierr);
1030da1bb401SStefano Zampini 
1031da1bb401SStefano Zampini   /* BDDC specific */
10323972b0daSStefano Zampini   pcbddc->temp_solution              = 0;
1033534831adSStefano Zampini   pcbddc->original_rhs               = 0;
1034534831adSStefano Zampini   pcbddc->local_mat                  = 0;
1035534831adSStefano Zampini   pcbddc->ChangeOfBasisMatrix        = 0;
1036534831adSStefano Zampini   pcbddc->usechangeofbasis           = PETSC_TRUE;
1037534831adSStefano Zampini   pcbddc->usechangeonfaces           = PETSC_FALSE;
1038da1bb401SStefano Zampini   pcbddc->coarse_vec                 = 0;
1039da1bb401SStefano Zampini   pcbddc->coarse_rhs                 = 0;
1040da1bb401SStefano Zampini   pcbddc->coarse_ksp                 = 0;
1041da1bb401SStefano Zampini   pcbddc->coarse_phi_B               = 0;
1042da1bb401SStefano Zampini   pcbddc->coarse_phi_D               = 0;
1043da1bb401SStefano Zampini   pcbddc->vec1_P                     = 0;
1044da1bb401SStefano Zampini   pcbddc->vec1_R                     = 0;
1045da1bb401SStefano Zampini   pcbddc->vec2_R                     = 0;
1046da1bb401SStefano Zampini   pcbddc->local_auxmat1              = 0;
1047da1bb401SStefano Zampini   pcbddc->local_auxmat2              = 0;
1048da1bb401SStefano Zampini   pcbddc->R_to_B                     = 0;
1049da1bb401SStefano Zampini   pcbddc->R_to_D                     = 0;
1050da1bb401SStefano Zampini   pcbddc->ksp_D                      = 0;
1051da1bb401SStefano Zampini   pcbddc->ksp_R                      = 0;
1052da1bb401SStefano Zampini   pcbddc->local_primal_indices       = 0;
1053da1bb401SStefano Zampini   pcbddc->prec_type                  = PETSC_FALSE;
1054da1bb401SStefano Zampini   pcbddc->NeumannBoundaries          = 0;
1055da1bb401SStefano Zampini   pcbddc->ISForDofs                  = 0;
1056da1bb401SStefano Zampini   pcbddc->ISForVertices              = 0;
1057da1bb401SStefano Zampini   pcbddc->n_ISForFaces               = 0;
1058da1bb401SStefano Zampini   pcbddc->n_ISForEdges               = 0;
1059da1bb401SStefano Zampini   pcbddc->ConstraintMatrix           = 0;
1060da1bb401SStefano Zampini   pcbddc->use_nnsp_true              = PETSC_FALSE;
1061da1bb401SStefano Zampini   pcbddc->local_primal_sizes         = 0;
1062da1bb401SStefano Zampini   pcbddc->local_primal_displacements = 0;
1063da1bb401SStefano Zampini   pcbddc->replicated_local_primal_indices = 0;
1064da1bb401SStefano Zampini   pcbddc->replicated_local_primal_values  = 0;
1065da1bb401SStefano Zampini   pcbddc->coarse_loc_to_glob         = 0;
1066da1bb401SStefano Zampini   pcbddc->dbg_flag                   = PETSC_FALSE;
1067da1bb401SStefano Zampini   pcbddc->coarsening_ratio           = 8;
1068b76ba322SStefano Zampini   pcbddc->use_exact_dirichlet        = PETSC_TRUE;
1069da1bb401SStefano Zampini 
1070da1bb401SStefano Zampini   /* allocate and initialize needed graph structure */
1071da1bb401SStefano Zampini   ierr = PetscMalloc(sizeof(*mat_graph),&pcbddc->mat_graph);CHKERRQ(ierr);
1072da1bb401SStefano Zampini   pcbddc->mat_graph->xadj            = 0;
1073da1bb401SStefano Zampini   pcbddc->mat_graph->adjncy          = 0;
1074da1bb401SStefano Zampini 
1075da1bb401SStefano Zampini   /* function pointers */
1076da1bb401SStefano Zampini   pc->ops->apply               = PCApply_BDDC;
1077da1bb401SStefano Zampini   pc->ops->applytranspose      = 0;
1078da1bb401SStefano Zampini   pc->ops->setup               = PCSetUp_BDDC;
1079da1bb401SStefano Zampini   pc->ops->destroy             = PCDestroy_BDDC;
1080da1bb401SStefano Zampini   pc->ops->setfromoptions      = PCSetFromOptions_BDDC;
1081da1bb401SStefano Zampini   pc->ops->view                = 0;
1082da1bb401SStefano Zampini   pc->ops->applyrichardson     = 0;
1083da1bb401SStefano Zampini   pc->ops->applysymmetricleft  = 0;
1084da1bb401SStefano Zampini   pc->ops->applysymmetricright = 0;
1085534831adSStefano Zampini   pc->ops->presolve            = PCPreSolve_BDDC;
1086534831adSStefano Zampini   pc->ops->postsolve           = PCPostSolve_BDDC;
1087da1bb401SStefano Zampini 
1088da1bb401SStefano Zampini   /* composing function */
1089da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDirichletBoundaries_C","PCBDDCSetDirichletBoundaries_BDDC",
1090da1bb401SStefano Zampini                     PCBDDCSetDirichletBoundaries_BDDC);CHKERRQ(ierr);
1091da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetNeumannBoundaries_C","PCBDDCSetNeumannBoundaries_BDDC",
1092da1bb401SStefano Zampini                     PCBDDCSetNeumannBoundaries_BDDC);CHKERRQ(ierr);
1093da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetDirichletBoundaries_C","PCBDDCGetDirichletBoundaries_BDDC",
1094da1bb401SStefano Zampini                     PCBDDCGetDirichletBoundaries_BDDC);CHKERRQ(ierr);
1095da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetNeumannBoundaries_C","PCBDDCGetNeumannBoundaries_BDDC",
1096da1bb401SStefano Zampini                     PCBDDCGetNeumannBoundaries_BDDC);CHKERRQ(ierr);
1097da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetCoarseProblemType_C","PCBDDCSetCoarseProblemType_BDDC",
1098da1bb401SStefano Zampini                     PCBDDCSetCoarseProblemType_BDDC);CHKERRQ(ierr);
1099da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDofsSplitting_C","PCBDDCSetDofsSplitting_BDDC",
1100da1bb401SStefano Zampini                     PCBDDCSetDofsSplitting_BDDC);CHKERRQ(ierr);
1101da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetLocalAdjacencyGraph_C","PCBDDCSetLocalAdjacencyGraph_BDDC",
1102da1bb401SStefano Zampini                     PCBDDCSetLocalAdjacencyGraph_BDDC);CHKERRQ(ierr);
1103534831adSStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPreSolve_C","PCPreSolve_BDDC",
1104534831adSStefano Zampini                     PCPreSolve_BDDC);CHKERRQ(ierr);
1105534831adSStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPostSolve_C","PCPostSolve_BDDC",
1106534831adSStefano Zampini                     PCPostSolve_BDDC);CHKERRQ(ierr);
11073425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCCreateFETIDPOperators_C","PCBDDCCreateFETIDPOperators_BDDC",
11083425bc38SStefano Zampini                     PCBDDCCreateFETIDPOperators_BDDC);CHKERRQ(ierr);
11093425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetRHS_C","PCBDDCMatFETIDPGetRHS_BDDC",
11103425bc38SStefano Zampini                     PCBDDCMatFETIDPGetRHS_BDDC);CHKERRQ(ierr);
11113425bc38SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCMatFETIDPGetSolution_C","PCBDDCMatFETIDPGetSolution_BDDC",
11123425bc38SStefano Zampini                     PCBDDCMatFETIDPGetSolution_BDDC);CHKERRQ(ierr);
1113da1bb401SStefano Zampini   PetscFunctionReturn(0);
1114da1bb401SStefano Zampini }
1115da1bb401SStefano Zampini EXTERN_C_END
11163425bc38SStefano Zampini 
1117da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
1118da1bb401SStefano Zampini /* All static functions from now on                                           */
1119da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
11203425bc38SStefano Zampini 
11213425bc38SStefano Zampini #undef __FUNCT__
11223425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPMatContext"
11233425bc38SStefano Zampini static PetscErrorCode PCBDDCCreateFETIDPMatContext(PC pc, FETIDPMat_ctx **fetidpmat_ctx)
11243425bc38SStefano Zampini {
11253425bc38SStefano Zampini   FETIDPMat_ctx  *newctx;
11263425bc38SStefano Zampini   PetscErrorCode ierr;
11273425bc38SStefano Zampini 
11283425bc38SStefano Zampini   PetscFunctionBegin;
11293425bc38SStefano Zampini   ierr = PetscMalloc(sizeof(*newctx),&newctx);CHKERRQ(ierr);
11303425bc38SStefano Zampini   newctx->lambda_local    = 0;
11313425bc38SStefano Zampini   newctx->temp_solution_B = 0;
11323425bc38SStefano Zampini   newctx->temp_solution_D = 0;
11333425bc38SStefano Zampini   newctx->B_delta         = 0;
11343425bc38SStefano Zampini   newctx->B_Ddelta        = 0; /* theoretically belongs to the FETIDP preconditioner */
11353425bc38SStefano Zampini   newctx->l2g_lambda      = 0;
11363425bc38SStefano Zampini   /* increase the reference count for BDDC preconditioner */
11373425bc38SStefano Zampini   ierr = PetscObjectReference((PetscObject)pc);CHKERRQ(ierr);
11383425bc38SStefano Zampini   newctx->pc              = pc;
11393425bc38SStefano Zampini   *fetidpmat_ctx          = newctx;
11403425bc38SStefano Zampini   PetscFunctionReturn(0);
11413425bc38SStefano Zampini }
11423425bc38SStefano Zampini 
11433425bc38SStefano Zampini #undef __FUNCT__
11443425bc38SStefano Zampini #define __FUNCT__ "PCBDDCCreateFETIDPPCContext"
11453425bc38SStefano Zampini static PetscErrorCode PCBDDCCreateFETIDPPCContext(PC pc, FETIDPPC_ctx **fetidppc_ctx)
11463425bc38SStefano Zampini {
11473425bc38SStefano Zampini   FETIDPPC_ctx  *newctx;
11483425bc38SStefano Zampini   PetscErrorCode ierr;
11493425bc38SStefano Zampini 
11503425bc38SStefano Zampini   PetscFunctionBegin;
11513425bc38SStefano Zampini   ierr = PetscMalloc(sizeof(*newctx),&newctx);CHKERRQ(ierr);
11523425bc38SStefano Zampini   newctx->lambda_local    = 0;
11533425bc38SStefano Zampini   newctx->B_Ddelta        = 0;
11543425bc38SStefano Zampini   newctx->l2g_lambda      = 0;
11553425bc38SStefano Zampini   /* increase the reference count for BDDC preconditioner */
11563425bc38SStefano Zampini   ierr = PetscObjectReference((PetscObject)pc);CHKERRQ(ierr);
11573425bc38SStefano Zampini   newctx->pc              = pc;
11583425bc38SStefano Zampini   *fetidppc_ctx           = newctx;
11593425bc38SStefano Zampini   PetscFunctionReturn(0);
11603425bc38SStefano Zampini }
11613425bc38SStefano Zampini 
11623425bc38SStefano Zampini #undef __FUNCT__
11633425bc38SStefano Zampini #define __FUNCT__ "PCBDDCDestroyFETIDPMat"
11643425bc38SStefano Zampini static PetscErrorCode PCBDDCDestroyFETIDPMat(Mat A)
11653425bc38SStefano Zampini {
11663425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
11673425bc38SStefano Zampini   PetscErrorCode ierr;
11683425bc38SStefano Zampini 
11693425bc38SStefano Zampini   PetscFunctionBegin;
11703425bc38SStefano Zampini   ierr = MatShellGetContext(A,(void**)&mat_ctx);CHKERRQ(ierr);
11713425bc38SStefano Zampini   ierr = VecDestroy(&mat_ctx->lambda_local);CHKERRQ(ierr);
11723425bc38SStefano Zampini   ierr = VecDestroy(&mat_ctx->temp_solution_D);CHKERRQ(ierr);
11733425bc38SStefano Zampini   ierr = VecDestroy(&mat_ctx->temp_solution_B);CHKERRQ(ierr);
11743425bc38SStefano Zampini   ierr = MatDestroy(&mat_ctx->B_delta);CHKERRQ(ierr);
11753425bc38SStefano Zampini   ierr = MatDestroy(&mat_ctx->B_Ddelta);CHKERRQ(ierr);
11763425bc38SStefano Zampini   ierr = VecScatterDestroy(&mat_ctx->l2g_lambda);CHKERRQ(ierr);
11773425bc38SStefano Zampini   ierr = PCDestroy(&mat_ctx->pc);CHKERRQ(ierr); /* actually it does not destroy BDDC, only decrease its reference count */
11783425bc38SStefano Zampini   ierr = PetscFree(mat_ctx);CHKERRQ(ierr);
11793425bc38SStefano Zampini   PetscFunctionReturn(0);
11803425bc38SStefano Zampini }
11813425bc38SStefano Zampini 
11823425bc38SStefano Zampini #undef __FUNCT__
11833425bc38SStefano Zampini #define __FUNCT__ "PCBDDCDestroyFETIDPPC"
11843425bc38SStefano Zampini static PetscErrorCode PCBDDCDestroyFETIDPPC(PC pc)
11853425bc38SStefano Zampini {
11863425bc38SStefano Zampini   FETIDPPC_ctx  *pc_ctx;
11873425bc38SStefano Zampini   PetscErrorCode ierr;
11883425bc38SStefano Zampini 
11893425bc38SStefano Zampini   PetscFunctionBegin;
11903425bc38SStefano Zampini   ierr = PCShellGetContext(pc,(void**)&pc_ctx);CHKERRQ(ierr);
11913425bc38SStefano Zampini   ierr = VecDestroy(&pc_ctx->lambda_local);CHKERRQ(ierr);
11923425bc38SStefano Zampini   ierr = MatDestroy(&pc_ctx->B_Ddelta);CHKERRQ(ierr);
11933425bc38SStefano Zampini   ierr = VecScatterDestroy(&pc_ctx->l2g_lambda);CHKERRQ(ierr);
11943425bc38SStefano Zampini   ierr = PCDestroy(&pc_ctx->pc);CHKERRQ(ierr); /* actually it does not destroy BDDC, only decrease its reference count */
11953425bc38SStefano Zampini   ierr = PetscFree(pc_ctx);CHKERRQ(ierr);
11963425bc38SStefano Zampini   PetscFunctionReturn(0);
11973425bc38SStefano Zampini }
11983425bc38SStefano Zampini 
11993425bc38SStefano Zampini #undef __FUNCT__
12003425bc38SStefano Zampini #define __FUNCT__ "PCBDDCSetupFETIDPMatContext"
12013425bc38SStefano Zampini static PetscErrorCode PCBDDCSetupFETIDPMatContext(FETIDPMat_ctx *fetidpmat_ctx )
12023425bc38SStefano Zampini {
12033425bc38SStefano Zampini   PetscErrorCode ierr;
12043425bc38SStefano Zampini   PC_IS          *pcis=(PC_IS*)fetidpmat_ctx->pc->data;
12053425bc38SStefano Zampini   PC_BDDC        *pcbddc=(PC_BDDC*)fetidpmat_ctx->pc->data;
12063425bc38SStefano Zampini   PCBDDCGraph    mat_graph=pcbddc->mat_graph;
12073425bc38SStefano Zampini   Mat_IS         *matis  = (Mat_IS*)fetidpmat_ctx->pc->pmat->data;
12083425bc38SStefano Zampini   MPI_Comm       comm = ((PetscObject)(fetidpmat_ctx->pc))->comm;
12093425bc38SStefano Zampini 
12103425bc38SStefano Zampini   Mat            ScalingMat;
12113425bc38SStefano Zampini   Vec            lambda_global;
12123425bc38SStefano Zampini   IS             IS_l2g_lambda;
12133425bc38SStefano Zampini 
12143425bc38SStefano Zampini   PetscBool      skip_node,fully_redundant;
12153425bc38SStefano Zampini   PetscInt       i,j,k,s,n_boundary_dofs,sum_dof_sizes,n_global_lambda,n_vertices;
12163425bc38SStefano Zampini   PetscInt       n_local_lambda,n_lambda_for_dof,dual_size,n_neg_values,n_pos_values;
12173425bc38SStefano Zampini   PetscMPIInt    rank,nprocs,partial_sum;
12183425bc38SStefano Zampini   PetscScalar    scalar_value;
12193425bc38SStefano Zampini 
12203425bc38SStefano Zampini   PetscInt       *vertex_indices,*temp_indices;
12213425bc38SStefano Zampini   PetscInt       *dual_dofs_boundary_indices,*aux_local_numbering_1,*aux_global_numbering;
12223425bc38SStefano Zampini   PetscInt       *aux_sums,*cols_B_delta,*l2g_indices;
12233425bc38SStefano Zampini   PetscMPIInt    *aux_local_numbering_2,*aux_global_numbering_mpi,*dof_sizes,*dof_displs;
12243425bc38SStefano Zampini   PetscMPIInt    *all_aux_global_numbering_mpi_1,*all_aux_global_numbering_mpi_2,*global_dofs_numbering;
12253425bc38SStefano Zampini   PetscScalar    *array,*scaling_factors,*vals_B_delta;
12263425bc38SStefano Zampini 
12273425bc38SStefano Zampini   /* For communication of scaling factors */
12283425bc38SStefano Zampini   PetscInt       *ptrs_buffer,neigh_position;
12293425bc38SStefano Zampini   PetscScalar    **all_factors,*send_buffer,*recv_buffer;
12303425bc38SStefano Zampini   MPI_Request    *send_reqs,*recv_reqs;
12313425bc38SStefano Zampini 
12323425bc38SStefano Zampini   /* tests */
12333425bc38SStefano Zampini   Vec            test_vec;
12343425bc38SStefano Zampini   PetscBool      test_fetidp;
12353425bc38SStefano Zampini   PetscViewer    viewer;
12363425bc38SStefano Zampini 
12373425bc38SStefano Zampini   PetscFunctionBegin;
12383425bc38SStefano Zampini   ierr = MPI_Comm_rank(comm,&rank);CHKERRQ(ierr);
12393425bc38SStefano Zampini   ierr = MPI_Comm_size(comm,&nprocs);CHKERRQ(ierr);
12403425bc38SStefano Zampini 
12413425bc38SStefano Zampini   /* Default type of lagrange multipliers is non-redundant */
12423425bc38SStefano Zampini   fully_redundant = PETSC_FALSE;
12433425bc38SStefano Zampini   ierr = PetscOptionsGetBool(PETSC_NULL,"-fetidp_fullyredundant",&fully_redundant,PETSC_NULL);CHKERRQ(ierr);
12443425bc38SStefano Zampini 
12453425bc38SStefano Zampini   /* Evaluate local and global number of lagrange multipliers */
12463425bc38SStefano Zampini   ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
12473425bc38SStefano Zampini   n_local_lambda = 0;
12483425bc38SStefano Zampini   partial_sum = 0;
12493425bc38SStefano Zampini   n_boundary_dofs = 0;
12503425bc38SStefano Zampini   s = 0;
12513425bc38SStefano Zampini   n_vertices = 0;
12523425bc38SStefano Zampini   /* Get Vertices used to define the BDDC */
12533425bc38SStefano Zampini   ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(*vertex_indices),&vertex_indices);CHKERRQ(ierr);
12543425bc38SStefano Zampini   for(i=0;i<pcbddc->local_primal_size;i++) {
12553425bc38SStefano Zampini     ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&j,(const PetscInt**)&temp_indices,PETSC_NULL);CHKERRQ(ierr);
12563425bc38SStefano Zampini     if(j == 1) {
12573425bc38SStefano Zampini       vertex_indices[n_vertices]=temp_indices[0];
12583425bc38SStefano Zampini       n_vertices++;
12593425bc38SStefano Zampini     }
12603425bc38SStefano Zampini     ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&j,(const PetscInt**)&temp_indices,PETSC_NULL);CHKERRQ(ierr);
12613425bc38SStefano Zampini   }
12623425bc38SStefano Zampini   dual_size = pcis->n_B-n_vertices;
12633425bc38SStefano Zampini   ierr = PetscMalloc(dual_size*sizeof(*dual_dofs_boundary_indices),&dual_dofs_boundary_indices);CHKERRQ(ierr);
12643425bc38SStefano Zampini   ierr = PetscMalloc(dual_size*sizeof(*aux_local_numbering_1),&aux_local_numbering_1);CHKERRQ(ierr);
12653425bc38SStefano Zampini   ierr = PetscMalloc(dual_size*sizeof(*aux_local_numbering_2),&aux_local_numbering_2);CHKERRQ(ierr);
12663425bc38SStefano Zampini 
12673425bc38SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
12683425bc38SStefano Zampini   for(i=0;i<pcis->n;i++){
12693425bc38SStefano Zampini     j = mat_graph->count[i]; /* RECALL: mat_graph->count[i] does not count myself */
1270c6582918SStefano Zampini     k = 0;
1271c6582918SStefano Zampini     if(j > 0) {
12723425bc38SStefano Zampini       k = (mat_graph->neighbours_set[i][0] == -1 ?  1 : 0);
1273c6582918SStefano Zampini     }
12743425bc38SStefano Zampini     j = j - k ;
12753425bc38SStefano Zampini     if( j > 0 ) { n_boundary_dofs++; }
12763425bc38SStefano Zampini 
12773425bc38SStefano Zampini     skip_node = PETSC_FALSE;
1278c6582918SStefano Zampini     if( s < n_vertices && vertex_indices[s]==i) { /* it works for a sorted set of vertices */
12793425bc38SStefano Zampini       skip_node = PETSC_TRUE;
12803425bc38SStefano Zampini       s++;
12813425bc38SStefano Zampini     }
12823425bc38SStefano Zampini     if(j < 1) {skip_node = PETSC_TRUE;}
12833425bc38SStefano Zampini     if( !skip_node ) {
12843425bc38SStefano Zampini       if(fully_redundant) {
12853425bc38SStefano Zampini         /* fully redundant set of lagrange multipliers */
12863425bc38SStefano Zampini         n_lambda_for_dof = (j*(j+1))/2;
12873425bc38SStefano Zampini       } else {
12883425bc38SStefano Zampini         n_lambda_for_dof = j;
12893425bc38SStefano Zampini       }
12903425bc38SStefano Zampini       n_local_lambda += j;
12913425bc38SStefano Zampini       /* needed to evaluate global number of lagrange multipliers */
12923425bc38SStefano Zampini       array[i]=(1.0*n_lambda_for_dof)/(j+1.0); /* already scaled for the next global sum */
12933425bc38SStefano Zampini       /* store some data needed */
12943425bc38SStefano Zampini       dual_dofs_boundary_indices[partial_sum] = n_boundary_dofs-1;
12953425bc38SStefano Zampini       aux_local_numbering_1[partial_sum] = i;
12963425bc38SStefano Zampini       aux_local_numbering_2[partial_sum] = (PetscMPIInt)n_lambda_for_dof;
12973425bc38SStefano Zampini       partial_sum++;
12983425bc38SStefano Zampini     }
12993425bc38SStefano Zampini   }
13003425bc38SStefano Zampini   /*printf("I found %d local lambda dofs\n",n_local_lambda);
13013425bc38SStefano Zampini   printf("I found %d boundary dofs (should be %d)\n",n_boundary_dofs,pcis->n_B);
13023425bc38SStefano Zampini   printf("Partial sum %d should be %d\n",partial_sum,dual_size);*/
13033425bc38SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
13043425bc38SStefano Zampini   ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
13053425bc38SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
13063425bc38SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
13073425bc38SStefano Zampini   ierr = VecSum(pcis->vec1_global,&scalar_value);CHKERRQ(ierr);
13083425bc38SStefano Zampini   fetidpmat_ctx->n_lambda = (PetscInt) scalar_value;
13093425bc38SStefano Zampini   /* printf("I found %d global multipliers (%f)\n",fetidpmat_ctx->n_lambda,scalar_value); */
13103425bc38SStefano Zampini   ierr = VecCreate(PETSC_COMM_SELF,&fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
13113425bc38SStefano Zampini   ierr = VecSetSizes(fetidpmat_ctx->lambda_local,n_local_lambda,n_local_lambda);CHKERRQ(ierr);
13123425bc38SStefano Zampini   ierr = VecSetType(fetidpmat_ctx->lambda_local,VECSEQ);CHKERRQ(ierr);
13133425bc38SStefano Zampini   ierr = VecCreate(comm,&lambda_global);CHKERRQ(ierr);
13143425bc38SStefano Zampini   ierr = VecSetSizes(lambda_global,PETSC_DECIDE,fetidpmat_ctx->n_lambda);CHKERRQ(ierr);
13153425bc38SStefano Zampini   ierr = VecSetType(lambda_global,VECMPI);CHKERRQ(ierr);
13163425bc38SStefano Zampini 
13173425bc38SStefano Zampini   /* compute global ordering of lagrange multipliers and associate l2g map */
13183425bc38SStefano Zampini 
13193425bc38SStefano Zampini   ierr = PetscMalloc(dual_size*sizeof(*aux_global_numbering),&aux_global_numbering);CHKERRQ(ierr);
13203425bc38SStefano Zampini   ierr = PetscMalloc(dual_size*sizeof(*aux_global_numbering_mpi),&aux_global_numbering_mpi);CHKERRQ(ierr);
13213425bc38SStefano Zampini   j = (rank == 0 ? nprocs : 0);
13223425bc38SStefano Zampini   ierr = PetscMalloc(j*sizeof(*dof_sizes),&dof_sizes);CHKERRQ(ierr);
13233425bc38SStefano Zampini   ierr = PetscMalloc(j*sizeof(*dof_displs),&dof_displs);CHKERRQ(ierr);
13243425bc38SStefano Zampini   ierr = ISLocalToGlobalMappingApply(matis->mapping,dual_size,aux_local_numbering_1,aux_global_numbering);CHKERRQ(ierr);
13253425bc38SStefano Zampini   ierr = MPI_Gather(&dual_size,1,MPIU_INT,dof_sizes,1,MPIU_INT,0,comm);CHKERRQ(ierr);
13263425bc38SStefano Zampini   sum_dof_sizes=0;
13273425bc38SStefano Zampini   if ( rank == 0 ) {
13283425bc38SStefano Zampini     dof_displs[0]=0;
13293425bc38SStefano Zampini     sum_dof_sizes=dual_size;
13303425bc38SStefano Zampini     for(i=1;i<nprocs;i++) {
13313425bc38SStefano Zampini       dof_displs[i] = dof_displs[i-1]+dof_sizes[i-1];
13323425bc38SStefano Zampini       sum_dof_sizes += dof_sizes[i];
13333425bc38SStefano Zampini     }
13343425bc38SStefano Zampini   }
13353425bc38SStefano Zampini   for(i=0;i<dual_size;i++) {
13363425bc38SStefano Zampini     aux_global_numbering_mpi[i]=(PetscMPIInt)aux_global_numbering[i];
13373425bc38SStefano Zampini   }
13383425bc38SStefano Zampini   ierr = PetscMalloc(sum_dof_sizes*sizeof(*all_aux_global_numbering_mpi_1),&all_aux_global_numbering_mpi_1);CHKERRQ(ierr);
13393425bc38SStefano Zampini   ierr = PetscMalloc(sum_dof_sizes*sizeof(*all_aux_global_numbering_mpi_2),&all_aux_global_numbering_mpi_2);CHKERRQ(ierr);
13403425bc38SStefano Zampini   ierr = MPI_Gatherv(aux_global_numbering_mpi,dual_size,MPIU_INT,all_aux_global_numbering_mpi_1,dof_sizes,dof_displs,MPIU_INT,0,comm);CHKERRQ(ierr);
13413425bc38SStefano Zampini   ierr = MPI_Gatherv(aux_local_numbering_2,dual_size,MPIU_INT,all_aux_global_numbering_mpi_2,dof_sizes,dof_displs,MPIU_INT,0,comm);CHKERRQ(ierr);
13423425bc38SStefano Zampini 
13433425bc38SStefano Zampini   ierr = PetscMalloc(fetidpmat_ctx->n_lambda*sizeof(*global_dofs_numbering),&global_dofs_numbering);CHKERRQ(ierr);
13443425bc38SStefano Zampini   if( rank == 0 ) {
13453425bc38SStefano Zampini     ierr = PetscSortMPIIntWithArray(sum_dof_sizes,all_aux_global_numbering_mpi_1,all_aux_global_numbering_mpi_2);CHKERRQ(ierr);
13463425bc38SStefano Zampini     j=-1;
13473425bc38SStefano Zampini     partial_sum = 0;
13483425bc38SStefano Zampini     for(i=0;i<sum_dof_sizes;i++) {
13493425bc38SStefano Zampini       if(j != all_aux_global_numbering_mpi_1[i] ) {
13503425bc38SStefano Zampini         j=all_aux_global_numbering_mpi_1[i];
13513425bc38SStefano Zampini         for(k=0;k<all_aux_global_numbering_mpi_2[i];k++) {
13523425bc38SStefano Zampini           global_dofs_numbering[partial_sum+k]=all_aux_global_numbering_mpi_1[i];
13533425bc38SStefano Zampini         }
13543425bc38SStefano Zampini         partial_sum += all_aux_global_numbering_mpi_2[i];
13553425bc38SStefano Zampini       }
13563425bc38SStefano Zampini     }
13573425bc38SStefano Zampini     /* printf("Partial sum for global dofs %d should be %d\n",partial_sum,fetidpmat_ctx->n_lambda); */
13583425bc38SStefano Zampini   }
13593425bc38SStefano Zampini   ierr = MPI_Bcast(global_dofs_numbering,fetidpmat_ctx->n_lambda,MPIU_INT,0,comm);CHKERRQ(ierr);
13603425bc38SStefano Zampini 
13613425bc38SStefano Zampini   /* init data for scaling factors exchange */
13623425bc38SStefano Zampini   partial_sum = 0;
13633425bc38SStefano Zampini   j = 0;
13643425bc38SStefano Zampini   ierr = PetscMalloc( pcis->n_neigh*sizeof(PetscInt),&ptrs_buffer);CHKERRQ(ierr);
13653425bc38SStefano Zampini   ierr = PetscMalloc( (pcis->n_neigh-1)*sizeof(MPI_Request),&send_reqs);CHKERRQ(ierr);
13663425bc38SStefano Zampini   ierr = PetscMalloc( (pcis->n_neigh-1)*sizeof(MPI_Request),&recv_reqs);CHKERRQ(ierr);
13673425bc38SStefano Zampini   ierr = PetscMalloc( pcis->n*sizeof(PetscScalar*),&all_factors);CHKERRQ(ierr);
13683425bc38SStefano Zampini   ptrs_buffer[0]=0;
13693425bc38SStefano Zampini   for(i=1;i<pcis->n_neigh;i++) {
13703425bc38SStefano Zampini     partial_sum += pcis->n_shared[i];
13713425bc38SStefano Zampini     ptrs_buffer[i] = ptrs_buffer[i-1]+pcis->n_shared[i];
13723425bc38SStefano Zampini   }
13733425bc38SStefano Zampini   ierr = PetscMalloc( partial_sum*sizeof(PetscScalar),&send_buffer);CHKERRQ(ierr);
13743425bc38SStefano Zampini   ierr = PetscMalloc( partial_sum*sizeof(PetscScalar),&recv_buffer);CHKERRQ(ierr);
13753425bc38SStefano Zampini   ierr = PetscMalloc( partial_sum*sizeof(PetscScalar),&all_factors[0]);CHKERRQ(ierr);
13763425bc38SStefano Zampini   for(i=0;i<pcis->n-1;i++) {
13773425bc38SStefano Zampini     j = mat_graph->count[i];
13783425bc38SStefano Zampini     if(j>0) {
13793425bc38SStefano Zampini       k = (mat_graph->neighbours_set[i][0] == -1 ?  1 : 0);
13803425bc38SStefano Zampini       j = j - k;
13813425bc38SStefano Zampini     }
13823425bc38SStefano Zampini     all_factors[i+1]=all_factors[i]+j;
13833425bc38SStefano Zampini   }
13843425bc38SStefano Zampini   /* scatter B scaling to N vec */
13853425bc38SStefano Zampini   ierr = VecScatterBegin(pcis->N_to_B,pcis->D,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
13863425bc38SStefano Zampini   ierr = VecScatterEnd  (pcis->N_to_B,pcis->D,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
13873425bc38SStefano Zampini   /* communications */
13883425bc38SStefano Zampini   k = 0;
13893425bc38SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
13903425bc38SStefano Zampini   for(i=1;i<pcis->n_neigh;i++) {
13913425bc38SStefano Zampini     for(j=0;j<pcis->n_shared[i];j++) {
13923425bc38SStefano Zampini       send_buffer[ptrs_buffer[i-1]+j]=array[pcis->shared[i][j]];
13933425bc38SStefano Zampini     }
13943425bc38SStefano Zampini     j = ptrs_buffer[i]-ptrs_buffer[i-1];
13953425bc38SStefano Zampini     ierr = MPI_Isend(&send_buffer[ptrs_buffer[i-1]],j,MPIU_SCALAR,pcis->neigh[i],0,comm,&send_reqs[k]);CHKERRQ(ierr);
13963425bc38SStefano Zampini     ierr = MPI_Irecv(&recv_buffer[ptrs_buffer[i-1]],j,MPIU_SCALAR,pcis->neigh[i],0,comm,&recv_reqs[k]);CHKERRQ(ierr);
13973425bc38SStefano Zampini     k++;
13983425bc38SStefano Zampini   }
13993425bc38SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
14003425bc38SStefano Zampini   ierr = MPI_Waitall(k,recv_reqs,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
14013425bc38SStefano Zampini   ierr = MPI_Waitall(k,send_reqs,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
14023425bc38SStefano Zampini   /* put values in correct places */
14033425bc38SStefano Zampini   for(i=1;i<pcis->n_neigh;i++) {
14043425bc38SStefano Zampini     for(j=0;j<pcis->n_shared[i];j++) {
14053425bc38SStefano Zampini       k = pcis->shared[i][j];
14063425bc38SStefano Zampini       neigh_position = 0;
14073425bc38SStefano Zampini       while(mat_graph->neighbours_set[k][neigh_position] != pcis->neigh[i]) {neigh_position++;}
14083425bc38SStefano Zampini       s = (mat_graph->neighbours_set[k][0] == -1 ?  1 : 0);
14093425bc38SStefano Zampini       neigh_position = neigh_position - s;
14103425bc38SStefano Zampini       all_factors[k][neigh_position]=recv_buffer[ptrs_buffer[i-1]+j];
14113425bc38SStefano Zampini     }
14123425bc38SStefano Zampini   }
14133425bc38SStefano Zampini   ierr = PetscFree(send_reqs);CHKERRQ(ierr);
14143425bc38SStefano Zampini   ierr = PetscFree(recv_reqs);CHKERRQ(ierr);
14153425bc38SStefano Zampini   ierr = PetscFree(send_buffer);CHKERRQ(ierr);
14163425bc38SStefano Zampini   ierr = PetscFree(recv_buffer);CHKERRQ(ierr);
14173425bc38SStefano Zampini   ierr = PetscFree(ptrs_buffer);CHKERRQ(ierr);
14183425bc38SStefano Zampini 
14193425bc38SStefano Zampini   /* Compute B and B_delta (local actions) */
14203425bc38SStefano Zampini   ierr = PetscMalloc(pcis->n_neigh*sizeof(*aux_sums),&aux_sums);CHKERRQ(ierr);
14213425bc38SStefano Zampini   ierr = PetscMalloc(n_local_lambda*sizeof(*l2g_indices),&l2g_indices);CHKERRQ(ierr);
14223425bc38SStefano Zampini   ierr = PetscMalloc(n_local_lambda*sizeof(*vals_B_delta),&vals_B_delta);CHKERRQ(ierr);
14233425bc38SStefano Zampini   ierr = PetscMalloc(n_local_lambda*sizeof(*cols_B_delta),&cols_B_delta);CHKERRQ(ierr);
14243425bc38SStefano Zampini   ierr = PetscMalloc(n_local_lambda*sizeof(*scaling_factors),&scaling_factors);CHKERRQ(ierr);
14253425bc38SStefano Zampini   n_global_lambda=0;
14263425bc38SStefano Zampini   partial_sum=0;
14273425bc38SStefano Zampini   for(i=0;i<dual_size;i++) {
14283425bc38SStefano Zampini     while( global_dofs_numbering[n_global_lambda] != aux_global_numbering_mpi[i] ) { n_global_lambda++; }
14293425bc38SStefano Zampini     j = mat_graph->count[aux_local_numbering_1[i]];
14303425bc38SStefano Zampini     k = (mat_graph->neighbours_set[aux_local_numbering_1[i]][0] == -1 ?  1 : 0);
14313425bc38SStefano Zampini     j = j - k;
14323425bc38SStefano Zampini     aux_sums[0]=0;
14333425bc38SStefano Zampini     for(s=1;s<j;s++) {
14343425bc38SStefano Zampini       aux_sums[s]=aux_sums[s-1]+j-s+1;
14353425bc38SStefano Zampini     }
14363425bc38SStefano Zampini     array = all_factors[aux_local_numbering_1[i]];
14373425bc38SStefano Zampini     n_neg_values = 0;
14383425bc38SStefano Zampini     while(n_neg_values < j && mat_graph->neighbours_set[aux_local_numbering_1[i]][n_neg_values+k] < rank) {n_neg_values++;}
14393425bc38SStefano Zampini     n_pos_values = j - n_neg_values;
14403425bc38SStefano Zampini     if(fully_redundant) {
14413425bc38SStefano Zampini       for(s=0;s<n_neg_values;s++) {
14423425bc38SStefano Zampini         l2g_indices    [partial_sum+s]=aux_sums[s]+n_neg_values-s-1+n_global_lambda;
14433425bc38SStefano Zampini         cols_B_delta   [partial_sum+s]=dual_dofs_boundary_indices[i];
14443425bc38SStefano Zampini         vals_B_delta   [partial_sum+s]=-1.0;
14453425bc38SStefano Zampini         scaling_factors[partial_sum+s]=array[s];
14463425bc38SStefano Zampini       }
14473425bc38SStefano Zampini       for(s=0;s<n_pos_values;s++) {
14483425bc38SStefano Zampini         l2g_indices    [partial_sum+s+n_neg_values]=aux_sums[n_neg_values]+s+n_global_lambda;
14493425bc38SStefano Zampini         cols_B_delta   [partial_sum+s+n_neg_values]=dual_dofs_boundary_indices[i];
14503425bc38SStefano Zampini         vals_B_delta   [partial_sum+s+n_neg_values]=1.0;
14513425bc38SStefano Zampini         scaling_factors[partial_sum+s+n_neg_values]=array[s+n_neg_values];
14523425bc38SStefano Zampini       }
14533425bc38SStefano Zampini       partial_sum += j;
14543425bc38SStefano Zampini     } else {
14553425bc38SStefano Zampini       /* l2g_indices and default cols and vals of B_delta */
14563425bc38SStefano Zampini       for(s=0;s<j;s++) {
14573425bc38SStefano Zampini         l2g_indices    [partial_sum+s]=n_global_lambda+s;
14583425bc38SStefano Zampini         cols_B_delta   [partial_sum+s]=dual_dofs_boundary_indices[i];
14593425bc38SStefano Zampini         vals_B_delta   [partial_sum+s]=0.0;
14603425bc38SStefano Zampini       }
14613425bc38SStefano Zampini       /* B_delta */
14623425bc38SStefano Zampini       if( n_neg_values > 0 ) { /* there's a rank next to me to the left */
14633425bc38SStefano Zampini         vals_B_delta   [partial_sum+n_neg_values-1]=-1.0;
14643425bc38SStefano Zampini       }
14653425bc38SStefano Zampini       if ( n_neg_values < j ) { /* there's a rank next to me to the right */
14663425bc38SStefano Zampini         vals_B_delta   [partial_sum+n_neg_values]=1.0;
14673425bc38SStefano Zampini       }
14683425bc38SStefano Zampini       /* scaling as in Klawonn-Widlund 1999*/
14693425bc38SStefano Zampini       for(s=0;s<n_neg_values;s++) {
14703425bc38SStefano Zampini         scalar_value = 0.0;
14713425bc38SStefano Zampini         for(k=0;k<s+1;k++) {
14723425bc38SStefano Zampini           scalar_value += array[k];
14733425bc38SStefano Zampini         }
14743425bc38SStefano Zampini         scalar_value = -scalar_value;
14753425bc38SStefano Zampini         scaling_factors[partial_sum+s] = scalar_value;
14763425bc38SStefano Zampini       }
14773425bc38SStefano Zampini       for(s=0;s<n_pos_values;s++) {
14783425bc38SStefano Zampini         scalar_value = 0.0;
14793425bc38SStefano Zampini         for(k=s+n_neg_values;k<j;k++) {
14803425bc38SStefano Zampini           scalar_value += array[k];
14813425bc38SStefano Zampini         }
14823425bc38SStefano Zampini         scaling_factors[partial_sum+s+n_neg_values] = scalar_value;
14833425bc38SStefano Zampini       }
14843425bc38SStefano Zampini       partial_sum += j;
14853425bc38SStefano Zampini     }
14863425bc38SStefano Zampini   }
14873425bc38SStefano Zampini   ierr = PetscFree(all_factors[0]);CHKERRQ(ierr);
14883425bc38SStefano Zampini   ierr = PetscFree(all_factors);CHKERRQ(ierr);
14893425bc38SStefano Zampini   /* printf("I found %d local lambda dofs when numbering them (should be %d)\n",partial_sum,n_local_lambda); */
14903425bc38SStefano Zampini   ierr = ISCreateGeneral(comm,n_local_lambda,l2g_indices,PETSC_OWN_POINTER,&IS_l2g_lambda);CHKERRQ(ierr);
14913425bc38SStefano Zampini   ierr = VecScatterCreate(fetidpmat_ctx->lambda_local,(IS)0,lambda_global,IS_l2g_lambda,&fetidpmat_ctx->l2g_lambda);CHKERRQ(ierr);
14923425bc38SStefano Zampini 
14933425bc38SStefano Zampini   /* Create local part of B_delta */
14943425bc38SStefano Zampini   ierr = MatCreate(PETSC_COMM_SELF,&fetidpmat_ctx->B_delta);
14953425bc38SStefano Zampini   ierr = MatSetSizes(fetidpmat_ctx->B_delta,n_local_lambda,pcis->n_B,n_local_lambda,pcis->n_B);CHKERRQ(ierr);
14963425bc38SStefano Zampini   ierr = MatSetType(fetidpmat_ctx->B_delta,MATSEQAIJ);CHKERRQ(ierr);
14973425bc38SStefano Zampini   ierr = MatSeqAIJSetPreallocation(fetidpmat_ctx->B_delta,1,PETSC_NULL);CHKERRQ(ierr);
14983425bc38SStefano Zampini   ierr = MatSetOption(fetidpmat_ctx->B_delta,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr);
14993425bc38SStefano Zampini   for(i=0;i<n_local_lambda;i++) {
15003425bc38SStefano Zampini     ierr = MatSetValue(fetidpmat_ctx->B_delta,i,cols_B_delta[i],vals_B_delta[i],INSERT_VALUES);CHKERRQ(ierr);
15013425bc38SStefano Zampini   }
15023425bc38SStefano Zampini   ierr = MatAssemblyBegin(fetidpmat_ctx->B_delta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
15033425bc38SStefano Zampini   ierr = MatAssemblyEnd  (fetidpmat_ctx->B_delta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
15043425bc38SStefano Zampini 
15053425bc38SStefano Zampini   if(fully_redundant) {
15063425bc38SStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&ScalingMat);
15073425bc38SStefano Zampini     ierr = MatSetSizes(ScalingMat,n_local_lambda,n_local_lambda,n_local_lambda,n_local_lambda);CHKERRQ(ierr);
15083425bc38SStefano Zampini     ierr = MatSetType(ScalingMat,MATSEQAIJ);CHKERRQ(ierr);
15093425bc38SStefano Zampini     ierr = MatSeqAIJSetPreallocation(ScalingMat,1,PETSC_NULL);CHKERRQ(ierr);
15103425bc38SStefano Zampini     for(i=0;i<n_local_lambda;i++) {
15113425bc38SStefano Zampini       ierr = MatSetValue(ScalingMat,i,i,scaling_factors[i],INSERT_VALUES);CHKERRQ(ierr);
15123425bc38SStefano Zampini     }
15133425bc38SStefano Zampini     ierr = MatAssemblyBegin(ScalingMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
15143425bc38SStefano Zampini     ierr = MatAssemblyEnd  (ScalingMat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
15153425bc38SStefano Zampini     ierr = MatMatMult(ScalingMat,fetidpmat_ctx->B_delta,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&fetidpmat_ctx->B_Ddelta);CHKERRQ(ierr);
15163425bc38SStefano Zampini     ierr = MatDestroy(&ScalingMat);CHKERRQ(ierr);
15173425bc38SStefano Zampini   } else {
15183425bc38SStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&fetidpmat_ctx->B_Ddelta);
15193425bc38SStefano Zampini     ierr = MatSetSizes(fetidpmat_ctx->B_Ddelta,n_local_lambda,pcis->n_B,n_local_lambda,pcis->n_B);CHKERRQ(ierr);
15203425bc38SStefano Zampini     ierr = MatSetType(fetidpmat_ctx->B_Ddelta,MATSEQAIJ);CHKERRQ(ierr);
15213425bc38SStefano Zampini     ierr = MatSeqAIJSetPreallocation(fetidpmat_ctx->B_Ddelta,1,PETSC_NULL);CHKERRQ(ierr);
15223425bc38SStefano Zampini     for(i=0;i<n_local_lambda;i++) {
15233425bc38SStefano Zampini       ierr = MatSetValue(fetidpmat_ctx->B_Ddelta,i,cols_B_delta[i],scaling_factors[i],INSERT_VALUES);CHKERRQ(ierr);
15243425bc38SStefano Zampini     }
15253425bc38SStefano Zampini     ierr = MatAssemblyBegin(fetidpmat_ctx->B_Ddelta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
15263425bc38SStefano Zampini     ierr = MatAssemblyEnd  (fetidpmat_ctx->B_Ddelta,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
15273425bc38SStefano Zampini   }
15283425bc38SStefano Zampini 
15293425bc38SStefano Zampini   /* Create some vectors needed by fetidp */
15303425bc38SStefano Zampini   ierr = VecDuplicate(pcis->vec1_B,&fetidpmat_ctx->temp_solution_B);CHKERRQ(ierr);
15313425bc38SStefano Zampini   ierr = VecDuplicate(pcis->vec1_D,&fetidpmat_ctx->temp_solution_D);CHKERRQ(ierr);
15323425bc38SStefano Zampini 
15333425bc38SStefano Zampini   test_fetidp = PETSC_FALSE;
15343425bc38SStefano Zampini   ierr = PetscOptionsGetBool(PETSC_NULL,"-fetidp_check",&test_fetidp,PETSC_NULL);CHKERRQ(ierr);
15353425bc38SStefano Zampini 
15363425bc38SStefano Zampini   if(test_fetidp) {
15373425bc38SStefano Zampini 
15383425bc38SStefano Zampini     ierr = PetscViewerASCIIGetStdout(((PetscObject)(fetidpmat_ctx->pc))->comm,&viewer);CHKERRQ(ierr);
15393425bc38SStefano Zampini     ierr = PetscViewerASCIISynchronizedAllow(viewer,PETSC_TRUE);CHKERRQ(ierr);
15403425bc38SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"----------FETI_DP TESTS--------------\n");CHKERRQ(ierr);
15413425bc38SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"All tests should return zero!\n");CHKERRQ(ierr);
15423425bc38SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"FETIDP MAT context in the ");CHKERRQ(ierr);
15433425bc38SStefano Zampini     if(fully_redundant) {
15443425bc38SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"fully redundant case for lagrange multipliers.\n");CHKERRQ(ierr);
15453425bc38SStefano Zampini     } else {
15463425bc38SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Non-fully redundant case for lagrange multiplier.\n");CHKERRQ(ierr);
15473425bc38SStefano Zampini     }
15483425bc38SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
15493425bc38SStefano Zampini 
15503425bc38SStefano Zampini     /******************************************************************/
15513425bc38SStefano Zampini     /* TEST A/B: Test numbering of global lambda dofs             */
15523425bc38SStefano Zampini     /******************************************************************/
15533425bc38SStefano Zampini 
15543425bc38SStefano Zampini     ierr = VecDuplicate(fetidpmat_ctx->lambda_local,&test_vec);CHKERRQ(ierr);
15553425bc38SStefano Zampini     ierr = VecSet(lambda_global,1.0);CHKERRQ(ierr);
15563425bc38SStefano Zampini     ierr = VecSet(test_vec,1.0);CHKERRQ(ierr);
15573425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
15583425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
15593425bc38SStefano Zampini     scalar_value = -1.0;
15603425bc38SStefano Zampini     ierr = VecAXPY(test_vec,scalar_value,fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
15613425bc38SStefano Zampini     ierr = VecNorm(test_vec,NORM_INFINITY,&scalar_value);CHKERRQ(ierr);
15623425bc38SStefano Zampini     ierr = VecDestroy(&test_vec);CHKERRQ(ierr);
15633425bc38SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"A[%04d]: CHECK glob to loc: % 1.14e\n",rank,scalar_value);CHKERRQ(ierr);
15643425bc38SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
15653425bc38SStefano Zampini     if(fully_redundant) {
15663425bc38SStefano Zampini       ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr);
15673425bc38SStefano Zampini       ierr = VecSet(fetidpmat_ctx->lambda_local,0.5);CHKERRQ(ierr);
15683425bc38SStefano Zampini       ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
15693425bc38SStefano Zampini       ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
15703425bc38SStefano Zampini       ierr = VecSum(lambda_global,&scalar_value);CHKERRQ(ierr);
15713425bc38SStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"B[%04d]: CHECK loc to glob: % 1.14e\n",rank,scalar_value-fetidpmat_ctx->n_lambda);CHKERRQ(ierr);
15723425bc38SStefano Zampini       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
15733425bc38SStefano Zampini     }
15743425bc38SStefano Zampini 
15753425bc38SStefano Zampini     /******************************************************************/
15763425bc38SStefano Zampini     /* TEST C: It should holds B_delta*w=0, w\in\widehat{W}           */
15773425bc38SStefano Zampini     /* This is the meaning of the B matrix                            */
15783425bc38SStefano Zampini     /******************************************************************/
15793425bc38SStefano Zampini 
15803425bc38SStefano Zampini     ierr = VecSetRandom(pcis->vec1_N,PETSC_NULL);CHKERRQ(ierr);
15813425bc38SStefano Zampini     ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
15823425bc38SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
15833425bc38SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
15843425bc38SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
15853425bc38SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
15863425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
15873425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
15883425bc38SStefano Zampini     /* Action of B_delta */
15893425bc38SStefano Zampini     ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
15903425bc38SStefano Zampini     ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr);
15913425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
15923425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
15933425bc38SStefano Zampini     ierr = VecNorm(lambda_global,NORM_INFINITY,&scalar_value);CHKERRQ(ierr);
15943425bc38SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"C[coll]: CHECK infty norm of B_delta*w (w continuous): % 1.14e\n",scalar_value);CHKERRQ(ierr);
15953425bc38SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
15963425bc38SStefano Zampini 
15973425bc38SStefano Zampini     /******************************************************************/
15983425bc38SStefano Zampini     /* TEST D: It should holds E_Dw = w - P_Dw w\in\widetilde{W}     */
15993425bc38SStefano Zampini     /* E_D = R_D^TR                                                   */
16003425bc38SStefano Zampini     /* P_D = B_{D,delta}^T B_{delta}                                  */
16013425bc38SStefano Zampini     /* eq.44 Mandel Tezaur and Dohrmann 2005                          */
16023425bc38SStefano Zampini     /******************************************************************/
16033425bc38SStefano Zampini 
16043425bc38SStefano Zampini     /* compute a random vector in \widetilde{W} */
16053425bc38SStefano Zampini     ierr = VecSetRandom(pcis->vec1_N,PETSC_NULL);CHKERRQ(ierr);
16063425bc38SStefano Zampini     scalar_value = 0.0;  /* set zero at vertices */
16073425bc38SStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
16083425bc38SStefano Zampini     for(i=0;i<n_vertices;i++) { array[vertex_indices[i]]=scalar_value; }
16093425bc38SStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
16103425bc38SStefano Zampini     /* store w for final comparison */
16113425bc38SStefano Zampini     ierr = VecDuplicate(pcis->vec1_B,&test_vec);CHKERRQ(ierr);
16123425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,test_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
16133425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,test_vec,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
16143425bc38SStefano Zampini 
16153425bc38SStefano Zampini     /* Jump operator P_D : results stored in pcis->vec1_B */
16163425bc38SStefano Zampini 
16173425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
16183425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
16193425bc38SStefano Zampini     /* Action of B_delta */
16203425bc38SStefano Zampini     ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
16213425bc38SStefano Zampini     ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr);
16223425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
16233425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
16243425bc38SStefano Zampini     /* Action of B_Ddelta^T */
16253425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
16263425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
16273425bc38SStefano Zampini     ierr = MatMultTranspose(fetidpmat_ctx->B_Ddelta,fetidpmat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr);
16283425bc38SStefano Zampini 
16293425bc38SStefano Zampini     /* Average operator E_D : results stored in pcis->vec2_B */
16303425bc38SStefano Zampini 
16313425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
16323425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
16333425bc38SStefano Zampini     ierr = VecPointwiseMult(pcis->vec2_B,pcis->D,pcis->vec2_B);CHKERRQ(ierr);
16343425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec2_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
16353425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec2_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
16363425bc38SStefano Zampini     ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
16373425bc38SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
16383425bc38SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
16393425bc38SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
16403425bc38SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
16413425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
16423425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec2_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
16433425bc38SStefano Zampini 
16443425bc38SStefano Zampini     /* test E_D=I-P_D */
16453425bc38SStefano Zampini     scalar_value = 1.0;
16463425bc38SStefano Zampini     ierr = VecAXPY(pcis->vec1_B,scalar_value,pcis->vec2_B);CHKERRQ(ierr);
16473425bc38SStefano Zampini     scalar_value = -1.0;
16483425bc38SStefano Zampini     ierr = VecAXPY(pcis->vec1_B,scalar_value,test_vec);CHKERRQ(ierr);
16493425bc38SStefano Zampini     ierr = VecNorm(pcis->vec1_B,NORM_INFINITY,&scalar_value);CHKERRQ(ierr);
16503425bc38SStefano Zampini     ierr = VecDestroy(&test_vec);CHKERRQ(ierr);
16513425bc38SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"D[%04d] CHECK infty norm of E_D + P_D - I: % 1.14e\n",rank,scalar_value);CHKERRQ(ierr);
16523425bc38SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
16533425bc38SStefano Zampini 
16543425bc38SStefano Zampini     /******************************************************************/
16553425bc38SStefano Zampini     /* TEST E: It should holds R_D^TP_Dw=0 w\in\widetilde{W}          */
16563425bc38SStefano Zampini     /* eq.48 Mandel Tezaur and Dohrmann 2005                          */
16573425bc38SStefano Zampini     /******************************************************************/
16583425bc38SStefano Zampini 
16593425bc38SStefano Zampini     ierr = VecSetRandom(pcis->vec1_N,PETSC_NULL);CHKERRQ(ierr);
16603425bc38SStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
16613425bc38SStefano Zampini     scalar_value = 0.0;  /* set zero at vertices */
16623425bc38SStefano Zampini     for(i=0;i<n_vertices;i++) { array[vertex_indices[i]]=scalar_value; }
16633425bc38SStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
16643425bc38SStefano Zampini 
16653425bc38SStefano Zampini     /* Jump operator P_D : results stored in pcis->vec1_B */
16663425bc38SStefano Zampini 
16673425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
16683425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
16693425bc38SStefano Zampini     /* Action of B_delta */
16703425bc38SStefano Zampini     ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
16713425bc38SStefano Zampini     ierr = VecSet(lambda_global,0.0);CHKERRQ(ierr);
16723425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
16733425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,lambda_global,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
16743425bc38SStefano Zampini     /* Action of B_Ddelta^T */
16753425bc38SStefano Zampini     ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
16763425bc38SStefano Zampini     ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
16773425bc38SStefano Zampini     ierr = MatMultTranspose(fetidpmat_ctx->B_Ddelta,fetidpmat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr);
16783425bc38SStefano Zampini     /* diagonal scaling */
16793425bc38SStefano Zampini     ierr = VecPointwiseMult(pcis->vec1_B,pcis->D,pcis->vec1_B);CHKERRQ(ierr);
16803425bc38SStefano Zampini     /* sum on the interface */
16813425bc38SStefano Zampini     ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
16823425bc38SStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
16833425bc38SStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_B,pcis->vec1_N,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
16843425bc38SStefano Zampini     ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
16853425bc38SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
16863425bc38SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
16873425bc38SStefano Zampini     ierr = VecNorm(pcis->vec1_global,NORM_INFINITY,&scalar_value);CHKERRQ(ierr);
16883425bc38SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"E[coll]: CHECK infty norm of R^T_D P_D: % 1.14e\n",scalar_value);CHKERRQ(ierr);
16893425bc38SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
16903425bc38SStefano Zampini 
16913425bc38SStefano Zampini     if(!fully_redundant) {
16923425bc38SStefano Zampini       /******************************************************************/
16933425bc38SStefano Zampini       /* TEST F: It should holds B_{delta}B^T_{D,delta}=I               */
16943425bc38SStefano Zampini       /* Corollary thm 14 Mandel Tezaur and Dohrmann 2005               */
16953425bc38SStefano Zampini       /******************************************************************/
16963425bc38SStefano Zampini       ierr = VecDuplicate(lambda_global,&test_vec);CHKERRQ(ierr);
16973425bc38SStefano Zampini       ierr = VecSetRandom(lambda_global,PETSC_NULL);CHKERRQ(ierr);
16983425bc38SStefano Zampini       /* Action of B_Ddelta^T */
16993425bc38SStefano Zampini       ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
17003425bc38SStefano Zampini       ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,lambda_global,fetidpmat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
17013425bc38SStefano Zampini       ierr = MatMultTranspose(fetidpmat_ctx->B_Ddelta,fetidpmat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr);
17023425bc38SStefano Zampini       /* Action of B_delta */
17033425bc38SStefano Zampini       ierr = MatMult(fetidpmat_ctx->B_delta,pcis->vec1_B,fetidpmat_ctx->lambda_local);CHKERRQ(ierr);
17043425bc38SStefano Zampini       ierr = VecSet(test_vec,0.0);CHKERRQ(ierr);
17053425bc38SStefano Zampini       ierr = VecScatterBegin(fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,test_vec,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
17063425bc38SStefano Zampini       ierr = VecScatterEnd  (fetidpmat_ctx->l2g_lambda,fetidpmat_ctx->lambda_local,test_vec,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
17073425bc38SStefano Zampini       scalar_value = -1.0;
17083425bc38SStefano Zampini       ierr = VecAXPY(lambda_global,scalar_value,test_vec);CHKERRQ(ierr);
17093425bc38SStefano Zampini       ierr = VecNorm(lambda_global,NORM_INFINITY,&scalar_value);CHKERRQ(ierr);
17103425bc38SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"E[coll]: CHECK infty norm of P^T_D - I: % 1.14e\n",scalar_value);CHKERRQ(ierr);
17113425bc38SStefano Zampini       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
17123425bc38SStefano Zampini       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
17133425bc38SStefano Zampini       ierr = VecDestroy(&test_vec);CHKERRQ(ierr);
17143425bc38SStefano Zampini     }
17153425bc38SStefano Zampini   }
17163425bc38SStefano Zampini   /* final cleanup */
17173425bc38SStefano Zampini   ierr = PetscFree(dual_dofs_boundary_indices);CHKERRQ(ierr);
17183425bc38SStefano Zampini   ierr = PetscFree(vertex_indices);CHKERRQ(ierr);
17193425bc38SStefano Zampini   ierr = PetscFree(aux_local_numbering_1);CHKERRQ(ierr);
17203425bc38SStefano Zampini   ierr = PetscFree(aux_local_numbering_2);CHKERRQ(ierr);
17213425bc38SStefano Zampini   ierr = PetscFree(aux_global_numbering);CHKERRQ(ierr);
17223425bc38SStefano Zampini   ierr = PetscFree(aux_global_numbering_mpi);CHKERRQ(ierr);
17233425bc38SStefano Zampini   ierr = PetscFree(dof_sizes);CHKERRQ(ierr);
17243425bc38SStefano Zampini   ierr = PetscFree(dof_displs);CHKERRQ(ierr);
17253425bc38SStefano Zampini   ierr = PetscFree(all_aux_global_numbering_mpi_1);CHKERRQ(ierr);
17263425bc38SStefano Zampini   ierr = PetscFree(all_aux_global_numbering_mpi_2);CHKERRQ(ierr);
17273425bc38SStefano Zampini   ierr = PetscFree(global_dofs_numbering);CHKERRQ(ierr);
17283425bc38SStefano Zampini   ierr = PetscFree(aux_sums);CHKERRQ(ierr);
17293425bc38SStefano Zampini   ierr = PetscFree(cols_B_delta);CHKERRQ(ierr);
17303425bc38SStefano Zampini   ierr = PetscFree(vals_B_delta);CHKERRQ(ierr);
17313425bc38SStefano Zampini   ierr = PetscFree(scaling_factors);CHKERRQ(ierr);
17323425bc38SStefano Zampini   ierr = VecDestroy(&lambda_global);CHKERRQ(ierr);
17333425bc38SStefano Zampini   ierr = ISDestroy(&IS_l2g_lambda);CHKERRQ(ierr);
17343425bc38SStefano Zampini 
17353425bc38SStefano Zampini   PetscFunctionReturn(0);
17363425bc38SStefano Zampini }
17373425bc38SStefano Zampini 
17383425bc38SStefano Zampini #undef __FUNCT__
17393425bc38SStefano Zampini #define __FUNCT__ "PCBDDCSetupFETIDPPCContext"
17403425bc38SStefano Zampini static PetscErrorCode PCBDDCSetupFETIDPPCContext(Mat fetimat, FETIDPPC_ctx *fetidppc_ctx)
17413425bc38SStefano Zampini {
17423425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
17433425bc38SStefano Zampini   PetscErrorCode ierr;
17443425bc38SStefano Zampini 
17453425bc38SStefano Zampini   PetscFunctionBegin;
17463425bc38SStefano Zampini   ierr = MatShellGetContext(fetimat,&mat_ctx);CHKERRQ(ierr);
17473425bc38SStefano Zampini   /* get references from objects created when setting up feti mat context */
17483425bc38SStefano Zampini   ierr = PetscObjectReference((PetscObject)mat_ctx->lambda_local);CHKERRQ(ierr);
17493425bc38SStefano Zampini   fetidppc_ctx->lambda_local = mat_ctx->lambda_local;
17503425bc38SStefano Zampini   ierr = PetscObjectReference((PetscObject)mat_ctx->B_Ddelta);CHKERRQ(ierr);
17513425bc38SStefano Zampini   fetidppc_ctx->B_Ddelta = mat_ctx->B_Ddelta;
17523425bc38SStefano Zampini   ierr = PetscObjectReference((PetscObject)mat_ctx->l2g_lambda);CHKERRQ(ierr);
17533425bc38SStefano Zampini   fetidppc_ctx->l2g_lambda = mat_ctx->l2g_lambda;
17543425bc38SStefano Zampini   PetscFunctionReturn(0);
17553425bc38SStefano Zampini }
17563425bc38SStefano Zampini 
17573425bc38SStefano Zampini #undef __FUNCT__
17583425bc38SStefano Zampini #define __FUNCT__ "FETIDPMatMult"
17593425bc38SStefano Zampini static PetscErrorCode FETIDPMatMult(Mat fetimat, Vec x, Vec y)
17603425bc38SStefano Zampini {
17613425bc38SStefano Zampini   FETIDPMat_ctx  *mat_ctx;
17623425bc38SStefano Zampini   PC_IS          *pcis;
17633425bc38SStefano Zampini   PetscErrorCode ierr;
17643425bc38SStefano Zampini 
17653425bc38SStefano Zampini   PetscFunctionBegin;
17663425bc38SStefano Zampini   ierr = MatShellGetContext(fetimat,&mat_ctx);CHKERRQ(ierr);
17673425bc38SStefano Zampini   pcis = (PC_IS*)mat_ctx->pc->data;
17683425bc38SStefano Zampini   /* Application of B_delta^T */
17693425bc38SStefano Zampini   ierr = VecScatterBegin(mat_ctx->l2g_lambda,x,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
17703425bc38SStefano Zampini   ierr = VecScatterEnd(mat_ctx->l2g_lambda,x,mat_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
17713425bc38SStefano Zampini   ierr = MatMultTranspose(mat_ctx->B_delta,mat_ctx->lambda_local,pcis->vec1_B);CHKERRQ(ierr);
17723425bc38SStefano Zampini   /* Application of \widetilde{S}^-1 */
17733425bc38SStefano Zampini   ierr = VecSet(pcis->vec1_D,0.0);CHKERRQ(ierr);
17743425bc38SStefano Zampini   ierr = PCBDDCApplyInterfacePreconditioner(mat_ctx->pc);CHKERRQ(ierr);
17753425bc38SStefano Zampini   /* Application of B_delta */
17763425bc38SStefano Zampini   ierr = MatMult(mat_ctx->B_delta,pcis->vec1_B,mat_ctx->lambda_local);CHKERRQ(ierr);
17773425bc38SStefano Zampini   ierr = VecSet(y,0.0);CHKERRQ(ierr);
17783425bc38SStefano Zampini   ierr = VecScatterBegin(mat_ctx->l2g_lambda,mat_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
17793425bc38SStefano Zampini   ierr = VecScatterEnd(mat_ctx->l2g_lambda,mat_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
17803425bc38SStefano Zampini   PetscFunctionReturn(0);
17813425bc38SStefano Zampini }
17823425bc38SStefano Zampini 
17833425bc38SStefano Zampini #undef __FUNCT__
17843425bc38SStefano Zampini #define __FUNCT__ "FETIDPPCApply"
17853425bc38SStefano Zampini static PetscErrorCode FETIDPPCApply(PC fetipc, Vec x, Vec y)
17863425bc38SStefano Zampini {
17873425bc38SStefano Zampini   FETIDPPC_ctx   *pc_ctx;
17883425bc38SStefano Zampini   PC_IS          *pcis;
17893425bc38SStefano Zampini   PetscErrorCode ierr;
17903425bc38SStefano Zampini 
17913425bc38SStefano Zampini   PetscFunctionBegin;
17923425bc38SStefano Zampini   ierr = PCShellGetContext(fetipc,(void**)&pc_ctx);
17933425bc38SStefano Zampini   pcis = (PC_IS*)pc_ctx->pc->data;
17943425bc38SStefano Zampini   /* Application of B_Ddelta^T */
17953425bc38SStefano Zampini   ierr = VecScatterBegin(pc_ctx->l2g_lambda,x,pc_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
17963425bc38SStefano Zampini   ierr = VecScatterEnd(pc_ctx->l2g_lambda,x,pc_ctx->lambda_local,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
17973425bc38SStefano Zampini   ierr = VecSet(pcis->vec2_B,0.0);CHKERRQ(ierr);
17983425bc38SStefano Zampini   ierr = MatMultTranspose(pc_ctx->B_Ddelta,pc_ctx->lambda_local,pcis->vec2_B);CHKERRQ(ierr);
17993425bc38SStefano Zampini   /* Application of S */
18003425bc38SStefano Zampini   ierr = PCISApplySchur(pc_ctx->pc,pcis->vec2_B,pcis->vec1_B,(Vec)0,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr);
18013425bc38SStefano Zampini   /* Application of B_Ddelta */
18023425bc38SStefano Zampini   ierr = MatMult(pc_ctx->B_Ddelta,pcis->vec1_B,pc_ctx->lambda_local);CHKERRQ(ierr);
18033425bc38SStefano Zampini   ierr = VecSet(y,0.0);CHKERRQ(ierr);
18043425bc38SStefano Zampini   ierr = VecScatterBegin(pc_ctx->l2g_lambda,pc_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18053425bc38SStefano Zampini   ierr = VecScatterEnd(pc_ctx->l2g_lambda,pc_ctx->lambda_local,y,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18063425bc38SStefano Zampini   PetscFunctionReturn(0);
18073425bc38SStefano Zampini }
18083425bc38SStefano Zampini 
1809da1bb401SStefano Zampini #undef __FUNCT__
1810da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetupLocalAdjacencyGraph"
1811da1bb401SStefano Zampini static PetscErrorCode PCBDDCSetupLocalAdjacencyGraph(PC pc)
1812da1bb401SStefano Zampini {
1813da1bb401SStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
1814da1bb401SStefano Zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
1815da1bb401SStefano Zampini   PetscInt       nvtxs,*xadj,*adjncy;
1816da1bb401SStefano Zampini   Mat            mat_adj;
1817da1bb401SStefano Zampini   PetscBool      symmetrize_rowij=PETSC_TRUE,compressed_rowij=PETSC_FALSE,flg_row=PETSC_TRUE;
1818da1bb401SStefano Zampini   PCBDDCGraph    mat_graph=pcbddc->mat_graph;
1819da1bb401SStefano Zampini   PetscErrorCode ierr;
1820da1bb401SStefano Zampini 
1821da1bb401SStefano Zampini   PetscFunctionBegin;
1822da1bb401SStefano Zampini   /* get CSR adjacency from local matrix if user has not yet provided local graph using PCBDDCSetLocalAdjacencyGraph function */
1823da1bb401SStefano Zampini   if(!mat_graph->xadj) {
1824da1bb401SStefano Zampini     ierr = MatConvert(matis->A,MATMPIADJ,MAT_INITIAL_MATRIX,&mat_adj);CHKERRQ(ierr);
1825da1bb401SStefano Zampini     ierr = MatGetRowIJ(mat_adj,0,symmetrize_rowij,compressed_rowij,&nvtxs,&xadj,&adjncy,&flg_row);CHKERRQ(ierr);
1826da1bb401SStefano Zampini     if(!flg_row) {
1827da1bb401SStefano Zampini       SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in MatGetRowIJ called in %s\n",__FUNCT__);
1828da1bb401SStefano Zampini     }
1829da1bb401SStefano Zampini     /* Get adjacency into BDDC workspace */
1830da1bb401SStefano Zampini     ierr = PCBDDCSetLocalAdjacencyGraph(pc,nvtxs,xadj,adjncy,PETSC_COPY_VALUES);CHKERRQ(ierr);
1831da1bb401SStefano Zampini     ierr = MatRestoreRowIJ(mat_adj,0,symmetrize_rowij,compressed_rowij,&nvtxs,&xadj,&adjncy,&flg_row);CHKERRQ(ierr);
1832da1bb401SStefano Zampini     if(!flg_row) {
1833da1bb401SStefano Zampini       SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in MatRestoreRowIJ called in %s\n",__FUNCT__);
1834da1bb401SStefano Zampini     }
1835da1bb401SStefano Zampini     ierr = MatDestroy(&mat_adj);CHKERRQ(ierr);
1836da1bb401SStefano Zampini   }
1837da1bb401SStefano Zampini   PetscFunctionReturn(0);
1838da1bb401SStefano Zampini }
1839da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
18400c7d97c5SJed Brown #undef __FUNCT__
18410c7d97c5SJed Brown #define __FUNCT__ "PCBDDCApplyInterfacePreconditioner"
18422617d88aSStefano Zampini static PetscErrorCode  PCBDDCApplyInterfacePreconditioner(PC pc)
18430c7d97c5SJed Brown {
18440c7d97c5SJed Brown   PetscErrorCode ierr;
18450c7d97c5SJed Brown   PC_BDDC*        pcbddc = (PC_BDDC*)(pc->data);
18460c7d97c5SJed Brown   PC_IS*            pcis = (PC_IS*)  (pc->data);
18473b03a366Sstefano_zampini   const PetscScalar zero = 0.0;
18480c7d97c5SJed Brown 
18490c7d97c5SJed Brown   PetscFunctionBegin;
18500c7d97c5SJed Brown   /* Application of PHI^T  */
18510c7d97c5SJed Brown   ierr = MatMultTranspose(pcbddc->coarse_phi_B,pcis->vec1_B,pcbddc->vec1_P);CHKERRQ(ierr);
18520c7d97c5SJed Brown   if(pcbddc->prec_type) { ierr = MatMultTransposeAdd(pcbddc->coarse_phi_D,pcis->vec1_D,pcbddc->vec1_P,pcbddc->vec1_P);CHKERRQ(ierr); }
18530c7d97c5SJed Brown 
18540c7d97c5SJed Brown   /* Scatter data of coarse_rhs */
18550c7d97c5SJed Brown   if(pcbddc->coarse_rhs) ierr = VecSet(pcbddc->coarse_rhs,zero);CHKERRQ(ierr);
18560c7d97c5SJed Brown   ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->vec1_P,pcbddc->coarse_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18570c7d97c5SJed Brown 
18580c7d97c5SJed Brown   /* Local solution on R nodes */
18590c7d97c5SJed Brown   ierr = VecSet(pcbddc->vec1_R,zero);CHKERRQ(ierr);
18600c7d97c5SJed Brown   ierr = VecScatterBegin(pcbddc->R_to_B,pcis->vec1_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
18610c7d97c5SJed Brown   ierr = VecScatterEnd  (pcbddc->R_to_B,pcis->vec1_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
18620c7d97c5SJed Brown   if(pcbddc->prec_type) {
18630c7d97c5SJed Brown     ierr = VecScatterBegin(pcbddc->R_to_D,pcis->vec1_D,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
18640c7d97c5SJed Brown     ierr = VecScatterEnd  (pcbddc->R_to_D,pcis->vec1_D,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
18650c7d97c5SJed Brown   }
18660c7d97c5SJed Brown   ierr = PCBDDCSolveSaddlePoint(pc);CHKERRQ(ierr);
18670c7d97c5SJed Brown   ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr);
18680c7d97c5SJed Brown   ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec2_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18690c7d97c5SJed Brown   ierr = VecScatterEnd  (pcbddc->R_to_B,pcbddc->vec2_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18700c7d97c5SJed Brown   if(pcbddc->prec_type) {
18710c7d97c5SJed Brown     ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec2_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18720c7d97c5SJed Brown     ierr = VecScatterEnd  (pcbddc->R_to_D,pcbddc->vec2_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
18730c7d97c5SJed Brown   }
18740c7d97c5SJed Brown 
18750c7d97c5SJed Brown   /* Coarse solution */
18760c7d97c5SJed Brown   ierr = PCBDDCScatterCoarseDataEnd(pc,pcbddc->vec1_P,pcbddc->coarse_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
187753cdbc3dSStefano Zampini   if(pcbddc->coarse_rhs) ierr = KSPSolve(pcbddc->coarse_ksp,pcbddc->coarse_rhs,pcbddc->coarse_vec);CHKERRQ(ierr);
18780c7d97c5SJed Brown   ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->coarse_vec,pcbddc->vec1_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
18790c7d97c5SJed Brown   ierr = PCBDDCScatterCoarseDataEnd  (pc,pcbddc->coarse_vec,pcbddc->vec1_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
18800c7d97c5SJed Brown 
18810c7d97c5SJed Brown   /* Sum contributions from two levels */
18820c7d97c5SJed Brown   ierr = MatMultAdd(pcbddc->coarse_phi_B,pcbddc->vec1_P,pcis->vec1_B,pcis->vec1_B);CHKERRQ(ierr);
18830c7d97c5SJed Brown   if(pcbddc->prec_type) { ierr = MatMultAdd(pcbddc->coarse_phi_D,pcbddc->vec1_P,pcis->vec1_D,pcis->vec1_D);CHKERRQ(ierr); }
18840c7d97c5SJed Brown   PetscFunctionReturn(0);
18850c7d97c5SJed Brown }
18860c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
18870c7d97c5SJed Brown #undef __FUNCT__
18880c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSolveSaddlePoint"
188953cdbc3dSStefano Zampini static PetscErrorCode  PCBDDCSolveSaddlePoint(PC pc)
18900c7d97c5SJed Brown {
18910c7d97c5SJed Brown   PetscErrorCode ierr;
18920c7d97c5SJed Brown   PC_BDDC*       pcbddc = (PC_BDDC*)(pc->data);
18930c7d97c5SJed Brown 
18940c7d97c5SJed Brown   PetscFunctionBegin;
189553cdbc3dSStefano Zampini   ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr);
1896534831adSStefano Zampini   if(pcbddc->local_auxmat1) {
18970c7d97c5SJed Brown     ierr = MatMult(pcbddc->local_auxmat1,pcbddc->vec2_R,pcbddc->vec1_C);CHKERRQ(ierr);
18980c7d97c5SJed Brown     ierr = MatMultAdd(pcbddc->local_auxmat2,pcbddc->vec1_C,pcbddc->vec2_R,pcbddc->vec2_R);CHKERRQ(ierr);
18990c7d97c5SJed Brown   }
19000c7d97c5SJed Brown   PetscFunctionReturn(0);
19010c7d97c5SJed Brown }
19020c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
19030c7d97c5SJed Brown #undef __FUNCT__
19040c7d97c5SJed Brown #define __FUNCT__ "PCBDDCScatterCoarseDataBegin"
190553cdbc3dSStefano Zampini static PetscErrorCode  PCBDDCScatterCoarseDataBegin(PC pc,Vec vec_from, Vec vec_to, InsertMode imode, ScatterMode smode)
19060c7d97c5SJed Brown {
19070c7d97c5SJed Brown   PetscErrorCode ierr;
19080c7d97c5SJed Brown   PC_BDDC*       pcbddc = (PC_BDDC*)(pc->data);
19090c7d97c5SJed Brown 
19100c7d97c5SJed Brown   PetscFunctionBegin;
19110c7d97c5SJed Brown   switch(pcbddc->coarse_communications_type){
19120c7d97c5SJed Brown     case SCATTERS_BDDC:
19130c7d97c5SJed Brown       ierr = VecScatterBegin(pcbddc->coarse_loc_to_glob,vec_from,vec_to,imode,smode);CHKERRQ(ierr);
19140c7d97c5SJed Brown       break;
19150c7d97c5SJed Brown     case GATHERS_BDDC:
19160c7d97c5SJed Brown       break;
19170c7d97c5SJed Brown   }
19180c7d97c5SJed Brown   PetscFunctionReturn(0);
19190c7d97c5SJed Brown }
19200c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
19210c7d97c5SJed Brown #undef __FUNCT__
19220c7d97c5SJed Brown #define __FUNCT__ "PCBDDCScatterCoarseDataEnd"
192353cdbc3dSStefano Zampini static PetscErrorCode  PCBDDCScatterCoarseDataEnd(PC pc,Vec vec_from, Vec vec_to, InsertMode imode, ScatterMode smode)
19240c7d97c5SJed Brown {
19250c7d97c5SJed Brown   PetscErrorCode ierr;
19260c7d97c5SJed Brown   PC_BDDC*       pcbddc = (PC_BDDC*)(pc->data);
19270c7d97c5SJed Brown   PetscScalar*   array_to;
19280c7d97c5SJed Brown   PetscScalar*   array_from;
19290c7d97c5SJed Brown   MPI_Comm       comm=((PetscObject)pc)->comm;
19300c7d97c5SJed Brown   PetscInt i;
19310c7d97c5SJed Brown 
19320c7d97c5SJed Brown   PetscFunctionBegin;
19330c7d97c5SJed Brown 
19340c7d97c5SJed Brown   switch(pcbddc->coarse_communications_type){
19350c7d97c5SJed Brown     case SCATTERS_BDDC:
19360c7d97c5SJed Brown       ierr = VecScatterEnd(pcbddc->coarse_loc_to_glob,vec_from,vec_to,imode,smode);CHKERRQ(ierr);
19370c7d97c5SJed Brown       break;
19380c7d97c5SJed Brown     case GATHERS_BDDC:
19390c7d97c5SJed Brown       if(vec_from) VecGetArray(vec_from,&array_from);
19400c7d97c5SJed Brown       if(vec_to)   VecGetArray(vec_to,&array_to);
19410c7d97c5SJed Brown       switch(pcbddc->coarse_problem_type){
19420c7d97c5SJed Brown         case SEQUENTIAL_BDDC:
19430c7d97c5SJed Brown           if(smode == SCATTER_FORWARD) {
194453cdbc3dSStefano Zampini             ierr = MPI_Gatherv(&array_from[0],pcbddc->local_primal_size,MPIU_SCALAR,&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,0,comm);CHKERRQ(ierr);
19450c7d97c5SJed Brown             if(vec_to) {
19460c7d97c5SJed Brown               for(i=0;i<pcbddc->replicated_primal_size;i++)
19470c7d97c5SJed Brown                 array_to[pcbddc->replicated_local_primal_indices[i]]+=pcbddc->replicated_local_primal_values[i];
19480c7d97c5SJed Brown             }
19490c7d97c5SJed Brown           } else {
19500c7d97c5SJed Brown             if(vec_from)
19510c7d97c5SJed Brown               for(i=0;i<pcbddc->replicated_primal_size;i++)
19520c7d97c5SJed Brown                 pcbddc->replicated_local_primal_values[i]=array_from[pcbddc->replicated_local_primal_indices[i]];
195353cdbc3dSStefano Zampini             ierr = MPI_Scatterv(&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,&array_to[0],pcbddc->local_primal_size,MPIU_SCALAR,0,comm);CHKERRQ(ierr);
19540c7d97c5SJed Brown           }
19550c7d97c5SJed Brown           break;
19560c7d97c5SJed Brown         case REPLICATED_BDDC:
19570c7d97c5SJed Brown           if(smode == SCATTER_FORWARD) {
195853cdbc3dSStefano Zampini             ierr = MPI_Allgatherv(&array_from[0],pcbddc->local_primal_size,MPIU_SCALAR,&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,comm);CHKERRQ(ierr);
19590c7d97c5SJed Brown             for(i=0;i<pcbddc->replicated_primal_size;i++)
19600c7d97c5SJed Brown               array_to[pcbddc->replicated_local_primal_indices[i]]+=pcbddc->replicated_local_primal_values[i];
19610c7d97c5SJed Brown           } else { /* no communications needed for SCATTER_REVERSE since needed data is already present */
19620c7d97c5SJed Brown             for(i=0;i<pcbddc->local_primal_size;i++)
19630c7d97c5SJed Brown               array_to[i]=array_from[pcbddc->local_primal_indices[i]];
19640c7d97c5SJed Brown           }
19650c7d97c5SJed Brown           break;
196653cdbc3dSStefano Zampini         case MULTILEVEL_BDDC:
196753cdbc3dSStefano Zampini           break;
196853cdbc3dSStefano Zampini         case PARALLEL_BDDC:
196953cdbc3dSStefano Zampini           break;
19700c7d97c5SJed Brown       }
19710c7d97c5SJed Brown       if(vec_from) VecRestoreArray(vec_from,&array_from);
19720c7d97c5SJed Brown       if(vec_to)   VecRestoreArray(vec_to,&array_to);
19730c7d97c5SJed Brown       break;
19740c7d97c5SJed Brown   }
19750c7d97c5SJed Brown   PetscFunctionReturn(0);
19760c7d97c5SJed Brown }
19770c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
19783b03a366Sstefano_zampini #undef __FUNCT__
19793b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCCreateConstraintMatrix"
19803b03a366Sstefano_zampini static PetscErrorCode PCBDDCCreateConstraintMatrix(PC pc)
19813b03a366Sstefano_zampini {
19823b03a366Sstefano_zampini   PetscErrorCode ierr;
19833b03a366Sstefano_zampini   PC_IS*         pcis = (PC_IS*)(pc->data);
19843b03a366Sstefano_zampini   PC_BDDC*       pcbddc = (PC_BDDC*)pc->data;
19853b03a366Sstefano_zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
198623d4d1a5SStefano Zampini   PetscInt       *nnz,*is_indices;
19873b03a366Sstefano_zampini   PetscScalar    *temp_quadrature_constraint;
1988534831adSStefano Zampini   PetscInt       *temp_indices,*temp_indices_to_constraint,*temp_indices_to_constraint_B,*local_to_B;
19893b03a366Sstefano_zampini   PetscInt       local_primal_size,i,j,k,total_counts,max_size_of_constraint;
19903b03a366Sstefano_zampini   PetscInt       n_constraints,n_vertices,size_of_constraint;
1991534831adSStefano Zampini   PetscScalar    quad_value;
19923b03a366Sstefano_zampini   PetscBool      nnsp_has_cnst=PETSC_FALSE,use_nnsp_true=pcbddc->use_nnsp_true;
19933b03a366Sstefano_zampini   PetscInt       nnsp_size=0,nnsp_addone=0,temp_constraints,temp_start_ptr;
19943b03a366Sstefano_zampini   IS             *used_IS;
19953b03a366Sstefano_zampini   const MatType  impMatType=MATSEQAIJ;
19963b03a366Sstefano_zampini   PetscBLASInt   Bs,Bt,lwork,lierr;
19973b03a366Sstefano_zampini   PetscReal      tol=1.0e-8;
1998fcda91b4SJed Brown   MatNullSpace   nearnullsp;
1999fcda91b4SJed Brown   const Vec      *nearnullvecs;
20003b03a366Sstefano_zampini   Vec            *localnearnullsp;
20013b03a366Sstefano_zampini   PetscScalar    *work,*temp_basis,*array_vector,*correlation_mat;
20023b03a366Sstefano_zampini   PetscReal      *rwork,*singular_vals;
2003534831adSStefano Zampini   PetscBLASInt   Bone=1,*ipiv;
2004534831adSStefano Zampini   Vec            temp_vec;
2005534831adSStefano Zampini   Mat            temp_mat;
2006534831adSStefano Zampini   KSP            temp_ksp;
2007534831adSStefano Zampini   PetscInt       s,start_constraint,dual_dofs;
2008534831adSStefano Zampini   PetscBool      compute_submatrix,useksp=PETSC_FALSE;
2009534831adSStefano Zampini   PetscInt       *aux_primal_permutation,*aux_primal_numbering;
2010534831adSStefano Zampini   PetscBool      boolforface,*change_basis;
2011de534f79Sstefano_zampini /* some ugly conditional declarations */
20123b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD)
20133b03a366Sstefano_zampini   PetscScalar    dot_result;
20143b03a366Sstefano_zampini   PetscScalar    one=1.0,zero=0.0;
20153b03a366Sstefano_zampini   PetscInt       ii;
20163425bc38SStefano Zampini   PetscScalar    *singular_vectors;
20173425bc38SStefano Zampini   PetscBLASInt   *iwork,*ifail;
20183425bc38SStefano Zampini   PetscReal      dummy_real,abs_tol;
20193425bc38SStefano Zampini   PetscBLASInt   eigs_found;
20203b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX)
20213b03a366Sstefano_zampini   PetscScalar    val1,val2;
20223b03a366Sstefano_zampini #endif
20233425bc38SStefano Zampini #endif
20243b03a366Sstefano_zampini   PetscBLASInt   dummy_int;
20253b03a366Sstefano_zampini   PetscScalar    dummy_scalar;
20263b03a366Sstefano_zampini 
20273b03a366Sstefano_zampini   PetscFunctionBegin;
20283b03a366Sstefano_zampini   /* check if near null space is attached to global mat */
2029fcda91b4SJed Brown   ierr = MatGetNearNullSpace(pc->pmat,&nearnullsp);CHKERRQ(ierr);
2030fcda91b4SJed Brown   if (nearnullsp) {
2031fcda91b4SJed Brown     ierr = MatNullSpaceGetVecs(nearnullsp,&nnsp_has_cnst,&nnsp_size,&nearnullvecs);CHKERRQ(ierr);
20323b03a366Sstefano_zampini   } else { /* if near null space is not provided it uses constants */
20333b03a366Sstefano_zampini     nnsp_has_cnst = PETSC_TRUE;
20343b03a366Sstefano_zampini     use_nnsp_true = PETSC_TRUE;
20353b03a366Sstefano_zampini   }
20363b03a366Sstefano_zampini   if(nnsp_has_cnst) {
20373b03a366Sstefano_zampini     nnsp_addone = 1;
20383b03a366Sstefano_zampini   }
20393b03a366Sstefano_zampini   /*
20403b03a366Sstefano_zampini        Evaluate maximum storage size needed by the procedure
20413b03a366Sstefano_zampini        - temp_indices will contain start index of each constraint stored as follows
20423b03a366Sstefano_zampini        - temp_indices_to_constraint  [temp_indices[i],...,temp[indices[i+1]-1] will contain the indices (in local numbering) on which the constraint acts
2043534831adSStefano Zampini        - temp_indices_to_constraint_B[temp_indices[i],...,temp[indices[i+1]-1] will contain the indices (in boundary numbering) on which the constraint acts
20443b03a366Sstefano_zampini        - temp_quadrature_constraint  [temp_indices[i],...,temp[indices[i+1]-1] will contain the scalars representing the constraint itself
20453b03a366Sstefano_zampini                                                                                                                                                          */
2046da1bb401SStefano Zampini 
20473b03a366Sstefano_zampini   total_counts = pcbddc->n_ISForFaces+pcbddc->n_ISForEdges;
20483b03a366Sstefano_zampini   total_counts *= (nnsp_addone+nnsp_size);
2049da1bb401SStefano Zampini   ierr = ISGetSize(pcbddc->ISForVertices,&n_vertices);CHKERRQ(ierr);
2050da1bb401SStefano Zampini   total_counts += n_vertices;
20513b03a366Sstefano_zampini   ierr = PetscMalloc((total_counts+1)*sizeof(PetscInt),&temp_indices);CHKERRQ(ierr);
2052534831adSStefano Zampini   ierr = PetscMalloc((total_counts+1)*sizeof(PetscBool),&change_basis);CHKERRQ(ierr);
20533b03a366Sstefano_zampini   total_counts = 0;
20543b03a366Sstefano_zampini   max_size_of_constraint = 0;
20553b03a366Sstefano_zampini   for(i=0;i<pcbddc->n_ISForEdges+pcbddc->n_ISForFaces;i++){
20563b03a366Sstefano_zampini     if(i<pcbddc->n_ISForEdges){
20573b03a366Sstefano_zampini       used_IS = &pcbddc->ISForEdges[i];
20583b03a366Sstefano_zampini     } else {
20593b03a366Sstefano_zampini       used_IS = &pcbddc->ISForFaces[i-pcbddc->n_ISForEdges];
20603b03a366Sstefano_zampini     }
20613b03a366Sstefano_zampini     ierr = ISGetSize(*used_IS,&j);CHKERRQ(ierr);
20623b03a366Sstefano_zampini     total_counts += j;
20633b03a366Sstefano_zampini     if(j>max_size_of_constraint) max_size_of_constraint=j;
20643b03a366Sstefano_zampini   }
20653b03a366Sstefano_zampini   total_counts *= (nnsp_addone+nnsp_size);
2066da1bb401SStefano Zampini   total_counts += n_vertices;
20673b03a366Sstefano_zampini   ierr = PetscMalloc(total_counts*sizeof(PetscScalar),&temp_quadrature_constraint);CHKERRQ(ierr);
20683b03a366Sstefano_zampini   ierr = PetscMalloc(total_counts*sizeof(PetscInt),&temp_indices_to_constraint);CHKERRQ(ierr);
2069534831adSStefano Zampini   ierr = PetscMalloc(total_counts*sizeof(PetscInt),&temp_indices_to_constraint_B);CHKERRQ(ierr);
2070534831adSStefano Zampini   ierr = PetscMalloc(pcis->n*sizeof(PetscInt),&local_to_B);CHKERRQ(ierr);
2071534831adSStefano Zampini   ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2072534831adSStefano Zampini   for(i=0;i<pcis->n;i++) {
2073534831adSStefano Zampini     local_to_B[i]=-1;
2074534831adSStefano Zampini   }
2075534831adSStefano Zampini   for(i=0;i<pcis->n_B;i++) {
2076534831adSStefano Zampini     local_to_B[is_indices[i]]=i;
2077534831adSStefano Zampini   }
2078534831adSStefano Zampini   ierr = ISRestoreIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2079534831adSStefano Zampini 
20803b03a366Sstefano_zampini   /* First we issue queries to allocate optimal workspace for LAPACKgesvd or LAPACKsyev/LAPACKheev */
20813b03a366Sstefano_zampini   rwork = 0;
20823b03a366Sstefano_zampini   work = 0;
20833b03a366Sstefano_zampini   singular_vals = 0;
20843b03a366Sstefano_zampini   temp_basis = 0;
20853b03a366Sstefano_zampini   correlation_mat = 0;
20863b03a366Sstefano_zampini   if(!pcbddc->use_nnsp_true) {
20873b03a366Sstefano_zampini     PetscScalar temp_work;
20883b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD)
20893b03a366Sstefano_zampini     /* POD */
20903b03a366Sstefano_zampini     PetscInt max_n;
20913b03a366Sstefano_zampini     max_n = nnsp_addone+nnsp_size;
20923b03a366Sstefano_zampini     /* using some techniques borrowed from Proper Orthogonal Decomposition */
20933b03a366Sstefano_zampini     ierr = PetscMalloc(max_n*max_n*sizeof(PetscScalar),&correlation_mat);CHKERRQ(ierr);
20943425bc38SStefano Zampini     ierr = PetscMalloc(max_n*max_n*sizeof(PetscScalar),&singular_vectors);CHKERRQ(ierr);
20953b03a366Sstefano_zampini     ierr = PetscMalloc(max_n*sizeof(PetscReal),&singular_vals);CHKERRQ(ierr);
20963b03a366Sstefano_zampini     ierr = PetscMalloc(max_size_of_constraint*(nnsp_addone+nnsp_size)*sizeof(PetscScalar),&temp_basis);CHKERRQ(ierr);
20973b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX)
20983b03a366Sstefano_zampini     ierr = PetscMalloc(3*max_n*sizeof(PetscReal),&rwork);CHKERRQ(ierr);
20993b03a366Sstefano_zampini #endif
21003425bc38SStefano Zampini     ierr = PetscMalloc(5*max_n*sizeof(PetscBLASInt),&iwork);CHKERRQ(ierr);
21013425bc38SStefano Zampini     ierr = PetscMalloc(max_n*sizeof(PetscBLASInt),&ifail);CHKERRQ(ierr);
21023b03a366Sstefano_zampini     /* now we evaluate the optimal workspace using query with lwork=-1 */
21033b03a366Sstefano_zampini     Bt = PetscBLASIntCast(max_n);
21043b03a366Sstefano_zampini     lwork=-1;
21053425bc38SStefano Zampini     ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
21063b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX)
21073425bc38SStefano Zampini     abs_tol=1.e-8;
21083425bc38SStefano Zampini /*    LAPACKsyev_("V","U",&Bt,correlation_mat,&Bt,singular_vals,&temp_work,&lwork,&lierr); */
21093425bc38SStefano Zampini     LAPACKsyevx_("V","A","U",&Bt,correlation_mat,&Bt,&dummy_real,&dummy_real,&dummy_int,&dummy_int,
21103425bc38SStefano Zampini                  &abs_tol,&eigs_found,singular_vals,singular_vectors,&Bt,&temp_work,&lwork,iwork,ifail,&lierr);
21113b03a366Sstefano_zampini #else
21123425bc38SStefano Zampini /*    LAPACKsyev_("V","U",&Bt,correlation_mat,&Bt,singular_vals,&temp_work,&lwork,rwork,&lierr); */
21133425bc38SStefano Zampini /*  LAPACK call is missing here! TODO */
21143425bc38SStefano Zampini     SETERRQ(((PetscObject) pc)->comm, PETSC_ERR_SUP, "Not yet implemented for complexes when PETSC_MISSING_GESVD = 1");
21153b03a366Sstefano_zampini #endif
21163425bc38SStefano Zampini     if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to SYEVX Lapack routine %d",(int)lierr);
21173425bc38SStefano Zampini     ierr = PetscFPTrapPop();CHKERRQ(ierr);
21183b03a366Sstefano_zampini #else /* on missing GESVD */
21193b03a366Sstefano_zampini     /* SVD */
21203b03a366Sstefano_zampini     PetscInt max_n,min_n;
21213b03a366Sstefano_zampini     max_n = max_size_of_constraint;
21223b03a366Sstefano_zampini     min_n = nnsp_addone+nnsp_size;
21233b03a366Sstefano_zampini     if(max_size_of_constraint < ( nnsp_addone+nnsp_size ) ) {
21243b03a366Sstefano_zampini       min_n = max_size_of_constraint;
21253b03a366Sstefano_zampini       max_n = nnsp_addone+nnsp_size;
21263b03a366Sstefano_zampini     }
21273b03a366Sstefano_zampini     ierr = PetscMalloc(min_n*sizeof(PetscReal),&singular_vals);CHKERRQ(ierr);
21283b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX)
21293b03a366Sstefano_zampini     ierr = PetscMalloc(5*min_n*sizeof(PetscReal),&rwork);CHKERRQ(ierr);
21303b03a366Sstefano_zampini #endif
21313b03a366Sstefano_zampini     /* now we evaluate the optimal workspace using query with lwork=-1 */
21323b03a366Sstefano_zampini     lwork=-1;
21333b03a366Sstefano_zampini     Bs = PetscBLASIntCast(max_n);
21343b03a366Sstefano_zampini     Bt = PetscBLASIntCast(min_n);
21353b03a366Sstefano_zampini     dummy_int = Bs;
2136670f3ff9SJed Brown     ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
21373b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX)
21383b03a366Sstefano_zampini     LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[0],&Bs,singular_vals,
21393b03a366Sstefano_zampini                  &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,&temp_work,&lwork,&lierr);
21403b03a366Sstefano_zampini #else
21413b03a366Sstefano_zampini     LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[0],&Bs,singular_vals,
21423b03a366Sstefano_zampini                  &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,&temp_work,&lwork,rwork,&lierr);
21433b03a366Sstefano_zampini #endif
21443b03a366Sstefano_zampini     if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to SVD Lapack routine %d",(int)lierr);
2145670f3ff9SJed Brown     ierr = PetscFPTrapPop();CHKERRQ(ierr);
21463b03a366Sstefano_zampini #endif
21473b03a366Sstefano_zampini     /* Allocate optimal workspace */
21483b03a366Sstefano_zampini     lwork = PetscBLASIntCast((PetscInt)PetscRealPart(temp_work));
21493b03a366Sstefano_zampini     total_counts = (PetscInt)lwork;
21503b03a366Sstefano_zampini     ierr = PetscMalloc(total_counts*sizeof(PetscScalar),&work);CHKERRQ(ierr);
21513b03a366Sstefano_zampini   }
21523b03a366Sstefano_zampini   /* get local part of global near null space vectors */
21533b03a366Sstefano_zampini   ierr = PetscMalloc(nnsp_size*sizeof(Vec),&localnearnullsp);CHKERRQ(ierr);
21543b03a366Sstefano_zampini   for(k=0;k<nnsp_size;k++) {
21553b03a366Sstefano_zampini     ierr = VecDuplicate(pcis->vec1_N,&localnearnullsp[k]);CHKERRQ(ierr);
2156fcda91b4SJed Brown     ierr = VecScatterBegin(matis->ctx,nearnullvecs[k],localnearnullsp[k],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
2157fcda91b4SJed Brown     ierr = VecScatterEnd  (matis->ctx,nearnullvecs[k],localnearnullsp[k],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
21583b03a366Sstefano_zampini   }
21593b03a366Sstefano_zampini   /* Now we can loop on constraining sets */
21603b03a366Sstefano_zampini   total_counts=0;
21613b03a366Sstefano_zampini   temp_indices[0]=0;
2162da1bb401SStefano Zampini   /* vertices */
2163da1bb401SStefano Zampini   PetscBool used_vertex;
2164da1bb401SStefano Zampini   ierr = ISGetIndices(pcbddc->ISForVertices,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2165da1bb401SStefano Zampini   if(nnsp_has_cnst) { /* consider all vertices */
2166da1bb401SStefano Zampini     for(i=0;i<n_vertices;i++) {
2167da1bb401SStefano Zampini       temp_indices_to_constraint[temp_indices[total_counts]]=is_indices[i];
2168534831adSStefano Zampini       temp_indices_to_constraint_B[temp_indices[total_counts]]=local_to_B[is_indices[i]];
2169da1bb401SStefano Zampini       temp_quadrature_constraint[temp_indices[total_counts]]=1.0;
2170da1bb401SStefano Zampini       temp_indices[total_counts+1]=temp_indices[total_counts]+1;
2171534831adSStefano Zampini       change_basis[total_counts]=PETSC_FALSE;
2172da1bb401SStefano Zampini       total_counts++;
2173da1bb401SStefano Zampini     }
2174da1bb401SStefano Zampini   } else { /* consider vertices for which exist at least a localnearnullsp which is not null there */
2175da1bb401SStefano Zampini     for(i=0;i<n_vertices;i++) {
2176da1bb401SStefano Zampini       used_vertex=PETSC_FALSE;
2177da1bb401SStefano Zampini       k=0;
2178da1bb401SStefano Zampini       while(!used_vertex && k<nnsp_size) {
2179da1bb401SStefano Zampini         ierr = VecGetArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr);
2180da1bb401SStefano Zampini         if(PetscAbsScalar(array_vector[is_indices[i]])>0.0) {
2181da1bb401SStefano Zampini           temp_indices_to_constraint[temp_indices[total_counts]]=is_indices[i];
2182534831adSStefano Zampini           temp_indices_to_constraint_B[temp_indices[total_counts]]=local_to_B[is_indices[i]];
2183da1bb401SStefano Zampini           temp_quadrature_constraint[temp_indices[total_counts]]=1.0;
2184da1bb401SStefano Zampini           temp_indices[total_counts+1]=temp_indices[total_counts]+1;
2185534831adSStefano Zampini           change_basis[total_counts]=PETSC_FALSE;
2186da1bb401SStefano Zampini           total_counts++;
2187da1bb401SStefano Zampini           used_vertex=PETSC_TRUE;
2188da1bb401SStefano Zampini         }
2189da1bb401SStefano Zampini         ierr = VecRestoreArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr);
2190da1bb401SStefano Zampini         k++;
2191da1bb401SStefano Zampini       }
2192da1bb401SStefano Zampini     }
2193da1bb401SStefano Zampini   }
2194da1bb401SStefano Zampini   ierr = ISRestoreIndices(pcbddc->ISForVertices,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2195da1bb401SStefano Zampini   n_vertices=total_counts;
2196da1bb401SStefano Zampini   /* edges and faces */
21973b03a366Sstefano_zampini   for(i=0;i<pcbddc->n_ISForEdges+pcbddc->n_ISForFaces;i++){
21983b03a366Sstefano_zampini     if(i<pcbddc->n_ISForEdges){
21993b03a366Sstefano_zampini       used_IS = &pcbddc->ISForEdges[i];
2200534831adSStefano Zampini       boolforface = pcbddc->usechangeofbasis;
22013b03a366Sstefano_zampini     } else {
22023b03a366Sstefano_zampini       used_IS = &pcbddc->ISForFaces[i-pcbddc->n_ISForEdges];
2203534831adSStefano Zampini       boolforface = pcbddc->usechangeonfaces;
22043b03a366Sstefano_zampini     }
22053b03a366Sstefano_zampini     temp_constraints = 0;          /* zero the number of constraints I have on this conn comp */
22063b03a366Sstefano_zampini     temp_start_ptr = total_counts; /* need to know the starting index of constraints stored */
22073b03a366Sstefano_zampini     ierr = ISGetSize(*used_IS,&size_of_constraint);CHKERRQ(ierr);
22083b03a366Sstefano_zampini     ierr = ISGetIndices(*used_IS,(const PetscInt**)&is_indices);CHKERRQ(ierr);
22093b03a366Sstefano_zampini     if(nnsp_has_cnst) {
22103b03a366Sstefano_zampini       temp_constraints++;
2211534831adSStefano Zampini       quad_value = (PetscScalar) (1.0/PetscSqrtReal((PetscReal)size_of_constraint));
22123b03a366Sstefano_zampini       for(j=0;j<size_of_constraint;j++) {
22133b03a366Sstefano_zampini         temp_indices_to_constraint[temp_indices[total_counts]+j]=is_indices[j];
2214534831adSStefano Zampini         temp_indices_to_constraint_B[temp_indices[total_counts]+j]=local_to_B[is_indices[j]];
22153b03a366Sstefano_zampini         temp_quadrature_constraint[temp_indices[total_counts]+j]=quad_value;
22163b03a366Sstefano_zampini       }
22173b03a366Sstefano_zampini       temp_indices[total_counts+1]=temp_indices[total_counts]+size_of_constraint;  /* store new starting point */
2218534831adSStefano Zampini       change_basis[total_counts]=boolforface;
22193b03a366Sstefano_zampini       total_counts++;
22203b03a366Sstefano_zampini     }
22213b03a366Sstefano_zampini     for(k=0;k<nnsp_size;k++) {
22223b03a366Sstefano_zampini       ierr = VecGetArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr);
22233b03a366Sstefano_zampini       for(j=0;j<size_of_constraint;j++) {
22243b03a366Sstefano_zampini         temp_indices_to_constraint[temp_indices[total_counts]+j]=is_indices[j];
2225534831adSStefano Zampini         temp_indices_to_constraint_B[temp_indices[total_counts]+j]=local_to_B[is_indices[j]];
22263b03a366Sstefano_zampini         temp_quadrature_constraint[temp_indices[total_counts]+j]=array_vector[is_indices[j]];
22273b03a366Sstefano_zampini       }
22283b03a366Sstefano_zampini       ierr = VecRestoreArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr);
2229de534f79Sstefano_zampini       quad_value = 1.0;
2230de534f79Sstefano_zampini       if( use_nnsp_true ) { /* check if array is null on the connected component in case use_nnsp_true has been requested */
2231de534f79Sstefano_zampini         Bs = PetscBLASIntCast(size_of_constraint);
2232de534f79Sstefano_zampini         quad_value = BLASasum_(&Bs,&temp_quadrature_constraint[temp_indices[total_counts]],&Bone);
2233de534f79Sstefano_zampini       }
2234de534f79Sstefano_zampini       if ( quad_value > 0.0 ) { /* keep indices and values */
2235de534f79Sstefano_zampini         temp_constraints++;
22363b03a366Sstefano_zampini         temp_indices[total_counts+1]=temp_indices[total_counts]+size_of_constraint;  /* store new starting point */
2237534831adSStefano Zampini         change_basis[total_counts]=boolforface;
22383b03a366Sstefano_zampini         total_counts++;
22393b03a366Sstefano_zampini       }
2240de534f79Sstefano_zampini     }
22413b03a366Sstefano_zampini     ierr = ISRestoreIndices(*used_IS,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2242de534f79Sstefano_zampini     /* perform SVD on the constraint if use_nnsp_true has not be requested by the user */
22433b03a366Sstefano_zampini     if(!use_nnsp_true) {
2244de534f79Sstefano_zampini 
22453b03a366Sstefano_zampini       Bs = PetscBLASIntCast(size_of_constraint);
22463b03a366Sstefano_zampini       Bt = PetscBLASIntCast(temp_constraints);
2247de534f79Sstefano_zampini 
22483b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD)
22493b03a366Sstefano_zampini       ierr = PetscMemzero(correlation_mat,Bt*Bt*sizeof(PetscScalar));CHKERRQ(ierr);
22503b03a366Sstefano_zampini       /* Store upper triangular part of correlation matrix */
22513b03a366Sstefano_zampini       for(j=0;j<temp_constraints;j++) {
22523b03a366Sstefano_zampini         for(k=0;k<j+1;k++) {
22533b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX)
22543425bc38SStefano Zampini           /* hand made complex dot product -> replace */
22553b03a366Sstefano_zampini           dot_result = 0.0;
22563b03a366Sstefano_zampini           for (ii=0; ii<size_of_constraint; ii++) {
22573b03a366Sstefano_zampini             val1 = temp_quadrature_constraint[temp_indices[temp_start_ptr+j]+ii];
22583b03a366Sstefano_zampini             val2 = temp_quadrature_constraint[temp_indices[temp_start_ptr+k]+ii];
22593b03a366Sstefano_zampini             dot_result += val1*PetscConj(val2);
22603b03a366Sstefano_zampini           }
22613b03a366Sstefano_zampini #else
22623b03a366Sstefano_zampini           dot_result = BLASdot_(&Bs,&temp_quadrature_constraint[temp_indices[temp_start_ptr+j]],&Bone,
22633b03a366Sstefano_zampini                                     &temp_quadrature_constraint[temp_indices[temp_start_ptr+k]],&Bone);
22643b03a366Sstefano_zampini #endif
22653b03a366Sstefano_zampini           correlation_mat[j*temp_constraints+k]=dot_result;
22663b03a366Sstefano_zampini         }
22673b03a366Sstefano_zampini       }
22683425bc38SStefano Zampini       ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
22693b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX)
22703425bc38SStefano Zampini /*      LAPACKsyev_("V","U",&Bt,correlation_mat,&Bt,singular_vals,work,&lwork,&lierr); */
22713425bc38SStefano Zampini       LAPACKsyevx_("V","A","U",&Bt,correlation_mat,&Bt,&dummy_real,&dummy_real,&dummy_int,&dummy_int,
22723425bc38SStefano Zampini                  &abs_tol,&eigs_found,singular_vals,singular_vectors,&Bt,work,&lwork,iwork,ifail,&lierr);
22733b03a366Sstefano_zampini #else
22743425bc38SStefano Zampini /*  LAPACK call is missing here! TODO */
22753425bc38SStefano Zampini       SETERRQ(((PetscObject) pc)->comm, PETSC_ERR_SUP, "Not yet implemented for complexes when PETSC_MISSING_GESVD = 1");
22763b03a366Sstefano_zampini #endif
22773425bc38SStefano Zampini       if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SYEVX Lapack routine %d",(int)lierr);
22783425bc38SStefano Zampini       ierr = PetscFPTrapPop();CHKERRQ(ierr);
22793b03a366Sstefano_zampini       /* retain eigenvalues greater than tol: note that lapack SYEV gives eigs in ascending order */
22803b03a366Sstefano_zampini       j=0;
22813b03a366Sstefano_zampini       while( j < Bt && singular_vals[j] < tol) j++;
22823b03a366Sstefano_zampini       total_counts=total_counts-j;
22833b03a366Sstefano_zampini       if(j<temp_constraints) {
22843b03a366Sstefano_zampini         for(k=j;k<Bt;k++) { singular_vals[k]=1.0/PetscSqrtReal(singular_vals[k]); }
22853425bc38SStefano Zampini         ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
22863b03a366Sstefano_zampini         BLASgemm_("N","N",&Bs,&Bt,&Bt,&one,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,correlation_mat,&Bt,&zero,temp_basis,&Bs);
22873425bc38SStefano Zampini         ierr = PetscFPTrapPop();CHKERRQ(ierr);
22883b03a366Sstefano_zampini         /* copy POD basis into used quadrature memory */
22893b03a366Sstefano_zampini         for(k=0;k<Bt-j;k++) {
22903b03a366Sstefano_zampini           for(ii=0;ii<size_of_constraint;ii++) {
22913b03a366Sstefano_zampini             temp_quadrature_constraint[temp_indices[temp_start_ptr+k]+ii]=singular_vals[Bt-1-k]*temp_basis[(Bt-1-k)*size_of_constraint+ii];
22923b03a366Sstefano_zampini           }
22933b03a366Sstefano_zampini         }
22943b03a366Sstefano_zampini       }
2295de534f79Sstefano_zampini 
22963b03a366Sstefano_zampini #else  /* on missing GESVD */
22973b03a366Sstefano_zampini       PetscInt min_n = temp_constraints;
22983b03a366Sstefano_zampini       if(min_n > size_of_constraint) min_n = size_of_constraint;
22993b03a366Sstefano_zampini       dummy_int = Bs;
2300670f3ff9SJed Brown       ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
23013b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX)
23023b03a366Sstefano_zampini       LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,singular_vals,
23033b03a366Sstefano_zampini                    &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,work,&lwork,&lierr);
23043b03a366Sstefano_zampini #else
23053b03a366Sstefano_zampini       LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,singular_vals,
23063b03a366Sstefano_zampini                    &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,work,&lwork,rwork,&lierr);
23073b03a366Sstefano_zampini #endif
23083b03a366Sstefano_zampini       if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SVD Lapack routine %d",(int)lierr);
2309670f3ff9SJed Brown       ierr = PetscFPTrapPop();CHKERRQ(ierr);
23103b03a366Sstefano_zampini       /* retain eigenvalues greater than tol: note that lapack SVD gives eigs in descending order */
23113b03a366Sstefano_zampini       j=0;
23123b03a366Sstefano_zampini       while( j < min_n && singular_vals[min_n-j-1] < tol) j++;
23133b03a366Sstefano_zampini       total_counts = total_counts-(PetscInt)Bt+(min_n-j);
23143b03a366Sstefano_zampini #endif
23153b03a366Sstefano_zampini     }
23163b03a366Sstefano_zampini   }
2317534831adSStefano Zampini 
2318da1bb401SStefano Zampini   n_constraints=total_counts-n_vertices;
2319da1bb401SStefano Zampini   local_primal_size = total_counts;
23203b03a366Sstefano_zampini   /* set quantities in pcbddc data structure */
23213b03a366Sstefano_zampini   pcbddc->n_vertices = n_vertices;
23223b03a366Sstefano_zampini   pcbddc->n_constraints = n_constraints;
2323da1bb401SStefano Zampini   pcbddc->local_primal_size = local_primal_size;
2324534831adSStefano Zampini 
2325534831adSStefano Zampini   /* Create constraint matrix */
2326534831adSStefano Zampini   /* The constraint matrix is used to compute the l2g map of primal dofs */
2327534831adSStefano Zampini   /* so we need to set it up properly either with or without change of basis */
2328534831adSStefano Zampini   ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->ConstraintMatrix);CHKERRQ(ierr);
2329534831adSStefano Zampini   ierr = MatSetType(pcbddc->ConstraintMatrix,impMatType);CHKERRQ(ierr);
2330534831adSStefano Zampini   ierr = MatSetSizes(pcbddc->ConstraintMatrix,local_primal_size,pcis->n,local_primal_size,pcis->n);CHKERRQ(ierr);
2331534831adSStefano Zampini   /* compute a local numbering of constraints : vertices first then constraints */
2332534831adSStefano Zampini   ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
2333534831adSStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array_vector);CHKERRQ(ierr);
2334534831adSStefano Zampini   ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&aux_primal_numbering);CHKERRQ(ierr);
2335534831adSStefano Zampini   ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&aux_primal_permutation);CHKERRQ(ierr);
2336534831adSStefano Zampini   total_counts=0;
2337534831adSStefano Zampini   /* find vertices: subdomain corners plus dofs with basis changed */
2338534831adSStefano Zampini   for(i=0;i<local_primal_size;i++) {
2339534831adSStefano Zampini     size_of_constraint=temp_indices[i+1]-temp_indices[i];
2340534831adSStefano Zampini     if(change_basis[i] || size_of_constraint == 1) {
2341534831adSStefano Zampini       k=0;
2342534831adSStefano Zampini       while(k < size_of_constraint && array_vector[temp_indices_to_constraint[temp_indices[i]+size_of_constraint-k-1]] != 0.0) {
2343534831adSStefano Zampini         k=k+1;
2344534831adSStefano Zampini       }
2345534831adSStefano Zampini       j=temp_indices_to_constraint[temp_indices[i]+size_of_constraint-k-1];
2346534831adSStefano Zampini       array_vector[j] = 1.0;
2347534831adSStefano Zampini       aux_primal_numbering[total_counts]=j;
2348534831adSStefano Zampini       aux_primal_permutation[total_counts]=total_counts;
2349534831adSStefano Zampini       total_counts++;
2350534831adSStefano Zampini     }
2351534831adSStefano Zampini   }
2352534831adSStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array_vector);CHKERRQ(ierr);
2353534831adSStefano Zampini   /* permute indices in order to have a sorted set of vertices */
2354534831adSStefano Zampini   ierr = PetscSortIntWithPermutation(total_counts,aux_primal_numbering,aux_primal_permutation);
2355534831adSStefano Zampini   /* nonzero structure */
2356534831adSStefano Zampini   ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&nnz);CHKERRQ(ierr);
2357534831adSStefano Zampini   for(i=0;i<total_counts;i++) {
2358534831adSStefano Zampini     nnz[i]=1;
2359534831adSStefano Zampini   }
2360534831adSStefano Zampini   j=total_counts;
2361534831adSStefano Zampini   for(i=n_vertices;i<local_primal_size;i++) {
2362534831adSStefano Zampini     if(!change_basis[i]) {
2363534831adSStefano Zampini       nnz[j]=temp_indices[i+1]-temp_indices[i];
2364534831adSStefano Zampini       j++;
2365534831adSStefano Zampini     }
2366534831adSStefano Zampini   }
2367534831adSStefano Zampini   ierr = MatSeqAIJSetPreallocation(pcbddc->ConstraintMatrix,0,nnz);CHKERRQ(ierr);
2368534831adSStefano Zampini   ierr = PetscFree(nnz);CHKERRQ(ierr);
2369534831adSStefano Zampini   /* set values in constraint matrix */
2370534831adSStefano Zampini   for(i=0;i<total_counts;i++) {
2371534831adSStefano Zampini     j = aux_primal_permutation[i];
2372534831adSStefano Zampini     k = aux_primal_numbering[j];
2373534831adSStefano Zampini     ierr = MatSetValue(pcbddc->ConstraintMatrix,i,k,1.0,INSERT_VALUES);CHKERRQ(ierr);
2374534831adSStefano Zampini   }
2375534831adSStefano Zampini   for(i=n_vertices;i<local_primal_size;i++) {
2376534831adSStefano Zampini     if(!change_basis[i]) {
2377534831adSStefano Zampini       size_of_constraint=temp_indices[i+1]-temp_indices[i];
2378534831adSStefano Zampini       ierr = MatSetValues(pcbddc->ConstraintMatrix,1,&total_counts,size_of_constraint,&temp_indices_to_constraint[temp_indices[i]],&temp_quadrature_constraint[temp_indices[i]],INSERT_VALUES);CHKERRQ(ierr);
2379534831adSStefano Zampini       total_counts++;
2380534831adSStefano Zampini     }
2381534831adSStefano Zampini   }
2382534831adSStefano Zampini   ierr = PetscFree(aux_primal_numbering);CHKERRQ(ierr);
2383534831adSStefano Zampini   ierr = PetscFree(aux_primal_permutation);CHKERRQ(ierr);
2384534831adSStefano Zampini   /* assembling */
2385534831adSStefano Zampini   ierr = MatAssemblyBegin(pcbddc->ConstraintMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2386534831adSStefano Zampini   ierr = MatAssemblyEnd(pcbddc->ConstraintMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2387534831adSStefano Zampini 
2388534831adSStefano Zampini   /* Create matrix for change of basis. We don't need it in case pcbddc->usechangeofbasis is FALSE */
2389534831adSStefano Zampini   if(pcbddc->usechangeofbasis) {
2390534831adSStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->ChangeOfBasisMatrix);CHKERRQ(ierr);
2391534831adSStefano Zampini     ierr = MatSetType(pcbddc->ChangeOfBasisMatrix,impMatType);CHKERRQ(ierr);
2392534831adSStefano Zampini     ierr = MatSetSizes(pcbddc->ChangeOfBasisMatrix,pcis->n_B,pcis->n_B,pcis->n_B,pcis->n_B);CHKERRQ(ierr);
2393534831adSStefano Zampini     /* work arrays */
2394534831adSStefano Zampini     /* we need to reuse these arrays, so we free them */
2395534831adSStefano Zampini     ierr = PetscFree(temp_basis);CHKERRQ(ierr);
2396534831adSStefano Zampini     ierr = PetscFree(work);CHKERRQ(ierr);
2397534831adSStefano Zampini     ierr = PetscMalloc(pcis->n_B*sizeof(PetscInt),&nnz);CHKERRQ(ierr);
2398534831adSStefano Zampini     ierr = PetscMalloc((nnsp_addone+nnsp_size)*(nnsp_addone+nnsp_size)*sizeof(PetscScalar),&temp_basis);CHKERRQ(ierr);
2399534831adSStefano Zampini     ierr = PetscMalloc((nnsp_addone+nnsp_size)*sizeof(PetscScalar),&work);CHKERRQ(ierr);
2400534831adSStefano Zampini     ierr = PetscMalloc((nnsp_addone+nnsp_size)*sizeof(PetscBLASInt),&ipiv);CHKERRQ(ierr);
2401534831adSStefano Zampini     for(i=0;i<pcis->n_B;i++) {
2402534831adSStefano Zampini       nnz[i]=1;
2403534831adSStefano Zampini     }
2404534831adSStefano Zampini     /* Overestimated nonzeros per row */
2405534831adSStefano Zampini     k=1;
2406534831adSStefano Zampini     for(i=pcbddc->n_vertices;i<local_primal_size;i++) {
2407534831adSStefano Zampini       if(change_basis[i]) {
2408534831adSStefano Zampini         size_of_constraint = temp_indices[i+1]-temp_indices[i];
2409534831adSStefano Zampini         if(k < size_of_constraint) {
2410534831adSStefano Zampini           k = size_of_constraint;
2411534831adSStefano Zampini         }
2412534831adSStefano Zampini         for(j=0;j<size_of_constraint;j++) {
2413534831adSStefano Zampini           nnz[temp_indices_to_constraint_B[temp_indices[i]+j]] = size_of_constraint;
2414534831adSStefano Zampini         }
2415534831adSStefano Zampini       }
2416534831adSStefano Zampini     }
2417534831adSStefano Zampini     ierr = MatSeqAIJSetPreallocation(pcbddc->ChangeOfBasisMatrix,0,nnz);CHKERRQ(ierr);
2418534831adSStefano Zampini     ierr = PetscFree(nnz);CHKERRQ(ierr);
2419534831adSStefano Zampini     /* Temporary array to store indices */
2420534831adSStefano Zampini     ierr = PetscMalloc(k*sizeof(PetscInt),&is_indices);CHKERRQ(ierr);
2421534831adSStefano Zampini     /* Set initial identity in the matrix */
2422534831adSStefano Zampini     for(i=0;i<pcis->n_B;i++) {
2423534831adSStefano Zampini       ierr = MatSetValue(pcbddc->ChangeOfBasisMatrix,i,i,1.0,INSERT_VALUES);CHKERRQ(ierr);
2424534831adSStefano Zampini     }
2425534831adSStefano Zampini     /* Now we loop on the constraints which need a change of basis */
2426534831adSStefano Zampini     /* Change of basis matrix is evaluated as the FIRST APPROACH in */
2427534831adSStefano Zampini     /* Klawonn and Widlund, Dual-primal FETI-DP methods for linear elasticity, (6.2.1) */
2428534831adSStefano Zampini     temp_constraints = 0;
2429*93dc3b60SStefano Zampini     if(pcbddc->n_vertices < local_primal_size) {
2430534831adSStefano Zampini       temp_start_ptr = temp_indices_to_constraint_B[temp_indices[pcbddc->n_vertices]];
2431*93dc3b60SStefano Zampini     }
2432534831adSStefano Zampini     for(i=pcbddc->n_vertices;i<local_primal_size;i++) {
2433534831adSStefano Zampini       if(change_basis[i]) {
2434534831adSStefano Zampini         compute_submatrix = PETSC_FALSE;
2435534831adSStefano Zampini         useksp = PETSC_FALSE;
2436534831adSStefano Zampini         if(temp_start_ptr == temp_indices_to_constraint_B[temp_indices[i]]) {
2437534831adSStefano Zampini           temp_constraints++;
243804eaf177SStefano Zampini           if(i == local_primal_size -1 ||  temp_start_ptr != temp_indices_to_constraint_B[temp_indices[i+1]]) {
2439534831adSStefano Zampini             compute_submatrix = PETSC_TRUE;
2440534831adSStefano Zampini           }
2441534831adSStefano Zampini         }
2442534831adSStefano Zampini         if(compute_submatrix) {
2443534831adSStefano Zampini           if(temp_constraints > 1 || pcbddc->use_nnsp_true) {
2444534831adSStefano Zampini             useksp = PETSC_TRUE;
2445534831adSStefano Zampini           }
2446534831adSStefano Zampini           size_of_constraint = temp_indices[i+1]-temp_indices[i];
2447534831adSStefano Zampini           if(useksp) { /* experimental */
2448534831adSStefano Zampini             ierr = MatCreate(PETSC_COMM_SELF,&temp_mat);CHKERRQ(ierr);
2449534831adSStefano Zampini             ierr = MatSetType(temp_mat,impMatType);CHKERRQ(ierr);
2450534831adSStefano Zampini             ierr = MatSetSizes(temp_mat,size_of_constraint,size_of_constraint,size_of_constraint,size_of_constraint);CHKERRQ(ierr);
2451534831adSStefano Zampini             ierr = MatSeqAIJSetPreallocation(temp_mat,size_of_constraint,PETSC_NULL);CHKERRQ(ierr);
2452534831adSStefano Zampini           }
2453534831adSStefano Zampini           /* First _size_of_constraint-temp_constraints_ columns */
2454534831adSStefano Zampini           dual_dofs = size_of_constraint-temp_constraints;
2455534831adSStefano Zampini           start_constraint = i+1-temp_constraints;
2456534831adSStefano Zampini           for(s=0;s<dual_dofs;s++) {
2457534831adSStefano Zampini             is_indices[0] = s;
2458534831adSStefano Zampini             for(j=0;j<temp_constraints;j++) {
2459534831adSStefano Zampini               for(k=0;k<temp_constraints;k++) {
2460534831adSStefano Zampini                 temp_basis[j*temp_constraints+k]=temp_quadrature_constraint[temp_indices[start_constraint+k]+s+j+1];
2461534831adSStefano Zampini               }
2462534831adSStefano Zampini               work[j]=-temp_quadrature_constraint[temp_indices[start_constraint+j]+s];
2463534831adSStefano Zampini               is_indices[j+1]=s+j+1;
2464534831adSStefano Zampini             }
2465534831adSStefano Zampini             Bt = temp_constraints;
2466534831adSStefano Zampini             ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
2467534831adSStefano Zampini             LAPACKgesv_(&Bt,&Bone,temp_basis,&Bt,ipiv,work,&Bt,&lierr);
2468534831adSStefano Zampini             if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GESV Lapack routine %d",(int)lierr);
2469534831adSStefano Zampini             ierr = PetscFPTrapPop();CHKERRQ(ierr);
2470534831adSStefano Zampini             j = temp_indices_to_constraint_B[temp_indices[start_constraint]+s];
2471534831adSStefano Zampini             ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,temp_constraints,&temp_indices_to_constraint_B[temp_indices[start_constraint]+s+1],1,&j,work,INSERT_VALUES);CHKERRQ(ierr);
2472534831adSStefano Zampini             if(useksp) {
2473534831adSStefano Zampini               /* temp mat with transposed rows and columns */
2474534831adSStefano Zampini               ierr = MatSetValues(temp_mat,1,&s,temp_constraints,&is_indices[1],work,INSERT_VALUES);CHKERRQ(ierr);
2475534831adSStefano Zampini               ierr = MatSetValue(temp_mat,is_indices[0],is_indices[0],1.0,INSERT_VALUES);CHKERRQ(ierr);
2476534831adSStefano Zampini             }
2477534831adSStefano Zampini           }
2478534831adSStefano Zampini           if(useksp) {
2479534831adSStefano Zampini             /* last rows of temp_mat */
2480534831adSStefano Zampini             for(j=0;j<size_of_constraint;j++) {
2481534831adSStefano Zampini               is_indices[j] = j;
2482534831adSStefano Zampini             }
2483534831adSStefano Zampini             for(s=0;s<temp_constraints;s++) {
2484534831adSStefano Zampini               k = s + dual_dofs;
2485534831adSStefano Zampini               ierr = MatSetValues(temp_mat,1,&k,size_of_constraint,is_indices,&temp_quadrature_constraint[temp_indices[start_constraint+s]],INSERT_VALUES);CHKERRQ(ierr);
2486534831adSStefano Zampini             }
2487534831adSStefano Zampini             ierr = MatAssemblyBegin(temp_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2488534831adSStefano Zampini             ierr = MatAssemblyEnd(temp_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2489534831adSStefano Zampini             ierr = MatGetVecs(temp_mat,&temp_vec,PETSC_NULL);CHKERRQ(ierr);
2490534831adSStefano Zampini             ierr = KSPCreate(PETSC_COMM_SELF,&temp_ksp);CHKERRQ(ierr);
2491534831adSStefano Zampini             ierr = KSPSetOperators(temp_ksp,temp_mat,temp_mat,SAME_PRECONDITIONER);CHKERRQ(ierr);
2492534831adSStefano Zampini             ierr = KSPSetType(temp_ksp,KSPPREONLY);CHKERRQ(ierr);
2493534831adSStefano Zampini             ierr = KSPSetUp(temp_ksp);CHKERRQ(ierr);
2494534831adSStefano Zampini             for(s=0;s<temp_constraints;s++) {
2495534831adSStefano Zampini               ierr = VecSet(temp_vec,0.0);CHKERRQ(ierr);
2496534831adSStefano Zampini               ierr = VecSetValue(temp_vec,s+dual_dofs,1.0,INSERT_VALUES);CHKERRQ(ierr);
2497534831adSStefano Zampini               ierr = VecAssemblyBegin(temp_vec);CHKERRQ(ierr);
2498534831adSStefano Zampini               ierr = VecAssemblyEnd(temp_vec);CHKERRQ(ierr);
2499534831adSStefano Zampini               ierr = KSPSolve(temp_ksp,temp_vec,temp_vec);CHKERRQ(ierr);
2500534831adSStefano Zampini               ierr = VecGetArray(temp_vec,&array_vector);CHKERRQ(ierr);
2501534831adSStefano Zampini               j = temp_indices_to_constraint_B[temp_indices[start_constraint+s]+size_of_constraint-s-1];
2502534831adSStefano Zampini               /* last columns of change of basis matrix associated to new primal dofs */
2503534831adSStefano Zampini               ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,size_of_constraint,&temp_indices_to_constraint_B[temp_indices[start_constraint+s]],1,&j,array_vector,INSERT_VALUES);CHKERRQ(ierr);
2504534831adSStefano Zampini               ierr = VecRestoreArray(temp_vec,&array_vector);CHKERRQ(ierr);
2505534831adSStefano Zampini             }
2506534831adSStefano Zampini             ierr = MatDestroy(&temp_mat);CHKERRQ(ierr);
2507534831adSStefano Zampini             ierr = KSPDestroy(&temp_ksp);CHKERRQ(ierr);
2508534831adSStefano Zampini             ierr = VecDestroy(&temp_vec);CHKERRQ(ierr);
2509534831adSStefano Zampini           } else {
2510534831adSStefano Zampini             /* last columns of change of basis matrix associated to new primal dofs */
2511534831adSStefano Zampini             for(s=0;s<temp_constraints;s++) {
2512534831adSStefano Zampini               j = temp_indices_to_constraint_B[temp_indices[start_constraint+s]+size_of_constraint-s-1];
2513534831adSStefano Zampini               ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,size_of_constraint,&temp_indices_to_constraint_B[temp_indices[start_constraint+s]],1,&j,&temp_quadrature_constraint[temp_indices[start_constraint+s]],INSERT_VALUES);CHKERRQ(ierr);
2514534831adSStefano Zampini             }
2515534831adSStefano Zampini           }
2516534831adSStefano Zampini           /* prepare for the next cycle */
2517534831adSStefano Zampini           temp_constraints = 0;
251804eaf177SStefano Zampini           if(i != local_primal_size -1 ) {
2519534831adSStefano Zampini             temp_start_ptr = temp_indices_to_constraint_B[temp_indices[i+1]];
2520534831adSStefano Zampini           }
2521534831adSStefano Zampini         }
2522534831adSStefano Zampini       }
252304eaf177SStefano Zampini     }
2524534831adSStefano Zampini     /* assembling */
2525534831adSStefano Zampini     ierr = MatAssemblyBegin(pcbddc->ChangeOfBasisMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2526534831adSStefano Zampini     ierr = MatAssemblyEnd(pcbddc->ChangeOfBasisMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2527534831adSStefano Zampini     ierr = PetscFree(ipiv);CHKERRQ(ierr);
2528534831adSStefano Zampini     ierr = PetscFree(is_indices);CHKERRQ(ierr);
2529534831adSStefano Zampini   }
25303b03a366Sstefano_zampini   /* free workspace no longer needed */
25313b03a366Sstefano_zampini   ierr = PetscFree(rwork);CHKERRQ(ierr);
25323b03a366Sstefano_zampini   ierr = PetscFree(work);CHKERRQ(ierr);
25333b03a366Sstefano_zampini   ierr = PetscFree(temp_basis);CHKERRQ(ierr);
25343b03a366Sstefano_zampini   ierr = PetscFree(singular_vals);CHKERRQ(ierr);
25353b03a366Sstefano_zampini   ierr = PetscFree(correlation_mat);CHKERRQ(ierr);
25363b03a366Sstefano_zampini   ierr = PetscFree(temp_indices);CHKERRQ(ierr);
2537534831adSStefano Zampini   ierr = PetscFree(change_basis);CHKERRQ(ierr);
25383b03a366Sstefano_zampini   ierr = PetscFree(temp_indices_to_constraint);CHKERRQ(ierr);
2539534831adSStefano Zampini   ierr = PetscFree(temp_indices_to_constraint_B);CHKERRQ(ierr);
2540534831adSStefano Zampini   ierr = PetscFree(local_to_B);CHKERRQ(ierr);
25413b03a366Sstefano_zampini   ierr = PetscFree(temp_quadrature_constraint);CHKERRQ(ierr);
25423425bc38SStefano Zampini #if defined(PETSC_MISSING_LAPACK_GESVD)
25433425bc38SStefano Zampini   ierr = PetscFree(iwork);CHKERRQ(ierr);
25443425bc38SStefano Zampini   ierr = PetscFree(ifail);CHKERRQ(ierr);
25453425bc38SStefano Zampini   ierr = PetscFree(singular_vectors);CHKERRQ(ierr);
25463425bc38SStefano Zampini #endif
2547da1bb401SStefano Zampini   for(k=0;k<nnsp_size;k++) {
2548da1bb401SStefano Zampini     ierr = VecDestroy(&localnearnullsp[k]);CHKERRQ(ierr);
2549da1bb401SStefano Zampini   }
25503b03a366Sstefano_zampini   ierr = PetscFree(localnearnullsp);CHKERRQ(ierr);
25513b03a366Sstefano_zampini   PetscFunctionReturn(0);
25523b03a366Sstefano_zampini }
25533b03a366Sstefano_zampini /* -------------------------------------------------------------------------- */
25540c7d97c5SJed Brown #undef __FUNCT__
25550c7d97c5SJed Brown #define __FUNCT__ "PCBDDCCoarseSetUp"
255653cdbc3dSStefano Zampini static PetscErrorCode PCBDDCCoarseSetUp(PC pc)
25570c7d97c5SJed Brown {
25580c7d97c5SJed Brown   PetscErrorCode  ierr;
25590c7d97c5SJed Brown 
25600c7d97c5SJed Brown   PC_IS*            pcis = (PC_IS*)(pc->data);
25610c7d97c5SJed Brown   PC_BDDC*          pcbddc = (PC_BDDC*)pc->data;
25620c7d97c5SJed Brown   Mat_IS            *matis = (Mat_IS*)pc->pmat->data;
2563534831adSStefano Zampini   Mat               change_mat_all;
25640c7d97c5SJed Brown   IS                is_R_local;
25650c7d97c5SJed Brown   IS                is_V_local;
25660c7d97c5SJed Brown   IS                is_C_local;
25670c7d97c5SJed Brown   IS                is_aux1;
25680c7d97c5SJed Brown   IS                is_aux2;
25690c7d97c5SJed Brown   const VecType     impVecType;
25700c7d97c5SJed Brown   const MatType     impMatType;
25710c7d97c5SJed Brown   PetscInt          n_R=0;
25720c7d97c5SJed Brown   PetscInt          n_D=0;
25730c7d97c5SJed Brown   PetscInt          n_B=0;
25740c7d97c5SJed Brown   PetscScalar       zero=0.0;
25750c7d97c5SJed Brown   PetscScalar       one=1.0;
25760c7d97c5SJed Brown   PetscScalar       m_one=-1.0;
25770c7d97c5SJed Brown   PetscScalar*      array;
25780c7d97c5SJed Brown   PetscScalar       *coarse_submat_vals;
25790c7d97c5SJed Brown   PetscInt          *idx_R_local;
25800c7d97c5SJed Brown   PetscInt          *idx_V_B;
25810c7d97c5SJed Brown   PetscScalar       *coarsefunctions_errors;
25820c7d97c5SJed Brown   PetscScalar       *constraints_errors;
25830c7d97c5SJed Brown   /* auxiliary indices */
2584534831adSStefano Zampini   PetscInt i,j,k;
2585e269702eSStefano Zampini   /* for verbose output of bddc */
2586e269702eSStefano Zampini   PetscViewer       viewer=pcbddc->dbg_viewer;
2587e269702eSStefano Zampini   PetscBool         dbg_flag=pcbddc->dbg_flag;
2588a0ba757dSStefano Zampini   /* for counting coarse dofs */
2589534831adSStefano Zampini   PetscInt          n_vertices,n_constraints;
25903b03a366Sstefano_zampini   PetscInt          size_of_constraint;
25913b03a366Sstefano_zampini   PetscInt          *row_cmat_indices;
25923b03a366Sstefano_zampini   PetscScalar       *row_cmat_values;
2593534831adSStefano Zampini   PetscInt          *vertices,*nnz,*is_indices,*temp_indices;
25940c7d97c5SJed Brown 
25950c7d97c5SJed Brown   PetscFunctionBegin;
25960c7d97c5SJed Brown   /* Set Non-overlapping dimensions */
25970c7d97c5SJed Brown   n_B = pcis->n_B; n_D = pcis->n - n_B;
2598534831adSStefano Zampini   /* Set types for local objects needed by BDDC precondtioner */
2599534831adSStefano Zampini   impMatType = MATSEQDENSE;
2600534831adSStefano Zampini   impVecType = VECSEQ;
2601da1bb401SStefano Zampini   /* get vertex indices from constraint matrix */
2602534831adSStefano Zampini   ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscInt),&vertices);CHKERRQ(ierr);
2603534831adSStefano Zampini   n_vertices=0;
2604da1bb401SStefano Zampini   for(i=0;i<pcbddc->local_primal_size;i++) {
2605da1bb401SStefano Zampini     ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr);
2606da1bb401SStefano Zampini     if(size_of_constraint == 1) {
2607534831adSStefano Zampini       vertices[n_vertices]=row_cmat_indices[0];
2608534831adSStefano Zampini       n_vertices++;
2609a0ba757dSStefano Zampini     }
2610da1bb401SStefano Zampini     ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr);
2611a0ba757dSStefano Zampini   }
2612534831adSStefano Zampini   /* Set number of constraints */
2613534831adSStefano Zampini   n_constraints = pcbddc->local_primal_size-n_vertices;
2614534831adSStefano Zampini 
2615534831adSStefano Zampini   /* vertices in boundary numbering */
2616534831adSStefano Zampini   if(n_vertices) {
2617534831adSStefano Zampini     ierr = VecSet(pcis->vec1_N,m_one);CHKERRQ(ierr);
2618534831adSStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
2619534831adSStefano Zampini     for (i=0; i<n_vertices; i++) { array[ vertices[i] ] = i; }
2620534831adSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
2621534831adSStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
2622534831adSStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
2623534831adSStefano Zampini     ierr = PetscMalloc(n_vertices*sizeof(PetscInt),&idx_V_B);CHKERRQ(ierr);
2624534831adSStefano Zampini     ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr);
2625534831adSStefano Zampini     for (i=0; i<n_vertices; i++) {
2626534831adSStefano Zampini       j=0;
2627534831adSStefano Zampini       while (array[j] != i ) {j++;}
2628534831adSStefano Zampini       idx_V_B[i]=j;
2629534831adSStefano Zampini     }
2630534831adSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr);
2631534831adSStefano Zampini   }
2632534831adSStefano Zampini 
2633534831adSStefano Zampini   /* transform local matrices if needed */
2634534831adSStefano Zampini   if(pcbddc->usechangeofbasis) {
2635534831adSStefano Zampini     ierr = PetscMalloc(pcis->n*sizeof(PetscInt),&nnz);CHKERRQ(ierr);
2636534831adSStefano Zampini     ierr = ISGetIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2637534831adSStefano Zampini     for(i=0;i<n_D;i++) {
2638534831adSStefano Zampini       nnz[is_indices[i]]=1;
2639534831adSStefano Zampini     }
2640534831adSStefano Zampini     ierr = ISRestoreIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2641534831adSStefano Zampini     ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2642534831adSStefano Zampini     k=1;
2643534831adSStefano Zampini     for(i=0;i<n_B;i++) {
2644534831adSStefano Zampini       ierr = MatGetRow(pcbddc->ChangeOfBasisMatrix,i,&j,PETSC_NULL,PETSC_NULL);CHKERRQ(ierr);
2645534831adSStefano Zampini       nnz[is_indices[i]]=j;
2646534831adSStefano Zampini       if( k < j) {
2647534831adSStefano Zampini         k = j;
2648534831adSStefano Zampini       }
2649534831adSStefano Zampini       ierr = MatRestoreRow(pcbddc->ChangeOfBasisMatrix,i,&j,PETSC_NULL,PETSC_NULL);CHKERRQ(ierr);
2650534831adSStefano Zampini     }
2651534831adSStefano Zampini     ierr = ISRestoreIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2652534831adSStefano Zampini     /* assemble change of basis matrix on the whole set of local dofs */
2653534831adSStefano Zampini     ierr = PetscMalloc(k*sizeof(PetscInt),&temp_indices);CHKERRQ(ierr);
2654534831adSStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&change_mat_all);CHKERRQ(ierr);
2655534831adSStefano Zampini     ierr = MatSetSizes(change_mat_all,pcis->n,pcis->n,pcis->n,pcis->n);CHKERRQ(ierr);
2656534831adSStefano Zampini     ierr = MatSetType(change_mat_all,MATSEQAIJ);CHKERRQ(ierr);
2657534831adSStefano Zampini     ierr = MatSeqAIJSetPreallocation(change_mat_all,0,nnz);CHKERRQ(ierr);
2658534831adSStefano Zampini     ierr = ISGetIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2659534831adSStefano Zampini     for(i=0;i<n_D;i++) {
2660534831adSStefano Zampini       ierr = MatSetValue(change_mat_all,is_indices[i],is_indices[i],1.0,INSERT_VALUES);CHKERRQ(ierr);
2661534831adSStefano Zampini     }
2662534831adSStefano Zampini     ierr = ISRestoreIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2663534831adSStefano Zampini     ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
2664534831adSStefano Zampini     for(i=0;i<n_B;i++) {
2665534831adSStefano Zampini       ierr = MatGetRow(pcbddc->ChangeOfBasisMatrix,i,&j,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr);
2666534831adSStefano Zampini       for(k=0;k<j;k++) {
2667534831adSStefano Zampini         temp_indices[k]=is_indices[row_cmat_indices[k]];
2668534831adSStefano Zampini       }
2669534831adSStefano Zampini       ierr = MatSetValues(change_mat_all,1,&is_indices[i],j,temp_indices,row_cmat_values,INSERT_VALUES);CHKERRQ(ierr);
2670534831adSStefano Zampini       ierr = MatRestoreRow(pcbddc->ChangeOfBasisMatrix,i,&j,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr);
2671534831adSStefano Zampini     }
2672534831adSStefano Zampini     ierr = MatAssemblyBegin(change_mat_all,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2673534831adSStefano Zampini     ierr = MatAssemblyEnd(change_mat_all,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2674534831adSStefano Zampini     ierr = MatPtAP(matis->A,change_mat_all,MAT_INITIAL_MATRIX,1.0,&pcbddc->local_mat);CHKERRQ(ierr);
2675534831adSStefano Zampini     ierr = MatDestroy(&pcis->A_IB);CHKERRQ(ierr);
2676534831adSStefano Zampini     ierr = MatDestroy(&pcis->A_BI);CHKERRQ(ierr);
2677534831adSStefano Zampini     ierr = MatDestroy(&pcis->A_BB);CHKERRQ(ierr);
2678534831adSStefano Zampini     ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_I_local,pcis->is_B_local,MAT_INITIAL_MATRIX,&pcis->A_IB);CHKERRQ(ierr);
2679534831adSStefano Zampini     ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_B_local,pcis->is_I_local,MAT_INITIAL_MATRIX,&pcis->A_BI);CHKERRQ(ierr);
2680534831adSStefano Zampini     ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_B_local,pcis->is_B_local,MAT_INITIAL_MATRIX,&pcis->A_BB);CHKERRQ(ierr);
2681534831adSStefano Zampini     ierr = MatDestroy(&change_mat_all);CHKERRQ(ierr);
2682534831adSStefano Zampini     ierr = PetscFree(nnz);CHKERRQ(ierr);
2683534831adSStefano Zampini     ierr = PetscFree(temp_indices);CHKERRQ(ierr);
2684534831adSStefano Zampini   } else {
2685534831adSStefano Zampini     /* without change of basis, the local matrix is unchanged */
2686534831adSStefano Zampini     ierr = PetscObjectReference((PetscObject)matis->A);CHKERRQ(ierr);
2687534831adSStefano Zampini     pcbddc->local_mat = matis->A;
2688534831adSStefano Zampini   }
2689a0ba757dSStefano Zampini 
26900c7d97c5SJed Brown   /* Dohrmann's notation: dofs splitted in R (Remaining: all dofs but the vertices) and V (Vertices) */
26910c7d97c5SJed Brown   ierr = VecSet(pcis->vec1_N,one);CHKERRQ(ierr);
26920c7d97c5SJed Brown   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
26933b03a366Sstefano_zampini   for (i=0;i<n_vertices;i++) { array[ vertices[i] ] = zero; }
26943b03a366Sstefano_zampini   ierr = PetscMalloc(( pcis->n - n_vertices )*sizeof(PetscInt),&idx_R_local);CHKERRQ(ierr);
26950c7d97c5SJed Brown   for (i=0, n_R=0; i<pcis->n; i++) { if (array[i] == one) { idx_R_local[n_R] = i; n_R++; } }
26960c7d97c5SJed Brown   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
2697e269702eSStefano Zampini   if(dbg_flag) {
26980c7d97c5SJed Brown     ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
26990c7d97c5SJed Brown     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
27000c7d97c5SJed Brown     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d local dimensions\n",PetscGlobalRank);CHKERRQ(ierr);
27010c7d97c5SJed Brown     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local_size = %d, dirichlet_size = %d, boundary_size = %d\n",pcis->n,n_D,n_B);CHKERRQ(ierr);
27023b03a366Sstefano_zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"r_size = %d, v_size = %d, constraints = %d, local_primal_size = %d\n",n_R,n_vertices,n_constraints,pcbddc->local_primal_size);CHKERRQ(ierr);
2703534831adSStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"pcbddc->n_vertices = %d, pcbddc->n_constraints = %d\n",pcbddc->n_vertices,pcbddc->n_constraints);CHKERRQ(ierr);
27040c7d97c5SJed Brown     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
27050c7d97c5SJed Brown   }
2706534831adSStefano Zampini 
27070c7d97c5SJed Brown   /* Allocate needed vectors */
2708534831adSStefano Zampini   ierr = VecDuplicate(pcis->vec1_global,&pcbddc->original_rhs);CHKERRQ(ierr);
27093972b0daSStefano Zampini   ierr = VecDuplicate(pcis->vec1_global,&pcbddc->temp_solution);CHKERRQ(ierr);
27100c7d97c5SJed Brown   ierr = VecDuplicate(pcis->vec1_D,&pcbddc->vec4_D);CHKERRQ(ierr);
27110c7d97c5SJed Brown   ierr = VecCreate(PETSC_COMM_SELF,&pcbddc->vec1_R);CHKERRQ(ierr);
27120c7d97c5SJed Brown   ierr = VecSetSizes(pcbddc->vec1_R,n_R,n_R);CHKERRQ(ierr);
27130c7d97c5SJed Brown   ierr = VecSetType(pcbddc->vec1_R,impVecType);CHKERRQ(ierr);
2714d49ef151SStefano Zampini   ierr = VecDuplicate(pcbddc->vec1_R,&pcbddc->vec2_R);CHKERRQ(ierr);
27150c7d97c5SJed Brown   ierr = VecCreate(PETSC_COMM_SELF,&pcbddc->vec1_P);CHKERRQ(ierr);
27160c7d97c5SJed Brown   ierr = VecSetSizes(pcbddc->vec1_P,pcbddc->local_primal_size,pcbddc->local_primal_size);CHKERRQ(ierr);
27170c7d97c5SJed Brown   ierr = VecSetType(pcbddc->vec1_P,impVecType);CHKERRQ(ierr);
27180c7d97c5SJed Brown 
27190c7d97c5SJed Brown   /* Creating some index sets needed  */
27200c7d97c5SJed Brown   /* For submatrices */
2721da1bb401SStefano Zampini   ierr = ISCreateGeneral(PETSC_COMM_SELF,n_R,idx_R_local,PETSC_OWN_POINTER,&is_R_local);CHKERRQ(ierr);
27223b03a366Sstefano_zampini   if(n_vertices)    {
2723da1bb401SStefano Zampini     ierr = ISCreateGeneral(PETSC_COMM_SELF,n_vertices,vertices,PETSC_OWN_POINTER,&is_V_local);CHKERRQ(ierr);
27243b03a366Sstefano_zampini   }
2725da1bb401SStefano Zampini   if(n_constraints) {
2726da1bb401SStefano Zampini     ierr = ISCreateStride(PETSC_COMM_SELF,n_constraints,n_vertices,1,&is_C_local);CHKERRQ(ierr);
2727da1bb401SStefano Zampini   }
2728da1bb401SStefano Zampini 
27290c7d97c5SJed Brown   /* For VecScatters pcbddc->R_to_B and (optionally) pcbddc->R_to_D */
27300c7d97c5SJed Brown   {
27310c7d97c5SJed Brown     PetscInt   *aux_array1;
27320c7d97c5SJed Brown     PetscInt   *aux_array2;
27330c7d97c5SJed Brown 
27343b03a366Sstefano_zampini     ierr = PetscMalloc( (pcis->n_B-n_vertices)*sizeof(PetscInt),&aux_array1);CHKERRQ(ierr);
27353b03a366Sstefano_zampini     ierr = PetscMalloc( (pcis->n_B-n_vertices)*sizeof(PetscInt),&aux_array2);CHKERRQ(ierr);
27360c7d97c5SJed Brown 
2737d49ef151SStefano Zampini     ierr = VecSet(pcis->vec1_global,zero);CHKERRQ(ierr);
27380c7d97c5SJed Brown     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
27390c7d97c5SJed Brown     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
27400c7d97c5SJed Brown     ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
27410c7d97c5SJed Brown     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
27420c7d97c5SJed Brown     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
27430c7d97c5SJed Brown     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
27440c7d97c5SJed Brown     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
2745da1bb401SStefano Zampini     for (i=0, j=0; i<n_R; i++) { if (array[idx_R_local[i]] > one) { aux_array1[j] = i; j++; } }
27460c7d97c5SJed Brown     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
2747da1bb401SStefano Zampini     ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array1,PETSC_COPY_VALUES,&is_aux1);CHKERRQ(ierr);
27480c7d97c5SJed Brown     ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr);
2749da1bb401SStefano Zampini     for (i=0, j=0; i<n_B; i++) { if (array[i] > one) { aux_array2[j] = i; j++; } }
27503828260eSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr);
2751da1bb401SStefano Zampini     ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array2,PETSC_COPY_VALUES,&is_aux2);CHKERRQ(ierr);
27520c7d97c5SJed Brown     ierr = VecScatterCreate(pcbddc->vec1_R,is_aux1,pcis->vec1_B,is_aux2,&pcbddc->R_to_B);CHKERRQ(ierr);
27530c7d97c5SJed Brown     ierr = PetscFree(aux_array1);CHKERRQ(ierr);
27540c7d97c5SJed Brown     ierr = PetscFree(aux_array2);CHKERRQ(ierr);
27550c7d97c5SJed Brown     ierr = ISDestroy(&is_aux1);CHKERRQ(ierr);
27560c7d97c5SJed Brown     ierr = ISDestroy(&is_aux2);CHKERRQ(ierr);
27570c7d97c5SJed Brown 
2758e269702eSStefano Zampini     if(pcbddc->prec_type || dbg_flag ) {
27590c7d97c5SJed Brown       ierr = PetscMalloc(n_D*sizeof(PetscInt),&aux_array1);CHKERRQ(ierr);
27600c7d97c5SJed Brown       ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
2761da1bb401SStefano Zampini       for (i=0, j=0; i<n_R; i++) { if (array[idx_R_local[i]] == one) { aux_array1[j] = i; j++; } }
27620c7d97c5SJed Brown       ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
2763da1bb401SStefano Zampini       ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array1,PETSC_COPY_VALUES,&is_aux1);CHKERRQ(ierr);
27640c7d97c5SJed Brown       ierr = VecScatterCreate(pcbddc->vec1_R,is_aux1,pcis->vec1_D,(IS)0,&pcbddc->R_to_D);CHKERRQ(ierr);
27650c7d97c5SJed Brown       ierr = PetscFree(aux_array1);CHKERRQ(ierr);
27660c7d97c5SJed Brown       ierr = ISDestroy(&is_aux1);CHKERRQ(ierr);
27670c7d97c5SJed Brown     }
27680c7d97c5SJed Brown   }
27690c7d97c5SJed Brown 
27700c7d97c5SJed Brown   /* Creating PC contexts for local Dirichlet and Neumann problems */
27710c7d97c5SJed Brown   {
27720c7d97c5SJed Brown     Mat  A_RR;
277353cdbc3dSStefano Zampini     PC   pc_temp;
27740c7d97c5SJed Brown     /* Matrix for Dirichlet problem is A_II -> we already have it from pcis.c code */
277553cdbc3dSStefano Zampini     ierr = KSPCreate(PETSC_COMM_SELF,&pcbddc->ksp_D);CHKERRQ(ierr);
277653cdbc3dSStefano Zampini     ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->ksp_D,(PetscObject)pc,1);CHKERRQ(ierr);
277753cdbc3dSStefano Zampini     ierr = KSPSetOperators(pcbddc->ksp_D,pcis->A_II,pcis->A_II,SAME_PRECONDITIONER);CHKERRQ(ierr);
277853cdbc3dSStefano Zampini     ierr = KSPSetType(pcbddc->ksp_D,KSPPREONLY);CHKERRQ(ierr);
2779da1bb401SStefano Zampini     ierr = KSPSetOptionsPrefix(pcbddc->ksp_D,"dirichlet_");CHKERRQ(ierr);
27800c7d97c5SJed Brown     /* default */
278153cdbc3dSStefano Zampini     ierr = KSPGetPC(pcbddc->ksp_D,&pc_temp);CHKERRQ(ierr);
278253cdbc3dSStefano Zampini     ierr = PCSetType(pc_temp,PCLU);CHKERRQ(ierr);
27830c7d97c5SJed Brown     /* Allow user's customization */
278453cdbc3dSStefano Zampini     ierr = KSPSetFromOptions(pcbddc->ksp_D);CHKERRQ(ierr);
278553cdbc3dSStefano Zampini     /* Set Up KSP for Dirichlet problem of BDDC */
278653cdbc3dSStefano Zampini     ierr = KSPSetUp(pcbddc->ksp_D);CHKERRQ(ierr);
27873972b0daSStefano Zampini     /* set ksp_D into pcis data */
27883972b0daSStefano Zampini     ierr = KSPDestroy(&pcis->ksp_D);CHKERRQ(ierr);
27893972b0daSStefano Zampini     ierr = PetscObjectReference((PetscObject)pcbddc->ksp_D);CHKERRQ(ierr);
27903972b0daSStefano Zampini     pcis->ksp_D = pcbddc->ksp_D;
27910c7d97c5SJed Brown     /* Matrix for Neumann problem is A_RR -> we need to create it */
2792534831adSStefano Zampini     ierr = MatGetSubMatrix(pcbddc->local_mat,is_R_local,is_R_local,MAT_INITIAL_MATRIX,&A_RR);CHKERRQ(ierr);
279353cdbc3dSStefano Zampini     ierr = KSPCreate(PETSC_COMM_SELF,&pcbddc->ksp_R);CHKERRQ(ierr);
279453cdbc3dSStefano Zampini     ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->ksp_R,(PetscObject)pc,1);CHKERRQ(ierr);
279553cdbc3dSStefano Zampini     ierr = KSPSetOperators(pcbddc->ksp_R,A_RR,A_RR,SAME_PRECONDITIONER);CHKERRQ(ierr);
279653cdbc3dSStefano Zampini     ierr = KSPSetType(pcbddc->ksp_R,KSPPREONLY);CHKERRQ(ierr);
2797da1bb401SStefano Zampini     ierr = KSPSetOptionsPrefix(pcbddc->ksp_R,"neumann_");CHKERRQ(ierr);
27980c7d97c5SJed Brown     /* default */
279953cdbc3dSStefano Zampini     ierr = KSPGetPC(pcbddc->ksp_R,&pc_temp);CHKERRQ(ierr);
280053cdbc3dSStefano Zampini     ierr = PCSetType(pc_temp,PCLU);CHKERRQ(ierr);
28010c7d97c5SJed Brown     /* Allow user's customization */
280253cdbc3dSStefano Zampini     ierr = KSPSetFromOptions(pcbddc->ksp_R);CHKERRQ(ierr);
280353cdbc3dSStefano Zampini     /* Set Up KSP for Neumann problem of BDDC */
280453cdbc3dSStefano Zampini     ierr = KSPSetUp(pcbddc->ksp_R);CHKERRQ(ierr);
2805a0ba757dSStefano Zampini     /* check Dirichlet and Neumann solvers */
2806b76ba322SStefano Zampini     {
28070c7d97c5SJed Brown       Vec         temp_vec;
2808b76ba322SStefano Zampini       PetscReal   value;
2809b76ba322SStefano Zampini       PetscMPIInt use_exact,use_exact_reduced;
28100c7d97c5SJed Brown 
2811a0ba757dSStefano Zampini       ierr = VecDuplicate(pcis->vec1_D,&temp_vec);CHKERRQ(ierr);
2812a0ba757dSStefano Zampini       ierr = VecSetRandom(pcis->vec1_D,PETSC_NULL);CHKERRQ(ierr);
2813a0ba757dSStefano Zampini       ierr = MatMult(pcis->A_II,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr);
2814a0ba757dSStefano Zampini       ierr = KSPSolve(pcbddc->ksp_D,pcis->vec2_D,temp_vec);CHKERRQ(ierr);
2815a0ba757dSStefano Zampini       ierr = VecAXPY(temp_vec,m_one,pcis->vec1_D);CHKERRQ(ierr);
2816a0ba757dSStefano Zampini       ierr = VecNorm(temp_vec,NORM_INFINITY,&value);CHKERRQ(ierr);
2817b76ba322SStefano Zampini       use_exact = 1;
2818b76ba322SStefano Zampini       if(PetscAbsReal(value) > 1.e-4) {
2819b76ba322SStefano Zampini         use_exact = 0;
2820b76ba322SStefano Zampini       }
2821b76ba322SStefano Zampini       ierr = MPI_Allreduce(&use_exact,&use_exact_reduced,1,MPIU_INT,MPI_LAND,((PetscObject)pc)->comm);CHKERRQ(ierr);
2822b76ba322SStefano Zampini       pcbddc->use_exact_dirichlet = (PetscBool) use_exact_reduced;
2823a0ba757dSStefano Zampini       ierr = VecDestroy(&temp_vec);CHKERRQ(ierr);
2824b76ba322SStefano Zampini       if(dbg_flag) {
2825a0ba757dSStefano Zampini         ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
2826a0ba757dSStefano Zampini         ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
2827a0ba757dSStefano Zampini         ierr = PetscViewerASCIIPrintf(viewer,"Checking solution of Dirichlet and Neumann problems\n");CHKERRQ(ierr);
2828a0ba757dSStefano Zampini         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d infinity error for Dirichlet solve = % 1.14e \n",PetscGlobalRank,value);CHKERRQ(ierr);
2829d49ef151SStefano Zampini         ierr = VecDuplicate(pcbddc->vec1_R,&temp_vec);CHKERRQ(ierr);
2830d49ef151SStefano Zampini         ierr = VecSetRandom(pcbddc->vec1_R,PETSC_NULL);CHKERRQ(ierr);
2831d49ef151SStefano Zampini         ierr = MatMult(A_RR,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr);
2832d49ef151SStefano Zampini         ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec2_R,temp_vec);CHKERRQ(ierr);
2833d49ef151SStefano Zampini         ierr = VecAXPY(temp_vec,m_one,pcbddc->vec1_R);CHKERRQ(ierr);
2834d49ef151SStefano Zampini         ierr = VecNorm(temp_vec,NORM_INFINITY,&value);CHKERRQ(ierr);
2835e269702eSStefano Zampini         ierr = VecDestroy(&temp_vec);CHKERRQ(ierr);
28360c7d97c5SJed Brown         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d infinity error for  Neumann  solve = % 1.14e \n",PetscGlobalRank,value);CHKERRQ(ierr);
2837d49ef151SStefano Zampini         ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
28380c7d97c5SJed Brown       }
2839b76ba322SStefano Zampini     }
28400c7d97c5SJed Brown     /* free Neumann problem's matrix */
28410c7d97c5SJed Brown     ierr = MatDestroy(&A_RR);CHKERRQ(ierr);
28420c7d97c5SJed Brown   }
28430c7d97c5SJed Brown 
28440c7d97c5SJed Brown   /* Assemble all remaining stuff needed to apply BDDC  */
28450c7d97c5SJed Brown   {
28460c7d97c5SJed Brown     Mat          A_RV,A_VR,A_VV;
28470c7d97c5SJed Brown     Mat          M1,M2;
28480c7d97c5SJed Brown     Mat          C_CR;
28493b03a366Sstefano_zampini     Mat          AUXMAT;
28500c7d97c5SJed Brown     Vec          vec1_C;
28510c7d97c5SJed Brown     Vec          vec2_C;
28520c7d97c5SJed Brown     Vec          vec1_V;
28530c7d97c5SJed Brown     Vec          vec2_V;
28540c7d97c5SJed Brown     PetscInt     *nnz;
28550c7d97c5SJed Brown     PetscInt     *auxindices;
285653cdbc3dSStefano Zampini     PetscInt     index;
28570c7d97c5SJed Brown     PetscScalar* array2;
28580c7d97c5SJed Brown     MatFactorInfo matinfo;
28590c7d97c5SJed Brown 
28600c7d97c5SJed Brown     /* Allocating some extra storage just to be safe */
28610c7d97c5SJed Brown     ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&nnz);CHKERRQ(ierr);
28620c7d97c5SJed Brown     ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&auxindices);CHKERRQ(ierr);
28630c7d97c5SJed Brown     for(i=0;i<pcis->n;i++) {auxindices[i]=i;}
28640c7d97c5SJed Brown 
28650c7d97c5SJed Brown     /* some work vectors on vertices and/or constraints */
28663b03a366Sstefano_zampini     if(n_vertices) {
28670c7d97c5SJed Brown       ierr = VecCreate(PETSC_COMM_SELF,&vec1_V);CHKERRQ(ierr);
28683b03a366Sstefano_zampini       ierr = VecSetSizes(vec1_V,n_vertices,n_vertices);CHKERRQ(ierr);
28690c7d97c5SJed Brown       ierr = VecSetType(vec1_V,impVecType);CHKERRQ(ierr);
28700c7d97c5SJed Brown       ierr = VecDuplicate(vec1_V,&vec2_V);CHKERRQ(ierr);
28710c7d97c5SJed Brown     }
2872534831adSStefano Zampini     if(n_constraints) {
28730c7d97c5SJed Brown       ierr = VecCreate(PETSC_COMM_SELF,&vec1_C);CHKERRQ(ierr);
2874534831adSStefano Zampini       ierr = VecSetSizes(vec1_C,n_constraints,n_constraints);CHKERRQ(ierr);
28750c7d97c5SJed Brown       ierr = VecSetType(vec1_C,impVecType);CHKERRQ(ierr);
28760c7d97c5SJed Brown       ierr = VecDuplicate(vec1_C,&vec2_C);CHKERRQ(ierr);
28770c7d97c5SJed Brown       ierr = VecDuplicate(vec1_C,&pcbddc->vec1_C);CHKERRQ(ierr);
28780c7d97c5SJed Brown     }
28790c7d97c5SJed Brown     /* Precompute stuffs needed for preprocessing and application of BDDC*/
28803b03a366Sstefano_zampini     if(n_constraints) {
28810c7d97c5SJed Brown       ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->local_auxmat2);CHKERRQ(ierr);
28823b03a366Sstefano_zampini       ierr = MatSetSizes(pcbddc->local_auxmat2,n_R,n_constraints,n_R,n_constraints);CHKERRQ(ierr);
28830c7d97c5SJed Brown       ierr = MatSetType(pcbddc->local_auxmat2,impMatType);CHKERRQ(ierr);
28843b03a366Sstefano_zampini       ierr = MatSeqDenseSetPreallocation(pcbddc->local_auxmat2,PETSC_NULL);CHKERRQ(ierr);
28850c7d97c5SJed Brown 
288657a90decSStefano Zampini       /* Create Constraint matrix on R nodes: C_{CR}  */
288757a90decSStefano Zampini       ierr = MatGetSubMatrix(pcbddc->ConstraintMatrix,is_C_local,is_R_local,MAT_INITIAL_MATRIX,&C_CR);CHKERRQ(ierr);
288857a90decSStefano Zampini       ierr = ISDestroy(&is_C_local);CHKERRQ(ierr);
288957a90decSStefano Zampini 
28900c7d97c5SJed Brown       /* Assemble local_auxmat2 = - A_{RR}^{-1} C^T_{CR} needed by BDDC application */
28913b03a366Sstefano_zampini       for(i=0;i<n_constraints;i++) {
28923b03a366Sstefano_zampini         ierr = VecSet(pcbddc->vec1_R,zero);CHKERRQ(ierr);
28933b03a366Sstefano_zampini         /* Get row of constraint matrix in R numbering */
289457a90decSStefano Zampini         ierr = VecGetArray(pcbddc->vec1_R,&array);CHKERRQ(ierr);
289557a90decSStefano Zampini         ierr = MatGetRow(C_CR,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr);
28963b03a366Sstefano_zampini         for(j=0;j<size_of_constraint;j++) { array[ row_cmat_indices[j] ] = - row_cmat_values[j]; }
289757a90decSStefano Zampini         ierr = MatRestoreRow(C_CR,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr);
289857a90decSStefano Zampini         ierr = VecRestoreArray(pcbddc->vec1_R,&array);CHKERRQ(ierr);
28993b03a366Sstefano_zampini         /* Solve for row of constraint matrix in R numbering */
290053cdbc3dSStefano Zampini         ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr);
29013b03a366Sstefano_zampini         /* Set values */
29020c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec2_R,&array);CHKERRQ(ierr);
29033b03a366Sstefano_zampini         ierr = MatSetValues(pcbddc->local_auxmat2,n_R,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
29040c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec2_R,&array);CHKERRQ(ierr);
29050c7d97c5SJed Brown       }
29060c7d97c5SJed Brown       ierr = MatAssemblyBegin(pcbddc->local_auxmat2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
29070c7d97c5SJed Brown       ierr = MatAssemblyEnd(pcbddc->local_auxmat2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
29080c7d97c5SJed Brown 
29090c7d97c5SJed Brown       /* Assemble AUXMAT = ( LUFactor )( -C_{CR} A_{RR}^{-1} C^T_{CR} )^{-1} */
29100c7d97c5SJed Brown       ierr = MatMatMult(C_CR,pcbddc->local_auxmat2,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&AUXMAT);CHKERRQ(ierr);
2911d49ef151SStefano Zampini       ierr = MatFactorInfoInitialize(&matinfo);CHKERRQ(ierr);
29123b03a366Sstefano_zampini       ierr = ISCreateStride(PETSC_COMM_SELF,n_constraints,0,1,&is_aux1);CHKERRQ(ierr);
29130c7d97c5SJed Brown       ierr = MatLUFactor(AUXMAT,is_aux1,is_aux1,&matinfo);CHKERRQ(ierr);
29140c7d97c5SJed Brown       ierr = ISDestroy(&is_aux1);CHKERRQ(ierr);
29150c7d97c5SJed Brown 
29163b03a366Sstefano_zampini       /* Assemble explicitly M1 = ( C_{CR} A_{RR}^{-1} C^T_{CR} )^{-1} needed in preproc  */
2917d49ef151SStefano Zampini       ierr = MatCreate(PETSC_COMM_SELF,&M1);CHKERRQ(ierr);
29183b03a366Sstefano_zampini       ierr = MatSetSizes(M1,n_constraints,n_constraints,n_constraints,n_constraints);CHKERRQ(ierr);
29190c7d97c5SJed Brown       ierr = MatSetType(M1,impMatType);CHKERRQ(ierr);
29203b03a366Sstefano_zampini       ierr = MatSeqDenseSetPreallocation(M1,PETSC_NULL);CHKERRQ(ierr);
29213b03a366Sstefano_zampini       for(i=0;i<n_constraints;i++) {
29220c7d97c5SJed Brown         ierr = VecSet(vec1_C,zero);CHKERRQ(ierr);
29230c7d97c5SJed Brown         ierr = VecSetValue(vec1_C,i,one,INSERT_VALUES);CHKERRQ(ierr);
29240c7d97c5SJed Brown         ierr = VecAssemblyBegin(vec1_C);CHKERRQ(ierr);
29250c7d97c5SJed Brown         ierr = VecAssemblyEnd(vec1_C);CHKERRQ(ierr);
29260c7d97c5SJed Brown         ierr = MatSolve(AUXMAT,vec1_C,vec2_C);CHKERRQ(ierr);
29270c7d97c5SJed Brown         ierr = VecScale(vec2_C,m_one);CHKERRQ(ierr);
29280c7d97c5SJed Brown         ierr = VecGetArray(vec2_C,&array);CHKERRQ(ierr);
29293b03a366Sstefano_zampini         ierr = MatSetValues(M1,n_constraints,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
29300c7d97c5SJed Brown         ierr = VecRestoreArray(vec2_C,&array);CHKERRQ(ierr);
29310c7d97c5SJed Brown       }
29320c7d97c5SJed Brown       ierr = MatAssemblyBegin(M1,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
29330c7d97c5SJed Brown       ierr = MatAssemblyEnd(M1,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
29340c7d97c5SJed Brown       ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr);
29350c7d97c5SJed Brown       /* Assemble local_auxmat1 = M1*C_{CR} needed by BDDC application in KSP and in preproc */
29360c7d97c5SJed Brown       ierr = MatMatMult(M1,C_CR,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&pcbddc->local_auxmat1);CHKERRQ(ierr);
29370c7d97c5SJed Brown 
29380c7d97c5SJed Brown     }
29390c7d97c5SJed Brown 
29400c7d97c5SJed Brown     /* Get submatrices from subdomain matrix */
29413b03a366Sstefano_zampini     if(n_vertices){
2942534831adSStefano Zampini       ierr = MatGetSubMatrix(pcbddc->local_mat,is_R_local,is_V_local,MAT_INITIAL_MATRIX,&A_RV);CHKERRQ(ierr);
2943534831adSStefano Zampini       ierr = MatGetSubMatrix(pcbddc->local_mat,is_V_local,is_R_local,MAT_INITIAL_MATRIX,&A_VR);CHKERRQ(ierr);
2944534831adSStefano Zampini       ierr = MatGetSubMatrix(pcbddc->local_mat,is_V_local,is_V_local,MAT_INITIAL_MATRIX,&A_VV);CHKERRQ(ierr);
29450c7d97c5SJed Brown       /* Assemble M2 = A_RR^{-1}A_RV */
2946d49ef151SStefano Zampini       ierr = MatCreate(PETSC_COMM_SELF,&M2);CHKERRQ(ierr);
29473b03a366Sstefano_zampini       ierr = MatSetSizes(M2,n_R,n_vertices,n_R,n_vertices);CHKERRQ(ierr);
29480c7d97c5SJed Brown       ierr = MatSetType(M2,impMatType);CHKERRQ(ierr);
29493b03a366Sstefano_zampini       ierr = MatSeqDenseSetPreallocation(M2,PETSC_NULL);CHKERRQ(ierr);
29503b03a366Sstefano_zampini       for(i=0;i<n_vertices;i++) {
29510c7d97c5SJed Brown         ierr = VecSet(vec1_V,zero);CHKERRQ(ierr);
29520c7d97c5SJed Brown         ierr = VecSetValue(vec1_V,i,one,INSERT_VALUES);CHKERRQ(ierr);
29530c7d97c5SJed Brown         ierr = VecAssemblyBegin(vec1_V);CHKERRQ(ierr);
29540c7d97c5SJed Brown         ierr = VecAssemblyEnd(vec1_V);CHKERRQ(ierr);
29550c7d97c5SJed Brown         ierr = MatMult(A_RV,vec1_V,pcbddc->vec1_R);CHKERRQ(ierr);
295653cdbc3dSStefano Zampini         ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr);
29570c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec2_R,&array);CHKERRQ(ierr);
29583b03a366Sstefano_zampini         ierr = MatSetValues(M2,n_R,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
29590c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec2_R,&array);CHKERRQ(ierr);
29600c7d97c5SJed Brown       }
29610c7d97c5SJed Brown       ierr = MatAssemblyBegin(M2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
29620c7d97c5SJed Brown       ierr = MatAssemblyEnd(M2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
29630c7d97c5SJed Brown     }
29640c7d97c5SJed Brown 
29650c7d97c5SJed Brown     /* Matrix of coarse basis functions (local) */
2966d49ef151SStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->coarse_phi_B);CHKERRQ(ierr);
29670c7d97c5SJed Brown     ierr = MatSetSizes(pcbddc->coarse_phi_B,n_B,pcbddc->local_primal_size,n_B,pcbddc->local_primal_size);CHKERRQ(ierr);
29680c7d97c5SJed Brown     ierr = MatSetType(pcbddc->coarse_phi_B,impMatType);CHKERRQ(ierr);
29693b03a366Sstefano_zampini     ierr = MatSeqDenseSetPreallocation(pcbddc->coarse_phi_B,PETSC_NULL);CHKERRQ(ierr);
2970e269702eSStefano Zampini     if(pcbddc->prec_type || dbg_flag ) {
2971d49ef151SStefano Zampini       ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->coarse_phi_D);CHKERRQ(ierr);
29720c7d97c5SJed Brown       ierr = MatSetSizes(pcbddc->coarse_phi_D,n_D,pcbddc->local_primal_size,n_D,pcbddc->local_primal_size);CHKERRQ(ierr);
29730c7d97c5SJed Brown       ierr = MatSetType(pcbddc->coarse_phi_D,impMatType);CHKERRQ(ierr);
29743b03a366Sstefano_zampini       ierr = MatSeqDenseSetPreallocation(pcbddc->coarse_phi_D,PETSC_NULL);CHKERRQ(ierr);
29750c7d97c5SJed Brown     }
29760c7d97c5SJed Brown 
2977e269702eSStefano Zampini     if(dbg_flag) {
29780c7d97c5SJed Brown       ierr = PetscMalloc( pcbddc->local_primal_size*sizeof(PetscScalar),&coarsefunctions_errors);CHKERRQ(ierr);
29790c7d97c5SJed Brown       ierr = PetscMalloc( pcbddc->local_primal_size*sizeof(PetscScalar),&constraints_errors);CHKERRQ(ierr);
29800c7d97c5SJed Brown     }
29813b03a366Sstefano_zampini     /* Subdomain contribution (Non-overlapping) to coarse matrix  */
29820c7d97c5SJed Brown     ierr = PetscMalloc ((pcbddc->local_primal_size)*(pcbddc->local_primal_size)*sizeof(PetscScalar),&coarse_submat_vals);CHKERRQ(ierr);
29830c7d97c5SJed Brown 
29840c7d97c5SJed Brown     /* We are now ready to evaluate coarse basis functions and subdomain contribution to coarse problem */
29853b03a366Sstefano_zampini     for(i=0;i<n_vertices;i++){
29860c7d97c5SJed Brown       ierr = VecSet(vec1_V,zero);CHKERRQ(ierr);
29870c7d97c5SJed Brown       ierr = VecSetValue(vec1_V,i,one,INSERT_VALUES);CHKERRQ(ierr);
29880c7d97c5SJed Brown       ierr = VecAssemblyBegin(vec1_V);CHKERRQ(ierr);
29890c7d97c5SJed Brown       ierr = VecAssemblyEnd(vec1_V);CHKERRQ(ierr);
29900c7d97c5SJed Brown       /* solution of saddle point problem */
29910c7d97c5SJed Brown       ierr = MatMult(M2,vec1_V,pcbddc->vec1_R);CHKERRQ(ierr);
29920c7d97c5SJed Brown       ierr = VecScale(pcbddc->vec1_R,m_one);CHKERRQ(ierr);
29933b03a366Sstefano_zampini       if(n_constraints) {
29940c7d97c5SJed Brown         ierr = MatMult(pcbddc->local_auxmat1,pcbddc->vec1_R,vec1_C);CHKERRQ(ierr);
29950c7d97c5SJed Brown         ierr = MatMultAdd(pcbddc->local_auxmat2,vec1_C,pcbddc->vec1_R,pcbddc->vec1_R);CHKERRQ(ierr);
29960c7d97c5SJed Brown         ierr = VecScale(vec1_C,m_one);CHKERRQ(ierr);
29970c7d97c5SJed Brown       }
29980c7d97c5SJed Brown       ierr = MatMult(A_VR,pcbddc->vec1_R,vec2_V);CHKERRQ(ierr);
29990c7d97c5SJed Brown       ierr = MatMultAdd(A_VV,vec1_V,vec2_V,vec2_V);CHKERRQ(ierr);
30000c7d97c5SJed Brown 
30010c7d97c5SJed Brown       /* Set values in coarse basis function and subdomain part of coarse_mat */
30020c7d97c5SJed Brown       /* coarse basis functions */
30030c7d97c5SJed Brown       ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr);
30040c7d97c5SJed Brown       ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
30050c7d97c5SJed Brown       ierr = VecScatterEnd  (pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
30060c7d97c5SJed Brown       ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr);
30073b03a366Sstefano_zampini       ierr = MatSetValues(pcbddc->coarse_phi_B,n_B,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
30080c7d97c5SJed Brown       ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr);
30090c7d97c5SJed Brown       ierr = MatSetValue(pcbddc->coarse_phi_B,idx_V_B[i],i,one,INSERT_VALUES);CHKERRQ(ierr);
3010e269702eSStefano Zampini       if( pcbddc->prec_type || dbg_flag  ) {
30110c7d97c5SJed Brown         ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
30120c7d97c5SJed Brown         ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
30130c7d97c5SJed Brown         ierr = VecGetArray(pcis->vec1_D,&array);CHKERRQ(ierr);
30143b03a366Sstefano_zampini         ierr = MatSetValues(pcbddc->coarse_phi_D,n_D,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
30150c7d97c5SJed Brown         ierr = VecRestoreArray(pcis->vec1_D,&array);CHKERRQ(ierr);
30160c7d97c5SJed Brown       }
30170c7d97c5SJed Brown       /* subdomain contribution to coarse matrix */
30180c7d97c5SJed Brown       ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr);
3019da1bb401SStefano Zampini       for(j=0;j<n_vertices;j++) { coarse_submat_vals[i*pcbddc->local_primal_size+j] = array[j]; } /* WARNING -> column major ordering */
30200c7d97c5SJed Brown       ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr);
30213b03a366Sstefano_zampini       if(n_constraints) {
30220c7d97c5SJed Brown         ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr);
3023da1bb401SStefano Zampini         for(j=0;j<n_constraints;j++) { coarse_submat_vals[i*pcbddc->local_primal_size+j+n_vertices] = array[j]; } /* WARNING -> column major ordering */
30240c7d97c5SJed Brown         ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr);
30250c7d97c5SJed Brown       }
30260c7d97c5SJed Brown 
3027e269702eSStefano Zampini       if( dbg_flag ) {
30280c7d97c5SJed Brown         /* assemble subdomain vector on nodes */
3029d49ef151SStefano Zampini         ierr = VecSet(pcis->vec1_N,zero);CHKERRQ(ierr);
30300c7d97c5SJed Brown         ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
30310c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr);
30320c7d97c5SJed Brown         for(j=0;j<n_R;j++) { array[idx_R_local[j]] = array2[j]; }
30333b03a366Sstefano_zampini         array[ vertices[i] ] = one;
30340c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr);
30350c7d97c5SJed Brown         ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
30360c7d97c5SJed Brown         /* assemble subdomain vector of lagrange multipliers (i.e. primal nodes) */
3037d49ef151SStefano Zampini         ierr = VecSet(pcbddc->vec1_P,zero);CHKERRQ(ierr);
30380c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr);
30390c7d97c5SJed Brown         ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr);
30403b03a366Sstefano_zampini         for(j=0;j<n_vertices;j++) { array2[j]=array[j]; }
30410c7d97c5SJed Brown         ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr);
30423b03a366Sstefano_zampini         if(n_constraints) {
30430c7d97c5SJed Brown           ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr);
30443b03a366Sstefano_zampini           for(j=0;j<n_constraints;j++) { array2[j+n_vertices]=array[j]; }
30450c7d97c5SJed Brown           ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr);
30460c7d97c5SJed Brown         }
30470c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr);
30480c7d97c5SJed Brown         ierr = VecScale(pcbddc->vec1_P,m_one);CHKERRQ(ierr);
30490c7d97c5SJed Brown         /* check saddle point solution */
3050534831adSStefano Zampini         ierr = MatMult(pcbddc->local_mat,pcis->vec1_N,pcis->vec2_N);CHKERRQ(ierr);
30513b03a366Sstefano_zampini         ierr = MatMultTransposeAdd(pcbddc->ConstraintMatrix,pcbddc->vec1_P,pcis->vec2_N,pcis->vec2_N);CHKERRQ(ierr);
30523b03a366Sstefano_zampini         ierr = VecNorm(pcis->vec2_N,NORM_INFINITY,&coarsefunctions_errors[i]);CHKERRQ(ierr);
30533b03a366Sstefano_zampini         ierr = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr);
30540c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
30553b03a366Sstefano_zampini         array[i]=array[i]+m_one;  /* shift by the identity matrix */
30560c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
30573b03a366Sstefano_zampini         ierr = VecNorm(pcbddc->vec1_P,NORM_INFINITY,&constraints_errors[i]);CHKERRQ(ierr);
30580c7d97c5SJed Brown       }
30590c7d97c5SJed Brown     }
30600c7d97c5SJed Brown 
30613b03a366Sstefano_zampini     for(i=0;i<n_constraints;i++){
3062d49ef151SStefano Zampini       ierr = VecSet(vec2_C,zero);CHKERRQ(ierr);
30630c7d97c5SJed Brown       ierr = VecSetValue(vec2_C,i,m_one,INSERT_VALUES);CHKERRQ(ierr);
30640c7d97c5SJed Brown       ierr = VecAssemblyBegin(vec2_C);CHKERRQ(ierr);
30650c7d97c5SJed Brown       ierr = VecAssemblyEnd(vec2_C);CHKERRQ(ierr);
30660c7d97c5SJed Brown       /* solution of saddle point problem */
30670c7d97c5SJed Brown       ierr = MatMult(M1,vec2_C,vec1_C);CHKERRQ(ierr);
30680c7d97c5SJed Brown       ierr = MatMult(pcbddc->local_auxmat2,vec1_C,pcbddc->vec1_R);CHKERRQ(ierr);
30690c7d97c5SJed Brown       ierr = VecScale(vec1_C,m_one);CHKERRQ(ierr);
30703b03a366Sstefano_zampini       if(n_vertices) { ierr = MatMult(A_VR,pcbddc->vec1_R,vec2_V);CHKERRQ(ierr); }
30710c7d97c5SJed Brown       /* Set values in coarse basis function and subdomain part of coarse_mat */
30720c7d97c5SJed Brown       /* coarse basis functions */
30733b03a366Sstefano_zampini       index=i+n_vertices;
30740c7d97c5SJed Brown       ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr);
30750c7d97c5SJed Brown       ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
30760c7d97c5SJed Brown       ierr = VecScatterEnd  (pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
30770c7d97c5SJed Brown       ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr);
307853cdbc3dSStefano Zampini       ierr = MatSetValues(pcbddc->coarse_phi_B,n_B,auxindices,1,&index,array,INSERT_VALUES);CHKERRQ(ierr);
30790c7d97c5SJed Brown       ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr);
3080e269702eSStefano Zampini       if( pcbddc->prec_type || dbg_flag ) {
30810c7d97c5SJed Brown         ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
30820c7d97c5SJed Brown         ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
30830c7d97c5SJed Brown         ierr = VecGetArray(pcis->vec1_D,&array);CHKERRQ(ierr);
308453cdbc3dSStefano Zampini         ierr = MatSetValues(pcbddc->coarse_phi_D,n_D,auxindices,1,&index,array,INSERT_VALUES);CHKERRQ(ierr);
30850c7d97c5SJed Brown         ierr = VecRestoreArray(pcis->vec1_D,&array);CHKERRQ(ierr);
30860c7d97c5SJed Brown       }
30870c7d97c5SJed Brown       /* subdomain contribution to coarse matrix */
30883b03a366Sstefano_zampini       if(n_vertices) {
30890c7d97c5SJed Brown         ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr);
3090da1bb401SStefano Zampini         for(j=0;j<n_vertices;j++) {coarse_submat_vals[index*pcbddc->local_primal_size+j]=array[j];} /* WARNING -> column major ordering */
30910c7d97c5SJed Brown         ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr);
30920c7d97c5SJed Brown       }
30930c7d97c5SJed Brown       ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr);
3094da1bb401SStefano Zampini       for(j=0;j<n_constraints;j++) {coarse_submat_vals[index*pcbddc->local_primal_size+j+n_vertices]=array[j];} /* WARNING -> column major ordering */
30950c7d97c5SJed Brown       ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr);
30960c7d97c5SJed Brown 
3097e269702eSStefano Zampini       if( dbg_flag ) {
30980c7d97c5SJed Brown         /* assemble subdomain vector on nodes */
309953cdbc3dSStefano Zampini         ierr = VecSet(pcis->vec1_N,zero);CHKERRQ(ierr);
31000c7d97c5SJed Brown         ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
31010c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr);
31020c7d97c5SJed Brown         for(j=0;j<n_R;j++){ array[ idx_R_local[j] ] = array2[j]; }
31030c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr);
31040c7d97c5SJed Brown         ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
31050c7d97c5SJed Brown         /* assemble subdomain vector of lagrange multipliers */
310653cdbc3dSStefano Zampini         ierr = VecSet(pcbddc->vec1_P,zero);CHKERRQ(ierr);
31070c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr);
31083b03a366Sstefano_zampini         if( n_vertices) {
31090c7d97c5SJed Brown           ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr);
31103b03a366Sstefano_zampini           for(j=0;j<n_vertices;j++) {array2[j]=-array[j];}
31110c7d97c5SJed Brown           ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr);
31120c7d97c5SJed Brown         }
31130c7d97c5SJed Brown         ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr);
31143b03a366Sstefano_zampini         for(j=0;j<n_constraints;j++) {array2[j+n_vertices]=-array[j];}
31150c7d97c5SJed Brown         ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr);
31160c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr);
31173972b0daSStefano Zampini         /* check saddle point solution */
3118534831adSStefano Zampini         ierr = MatMult(pcbddc->local_mat,pcis->vec1_N,pcis->vec2_N);CHKERRQ(ierr);
31193b03a366Sstefano_zampini         ierr = MatMultTransposeAdd(pcbddc->ConstraintMatrix,pcbddc->vec1_P,pcis->vec2_N,pcis->vec2_N);CHKERRQ(ierr);
312053cdbc3dSStefano Zampini         ierr = VecNorm(pcis->vec2_N,NORM_INFINITY,&coarsefunctions_errors[index]);CHKERRQ(ierr);
31213b03a366Sstefano_zampini         ierr = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr);
31220c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
312353cdbc3dSStefano Zampini         array[index]=array[index]+m_one; /* shift by the identity matrix */
31240c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
312553cdbc3dSStefano Zampini         ierr = VecNorm(pcbddc->vec1_P,NORM_INFINITY,&constraints_errors[index]);CHKERRQ(ierr);
31260c7d97c5SJed Brown       }
31270c7d97c5SJed Brown     }
31280c7d97c5SJed Brown     ierr = MatAssemblyBegin(pcbddc->coarse_phi_B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
31290c7d97c5SJed Brown     ierr = MatAssemblyEnd  (pcbddc->coarse_phi_B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
3130e269702eSStefano Zampini     if( pcbddc->prec_type || dbg_flag ) {
31310c7d97c5SJed Brown       ierr = MatAssemblyBegin(pcbddc->coarse_phi_D,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
31320c7d97c5SJed Brown       ierr = MatAssemblyEnd  (pcbddc->coarse_phi_D,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
31330c7d97c5SJed Brown     }
31340c7d97c5SJed Brown     /* Checking coarse_sub_mat and coarse basis functios */
31350c7d97c5SJed Brown     /* It shuld be \Phi^{(j)^T} A^{(j)} \Phi^{(j)}=coarse_sub_mat */
31369d2fce94SStefano Zampini     if(dbg_flag) {
31370c7d97c5SJed Brown 
31380c7d97c5SJed Brown       Mat coarse_sub_mat;
31390c7d97c5SJed Brown       Mat TM1,TM2,TM3,TM4;
31400c7d97c5SJed Brown       Mat coarse_phi_D,coarse_phi_B,A_II,A_BB,A_IB,A_BI;
3141a0ba757dSStefano Zampini       const MatType checkmattype=MATSEQAIJ;
31420c7d97c5SJed Brown       PetscScalar      value;
31430c7d97c5SJed Brown 
3144c042a7c3SStefano Zampini       ierr = MatConvert(pcis->A_II,checkmattype,MAT_INITIAL_MATRIX,&A_II);CHKERRQ(ierr);
3145c042a7c3SStefano Zampini       ierr = MatConvert(pcis->A_IB,checkmattype,MAT_INITIAL_MATRIX,&A_IB);CHKERRQ(ierr);
3146c042a7c3SStefano Zampini       ierr = MatConvert(pcis->A_BI,checkmattype,MAT_INITIAL_MATRIX,&A_BI);CHKERRQ(ierr);
3147c042a7c3SStefano Zampini       ierr = MatConvert(pcis->A_BB,checkmattype,MAT_INITIAL_MATRIX,&A_BB);CHKERRQ(ierr);
3148c042a7c3SStefano Zampini       ierr = MatConvert(pcbddc->coarse_phi_D,checkmattype,MAT_INITIAL_MATRIX,&coarse_phi_D);CHKERRQ(ierr);
3149c042a7c3SStefano Zampini       ierr = MatConvert(pcbddc->coarse_phi_B,checkmattype,MAT_INITIAL_MATRIX,&coarse_phi_B);CHKERRQ(ierr);
3150c042a7c3SStefano Zampini       ierr = MatCreateSeqDense(PETSC_COMM_SELF,pcbddc->local_primal_size,pcbddc->local_primal_size,coarse_submat_vals,&coarse_sub_mat);CHKERRQ(ierr);
3151c042a7c3SStefano Zampini       ierr = MatConvert(coarse_sub_mat,checkmattype,MAT_REUSE_MATRIX,&coarse_sub_mat);CHKERRQ(ierr);
31520c7d97c5SJed Brown 
3153da1bb401SStefano Zampini       /*PetscViewer view_out;
3154da1bb401SStefano Zampini       PetscMPIInt myrank;
3155da1bb401SStefano Zampini       char filename[256];
3156da1bb401SStefano Zampini       MPI_Comm_rank(((PetscObject)pc)->comm,&myrank);
3157da1bb401SStefano Zampini       sprintf(filename,"coarsesubmat_%04d.m",myrank);
3158da1bb401SStefano Zampini       ierr = PetscViewerASCIIOpen(PETSC_COMM_SELF,filename,&view_out);CHKERRQ(ierr);
3159da1bb401SStefano Zampini       ierr = PetscViewerSetFormat(view_out,PETSC_VIEWER_ASCII_MATLAB);CHKERRQ(ierr);
3160da1bb401SStefano Zampini       ierr = MatView(coarse_sub_mat,view_out);CHKERRQ(ierr);
3161da1bb401SStefano Zampini       ierr = PetscViewerDestroy(&view_out);CHKERRQ(ierr);*/
3162da1bb401SStefano Zampini 
31630c7d97c5SJed Brown       ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
31640c7d97c5SJed Brown       ierr = PetscViewerASCIIPrintf(viewer,"Check coarse sub mat and local basis functions\n");CHKERRQ(ierr);
31650c7d97c5SJed Brown       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
316653cdbc3dSStefano Zampini       ierr = MatPtAP(A_II,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&TM1);CHKERRQ(ierr);
316753cdbc3dSStefano Zampini       ierr = MatPtAP(A_BB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&TM2);CHKERRQ(ierr);
316853cdbc3dSStefano Zampini       ierr = MatMatMult(A_IB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr);
3169c042a7c3SStefano Zampini       ierr = MatTransposeMatMult(coarse_phi_D,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM3);CHKERRQ(ierr);
317053cdbc3dSStefano Zampini       ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr);
317153cdbc3dSStefano Zampini       ierr = MatMatMult(A_BI,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr);
3172c042a7c3SStefano Zampini       ierr = MatTransposeMatMult(coarse_phi_B,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM4);CHKERRQ(ierr);
317353cdbc3dSStefano Zampini       ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr);
317453cdbc3dSStefano Zampini       ierr = MatAXPY(TM1,one,TM2,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
317553cdbc3dSStefano Zampini       ierr = MatAXPY(TM1,one,TM3,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
317653cdbc3dSStefano Zampini       ierr = MatAXPY(TM1,one,TM4,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
317753cdbc3dSStefano Zampini       ierr = MatAXPY(TM1,m_one,coarse_sub_mat,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
317853cdbc3dSStefano Zampini       ierr = MatNorm(TM1,NORM_INFINITY,&value);CHKERRQ(ierr);
31790c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"----------------------------------\n");CHKERRQ(ierr);
31800c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d \n",PetscGlobalRank);CHKERRQ(ierr);
31810c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"matrix error = % 1.14e\n",value);CHKERRQ(ierr);
31820c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"coarse functions errors\n");CHKERRQ(ierr);
318353cdbc3dSStefano Zampini       for(i=0;i<pcbddc->local_primal_size;i++) { ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local %02d-th function error = % 1.14e\n",i,coarsefunctions_errors[i]);CHKERRQ(ierr); }
31840c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"constraints errors\n");CHKERRQ(ierr);
318553cdbc3dSStefano Zampini       for(i=0;i<pcbddc->local_primal_size;i++) { ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local %02d-th function error = % 1.14e\n",i,constraints_errors[i]);CHKERRQ(ierr); }
31860c7d97c5SJed Brown       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
318753cdbc3dSStefano Zampini       ierr = MatDestroy(&A_II);CHKERRQ(ierr);
318853cdbc3dSStefano Zampini       ierr = MatDestroy(&A_BB);CHKERRQ(ierr);
318953cdbc3dSStefano Zampini       ierr = MatDestroy(&A_IB);CHKERRQ(ierr);
319053cdbc3dSStefano Zampini       ierr = MatDestroy(&A_BI);CHKERRQ(ierr);
319153cdbc3dSStefano Zampini       ierr = MatDestroy(&TM1);CHKERRQ(ierr);
319253cdbc3dSStefano Zampini       ierr = MatDestroy(&TM2);CHKERRQ(ierr);
319353cdbc3dSStefano Zampini       ierr = MatDestroy(&TM3);CHKERRQ(ierr);
319453cdbc3dSStefano Zampini       ierr = MatDestroy(&TM4);CHKERRQ(ierr);
319553cdbc3dSStefano Zampini       ierr = MatDestroy(&coarse_phi_D);CHKERRQ(ierr);
319653cdbc3dSStefano Zampini       ierr = MatDestroy(&coarse_sub_mat);CHKERRQ(ierr);
319753cdbc3dSStefano Zampini       ierr = MatDestroy(&coarse_phi_B);CHKERRQ(ierr);
31980c7d97c5SJed Brown       ierr = PetscFree(coarsefunctions_errors);CHKERRQ(ierr);
31990c7d97c5SJed Brown       ierr = PetscFree(constraints_errors);CHKERRQ(ierr);
32000c7d97c5SJed Brown     }
32010c7d97c5SJed Brown 
32020c7d97c5SJed Brown     /* create coarse matrix and data structures for message passing associated actual choice of coarse problem type */
32030c7d97c5SJed Brown     ierr = PCBDDCSetupCoarseEnvironment(pc,coarse_submat_vals);CHKERRQ(ierr);
32040c7d97c5SJed Brown     /* free memory */
32050c7d97c5SJed Brown     ierr = PetscFree(coarse_submat_vals);CHKERRQ(ierr);
32060c7d97c5SJed Brown     ierr = PetscFree(auxindices);CHKERRQ(ierr);
32070c7d97c5SJed Brown     ierr = PetscFree(nnz);CHKERRQ(ierr);
32083b03a366Sstefano_zampini     if(n_vertices) {
32090c7d97c5SJed Brown       ierr = VecDestroy(&vec1_V);CHKERRQ(ierr);
32100c7d97c5SJed Brown       ierr = VecDestroy(&vec2_V);CHKERRQ(ierr);
32110c7d97c5SJed Brown       ierr = MatDestroy(&M2);CHKERRQ(ierr);
32120c7d97c5SJed Brown       ierr = MatDestroy(&A_RV);CHKERRQ(ierr);
32130c7d97c5SJed Brown       ierr = MatDestroy(&A_VR);CHKERRQ(ierr);
32140c7d97c5SJed Brown       ierr = MatDestroy(&A_VV);CHKERRQ(ierr);
32150c7d97c5SJed Brown     }
3216534831adSStefano Zampini     if(n_constraints) {
32170c7d97c5SJed Brown       ierr = VecDestroy(&vec1_C);CHKERRQ(ierr);
32180c7d97c5SJed Brown       ierr = VecDestroy(&vec2_C);CHKERRQ(ierr);
32190c7d97c5SJed Brown       ierr = MatDestroy(&M1);CHKERRQ(ierr);
32200c7d97c5SJed Brown       ierr = MatDestroy(&C_CR);CHKERRQ(ierr);
32210c7d97c5SJed Brown     }
32220c7d97c5SJed Brown   }
32230c7d97c5SJed Brown   /* free memory */
32243b03a366Sstefano_zampini   if(n_vertices) {
32250c7d97c5SJed Brown     ierr = PetscFree(idx_V_B);CHKERRQ(ierr);
32260c7d97c5SJed Brown     ierr = ISDestroy(&is_V_local);CHKERRQ(ierr);
32270c7d97c5SJed Brown   }
32280c7d97c5SJed Brown   ierr = ISDestroy(&is_R_local);CHKERRQ(ierr);
32290c7d97c5SJed Brown 
32300c7d97c5SJed Brown   PetscFunctionReturn(0);
32310c7d97c5SJed Brown }
32320c7d97c5SJed Brown 
32330c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
32340c7d97c5SJed Brown 
32350c7d97c5SJed Brown #undef __FUNCT__
32360c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetupCoarseEnvironment"
323753cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetupCoarseEnvironment(PC pc,PetscScalar* coarse_submat_vals)
32380c7d97c5SJed Brown {
32390c7d97c5SJed Brown 
32400c7d97c5SJed Brown 
32410c7d97c5SJed Brown   Mat_IS    *matis    = (Mat_IS*)pc->pmat->data;
32420c7d97c5SJed Brown   PC_BDDC   *pcbddc   = (PC_BDDC*)pc->data;
32430c7d97c5SJed Brown   PC_IS     *pcis     = (PC_IS*)pc->data;
32440c7d97c5SJed Brown   MPI_Comm  prec_comm = ((PetscObject)pc)->comm;
32450c7d97c5SJed Brown   MPI_Comm  coarse_comm;
32460c7d97c5SJed Brown 
32470c7d97c5SJed Brown   /* common to all choiches */
32480c7d97c5SJed Brown   PetscScalar *temp_coarse_mat_vals;
32490c7d97c5SJed Brown   PetscScalar *ins_coarse_mat_vals;
32500c7d97c5SJed Brown   PetscInt    *ins_local_primal_indices;
32510c7d97c5SJed Brown   PetscMPIInt *localsizes2,*localdispl2;
32520c7d97c5SJed Brown   PetscMPIInt size_prec_comm;
32530c7d97c5SJed Brown   PetscMPIInt rank_prec_comm;
32540c7d97c5SJed Brown   PetscMPIInt active_rank=MPI_PROC_NULL;
32550c7d97c5SJed Brown   PetscMPIInt master_proc=0;
32560c7d97c5SJed Brown   PetscInt    ins_local_primal_size;
32570c7d97c5SJed Brown   /* specific to MULTILEVEL_BDDC */
32580c7d97c5SJed Brown   PetscMPIInt *ranks_recv;
32590c7d97c5SJed Brown   PetscMPIInt count_recv=0;
32600c7d97c5SJed Brown   PetscMPIInt rank_coarse_proc_send_to;
32610c7d97c5SJed Brown   PetscMPIInt coarse_color = MPI_UNDEFINED;
32620c7d97c5SJed Brown   ISLocalToGlobalMapping coarse_ISLG;
32630c7d97c5SJed Brown   /* some other variables */
32640c7d97c5SJed Brown   PetscErrorCode ierr;
32650c7d97c5SJed Brown   const MatType coarse_mat_type;
32660c7d97c5SJed Brown   const PCType  coarse_pc_type;
326753cdbc3dSStefano Zampini   const KSPType  coarse_ksp_type;
326853cdbc3dSStefano Zampini   PC pc_temp;
32690c7d97c5SJed Brown   PetscInt i,j,k,bs;
32703b03a366Sstefano_zampini   PetscInt max_it_coarse_ksp=1;  /* don't increase this value */
3271e269702eSStefano Zampini   /* verbose output viewer */
3272e269702eSStefano Zampini   PetscViewer viewer=pcbddc->dbg_viewer;
3273e269702eSStefano Zampini   PetscBool   dbg_flag=pcbddc->dbg_flag;
32740c7d97c5SJed Brown 
32750c7d97c5SJed Brown   PetscFunctionBegin;
32760c7d97c5SJed Brown 
32770c7d97c5SJed Brown   ins_local_primal_indices = 0;
32780c7d97c5SJed Brown   ins_coarse_mat_vals      = 0;
32790c7d97c5SJed Brown   localsizes2              = 0;
32800c7d97c5SJed Brown   localdispl2              = 0;
32810c7d97c5SJed Brown   temp_coarse_mat_vals     = 0;
32820c7d97c5SJed Brown   coarse_ISLG              = 0;
32830c7d97c5SJed Brown 
328453cdbc3dSStefano Zampini   ierr = MPI_Comm_size(prec_comm,&size_prec_comm);CHKERRQ(ierr);
328553cdbc3dSStefano Zampini   ierr = MPI_Comm_rank(prec_comm,&rank_prec_comm);CHKERRQ(ierr);
32860c7d97c5SJed Brown   ierr = MatGetBlockSize(matis->A,&bs);CHKERRQ(ierr);
32870c7d97c5SJed Brown 
3288beed3852SStefano Zampini   /* Assign global numbering to coarse dofs */
3289beed3852SStefano Zampini   {
3290a0ba757dSStefano Zampini     PetscScalar    one=1.,zero=0.;
3291beed3852SStefano Zampini     PetscScalar    *array;
3292beed3852SStefano Zampini     PetscMPIInt    *auxlocal_primal;
3293beed3852SStefano Zampini     PetscMPIInt    *auxglobal_primal;
3294beed3852SStefano Zampini     PetscMPIInt    *all_auxglobal_primal;
3295beed3852SStefano Zampini     PetscMPIInt    *all_auxglobal_primal_dummy;
3296beed3852SStefano Zampini     PetscMPIInt    mpi_local_primal_size = (PetscMPIInt)pcbddc->local_primal_size;
3297da1bb401SStefano Zampini     PetscInt       *row_cmat_indices;
32983b03a366Sstefano_zampini     PetscInt       size_of_constraint;
3299da1bb401SStefano Zampini     PetscScalar    coarsesum;
3300beed3852SStefano Zampini 
3301beed3852SStefano Zampini     /* Construct needed data structures for message passing */
3302beed3852SStefano Zampini     ierr = PetscMalloc(mpi_local_primal_size*sizeof(PetscMPIInt),&pcbddc->local_primal_indices);CHKERRQ(ierr);
3303beed3852SStefano Zampini     ierr = PetscMalloc(size_prec_comm*sizeof(PetscMPIInt),&pcbddc->local_primal_sizes);CHKERRQ(ierr);
3304beed3852SStefano Zampini     ierr = PetscMalloc(size_prec_comm*sizeof(PetscMPIInt),&pcbddc->local_primal_displacements);CHKERRQ(ierr);
3305beed3852SStefano Zampini     /* Gather local_primal_size information for all processes  */
33065619798eSStefano Zampini     ierr = MPI_Allgather(&mpi_local_primal_size,1,MPIU_INT,&pcbddc->local_primal_sizes[0],1,MPIU_INT,prec_comm);CHKERRQ(ierr);
3307beed3852SStefano Zampini     pcbddc->replicated_primal_size = 0;
3308beed3852SStefano Zampini     for (i=0; i<size_prec_comm; i++) {
3309beed3852SStefano Zampini       pcbddc->local_primal_displacements[i] = pcbddc->replicated_primal_size ;
3310beed3852SStefano Zampini       pcbddc->replicated_primal_size += pcbddc->local_primal_sizes[i];
3311beed3852SStefano Zampini     }
33125619798eSStefano Zampini     if(rank_prec_comm == 0) {
3313beed3852SStefano Zampini       /* allocate some auxiliary space */
3314beed3852SStefano Zampini       ierr = PetscMalloc(pcbddc->replicated_primal_size*sizeof(*all_auxglobal_primal),&all_auxglobal_primal);CHKERRQ(ierr);
3315beed3852SStefano Zampini       ierr = PetscMalloc(pcbddc->replicated_primal_size*sizeof(*all_auxglobal_primal_dummy),&all_auxglobal_primal_dummy);CHKERRQ(ierr);
3316beed3852SStefano Zampini     }
3317beed3852SStefano Zampini     ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscMPIInt),&auxlocal_primal);CHKERRQ(ierr);
3318beed3852SStefano Zampini     ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscMPIInt),&auxglobal_primal);CHKERRQ(ierr);
3319beed3852SStefano Zampini 
3320da1bb401SStefano Zampini     /* First let's count coarse dofs.
3321beed3852SStefano Zampini        This code fragment assumes that the number of local constraints per connected component
3322beed3852SStefano Zampini        is not greater than the number of nodes defined for the connected component
3323beed3852SStefano Zampini        (otherwise we will surely have linear dependence between constraints and thus a singular coarse problem) */
33243b03a366Sstefano_zampini     /* auxlocal_primal      : primal indices in local nodes numbering (internal and interface) with complete queue sorted by global ordering */
3325beed3852SStefano Zampini     ierr = VecSet(pcis->vec1_N,zero);CHKERRQ(ierr);
3326beed3852SStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3327da1bb401SStefano Zampini     for(i=0;i<pcbddc->local_primal_size;i++) {
3328da1bb401SStefano Zampini       ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr);
33293b03a366Sstefano_zampini       for (j=0; j<size_of_constraint; j++) {
33303b03a366Sstefano_zampini         k = row_cmat_indices[j];
3331beed3852SStefano Zampini         if( array[k] == zero ) {
3332beed3852SStefano Zampini           array[k] = one;
3333da1bb401SStefano Zampini           auxlocal_primal[i] = k;
3334beed3852SStefano Zampini           break;
3335beed3852SStefano Zampini         }
3336beed3852SStefano Zampini       }
3337da1bb401SStefano Zampini       ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr);
3338beed3852SStefano Zampini     }
3339beed3852SStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3340da1bb401SStefano Zampini     ierr = VecSet(pcis->vec1_global,zero);CHKERRQ(ierr);
3341da1bb401SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3342da1bb401SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3343da1bb401SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3344da1bb401SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3345da1bb401SStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3346da1bb401SStefano Zampini     for(i=0;i<pcis->n;i++) { if( array[i] > zero) array[i] = one/array[i]; }
3347da1bb401SStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3348da1bb401SStefano Zampini     ierr = VecSet(pcis->vec1_global,zero);CHKERRQ(ierr);
3349da1bb401SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3350da1bb401SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3351da1bb401SStefano Zampini     ierr = VecSum(pcis->vec1_global,&coarsesum);CHKERRQ(ierr);
3352da1bb401SStefano Zampini     pcbddc->coarse_size = (PetscInt) coarsesum;
3353a0ba757dSStefano Zampini 
3354beed3852SStefano Zampini     /* Now assign them a global numbering */
3355beed3852SStefano Zampini     /* auxglobal_primal contains indices in global nodes numbering (internal and interface) */
3356beed3852SStefano Zampini     ierr = ISLocalToGlobalMappingApply(matis->mapping,pcbddc->local_primal_size,auxlocal_primal,auxglobal_primal);CHKERRQ(ierr);
3357beed3852SStefano Zampini     /* all_auxglobal_primal contains all primal nodes indices in global nodes numbering (internal and interface) */
3358beed3852SStefano Zampini     ierr = MPI_Gatherv(&auxglobal_primal[0],pcbddc->local_primal_size,MPIU_INT,&all_auxglobal_primal[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,0,prec_comm);CHKERRQ(ierr);
3359beed3852SStefano Zampini 
3360beed3852SStefano Zampini     /* After this block all_auxglobal_primal should contains one copy of each primal node's indices in global nodes numbering */
3361beed3852SStefano Zampini     /* It implements a function similar to PetscSortRemoveDupsInt */
3362beed3852SStefano Zampini     if(rank_prec_comm==0) {
3363beed3852SStefano Zampini       /* dummy argument since PetscSortMPIInt doesn't exist! */
3364beed3852SStefano Zampini       ierr = PetscSortMPIIntWithArray(pcbddc->replicated_primal_size,all_auxglobal_primal,all_auxglobal_primal_dummy);CHKERRQ(ierr);
3365beed3852SStefano Zampini       k=1;
3366beed3852SStefano Zampini       j=all_auxglobal_primal[0];  /* first dof in global numbering */
3367beed3852SStefano Zampini       for(i=1;i< pcbddc->replicated_primal_size ;i++) {
3368beed3852SStefano Zampini         if(j != all_auxglobal_primal[i] ) {
3369beed3852SStefano Zampini           all_auxglobal_primal[k]=all_auxglobal_primal[i];
3370beed3852SStefano Zampini           k++;
3371beed3852SStefano Zampini           j=all_auxglobal_primal[i];
3372beed3852SStefano Zampini         }
3373beed3852SStefano Zampini       }
3374beed3852SStefano Zampini     } else {
3375beed3852SStefano Zampini       ierr = PetscMalloc(pcbddc->coarse_size*sizeof(PetscMPIInt),&all_auxglobal_primal);CHKERRQ(ierr);
3376beed3852SStefano Zampini     }
33775619798eSStefano Zampini     /* We only need to broadcast the indices from 0 to pcbddc->coarse_size. Remaning elements of array all_aux_global_primal are garbage. */
3378beed3852SStefano Zampini     ierr = MPI_Bcast(all_auxglobal_primal,pcbddc->coarse_size,MPIU_INT,0,prec_comm);CHKERRQ(ierr);
3379beed3852SStefano Zampini 
3380beed3852SStefano Zampini     /* Now get global coarse numbering of local primal nodes */
3381beed3852SStefano Zampini     for(i=0;i<pcbddc->local_primal_size;i++) {
3382beed3852SStefano Zampini       k=0;
3383beed3852SStefano Zampini       while( all_auxglobal_primal[k] != auxglobal_primal[i] ) { k++;}
3384beed3852SStefano Zampini       pcbddc->local_primal_indices[i]=k;
3385beed3852SStefano Zampini     }
3386e269702eSStefano Zampini     if(dbg_flag) {
3387e269702eSStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
3388da1bb401SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Size of coarse problem %d\n",pcbddc->coarse_size);CHKERRQ(ierr);
3389e269702eSStefano Zampini       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
3390e269702eSStefano Zampini     }
3391beed3852SStefano Zampini     /* free allocated memory */
3392beed3852SStefano Zampini     ierr = PetscFree(auxlocal_primal);CHKERRQ(ierr);
3393beed3852SStefano Zampini     ierr = PetscFree(auxglobal_primal);CHKERRQ(ierr);
3394beed3852SStefano Zampini     ierr = PetscFree(all_auxglobal_primal);CHKERRQ(ierr);
3395e269702eSStefano Zampini     if(rank_prec_comm == 0) {
3396beed3852SStefano Zampini       ierr = PetscFree(all_auxglobal_primal_dummy);CHKERRQ(ierr);
3397beed3852SStefano Zampini     }
3398e269702eSStefano Zampini   }
3399beed3852SStefano Zampini 
34000c7d97c5SJed Brown   /* adapt coarse problem type */
34010c7d97c5SJed Brown   if(pcbddc->coarse_problem_type == MULTILEVEL_BDDC && pcbddc->active_procs < MIN_PROCS_FOR_BDDC )
34020c7d97c5SJed Brown     pcbddc->coarse_problem_type = PARALLEL_BDDC;
34030c7d97c5SJed Brown 
34040c7d97c5SJed Brown   switch(pcbddc->coarse_problem_type){
34050c7d97c5SJed Brown 
3406da1bb401SStefano Zampini     case(MULTILEVEL_BDDC):   /* we define a coarse mesh where subdomains are elements */
34070c7d97c5SJed Brown     {
34080c7d97c5SJed Brown       /* we need additional variables */
34090c7d97c5SJed Brown       MetisInt   n_subdomains,n_parts,objval,ncon,faces_nvtxs;
34100c7d97c5SJed Brown       MetisInt   *metis_coarse_subdivision;
34110c7d97c5SJed Brown       MetisInt   options[METIS_NOPTIONS];
34120c7d97c5SJed Brown       PetscMPIInt size_coarse_comm,rank_coarse_comm;
34130c7d97c5SJed Brown       PetscMPIInt procs_jumps_coarse_comm;
34140c7d97c5SJed Brown       PetscMPIInt *coarse_subdivision;
34150c7d97c5SJed Brown       PetscMPIInt *total_count_recv;
34160c7d97c5SJed Brown       PetscMPIInt *total_ranks_recv;
34170c7d97c5SJed Brown       PetscMPIInt *displacements_recv;
34180c7d97c5SJed Brown       PetscMPIInt *my_faces_connectivity;
34190c7d97c5SJed Brown       PetscMPIInt *petsc_faces_adjncy;
34200c7d97c5SJed Brown       MetisInt    *faces_adjncy;
34210c7d97c5SJed Brown       MetisInt    *faces_xadj;
34220c7d97c5SJed Brown       PetscMPIInt *number_of_faces;
34230c7d97c5SJed Brown       PetscMPIInt *faces_displacements;
34240c7d97c5SJed Brown       PetscInt    *array_int;
34250c7d97c5SJed Brown       PetscMPIInt my_faces=0;
34260c7d97c5SJed Brown       PetscMPIInt total_faces=0;
34273828260eSStefano Zampini       PetscInt    ranks_stretching_ratio;
34280c7d97c5SJed Brown 
34290c7d97c5SJed Brown       /* define some quantities */
34300c7d97c5SJed Brown       pcbddc->coarse_communications_type = SCATTERS_BDDC;
34310c7d97c5SJed Brown       coarse_mat_type = MATIS;
34320c7d97c5SJed Brown       coarse_pc_type  = PCBDDC;
34336c9de887SHong Zhang       coarse_ksp_type  = KSPCHEBYSHEV;
34340c7d97c5SJed Brown 
34350c7d97c5SJed Brown       /* details of coarse decomposition */
34360c7d97c5SJed Brown       n_subdomains = pcbddc->active_procs;
34370c7d97c5SJed Brown       n_parts      = n_subdomains/pcbddc->coarsening_ratio;
34383828260eSStefano Zampini       ranks_stretching_ratio = size_prec_comm/pcbddc->active_procs;
34393828260eSStefano Zampini       procs_jumps_coarse_comm = pcbddc->coarsening_ratio*ranks_stretching_ratio;
34403828260eSStefano Zampini 
3441da1bb401SStefano Zampini       /*printf("Coarse algorithm details: \n");
3442da1bb401SStefano Zampini       printf("n_subdomains %d, n_parts %d\nstretch %d,jumps %d,coarse_ratio %d\nlevel should be log_%d(%d)\n",n_subdomains,n_parts,ranks_stretching_ratio,procs_jumps_coarse_comm,pcbddc->coarsening_ratio,pcbddc->coarsening_ratio,(ranks_stretching_ratio/pcbddc->coarsening_ratio+1));*/
34430c7d97c5SJed Brown 
34440c7d97c5SJed Brown       /* build CSR graph of subdomains' connectivity through faces */
34450c7d97c5SJed Brown       ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&array_int);CHKERRQ(ierr);
34463828260eSStefano Zampini       ierr = PetscMemzero(array_int,pcis->n*sizeof(PetscInt));CHKERRQ(ierr);
34470c7d97c5SJed Brown       for(i=1;i<pcis->n_neigh;i++){/* i=1 so I don't count myself -> faces nodes counts to 1 */
34480c7d97c5SJed Brown         for(j=0;j<pcis->n_shared[i];j++){
34490c7d97c5SJed Brown           array_int[ pcis->shared[i][j] ]+=1;
34500c7d97c5SJed Brown         }
34510c7d97c5SJed Brown       }
34520c7d97c5SJed Brown       for(i=1;i<pcis->n_neigh;i++){
34530c7d97c5SJed Brown         for(j=0;j<pcis->n_shared[i];j++){
34540c7d97c5SJed Brown           if(array_int[ pcis->shared[i][j] ] == 1 ){
34550c7d97c5SJed Brown             my_faces++;
34560c7d97c5SJed Brown             break;
34570c7d97c5SJed Brown           }
34580c7d97c5SJed Brown         }
34590c7d97c5SJed Brown       }
34600c7d97c5SJed Brown 
346153cdbc3dSStefano Zampini       ierr = MPI_Reduce(&my_faces,&total_faces,1,MPIU_INT,MPI_SUM,master_proc,prec_comm);CHKERRQ(ierr);
34620c7d97c5SJed Brown       ierr = PetscMalloc (my_faces*sizeof(PetscInt),&my_faces_connectivity);CHKERRQ(ierr);
34630c7d97c5SJed Brown       my_faces=0;
34640c7d97c5SJed Brown       for(i=1;i<pcis->n_neigh;i++){
34650c7d97c5SJed Brown         for(j=0;j<pcis->n_shared[i];j++){
34660c7d97c5SJed Brown           if(array_int[ pcis->shared[i][j] ] == 1 ){
34670c7d97c5SJed Brown             my_faces_connectivity[my_faces]=pcis->neigh[i];
34680c7d97c5SJed Brown             my_faces++;
34690c7d97c5SJed Brown             break;
34700c7d97c5SJed Brown           }
34710c7d97c5SJed Brown         }
34720c7d97c5SJed Brown       }
34730c7d97c5SJed Brown       if(rank_prec_comm == master_proc) {
34740c7d97c5SJed Brown         ierr = PetscMalloc (total_faces*sizeof(PetscMPIInt),&petsc_faces_adjncy);CHKERRQ(ierr);
34750c7d97c5SJed Brown         ierr = PetscMalloc (size_prec_comm*sizeof(PetscMPIInt),&number_of_faces);CHKERRQ(ierr);
34760c7d97c5SJed Brown         ierr = PetscMalloc (total_faces*sizeof(MetisInt),&faces_adjncy);CHKERRQ(ierr);
34770c7d97c5SJed Brown         ierr = PetscMalloc ((n_subdomains+1)*sizeof(MetisInt),&faces_xadj);CHKERRQ(ierr);
34780c7d97c5SJed Brown         ierr = PetscMalloc ((size_prec_comm+1)*sizeof(PetscMPIInt),&faces_displacements);CHKERRQ(ierr);
34790c7d97c5SJed Brown       }
348053cdbc3dSStefano Zampini       ierr = MPI_Gather(&my_faces,1,MPIU_INT,&number_of_faces[0],1,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr);
34810c7d97c5SJed Brown       if(rank_prec_comm == master_proc) {
34820c7d97c5SJed Brown         faces_xadj[0]=0;
34830c7d97c5SJed Brown         faces_displacements[0]=0;
34840c7d97c5SJed Brown         j=0;
34850c7d97c5SJed Brown         for(i=1;i<size_prec_comm+1;i++) {
34860c7d97c5SJed Brown           faces_displacements[i]=faces_displacements[i-1]+number_of_faces[i-1];
34870c7d97c5SJed Brown           if(number_of_faces[i-1]) {
34880c7d97c5SJed Brown             j++;
34890c7d97c5SJed Brown             faces_xadj[j]=faces_xadj[j-1]+number_of_faces[i-1];
34900c7d97c5SJed Brown           }
34910c7d97c5SJed Brown         }
3492da1bb401SStefano Zampini         /*printf("The J I count is %d and should be %d\n",j,n_subdomains);
3493da1bb401SStefano Zampini         printf("Total faces seem %d and should be %d\n",faces_xadj[j],total_faces);*/
34940c7d97c5SJed Brown       }
349553cdbc3dSStefano Zampini       ierr = MPI_Gatherv(&my_faces_connectivity[0],my_faces,MPIU_INT,&petsc_faces_adjncy[0],number_of_faces,faces_displacements,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr);
34960c7d97c5SJed Brown       ierr = PetscFree(my_faces_connectivity);CHKERRQ(ierr);
34970c7d97c5SJed Brown       ierr = PetscFree(array_int);CHKERRQ(ierr);
34980c7d97c5SJed Brown       if(rank_prec_comm == master_proc) {
34993828260eSStefano Zampini         for(i=0;i<total_faces;i++) faces_adjncy[i]=(MetisInt)(petsc_faces_adjncy[i]/ranks_stretching_ratio); /* cast to MetisInt */
3500da1bb401SStefano Zampini         /*printf("This is the face connectivity (actual ranks)\n");
35010c7d97c5SJed Brown         for(i=0;i<n_subdomains;i++){
35020c7d97c5SJed Brown           printf("proc %d is connected with \n",i);
35030c7d97c5SJed Brown           for(j=faces_xadj[i];j<faces_xadj[i+1];j++)
35040c7d97c5SJed Brown             printf("%d ",faces_adjncy[j]);
35050c7d97c5SJed Brown           printf("\n");
3506da1bb401SStefano Zampini         }*/
35070c7d97c5SJed Brown         ierr = PetscFree(faces_displacements);CHKERRQ(ierr);
35080c7d97c5SJed Brown         ierr = PetscFree(number_of_faces);CHKERRQ(ierr);
35090c7d97c5SJed Brown         ierr = PetscFree(petsc_faces_adjncy);CHKERRQ(ierr);
35100c7d97c5SJed Brown       }
35110c7d97c5SJed Brown 
35120c7d97c5SJed Brown       if( rank_prec_comm == master_proc ) {
35130c7d97c5SJed Brown 
35143828260eSStefano Zampini         PetscInt heuristic_for_metis=3;
35153828260eSStefano Zampini 
35160c7d97c5SJed Brown         ncon=1;
35170c7d97c5SJed Brown         faces_nvtxs=n_subdomains;
35180c7d97c5SJed Brown         /* partition graoh induced by face connectivity */
35190c7d97c5SJed Brown         ierr = PetscMalloc (n_subdomains*sizeof(MetisInt),&metis_coarse_subdivision);CHKERRQ(ierr);
35200c7d97c5SJed Brown         ierr = METIS_SetDefaultOptions(options);
35210c7d97c5SJed Brown         /* we need a contiguous partition of the coarse mesh */
35220c7d97c5SJed Brown         options[METIS_OPTION_CONTIG]=1;
35230c7d97c5SJed Brown         options[METIS_OPTION_DBGLVL]=1;
35240c7d97c5SJed Brown         options[METIS_OPTION_NITER]=30;
35253828260eSStefano Zampini         if(n_subdomains>n_parts*heuristic_for_metis) {
35263828260eSStefano Zampini           options[METIS_OPTION_IPTYPE]=METIS_IPTYPE_EDGE;
35273828260eSStefano Zampini           options[METIS_OPTION_OBJTYPE]=METIS_OBJTYPE_CUT;
35280c7d97c5SJed Brown           ierr = METIS_PartGraphKway(&faces_nvtxs,&ncon,faces_xadj,faces_adjncy,NULL,NULL,NULL,&n_parts,NULL,NULL,options,&objval,metis_coarse_subdivision);
35293828260eSStefano Zampini         } else {
35303828260eSStefano Zampini           ierr = METIS_PartGraphRecursive(&faces_nvtxs,&ncon,faces_xadj,faces_adjncy,NULL,NULL,NULL,&n_parts,NULL,NULL,options,&objval,metis_coarse_subdivision);
35313828260eSStefano Zampini         }
35320c7d97c5SJed Brown         if(ierr != METIS_OK) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in METIS_PartGraphKway (metis error code %D) called from PCBDDCSetupCoarseEnvironment\n",ierr);
35330c7d97c5SJed Brown         ierr = PetscFree(faces_xadj);CHKERRQ(ierr);
35340c7d97c5SJed Brown         ierr = PetscFree(faces_adjncy);CHKERRQ(ierr);
35350c7d97c5SJed Brown         coarse_subdivision = (PetscMPIInt*)calloc(size_prec_comm,sizeof(PetscMPIInt)); /* calloc for contiguous memory since we need to scatter these values later */
35360c7d97c5SJed Brown         /* copy/cast values avoiding possible type conflicts between PETSc, MPI and METIS */
35373828260eSStefano Zampini         for(i=0;i<size_prec_comm;i++) coarse_subdivision[i]=MPI_PROC_NULL;
35383828260eSStefano Zampini         for(i=0;i<n_subdomains;i++)   coarse_subdivision[ranks_stretching_ratio*i]=(PetscInt)(metis_coarse_subdivision[i]);
35390c7d97c5SJed Brown         ierr = PetscFree(metis_coarse_subdivision);CHKERRQ(ierr);
35400c7d97c5SJed Brown       }
35410c7d97c5SJed Brown 
35420c7d97c5SJed Brown       /* Create new communicator for coarse problem splitting the old one */
35430c7d97c5SJed Brown       if( !(rank_prec_comm%procs_jumps_coarse_comm) && rank_prec_comm < procs_jumps_coarse_comm*n_parts ){
3544da1bb401SStefano Zampini         coarse_color=0;              /* for communicator splitting */
3545da1bb401SStefano Zampini         active_rank=rank_prec_comm;  /* for insertion of matrix values */
35460c7d97c5SJed Brown       }
3547da1bb401SStefano Zampini       /* procs with coarse_color = MPI_UNDEFINED will have coarse_comm = MPI_COMM_NULL (from mpi standards)
3548da1bb401SStefano Zampini          key = rank_prec_comm -> keep same ordering of ranks from the old to the new communicator */
354953cdbc3dSStefano Zampini       ierr = MPI_Comm_split(prec_comm,coarse_color,rank_prec_comm,&coarse_comm);CHKERRQ(ierr);
35500c7d97c5SJed Brown 
35510c7d97c5SJed Brown       if( coarse_color == 0 ) {
355253cdbc3dSStefano Zampini         ierr = MPI_Comm_size(coarse_comm,&size_coarse_comm);CHKERRQ(ierr);
355353cdbc3dSStefano Zampini         ierr = MPI_Comm_rank(coarse_comm,&rank_coarse_comm);CHKERRQ(ierr);
3554da1bb401SStefano Zampini         /*printf("Details of coarse comm\n");
35553828260eSStefano Zampini         printf("size = %d, myrank = %d\n",size_coarse_comm,rank_coarse_comm);
3556da1bb401SStefano Zampini         printf("jumps = %d, coarse_color = %d, n_parts = %d\n",procs_jumps_coarse_comm,coarse_color,n_parts);*/
35570c7d97c5SJed Brown       } else {
35580c7d97c5SJed Brown         rank_coarse_comm = MPI_PROC_NULL;
35590c7d97c5SJed Brown       }
35600c7d97c5SJed Brown 
35610c7d97c5SJed Brown       /* master proc take care of arranging and distributing coarse informations */
35620c7d97c5SJed Brown       if(rank_coarse_comm == master_proc) {
35630c7d97c5SJed Brown         ierr = PetscMalloc (size_coarse_comm*sizeof(PetscMPIInt),&displacements_recv);CHKERRQ(ierr);
3564da1bb401SStefano Zampini         /*ierr = PetscMalloc (size_coarse_comm*sizeof(PetscMPIInt),&total_count_recv);CHKERRQ(ierr);
3565da1bb401SStefano Zampini           ierr = PetscMalloc (n_subdomains*sizeof(PetscMPIInt),&total_ranks_recv);CHKERRQ(ierr);*/
35660c7d97c5SJed Brown         total_count_recv = (PetscMPIInt*)calloc(size_prec_comm,sizeof(PetscMPIInt));
35670c7d97c5SJed Brown         total_ranks_recv = (PetscMPIInt*)calloc(n_subdomains,sizeof(PetscMPIInt));
35680c7d97c5SJed Brown         /* some initializations */
35690c7d97c5SJed Brown         displacements_recv[0]=0;
3570da1bb401SStefano Zampini         /* PetscMemzero(total_count_recv,size_coarse_comm*sizeof(PetscMPIInt)); not needed -> calloc initializes to zero */
35710c7d97c5SJed Brown         /* count from how many processes the j-th process of the coarse decomposition will receive data */
35720c7d97c5SJed Brown         for(j=0;j<size_coarse_comm;j++)
35733828260eSStefano Zampini           for(i=0;i<size_prec_comm;i++)
35740c7d97c5SJed Brown             if(coarse_subdivision[i]==j)
35750c7d97c5SJed Brown               total_count_recv[j]++;
35760c7d97c5SJed Brown         /* displacements needed for scatterv of total_ranks_recv */
35770c7d97c5SJed Brown         for(i=1;i<size_coarse_comm;i++) displacements_recv[i]=displacements_recv[i-1]+total_count_recv[i-1];
35780c7d97c5SJed Brown         /* Now fill properly total_ranks_recv -> each coarse process will receive the ranks (in prec_comm communicator) of its friend (sending) processes */
35790c7d97c5SJed Brown         ierr = PetscMemzero(total_count_recv,size_coarse_comm*sizeof(PetscMPIInt));CHKERRQ(ierr);
35800c7d97c5SJed Brown         for(j=0;j<size_coarse_comm;j++) {
35813828260eSStefano Zampini           for(i=0;i<size_prec_comm;i++) {
35820c7d97c5SJed Brown             if(coarse_subdivision[i]==j) {
35830c7d97c5SJed Brown               total_ranks_recv[displacements_recv[j]+total_count_recv[j]]=i;
35843828260eSStefano Zampini               total_count_recv[j]+=1;
35850c7d97c5SJed Brown             }
35860c7d97c5SJed Brown           }
35870c7d97c5SJed Brown         }
3588da1bb401SStefano Zampini         /*for(j=0;j<size_coarse_comm;j++) {
35893828260eSStefano Zampini           printf("process %d in new rank will receive from %d processes (original ranks follows)\n",j,total_count_recv[j]);
35903828260eSStefano Zampini           for(i=0;i<total_count_recv[j];i++) {
35913828260eSStefano Zampini             printf("%d ",total_ranks_recv[displacements_recv[j]+i]);
35923828260eSStefano Zampini           }
35933828260eSStefano Zampini           printf("\n");
3594da1bb401SStefano Zampini         }*/
35950c7d97c5SJed Brown 
35960c7d97c5SJed Brown         /* identify new decomposition in terms of ranks in the old communicator */
35973828260eSStefano Zampini         for(i=0;i<n_subdomains;i++) coarse_subdivision[ranks_stretching_ratio*i]=coarse_subdivision[ranks_stretching_ratio*i]*procs_jumps_coarse_comm;
3598da1bb401SStefano Zampini         /*printf("coarse_subdivision in old end new ranks\n");
35990c7d97c5SJed Brown         for(i=0;i<size_prec_comm;i++)
36003828260eSStefano Zampini           if(coarse_subdivision[i]!=MPI_PROC_NULL) {
36013828260eSStefano Zampini             printf("%d=(%d %d), ",i,coarse_subdivision[i],coarse_subdivision[i]/procs_jumps_coarse_comm);
36023828260eSStefano Zampini           } else {
36033828260eSStefano Zampini             printf("%d=(%d %d), ",i,coarse_subdivision[i],coarse_subdivision[i]);
36043828260eSStefano Zampini           }
3605da1bb401SStefano Zampini         printf("\n");*/
36060c7d97c5SJed Brown       }
36070c7d97c5SJed Brown 
36080c7d97c5SJed Brown       /* Scatter new decomposition for send details */
360953cdbc3dSStefano Zampini       ierr = MPI_Scatter(&coarse_subdivision[0],1,MPIU_INT,&rank_coarse_proc_send_to,1,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr);
36100c7d97c5SJed Brown       /* Scatter receiving details to members of coarse decomposition */
36110c7d97c5SJed Brown       if( coarse_color == 0) {
361253cdbc3dSStefano Zampini         ierr = MPI_Scatter(&total_count_recv[0],1,MPIU_INT,&count_recv,1,MPIU_INT,master_proc,coarse_comm);CHKERRQ(ierr);
36130c7d97c5SJed Brown         ierr = PetscMalloc (count_recv*sizeof(PetscMPIInt),&ranks_recv);CHKERRQ(ierr);
361453cdbc3dSStefano Zampini         ierr = MPI_Scatterv(&total_ranks_recv[0],total_count_recv,displacements_recv,MPIU_INT,&ranks_recv[0],count_recv,MPIU_INT,master_proc,coarse_comm);CHKERRQ(ierr);
36150c7d97c5SJed Brown       }
36160c7d97c5SJed Brown 
3617da1bb401SStefano Zampini       /*printf("I will send my matrix data to proc  %d\n",rank_coarse_proc_send_to);
3618da1bb401SStefano Zampini       if(coarse_color == 0) {
3619da1bb401SStefano Zampini         printf("I will receive some matrix data from %d processes (ranks follows)\n",count_recv);
3620da1bb401SStefano Zampini         for(i=0;i<count_recv;i++)
3621da1bb401SStefano Zampini           printf("%d ",ranks_recv[i]);
3622da1bb401SStefano Zampini         printf("\n");
3623da1bb401SStefano Zampini       }*/
36240c7d97c5SJed Brown 
36250c7d97c5SJed Brown       if(rank_prec_comm == master_proc) {
3626da1bb401SStefano Zampini         /*ierr = PetscFree(coarse_subdivision);CHKERRQ(ierr);
3627da1bb401SStefano Zampini         ierr = PetscFree(total_count_recv);CHKERRQ(ierr);
3628da1bb401SStefano Zampini         ierr = PetscFree(total_ranks_recv);CHKERRQ(ierr);*/
36290c7d97c5SJed Brown         free(coarse_subdivision);
36300c7d97c5SJed Brown         free(total_count_recv);
36310c7d97c5SJed Brown         free(total_ranks_recv);
36320c7d97c5SJed Brown         ierr = PetscFree(displacements_recv);CHKERRQ(ierr);
36330c7d97c5SJed Brown       }
36340c7d97c5SJed Brown       break;
36350c7d97c5SJed Brown     }
36360c7d97c5SJed Brown 
36370c7d97c5SJed Brown     case(REPLICATED_BDDC):
36380c7d97c5SJed Brown 
36390c7d97c5SJed Brown       pcbddc->coarse_communications_type = GATHERS_BDDC;
36400c7d97c5SJed Brown       coarse_mat_type = MATSEQAIJ;
36410c7d97c5SJed Brown       coarse_pc_type  = PCLU;
364253cdbc3dSStefano Zampini       coarse_ksp_type  = KSPPREONLY;
36430c7d97c5SJed Brown       coarse_comm = PETSC_COMM_SELF;
36440c7d97c5SJed Brown       active_rank = rank_prec_comm;
36450c7d97c5SJed Brown       break;
36460c7d97c5SJed Brown 
36470c7d97c5SJed Brown     case(PARALLEL_BDDC):
36480c7d97c5SJed Brown 
36490c7d97c5SJed Brown       pcbddc->coarse_communications_type = SCATTERS_BDDC;
36500c7d97c5SJed Brown       coarse_mat_type = MATMPIAIJ;
36510c7d97c5SJed Brown       coarse_pc_type  = PCREDUNDANT;
365253cdbc3dSStefano Zampini       coarse_ksp_type  = KSPPREONLY;
36530c7d97c5SJed Brown       coarse_comm = prec_comm;
36540c7d97c5SJed Brown       active_rank = rank_prec_comm;
36550c7d97c5SJed Brown       break;
36560c7d97c5SJed Brown 
36570c7d97c5SJed Brown     case(SEQUENTIAL_BDDC):
36580c7d97c5SJed Brown       pcbddc->coarse_communications_type = GATHERS_BDDC;
36590c7d97c5SJed Brown       coarse_mat_type = MATSEQAIJ;
36600c7d97c5SJed Brown       coarse_pc_type = PCLU;
366153cdbc3dSStefano Zampini       coarse_ksp_type  = KSPPREONLY;
36620c7d97c5SJed Brown       coarse_comm = PETSC_COMM_SELF;
36630c7d97c5SJed Brown       active_rank = master_proc;
36640c7d97c5SJed Brown       break;
36650c7d97c5SJed Brown   }
36660c7d97c5SJed Brown 
36670c7d97c5SJed Brown   switch(pcbddc->coarse_communications_type){
36680c7d97c5SJed Brown 
36690c7d97c5SJed Brown     case(SCATTERS_BDDC):
36700c7d97c5SJed Brown       {
36710c7d97c5SJed Brown         if(pcbddc->coarse_problem_type==MULTILEVEL_BDDC) {
36720c7d97c5SJed Brown 
36730c7d97c5SJed Brown           PetscMPIInt send_size;
36740c7d97c5SJed Brown           PetscInt    *aux_ins_indices;
36750c7d97c5SJed Brown           PetscInt    ii,jj;
36760c7d97c5SJed Brown           MPI_Request *requests;
36770c7d97c5SJed Brown 
36780c7d97c5SJed Brown           /* allocate auxiliary space */
36795619798eSStefano Zampini           ierr = PetscMalloc (pcbddc->replicated_primal_size*sizeof(PetscMPIInt),&pcbddc->replicated_local_primal_indices);CHKERRQ(ierr);
36805619798eSStefano Zampini           ierr = MPI_Allgatherv(&pcbddc->local_primal_indices[0],pcbddc->local_primal_size,MPIU_INT,&pcbddc->replicated_local_primal_indices[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,prec_comm);CHKERRQ(ierr);
36810c7d97c5SJed Brown           ierr = PetscMalloc ( pcbddc->coarse_size*sizeof(PetscInt),&aux_ins_indices);CHKERRQ(ierr);
36820c7d97c5SJed Brown           ierr = PetscMemzero(aux_ins_indices,pcbddc->coarse_size*sizeof(PetscInt));CHKERRQ(ierr);
36830c7d97c5SJed Brown           /* allocate stuffs for message massing */
36840c7d97c5SJed Brown           ierr = PetscMalloc ( (count_recv+1)*sizeof(MPI_Request),&requests);CHKERRQ(ierr);
36850c7d97c5SJed Brown           for(i=0;i<count_recv+1;i++) requests[i]=MPI_REQUEST_NULL;
36860c7d97c5SJed Brown           ierr = PetscMalloc ( count_recv*sizeof(PetscMPIInt),&localsizes2);CHKERRQ(ierr);
36870c7d97c5SJed Brown           ierr = PetscMalloc ( count_recv*sizeof(PetscMPIInt),&localdispl2);CHKERRQ(ierr);
36880c7d97c5SJed Brown           /* fill up quantities */
36890c7d97c5SJed Brown           j=0;
36900c7d97c5SJed Brown           for(i=0;i<count_recv;i++){
36910c7d97c5SJed Brown             ii = ranks_recv[i];
36920c7d97c5SJed Brown             localsizes2[i]=pcbddc->local_primal_sizes[ii]*pcbddc->local_primal_sizes[ii];
36930c7d97c5SJed Brown             localdispl2[i]=j;
36940c7d97c5SJed Brown             j+=localsizes2[i];
36950c7d97c5SJed Brown             jj = pcbddc->local_primal_displacements[ii];
3696da1bb401SStefano Zampini             for(k=0;k<pcbddc->local_primal_sizes[ii];k++) aux_ins_indices[pcbddc->replicated_local_primal_indices[jj+k]]+=1;  /* it counts the coarse subdomains sharing the coarse node */
36970c7d97c5SJed Brown           }
3698da1bb401SStefano Zampini           /*printf("aux_ins_indices 1\n");
3699da1bb401SStefano Zampini           for(i=0;i<pcbddc->coarse_size;i++)
3700da1bb401SStefano Zampini             printf("%d ",aux_ins_indices[i]);
3701da1bb401SStefano Zampini           printf("\n");*/
37020c7d97c5SJed Brown           /* temp_coarse_mat_vals used to store temporarly received matrix values */
37030c7d97c5SJed Brown           ierr = PetscMalloc ( j*sizeof(PetscScalar),&temp_coarse_mat_vals);CHKERRQ(ierr);
37040c7d97c5SJed Brown           /* evaluate how many values I will insert in coarse mat */
37050c7d97c5SJed Brown           ins_local_primal_size=0;
37060c7d97c5SJed Brown           for(i=0;i<pcbddc->coarse_size;i++)
37070c7d97c5SJed Brown             if(aux_ins_indices[i])
37080c7d97c5SJed Brown               ins_local_primal_size++;
37090c7d97c5SJed Brown           /* evaluate indices I will insert in coarse mat */
37100c7d97c5SJed Brown           ierr = PetscMalloc ( ins_local_primal_size*sizeof(PetscInt),&ins_local_primal_indices);CHKERRQ(ierr);
37110c7d97c5SJed Brown           j=0;
37120c7d97c5SJed Brown           for(i=0;i<pcbddc->coarse_size;i++)
37130c7d97c5SJed Brown             if(aux_ins_indices[i])
37140c7d97c5SJed Brown               ins_local_primal_indices[j++]=i;
37150c7d97c5SJed Brown           /* use aux_ins_indices to realize a global to local mapping */
37160c7d97c5SJed Brown           j=0;
37170c7d97c5SJed Brown           for(i=0;i<pcbddc->coarse_size;i++){
37180c7d97c5SJed Brown             if(aux_ins_indices[i]==0){
37190c7d97c5SJed Brown               aux_ins_indices[i]=-1;
37200c7d97c5SJed Brown             } else {
37210c7d97c5SJed Brown               aux_ins_indices[i]=j;
37220c7d97c5SJed Brown               j++;
37230c7d97c5SJed Brown             }
37240c7d97c5SJed Brown           }
37250c7d97c5SJed Brown 
3726da1bb401SStefano Zampini           /*printf("New details localsizes2 localdispl2\n");
3727da1bb401SStefano Zampini           for(i=0;i<count_recv;i++)
3728da1bb401SStefano Zampini             printf("(%d %d) ",localsizes2[i],localdispl2[i]);
3729da1bb401SStefano Zampini           printf("\n");
3730da1bb401SStefano Zampini           printf("aux_ins_indices 2\n");
3731da1bb401SStefano Zampini           for(i=0;i<pcbddc->coarse_size;i++)
3732da1bb401SStefano Zampini             printf("%d ",aux_ins_indices[i]);
3733da1bb401SStefano Zampini           printf("\n");
3734da1bb401SStefano Zampini           printf("ins_local_primal_indices\n");
3735da1bb401SStefano Zampini           for(i=0;i<ins_local_primal_size;i++)
3736da1bb401SStefano Zampini             printf("%d ",ins_local_primal_indices[i]);
3737da1bb401SStefano Zampini           printf("\n");
3738da1bb401SStefano Zampini           printf("coarse_submat_vals\n");
3739da1bb401SStefano Zampini           for(i=0;i<pcbddc->local_primal_size;i++)
3740da1bb401SStefano Zampini             for(j=0;j<pcbddc->local_primal_size;j++)
3741da1bb401SStefano Zampini               printf("(%lf %d %d)\n",coarse_submat_vals[j*pcbddc->local_primal_size+i],pcbddc->local_primal_indices[i],pcbddc->local_primal_indices[j]);
3742da1bb401SStefano Zampini           printf("\n");*/
37430c7d97c5SJed Brown 
37440c7d97c5SJed Brown           /* processes partecipating in coarse problem receive matrix data from their friends */
374553cdbc3dSStefano Zampini           for(i=0;i<count_recv;i++) ierr = MPI_Irecv(&temp_coarse_mat_vals[localdispl2[i]],localsizes2[i],MPIU_SCALAR,ranks_recv[i],666,prec_comm,&requests[i]);CHKERRQ(ierr);
37460c7d97c5SJed Brown           if(rank_coarse_proc_send_to != MPI_PROC_NULL ) {
37470c7d97c5SJed Brown             send_size=pcbddc->local_primal_size*pcbddc->local_primal_size;
374853cdbc3dSStefano Zampini             ierr = MPI_Isend(&coarse_submat_vals[0],send_size,MPIU_SCALAR,rank_coarse_proc_send_to,666,prec_comm,&requests[count_recv]);CHKERRQ(ierr);
37490c7d97c5SJed Brown           }
375053cdbc3dSStefano Zampini           ierr = MPI_Waitall(count_recv+1,requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
37510c7d97c5SJed Brown 
3752da1bb401SStefano Zampini           /*if(coarse_color == 0) {
3753da1bb401SStefano Zampini             printf("temp_coarse_mat_vals\n");
3754da1bb401SStefano Zampini             for(k=0;k<count_recv;k++){
3755da1bb401SStefano Zampini               printf("---- %d ----\n",ranks_recv[k]);
3756da1bb401SStefano Zampini               for(i=0;i<pcbddc->local_primal_sizes[ranks_recv[k]];i++)
3757da1bb401SStefano Zampini                 for(j=0;j<pcbddc->local_primal_sizes[ranks_recv[k]];j++)
3758da1bb401SStefano Zampini                   printf("(%lf %d %d)\n",temp_coarse_mat_vals[localdispl2[k]+j*pcbddc->local_primal_sizes[ranks_recv[k]]+i],pcbddc->replicated_local_primal_indices[pcbddc->local_primal_displacements[ranks_recv[k]]+i],pcbddc->replicated_local_primal_indices[pcbddc->local_primal_displacements[ranks_recv[k]]+j]);
3759da1bb401SStefano Zampini               printf("\n");
3760da1bb401SStefano Zampini             }
3761da1bb401SStefano Zampini           }*/
37620c7d97c5SJed Brown           /* calculate data to insert in coarse mat */
37630c7d97c5SJed Brown           ierr = PetscMalloc ( ins_local_primal_size*ins_local_primal_size*sizeof(PetscScalar),&ins_coarse_mat_vals);CHKERRQ(ierr);
37640c7d97c5SJed Brown           PetscMemzero(ins_coarse_mat_vals,ins_local_primal_size*ins_local_primal_size*sizeof(PetscScalar));
37650c7d97c5SJed Brown 
37660c7d97c5SJed Brown           PetscMPIInt rr,kk,lps,lpd;
37670c7d97c5SJed Brown           PetscInt row_ind,col_ind;
37680c7d97c5SJed Brown           for(k=0;k<count_recv;k++){
37690c7d97c5SJed Brown             rr = ranks_recv[k];
37700c7d97c5SJed Brown             kk = localdispl2[k];
37710c7d97c5SJed Brown             lps = pcbddc->local_primal_sizes[rr];
37720c7d97c5SJed Brown             lpd = pcbddc->local_primal_displacements[rr];
3773da1bb401SStefano Zampini             /*printf("Inserting the following indices (received from %d)\n",rr);*/
37740c7d97c5SJed Brown             for(j=0;j<lps;j++){
37750c7d97c5SJed Brown               col_ind=aux_ins_indices[pcbddc->replicated_local_primal_indices[lpd+j]];
37760c7d97c5SJed Brown               for(i=0;i<lps;i++){
37770c7d97c5SJed Brown                 row_ind=aux_ins_indices[pcbddc->replicated_local_primal_indices[lpd+i]];
3778da1bb401SStefano Zampini                 /*printf("%d %d\n",row_ind,col_ind);*/
37790c7d97c5SJed Brown                 ins_coarse_mat_vals[col_ind*ins_local_primal_size+row_ind]+=temp_coarse_mat_vals[kk+j*lps+i];
37800c7d97c5SJed Brown               }
37810c7d97c5SJed Brown             }
37820c7d97c5SJed Brown           }
37830c7d97c5SJed Brown           ierr = PetscFree(requests);CHKERRQ(ierr);
37840c7d97c5SJed Brown           ierr = PetscFree(aux_ins_indices);CHKERRQ(ierr);
37850c7d97c5SJed Brown           ierr = PetscFree(temp_coarse_mat_vals);CHKERRQ(ierr);
37860c7d97c5SJed Brown           if(coarse_color == 0) { ierr = PetscFree(ranks_recv);CHKERRQ(ierr); }
37870c7d97c5SJed Brown 
37880c7d97c5SJed Brown           /* create local to global mapping needed by coarse MATIS */
37890c7d97c5SJed Brown           {
37900c7d97c5SJed Brown             IS coarse_IS;
379153cdbc3dSStefano Zampini             if(coarse_comm != MPI_COMM_NULL ) ierr = MPI_Comm_free(&coarse_comm);CHKERRQ(ierr);
37920c7d97c5SJed Brown             coarse_comm = prec_comm;
37930c7d97c5SJed Brown             active_rank=rank_prec_comm;
37940c7d97c5SJed Brown             ierr = ISCreateGeneral(coarse_comm,ins_local_primal_size,ins_local_primal_indices,PETSC_COPY_VALUES,&coarse_IS);CHKERRQ(ierr);
37950c7d97c5SJed Brown             ierr = ISLocalToGlobalMappingCreateIS(coarse_IS,&coarse_ISLG);CHKERRQ(ierr);
37960c7d97c5SJed Brown             ierr = ISDestroy(&coarse_IS);CHKERRQ(ierr);
37970c7d97c5SJed Brown           }
37980c7d97c5SJed Brown         }
37990c7d97c5SJed Brown         if(pcbddc->coarse_problem_type==PARALLEL_BDDC) {
38000c7d97c5SJed Brown           /* arrays for values insertion */
38010c7d97c5SJed Brown           ins_local_primal_size = pcbddc->local_primal_size;
38020c7d97c5SJed Brown           ierr = PetscMalloc ( ins_local_primal_size*sizeof(PetscMPIInt),&ins_local_primal_indices);CHKERRQ(ierr);
38030c7d97c5SJed Brown           ierr = PetscMalloc ( ins_local_primal_size*ins_local_primal_size*sizeof(PetscScalar),&ins_coarse_mat_vals);CHKERRQ(ierr);
38040c7d97c5SJed Brown           for(j=0;j<ins_local_primal_size;j++){
38050c7d97c5SJed Brown             ins_local_primal_indices[j]=pcbddc->local_primal_indices[j];
38060c7d97c5SJed Brown             for(i=0;i<ins_local_primal_size;i++) ins_coarse_mat_vals[j*ins_local_primal_size+i]=coarse_submat_vals[j*ins_local_primal_size+i];
38070c7d97c5SJed Brown           }
38080c7d97c5SJed Brown         }
38090c7d97c5SJed Brown         break;
38100c7d97c5SJed Brown 
38110c7d97c5SJed Brown     }
38120c7d97c5SJed Brown 
38130c7d97c5SJed Brown     case(GATHERS_BDDC):
38140c7d97c5SJed Brown       {
38150c7d97c5SJed Brown 
38160c7d97c5SJed Brown         PetscMPIInt mysize,mysize2;
38170c7d97c5SJed Brown 
38180c7d97c5SJed Brown         if(rank_prec_comm==active_rank) {
38190c7d97c5SJed Brown           ierr = PetscMalloc ( pcbddc->replicated_primal_size*sizeof(PetscMPIInt),&pcbddc->replicated_local_primal_indices);CHKERRQ(ierr);
38200c7d97c5SJed Brown           pcbddc->replicated_local_primal_values = (PetscScalar*)calloc(pcbddc->replicated_primal_size,sizeof(PetscScalar));
38210c7d97c5SJed Brown           ierr = PetscMalloc ( size_prec_comm*sizeof(PetscMPIInt),&localsizes2);CHKERRQ(ierr);
38220c7d97c5SJed Brown           ierr = PetscMalloc ( size_prec_comm*sizeof(PetscMPIInt),&localdispl2);CHKERRQ(ierr);
38230c7d97c5SJed Brown           /* arrays for values insertion */
38240c7d97c5SJed Brown           ins_local_primal_size = pcbddc->coarse_size;
38250c7d97c5SJed Brown           ierr = PetscMalloc ( ins_local_primal_size*sizeof(PetscMPIInt),&ins_local_primal_indices);CHKERRQ(ierr);
38260c7d97c5SJed Brown           ierr = PetscMalloc ( ins_local_primal_size*ins_local_primal_size*sizeof(PetscScalar),&ins_coarse_mat_vals);CHKERRQ(ierr);
38270c7d97c5SJed Brown           for(i=0;i<size_prec_comm;i++) localsizes2[i]=pcbddc->local_primal_sizes[i]*pcbddc->local_primal_sizes[i];
38280c7d97c5SJed Brown           localdispl2[0]=0;
38290c7d97c5SJed Brown           for(i=1;i<size_prec_comm;i++) localdispl2[i]=localsizes2[i-1]+localdispl2[i-1];
38300c7d97c5SJed Brown           j=0;
38310c7d97c5SJed Brown           for(i=0;i<size_prec_comm;i++) j+=localsizes2[i];
38320c7d97c5SJed Brown           ierr = PetscMalloc ( j*sizeof(PetscScalar),&temp_coarse_mat_vals);CHKERRQ(ierr);
38330c7d97c5SJed Brown         }
38340c7d97c5SJed Brown 
38350c7d97c5SJed Brown         mysize=pcbddc->local_primal_size;
38360c7d97c5SJed Brown         mysize2=pcbddc->local_primal_size*pcbddc->local_primal_size;
38370c7d97c5SJed Brown         if(pcbddc->coarse_problem_type == SEQUENTIAL_BDDC){
383853cdbc3dSStefano Zampini           ierr = MPI_Gatherv(&pcbddc->local_primal_indices[0],mysize,MPIU_INT,&pcbddc->replicated_local_primal_indices[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr);
383953cdbc3dSStefano Zampini           ierr = MPI_Gatherv(&coarse_submat_vals[0],mysize2,MPIU_SCALAR,&temp_coarse_mat_vals[0],localsizes2,localdispl2,MPIU_SCALAR,master_proc,prec_comm);CHKERRQ(ierr);
38400c7d97c5SJed Brown         } else {
384153cdbc3dSStefano Zampini           ierr = MPI_Allgatherv(&pcbddc->local_primal_indices[0],mysize,MPIU_INT,&pcbddc->replicated_local_primal_indices[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,prec_comm);CHKERRQ(ierr);
384253cdbc3dSStefano Zampini           ierr = MPI_Allgatherv(&coarse_submat_vals[0],mysize2,MPIU_SCALAR,&temp_coarse_mat_vals[0],localsizes2,localdispl2,MPIU_SCALAR,prec_comm);CHKERRQ(ierr);
38430c7d97c5SJed Brown         }
38440c7d97c5SJed Brown 
38450c7d97c5SJed Brown   /* free data structures no longer needed and allocate some space which will be needed in BDDC application */
38460c7d97c5SJed Brown         if(rank_prec_comm==active_rank) {
38470c7d97c5SJed Brown           PetscInt offset,offset2,row_ind,col_ind;
38480c7d97c5SJed Brown           for(j=0;j<ins_local_primal_size;j++){
38490c7d97c5SJed Brown             ins_local_primal_indices[j]=j;
38500c7d97c5SJed Brown             for(i=0;i<ins_local_primal_size;i++) ins_coarse_mat_vals[j*ins_local_primal_size+i]=0.0;
38510c7d97c5SJed Brown           }
38520c7d97c5SJed Brown           for(k=0;k<size_prec_comm;k++){
38530c7d97c5SJed Brown             offset=pcbddc->local_primal_displacements[k];
38540c7d97c5SJed Brown             offset2=localdispl2[k];
38550c7d97c5SJed Brown             for(j=0;j<pcbddc->local_primal_sizes[k];j++){
38560c7d97c5SJed Brown               col_ind=pcbddc->replicated_local_primal_indices[offset+j];
38570c7d97c5SJed Brown               for(i=0;i<pcbddc->local_primal_sizes[k];i++){
38580c7d97c5SJed Brown                 row_ind=pcbddc->replicated_local_primal_indices[offset+i];
38590c7d97c5SJed Brown                 ins_coarse_mat_vals[col_ind*pcbddc->coarse_size+row_ind]+=temp_coarse_mat_vals[offset2+j*pcbddc->local_primal_sizes[k]+i];
38600c7d97c5SJed Brown               }
38610c7d97c5SJed Brown             }
38620c7d97c5SJed Brown           }
38630c7d97c5SJed Brown         }
38640c7d97c5SJed Brown         break;
3865da1bb401SStefano Zampini       }/* switch on coarse problem and communications associated with finished */
38660c7d97c5SJed Brown   }
38670c7d97c5SJed Brown 
38680c7d97c5SJed Brown   /* Now create and fill up coarse matrix */
38690c7d97c5SJed Brown   if( rank_prec_comm == active_rank ) {
38700c7d97c5SJed Brown     if(pcbddc->coarse_problem_type != MULTILEVEL_BDDC) {
38710c7d97c5SJed Brown       ierr = MatCreate(coarse_comm,&pcbddc->coarse_mat);CHKERRQ(ierr);
38720c7d97c5SJed Brown       ierr = MatSetSizes(pcbddc->coarse_mat,PETSC_DECIDE,PETSC_DECIDE,pcbddc->coarse_size,pcbddc->coarse_size);CHKERRQ(ierr);
38730c7d97c5SJed Brown       ierr = MatSetType(pcbddc->coarse_mat,coarse_mat_type);CHKERRQ(ierr);
38743b03a366Sstefano_zampini       ierr = MatSetUp(pcbddc->coarse_mat);CHKERRQ(ierr);
3875da1bb401SStefano Zampini       ierr = MatSetOption(pcbddc->coarse_mat,MAT_ROW_ORIENTED,PETSC_FALSE);CHKERRQ(ierr); /* local values stored in column major */
38763b03a366Sstefano_zampini       ierr = MatSetOption(pcbddc->coarse_mat,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr);
38770c7d97c5SJed Brown     } else {
38780c7d97c5SJed Brown       Mat matis_coarse_local_mat;
3879d3ee2243SStefano Zampini       /* remind bs */
3880d3ee2243SStefano Zampini       ierr = MatCreateIS(coarse_comm,bs,PETSC_DECIDE,PETSC_DECIDE,pcbddc->coarse_size,pcbddc->coarse_size,coarse_ISLG,&pcbddc->coarse_mat);CHKERRQ(ierr);
38813b03a366Sstefano_zampini       ierr = MatSetUp(pcbddc->coarse_mat);CHKERRQ(ierr);
38820c7d97c5SJed Brown       ierr = MatISGetLocalMat(pcbddc->coarse_mat,&matis_coarse_local_mat);CHKERRQ(ierr);
38833b03a366Sstefano_zampini       ierr = MatSetUp(matis_coarse_local_mat);CHKERRQ(ierr);
3884da1bb401SStefano Zampini       ierr = MatSetOption(matis_coarse_local_mat,MAT_ROW_ORIENTED,PETSC_FALSE);CHKERRQ(ierr); /* local values stored in column major */
3885a0ba757dSStefano Zampini       ierr = MatSetOption(matis_coarse_local_mat,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr);
38860c7d97c5SJed Brown     }
3887a0ba757dSStefano Zampini     ierr = MatSetOption(pcbddc->coarse_mat,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_FALSE);CHKERRQ(ierr);
38880c7d97c5SJed Brown     ierr = MatSetValues(pcbddc->coarse_mat,ins_local_primal_size,ins_local_primal_indices,ins_local_primal_size,ins_local_primal_indices,ins_coarse_mat_vals,ADD_VALUES);CHKERRQ(ierr);
38890c7d97c5SJed Brown     ierr = MatAssemblyBegin(pcbddc->coarse_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
38900c7d97c5SJed Brown     ierr = MatAssemblyEnd(pcbddc->coarse_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
38910c7d97c5SJed Brown 
3892da1bb401SStefano Zampini     /*  PetscViewer view_out;
3893da1bb401SStefano Zampini       ierr = PetscViewerASCIIOpen(PETSC_COMM_SELF,"coarsematfull.m",&view_out);CHKERRQ(ierr);
3894da1bb401SStefano Zampini       ierr = PetscViewerSetFormat(view_out,PETSC_VIEWER_ASCII_MATLAB);CHKERRQ(ierr);
3895da1bb401SStefano Zampini       ierr = MatView(pcbddc->coarse_mat,view_out);CHKERRQ(ierr);
3896da1bb401SStefano Zampini       ierr = PetscViewerDestroy(&view_out);CHKERRQ(ierr);*/
3897da1bb401SStefano Zampini 
38980c7d97c5SJed Brown     ierr = MatGetVecs(pcbddc->coarse_mat,&pcbddc->coarse_vec,&pcbddc->coarse_rhs);CHKERRQ(ierr);
38990c7d97c5SJed Brown     /* Preconditioner for coarse problem */
390053cdbc3dSStefano Zampini     ierr = KSPCreate(coarse_comm,&pcbddc->coarse_ksp);CHKERRQ(ierr);
390153cdbc3dSStefano Zampini     ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->coarse_ksp,(PetscObject)pc,1);CHKERRQ(ierr);
390253cdbc3dSStefano Zampini     ierr = KSPSetOperators(pcbddc->coarse_ksp,pcbddc->coarse_mat,pcbddc->coarse_mat,SAME_PRECONDITIONER);CHKERRQ(ierr);
39033b03a366Sstefano_zampini     ierr = KSPSetTolerances(pcbddc->coarse_ksp,PETSC_DEFAULT,PETSC_DEFAULT,PETSC_DEFAULT,max_it_coarse_ksp);CHKERRQ(ierr);
390453cdbc3dSStefano Zampini     ierr = KSPSetType(pcbddc->coarse_ksp,coarse_ksp_type);CHKERRQ(ierr);
390553cdbc3dSStefano Zampini     ierr = KSPGetPC(pcbddc->coarse_ksp,&pc_temp);CHKERRQ(ierr);
390653cdbc3dSStefano Zampini     ierr = PCSetType(pc_temp,coarse_pc_type);CHKERRQ(ierr);
39070c7d97c5SJed Brown     /* Allow user's customization */
3908da1bb401SStefano Zampini     ierr = KSPSetOptionsPrefix(pcbddc->coarse_ksp,"coarse_");CHKERRQ(ierr);
390953cdbc3dSStefano Zampini     ierr = KSPSetFromOptions(pcbddc->coarse_ksp);CHKERRQ(ierr);
39100c7d97c5SJed Brown     /* Set Up PC for coarse problem BDDC */
391153cdbc3dSStefano Zampini     if(pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
3912e269702eSStefano Zampini       if(dbg_flag) {
3913e269702eSStefano Zampini         ierr = PetscViewerASCIIPrintf(viewer,"----------------Setting up a new level---------------\n");CHKERRQ(ierr);
3914e269702eSStefano Zampini         ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
3915e269702eSStefano Zampini       }
391653cdbc3dSStefano Zampini       ierr = PCBDDCSetCoarseProblemType(pc_temp,MULTILEVEL_BDDC);CHKERRQ(ierr);
391753cdbc3dSStefano Zampini     }
391853cdbc3dSStefano Zampini     ierr = KSPSetUp(pcbddc->coarse_ksp);CHKERRQ(ierr);
39195619798eSStefano Zampini     if(pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
39205619798eSStefano Zampini       if(dbg_flag) {
39215619798eSStefano Zampini         ierr = PetscViewerASCIIPrintf(viewer,"----------------New level set------------------------\n");CHKERRQ(ierr);
39225619798eSStefano Zampini         ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
39235619798eSStefano Zampini       }
39245619798eSStefano Zampini     }
39250c7d97c5SJed Brown   }
39260c7d97c5SJed Brown   if(pcbddc->coarse_communications_type == SCATTERS_BDDC) {
39270c7d97c5SJed Brown      IS local_IS,global_IS;
39280c7d97c5SJed Brown      ierr = ISCreateStride(PETSC_COMM_SELF,pcbddc->local_primal_size,0,1,&local_IS);CHKERRQ(ierr);
39290c7d97c5SJed Brown      ierr = ISCreateGeneral(PETSC_COMM_SELF,pcbddc->local_primal_size,pcbddc->local_primal_indices,PETSC_COPY_VALUES,&global_IS);CHKERRQ(ierr);
39300c7d97c5SJed Brown      ierr = VecScatterCreate(pcbddc->vec1_P,local_IS,pcbddc->coarse_vec,global_IS,&pcbddc->coarse_loc_to_glob);CHKERRQ(ierr);
39310c7d97c5SJed Brown      ierr = ISDestroy(&local_IS);CHKERRQ(ierr);
39320c7d97c5SJed Brown      ierr = ISDestroy(&global_IS);CHKERRQ(ierr);
39330c7d97c5SJed Brown   }
39340c7d97c5SJed Brown 
39350c7d97c5SJed Brown 
39363b03a366Sstefano_zampini   /* Evaluate condition number of coarse problem for cheby (and verbose output if requested) */
39373b03a366Sstefano_zampini   if( pcbddc->coarse_problem_type == MULTILEVEL_BDDC && rank_prec_comm == active_rank ) {
39380c7d97c5SJed Brown     PetscScalar m_one=-1.0;
39395619798eSStefano Zampini     PetscReal   infty_error,lambda_min,lambda_max,kappa_2;
39403b03a366Sstefano_zampini     const KSPType check_ksp_type=KSPGMRES;
39410c7d97c5SJed Brown 
39425619798eSStefano Zampini     /* change coarse ksp object to an iterative method suitable for extreme eigenvalues' estimation */
39433b03a366Sstefano_zampini     ierr = KSPSetType(pcbddc->coarse_ksp,check_ksp_type);CHKERRQ(ierr);
3944d49ef151SStefano Zampini     ierr = KSPSetComputeSingularValues(pcbddc->coarse_ksp,PETSC_TRUE);CHKERRQ(ierr);
39455619798eSStefano Zampini     ierr = KSPSetTolerances(pcbddc->coarse_ksp,1.e-8,1.e-8,PETSC_DEFAULT,pcbddc->coarse_size);CHKERRQ(ierr);
39465619798eSStefano Zampini     ierr = KSPSetUp(pcbddc->coarse_ksp);CHKERRQ(ierr);
3947d49ef151SStefano Zampini     ierr = VecSetRandom(pcbddc->coarse_rhs,PETSC_NULL);CHKERRQ(ierr);
3948d49ef151SStefano Zampini     ierr = MatMult(pcbddc->coarse_mat,pcbddc->coarse_rhs,pcbddc->coarse_vec);CHKERRQ(ierr);
3949d49ef151SStefano Zampini     ierr = MatMult(pcbddc->coarse_mat,pcbddc->coarse_vec,pcbddc->coarse_rhs);CHKERRQ(ierr);
3950d49ef151SStefano Zampini     ierr = KSPSolve(pcbddc->coarse_ksp,pcbddc->coarse_rhs,pcbddc->coarse_rhs);CHKERRQ(ierr);
3951d49ef151SStefano Zampini     ierr = KSPComputeExtremeSingularValues(pcbddc->coarse_ksp,&lambda_max,&lambda_min);CHKERRQ(ierr);
39523b03a366Sstefano_zampini     if(dbg_flag) {
39535619798eSStefano Zampini       kappa_2=lambda_max/lambda_min;
39545619798eSStefano Zampini       ierr = KSPGetIterationNumber(pcbddc->coarse_ksp,&k);CHKERRQ(ierr);
3955d49ef151SStefano Zampini       ierr = VecAXPY(pcbddc->coarse_rhs,m_one,pcbddc->coarse_vec);CHKERRQ(ierr);
3956d49ef151SStefano Zampini       ierr = VecNorm(pcbddc->coarse_rhs,NORM_INFINITY,&infty_error);CHKERRQ(ierr);
39573b03a366Sstefano_zampini       ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem condition number estimated with %d iterations of %s is: % 1.14e\n",k,check_ksp_type,kappa_2);CHKERRQ(ierr);
3958e269702eSStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem eigenvalues: % 1.14e %1.14e\n",lambda_min,lambda_max);CHKERRQ(ierr);
3959e269702eSStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem infty_error: %1.14e\n",infty_error);CHKERRQ(ierr);
39603b03a366Sstefano_zampini     }
39615619798eSStefano Zampini     /* restore coarse ksp to default values */
3962d49ef151SStefano Zampini     ierr = KSPSetComputeSingularValues(pcbddc->coarse_ksp,PETSC_FALSE);CHKERRQ(ierr);
39635619798eSStefano Zampini     ierr = KSPSetType(pcbddc->coarse_ksp,coarse_ksp_type);CHKERRQ(ierr);
39646c9de887SHong Zhang     ierr = KSPChebyshevSetEigenvalues(pcbddc->coarse_ksp,lambda_max,lambda_min);CHKERRQ(ierr);
39653b03a366Sstefano_zampini     ierr = KSPSetTolerances(pcbddc->coarse_ksp,PETSC_DEFAULT,PETSC_DEFAULT,PETSC_DEFAULT,max_it_coarse_ksp);CHKERRQ(ierr);
39665619798eSStefano Zampini     ierr = KSPSetFromOptions(pcbddc->coarse_ksp);CHKERRQ(ierr);
39675619798eSStefano Zampini     ierr = KSPSetUp(pcbddc->coarse_ksp);CHKERRQ(ierr);
396853cdbc3dSStefano Zampini   }
39690c7d97c5SJed Brown 
39700c7d97c5SJed Brown   /* free data structures no longer needed */
39710c7d97c5SJed Brown   if(coarse_ISLG)                { ierr = ISLocalToGlobalMappingDestroy(&coarse_ISLG);CHKERRQ(ierr); }
39720c7d97c5SJed Brown   if(ins_local_primal_indices)   { ierr = PetscFree(ins_local_primal_indices);CHKERRQ(ierr);  }
39730c7d97c5SJed Brown   if(ins_coarse_mat_vals)        { ierr = PetscFree(ins_coarse_mat_vals);CHKERRQ(ierr);}
39740c7d97c5SJed Brown   if(localsizes2)                { ierr = PetscFree(localsizes2);CHKERRQ(ierr);}
39750c7d97c5SJed Brown   if(localdispl2)                { ierr = PetscFree(localdispl2);CHKERRQ(ierr);}
39760c7d97c5SJed Brown   if(temp_coarse_mat_vals)       { ierr = PetscFree(temp_coarse_mat_vals);CHKERRQ(ierr);}
39770c7d97c5SJed Brown 
39780c7d97c5SJed Brown   PetscFunctionReturn(0);
39790c7d97c5SJed Brown }
39800c7d97c5SJed Brown 
39810c7d97c5SJed Brown #undef __FUNCT__
39820c7d97c5SJed Brown #define __FUNCT__ "PCBDDCManageLocalBoundaries"
398353cdbc3dSStefano Zampini static PetscErrorCode PCBDDCManageLocalBoundaries(PC pc)
39840c7d97c5SJed Brown {
39850c7d97c5SJed Brown 
39860c7d97c5SJed Brown   PC_BDDC     *pcbddc = (PC_BDDC*)pc->data;
39870c7d97c5SJed Brown   PC_IS         *pcis = (PC_IS*)pc->data;
39880c7d97c5SJed Brown   Mat_IS      *matis  = (Mat_IS*)pc->pmat->data;
3989da1bb401SStefano Zampini   PCBDDCGraph mat_graph=pcbddc->mat_graph;
39903972b0daSStefano Zampini   PetscInt    *queue_in_global_numbering,*is_indices,*auxis;
39913b03a366Sstefano_zampini   PetscInt    bs,ierr,i,j,s,k,iindex,neumann_bsize,dirichlet_bsize;
3992da1bb401SStefano Zampini   PetscInt    total_counts,nodes_touched,where_values=1,vertex_size;
3993534831adSStefano Zampini   PetscMPIInt adapt_interface=0,adapt_interface_reduced=0,NEUMANNCNT=0;
3994da1bb401SStefano Zampini   PetscBool   same_set;
3995a0ba757dSStefano Zampini   MPI_Comm    interface_comm=((PetscObject)pc)->comm;
39963b03a366Sstefano_zampini   PetscBool   use_faces=PETSC_FALSE,use_edges=PETSC_FALSE;
39973b03a366Sstefano_zampini   const PetscInt *neumann_nodes;
39983b03a366Sstefano_zampini   const PetscInt *dirichlet_nodes;
3999a81d60d8SStefano Zampini   IS          used_IS,*custom_ISForDofs;
4000da1bb401SStefano Zampini   PetscScalar *array;
4001da1bb401SStefano Zampini   PetscScalar *array2;
4002da1bb401SStefano Zampini   PetscViewer viewer=pcbddc->dbg_viewer;
40030c7d97c5SJed Brown 
40040c7d97c5SJed Brown   PetscFunctionBegin;
4005da1bb401SStefano Zampini   /* Setup local adjacency graph */
4006da1bb401SStefano Zampini   mat_graph->nvtxs=pcis->n;
4007534831adSStefano Zampini   if(!mat_graph->xadj) { NEUMANNCNT = 1; }
4008da1bb401SStefano Zampini   ierr = PCBDDCSetupLocalAdjacencyGraph(pc);CHKERRQ(ierr);
4009a0ba757dSStefano Zampini   i = mat_graph->nvtxs;
4010a0ba757dSStefano Zampini   ierr = PetscMalloc4(i,PetscInt,&mat_graph->where,i,PetscInt,&mat_graph->count,i+1,PetscInt,&mat_graph->cptr,i,PetscInt,&mat_graph->queue);CHKERRQ(ierr);
40113972b0daSStefano Zampini   ierr = PetscMalloc2(i,PetscInt,&mat_graph->which_dof,i,PetscBool,&mat_graph->touched);CHKERRQ(ierr);
40123972b0daSStefano Zampini   ierr = PetscMalloc(i*sizeof(PetscInt),&queue_in_global_numbering);CHKERRQ(ierr);
4013a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->where,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
4014a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->count,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
4015a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->which_dof,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
4016a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->queue,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
40173828260eSStefano Zampini   ierr = PetscMemzero(mat_graph->cptr,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr);
4018a0ba757dSStefano Zampini 
4019a81d60d8SStefano Zampini   /* Setting dofs splitting in mat_graph->which_dof
4020a81d60d8SStefano Zampini      Get information about dofs' splitting if provided by the user
4021a81d60d8SStefano Zampini      Otherwise it assumes a constant block size */
4022a81d60d8SStefano Zampini   vertex_size=0;
4023a81d60d8SStefano Zampini   if(!pcbddc->n_ISForDofs) {
4024a81d60d8SStefano Zampini     ierr = MatGetBlockSize(matis->A,&bs);CHKERRQ(ierr);
4025a81d60d8SStefano Zampini     ierr = PetscMalloc(bs*sizeof(IS),&custom_ISForDofs);CHKERRQ(ierr);
4026a81d60d8SStefano Zampini     for(i=0;i<bs;i++) {
4027a81d60d8SStefano Zampini       ierr = ISCreateStride(PETSC_COMM_SELF,pcis->n/bs,i,bs,&custom_ISForDofs[i]);CHKERRQ(ierr);
4028a81d60d8SStefano Zampini     }
4029a81d60d8SStefano Zampini     ierr = PCBDDCSetDofsSplitting(pc,bs,custom_ISForDofs);CHKERRQ(ierr);
4030a81d60d8SStefano Zampini     vertex_size=1;
4031a81d60d8SStefano Zampini     /* remove my references to IS objects */
4032a81d60d8SStefano Zampini     for(i=0;i<bs;i++) {
4033a81d60d8SStefano Zampini       ierr = ISDestroy(&custom_ISForDofs[i]);CHKERRQ(ierr);
4034a81d60d8SStefano Zampini     }
4035a81d60d8SStefano Zampini     ierr = PetscFree(custom_ISForDofs);CHKERRQ(ierr);
4036a81d60d8SStefano Zampini   }
40379c0446d6SStefano Zampini   for(i=0;i<pcbddc->n_ISForDofs;i++) {
4038a81d60d8SStefano Zampini     ierr = ISGetSize(pcbddc->ISForDofs[i],&k);CHKERRQ(ierr);
40399c0446d6SStefano Zampini     ierr = ISGetIndices(pcbddc->ISForDofs[i],(const PetscInt**)&is_indices);CHKERRQ(ierr);
4040a81d60d8SStefano Zampini     for(j=0;j<k;j++) {
40419c0446d6SStefano Zampini       mat_graph->which_dof[is_indices[j]]=i;
40429c0446d6SStefano Zampini     }
40439c0446d6SStefano Zampini     ierr = ISRestoreIndices(pcbddc->ISForDofs[i],(const PetscInt**)&is_indices);CHKERRQ(ierr);
40449c0446d6SStefano Zampini   }
4045a81d60d8SStefano Zampini   /* use mat block size as vertex size if it has not yet set */
4046a81d60d8SStefano Zampini   if(!vertex_size) {
40473b03a366Sstefano_zampini     ierr = MatGetBlockSize(matis->A,&vertex_size);CHKERRQ(ierr);
40480c7d97c5SJed Brown   }
4049a81d60d8SStefano Zampini 
40503b03a366Sstefano_zampini   /* count number of neigh per node */
40510c7d97c5SJed Brown   total_counts=0;
40523b03a366Sstefano_zampini   for(i=1;i<pcis->n_neigh;i++){
40530c7d97c5SJed Brown     s=pcis->n_shared[i];
40540c7d97c5SJed Brown     total_counts+=s;
405553cdbc3dSStefano Zampini     for(j=0;j<s;j++){
40560c7d97c5SJed Brown       mat_graph->count[pcis->shared[i][j]] += 1;
40570c7d97c5SJed Brown     }
40580c7d97c5SJed Brown   }
4059534831adSStefano Zampini   /* Take into account Neumann data -> it increments number of sharing subdomains for nodes lying on the interface */
406036e030ebSStefano Zampini   ierr = PCBDDCGetNeumannBoundaries(pc,&used_IS);CHKERRQ(ierr);
4061da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
4062da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
406336e030ebSStefano Zampini   if(used_IS) {
406436e030ebSStefano Zampini     ierr = ISGetSize(used_IS,&neumann_bsize);CHKERRQ(ierr);
406536e030ebSStefano Zampini     ierr = ISGetIndices(used_IS,&neumann_nodes);CHKERRQ(ierr);
406653cdbc3dSStefano Zampini     for(i=0;i<neumann_bsize;i++){
406753cdbc3dSStefano Zampini       iindex = neumann_nodes[i];
4068534831adSStefano Zampini       if(mat_graph->count[iindex] > NEUMANNCNT && array[iindex]==0.0){
406953cdbc3dSStefano Zampini         mat_graph->count[iindex]+=1;
40700c7d97c5SJed Brown         total_counts++;
4071da1bb401SStefano Zampini         array[iindex]=array[iindex]+1.0;
4072da1bb401SStefano Zampini       } else if(array[iindex]>0.0) {
4073da1bb401SStefano Zampini         SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_USER,"Error for neumann nodes provided to BDDC! They must be uniquely listed! Found duplicate node %d\n",iindex);
40740c7d97c5SJed Brown       }
40750c7d97c5SJed Brown     }
40760c7d97c5SJed Brown   }
4077da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
4078da1bb401SStefano Zampini   /* allocate space for storing the set of neighbours for each node */
4079da1bb401SStefano Zampini   ierr = PetscMalloc(mat_graph->nvtxs*sizeof(PetscInt*),&mat_graph->neighbours_set);CHKERRQ(ierr);
4080da1bb401SStefano Zampini   if(mat_graph->nvtxs) { ierr = PetscMalloc(total_counts*sizeof(PetscInt),&mat_graph->neighbours_set[0]);CHKERRQ(ierr); }
4081da1bb401SStefano Zampini   for(i=1;i<mat_graph->nvtxs;i++) mat_graph->neighbours_set[i]=mat_graph->neighbours_set[i-1]+mat_graph->count[i-1];
4082a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->count,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
40833b03a366Sstefano_zampini   for(i=1;i<pcis->n_neigh;i++){
40840c7d97c5SJed Brown     s=pcis->n_shared[i];
40850c7d97c5SJed Brown     for(j=0;j<s;j++) {
40860c7d97c5SJed Brown       k=pcis->shared[i][j];
4087da1bb401SStefano Zampini       mat_graph->neighbours_set[k][mat_graph->count[k]] = pcis->neigh[i];
40880c7d97c5SJed Brown       mat_graph->count[k]+=1;
40890c7d97c5SJed Brown     }
40900c7d97c5SJed Brown   }
4091da1bb401SStefano Zampini   /* Check consistency of Neumann nodes */
4092da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
4093da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4094da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4095da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4096da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4097da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
40983b03a366Sstefano_zampini   /* set -1 fake neighbour to mimic Neumann boundary */
409936e030ebSStefano Zampini   if(used_IS) {
410053cdbc3dSStefano Zampini     for(i=0;i<neumann_bsize;i++){
410153cdbc3dSStefano Zampini       iindex = neumann_nodes[i];
4102534831adSStefano Zampini       if(mat_graph->count[iindex] > NEUMANNCNT){
4103da1bb401SStefano Zampini         if(mat_graph->count[iindex]+1 != (PetscInt)array[iindex]) {
4104da1bb401SStefano Zampini           SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_USER,"Neumann nodes provided to BDDC must be consistent among neighbours!\nNode %d: number of sharing subdomains %d != number of subdomains for which it is a neumann node %d\n",iindex,mat_graph->count[iindex]+1,(PetscInt)array[iindex]);
4105da1bb401SStefano Zampini         }
4106da1bb401SStefano Zampini         mat_graph->neighbours_set[iindex][mat_graph->count[iindex]] = -1;
410753cdbc3dSStefano Zampini         mat_graph->count[iindex]+=1;
41080c7d97c5SJed Brown       }
41090c7d97c5SJed Brown     }
411036e030ebSStefano Zampini     ierr = ISRestoreIndices(used_IS,&neumann_nodes);CHKERRQ(ierr);
41110c7d97c5SJed Brown   }
4112da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
4113da1bb401SStefano Zampini   /* sort set of sharing subdomains */
4114da1bb401SStefano Zampini   for(i=0;i<mat_graph->nvtxs;i++) { ierr = PetscSortInt(mat_graph->count[i],mat_graph->neighbours_set[i]);CHKERRQ(ierr); }
41153b03a366Sstefano_zampini   /* remove interior nodes and dirichlet boundary nodes from the next search into the graph */
4116da1bb401SStefano Zampini   for(i=0;i<mat_graph->nvtxs;i++){mat_graph->touched[i]=PETSC_FALSE;}
4117da1bb401SStefano Zampini   nodes_touched=0;
411836e030ebSStefano Zampini   ierr = PCBDDCGetDirichletBoundaries(pc,&used_IS);CHKERRQ(ierr);
4119da1bb401SStefano Zampini   ierr = VecSet(pcis->vec2_N,0.0);CHKERRQ(ierr);
4120da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
4121da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec2_N,&array2);CHKERRQ(ierr);
4122da1bb401SStefano Zampini   if(used_IS) {
4123da1bb401SStefano Zampini     ierr = ISGetSize(used_IS,&dirichlet_bsize);CHKERRQ(ierr);
4124da1bb401SStefano Zampini     if(dirichlet_bsize && matis->pure_neumann) {
4125da1bb401SStefano Zampini       SETERRQ(PETSC_COMM_SELF,PETSC_ERR_USER,"Dirichlet boundaries are intended to be used with matrices with zeroed rows!\n");
4126da1bb401SStefano Zampini     }
4127da1bb401SStefano Zampini     ierr = ISGetIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr);
4128da1bb401SStefano Zampini     for(i=0;i<dirichlet_bsize;i++){
4129da1bb401SStefano Zampini       iindex=dirichlet_nodes[i];
4130da1bb401SStefano Zampini       if(mat_graph->count[iindex] && !mat_graph->touched[iindex]) {
4131da1bb401SStefano Zampini         if(array[iindex]>0.0) {
4132da1bb401SStefano Zampini           SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_USER,"BDDC cannot have nodes which are marked as Neumann and Dirichlet at the same time! Wrong node %d\n",iindex);
4133da1bb401SStefano Zampini         }
4134da1bb401SStefano Zampini         mat_graph->touched[iindex]=PETSC_TRUE;
4135da1bb401SStefano Zampini         mat_graph->where[iindex]=0;
4136da1bb401SStefano Zampini         nodes_touched++;
4137da1bb401SStefano Zampini         array2[iindex]=array2[iindex]+1.0;
4138da1bb401SStefano Zampini       }
4139da1bb401SStefano Zampini     }
4140da1bb401SStefano Zampini     ierr = ISRestoreIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr);
4141da1bb401SStefano Zampini   }
4142da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
4143da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec2_N,&array2);CHKERRQ(ierr);
4144da1bb401SStefano Zampini   /* Check consistency of Dirichlet nodes */
4145da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_N,1.0);CHKERRQ(ierr);
4146da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
4147da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4148da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4149da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4150da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4151da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
4152da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec2_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4153da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec2_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4154da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4155da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4156da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
4157da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec2_N,&array2);CHKERRQ(ierr);
415836e030ebSStefano Zampini   if(used_IS) {
415936e030ebSStefano Zampini     ierr = ISGetSize(used_IS,&dirichlet_bsize);CHKERRQ(ierr);
416036e030ebSStefano Zampini     ierr = ISGetIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr);
41613b03a366Sstefano_zampini     for(i=0;i<dirichlet_bsize;i++){
4162da1bb401SStefano Zampini       iindex=dirichlet_nodes[i];
4163da1bb401SStefano Zampini       if(array[iindex]>1.0 && array[iindex]!=array2[iindex] ) {
4164da1bb401SStefano Zampini          SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_USER,"Dirichlet nodes provided to BDDC must be consistent among neighbours!\nNode %d: number of sharing subdomains %d != number of subdomains for which it is a neumann node %d\n",iindex,(PetscInt)array[iindex],(PetscInt)array2[iindex]);
4165da1bb401SStefano Zampini       }
41663b03a366Sstefano_zampini     }
416736e030ebSStefano Zampini     ierr = ISRestoreIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr);
41683b03a366Sstefano_zampini   }
4169da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
4170da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec2_N,&array2);CHKERRQ(ierr);
4171da1bb401SStefano Zampini 
41720c7d97c5SJed Brown   for(i=0;i<mat_graph->nvtxs;i++){
41733b03a366Sstefano_zampini     if(!mat_graph->count[i]){  /* interior nodes */
41740c7d97c5SJed Brown       mat_graph->touched[i]=PETSC_TRUE;
41750c7d97c5SJed Brown       mat_graph->where[i]=0;
41760c7d97c5SJed Brown       nodes_touched++;
41770c7d97c5SJed Brown     }
41780c7d97c5SJed Brown   }
41790c7d97c5SJed Brown   mat_graph->ncmps = 0;
4180da1bb401SStefano Zampini   i=0;
41810c7d97c5SJed Brown   while(nodes_touched<mat_graph->nvtxs) {
4182a0ba757dSStefano Zampini     /*  find first untouched node in local ordering */
41830c7d97c5SJed Brown     while(mat_graph->touched[i]) i++;
41840c7d97c5SJed Brown     mat_graph->touched[i]=PETSC_TRUE;
4185a0ba757dSStefano Zampini     mat_graph->where[i]=where_values;
41860c7d97c5SJed Brown     nodes_touched++;
4187a0ba757dSStefano Zampini     /* now find all other nodes having the same set of sharing subdomains */
41880c7d97c5SJed Brown     for(j=i+1;j<mat_graph->nvtxs;j++){
4189a0ba757dSStefano Zampini       /* check for same number of sharing subdomains and dof number */
4190da1bb401SStefano Zampini       if(!mat_graph->touched[j] && mat_graph->count[i]==mat_graph->count[j] && mat_graph->which_dof[i] == mat_graph->which_dof[j] ){
4191a0ba757dSStefano Zampini         /* check for same set of sharing subdomains */
41920c7d97c5SJed Brown         same_set=PETSC_TRUE;
41930c7d97c5SJed Brown         for(k=0;k<mat_graph->count[j];k++){
4194da1bb401SStefano Zampini           if(mat_graph->neighbours_set[i][k]!=mat_graph->neighbours_set[j][k]) {
41950c7d97c5SJed Brown             same_set=PETSC_FALSE;
41960c7d97c5SJed Brown           }
41970c7d97c5SJed Brown         }
4198a0ba757dSStefano Zampini         /* I found a friend of mine */
41990c7d97c5SJed Brown         if(same_set) {
4200a0ba757dSStefano Zampini           mat_graph->where[j]=where_values;
42010c7d97c5SJed Brown           mat_graph->touched[j]=PETSC_TRUE;
42020c7d97c5SJed Brown           nodes_touched++;
42030c7d97c5SJed Brown         }
42040c7d97c5SJed Brown       }
42050c7d97c5SJed Brown     }
4206a0ba757dSStefano Zampini     where_values++;
42070c7d97c5SJed Brown   }
4208a0ba757dSStefano Zampini   where_values--; if(where_values<0) where_values=0;
4209a0ba757dSStefano Zampini   ierr = PetscMalloc(where_values*sizeof(PetscMPIInt),&mat_graph->where_ncmps);CHKERRQ(ierr);
4210a0ba757dSStefano Zampini   /* Find connected components defined on the shared interface */
4211a0ba757dSStefano Zampini   if(where_values) {
4212a0ba757dSStefano Zampini     ierr = PCBDDCFindConnectedComponents(mat_graph, where_values);
42133b03a366Sstefano_zampini     /* For consistency among neughbouring procs, I need to sort (by global ordering) each connected component */
4214a0ba757dSStefano Zampini     for(i=0;i<mat_graph->ncmps;i++) {
4215a0ba757dSStefano Zampini       ierr = ISLocalToGlobalMappingApply(matis->mapping,mat_graph->cptr[i+1]-mat_graph->cptr[i],&mat_graph->queue[mat_graph->cptr[i]],&queue_in_global_numbering[mat_graph->cptr[i]]);CHKERRQ(ierr);
4216a0ba757dSStefano Zampini       ierr = PetscSortIntWithArray(mat_graph->cptr[i+1]-mat_graph->cptr[i],&queue_in_global_numbering[mat_graph->cptr[i]],&mat_graph->queue[mat_graph->cptr[i]]);CHKERRQ(ierr);
4217a0ba757dSStefano Zampini     }
4218a0ba757dSStefano Zampini   }
4219a0ba757dSStefano Zampini   /* check consistency of connected components among neighbouring subdomains -> it adapt them in case it is needed */
4220a0ba757dSStefano Zampini   for(i=0;i<where_values;i++) {
42213b03a366Sstefano_zampini     /* We are not sure that two connected components will be the same among subdomains sharing a subset of local interface */
42223b03a366Sstefano_zampini     if(mat_graph->where_ncmps[i]>1) {
4223a0ba757dSStefano Zampini       adapt_interface=1;
4224a0ba757dSStefano Zampini       break;
4225a0ba757dSStefano Zampini     }
4226a0ba757dSStefano Zampini   }
4227a0ba757dSStefano Zampini   ierr = MPI_Allreduce(&adapt_interface,&adapt_interface_reduced,1,MPIU_INT,MPI_LOR,interface_comm);CHKERRQ(ierr);
4228da1bb401SStefano Zampini   if(pcbddc->dbg_flag && adapt_interface_reduced) {
4229da1bb401SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"Interface adapted\n");CHKERRQ(ierr);
4230da1bb401SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
4231da1bb401SStefano Zampini   }
4232a0ba757dSStefano Zampini   if(where_values && adapt_interface_reduced) {
42330c7d97c5SJed Brown 
4234a0ba757dSStefano Zampini     PetscInt sum_requests=0,my_rank;
4235a0ba757dSStefano Zampini     PetscInt buffer_size,start_of_recv,size_of_recv,start_of_send;
4236a0ba757dSStefano Zampini     PetscInt temp_buffer_size,ins_val,global_where_counter;
4237a0ba757dSStefano Zampini     PetscInt *cum_recv_counts;
4238a0ba757dSStefano Zampini     PetscInt *where_to_nodes_indices;
4239a0ba757dSStefano Zampini     PetscInt *petsc_buffer;
4240a0ba757dSStefano Zampini     PetscMPIInt *recv_buffer;
4241a0ba757dSStefano Zampini     PetscMPIInt *recv_buffer_where;
4242a0ba757dSStefano Zampini     PetscMPIInt *send_buffer;
4243a0ba757dSStefano Zampini     PetscMPIInt size_of_send;
4244a0ba757dSStefano Zampini     PetscInt *sizes_of_sends;
4245a0ba757dSStefano Zampini     MPI_Request *send_requests;
4246a0ba757dSStefano Zampini     MPI_Request *recv_requests;
4247a0ba757dSStefano Zampini     PetscInt *where_cc_adapt;
4248a0ba757dSStefano Zampini     PetscInt **temp_buffer;
4249a0ba757dSStefano Zampini     PetscInt *nodes_to_temp_buffer_indices;
4250a0ba757dSStefano Zampini     PetscInt *add_to_where;
4251a0ba757dSStefano Zampini 
4252a0ba757dSStefano Zampini     ierr = MPI_Comm_rank(interface_comm,&my_rank);CHKERRQ(ierr);
4253a0ba757dSStefano Zampini     ierr = PetscMalloc((where_values+1)*sizeof(PetscInt),&cum_recv_counts);CHKERRQ(ierr);
4254a0ba757dSStefano Zampini     ierr = PetscMemzero(cum_recv_counts,(where_values+1)*sizeof(PetscInt));CHKERRQ(ierr);
4255a0ba757dSStefano Zampini     ierr = PetscMalloc(where_values*sizeof(PetscInt),&where_to_nodes_indices);CHKERRQ(ierr);
4256a0ba757dSStefano Zampini     /* first count how many neighbours per connected component I will receive from */
4257a0ba757dSStefano Zampini     cum_recv_counts[0]=0;
4258a0ba757dSStefano Zampini     for(i=1;i<where_values+1;i++){
4259a0ba757dSStefano Zampini       j=0;
4260a0ba757dSStefano Zampini       while(mat_graph->where[j] != i) j++;
4261a0ba757dSStefano Zampini       where_to_nodes_indices[i-1]=j;
4262da1bb401SStefano Zampini       if(mat_graph->neighbours_set[j][0]!=-1) { cum_recv_counts[i]=cum_recv_counts[i-1]+mat_graph->count[j]; } /* We don't want sends/recvs_to/from_self -> here I don't count myself  */
42633b03a366Sstefano_zampini       else { cum_recv_counts[i]=cum_recv_counts[i-1]+mat_graph->count[j]-1; }
4264a0ba757dSStefano Zampini     }
4265a0ba757dSStefano Zampini     buffer_size=2*cum_recv_counts[where_values]+mat_graph->nvtxs;
4266a0ba757dSStefano Zampini     ierr = PetscMalloc(2*cum_recv_counts[where_values]*sizeof(PetscMPIInt),&recv_buffer_where);CHKERRQ(ierr);
4267a0ba757dSStefano Zampini     ierr = PetscMalloc(buffer_size*sizeof(PetscMPIInt),&send_buffer);CHKERRQ(ierr);
4268a0ba757dSStefano Zampini     ierr = PetscMalloc(cum_recv_counts[where_values]*sizeof(MPI_Request),&send_requests);CHKERRQ(ierr);
4269a0ba757dSStefano Zampini     ierr = PetscMalloc(cum_recv_counts[where_values]*sizeof(MPI_Request),&recv_requests);CHKERRQ(ierr);
4270a0ba757dSStefano Zampini     for(i=0;i<cum_recv_counts[where_values];i++) {
4271a0ba757dSStefano Zampini       send_requests[i]=MPI_REQUEST_NULL;
4272a0ba757dSStefano Zampini       recv_requests[i]=MPI_REQUEST_NULL;
4273a0ba757dSStefano Zampini     }
4274a0ba757dSStefano Zampini     /* exchange with my neighbours the number of my connected components on the shared interface */
4275a0ba757dSStefano Zampini     for(i=0;i<where_values;i++){
4276a0ba757dSStefano Zampini       j=where_to_nodes_indices[i];
4277da1bb401SStefano Zampini       k = (mat_graph->neighbours_set[j][0] == -1 ?  1 : 0);
4278a0ba757dSStefano Zampini       for(;k<mat_graph->count[j];k++){
4279da1bb401SStefano Zampini         ierr = MPI_Isend(&mat_graph->where_ncmps[i],1,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr);
4280da1bb401SStefano Zampini         ierr = MPI_Irecv(&recv_buffer_where[sum_requests],1,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr);
4281a0ba757dSStefano Zampini         sum_requests++;
4282a0ba757dSStefano Zampini       }
4283a0ba757dSStefano Zampini     }
4284a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
4285a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
4286a0ba757dSStefano Zampini     /* determine the connected component I need to adapt */
4287a0ba757dSStefano Zampini     ierr = PetscMalloc(where_values*sizeof(PetscInt),&where_cc_adapt);CHKERRQ(ierr);
4288a0ba757dSStefano Zampini     ierr = PetscMemzero(where_cc_adapt,where_values*sizeof(PetscInt));CHKERRQ(ierr);
4289a0ba757dSStefano Zampini     for(i=0;i<where_values;i++){
4290a0ba757dSStefano Zampini       for(j=cum_recv_counts[i];j<cum_recv_counts[i+1];j++){
42913b03a366Sstefano_zampini         /* The first condition is natural (i.e someone has a different number of cc than me), the second one is just to be safe */
42923b03a366Sstefano_zampini         if( mat_graph->where_ncmps[i]!=recv_buffer_where[j] || mat_graph->where_ncmps[i] > 1 ) {
4293a0ba757dSStefano Zampini           where_cc_adapt[i]=PETSC_TRUE;
4294a0ba757dSStefano Zampini           break;
4295a0ba757dSStefano Zampini         }
4296a0ba757dSStefano Zampini       }
4297a0ba757dSStefano Zampini     }
4298a0ba757dSStefano Zampini     /* now get from neighbours their ccs (in global numbering) and adapt them (in case it is needed) */
4299a0ba757dSStefano Zampini     /* first determine how much data to send (size of each queue plus the global indices) and communicate it to neighbours */
4300a0ba757dSStefano Zampini     ierr = PetscMalloc(where_values*sizeof(PetscInt),&sizes_of_sends);CHKERRQ(ierr);
4301a0ba757dSStefano Zampini     ierr = PetscMemzero(sizes_of_sends,where_values*sizeof(PetscInt));CHKERRQ(ierr);
4302a0ba757dSStefano Zampini     sum_requests=0;
4303a0ba757dSStefano Zampini     start_of_send=0;
4304a0ba757dSStefano Zampini     start_of_recv=cum_recv_counts[where_values];
4305a0ba757dSStefano Zampini     for(i=0;i<where_values;i++) {
4306a0ba757dSStefano Zampini       if(where_cc_adapt[i]) {
4307a0ba757dSStefano Zampini         size_of_send=0;
4308a0ba757dSStefano Zampini         for(j=i;j<mat_graph->ncmps;j++) {
4309a0ba757dSStefano Zampini           if(mat_graph->where[mat_graph->queue[mat_graph->cptr[j]]] == i+1) { /* WARNING -> where values goes from 1 to where_values included */
4310a0ba757dSStefano Zampini             send_buffer[start_of_send+size_of_send]=mat_graph->cptr[j+1]-mat_graph->cptr[j];
4311a0ba757dSStefano Zampini             size_of_send+=1;
4312a0ba757dSStefano Zampini             for(k=0;k<mat_graph->cptr[j+1]-mat_graph->cptr[j];k++) {
4313a0ba757dSStefano Zampini               send_buffer[start_of_send+size_of_send+k]=queue_in_global_numbering[mat_graph->cptr[j]+k];
4314a0ba757dSStefano Zampini             }
4315a0ba757dSStefano Zampini             size_of_send=size_of_send+mat_graph->cptr[j+1]-mat_graph->cptr[j];
4316a0ba757dSStefano Zampini           }
4317a0ba757dSStefano Zampini         }
4318a0ba757dSStefano Zampini         j = where_to_nodes_indices[i];
4319da1bb401SStefano Zampini         k = (mat_graph->neighbours_set[j][0] == -1 ?  1 : 0);
432011d8f4c2SStefano Zampini         sizes_of_sends[i]=size_of_send;
4321a0ba757dSStefano Zampini         for(;k<mat_graph->count[j];k++){
432211d8f4c2SStefano Zampini           ierr = MPI_Isend(&sizes_of_sends[i],1,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr);
4323da1bb401SStefano Zampini           ierr = MPI_Irecv(&recv_buffer_where[sum_requests+start_of_recv],1,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr);
4324a0ba757dSStefano Zampini           sum_requests++;
4325a0ba757dSStefano Zampini         }
4326a0ba757dSStefano Zampini         start_of_send+=size_of_send;
4327a0ba757dSStefano Zampini       }
4328a0ba757dSStefano Zampini     }
4329a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
4330a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
4331a0ba757dSStefano Zampini     buffer_size=0;
4332a0ba757dSStefano Zampini     for(k=0;k<sum_requests;k++) { buffer_size+=recv_buffer_where[start_of_recv+k]; }
4333a0ba757dSStefano Zampini     ierr = PetscMalloc(buffer_size*sizeof(PetscMPIInt),&recv_buffer);CHKERRQ(ierr);
4334a0ba757dSStefano Zampini     /* now exchange the data */
4335a0ba757dSStefano Zampini     start_of_recv=0;
4336a0ba757dSStefano Zampini     start_of_send=0;
4337a0ba757dSStefano Zampini     sum_requests=0;
4338a0ba757dSStefano Zampini     for(i=0;i<where_values;i++) {
4339a0ba757dSStefano Zampini       if(where_cc_adapt[i]) {
4340a0ba757dSStefano Zampini         size_of_send = sizes_of_sends[i];
4341a0ba757dSStefano Zampini         j = where_to_nodes_indices[i];
4342da1bb401SStefano Zampini         k = (mat_graph->neighbours_set[j][0] == -1 ?  1 : 0);
4343a0ba757dSStefano Zampini         for(;k<mat_graph->count[j];k++){
4344da1bb401SStefano Zampini           ierr = MPI_Isend(&send_buffer[start_of_send],size_of_send,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr);
4345a0ba757dSStefano Zampini           size_of_recv=recv_buffer_where[cum_recv_counts[where_values]+sum_requests];
4346da1bb401SStefano Zampini           ierr = MPI_Irecv(&recv_buffer[start_of_recv],size_of_recv,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr);
4347a0ba757dSStefano Zampini           start_of_recv+=size_of_recv;
4348a0ba757dSStefano Zampini           sum_requests++;
4349a0ba757dSStefano Zampini         }
4350a0ba757dSStefano Zampini         start_of_send+=size_of_send;
4351a0ba757dSStefano Zampini       }
4352a0ba757dSStefano Zampini     }
4353a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
4354a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
4355a0ba757dSStefano Zampini     ierr = PetscMalloc(buffer_size*sizeof(PetscInt),&petsc_buffer);CHKERRQ(ierr);
4356a0ba757dSStefano Zampini     for(k=0;k<start_of_recv;k++) { petsc_buffer[k]=(PetscInt)recv_buffer[k]; }
4357a0ba757dSStefano Zampini     for(j=0;j<buffer_size;) {
4358a0ba757dSStefano Zampini        ierr = ISGlobalToLocalMappingApply(matis->mapping,IS_GTOLM_MASK,petsc_buffer[j],&petsc_buffer[j+1],&petsc_buffer[j],&petsc_buffer[j+1]);CHKERRQ(ierr);
4359a0ba757dSStefano Zampini        k=petsc_buffer[j]+1;
4360a0ba757dSStefano Zampini        j+=k;
4361a0ba757dSStefano Zampini     }
4362a0ba757dSStefano Zampini     sum_requests=cum_recv_counts[where_values];
4363a0ba757dSStefano Zampini     start_of_recv=0;
4364a0ba757dSStefano Zampini     ierr = PetscMalloc(mat_graph->nvtxs*sizeof(PetscInt),&nodes_to_temp_buffer_indices);CHKERRQ(ierr);
4365a0ba757dSStefano Zampini     global_where_counter=0;
4366a0ba757dSStefano Zampini     for(i=0;i<where_values;i++){
4367a0ba757dSStefano Zampini       if(where_cc_adapt[i]){
4368a0ba757dSStefano Zampini         temp_buffer_size=0;
4369a0ba757dSStefano Zampini         /* find nodes on the shared interface we need to adapt */
4370a0ba757dSStefano Zampini         for(j=0;j<mat_graph->nvtxs;j++){
4371a0ba757dSStefano Zampini           if(mat_graph->where[j]==i+1) {
4372a0ba757dSStefano Zampini             nodes_to_temp_buffer_indices[j]=temp_buffer_size;
4373a0ba757dSStefano Zampini             temp_buffer_size++;
4374a0ba757dSStefano Zampini           } else {
4375a0ba757dSStefano Zampini             nodes_to_temp_buffer_indices[j]=-1;
4376a0ba757dSStefano Zampini           }
4377a0ba757dSStefano Zampini         }
4378a0ba757dSStefano Zampini         /* allocate some temporary space */
4379a0ba757dSStefano Zampini         ierr = PetscMalloc(temp_buffer_size*sizeof(PetscInt*),&temp_buffer);CHKERRQ(ierr);
4380a0ba757dSStefano Zampini         ierr = PetscMalloc(temp_buffer_size*(cum_recv_counts[i+1]-cum_recv_counts[i])*sizeof(PetscInt),&temp_buffer[0]);CHKERRQ(ierr);
4381a0ba757dSStefano Zampini         ierr = PetscMemzero(temp_buffer[0],temp_buffer_size*(cum_recv_counts[i+1]-cum_recv_counts[i])*sizeof(PetscInt));CHKERRQ(ierr);
4382a0ba757dSStefano Zampini         for(j=1;j<temp_buffer_size;j++){
4383a0ba757dSStefano Zampini           temp_buffer[j]=temp_buffer[j-1]+cum_recv_counts[i+1]-cum_recv_counts[i];
4384a0ba757dSStefano Zampini         }
4385a0ba757dSStefano Zampini         /* analyze contributions from neighbouring subdomains for i-th conn comp
4386a0ba757dSStefano Zampini            temp buffer structure:
4387a0ba757dSStefano Zampini            supposing part of the interface has dimension 5 (global nodes 0,1,2,3,4)
4388a0ba757dSStefano Zampini            3 neighs procs with structured connected components:
4389a0ba757dSStefano Zampini              neigh 0: [0 1 4], [2 3];  (2 connected components)
4390a0ba757dSStefano Zampini              neigh 1: [0 1], [2 3 4];  (2 connected components)
4391a0ba757dSStefano Zampini              neigh 2: [0 4], [1], [2 3]; (3 connected components)
4392a0ba757dSStefano Zampini            tempbuffer (row-oriented) should be filled as:
4393a0ba757dSStefano Zampini              [ 0, 0, 0;
4394a0ba757dSStefano Zampini                0, 0, 1;
4395a0ba757dSStefano Zampini                1, 1, 2;
4396a0ba757dSStefano Zampini                1, 1, 2;
4397a0ba757dSStefano Zampini                0, 1, 0; ];
4398a0ba757dSStefano Zampini            This way we can simply recover the resulting structure account for possible intersections of ccs among neighs.
4399a0ba757dSStefano Zampini            The mat_graph->where array will be modified to reproduce the following 4 connected components [0], [1], [2 3], [4];
4400a0ba757dSStefano Zampini                                                                                                                                    */
4401a0ba757dSStefano Zampini         for(j=0;j<cum_recv_counts[i+1]-cum_recv_counts[i];j++) {
4402a0ba757dSStefano Zampini           ins_val=0;
4403a0ba757dSStefano Zampini           size_of_recv=recv_buffer_where[sum_requests];  /* total size of recv from neighs */
4404a0ba757dSStefano Zampini           for(buffer_size=0;buffer_size<size_of_recv;) {  /* loop until all data from neighs has been taken into account */
4405a0ba757dSStefano Zampini             for(k=1;k<petsc_buffer[buffer_size+start_of_recv]+1;k++) { /* filling properly temp_buffer using data from a single recv */
4406a0ba757dSStefano Zampini               temp_buffer[ nodes_to_temp_buffer_indices[ petsc_buffer[ start_of_recv+buffer_size+k ] ] ][j]=ins_val;
4407a0ba757dSStefano Zampini             }
4408a0ba757dSStefano Zampini             buffer_size+=k;
4409a0ba757dSStefano Zampini             ins_val++;
4410a0ba757dSStefano Zampini           }
4411a0ba757dSStefano Zampini           start_of_recv+=size_of_recv;
4412a0ba757dSStefano Zampini           sum_requests++;
4413a0ba757dSStefano Zampini         }
4414a0ba757dSStefano Zampini         ierr = PetscMalloc(temp_buffer_size*sizeof(PetscInt),&add_to_where);CHKERRQ(ierr);
4415a0ba757dSStefano Zampini         ierr = PetscMemzero(add_to_where,temp_buffer_size*sizeof(PetscInt));CHKERRQ(ierr);
4416a0ba757dSStefano Zampini         for(j=0;j<temp_buffer_size;j++){
4417a0ba757dSStefano Zampini           if(!add_to_where[j]){ /* found a new cc  */
4418a0ba757dSStefano Zampini             global_where_counter++;
4419a0ba757dSStefano Zampini             add_to_where[j]=global_where_counter;
4420a0ba757dSStefano Zampini             for(k=j+1;k<temp_buffer_size;k++){ /* check for other nodes in new cc */
4421a0ba757dSStefano Zampini               same_set=PETSC_TRUE;
4422a0ba757dSStefano Zampini               for(s=0;s<cum_recv_counts[i+1]-cum_recv_counts[i];s++){
4423a0ba757dSStefano Zampini                 if(temp_buffer[j][s]!=temp_buffer[k][s]) {
4424a0ba757dSStefano Zampini                   same_set=PETSC_FALSE;
4425a0ba757dSStefano Zampini                   break;
4426a0ba757dSStefano Zampini                 }
4427a0ba757dSStefano Zampini               }
4428a0ba757dSStefano Zampini               if(same_set) add_to_where[k]=global_where_counter;
4429a0ba757dSStefano Zampini             }
4430a0ba757dSStefano Zampini           }
4431a0ba757dSStefano Zampini         }
4432a0ba757dSStefano Zampini         /* insert new data in where array */
4433a0ba757dSStefano Zampini         temp_buffer_size=0;
4434a0ba757dSStefano Zampini         for(j=0;j<mat_graph->nvtxs;j++){
4435a0ba757dSStefano Zampini           if(mat_graph->where[j]==i+1) {
4436a0ba757dSStefano Zampini             mat_graph->where[j]=where_values+add_to_where[temp_buffer_size];
4437a0ba757dSStefano Zampini             temp_buffer_size++;
4438a0ba757dSStefano Zampini           }
4439a0ba757dSStefano Zampini         }
4440a0ba757dSStefano Zampini         ierr = PetscFree(temp_buffer[0]);CHKERRQ(ierr);
4441a0ba757dSStefano Zampini         ierr = PetscFree(temp_buffer);CHKERRQ(ierr);
4442a0ba757dSStefano Zampini         ierr = PetscFree(add_to_where);CHKERRQ(ierr);
4443a0ba757dSStefano Zampini       }
4444a0ba757dSStefano Zampini     }
4445a0ba757dSStefano Zampini     ierr = PetscFree(nodes_to_temp_buffer_indices);CHKERRQ(ierr);
4446a0ba757dSStefano Zampini     ierr = PetscFree(sizes_of_sends);CHKERRQ(ierr);
4447a0ba757dSStefano Zampini     ierr = PetscFree(send_requests);CHKERRQ(ierr);
4448a0ba757dSStefano Zampini     ierr = PetscFree(recv_requests);CHKERRQ(ierr);
4449a0ba757dSStefano Zampini     ierr = PetscFree(petsc_buffer);CHKERRQ(ierr);
4450a0ba757dSStefano Zampini     ierr = PetscFree(recv_buffer);CHKERRQ(ierr);
4451a0ba757dSStefano Zampini     ierr = PetscFree(recv_buffer_where);CHKERRQ(ierr);
4452a0ba757dSStefano Zampini     ierr = PetscFree(send_buffer);CHKERRQ(ierr);
4453a0ba757dSStefano Zampini     ierr = PetscFree(cum_recv_counts);CHKERRQ(ierr);
4454a0ba757dSStefano Zampini     ierr = PetscFree(where_to_nodes_indices);CHKERRQ(ierr);
445523d4d1a5SStefano Zampini     ierr = PetscFree(where_cc_adapt);CHKERRQ(ierr);
4456a0ba757dSStefano Zampini     /* We are ready to evaluate consistent connected components on each part of the shared interface */
4457a0ba757dSStefano Zampini     if(global_where_counter) {
4458a0ba757dSStefano Zampini       for(i=0;i<mat_graph->nvtxs;i++){ mat_graph->touched[i]=PETSC_FALSE; }
4459a0ba757dSStefano Zampini       global_where_counter=0;
4460a0ba757dSStefano Zampini       for(i=0;i<mat_graph->nvtxs;i++){
4461a0ba757dSStefano Zampini         if(mat_graph->where[i] && !mat_graph->touched[i]) {
4462a0ba757dSStefano Zampini           global_where_counter++;
4463a0ba757dSStefano Zampini           for(j=i+1;j<mat_graph->nvtxs;j++){
4464a0ba757dSStefano Zampini             if(!mat_graph->touched[j] && mat_graph->where[j]==mat_graph->where[i]) {
4465a0ba757dSStefano Zampini               mat_graph->where[j]=global_where_counter;
4466a0ba757dSStefano Zampini               mat_graph->touched[j]=PETSC_TRUE;
4467a0ba757dSStefano Zampini             }
4468a0ba757dSStefano Zampini           }
4469a0ba757dSStefano Zampini           mat_graph->where[i]=global_where_counter;
4470a0ba757dSStefano Zampini           mat_graph->touched[i]=PETSC_TRUE;
4471a0ba757dSStefano Zampini         }
4472a0ba757dSStefano Zampini       }
4473a0ba757dSStefano Zampini       where_values=global_where_counter;
4474a0ba757dSStefano Zampini     }
4475a0ba757dSStefano Zampini     if(global_where_counter) {
4476a0ba757dSStefano Zampini       ierr = PetscMemzero(mat_graph->cptr,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr);
4477a0ba757dSStefano Zampini       ierr = PetscMemzero(mat_graph->queue,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
4478a0ba757dSStefano Zampini       ierr = PetscFree(mat_graph->where_ncmps);CHKERRQ(ierr);
4479a0ba757dSStefano Zampini       ierr = PetscMalloc(where_values*sizeof(PetscMPIInt),&mat_graph->where_ncmps);CHKERRQ(ierr);
4480a0ba757dSStefano Zampini       ierr = PCBDDCFindConnectedComponents(mat_graph, where_values);
4481a0ba757dSStefano Zampini       for(i=0;i<mat_graph->ncmps;i++) {
4482a0ba757dSStefano Zampini         ierr = ISLocalToGlobalMappingApply(matis->mapping,mat_graph->cptr[i+1]-mat_graph->cptr[i],&mat_graph->queue[mat_graph->cptr[i]],&queue_in_global_numbering[mat_graph->cptr[i]]);CHKERRQ(ierr);
4483a0ba757dSStefano Zampini         ierr = PetscSortIntWithArray(mat_graph->cptr[i+1]-mat_graph->cptr[i],&queue_in_global_numbering[mat_graph->cptr[i]],&mat_graph->queue[mat_graph->cptr[i]]);CHKERRQ(ierr);
4484a0ba757dSStefano Zampini       }
4485a0ba757dSStefano Zampini     }
44863b03a366Sstefano_zampini   } /* Finished adapting interface */
44870c7d97c5SJed Brown   PetscInt nfc=0;
44880c7d97c5SJed Brown   PetscInt nec=0;
44890c7d97c5SJed Brown   PetscInt nvc=0;
44903b03a366Sstefano_zampini   PetscBool twodim_flag=PETSC_FALSE;
44910c7d97c5SJed Brown   for (i=0; i<mat_graph->ncmps; i++) {
44923b03a366Sstefano_zampini     if( mat_graph->cptr[i+1]-mat_graph->cptr[i] > vertex_size ){
4493534831adSStefano Zampini       if(mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]==1){ /* 1 neigh Neumann fake included */
44940c7d97c5SJed Brown         nfc++;
44953b03a366Sstefano_zampini       } else { /* note that nec will be zero in 2d */
44963b03a366Sstefano_zampini         nec++;
44973b03a366Sstefano_zampini       }
44980c7d97c5SJed Brown     } else {
44993b03a366Sstefano_zampini       nvc+=mat_graph->cptr[i+1]-mat_graph->cptr[i];
45003b03a366Sstefano_zampini     }
45013b03a366Sstefano_zampini   }
45023b03a366Sstefano_zampini 
45033b03a366Sstefano_zampini   if(!nec) { /* we are in a 2d case -> no faces, only edges */
45043b03a366Sstefano_zampini     nec = nfc;
45053b03a366Sstefano_zampini     nfc = 0;
45063b03a366Sstefano_zampini     twodim_flag = PETSC_TRUE;
45073b03a366Sstefano_zampini   }
45083972b0daSStefano Zampini   /* allocate IS arrays for faces, edges. Vertices need a single index set. */
45093972b0daSStefano Zampini   k=0;
45103972b0daSStefano Zampini   for (i=0; i<mat_graph->ncmps; i++) {
45113972b0daSStefano Zampini     j=mat_graph->cptr[i+1]-mat_graph->cptr[i];
45123972b0daSStefano Zampini     if( j > k) {
45133972b0daSStefano Zampini       k=j;
45143972b0daSStefano Zampini     }
4515ba1573a8SStefano Zampini     if(j<=vertex_size) {
4516ba1573a8SStefano Zampini       k+=vertex_size;
4517ba1573a8SStefano Zampini     }
45183972b0daSStefano Zampini   }
45193972b0daSStefano Zampini   ierr = PetscMalloc(k*sizeof(PetscInt),&auxis);CHKERRQ(ierr);
45203972b0daSStefano Zampini 
45213b03a366Sstefano_zampini   if(!pcbddc->vertices_flag && !pcbddc->edges_flag) {
45223b03a366Sstefano_zampini     ierr = PetscMalloc(nfc*sizeof(IS),&pcbddc->ISForFaces);CHKERRQ(ierr);
45233b03a366Sstefano_zampini     use_faces=PETSC_TRUE;
45243b03a366Sstefano_zampini   }
45253b03a366Sstefano_zampini   if(!pcbddc->vertices_flag && !pcbddc->faces_flag) {
45263b03a366Sstefano_zampini     ierr = PetscMalloc(nec*sizeof(IS),&pcbddc->ISForEdges);CHKERRQ(ierr);
45273b03a366Sstefano_zampini     use_edges=PETSC_TRUE;
45283b03a366Sstefano_zampini   }
45293b03a366Sstefano_zampini   nfc=0;
45303b03a366Sstefano_zampini   nec=0;
45313b03a366Sstefano_zampini   for (i=0; i<mat_graph->ncmps; i++) {
45323b03a366Sstefano_zampini     if( mat_graph->cptr[i+1]-mat_graph->cptr[i] > vertex_size ){
45333b03a366Sstefano_zampini       for(j=0;j<mat_graph->cptr[i+1]-mat_graph->cptr[i];j++) {
45343972b0daSStefano Zampini         auxis[j]=mat_graph->queue[mat_graph->cptr[i]+j];
45353b03a366Sstefano_zampini       }
45363b03a366Sstefano_zampini       if(mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]==1){
45373b03a366Sstefano_zampini         if(twodim_flag) {
45383b03a366Sstefano_zampini           if(use_edges) {
45393972b0daSStefano Zampini             ierr = ISCreateGeneral(PETSC_COMM_SELF,j,auxis,PETSC_COPY_VALUES,&pcbddc->ISForEdges[nec]);CHKERRQ(ierr);
45403b03a366Sstefano_zampini             nec++;
45413b03a366Sstefano_zampini           }
45423b03a366Sstefano_zampini         } else {
45433b03a366Sstefano_zampini           if(use_faces) {
45443972b0daSStefano Zampini             ierr = ISCreateGeneral(PETSC_COMM_SELF,j,auxis,PETSC_COPY_VALUES,&pcbddc->ISForFaces[nfc]);CHKERRQ(ierr);
45453b03a366Sstefano_zampini             nfc++;
45463b03a366Sstefano_zampini           }
45473b03a366Sstefano_zampini         }
45483b03a366Sstefano_zampini       } else {
45493b03a366Sstefano_zampini         if(use_edges) {
45503972b0daSStefano Zampini           ierr = ISCreateGeneral(PETSC_COMM_SELF,j,auxis,PETSC_COPY_VALUES,&pcbddc->ISForEdges[nec]);CHKERRQ(ierr);
45510c7d97c5SJed Brown           nec++;
45520c7d97c5SJed Brown         }
45530c7d97c5SJed Brown       }
45540c7d97c5SJed Brown     }
45553b03a366Sstefano_zampini   }
45563b03a366Sstefano_zampini   pcbddc->n_ISForFaces=nfc;
45573b03a366Sstefano_zampini   pcbddc->n_ISForEdges=nec;
45583b03a366Sstefano_zampini   nvc=0;
45590c7d97c5SJed Brown   if( !pcbddc->constraints_flag ) {
45603b03a366Sstefano_zampini     for (i=0; i<mat_graph->ncmps; i++) {
45613b03a366Sstefano_zampini       if( mat_graph->cptr[i+1]-mat_graph->cptr[i] <= vertex_size ){
45623b03a366Sstefano_zampini         for( j=mat_graph->cptr[i];j<mat_graph->cptr[i+1];j++) {
45633972b0daSStefano Zampini           auxis[nvc]=mat_graph->queue[j];
45640c7d97c5SJed Brown           nvc++;
45650c7d97c5SJed Brown         }
45660c7d97c5SJed Brown       }
45670c7d97c5SJed Brown     }
45680c7d97c5SJed Brown   }
4569a0ba757dSStefano Zampini   /* sort vertex set (by local ordering) */
45703972b0daSStefano Zampini   ierr = PetscSortInt(nvc,auxis);CHKERRQ(ierr);
45713972b0daSStefano Zampini   ierr = ISCreateGeneral(PETSC_COMM_SELF,nvc,auxis,PETSC_COPY_VALUES,&pcbddc->ISForVertices);CHKERRQ(ierr);
45720c7d97c5SJed Brown 
4573e269702eSStefano Zampini   if(pcbddc->dbg_flag) {
4574e269702eSStefano Zampini 
4575d49ef151SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"--------------------------------------------------------------\n");CHKERRQ(ierr);
4576d49ef151SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Details from PCBDDCManageLocalBoundaries for subdomain %04d\n",PetscGlobalRank);CHKERRQ(ierr);
4577d49ef151SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"--------------------------------------------------------------\n");CHKERRQ(ierr);
4578a0ba757dSStefano Zampini /*    ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Graph (adjacency structure) of local Neumann mat\n");CHKERRQ(ierr);
4579a0ba757dSStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"--------------------------------------------------------------\n");CHKERRQ(ierr);
4580e269702eSStefano Zampini     for(i=0;i<mat_graph->nvtxs;i++) {
4581a0ba757dSStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Nodes connected to node number %d are %d\n",i,mat_graph->xadj[i+1]-mat_graph->xadj[i]);CHKERRQ(ierr);
4582e269702eSStefano Zampini       for(j=mat_graph->xadj[i];j<mat_graph->xadj[i+1];j++){
4583a0ba757dSStefano Zampini         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d ",mat_graph->adjncy[j]);CHKERRQ(ierr);
4584e269702eSStefano Zampini       }
4585a0ba757dSStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\n--------------------------------------------------------------\n");CHKERRQ(ierr);
4586da1bb401SStefano Zampini     }*/
4587d49ef151SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Matrix graph has %d connected components", mat_graph->ncmps);CHKERRQ(ierr);
45880c7d97c5SJed Brown     for(i=0;i<mat_graph->ncmps;i++) {
45893b03a366Sstefano_zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\nDetails for connected component number %02d: size %04d, count %01d. Nodes follow.\n",
45903b03a366Sstefano_zampini              i,mat_graph->cptr[i+1]-mat_graph->cptr[i],mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]);CHKERRQ(ierr);
4591da1bb401SStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"subdomains: ");
4592da1bb401SStefano Zampini       for (j=0;j<mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]; j++) {
4593da1bb401SStefano Zampini         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d ",mat_graph->neighbours_set[mat_graph->queue[mat_graph->cptr[i]]][j]);
4594da1bb401SStefano Zampini       }
4595da1bb401SStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\n");
45960c7d97c5SJed Brown       for (j=mat_graph->cptr[i]; j<mat_graph->cptr[i+1]; j++){
4597da1bb401SStefano Zampini         /* ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d (%d), ",queue_in_global_numbering[j],mat_graph->queue[j]);CHKERRQ(ierr); */
4598da1bb401SStefano Zampini         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d, ",mat_graph->queue[j]);CHKERRQ(ierr);
45990c7d97c5SJed Brown       }
46000c7d97c5SJed Brown     }
4601da1bb401SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\n--------------------------------------------------------------\n");CHKERRQ(ierr);
46023b03a366Sstefano_zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local vertices\n",PetscGlobalRank,nvc);CHKERRQ(ierr);
46033b03a366Sstefano_zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local faces\n",PetscGlobalRank,nfc);CHKERRQ(ierr);
46043b03a366Sstefano_zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local edges\n",PetscGlobalRank,nec);CHKERRQ(ierr);
4605d49ef151SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
46060c7d97c5SJed Brown   }
46070c7d97c5SJed Brown 
46083972b0daSStefano Zampini   ierr = PetscFree(queue_in_global_numbering);CHKERRQ(ierr);
46093972b0daSStefano Zampini   ierr = PetscFree(auxis);CHKERRQ(ierr);
46100c7d97c5SJed Brown   PetscFunctionReturn(0);
46110c7d97c5SJed Brown 
46120c7d97c5SJed Brown }
46130c7d97c5SJed Brown 
46140c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
46150c7d97c5SJed Brown 
46160c7d97c5SJed Brown /* The following code has been adapted from function IsConnectedSubdomain contained
4617da1bb401SStefano Zampini    in source file contig.c of METIS library (version 5.0.1)
4618da1bb401SStefano Zampini    It finds connected components of each partition labeled from 1 to n_dist  */
46190c7d97c5SJed Brown 
46200c7d97c5SJed Brown #undef __FUNCT__
46210c7d97c5SJed Brown #define __FUNCT__ "PCBDDCFindConnectedComponents"
46229c0446d6SStefano Zampini static PetscErrorCode PCBDDCFindConnectedComponents(PCBDDCGraph graph, PetscInt n_dist )
46230c7d97c5SJed Brown {
46240c7d97c5SJed Brown   PetscInt i, j, k, nvtxs, first, last, nleft, ncmps,pid,cum_queue,n,ncmps_pid;
46250c7d97c5SJed Brown   PetscInt *xadj, *adjncy, *where, *queue;
46260c7d97c5SJed Brown   PetscInt *cptr;
46270c7d97c5SJed Brown   PetscBool *touched;
46280c7d97c5SJed Brown 
46290c7d97c5SJed Brown   PetscFunctionBegin;
46300c7d97c5SJed Brown 
46310c7d97c5SJed Brown   nvtxs   = graph->nvtxs;
46320c7d97c5SJed Brown   xadj    = graph->xadj;
46330c7d97c5SJed Brown   adjncy  = graph->adjncy;
46340c7d97c5SJed Brown   where   = graph->where;
46350c7d97c5SJed Brown   touched = graph->touched;
46360c7d97c5SJed Brown   queue   = graph->queue;
46370c7d97c5SJed Brown   cptr    = graph->cptr;
46380c7d97c5SJed Brown 
46390c7d97c5SJed Brown   for (i=0; i<nvtxs; i++)
46400c7d97c5SJed Brown     touched[i] = PETSC_FALSE;
46410c7d97c5SJed Brown 
46420c7d97c5SJed Brown   cum_queue=0;
46430c7d97c5SJed Brown   ncmps=0;
46440c7d97c5SJed Brown 
46450c7d97c5SJed Brown   for(n=0; n<n_dist; n++) {
4646da1bb401SStefano Zampini     pid = n+1;  /* partition labeled by 0 is discarded */
46470c7d97c5SJed Brown     nleft = 0;
46480c7d97c5SJed Brown     for (i=0; i<nvtxs; i++) {
46490c7d97c5SJed Brown       if (where[i] == pid)
46500c7d97c5SJed Brown         nleft++;
46510c7d97c5SJed Brown     }
46520c7d97c5SJed Brown     for (i=0; i<nvtxs; i++) {
46530c7d97c5SJed Brown       if (where[i] == pid)
46540c7d97c5SJed Brown         break;
46550c7d97c5SJed Brown     }
46560c7d97c5SJed Brown     touched[i] = PETSC_TRUE;
46570c7d97c5SJed Brown     queue[cum_queue] = i;
46580c7d97c5SJed Brown     first = 0; last = 1;
46590c7d97c5SJed Brown     cptr[ncmps] = cum_queue;  /* This actually points to queue */
46600c7d97c5SJed Brown     ncmps_pid = 0;
46610c7d97c5SJed Brown     while (first != nleft) {
46620c7d97c5SJed Brown       if (first == last) { /* Find another starting vertex */
46630c7d97c5SJed Brown         cptr[++ncmps] = first+cum_queue;
46640c7d97c5SJed Brown         ncmps_pid++;
46650c7d97c5SJed Brown         for (i=0; i<nvtxs; i++) {
46660c7d97c5SJed Brown           if (where[i] == pid && !touched[i])
46670c7d97c5SJed Brown             break;
46680c7d97c5SJed Brown         }
46690c7d97c5SJed Brown         queue[cum_queue+last] = i;
46700c7d97c5SJed Brown         last++;
46710c7d97c5SJed Brown         touched[i] = PETSC_TRUE;
46720c7d97c5SJed Brown       }
46730c7d97c5SJed Brown       i = queue[cum_queue+first];
46740c7d97c5SJed Brown       first++;
46750c7d97c5SJed Brown       for (j=xadj[i]; j<xadj[i+1]; j++) {
46760c7d97c5SJed Brown         k = adjncy[j];
46770c7d97c5SJed Brown         if (where[k] == pid && !touched[k]) {
46780c7d97c5SJed Brown           queue[cum_queue+last] = k;
46790c7d97c5SJed Brown           last++;
46800c7d97c5SJed Brown           touched[k] = PETSC_TRUE;
46810c7d97c5SJed Brown         }
46820c7d97c5SJed Brown       }
46830c7d97c5SJed Brown     }
46840c7d97c5SJed Brown     cptr[++ncmps] = first+cum_queue;
46850c7d97c5SJed Brown     ncmps_pid++;
46860c7d97c5SJed Brown     cum_queue=cptr[ncmps];
4687a0ba757dSStefano Zampini     graph->where_ncmps[n] = ncmps_pid;
46880c7d97c5SJed Brown   }
46890c7d97c5SJed Brown   graph->ncmps = ncmps;
46900c7d97c5SJed Brown 
46910c7d97c5SJed Brown   PetscFunctionReturn(0);
46920c7d97c5SJed Brown }
4693