xref: /petsc/src/ksp/pc/impls/bddc/bddc.c (revision 534831adffddd762cbff73f5893cfd24dcb6ad3c)
153cdbc3dSStefano Zampini /* TODOLIST
2da1bb401SStefano Zampini    DofSplitting and DM attached to pc?
3da1bb401SStefano Zampini    Change SetNeumannBoundaries to SetNeumannBoundariesLocal and provide new SetNeumannBoundaries (same Dirichlet)
4da1bb401SStefano Zampini    Exact solvers: Solve local saddle point directly
5831a100dSStefano Zampini      - change prec_type to switch_inexact_prec_type
6831a100dSStefano Zampini      - add bool solve_exact_saddle_point slot to pdbddc data
73b03a366Sstefano_zampini    Inexact solvers: global preconditioner application is ready, ask to developers (Jed?) on how to best implement Dohrmann's approach (PCSHELL?)
8a0ba757dSStefano Zampini    change how to deal with the coarse problem (PCBDDCSetCoarseEnvironment):
9a0ba757dSStefano Zampini      - mind the problem with coarsening_factor
10a0ba757dSStefano Zampini      - simplify coarse problem structure -> PCBDDC or PCREDUDANT, nothing else -> same comm for all levels?
11a0ba757dSStefano Zampini      - remove coarse enums and allow use of PCBDDCGetCoarseKSP
12a0ba757dSStefano Zampini      - remove metis dependency -> use MatPartitioning for multilevel -> Assemble serial adjacency in ManageLocalBoundaries?
133b03a366Sstefano_zampini      - Add levels' slot to bddc data structure and associated Set/Get functions
14a0ba757dSStefano Zampini    code refactoring:
15a0ba757dSStefano Zampini      - pick up better names for static functions
16a0ba757dSStefano Zampini    change options structure:
17a0ba757dSStefano Zampini      - insert BDDC into MG framework?
18a0ba757dSStefano Zampini    provide other ops? Ask to developers
19a0ba757dSStefano Zampini    remove all unused printf
20a0ba757dSStefano Zampini    man pages
2153cdbc3dSStefano Zampini */
220c7d97c5SJed Brown 
2353cdbc3dSStefano Zampini /* ----------------------------------------------------------------------------------------------------------------------------------------------
240c7d97c5SJed Brown    Implementation of BDDC preconditioner based on:
250c7d97c5SJed Brown    C. Dohrmann "An approximate BDDC preconditioner", Numerical Linear Algebra with Applications Volume 14, Issue 2, pages 149-168, March 2007
2653cdbc3dSStefano Zampini    ---------------------------------------------------------------------------------------------------------------------------------------------- */
2753cdbc3dSStefano Zampini 
2853cdbc3dSStefano Zampini #include "bddc.h" /*I "petscpc.h" I*/  /* includes for fortran wrappers */
293b03a366Sstefano_zampini #include <petscblaslapack.h>
300c7d97c5SJed Brown 
310c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
320c7d97c5SJed Brown #undef __FUNCT__
330c7d97c5SJed Brown #define __FUNCT__ "PCSetFromOptions_BDDC"
340c7d97c5SJed Brown PetscErrorCode PCSetFromOptions_BDDC(PC pc)
350c7d97c5SJed Brown {
360c7d97c5SJed Brown   PC_BDDC         *pcbddc = (PC_BDDC*)pc->data;
370c7d97c5SJed Brown   PetscErrorCode ierr;
380c7d97c5SJed Brown 
390c7d97c5SJed Brown   PetscFunctionBegin;
400c7d97c5SJed Brown   ierr = PetscOptionsHead("BDDC options");CHKERRQ(ierr);
410c7d97c5SJed Brown   /* Verbose debugging of main data structures */
42e269702eSStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_check_all"       ,"Verbose (debugging) output for PCBDDC"                       ,"none",pcbddc->dbg_flag      ,&pcbddc->dbg_flag      ,PETSC_NULL);CHKERRQ(ierr);
430c7d97c5SJed Brown   /* Some customization for default primal space */
44da1bb401SStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_vertices_only"   ,"Use only vertices in coarse space (i.e. discard constraints)","none",pcbddc->vertices_flag   ,&pcbddc->vertices_flag   ,PETSC_NULL);CHKERRQ(ierr);
45da1bb401SStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_constraints_only","Use only constraints in coarse space (i.e. discard vertices)","none",pcbddc->constraints_flag,&pcbddc->constraints_flag,PETSC_NULL);CHKERRQ(ierr);
46da1bb401SStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_faces_only"      ,"Use only faces among constraints of coarse space (i.e. discard edges)"         ,"none",pcbddc->faces_flag      ,&pcbddc->faces_flag      ,PETSC_NULL);CHKERRQ(ierr);
47da1bb401SStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_edges_only"      ,"Use only edges among constraints of coarse space (i.e. discard faces)"         ,"none",pcbddc->edges_flag      ,&pcbddc->edges_flag      ,PETSC_NULL);CHKERRQ(ierr);
480c7d97c5SJed Brown   /* Coarse solver context */
49da1bb401SStefano Zampini   static const char *avail_coarse_problems[] = {"sequential","replicated","parallel","multilevel",""}; /*order of choiches depends on ENUM defined in bddc.h */
500c7d97c5SJed Brown   ierr = PetscOptionsEnum("-pc_bddc_coarse_problem_type","Set coarse problem type","none",avail_coarse_problems,(PetscEnum)pcbddc->coarse_problem_type,(PetscEnum*)&pcbddc->coarse_problem_type,PETSC_NULL);CHKERRQ(ierr);
510c7d97c5SJed Brown   /* Two different application of BDDC to the whole set of dofs, internal and interface */
520c7d97c5SJed Brown   ierr = PetscOptionsBool("-pc_bddc_switch_preconditioning_type","Switch between M_2 (default) and M_3 preconditioners (as defined by Dohrmann)","none",pcbddc->prec_type,&pcbddc->prec_type,PETSC_NULL);CHKERRQ(ierr);
53*534831adSStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_use_change_of_basis","Use change of basis approach for primal space","none",pcbddc->usechangeofbasis,&pcbddc->usechangeofbasis,PETSC_NULL);CHKERRQ(ierr);
54*534831adSStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_use_change_on_faces","Use change of basis approach for face constraints","none",pcbddc->usechangeonfaces,&pcbddc->usechangeonfaces,PETSC_NULL);CHKERRQ(ierr);
55*534831adSStefano Zampini   pcbddc->usechangeonfaces = pcbddc->usechangeonfaces && pcbddc->usechangeofbasis;
560c7d97c5SJed Brown   ierr = PetscOptionsInt("-pc_bddc_coarsening_ratio","Set coarsening ratio used in multilevel coarsening","none",pcbddc->coarsening_ratio,&pcbddc->coarsening_ratio,PETSC_NULL);CHKERRQ(ierr);
570c7d97c5SJed Brown   ierr = PetscOptionsTail();CHKERRQ(ierr);
580c7d97c5SJed Brown   PetscFunctionReturn(0);
590c7d97c5SJed Brown }
600c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
610c7d97c5SJed Brown EXTERN_C_BEGIN
620c7d97c5SJed Brown #undef __FUNCT__
630c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetCoarseProblemType_BDDC"
6453cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetCoarseProblemType_BDDC(PC pc, CoarseProblemType CPT)
650c7d97c5SJed Brown {
660c7d97c5SJed Brown   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
670c7d97c5SJed Brown 
680c7d97c5SJed Brown   PetscFunctionBegin;
690c7d97c5SJed Brown   pcbddc->coarse_problem_type = CPT;
700c7d97c5SJed Brown   PetscFunctionReturn(0);
710c7d97c5SJed Brown }
720c7d97c5SJed Brown EXTERN_C_END
730c7d97c5SJed Brown #undef __FUNCT__
740c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetCoarseProblemType"
7553cdbc3dSStefano Zampini /*@
769c0446d6SStefano Zampini  PCBDDCSetCoarseProblemType - Set coarse problem type in PCBDDC.
7753cdbc3dSStefano Zampini 
789c0446d6SStefano Zampini    Not collective
7953cdbc3dSStefano Zampini 
8053cdbc3dSStefano Zampini    Input Parameters:
8153cdbc3dSStefano Zampini +  pc - the preconditioning context
8253cdbc3dSStefano Zampini -  CoarseProblemType - pick a better name and explain what this is
8353cdbc3dSStefano Zampini 
8453cdbc3dSStefano Zampini    Level: intermediate
8553cdbc3dSStefano Zampini 
8653cdbc3dSStefano Zampini    Notes:
87da1bb401SStefano Zampini    Not collective but all procs must call with same arguments.
8853cdbc3dSStefano Zampini 
8953cdbc3dSStefano Zampini .seealso: PCBDDC
9053cdbc3dSStefano Zampini @*/
910c7d97c5SJed Brown PetscErrorCode PCBDDCSetCoarseProblemType(PC pc, CoarseProblemType CPT)
920c7d97c5SJed Brown {
930c7d97c5SJed Brown   PetscErrorCode ierr;
940c7d97c5SJed Brown 
950c7d97c5SJed Brown   PetscFunctionBegin;
960c7d97c5SJed Brown   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
970c7d97c5SJed Brown   ierr = PetscTryMethod(pc,"PCBDDCSetCoarseProblemType_C",(PC,CoarseProblemType),(pc,CPT));CHKERRQ(ierr);
980c7d97c5SJed Brown   PetscFunctionReturn(0);
990c7d97c5SJed Brown }
1000c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
1010c7d97c5SJed Brown EXTERN_C_BEGIN
1020c7d97c5SJed Brown #undef __FUNCT__
1033b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCSetDirichletBoundaries_BDDC"
1043b03a366Sstefano_zampini static PetscErrorCode PCBDDCSetDirichletBoundaries_BDDC(PC pc,IS DirichletBoundaries)
1053b03a366Sstefano_zampini {
1063b03a366Sstefano_zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
1073b03a366Sstefano_zampini   PetscErrorCode ierr;
1083b03a366Sstefano_zampini 
1093b03a366Sstefano_zampini   PetscFunctionBegin;
1103b03a366Sstefano_zampini   ierr = ISDestroy(&pcbddc->DirichletBoundaries);CHKERRQ(ierr);
11136e030ebSStefano Zampini   ierr = PetscObjectReference((PetscObject)DirichletBoundaries);CHKERRQ(ierr);
11236e030ebSStefano Zampini   pcbddc->DirichletBoundaries=DirichletBoundaries;
1133b03a366Sstefano_zampini   PetscFunctionReturn(0);
1143b03a366Sstefano_zampini }
1153b03a366Sstefano_zampini EXTERN_C_END
1163b03a366Sstefano_zampini #undef __FUNCT__
1173b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCSetDirichletBoundaries"
1183b03a366Sstefano_zampini /*@
119da1bb401SStefano Zampini  PCBDDCSetDirichletBoundaries - Set index set defining subdomain part (in local ordering)
120da1bb401SStefano Zampini                               of Dirichlet boundaries for the global problem.
1213b03a366Sstefano_zampini 
1223b03a366Sstefano_zampini    Not collective
1233b03a366Sstefano_zampini 
1243b03a366Sstefano_zampini    Input Parameters:
1253b03a366Sstefano_zampini +  pc - the preconditioning context
1263b03a366Sstefano_zampini -  DirichletBoundaries - sequential index set defining the subdomain part of Dirichlet boundaries (can be PETSC_NULL)
1273b03a366Sstefano_zampini 
1283b03a366Sstefano_zampini    Level: intermediate
1293b03a366Sstefano_zampini 
1303b03a366Sstefano_zampini    Notes:
1313b03a366Sstefano_zampini 
1323b03a366Sstefano_zampini .seealso: PCBDDC
1333b03a366Sstefano_zampini @*/
1343b03a366Sstefano_zampini PetscErrorCode PCBDDCSetDirichletBoundaries(PC pc,IS DirichletBoundaries)
1353b03a366Sstefano_zampini {
1363b03a366Sstefano_zampini   PetscErrorCode ierr;
1373b03a366Sstefano_zampini 
1383b03a366Sstefano_zampini   PetscFunctionBegin;
1393b03a366Sstefano_zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
1403b03a366Sstefano_zampini   ierr = PetscTryMethod(pc,"PCBDDCSetDirichletBoundaries_C",(PC,IS),(pc,DirichletBoundaries));CHKERRQ(ierr);
1413b03a366Sstefano_zampini   PetscFunctionReturn(0);
1423b03a366Sstefano_zampini }
1433b03a366Sstefano_zampini /* -------------------------------------------------------------------------- */
1443b03a366Sstefano_zampini EXTERN_C_BEGIN
1453b03a366Sstefano_zampini #undef __FUNCT__
1460c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetNeumannBoundaries_BDDC"
14753cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetNeumannBoundaries_BDDC(PC pc,IS NeumannBoundaries)
1480c7d97c5SJed Brown {
1490c7d97c5SJed Brown   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
15053cdbc3dSStefano Zampini   PetscErrorCode ierr;
1510c7d97c5SJed Brown 
1520c7d97c5SJed Brown   PetscFunctionBegin;
15353cdbc3dSStefano Zampini   ierr = ISDestroy(&pcbddc->NeumannBoundaries);CHKERRQ(ierr);
15436e030ebSStefano Zampini   ierr = PetscObjectReference((PetscObject)NeumannBoundaries);CHKERRQ(ierr);
15536e030ebSStefano Zampini   pcbddc->NeumannBoundaries=NeumannBoundaries;
1560c7d97c5SJed Brown   PetscFunctionReturn(0);
1570c7d97c5SJed Brown }
1580c7d97c5SJed Brown EXTERN_C_END
1590c7d97c5SJed Brown #undef __FUNCT__
1600c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetNeumannBoundaries"
16157527edcSJed Brown /*@
162da1bb401SStefano Zampini  PCBDDCSetNeumannBoundaries - Set index set defining subdomain part (in local ordering)
163da1bb401SStefano Zampini                               of Neumann boundaries for the global problem.
16457527edcSJed Brown 
1659c0446d6SStefano Zampini    Not collective
16657527edcSJed Brown 
16757527edcSJed Brown    Input Parameters:
16857527edcSJed Brown +  pc - the preconditioning context
1699c0446d6SStefano Zampini -  NeumannBoundaries - sequential index set defining the subdomain part of Neumann boundaries (can be PETSC_NULL)
17057527edcSJed Brown 
17157527edcSJed Brown    Level: intermediate
17257527edcSJed Brown 
17357527edcSJed Brown    Notes:
17457527edcSJed Brown 
17557527edcSJed Brown .seealso: PCBDDC
17657527edcSJed Brown @*/
17753cdbc3dSStefano Zampini PetscErrorCode PCBDDCSetNeumannBoundaries(PC pc,IS NeumannBoundaries)
1780c7d97c5SJed Brown {
1790c7d97c5SJed Brown   PetscErrorCode ierr;
1800c7d97c5SJed Brown 
1810c7d97c5SJed Brown   PetscFunctionBegin;
1820c7d97c5SJed Brown   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
18353cdbc3dSStefano Zampini   ierr = PetscTryMethod(pc,"PCBDDCSetNeumannBoundaries_C",(PC,IS),(pc,NeumannBoundaries));CHKERRQ(ierr);
18453cdbc3dSStefano Zampini   PetscFunctionReturn(0);
18553cdbc3dSStefano Zampini }
18653cdbc3dSStefano Zampini /* -------------------------------------------------------------------------- */
18753cdbc3dSStefano Zampini EXTERN_C_BEGIN
18853cdbc3dSStefano Zampini #undef __FUNCT__
189da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCGetDirichletBoundaries_BDDC"
190da1bb401SStefano Zampini static PetscErrorCode PCBDDCGetDirichletBoundaries_BDDC(PC pc,IS *DirichletBoundaries)
191da1bb401SStefano Zampini {
192da1bb401SStefano Zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
193da1bb401SStefano Zampini 
194da1bb401SStefano Zampini   PetscFunctionBegin;
195da1bb401SStefano Zampini   *DirichletBoundaries = pcbddc->DirichletBoundaries;
196da1bb401SStefano Zampini   PetscFunctionReturn(0);
197da1bb401SStefano Zampini }
198da1bb401SStefano Zampini EXTERN_C_END
199da1bb401SStefano Zampini #undef __FUNCT__
200da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCGetDirichletBoundaries"
201da1bb401SStefano Zampini /*@
202da1bb401SStefano Zampini  PCBDDCGetDirichletBoundaries - Get index set defining subdomain part (in local ordering)
203da1bb401SStefano Zampini                                 of Dirichlet boundaries for the global problem.
204da1bb401SStefano Zampini 
205da1bb401SStefano Zampini    Not collective
206da1bb401SStefano Zampini 
207da1bb401SStefano Zampini    Input Parameters:
208da1bb401SStefano Zampini +  pc - the preconditioning context
209da1bb401SStefano Zampini 
210da1bb401SStefano Zampini    Output Parameters:
211da1bb401SStefano Zampini +  DirichletBoundaries - index set defining the subdomain part of Dirichlet boundaries
212da1bb401SStefano Zampini 
213da1bb401SStefano Zampini    Level: intermediate
214da1bb401SStefano Zampini 
215da1bb401SStefano Zampini    Notes:
216da1bb401SStefano Zampini 
217da1bb401SStefano Zampini .seealso: PCBDDC
218da1bb401SStefano Zampini @*/
219da1bb401SStefano Zampini PetscErrorCode PCBDDCGetDirichletBoundaries(PC pc,IS *DirichletBoundaries)
220da1bb401SStefano Zampini {
221da1bb401SStefano Zampini   PetscErrorCode ierr;
222da1bb401SStefano Zampini 
223da1bb401SStefano Zampini   PetscFunctionBegin;
224da1bb401SStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
225da1bb401SStefano Zampini   ierr = PetscUseMethod(pc,"PCBDDCGetDirichletBoundaries_C",(PC,IS*),(pc,DirichletBoundaries));CHKERRQ(ierr);
226da1bb401SStefano Zampini   PetscFunctionReturn(0);
227da1bb401SStefano Zampini }
228da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
229da1bb401SStefano Zampini EXTERN_C_BEGIN
230da1bb401SStefano Zampini #undef __FUNCT__
23153cdbc3dSStefano Zampini #define __FUNCT__ "PCBDDCGetNeumannBoundaries_BDDC"
23253cdbc3dSStefano Zampini static PetscErrorCode PCBDDCGetNeumannBoundaries_BDDC(PC pc,IS *NeumannBoundaries)
23353cdbc3dSStefano Zampini {
23453cdbc3dSStefano Zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
23553cdbc3dSStefano Zampini 
23653cdbc3dSStefano Zampini   PetscFunctionBegin;
23753cdbc3dSStefano Zampini   *NeumannBoundaries = pcbddc->NeumannBoundaries;
23853cdbc3dSStefano Zampini   PetscFunctionReturn(0);
23953cdbc3dSStefano Zampini }
24053cdbc3dSStefano Zampini EXTERN_C_END
24153cdbc3dSStefano Zampini #undef __FUNCT__
24253cdbc3dSStefano Zampini #define __FUNCT__ "PCBDDCGetNeumannBoundaries"
24353cdbc3dSStefano Zampini /*@
244da1bb401SStefano Zampini  PCBDDCGetNeumannBoundaries - Get index set defining subdomain part (in local ordering)
245da1bb401SStefano Zampini                               of Neumann boundaries for the global problem.
24653cdbc3dSStefano Zampini 
2479c0446d6SStefano Zampini    Not collective
24853cdbc3dSStefano Zampini 
24953cdbc3dSStefano Zampini    Input Parameters:
25053cdbc3dSStefano Zampini +  pc - the preconditioning context
25153cdbc3dSStefano Zampini 
25253cdbc3dSStefano Zampini    Output Parameters:
25353cdbc3dSStefano Zampini +  NeumannBoundaries - index set defining the subdomain part of Neumann boundaries
25453cdbc3dSStefano Zampini 
25553cdbc3dSStefano Zampini    Level: intermediate
25653cdbc3dSStefano Zampini 
25753cdbc3dSStefano Zampini    Notes:
25853cdbc3dSStefano Zampini 
25953cdbc3dSStefano Zampini .seealso: PCBDDC
26053cdbc3dSStefano Zampini @*/
26153cdbc3dSStefano Zampini PetscErrorCode PCBDDCGetNeumannBoundaries(PC pc,IS *NeumannBoundaries)
26253cdbc3dSStefano Zampini {
26353cdbc3dSStefano Zampini   PetscErrorCode ierr;
26453cdbc3dSStefano Zampini 
26553cdbc3dSStefano Zampini   PetscFunctionBegin;
26653cdbc3dSStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
26753cdbc3dSStefano Zampini   ierr = PetscUseMethod(pc,"PCBDDCGetNeumannBoundaries_C",(PC,IS*),(pc,NeumannBoundaries));CHKERRQ(ierr);
2680c7d97c5SJed Brown   PetscFunctionReturn(0);
2690c7d97c5SJed Brown }
27036e030ebSStefano Zampini /* -------------------------------------------------------------------------- */
27136e030ebSStefano Zampini EXTERN_C_BEGIN
27236e030ebSStefano Zampini #undef __FUNCT__
273da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetLocalAdjacencyGraph_BDDC"
274da1bb401SStefano Zampini static PetscErrorCode PCBDDCSetLocalAdjacencyGraph_BDDC(PC pc, PetscInt nvtxs, PetscInt xadj[], PetscInt adjncy[], PetscCopyMode copymode)
27536e030ebSStefano Zampini {
27636e030ebSStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
277da1bb401SStefano Zampini   PCBDDCGraph    mat_graph=pcbddc->mat_graph;
278da1bb401SStefano Zampini   PetscErrorCode ierr;
27936e030ebSStefano Zampini 
28036e030ebSStefano Zampini   PetscFunctionBegin;
281da1bb401SStefano Zampini   mat_graph->nvtxs=nvtxs;
282da1bb401SStefano Zampini   ierr = PetscFree(mat_graph->xadj);CHKERRQ(ierr);
283da1bb401SStefano Zampini   ierr = PetscFree(mat_graph->adjncy);CHKERRQ(ierr);
284da1bb401SStefano Zampini   if(copymode == PETSC_COPY_VALUES) {
285da1bb401SStefano Zampini     ierr = PetscMalloc((mat_graph->nvtxs+1)*sizeof(PetscInt),&mat_graph->xadj);CHKERRQ(ierr);
286da1bb401SStefano Zampini     ierr = PetscMalloc(xadj[mat_graph->nvtxs]*sizeof(PetscInt),&mat_graph->adjncy);CHKERRQ(ierr);
287da1bb401SStefano Zampini     ierr = PetscMemcpy(mat_graph->xadj,xadj,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr);
288da1bb401SStefano Zampini     ierr = PetscMemcpy(mat_graph->adjncy,adjncy,xadj[mat_graph->nvtxs]*sizeof(PetscInt));CHKERRQ(ierr);
289da1bb401SStefano Zampini   } else if(copymode == PETSC_OWN_POINTER) {
290da1bb401SStefano Zampini     mat_graph->xadj=xadj;
291da1bb401SStefano Zampini     mat_graph->adjncy=adjncy;
292da1bb401SStefano Zampini   } else {
293da1bb401SStefano Zampini     SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_SUP,"Unsupported copy mode %d in %s\n",copymode,__FUNCT__);
294da1bb401SStefano Zampini   }
29536e030ebSStefano Zampini   PetscFunctionReturn(0);
29636e030ebSStefano Zampini }
29736e030ebSStefano Zampini EXTERN_C_END
29836e030ebSStefano Zampini #undef __FUNCT__
299da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetLocalAdjacencyGraph"
30036e030ebSStefano Zampini /*@
301da1bb401SStefano Zampini  PCBDDCSetLocalAdjacencyGraph - Set CSR graph of local matrix for use of PCBDDC.
30236e030ebSStefano Zampini 
30336e030ebSStefano Zampini    Not collective
30436e030ebSStefano Zampini 
30536e030ebSStefano Zampini    Input Parameters:
30636e030ebSStefano Zampini +  pc - the preconditioning context
307da1bb401SStefano Zampini -  nvtxs - number of local vertices of the graph
308da1bb401SStefano Zampini -  xadj, adjncy - the CSR graph
309da1bb401SStefano Zampini -  copymode - either PETSC_COPY_VALUES or PETSC_OWN_POINTER. In the former case the user must free the array passed in;
310da1bb401SStefano Zampini                                                              in the latter case, memory must be obtained with PetscMalloc.
31136e030ebSStefano Zampini 
31236e030ebSStefano Zampini    Level: intermediate
31336e030ebSStefano Zampini 
31436e030ebSStefano Zampini    Notes:
31536e030ebSStefano Zampini 
31636e030ebSStefano Zampini .seealso: PCBDDC
31736e030ebSStefano Zampini @*/
318da1bb401SStefano Zampini PetscErrorCode PCBDDCSetLocalAdjacencyGraph(PC pc,PetscInt nvtxs,PetscInt xadj[],PetscInt adjncy[], PetscCopyMode copymode)
31936e030ebSStefano Zampini {
320da1bb401SStefano Zampini   PetscInt       nrows,ncols;
321da1bb401SStefano Zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
32236e030ebSStefano Zampini   PetscErrorCode ierr;
32336e030ebSStefano Zampini 
32436e030ebSStefano Zampini   PetscFunctionBegin;
32536e030ebSStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
326da1bb401SStefano Zampini   ierr = MatGetSize(matis->A,&nrows,&ncols);CHKERRQ(ierr);
327da1bb401SStefano Zampini   if(nvtxs != nrows) {
328da1bb401SStefano Zampini     SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Local adjacency size %d passed in %s differs from local problem size %d!\n",nvtxs,__FUNCT__,nrows);
329da1bb401SStefano Zampini   } else {
330da1bb401SStefano Zampini     ierr = PetscTryMethod(pc,"PCBDDCSetLocalAdjacencyGraph_C",(PC,PetscInt,PetscInt[],PetscInt[],PetscCopyMode),(pc,nvtxs,xadj,adjncy,copymode));CHKERRQ(ierr);
331da1bb401SStefano Zampini   }
33236e030ebSStefano Zampini   PetscFunctionReturn(0);
33336e030ebSStefano Zampini }
3349c0446d6SStefano Zampini /* -------------------------------------------------------------------------- */
3359c0446d6SStefano Zampini EXTERN_C_BEGIN
3369c0446d6SStefano Zampini #undef __FUNCT__
3379c0446d6SStefano Zampini #define __FUNCT__ "PCBDDCSetDofsSplitting_BDDC"
3389c0446d6SStefano Zampini static PetscErrorCode PCBDDCSetDofsSplitting_BDDC(PC pc,PetscInt n_is, IS ISForDofs[])
3399c0446d6SStefano Zampini {
3409c0446d6SStefano Zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
3419c0446d6SStefano Zampini   PetscInt i;
3429c0446d6SStefano Zampini   PetscErrorCode ierr;
3439c0446d6SStefano Zampini 
3449c0446d6SStefano Zampini   PetscFunctionBegin;
345da1bb401SStefano Zampini   /* Destroy ISes if they were already set */
3469c0446d6SStefano Zampini   for(i=0;i<pcbddc->n_ISForDofs;i++) {
3479c0446d6SStefano Zampini     ierr = ISDestroy(&pcbddc->ISForDofs[i]);CHKERRQ(ierr);
3489c0446d6SStefano Zampini   }
349d11ae9bbSstefano_zampini   ierr = PetscFree(pcbddc->ISForDofs);CHKERRQ(ierr);
350da1bb401SStefano Zampini   /* allocate space then set */
3519c0446d6SStefano Zampini   ierr = PetscMalloc(n_is*sizeof(IS),&pcbddc->ISForDofs);CHKERRQ(ierr);
3529c0446d6SStefano Zampini   for(i=0;i<n_is;i++) {
353da1bb401SStefano Zampini     ierr = PetscObjectReference((PetscObject)ISForDofs[i]);CHKERRQ(ierr);
354da1bb401SStefano Zampini     pcbddc->ISForDofs[i]=ISForDofs[i];
3559c0446d6SStefano Zampini   }
3569c0446d6SStefano Zampini   pcbddc->n_ISForDofs=n_is;
3579c0446d6SStefano Zampini   PetscFunctionReturn(0);
3589c0446d6SStefano Zampini }
3599c0446d6SStefano Zampini EXTERN_C_END
3609c0446d6SStefano Zampini #undef __FUNCT__
3619c0446d6SStefano Zampini #define __FUNCT__ "PCBDDCSetDofsSplitting"
3629c0446d6SStefano Zampini /*@
363da1bb401SStefano Zampini  PCBDDCSetDofsSplitting - Set index sets defining fields of local mat.
3649c0446d6SStefano Zampini 
3659c0446d6SStefano Zampini    Not collective
3669c0446d6SStefano Zampini 
3679c0446d6SStefano Zampini    Input Parameters:
3689c0446d6SStefano Zampini +  pc - the preconditioning context
369da1bb401SStefano Zampini -  n - number of index sets defining the fields
370da1bb401SStefano Zampini -  IS[] - array of IS describing the fields
3719c0446d6SStefano Zampini 
3729c0446d6SStefano Zampini    Level: intermediate
3739c0446d6SStefano Zampini 
3749c0446d6SStefano Zampini    Notes:
3759c0446d6SStefano Zampini 
3769c0446d6SStefano Zampini .seealso: PCBDDC
3779c0446d6SStefano Zampini @*/
3789c0446d6SStefano Zampini PetscErrorCode PCBDDCSetDofsSplitting(PC pc,PetscInt n_is, IS ISForDofs[])
3799c0446d6SStefano Zampini {
3809c0446d6SStefano Zampini   PetscErrorCode ierr;
3819c0446d6SStefano Zampini 
3829c0446d6SStefano Zampini   PetscFunctionBegin;
3839c0446d6SStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
3849c0446d6SStefano Zampini   ierr = PetscTryMethod(pc,"PCBDDCSetDofsSplitting_C",(PC,PetscInt,IS[]),(pc,n_is,ISForDofs));CHKERRQ(ierr);
3859c0446d6SStefano Zampini   PetscFunctionReturn(0);
3869c0446d6SStefano Zampini }
387da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
388*534831adSStefano Zampini #undef __FUNCT__
389*534831adSStefano Zampini #define __FUNCT__ "PCPreSolve_BDDC"
390*534831adSStefano Zampini /* -------------------------------------------------------------------------- */
391*534831adSStefano Zampini /*
392*534831adSStefano Zampini    PCPreSolve_BDDC - Changes the right hand side and (if necessary) the initial
393*534831adSStefano Zampini                      guess if a transformation of basis approach has been selected.
3949c0446d6SStefano Zampini 
395*534831adSStefano Zampini    Input Parameter:
396*534831adSStefano Zampini +  pc - the preconditioner contex
397*534831adSStefano Zampini 
398*534831adSStefano Zampini    Application Interface Routine: PCPreSolve()
399*534831adSStefano Zampini 
400*534831adSStefano Zampini    Notes:
401*534831adSStefano Zampini    The interface routine PCPreSolve() is not usually called directly by
402*534831adSStefano Zampini    the user, but instead is called by KSPSolve().
403*534831adSStefano Zampini */
404*534831adSStefano Zampini static PetscErrorCode PCPreSolve_BDDC(PC pc, KSP ksp, Vec rhs, Vec x)
405*534831adSStefano Zampini {
406*534831adSStefano Zampini   PetscErrorCode ierr;
407*534831adSStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
408*534831adSStefano Zampini   PC_IS          *pcis = (PC_IS*)(pc->data);
409*534831adSStefano Zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
410*534831adSStefano Zampini   Mat            temp_mat;
411*534831adSStefano Zampini 
412*534831adSStefano Zampini   PetscFunctionBegin;
413*534831adSStefano Zampini   if(pcbddc->usechangeofbasis) {
414*534831adSStefano Zampini     /* swap pointers for local matrices */
415*534831adSStefano Zampini     temp_mat = matis->A;
416*534831adSStefano Zampini     matis->A = pcbddc->local_mat;
417*534831adSStefano Zampini     pcbddc->local_mat = temp_mat;
418*534831adSStefano Zampini     /* store the original rhs */
419*534831adSStefano Zampini     ierr = VecCopy(rhs,pcbddc->original_rhs);CHKERRQ(ierr);
420*534831adSStefano Zampini     /* Get local rhs and apply transformation of basis */
421*534831adSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,rhs,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
422*534831adSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,rhs,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
423*534831adSStefano Zampini     /* from original basis to modified basis */
424*534831adSStefano Zampini     ierr = MatMultTranspose(pcbddc->ChangeOfBasisMatrix,pcis->vec1_B,pcis->vec2_B);CHKERRQ(ierr);
425*534831adSStefano Zampini     /* put back modified values into the global vec using INSERT_VALUES copy mode */
426*534831adSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,pcis->vec2_B,rhs,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
427*534831adSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec2_B,rhs,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
428*534831adSStefano Zampini   }
429*534831adSStefano Zampini   PetscFunctionReturn(0);
430*534831adSStefano Zampini }
431*534831adSStefano Zampini /* -------------------------------------------------------------------------- */
432*534831adSStefano Zampini #undef __FUNCT__
433*534831adSStefano Zampini #define __FUNCT__ "PCPostSolve_BDDC"
434*534831adSStefano Zampini /* -------------------------------------------------------------------------- */
435*534831adSStefano Zampini /*
436*534831adSStefano Zampini    PCPostSolve_BDDC - Changes the computed solution if a transformation of basis
437*534831adSStefano Zampini                      approach has been selected. Also, restores rhs to its original state.
438*534831adSStefano Zampini 
439*534831adSStefano Zampini    Input Parameter:
440*534831adSStefano Zampini +  pc - the preconditioner contex
441*534831adSStefano Zampini 
442*534831adSStefano Zampini    Application Interface Routine: PCPostSolve()
443*534831adSStefano Zampini 
444*534831adSStefano Zampini    Notes:
445*534831adSStefano Zampini    The interface routine PCPostSolve() is not usually called directly by
446*534831adSStefano Zampini    the user, but instead is called by KSPSolve().
447*534831adSStefano Zampini */
448*534831adSStefano Zampini static PetscErrorCode PCPostSolve_BDDC(PC pc, KSP ksp, Vec rhs, Vec x)
449*534831adSStefano Zampini {
450*534831adSStefano Zampini   PetscErrorCode ierr;
451*534831adSStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
452*534831adSStefano Zampini   PC_IS          *pcis = (PC_IS*)(pc->data);
453*534831adSStefano Zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
454*534831adSStefano Zampini   Mat            temp_mat;
455*534831adSStefano Zampini 
456*534831adSStefano Zampini   PetscFunctionBegin;
457*534831adSStefano Zampini   if(pcbddc->usechangeofbasis) {
458*534831adSStefano Zampini     /* swap pointers for local matrices */
459*534831adSStefano Zampini     temp_mat = matis->A;
460*534831adSStefano Zampini     matis->A = pcbddc->local_mat;
461*534831adSStefano Zampini     pcbddc->local_mat = temp_mat;
462*534831adSStefano Zampini     /* restore rhs to its original state */
463*534831adSStefano Zampini     ierr = VecCopy(pcbddc->original_rhs,rhs);CHKERRQ(ierr);
464*534831adSStefano Zampini     /* Get Local boundary and apply transformation of basis to solution vector */
465*534831adSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,x,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
466*534831adSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,x,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
467*534831adSStefano Zampini     /* from modified basis to original basis */
468*534831adSStefano Zampini     ierr = MatMult(pcbddc->ChangeOfBasisMatrix,pcis->vec1_B,pcis->vec2_B);CHKERRQ(ierr);
469*534831adSStefano Zampini     /* put back modified values into the global vec using INSERT_VALUES copy mode */
470*534831adSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,pcis->vec2_B,x,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
471*534831adSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec2_B,x,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
472*534831adSStefano Zampini   }
473*534831adSStefano Zampini   PetscFunctionReturn(0);
474*534831adSStefano Zampini }
475*534831adSStefano Zampini /* -------------------------------------------------------------------------- */
47653cdbc3dSStefano Zampini #undef __FUNCT__
47753cdbc3dSStefano Zampini #define __FUNCT__ "PCSetUp_BDDC"
4780c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
4790c7d97c5SJed Brown /*
4800c7d97c5SJed Brown    PCSetUp_BDDC - Prepares for the use of the BDDC preconditioner
4810c7d97c5SJed Brown                   by setting data structures and options.
4820c7d97c5SJed Brown 
4830c7d97c5SJed Brown    Input Parameter:
48453cdbc3dSStefano Zampini +  pc - the preconditioner context
4850c7d97c5SJed Brown 
4860c7d97c5SJed Brown    Application Interface Routine: PCSetUp()
4870c7d97c5SJed Brown 
4880c7d97c5SJed Brown    Notes:
4890c7d97c5SJed Brown    The interface routine PCSetUp() is not usually called directly by
4900c7d97c5SJed Brown    the user, but instead is called by PCApply() if necessary.
4910c7d97c5SJed Brown */
49253cdbc3dSStefano Zampini PetscErrorCode PCSetUp_BDDC(PC pc)
4930c7d97c5SJed Brown {
4940c7d97c5SJed Brown   PetscErrorCode ierr;
4950c7d97c5SJed Brown   PC_BDDC*       pcbddc   = (PC_BDDC*)pc->data;
4960c7d97c5SJed Brown   PC_IS            *pcis = (PC_IS*)(pc->data);
4970c7d97c5SJed Brown 
4980c7d97c5SJed Brown   PetscFunctionBegin;
4990c7d97c5SJed Brown   if (!pc->setupcalled) {
5003b03a366Sstefano_zampini     /* For BDDC we need to define a local "Neumann" problem different to that defined in PCISSetup
5019c0446d6SStefano Zampini        So, we set to pcnone the Neumann problem of pcis in order to avoid unneeded computation
5020c7d97c5SJed Brown        Also, we decide to directly build the (same) Dirichlet problem */
5030c7d97c5SJed Brown     ierr = PetscOptionsSetValue("-is_localN_pc_type","none");CHKERRQ(ierr);
5040c7d97c5SJed Brown     ierr = PetscOptionsSetValue("-is_localD_pc_type","none");CHKERRQ(ierr);
5050c7d97c5SJed Brown     /* Set up all the "iterative substructuring" common block */
5060c7d97c5SJed Brown     ierr = PCISSetUp(pc);CHKERRQ(ierr);
5073b03a366Sstefano_zampini     /* Get stdout for dbg */
508e269702eSStefano Zampini     if(pcbddc->dbg_flag) {
509e269702eSStefano Zampini       ierr = PetscViewerASCIIGetStdout(((PetscObject)pc)->comm,&pcbddc->dbg_viewer);CHKERRQ(ierr);
510e269702eSStefano Zampini       ierr = PetscViewerASCIISynchronizedAllow(pcbddc->dbg_viewer,PETSC_TRUE);CHKERRQ(ierr);
511e269702eSStefano Zampini     }
5123b03a366Sstefano_zampini     /* TODO MOVE CODE FRAGMENT */
5130c7d97c5SJed Brown     PetscInt im_active=0;
5140c7d97c5SJed Brown     if(pcis->n) im_active = 1;
51553cdbc3dSStefano Zampini     ierr = MPI_Allreduce(&im_active,&pcbddc->active_procs,1,MPIU_INT,MPI_SUM,((PetscObject)pc)->comm);CHKERRQ(ierr);
5163b03a366Sstefano_zampini     /* Analyze local interface */
5170c7d97c5SJed Brown     ierr = PCBDDCManageLocalBoundaries(pc);CHKERRQ(ierr);
5183b03a366Sstefano_zampini     /* Set up local constraint matrix */
5193b03a366Sstefano_zampini     ierr = PCBDDCCreateConstraintMatrix(pc);CHKERRQ(ierr);
5200c7d97c5SJed Brown     /* Create coarse and local stuffs used for evaluating action of preconditioner */
5210c7d97c5SJed Brown     ierr = PCBDDCCoarseSetUp(pc);CHKERRQ(ierr);
5223b03a366Sstefano_zampini     /* Processes fakely involved in multilevel should not call ISLocalToGlobalMappingRestoreInfo */
5233b03a366Sstefano_zampini     if ( !pcis->n_neigh ) pcis->ISLocalToGlobalMappingGetInfoWasCalled=PETSC_FALSE;
5240c7d97c5SJed Brown   }
5250c7d97c5SJed Brown   PetscFunctionReturn(0);
5260c7d97c5SJed Brown }
5270c7d97c5SJed Brown 
5280c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
5290c7d97c5SJed Brown /*
5300c7d97c5SJed Brown    PCApply_BDDC - Applies the BDDC preconditioner to a vector.
5310c7d97c5SJed Brown 
5320c7d97c5SJed Brown    Input Parameters:
5330c7d97c5SJed Brown .  pc - the preconditioner context
5340c7d97c5SJed Brown .  r - input vector (global)
5350c7d97c5SJed Brown 
5360c7d97c5SJed Brown    Output Parameter:
5370c7d97c5SJed Brown .  z - output vector (global)
5380c7d97c5SJed Brown 
5390c7d97c5SJed Brown    Application Interface Routine: PCApply()
5400c7d97c5SJed Brown  */
5410c7d97c5SJed Brown #undef __FUNCT__
5420c7d97c5SJed Brown #define __FUNCT__ "PCApply_BDDC"
54353cdbc3dSStefano Zampini PetscErrorCode PCApply_BDDC(PC pc,Vec r,Vec z)
5440c7d97c5SJed Brown {
5450c7d97c5SJed Brown   PC_IS             *pcis = (PC_IS*)(pc->data);
5460c7d97c5SJed Brown   PC_BDDC           *pcbddc = (PC_BDDC*)(pc->data);
5470c7d97c5SJed Brown   PetscErrorCode    ierr;
5483b03a366Sstefano_zampini   const PetscScalar one = 1.0;
5493b03a366Sstefano_zampini   const PetscScalar m_one = -1.0;
5502617d88aSStefano Zampini   const PetscScalar zero = 0.0;
5510c7d97c5SJed Brown 
5520c7d97c5SJed Brown /* This code is similar to that provided in nn.c for PCNN
5530c7d97c5SJed Brown    NN interface preconditioner changed to BDDC
5540c7d97c5SJed Brown    Added support for M_3 preconditioenr in the reference article (code is active if pcbddc->prec_type = PETSC_TRUE) */
5550c7d97c5SJed Brown 
5560c7d97c5SJed Brown   PetscFunctionBegin;
5570c7d97c5SJed Brown   /* First Dirichlet solve */
5580c7d97c5SJed Brown   ierr = VecScatterBegin(pcis->global_to_D,r,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
5590c7d97c5SJed Brown   ierr = VecScatterEnd  (pcis->global_to_D,r,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
56053cdbc3dSStefano Zampini   ierr = KSPSolve(pcbddc->ksp_D,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr);
5610c7d97c5SJed Brown   /*
5620c7d97c5SJed Brown     Assembling right hand side for BDDC operator
5630c7d97c5SJed Brown     - vec1_D for the Dirichlet part (if needed, i.e. prec_flag=PETSC_TRUE)
5640c7d97c5SJed Brown     - the interface part of the global vector z
5650c7d97c5SJed Brown   */
5660c7d97c5SJed Brown   ierr = VecScale(pcis->vec2_D,m_one);CHKERRQ(ierr);
5670c7d97c5SJed Brown   ierr = MatMult(pcis->A_BI,pcis->vec2_D,pcis->vec1_B);CHKERRQ(ierr);
5680c7d97c5SJed Brown   if(pcbddc->prec_type) { ierr = MatMultAdd(pcis->A_II,pcis->vec2_D,pcis->vec1_D,pcis->vec1_D);CHKERRQ(ierr); }
5690c7d97c5SJed Brown   ierr = VecScale(pcis->vec2_D,m_one);CHKERRQ(ierr);
5700c7d97c5SJed Brown   ierr = VecCopy(r,z);CHKERRQ(ierr);
5710c7d97c5SJed Brown   ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
5720c7d97c5SJed Brown   ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
5730c7d97c5SJed Brown 
5742617d88aSStefano Zampini   /* Get Local boundary and apply partition of unity */
5752617d88aSStefano Zampini   ierr = VecScatterBegin(pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
5762617d88aSStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
5772617d88aSStefano Zampini   ierr = VecPointwiseMult(pcis->vec1_B,pcis->D,pcis->vec1_B);CHKERRQ(ierr);
5782617d88aSStefano Zampini 
5792617d88aSStefano Zampini   /* Apply interface preconditioner
5802617d88aSStefano Zampini      input/output vecs: pcis->vec1_B and pcis->vec1_D */
5812617d88aSStefano Zampini   ierr = PCBDDCApplyInterfacePreconditioner(pc);CHKERRQ(ierr);
5822617d88aSStefano Zampini 
5832617d88aSStefano Zampini   /* Apply partition of unity and sum boundary values */
5842617d88aSStefano Zampini   ierr = VecPointwiseMult(pcis->vec1_B,pcis->D,pcis->vec1_B);CHKERRQ(ierr);
5852617d88aSStefano Zampini   ierr = VecSet(z,zero);CHKERRQ(ierr);
5862617d88aSStefano Zampini   ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
5872617d88aSStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
5880c7d97c5SJed Brown 
5893b03a366Sstefano_zampini   /* Second Dirichlet solve and assembling of output */
5900c7d97c5SJed Brown   ierr = VecScatterBegin(pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
5910c7d97c5SJed Brown   ierr = VecScatterEnd  (pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
5920c7d97c5SJed Brown   ierr = MatMult(pcis->A_IB,pcis->vec1_B,pcis->vec3_D);CHKERRQ(ierr);
5930c7d97c5SJed Brown   if(pcbddc->prec_type) { ierr = MatMultAdd(pcis->A_II,pcis->vec1_D,pcis->vec3_D,pcis->vec3_D);CHKERRQ(ierr); }
59453cdbc3dSStefano Zampini   ierr = KSPSolve(pcbddc->ksp_D,pcis->vec3_D,pcbddc->vec4_D);CHKERRQ(ierr);
5950c7d97c5SJed Brown   ierr = VecScale(pcbddc->vec4_D,m_one);CHKERRQ(ierr);
5960c7d97c5SJed Brown   if(pcbddc->prec_type) { ierr = VecAXPY (pcbddc->vec4_D,one,pcis->vec1_D);CHKERRQ(ierr); }
5970c7d97c5SJed Brown   ierr = VecAXPY (pcis->vec2_D,one,pcbddc->vec4_D);CHKERRQ(ierr);
5980c7d97c5SJed Brown   ierr = VecScatterBegin(pcis->global_to_D,pcis->vec2_D,z,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
5990c7d97c5SJed Brown   ierr = VecScatterEnd  (pcis->global_to_D,pcis->vec2_D,z,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
6000c7d97c5SJed Brown 
6010c7d97c5SJed Brown   PetscFunctionReturn(0);
6020c7d97c5SJed Brown 
6030c7d97c5SJed Brown }
604da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
605da1bb401SStefano Zampini #undef __FUNCT__
606da1bb401SStefano Zampini #define __FUNCT__ "PCDestroy_BDDC"
607da1bb401SStefano Zampini PetscErrorCode PCDestroy_BDDC(PC pc)
608da1bb401SStefano Zampini {
609da1bb401SStefano Zampini   PC_BDDC          *pcbddc = (PC_BDDC*)pc->data;
610da1bb401SStefano Zampini   PetscErrorCode ierr;
611da1bb401SStefano Zampini 
612da1bb401SStefano Zampini   PetscFunctionBegin;
613da1bb401SStefano Zampini   /* free data created by PCIS */
614da1bb401SStefano Zampini   ierr = PCISDestroy(pc);CHKERRQ(ierr);
615da1bb401SStefano Zampini   /* free BDDC data  */
616*534831adSStefano Zampini   ierr = VecDestroy(&pcbddc->original_rhs);CHKERRQ(ierr);
617*534831adSStefano Zampini   ierr = MatDestroy(&pcbddc->local_mat);CHKERRQ(ierr);
618*534831adSStefano Zampini   ierr = MatDestroy(&pcbddc->ChangeOfBasisMatrix);CHKERRQ(ierr);
619da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->coarse_vec);CHKERRQ(ierr);
620da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->coarse_rhs);CHKERRQ(ierr);
621da1bb401SStefano Zampini   ierr = KSPDestroy(&pcbddc->coarse_ksp);CHKERRQ(ierr);
622da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->coarse_mat);CHKERRQ(ierr);
623da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->coarse_phi_B);CHKERRQ(ierr);
624da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->coarse_phi_D);CHKERRQ(ierr);
625da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec1_P);CHKERRQ(ierr);
626da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec1_C);CHKERRQ(ierr);
627da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->local_auxmat1);CHKERRQ(ierr);
628da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->local_auxmat2);CHKERRQ(ierr);
629da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec1_R);CHKERRQ(ierr);
630da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec2_R);CHKERRQ(ierr);
631da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec4_D);CHKERRQ(ierr);
632da1bb401SStefano Zampini   ierr = VecScatterDestroy(&pcbddc->R_to_B);CHKERRQ(ierr);
633da1bb401SStefano Zampini   ierr = VecScatterDestroy(&pcbddc->R_to_D);CHKERRQ(ierr);
634da1bb401SStefano Zampini   ierr = VecScatterDestroy(&pcbddc->coarse_loc_to_glob);CHKERRQ(ierr);
635da1bb401SStefano Zampini   ierr = KSPDestroy(&pcbddc->ksp_D);CHKERRQ(ierr);
636da1bb401SStefano Zampini   ierr = KSPDestroy(&pcbddc->ksp_R);CHKERRQ(ierr);
637da1bb401SStefano Zampini   ierr = ISDestroy(&pcbddc->NeumannBoundaries);CHKERRQ(ierr);
638da1bb401SStefano Zampini   ierr = ISDestroy(&pcbddc->DirichletBoundaries);CHKERRQ(ierr);
639da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->ConstraintMatrix);CHKERRQ(ierr);
640da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->local_primal_indices);CHKERRQ(ierr);
641da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->replicated_local_primal_indices);CHKERRQ(ierr);
642da1bb401SStefano Zampini   if (pcbddc->replicated_local_primal_values)    { free(pcbddc->replicated_local_primal_values); }
643da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->local_primal_displacements);CHKERRQ(ierr);
644da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->local_primal_sizes);CHKERRQ(ierr);
645da1bb401SStefano Zampini   PetscInt i;
646da1bb401SStefano Zampini   for(i=0;i<pcbddc->n_ISForDofs;i++) { ierr = ISDestroy(&pcbddc->ISForDofs[i]);CHKERRQ(ierr); }
647da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->ISForDofs);CHKERRQ(ierr);
648da1bb401SStefano Zampini   for(i=0;i<pcbddc->n_ISForFaces;i++) { ierr = ISDestroy(&pcbddc->ISForFaces[i]);CHKERRQ(ierr); }
649da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->ISForFaces);CHKERRQ(ierr);
650da1bb401SStefano Zampini   for(i=0;i<pcbddc->n_ISForEdges;i++) { ierr = ISDestroy(&pcbddc->ISForEdges[i]);CHKERRQ(ierr); }
651da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->ISForEdges);CHKERRQ(ierr);
652da1bb401SStefano Zampini   ierr = ISDestroy(&pcbddc->ISForVertices);CHKERRQ(ierr);
653da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph->xadj);CHKERRQ(ierr);
654da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph->adjncy);CHKERRQ(ierr);
655da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph->neighbours_set[0]);CHKERRQ(ierr);
656da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph->neighbours_set);CHKERRQ(ierr);
657da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph);CHKERRQ(ierr);
658da1bb401SStefano Zampini   /* Free the private data structure that was hanging off the PC */
659da1bb401SStefano Zampini   ierr = PetscFree(pcbddc);CHKERRQ(ierr);
660da1bb401SStefano Zampini   PetscFunctionReturn(0);
661da1bb401SStefano Zampini }
6620c7d97c5SJed Brown 
6630c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
664da1bb401SStefano Zampini /*MC
665da1bb401SStefano Zampini    PCBDDC - Balancing Domain Decomposition by Constraints.
6660c7d97c5SJed Brown 
667da1bb401SStefano Zampini    Options Database Keys:
668da1bb401SStefano Zampini .    -pcbddc ??? -
669da1bb401SStefano Zampini 
670da1bb401SStefano Zampini    Level: intermediate
671da1bb401SStefano Zampini 
672da1bb401SStefano Zampini    Notes: The matrix used with this preconditioner must be of type MATIS
673da1bb401SStefano Zampini 
674da1bb401SStefano Zampini           Unlike more 'conventional' interface preconditioners, this iterates over ALL the
675da1bb401SStefano Zampini           degrees of freedom, NOT just those on the interface (this allows the use of approximate solvers
676da1bb401SStefano Zampini           on the subdomains).
677da1bb401SStefano Zampini 
678da1bb401SStefano Zampini           Options for the coarse grid preconditioner can be set with -
679da1bb401SStefano Zampini           Options for the Dirichlet subproblem can be set with -
680da1bb401SStefano Zampini           Options for the Neumann subproblem can be set with -
681da1bb401SStefano Zampini 
682da1bb401SStefano Zampini    Contributed by Stefano Zampini
683da1bb401SStefano Zampini 
684da1bb401SStefano Zampini .seealso:  PCCreate(), PCSetType(), PCType (for list of available types), PC,  MATIS
685da1bb401SStefano Zampini M*/
686da1bb401SStefano Zampini EXTERN_C_BEGIN
687da1bb401SStefano Zampini #undef __FUNCT__
688da1bb401SStefano Zampini #define __FUNCT__ "PCCreate_BDDC"
689da1bb401SStefano Zampini PetscErrorCode PCCreate_BDDC(PC pc)
690da1bb401SStefano Zampini {
691da1bb401SStefano Zampini   PetscErrorCode ierr;
692da1bb401SStefano Zampini   PC_BDDC        *pcbddc;
693da1bb401SStefano Zampini   PCBDDCGraph    mat_graph;
694da1bb401SStefano Zampini 
695da1bb401SStefano Zampini   PetscFunctionBegin;
696da1bb401SStefano Zampini   /* Creates the private data structure for this preconditioner and attach it to the PC object. */
697da1bb401SStefano Zampini   ierr      = PetscNewLog(pc,PC_BDDC,&pcbddc);CHKERRQ(ierr);
698da1bb401SStefano Zampini   pc->data  = (void*)pcbddc;
699da1bb401SStefano Zampini 
700da1bb401SStefano Zampini   /* create PCIS data structure */
701da1bb401SStefano Zampini   ierr = PCISCreate(pc);CHKERRQ(ierr);
702da1bb401SStefano Zampini 
703da1bb401SStefano Zampini   /* BDDC specific */
704*534831adSStefano Zampini   pcbddc->original_rhs               = 0;
705*534831adSStefano Zampini   pcbddc->local_mat                  = 0;
706*534831adSStefano Zampini   pcbddc->ChangeOfBasisMatrix        = 0;
707*534831adSStefano Zampini   pcbddc->usechangeofbasis           = PETSC_TRUE;
708*534831adSStefano Zampini   pcbddc->usechangeonfaces           = PETSC_FALSE;
709da1bb401SStefano Zampini   pcbddc->coarse_vec                 = 0;
710da1bb401SStefano Zampini   pcbddc->coarse_rhs                 = 0;
711da1bb401SStefano Zampini   pcbddc->coarse_ksp                 = 0;
712da1bb401SStefano Zampini   pcbddc->coarse_phi_B               = 0;
713da1bb401SStefano Zampini   pcbddc->coarse_phi_D               = 0;
714da1bb401SStefano Zampini   pcbddc->vec1_P                     = 0;
715da1bb401SStefano Zampini   pcbddc->vec1_R                     = 0;
716da1bb401SStefano Zampini   pcbddc->vec2_R                     = 0;
717da1bb401SStefano Zampini   pcbddc->local_auxmat1              = 0;
718da1bb401SStefano Zampini   pcbddc->local_auxmat2              = 0;
719da1bb401SStefano Zampini   pcbddc->R_to_B                     = 0;
720da1bb401SStefano Zampini   pcbddc->R_to_D                     = 0;
721da1bb401SStefano Zampini   pcbddc->ksp_D                      = 0;
722da1bb401SStefano Zampini   pcbddc->ksp_R                      = 0;
723da1bb401SStefano Zampini   pcbddc->local_primal_indices       = 0;
724da1bb401SStefano Zampini   pcbddc->prec_type                  = PETSC_FALSE;
725da1bb401SStefano Zampini   pcbddc->NeumannBoundaries          = 0;
726da1bb401SStefano Zampini   pcbddc->ISForDofs                  = 0;
727da1bb401SStefano Zampini   pcbddc->ISForVertices              = 0;
728da1bb401SStefano Zampini   pcbddc->n_ISForFaces               = 0;
729da1bb401SStefano Zampini   pcbddc->n_ISForEdges               = 0;
730da1bb401SStefano Zampini   pcbddc->ConstraintMatrix           = 0;
731da1bb401SStefano Zampini   pcbddc->use_nnsp_true              = PETSC_FALSE;
732da1bb401SStefano Zampini   pcbddc->local_primal_sizes         = 0;
733da1bb401SStefano Zampini   pcbddc->local_primal_displacements = 0;
734da1bb401SStefano Zampini   pcbddc->replicated_local_primal_indices = 0;
735da1bb401SStefano Zampini   pcbddc->replicated_local_primal_values  = 0;
736da1bb401SStefano Zampini   pcbddc->coarse_loc_to_glob         = 0;
737da1bb401SStefano Zampini   pcbddc->dbg_flag                   = PETSC_FALSE;
738da1bb401SStefano Zampini   pcbddc->coarsening_ratio           = 8;
739da1bb401SStefano Zampini 
740da1bb401SStefano Zampini   /* allocate and initialize needed graph structure */
741da1bb401SStefano Zampini   ierr = PetscMalloc(sizeof(*mat_graph),&pcbddc->mat_graph);CHKERRQ(ierr);
742da1bb401SStefano Zampini   pcbddc->mat_graph->xadj            = 0;
743da1bb401SStefano Zampini   pcbddc->mat_graph->adjncy          = 0;
744da1bb401SStefano Zampini 
745da1bb401SStefano Zampini   /* function pointers */
746da1bb401SStefano Zampini   pc->ops->apply               = PCApply_BDDC;
747da1bb401SStefano Zampini   pc->ops->applytranspose      = 0;
748da1bb401SStefano Zampini   pc->ops->setup               = PCSetUp_BDDC;
749da1bb401SStefano Zampini   pc->ops->destroy             = PCDestroy_BDDC;
750da1bb401SStefano Zampini   pc->ops->setfromoptions      = PCSetFromOptions_BDDC;
751da1bb401SStefano Zampini   pc->ops->view                = 0;
752da1bb401SStefano Zampini   pc->ops->applyrichardson     = 0;
753da1bb401SStefano Zampini   pc->ops->applysymmetricleft  = 0;
754da1bb401SStefano Zampini   pc->ops->applysymmetricright = 0;
755*534831adSStefano Zampini   pc->ops->presolve            = PCPreSolve_BDDC;
756*534831adSStefano Zampini   pc->ops->postsolve           = PCPostSolve_BDDC;
757da1bb401SStefano Zampini 
758da1bb401SStefano Zampini   /* composing function */
759da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDirichletBoundaries_C","PCBDDCSetDirichletBoundaries_BDDC",
760da1bb401SStefano Zampini                     PCBDDCSetDirichletBoundaries_BDDC);CHKERRQ(ierr);
761da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetNeumannBoundaries_C","PCBDDCSetNeumannBoundaries_BDDC",
762da1bb401SStefano Zampini                     PCBDDCSetNeumannBoundaries_BDDC);CHKERRQ(ierr);
763da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetDirichletBoundaries_C","PCBDDCGetDirichletBoundaries_BDDC",
764da1bb401SStefano Zampini                     PCBDDCGetDirichletBoundaries_BDDC);CHKERRQ(ierr);
765da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetNeumannBoundaries_C","PCBDDCGetNeumannBoundaries_BDDC",
766da1bb401SStefano Zampini                     PCBDDCGetNeumannBoundaries_BDDC);CHKERRQ(ierr);
767da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetCoarseProblemType_C","PCBDDCSetCoarseProblemType_BDDC",
768da1bb401SStefano Zampini                     PCBDDCSetCoarseProblemType_BDDC);CHKERRQ(ierr);
769da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDofsSplitting_C","PCBDDCSetDofsSplitting_BDDC",
770da1bb401SStefano Zampini                     PCBDDCSetDofsSplitting_BDDC);CHKERRQ(ierr);
771da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetLocalAdjacencyGraph_C","PCBDDCSetLocalAdjacencyGraph_BDDC",
772da1bb401SStefano Zampini                     PCBDDCSetLocalAdjacencyGraph_BDDC);CHKERRQ(ierr);
773*534831adSStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPreSolve_C","PCPreSolve_BDDC",
774*534831adSStefano Zampini                     PCPreSolve_BDDC);CHKERRQ(ierr);
775*534831adSStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPostSolve_C","PCPostSolve_BDDC",
776*534831adSStefano Zampini                     PCPostSolve_BDDC);CHKERRQ(ierr);
777da1bb401SStefano Zampini   PetscFunctionReturn(0);
778da1bb401SStefano Zampini }
779da1bb401SStefano Zampini EXTERN_C_END
780da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
781da1bb401SStefano Zampini /* All static functions from now on                                           */
782da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
783da1bb401SStefano Zampini #undef __FUNCT__
784da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetupLocalAdjacencyGraph"
785da1bb401SStefano Zampini static PetscErrorCode PCBDDCSetupLocalAdjacencyGraph(PC pc)
786da1bb401SStefano Zampini {
787da1bb401SStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
788da1bb401SStefano Zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
789da1bb401SStefano Zampini   PetscInt       nvtxs,*xadj,*adjncy;
790da1bb401SStefano Zampini   Mat            mat_adj;
791da1bb401SStefano Zampini   PetscBool      symmetrize_rowij=PETSC_TRUE,compressed_rowij=PETSC_FALSE,flg_row=PETSC_TRUE;
792da1bb401SStefano Zampini   PCBDDCGraph    mat_graph=pcbddc->mat_graph;
793da1bb401SStefano Zampini   PetscErrorCode ierr;
794da1bb401SStefano Zampini 
795da1bb401SStefano Zampini   PetscFunctionBegin;
796da1bb401SStefano Zampini   /* get CSR adjacency from local matrix if user has not yet provided local graph using PCBDDCSetLocalAdjacencyGraph function */
797da1bb401SStefano Zampini   if(!mat_graph->xadj) {
798da1bb401SStefano Zampini     ierr = MatConvert(matis->A,MATMPIADJ,MAT_INITIAL_MATRIX,&mat_adj);CHKERRQ(ierr);
799da1bb401SStefano Zampini     ierr = MatGetRowIJ(mat_adj,0,symmetrize_rowij,compressed_rowij,&nvtxs,&xadj,&adjncy,&flg_row);CHKERRQ(ierr);
800da1bb401SStefano Zampini     if(!flg_row) {
801da1bb401SStefano Zampini       SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in MatGetRowIJ called in %s\n",__FUNCT__);
802da1bb401SStefano Zampini     }
803da1bb401SStefano Zampini     /* Get adjacency into BDDC workspace */
804da1bb401SStefano Zampini     ierr = PCBDDCSetLocalAdjacencyGraph(pc,nvtxs,xadj,adjncy,PETSC_COPY_VALUES);CHKERRQ(ierr);
805da1bb401SStefano Zampini     ierr = MatRestoreRowIJ(mat_adj,0,symmetrize_rowij,compressed_rowij,&nvtxs,&xadj,&adjncy,&flg_row);CHKERRQ(ierr);
806da1bb401SStefano Zampini     if(!flg_row) {
807da1bb401SStefano Zampini       SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in MatRestoreRowIJ called in %s\n",__FUNCT__);
808da1bb401SStefano Zampini     }
809da1bb401SStefano Zampini     ierr = MatDestroy(&mat_adj);CHKERRQ(ierr);
810da1bb401SStefano Zampini   }
811da1bb401SStefano Zampini   PetscFunctionReturn(0);
812da1bb401SStefano Zampini }
813da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
8140c7d97c5SJed Brown #undef __FUNCT__
8150c7d97c5SJed Brown #define __FUNCT__ "PCBDDCApplyInterfacePreconditioner"
8162617d88aSStefano Zampini static PetscErrorCode  PCBDDCApplyInterfacePreconditioner(PC pc)
8170c7d97c5SJed Brown {
8180c7d97c5SJed Brown   PetscErrorCode ierr;
8190c7d97c5SJed Brown   PC_BDDC*        pcbddc = (PC_BDDC*)(pc->data);
8200c7d97c5SJed Brown   PC_IS*            pcis = (PC_IS*)  (pc->data);
8213b03a366Sstefano_zampini   const PetscScalar zero = 0.0;
8220c7d97c5SJed Brown 
8230c7d97c5SJed Brown   PetscFunctionBegin;
8240c7d97c5SJed Brown   /* Application of PHI^T  */
8250c7d97c5SJed Brown   ierr = MatMultTranspose(pcbddc->coarse_phi_B,pcis->vec1_B,pcbddc->vec1_P);CHKERRQ(ierr);
8260c7d97c5SJed Brown   if(pcbddc->prec_type) { ierr = MatMultTransposeAdd(pcbddc->coarse_phi_D,pcis->vec1_D,pcbddc->vec1_P,pcbddc->vec1_P);CHKERRQ(ierr); }
8270c7d97c5SJed Brown 
8280c7d97c5SJed Brown   /* Scatter data of coarse_rhs */
8290c7d97c5SJed Brown   if(pcbddc->coarse_rhs) ierr = VecSet(pcbddc->coarse_rhs,zero);CHKERRQ(ierr);
8300c7d97c5SJed Brown   ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->vec1_P,pcbddc->coarse_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
8310c7d97c5SJed Brown 
8320c7d97c5SJed Brown   /* Local solution on R nodes */
8330c7d97c5SJed Brown   ierr = VecSet(pcbddc->vec1_R,zero);CHKERRQ(ierr);
8340c7d97c5SJed Brown   ierr = VecScatterBegin(pcbddc->R_to_B,pcis->vec1_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
8350c7d97c5SJed Brown   ierr = VecScatterEnd  (pcbddc->R_to_B,pcis->vec1_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
8360c7d97c5SJed Brown   if(pcbddc->prec_type) {
8370c7d97c5SJed Brown     ierr = VecScatterBegin(pcbddc->R_to_D,pcis->vec1_D,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
8380c7d97c5SJed Brown     ierr = VecScatterEnd  (pcbddc->R_to_D,pcis->vec1_D,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
8390c7d97c5SJed Brown   }
8400c7d97c5SJed Brown   ierr = PCBDDCSolveSaddlePoint(pc);CHKERRQ(ierr);
8410c7d97c5SJed Brown   ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr);
8420c7d97c5SJed Brown   ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec2_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
8430c7d97c5SJed Brown   ierr = VecScatterEnd  (pcbddc->R_to_B,pcbddc->vec2_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
8440c7d97c5SJed Brown   if(pcbddc->prec_type) {
8450c7d97c5SJed Brown     ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec2_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
8460c7d97c5SJed Brown     ierr = VecScatterEnd  (pcbddc->R_to_D,pcbddc->vec2_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
8470c7d97c5SJed Brown   }
8480c7d97c5SJed Brown 
8490c7d97c5SJed Brown   /* Coarse solution */
8500c7d97c5SJed Brown   ierr = PCBDDCScatterCoarseDataEnd(pc,pcbddc->vec1_P,pcbddc->coarse_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
85153cdbc3dSStefano Zampini   if(pcbddc->coarse_rhs) ierr = KSPSolve(pcbddc->coarse_ksp,pcbddc->coarse_rhs,pcbddc->coarse_vec);CHKERRQ(ierr);
8520c7d97c5SJed Brown   ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->coarse_vec,pcbddc->vec1_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
8530c7d97c5SJed Brown   ierr = PCBDDCScatterCoarseDataEnd  (pc,pcbddc->coarse_vec,pcbddc->vec1_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
8540c7d97c5SJed Brown 
8550c7d97c5SJed Brown   /* Sum contributions from two levels */
8560c7d97c5SJed Brown   ierr = MatMultAdd(pcbddc->coarse_phi_B,pcbddc->vec1_P,pcis->vec1_B,pcis->vec1_B);CHKERRQ(ierr);
8570c7d97c5SJed Brown   if(pcbddc->prec_type) { ierr = MatMultAdd(pcbddc->coarse_phi_D,pcbddc->vec1_P,pcis->vec1_D,pcis->vec1_D);CHKERRQ(ierr); }
8580c7d97c5SJed Brown   PetscFunctionReturn(0);
8590c7d97c5SJed Brown }
8600c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
8610c7d97c5SJed Brown #undef __FUNCT__
8620c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSolveSaddlePoint"
86353cdbc3dSStefano Zampini static PetscErrorCode  PCBDDCSolveSaddlePoint(PC pc)
8640c7d97c5SJed Brown {
8650c7d97c5SJed Brown   PetscErrorCode ierr;
8660c7d97c5SJed Brown   PC_BDDC*       pcbddc = (PC_BDDC*)(pc->data);
8670c7d97c5SJed Brown 
8680c7d97c5SJed Brown   PetscFunctionBegin;
86953cdbc3dSStefano Zampini   ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr);
870*534831adSStefano Zampini   if(pcbddc->local_auxmat1) {
8710c7d97c5SJed Brown     ierr = MatMult(pcbddc->local_auxmat1,pcbddc->vec2_R,pcbddc->vec1_C);CHKERRQ(ierr);
8720c7d97c5SJed Brown     ierr = MatMultAdd(pcbddc->local_auxmat2,pcbddc->vec1_C,pcbddc->vec2_R,pcbddc->vec2_R);CHKERRQ(ierr);
8730c7d97c5SJed Brown   }
8740c7d97c5SJed Brown   PetscFunctionReturn(0);
8750c7d97c5SJed Brown }
8760c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
8770c7d97c5SJed Brown #undef __FUNCT__
8780c7d97c5SJed Brown #define __FUNCT__ "PCBDDCScatterCoarseDataBegin"
87953cdbc3dSStefano Zampini static PetscErrorCode  PCBDDCScatterCoarseDataBegin(PC pc,Vec vec_from, Vec vec_to, InsertMode imode, ScatterMode smode)
8800c7d97c5SJed Brown {
8810c7d97c5SJed Brown   PetscErrorCode ierr;
8820c7d97c5SJed Brown   PC_BDDC*       pcbddc = (PC_BDDC*)(pc->data);
8830c7d97c5SJed Brown 
8840c7d97c5SJed Brown   PetscFunctionBegin;
8850c7d97c5SJed Brown   switch(pcbddc->coarse_communications_type){
8860c7d97c5SJed Brown     case SCATTERS_BDDC:
8870c7d97c5SJed Brown       ierr = VecScatterBegin(pcbddc->coarse_loc_to_glob,vec_from,vec_to,imode,smode);CHKERRQ(ierr);
8880c7d97c5SJed Brown       break;
8890c7d97c5SJed Brown     case GATHERS_BDDC:
8900c7d97c5SJed Brown       break;
8910c7d97c5SJed Brown   }
8920c7d97c5SJed Brown   PetscFunctionReturn(0);
8930c7d97c5SJed Brown }
8940c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
8950c7d97c5SJed Brown #undef __FUNCT__
8960c7d97c5SJed Brown #define __FUNCT__ "PCBDDCScatterCoarseDataEnd"
89753cdbc3dSStefano Zampini static PetscErrorCode  PCBDDCScatterCoarseDataEnd(PC pc,Vec vec_from, Vec vec_to, InsertMode imode, ScatterMode smode)
8980c7d97c5SJed Brown {
8990c7d97c5SJed Brown   PetscErrorCode ierr;
9000c7d97c5SJed Brown   PC_BDDC*       pcbddc = (PC_BDDC*)(pc->data);
9010c7d97c5SJed Brown   PetscScalar*   array_to;
9020c7d97c5SJed Brown   PetscScalar*   array_from;
9030c7d97c5SJed Brown   MPI_Comm       comm=((PetscObject)pc)->comm;
9040c7d97c5SJed Brown   PetscInt i;
9050c7d97c5SJed Brown 
9060c7d97c5SJed Brown   PetscFunctionBegin;
9070c7d97c5SJed Brown 
9080c7d97c5SJed Brown   switch(pcbddc->coarse_communications_type){
9090c7d97c5SJed Brown     case SCATTERS_BDDC:
9100c7d97c5SJed Brown       ierr = VecScatterEnd(pcbddc->coarse_loc_to_glob,vec_from,vec_to,imode,smode);CHKERRQ(ierr);
9110c7d97c5SJed Brown       break;
9120c7d97c5SJed Brown     case GATHERS_BDDC:
9130c7d97c5SJed Brown       if(vec_from) VecGetArray(vec_from,&array_from);
9140c7d97c5SJed Brown       if(vec_to)   VecGetArray(vec_to,&array_to);
9150c7d97c5SJed Brown       switch(pcbddc->coarse_problem_type){
9160c7d97c5SJed Brown         case SEQUENTIAL_BDDC:
9170c7d97c5SJed Brown           if(smode == SCATTER_FORWARD) {
91853cdbc3dSStefano Zampini             ierr = MPI_Gatherv(&array_from[0],pcbddc->local_primal_size,MPIU_SCALAR,&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,0,comm);CHKERRQ(ierr);
9190c7d97c5SJed Brown             if(vec_to) {
9200c7d97c5SJed Brown               for(i=0;i<pcbddc->replicated_primal_size;i++)
9210c7d97c5SJed Brown                 array_to[pcbddc->replicated_local_primal_indices[i]]+=pcbddc->replicated_local_primal_values[i];
9220c7d97c5SJed Brown             }
9230c7d97c5SJed Brown           } else {
9240c7d97c5SJed Brown             if(vec_from)
9250c7d97c5SJed Brown               for(i=0;i<pcbddc->replicated_primal_size;i++)
9260c7d97c5SJed Brown                 pcbddc->replicated_local_primal_values[i]=array_from[pcbddc->replicated_local_primal_indices[i]];
92753cdbc3dSStefano Zampini             ierr = MPI_Scatterv(&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,&array_to[0],pcbddc->local_primal_size,MPIU_SCALAR,0,comm);CHKERRQ(ierr);
9280c7d97c5SJed Brown           }
9290c7d97c5SJed Brown           break;
9300c7d97c5SJed Brown         case REPLICATED_BDDC:
9310c7d97c5SJed Brown           if(smode == SCATTER_FORWARD) {
93253cdbc3dSStefano Zampini             ierr = MPI_Allgatherv(&array_from[0],pcbddc->local_primal_size,MPIU_SCALAR,&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,comm);CHKERRQ(ierr);
9330c7d97c5SJed Brown             for(i=0;i<pcbddc->replicated_primal_size;i++)
9340c7d97c5SJed Brown               array_to[pcbddc->replicated_local_primal_indices[i]]+=pcbddc->replicated_local_primal_values[i];
9350c7d97c5SJed Brown           } else { /* no communications needed for SCATTER_REVERSE since needed data is already present */
9360c7d97c5SJed Brown             for(i=0;i<pcbddc->local_primal_size;i++)
9370c7d97c5SJed Brown               array_to[i]=array_from[pcbddc->local_primal_indices[i]];
9380c7d97c5SJed Brown           }
9390c7d97c5SJed Brown           break;
94053cdbc3dSStefano Zampini         case MULTILEVEL_BDDC:
94153cdbc3dSStefano Zampini           break;
94253cdbc3dSStefano Zampini         case PARALLEL_BDDC:
94353cdbc3dSStefano Zampini           break;
9440c7d97c5SJed Brown       }
9450c7d97c5SJed Brown       if(vec_from) VecRestoreArray(vec_from,&array_from);
9460c7d97c5SJed Brown       if(vec_to)   VecRestoreArray(vec_to,&array_to);
9470c7d97c5SJed Brown       break;
9480c7d97c5SJed Brown   }
9490c7d97c5SJed Brown   PetscFunctionReturn(0);
9500c7d97c5SJed Brown }
9510c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
952de534f79Sstefano_zampini #ifdef BDDC_USE_POD
953de534f79Sstefano_zampini #if !defined(PETSC_MISSING_LAPACK_GESVD)
9543b03a366Sstefano_zampini #define PETSC_MISSING_LAPACK_GESVD 1
955de534f79Sstefano_zampini #define UNDEF_PETSC_MISSING_LAPACK_GESVD 1
956de534f79Sstefano_zampini #endif
9573b03a366Sstefano_zampini #endif
9583b03a366Sstefano_zampini 
9593b03a366Sstefano_zampini #undef __FUNCT__
9603b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCCreateConstraintMatrix"
9613b03a366Sstefano_zampini static PetscErrorCode PCBDDCCreateConstraintMatrix(PC pc)
9623b03a366Sstefano_zampini {
9633b03a366Sstefano_zampini   PetscErrorCode ierr;
9643b03a366Sstefano_zampini   PC_IS*         pcis = (PC_IS*)(pc->data);
9653b03a366Sstefano_zampini   PC_BDDC*       pcbddc = (PC_BDDC*)pc->data;
9663b03a366Sstefano_zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
9673b03a366Sstefano_zampini   PetscInt       *nnz,*vertices,*is_indices;
9683b03a366Sstefano_zampini   PetscScalar    *temp_quadrature_constraint;
969*534831adSStefano Zampini   PetscInt       *temp_indices,*temp_indices_to_constraint,*temp_indices_to_constraint_B,*local_to_B;
9703b03a366Sstefano_zampini   PetscInt       local_primal_size,i,j,k,total_counts,max_size_of_constraint;
9713b03a366Sstefano_zampini   PetscInt       n_constraints,n_vertices,size_of_constraint;
972*534831adSStefano Zampini   PetscScalar    quad_value;
9733b03a366Sstefano_zampini   PetscBool      nnsp_has_cnst=PETSC_FALSE,use_nnsp_true=pcbddc->use_nnsp_true;
9743b03a366Sstefano_zampini   PetscInt       nnsp_size=0,nnsp_addone=0,temp_constraints,temp_start_ptr;
9753b03a366Sstefano_zampini   IS             *used_IS;
9763b03a366Sstefano_zampini   const MatType  impMatType=MATSEQAIJ;
9773b03a366Sstefano_zampini   PetscBLASInt   Bs,Bt,lwork,lierr;
9783b03a366Sstefano_zampini   PetscReal      tol=1.0e-8;
979fcda91b4SJed Brown   MatNullSpace   nearnullsp;
980fcda91b4SJed Brown   const Vec      *nearnullvecs;
9813b03a366Sstefano_zampini   Vec            *localnearnullsp;
9823b03a366Sstefano_zampini   PetscScalar    *work,*temp_basis,*array_vector,*correlation_mat;
9833b03a366Sstefano_zampini   PetscReal      *rwork,*singular_vals;
984*534831adSStefano Zampini   PetscBLASInt   Bone=1,*ipiv;
985*534831adSStefano Zampini   Vec            temp_vec;
986*534831adSStefano Zampini   Mat            temp_mat;
987*534831adSStefano Zampini   KSP            temp_ksp;
988*534831adSStefano Zampini   PetscInt       s,start_constraint,dual_dofs;
989*534831adSStefano Zampini   PetscBool      compute_submatrix,useksp=PETSC_FALSE;
990*534831adSStefano Zampini   PetscInt       *aux_primal_permutation,*aux_primal_numbering;
991*534831adSStefano Zampini   PetscBool      boolforface,*change_basis;
992de534f79Sstefano_zampini /* some ugly conditional declarations */
9933b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD)
9943b03a366Sstefano_zampini   PetscScalar    dot_result;
9953b03a366Sstefano_zampini   PetscScalar    one=1.0,zero=0.0;
9963b03a366Sstefano_zampini   PetscInt       ii;
9973b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX)
9983b03a366Sstefano_zampini   PetscScalar    val1,val2;
9993b03a366Sstefano_zampini #endif
10003b03a366Sstefano_zampini #else
10013b03a366Sstefano_zampini   PetscBLASInt   dummy_int;
10023b03a366Sstefano_zampini   PetscScalar    dummy_scalar;
10033b03a366Sstefano_zampini #endif
10043b03a366Sstefano_zampini 
10053b03a366Sstefano_zampini   PetscFunctionBegin;
10063b03a366Sstefano_zampini   /* check if near null space is attached to global mat */
1007fcda91b4SJed Brown   ierr = MatGetNearNullSpace(pc->pmat,&nearnullsp);CHKERRQ(ierr);
1008fcda91b4SJed Brown   if (nearnullsp) {
1009fcda91b4SJed Brown     ierr = MatNullSpaceGetVecs(nearnullsp,&nnsp_has_cnst,&nnsp_size,&nearnullvecs);CHKERRQ(ierr);
10103b03a366Sstefano_zampini   } else { /* if near null space is not provided it uses constants */
10113b03a366Sstefano_zampini     nnsp_has_cnst = PETSC_TRUE;
10123b03a366Sstefano_zampini     use_nnsp_true = PETSC_TRUE;
10133b03a366Sstefano_zampini   }
10143b03a366Sstefano_zampini   if(nnsp_has_cnst) {
10153b03a366Sstefano_zampini     nnsp_addone = 1;
10163b03a366Sstefano_zampini   }
10173b03a366Sstefano_zampini   /*
10183b03a366Sstefano_zampini        Evaluate maximum storage size needed by the procedure
10193b03a366Sstefano_zampini        - temp_indices will contain start index of each constraint stored as follows
10203b03a366Sstefano_zampini        - temp_indices_to_constraint  [temp_indices[i],...,temp[indices[i+1]-1] will contain the indices (in local numbering) on which the constraint acts
1021*534831adSStefano Zampini        - temp_indices_to_constraint_B[temp_indices[i],...,temp[indices[i+1]-1] will contain the indices (in boundary numbering) on which the constraint acts
10223b03a366Sstefano_zampini        - temp_quadrature_constraint  [temp_indices[i],...,temp[indices[i+1]-1] will contain the scalars representing the constraint itself
10233b03a366Sstefano_zampini                                                                                                                                                          */
1024da1bb401SStefano Zampini 
10253b03a366Sstefano_zampini   total_counts = pcbddc->n_ISForFaces+pcbddc->n_ISForEdges;
10263b03a366Sstefano_zampini   total_counts *= (nnsp_addone+nnsp_size);
1027da1bb401SStefano Zampini   ierr = ISGetSize(pcbddc->ISForVertices,&n_vertices);CHKERRQ(ierr);
1028da1bb401SStefano Zampini   total_counts += n_vertices;
10293b03a366Sstefano_zampini   ierr = PetscMalloc((total_counts+1)*sizeof(PetscInt),&temp_indices);CHKERRQ(ierr);
1030*534831adSStefano Zampini   ierr = PetscMalloc((total_counts+1)*sizeof(PetscBool),&change_basis);CHKERRQ(ierr);
10313b03a366Sstefano_zampini   total_counts = 0;
10323b03a366Sstefano_zampini   max_size_of_constraint = 0;
10333b03a366Sstefano_zampini   for(i=0;i<pcbddc->n_ISForEdges+pcbddc->n_ISForFaces;i++){
10343b03a366Sstefano_zampini     if(i<pcbddc->n_ISForEdges){
10353b03a366Sstefano_zampini       used_IS = &pcbddc->ISForEdges[i];
10363b03a366Sstefano_zampini     } else {
10373b03a366Sstefano_zampini       used_IS = &pcbddc->ISForFaces[i-pcbddc->n_ISForEdges];
10383b03a366Sstefano_zampini     }
10393b03a366Sstefano_zampini     ierr = ISGetSize(*used_IS,&j);CHKERRQ(ierr);
10403b03a366Sstefano_zampini     total_counts += j;
10413b03a366Sstefano_zampini     if(j>max_size_of_constraint) max_size_of_constraint=j;
10423b03a366Sstefano_zampini   }
10433b03a366Sstefano_zampini   total_counts *= (nnsp_addone+nnsp_size);
1044da1bb401SStefano Zampini   total_counts += n_vertices;
10453b03a366Sstefano_zampini   ierr = PetscMalloc(total_counts*sizeof(PetscScalar),&temp_quadrature_constraint);CHKERRQ(ierr);
10463b03a366Sstefano_zampini   ierr = PetscMalloc(total_counts*sizeof(PetscInt),&temp_indices_to_constraint);CHKERRQ(ierr);
1047*534831adSStefano Zampini   ierr = PetscMalloc(total_counts*sizeof(PetscInt),&temp_indices_to_constraint_B);CHKERRQ(ierr);
1048*534831adSStefano Zampini   ierr = PetscMalloc(pcis->n*sizeof(PetscInt),&local_to_B);CHKERRQ(ierr);
1049*534831adSStefano Zampini   ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
1050*534831adSStefano Zampini   for(i=0;i<pcis->n;i++) {
1051*534831adSStefano Zampini     local_to_B[i]=-1;
1052*534831adSStefano Zampini   }
1053*534831adSStefano Zampini   for(i=0;i<pcis->n_B;i++) {
1054*534831adSStefano Zampini     local_to_B[is_indices[i]]=i;
1055*534831adSStefano Zampini   }
1056*534831adSStefano Zampini   ierr = ISRestoreIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
1057*534831adSStefano Zampini 
10583b03a366Sstefano_zampini   /* First we issue queries to allocate optimal workspace for LAPACKgesvd or LAPACKsyev/LAPACKheev */
10593b03a366Sstefano_zampini   rwork = 0;
10603b03a366Sstefano_zampini   work = 0;
10613b03a366Sstefano_zampini   singular_vals = 0;
10623b03a366Sstefano_zampini   temp_basis = 0;
10633b03a366Sstefano_zampini   correlation_mat = 0;
10643b03a366Sstefano_zampini   if(!pcbddc->use_nnsp_true) {
10653b03a366Sstefano_zampini     PetscScalar temp_work;
10663b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD)
10673b03a366Sstefano_zampini     /* POD */
10683b03a366Sstefano_zampini     PetscInt max_n;
10693b03a366Sstefano_zampini     max_n = nnsp_addone+nnsp_size;
10703b03a366Sstefano_zampini     /* using some techniques borrowed from Proper Orthogonal Decomposition */
10713b03a366Sstefano_zampini     ierr = PetscMalloc(max_n*max_n*sizeof(PetscScalar),&correlation_mat);CHKERRQ(ierr);
10723b03a366Sstefano_zampini     ierr = PetscMalloc(max_n*sizeof(PetscReal),&singular_vals);CHKERRQ(ierr);
10733b03a366Sstefano_zampini     ierr = PetscMalloc(max_size_of_constraint*(nnsp_addone+nnsp_size)*sizeof(PetscScalar),&temp_basis);CHKERRQ(ierr);
10743b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX)
10753b03a366Sstefano_zampini     ierr = PetscMalloc(3*max_n*sizeof(PetscReal),&rwork);CHKERRQ(ierr);
10763b03a366Sstefano_zampini #endif
10773b03a366Sstefano_zampini     /* now we evaluate the optimal workspace using query with lwork=-1 */
10783b03a366Sstefano_zampini     Bt = PetscBLASIntCast(max_n);
10793b03a366Sstefano_zampini     lwork=-1;
10803b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX)
10813b03a366Sstefano_zampini     LAPACKsyev_("V","U",&Bt,correlation_mat,&Bt,singular_vals,&temp_work,&lwork,&lierr);
10823b03a366Sstefano_zampini #else
10833b03a366Sstefano_zampini     LAPACKsyev_("V","U",&Bt,correlation_mat,&Bt,singular_vals,&temp_work,&lwork,rwork,&lierr);
10843b03a366Sstefano_zampini #endif
10853b03a366Sstefano_zampini #else /* on missing GESVD */
10863b03a366Sstefano_zampini     /* SVD */
10873b03a366Sstefano_zampini     PetscInt max_n,min_n;
10883b03a366Sstefano_zampini     max_n = max_size_of_constraint;
10893b03a366Sstefano_zampini     min_n = nnsp_addone+nnsp_size;
10903b03a366Sstefano_zampini     if(max_size_of_constraint < ( nnsp_addone+nnsp_size ) ) {
10913b03a366Sstefano_zampini       min_n = max_size_of_constraint;
10923b03a366Sstefano_zampini       max_n = nnsp_addone+nnsp_size;
10933b03a366Sstefano_zampini     }
10943b03a366Sstefano_zampini     ierr = PetscMalloc(min_n*sizeof(PetscReal),&singular_vals);CHKERRQ(ierr);
10953b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX)
10963b03a366Sstefano_zampini     ierr = PetscMalloc(5*min_n*sizeof(PetscReal),&rwork);CHKERRQ(ierr);
10973b03a366Sstefano_zampini #endif
10983b03a366Sstefano_zampini     /* now we evaluate the optimal workspace using query with lwork=-1 */
10993b03a366Sstefano_zampini     lwork=-1;
11003b03a366Sstefano_zampini     Bs = PetscBLASIntCast(max_n);
11013b03a366Sstefano_zampini     Bt = PetscBLASIntCast(min_n);
11023b03a366Sstefano_zampini     dummy_int = Bs;
1103670f3ff9SJed Brown     ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
11043b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX)
11053b03a366Sstefano_zampini     LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[0],&Bs,singular_vals,
11063b03a366Sstefano_zampini                  &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,&temp_work,&lwork,&lierr);
11073b03a366Sstefano_zampini #else
11083b03a366Sstefano_zampini     LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[0],&Bs,singular_vals,
11093b03a366Sstefano_zampini                  &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,&temp_work,&lwork,rwork,&lierr);
11103b03a366Sstefano_zampini #endif
11113b03a366Sstefano_zampini     if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to SVD Lapack routine %d",(int)lierr);
1112670f3ff9SJed Brown     ierr = PetscFPTrapPop();CHKERRQ(ierr);
11133b03a366Sstefano_zampini #endif
11143b03a366Sstefano_zampini     /* Allocate optimal workspace */
11153b03a366Sstefano_zampini     lwork = PetscBLASIntCast((PetscInt)PetscRealPart(temp_work));
11163b03a366Sstefano_zampini     total_counts = (PetscInt)lwork;
11173b03a366Sstefano_zampini     ierr = PetscMalloc(total_counts*sizeof(PetscScalar),&work);CHKERRQ(ierr);
11183b03a366Sstefano_zampini   }
11193b03a366Sstefano_zampini   /* get local part of global near null space vectors */
11203b03a366Sstefano_zampini   ierr = PetscMalloc(nnsp_size*sizeof(Vec),&localnearnullsp);CHKERRQ(ierr);
11213b03a366Sstefano_zampini   for(k=0;k<nnsp_size;k++) {
11223b03a366Sstefano_zampini     ierr = VecDuplicate(pcis->vec1_N,&localnearnullsp[k]);CHKERRQ(ierr);
1123fcda91b4SJed Brown     ierr = VecScatterBegin(matis->ctx,nearnullvecs[k],localnearnullsp[k],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1124fcda91b4SJed Brown     ierr = VecScatterEnd  (matis->ctx,nearnullvecs[k],localnearnullsp[k],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
11253b03a366Sstefano_zampini   }
11263b03a366Sstefano_zampini   /* Now we can loop on constraining sets */
11273b03a366Sstefano_zampini   total_counts=0;
11283b03a366Sstefano_zampini   temp_indices[0]=0;
1129da1bb401SStefano Zampini   /* vertices */
1130da1bb401SStefano Zampini   PetscBool used_vertex;
1131da1bb401SStefano Zampini   ierr = PetscMalloc(n_vertices*sizeof(PetscInt),&vertices);CHKERRQ(ierr);
1132da1bb401SStefano Zampini   ierr = ISGetIndices(pcbddc->ISForVertices,(const PetscInt**)&is_indices);CHKERRQ(ierr);
1133da1bb401SStefano Zampini   if(nnsp_has_cnst) { /* consider all vertices */
1134da1bb401SStefano Zampini     for(i=0;i<n_vertices;i++) {
1135da1bb401SStefano Zampini       temp_indices_to_constraint[temp_indices[total_counts]]=is_indices[i];
1136*534831adSStefano Zampini       temp_indices_to_constraint_B[temp_indices[total_counts]]=local_to_B[is_indices[i]];
1137da1bb401SStefano Zampini       temp_quadrature_constraint[temp_indices[total_counts]]=1.0;
1138da1bb401SStefano Zampini       temp_indices[total_counts+1]=temp_indices[total_counts]+1;
1139da1bb401SStefano Zampini       vertices[total_counts]=is_indices[i];
1140*534831adSStefano Zampini       change_basis[total_counts]=PETSC_FALSE;
1141da1bb401SStefano Zampini       total_counts++;
1142da1bb401SStefano Zampini     }
1143da1bb401SStefano Zampini   } else { /* consider vertices for which exist at least a localnearnullsp which is not null there */
1144da1bb401SStefano Zampini     for(i=0;i<n_vertices;i++) {
1145da1bb401SStefano Zampini       used_vertex=PETSC_FALSE;
1146da1bb401SStefano Zampini       k=0;
1147da1bb401SStefano Zampini       while(!used_vertex && k<nnsp_size) {
1148da1bb401SStefano Zampini         ierr = VecGetArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr);
1149da1bb401SStefano Zampini         if(PetscAbsScalar(array_vector[is_indices[i]])>0.0) {
1150da1bb401SStefano Zampini           temp_indices_to_constraint[temp_indices[total_counts]]=is_indices[i];
1151*534831adSStefano Zampini           temp_indices_to_constraint_B[temp_indices[total_counts]]=local_to_B[is_indices[i]];
1152da1bb401SStefano Zampini           temp_quadrature_constraint[temp_indices[total_counts]]=1.0;
1153da1bb401SStefano Zampini           temp_indices[total_counts+1]=temp_indices[total_counts]+1;
1154da1bb401SStefano Zampini           vertices[total_counts]=is_indices[i];
1155*534831adSStefano Zampini           change_basis[total_counts]=PETSC_FALSE;
1156da1bb401SStefano Zampini           total_counts++;
1157da1bb401SStefano Zampini           used_vertex=PETSC_TRUE;
1158da1bb401SStefano Zampini         }
1159da1bb401SStefano Zampini         ierr = VecRestoreArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr);
1160da1bb401SStefano Zampini         k++;
1161da1bb401SStefano Zampini       }
1162da1bb401SStefano Zampini     }
1163da1bb401SStefano Zampini   }
1164da1bb401SStefano Zampini   ierr = ISRestoreIndices(pcbddc->ISForVertices,(const PetscInt**)&is_indices);CHKERRQ(ierr);
1165da1bb401SStefano Zampini   n_vertices=total_counts;
1166da1bb401SStefano Zampini   /* edges and faces */
11673b03a366Sstefano_zampini   for(i=0;i<pcbddc->n_ISForEdges+pcbddc->n_ISForFaces;i++){
11683b03a366Sstefano_zampini     if(i<pcbddc->n_ISForEdges){
11693b03a366Sstefano_zampini       used_IS = &pcbddc->ISForEdges[i];
1170*534831adSStefano Zampini       boolforface = pcbddc->usechangeofbasis;
11713b03a366Sstefano_zampini     } else {
11723b03a366Sstefano_zampini       used_IS = &pcbddc->ISForFaces[i-pcbddc->n_ISForEdges];
1173*534831adSStefano Zampini       boolforface = pcbddc->usechangeonfaces;
11743b03a366Sstefano_zampini     }
11753b03a366Sstefano_zampini     temp_constraints = 0;          /* zero the number of constraints I have on this conn comp */
11763b03a366Sstefano_zampini     temp_start_ptr = total_counts; /* need to know the starting index of constraints stored */
11773b03a366Sstefano_zampini     ierr = ISGetSize(*used_IS,&size_of_constraint);CHKERRQ(ierr);
11783b03a366Sstefano_zampini     ierr = ISGetIndices(*used_IS,(const PetscInt**)&is_indices);CHKERRQ(ierr);
11793b03a366Sstefano_zampini     if(nnsp_has_cnst) {
11803b03a366Sstefano_zampini       temp_constraints++;
1181*534831adSStefano Zampini       quad_value = (PetscScalar) (1.0/PetscSqrtReal((PetscReal)size_of_constraint));
11823b03a366Sstefano_zampini       for(j=0;j<size_of_constraint;j++) {
11833b03a366Sstefano_zampini         temp_indices_to_constraint[temp_indices[total_counts]+j]=is_indices[j];
1184*534831adSStefano Zampini         temp_indices_to_constraint_B[temp_indices[total_counts]+j]=local_to_B[is_indices[j]];
11853b03a366Sstefano_zampini         temp_quadrature_constraint[temp_indices[total_counts]+j]=quad_value;
11863b03a366Sstefano_zampini       }
11873b03a366Sstefano_zampini       temp_indices[total_counts+1]=temp_indices[total_counts]+size_of_constraint;  /* store new starting point */
1188*534831adSStefano Zampini       change_basis[total_counts]=boolforface;
11893b03a366Sstefano_zampini       total_counts++;
11903b03a366Sstefano_zampini     }
11913b03a366Sstefano_zampini     for(k=0;k<nnsp_size;k++) {
11923b03a366Sstefano_zampini       ierr = VecGetArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr);
11933b03a366Sstefano_zampini       for(j=0;j<size_of_constraint;j++) {
11943b03a366Sstefano_zampini         temp_indices_to_constraint[temp_indices[total_counts]+j]=is_indices[j];
1195*534831adSStefano Zampini         temp_indices_to_constraint_B[temp_indices[total_counts]+j]=local_to_B[is_indices[j]];
11963b03a366Sstefano_zampini         temp_quadrature_constraint[temp_indices[total_counts]+j]=array_vector[is_indices[j]];
11973b03a366Sstefano_zampini       }
11983b03a366Sstefano_zampini       ierr = VecRestoreArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr);
1199de534f79Sstefano_zampini       quad_value = 1.0;
1200de534f79Sstefano_zampini       if( use_nnsp_true ) { /* check if array is null on the connected component in case use_nnsp_true has been requested */
1201de534f79Sstefano_zampini         Bs = PetscBLASIntCast(size_of_constraint);
1202de534f79Sstefano_zampini         quad_value = BLASasum_(&Bs,&temp_quadrature_constraint[temp_indices[total_counts]],&Bone);
1203de534f79Sstefano_zampini       }
1204de534f79Sstefano_zampini       if ( quad_value > 0.0 ) { /* keep indices and values */
1205de534f79Sstefano_zampini         temp_constraints++;
12063b03a366Sstefano_zampini         temp_indices[total_counts+1]=temp_indices[total_counts]+size_of_constraint;  /* store new starting point */
1207*534831adSStefano Zampini         change_basis[total_counts]=boolforface;
12083b03a366Sstefano_zampini         total_counts++;
12093b03a366Sstefano_zampini       }
1210de534f79Sstefano_zampini     }
12113b03a366Sstefano_zampini     ierr = ISRestoreIndices(*used_IS,(const PetscInt**)&is_indices);CHKERRQ(ierr);
1212de534f79Sstefano_zampini     /* perform SVD on the constraint if use_nnsp_true has not be requested by the user */
12133b03a366Sstefano_zampini     if(!use_nnsp_true) {
1214de534f79Sstefano_zampini 
12153b03a366Sstefano_zampini       Bs = PetscBLASIntCast(size_of_constraint);
12163b03a366Sstefano_zampini       Bt = PetscBLASIntCast(temp_constraints);
1217de534f79Sstefano_zampini 
12183b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD)
12193b03a366Sstefano_zampini       ierr = PetscMemzero(correlation_mat,Bt*Bt*sizeof(PetscScalar));CHKERRQ(ierr);
12203b03a366Sstefano_zampini       /* Store upper triangular part of correlation matrix */
12213b03a366Sstefano_zampini       for(j=0;j<temp_constraints;j++) {
12223b03a366Sstefano_zampini         for(k=0;k<j+1;k++) {
12233b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX)
12243b03a366Sstefano_zampini           /* hand made complex dot product */
12253b03a366Sstefano_zampini           dot_result = 0.0;
12263b03a366Sstefano_zampini           for (ii=0; ii<size_of_constraint; ii++) {
12273b03a366Sstefano_zampini             val1 = temp_quadrature_constraint[temp_indices[temp_start_ptr+j]+ii];
12283b03a366Sstefano_zampini             val2 = temp_quadrature_constraint[temp_indices[temp_start_ptr+k]+ii];
12293b03a366Sstefano_zampini             dot_result += val1*PetscConj(val2);
12303b03a366Sstefano_zampini           }
12313b03a366Sstefano_zampini #else
12323b03a366Sstefano_zampini           dot_result = BLASdot_(&Bs,&temp_quadrature_constraint[temp_indices[temp_start_ptr+j]],&Bone,
12333b03a366Sstefano_zampini                                     &temp_quadrature_constraint[temp_indices[temp_start_ptr+k]],&Bone);
12343b03a366Sstefano_zampini #endif
12353b03a366Sstefano_zampini           correlation_mat[j*temp_constraints+k]=dot_result;
12363b03a366Sstefano_zampini         }
12373b03a366Sstefano_zampini       }
12383b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX)
12393b03a366Sstefano_zampini       LAPACKsyev_("V","U",&Bt,correlation_mat,&Bt,singular_vals,work,&lwork,&lierr);
12403b03a366Sstefano_zampini #else
12413b03a366Sstefano_zampini       LAPACKsyev_("V","U",&Bt,correlation_mat,&Bt,singular_vals,work,&lwork,rwork,&lierr);
12423b03a366Sstefano_zampini #endif
12433b03a366Sstefano_zampini       if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in EV Lapack routine %d",(int)lierr);
12443b03a366Sstefano_zampini       /* retain eigenvalues greater than tol: note that lapack SYEV gives eigs in ascending order */
12453b03a366Sstefano_zampini       j=0;
12463b03a366Sstefano_zampini       while( j < Bt && singular_vals[j] < tol) j++;
12473b03a366Sstefano_zampini       total_counts=total_counts-j;
12483b03a366Sstefano_zampini       if(j<temp_constraints) {
12493b03a366Sstefano_zampini         for(k=j;k<Bt;k++) { singular_vals[k]=1.0/PetscSqrtReal(singular_vals[k]); }
12503b03a366Sstefano_zampini         BLASgemm_("N","N",&Bs,&Bt,&Bt,&one,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,correlation_mat,&Bt,&zero,temp_basis,&Bs);
12513b03a366Sstefano_zampini         /* copy POD basis into used quadrature memory */
12523b03a366Sstefano_zampini         for(k=0;k<Bt-j;k++) {
12533b03a366Sstefano_zampini           for(ii=0;ii<size_of_constraint;ii++) {
12543b03a366Sstefano_zampini             temp_quadrature_constraint[temp_indices[temp_start_ptr+k]+ii]=singular_vals[Bt-1-k]*temp_basis[(Bt-1-k)*size_of_constraint+ii];
12553b03a366Sstefano_zampini           }
12563b03a366Sstefano_zampini         }
12573b03a366Sstefano_zampini       }
1258de534f79Sstefano_zampini 
12593b03a366Sstefano_zampini #else  /* on missing GESVD */
1260de534f79Sstefano_zampini 
12613b03a366Sstefano_zampini       PetscInt min_n = temp_constraints;
12623b03a366Sstefano_zampini       if(min_n > size_of_constraint) min_n = size_of_constraint;
12633b03a366Sstefano_zampini       dummy_int = Bs;
1264670f3ff9SJed Brown       ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
12653b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX)
12663b03a366Sstefano_zampini       LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,singular_vals,
12673b03a366Sstefano_zampini                    &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,work,&lwork,&lierr);
12683b03a366Sstefano_zampini #else
12693b03a366Sstefano_zampini       LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,singular_vals,
12703b03a366Sstefano_zampini                    &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,work,&lwork,rwork,&lierr);
12713b03a366Sstefano_zampini #endif
12723b03a366Sstefano_zampini       if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SVD Lapack routine %d",(int)lierr);
1273670f3ff9SJed Brown       ierr = PetscFPTrapPop();CHKERRQ(ierr);
12743b03a366Sstefano_zampini       /* retain eigenvalues greater than tol: note that lapack SVD gives eigs in descending order */
12753b03a366Sstefano_zampini       j=0;
12763b03a366Sstefano_zampini       while( j < min_n && singular_vals[min_n-j-1] < tol) j++;
12773b03a366Sstefano_zampini       total_counts = total_counts-(PetscInt)Bt+(min_n-j);
12783b03a366Sstefano_zampini #endif
12793b03a366Sstefano_zampini     }
12803b03a366Sstefano_zampini   }
1281*534831adSStefano Zampini 
1282da1bb401SStefano Zampini   n_constraints=total_counts-n_vertices;
1283da1bb401SStefano Zampini   local_primal_size = total_counts;
12843b03a366Sstefano_zampini   /* set quantities in pcbddc data structure */
12853b03a366Sstefano_zampini   pcbddc->n_vertices = n_vertices;
12863b03a366Sstefano_zampini   pcbddc->n_constraints = n_constraints;
1287da1bb401SStefano Zampini   pcbddc->local_primal_size = local_primal_size;
1288*534831adSStefano Zampini 
1289*534831adSStefano Zampini   /* Create constraint matrix */
1290*534831adSStefano Zampini   /* The constraint matrix is used to compute the l2g map of primal dofs */
1291*534831adSStefano Zampini   /* so we need to set it up properly either with or without change of basis */
1292*534831adSStefano Zampini   ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->ConstraintMatrix);CHKERRQ(ierr);
1293*534831adSStefano Zampini   ierr = MatSetType(pcbddc->ConstraintMatrix,impMatType);CHKERRQ(ierr);
1294*534831adSStefano Zampini   ierr = MatSetSizes(pcbddc->ConstraintMatrix,local_primal_size,pcis->n,local_primal_size,pcis->n);CHKERRQ(ierr);
1295*534831adSStefano Zampini   /* compute a local numbering of constraints : vertices first then constraints */
1296*534831adSStefano Zampini   ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
1297*534831adSStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array_vector);CHKERRQ(ierr);
1298*534831adSStefano Zampini   ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&aux_primal_numbering);CHKERRQ(ierr);
1299*534831adSStefano Zampini   ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&aux_primal_permutation);CHKERRQ(ierr);
1300*534831adSStefano Zampini   total_counts=0;
1301*534831adSStefano Zampini   /* find vertices: subdomain corners plus dofs with basis changed */
1302*534831adSStefano Zampini   for(i=0;i<local_primal_size;i++) {
1303*534831adSStefano Zampini     size_of_constraint=temp_indices[i+1]-temp_indices[i];
1304*534831adSStefano Zampini     if(change_basis[i] || size_of_constraint == 1) {
1305*534831adSStefano Zampini       k=0;
1306*534831adSStefano Zampini       while(k < size_of_constraint && array_vector[temp_indices_to_constraint[temp_indices[i]+size_of_constraint-k-1]] != 0.0) {
1307*534831adSStefano Zampini         k=k+1;
1308*534831adSStefano Zampini       }
1309*534831adSStefano Zampini       j=temp_indices_to_constraint[temp_indices[i]+size_of_constraint-k-1];
1310*534831adSStefano Zampini       array_vector[j] = 1.0;
1311*534831adSStefano Zampini       aux_primal_numbering[total_counts]=j;
1312*534831adSStefano Zampini       aux_primal_permutation[total_counts]=total_counts;
1313*534831adSStefano Zampini       total_counts++;
1314*534831adSStefano Zampini     }
1315*534831adSStefano Zampini   }
1316*534831adSStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array_vector);CHKERRQ(ierr);
1317*534831adSStefano Zampini   /* permute indices in order to have a sorted set of vertices */
1318*534831adSStefano Zampini   ierr = PetscSortIntWithPermutation(total_counts,aux_primal_numbering,aux_primal_permutation);
1319*534831adSStefano Zampini   /* nonzero structure */
1320*534831adSStefano Zampini   ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&nnz);CHKERRQ(ierr);
1321*534831adSStefano Zampini   for(i=0;i<total_counts;i++) {
1322*534831adSStefano Zampini     nnz[i]=1;
1323*534831adSStefano Zampini   }
1324*534831adSStefano Zampini   j=total_counts;
1325*534831adSStefano Zampini   for(i=n_vertices;i<local_primal_size;i++) {
1326*534831adSStefano Zampini     if(!change_basis[i]) {
1327*534831adSStefano Zampini       nnz[j]=temp_indices[i+1]-temp_indices[i];
1328*534831adSStefano Zampini       j++;
1329*534831adSStefano Zampini     }
1330*534831adSStefano Zampini   }
1331*534831adSStefano Zampini   ierr = MatSeqAIJSetPreallocation(pcbddc->ConstraintMatrix,0,nnz);CHKERRQ(ierr);
1332*534831adSStefano Zampini   ierr = PetscFree(nnz);CHKERRQ(ierr);
1333*534831adSStefano Zampini   /* set values in constraint matrix */
1334*534831adSStefano Zampini   for(i=0;i<total_counts;i++) {
1335*534831adSStefano Zampini     j = aux_primal_permutation[i];
1336*534831adSStefano Zampini     k = aux_primal_numbering[j];
1337*534831adSStefano Zampini     ierr = MatSetValue(pcbddc->ConstraintMatrix,i,k,1.0,INSERT_VALUES);CHKERRQ(ierr);
1338*534831adSStefano Zampini   }
1339*534831adSStefano Zampini   for(i=n_vertices;i<local_primal_size;i++) {
1340*534831adSStefano Zampini     if(!change_basis[i]) {
1341*534831adSStefano Zampini       size_of_constraint=temp_indices[i+1]-temp_indices[i];
1342*534831adSStefano Zampini       ierr = MatSetValues(pcbddc->ConstraintMatrix,1,&total_counts,size_of_constraint,&temp_indices_to_constraint[temp_indices[i]],&temp_quadrature_constraint[temp_indices[i]],INSERT_VALUES);CHKERRQ(ierr);
1343*534831adSStefano Zampini       total_counts++;
1344*534831adSStefano Zampini     }
1345*534831adSStefano Zampini   }
1346*534831adSStefano Zampini   ierr = PetscFree(aux_primal_numbering);CHKERRQ(ierr);
1347*534831adSStefano Zampini   ierr = PetscFree(aux_primal_permutation);CHKERRQ(ierr);
1348*534831adSStefano Zampini   /* assembling */
1349*534831adSStefano Zampini   ierr = MatAssemblyBegin(pcbddc->ConstraintMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1350*534831adSStefano Zampini   ierr = MatAssemblyEnd(pcbddc->ConstraintMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1351*534831adSStefano Zampini 
1352*534831adSStefano Zampini   /* Create matrix for change of basis. We don't need it in case pcbddc->usechangeofbasis is FALSE */
1353*534831adSStefano Zampini   if(pcbddc->usechangeofbasis) {
1354*534831adSStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->ChangeOfBasisMatrix);CHKERRQ(ierr);
1355*534831adSStefano Zampini     ierr = MatSetType(pcbddc->ChangeOfBasisMatrix,impMatType);CHKERRQ(ierr);
1356*534831adSStefano Zampini     ierr = MatSetSizes(pcbddc->ChangeOfBasisMatrix,pcis->n_B,pcis->n_B,pcis->n_B,pcis->n_B);CHKERRQ(ierr);
1357*534831adSStefano Zampini     /* work arrays */
1358*534831adSStefano Zampini     /* we need to reuse these arrays, so we free them */
1359*534831adSStefano Zampini     ierr = PetscFree(temp_basis);CHKERRQ(ierr);
1360*534831adSStefano Zampini     ierr = PetscFree(work);CHKERRQ(ierr);
1361*534831adSStefano Zampini     ierr = PetscMalloc(pcis->n_B*sizeof(PetscInt),&nnz);CHKERRQ(ierr);
1362*534831adSStefano Zampini     ierr = PetscMalloc((nnsp_addone+nnsp_size)*(nnsp_addone+nnsp_size)*sizeof(PetscScalar),&temp_basis);CHKERRQ(ierr);
1363*534831adSStefano Zampini     ierr = PetscMalloc((nnsp_addone+nnsp_size)*sizeof(PetscScalar),&work);CHKERRQ(ierr);
1364*534831adSStefano Zampini     ierr = PetscMalloc((nnsp_addone+nnsp_size)*sizeof(PetscBLASInt),&ipiv);CHKERRQ(ierr);
1365*534831adSStefano Zampini     for(i=0;i<pcis->n_B;i++) {
1366*534831adSStefano Zampini       nnz[i]=1;
1367*534831adSStefano Zampini     }
1368*534831adSStefano Zampini     /* Overestimated nonzeros per row */
1369*534831adSStefano Zampini     k=1;
1370*534831adSStefano Zampini     for(i=pcbddc->n_vertices;i<local_primal_size;i++) {
1371*534831adSStefano Zampini       if(change_basis[i]) {
1372*534831adSStefano Zampini         size_of_constraint = temp_indices[i+1]-temp_indices[i];
1373*534831adSStefano Zampini         if(k < size_of_constraint) {
1374*534831adSStefano Zampini           k = size_of_constraint;
1375*534831adSStefano Zampini         }
1376*534831adSStefano Zampini         for(j=0;j<size_of_constraint;j++) {
1377*534831adSStefano Zampini           nnz[temp_indices_to_constraint_B[temp_indices[i]+j]] = size_of_constraint;
1378*534831adSStefano Zampini         }
1379*534831adSStefano Zampini       }
1380*534831adSStefano Zampini     }
1381*534831adSStefano Zampini     ierr = MatSeqAIJSetPreallocation(pcbddc->ChangeOfBasisMatrix,0,nnz);CHKERRQ(ierr);
1382*534831adSStefano Zampini     ierr = PetscFree(nnz);CHKERRQ(ierr);
1383*534831adSStefano Zampini     /* Temporary array to store indices */
1384*534831adSStefano Zampini     ierr = PetscMalloc(k*sizeof(PetscInt),&is_indices);CHKERRQ(ierr);
1385*534831adSStefano Zampini     /* Set initial identity in the matrix */
1386*534831adSStefano Zampini     for(i=0;i<pcis->n_B;i++) {
1387*534831adSStefano Zampini       ierr = MatSetValue(pcbddc->ChangeOfBasisMatrix,i,i,1.0,INSERT_VALUES);CHKERRQ(ierr);
1388*534831adSStefano Zampini     }
1389*534831adSStefano Zampini     /* Now we loop on the constraints which need a change of basis */
1390*534831adSStefano Zampini     /* Change of basis matrix is evaluated as the FIRST APPROACH in */
1391*534831adSStefano Zampini     /* Klawonn and Widlund, Dual-primal FETI-DP methods for linear elasticity, (6.2.1) */
1392*534831adSStefano Zampini     temp_constraints = 0;
1393*534831adSStefano Zampini     temp_start_ptr = temp_indices_to_constraint_B[temp_indices[pcbddc->n_vertices]];
1394*534831adSStefano Zampini     for(i=pcbddc->n_vertices;i<local_primal_size;i++) {
1395*534831adSStefano Zampini       if(change_basis[i]) {
1396*534831adSStefano Zampini         compute_submatrix = PETSC_FALSE;
1397*534831adSStefano Zampini         useksp = PETSC_FALSE;
1398*534831adSStefano Zampini         if(temp_start_ptr == temp_indices_to_constraint_B[temp_indices[i]]) {
1399*534831adSStefano Zampini           temp_constraints++;
1400*534831adSStefano Zampini           if(temp_start_ptr != temp_indices_to_constraint_B[temp_indices[i+1]]) {
1401*534831adSStefano Zampini             compute_submatrix = PETSC_TRUE;
1402*534831adSStefano Zampini           }
1403*534831adSStefano Zampini         }
1404*534831adSStefano Zampini         if(compute_submatrix) {
1405*534831adSStefano Zampini           if(temp_constraints > 1 || pcbddc->use_nnsp_true) {
1406*534831adSStefano Zampini             useksp = PETSC_TRUE;
1407*534831adSStefano Zampini           }
1408*534831adSStefano Zampini           size_of_constraint = temp_indices[i+1]-temp_indices[i];
1409*534831adSStefano Zampini           if(useksp) { /* experimental */
1410*534831adSStefano Zampini             ierr = MatCreate(PETSC_COMM_SELF,&temp_mat);CHKERRQ(ierr);
1411*534831adSStefano Zampini             ierr = MatSetType(temp_mat,impMatType);CHKERRQ(ierr);
1412*534831adSStefano Zampini             ierr = MatSetSizes(temp_mat,size_of_constraint,size_of_constraint,size_of_constraint,size_of_constraint);CHKERRQ(ierr);
1413*534831adSStefano Zampini             ierr = MatSeqAIJSetPreallocation(temp_mat,size_of_constraint,PETSC_NULL);CHKERRQ(ierr);
1414*534831adSStefano Zampini           }
1415*534831adSStefano Zampini           /* First _size_of_constraint-temp_constraints_ columns */
1416*534831adSStefano Zampini           dual_dofs = size_of_constraint-temp_constraints;
1417*534831adSStefano Zampini           start_constraint = i+1-temp_constraints;
1418*534831adSStefano Zampini           for(s=0;s<dual_dofs;s++) {
1419*534831adSStefano Zampini             is_indices[0] = s;
1420*534831adSStefano Zampini             for(j=0;j<temp_constraints;j++) {
1421*534831adSStefano Zampini               for(k=0;k<temp_constraints;k++) {
1422*534831adSStefano Zampini                 temp_basis[j*temp_constraints+k]=temp_quadrature_constraint[temp_indices[start_constraint+k]+s+j+1];
1423*534831adSStefano Zampini               }
1424*534831adSStefano Zampini               work[j]=-temp_quadrature_constraint[temp_indices[start_constraint+j]+s];
1425*534831adSStefano Zampini               is_indices[j+1]=s+j+1;
1426*534831adSStefano Zampini             }
1427*534831adSStefano Zampini             Bt = temp_constraints;
1428*534831adSStefano Zampini             ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
1429*534831adSStefano Zampini             LAPACKgesv_(&Bt,&Bone,temp_basis,&Bt,ipiv,work,&Bt,&lierr);
1430*534831adSStefano Zampini             if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GESV Lapack routine %d",(int)lierr);
1431*534831adSStefano Zampini             ierr = PetscFPTrapPop();CHKERRQ(ierr);
1432*534831adSStefano Zampini             j = temp_indices_to_constraint_B[temp_indices[start_constraint]+s];
1433*534831adSStefano Zampini             ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,temp_constraints,&temp_indices_to_constraint_B[temp_indices[start_constraint]+s+1],1,&j,work,INSERT_VALUES);CHKERRQ(ierr);
1434*534831adSStefano Zampini             if(useksp) {
1435*534831adSStefano Zampini               /* temp mat with transposed rows and columns */
1436*534831adSStefano Zampini               ierr = MatSetValues(temp_mat,1,&s,temp_constraints,&is_indices[1],work,INSERT_VALUES);CHKERRQ(ierr);
1437*534831adSStefano Zampini               ierr = MatSetValue(temp_mat,is_indices[0],is_indices[0],1.0,INSERT_VALUES);CHKERRQ(ierr);
1438*534831adSStefano Zampini             }
1439*534831adSStefano Zampini           }
1440*534831adSStefano Zampini           if(useksp) {
1441*534831adSStefano Zampini             /* last rows of temp_mat */
1442*534831adSStefano Zampini             for(j=0;j<size_of_constraint;j++) {
1443*534831adSStefano Zampini               is_indices[j] = j;
1444*534831adSStefano Zampini             }
1445*534831adSStefano Zampini             for(s=0;s<temp_constraints;s++) {
1446*534831adSStefano Zampini               k = s + dual_dofs;
1447*534831adSStefano Zampini               ierr = MatSetValues(temp_mat,1,&k,size_of_constraint,is_indices,&temp_quadrature_constraint[temp_indices[start_constraint+s]],INSERT_VALUES);CHKERRQ(ierr);
1448*534831adSStefano Zampini             }
1449*534831adSStefano Zampini             ierr = MatAssemblyBegin(temp_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1450*534831adSStefano Zampini             ierr = MatAssemblyEnd(temp_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1451*534831adSStefano Zampini             ierr = MatGetVecs(temp_mat,&temp_vec,PETSC_NULL);CHKERRQ(ierr);
1452*534831adSStefano Zampini             ierr = KSPCreate(PETSC_COMM_SELF,&temp_ksp);CHKERRQ(ierr);
1453*534831adSStefano Zampini             ierr = KSPSetOperators(temp_ksp,temp_mat,temp_mat,SAME_PRECONDITIONER);CHKERRQ(ierr);
1454*534831adSStefano Zampini             ierr = KSPSetType(temp_ksp,KSPPREONLY);CHKERRQ(ierr);
1455*534831adSStefano Zampini             ierr = KSPSetUp(temp_ksp);CHKERRQ(ierr);
1456*534831adSStefano Zampini             for(s=0;s<temp_constraints;s++) {
1457*534831adSStefano Zampini               ierr = VecSet(temp_vec,0.0);CHKERRQ(ierr);
1458*534831adSStefano Zampini               ierr = VecSetValue(temp_vec,s+dual_dofs,1.0,INSERT_VALUES);CHKERRQ(ierr);
1459*534831adSStefano Zampini               ierr = VecAssemblyBegin(temp_vec);CHKERRQ(ierr);
1460*534831adSStefano Zampini               ierr = VecAssemblyEnd(temp_vec);CHKERRQ(ierr);
1461*534831adSStefano Zampini               ierr = KSPSolve(temp_ksp,temp_vec,temp_vec);CHKERRQ(ierr);
1462*534831adSStefano Zampini               ierr = VecGetArray(temp_vec,&array_vector);CHKERRQ(ierr);
1463*534831adSStefano Zampini               j = temp_indices_to_constraint_B[temp_indices[start_constraint+s]+size_of_constraint-s-1];
1464*534831adSStefano Zampini               /* last columns of change of basis matrix associated to new primal dofs */
1465*534831adSStefano Zampini               ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,size_of_constraint,&temp_indices_to_constraint_B[temp_indices[start_constraint+s]],1,&j,array_vector,INSERT_VALUES);CHKERRQ(ierr);
1466*534831adSStefano Zampini               ierr = VecRestoreArray(temp_vec,&array_vector);CHKERRQ(ierr);
1467*534831adSStefano Zampini             }
1468*534831adSStefano Zampini             ierr = MatDestroy(&temp_mat);CHKERRQ(ierr);
1469*534831adSStefano Zampini             ierr = KSPDestroy(&temp_ksp);CHKERRQ(ierr);
1470*534831adSStefano Zampini             ierr = VecDestroy(&temp_vec);CHKERRQ(ierr);
1471*534831adSStefano Zampini           } else {
1472*534831adSStefano Zampini             /* last columns of change of basis matrix associated to new primal dofs */
1473*534831adSStefano Zampini             for(s=0;s<temp_constraints;s++) {
1474*534831adSStefano Zampini               j = temp_indices_to_constraint_B[temp_indices[start_constraint+s]+size_of_constraint-s-1];
1475*534831adSStefano Zampini               ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,size_of_constraint,&temp_indices_to_constraint_B[temp_indices[start_constraint+s]],1,&j,&temp_quadrature_constraint[temp_indices[start_constraint+s]],INSERT_VALUES);CHKERRQ(ierr);
1476*534831adSStefano Zampini             }
1477*534831adSStefano Zampini           }
1478*534831adSStefano Zampini           /* prepare for the next cycle */
1479*534831adSStefano Zampini           temp_constraints = 0;
1480*534831adSStefano Zampini           temp_start_ptr = temp_indices_to_constraint_B[temp_indices[i+1]];
1481*534831adSStefano Zampini         }
1482*534831adSStefano Zampini       }
1483*534831adSStefano Zampini     }
1484*534831adSStefano Zampini     /* assembling */
1485*534831adSStefano Zampini     ierr = MatAssemblyBegin(pcbddc->ChangeOfBasisMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1486*534831adSStefano Zampini     ierr = MatAssemblyEnd(pcbddc->ChangeOfBasisMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1487*534831adSStefano Zampini     ierr = PetscFree(ipiv);CHKERRQ(ierr);
1488*534831adSStefano Zampini     ierr = PetscFree(is_indices);CHKERRQ(ierr);
1489*534831adSStefano Zampini   }
14903b03a366Sstefano_zampini   /* free workspace no longer needed */
14913b03a366Sstefano_zampini   ierr = PetscFree(rwork);CHKERRQ(ierr);
14923b03a366Sstefano_zampini   ierr = PetscFree(work);CHKERRQ(ierr);
14933b03a366Sstefano_zampini   ierr = PetscFree(temp_basis);CHKERRQ(ierr);
14943b03a366Sstefano_zampini   ierr = PetscFree(singular_vals);CHKERRQ(ierr);
14953b03a366Sstefano_zampini   ierr = PetscFree(correlation_mat);CHKERRQ(ierr);
14963b03a366Sstefano_zampini   ierr = PetscFree(temp_indices);CHKERRQ(ierr);
1497*534831adSStefano Zampini   ierr = PetscFree(change_basis);CHKERRQ(ierr);
14983b03a366Sstefano_zampini   ierr = PetscFree(temp_indices_to_constraint);CHKERRQ(ierr);
1499*534831adSStefano Zampini   ierr = PetscFree(temp_indices_to_constraint_B);CHKERRQ(ierr);
1500*534831adSStefano Zampini   ierr = PetscFree(local_to_B);CHKERRQ(ierr);
15013b03a366Sstefano_zampini   ierr = PetscFree(temp_quadrature_constraint);CHKERRQ(ierr);
1502da1bb401SStefano Zampini   for(k=0;k<nnsp_size;k++) {
1503da1bb401SStefano Zampini     ierr = VecDestroy(&localnearnullsp[k]);CHKERRQ(ierr);
1504da1bb401SStefano Zampini   }
15053b03a366Sstefano_zampini   ierr = PetscFree(localnearnullsp);CHKERRQ(ierr);
15063b03a366Sstefano_zampini   PetscFunctionReturn(0);
15073b03a366Sstefano_zampini }
1508de534f79Sstefano_zampini #ifdef UNDEF_PETSC_MISSING_LAPACK_GESVD
15093b03a366Sstefano_zampini #undef PETSC_MISSING_LAPACK_GESVD
15103b03a366Sstefano_zampini #endif
15113b03a366Sstefano_zampini /* -------------------------------------------------------------------------- */
15120c7d97c5SJed Brown #undef __FUNCT__
15130c7d97c5SJed Brown #define __FUNCT__ "PCBDDCCoarseSetUp"
151453cdbc3dSStefano Zampini static PetscErrorCode PCBDDCCoarseSetUp(PC pc)
15150c7d97c5SJed Brown {
15160c7d97c5SJed Brown   PetscErrorCode  ierr;
15170c7d97c5SJed Brown 
15180c7d97c5SJed Brown   PC_IS*            pcis = (PC_IS*)(pc->data);
15190c7d97c5SJed Brown   PC_BDDC*          pcbddc = (PC_BDDC*)pc->data;
15200c7d97c5SJed Brown   Mat_IS            *matis = (Mat_IS*)pc->pmat->data;
1521*534831adSStefano Zampini   Mat               change_mat_all;
15220c7d97c5SJed Brown   IS                is_R_local;
15230c7d97c5SJed Brown   IS                is_V_local;
15240c7d97c5SJed Brown   IS                is_C_local;
15250c7d97c5SJed Brown   IS                is_aux1;
15260c7d97c5SJed Brown   IS                is_aux2;
15270c7d97c5SJed Brown   const VecType     impVecType;
15280c7d97c5SJed Brown   const MatType     impMatType;
15290c7d97c5SJed Brown   PetscInt          n_R=0;
15300c7d97c5SJed Brown   PetscInt          n_D=0;
15310c7d97c5SJed Brown   PetscInt          n_B=0;
15320c7d97c5SJed Brown   PetscScalar       zero=0.0;
15330c7d97c5SJed Brown   PetscScalar       one=1.0;
15340c7d97c5SJed Brown   PetscScalar       m_one=-1.0;
15350c7d97c5SJed Brown   PetscScalar*      array;
15360c7d97c5SJed Brown   PetscScalar       *coarse_submat_vals;
15370c7d97c5SJed Brown   PetscInt          *idx_R_local;
15380c7d97c5SJed Brown   PetscInt          *idx_V_B;
15390c7d97c5SJed Brown   PetscScalar       *coarsefunctions_errors;
15400c7d97c5SJed Brown   PetscScalar       *constraints_errors;
15410c7d97c5SJed Brown   /* auxiliary indices */
1542*534831adSStefano Zampini   PetscInt i,j,k;
1543e269702eSStefano Zampini   /* for verbose output of bddc */
1544e269702eSStefano Zampini   PetscViewer       viewer=pcbddc->dbg_viewer;
1545e269702eSStefano Zampini   PetscBool         dbg_flag=pcbddc->dbg_flag;
1546a0ba757dSStefano Zampini   /* for counting coarse dofs */
1547*534831adSStefano Zampini   PetscInt          n_vertices,n_constraints;
15483b03a366Sstefano_zampini   PetscInt          size_of_constraint;
15493b03a366Sstefano_zampini   PetscInt          *row_cmat_indices;
15503b03a366Sstefano_zampini   PetscScalar       *row_cmat_values;
1551*534831adSStefano Zampini   PetscInt          *vertices,*nnz,*is_indices,*temp_indices;
15520c7d97c5SJed Brown 
15530c7d97c5SJed Brown   PetscFunctionBegin;
15540c7d97c5SJed Brown   /* Set Non-overlapping dimensions */
15550c7d97c5SJed Brown   n_B = pcis->n_B; n_D = pcis->n - n_B;
1556*534831adSStefano Zampini   /* Set types for local objects needed by BDDC precondtioner */
1557*534831adSStefano Zampini   impMatType = MATSEQDENSE;
1558*534831adSStefano Zampini   impVecType = VECSEQ;
1559da1bb401SStefano Zampini   /* get vertex indices from constraint matrix */
1560*534831adSStefano Zampini   ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscInt),&vertices);CHKERRQ(ierr);
1561*534831adSStefano Zampini   n_vertices=0;
1562da1bb401SStefano Zampini   for(i=0;i<pcbddc->local_primal_size;i++) {
1563da1bb401SStefano Zampini     ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr);
1564da1bb401SStefano Zampini     if(size_of_constraint == 1) {
1565*534831adSStefano Zampini       vertices[n_vertices]=row_cmat_indices[0];
1566*534831adSStefano Zampini       n_vertices++;
1567a0ba757dSStefano Zampini     }
1568da1bb401SStefano Zampini     ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr);
1569a0ba757dSStefano Zampini   }
1570*534831adSStefano Zampini   /* Set number of constraints */
1571*534831adSStefano Zampini   n_constraints = pcbddc->local_primal_size-n_vertices;
1572*534831adSStefano Zampini 
1573*534831adSStefano Zampini   /* vertices in boundary numbering */
1574*534831adSStefano Zampini   if(n_vertices) {
1575*534831adSStefano Zampini     ierr = VecSet(pcis->vec1_N,m_one);CHKERRQ(ierr);
1576*534831adSStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
1577*534831adSStefano Zampini     for (i=0; i<n_vertices; i++) { array[ vertices[i] ] = i; }
1578*534831adSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
1579*534831adSStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1580*534831adSStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1581*534831adSStefano Zampini     ierr = PetscMalloc(n_vertices*sizeof(PetscInt),&idx_V_B);CHKERRQ(ierr);
1582*534831adSStefano Zampini     ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr);
1583*534831adSStefano Zampini     for (i=0; i<n_vertices; i++) {
1584*534831adSStefano Zampini       j=0;
1585*534831adSStefano Zampini       while (array[j] != i ) {j++;}
1586*534831adSStefano Zampini       idx_V_B[i]=j;
1587*534831adSStefano Zampini     }
1588*534831adSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr);
1589*534831adSStefano Zampini   }
1590*534831adSStefano Zampini 
1591*534831adSStefano Zampini   /* transform local matrices if needed */
1592*534831adSStefano Zampini   if(pcbddc->usechangeofbasis) {
1593*534831adSStefano Zampini     ierr = PetscMalloc(pcis->n*sizeof(PetscInt),&nnz);CHKERRQ(ierr);
1594*534831adSStefano Zampini     ierr = ISGetIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
1595*534831adSStefano Zampini     for(i=0;i<n_D;i++) {
1596*534831adSStefano Zampini       nnz[is_indices[i]]=1;
1597*534831adSStefano Zampini     }
1598*534831adSStefano Zampini     ierr = ISRestoreIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
1599*534831adSStefano Zampini     ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
1600*534831adSStefano Zampini     k=1;
1601*534831adSStefano Zampini     for(i=0;i<n_B;i++) {
1602*534831adSStefano Zampini       ierr = MatGetRow(pcbddc->ChangeOfBasisMatrix,i,&j,PETSC_NULL,PETSC_NULL);CHKERRQ(ierr);
1603*534831adSStefano Zampini       nnz[is_indices[i]]=j;
1604*534831adSStefano Zampini       if( k < j) {
1605*534831adSStefano Zampini         k = j;
1606*534831adSStefano Zampini       }
1607*534831adSStefano Zampini       ierr = MatRestoreRow(pcbddc->ChangeOfBasisMatrix,i,&j,PETSC_NULL,PETSC_NULL);CHKERRQ(ierr);
1608*534831adSStefano Zampini     }
1609*534831adSStefano Zampini     ierr = ISRestoreIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
1610*534831adSStefano Zampini     /* assemble change of basis matrix on the whole set of local dofs */
1611*534831adSStefano Zampini     ierr = PetscMalloc(k*sizeof(PetscInt),&temp_indices);CHKERRQ(ierr);
1612*534831adSStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&change_mat_all);CHKERRQ(ierr);
1613*534831adSStefano Zampini     ierr = MatSetSizes(change_mat_all,pcis->n,pcis->n,pcis->n,pcis->n);CHKERRQ(ierr);
1614*534831adSStefano Zampini     ierr = MatSetType(change_mat_all,MATSEQAIJ);CHKERRQ(ierr);
1615*534831adSStefano Zampini     ierr = MatSeqAIJSetPreallocation(change_mat_all,0,nnz);CHKERRQ(ierr);
1616*534831adSStefano Zampini     ierr = ISGetIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
1617*534831adSStefano Zampini     for(i=0;i<n_D;i++) {
1618*534831adSStefano Zampini       ierr = MatSetValue(change_mat_all,is_indices[i],is_indices[i],1.0,INSERT_VALUES);CHKERRQ(ierr);
1619*534831adSStefano Zampini     }
1620*534831adSStefano Zampini     ierr = ISRestoreIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
1621*534831adSStefano Zampini     ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
1622*534831adSStefano Zampini     for(i=0;i<n_B;i++) {
1623*534831adSStefano Zampini       ierr = MatGetRow(pcbddc->ChangeOfBasisMatrix,i,&j,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr);
1624*534831adSStefano Zampini       for(k=0;k<j;k++) {
1625*534831adSStefano Zampini         temp_indices[k]=is_indices[row_cmat_indices[k]];
1626*534831adSStefano Zampini       }
1627*534831adSStefano Zampini       ierr = MatSetValues(change_mat_all,1,&is_indices[i],j,temp_indices,row_cmat_values,INSERT_VALUES);CHKERRQ(ierr);
1628*534831adSStefano Zampini       ierr = MatRestoreRow(pcbddc->ChangeOfBasisMatrix,i,&j,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr);
1629*534831adSStefano Zampini     }
1630*534831adSStefano Zampini     ierr = MatAssemblyBegin(change_mat_all,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1631*534831adSStefano Zampini     ierr = MatAssemblyEnd(change_mat_all,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1632*534831adSStefano Zampini     ierr = MatPtAP(matis->A,change_mat_all,MAT_INITIAL_MATRIX,1.0,&pcbddc->local_mat);CHKERRQ(ierr);
1633*534831adSStefano Zampini     ierr = MatDestroy(&pcis->A_IB);CHKERRQ(ierr);
1634*534831adSStefano Zampini     ierr = MatDestroy(&pcis->A_BI);CHKERRQ(ierr);
1635*534831adSStefano Zampini     ierr = MatDestroy(&pcis->A_BB);CHKERRQ(ierr);
1636*534831adSStefano Zampini     ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_I_local,pcis->is_B_local,MAT_INITIAL_MATRIX,&pcis->A_IB);CHKERRQ(ierr);
1637*534831adSStefano Zampini     ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_B_local,pcis->is_I_local,MAT_INITIAL_MATRIX,&pcis->A_BI);CHKERRQ(ierr);
1638*534831adSStefano Zampini     ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_B_local,pcis->is_B_local,MAT_INITIAL_MATRIX,&pcis->A_BB);CHKERRQ(ierr);
1639*534831adSStefano Zampini     ierr = MatDestroy(&change_mat_all);CHKERRQ(ierr);
1640*534831adSStefano Zampini     ierr = PetscFree(nnz);CHKERRQ(ierr);
1641*534831adSStefano Zampini     ierr = PetscFree(temp_indices);CHKERRQ(ierr);
1642*534831adSStefano Zampini   } else {
1643*534831adSStefano Zampini     /* without change of basis, the local matrix is unchanged */
1644*534831adSStefano Zampini     ierr = PetscObjectReference((PetscObject)matis->A);CHKERRQ(ierr);
1645*534831adSStefano Zampini     pcbddc->local_mat = matis->A;
1646*534831adSStefano Zampini   }
1647a0ba757dSStefano Zampini 
16480c7d97c5SJed Brown   /* Dohrmann's notation: dofs splitted in R (Remaining: all dofs but the vertices) and V (Vertices) */
16490c7d97c5SJed Brown   ierr = VecSet(pcis->vec1_N,one);CHKERRQ(ierr);
16500c7d97c5SJed Brown   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
16513b03a366Sstefano_zampini   for (i=0;i<n_vertices;i++) { array[ vertices[i] ] = zero; }
16523b03a366Sstefano_zampini   ierr = PetscMalloc(( pcis->n - n_vertices )*sizeof(PetscInt),&idx_R_local);CHKERRQ(ierr);
16530c7d97c5SJed Brown   for (i=0, n_R=0; i<pcis->n; i++) { if (array[i] == one) { idx_R_local[n_R] = i; n_R++; } }
16540c7d97c5SJed Brown   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
1655e269702eSStefano Zampini   if(dbg_flag) {
16560c7d97c5SJed Brown     ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
16570c7d97c5SJed Brown     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
16580c7d97c5SJed Brown     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d local dimensions\n",PetscGlobalRank);CHKERRQ(ierr);
16590c7d97c5SJed Brown     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local_size = %d, dirichlet_size = %d, boundary_size = %d\n",pcis->n,n_D,n_B);CHKERRQ(ierr);
16603b03a366Sstefano_zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"r_size = %d, v_size = %d, constraints = %d, local_primal_size = %d\n",n_R,n_vertices,n_constraints,pcbddc->local_primal_size);CHKERRQ(ierr);
1661*534831adSStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"pcbddc->n_vertices = %d, pcbddc->n_constraints = %d\n",pcbddc->n_vertices,pcbddc->n_constraints);CHKERRQ(ierr);
16620c7d97c5SJed Brown     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
16630c7d97c5SJed Brown   }
1664*534831adSStefano Zampini 
16650c7d97c5SJed Brown   /* Allocate needed vectors */
1666*534831adSStefano Zampini   ierr = VecDuplicate(pcis->vec1_global,&pcbddc->original_rhs);CHKERRQ(ierr);
16670c7d97c5SJed Brown   ierr = VecDuplicate(pcis->vec1_D,&pcbddc->vec4_D);CHKERRQ(ierr);
16680c7d97c5SJed Brown   ierr = VecCreate(PETSC_COMM_SELF,&pcbddc->vec1_R);CHKERRQ(ierr);
16690c7d97c5SJed Brown   ierr = VecSetSizes(pcbddc->vec1_R,n_R,n_R);CHKERRQ(ierr);
16700c7d97c5SJed Brown   ierr = VecSetType(pcbddc->vec1_R,impVecType);CHKERRQ(ierr);
1671d49ef151SStefano Zampini   ierr = VecDuplicate(pcbddc->vec1_R,&pcbddc->vec2_R);CHKERRQ(ierr);
16720c7d97c5SJed Brown   ierr = VecCreate(PETSC_COMM_SELF,&pcbddc->vec1_P);CHKERRQ(ierr);
16730c7d97c5SJed Brown   ierr = VecSetSizes(pcbddc->vec1_P,pcbddc->local_primal_size,pcbddc->local_primal_size);CHKERRQ(ierr);
16740c7d97c5SJed Brown   ierr = VecSetType(pcbddc->vec1_P,impVecType);CHKERRQ(ierr);
16750c7d97c5SJed Brown 
16760c7d97c5SJed Brown   /* Creating some index sets needed  */
16770c7d97c5SJed Brown   /* For submatrices */
1678da1bb401SStefano Zampini   ierr = ISCreateGeneral(PETSC_COMM_SELF,n_R,idx_R_local,PETSC_OWN_POINTER,&is_R_local);CHKERRQ(ierr);
16793b03a366Sstefano_zampini   if(n_vertices)    {
1680da1bb401SStefano Zampini     ierr = ISCreateGeneral(PETSC_COMM_SELF,n_vertices,vertices,PETSC_OWN_POINTER,&is_V_local);CHKERRQ(ierr);
16813b03a366Sstefano_zampini   }
1682da1bb401SStefano Zampini   if(n_constraints) {
1683da1bb401SStefano Zampini     ierr = ISCreateStride(PETSC_COMM_SELF,n_constraints,n_vertices,1,&is_C_local);CHKERRQ(ierr);
1684da1bb401SStefano Zampini   }
1685da1bb401SStefano Zampini 
16860c7d97c5SJed Brown   /* For VecScatters pcbddc->R_to_B and (optionally) pcbddc->R_to_D */
16870c7d97c5SJed Brown   {
16880c7d97c5SJed Brown     PetscInt   *aux_array1;
16890c7d97c5SJed Brown     PetscInt   *aux_array2;
16900c7d97c5SJed Brown 
16913b03a366Sstefano_zampini     ierr = PetscMalloc( (pcis->n_B-n_vertices)*sizeof(PetscInt),&aux_array1);CHKERRQ(ierr);
16923b03a366Sstefano_zampini     ierr = PetscMalloc( (pcis->n_B-n_vertices)*sizeof(PetscInt),&aux_array2);CHKERRQ(ierr);
16930c7d97c5SJed Brown 
1694d49ef151SStefano Zampini     ierr = VecSet(pcis->vec1_global,zero);CHKERRQ(ierr);
16950c7d97c5SJed Brown     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
16960c7d97c5SJed Brown     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
16970c7d97c5SJed Brown     ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
16980c7d97c5SJed Brown     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
16990c7d97c5SJed Brown     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
17000c7d97c5SJed Brown     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
17010c7d97c5SJed Brown     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
1702da1bb401SStefano Zampini     for (i=0, j=0; i<n_R; i++) { if (array[idx_R_local[i]] > one) { aux_array1[j] = i; j++; } }
17030c7d97c5SJed Brown     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
1704da1bb401SStefano Zampini     ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array1,PETSC_COPY_VALUES,&is_aux1);CHKERRQ(ierr);
17050c7d97c5SJed Brown     ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr);
1706da1bb401SStefano Zampini     for (i=0, j=0; i<n_B; i++) { if (array[i] > one) { aux_array2[j] = i; j++; } }
17073828260eSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr);
1708da1bb401SStefano Zampini     ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array2,PETSC_COPY_VALUES,&is_aux2);CHKERRQ(ierr);
17090c7d97c5SJed Brown     ierr = VecScatterCreate(pcbddc->vec1_R,is_aux1,pcis->vec1_B,is_aux2,&pcbddc->R_to_B);CHKERRQ(ierr);
17100c7d97c5SJed Brown     ierr = PetscFree(aux_array1);CHKERRQ(ierr);
17110c7d97c5SJed Brown     ierr = PetscFree(aux_array2);CHKERRQ(ierr);
17120c7d97c5SJed Brown     ierr = ISDestroy(&is_aux1);CHKERRQ(ierr);
17130c7d97c5SJed Brown     ierr = ISDestroy(&is_aux2);CHKERRQ(ierr);
17140c7d97c5SJed Brown 
1715e269702eSStefano Zampini     if(pcbddc->prec_type || dbg_flag ) {
17160c7d97c5SJed Brown       ierr = PetscMalloc(n_D*sizeof(PetscInt),&aux_array1);CHKERRQ(ierr);
17170c7d97c5SJed Brown       ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
1718da1bb401SStefano Zampini       for (i=0, j=0; i<n_R; i++) { if (array[idx_R_local[i]] == one) { aux_array1[j] = i; j++; } }
17190c7d97c5SJed Brown       ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
1720da1bb401SStefano Zampini       ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array1,PETSC_COPY_VALUES,&is_aux1);CHKERRQ(ierr);
17210c7d97c5SJed Brown       ierr = VecScatterCreate(pcbddc->vec1_R,is_aux1,pcis->vec1_D,(IS)0,&pcbddc->R_to_D);CHKERRQ(ierr);
17220c7d97c5SJed Brown       ierr = PetscFree(aux_array1);CHKERRQ(ierr);
17230c7d97c5SJed Brown       ierr = ISDestroy(&is_aux1);CHKERRQ(ierr);
17240c7d97c5SJed Brown     }
17250c7d97c5SJed Brown   }
17260c7d97c5SJed Brown 
17270c7d97c5SJed Brown   /* Creating PC contexts for local Dirichlet and Neumann problems */
17280c7d97c5SJed Brown   {
17290c7d97c5SJed Brown     Mat  A_RR;
173053cdbc3dSStefano Zampini     PC   pc_temp;
17310c7d97c5SJed Brown     /* Matrix for Dirichlet problem is A_II -> we already have it from pcis.c code */
173253cdbc3dSStefano Zampini     ierr = KSPCreate(PETSC_COMM_SELF,&pcbddc->ksp_D);CHKERRQ(ierr);
173353cdbc3dSStefano Zampini     ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->ksp_D,(PetscObject)pc,1);CHKERRQ(ierr);
173453cdbc3dSStefano Zampini     ierr = KSPSetOperators(pcbddc->ksp_D,pcis->A_II,pcis->A_II,SAME_PRECONDITIONER);CHKERRQ(ierr);
173553cdbc3dSStefano Zampini     ierr = KSPSetType(pcbddc->ksp_D,KSPPREONLY);CHKERRQ(ierr);
1736da1bb401SStefano Zampini     ierr = KSPSetOptionsPrefix(pcbddc->ksp_D,"dirichlet_");CHKERRQ(ierr);
17370c7d97c5SJed Brown     /* default */
173853cdbc3dSStefano Zampini     ierr = KSPGetPC(pcbddc->ksp_D,&pc_temp);CHKERRQ(ierr);
173953cdbc3dSStefano Zampini     ierr = PCSetType(pc_temp,PCLU);CHKERRQ(ierr);
17400c7d97c5SJed Brown     /* Allow user's customization */
174153cdbc3dSStefano Zampini     ierr = KSPSetFromOptions(pcbddc->ksp_D);CHKERRQ(ierr);
174253cdbc3dSStefano Zampini     /* Set Up KSP for Dirichlet problem of BDDC */
174353cdbc3dSStefano Zampini     ierr = KSPSetUp(pcbddc->ksp_D);CHKERRQ(ierr);
1744da1bb401SStefano Zampini     if(pcbddc->dbg_flag) ierr = KSPView(pcbddc->ksp_D,PETSC_VIEWER_STDOUT_SELF);
17450c7d97c5SJed Brown     /* Matrix for Neumann problem is A_RR -> we need to create it */
1746*534831adSStefano Zampini     ierr = MatGetSubMatrix(pcbddc->local_mat,is_R_local,is_R_local,MAT_INITIAL_MATRIX,&A_RR);CHKERRQ(ierr);
174753cdbc3dSStefano Zampini     ierr = KSPCreate(PETSC_COMM_SELF,&pcbddc->ksp_R);CHKERRQ(ierr);
174853cdbc3dSStefano Zampini     ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->ksp_R,(PetscObject)pc,1);CHKERRQ(ierr);
174953cdbc3dSStefano Zampini     ierr = KSPSetOperators(pcbddc->ksp_R,A_RR,A_RR,SAME_PRECONDITIONER);CHKERRQ(ierr);
175053cdbc3dSStefano Zampini     ierr = KSPSetType(pcbddc->ksp_R,KSPPREONLY);CHKERRQ(ierr);
1751da1bb401SStefano Zampini     ierr = KSPSetOptionsPrefix(pcbddc->ksp_R,"neumann_");CHKERRQ(ierr);
17520c7d97c5SJed Brown     /* default */
175353cdbc3dSStefano Zampini     ierr = KSPGetPC(pcbddc->ksp_R,&pc_temp);CHKERRQ(ierr);
175453cdbc3dSStefano Zampini     ierr = PCSetType(pc_temp,PCLU);CHKERRQ(ierr);
17550c7d97c5SJed Brown     /* Allow user's customization */
175653cdbc3dSStefano Zampini     ierr = KSPSetFromOptions(pcbddc->ksp_R);CHKERRQ(ierr);
175753cdbc3dSStefano Zampini     /* Set Up KSP for Neumann problem of BDDC */
175853cdbc3dSStefano Zampini     ierr = KSPSetUp(pcbddc->ksp_R);CHKERRQ(ierr);
1759da1bb401SStefano Zampini     if(pcbddc->dbg_flag) ierr = KSPView(pcbddc->ksp_R,PETSC_VIEWER_STDOUT_SELF);
1760a0ba757dSStefano Zampini     /* check Dirichlet and Neumann solvers */
1761e269702eSStefano Zampini     if(pcbddc->dbg_flag) {
17620c7d97c5SJed Brown       Vec temp_vec;
17630c7d97c5SJed Brown       PetscScalar value;
17640c7d97c5SJed Brown 
1765a0ba757dSStefano Zampini       ierr = VecDuplicate(pcis->vec1_D,&temp_vec);CHKERRQ(ierr);
1766a0ba757dSStefano Zampini       ierr = VecSetRandom(pcis->vec1_D,PETSC_NULL);CHKERRQ(ierr);
1767a0ba757dSStefano Zampini       ierr = MatMult(pcis->A_II,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr);
1768a0ba757dSStefano Zampini       ierr = KSPSolve(pcbddc->ksp_D,pcis->vec2_D,temp_vec);CHKERRQ(ierr);
1769a0ba757dSStefano Zampini       ierr = VecAXPY(temp_vec,m_one,pcis->vec1_D);CHKERRQ(ierr);
1770a0ba757dSStefano Zampini       ierr = VecNorm(temp_vec,NORM_INFINITY,&value);CHKERRQ(ierr);
1771a0ba757dSStefano Zampini       ierr = VecDestroy(&temp_vec);CHKERRQ(ierr);
1772a0ba757dSStefano Zampini       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
1773a0ba757dSStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
1774a0ba757dSStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Checking solution of Dirichlet and Neumann problems\n");CHKERRQ(ierr);
1775a0ba757dSStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d infinity error for Dirichlet solve = % 1.14e \n",PetscGlobalRank,value);CHKERRQ(ierr);
1776d49ef151SStefano Zampini       ierr = VecDuplicate(pcbddc->vec1_R,&temp_vec);CHKERRQ(ierr);
1777d49ef151SStefano Zampini       ierr = VecSetRandom(pcbddc->vec1_R,PETSC_NULL);CHKERRQ(ierr);
1778d49ef151SStefano Zampini       ierr = MatMult(A_RR,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr);
1779d49ef151SStefano Zampini       ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec2_R,temp_vec);CHKERRQ(ierr);
1780d49ef151SStefano Zampini       ierr = VecAXPY(temp_vec,m_one,pcbddc->vec1_R);CHKERRQ(ierr);
1781d49ef151SStefano Zampini       ierr = VecNorm(temp_vec,NORM_INFINITY,&value);CHKERRQ(ierr);
1782e269702eSStefano Zampini       ierr = VecDestroy(&temp_vec);CHKERRQ(ierr);
17830c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d infinity error for  Neumann  solve = % 1.14e \n",PetscGlobalRank,value);CHKERRQ(ierr);
1784d49ef151SStefano Zampini       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
17850c7d97c5SJed Brown     }
17860c7d97c5SJed Brown     /* free Neumann problem's matrix */
17870c7d97c5SJed Brown     ierr = MatDestroy(&A_RR);CHKERRQ(ierr);
17880c7d97c5SJed Brown   }
17890c7d97c5SJed Brown 
17900c7d97c5SJed Brown   /* Assemble all remaining stuff needed to apply BDDC  */
17910c7d97c5SJed Brown   {
17920c7d97c5SJed Brown     Mat          A_RV,A_VR,A_VV;
17930c7d97c5SJed Brown     Mat          M1,M2;
17940c7d97c5SJed Brown     Mat          C_CR;
17953b03a366Sstefano_zampini     Mat          AUXMAT;
17960c7d97c5SJed Brown     Vec          vec1_C;
17970c7d97c5SJed Brown     Vec          vec2_C;
17980c7d97c5SJed Brown     Vec          vec1_V;
17990c7d97c5SJed Brown     Vec          vec2_V;
18000c7d97c5SJed Brown     PetscInt     *nnz;
18010c7d97c5SJed Brown     PetscInt     *auxindices;
180253cdbc3dSStefano Zampini     PetscInt     index;
18030c7d97c5SJed Brown     PetscScalar* array2;
18040c7d97c5SJed Brown     MatFactorInfo matinfo;
18050c7d97c5SJed Brown 
18060c7d97c5SJed Brown     /* Allocating some extra storage just to be safe */
18070c7d97c5SJed Brown     ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&nnz);CHKERRQ(ierr);
18080c7d97c5SJed Brown     ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&auxindices);CHKERRQ(ierr);
18090c7d97c5SJed Brown     for(i=0;i<pcis->n;i++) {auxindices[i]=i;}
18100c7d97c5SJed Brown 
18110c7d97c5SJed Brown     /* some work vectors on vertices and/or constraints */
18123b03a366Sstefano_zampini     if(n_vertices) {
18130c7d97c5SJed Brown       ierr = VecCreate(PETSC_COMM_SELF,&vec1_V);CHKERRQ(ierr);
18143b03a366Sstefano_zampini       ierr = VecSetSizes(vec1_V,n_vertices,n_vertices);CHKERRQ(ierr);
18150c7d97c5SJed Brown       ierr = VecSetType(vec1_V,impVecType);CHKERRQ(ierr);
18160c7d97c5SJed Brown       ierr = VecDuplicate(vec1_V,&vec2_V);CHKERRQ(ierr);
18170c7d97c5SJed Brown     }
1818*534831adSStefano Zampini     if(n_constraints) {
18190c7d97c5SJed Brown       ierr = VecCreate(PETSC_COMM_SELF,&vec1_C);CHKERRQ(ierr);
1820*534831adSStefano Zampini       ierr = VecSetSizes(vec1_C,n_constraints,n_constraints);CHKERRQ(ierr);
18210c7d97c5SJed Brown       ierr = VecSetType(vec1_C,impVecType);CHKERRQ(ierr);
18220c7d97c5SJed Brown       ierr = VecDuplicate(vec1_C,&vec2_C);CHKERRQ(ierr);
18230c7d97c5SJed Brown       ierr = VecDuplicate(vec1_C,&pcbddc->vec1_C);CHKERRQ(ierr);
18240c7d97c5SJed Brown     }
18250c7d97c5SJed Brown     /* Precompute stuffs needed for preprocessing and application of BDDC*/
18263b03a366Sstefano_zampini     if(n_constraints) {
18270c7d97c5SJed Brown       /* some work vectors */
18280c7d97c5SJed Brown       ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->local_auxmat2);CHKERRQ(ierr);
18293b03a366Sstefano_zampini       ierr = MatSetSizes(pcbddc->local_auxmat2,n_R,n_constraints,n_R,n_constraints);CHKERRQ(ierr);
18300c7d97c5SJed Brown       ierr = MatSetType(pcbddc->local_auxmat2,impMatType);CHKERRQ(ierr);
18313b03a366Sstefano_zampini       ierr = MatSeqDenseSetPreallocation(pcbddc->local_auxmat2,PETSC_NULL);CHKERRQ(ierr);
18320c7d97c5SJed Brown 
18330c7d97c5SJed Brown       /* Assemble local_auxmat2 = - A_{RR}^{-1} C^T_{CR} needed by BDDC application */
18343b03a366Sstefano_zampini       for(i=0;i<n_constraints;i++) {
1835d49ef151SStefano Zampini         ierr = VecSet(pcis->vec1_N,zero);CHKERRQ(ierr);
18363b03a366Sstefano_zampini         ierr = VecSet(pcbddc->vec1_R,zero);CHKERRQ(ierr);
18373b03a366Sstefano_zampini         /* Get row of constraint matrix in R numbering */
18380c7d97c5SJed Brown         ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
18393b03a366Sstefano_zampini         ierr = MatGetRow(pcbddc->ConstraintMatrix,n_vertices+i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr);
18403b03a366Sstefano_zampini         for(j=0;j<size_of_constraint;j++) { array[ row_cmat_indices[j] ] = - row_cmat_values[j]; }
18413b03a366Sstefano_zampini         ierr = MatRestoreRow(pcbddc->ConstraintMatrix,n_vertices+i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr);
18420c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr);
18430c7d97c5SJed Brown         for(j=0;j<n_R;j++) { array2[j] = array[ idx_R_local[j] ]; }
18440c7d97c5SJed Brown         ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
18450c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr);
18463b03a366Sstefano_zampini         /* Solve for row of constraint matrix in R numbering */
184753cdbc3dSStefano Zampini         ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr);
18483b03a366Sstefano_zampini         /* Set values */
18490c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec2_R,&array);CHKERRQ(ierr);
18503b03a366Sstefano_zampini         ierr = MatSetValues(pcbddc->local_auxmat2,n_R,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
18510c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec2_R,&array);CHKERRQ(ierr);
18520c7d97c5SJed Brown       }
18530c7d97c5SJed Brown       ierr = MatAssemblyBegin(pcbddc->local_auxmat2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
18540c7d97c5SJed Brown       ierr = MatAssemblyEnd(pcbddc->local_auxmat2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
18550c7d97c5SJed Brown 
18560c7d97c5SJed Brown       /* Create Constraint matrix on R nodes: C_{CR}  */
18573b03a366Sstefano_zampini       ierr = MatGetSubMatrix(pcbddc->ConstraintMatrix,is_C_local,is_R_local,MAT_INITIAL_MATRIX,&C_CR);CHKERRQ(ierr);
18580c7d97c5SJed Brown       ierr = ISDestroy(&is_C_local);CHKERRQ(ierr);
18590c7d97c5SJed Brown 
18600c7d97c5SJed Brown       /* Assemble AUXMAT = ( LUFactor )( -C_{CR} A_{RR}^{-1} C^T_{CR} )^{-1} */
18610c7d97c5SJed Brown       ierr = MatMatMult(C_CR,pcbddc->local_auxmat2,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&AUXMAT);CHKERRQ(ierr);
1862d49ef151SStefano Zampini       ierr = MatFactorInfoInitialize(&matinfo);CHKERRQ(ierr);
18633b03a366Sstefano_zampini       ierr = ISCreateStride(PETSC_COMM_SELF,n_constraints,0,1,&is_aux1);CHKERRQ(ierr);
18640c7d97c5SJed Brown       ierr = MatLUFactor(AUXMAT,is_aux1,is_aux1,&matinfo);CHKERRQ(ierr);
18650c7d97c5SJed Brown       ierr = ISDestroy(&is_aux1);CHKERRQ(ierr);
18660c7d97c5SJed Brown 
18673b03a366Sstefano_zampini       /* Assemble explicitly M1 = ( C_{CR} A_{RR}^{-1} C^T_{CR} )^{-1} needed in preproc  */
1868d49ef151SStefano Zampini       ierr = MatCreate(PETSC_COMM_SELF,&M1);CHKERRQ(ierr);
18693b03a366Sstefano_zampini       ierr = MatSetSizes(M1,n_constraints,n_constraints,n_constraints,n_constraints);CHKERRQ(ierr);
18700c7d97c5SJed Brown       ierr = MatSetType(M1,impMatType);CHKERRQ(ierr);
18713b03a366Sstefano_zampini       ierr = MatSeqDenseSetPreallocation(M1,PETSC_NULL);CHKERRQ(ierr);
18723b03a366Sstefano_zampini       for(i=0;i<n_constraints;i++) {
18730c7d97c5SJed Brown         ierr = VecSet(vec1_C,zero);CHKERRQ(ierr);
18740c7d97c5SJed Brown         ierr = VecSetValue(vec1_C,i,one,INSERT_VALUES);CHKERRQ(ierr);
18750c7d97c5SJed Brown         ierr = VecAssemblyBegin(vec1_C);CHKERRQ(ierr);
18760c7d97c5SJed Brown         ierr = VecAssemblyEnd(vec1_C);CHKERRQ(ierr);
18770c7d97c5SJed Brown         ierr = MatSolve(AUXMAT,vec1_C,vec2_C);CHKERRQ(ierr);
18780c7d97c5SJed Brown         ierr = VecScale(vec2_C,m_one);CHKERRQ(ierr);
18790c7d97c5SJed Brown         ierr = VecGetArray(vec2_C,&array);CHKERRQ(ierr);
18803b03a366Sstefano_zampini         ierr = MatSetValues(M1,n_constraints,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
18810c7d97c5SJed Brown         ierr = VecRestoreArray(vec2_C,&array);CHKERRQ(ierr);
18820c7d97c5SJed Brown       }
18830c7d97c5SJed Brown       ierr = MatAssemblyBegin(M1,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
18840c7d97c5SJed Brown       ierr = MatAssemblyEnd(M1,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
18850c7d97c5SJed Brown       ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr);
18860c7d97c5SJed Brown       /* Assemble local_auxmat1 = M1*C_{CR} needed by BDDC application in KSP and in preproc */
18870c7d97c5SJed Brown       ierr = MatMatMult(M1,C_CR,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&pcbddc->local_auxmat1);CHKERRQ(ierr);
18880c7d97c5SJed Brown 
18890c7d97c5SJed Brown     }
18900c7d97c5SJed Brown 
18910c7d97c5SJed Brown     /* Get submatrices from subdomain matrix */
18923b03a366Sstefano_zampini     if(n_vertices){
1893*534831adSStefano Zampini       ierr = MatGetSubMatrix(pcbddc->local_mat,is_R_local,is_V_local,MAT_INITIAL_MATRIX,&A_RV);CHKERRQ(ierr);
1894*534831adSStefano Zampini       ierr = MatGetSubMatrix(pcbddc->local_mat,is_V_local,is_R_local,MAT_INITIAL_MATRIX,&A_VR);CHKERRQ(ierr);
1895*534831adSStefano Zampini       ierr = MatGetSubMatrix(pcbddc->local_mat,is_V_local,is_V_local,MAT_INITIAL_MATRIX,&A_VV);CHKERRQ(ierr);
18960c7d97c5SJed Brown       /* Assemble M2 = A_RR^{-1}A_RV */
1897d49ef151SStefano Zampini       ierr = MatCreate(PETSC_COMM_SELF,&M2);CHKERRQ(ierr);
18983b03a366Sstefano_zampini       ierr = MatSetSizes(M2,n_R,n_vertices,n_R,n_vertices);CHKERRQ(ierr);
18990c7d97c5SJed Brown       ierr = MatSetType(M2,impMatType);CHKERRQ(ierr);
19003b03a366Sstefano_zampini       ierr = MatSeqDenseSetPreallocation(M2,PETSC_NULL);CHKERRQ(ierr);
19013b03a366Sstefano_zampini       for(i=0;i<n_vertices;i++) {
19020c7d97c5SJed Brown         ierr = VecSet(vec1_V,zero);CHKERRQ(ierr);
19030c7d97c5SJed Brown         ierr = VecSetValue(vec1_V,i,one,INSERT_VALUES);CHKERRQ(ierr);
19040c7d97c5SJed Brown         ierr = VecAssemblyBegin(vec1_V);CHKERRQ(ierr);
19050c7d97c5SJed Brown         ierr = VecAssemblyEnd(vec1_V);CHKERRQ(ierr);
19060c7d97c5SJed Brown         ierr = MatMult(A_RV,vec1_V,pcbddc->vec1_R);CHKERRQ(ierr);
190753cdbc3dSStefano Zampini         ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr);
19080c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec2_R,&array);CHKERRQ(ierr);
19093b03a366Sstefano_zampini         ierr = MatSetValues(M2,n_R,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
19100c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec2_R,&array);CHKERRQ(ierr);
19110c7d97c5SJed Brown       }
19120c7d97c5SJed Brown       ierr = MatAssemblyBegin(M2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
19130c7d97c5SJed Brown       ierr = MatAssemblyEnd(M2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
19140c7d97c5SJed Brown     }
19150c7d97c5SJed Brown 
19160c7d97c5SJed Brown     /* Matrix of coarse basis functions (local) */
1917d49ef151SStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->coarse_phi_B);CHKERRQ(ierr);
19180c7d97c5SJed Brown     ierr = MatSetSizes(pcbddc->coarse_phi_B,n_B,pcbddc->local_primal_size,n_B,pcbddc->local_primal_size);CHKERRQ(ierr);
19190c7d97c5SJed Brown     ierr = MatSetType(pcbddc->coarse_phi_B,impMatType);CHKERRQ(ierr);
19203b03a366Sstefano_zampini     ierr = MatSeqDenseSetPreallocation(pcbddc->coarse_phi_B,PETSC_NULL);CHKERRQ(ierr);
1921e269702eSStefano Zampini     if(pcbddc->prec_type || dbg_flag ) {
1922d49ef151SStefano Zampini       ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->coarse_phi_D);CHKERRQ(ierr);
19230c7d97c5SJed Brown       ierr = MatSetSizes(pcbddc->coarse_phi_D,n_D,pcbddc->local_primal_size,n_D,pcbddc->local_primal_size);CHKERRQ(ierr);
19240c7d97c5SJed Brown       ierr = MatSetType(pcbddc->coarse_phi_D,impMatType);CHKERRQ(ierr);
19253b03a366Sstefano_zampini       ierr = MatSeqDenseSetPreallocation(pcbddc->coarse_phi_D,PETSC_NULL);CHKERRQ(ierr);
19260c7d97c5SJed Brown     }
19270c7d97c5SJed Brown 
1928e269702eSStefano Zampini     if(dbg_flag) {
19290c7d97c5SJed Brown       ierr = PetscMalloc( pcbddc->local_primal_size*sizeof(PetscScalar),&coarsefunctions_errors);CHKERRQ(ierr);
19300c7d97c5SJed Brown       ierr = PetscMalloc( pcbddc->local_primal_size*sizeof(PetscScalar),&constraints_errors);CHKERRQ(ierr);
19310c7d97c5SJed Brown     }
19323b03a366Sstefano_zampini     /* Subdomain contribution (Non-overlapping) to coarse matrix  */
19330c7d97c5SJed Brown     ierr = PetscMalloc ((pcbddc->local_primal_size)*(pcbddc->local_primal_size)*sizeof(PetscScalar),&coarse_submat_vals);CHKERRQ(ierr);
19340c7d97c5SJed Brown 
19350c7d97c5SJed Brown     /* We are now ready to evaluate coarse basis functions and subdomain contribution to coarse problem */
19363b03a366Sstefano_zampini     for(i=0;i<n_vertices;i++){
19370c7d97c5SJed Brown       ierr = VecSet(vec1_V,zero);CHKERRQ(ierr);
19380c7d97c5SJed Brown       ierr = VecSetValue(vec1_V,i,one,INSERT_VALUES);CHKERRQ(ierr);
19390c7d97c5SJed Brown       ierr = VecAssemblyBegin(vec1_V);CHKERRQ(ierr);
19400c7d97c5SJed Brown       ierr = VecAssemblyEnd(vec1_V);CHKERRQ(ierr);
19410c7d97c5SJed Brown       /* solution of saddle point problem */
19420c7d97c5SJed Brown       ierr = MatMult(M2,vec1_V,pcbddc->vec1_R);CHKERRQ(ierr);
19430c7d97c5SJed Brown       ierr = VecScale(pcbddc->vec1_R,m_one);CHKERRQ(ierr);
19443b03a366Sstefano_zampini       if(n_constraints) {
19450c7d97c5SJed Brown         ierr = MatMult(pcbddc->local_auxmat1,pcbddc->vec1_R,vec1_C);CHKERRQ(ierr);
19460c7d97c5SJed Brown         ierr = MatMultAdd(pcbddc->local_auxmat2,vec1_C,pcbddc->vec1_R,pcbddc->vec1_R);CHKERRQ(ierr);
19470c7d97c5SJed Brown         ierr = VecScale(vec1_C,m_one);CHKERRQ(ierr);
19480c7d97c5SJed Brown       }
19490c7d97c5SJed Brown       ierr = MatMult(A_VR,pcbddc->vec1_R,vec2_V);CHKERRQ(ierr);
19500c7d97c5SJed Brown       ierr = MatMultAdd(A_VV,vec1_V,vec2_V,vec2_V);CHKERRQ(ierr);
19510c7d97c5SJed Brown 
19520c7d97c5SJed Brown       /* Set values in coarse basis function and subdomain part of coarse_mat */
19530c7d97c5SJed Brown       /* coarse basis functions */
19540c7d97c5SJed Brown       ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr);
19550c7d97c5SJed Brown       ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
19560c7d97c5SJed Brown       ierr = VecScatterEnd  (pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
19570c7d97c5SJed Brown       ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr);
19583b03a366Sstefano_zampini       ierr = MatSetValues(pcbddc->coarse_phi_B,n_B,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
19590c7d97c5SJed Brown       ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr);
19600c7d97c5SJed Brown       ierr = MatSetValue(pcbddc->coarse_phi_B,idx_V_B[i],i,one,INSERT_VALUES);CHKERRQ(ierr);
1961e269702eSStefano Zampini       if( pcbddc->prec_type || dbg_flag  ) {
19620c7d97c5SJed Brown         ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
19630c7d97c5SJed Brown         ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
19640c7d97c5SJed Brown         ierr = VecGetArray(pcis->vec1_D,&array);CHKERRQ(ierr);
19653b03a366Sstefano_zampini         ierr = MatSetValues(pcbddc->coarse_phi_D,n_D,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
19660c7d97c5SJed Brown         ierr = VecRestoreArray(pcis->vec1_D,&array);CHKERRQ(ierr);
19670c7d97c5SJed Brown       }
19680c7d97c5SJed Brown       /* subdomain contribution to coarse matrix */
19690c7d97c5SJed Brown       ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr);
1970da1bb401SStefano Zampini       for(j=0;j<n_vertices;j++) { coarse_submat_vals[i*pcbddc->local_primal_size+j] = array[j]; } /* WARNING -> column major ordering */
19710c7d97c5SJed Brown       ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr);
19723b03a366Sstefano_zampini       if(n_constraints) {
19730c7d97c5SJed Brown         ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr);
1974da1bb401SStefano Zampini         for(j=0;j<n_constraints;j++) { coarse_submat_vals[i*pcbddc->local_primal_size+j+n_vertices] = array[j]; } /* WARNING -> column major ordering */
19750c7d97c5SJed Brown         ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr);
19760c7d97c5SJed Brown       }
19770c7d97c5SJed Brown 
1978e269702eSStefano Zampini       if( dbg_flag ) {
19790c7d97c5SJed Brown         /* assemble subdomain vector on nodes */
1980d49ef151SStefano Zampini         ierr = VecSet(pcis->vec1_N,zero);CHKERRQ(ierr);
19810c7d97c5SJed Brown         ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
19820c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr);
19830c7d97c5SJed Brown         for(j=0;j<n_R;j++) { array[idx_R_local[j]] = array2[j]; }
19843b03a366Sstefano_zampini         array[ vertices[i] ] = one;
19850c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr);
19860c7d97c5SJed Brown         ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
19870c7d97c5SJed Brown         /* assemble subdomain vector of lagrange multipliers (i.e. primal nodes) */
1988d49ef151SStefano Zampini         ierr = VecSet(pcbddc->vec1_P,zero);CHKERRQ(ierr);
19890c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr);
19900c7d97c5SJed Brown         ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr);
19913b03a366Sstefano_zampini         for(j=0;j<n_vertices;j++) { array2[j]=array[j]; }
19920c7d97c5SJed Brown         ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr);
19933b03a366Sstefano_zampini         if(n_constraints) {
19940c7d97c5SJed Brown           ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr);
19953b03a366Sstefano_zampini           for(j=0;j<n_constraints;j++) { array2[j+n_vertices]=array[j]; }
19960c7d97c5SJed Brown           ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr);
19970c7d97c5SJed Brown         }
19980c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr);
19990c7d97c5SJed Brown         ierr = VecScale(pcbddc->vec1_P,m_one);CHKERRQ(ierr);
20000c7d97c5SJed Brown         /* check saddle point solution */
2001*534831adSStefano Zampini         ierr = MatMult(pcbddc->local_mat,pcis->vec1_N,pcis->vec2_N);CHKERRQ(ierr);
20023b03a366Sstefano_zampini         ierr = MatMultTransposeAdd(pcbddc->ConstraintMatrix,pcbddc->vec1_P,pcis->vec2_N,pcis->vec2_N);CHKERRQ(ierr);
20033b03a366Sstefano_zampini         ierr = VecNorm(pcis->vec2_N,NORM_INFINITY,&coarsefunctions_errors[i]);CHKERRQ(ierr);
20043b03a366Sstefano_zampini         ierr = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr);
20050c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
20063b03a366Sstefano_zampini         array[i]=array[i]+m_one;  /* shift by the identity matrix */
20070c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
20083b03a366Sstefano_zampini         ierr = VecNorm(pcbddc->vec1_P,NORM_INFINITY,&constraints_errors[i]);CHKERRQ(ierr);
20090c7d97c5SJed Brown       }
20100c7d97c5SJed Brown     }
20110c7d97c5SJed Brown 
20123b03a366Sstefano_zampini     for(i=0;i<n_constraints;i++){
2013d49ef151SStefano Zampini       ierr = VecSet(vec2_C,zero);CHKERRQ(ierr);
20140c7d97c5SJed Brown       ierr = VecSetValue(vec2_C,i,m_one,INSERT_VALUES);CHKERRQ(ierr);
20150c7d97c5SJed Brown       ierr = VecAssemblyBegin(vec2_C);CHKERRQ(ierr);
20160c7d97c5SJed Brown       ierr = VecAssemblyEnd(vec2_C);CHKERRQ(ierr);
20170c7d97c5SJed Brown       /* solution of saddle point problem */
20180c7d97c5SJed Brown       ierr = MatMult(M1,vec2_C,vec1_C);CHKERRQ(ierr);
20190c7d97c5SJed Brown       ierr = MatMult(pcbddc->local_auxmat2,vec1_C,pcbddc->vec1_R);CHKERRQ(ierr);
20200c7d97c5SJed Brown       ierr = VecScale(vec1_C,m_one);CHKERRQ(ierr);
20213b03a366Sstefano_zampini       if(n_vertices) { ierr = MatMult(A_VR,pcbddc->vec1_R,vec2_V);CHKERRQ(ierr); }
20220c7d97c5SJed Brown       /* Set values in coarse basis function and subdomain part of coarse_mat */
20230c7d97c5SJed Brown       /* coarse basis functions */
20243b03a366Sstefano_zampini       index=i+n_vertices;
20250c7d97c5SJed Brown       ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr);
20260c7d97c5SJed Brown       ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20270c7d97c5SJed Brown       ierr = VecScatterEnd  (pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20280c7d97c5SJed Brown       ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr);
202953cdbc3dSStefano Zampini       ierr = MatSetValues(pcbddc->coarse_phi_B,n_B,auxindices,1,&index,array,INSERT_VALUES);CHKERRQ(ierr);
20300c7d97c5SJed Brown       ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr);
2031e269702eSStefano Zampini       if( pcbddc->prec_type || dbg_flag ) {
20320c7d97c5SJed Brown         ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20330c7d97c5SJed Brown         ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20340c7d97c5SJed Brown         ierr = VecGetArray(pcis->vec1_D,&array);CHKERRQ(ierr);
203553cdbc3dSStefano Zampini         ierr = MatSetValues(pcbddc->coarse_phi_D,n_D,auxindices,1,&index,array,INSERT_VALUES);CHKERRQ(ierr);
20360c7d97c5SJed Brown         ierr = VecRestoreArray(pcis->vec1_D,&array);CHKERRQ(ierr);
20370c7d97c5SJed Brown       }
20380c7d97c5SJed Brown       /* subdomain contribution to coarse matrix */
20393b03a366Sstefano_zampini       if(n_vertices) {
20400c7d97c5SJed Brown         ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr);
2041da1bb401SStefano Zampini         for(j=0;j<n_vertices;j++) {coarse_submat_vals[index*pcbddc->local_primal_size+j]=array[j];} /* WARNING -> column major ordering */
20420c7d97c5SJed Brown         ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr);
20430c7d97c5SJed Brown       }
20440c7d97c5SJed Brown       ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr);
2045da1bb401SStefano Zampini       for(j=0;j<n_constraints;j++) {coarse_submat_vals[index*pcbddc->local_primal_size+j+n_vertices]=array[j];} /* WARNING -> column major ordering */
20460c7d97c5SJed Brown       ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr);
20470c7d97c5SJed Brown 
2048e269702eSStefano Zampini       if( dbg_flag ) {
20490c7d97c5SJed Brown         /* assemble subdomain vector on nodes */
205053cdbc3dSStefano Zampini         ierr = VecSet(pcis->vec1_N,zero);CHKERRQ(ierr);
20510c7d97c5SJed Brown         ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
20520c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr);
20530c7d97c5SJed Brown         for(j=0;j<n_R;j++){ array[ idx_R_local[j] ] = array2[j]; }
20540c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr);
20550c7d97c5SJed Brown         ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
20560c7d97c5SJed Brown         /* assemble subdomain vector of lagrange multipliers */
205753cdbc3dSStefano Zampini         ierr = VecSet(pcbddc->vec1_P,zero);CHKERRQ(ierr);
20580c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr);
20593b03a366Sstefano_zampini         if( n_vertices) {
20600c7d97c5SJed Brown           ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr);
20613b03a366Sstefano_zampini           for(j=0;j<n_vertices;j++) {array2[j]=-array[j];}
20620c7d97c5SJed Brown           ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr);
20630c7d97c5SJed Brown         }
20640c7d97c5SJed Brown         ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr);
20653b03a366Sstefano_zampini         for(j=0;j<n_constraints;j++) {array2[j+n_vertices]=-array[j];}
20660c7d97c5SJed Brown         ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr);
20670c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr);
2068*534831adSStefano Zampini         /* check saddle point solution CACCA*/
2069*534831adSStefano Zampini         ierr = MatMult(pcbddc->local_mat,pcis->vec1_N,pcis->vec2_N);CHKERRQ(ierr);
20703b03a366Sstefano_zampini         ierr = MatMultTransposeAdd(pcbddc->ConstraintMatrix,pcbddc->vec1_P,pcis->vec2_N,pcis->vec2_N);CHKERRQ(ierr);
207153cdbc3dSStefano Zampini         ierr = VecNorm(pcis->vec2_N,NORM_INFINITY,&coarsefunctions_errors[index]);CHKERRQ(ierr);
20723b03a366Sstefano_zampini         ierr = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr);
20730c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
207453cdbc3dSStefano Zampini         array[index]=array[index]+m_one; /* shift by the identity matrix */
20750c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
207653cdbc3dSStefano Zampini         ierr = VecNorm(pcbddc->vec1_P,NORM_INFINITY,&constraints_errors[index]);CHKERRQ(ierr);
20770c7d97c5SJed Brown       }
20780c7d97c5SJed Brown     }
20790c7d97c5SJed Brown     ierr = MatAssemblyBegin(pcbddc->coarse_phi_B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
20800c7d97c5SJed Brown     ierr = MatAssemblyEnd  (pcbddc->coarse_phi_B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2081e269702eSStefano Zampini     if( pcbddc->prec_type || dbg_flag ) {
20820c7d97c5SJed Brown       ierr = MatAssemblyBegin(pcbddc->coarse_phi_D,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
20830c7d97c5SJed Brown       ierr = MatAssemblyEnd  (pcbddc->coarse_phi_D,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
20840c7d97c5SJed Brown     }
20850c7d97c5SJed Brown     /* Checking coarse_sub_mat and coarse basis functios */
20860c7d97c5SJed Brown     /* It shuld be \Phi^{(j)^T} A^{(j)} \Phi^{(j)}=coarse_sub_mat */
20879d2fce94SStefano Zampini     if(dbg_flag) {
20880c7d97c5SJed Brown 
20890c7d97c5SJed Brown       Mat coarse_sub_mat;
20900c7d97c5SJed Brown       Mat TM1,TM2,TM3,TM4;
20910c7d97c5SJed Brown       Mat coarse_phi_D,coarse_phi_B,A_II,A_BB,A_IB,A_BI;
2092a0ba757dSStefano Zampini       const MatType checkmattype=MATSEQAIJ;
20930c7d97c5SJed Brown       PetscScalar      value;
20940c7d97c5SJed Brown 
2095c042a7c3SStefano Zampini       ierr = MatConvert(pcis->A_II,checkmattype,MAT_INITIAL_MATRIX,&A_II);CHKERRQ(ierr);
2096c042a7c3SStefano Zampini       ierr = MatConvert(pcis->A_IB,checkmattype,MAT_INITIAL_MATRIX,&A_IB);CHKERRQ(ierr);
2097c042a7c3SStefano Zampini       ierr = MatConvert(pcis->A_BI,checkmattype,MAT_INITIAL_MATRIX,&A_BI);CHKERRQ(ierr);
2098c042a7c3SStefano Zampini       ierr = MatConvert(pcis->A_BB,checkmattype,MAT_INITIAL_MATRIX,&A_BB);CHKERRQ(ierr);
2099c042a7c3SStefano Zampini       ierr = MatConvert(pcbddc->coarse_phi_D,checkmattype,MAT_INITIAL_MATRIX,&coarse_phi_D);CHKERRQ(ierr);
2100c042a7c3SStefano Zampini       ierr = MatConvert(pcbddc->coarse_phi_B,checkmattype,MAT_INITIAL_MATRIX,&coarse_phi_B);CHKERRQ(ierr);
2101c042a7c3SStefano Zampini       ierr = MatCreateSeqDense(PETSC_COMM_SELF,pcbddc->local_primal_size,pcbddc->local_primal_size,coarse_submat_vals,&coarse_sub_mat);CHKERRQ(ierr);
2102c042a7c3SStefano Zampini       ierr = MatConvert(coarse_sub_mat,checkmattype,MAT_REUSE_MATRIX,&coarse_sub_mat);CHKERRQ(ierr);
21030c7d97c5SJed Brown 
2104da1bb401SStefano Zampini       /*PetscViewer view_out;
2105da1bb401SStefano Zampini       PetscMPIInt myrank;
2106da1bb401SStefano Zampini       char filename[256];
2107da1bb401SStefano Zampini       MPI_Comm_rank(((PetscObject)pc)->comm,&myrank);
2108da1bb401SStefano Zampini       sprintf(filename,"coarsesubmat_%04d.m",myrank);
2109da1bb401SStefano Zampini       ierr = PetscViewerASCIIOpen(PETSC_COMM_SELF,filename,&view_out);CHKERRQ(ierr);
2110da1bb401SStefano Zampini       ierr = PetscViewerSetFormat(view_out,PETSC_VIEWER_ASCII_MATLAB);CHKERRQ(ierr);
2111da1bb401SStefano Zampini       ierr = MatView(coarse_sub_mat,view_out);CHKERRQ(ierr);
2112da1bb401SStefano Zampini       ierr = PetscViewerDestroy(&view_out);CHKERRQ(ierr);*/
2113da1bb401SStefano Zampini 
21140c7d97c5SJed Brown       ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
21150c7d97c5SJed Brown       ierr = PetscViewerASCIIPrintf(viewer,"Check coarse sub mat and local basis functions\n");CHKERRQ(ierr);
21160c7d97c5SJed Brown       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
211753cdbc3dSStefano Zampini       ierr = MatPtAP(A_II,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&TM1);CHKERRQ(ierr);
211853cdbc3dSStefano Zampini       ierr = MatPtAP(A_BB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&TM2);CHKERRQ(ierr);
211953cdbc3dSStefano Zampini       ierr = MatMatMult(A_IB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr);
2120c042a7c3SStefano Zampini       ierr = MatTransposeMatMult(coarse_phi_D,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM3);CHKERRQ(ierr);
212153cdbc3dSStefano Zampini       ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr);
212253cdbc3dSStefano Zampini       ierr = MatMatMult(A_BI,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr);
2123c042a7c3SStefano Zampini       ierr = MatTransposeMatMult(coarse_phi_B,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM4);CHKERRQ(ierr);
212453cdbc3dSStefano Zampini       ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr);
212553cdbc3dSStefano Zampini       ierr = MatAXPY(TM1,one,TM2,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
212653cdbc3dSStefano Zampini       ierr = MatAXPY(TM1,one,TM3,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
212753cdbc3dSStefano Zampini       ierr = MatAXPY(TM1,one,TM4,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
212853cdbc3dSStefano Zampini       ierr = MatAXPY(TM1,m_one,coarse_sub_mat,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
212953cdbc3dSStefano Zampini       ierr = MatNorm(TM1,NORM_INFINITY,&value);CHKERRQ(ierr);
21300c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"----------------------------------\n");CHKERRQ(ierr);
21310c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d \n",PetscGlobalRank);CHKERRQ(ierr);
21320c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"matrix error = % 1.14e\n",value);CHKERRQ(ierr);
21330c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"coarse functions errors\n");CHKERRQ(ierr);
213453cdbc3dSStefano Zampini       for(i=0;i<pcbddc->local_primal_size;i++) { ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local %02d-th function error = % 1.14e\n",i,coarsefunctions_errors[i]);CHKERRQ(ierr); }
21350c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"constraints errors\n");CHKERRQ(ierr);
213653cdbc3dSStefano Zampini       for(i=0;i<pcbddc->local_primal_size;i++) { ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local %02d-th function error = % 1.14e\n",i,constraints_errors[i]);CHKERRQ(ierr); }
21370c7d97c5SJed Brown       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
213853cdbc3dSStefano Zampini       ierr = MatDestroy(&A_II);CHKERRQ(ierr);
213953cdbc3dSStefano Zampini       ierr = MatDestroy(&A_BB);CHKERRQ(ierr);
214053cdbc3dSStefano Zampini       ierr = MatDestroy(&A_IB);CHKERRQ(ierr);
214153cdbc3dSStefano Zampini       ierr = MatDestroy(&A_BI);CHKERRQ(ierr);
214253cdbc3dSStefano Zampini       ierr = MatDestroy(&TM1);CHKERRQ(ierr);
214353cdbc3dSStefano Zampini       ierr = MatDestroy(&TM2);CHKERRQ(ierr);
214453cdbc3dSStefano Zampini       ierr = MatDestroy(&TM3);CHKERRQ(ierr);
214553cdbc3dSStefano Zampini       ierr = MatDestroy(&TM4);CHKERRQ(ierr);
214653cdbc3dSStefano Zampini       ierr = MatDestroy(&coarse_phi_D);CHKERRQ(ierr);
214753cdbc3dSStefano Zampini       ierr = MatDestroy(&coarse_sub_mat);CHKERRQ(ierr);
214853cdbc3dSStefano Zampini       ierr = MatDestroy(&coarse_phi_B);CHKERRQ(ierr);
21490c7d97c5SJed Brown       ierr = PetscFree(coarsefunctions_errors);CHKERRQ(ierr);
21500c7d97c5SJed Brown       ierr = PetscFree(constraints_errors);CHKERRQ(ierr);
21510c7d97c5SJed Brown     }
21520c7d97c5SJed Brown 
21530c7d97c5SJed Brown     /* create coarse matrix and data structures for message passing associated actual choice of coarse problem type */
21540c7d97c5SJed Brown     ierr = PCBDDCSetupCoarseEnvironment(pc,coarse_submat_vals);CHKERRQ(ierr);
21550c7d97c5SJed Brown     /* free memory */
21560c7d97c5SJed Brown     ierr = PetscFree(coarse_submat_vals);CHKERRQ(ierr);
21570c7d97c5SJed Brown     ierr = PetscFree(auxindices);CHKERRQ(ierr);
21580c7d97c5SJed Brown     ierr = PetscFree(nnz);CHKERRQ(ierr);
21593b03a366Sstefano_zampini     if(n_vertices) {
21600c7d97c5SJed Brown       ierr = VecDestroy(&vec1_V);CHKERRQ(ierr);
21610c7d97c5SJed Brown       ierr = VecDestroy(&vec2_V);CHKERRQ(ierr);
21620c7d97c5SJed Brown       ierr = MatDestroy(&M2);CHKERRQ(ierr);
21630c7d97c5SJed Brown       ierr = MatDestroy(&A_RV);CHKERRQ(ierr);
21640c7d97c5SJed Brown       ierr = MatDestroy(&A_VR);CHKERRQ(ierr);
21650c7d97c5SJed Brown       ierr = MatDestroy(&A_VV);CHKERRQ(ierr);
21660c7d97c5SJed Brown     }
2167*534831adSStefano Zampini     if(n_constraints) {
21680c7d97c5SJed Brown       ierr = VecDestroy(&vec1_C);CHKERRQ(ierr);
21690c7d97c5SJed Brown       ierr = VecDestroy(&vec2_C);CHKERRQ(ierr);
21700c7d97c5SJed Brown       ierr = MatDestroy(&M1);CHKERRQ(ierr);
21710c7d97c5SJed Brown       ierr = MatDestroy(&C_CR);CHKERRQ(ierr);
21720c7d97c5SJed Brown     }
21730c7d97c5SJed Brown   }
21740c7d97c5SJed Brown   /* free memory */
21753b03a366Sstefano_zampini   if(n_vertices) {
21760c7d97c5SJed Brown     ierr = PetscFree(idx_V_B);CHKERRQ(ierr);
21770c7d97c5SJed Brown     ierr = ISDestroy(&is_V_local);CHKERRQ(ierr);
21780c7d97c5SJed Brown   }
21790c7d97c5SJed Brown   ierr = ISDestroy(&is_R_local);CHKERRQ(ierr);
21800c7d97c5SJed Brown 
21810c7d97c5SJed Brown   PetscFunctionReturn(0);
21820c7d97c5SJed Brown }
21830c7d97c5SJed Brown 
21840c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
21850c7d97c5SJed Brown 
21860c7d97c5SJed Brown #undef __FUNCT__
21870c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetupCoarseEnvironment"
218853cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetupCoarseEnvironment(PC pc,PetscScalar* coarse_submat_vals)
21890c7d97c5SJed Brown {
21900c7d97c5SJed Brown 
21910c7d97c5SJed Brown 
21920c7d97c5SJed Brown   Mat_IS    *matis    = (Mat_IS*)pc->pmat->data;
21930c7d97c5SJed Brown   PC_BDDC   *pcbddc   = (PC_BDDC*)pc->data;
21940c7d97c5SJed Brown   PC_IS     *pcis     = (PC_IS*)pc->data;
21950c7d97c5SJed Brown   MPI_Comm  prec_comm = ((PetscObject)pc)->comm;
21960c7d97c5SJed Brown   MPI_Comm  coarse_comm;
21970c7d97c5SJed Brown 
21980c7d97c5SJed Brown   /* common to all choiches */
21990c7d97c5SJed Brown   PetscScalar *temp_coarse_mat_vals;
22000c7d97c5SJed Brown   PetscScalar *ins_coarse_mat_vals;
22010c7d97c5SJed Brown   PetscInt    *ins_local_primal_indices;
22020c7d97c5SJed Brown   PetscMPIInt *localsizes2,*localdispl2;
22030c7d97c5SJed Brown   PetscMPIInt size_prec_comm;
22040c7d97c5SJed Brown   PetscMPIInt rank_prec_comm;
22050c7d97c5SJed Brown   PetscMPIInt active_rank=MPI_PROC_NULL;
22060c7d97c5SJed Brown   PetscMPIInt master_proc=0;
22070c7d97c5SJed Brown   PetscInt    ins_local_primal_size;
22080c7d97c5SJed Brown   /* specific to MULTILEVEL_BDDC */
22090c7d97c5SJed Brown   PetscMPIInt *ranks_recv;
22100c7d97c5SJed Brown   PetscMPIInt count_recv=0;
22110c7d97c5SJed Brown   PetscMPIInt rank_coarse_proc_send_to;
22120c7d97c5SJed Brown   PetscMPIInt coarse_color = MPI_UNDEFINED;
22130c7d97c5SJed Brown   ISLocalToGlobalMapping coarse_ISLG;
22140c7d97c5SJed Brown   /* some other variables */
22150c7d97c5SJed Brown   PetscErrorCode ierr;
22160c7d97c5SJed Brown   const MatType coarse_mat_type;
22170c7d97c5SJed Brown   const PCType  coarse_pc_type;
221853cdbc3dSStefano Zampini   const KSPType  coarse_ksp_type;
221953cdbc3dSStefano Zampini   PC pc_temp;
22200c7d97c5SJed Brown   PetscInt i,j,k,bs;
22213b03a366Sstefano_zampini   PetscInt max_it_coarse_ksp=1;  /* don't increase this value */
2222e269702eSStefano Zampini   /* verbose output viewer */
2223e269702eSStefano Zampini   PetscViewer viewer=pcbddc->dbg_viewer;
2224e269702eSStefano Zampini   PetscBool   dbg_flag=pcbddc->dbg_flag;
22250c7d97c5SJed Brown 
22260c7d97c5SJed Brown   PetscFunctionBegin;
22270c7d97c5SJed Brown 
22280c7d97c5SJed Brown   ins_local_primal_indices = 0;
22290c7d97c5SJed Brown   ins_coarse_mat_vals      = 0;
22300c7d97c5SJed Brown   localsizes2              = 0;
22310c7d97c5SJed Brown   localdispl2              = 0;
22320c7d97c5SJed Brown   temp_coarse_mat_vals     = 0;
22330c7d97c5SJed Brown   coarse_ISLG              = 0;
22340c7d97c5SJed Brown 
223553cdbc3dSStefano Zampini   ierr = MPI_Comm_size(prec_comm,&size_prec_comm);CHKERRQ(ierr);
223653cdbc3dSStefano Zampini   ierr = MPI_Comm_rank(prec_comm,&rank_prec_comm);CHKERRQ(ierr);
22370c7d97c5SJed Brown   ierr = MatGetBlockSize(matis->A,&bs);CHKERRQ(ierr);
22380c7d97c5SJed Brown 
2239beed3852SStefano Zampini   /* Assign global numbering to coarse dofs */
2240beed3852SStefano Zampini   {
2241a0ba757dSStefano Zampini     PetscScalar    one=1.,zero=0.;
2242beed3852SStefano Zampini     PetscScalar    *array;
2243beed3852SStefano Zampini     PetscMPIInt    *auxlocal_primal;
2244beed3852SStefano Zampini     PetscMPIInt    *auxglobal_primal;
2245beed3852SStefano Zampini     PetscMPIInt    *all_auxglobal_primal;
2246beed3852SStefano Zampini     PetscMPIInt    *all_auxglobal_primal_dummy;
2247beed3852SStefano Zampini     PetscMPIInt    mpi_local_primal_size = (PetscMPIInt)pcbddc->local_primal_size;
2248da1bb401SStefano Zampini     PetscInt       *row_cmat_indices;
22493b03a366Sstefano_zampini     PetscInt       size_of_constraint;
2250da1bb401SStefano Zampini     PetscScalar    coarsesum;
2251beed3852SStefano Zampini 
2252beed3852SStefano Zampini     /* Construct needed data structures for message passing */
2253beed3852SStefano Zampini     ierr = PetscMalloc(mpi_local_primal_size*sizeof(PetscMPIInt),&pcbddc->local_primal_indices);CHKERRQ(ierr);
2254beed3852SStefano Zampini     ierr = PetscMalloc(size_prec_comm*sizeof(PetscMPIInt),&pcbddc->local_primal_sizes);CHKERRQ(ierr);
2255beed3852SStefano Zampini     ierr = PetscMalloc(size_prec_comm*sizeof(PetscMPIInt),&pcbddc->local_primal_displacements);CHKERRQ(ierr);
2256beed3852SStefano Zampini     /* Gather local_primal_size information for all processes  */
22575619798eSStefano Zampini     ierr = MPI_Allgather(&mpi_local_primal_size,1,MPIU_INT,&pcbddc->local_primal_sizes[0],1,MPIU_INT,prec_comm);CHKERRQ(ierr);
2258beed3852SStefano Zampini     pcbddc->replicated_primal_size = 0;
2259beed3852SStefano Zampini     for (i=0; i<size_prec_comm; i++) {
2260beed3852SStefano Zampini       pcbddc->local_primal_displacements[i] = pcbddc->replicated_primal_size ;
2261beed3852SStefano Zampini       pcbddc->replicated_primal_size += pcbddc->local_primal_sizes[i];
2262beed3852SStefano Zampini     }
22635619798eSStefano Zampini     if(rank_prec_comm == 0) {
2264beed3852SStefano Zampini       /* allocate some auxiliary space */
2265beed3852SStefano Zampini       ierr = PetscMalloc(pcbddc->replicated_primal_size*sizeof(*all_auxglobal_primal),&all_auxglobal_primal);CHKERRQ(ierr);
2266beed3852SStefano Zampini       ierr = PetscMalloc(pcbddc->replicated_primal_size*sizeof(*all_auxglobal_primal_dummy),&all_auxglobal_primal_dummy);CHKERRQ(ierr);
2267beed3852SStefano Zampini     }
2268beed3852SStefano Zampini     ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscMPIInt),&auxlocal_primal);CHKERRQ(ierr);
2269beed3852SStefano Zampini     ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscMPIInt),&auxglobal_primal);CHKERRQ(ierr);
2270beed3852SStefano Zampini 
2271da1bb401SStefano Zampini     /* First let's count coarse dofs.
2272beed3852SStefano Zampini        This code fragment assumes that the number of local constraints per connected component
2273beed3852SStefano Zampini        is not greater than the number of nodes defined for the connected component
2274beed3852SStefano Zampini        (otherwise we will surely have linear dependence between constraints and thus a singular coarse problem) */
22753b03a366Sstefano_zampini     /* auxlocal_primal      : primal indices in local nodes numbering (internal and interface) with complete queue sorted by global ordering */
2276beed3852SStefano Zampini     ierr = VecSet(pcis->vec1_N,zero);CHKERRQ(ierr);
2277beed3852SStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
2278da1bb401SStefano Zampini     for(i=0;i<pcbddc->local_primal_size;i++) {
2279da1bb401SStefano Zampini       ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr);
22803b03a366Sstefano_zampini       for (j=0; j<size_of_constraint; j++) {
22813b03a366Sstefano_zampini         k = row_cmat_indices[j];
2282beed3852SStefano Zampini         if( array[k] == zero ) {
2283beed3852SStefano Zampini           array[k] = one;
2284da1bb401SStefano Zampini           auxlocal_primal[i] = k;
2285beed3852SStefano Zampini           break;
2286beed3852SStefano Zampini         }
2287beed3852SStefano Zampini       }
2288da1bb401SStefano Zampini       ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr);
2289beed3852SStefano Zampini     }
2290beed3852SStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
2291da1bb401SStefano Zampini     ierr = VecSet(pcis->vec1_global,zero);CHKERRQ(ierr);
2292da1bb401SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
2293da1bb401SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
2294da1bb401SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
2295da1bb401SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
2296da1bb401SStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
2297da1bb401SStefano Zampini     for(i=0;i<pcis->n;i++) { if( array[i] > zero) array[i] = one/array[i]; }
2298da1bb401SStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
2299da1bb401SStefano Zampini     ierr = VecSet(pcis->vec1_global,zero);CHKERRQ(ierr);
2300da1bb401SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
2301da1bb401SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
2302da1bb401SStefano Zampini     ierr = VecSum(pcis->vec1_global,&coarsesum);CHKERRQ(ierr);
2303da1bb401SStefano Zampini     pcbddc->coarse_size = (PetscInt) coarsesum;
2304a0ba757dSStefano Zampini 
2305beed3852SStefano Zampini     /* Now assign them a global numbering */
2306beed3852SStefano Zampini     /* auxglobal_primal contains indices in global nodes numbering (internal and interface) */
2307beed3852SStefano Zampini     ierr = ISLocalToGlobalMappingApply(matis->mapping,pcbddc->local_primal_size,auxlocal_primal,auxglobal_primal);CHKERRQ(ierr);
2308beed3852SStefano Zampini     /* all_auxglobal_primal contains all primal nodes indices in global nodes numbering (internal and interface) */
2309beed3852SStefano Zampini     ierr = MPI_Gatherv(&auxglobal_primal[0],pcbddc->local_primal_size,MPIU_INT,&all_auxglobal_primal[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,0,prec_comm);CHKERRQ(ierr);
2310beed3852SStefano Zampini 
2311beed3852SStefano Zampini     /* After this block all_auxglobal_primal should contains one copy of each primal node's indices in global nodes numbering */
2312beed3852SStefano Zampini     /* It implements a function similar to PetscSortRemoveDupsInt */
2313beed3852SStefano Zampini     if(rank_prec_comm==0) {
2314beed3852SStefano Zampini       /* dummy argument since PetscSortMPIInt doesn't exist! */
2315beed3852SStefano Zampini       ierr = PetscSortMPIIntWithArray(pcbddc->replicated_primal_size,all_auxglobal_primal,all_auxglobal_primal_dummy);CHKERRQ(ierr);
2316beed3852SStefano Zampini       k=1;
2317beed3852SStefano Zampini       j=all_auxglobal_primal[0];  /* first dof in global numbering */
2318beed3852SStefano Zampini       for(i=1;i< pcbddc->replicated_primal_size ;i++) {
2319beed3852SStefano Zampini         if(j != all_auxglobal_primal[i] ) {
2320beed3852SStefano Zampini           all_auxglobal_primal[k]=all_auxglobal_primal[i];
2321beed3852SStefano Zampini           k++;
2322beed3852SStefano Zampini           j=all_auxglobal_primal[i];
2323beed3852SStefano Zampini         }
2324beed3852SStefano Zampini       }
2325beed3852SStefano Zampini     } else {
2326beed3852SStefano Zampini       ierr = PetscMalloc(pcbddc->coarse_size*sizeof(PetscMPIInt),&all_auxglobal_primal);CHKERRQ(ierr);
2327beed3852SStefano Zampini     }
23285619798eSStefano Zampini     /* We only need to broadcast the indices from 0 to pcbddc->coarse_size. Remaning elements of array all_aux_global_primal are garbage. */
2329beed3852SStefano Zampini     ierr = MPI_Bcast(all_auxglobal_primal,pcbddc->coarse_size,MPIU_INT,0,prec_comm);CHKERRQ(ierr);
2330beed3852SStefano Zampini 
2331beed3852SStefano Zampini     /* Now get global coarse numbering of local primal nodes */
2332beed3852SStefano Zampini     for(i=0;i<pcbddc->local_primal_size;i++) {
2333beed3852SStefano Zampini       k=0;
2334beed3852SStefano Zampini       while( all_auxglobal_primal[k] != auxglobal_primal[i] ) { k++;}
2335beed3852SStefano Zampini       pcbddc->local_primal_indices[i]=k;
2336beed3852SStefano Zampini     }
2337e269702eSStefano Zampini     if(dbg_flag) {
2338e269702eSStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
2339da1bb401SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Size of coarse problem %d\n",pcbddc->coarse_size);CHKERRQ(ierr);
2340e269702eSStefano Zampini       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
2341e269702eSStefano Zampini     }
2342beed3852SStefano Zampini     /* free allocated memory */
2343beed3852SStefano Zampini     ierr = PetscFree(auxlocal_primal);CHKERRQ(ierr);
2344beed3852SStefano Zampini     ierr = PetscFree(auxglobal_primal);CHKERRQ(ierr);
2345beed3852SStefano Zampini     ierr = PetscFree(all_auxglobal_primal);CHKERRQ(ierr);
2346e269702eSStefano Zampini     if(rank_prec_comm == 0) {
2347beed3852SStefano Zampini       ierr = PetscFree(all_auxglobal_primal_dummy);CHKERRQ(ierr);
2348beed3852SStefano Zampini     }
2349e269702eSStefano Zampini   }
2350beed3852SStefano Zampini 
23510c7d97c5SJed Brown   /* adapt coarse problem type */
23520c7d97c5SJed Brown   if(pcbddc->coarse_problem_type == MULTILEVEL_BDDC && pcbddc->active_procs < MIN_PROCS_FOR_BDDC )
23530c7d97c5SJed Brown     pcbddc->coarse_problem_type = PARALLEL_BDDC;
23540c7d97c5SJed Brown 
23550c7d97c5SJed Brown   switch(pcbddc->coarse_problem_type){
23560c7d97c5SJed Brown 
2357da1bb401SStefano Zampini     case(MULTILEVEL_BDDC):   /* we define a coarse mesh where subdomains are elements */
23580c7d97c5SJed Brown     {
23590c7d97c5SJed Brown       /* we need additional variables */
23600c7d97c5SJed Brown       MetisInt   n_subdomains,n_parts,objval,ncon,faces_nvtxs;
23610c7d97c5SJed Brown       MetisInt   *metis_coarse_subdivision;
23620c7d97c5SJed Brown       MetisInt   options[METIS_NOPTIONS];
23630c7d97c5SJed Brown       PetscMPIInt size_coarse_comm,rank_coarse_comm;
23640c7d97c5SJed Brown       PetscMPIInt procs_jumps_coarse_comm;
23650c7d97c5SJed Brown       PetscMPIInt *coarse_subdivision;
23660c7d97c5SJed Brown       PetscMPIInt *total_count_recv;
23670c7d97c5SJed Brown       PetscMPIInt *total_ranks_recv;
23680c7d97c5SJed Brown       PetscMPIInt *displacements_recv;
23690c7d97c5SJed Brown       PetscMPIInt *my_faces_connectivity;
23700c7d97c5SJed Brown       PetscMPIInt *petsc_faces_adjncy;
23710c7d97c5SJed Brown       MetisInt    *faces_adjncy;
23720c7d97c5SJed Brown       MetisInt    *faces_xadj;
23730c7d97c5SJed Brown       PetscMPIInt *number_of_faces;
23740c7d97c5SJed Brown       PetscMPIInt *faces_displacements;
23750c7d97c5SJed Brown       PetscInt    *array_int;
23760c7d97c5SJed Brown       PetscMPIInt my_faces=0;
23770c7d97c5SJed Brown       PetscMPIInt total_faces=0;
23783828260eSStefano Zampini       PetscInt    ranks_stretching_ratio;
23790c7d97c5SJed Brown 
23800c7d97c5SJed Brown       /* define some quantities */
23810c7d97c5SJed Brown       pcbddc->coarse_communications_type = SCATTERS_BDDC;
23820c7d97c5SJed Brown       coarse_mat_type = MATIS;
23830c7d97c5SJed Brown       coarse_pc_type  = PCBDDC;
23846c9de887SHong Zhang       coarse_ksp_type  = KSPCHEBYSHEV;
23850c7d97c5SJed Brown 
23860c7d97c5SJed Brown       /* details of coarse decomposition */
23870c7d97c5SJed Brown       n_subdomains = pcbddc->active_procs;
23880c7d97c5SJed Brown       n_parts      = n_subdomains/pcbddc->coarsening_ratio;
23893828260eSStefano Zampini       ranks_stretching_ratio = size_prec_comm/pcbddc->active_procs;
23903828260eSStefano Zampini       procs_jumps_coarse_comm = pcbddc->coarsening_ratio*ranks_stretching_ratio;
23913828260eSStefano Zampini 
2392da1bb401SStefano Zampini       /*printf("Coarse algorithm details: \n");
2393da1bb401SStefano Zampini       printf("n_subdomains %d, n_parts %d\nstretch %d,jumps %d,coarse_ratio %d\nlevel should be log_%d(%d)\n",n_subdomains,n_parts,ranks_stretching_ratio,procs_jumps_coarse_comm,pcbddc->coarsening_ratio,pcbddc->coarsening_ratio,(ranks_stretching_ratio/pcbddc->coarsening_ratio+1));*/
23940c7d97c5SJed Brown 
23950c7d97c5SJed Brown       /* build CSR graph of subdomains' connectivity through faces */
23960c7d97c5SJed Brown       ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&array_int);CHKERRQ(ierr);
23973828260eSStefano Zampini       ierr = PetscMemzero(array_int,pcis->n*sizeof(PetscInt));CHKERRQ(ierr);
23980c7d97c5SJed Brown       for(i=1;i<pcis->n_neigh;i++){/* i=1 so I don't count myself -> faces nodes counts to 1 */
23990c7d97c5SJed Brown         for(j=0;j<pcis->n_shared[i];j++){
24000c7d97c5SJed Brown           array_int[ pcis->shared[i][j] ]+=1;
24010c7d97c5SJed Brown         }
24020c7d97c5SJed Brown       }
24030c7d97c5SJed Brown       for(i=1;i<pcis->n_neigh;i++){
24040c7d97c5SJed Brown         for(j=0;j<pcis->n_shared[i];j++){
24050c7d97c5SJed Brown           if(array_int[ pcis->shared[i][j] ] == 1 ){
24060c7d97c5SJed Brown             my_faces++;
24070c7d97c5SJed Brown             break;
24080c7d97c5SJed Brown           }
24090c7d97c5SJed Brown         }
24100c7d97c5SJed Brown       }
24110c7d97c5SJed Brown 
241253cdbc3dSStefano Zampini       ierr = MPI_Reduce(&my_faces,&total_faces,1,MPIU_INT,MPI_SUM,master_proc,prec_comm);CHKERRQ(ierr);
24130c7d97c5SJed Brown       ierr = PetscMalloc (my_faces*sizeof(PetscInt),&my_faces_connectivity);CHKERRQ(ierr);
24140c7d97c5SJed Brown       my_faces=0;
24150c7d97c5SJed Brown       for(i=1;i<pcis->n_neigh;i++){
24160c7d97c5SJed Brown         for(j=0;j<pcis->n_shared[i];j++){
24170c7d97c5SJed Brown           if(array_int[ pcis->shared[i][j] ] == 1 ){
24180c7d97c5SJed Brown             my_faces_connectivity[my_faces]=pcis->neigh[i];
24190c7d97c5SJed Brown             my_faces++;
24200c7d97c5SJed Brown             break;
24210c7d97c5SJed Brown           }
24220c7d97c5SJed Brown         }
24230c7d97c5SJed Brown       }
24240c7d97c5SJed Brown       if(rank_prec_comm == master_proc) {
24250c7d97c5SJed Brown         ierr = PetscMalloc (total_faces*sizeof(PetscMPIInt),&petsc_faces_adjncy);CHKERRQ(ierr);
24260c7d97c5SJed Brown         ierr = PetscMalloc (size_prec_comm*sizeof(PetscMPIInt),&number_of_faces);CHKERRQ(ierr);
24270c7d97c5SJed Brown         ierr = PetscMalloc (total_faces*sizeof(MetisInt),&faces_adjncy);CHKERRQ(ierr);
24280c7d97c5SJed Brown         ierr = PetscMalloc ((n_subdomains+1)*sizeof(MetisInt),&faces_xadj);CHKERRQ(ierr);
24290c7d97c5SJed Brown         ierr = PetscMalloc ((size_prec_comm+1)*sizeof(PetscMPIInt),&faces_displacements);CHKERRQ(ierr);
24300c7d97c5SJed Brown       }
243153cdbc3dSStefano Zampini       ierr = MPI_Gather(&my_faces,1,MPIU_INT,&number_of_faces[0],1,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr);
24320c7d97c5SJed Brown       if(rank_prec_comm == master_proc) {
24330c7d97c5SJed Brown         faces_xadj[0]=0;
24340c7d97c5SJed Brown         faces_displacements[0]=0;
24350c7d97c5SJed Brown         j=0;
24360c7d97c5SJed Brown         for(i=1;i<size_prec_comm+1;i++) {
24370c7d97c5SJed Brown           faces_displacements[i]=faces_displacements[i-1]+number_of_faces[i-1];
24380c7d97c5SJed Brown           if(number_of_faces[i-1]) {
24390c7d97c5SJed Brown             j++;
24400c7d97c5SJed Brown             faces_xadj[j]=faces_xadj[j-1]+number_of_faces[i-1];
24410c7d97c5SJed Brown           }
24420c7d97c5SJed Brown         }
2443da1bb401SStefano Zampini         /*printf("The J I count is %d and should be %d\n",j,n_subdomains);
2444da1bb401SStefano Zampini         printf("Total faces seem %d and should be %d\n",faces_xadj[j],total_faces);*/
24450c7d97c5SJed Brown       }
244653cdbc3dSStefano Zampini       ierr = MPI_Gatherv(&my_faces_connectivity[0],my_faces,MPIU_INT,&petsc_faces_adjncy[0],number_of_faces,faces_displacements,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr);
24470c7d97c5SJed Brown       ierr = PetscFree(my_faces_connectivity);CHKERRQ(ierr);
24480c7d97c5SJed Brown       ierr = PetscFree(array_int);CHKERRQ(ierr);
24490c7d97c5SJed Brown       if(rank_prec_comm == master_proc) {
24503828260eSStefano Zampini         for(i=0;i<total_faces;i++) faces_adjncy[i]=(MetisInt)(petsc_faces_adjncy[i]/ranks_stretching_ratio); /* cast to MetisInt */
2451da1bb401SStefano Zampini         /*printf("This is the face connectivity (actual ranks)\n");
24520c7d97c5SJed Brown         for(i=0;i<n_subdomains;i++){
24530c7d97c5SJed Brown           printf("proc %d is connected with \n",i);
24540c7d97c5SJed Brown           for(j=faces_xadj[i];j<faces_xadj[i+1];j++)
24550c7d97c5SJed Brown             printf("%d ",faces_adjncy[j]);
24560c7d97c5SJed Brown           printf("\n");
2457da1bb401SStefano Zampini         }*/
24580c7d97c5SJed Brown         ierr = PetscFree(faces_displacements);CHKERRQ(ierr);
24590c7d97c5SJed Brown         ierr = PetscFree(number_of_faces);CHKERRQ(ierr);
24600c7d97c5SJed Brown         ierr = PetscFree(petsc_faces_adjncy);CHKERRQ(ierr);
24610c7d97c5SJed Brown       }
24620c7d97c5SJed Brown 
24630c7d97c5SJed Brown       if( rank_prec_comm == master_proc ) {
24640c7d97c5SJed Brown 
24653828260eSStefano Zampini         PetscInt heuristic_for_metis=3;
24663828260eSStefano Zampini 
24670c7d97c5SJed Brown         ncon=1;
24680c7d97c5SJed Brown         faces_nvtxs=n_subdomains;
24690c7d97c5SJed Brown         /* partition graoh induced by face connectivity */
24700c7d97c5SJed Brown         ierr = PetscMalloc (n_subdomains*sizeof(MetisInt),&metis_coarse_subdivision);CHKERRQ(ierr);
24710c7d97c5SJed Brown         ierr = METIS_SetDefaultOptions(options);
24720c7d97c5SJed Brown         /* we need a contiguous partition of the coarse mesh */
24730c7d97c5SJed Brown         options[METIS_OPTION_CONTIG]=1;
24740c7d97c5SJed Brown         options[METIS_OPTION_DBGLVL]=1;
24750c7d97c5SJed Brown         options[METIS_OPTION_NITER]=30;
24763828260eSStefano Zampini         if(n_subdomains>n_parts*heuristic_for_metis) {
24773828260eSStefano Zampini           options[METIS_OPTION_IPTYPE]=METIS_IPTYPE_EDGE;
24783828260eSStefano Zampini           options[METIS_OPTION_OBJTYPE]=METIS_OBJTYPE_CUT;
24790c7d97c5SJed Brown           ierr = METIS_PartGraphKway(&faces_nvtxs,&ncon,faces_xadj,faces_adjncy,NULL,NULL,NULL,&n_parts,NULL,NULL,options,&objval,metis_coarse_subdivision);
24803828260eSStefano Zampini         } else {
24813828260eSStefano Zampini           ierr = METIS_PartGraphRecursive(&faces_nvtxs,&ncon,faces_xadj,faces_adjncy,NULL,NULL,NULL,&n_parts,NULL,NULL,options,&objval,metis_coarse_subdivision);
24823828260eSStefano Zampini         }
24830c7d97c5SJed Brown         if(ierr != METIS_OK) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in METIS_PartGraphKway (metis error code %D) called from PCBDDCSetupCoarseEnvironment\n",ierr);
24840c7d97c5SJed Brown         ierr = PetscFree(faces_xadj);CHKERRQ(ierr);
24850c7d97c5SJed Brown         ierr = PetscFree(faces_adjncy);CHKERRQ(ierr);
24860c7d97c5SJed Brown         coarse_subdivision = (PetscMPIInt*)calloc(size_prec_comm,sizeof(PetscMPIInt)); /* calloc for contiguous memory since we need to scatter these values later */
24870c7d97c5SJed Brown         /* copy/cast values avoiding possible type conflicts between PETSc, MPI and METIS */
24883828260eSStefano Zampini         for(i=0;i<size_prec_comm;i++) coarse_subdivision[i]=MPI_PROC_NULL;
24893828260eSStefano Zampini         for(i=0;i<n_subdomains;i++)   coarse_subdivision[ranks_stretching_ratio*i]=(PetscInt)(metis_coarse_subdivision[i]);
24900c7d97c5SJed Brown         ierr = PetscFree(metis_coarse_subdivision);CHKERRQ(ierr);
24910c7d97c5SJed Brown       }
24920c7d97c5SJed Brown 
24930c7d97c5SJed Brown       /* Create new communicator for coarse problem splitting the old one */
24940c7d97c5SJed Brown       if( !(rank_prec_comm%procs_jumps_coarse_comm) && rank_prec_comm < procs_jumps_coarse_comm*n_parts ){
2495da1bb401SStefano Zampini         coarse_color=0;              /* for communicator splitting */
2496da1bb401SStefano Zampini         active_rank=rank_prec_comm;  /* for insertion of matrix values */
24970c7d97c5SJed Brown       }
2498da1bb401SStefano Zampini       /* procs with coarse_color = MPI_UNDEFINED will have coarse_comm = MPI_COMM_NULL (from mpi standards)
2499da1bb401SStefano Zampini          key = rank_prec_comm -> keep same ordering of ranks from the old to the new communicator */
250053cdbc3dSStefano Zampini       ierr = MPI_Comm_split(prec_comm,coarse_color,rank_prec_comm,&coarse_comm);CHKERRQ(ierr);
25010c7d97c5SJed Brown 
25020c7d97c5SJed Brown       if( coarse_color == 0 ) {
250353cdbc3dSStefano Zampini         ierr = MPI_Comm_size(coarse_comm,&size_coarse_comm);CHKERRQ(ierr);
250453cdbc3dSStefano Zampini         ierr = MPI_Comm_rank(coarse_comm,&rank_coarse_comm);CHKERRQ(ierr);
2505da1bb401SStefano Zampini         /*printf("Details of coarse comm\n");
25063828260eSStefano Zampini         printf("size = %d, myrank = %d\n",size_coarse_comm,rank_coarse_comm);
2507da1bb401SStefano Zampini         printf("jumps = %d, coarse_color = %d, n_parts = %d\n",procs_jumps_coarse_comm,coarse_color,n_parts);*/
25080c7d97c5SJed Brown       } else {
25090c7d97c5SJed Brown         rank_coarse_comm = MPI_PROC_NULL;
25100c7d97c5SJed Brown       }
25110c7d97c5SJed Brown 
25120c7d97c5SJed Brown       /* master proc take care of arranging and distributing coarse informations */
25130c7d97c5SJed Brown       if(rank_coarse_comm == master_proc) {
25140c7d97c5SJed Brown         ierr = PetscMalloc (size_coarse_comm*sizeof(PetscMPIInt),&displacements_recv);CHKERRQ(ierr);
2515da1bb401SStefano Zampini         /*ierr = PetscMalloc (size_coarse_comm*sizeof(PetscMPIInt),&total_count_recv);CHKERRQ(ierr);
2516da1bb401SStefano Zampini           ierr = PetscMalloc (n_subdomains*sizeof(PetscMPIInt),&total_ranks_recv);CHKERRQ(ierr);*/
25170c7d97c5SJed Brown         total_count_recv = (PetscMPIInt*)calloc(size_prec_comm,sizeof(PetscMPIInt));
25180c7d97c5SJed Brown         total_ranks_recv = (PetscMPIInt*)calloc(n_subdomains,sizeof(PetscMPIInt));
25190c7d97c5SJed Brown         /* some initializations */
25200c7d97c5SJed Brown         displacements_recv[0]=0;
2521da1bb401SStefano Zampini         /* PetscMemzero(total_count_recv,size_coarse_comm*sizeof(PetscMPIInt)); not needed -> calloc initializes to zero */
25220c7d97c5SJed Brown         /* count from how many processes the j-th process of the coarse decomposition will receive data */
25230c7d97c5SJed Brown         for(j=0;j<size_coarse_comm;j++)
25243828260eSStefano Zampini           for(i=0;i<size_prec_comm;i++)
25250c7d97c5SJed Brown             if(coarse_subdivision[i]==j)
25260c7d97c5SJed Brown               total_count_recv[j]++;
25270c7d97c5SJed Brown         /* displacements needed for scatterv of total_ranks_recv */
25280c7d97c5SJed Brown         for(i=1;i<size_coarse_comm;i++) displacements_recv[i]=displacements_recv[i-1]+total_count_recv[i-1];
25290c7d97c5SJed Brown         /* Now fill properly total_ranks_recv -> each coarse process will receive the ranks (in prec_comm communicator) of its friend (sending) processes */
25300c7d97c5SJed Brown         ierr = PetscMemzero(total_count_recv,size_coarse_comm*sizeof(PetscMPIInt));CHKERRQ(ierr);
25310c7d97c5SJed Brown         for(j=0;j<size_coarse_comm;j++) {
25323828260eSStefano Zampini           for(i=0;i<size_prec_comm;i++) {
25330c7d97c5SJed Brown             if(coarse_subdivision[i]==j) {
25340c7d97c5SJed Brown               total_ranks_recv[displacements_recv[j]+total_count_recv[j]]=i;
25353828260eSStefano Zampini               total_count_recv[j]+=1;
25360c7d97c5SJed Brown             }
25370c7d97c5SJed Brown           }
25380c7d97c5SJed Brown         }
2539da1bb401SStefano Zampini         /*for(j=0;j<size_coarse_comm;j++) {
25403828260eSStefano Zampini           printf("process %d in new rank will receive from %d processes (original ranks follows)\n",j,total_count_recv[j]);
25413828260eSStefano Zampini           for(i=0;i<total_count_recv[j];i++) {
25423828260eSStefano Zampini             printf("%d ",total_ranks_recv[displacements_recv[j]+i]);
25433828260eSStefano Zampini           }
25443828260eSStefano Zampini           printf("\n");
2545da1bb401SStefano Zampini         }*/
25460c7d97c5SJed Brown 
25470c7d97c5SJed Brown         /* identify new decomposition in terms of ranks in the old communicator */
25483828260eSStefano Zampini         for(i=0;i<n_subdomains;i++) coarse_subdivision[ranks_stretching_ratio*i]=coarse_subdivision[ranks_stretching_ratio*i]*procs_jumps_coarse_comm;
2549da1bb401SStefano Zampini         /*printf("coarse_subdivision in old end new ranks\n");
25500c7d97c5SJed Brown         for(i=0;i<size_prec_comm;i++)
25513828260eSStefano Zampini           if(coarse_subdivision[i]!=MPI_PROC_NULL) {
25523828260eSStefano Zampini             printf("%d=(%d %d), ",i,coarse_subdivision[i],coarse_subdivision[i]/procs_jumps_coarse_comm);
25533828260eSStefano Zampini           } else {
25543828260eSStefano Zampini             printf("%d=(%d %d), ",i,coarse_subdivision[i],coarse_subdivision[i]);
25553828260eSStefano Zampini           }
2556da1bb401SStefano Zampini         printf("\n");*/
25570c7d97c5SJed Brown       }
25580c7d97c5SJed Brown 
25590c7d97c5SJed Brown       /* Scatter new decomposition for send details */
256053cdbc3dSStefano Zampini       ierr = MPI_Scatter(&coarse_subdivision[0],1,MPIU_INT,&rank_coarse_proc_send_to,1,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr);
25610c7d97c5SJed Brown       /* Scatter receiving details to members of coarse decomposition */
25620c7d97c5SJed Brown       if( coarse_color == 0) {
256353cdbc3dSStefano Zampini         ierr = MPI_Scatter(&total_count_recv[0],1,MPIU_INT,&count_recv,1,MPIU_INT,master_proc,coarse_comm);CHKERRQ(ierr);
25640c7d97c5SJed Brown         ierr = PetscMalloc (count_recv*sizeof(PetscMPIInt),&ranks_recv);CHKERRQ(ierr);
256553cdbc3dSStefano Zampini         ierr = MPI_Scatterv(&total_ranks_recv[0],total_count_recv,displacements_recv,MPIU_INT,&ranks_recv[0],count_recv,MPIU_INT,master_proc,coarse_comm);CHKERRQ(ierr);
25660c7d97c5SJed Brown       }
25670c7d97c5SJed Brown 
2568da1bb401SStefano Zampini       /*printf("I will send my matrix data to proc  %d\n",rank_coarse_proc_send_to);
2569da1bb401SStefano Zampini       if(coarse_color == 0) {
2570da1bb401SStefano Zampini         printf("I will receive some matrix data from %d processes (ranks follows)\n",count_recv);
2571da1bb401SStefano Zampini         for(i=0;i<count_recv;i++)
2572da1bb401SStefano Zampini           printf("%d ",ranks_recv[i]);
2573da1bb401SStefano Zampini         printf("\n");
2574da1bb401SStefano Zampini       }*/
25750c7d97c5SJed Brown 
25760c7d97c5SJed Brown       if(rank_prec_comm == master_proc) {
2577da1bb401SStefano Zampini         /*ierr = PetscFree(coarse_subdivision);CHKERRQ(ierr);
2578da1bb401SStefano Zampini         ierr = PetscFree(total_count_recv);CHKERRQ(ierr);
2579da1bb401SStefano Zampini         ierr = PetscFree(total_ranks_recv);CHKERRQ(ierr);*/
25800c7d97c5SJed Brown         free(coarse_subdivision);
25810c7d97c5SJed Brown         free(total_count_recv);
25820c7d97c5SJed Brown         free(total_ranks_recv);
25830c7d97c5SJed Brown         ierr = PetscFree(displacements_recv);CHKERRQ(ierr);
25840c7d97c5SJed Brown       }
25850c7d97c5SJed Brown       break;
25860c7d97c5SJed Brown     }
25870c7d97c5SJed Brown 
25880c7d97c5SJed Brown     case(REPLICATED_BDDC):
25890c7d97c5SJed Brown 
25900c7d97c5SJed Brown       pcbddc->coarse_communications_type = GATHERS_BDDC;
25910c7d97c5SJed Brown       coarse_mat_type = MATSEQAIJ;
25920c7d97c5SJed Brown       coarse_pc_type  = PCLU;
259353cdbc3dSStefano Zampini       coarse_ksp_type  = KSPPREONLY;
25940c7d97c5SJed Brown       coarse_comm = PETSC_COMM_SELF;
25950c7d97c5SJed Brown       active_rank = rank_prec_comm;
25960c7d97c5SJed Brown       break;
25970c7d97c5SJed Brown 
25980c7d97c5SJed Brown     case(PARALLEL_BDDC):
25990c7d97c5SJed Brown 
26000c7d97c5SJed Brown       pcbddc->coarse_communications_type = SCATTERS_BDDC;
26010c7d97c5SJed Brown       coarse_mat_type = MATMPIAIJ;
26020c7d97c5SJed Brown       coarse_pc_type  = PCREDUNDANT;
260353cdbc3dSStefano Zampini       coarse_ksp_type  = KSPPREONLY;
26040c7d97c5SJed Brown       coarse_comm = prec_comm;
26050c7d97c5SJed Brown       active_rank = rank_prec_comm;
26060c7d97c5SJed Brown       break;
26070c7d97c5SJed Brown 
26080c7d97c5SJed Brown     case(SEQUENTIAL_BDDC):
26090c7d97c5SJed Brown       pcbddc->coarse_communications_type = GATHERS_BDDC;
26100c7d97c5SJed Brown       coarse_mat_type = MATSEQAIJ;
26110c7d97c5SJed Brown       coarse_pc_type = PCLU;
261253cdbc3dSStefano Zampini       coarse_ksp_type  = KSPPREONLY;
26130c7d97c5SJed Brown       coarse_comm = PETSC_COMM_SELF;
26140c7d97c5SJed Brown       active_rank = master_proc;
26150c7d97c5SJed Brown       break;
26160c7d97c5SJed Brown   }
26170c7d97c5SJed Brown 
26180c7d97c5SJed Brown   switch(pcbddc->coarse_communications_type){
26190c7d97c5SJed Brown 
26200c7d97c5SJed Brown     case(SCATTERS_BDDC):
26210c7d97c5SJed Brown       {
26220c7d97c5SJed Brown         if(pcbddc->coarse_problem_type==MULTILEVEL_BDDC) {
26230c7d97c5SJed Brown 
26240c7d97c5SJed Brown           PetscMPIInt send_size;
26250c7d97c5SJed Brown           PetscInt    *aux_ins_indices;
26260c7d97c5SJed Brown           PetscInt    ii,jj;
26270c7d97c5SJed Brown           MPI_Request *requests;
26280c7d97c5SJed Brown 
26290c7d97c5SJed Brown           /* allocate auxiliary space */
26305619798eSStefano Zampini           ierr = PetscMalloc (pcbddc->replicated_primal_size*sizeof(PetscMPIInt),&pcbddc->replicated_local_primal_indices);CHKERRQ(ierr);
26315619798eSStefano Zampini           ierr = MPI_Allgatherv(&pcbddc->local_primal_indices[0],pcbddc->local_primal_size,MPIU_INT,&pcbddc->replicated_local_primal_indices[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,prec_comm);CHKERRQ(ierr);
26320c7d97c5SJed Brown           ierr = PetscMalloc ( pcbddc->coarse_size*sizeof(PetscInt),&aux_ins_indices);CHKERRQ(ierr);
26330c7d97c5SJed Brown           ierr = PetscMemzero(aux_ins_indices,pcbddc->coarse_size*sizeof(PetscInt));CHKERRQ(ierr);
26340c7d97c5SJed Brown           /* allocate stuffs for message massing */
26350c7d97c5SJed Brown           ierr = PetscMalloc ( (count_recv+1)*sizeof(MPI_Request),&requests);CHKERRQ(ierr);
26360c7d97c5SJed Brown           for(i=0;i<count_recv+1;i++) requests[i]=MPI_REQUEST_NULL;
26370c7d97c5SJed Brown           ierr = PetscMalloc ( count_recv*sizeof(PetscMPIInt),&localsizes2);CHKERRQ(ierr);
26380c7d97c5SJed Brown           ierr = PetscMalloc ( count_recv*sizeof(PetscMPIInt),&localdispl2);CHKERRQ(ierr);
26390c7d97c5SJed Brown           /* fill up quantities */
26400c7d97c5SJed Brown           j=0;
26410c7d97c5SJed Brown           for(i=0;i<count_recv;i++){
26420c7d97c5SJed Brown             ii = ranks_recv[i];
26430c7d97c5SJed Brown             localsizes2[i]=pcbddc->local_primal_sizes[ii]*pcbddc->local_primal_sizes[ii];
26440c7d97c5SJed Brown             localdispl2[i]=j;
26450c7d97c5SJed Brown             j+=localsizes2[i];
26460c7d97c5SJed Brown             jj = pcbddc->local_primal_displacements[ii];
2647da1bb401SStefano Zampini             for(k=0;k<pcbddc->local_primal_sizes[ii];k++) aux_ins_indices[pcbddc->replicated_local_primal_indices[jj+k]]+=1;  /* it counts the coarse subdomains sharing the coarse node */
26480c7d97c5SJed Brown           }
2649da1bb401SStefano Zampini           /*printf("aux_ins_indices 1\n");
2650da1bb401SStefano Zampini           for(i=0;i<pcbddc->coarse_size;i++)
2651da1bb401SStefano Zampini             printf("%d ",aux_ins_indices[i]);
2652da1bb401SStefano Zampini           printf("\n");*/
26530c7d97c5SJed Brown           /* temp_coarse_mat_vals used to store temporarly received matrix values */
26540c7d97c5SJed Brown           ierr = PetscMalloc ( j*sizeof(PetscScalar),&temp_coarse_mat_vals);CHKERRQ(ierr);
26550c7d97c5SJed Brown           /* evaluate how many values I will insert in coarse mat */
26560c7d97c5SJed Brown           ins_local_primal_size=0;
26570c7d97c5SJed Brown           for(i=0;i<pcbddc->coarse_size;i++)
26580c7d97c5SJed Brown             if(aux_ins_indices[i])
26590c7d97c5SJed Brown               ins_local_primal_size++;
26600c7d97c5SJed Brown           /* evaluate indices I will insert in coarse mat */
26610c7d97c5SJed Brown           ierr = PetscMalloc ( ins_local_primal_size*sizeof(PetscInt),&ins_local_primal_indices);CHKERRQ(ierr);
26620c7d97c5SJed Brown           j=0;
26630c7d97c5SJed Brown           for(i=0;i<pcbddc->coarse_size;i++)
26640c7d97c5SJed Brown             if(aux_ins_indices[i])
26650c7d97c5SJed Brown               ins_local_primal_indices[j++]=i;
26660c7d97c5SJed Brown           /* use aux_ins_indices to realize a global to local mapping */
26670c7d97c5SJed Brown           j=0;
26680c7d97c5SJed Brown           for(i=0;i<pcbddc->coarse_size;i++){
26690c7d97c5SJed Brown             if(aux_ins_indices[i]==0){
26700c7d97c5SJed Brown               aux_ins_indices[i]=-1;
26710c7d97c5SJed Brown             } else {
26720c7d97c5SJed Brown               aux_ins_indices[i]=j;
26730c7d97c5SJed Brown               j++;
26740c7d97c5SJed Brown             }
26750c7d97c5SJed Brown           }
26760c7d97c5SJed Brown 
2677da1bb401SStefano Zampini           /*printf("New details localsizes2 localdispl2\n");
2678da1bb401SStefano Zampini           for(i=0;i<count_recv;i++)
2679da1bb401SStefano Zampini             printf("(%d %d) ",localsizes2[i],localdispl2[i]);
2680da1bb401SStefano Zampini           printf("\n");
2681da1bb401SStefano Zampini           printf("aux_ins_indices 2\n");
2682da1bb401SStefano Zampini           for(i=0;i<pcbddc->coarse_size;i++)
2683da1bb401SStefano Zampini             printf("%d ",aux_ins_indices[i]);
2684da1bb401SStefano Zampini           printf("\n");
2685da1bb401SStefano Zampini           printf("ins_local_primal_indices\n");
2686da1bb401SStefano Zampini           for(i=0;i<ins_local_primal_size;i++)
2687da1bb401SStefano Zampini             printf("%d ",ins_local_primal_indices[i]);
2688da1bb401SStefano Zampini           printf("\n");
2689da1bb401SStefano Zampini           printf("coarse_submat_vals\n");
2690da1bb401SStefano Zampini           for(i=0;i<pcbddc->local_primal_size;i++)
2691da1bb401SStefano Zampini             for(j=0;j<pcbddc->local_primal_size;j++)
2692da1bb401SStefano Zampini               printf("(%lf %d %d)\n",coarse_submat_vals[j*pcbddc->local_primal_size+i],pcbddc->local_primal_indices[i],pcbddc->local_primal_indices[j]);
2693da1bb401SStefano Zampini           printf("\n");*/
26940c7d97c5SJed Brown 
26950c7d97c5SJed Brown           /* processes partecipating in coarse problem receive matrix data from their friends */
269653cdbc3dSStefano Zampini           for(i=0;i<count_recv;i++) ierr = MPI_Irecv(&temp_coarse_mat_vals[localdispl2[i]],localsizes2[i],MPIU_SCALAR,ranks_recv[i],666,prec_comm,&requests[i]);CHKERRQ(ierr);
26970c7d97c5SJed Brown           if(rank_coarse_proc_send_to != MPI_PROC_NULL ) {
26980c7d97c5SJed Brown             send_size=pcbddc->local_primal_size*pcbddc->local_primal_size;
269953cdbc3dSStefano Zampini             ierr = MPI_Isend(&coarse_submat_vals[0],send_size,MPIU_SCALAR,rank_coarse_proc_send_to,666,prec_comm,&requests[count_recv]);CHKERRQ(ierr);
27000c7d97c5SJed Brown           }
270153cdbc3dSStefano Zampini           ierr = MPI_Waitall(count_recv+1,requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
27020c7d97c5SJed Brown 
2703da1bb401SStefano Zampini           /*if(coarse_color == 0) {
2704da1bb401SStefano Zampini             printf("temp_coarse_mat_vals\n");
2705da1bb401SStefano Zampini             for(k=0;k<count_recv;k++){
2706da1bb401SStefano Zampini               printf("---- %d ----\n",ranks_recv[k]);
2707da1bb401SStefano Zampini               for(i=0;i<pcbddc->local_primal_sizes[ranks_recv[k]];i++)
2708da1bb401SStefano Zampini                 for(j=0;j<pcbddc->local_primal_sizes[ranks_recv[k]];j++)
2709da1bb401SStefano Zampini                   printf("(%lf %d %d)\n",temp_coarse_mat_vals[localdispl2[k]+j*pcbddc->local_primal_sizes[ranks_recv[k]]+i],pcbddc->replicated_local_primal_indices[pcbddc->local_primal_displacements[ranks_recv[k]]+i],pcbddc->replicated_local_primal_indices[pcbddc->local_primal_displacements[ranks_recv[k]]+j]);
2710da1bb401SStefano Zampini               printf("\n");
2711da1bb401SStefano Zampini             }
2712da1bb401SStefano Zampini           }*/
27130c7d97c5SJed Brown           /* calculate data to insert in coarse mat */
27140c7d97c5SJed Brown           ierr = PetscMalloc ( ins_local_primal_size*ins_local_primal_size*sizeof(PetscScalar),&ins_coarse_mat_vals);CHKERRQ(ierr);
27150c7d97c5SJed Brown           PetscMemzero(ins_coarse_mat_vals,ins_local_primal_size*ins_local_primal_size*sizeof(PetscScalar));
27160c7d97c5SJed Brown 
27170c7d97c5SJed Brown           PetscMPIInt rr,kk,lps,lpd;
27180c7d97c5SJed Brown           PetscInt row_ind,col_ind;
27190c7d97c5SJed Brown           for(k=0;k<count_recv;k++){
27200c7d97c5SJed Brown             rr = ranks_recv[k];
27210c7d97c5SJed Brown             kk = localdispl2[k];
27220c7d97c5SJed Brown             lps = pcbddc->local_primal_sizes[rr];
27230c7d97c5SJed Brown             lpd = pcbddc->local_primal_displacements[rr];
2724da1bb401SStefano Zampini             /*printf("Inserting the following indices (received from %d)\n",rr);*/
27250c7d97c5SJed Brown             for(j=0;j<lps;j++){
27260c7d97c5SJed Brown               col_ind=aux_ins_indices[pcbddc->replicated_local_primal_indices[lpd+j]];
27270c7d97c5SJed Brown               for(i=0;i<lps;i++){
27280c7d97c5SJed Brown                 row_ind=aux_ins_indices[pcbddc->replicated_local_primal_indices[lpd+i]];
2729da1bb401SStefano Zampini                 /*printf("%d %d\n",row_ind,col_ind);*/
27300c7d97c5SJed Brown                 ins_coarse_mat_vals[col_ind*ins_local_primal_size+row_ind]+=temp_coarse_mat_vals[kk+j*lps+i];
27310c7d97c5SJed Brown               }
27320c7d97c5SJed Brown             }
27330c7d97c5SJed Brown           }
27340c7d97c5SJed Brown           ierr = PetscFree(requests);CHKERRQ(ierr);
27350c7d97c5SJed Brown           ierr = PetscFree(aux_ins_indices);CHKERRQ(ierr);
27360c7d97c5SJed Brown           ierr = PetscFree(temp_coarse_mat_vals);CHKERRQ(ierr);
27370c7d97c5SJed Brown           if(coarse_color == 0) { ierr = PetscFree(ranks_recv);CHKERRQ(ierr); }
27380c7d97c5SJed Brown 
27390c7d97c5SJed Brown           /* create local to global mapping needed by coarse MATIS */
27400c7d97c5SJed Brown           {
27410c7d97c5SJed Brown             IS coarse_IS;
274253cdbc3dSStefano Zampini             if(coarse_comm != MPI_COMM_NULL ) ierr = MPI_Comm_free(&coarse_comm);CHKERRQ(ierr);
27430c7d97c5SJed Brown             coarse_comm = prec_comm;
27440c7d97c5SJed Brown             active_rank=rank_prec_comm;
27450c7d97c5SJed Brown             ierr = ISCreateGeneral(coarse_comm,ins_local_primal_size,ins_local_primal_indices,PETSC_COPY_VALUES,&coarse_IS);CHKERRQ(ierr);
27460c7d97c5SJed Brown             ierr = ISLocalToGlobalMappingCreateIS(coarse_IS,&coarse_ISLG);CHKERRQ(ierr);
27470c7d97c5SJed Brown             ierr = ISDestroy(&coarse_IS);CHKERRQ(ierr);
27480c7d97c5SJed Brown           }
27490c7d97c5SJed Brown         }
27500c7d97c5SJed Brown         if(pcbddc->coarse_problem_type==PARALLEL_BDDC) {
27510c7d97c5SJed Brown           /* arrays for values insertion */
27520c7d97c5SJed Brown           ins_local_primal_size = pcbddc->local_primal_size;
27530c7d97c5SJed Brown           ierr = PetscMalloc ( ins_local_primal_size*sizeof(PetscMPIInt),&ins_local_primal_indices);CHKERRQ(ierr);
27540c7d97c5SJed Brown           ierr = PetscMalloc ( ins_local_primal_size*ins_local_primal_size*sizeof(PetscScalar),&ins_coarse_mat_vals);CHKERRQ(ierr);
27550c7d97c5SJed Brown           for(j=0;j<ins_local_primal_size;j++){
27560c7d97c5SJed Brown             ins_local_primal_indices[j]=pcbddc->local_primal_indices[j];
27570c7d97c5SJed Brown             for(i=0;i<ins_local_primal_size;i++) ins_coarse_mat_vals[j*ins_local_primal_size+i]=coarse_submat_vals[j*ins_local_primal_size+i];
27580c7d97c5SJed Brown           }
27590c7d97c5SJed Brown         }
27600c7d97c5SJed Brown         break;
27610c7d97c5SJed Brown 
27620c7d97c5SJed Brown     }
27630c7d97c5SJed Brown 
27640c7d97c5SJed Brown     case(GATHERS_BDDC):
27650c7d97c5SJed Brown       {
27660c7d97c5SJed Brown 
27670c7d97c5SJed Brown         PetscMPIInt mysize,mysize2;
27680c7d97c5SJed Brown 
27690c7d97c5SJed Brown         if(rank_prec_comm==active_rank) {
27700c7d97c5SJed Brown           ierr = PetscMalloc ( pcbddc->replicated_primal_size*sizeof(PetscMPIInt),&pcbddc->replicated_local_primal_indices);CHKERRQ(ierr);
27710c7d97c5SJed Brown           pcbddc->replicated_local_primal_values = (PetscScalar*)calloc(pcbddc->replicated_primal_size,sizeof(PetscScalar));
27720c7d97c5SJed Brown           ierr = PetscMalloc ( size_prec_comm*sizeof(PetscMPIInt),&localsizes2);CHKERRQ(ierr);
27730c7d97c5SJed Brown           ierr = PetscMalloc ( size_prec_comm*sizeof(PetscMPIInt),&localdispl2);CHKERRQ(ierr);
27740c7d97c5SJed Brown           /* arrays for values insertion */
27750c7d97c5SJed Brown           ins_local_primal_size = pcbddc->coarse_size;
27760c7d97c5SJed Brown           ierr = PetscMalloc ( ins_local_primal_size*sizeof(PetscMPIInt),&ins_local_primal_indices);CHKERRQ(ierr);
27770c7d97c5SJed Brown           ierr = PetscMalloc ( ins_local_primal_size*ins_local_primal_size*sizeof(PetscScalar),&ins_coarse_mat_vals);CHKERRQ(ierr);
27780c7d97c5SJed Brown           for(i=0;i<size_prec_comm;i++) localsizes2[i]=pcbddc->local_primal_sizes[i]*pcbddc->local_primal_sizes[i];
27790c7d97c5SJed Brown           localdispl2[0]=0;
27800c7d97c5SJed Brown           for(i=1;i<size_prec_comm;i++) localdispl2[i]=localsizes2[i-1]+localdispl2[i-1];
27810c7d97c5SJed Brown           j=0;
27820c7d97c5SJed Brown           for(i=0;i<size_prec_comm;i++) j+=localsizes2[i];
27830c7d97c5SJed Brown           ierr = PetscMalloc ( j*sizeof(PetscScalar),&temp_coarse_mat_vals);CHKERRQ(ierr);
27840c7d97c5SJed Brown         }
27850c7d97c5SJed Brown 
27860c7d97c5SJed Brown         mysize=pcbddc->local_primal_size;
27870c7d97c5SJed Brown         mysize2=pcbddc->local_primal_size*pcbddc->local_primal_size;
27880c7d97c5SJed Brown         if(pcbddc->coarse_problem_type == SEQUENTIAL_BDDC){
278953cdbc3dSStefano Zampini           ierr = MPI_Gatherv(&pcbddc->local_primal_indices[0],mysize,MPIU_INT,&pcbddc->replicated_local_primal_indices[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr);
279053cdbc3dSStefano Zampini           ierr = MPI_Gatherv(&coarse_submat_vals[0],mysize2,MPIU_SCALAR,&temp_coarse_mat_vals[0],localsizes2,localdispl2,MPIU_SCALAR,master_proc,prec_comm);CHKERRQ(ierr);
27910c7d97c5SJed Brown         } else {
279253cdbc3dSStefano Zampini           ierr = MPI_Allgatherv(&pcbddc->local_primal_indices[0],mysize,MPIU_INT,&pcbddc->replicated_local_primal_indices[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,prec_comm);CHKERRQ(ierr);
279353cdbc3dSStefano Zampini           ierr = MPI_Allgatherv(&coarse_submat_vals[0],mysize2,MPIU_SCALAR,&temp_coarse_mat_vals[0],localsizes2,localdispl2,MPIU_SCALAR,prec_comm);CHKERRQ(ierr);
27940c7d97c5SJed Brown         }
27950c7d97c5SJed Brown 
27960c7d97c5SJed Brown   /* free data structures no longer needed and allocate some space which will be needed in BDDC application */
27970c7d97c5SJed Brown         if(rank_prec_comm==active_rank) {
27980c7d97c5SJed Brown           PetscInt offset,offset2,row_ind,col_ind;
27990c7d97c5SJed Brown           for(j=0;j<ins_local_primal_size;j++){
28000c7d97c5SJed Brown             ins_local_primal_indices[j]=j;
28010c7d97c5SJed Brown             for(i=0;i<ins_local_primal_size;i++) ins_coarse_mat_vals[j*ins_local_primal_size+i]=0.0;
28020c7d97c5SJed Brown           }
28030c7d97c5SJed Brown           for(k=0;k<size_prec_comm;k++){
28040c7d97c5SJed Brown             offset=pcbddc->local_primal_displacements[k];
28050c7d97c5SJed Brown             offset2=localdispl2[k];
28060c7d97c5SJed Brown             for(j=0;j<pcbddc->local_primal_sizes[k];j++){
28070c7d97c5SJed Brown               col_ind=pcbddc->replicated_local_primal_indices[offset+j];
28080c7d97c5SJed Brown               for(i=0;i<pcbddc->local_primal_sizes[k];i++){
28090c7d97c5SJed Brown                 row_ind=pcbddc->replicated_local_primal_indices[offset+i];
28100c7d97c5SJed Brown                 ins_coarse_mat_vals[col_ind*pcbddc->coarse_size+row_ind]+=temp_coarse_mat_vals[offset2+j*pcbddc->local_primal_sizes[k]+i];
28110c7d97c5SJed Brown               }
28120c7d97c5SJed Brown             }
28130c7d97c5SJed Brown           }
28140c7d97c5SJed Brown         }
28150c7d97c5SJed Brown         break;
2816da1bb401SStefano Zampini       }/* switch on coarse problem and communications associated with finished */
28170c7d97c5SJed Brown   }
28180c7d97c5SJed Brown 
28190c7d97c5SJed Brown   /* Now create and fill up coarse matrix */
28200c7d97c5SJed Brown   if( rank_prec_comm == active_rank ) {
28210c7d97c5SJed Brown     if(pcbddc->coarse_problem_type != MULTILEVEL_BDDC) {
28220c7d97c5SJed Brown       ierr = MatCreate(coarse_comm,&pcbddc->coarse_mat);CHKERRQ(ierr);
28230c7d97c5SJed Brown       ierr = MatSetSizes(pcbddc->coarse_mat,PETSC_DECIDE,PETSC_DECIDE,pcbddc->coarse_size,pcbddc->coarse_size);CHKERRQ(ierr);
28240c7d97c5SJed Brown       ierr = MatSetType(pcbddc->coarse_mat,coarse_mat_type);CHKERRQ(ierr);
28253b03a366Sstefano_zampini       ierr = MatSetUp(pcbddc->coarse_mat);CHKERRQ(ierr);
2826da1bb401SStefano Zampini       ierr = MatSetOption(pcbddc->coarse_mat,MAT_ROW_ORIENTED,PETSC_FALSE);CHKERRQ(ierr); /* local values stored in column major */
28273b03a366Sstefano_zampini       ierr = MatSetOption(pcbddc->coarse_mat,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr);
28280c7d97c5SJed Brown     } else {
28290c7d97c5SJed Brown       Mat matis_coarse_local_mat;
2830d3ee2243SStefano Zampini       /* remind bs */
2831d3ee2243SStefano Zampini       ierr = MatCreateIS(coarse_comm,bs,PETSC_DECIDE,PETSC_DECIDE,pcbddc->coarse_size,pcbddc->coarse_size,coarse_ISLG,&pcbddc->coarse_mat);CHKERRQ(ierr);
28323b03a366Sstefano_zampini       ierr = MatSetUp(pcbddc->coarse_mat);CHKERRQ(ierr);
28330c7d97c5SJed Brown       ierr = MatISGetLocalMat(pcbddc->coarse_mat,&matis_coarse_local_mat);CHKERRQ(ierr);
28343b03a366Sstefano_zampini       ierr = MatSetUp(matis_coarse_local_mat);CHKERRQ(ierr);
2835da1bb401SStefano Zampini       ierr = MatSetOption(matis_coarse_local_mat,MAT_ROW_ORIENTED,PETSC_FALSE);CHKERRQ(ierr); /* local values stored in column major */
2836a0ba757dSStefano Zampini       ierr = MatSetOption(matis_coarse_local_mat,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr);
28370c7d97c5SJed Brown     }
2838a0ba757dSStefano Zampini     ierr = MatSetOption(pcbddc->coarse_mat,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_FALSE);CHKERRQ(ierr);
28390c7d97c5SJed Brown     ierr = MatSetValues(pcbddc->coarse_mat,ins_local_primal_size,ins_local_primal_indices,ins_local_primal_size,ins_local_primal_indices,ins_coarse_mat_vals,ADD_VALUES);CHKERRQ(ierr);
28400c7d97c5SJed Brown     ierr = MatAssemblyBegin(pcbddc->coarse_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
28410c7d97c5SJed Brown     ierr = MatAssemblyEnd(pcbddc->coarse_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
28420c7d97c5SJed Brown 
2843da1bb401SStefano Zampini     /*  PetscViewer view_out;
2844da1bb401SStefano Zampini       ierr = PetscViewerASCIIOpen(PETSC_COMM_SELF,"coarsematfull.m",&view_out);CHKERRQ(ierr);
2845da1bb401SStefano Zampini       ierr = PetscViewerSetFormat(view_out,PETSC_VIEWER_ASCII_MATLAB);CHKERRQ(ierr);
2846da1bb401SStefano Zampini       ierr = MatView(pcbddc->coarse_mat,view_out);CHKERRQ(ierr);
2847da1bb401SStefano Zampini       ierr = PetscViewerDestroy(&view_out);CHKERRQ(ierr);*/
2848da1bb401SStefano Zampini 
28490c7d97c5SJed Brown     ierr = MatGetVecs(pcbddc->coarse_mat,&pcbddc->coarse_vec,&pcbddc->coarse_rhs);CHKERRQ(ierr);
28500c7d97c5SJed Brown     /* Preconditioner for coarse problem */
285153cdbc3dSStefano Zampini     ierr = KSPCreate(coarse_comm,&pcbddc->coarse_ksp);CHKERRQ(ierr);
285253cdbc3dSStefano Zampini     ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->coarse_ksp,(PetscObject)pc,1);CHKERRQ(ierr);
285353cdbc3dSStefano Zampini     ierr = KSPSetOperators(pcbddc->coarse_ksp,pcbddc->coarse_mat,pcbddc->coarse_mat,SAME_PRECONDITIONER);CHKERRQ(ierr);
28543b03a366Sstefano_zampini     ierr = KSPSetTolerances(pcbddc->coarse_ksp,PETSC_DEFAULT,PETSC_DEFAULT,PETSC_DEFAULT,max_it_coarse_ksp);CHKERRQ(ierr);
285553cdbc3dSStefano Zampini     ierr = KSPSetType(pcbddc->coarse_ksp,coarse_ksp_type);CHKERRQ(ierr);
285653cdbc3dSStefano Zampini     ierr = KSPGetPC(pcbddc->coarse_ksp,&pc_temp);CHKERRQ(ierr);
285753cdbc3dSStefano Zampini     ierr = PCSetType(pc_temp,coarse_pc_type);CHKERRQ(ierr);
28580c7d97c5SJed Brown     /* Allow user's customization */
2859da1bb401SStefano Zampini     ierr = KSPSetOptionsPrefix(pcbddc->coarse_ksp,"coarse_");CHKERRQ(ierr);
286053cdbc3dSStefano Zampini     ierr = KSPSetFromOptions(pcbddc->coarse_ksp);CHKERRQ(ierr);
28610c7d97c5SJed Brown     /* Set Up PC for coarse problem BDDC */
286253cdbc3dSStefano Zampini     if(pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
2863e269702eSStefano Zampini       if(dbg_flag) {
2864e269702eSStefano Zampini         ierr = PetscViewerASCIIPrintf(viewer,"----------------Setting up a new level---------------\n");CHKERRQ(ierr);
2865e269702eSStefano Zampini         ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
2866e269702eSStefano Zampini       }
286753cdbc3dSStefano Zampini       ierr = PCBDDCSetCoarseProblemType(pc_temp,MULTILEVEL_BDDC);CHKERRQ(ierr);
286853cdbc3dSStefano Zampini     }
286953cdbc3dSStefano Zampini     ierr = KSPSetUp(pcbddc->coarse_ksp);CHKERRQ(ierr);
28705619798eSStefano Zampini     if(pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
28715619798eSStefano Zampini       if(dbg_flag) {
28725619798eSStefano Zampini         ierr = PetscViewerASCIIPrintf(viewer,"----------------New level set------------------------\n");CHKERRQ(ierr);
28735619798eSStefano Zampini         ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
28745619798eSStefano Zampini       }
28755619798eSStefano Zampini     }
28760c7d97c5SJed Brown   }
28770c7d97c5SJed Brown   if(pcbddc->coarse_communications_type == SCATTERS_BDDC) {
28780c7d97c5SJed Brown      IS local_IS,global_IS;
28790c7d97c5SJed Brown      ierr = ISCreateStride(PETSC_COMM_SELF,pcbddc->local_primal_size,0,1,&local_IS);CHKERRQ(ierr);
28800c7d97c5SJed Brown      ierr = ISCreateGeneral(PETSC_COMM_SELF,pcbddc->local_primal_size,pcbddc->local_primal_indices,PETSC_COPY_VALUES,&global_IS);CHKERRQ(ierr);
28810c7d97c5SJed Brown      ierr = VecScatterCreate(pcbddc->vec1_P,local_IS,pcbddc->coarse_vec,global_IS,&pcbddc->coarse_loc_to_glob);CHKERRQ(ierr);
28820c7d97c5SJed Brown      ierr = ISDestroy(&local_IS);CHKERRQ(ierr);
28830c7d97c5SJed Brown      ierr = ISDestroy(&global_IS);CHKERRQ(ierr);
28840c7d97c5SJed Brown   }
28850c7d97c5SJed Brown 
28860c7d97c5SJed Brown 
28873b03a366Sstefano_zampini   /* Evaluate condition number of coarse problem for cheby (and verbose output if requested) */
28883b03a366Sstefano_zampini   if( pcbddc->coarse_problem_type == MULTILEVEL_BDDC && rank_prec_comm == active_rank ) {
28890c7d97c5SJed Brown     PetscScalar m_one=-1.0;
28905619798eSStefano Zampini     PetscReal   infty_error,lambda_min,lambda_max,kappa_2;
28913b03a366Sstefano_zampini     const KSPType check_ksp_type=KSPGMRES;
28920c7d97c5SJed Brown 
28935619798eSStefano Zampini     /* change coarse ksp object to an iterative method suitable for extreme eigenvalues' estimation */
28943b03a366Sstefano_zampini     ierr = KSPSetType(pcbddc->coarse_ksp,check_ksp_type);CHKERRQ(ierr);
2895d49ef151SStefano Zampini     ierr = KSPSetComputeSingularValues(pcbddc->coarse_ksp,PETSC_TRUE);CHKERRQ(ierr);
28965619798eSStefano Zampini     ierr = KSPSetTolerances(pcbddc->coarse_ksp,1.e-8,1.e-8,PETSC_DEFAULT,pcbddc->coarse_size);CHKERRQ(ierr);
28975619798eSStefano Zampini     ierr = KSPSetUp(pcbddc->coarse_ksp);CHKERRQ(ierr);
2898d49ef151SStefano Zampini     ierr = VecSetRandom(pcbddc->coarse_rhs,PETSC_NULL);CHKERRQ(ierr);
2899d49ef151SStefano Zampini     ierr = MatMult(pcbddc->coarse_mat,pcbddc->coarse_rhs,pcbddc->coarse_vec);CHKERRQ(ierr);
2900d49ef151SStefano Zampini     ierr = MatMult(pcbddc->coarse_mat,pcbddc->coarse_vec,pcbddc->coarse_rhs);CHKERRQ(ierr);
2901d49ef151SStefano Zampini     ierr = KSPSolve(pcbddc->coarse_ksp,pcbddc->coarse_rhs,pcbddc->coarse_rhs);CHKERRQ(ierr);
2902d49ef151SStefano Zampini     ierr = KSPComputeExtremeSingularValues(pcbddc->coarse_ksp,&lambda_max,&lambda_min);CHKERRQ(ierr);
29033b03a366Sstefano_zampini     if(dbg_flag) {
29045619798eSStefano Zampini       kappa_2=lambda_max/lambda_min;
29055619798eSStefano Zampini       ierr = KSPGetIterationNumber(pcbddc->coarse_ksp,&k);CHKERRQ(ierr);
2906d49ef151SStefano Zampini       ierr = VecAXPY(pcbddc->coarse_rhs,m_one,pcbddc->coarse_vec);CHKERRQ(ierr);
2907d49ef151SStefano Zampini       ierr = VecNorm(pcbddc->coarse_rhs,NORM_INFINITY,&infty_error);CHKERRQ(ierr);
29083b03a366Sstefano_zampini       ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem condition number estimated with %d iterations of %s is: % 1.14e\n",k,check_ksp_type,kappa_2);CHKERRQ(ierr);
2909e269702eSStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem eigenvalues: % 1.14e %1.14e\n",lambda_min,lambda_max);CHKERRQ(ierr);
2910e269702eSStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem infty_error: %1.14e\n",infty_error);CHKERRQ(ierr);
29113b03a366Sstefano_zampini     }
29125619798eSStefano Zampini     /* restore coarse ksp to default values */
2913d49ef151SStefano Zampini     ierr = KSPSetComputeSingularValues(pcbddc->coarse_ksp,PETSC_FALSE);CHKERRQ(ierr);
29145619798eSStefano Zampini     ierr = KSPSetType(pcbddc->coarse_ksp,coarse_ksp_type);CHKERRQ(ierr);
29156c9de887SHong Zhang     ierr = KSPChebyshevSetEigenvalues(pcbddc->coarse_ksp,lambda_max,lambda_min);CHKERRQ(ierr);
29163b03a366Sstefano_zampini     ierr = KSPSetTolerances(pcbddc->coarse_ksp,PETSC_DEFAULT,PETSC_DEFAULT,PETSC_DEFAULT,max_it_coarse_ksp);CHKERRQ(ierr);
29175619798eSStefano Zampini     ierr = KSPSetFromOptions(pcbddc->coarse_ksp);CHKERRQ(ierr);
29185619798eSStefano Zampini     ierr = KSPSetUp(pcbddc->coarse_ksp);CHKERRQ(ierr);
291953cdbc3dSStefano Zampini   }
29200c7d97c5SJed Brown 
29210c7d97c5SJed Brown   /* free data structures no longer needed */
29220c7d97c5SJed Brown   if(coarse_ISLG)                { ierr = ISLocalToGlobalMappingDestroy(&coarse_ISLG);CHKERRQ(ierr); }
29230c7d97c5SJed Brown   if(ins_local_primal_indices)   { ierr = PetscFree(ins_local_primal_indices);CHKERRQ(ierr);  }
29240c7d97c5SJed Brown   if(ins_coarse_mat_vals)        { ierr = PetscFree(ins_coarse_mat_vals);CHKERRQ(ierr);}
29250c7d97c5SJed Brown   if(localsizes2)                { ierr = PetscFree(localsizes2);CHKERRQ(ierr);}
29260c7d97c5SJed Brown   if(localdispl2)                { ierr = PetscFree(localdispl2);CHKERRQ(ierr);}
29270c7d97c5SJed Brown   if(temp_coarse_mat_vals)       { ierr = PetscFree(temp_coarse_mat_vals);CHKERRQ(ierr);}
29280c7d97c5SJed Brown 
29290c7d97c5SJed Brown   PetscFunctionReturn(0);
29300c7d97c5SJed Brown }
29310c7d97c5SJed Brown 
29320c7d97c5SJed Brown #undef __FUNCT__
29330c7d97c5SJed Brown #define __FUNCT__ "PCBDDCManageLocalBoundaries"
293453cdbc3dSStefano Zampini static PetscErrorCode PCBDDCManageLocalBoundaries(PC pc)
29350c7d97c5SJed Brown {
29360c7d97c5SJed Brown 
29370c7d97c5SJed Brown   PC_BDDC     *pcbddc = (PC_BDDC*)pc->data;
29380c7d97c5SJed Brown   PC_IS         *pcis = (PC_IS*)pc->data;
29390c7d97c5SJed Brown   Mat_IS      *matis  = (Mat_IS*)pc->pmat->data;
2940da1bb401SStefano Zampini   PCBDDCGraph mat_graph=pcbddc->mat_graph;
2941a0ba757dSStefano Zampini   PetscInt    *queue_in_global_numbering;
29423b03a366Sstefano_zampini   PetscInt    bs,ierr,i,j,s,k,iindex,neumann_bsize,dirichlet_bsize;
2943da1bb401SStefano Zampini   PetscInt    total_counts,nodes_touched,where_values=1,vertex_size;
2944*534831adSStefano Zampini   PetscMPIInt adapt_interface=0,adapt_interface_reduced=0,NEUMANNCNT=0;
2945da1bb401SStefano Zampini   PetscBool   same_set;
2946a0ba757dSStefano Zampini   MPI_Comm    interface_comm=((PetscObject)pc)->comm;
29473b03a366Sstefano_zampini   PetscBool   use_faces=PETSC_FALSE,use_edges=PETSC_FALSE;
29483b03a366Sstefano_zampini   const PetscInt *neumann_nodes;
29493b03a366Sstefano_zampini   const PetscInt *dirichlet_nodes;
295036e030ebSStefano Zampini   IS          used_IS;
2951da1bb401SStefano Zampini   PetscScalar *array;
2952da1bb401SStefano Zampini   PetscScalar *array2;
2953da1bb401SStefano Zampini   PetscViewer viewer=pcbddc->dbg_viewer;
29540c7d97c5SJed Brown 
29550c7d97c5SJed Brown   PetscFunctionBegin;
2956da1bb401SStefano Zampini   /* Setup local adjacency graph */
2957da1bb401SStefano Zampini   mat_graph->nvtxs=pcis->n;
2958*534831adSStefano Zampini   if(!mat_graph->xadj) { NEUMANNCNT = 1; }
2959da1bb401SStefano Zampini   ierr = PCBDDCSetupLocalAdjacencyGraph(pc);CHKERRQ(ierr);
2960a0ba757dSStefano Zampini   i = mat_graph->nvtxs;
2961a0ba757dSStefano Zampini   ierr = PetscMalloc4(i,PetscInt,&mat_graph->where,i,PetscInt,&mat_graph->count,i+1,PetscInt,&mat_graph->cptr,i,PetscInt,&mat_graph->queue);CHKERRQ(ierr);
2962a0ba757dSStefano Zampini   ierr = PetscMalloc3(i,PetscInt,&mat_graph->which_dof,i,PetscBool,&mat_graph->touched,i,PetscInt,&queue_in_global_numbering);CHKERRQ(ierr);
2963a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->where,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
2964a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->count,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
2965a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->which_dof,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
2966a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->queue,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
29673828260eSStefano Zampini   ierr = PetscMemzero(mat_graph->cptr,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr);
2968a0ba757dSStefano Zampini 
29699c0446d6SStefano Zampini   /* Setting dofs splitting in mat_graph->which_dof */
29709c0446d6SStefano Zampini   if(pcbddc->n_ISForDofs) { /* get information about dofs' splitting if provided by the user */
29719c0446d6SStefano Zampini     PetscInt *is_indices;
29729c0446d6SStefano Zampini     PetscInt is_size;
29739c0446d6SStefano Zampini     for(i=0;i<pcbddc->n_ISForDofs;i++) {
29749c0446d6SStefano Zampini       ierr = ISGetSize(pcbddc->ISForDofs[i],&is_size);CHKERRQ(ierr);
29759c0446d6SStefano Zampini       ierr = ISGetIndices(pcbddc->ISForDofs[i],(const PetscInt**)&is_indices);CHKERRQ(ierr);
29769c0446d6SStefano Zampini       for(j=0;j<is_size;j++) {
29779c0446d6SStefano Zampini         mat_graph->which_dof[is_indices[j]]=i;
29789c0446d6SStefano Zampini       }
29799c0446d6SStefano Zampini       ierr = ISRestoreIndices(pcbddc->ISForDofs[i],(const PetscInt**)&is_indices);CHKERRQ(ierr);
29809c0446d6SStefano Zampini     }
29813b03a366Sstefano_zampini     /* use mat block size as vertex size */
29823b03a366Sstefano_zampini     ierr = MatGetBlockSize(matis->A,&vertex_size);CHKERRQ(ierr);
29833b03a366Sstefano_zampini   } else { /* otherwise it assumes a constant block size */
2984a0ba757dSStefano Zampini     ierr = MatGetBlockSize(matis->A,&bs);CHKERRQ(ierr);
29850c7d97c5SJed Brown     for(i=0;i<mat_graph->nvtxs/bs;i++) {
29860c7d97c5SJed Brown       for(s=0;s<bs;s++) {
29870c7d97c5SJed Brown         mat_graph->which_dof[i*bs+s]=s;
29880c7d97c5SJed Brown       }
29890c7d97c5SJed Brown     }
29903b03a366Sstefano_zampini     vertex_size=1;
29919c0446d6SStefano Zampini   }
29923b03a366Sstefano_zampini   /* count number of neigh per node */
29930c7d97c5SJed Brown   total_counts=0;
29943b03a366Sstefano_zampini   for(i=1;i<pcis->n_neigh;i++){
29950c7d97c5SJed Brown     s=pcis->n_shared[i];
29960c7d97c5SJed Brown     total_counts+=s;
299753cdbc3dSStefano Zampini     for(j=0;j<s;j++){
29980c7d97c5SJed Brown       mat_graph->count[pcis->shared[i][j]] += 1;
29990c7d97c5SJed Brown     }
30000c7d97c5SJed Brown   }
3001*534831adSStefano Zampini   /* Take into account Neumann data -> it increments number of sharing subdomains for nodes lying on the interface */
300236e030ebSStefano Zampini   ierr = PCBDDCGetNeumannBoundaries(pc,&used_IS);CHKERRQ(ierr);
3003da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
3004da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
300536e030ebSStefano Zampini   if(used_IS) {
300636e030ebSStefano Zampini     ierr = ISGetSize(used_IS,&neumann_bsize);CHKERRQ(ierr);
300736e030ebSStefano Zampini     ierr = ISGetIndices(used_IS,&neumann_nodes);CHKERRQ(ierr);
300853cdbc3dSStefano Zampini     for(i=0;i<neumann_bsize;i++){
300953cdbc3dSStefano Zampini       iindex = neumann_nodes[i];
3010*534831adSStefano Zampini       if(mat_graph->count[iindex] > NEUMANNCNT && array[iindex]==0.0){
301153cdbc3dSStefano Zampini         mat_graph->count[iindex]+=1;
30120c7d97c5SJed Brown         total_counts++;
3013da1bb401SStefano Zampini         array[iindex]=array[iindex]+1.0;
3014da1bb401SStefano Zampini       } else if(array[iindex]>0.0) {
3015da1bb401SStefano Zampini         SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_USER,"Error for neumann nodes provided to BDDC! They must be uniquely listed! Found duplicate node %d\n",iindex);
30160c7d97c5SJed Brown       }
30170c7d97c5SJed Brown     }
30180c7d97c5SJed Brown   }
3019da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3020da1bb401SStefano Zampini   /* allocate space for storing the set of neighbours for each node */
3021da1bb401SStefano Zampini   ierr = PetscMalloc(mat_graph->nvtxs*sizeof(PetscInt*),&mat_graph->neighbours_set);CHKERRQ(ierr);
3022da1bb401SStefano Zampini   if(mat_graph->nvtxs) { ierr = PetscMalloc(total_counts*sizeof(PetscInt),&mat_graph->neighbours_set[0]);CHKERRQ(ierr); }
3023da1bb401SStefano Zampini   for(i=1;i<mat_graph->nvtxs;i++) mat_graph->neighbours_set[i]=mat_graph->neighbours_set[i-1]+mat_graph->count[i-1];
3024a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->count,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
30253b03a366Sstefano_zampini   for(i=1;i<pcis->n_neigh;i++){
30260c7d97c5SJed Brown     s=pcis->n_shared[i];
30270c7d97c5SJed Brown     for(j=0;j<s;j++) {
30280c7d97c5SJed Brown       k=pcis->shared[i][j];
3029da1bb401SStefano Zampini       mat_graph->neighbours_set[k][mat_graph->count[k]] = pcis->neigh[i];
30300c7d97c5SJed Brown       mat_graph->count[k]+=1;
30310c7d97c5SJed Brown     }
30320c7d97c5SJed Brown   }
3033da1bb401SStefano Zampini   /* Check consistency of Neumann nodes */
3034da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
3035da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3036da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3037da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3038da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3039da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
30403b03a366Sstefano_zampini   /* set -1 fake neighbour to mimic Neumann boundary */
304136e030ebSStefano Zampini   if(used_IS) {
304253cdbc3dSStefano Zampini     for(i=0;i<neumann_bsize;i++){
304353cdbc3dSStefano Zampini       iindex = neumann_nodes[i];
3044*534831adSStefano Zampini       if(mat_graph->count[iindex] > NEUMANNCNT){
3045da1bb401SStefano Zampini         if(mat_graph->count[iindex]+1 != (PetscInt)array[iindex]) {
3046da1bb401SStefano Zampini           SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_USER,"Neumann nodes provided to BDDC must be consistent among neighbours!\nNode %d: number of sharing subdomains %d != number of subdomains for which it is a neumann node %d\n",iindex,mat_graph->count[iindex]+1,(PetscInt)array[iindex]);
3047da1bb401SStefano Zampini         }
3048da1bb401SStefano Zampini         mat_graph->neighbours_set[iindex][mat_graph->count[iindex]] = -1;
304953cdbc3dSStefano Zampini         mat_graph->count[iindex]+=1;
30500c7d97c5SJed Brown       }
30510c7d97c5SJed Brown     }
305236e030ebSStefano Zampini     ierr = ISRestoreIndices(used_IS,&neumann_nodes);CHKERRQ(ierr);
30530c7d97c5SJed Brown   }
3054da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3055da1bb401SStefano Zampini   /* sort set of sharing subdomains */
3056da1bb401SStefano Zampini   for(i=0;i<mat_graph->nvtxs;i++) { ierr = PetscSortInt(mat_graph->count[i],mat_graph->neighbours_set[i]);CHKERRQ(ierr); }
30573b03a366Sstefano_zampini   /* remove interior nodes and dirichlet boundary nodes from the next search into the graph */
3058da1bb401SStefano Zampini   for(i=0;i<mat_graph->nvtxs;i++){mat_graph->touched[i]=PETSC_FALSE;}
3059da1bb401SStefano Zampini   nodes_touched=0;
306036e030ebSStefano Zampini   ierr = PCBDDCGetDirichletBoundaries(pc,&used_IS);CHKERRQ(ierr);
3061da1bb401SStefano Zampini   ierr = VecSet(pcis->vec2_N,0.0);CHKERRQ(ierr);
3062da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3063da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec2_N,&array2);CHKERRQ(ierr);
3064da1bb401SStefano Zampini   if(used_IS) {
3065da1bb401SStefano Zampini     ierr = ISGetSize(used_IS,&dirichlet_bsize);CHKERRQ(ierr);
3066da1bb401SStefano Zampini     if(dirichlet_bsize && matis->pure_neumann) {
3067da1bb401SStefano Zampini       SETERRQ(PETSC_COMM_SELF,PETSC_ERR_USER,"Dirichlet boundaries are intended to be used with matrices with zeroed rows!\n");
3068da1bb401SStefano Zampini     }
3069da1bb401SStefano Zampini     ierr = ISGetIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr);
3070da1bb401SStefano Zampini     for(i=0;i<dirichlet_bsize;i++){
3071da1bb401SStefano Zampini       iindex=dirichlet_nodes[i];
3072da1bb401SStefano Zampini       if(mat_graph->count[iindex] && !mat_graph->touched[iindex]) {
3073da1bb401SStefano Zampini         if(array[iindex]>0.0) {
3074da1bb401SStefano Zampini           SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_USER,"BDDC cannot have nodes which are marked as Neumann and Dirichlet at the same time! Wrong node %d\n",iindex);
3075da1bb401SStefano Zampini         }
3076da1bb401SStefano Zampini         mat_graph->touched[iindex]=PETSC_TRUE;
3077da1bb401SStefano Zampini         mat_graph->where[iindex]=0;
3078da1bb401SStefano Zampini         nodes_touched++;
3079da1bb401SStefano Zampini         array2[iindex]=array2[iindex]+1.0;
3080da1bb401SStefano Zampini       }
3081da1bb401SStefano Zampini     }
3082da1bb401SStefano Zampini     ierr = ISRestoreIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr);
3083da1bb401SStefano Zampini   }
3084da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3085da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec2_N,&array2);CHKERRQ(ierr);
3086da1bb401SStefano Zampini   /* Check consistency of Dirichlet nodes */
3087da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_N,1.0);CHKERRQ(ierr);
3088da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
3089da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3090da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3091da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3092da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3093da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
3094da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec2_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3095da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec2_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3096da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3097da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3098da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3099da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec2_N,&array2);CHKERRQ(ierr);
310036e030ebSStefano Zampini   if(used_IS) {
310136e030ebSStefano Zampini     ierr = ISGetSize(used_IS,&dirichlet_bsize);CHKERRQ(ierr);
310236e030ebSStefano Zampini     ierr = ISGetIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr);
31033b03a366Sstefano_zampini     for(i=0;i<dirichlet_bsize;i++){
3104da1bb401SStefano Zampini       iindex=dirichlet_nodes[i];
3105da1bb401SStefano Zampini       if(array[iindex]>1.0 && array[iindex]!=array2[iindex] ) {
3106da1bb401SStefano Zampini          SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_USER,"Dirichlet nodes provided to BDDC must be consistent among neighbours!\nNode %d: number of sharing subdomains %d != number of subdomains for which it is a neumann node %d\n",iindex,(PetscInt)array[iindex],(PetscInt)array2[iindex]);
3107da1bb401SStefano Zampini       }
31083b03a366Sstefano_zampini     }
310936e030ebSStefano Zampini     ierr = ISRestoreIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr);
31103b03a366Sstefano_zampini   }
3111da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3112da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec2_N,&array2);CHKERRQ(ierr);
3113da1bb401SStefano Zampini 
31140c7d97c5SJed Brown   for(i=0;i<mat_graph->nvtxs;i++){
31153b03a366Sstefano_zampini     if(!mat_graph->count[i]){  /* interior nodes */
31160c7d97c5SJed Brown       mat_graph->touched[i]=PETSC_TRUE;
31170c7d97c5SJed Brown       mat_graph->where[i]=0;
31180c7d97c5SJed Brown       nodes_touched++;
31190c7d97c5SJed Brown     }
31200c7d97c5SJed Brown   }
31210c7d97c5SJed Brown   mat_graph->ncmps = 0;
3122da1bb401SStefano Zampini   i=0;
31230c7d97c5SJed Brown   while(nodes_touched<mat_graph->nvtxs) {
3124a0ba757dSStefano Zampini     /*  find first untouched node in local ordering */
31250c7d97c5SJed Brown     while(mat_graph->touched[i]) i++;
31260c7d97c5SJed Brown     mat_graph->touched[i]=PETSC_TRUE;
3127a0ba757dSStefano Zampini     mat_graph->where[i]=where_values;
31280c7d97c5SJed Brown     nodes_touched++;
3129a0ba757dSStefano Zampini     /* now find all other nodes having the same set of sharing subdomains */
31300c7d97c5SJed Brown     for(j=i+1;j<mat_graph->nvtxs;j++){
3131a0ba757dSStefano Zampini       /* check for same number of sharing subdomains and dof number */
3132da1bb401SStefano Zampini       if(!mat_graph->touched[j] && mat_graph->count[i]==mat_graph->count[j] && mat_graph->which_dof[i] == mat_graph->which_dof[j] ){
3133a0ba757dSStefano Zampini         /* check for same set of sharing subdomains */
31340c7d97c5SJed Brown         same_set=PETSC_TRUE;
31350c7d97c5SJed Brown         for(k=0;k<mat_graph->count[j];k++){
3136da1bb401SStefano Zampini           if(mat_graph->neighbours_set[i][k]!=mat_graph->neighbours_set[j][k]) {
31370c7d97c5SJed Brown             same_set=PETSC_FALSE;
31380c7d97c5SJed Brown           }
31390c7d97c5SJed Brown         }
3140a0ba757dSStefano Zampini         /* I found a friend of mine */
31410c7d97c5SJed Brown         if(same_set) {
3142a0ba757dSStefano Zampini           mat_graph->where[j]=where_values;
31430c7d97c5SJed Brown           mat_graph->touched[j]=PETSC_TRUE;
31440c7d97c5SJed Brown           nodes_touched++;
31450c7d97c5SJed Brown         }
31460c7d97c5SJed Brown       }
31470c7d97c5SJed Brown     }
3148a0ba757dSStefano Zampini     where_values++;
31490c7d97c5SJed Brown   }
3150a0ba757dSStefano Zampini   where_values--; if(where_values<0) where_values=0;
3151a0ba757dSStefano Zampini   ierr = PetscMalloc(where_values*sizeof(PetscMPIInt),&mat_graph->where_ncmps);CHKERRQ(ierr);
3152a0ba757dSStefano Zampini   /* Find connected components defined on the shared interface */
3153a0ba757dSStefano Zampini   if(where_values) {
3154a0ba757dSStefano Zampini     ierr = PCBDDCFindConnectedComponents(mat_graph, where_values);
31553b03a366Sstefano_zampini     /* For consistency among neughbouring procs, I need to sort (by global ordering) each connected component */
3156a0ba757dSStefano Zampini     for(i=0;i<mat_graph->ncmps;i++) {
3157a0ba757dSStefano Zampini       ierr = ISLocalToGlobalMappingApply(matis->mapping,mat_graph->cptr[i+1]-mat_graph->cptr[i],&mat_graph->queue[mat_graph->cptr[i]],&queue_in_global_numbering[mat_graph->cptr[i]]);CHKERRQ(ierr);
3158a0ba757dSStefano Zampini       ierr = PetscSortIntWithArray(mat_graph->cptr[i+1]-mat_graph->cptr[i],&queue_in_global_numbering[mat_graph->cptr[i]],&mat_graph->queue[mat_graph->cptr[i]]);CHKERRQ(ierr);
3159a0ba757dSStefano Zampini     }
3160a0ba757dSStefano Zampini   }
3161a0ba757dSStefano Zampini   /* check consistency of connected components among neighbouring subdomains -> it adapt them in case it is needed */
3162a0ba757dSStefano Zampini   for(i=0;i<where_values;i++) {
31633b03a366Sstefano_zampini     /* We are not sure that two connected components will be the same among subdomains sharing a subset of local interface */
31643b03a366Sstefano_zampini     if(mat_graph->where_ncmps[i]>1) {
3165a0ba757dSStefano Zampini       adapt_interface=1;
3166a0ba757dSStefano Zampini       break;
3167a0ba757dSStefano Zampini     }
3168a0ba757dSStefano Zampini   }
3169a0ba757dSStefano Zampini   ierr = MPI_Allreduce(&adapt_interface,&adapt_interface_reduced,1,MPIU_INT,MPI_LOR,interface_comm);CHKERRQ(ierr);
3170da1bb401SStefano Zampini   if(pcbddc->dbg_flag && adapt_interface_reduced) {
3171da1bb401SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"Interface adapted\n");CHKERRQ(ierr);
3172da1bb401SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
3173da1bb401SStefano Zampini   }
3174a0ba757dSStefano Zampini   if(where_values && adapt_interface_reduced) {
31750c7d97c5SJed Brown 
3176a0ba757dSStefano Zampini     PetscInt sum_requests=0,my_rank;
3177a0ba757dSStefano Zampini     PetscInt buffer_size,start_of_recv,size_of_recv,start_of_send;
3178a0ba757dSStefano Zampini     PetscInt temp_buffer_size,ins_val,global_where_counter;
3179a0ba757dSStefano Zampini     PetscInt *cum_recv_counts;
3180a0ba757dSStefano Zampini     PetscInt *where_to_nodes_indices;
3181a0ba757dSStefano Zampini     PetscInt *petsc_buffer;
3182a0ba757dSStefano Zampini     PetscMPIInt *recv_buffer;
3183a0ba757dSStefano Zampini     PetscMPIInt *recv_buffer_where;
3184a0ba757dSStefano Zampini     PetscMPIInt *send_buffer;
3185a0ba757dSStefano Zampini     PetscMPIInt size_of_send;
3186a0ba757dSStefano Zampini     PetscInt *sizes_of_sends;
3187a0ba757dSStefano Zampini     MPI_Request *send_requests;
3188a0ba757dSStefano Zampini     MPI_Request *recv_requests;
3189a0ba757dSStefano Zampini     PetscInt *where_cc_adapt;
3190a0ba757dSStefano Zampini     PetscInt **temp_buffer;
3191a0ba757dSStefano Zampini     PetscInt *nodes_to_temp_buffer_indices;
3192a0ba757dSStefano Zampini     PetscInt *add_to_where;
3193a0ba757dSStefano Zampini 
3194a0ba757dSStefano Zampini     ierr = MPI_Comm_rank(interface_comm,&my_rank);CHKERRQ(ierr);
3195a0ba757dSStefano Zampini     ierr = PetscMalloc((where_values+1)*sizeof(PetscInt),&cum_recv_counts);CHKERRQ(ierr);
3196a0ba757dSStefano Zampini     ierr = PetscMemzero(cum_recv_counts,(where_values+1)*sizeof(PetscInt));CHKERRQ(ierr);
3197a0ba757dSStefano Zampini     ierr = PetscMalloc(where_values*sizeof(PetscInt),&where_to_nodes_indices);CHKERRQ(ierr);
3198a0ba757dSStefano Zampini     /* first count how many neighbours per connected component I will receive from */
3199a0ba757dSStefano Zampini     cum_recv_counts[0]=0;
3200a0ba757dSStefano Zampini     for(i=1;i<where_values+1;i++){
3201a0ba757dSStefano Zampini       j=0;
3202a0ba757dSStefano Zampini       while(mat_graph->where[j] != i) j++;
3203a0ba757dSStefano Zampini       where_to_nodes_indices[i-1]=j;
3204da1bb401SStefano Zampini       if(mat_graph->neighbours_set[j][0]!=-1) { cum_recv_counts[i]=cum_recv_counts[i-1]+mat_graph->count[j]; } /* We don't want sends/recvs_to/from_self -> here I don't count myself  */
32053b03a366Sstefano_zampini       else { cum_recv_counts[i]=cum_recv_counts[i-1]+mat_graph->count[j]-1; }
3206a0ba757dSStefano Zampini     }
3207a0ba757dSStefano Zampini     buffer_size=2*cum_recv_counts[where_values]+mat_graph->nvtxs;
3208a0ba757dSStefano Zampini     ierr = PetscMalloc(2*cum_recv_counts[where_values]*sizeof(PetscMPIInt),&recv_buffer_where);CHKERRQ(ierr);
3209a0ba757dSStefano Zampini     ierr = PetscMalloc(buffer_size*sizeof(PetscMPIInt),&send_buffer);CHKERRQ(ierr);
3210a0ba757dSStefano Zampini     ierr = PetscMalloc(cum_recv_counts[where_values]*sizeof(MPI_Request),&send_requests);CHKERRQ(ierr);
3211a0ba757dSStefano Zampini     ierr = PetscMalloc(cum_recv_counts[where_values]*sizeof(MPI_Request),&recv_requests);CHKERRQ(ierr);
3212a0ba757dSStefano Zampini     for(i=0;i<cum_recv_counts[where_values];i++) {
3213a0ba757dSStefano Zampini       send_requests[i]=MPI_REQUEST_NULL;
3214a0ba757dSStefano Zampini       recv_requests[i]=MPI_REQUEST_NULL;
3215a0ba757dSStefano Zampini     }
3216a0ba757dSStefano Zampini     /* exchange with my neighbours the number of my connected components on the shared interface */
3217a0ba757dSStefano Zampini     for(i=0;i<where_values;i++){
3218a0ba757dSStefano Zampini       j=where_to_nodes_indices[i];
3219da1bb401SStefano Zampini       k = (mat_graph->neighbours_set[j][0] == -1 ?  1 : 0);
3220a0ba757dSStefano Zampini       for(;k<mat_graph->count[j];k++){
3221da1bb401SStefano Zampini         ierr = MPI_Isend(&mat_graph->where_ncmps[i],1,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr);
3222da1bb401SStefano Zampini         ierr = MPI_Irecv(&recv_buffer_where[sum_requests],1,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr);
3223a0ba757dSStefano Zampini         sum_requests++;
3224a0ba757dSStefano Zampini       }
3225a0ba757dSStefano Zampini     }
3226a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
3227a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
3228a0ba757dSStefano Zampini     /* determine the connected component I need to adapt */
3229a0ba757dSStefano Zampini     ierr = PetscMalloc(where_values*sizeof(PetscInt),&where_cc_adapt);CHKERRQ(ierr);
3230a0ba757dSStefano Zampini     ierr = PetscMemzero(where_cc_adapt,where_values*sizeof(PetscInt));CHKERRQ(ierr);
3231a0ba757dSStefano Zampini     for(i=0;i<where_values;i++){
3232a0ba757dSStefano Zampini       for(j=cum_recv_counts[i];j<cum_recv_counts[i+1];j++){
32333b03a366Sstefano_zampini         /* The first condition is natural (i.e someone has a different number of cc than me), the second one is just to be safe */
32343b03a366Sstefano_zampini         if( mat_graph->where_ncmps[i]!=recv_buffer_where[j] || mat_graph->where_ncmps[i] > 1 ) {
3235a0ba757dSStefano Zampini           where_cc_adapt[i]=PETSC_TRUE;
3236a0ba757dSStefano Zampini           break;
3237a0ba757dSStefano Zampini         }
3238a0ba757dSStefano Zampini       }
3239a0ba757dSStefano Zampini     }
3240a0ba757dSStefano Zampini     /* now get from neighbours their ccs (in global numbering) and adapt them (in case it is needed) */
3241a0ba757dSStefano Zampini     /* first determine how much data to send (size of each queue plus the global indices) and communicate it to neighbours */
3242a0ba757dSStefano Zampini     ierr = PetscMalloc(where_values*sizeof(PetscInt),&sizes_of_sends);CHKERRQ(ierr);
3243a0ba757dSStefano Zampini     ierr = PetscMemzero(sizes_of_sends,where_values*sizeof(PetscInt));CHKERRQ(ierr);
3244a0ba757dSStefano Zampini     sum_requests=0;
3245a0ba757dSStefano Zampini     start_of_send=0;
3246a0ba757dSStefano Zampini     start_of_recv=cum_recv_counts[where_values];
3247a0ba757dSStefano Zampini     for(i=0;i<where_values;i++) {
3248a0ba757dSStefano Zampini       if(where_cc_adapt[i]) {
3249a0ba757dSStefano Zampini         size_of_send=0;
3250a0ba757dSStefano Zampini         for(j=i;j<mat_graph->ncmps;j++) {
3251a0ba757dSStefano Zampini           if(mat_graph->where[mat_graph->queue[mat_graph->cptr[j]]] == i+1) { /* WARNING -> where values goes from 1 to where_values included */
3252a0ba757dSStefano Zampini             send_buffer[start_of_send+size_of_send]=mat_graph->cptr[j+1]-mat_graph->cptr[j];
3253a0ba757dSStefano Zampini             size_of_send+=1;
3254a0ba757dSStefano Zampini             for(k=0;k<mat_graph->cptr[j+1]-mat_graph->cptr[j];k++) {
3255a0ba757dSStefano Zampini               send_buffer[start_of_send+size_of_send+k]=queue_in_global_numbering[mat_graph->cptr[j]+k];
3256a0ba757dSStefano Zampini             }
3257a0ba757dSStefano Zampini             size_of_send=size_of_send+mat_graph->cptr[j+1]-mat_graph->cptr[j];
3258a0ba757dSStefano Zampini           }
3259a0ba757dSStefano Zampini         }
3260a0ba757dSStefano Zampini         j = where_to_nodes_indices[i];
3261da1bb401SStefano Zampini         k = (mat_graph->neighbours_set[j][0] == -1 ?  1 : 0);
326211d8f4c2SStefano Zampini         sizes_of_sends[i]=size_of_send;
3263a0ba757dSStefano Zampini         for(;k<mat_graph->count[j];k++){
326411d8f4c2SStefano Zampini           ierr = MPI_Isend(&sizes_of_sends[i],1,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr);
3265da1bb401SStefano Zampini           ierr = MPI_Irecv(&recv_buffer_where[sum_requests+start_of_recv],1,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr);
3266a0ba757dSStefano Zampini           sum_requests++;
3267a0ba757dSStefano Zampini         }
3268a0ba757dSStefano Zampini         start_of_send+=size_of_send;
3269a0ba757dSStefano Zampini       }
3270a0ba757dSStefano Zampini     }
3271a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
3272a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
3273a0ba757dSStefano Zampini     buffer_size=0;
3274a0ba757dSStefano Zampini     for(k=0;k<sum_requests;k++) { buffer_size+=recv_buffer_where[start_of_recv+k]; }
3275a0ba757dSStefano Zampini     ierr = PetscMalloc(buffer_size*sizeof(PetscMPIInt),&recv_buffer);CHKERRQ(ierr);
3276a0ba757dSStefano Zampini     /* now exchange the data */
3277a0ba757dSStefano Zampini     start_of_recv=0;
3278a0ba757dSStefano Zampini     start_of_send=0;
3279a0ba757dSStefano Zampini     sum_requests=0;
3280a0ba757dSStefano Zampini     for(i=0;i<where_values;i++) {
3281a0ba757dSStefano Zampini       if(where_cc_adapt[i]) {
3282a0ba757dSStefano Zampini         size_of_send = sizes_of_sends[i];
3283a0ba757dSStefano Zampini         j = where_to_nodes_indices[i];
3284da1bb401SStefano Zampini         k = (mat_graph->neighbours_set[j][0] == -1 ?  1 : 0);
3285a0ba757dSStefano Zampini         for(;k<mat_graph->count[j];k++){
3286da1bb401SStefano Zampini           ierr = MPI_Isend(&send_buffer[start_of_send],size_of_send,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr);
3287a0ba757dSStefano Zampini           size_of_recv=recv_buffer_where[cum_recv_counts[where_values]+sum_requests];
3288da1bb401SStefano Zampini           ierr = MPI_Irecv(&recv_buffer[start_of_recv],size_of_recv,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr);
3289a0ba757dSStefano Zampini           start_of_recv+=size_of_recv;
3290a0ba757dSStefano Zampini           sum_requests++;
3291a0ba757dSStefano Zampini         }
3292a0ba757dSStefano Zampini         start_of_send+=size_of_send;
3293a0ba757dSStefano Zampini       }
3294a0ba757dSStefano Zampini     }
3295a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
3296a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
3297a0ba757dSStefano Zampini     ierr = PetscMalloc(buffer_size*sizeof(PetscInt),&petsc_buffer);CHKERRQ(ierr);
3298a0ba757dSStefano Zampini     for(k=0;k<start_of_recv;k++) { petsc_buffer[k]=(PetscInt)recv_buffer[k]; }
3299a0ba757dSStefano Zampini     for(j=0;j<buffer_size;) {
3300a0ba757dSStefano Zampini        ierr = ISGlobalToLocalMappingApply(matis->mapping,IS_GTOLM_MASK,petsc_buffer[j],&petsc_buffer[j+1],&petsc_buffer[j],&petsc_buffer[j+1]);CHKERRQ(ierr);
3301a0ba757dSStefano Zampini        k=petsc_buffer[j]+1;
3302a0ba757dSStefano Zampini        j+=k;
3303a0ba757dSStefano Zampini     }
3304a0ba757dSStefano Zampini     sum_requests=cum_recv_counts[where_values];
3305a0ba757dSStefano Zampini     start_of_recv=0;
3306a0ba757dSStefano Zampini     ierr = PetscMalloc(mat_graph->nvtxs*sizeof(PetscInt),&nodes_to_temp_buffer_indices);CHKERRQ(ierr);
3307a0ba757dSStefano Zampini     global_where_counter=0;
3308a0ba757dSStefano Zampini     for(i=0;i<where_values;i++){
3309a0ba757dSStefano Zampini       if(where_cc_adapt[i]){
3310a0ba757dSStefano Zampini         temp_buffer_size=0;
3311a0ba757dSStefano Zampini         /* find nodes on the shared interface we need to adapt */
3312a0ba757dSStefano Zampini         for(j=0;j<mat_graph->nvtxs;j++){
3313a0ba757dSStefano Zampini           if(mat_graph->where[j]==i+1) {
3314a0ba757dSStefano Zampini             nodes_to_temp_buffer_indices[j]=temp_buffer_size;
3315a0ba757dSStefano Zampini             temp_buffer_size++;
3316a0ba757dSStefano Zampini           } else {
3317a0ba757dSStefano Zampini             nodes_to_temp_buffer_indices[j]=-1;
3318a0ba757dSStefano Zampini           }
3319a0ba757dSStefano Zampini         }
3320a0ba757dSStefano Zampini         /* allocate some temporary space */
3321a0ba757dSStefano Zampini         ierr = PetscMalloc(temp_buffer_size*sizeof(PetscInt*),&temp_buffer);CHKERRQ(ierr);
3322a0ba757dSStefano Zampini         ierr = PetscMalloc(temp_buffer_size*(cum_recv_counts[i+1]-cum_recv_counts[i])*sizeof(PetscInt),&temp_buffer[0]);CHKERRQ(ierr);
3323a0ba757dSStefano Zampini         ierr = PetscMemzero(temp_buffer[0],temp_buffer_size*(cum_recv_counts[i+1]-cum_recv_counts[i])*sizeof(PetscInt));CHKERRQ(ierr);
3324a0ba757dSStefano Zampini         for(j=1;j<temp_buffer_size;j++){
3325a0ba757dSStefano Zampini           temp_buffer[j]=temp_buffer[j-1]+cum_recv_counts[i+1]-cum_recv_counts[i];
3326a0ba757dSStefano Zampini         }
3327a0ba757dSStefano Zampini         /* analyze contributions from neighbouring subdomains for i-th conn comp
3328a0ba757dSStefano Zampini            temp buffer structure:
3329a0ba757dSStefano Zampini            supposing part of the interface has dimension 5 (global nodes 0,1,2,3,4)
3330a0ba757dSStefano Zampini            3 neighs procs with structured connected components:
3331a0ba757dSStefano Zampini              neigh 0: [0 1 4], [2 3];  (2 connected components)
3332a0ba757dSStefano Zampini              neigh 1: [0 1], [2 3 4];  (2 connected components)
3333a0ba757dSStefano Zampini              neigh 2: [0 4], [1], [2 3]; (3 connected components)
3334a0ba757dSStefano Zampini            tempbuffer (row-oriented) should be filled as:
3335a0ba757dSStefano Zampini              [ 0, 0, 0;
3336a0ba757dSStefano Zampini                0, 0, 1;
3337a0ba757dSStefano Zampini                1, 1, 2;
3338a0ba757dSStefano Zampini                1, 1, 2;
3339a0ba757dSStefano Zampini                0, 1, 0; ];
3340a0ba757dSStefano Zampini            This way we can simply recover the resulting structure account for possible intersections of ccs among neighs.
3341a0ba757dSStefano Zampini            The mat_graph->where array will be modified to reproduce the following 4 connected components [0], [1], [2 3], [4];
3342a0ba757dSStefano Zampini                                                                                                                                    */
3343a0ba757dSStefano Zampini         for(j=0;j<cum_recv_counts[i+1]-cum_recv_counts[i];j++) {
3344a0ba757dSStefano Zampini           ins_val=0;
3345a0ba757dSStefano Zampini           size_of_recv=recv_buffer_where[sum_requests];  /* total size of recv from neighs */
3346a0ba757dSStefano Zampini           for(buffer_size=0;buffer_size<size_of_recv;) {  /* loop until all data from neighs has been taken into account */
3347a0ba757dSStefano Zampini             for(k=1;k<petsc_buffer[buffer_size+start_of_recv]+1;k++) { /* filling properly temp_buffer using data from a single recv */
3348a0ba757dSStefano Zampini               temp_buffer[ nodes_to_temp_buffer_indices[ petsc_buffer[ start_of_recv+buffer_size+k ] ] ][j]=ins_val;
3349a0ba757dSStefano Zampini             }
3350a0ba757dSStefano Zampini             buffer_size+=k;
3351a0ba757dSStefano Zampini             ins_val++;
3352a0ba757dSStefano Zampini           }
3353a0ba757dSStefano Zampini           start_of_recv+=size_of_recv;
3354a0ba757dSStefano Zampini           sum_requests++;
3355a0ba757dSStefano Zampini         }
3356a0ba757dSStefano Zampini         ierr = PetscMalloc(temp_buffer_size*sizeof(PetscInt),&add_to_where);CHKERRQ(ierr);
3357a0ba757dSStefano Zampini         ierr = PetscMemzero(add_to_where,temp_buffer_size*sizeof(PetscInt));CHKERRQ(ierr);
3358a0ba757dSStefano Zampini         for(j=0;j<temp_buffer_size;j++){
3359a0ba757dSStefano Zampini           if(!add_to_where[j]){ /* found a new cc  */
3360a0ba757dSStefano Zampini             global_where_counter++;
3361a0ba757dSStefano Zampini             add_to_where[j]=global_where_counter;
3362a0ba757dSStefano Zampini             for(k=j+1;k<temp_buffer_size;k++){ /* check for other nodes in new cc */
3363a0ba757dSStefano Zampini               same_set=PETSC_TRUE;
3364a0ba757dSStefano Zampini               for(s=0;s<cum_recv_counts[i+1]-cum_recv_counts[i];s++){
3365a0ba757dSStefano Zampini                 if(temp_buffer[j][s]!=temp_buffer[k][s]) {
3366a0ba757dSStefano Zampini                   same_set=PETSC_FALSE;
3367a0ba757dSStefano Zampini                   break;
3368a0ba757dSStefano Zampini                 }
3369a0ba757dSStefano Zampini               }
3370a0ba757dSStefano Zampini               if(same_set) add_to_where[k]=global_where_counter;
3371a0ba757dSStefano Zampini             }
3372a0ba757dSStefano Zampini           }
3373a0ba757dSStefano Zampini         }
3374a0ba757dSStefano Zampini         /* insert new data in where array */
3375a0ba757dSStefano Zampini         temp_buffer_size=0;
3376a0ba757dSStefano Zampini         for(j=0;j<mat_graph->nvtxs;j++){
3377a0ba757dSStefano Zampini           if(mat_graph->where[j]==i+1) {
3378a0ba757dSStefano Zampini             mat_graph->where[j]=where_values+add_to_where[temp_buffer_size];
3379a0ba757dSStefano Zampini             temp_buffer_size++;
3380a0ba757dSStefano Zampini           }
3381a0ba757dSStefano Zampini         }
3382a0ba757dSStefano Zampini         ierr = PetscFree(temp_buffer[0]);CHKERRQ(ierr);
3383a0ba757dSStefano Zampini         ierr = PetscFree(temp_buffer);CHKERRQ(ierr);
3384a0ba757dSStefano Zampini         ierr = PetscFree(add_to_where);CHKERRQ(ierr);
3385a0ba757dSStefano Zampini       }
3386a0ba757dSStefano Zampini     }
3387a0ba757dSStefano Zampini     ierr = PetscFree(nodes_to_temp_buffer_indices);CHKERRQ(ierr);
3388a0ba757dSStefano Zampini     ierr = PetscFree(sizes_of_sends);CHKERRQ(ierr);
3389a0ba757dSStefano Zampini     ierr = PetscFree(send_requests);CHKERRQ(ierr);
3390a0ba757dSStefano Zampini     ierr = PetscFree(recv_requests);CHKERRQ(ierr);
3391a0ba757dSStefano Zampini     ierr = PetscFree(petsc_buffer);CHKERRQ(ierr);
3392a0ba757dSStefano Zampini     ierr = PetscFree(recv_buffer);CHKERRQ(ierr);
3393a0ba757dSStefano Zampini     ierr = PetscFree(recv_buffer_where);CHKERRQ(ierr);
3394a0ba757dSStefano Zampini     ierr = PetscFree(send_buffer);CHKERRQ(ierr);
3395a0ba757dSStefano Zampini     ierr = PetscFree(cum_recv_counts);CHKERRQ(ierr);
3396a0ba757dSStefano Zampini     ierr = PetscFree(where_to_nodes_indices);CHKERRQ(ierr);
3397a0ba757dSStefano Zampini     /* We are ready to evaluate consistent connected components on each part of the shared interface */
3398a0ba757dSStefano Zampini     if(global_where_counter) {
3399a0ba757dSStefano Zampini       for(i=0;i<mat_graph->nvtxs;i++){ mat_graph->touched[i]=PETSC_FALSE; }
3400a0ba757dSStefano Zampini       global_where_counter=0;
3401a0ba757dSStefano Zampini       for(i=0;i<mat_graph->nvtxs;i++){
3402a0ba757dSStefano Zampini         if(mat_graph->where[i] && !mat_graph->touched[i]) {
3403a0ba757dSStefano Zampini           global_where_counter++;
3404a0ba757dSStefano Zampini           for(j=i+1;j<mat_graph->nvtxs;j++){
3405a0ba757dSStefano Zampini             if(!mat_graph->touched[j] && mat_graph->where[j]==mat_graph->where[i]) {
3406a0ba757dSStefano Zampini               mat_graph->where[j]=global_where_counter;
3407a0ba757dSStefano Zampini               mat_graph->touched[j]=PETSC_TRUE;
3408a0ba757dSStefano Zampini             }
3409a0ba757dSStefano Zampini           }
3410a0ba757dSStefano Zampini           mat_graph->where[i]=global_where_counter;
3411a0ba757dSStefano Zampini           mat_graph->touched[i]=PETSC_TRUE;
3412a0ba757dSStefano Zampini         }
3413a0ba757dSStefano Zampini       }
3414a0ba757dSStefano Zampini       where_values=global_where_counter;
3415a0ba757dSStefano Zampini     }
3416a0ba757dSStefano Zampini     if(global_where_counter) {
3417a0ba757dSStefano Zampini       ierr = PetscMemzero(mat_graph->cptr,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr);
3418a0ba757dSStefano Zampini       ierr = PetscMemzero(mat_graph->queue,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
3419a0ba757dSStefano Zampini       ierr = PetscFree(mat_graph->where_ncmps);CHKERRQ(ierr);
3420a0ba757dSStefano Zampini       ierr = PetscMalloc(where_values*sizeof(PetscMPIInt),&mat_graph->where_ncmps);CHKERRQ(ierr);
3421a0ba757dSStefano Zampini       ierr = PCBDDCFindConnectedComponents(mat_graph, where_values);
3422a0ba757dSStefano Zampini       for(i=0;i<mat_graph->ncmps;i++) {
3423a0ba757dSStefano Zampini         ierr = ISLocalToGlobalMappingApply(matis->mapping,mat_graph->cptr[i+1]-mat_graph->cptr[i],&mat_graph->queue[mat_graph->cptr[i]],&queue_in_global_numbering[mat_graph->cptr[i]]);CHKERRQ(ierr);
3424a0ba757dSStefano Zampini         ierr = PetscSortIntWithArray(mat_graph->cptr[i+1]-mat_graph->cptr[i],&queue_in_global_numbering[mat_graph->cptr[i]],&mat_graph->queue[mat_graph->cptr[i]]);CHKERRQ(ierr);
3425a0ba757dSStefano Zampini       }
3426a0ba757dSStefano Zampini     }
34273b03a366Sstefano_zampini   } /* Finished adapting interface */
34280c7d97c5SJed Brown   PetscInt nfc=0;
34290c7d97c5SJed Brown   PetscInt nec=0;
34300c7d97c5SJed Brown   PetscInt nvc=0;
34313b03a366Sstefano_zampini   PetscBool twodim_flag=PETSC_FALSE;
34320c7d97c5SJed Brown   for (i=0; i<mat_graph->ncmps; i++) {
34333b03a366Sstefano_zampini     if( mat_graph->cptr[i+1]-mat_graph->cptr[i] > vertex_size ){
3434*534831adSStefano Zampini       if(mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]==1){ /* 1 neigh Neumann fake included */
34350c7d97c5SJed Brown         nfc++;
34363b03a366Sstefano_zampini       } else { /* note that nec will be zero in 2d */
34373b03a366Sstefano_zampini         nec++;
34383b03a366Sstefano_zampini       }
34390c7d97c5SJed Brown     } else {
34403b03a366Sstefano_zampini       nvc+=mat_graph->cptr[i+1]-mat_graph->cptr[i];
34413b03a366Sstefano_zampini     }
34423b03a366Sstefano_zampini   }
34433b03a366Sstefano_zampini 
34443b03a366Sstefano_zampini   if(!nec) { /* we are in a 2d case -> no faces, only edges */
34453b03a366Sstefano_zampini     nec = nfc;
34463b03a366Sstefano_zampini     nfc = 0;
34473b03a366Sstefano_zampini     twodim_flag = PETSC_TRUE;
34483b03a366Sstefano_zampini   }
34493b03a366Sstefano_zampini   /* allocate IS arrays for faces, edges. Vertices need a single index set.
34503b03a366Sstefano_zampini      Reusing space allocated in mat_graph->where for creating IS objects */
34513b03a366Sstefano_zampini   if(!pcbddc->vertices_flag && !pcbddc->edges_flag) {
34523b03a366Sstefano_zampini     ierr = PetscMalloc(nfc*sizeof(IS),&pcbddc->ISForFaces);CHKERRQ(ierr);
34533b03a366Sstefano_zampini     use_faces=PETSC_TRUE;
34543b03a366Sstefano_zampini   }
34553b03a366Sstefano_zampini   if(!pcbddc->vertices_flag && !pcbddc->faces_flag) {
34563b03a366Sstefano_zampini     ierr = PetscMalloc(nec*sizeof(IS),&pcbddc->ISForEdges);CHKERRQ(ierr);
34573b03a366Sstefano_zampini     use_edges=PETSC_TRUE;
34583b03a366Sstefano_zampini   }
34593b03a366Sstefano_zampini   nfc=0;
34603b03a366Sstefano_zampini   nec=0;
34613b03a366Sstefano_zampini   for (i=0; i<mat_graph->ncmps; i++) {
34623b03a366Sstefano_zampini     if( mat_graph->cptr[i+1]-mat_graph->cptr[i] > vertex_size ){
34633b03a366Sstefano_zampini       for(j=0;j<mat_graph->cptr[i+1]-mat_graph->cptr[i];j++) {
34643b03a366Sstefano_zampini         mat_graph->where[j]=mat_graph->queue[mat_graph->cptr[i]+j];
34653b03a366Sstefano_zampini       }
34663b03a366Sstefano_zampini       if(mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]==1){
34673b03a366Sstefano_zampini         if(twodim_flag) {
34683b03a366Sstefano_zampini           if(use_edges) {
34693b03a366Sstefano_zampini             ierr = ISCreateGeneral(PETSC_COMM_SELF,j,mat_graph->where,PETSC_COPY_VALUES,&pcbddc->ISForEdges[nec]);CHKERRQ(ierr);
34703b03a366Sstefano_zampini             nec++;
34713b03a366Sstefano_zampini           }
34723b03a366Sstefano_zampini         } else {
34733b03a366Sstefano_zampini           if(use_faces) {
34743b03a366Sstefano_zampini             ierr = ISCreateGeneral(PETSC_COMM_SELF,j,mat_graph->where,PETSC_COPY_VALUES,&pcbddc->ISForFaces[nfc]);CHKERRQ(ierr);
34753b03a366Sstefano_zampini             nfc++;
34763b03a366Sstefano_zampini           }
34773b03a366Sstefano_zampini         }
34783b03a366Sstefano_zampini       } else {
34793b03a366Sstefano_zampini         if(use_edges) {
34803b03a366Sstefano_zampini           ierr = ISCreateGeneral(PETSC_COMM_SELF,j,mat_graph->where,PETSC_COPY_VALUES,&pcbddc->ISForEdges[nec]);CHKERRQ(ierr);
34810c7d97c5SJed Brown           nec++;
34820c7d97c5SJed Brown         }
34830c7d97c5SJed Brown       }
34840c7d97c5SJed Brown     }
34853b03a366Sstefano_zampini   }
34863b03a366Sstefano_zampini   pcbddc->n_ISForFaces=nfc;
34873b03a366Sstefano_zampini   pcbddc->n_ISForEdges=nec;
34883b03a366Sstefano_zampini   nvc=0;
34890c7d97c5SJed Brown   if( !pcbddc->constraints_flag ) {
34903b03a366Sstefano_zampini     for (i=0; i<mat_graph->ncmps; i++) {
34913b03a366Sstefano_zampini       if( mat_graph->cptr[i+1]-mat_graph->cptr[i] <= vertex_size ){
34923b03a366Sstefano_zampini         for( j=mat_graph->cptr[i];j<mat_graph->cptr[i+1];j++) {
34933b03a366Sstefano_zampini           mat_graph->where[nvc]=mat_graph->queue[j];
34940c7d97c5SJed Brown           nvc++;
34950c7d97c5SJed Brown         }
34960c7d97c5SJed Brown       }
34970c7d97c5SJed Brown     }
34980c7d97c5SJed Brown   }
3499a0ba757dSStefano Zampini   /* sort vertex set (by local ordering) */
35003b03a366Sstefano_zampini   ierr = PetscSortInt(nvc,mat_graph->where);CHKERRQ(ierr);
35013b03a366Sstefano_zampini   ierr = ISCreateGeneral(PETSC_COMM_SELF,nvc,mat_graph->where,PETSC_COPY_VALUES,&pcbddc->ISForVertices);CHKERRQ(ierr);
35020c7d97c5SJed Brown 
3503e269702eSStefano Zampini   if(pcbddc->dbg_flag) {
3504e269702eSStefano Zampini 
3505d49ef151SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"--------------------------------------------------------------\n");CHKERRQ(ierr);
3506d49ef151SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Details from PCBDDCManageLocalBoundaries for subdomain %04d\n",PetscGlobalRank);CHKERRQ(ierr);
3507d49ef151SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"--------------------------------------------------------------\n");CHKERRQ(ierr);
3508a0ba757dSStefano Zampini /*    ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Graph (adjacency structure) of local Neumann mat\n");CHKERRQ(ierr);
3509a0ba757dSStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"--------------------------------------------------------------\n");CHKERRQ(ierr);
3510e269702eSStefano Zampini     for(i=0;i<mat_graph->nvtxs;i++) {
3511a0ba757dSStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Nodes connected to node number %d are %d\n",i,mat_graph->xadj[i+1]-mat_graph->xadj[i]);CHKERRQ(ierr);
3512e269702eSStefano Zampini       for(j=mat_graph->xadj[i];j<mat_graph->xadj[i+1];j++){
3513a0ba757dSStefano Zampini         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d ",mat_graph->adjncy[j]);CHKERRQ(ierr);
3514e269702eSStefano Zampini       }
3515a0ba757dSStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\n--------------------------------------------------------------\n");CHKERRQ(ierr);
3516da1bb401SStefano Zampini     }*/
3517d49ef151SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Matrix graph has %d connected components", mat_graph->ncmps);CHKERRQ(ierr);
35180c7d97c5SJed Brown     for(i=0;i<mat_graph->ncmps;i++) {
35193b03a366Sstefano_zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\nDetails for connected component number %02d: size %04d, count %01d. Nodes follow.\n",
35203b03a366Sstefano_zampini              i,mat_graph->cptr[i+1]-mat_graph->cptr[i],mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]);CHKERRQ(ierr);
3521da1bb401SStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"subdomains: ");
3522da1bb401SStefano Zampini       for (j=0;j<mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]; j++) {
3523da1bb401SStefano Zampini         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d ",mat_graph->neighbours_set[mat_graph->queue[mat_graph->cptr[i]]][j]);
3524da1bb401SStefano Zampini       }
3525da1bb401SStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\n");
35260c7d97c5SJed Brown       for (j=mat_graph->cptr[i]; j<mat_graph->cptr[i+1]; j++){
3527da1bb401SStefano Zampini         /* ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d (%d), ",queue_in_global_numbering[j],mat_graph->queue[j]);CHKERRQ(ierr); */
3528da1bb401SStefano Zampini         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d, ",mat_graph->queue[j]);CHKERRQ(ierr);
35290c7d97c5SJed Brown       }
35300c7d97c5SJed Brown     }
3531da1bb401SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\n--------------------------------------------------------------\n");CHKERRQ(ierr);
35323b03a366Sstefano_zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local vertices\n",PetscGlobalRank,nvc);CHKERRQ(ierr);
35333b03a366Sstefano_zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local faces\n",PetscGlobalRank,nfc);CHKERRQ(ierr);
35343b03a366Sstefano_zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local edges\n",PetscGlobalRank,nec);CHKERRQ(ierr);
3535d49ef151SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
35360c7d97c5SJed Brown   }
35370c7d97c5SJed Brown 
3538a0ba757dSStefano Zampini   /* Free graph structure */
35390c7d97c5SJed Brown   if(mat_graph->nvtxs){
3540a0ba757dSStefano Zampini     ierr = PetscFree4(mat_graph->where,mat_graph->count,mat_graph->cptr,mat_graph->queue);CHKERRQ(ierr);
3541a0ba757dSStefano Zampini     ierr = PetscFree3(mat_graph->which_dof,mat_graph->touched,queue_in_global_numbering);CHKERRQ(ierr);
3542a0ba757dSStefano Zampini     ierr = PetscFree(mat_graph->where_ncmps);CHKERRQ(ierr);
35430c7d97c5SJed Brown   }
35440c7d97c5SJed Brown 
35450c7d97c5SJed Brown   PetscFunctionReturn(0);
35460c7d97c5SJed Brown 
35470c7d97c5SJed Brown }
35480c7d97c5SJed Brown 
35490c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
35500c7d97c5SJed Brown 
35510c7d97c5SJed Brown /* The following code has been adapted from function IsConnectedSubdomain contained
3552da1bb401SStefano Zampini    in source file contig.c of METIS library (version 5.0.1)
3553da1bb401SStefano Zampini    It finds connected components of each partition labeled from 1 to n_dist  */
35540c7d97c5SJed Brown 
35550c7d97c5SJed Brown #undef __FUNCT__
35560c7d97c5SJed Brown #define __FUNCT__ "PCBDDCFindConnectedComponents"
35579c0446d6SStefano Zampini static PetscErrorCode PCBDDCFindConnectedComponents(PCBDDCGraph graph, PetscInt n_dist )
35580c7d97c5SJed Brown {
35590c7d97c5SJed Brown   PetscInt i, j, k, nvtxs, first, last, nleft, ncmps,pid,cum_queue,n,ncmps_pid;
35600c7d97c5SJed Brown   PetscInt *xadj, *adjncy, *where, *queue;
35610c7d97c5SJed Brown   PetscInt *cptr;
35620c7d97c5SJed Brown   PetscBool *touched;
35630c7d97c5SJed Brown 
35640c7d97c5SJed Brown   PetscFunctionBegin;
35650c7d97c5SJed Brown 
35660c7d97c5SJed Brown   nvtxs   = graph->nvtxs;
35670c7d97c5SJed Brown   xadj    = graph->xadj;
35680c7d97c5SJed Brown   adjncy  = graph->adjncy;
35690c7d97c5SJed Brown   where   = graph->where;
35700c7d97c5SJed Brown   touched = graph->touched;
35710c7d97c5SJed Brown   queue   = graph->queue;
35720c7d97c5SJed Brown   cptr    = graph->cptr;
35730c7d97c5SJed Brown 
35740c7d97c5SJed Brown   for (i=0; i<nvtxs; i++)
35750c7d97c5SJed Brown     touched[i] = PETSC_FALSE;
35760c7d97c5SJed Brown 
35770c7d97c5SJed Brown   cum_queue=0;
35780c7d97c5SJed Brown   ncmps=0;
35790c7d97c5SJed Brown 
35800c7d97c5SJed Brown   for(n=0; n<n_dist; n++) {
3581da1bb401SStefano Zampini     pid = n+1;  /* partition labeled by 0 is discarded */
35820c7d97c5SJed Brown     nleft = 0;
35830c7d97c5SJed Brown     for (i=0; i<nvtxs; i++) {
35840c7d97c5SJed Brown       if (where[i] == pid)
35850c7d97c5SJed Brown         nleft++;
35860c7d97c5SJed Brown     }
35870c7d97c5SJed Brown     for (i=0; i<nvtxs; i++) {
35880c7d97c5SJed Brown       if (where[i] == pid)
35890c7d97c5SJed Brown         break;
35900c7d97c5SJed Brown     }
35910c7d97c5SJed Brown     touched[i] = PETSC_TRUE;
35920c7d97c5SJed Brown     queue[cum_queue] = i;
35930c7d97c5SJed Brown     first = 0; last = 1;
35940c7d97c5SJed Brown     cptr[ncmps] = cum_queue;  /* This actually points to queue */
35950c7d97c5SJed Brown     ncmps_pid = 0;
35960c7d97c5SJed Brown     while (first != nleft) {
35970c7d97c5SJed Brown       if (first == last) { /* Find another starting vertex */
35980c7d97c5SJed Brown         cptr[++ncmps] = first+cum_queue;
35990c7d97c5SJed Brown         ncmps_pid++;
36000c7d97c5SJed Brown         for (i=0; i<nvtxs; i++) {
36010c7d97c5SJed Brown           if (where[i] == pid && !touched[i])
36020c7d97c5SJed Brown             break;
36030c7d97c5SJed Brown         }
36040c7d97c5SJed Brown         queue[cum_queue+last] = i;
36050c7d97c5SJed Brown         last++;
36060c7d97c5SJed Brown         touched[i] = PETSC_TRUE;
36070c7d97c5SJed Brown       }
36080c7d97c5SJed Brown       i = queue[cum_queue+first];
36090c7d97c5SJed Brown       first++;
36100c7d97c5SJed Brown       for (j=xadj[i]; j<xadj[i+1]; j++) {
36110c7d97c5SJed Brown         k = adjncy[j];
36120c7d97c5SJed Brown         if (where[k] == pid && !touched[k]) {
36130c7d97c5SJed Brown           queue[cum_queue+last] = k;
36140c7d97c5SJed Brown           last++;
36150c7d97c5SJed Brown           touched[k] = PETSC_TRUE;
36160c7d97c5SJed Brown         }
36170c7d97c5SJed Brown       }
36180c7d97c5SJed Brown     }
36190c7d97c5SJed Brown     cptr[++ncmps] = first+cum_queue;
36200c7d97c5SJed Brown     ncmps_pid++;
36210c7d97c5SJed Brown     cum_queue=cptr[ncmps];
3622a0ba757dSStefano Zampini     graph->where_ncmps[n] = ncmps_pid;
36230c7d97c5SJed Brown   }
36240c7d97c5SJed Brown   graph->ncmps = ncmps;
36250c7d97c5SJed Brown 
36260c7d97c5SJed Brown   PetscFunctionReturn(0);
36270c7d97c5SJed Brown }
36280c7d97c5SJed Brown 
3629