xref: /petsc/src/ksp/pc/impls/bddc/bddc.c (revision 57a90dec2a89c5037cc64833d7e3012e5a502dc3)
153cdbc3dSStefano Zampini /* TODOLIST
2da1bb401SStefano Zampini    DofSplitting and DM attached to pc?
3da1bb401SStefano Zampini    Change SetNeumannBoundaries to SetNeumannBoundariesLocal and provide new SetNeumannBoundaries (same Dirichlet)
4da1bb401SStefano Zampini    Exact solvers: Solve local saddle point directly
5831a100dSStefano Zampini      - change prec_type to switch_inexact_prec_type
6831a100dSStefano Zampini      - add bool solve_exact_saddle_point slot to pdbddc data
73b03a366Sstefano_zampini    Inexact solvers: global preconditioner application is ready, ask to developers (Jed?) on how to best implement Dohrmann's approach (PCSHELL?)
8a0ba757dSStefano Zampini    change how to deal with the coarse problem (PCBDDCSetCoarseEnvironment):
9a0ba757dSStefano Zampini      - mind the problem with coarsening_factor
10a0ba757dSStefano Zampini      - simplify coarse problem structure -> PCBDDC or PCREDUDANT, nothing else -> same comm for all levels?
11a0ba757dSStefano Zampini      - remove coarse enums and allow use of PCBDDCGetCoarseKSP
12a0ba757dSStefano Zampini      - remove metis dependency -> use MatPartitioning for multilevel -> Assemble serial adjacency in ManageLocalBoundaries?
133b03a366Sstefano_zampini      - Add levels' slot to bddc data structure and associated Set/Get functions
14a0ba757dSStefano Zampini    code refactoring:
15a0ba757dSStefano Zampini      - pick up better names for static functions
16a0ba757dSStefano Zampini    change options structure:
17a0ba757dSStefano Zampini      - insert BDDC into MG framework?
18a0ba757dSStefano Zampini    provide other ops? Ask to developers
19a0ba757dSStefano Zampini    remove all unused printf
20a0ba757dSStefano Zampini    man pages
2153cdbc3dSStefano Zampini */
220c7d97c5SJed Brown 
2353cdbc3dSStefano Zampini /* ----------------------------------------------------------------------------------------------------------------------------------------------
240c7d97c5SJed Brown    Implementation of BDDC preconditioner based on:
250c7d97c5SJed Brown    C. Dohrmann "An approximate BDDC preconditioner", Numerical Linear Algebra with Applications Volume 14, Issue 2, pages 149-168, March 2007
2653cdbc3dSStefano Zampini    ---------------------------------------------------------------------------------------------------------------------------------------------- */
2753cdbc3dSStefano Zampini 
2853cdbc3dSStefano Zampini #include "bddc.h" /*I "petscpc.h" I*/  /* includes for fortran wrappers */
293b03a366Sstefano_zampini #include <petscblaslapack.h>
300c7d97c5SJed Brown 
310c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
320c7d97c5SJed Brown #undef __FUNCT__
330c7d97c5SJed Brown #define __FUNCT__ "PCSetFromOptions_BDDC"
340c7d97c5SJed Brown PetscErrorCode PCSetFromOptions_BDDC(PC pc)
350c7d97c5SJed Brown {
360c7d97c5SJed Brown   PC_BDDC         *pcbddc = (PC_BDDC*)pc->data;
370c7d97c5SJed Brown   PetscErrorCode ierr;
380c7d97c5SJed Brown 
390c7d97c5SJed Brown   PetscFunctionBegin;
400c7d97c5SJed Brown   ierr = PetscOptionsHead("BDDC options");CHKERRQ(ierr);
410c7d97c5SJed Brown   /* Verbose debugging of main data structures */
42e269702eSStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_check_all"       ,"Verbose (debugging) output for PCBDDC"                       ,"none",pcbddc->dbg_flag      ,&pcbddc->dbg_flag      ,PETSC_NULL);CHKERRQ(ierr);
430c7d97c5SJed Brown   /* Some customization for default primal space */
44da1bb401SStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_vertices_only"   ,"Use only vertices in coarse space (i.e. discard constraints)","none",pcbddc->vertices_flag   ,&pcbddc->vertices_flag   ,PETSC_NULL);CHKERRQ(ierr);
45da1bb401SStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_constraints_only","Use only constraints in coarse space (i.e. discard vertices)","none",pcbddc->constraints_flag,&pcbddc->constraints_flag,PETSC_NULL);CHKERRQ(ierr);
46da1bb401SStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_faces_only"      ,"Use only faces among constraints of coarse space (i.e. discard edges)"         ,"none",pcbddc->faces_flag      ,&pcbddc->faces_flag      ,PETSC_NULL);CHKERRQ(ierr);
47da1bb401SStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_edges_only"      ,"Use only edges among constraints of coarse space (i.e. discard faces)"         ,"none",pcbddc->edges_flag      ,&pcbddc->edges_flag      ,PETSC_NULL);CHKERRQ(ierr);
480c7d97c5SJed Brown   /* Coarse solver context */
49da1bb401SStefano Zampini   static const char *avail_coarse_problems[] = {"sequential","replicated","parallel","multilevel",""}; /*order of choiches depends on ENUM defined in bddc.h */
500c7d97c5SJed Brown   ierr = PetscOptionsEnum("-pc_bddc_coarse_problem_type","Set coarse problem type","none",avail_coarse_problems,(PetscEnum)pcbddc->coarse_problem_type,(PetscEnum*)&pcbddc->coarse_problem_type,PETSC_NULL);CHKERRQ(ierr);
510c7d97c5SJed Brown   /* Two different application of BDDC to the whole set of dofs, internal and interface */
520c7d97c5SJed Brown   ierr = PetscOptionsBool("-pc_bddc_switch_preconditioning_type","Switch between M_2 (default) and M_3 preconditioners (as defined by Dohrmann)","none",pcbddc->prec_type,&pcbddc->prec_type,PETSC_NULL);CHKERRQ(ierr);
53534831adSStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_use_change_of_basis","Use change of basis approach for primal space","none",pcbddc->usechangeofbasis,&pcbddc->usechangeofbasis,PETSC_NULL);CHKERRQ(ierr);
54534831adSStefano Zampini   ierr = PetscOptionsBool("-pc_bddc_use_change_on_faces","Use change of basis approach for face constraints","none",pcbddc->usechangeonfaces,&pcbddc->usechangeonfaces,PETSC_NULL);CHKERRQ(ierr);
55534831adSStefano Zampini   pcbddc->usechangeonfaces = pcbddc->usechangeonfaces && pcbddc->usechangeofbasis;
560c7d97c5SJed Brown   ierr = PetscOptionsInt("-pc_bddc_coarsening_ratio","Set coarsening ratio used in multilevel coarsening","none",pcbddc->coarsening_ratio,&pcbddc->coarsening_ratio,PETSC_NULL);CHKERRQ(ierr);
570c7d97c5SJed Brown   ierr = PetscOptionsTail();CHKERRQ(ierr);
580c7d97c5SJed Brown   PetscFunctionReturn(0);
590c7d97c5SJed Brown }
600c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
610c7d97c5SJed Brown EXTERN_C_BEGIN
620c7d97c5SJed Brown #undef __FUNCT__
630c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetCoarseProblemType_BDDC"
6453cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetCoarseProblemType_BDDC(PC pc, CoarseProblemType CPT)
650c7d97c5SJed Brown {
660c7d97c5SJed Brown   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
670c7d97c5SJed Brown 
680c7d97c5SJed Brown   PetscFunctionBegin;
690c7d97c5SJed Brown   pcbddc->coarse_problem_type = CPT;
700c7d97c5SJed Brown   PetscFunctionReturn(0);
710c7d97c5SJed Brown }
720c7d97c5SJed Brown EXTERN_C_END
730c7d97c5SJed Brown #undef __FUNCT__
740c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetCoarseProblemType"
7553cdbc3dSStefano Zampini /*@
769c0446d6SStefano Zampini  PCBDDCSetCoarseProblemType - Set coarse problem type in PCBDDC.
7753cdbc3dSStefano Zampini 
789c0446d6SStefano Zampini    Not collective
7953cdbc3dSStefano Zampini 
8053cdbc3dSStefano Zampini    Input Parameters:
8153cdbc3dSStefano Zampini +  pc - the preconditioning context
8253cdbc3dSStefano Zampini -  CoarseProblemType - pick a better name and explain what this is
8353cdbc3dSStefano Zampini 
8453cdbc3dSStefano Zampini    Level: intermediate
8553cdbc3dSStefano Zampini 
8653cdbc3dSStefano Zampini    Notes:
87da1bb401SStefano Zampini    Not collective but all procs must call with same arguments.
8853cdbc3dSStefano Zampini 
8953cdbc3dSStefano Zampini .seealso: PCBDDC
9053cdbc3dSStefano Zampini @*/
910c7d97c5SJed Brown PetscErrorCode PCBDDCSetCoarseProblemType(PC pc, CoarseProblemType CPT)
920c7d97c5SJed Brown {
930c7d97c5SJed Brown   PetscErrorCode ierr;
940c7d97c5SJed Brown 
950c7d97c5SJed Brown   PetscFunctionBegin;
960c7d97c5SJed Brown   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
970c7d97c5SJed Brown   ierr = PetscTryMethod(pc,"PCBDDCSetCoarseProblemType_C",(PC,CoarseProblemType),(pc,CPT));CHKERRQ(ierr);
980c7d97c5SJed Brown   PetscFunctionReturn(0);
990c7d97c5SJed Brown }
1000c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
1010c7d97c5SJed Brown EXTERN_C_BEGIN
1020c7d97c5SJed Brown #undef __FUNCT__
1033b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCSetDirichletBoundaries_BDDC"
1043b03a366Sstefano_zampini static PetscErrorCode PCBDDCSetDirichletBoundaries_BDDC(PC pc,IS DirichletBoundaries)
1053b03a366Sstefano_zampini {
1063b03a366Sstefano_zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
1073b03a366Sstefano_zampini   PetscErrorCode ierr;
1083b03a366Sstefano_zampini 
1093b03a366Sstefano_zampini   PetscFunctionBegin;
1103b03a366Sstefano_zampini   ierr = ISDestroy(&pcbddc->DirichletBoundaries);CHKERRQ(ierr);
11136e030ebSStefano Zampini   ierr = PetscObjectReference((PetscObject)DirichletBoundaries);CHKERRQ(ierr);
11236e030ebSStefano Zampini   pcbddc->DirichletBoundaries=DirichletBoundaries;
1133b03a366Sstefano_zampini   PetscFunctionReturn(0);
1143b03a366Sstefano_zampini }
1153b03a366Sstefano_zampini EXTERN_C_END
1163b03a366Sstefano_zampini #undef __FUNCT__
1173b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCSetDirichletBoundaries"
1183b03a366Sstefano_zampini /*@
119da1bb401SStefano Zampini  PCBDDCSetDirichletBoundaries - Set index set defining subdomain part (in local ordering)
120da1bb401SStefano Zampini                               of Dirichlet boundaries for the global problem.
1213b03a366Sstefano_zampini 
1223b03a366Sstefano_zampini    Not collective
1233b03a366Sstefano_zampini 
1243b03a366Sstefano_zampini    Input Parameters:
1253b03a366Sstefano_zampini +  pc - the preconditioning context
1263b03a366Sstefano_zampini -  DirichletBoundaries - sequential index set defining the subdomain part of Dirichlet boundaries (can be PETSC_NULL)
1273b03a366Sstefano_zampini 
1283b03a366Sstefano_zampini    Level: intermediate
1293b03a366Sstefano_zampini 
1303b03a366Sstefano_zampini    Notes:
1313b03a366Sstefano_zampini 
1323b03a366Sstefano_zampini .seealso: PCBDDC
1333b03a366Sstefano_zampini @*/
1343b03a366Sstefano_zampini PetscErrorCode PCBDDCSetDirichletBoundaries(PC pc,IS DirichletBoundaries)
1353b03a366Sstefano_zampini {
1363b03a366Sstefano_zampini   PetscErrorCode ierr;
1373b03a366Sstefano_zampini 
1383b03a366Sstefano_zampini   PetscFunctionBegin;
1393b03a366Sstefano_zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
1403b03a366Sstefano_zampini   ierr = PetscTryMethod(pc,"PCBDDCSetDirichletBoundaries_C",(PC,IS),(pc,DirichletBoundaries));CHKERRQ(ierr);
1413b03a366Sstefano_zampini   PetscFunctionReturn(0);
1423b03a366Sstefano_zampini }
1433b03a366Sstefano_zampini /* -------------------------------------------------------------------------- */
1443b03a366Sstefano_zampini EXTERN_C_BEGIN
1453b03a366Sstefano_zampini #undef __FUNCT__
1460c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetNeumannBoundaries_BDDC"
14753cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetNeumannBoundaries_BDDC(PC pc,IS NeumannBoundaries)
1480c7d97c5SJed Brown {
1490c7d97c5SJed Brown   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
15053cdbc3dSStefano Zampini   PetscErrorCode ierr;
1510c7d97c5SJed Brown 
1520c7d97c5SJed Brown   PetscFunctionBegin;
15353cdbc3dSStefano Zampini   ierr = ISDestroy(&pcbddc->NeumannBoundaries);CHKERRQ(ierr);
15436e030ebSStefano Zampini   ierr = PetscObjectReference((PetscObject)NeumannBoundaries);CHKERRQ(ierr);
15536e030ebSStefano Zampini   pcbddc->NeumannBoundaries=NeumannBoundaries;
1560c7d97c5SJed Brown   PetscFunctionReturn(0);
1570c7d97c5SJed Brown }
1580c7d97c5SJed Brown EXTERN_C_END
1590c7d97c5SJed Brown #undef __FUNCT__
1600c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetNeumannBoundaries"
16157527edcSJed Brown /*@
162da1bb401SStefano Zampini  PCBDDCSetNeumannBoundaries - Set index set defining subdomain part (in local ordering)
163da1bb401SStefano Zampini                               of Neumann boundaries for the global problem.
16457527edcSJed Brown 
1659c0446d6SStefano Zampini    Not collective
16657527edcSJed Brown 
16757527edcSJed Brown    Input Parameters:
16857527edcSJed Brown +  pc - the preconditioning context
1699c0446d6SStefano Zampini -  NeumannBoundaries - sequential index set defining the subdomain part of Neumann boundaries (can be PETSC_NULL)
17057527edcSJed Brown 
17157527edcSJed Brown    Level: intermediate
17257527edcSJed Brown 
17357527edcSJed Brown    Notes:
17457527edcSJed Brown 
17557527edcSJed Brown .seealso: PCBDDC
17657527edcSJed Brown @*/
17753cdbc3dSStefano Zampini PetscErrorCode PCBDDCSetNeumannBoundaries(PC pc,IS NeumannBoundaries)
1780c7d97c5SJed Brown {
1790c7d97c5SJed Brown   PetscErrorCode ierr;
1800c7d97c5SJed Brown 
1810c7d97c5SJed Brown   PetscFunctionBegin;
1820c7d97c5SJed Brown   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
18353cdbc3dSStefano Zampini   ierr = PetscTryMethod(pc,"PCBDDCSetNeumannBoundaries_C",(PC,IS),(pc,NeumannBoundaries));CHKERRQ(ierr);
18453cdbc3dSStefano Zampini   PetscFunctionReturn(0);
18553cdbc3dSStefano Zampini }
18653cdbc3dSStefano Zampini /* -------------------------------------------------------------------------- */
18753cdbc3dSStefano Zampini EXTERN_C_BEGIN
18853cdbc3dSStefano Zampini #undef __FUNCT__
189da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCGetDirichletBoundaries_BDDC"
190da1bb401SStefano Zampini static PetscErrorCode PCBDDCGetDirichletBoundaries_BDDC(PC pc,IS *DirichletBoundaries)
191da1bb401SStefano Zampini {
192da1bb401SStefano Zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
193da1bb401SStefano Zampini 
194da1bb401SStefano Zampini   PetscFunctionBegin;
195da1bb401SStefano Zampini   *DirichletBoundaries = pcbddc->DirichletBoundaries;
196da1bb401SStefano Zampini   PetscFunctionReturn(0);
197da1bb401SStefano Zampini }
198da1bb401SStefano Zampini EXTERN_C_END
199da1bb401SStefano Zampini #undef __FUNCT__
200da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCGetDirichletBoundaries"
201da1bb401SStefano Zampini /*@
202da1bb401SStefano Zampini  PCBDDCGetDirichletBoundaries - Get index set defining subdomain part (in local ordering)
203da1bb401SStefano Zampini                                 of Dirichlet boundaries for the global problem.
204da1bb401SStefano Zampini 
205da1bb401SStefano Zampini    Not collective
206da1bb401SStefano Zampini 
207da1bb401SStefano Zampini    Input Parameters:
208da1bb401SStefano Zampini +  pc - the preconditioning context
209da1bb401SStefano Zampini 
210da1bb401SStefano Zampini    Output Parameters:
211da1bb401SStefano Zampini +  DirichletBoundaries - index set defining the subdomain part of Dirichlet boundaries
212da1bb401SStefano Zampini 
213da1bb401SStefano Zampini    Level: intermediate
214da1bb401SStefano Zampini 
215da1bb401SStefano Zampini    Notes:
216da1bb401SStefano Zampini 
217da1bb401SStefano Zampini .seealso: PCBDDC
218da1bb401SStefano Zampini @*/
219da1bb401SStefano Zampini PetscErrorCode PCBDDCGetDirichletBoundaries(PC pc,IS *DirichletBoundaries)
220da1bb401SStefano Zampini {
221da1bb401SStefano Zampini   PetscErrorCode ierr;
222da1bb401SStefano Zampini 
223da1bb401SStefano Zampini   PetscFunctionBegin;
224da1bb401SStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
225da1bb401SStefano Zampini   ierr = PetscUseMethod(pc,"PCBDDCGetDirichletBoundaries_C",(PC,IS*),(pc,DirichletBoundaries));CHKERRQ(ierr);
226da1bb401SStefano Zampini   PetscFunctionReturn(0);
227da1bb401SStefano Zampini }
228da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
229da1bb401SStefano Zampini EXTERN_C_BEGIN
230da1bb401SStefano Zampini #undef __FUNCT__
23153cdbc3dSStefano Zampini #define __FUNCT__ "PCBDDCGetNeumannBoundaries_BDDC"
23253cdbc3dSStefano Zampini static PetscErrorCode PCBDDCGetNeumannBoundaries_BDDC(PC pc,IS *NeumannBoundaries)
23353cdbc3dSStefano Zampini {
23453cdbc3dSStefano Zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
23553cdbc3dSStefano Zampini 
23653cdbc3dSStefano Zampini   PetscFunctionBegin;
23753cdbc3dSStefano Zampini   *NeumannBoundaries = pcbddc->NeumannBoundaries;
23853cdbc3dSStefano Zampini   PetscFunctionReturn(0);
23953cdbc3dSStefano Zampini }
24053cdbc3dSStefano Zampini EXTERN_C_END
24153cdbc3dSStefano Zampini #undef __FUNCT__
24253cdbc3dSStefano Zampini #define __FUNCT__ "PCBDDCGetNeumannBoundaries"
24353cdbc3dSStefano Zampini /*@
244da1bb401SStefano Zampini  PCBDDCGetNeumannBoundaries - Get index set defining subdomain part (in local ordering)
245da1bb401SStefano Zampini                               of Neumann boundaries for the global problem.
24653cdbc3dSStefano Zampini 
2479c0446d6SStefano Zampini    Not collective
24853cdbc3dSStefano Zampini 
24953cdbc3dSStefano Zampini    Input Parameters:
25053cdbc3dSStefano Zampini +  pc - the preconditioning context
25153cdbc3dSStefano Zampini 
25253cdbc3dSStefano Zampini    Output Parameters:
25353cdbc3dSStefano Zampini +  NeumannBoundaries - index set defining the subdomain part of Neumann boundaries
25453cdbc3dSStefano Zampini 
25553cdbc3dSStefano Zampini    Level: intermediate
25653cdbc3dSStefano Zampini 
25753cdbc3dSStefano Zampini    Notes:
25853cdbc3dSStefano Zampini 
25953cdbc3dSStefano Zampini .seealso: PCBDDC
26053cdbc3dSStefano Zampini @*/
26153cdbc3dSStefano Zampini PetscErrorCode PCBDDCGetNeumannBoundaries(PC pc,IS *NeumannBoundaries)
26253cdbc3dSStefano Zampini {
26353cdbc3dSStefano Zampini   PetscErrorCode ierr;
26453cdbc3dSStefano Zampini 
26553cdbc3dSStefano Zampini   PetscFunctionBegin;
26653cdbc3dSStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
26753cdbc3dSStefano Zampini   ierr = PetscUseMethod(pc,"PCBDDCGetNeumannBoundaries_C",(PC,IS*),(pc,NeumannBoundaries));CHKERRQ(ierr);
2680c7d97c5SJed Brown   PetscFunctionReturn(0);
2690c7d97c5SJed Brown }
27036e030ebSStefano Zampini /* -------------------------------------------------------------------------- */
27136e030ebSStefano Zampini EXTERN_C_BEGIN
27236e030ebSStefano Zampini #undef __FUNCT__
273da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetLocalAdjacencyGraph_BDDC"
274da1bb401SStefano Zampini static PetscErrorCode PCBDDCSetLocalAdjacencyGraph_BDDC(PC pc, PetscInt nvtxs, PetscInt xadj[], PetscInt adjncy[], PetscCopyMode copymode)
27536e030ebSStefano Zampini {
27636e030ebSStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
277da1bb401SStefano Zampini   PCBDDCGraph    mat_graph=pcbddc->mat_graph;
278da1bb401SStefano Zampini   PetscErrorCode ierr;
27936e030ebSStefano Zampini 
28036e030ebSStefano Zampini   PetscFunctionBegin;
281da1bb401SStefano Zampini   mat_graph->nvtxs=nvtxs;
282da1bb401SStefano Zampini   ierr = PetscFree(mat_graph->xadj);CHKERRQ(ierr);
283da1bb401SStefano Zampini   ierr = PetscFree(mat_graph->adjncy);CHKERRQ(ierr);
284da1bb401SStefano Zampini   if(copymode == PETSC_COPY_VALUES) {
285da1bb401SStefano Zampini     ierr = PetscMalloc((mat_graph->nvtxs+1)*sizeof(PetscInt),&mat_graph->xadj);CHKERRQ(ierr);
286da1bb401SStefano Zampini     ierr = PetscMalloc(xadj[mat_graph->nvtxs]*sizeof(PetscInt),&mat_graph->adjncy);CHKERRQ(ierr);
287da1bb401SStefano Zampini     ierr = PetscMemcpy(mat_graph->xadj,xadj,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr);
288da1bb401SStefano Zampini     ierr = PetscMemcpy(mat_graph->adjncy,adjncy,xadj[mat_graph->nvtxs]*sizeof(PetscInt));CHKERRQ(ierr);
289da1bb401SStefano Zampini   } else if(copymode == PETSC_OWN_POINTER) {
290da1bb401SStefano Zampini     mat_graph->xadj=xadj;
291da1bb401SStefano Zampini     mat_graph->adjncy=adjncy;
292da1bb401SStefano Zampini   } else {
293da1bb401SStefano Zampini     SETERRQ2(PETSC_COMM_SELF,PETSC_ERR_SUP,"Unsupported copy mode %d in %s\n",copymode,__FUNCT__);
294da1bb401SStefano Zampini   }
29536e030ebSStefano Zampini   PetscFunctionReturn(0);
29636e030ebSStefano Zampini }
29736e030ebSStefano Zampini EXTERN_C_END
29836e030ebSStefano Zampini #undef __FUNCT__
299da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetLocalAdjacencyGraph"
30036e030ebSStefano Zampini /*@
301da1bb401SStefano Zampini  PCBDDCSetLocalAdjacencyGraph - Set CSR graph of local matrix for use of PCBDDC.
30236e030ebSStefano Zampini 
30336e030ebSStefano Zampini    Not collective
30436e030ebSStefano Zampini 
30536e030ebSStefano Zampini    Input Parameters:
30636e030ebSStefano Zampini +  pc - the preconditioning context
307da1bb401SStefano Zampini -  nvtxs - number of local vertices of the graph
308da1bb401SStefano Zampini -  xadj, adjncy - the CSR graph
309da1bb401SStefano Zampini -  copymode - either PETSC_COPY_VALUES or PETSC_OWN_POINTER. In the former case the user must free the array passed in;
310da1bb401SStefano Zampini                                                              in the latter case, memory must be obtained with PetscMalloc.
31136e030ebSStefano Zampini 
31236e030ebSStefano Zampini    Level: intermediate
31336e030ebSStefano Zampini 
31436e030ebSStefano Zampini    Notes:
31536e030ebSStefano Zampini 
31636e030ebSStefano Zampini .seealso: PCBDDC
31736e030ebSStefano Zampini @*/
318da1bb401SStefano Zampini PetscErrorCode PCBDDCSetLocalAdjacencyGraph(PC pc,PetscInt nvtxs,PetscInt xadj[],PetscInt adjncy[], PetscCopyMode copymode)
31936e030ebSStefano Zampini {
320da1bb401SStefano Zampini   PetscInt       nrows,ncols;
321da1bb401SStefano Zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
32236e030ebSStefano Zampini   PetscErrorCode ierr;
32336e030ebSStefano Zampini 
32436e030ebSStefano Zampini   PetscFunctionBegin;
32536e030ebSStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
326da1bb401SStefano Zampini   ierr = MatGetSize(matis->A,&nrows,&ncols);CHKERRQ(ierr);
327da1bb401SStefano Zampini   if(nvtxs != nrows) {
328da1bb401SStefano Zampini     SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_ARG_SIZ,"Local adjacency size %d passed in %s differs from local problem size %d!\n",nvtxs,__FUNCT__,nrows);
329da1bb401SStefano Zampini   } else {
330da1bb401SStefano Zampini     ierr = PetscTryMethod(pc,"PCBDDCSetLocalAdjacencyGraph_C",(PC,PetscInt,PetscInt[],PetscInt[],PetscCopyMode),(pc,nvtxs,xadj,adjncy,copymode));CHKERRQ(ierr);
331da1bb401SStefano Zampini   }
33236e030ebSStefano Zampini   PetscFunctionReturn(0);
33336e030ebSStefano Zampini }
3349c0446d6SStefano Zampini /* -------------------------------------------------------------------------- */
3359c0446d6SStefano Zampini EXTERN_C_BEGIN
3369c0446d6SStefano Zampini #undef __FUNCT__
3379c0446d6SStefano Zampini #define __FUNCT__ "PCBDDCSetDofsSplitting_BDDC"
3389c0446d6SStefano Zampini static PetscErrorCode PCBDDCSetDofsSplitting_BDDC(PC pc,PetscInt n_is, IS ISForDofs[])
3399c0446d6SStefano Zampini {
3409c0446d6SStefano Zampini   PC_BDDC  *pcbddc = (PC_BDDC*)pc->data;
3419c0446d6SStefano Zampini   PetscInt i;
3429c0446d6SStefano Zampini   PetscErrorCode ierr;
3439c0446d6SStefano Zampini 
3449c0446d6SStefano Zampini   PetscFunctionBegin;
345da1bb401SStefano Zampini   /* Destroy ISes if they were already set */
3469c0446d6SStefano Zampini   for(i=0;i<pcbddc->n_ISForDofs;i++) {
3479c0446d6SStefano Zampini     ierr = ISDestroy(&pcbddc->ISForDofs[i]);CHKERRQ(ierr);
3489c0446d6SStefano Zampini   }
349d11ae9bbSstefano_zampini   ierr = PetscFree(pcbddc->ISForDofs);CHKERRQ(ierr);
350da1bb401SStefano Zampini   /* allocate space then set */
3519c0446d6SStefano Zampini   ierr = PetscMalloc(n_is*sizeof(IS),&pcbddc->ISForDofs);CHKERRQ(ierr);
3529c0446d6SStefano Zampini   for(i=0;i<n_is;i++) {
353da1bb401SStefano Zampini     ierr = PetscObjectReference((PetscObject)ISForDofs[i]);CHKERRQ(ierr);
354da1bb401SStefano Zampini     pcbddc->ISForDofs[i]=ISForDofs[i];
3559c0446d6SStefano Zampini   }
3569c0446d6SStefano Zampini   pcbddc->n_ISForDofs=n_is;
3579c0446d6SStefano Zampini   PetscFunctionReturn(0);
3589c0446d6SStefano Zampini }
3599c0446d6SStefano Zampini EXTERN_C_END
3609c0446d6SStefano Zampini #undef __FUNCT__
3619c0446d6SStefano Zampini #define __FUNCT__ "PCBDDCSetDofsSplitting"
3629c0446d6SStefano Zampini /*@
363da1bb401SStefano Zampini  PCBDDCSetDofsSplitting - Set index sets defining fields of local mat.
3649c0446d6SStefano Zampini 
3659c0446d6SStefano Zampini    Not collective
3669c0446d6SStefano Zampini 
3679c0446d6SStefano Zampini    Input Parameters:
3689c0446d6SStefano Zampini +  pc - the preconditioning context
369da1bb401SStefano Zampini -  n - number of index sets defining the fields
370da1bb401SStefano Zampini -  IS[] - array of IS describing the fields
3719c0446d6SStefano Zampini 
3729c0446d6SStefano Zampini    Level: intermediate
3739c0446d6SStefano Zampini 
3749c0446d6SStefano Zampini    Notes:
3759c0446d6SStefano Zampini 
3769c0446d6SStefano Zampini .seealso: PCBDDC
3779c0446d6SStefano Zampini @*/
3789c0446d6SStefano Zampini PetscErrorCode PCBDDCSetDofsSplitting(PC pc,PetscInt n_is, IS ISForDofs[])
3799c0446d6SStefano Zampini {
3809c0446d6SStefano Zampini   PetscErrorCode ierr;
3819c0446d6SStefano Zampini 
3829c0446d6SStefano Zampini   PetscFunctionBegin;
3839c0446d6SStefano Zampini   PetscValidHeaderSpecific(pc,PC_CLASSID,1);
3849c0446d6SStefano Zampini   ierr = PetscTryMethod(pc,"PCBDDCSetDofsSplitting_C",(PC,PetscInt,IS[]),(pc,n_is,ISForDofs));CHKERRQ(ierr);
3859c0446d6SStefano Zampini   PetscFunctionReturn(0);
3869c0446d6SStefano Zampini }
387da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
388534831adSStefano Zampini #undef __FUNCT__
389534831adSStefano Zampini #define __FUNCT__ "PCPreSolve_BDDC"
390534831adSStefano Zampini /* -------------------------------------------------------------------------- */
391534831adSStefano Zampini /*
392534831adSStefano Zampini    PCPreSolve_BDDC - Changes the right hand side and (if necessary) the initial
393534831adSStefano Zampini                      guess if a transformation of basis approach has been selected.
3949c0446d6SStefano Zampini 
395534831adSStefano Zampini    Input Parameter:
396534831adSStefano Zampini +  pc - the preconditioner contex
397534831adSStefano Zampini 
398534831adSStefano Zampini    Application Interface Routine: PCPreSolve()
399534831adSStefano Zampini 
400534831adSStefano Zampini    Notes:
401534831adSStefano Zampini    The interface routine PCPreSolve() is not usually called directly by
402534831adSStefano Zampini    the user, but instead is called by KSPSolve().
403534831adSStefano Zampini */
404534831adSStefano Zampini static PetscErrorCode PCPreSolve_BDDC(PC pc, KSP ksp, Vec rhs, Vec x)
405534831adSStefano Zampini {
406534831adSStefano Zampini   PetscErrorCode ierr;
407534831adSStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
408534831adSStefano Zampini   PC_IS          *pcis = (PC_IS*)(pc->data);
409534831adSStefano Zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
410534831adSStefano Zampini   Mat            temp_mat;
4113972b0daSStefano Zampini   IS             dirIS;
4123972b0daSStefano Zampini   PetscInt       dirsize,i,*is_indices;
4133972b0daSStefano Zampini   PetscScalar    *array_x,*array_diagonal;
4143972b0daSStefano Zampini   Vec            used_vec;
4153972b0daSStefano Zampini   PetscBool      guess_nonzero;
416534831adSStefano Zampini 
417534831adSStefano Zampini   PetscFunctionBegin;
4183972b0daSStefano Zampini   if(x) {
4193972b0daSStefano Zampini     ierr = PetscObjectReference((PetscObject)x);CHKERRQ(ierr);
4203972b0daSStefano Zampini     used_vec = x;
4213972b0daSStefano Zampini   } else {
4223972b0daSStefano Zampini     ierr = PetscObjectReference((PetscObject)pcbddc->temp_solution);CHKERRQ(ierr);
4233972b0daSStefano Zampini     used_vec = pcbddc->temp_solution;
4243972b0daSStefano Zampini     ierr = VecSet(used_vec,0.0);CHKERRQ(ierr);
4253972b0daSStefano Zampini   }
4263972b0daSStefano Zampini   /* hack into ksp data structure PCPreSolve comes earlier in src/ksp/ksp/interface/itfunc.c */
4273972b0daSStefano Zampini   if (ksp) {
4283972b0daSStefano Zampini     ierr = KSPGetInitialGuessNonzero(ksp,&guess_nonzero);CHKERRQ(ierr);
4293972b0daSStefano Zampini     if( !guess_nonzero ) {
4303972b0daSStefano Zampini       ierr = VecSet(used_vec,0.0);CHKERRQ(ierr);
4313972b0daSStefano Zampini     }
4323972b0daSStefano Zampini   }
4333972b0daSStefano Zampini   /* store the original rhs */
4343972b0daSStefano Zampini   ierr = VecCopy(rhs,pcbddc->original_rhs);CHKERRQ(ierr);
435534831adSStefano Zampini   if(pcbddc->usechangeofbasis) {
436534831adSStefano Zampini     /* swap pointers for local matrices */
437534831adSStefano Zampini     temp_mat = matis->A;
438534831adSStefano Zampini     matis->A = pcbddc->local_mat;
439534831adSStefano Zampini     pcbddc->local_mat = temp_mat;
440534831adSStefano Zampini     /* Get local rhs and apply transformation of basis */
441534831adSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,rhs,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
442534831adSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,rhs,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
443534831adSStefano Zampini     /* from original basis to modified basis */
444534831adSStefano Zampini     ierr = MatMultTranspose(pcbddc->ChangeOfBasisMatrix,pcis->vec1_B,pcis->vec2_B);CHKERRQ(ierr);
445534831adSStefano Zampini     /* put back modified values into the global vec using INSERT_VALUES copy mode */
446534831adSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,pcis->vec2_B,rhs,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
447534831adSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec2_B,rhs,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
448534831adSStefano Zampini   }
4493972b0daSStefano Zampini 
4503972b0daSStefano Zampini   /* Take into account zeroed rows -> change rhs and store solution removed */
4513972b0daSStefano Zampini   ierr = MatGetDiagonal(pc->pmat,pcis->vec1_global);CHKERRQ(ierr);
4523972b0daSStefano Zampini   ierr = VecPointwiseDivide(pcis->vec1_global,rhs,pcis->vec1_global);CHKERRQ(ierr);
4533972b0daSStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4543972b0daSStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4553972b0daSStefano Zampini   ierr = VecScatterBegin(matis->ctx,used_vec,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4563972b0daSStefano Zampini   ierr = VecScatterEnd  (matis->ctx,used_vec,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
4573972b0daSStefano Zampini   ierr = PCBDDCGetDirichletBoundaries(pc,&dirIS);CHKERRQ(ierr);
4583972b0daSStefano Zampini   if(dirIS) {
4593972b0daSStefano Zampini     ierr = ISGetSize(dirIS,&dirsize);CHKERRQ(ierr);
4603972b0daSStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array_x);CHKERRQ(ierr);
4613972b0daSStefano Zampini     ierr = VecGetArray(pcis->vec2_N,&array_diagonal);CHKERRQ(ierr);
4623972b0daSStefano Zampini     ierr = ISGetIndices(dirIS,(const PetscInt**)&is_indices);CHKERRQ(ierr);
4633972b0daSStefano Zampini     for(i=0;i<dirsize;i++) {
4643972b0daSStefano Zampini       array_x[is_indices[i]]=array_diagonal[is_indices[i]];
4653972b0daSStefano Zampini     }
4663972b0daSStefano Zampini     ierr = ISRestoreIndices(dirIS,(const PetscInt**)&is_indices);CHKERRQ(ierr);
4673972b0daSStefano Zampini     ierr = VecRestoreArray(pcis->vec2_N,&array_diagonal);CHKERRQ(ierr);
4683972b0daSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array_x);CHKERRQ(ierr);
4693972b0daSStefano Zampini   }
4703972b0daSStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4713972b0daSStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,used_vec,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
4723972b0daSStefano Zampini   /* remove the computed solution from the rhs */
4733972b0daSStefano Zampini   ierr = VecScale(used_vec,-1.0);CHKERRQ(ierr);
4743972b0daSStefano Zampini   ierr = MatMultAdd(pc->pmat,used_vec,rhs,rhs);CHKERRQ(ierr);
4753972b0daSStefano Zampini   ierr = VecScale(used_vec,-1.0);CHKERRQ(ierr);
4763972b0daSStefano Zampini   if(x) {
4773972b0daSStefano Zampini     /* store partially computed solution and set initial guess to 0 */
4783972b0daSStefano Zampini     ierr = VecCopy(used_vec,pcbddc->temp_solution);CHKERRQ(ierr);
4793972b0daSStefano Zampini     ierr = VecSet(used_vec,0.0);CHKERRQ(ierr);
4803972b0daSStefano Zampini   }
4813972b0daSStefano Zampini   ierr = VecDestroy(&used_vec);CHKERRQ(ierr);
482534831adSStefano Zampini   PetscFunctionReturn(0);
483534831adSStefano Zampini }
484534831adSStefano Zampini /* -------------------------------------------------------------------------- */
485534831adSStefano Zampini #undef __FUNCT__
486534831adSStefano Zampini #define __FUNCT__ "PCPostSolve_BDDC"
487534831adSStefano Zampini /* -------------------------------------------------------------------------- */
488534831adSStefano Zampini /*
489534831adSStefano Zampini    PCPostSolve_BDDC - Changes the computed solution if a transformation of basis
490534831adSStefano Zampini                      approach has been selected. Also, restores rhs to its original state.
491534831adSStefano Zampini 
492534831adSStefano Zampini    Input Parameter:
493534831adSStefano Zampini +  pc - the preconditioner contex
494534831adSStefano Zampini 
495534831adSStefano Zampini    Application Interface Routine: PCPostSolve()
496534831adSStefano Zampini 
497534831adSStefano Zampini    Notes:
498534831adSStefano Zampini    The interface routine PCPostSolve() is not usually called directly by
499534831adSStefano Zampini    the user, but instead is called by KSPSolve().
500534831adSStefano Zampini */
501534831adSStefano Zampini static PetscErrorCode PCPostSolve_BDDC(PC pc, KSP ksp, Vec rhs, Vec x)
502534831adSStefano Zampini {
503534831adSStefano Zampini   PetscErrorCode ierr;
504534831adSStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
505534831adSStefano Zampini   PC_IS          *pcis = (PC_IS*)(pc->data);
506534831adSStefano Zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
507534831adSStefano Zampini   Mat            temp_mat;
508534831adSStefano Zampini 
509534831adSStefano Zampini   PetscFunctionBegin;
510534831adSStefano Zampini   if(pcbddc->usechangeofbasis) {
511534831adSStefano Zampini     /* swap pointers for local matrices */
512534831adSStefano Zampini     temp_mat = matis->A;
513534831adSStefano Zampini     matis->A = pcbddc->local_mat;
514534831adSStefano Zampini     pcbddc->local_mat = temp_mat;
515534831adSStefano Zampini     /* restore rhs to its original state */
5163972b0daSStefano Zampini     if(rhs) ierr = VecCopy(pcbddc->original_rhs,rhs);CHKERRQ(ierr);
517534831adSStefano Zampini     /* Get Local boundary and apply transformation of basis to solution vector */
518534831adSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,x,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
519534831adSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,x,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
520534831adSStefano Zampini     /* from modified basis to original basis */
521534831adSStefano Zampini     ierr = MatMult(pcbddc->ChangeOfBasisMatrix,pcis->vec1_B,pcis->vec2_B);CHKERRQ(ierr);
522534831adSStefano Zampini     /* put back modified values into the global vec using INSERT_VALUES copy mode */
523534831adSStefano Zampini     ierr = VecScatterBegin(pcis->global_to_B,pcis->vec2_B,x,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
524534831adSStefano Zampini     ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec2_B,x,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
525534831adSStefano Zampini   }
5263972b0daSStefano Zampini   /* add solution removed in presolve */
5273972b0daSStefano Zampini   if(x) ierr = VecAXPY(x,1.0,pcbddc->temp_solution);CHKERRQ(ierr);
528534831adSStefano Zampini   PetscFunctionReturn(0);
529534831adSStefano Zampini }
530534831adSStefano Zampini /* -------------------------------------------------------------------------- */
53153cdbc3dSStefano Zampini #undef __FUNCT__
53253cdbc3dSStefano Zampini #define __FUNCT__ "PCSetUp_BDDC"
5330c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
5340c7d97c5SJed Brown /*
5350c7d97c5SJed Brown    PCSetUp_BDDC - Prepares for the use of the BDDC preconditioner
5360c7d97c5SJed Brown                   by setting data structures and options.
5370c7d97c5SJed Brown 
5380c7d97c5SJed Brown    Input Parameter:
53953cdbc3dSStefano Zampini +  pc - the preconditioner context
5400c7d97c5SJed Brown 
5410c7d97c5SJed Brown    Application Interface Routine: PCSetUp()
5420c7d97c5SJed Brown 
5430c7d97c5SJed Brown    Notes:
5440c7d97c5SJed Brown    The interface routine PCSetUp() is not usually called directly by
5450c7d97c5SJed Brown    the user, but instead is called by PCApply() if necessary.
5460c7d97c5SJed Brown */
54753cdbc3dSStefano Zampini PetscErrorCode PCSetUp_BDDC(PC pc)
5480c7d97c5SJed Brown {
5490c7d97c5SJed Brown   PetscErrorCode ierr;
5500c7d97c5SJed Brown   PC_BDDC*       pcbddc   = (PC_BDDC*)pc->data;
5510c7d97c5SJed Brown   PC_IS            *pcis = (PC_IS*)(pc->data);
5520c7d97c5SJed Brown 
5530c7d97c5SJed Brown   PetscFunctionBegin;
5540c7d97c5SJed Brown   if (!pc->setupcalled) {
5553b03a366Sstefano_zampini     /* For BDDC we need to define a local "Neumann" problem different to that defined in PCISSetup
5569c0446d6SStefano Zampini        So, we set to pcnone the Neumann problem of pcis in order to avoid unneeded computation
5570c7d97c5SJed Brown        Also, we decide to directly build the (same) Dirichlet problem */
5580c7d97c5SJed Brown     ierr = PetscOptionsSetValue("-is_localN_pc_type","none");CHKERRQ(ierr);
5590c7d97c5SJed Brown     ierr = PetscOptionsSetValue("-is_localD_pc_type","none");CHKERRQ(ierr);
5600c7d97c5SJed Brown     /* Set up all the "iterative substructuring" common block */
5610c7d97c5SJed Brown     ierr = PCISSetUp(pc);CHKERRQ(ierr);
5623b03a366Sstefano_zampini     /* Get stdout for dbg */
563e269702eSStefano Zampini     if(pcbddc->dbg_flag) {
564e269702eSStefano Zampini       ierr = PetscViewerASCIIGetStdout(((PetscObject)pc)->comm,&pcbddc->dbg_viewer);CHKERRQ(ierr);
565e269702eSStefano Zampini       ierr = PetscViewerASCIISynchronizedAllow(pcbddc->dbg_viewer,PETSC_TRUE);CHKERRQ(ierr);
566e269702eSStefano Zampini     }
5673b03a366Sstefano_zampini     /* TODO MOVE CODE FRAGMENT */
5680c7d97c5SJed Brown     PetscInt im_active=0;
5690c7d97c5SJed Brown     if(pcis->n) im_active = 1;
57053cdbc3dSStefano Zampini     ierr = MPI_Allreduce(&im_active,&pcbddc->active_procs,1,MPIU_INT,MPI_SUM,((PetscObject)pc)->comm);CHKERRQ(ierr);
5713b03a366Sstefano_zampini     /* Analyze local interface */
5720c7d97c5SJed Brown     ierr = PCBDDCManageLocalBoundaries(pc);CHKERRQ(ierr);
5733b03a366Sstefano_zampini     /* Set up local constraint matrix */
5743b03a366Sstefano_zampini     ierr = PCBDDCCreateConstraintMatrix(pc);CHKERRQ(ierr);
5750c7d97c5SJed Brown     /* Create coarse and local stuffs used for evaluating action of preconditioner */
5760c7d97c5SJed Brown     ierr = PCBDDCCoarseSetUp(pc);CHKERRQ(ierr);
5773b03a366Sstefano_zampini     /* Processes fakely involved in multilevel should not call ISLocalToGlobalMappingRestoreInfo */
5783b03a366Sstefano_zampini     if ( !pcis->n_neigh ) pcis->ISLocalToGlobalMappingGetInfoWasCalled=PETSC_FALSE;
5790c7d97c5SJed Brown   }
5800c7d97c5SJed Brown   PetscFunctionReturn(0);
5810c7d97c5SJed Brown }
5820c7d97c5SJed Brown 
5830c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
5840c7d97c5SJed Brown /*
5850c7d97c5SJed Brown    PCApply_BDDC - Applies the BDDC preconditioner to a vector.
5860c7d97c5SJed Brown 
5870c7d97c5SJed Brown    Input Parameters:
5880c7d97c5SJed Brown .  pc - the preconditioner context
5890c7d97c5SJed Brown .  r - input vector (global)
5900c7d97c5SJed Brown 
5910c7d97c5SJed Brown    Output Parameter:
5920c7d97c5SJed Brown .  z - output vector (global)
5930c7d97c5SJed Brown 
5940c7d97c5SJed Brown    Application Interface Routine: PCApply()
5950c7d97c5SJed Brown  */
5960c7d97c5SJed Brown #undef __FUNCT__
5970c7d97c5SJed Brown #define __FUNCT__ "PCApply_BDDC"
59853cdbc3dSStefano Zampini PetscErrorCode PCApply_BDDC(PC pc,Vec r,Vec z)
5990c7d97c5SJed Brown {
6000c7d97c5SJed Brown   PC_IS             *pcis = (PC_IS*)(pc->data);
6010c7d97c5SJed Brown   PC_BDDC           *pcbddc = (PC_BDDC*)(pc->data);
6020c7d97c5SJed Brown   PetscErrorCode    ierr;
6033b03a366Sstefano_zampini   const PetscScalar one = 1.0;
6043b03a366Sstefano_zampini   const PetscScalar m_one = -1.0;
6052617d88aSStefano Zampini   const PetscScalar zero = 0.0;
6060c7d97c5SJed Brown 
6070c7d97c5SJed Brown /* This code is similar to that provided in nn.c for PCNN
6080c7d97c5SJed Brown    NN interface preconditioner changed to BDDC
6090c7d97c5SJed Brown    Added support for M_3 preconditioenr in the reference article (code is active if pcbddc->prec_type = PETSC_TRUE) */
6100c7d97c5SJed Brown 
6110c7d97c5SJed Brown   PetscFunctionBegin;
6120c7d97c5SJed Brown   /* First Dirichlet solve */
6130c7d97c5SJed Brown   ierr = VecScatterBegin(pcis->global_to_D,r,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
6140c7d97c5SJed Brown   ierr = VecScatterEnd  (pcis->global_to_D,r,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
61553cdbc3dSStefano Zampini   ierr = KSPSolve(pcbddc->ksp_D,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr);
6160c7d97c5SJed Brown   /*
6170c7d97c5SJed Brown     Assembling right hand side for BDDC operator
6180c7d97c5SJed Brown     - vec1_D for the Dirichlet part (if needed, i.e. prec_flag=PETSC_TRUE)
6190c7d97c5SJed Brown     - the interface part of the global vector z
6200c7d97c5SJed Brown   */
6210c7d97c5SJed Brown   ierr = VecScale(pcis->vec2_D,m_one);CHKERRQ(ierr);
6220c7d97c5SJed Brown   ierr = MatMult(pcis->A_BI,pcis->vec2_D,pcis->vec1_B);CHKERRQ(ierr);
6230c7d97c5SJed Brown   if(pcbddc->prec_type) { ierr = MatMultAdd(pcis->A_II,pcis->vec2_D,pcis->vec1_D,pcis->vec1_D);CHKERRQ(ierr); }
6240c7d97c5SJed Brown   ierr = VecScale(pcis->vec2_D,m_one);CHKERRQ(ierr);
6250c7d97c5SJed Brown   ierr = VecCopy(r,z);CHKERRQ(ierr);
6260c7d97c5SJed Brown   ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
6270c7d97c5SJed Brown   ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
6280c7d97c5SJed Brown 
6292617d88aSStefano Zampini   /* Get Local boundary and apply partition of unity */
6302617d88aSStefano Zampini   ierr = VecScatterBegin(pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
6312617d88aSStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
6322617d88aSStefano Zampini   ierr = VecPointwiseMult(pcis->vec1_B,pcis->D,pcis->vec1_B);CHKERRQ(ierr);
6332617d88aSStefano Zampini 
6342617d88aSStefano Zampini   /* Apply interface preconditioner
6352617d88aSStefano Zampini      input/output vecs: pcis->vec1_B and pcis->vec1_D */
6362617d88aSStefano Zampini   ierr = PCBDDCApplyInterfacePreconditioner(pc);CHKERRQ(ierr);
6372617d88aSStefano Zampini 
6382617d88aSStefano Zampini   /* Apply partition of unity and sum boundary values */
6392617d88aSStefano Zampini   ierr = VecPointwiseMult(pcis->vec1_B,pcis->D,pcis->vec1_B);CHKERRQ(ierr);
6402617d88aSStefano Zampini   ierr = VecSet(z,zero);CHKERRQ(ierr);
6412617d88aSStefano Zampini   ierr = VecScatterBegin(pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
6422617d88aSStefano Zampini   ierr = VecScatterEnd  (pcis->global_to_B,pcis->vec1_B,z,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
6430c7d97c5SJed Brown 
6443b03a366Sstefano_zampini   /* Second Dirichlet solve and assembling of output */
6450c7d97c5SJed Brown   ierr = VecScatterBegin(pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
6460c7d97c5SJed Brown   ierr = VecScatterEnd  (pcis->global_to_B,z,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
6470c7d97c5SJed Brown   ierr = MatMult(pcis->A_IB,pcis->vec1_B,pcis->vec3_D);CHKERRQ(ierr);
6480c7d97c5SJed Brown   if(pcbddc->prec_type) { ierr = MatMultAdd(pcis->A_II,pcis->vec1_D,pcis->vec3_D,pcis->vec3_D);CHKERRQ(ierr); }
64953cdbc3dSStefano Zampini   ierr = KSPSolve(pcbddc->ksp_D,pcis->vec3_D,pcbddc->vec4_D);CHKERRQ(ierr);
6500c7d97c5SJed Brown   ierr = VecScale(pcbddc->vec4_D,m_one);CHKERRQ(ierr);
6510c7d97c5SJed Brown   if(pcbddc->prec_type) { ierr = VecAXPY (pcbddc->vec4_D,one,pcis->vec1_D);CHKERRQ(ierr); }
6520c7d97c5SJed Brown   ierr = VecAXPY (pcis->vec2_D,one,pcbddc->vec4_D);CHKERRQ(ierr);
6530c7d97c5SJed Brown   ierr = VecScatterBegin(pcis->global_to_D,pcis->vec2_D,z,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
6540c7d97c5SJed Brown   ierr = VecScatterEnd  (pcis->global_to_D,pcis->vec2_D,z,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
6550c7d97c5SJed Brown   PetscFunctionReturn(0);
6560c7d97c5SJed Brown 
6570c7d97c5SJed Brown }
658da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
659da1bb401SStefano Zampini #undef __FUNCT__
660da1bb401SStefano Zampini #define __FUNCT__ "PCDestroy_BDDC"
661da1bb401SStefano Zampini PetscErrorCode PCDestroy_BDDC(PC pc)
662da1bb401SStefano Zampini {
663da1bb401SStefano Zampini   PC_BDDC          *pcbddc = (PC_BDDC*)pc->data;
664da1bb401SStefano Zampini   PetscErrorCode ierr;
665da1bb401SStefano Zampini 
666da1bb401SStefano Zampini   PetscFunctionBegin;
667da1bb401SStefano Zampini   /* free data created by PCIS */
668da1bb401SStefano Zampini   ierr = PCISDestroy(pc);CHKERRQ(ierr);
669da1bb401SStefano Zampini   /* free BDDC data  */
6703972b0daSStefano Zampini   ierr = VecDestroy(&pcbddc->temp_solution);CHKERRQ(ierr);
671534831adSStefano Zampini   ierr = VecDestroy(&pcbddc->original_rhs);CHKERRQ(ierr);
672534831adSStefano Zampini   ierr = MatDestroy(&pcbddc->local_mat);CHKERRQ(ierr);
673534831adSStefano Zampini   ierr = MatDestroy(&pcbddc->ChangeOfBasisMatrix);CHKERRQ(ierr);
674da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->coarse_vec);CHKERRQ(ierr);
675da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->coarse_rhs);CHKERRQ(ierr);
676da1bb401SStefano Zampini   ierr = KSPDestroy(&pcbddc->coarse_ksp);CHKERRQ(ierr);
677da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->coarse_mat);CHKERRQ(ierr);
678da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->coarse_phi_B);CHKERRQ(ierr);
679da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->coarse_phi_D);CHKERRQ(ierr);
680da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec1_P);CHKERRQ(ierr);
681da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec1_C);CHKERRQ(ierr);
682da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->local_auxmat1);CHKERRQ(ierr);
683da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->local_auxmat2);CHKERRQ(ierr);
684da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec1_R);CHKERRQ(ierr);
685da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec2_R);CHKERRQ(ierr);
686da1bb401SStefano Zampini   ierr = VecDestroy(&pcbddc->vec4_D);CHKERRQ(ierr);
687da1bb401SStefano Zampini   ierr = VecScatterDestroy(&pcbddc->R_to_B);CHKERRQ(ierr);
688da1bb401SStefano Zampini   ierr = VecScatterDestroy(&pcbddc->R_to_D);CHKERRQ(ierr);
689da1bb401SStefano Zampini   ierr = VecScatterDestroy(&pcbddc->coarse_loc_to_glob);CHKERRQ(ierr);
690da1bb401SStefano Zampini   ierr = KSPDestroy(&pcbddc->ksp_D);CHKERRQ(ierr);
691da1bb401SStefano Zampini   ierr = KSPDestroy(&pcbddc->ksp_R);CHKERRQ(ierr);
692da1bb401SStefano Zampini   ierr = ISDestroy(&pcbddc->NeumannBoundaries);CHKERRQ(ierr);
693da1bb401SStefano Zampini   ierr = ISDestroy(&pcbddc->DirichletBoundaries);CHKERRQ(ierr);
694da1bb401SStefano Zampini   ierr = MatDestroy(&pcbddc->ConstraintMatrix);CHKERRQ(ierr);
695da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->local_primal_indices);CHKERRQ(ierr);
696da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->replicated_local_primal_indices);CHKERRQ(ierr);
697da1bb401SStefano Zampini   if (pcbddc->replicated_local_primal_values)    { free(pcbddc->replicated_local_primal_values); }
698da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->local_primal_displacements);CHKERRQ(ierr);
699da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->local_primal_sizes);CHKERRQ(ierr);
700da1bb401SStefano Zampini   PetscInt i;
701da1bb401SStefano Zampini   for(i=0;i<pcbddc->n_ISForDofs;i++) { ierr = ISDestroy(&pcbddc->ISForDofs[i]);CHKERRQ(ierr); }
702da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->ISForDofs);CHKERRQ(ierr);
703da1bb401SStefano Zampini   for(i=0;i<pcbddc->n_ISForFaces;i++) { ierr = ISDestroy(&pcbddc->ISForFaces[i]);CHKERRQ(ierr); }
704da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->ISForFaces);CHKERRQ(ierr);
705da1bb401SStefano Zampini   for(i=0;i<pcbddc->n_ISForEdges;i++) { ierr = ISDestroy(&pcbddc->ISForEdges[i]);CHKERRQ(ierr); }
706da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->ISForEdges);CHKERRQ(ierr);
707da1bb401SStefano Zampini   ierr = ISDestroy(&pcbddc->ISForVertices);CHKERRQ(ierr);
7083972b0daSStefano Zampini   /* Free graph structure */
709da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph->xadj);CHKERRQ(ierr);
710da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph->adjncy);CHKERRQ(ierr);
711da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph->neighbours_set[0]);CHKERRQ(ierr);
712da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph->neighbours_set);CHKERRQ(ierr);
7133972b0daSStefano Zampini   ierr = PetscFree4(pcbddc->mat_graph->where,pcbddc->mat_graph->count,pcbddc->mat_graph->cptr,pcbddc->mat_graph->queue);CHKERRQ(ierr);
7143972b0daSStefano Zampini   ierr = PetscFree2(pcbddc->mat_graph->which_dof,pcbddc->mat_graph->touched);CHKERRQ(ierr);
7153972b0daSStefano Zampini   ierr = PetscFree(pcbddc->mat_graph->where_ncmps);CHKERRQ(ierr);
716da1bb401SStefano Zampini   ierr = PetscFree(pcbddc->mat_graph);CHKERRQ(ierr);
717da1bb401SStefano Zampini   /* Free the private data structure that was hanging off the PC */
718da1bb401SStefano Zampini   ierr = PetscFree(pcbddc);CHKERRQ(ierr);
719da1bb401SStefano Zampini   PetscFunctionReturn(0);
720da1bb401SStefano Zampini }
7210c7d97c5SJed Brown 
7220c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
723da1bb401SStefano Zampini /*MC
724da1bb401SStefano Zampini    PCBDDC - Balancing Domain Decomposition by Constraints.
7250c7d97c5SJed Brown 
726da1bb401SStefano Zampini    Options Database Keys:
727da1bb401SStefano Zampini .    -pcbddc ??? -
728da1bb401SStefano Zampini 
729da1bb401SStefano Zampini    Level: intermediate
730da1bb401SStefano Zampini 
731da1bb401SStefano Zampini    Notes: The matrix used with this preconditioner must be of type MATIS
732da1bb401SStefano Zampini 
733da1bb401SStefano Zampini           Unlike more 'conventional' interface preconditioners, this iterates over ALL the
734da1bb401SStefano Zampini           degrees of freedom, NOT just those on the interface (this allows the use of approximate solvers
735da1bb401SStefano Zampini           on the subdomains).
736da1bb401SStefano Zampini 
737da1bb401SStefano Zampini           Options for the coarse grid preconditioner can be set with -
738da1bb401SStefano Zampini           Options for the Dirichlet subproblem can be set with -
739da1bb401SStefano Zampini           Options for the Neumann subproblem can be set with -
740da1bb401SStefano Zampini 
741da1bb401SStefano Zampini    Contributed by Stefano Zampini
742da1bb401SStefano Zampini 
743da1bb401SStefano Zampini .seealso:  PCCreate(), PCSetType(), PCType (for list of available types), PC,  MATIS
744da1bb401SStefano Zampini M*/
745da1bb401SStefano Zampini EXTERN_C_BEGIN
746da1bb401SStefano Zampini #undef __FUNCT__
747da1bb401SStefano Zampini #define __FUNCT__ "PCCreate_BDDC"
748da1bb401SStefano Zampini PetscErrorCode PCCreate_BDDC(PC pc)
749da1bb401SStefano Zampini {
750da1bb401SStefano Zampini   PetscErrorCode ierr;
751da1bb401SStefano Zampini   PC_BDDC        *pcbddc;
752da1bb401SStefano Zampini   PCBDDCGraph    mat_graph;
753da1bb401SStefano Zampini 
754da1bb401SStefano Zampini   PetscFunctionBegin;
755da1bb401SStefano Zampini   /* Creates the private data structure for this preconditioner and attach it to the PC object. */
756da1bb401SStefano Zampini   ierr      = PetscNewLog(pc,PC_BDDC,&pcbddc);CHKERRQ(ierr);
757da1bb401SStefano Zampini   pc->data  = (void*)pcbddc;
758da1bb401SStefano Zampini 
759da1bb401SStefano Zampini   /* create PCIS data structure */
760da1bb401SStefano Zampini   ierr = PCISCreate(pc);CHKERRQ(ierr);
761da1bb401SStefano Zampini 
762da1bb401SStefano Zampini   /* BDDC specific */
7633972b0daSStefano Zampini   pcbddc->temp_solution              = 0;
764534831adSStefano Zampini   pcbddc->original_rhs               = 0;
765534831adSStefano Zampini   pcbddc->local_mat                  = 0;
766534831adSStefano Zampini   pcbddc->ChangeOfBasisMatrix        = 0;
767534831adSStefano Zampini   pcbddc->usechangeofbasis           = PETSC_TRUE;
768534831adSStefano Zampini   pcbddc->usechangeonfaces           = PETSC_FALSE;
769da1bb401SStefano Zampini   pcbddc->coarse_vec                 = 0;
770da1bb401SStefano Zampini   pcbddc->coarse_rhs                 = 0;
771da1bb401SStefano Zampini   pcbddc->coarse_ksp                 = 0;
772da1bb401SStefano Zampini   pcbddc->coarse_phi_B               = 0;
773da1bb401SStefano Zampini   pcbddc->coarse_phi_D               = 0;
774da1bb401SStefano Zampini   pcbddc->vec1_P                     = 0;
775da1bb401SStefano Zampini   pcbddc->vec1_R                     = 0;
776da1bb401SStefano Zampini   pcbddc->vec2_R                     = 0;
777da1bb401SStefano Zampini   pcbddc->local_auxmat1              = 0;
778da1bb401SStefano Zampini   pcbddc->local_auxmat2              = 0;
779da1bb401SStefano Zampini   pcbddc->R_to_B                     = 0;
780da1bb401SStefano Zampini   pcbddc->R_to_D                     = 0;
781da1bb401SStefano Zampini   pcbddc->ksp_D                      = 0;
782da1bb401SStefano Zampini   pcbddc->ksp_R                      = 0;
783da1bb401SStefano Zampini   pcbddc->local_primal_indices       = 0;
784da1bb401SStefano Zampini   pcbddc->prec_type                  = PETSC_FALSE;
785da1bb401SStefano Zampini   pcbddc->NeumannBoundaries          = 0;
786da1bb401SStefano Zampini   pcbddc->ISForDofs                  = 0;
787da1bb401SStefano Zampini   pcbddc->ISForVertices              = 0;
788da1bb401SStefano Zampini   pcbddc->n_ISForFaces               = 0;
789da1bb401SStefano Zampini   pcbddc->n_ISForEdges               = 0;
790da1bb401SStefano Zampini   pcbddc->ConstraintMatrix           = 0;
791da1bb401SStefano Zampini   pcbddc->use_nnsp_true              = PETSC_FALSE;
792da1bb401SStefano Zampini   pcbddc->local_primal_sizes         = 0;
793da1bb401SStefano Zampini   pcbddc->local_primal_displacements = 0;
794da1bb401SStefano Zampini   pcbddc->replicated_local_primal_indices = 0;
795da1bb401SStefano Zampini   pcbddc->replicated_local_primal_values  = 0;
796da1bb401SStefano Zampini   pcbddc->coarse_loc_to_glob         = 0;
797da1bb401SStefano Zampini   pcbddc->dbg_flag                   = PETSC_FALSE;
798da1bb401SStefano Zampini   pcbddc->coarsening_ratio           = 8;
799da1bb401SStefano Zampini 
800da1bb401SStefano Zampini   /* allocate and initialize needed graph structure */
801da1bb401SStefano Zampini   ierr = PetscMalloc(sizeof(*mat_graph),&pcbddc->mat_graph);CHKERRQ(ierr);
802da1bb401SStefano Zampini   pcbddc->mat_graph->xadj            = 0;
803da1bb401SStefano Zampini   pcbddc->mat_graph->adjncy          = 0;
804da1bb401SStefano Zampini 
805da1bb401SStefano Zampini   /* function pointers */
806da1bb401SStefano Zampini   pc->ops->apply               = PCApply_BDDC;
807da1bb401SStefano Zampini   pc->ops->applytranspose      = 0;
808da1bb401SStefano Zampini   pc->ops->setup               = PCSetUp_BDDC;
809da1bb401SStefano Zampini   pc->ops->destroy             = PCDestroy_BDDC;
810da1bb401SStefano Zampini   pc->ops->setfromoptions      = PCSetFromOptions_BDDC;
811da1bb401SStefano Zampini   pc->ops->view                = 0;
812da1bb401SStefano Zampini   pc->ops->applyrichardson     = 0;
813da1bb401SStefano Zampini   pc->ops->applysymmetricleft  = 0;
814da1bb401SStefano Zampini   pc->ops->applysymmetricright = 0;
815534831adSStefano Zampini   pc->ops->presolve            = PCPreSolve_BDDC;
816534831adSStefano Zampini   pc->ops->postsolve           = PCPostSolve_BDDC;
817da1bb401SStefano Zampini 
818da1bb401SStefano Zampini   /* composing function */
819da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDirichletBoundaries_C","PCBDDCSetDirichletBoundaries_BDDC",
820da1bb401SStefano Zampini                     PCBDDCSetDirichletBoundaries_BDDC);CHKERRQ(ierr);
821da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetNeumannBoundaries_C","PCBDDCSetNeumannBoundaries_BDDC",
822da1bb401SStefano Zampini                     PCBDDCSetNeumannBoundaries_BDDC);CHKERRQ(ierr);
823da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetDirichletBoundaries_C","PCBDDCGetDirichletBoundaries_BDDC",
824da1bb401SStefano Zampini                     PCBDDCGetDirichletBoundaries_BDDC);CHKERRQ(ierr);
825da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCGetNeumannBoundaries_C","PCBDDCGetNeumannBoundaries_BDDC",
826da1bb401SStefano Zampini                     PCBDDCGetNeumannBoundaries_BDDC);CHKERRQ(ierr);
827da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetCoarseProblemType_C","PCBDDCSetCoarseProblemType_BDDC",
828da1bb401SStefano Zampini                     PCBDDCSetCoarseProblemType_BDDC);CHKERRQ(ierr);
829da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetDofsSplitting_C","PCBDDCSetDofsSplitting_BDDC",
830da1bb401SStefano Zampini                     PCBDDCSetDofsSplitting_BDDC);CHKERRQ(ierr);
831da1bb401SStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCBDDCSetLocalAdjacencyGraph_C","PCBDDCSetLocalAdjacencyGraph_BDDC",
832da1bb401SStefano Zampini                     PCBDDCSetLocalAdjacencyGraph_BDDC);CHKERRQ(ierr);
833534831adSStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPreSolve_C","PCPreSolve_BDDC",
834534831adSStefano Zampini                     PCPreSolve_BDDC);CHKERRQ(ierr);
835534831adSStefano Zampini   ierr = PetscObjectComposeFunctionDynamic((PetscObject)pc,"PCPostSolve_C","PCPostSolve_BDDC",
836534831adSStefano Zampini                     PCPostSolve_BDDC);CHKERRQ(ierr);
837da1bb401SStefano Zampini   PetscFunctionReturn(0);
838da1bb401SStefano Zampini }
839da1bb401SStefano Zampini EXTERN_C_END
840da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
841da1bb401SStefano Zampini /* All static functions from now on                                           */
842da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
843da1bb401SStefano Zampini #undef __FUNCT__
844da1bb401SStefano Zampini #define __FUNCT__ "PCBDDCSetupLocalAdjacencyGraph"
845da1bb401SStefano Zampini static PetscErrorCode PCBDDCSetupLocalAdjacencyGraph(PC pc)
846da1bb401SStefano Zampini {
847da1bb401SStefano Zampini   PC_BDDC        *pcbddc = (PC_BDDC*)pc->data;
848da1bb401SStefano Zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
849da1bb401SStefano Zampini   PetscInt       nvtxs,*xadj,*adjncy;
850da1bb401SStefano Zampini   Mat            mat_adj;
851da1bb401SStefano Zampini   PetscBool      symmetrize_rowij=PETSC_TRUE,compressed_rowij=PETSC_FALSE,flg_row=PETSC_TRUE;
852da1bb401SStefano Zampini   PCBDDCGraph    mat_graph=pcbddc->mat_graph;
853da1bb401SStefano Zampini   PetscErrorCode ierr;
854da1bb401SStefano Zampini 
855da1bb401SStefano Zampini   PetscFunctionBegin;
856da1bb401SStefano Zampini   /* get CSR adjacency from local matrix if user has not yet provided local graph using PCBDDCSetLocalAdjacencyGraph function */
857da1bb401SStefano Zampini   if(!mat_graph->xadj) {
858da1bb401SStefano Zampini     ierr = MatConvert(matis->A,MATMPIADJ,MAT_INITIAL_MATRIX,&mat_adj);CHKERRQ(ierr);
859da1bb401SStefano Zampini     ierr = MatGetRowIJ(mat_adj,0,symmetrize_rowij,compressed_rowij,&nvtxs,&xadj,&adjncy,&flg_row);CHKERRQ(ierr);
860da1bb401SStefano Zampini     if(!flg_row) {
861da1bb401SStefano Zampini       SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in MatGetRowIJ called in %s\n",__FUNCT__);
862da1bb401SStefano Zampini     }
863da1bb401SStefano Zampini     /* Get adjacency into BDDC workspace */
864da1bb401SStefano Zampini     ierr = PCBDDCSetLocalAdjacencyGraph(pc,nvtxs,xadj,adjncy,PETSC_COPY_VALUES);CHKERRQ(ierr);
865da1bb401SStefano Zampini     ierr = MatRestoreRowIJ(mat_adj,0,symmetrize_rowij,compressed_rowij,&nvtxs,&xadj,&adjncy,&flg_row);CHKERRQ(ierr);
866da1bb401SStefano Zampini     if(!flg_row) {
867da1bb401SStefano Zampini       SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_PLIB,"Error in MatRestoreRowIJ called in %s\n",__FUNCT__);
868da1bb401SStefano Zampini     }
869da1bb401SStefano Zampini     ierr = MatDestroy(&mat_adj);CHKERRQ(ierr);
870da1bb401SStefano Zampini   }
871da1bb401SStefano Zampini   PetscFunctionReturn(0);
872da1bb401SStefano Zampini }
873da1bb401SStefano Zampini /* -------------------------------------------------------------------------- */
8740c7d97c5SJed Brown #undef __FUNCT__
8750c7d97c5SJed Brown #define __FUNCT__ "PCBDDCApplyInterfacePreconditioner"
8762617d88aSStefano Zampini static PetscErrorCode  PCBDDCApplyInterfacePreconditioner(PC pc)
8770c7d97c5SJed Brown {
8780c7d97c5SJed Brown   PetscErrorCode ierr;
8790c7d97c5SJed Brown   PC_BDDC*        pcbddc = (PC_BDDC*)(pc->data);
8800c7d97c5SJed Brown   PC_IS*            pcis = (PC_IS*)  (pc->data);
8813b03a366Sstefano_zampini   const PetscScalar zero = 0.0;
8820c7d97c5SJed Brown 
8830c7d97c5SJed Brown   PetscFunctionBegin;
8840c7d97c5SJed Brown   /* Application of PHI^T  */
8850c7d97c5SJed Brown   ierr = MatMultTranspose(pcbddc->coarse_phi_B,pcis->vec1_B,pcbddc->vec1_P);CHKERRQ(ierr);
8860c7d97c5SJed Brown   if(pcbddc->prec_type) { ierr = MatMultTransposeAdd(pcbddc->coarse_phi_D,pcis->vec1_D,pcbddc->vec1_P,pcbddc->vec1_P);CHKERRQ(ierr); }
8870c7d97c5SJed Brown 
8880c7d97c5SJed Brown   /* Scatter data of coarse_rhs */
8890c7d97c5SJed Brown   if(pcbddc->coarse_rhs) ierr = VecSet(pcbddc->coarse_rhs,zero);CHKERRQ(ierr);
8900c7d97c5SJed Brown   ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->vec1_P,pcbddc->coarse_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
8910c7d97c5SJed Brown 
8920c7d97c5SJed Brown   /* Local solution on R nodes */
8930c7d97c5SJed Brown   ierr = VecSet(pcbddc->vec1_R,zero);CHKERRQ(ierr);
8940c7d97c5SJed Brown   ierr = VecScatterBegin(pcbddc->R_to_B,pcis->vec1_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
8950c7d97c5SJed Brown   ierr = VecScatterEnd  (pcbddc->R_to_B,pcis->vec1_B,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
8960c7d97c5SJed Brown   if(pcbddc->prec_type) {
8970c7d97c5SJed Brown     ierr = VecScatterBegin(pcbddc->R_to_D,pcis->vec1_D,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
8980c7d97c5SJed Brown     ierr = VecScatterEnd  (pcbddc->R_to_D,pcis->vec1_D,pcbddc->vec1_R,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
8990c7d97c5SJed Brown   }
9000c7d97c5SJed Brown   ierr = PCBDDCSolveSaddlePoint(pc);CHKERRQ(ierr);
9010c7d97c5SJed Brown   ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr);
9020c7d97c5SJed Brown   ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec2_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
9030c7d97c5SJed Brown   ierr = VecScatterEnd  (pcbddc->R_to_B,pcbddc->vec2_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
9040c7d97c5SJed Brown   if(pcbddc->prec_type) {
9050c7d97c5SJed Brown     ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec2_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
9060c7d97c5SJed Brown     ierr = VecScatterEnd  (pcbddc->R_to_D,pcbddc->vec2_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
9070c7d97c5SJed Brown   }
9080c7d97c5SJed Brown 
9090c7d97c5SJed Brown   /* Coarse solution */
9100c7d97c5SJed Brown   ierr = PCBDDCScatterCoarseDataEnd(pc,pcbddc->vec1_P,pcbddc->coarse_rhs,ADD_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
91153cdbc3dSStefano Zampini   if(pcbddc->coarse_rhs) ierr = KSPSolve(pcbddc->coarse_ksp,pcbddc->coarse_rhs,pcbddc->coarse_vec);CHKERRQ(ierr);
9120c7d97c5SJed Brown   ierr = PCBDDCScatterCoarseDataBegin(pc,pcbddc->coarse_vec,pcbddc->vec1_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
9130c7d97c5SJed Brown   ierr = PCBDDCScatterCoarseDataEnd  (pc,pcbddc->coarse_vec,pcbddc->vec1_P,INSERT_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
9140c7d97c5SJed Brown 
9150c7d97c5SJed Brown   /* Sum contributions from two levels */
9160c7d97c5SJed Brown   ierr = MatMultAdd(pcbddc->coarse_phi_B,pcbddc->vec1_P,pcis->vec1_B,pcis->vec1_B);CHKERRQ(ierr);
9170c7d97c5SJed Brown   if(pcbddc->prec_type) { ierr = MatMultAdd(pcbddc->coarse_phi_D,pcbddc->vec1_P,pcis->vec1_D,pcis->vec1_D);CHKERRQ(ierr); }
9180c7d97c5SJed Brown   PetscFunctionReturn(0);
9190c7d97c5SJed Brown }
9200c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
9210c7d97c5SJed Brown #undef __FUNCT__
9220c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSolveSaddlePoint"
92353cdbc3dSStefano Zampini static PetscErrorCode  PCBDDCSolveSaddlePoint(PC pc)
9240c7d97c5SJed Brown {
9250c7d97c5SJed Brown   PetscErrorCode ierr;
9260c7d97c5SJed Brown   PC_BDDC*       pcbddc = (PC_BDDC*)(pc->data);
9270c7d97c5SJed Brown 
9280c7d97c5SJed Brown   PetscFunctionBegin;
92953cdbc3dSStefano Zampini   ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr);
930534831adSStefano Zampini   if(pcbddc->local_auxmat1) {
9310c7d97c5SJed Brown     ierr = MatMult(pcbddc->local_auxmat1,pcbddc->vec2_R,pcbddc->vec1_C);CHKERRQ(ierr);
9320c7d97c5SJed Brown     ierr = MatMultAdd(pcbddc->local_auxmat2,pcbddc->vec1_C,pcbddc->vec2_R,pcbddc->vec2_R);CHKERRQ(ierr);
9330c7d97c5SJed Brown   }
9340c7d97c5SJed Brown   PetscFunctionReturn(0);
9350c7d97c5SJed Brown }
9360c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
9370c7d97c5SJed Brown #undef __FUNCT__
9380c7d97c5SJed Brown #define __FUNCT__ "PCBDDCScatterCoarseDataBegin"
93953cdbc3dSStefano Zampini static PetscErrorCode  PCBDDCScatterCoarseDataBegin(PC pc,Vec vec_from, Vec vec_to, InsertMode imode, ScatterMode smode)
9400c7d97c5SJed Brown {
9410c7d97c5SJed Brown   PetscErrorCode ierr;
9420c7d97c5SJed Brown   PC_BDDC*       pcbddc = (PC_BDDC*)(pc->data);
9430c7d97c5SJed Brown 
9440c7d97c5SJed Brown   PetscFunctionBegin;
9450c7d97c5SJed Brown   switch(pcbddc->coarse_communications_type){
9460c7d97c5SJed Brown     case SCATTERS_BDDC:
9470c7d97c5SJed Brown       ierr = VecScatterBegin(pcbddc->coarse_loc_to_glob,vec_from,vec_to,imode,smode);CHKERRQ(ierr);
9480c7d97c5SJed Brown       break;
9490c7d97c5SJed Brown     case GATHERS_BDDC:
9500c7d97c5SJed Brown       break;
9510c7d97c5SJed Brown   }
9520c7d97c5SJed Brown   PetscFunctionReturn(0);
9530c7d97c5SJed Brown }
9540c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
9550c7d97c5SJed Brown #undef __FUNCT__
9560c7d97c5SJed Brown #define __FUNCT__ "PCBDDCScatterCoarseDataEnd"
95753cdbc3dSStefano Zampini static PetscErrorCode  PCBDDCScatterCoarseDataEnd(PC pc,Vec vec_from, Vec vec_to, InsertMode imode, ScatterMode smode)
9580c7d97c5SJed Brown {
9590c7d97c5SJed Brown   PetscErrorCode ierr;
9600c7d97c5SJed Brown   PC_BDDC*       pcbddc = (PC_BDDC*)(pc->data);
9610c7d97c5SJed Brown   PetscScalar*   array_to;
9620c7d97c5SJed Brown   PetscScalar*   array_from;
9630c7d97c5SJed Brown   MPI_Comm       comm=((PetscObject)pc)->comm;
9640c7d97c5SJed Brown   PetscInt i;
9650c7d97c5SJed Brown 
9660c7d97c5SJed Brown   PetscFunctionBegin;
9670c7d97c5SJed Brown 
9680c7d97c5SJed Brown   switch(pcbddc->coarse_communications_type){
9690c7d97c5SJed Brown     case SCATTERS_BDDC:
9700c7d97c5SJed Brown       ierr = VecScatterEnd(pcbddc->coarse_loc_to_glob,vec_from,vec_to,imode,smode);CHKERRQ(ierr);
9710c7d97c5SJed Brown       break;
9720c7d97c5SJed Brown     case GATHERS_BDDC:
9730c7d97c5SJed Brown       if(vec_from) VecGetArray(vec_from,&array_from);
9740c7d97c5SJed Brown       if(vec_to)   VecGetArray(vec_to,&array_to);
9750c7d97c5SJed Brown       switch(pcbddc->coarse_problem_type){
9760c7d97c5SJed Brown         case SEQUENTIAL_BDDC:
9770c7d97c5SJed Brown           if(smode == SCATTER_FORWARD) {
97853cdbc3dSStefano Zampini             ierr = MPI_Gatherv(&array_from[0],pcbddc->local_primal_size,MPIU_SCALAR,&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,0,comm);CHKERRQ(ierr);
9790c7d97c5SJed Brown             if(vec_to) {
9800c7d97c5SJed Brown               for(i=0;i<pcbddc->replicated_primal_size;i++)
9810c7d97c5SJed Brown                 array_to[pcbddc->replicated_local_primal_indices[i]]+=pcbddc->replicated_local_primal_values[i];
9820c7d97c5SJed Brown             }
9830c7d97c5SJed Brown           } else {
9840c7d97c5SJed Brown             if(vec_from)
9850c7d97c5SJed Brown               for(i=0;i<pcbddc->replicated_primal_size;i++)
9860c7d97c5SJed Brown                 pcbddc->replicated_local_primal_values[i]=array_from[pcbddc->replicated_local_primal_indices[i]];
98753cdbc3dSStefano Zampini             ierr = MPI_Scatterv(&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,&array_to[0],pcbddc->local_primal_size,MPIU_SCALAR,0,comm);CHKERRQ(ierr);
9880c7d97c5SJed Brown           }
9890c7d97c5SJed Brown           break;
9900c7d97c5SJed Brown         case REPLICATED_BDDC:
9910c7d97c5SJed Brown           if(smode == SCATTER_FORWARD) {
99253cdbc3dSStefano Zampini             ierr = MPI_Allgatherv(&array_from[0],pcbddc->local_primal_size,MPIU_SCALAR,&pcbddc->replicated_local_primal_values[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_SCALAR,comm);CHKERRQ(ierr);
9930c7d97c5SJed Brown             for(i=0;i<pcbddc->replicated_primal_size;i++)
9940c7d97c5SJed Brown               array_to[pcbddc->replicated_local_primal_indices[i]]+=pcbddc->replicated_local_primal_values[i];
9950c7d97c5SJed Brown           } else { /* no communications needed for SCATTER_REVERSE since needed data is already present */
9960c7d97c5SJed Brown             for(i=0;i<pcbddc->local_primal_size;i++)
9970c7d97c5SJed Brown               array_to[i]=array_from[pcbddc->local_primal_indices[i]];
9980c7d97c5SJed Brown           }
9990c7d97c5SJed Brown           break;
100053cdbc3dSStefano Zampini         case MULTILEVEL_BDDC:
100153cdbc3dSStefano Zampini           break;
100253cdbc3dSStefano Zampini         case PARALLEL_BDDC:
100353cdbc3dSStefano Zampini           break;
10040c7d97c5SJed Brown       }
10050c7d97c5SJed Brown       if(vec_from) VecRestoreArray(vec_from,&array_from);
10060c7d97c5SJed Brown       if(vec_to)   VecRestoreArray(vec_to,&array_to);
10070c7d97c5SJed Brown       break;
10080c7d97c5SJed Brown   }
10090c7d97c5SJed Brown   PetscFunctionReturn(0);
10100c7d97c5SJed Brown }
10110c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
1012de534f79Sstefano_zampini #ifdef BDDC_USE_POD
1013de534f79Sstefano_zampini #if !defined(PETSC_MISSING_LAPACK_GESVD)
10143b03a366Sstefano_zampini #define PETSC_MISSING_LAPACK_GESVD 1
1015de534f79Sstefano_zampini #define UNDEF_PETSC_MISSING_LAPACK_GESVD 1
1016de534f79Sstefano_zampini #endif
10173b03a366Sstefano_zampini #endif
10183b03a366Sstefano_zampini 
10193b03a366Sstefano_zampini #undef __FUNCT__
10203b03a366Sstefano_zampini #define __FUNCT__ "PCBDDCCreateConstraintMatrix"
10213b03a366Sstefano_zampini static PetscErrorCode PCBDDCCreateConstraintMatrix(PC pc)
10223b03a366Sstefano_zampini {
10233b03a366Sstefano_zampini   PetscErrorCode ierr;
10243b03a366Sstefano_zampini   PC_IS*         pcis = (PC_IS*)(pc->data);
10253b03a366Sstefano_zampini   PC_BDDC*       pcbddc = (PC_BDDC*)pc->data;
10263b03a366Sstefano_zampini   Mat_IS         *matis = (Mat_IS*)pc->pmat->data;
102723d4d1a5SStefano Zampini   PetscInt       *nnz,*is_indices;
10283b03a366Sstefano_zampini   PetscScalar    *temp_quadrature_constraint;
1029534831adSStefano Zampini   PetscInt       *temp_indices,*temp_indices_to_constraint,*temp_indices_to_constraint_B,*local_to_B;
10303b03a366Sstefano_zampini   PetscInt       local_primal_size,i,j,k,total_counts,max_size_of_constraint;
10313b03a366Sstefano_zampini   PetscInt       n_constraints,n_vertices,size_of_constraint;
1032534831adSStefano Zampini   PetscScalar    quad_value;
10333b03a366Sstefano_zampini   PetscBool      nnsp_has_cnst=PETSC_FALSE,use_nnsp_true=pcbddc->use_nnsp_true;
10343b03a366Sstefano_zampini   PetscInt       nnsp_size=0,nnsp_addone=0,temp_constraints,temp_start_ptr;
10353b03a366Sstefano_zampini   IS             *used_IS;
10363b03a366Sstefano_zampini   const MatType  impMatType=MATSEQAIJ;
10373b03a366Sstefano_zampini   PetscBLASInt   Bs,Bt,lwork,lierr;
10383b03a366Sstefano_zampini   PetscReal      tol=1.0e-8;
1039fcda91b4SJed Brown   MatNullSpace   nearnullsp;
1040fcda91b4SJed Brown   const Vec      *nearnullvecs;
10413b03a366Sstefano_zampini   Vec            *localnearnullsp;
10423b03a366Sstefano_zampini   PetscScalar    *work,*temp_basis,*array_vector,*correlation_mat;
10433b03a366Sstefano_zampini   PetscReal      *rwork,*singular_vals;
1044534831adSStefano Zampini   PetscBLASInt   Bone=1,*ipiv;
1045534831adSStefano Zampini   Vec            temp_vec;
1046534831adSStefano Zampini   Mat            temp_mat;
1047534831adSStefano Zampini   KSP            temp_ksp;
1048534831adSStefano Zampini   PetscInt       s,start_constraint,dual_dofs;
1049534831adSStefano Zampini   PetscBool      compute_submatrix,useksp=PETSC_FALSE;
1050534831adSStefano Zampini   PetscInt       *aux_primal_permutation,*aux_primal_numbering;
1051534831adSStefano Zampini   PetscBool      boolforface,*change_basis;
1052de534f79Sstefano_zampini /* some ugly conditional declarations */
10533b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD)
10543b03a366Sstefano_zampini   PetscScalar    dot_result;
10553b03a366Sstefano_zampini   PetscScalar    one=1.0,zero=0.0;
10563b03a366Sstefano_zampini   PetscInt       ii;
10573b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX)
10583b03a366Sstefano_zampini   PetscScalar    val1,val2;
10593b03a366Sstefano_zampini #endif
10603b03a366Sstefano_zampini #else
10613b03a366Sstefano_zampini   PetscBLASInt   dummy_int;
10623b03a366Sstefano_zampini   PetscScalar    dummy_scalar;
10633b03a366Sstefano_zampini #endif
10643b03a366Sstefano_zampini 
10653b03a366Sstefano_zampini   PetscFunctionBegin;
10663b03a366Sstefano_zampini   /* check if near null space is attached to global mat */
1067fcda91b4SJed Brown   ierr = MatGetNearNullSpace(pc->pmat,&nearnullsp);CHKERRQ(ierr);
1068fcda91b4SJed Brown   if (nearnullsp) {
1069fcda91b4SJed Brown     ierr = MatNullSpaceGetVecs(nearnullsp,&nnsp_has_cnst,&nnsp_size,&nearnullvecs);CHKERRQ(ierr);
10703b03a366Sstefano_zampini   } else { /* if near null space is not provided it uses constants */
10713b03a366Sstefano_zampini     nnsp_has_cnst = PETSC_TRUE;
10723b03a366Sstefano_zampini     use_nnsp_true = PETSC_TRUE;
10733b03a366Sstefano_zampini   }
10743b03a366Sstefano_zampini   if(nnsp_has_cnst) {
10753b03a366Sstefano_zampini     nnsp_addone = 1;
10763b03a366Sstefano_zampini   }
10773b03a366Sstefano_zampini   /*
10783b03a366Sstefano_zampini        Evaluate maximum storage size needed by the procedure
10793b03a366Sstefano_zampini        - temp_indices will contain start index of each constraint stored as follows
10803b03a366Sstefano_zampini        - temp_indices_to_constraint  [temp_indices[i],...,temp[indices[i+1]-1] will contain the indices (in local numbering) on which the constraint acts
1081534831adSStefano Zampini        - temp_indices_to_constraint_B[temp_indices[i],...,temp[indices[i+1]-1] will contain the indices (in boundary numbering) on which the constraint acts
10823b03a366Sstefano_zampini        - temp_quadrature_constraint  [temp_indices[i],...,temp[indices[i+1]-1] will contain the scalars representing the constraint itself
10833b03a366Sstefano_zampini                                                                                                                                                          */
1084da1bb401SStefano Zampini 
10853b03a366Sstefano_zampini   total_counts = pcbddc->n_ISForFaces+pcbddc->n_ISForEdges;
10863b03a366Sstefano_zampini   total_counts *= (nnsp_addone+nnsp_size);
1087da1bb401SStefano Zampini   ierr = ISGetSize(pcbddc->ISForVertices,&n_vertices);CHKERRQ(ierr);
1088da1bb401SStefano Zampini   total_counts += n_vertices;
10893b03a366Sstefano_zampini   ierr = PetscMalloc((total_counts+1)*sizeof(PetscInt),&temp_indices);CHKERRQ(ierr);
1090534831adSStefano Zampini   ierr = PetscMalloc((total_counts+1)*sizeof(PetscBool),&change_basis);CHKERRQ(ierr);
10913b03a366Sstefano_zampini   total_counts = 0;
10923b03a366Sstefano_zampini   max_size_of_constraint = 0;
10933b03a366Sstefano_zampini   for(i=0;i<pcbddc->n_ISForEdges+pcbddc->n_ISForFaces;i++){
10943b03a366Sstefano_zampini     if(i<pcbddc->n_ISForEdges){
10953b03a366Sstefano_zampini       used_IS = &pcbddc->ISForEdges[i];
10963b03a366Sstefano_zampini     } else {
10973b03a366Sstefano_zampini       used_IS = &pcbddc->ISForFaces[i-pcbddc->n_ISForEdges];
10983b03a366Sstefano_zampini     }
10993b03a366Sstefano_zampini     ierr = ISGetSize(*used_IS,&j);CHKERRQ(ierr);
11003b03a366Sstefano_zampini     total_counts += j;
11013b03a366Sstefano_zampini     if(j>max_size_of_constraint) max_size_of_constraint=j;
11023b03a366Sstefano_zampini   }
11033b03a366Sstefano_zampini   total_counts *= (nnsp_addone+nnsp_size);
1104da1bb401SStefano Zampini   total_counts += n_vertices;
11053b03a366Sstefano_zampini   ierr = PetscMalloc(total_counts*sizeof(PetscScalar),&temp_quadrature_constraint);CHKERRQ(ierr);
11063b03a366Sstefano_zampini   ierr = PetscMalloc(total_counts*sizeof(PetscInt),&temp_indices_to_constraint);CHKERRQ(ierr);
1107534831adSStefano Zampini   ierr = PetscMalloc(total_counts*sizeof(PetscInt),&temp_indices_to_constraint_B);CHKERRQ(ierr);
1108534831adSStefano Zampini   ierr = PetscMalloc(pcis->n*sizeof(PetscInt),&local_to_B);CHKERRQ(ierr);
1109534831adSStefano Zampini   ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
1110534831adSStefano Zampini   for(i=0;i<pcis->n;i++) {
1111534831adSStefano Zampini     local_to_B[i]=-1;
1112534831adSStefano Zampini   }
1113534831adSStefano Zampini   for(i=0;i<pcis->n_B;i++) {
1114534831adSStefano Zampini     local_to_B[is_indices[i]]=i;
1115534831adSStefano Zampini   }
1116534831adSStefano Zampini   ierr = ISRestoreIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
1117534831adSStefano Zampini 
11183b03a366Sstefano_zampini   /* First we issue queries to allocate optimal workspace for LAPACKgesvd or LAPACKsyev/LAPACKheev */
11193b03a366Sstefano_zampini   rwork = 0;
11203b03a366Sstefano_zampini   work = 0;
11213b03a366Sstefano_zampini   singular_vals = 0;
11223b03a366Sstefano_zampini   temp_basis = 0;
11233b03a366Sstefano_zampini   correlation_mat = 0;
11243b03a366Sstefano_zampini   if(!pcbddc->use_nnsp_true) {
11253b03a366Sstefano_zampini     PetscScalar temp_work;
11263b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD)
11273b03a366Sstefano_zampini     /* POD */
11283b03a366Sstefano_zampini     PetscInt max_n;
11293b03a366Sstefano_zampini     max_n = nnsp_addone+nnsp_size;
11303b03a366Sstefano_zampini     /* using some techniques borrowed from Proper Orthogonal Decomposition */
11313b03a366Sstefano_zampini     ierr = PetscMalloc(max_n*max_n*sizeof(PetscScalar),&correlation_mat);CHKERRQ(ierr);
11323b03a366Sstefano_zampini     ierr = PetscMalloc(max_n*sizeof(PetscReal),&singular_vals);CHKERRQ(ierr);
11333b03a366Sstefano_zampini     ierr = PetscMalloc(max_size_of_constraint*(nnsp_addone+nnsp_size)*sizeof(PetscScalar),&temp_basis);CHKERRQ(ierr);
11343b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX)
11353b03a366Sstefano_zampini     ierr = PetscMalloc(3*max_n*sizeof(PetscReal),&rwork);CHKERRQ(ierr);
11363b03a366Sstefano_zampini #endif
11373b03a366Sstefano_zampini     /* now we evaluate the optimal workspace using query with lwork=-1 */
11383b03a366Sstefano_zampini     Bt = PetscBLASIntCast(max_n);
11393b03a366Sstefano_zampini     lwork=-1;
11403b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX)
11413b03a366Sstefano_zampini     LAPACKsyev_("V","U",&Bt,correlation_mat,&Bt,singular_vals,&temp_work,&lwork,&lierr);
11423b03a366Sstefano_zampini #else
11433b03a366Sstefano_zampini     LAPACKsyev_("V","U",&Bt,correlation_mat,&Bt,singular_vals,&temp_work,&lwork,rwork,&lierr);
11443b03a366Sstefano_zampini #endif
11453b03a366Sstefano_zampini #else /* on missing GESVD */
11463b03a366Sstefano_zampini     /* SVD */
11473b03a366Sstefano_zampini     PetscInt max_n,min_n;
11483b03a366Sstefano_zampini     max_n = max_size_of_constraint;
11493b03a366Sstefano_zampini     min_n = nnsp_addone+nnsp_size;
11503b03a366Sstefano_zampini     if(max_size_of_constraint < ( nnsp_addone+nnsp_size ) ) {
11513b03a366Sstefano_zampini       min_n = max_size_of_constraint;
11523b03a366Sstefano_zampini       max_n = nnsp_addone+nnsp_size;
11533b03a366Sstefano_zampini     }
11543b03a366Sstefano_zampini     ierr = PetscMalloc(min_n*sizeof(PetscReal),&singular_vals);CHKERRQ(ierr);
11553b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX)
11563b03a366Sstefano_zampini     ierr = PetscMalloc(5*min_n*sizeof(PetscReal),&rwork);CHKERRQ(ierr);
11573b03a366Sstefano_zampini #endif
11583b03a366Sstefano_zampini     /* now we evaluate the optimal workspace using query with lwork=-1 */
11593b03a366Sstefano_zampini     lwork=-1;
11603b03a366Sstefano_zampini     Bs = PetscBLASIntCast(max_n);
11613b03a366Sstefano_zampini     Bt = PetscBLASIntCast(min_n);
11623b03a366Sstefano_zampini     dummy_int = Bs;
1163670f3ff9SJed Brown     ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
11643b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX)
11653b03a366Sstefano_zampini     LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[0],&Bs,singular_vals,
11663b03a366Sstefano_zampini                  &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,&temp_work,&lwork,&lierr);
11673b03a366Sstefano_zampini #else
11683b03a366Sstefano_zampini     LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[0],&Bs,singular_vals,
11693b03a366Sstefano_zampini                  &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,&temp_work,&lwork,rwork,&lierr);
11703b03a366Sstefano_zampini #endif
11713b03a366Sstefano_zampini     if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in query to SVD Lapack routine %d",(int)lierr);
1172670f3ff9SJed Brown     ierr = PetscFPTrapPop();CHKERRQ(ierr);
11733b03a366Sstefano_zampini #endif
11743b03a366Sstefano_zampini     /* Allocate optimal workspace */
11753b03a366Sstefano_zampini     lwork = PetscBLASIntCast((PetscInt)PetscRealPart(temp_work));
11763b03a366Sstefano_zampini     total_counts = (PetscInt)lwork;
11773b03a366Sstefano_zampini     ierr = PetscMalloc(total_counts*sizeof(PetscScalar),&work);CHKERRQ(ierr);
11783b03a366Sstefano_zampini   }
11793b03a366Sstefano_zampini   /* get local part of global near null space vectors */
11803b03a366Sstefano_zampini   ierr = PetscMalloc(nnsp_size*sizeof(Vec),&localnearnullsp);CHKERRQ(ierr);
11813b03a366Sstefano_zampini   for(k=0;k<nnsp_size;k++) {
11823b03a366Sstefano_zampini     ierr = VecDuplicate(pcis->vec1_N,&localnearnullsp[k]);CHKERRQ(ierr);
1183fcda91b4SJed Brown     ierr = VecScatterBegin(matis->ctx,nearnullvecs[k],localnearnullsp[k],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1184fcda91b4SJed Brown     ierr = VecScatterEnd  (matis->ctx,nearnullvecs[k],localnearnullsp[k],INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
11853b03a366Sstefano_zampini   }
11863b03a366Sstefano_zampini   /* Now we can loop on constraining sets */
11873b03a366Sstefano_zampini   total_counts=0;
11883b03a366Sstefano_zampini   temp_indices[0]=0;
1189da1bb401SStefano Zampini   /* vertices */
1190da1bb401SStefano Zampini   PetscBool used_vertex;
1191da1bb401SStefano Zampini   ierr = ISGetIndices(pcbddc->ISForVertices,(const PetscInt**)&is_indices);CHKERRQ(ierr);
1192da1bb401SStefano Zampini   if(nnsp_has_cnst) { /* consider all vertices */
1193da1bb401SStefano Zampini     for(i=0;i<n_vertices;i++) {
1194da1bb401SStefano Zampini       temp_indices_to_constraint[temp_indices[total_counts]]=is_indices[i];
1195534831adSStefano Zampini       temp_indices_to_constraint_B[temp_indices[total_counts]]=local_to_B[is_indices[i]];
1196da1bb401SStefano Zampini       temp_quadrature_constraint[temp_indices[total_counts]]=1.0;
1197da1bb401SStefano Zampini       temp_indices[total_counts+1]=temp_indices[total_counts]+1;
1198534831adSStefano Zampini       change_basis[total_counts]=PETSC_FALSE;
1199da1bb401SStefano Zampini       total_counts++;
1200da1bb401SStefano Zampini     }
1201da1bb401SStefano Zampini   } else { /* consider vertices for which exist at least a localnearnullsp which is not null there */
1202da1bb401SStefano Zampini     for(i=0;i<n_vertices;i++) {
1203da1bb401SStefano Zampini       used_vertex=PETSC_FALSE;
1204da1bb401SStefano Zampini       k=0;
1205da1bb401SStefano Zampini       while(!used_vertex && k<nnsp_size) {
1206da1bb401SStefano Zampini         ierr = VecGetArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr);
1207da1bb401SStefano Zampini         if(PetscAbsScalar(array_vector[is_indices[i]])>0.0) {
1208da1bb401SStefano Zampini           temp_indices_to_constraint[temp_indices[total_counts]]=is_indices[i];
1209534831adSStefano Zampini           temp_indices_to_constraint_B[temp_indices[total_counts]]=local_to_B[is_indices[i]];
1210da1bb401SStefano Zampini           temp_quadrature_constraint[temp_indices[total_counts]]=1.0;
1211da1bb401SStefano Zampini           temp_indices[total_counts+1]=temp_indices[total_counts]+1;
1212534831adSStefano Zampini           change_basis[total_counts]=PETSC_FALSE;
1213da1bb401SStefano Zampini           total_counts++;
1214da1bb401SStefano Zampini           used_vertex=PETSC_TRUE;
1215da1bb401SStefano Zampini         }
1216da1bb401SStefano Zampini         ierr = VecRestoreArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr);
1217da1bb401SStefano Zampini         k++;
1218da1bb401SStefano Zampini       }
1219da1bb401SStefano Zampini     }
1220da1bb401SStefano Zampini   }
1221da1bb401SStefano Zampini   ierr = ISRestoreIndices(pcbddc->ISForVertices,(const PetscInt**)&is_indices);CHKERRQ(ierr);
1222da1bb401SStefano Zampini   n_vertices=total_counts;
1223da1bb401SStefano Zampini   /* edges and faces */
12243b03a366Sstefano_zampini   for(i=0;i<pcbddc->n_ISForEdges+pcbddc->n_ISForFaces;i++){
12253b03a366Sstefano_zampini     if(i<pcbddc->n_ISForEdges){
12263b03a366Sstefano_zampini       used_IS = &pcbddc->ISForEdges[i];
1227534831adSStefano Zampini       boolforface = pcbddc->usechangeofbasis;
12283b03a366Sstefano_zampini     } else {
12293b03a366Sstefano_zampini       used_IS = &pcbddc->ISForFaces[i-pcbddc->n_ISForEdges];
1230534831adSStefano Zampini       boolforface = pcbddc->usechangeonfaces;
12313b03a366Sstefano_zampini     }
12323b03a366Sstefano_zampini     temp_constraints = 0;          /* zero the number of constraints I have on this conn comp */
12333b03a366Sstefano_zampini     temp_start_ptr = total_counts; /* need to know the starting index of constraints stored */
12343b03a366Sstefano_zampini     ierr = ISGetSize(*used_IS,&size_of_constraint);CHKERRQ(ierr);
12353b03a366Sstefano_zampini     ierr = ISGetIndices(*used_IS,(const PetscInt**)&is_indices);CHKERRQ(ierr);
12363b03a366Sstefano_zampini     if(nnsp_has_cnst) {
12373b03a366Sstefano_zampini       temp_constraints++;
1238534831adSStefano Zampini       quad_value = (PetscScalar) (1.0/PetscSqrtReal((PetscReal)size_of_constraint));
12393b03a366Sstefano_zampini       for(j=0;j<size_of_constraint;j++) {
12403b03a366Sstefano_zampini         temp_indices_to_constraint[temp_indices[total_counts]+j]=is_indices[j];
1241534831adSStefano Zampini         temp_indices_to_constraint_B[temp_indices[total_counts]+j]=local_to_B[is_indices[j]];
12423b03a366Sstefano_zampini         temp_quadrature_constraint[temp_indices[total_counts]+j]=quad_value;
12433b03a366Sstefano_zampini       }
12443b03a366Sstefano_zampini       temp_indices[total_counts+1]=temp_indices[total_counts]+size_of_constraint;  /* store new starting point */
1245534831adSStefano Zampini       change_basis[total_counts]=boolforface;
12463b03a366Sstefano_zampini       total_counts++;
12473b03a366Sstefano_zampini     }
12483b03a366Sstefano_zampini     for(k=0;k<nnsp_size;k++) {
12493b03a366Sstefano_zampini       ierr = VecGetArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr);
12503b03a366Sstefano_zampini       for(j=0;j<size_of_constraint;j++) {
12513b03a366Sstefano_zampini         temp_indices_to_constraint[temp_indices[total_counts]+j]=is_indices[j];
1252534831adSStefano Zampini         temp_indices_to_constraint_B[temp_indices[total_counts]+j]=local_to_B[is_indices[j]];
12533b03a366Sstefano_zampini         temp_quadrature_constraint[temp_indices[total_counts]+j]=array_vector[is_indices[j]];
12543b03a366Sstefano_zampini       }
12553b03a366Sstefano_zampini       ierr = VecRestoreArrayRead(localnearnullsp[k],(const PetscScalar**)&array_vector);CHKERRQ(ierr);
1256de534f79Sstefano_zampini       quad_value = 1.0;
1257de534f79Sstefano_zampini       if( use_nnsp_true ) { /* check if array is null on the connected component in case use_nnsp_true has been requested */
1258de534f79Sstefano_zampini         Bs = PetscBLASIntCast(size_of_constraint);
1259de534f79Sstefano_zampini         quad_value = BLASasum_(&Bs,&temp_quadrature_constraint[temp_indices[total_counts]],&Bone);
1260de534f79Sstefano_zampini       }
1261de534f79Sstefano_zampini       if ( quad_value > 0.0 ) { /* keep indices and values */
1262de534f79Sstefano_zampini         temp_constraints++;
12633b03a366Sstefano_zampini         temp_indices[total_counts+1]=temp_indices[total_counts]+size_of_constraint;  /* store new starting point */
1264534831adSStefano Zampini         change_basis[total_counts]=boolforface;
12653b03a366Sstefano_zampini         total_counts++;
12663b03a366Sstefano_zampini       }
1267de534f79Sstefano_zampini     }
12683b03a366Sstefano_zampini     ierr = ISRestoreIndices(*used_IS,(const PetscInt**)&is_indices);CHKERRQ(ierr);
1269de534f79Sstefano_zampini     /* perform SVD on the constraint if use_nnsp_true has not be requested by the user */
12703b03a366Sstefano_zampini     if(!use_nnsp_true) {
1271de534f79Sstefano_zampini 
12723b03a366Sstefano_zampini       Bs = PetscBLASIntCast(size_of_constraint);
12733b03a366Sstefano_zampini       Bt = PetscBLASIntCast(temp_constraints);
1274de534f79Sstefano_zampini 
12753b03a366Sstefano_zampini #if defined(PETSC_MISSING_LAPACK_GESVD)
12763b03a366Sstefano_zampini       ierr = PetscMemzero(correlation_mat,Bt*Bt*sizeof(PetscScalar));CHKERRQ(ierr);
12773b03a366Sstefano_zampini       /* Store upper triangular part of correlation matrix */
12783b03a366Sstefano_zampini       for(j=0;j<temp_constraints;j++) {
12793b03a366Sstefano_zampini         for(k=0;k<j+1;k++) {
12803b03a366Sstefano_zampini #if defined(PETSC_USE_COMPLEX)
12813b03a366Sstefano_zampini           /* hand made complex dot product */
12823b03a366Sstefano_zampini           dot_result = 0.0;
12833b03a366Sstefano_zampini           for (ii=0; ii<size_of_constraint; ii++) {
12843b03a366Sstefano_zampini             val1 = temp_quadrature_constraint[temp_indices[temp_start_ptr+j]+ii];
12853b03a366Sstefano_zampini             val2 = temp_quadrature_constraint[temp_indices[temp_start_ptr+k]+ii];
12863b03a366Sstefano_zampini             dot_result += val1*PetscConj(val2);
12873b03a366Sstefano_zampini           }
12883b03a366Sstefano_zampini #else
12893b03a366Sstefano_zampini           dot_result = BLASdot_(&Bs,&temp_quadrature_constraint[temp_indices[temp_start_ptr+j]],&Bone,
12903b03a366Sstefano_zampini                                     &temp_quadrature_constraint[temp_indices[temp_start_ptr+k]],&Bone);
12913b03a366Sstefano_zampini #endif
12923b03a366Sstefano_zampini           correlation_mat[j*temp_constraints+k]=dot_result;
12933b03a366Sstefano_zampini         }
12943b03a366Sstefano_zampini       }
12953b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX)
12963b03a366Sstefano_zampini       LAPACKsyev_("V","U",&Bt,correlation_mat,&Bt,singular_vals,work,&lwork,&lierr);
12973b03a366Sstefano_zampini #else
12983b03a366Sstefano_zampini       LAPACKsyev_("V","U",&Bt,correlation_mat,&Bt,singular_vals,work,&lwork,rwork,&lierr);
12993b03a366Sstefano_zampini #endif
13003b03a366Sstefano_zampini       if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in EV Lapack routine %d",(int)lierr);
13013b03a366Sstefano_zampini       /* retain eigenvalues greater than tol: note that lapack SYEV gives eigs in ascending order */
13023b03a366Sstefano_zampini       j=0;
13033b03a366Sstefano_zampini       while( j < Bt && singular_vals[j] < tol) j++;
13043b03a366Sstefano_zampini       total_counts=total_counts-j;
13053b03a366Sstefano_zampini       if(j<temp_constraints) {
13063b03a366Sstefano_zampini         for(k=j;k<Bt;k++) { singular_vals[k]=1.0/PetscSqrtReal(singular_vals[k]); }
13073b03a366Sstefano_zampini         BLASgemm_("N","N",&Bs,&Bt,&Bt,&one,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,correlation_mat,&Bt,&zero,temp_basis,&Bs);
13083b03a366Sstefano_zampini         /* copy POD basis into used quadrature memory */
13093b03a366Sstefano_zampini         for(k=0;k<Bt-j;k++) {
13103b03a366Sstefano_zampini           for(ii=0;ii<size_of_constraint;ii++) {
13113b03a366Sstefano_zampini             temp_quadrature_constraint[temp_indices[temp_start_ptr+k]+ii]=singular_vals[Bt-1-k]*temp_basis[(Bt-1-k)*size_of_constraint+ii];
13123b03a366Sstefano_zampini           }
13133b03a366Sstefano_zampini         }
13143b03a366Sstefano_zampini       }
1315de534f79Sstefano_zampini 
13163b03a366Sstefano_zampini #else  /* on missing GESVD */
1317de534f79Sstefano_zampini 
13183b03a366Sstefano_zampini       PetscInt min_n = temp_constraints;
13193b03a366Sstefano_zampini       if(min_n > size_of_constraint) min_n = size_of_constraint;
13203b03a366Sstefano_zampini       dummy_int = Bs;
1321670f3ff9SJed Brown       ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
13223b03a366Sstefano_zampini #if !defined(PETSC_USE_COMPLEX)
13233b03a366Sstefano_zampini       LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,singular_vals,
13243b03a366Sstefano_zampini                    &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,work,&lwork,&lierr);
13253b03a366Sstefano_zampini #else
13263b03a366Sstefano_zampini       LAPACKgesvd_("O","N",&Bs,&Bt,&temp_quadrature_constraint[temp_indices[temp_start_ptr]],&Bs,singular_vals,
13273b03a366Sstefano_zampini                    &dummy_scalar,&dummy_int,&dummy_scalar,&dummy_int,work,&lwork,rwork,&lierr);
13283b03a366Sstefano_zampini #endif
13293b03a366Sstefano_zampini       if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in SVD Lapack routine %d",(int)lierr);
1330670f3ff9SJed Brown       ierr = PetscFPTrapPop();CHKERRQ(ierr);
13313b03a366Sstefano_zampini       /* retain eigenvalues greater than tol: note that lapack SVD gives eigs in descending order */
13323b03a366Sstefano_zampini       j=0;
13333b03a366Sstefano_zampini       while( j < min_n && singular_vals[min_n-j-1] < tol) j++;
13343b03a366Sstefano_zampini       total_counts = total_counts-(PetscInt)Bt+(min_n-j);
13353b03a366Sstefano_zampini #endif
13363b03a366Sstefano_zampini     }
13373b03a366Sstefano_zampini   }
1338534831adSStefano Zampini 
1339da1bb401SStefano Zampini   n_constraints=total_counts-n_vertices;
1340da1bb401SStefano Zampini   local_primal_size = total_counts;
13413b03a366Sstefano_zampini   /* set quantities in pcbddc data structure */
13423b03a366Sstefano_zampini   pcbddc->n_vertices = n_vertices;
13433b03a366Sstefano_zampini   pcbddc->n_constraints = n_constraints;
1344da1bb401SStefano Zampini   pcbddc->local_primal_size = local_primal_size;
1345534831adSStefano Zampini 
1346534831adSStefano Zampini   /* Create constraint matrix */
1347534831adSStefano Zampini   /* The constraint matrix is used to compute the l2g map of primal dofs */
1348534831adSStefano Zampini   /* so we need to set it up properly either with or without change of basis */
1349534831adSStefano Zampini   ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->ConstraintMatrix);CHKERRQ(ierr);
1350534831adSStefano Zampini   ierr = MatSetType(pcbddc->ConstraintMatrix,impMatType);CHKERRQ(ierr);
1351534831adSStefano Zampini   ierr = MatSetSizes(pcbddc->ConstraintMatrix,local_primal_size,pcis->n,local_primal_size,pcis->n);CHKERRQ(ierr);
1352534831adSStefano Zampini   /* compute a local numbering of constraints : vertices first then constraints */
1353534831adSStefano Zampini   ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
1354534831adSStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array_vector);CHKERRQ(ierr);
1355534831adSStefano Zampini   ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&aux_primal_numbering);CHKERRQ(ierr);
1356534831adSStefano Zampini   ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&aux_primal_permutation);CHKERRQ(ierr);
1357534831adSStefano Zampini   total_counts=0;
1358534831adSStefano Zampini   /* find vertices: subdomain corners plus dofs with basis changed */
1359534831adSStefano Zampini   for(i=0;i<local_primal_size;i++) {
1360534831adSStefano Zampini     size_of_constraint=temp_indices[i+1]-temp_indices[i];
1361534831adSStefano Zampini     if(change_basis[i] || size_of_constraint == 1) {
1362534831adSStefano Zampini       k=0;
1363534831adSStefano Zampini       while(k < size_of_constraint && array_vector[temp_indices_to_constraint[temp_indices[i]+size_of_constraint-k-1]] != 0.0) {
1364534831adSStefano Zampini         k=k+1;
1365534831adSStefano Zampini       }
1366534831adSStefano Zampini       j=temp_indices_to_constraint[temp_indices[i]+size_of_constraint-k-1];
1367534831adSStefano Zampini       array_vector[j] = 1.0;
1368534831adSStefano Zampini       aux_primal_numbering[total_counts]=j;
1369534831adSStefano Zampini       aux_primal_permutation[total_counts]=total_counts;
1370534831adSStefano Zampini       total_counts++;
1371534831adSStefano Zampini     }
1372534831adSStefano Zampini   }
1373534831adSStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array_vector);CHKERRQ(ierr);
1374534831adSStefano Zampini   /* permute indices in order to have a sorted set of vertices */
1375534831adSStefano Zampini   ierr = PetscSortIntWithPermutation(total_counts,aux_primal_numbering,aux_primal_permutation);
1376534831adSStefano Zampini   /* nonzero structure */
1377534831adSStefano Zampini   ierr = PetscMalloc(local_primal_size*sizeof(PetscInt),&nnz);CHKERRQ(ierr);
1378534831adSStefano Zampini   for(i=0;i<total_counts;i++) {
1379534831adSStefano Zampini     nnz[i]=1;
1380534831adSStefano Zampini   }
1381534831adSStefano Zampini   j=total_counts;
1382534831adSStefano Zampini   for(i=n_vertices;i<local_primal_size;i++) {
1383534831adSStefano Zampini     if(!change_basis[i]) {
1384534831adSStefano Zampini       nnz[j]=temp_indices[i+1]-temp_indices[i];
1385534831adSStefano Zampini       j++;
1386534831adSStefano Zampini     }
1387534831adSStefano Zampini   }
1388534831adSStefano Zampini   ierr = MatSeqAIJSetPreallocation(pcbddc->ConstraintMatrix,0,nnz);CHKERRQ(ierr);
1389534831adSStefano Zampini   ierr = PetscFree(nnz);CHKERRQ(ierr);
1390534831adSStefano Zampini   /* set values in constraint matrix */
1391534831adSStefano Zampini   for(i=0;i<total_counts;i++) {
1392534831adSStefano Zampini     j = aux_primal_permutation[i];
1393534831adSStefano Zampini     k = aux_primal_numbering[j];
1394534831adSStefano Zampini     ierr = MatSetValue(pcbddc->ConstraintMatrix,i,k,1.0,INSERT_VALUES);CHKERRQ(ierr);
1395534831adSStefano Zampini   }
1396534831adSStefano Zampini   for(i=n_vertices;i<local_primal_size;i++) {
1397534831adSStefano Zampini     if(!change_basis[i]) {
1398534831adSStefano Zampini       size_of_constraint=temp_indices[i+1]-temp_indices[i];
1399534831adSStefano Zampini       ierr = MatSetValues(pcbddc->ConstraintMatrix,1,&total_counts,size_of_constraint,&temp_indices_to_constraint[temp_indices[i]],&temp_quadrature_constraint[temp_indices[i]],INSERT_VALUES);CHKERRQ(ierr);
1400534831adSStefano Zampini       total_counts++;
1401534831adSStefano Zampini     }
1402534831adSStefano Zampini   }
1403534831adSStefano Zampini   ierr = PetscFree(aux_primal_numbering);CHKERRQ(ierr);
1404534831adSStefano Zampini   ierr = PetscFree(aux_primal_permutation);CHKERRQ(ierr);
1405534831adSStefano Zampini   /* assembling */
1406534831adSStefano Zampini   ierr = MatAssemblyBegin(pcbddc->ConstraintMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1407534831adSStefano Zampini   ierr = MatAssemblyEnd(pcbddc->ConstraintMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1408534831adSStefano Zampini 
1409534831adSStefano Zampini   /* Create matrix for change of basis. We don't need it in case pcbddc->usechangeofbasis is FALSE */
1410534831adSStefano Zampini   if(pcbddc->usechangeofbasis) {
1411534831adSStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->ChangeOfBasisMatrix);CHKERRQ(ierr);
1412534831adSStefano Zampini     ierr = MatSetType(pcbddc->ChangeOfBasisMatrix,impMatType);CHKERRQ(ierr);
1413534831adSStefano Zampini     ierr = MatSetSizes(pcbddc->ChangeOfBasisMatrix,pcis->n_B,pcis->n_B,pcis->n_B,pcis->n_B);CHKERRQ(ierr);
1414534831adSStefano Zampini     /* work arrays */
1415534831adSStefano Zampini     /* we need to reuse these arrays, so we free them */
1416534831adSStefano Zampini     ierr = PetscFree(temp_basis);CHKERRQ(ierr);
1417534831adSStefano Zampini     ierr = PetscFree(work);CHKERRQ(ierr);
1418534831adSStefano Zampini     ierr = PetscMalloc(pcis->n_B*sizeof(PetscInt),&nnz);CHKERRQ(ierr);
1419534831adSStefano Zampini     ierr = PetscMalloc((nnsp_addone+nnsp_size)*(nnsp_addone+nnsp_size)*sizeof(PetscScalar),&temp_basis);CHKERRQ(ierr);
1420534831adSStefano Zampini     ierr = PetscMalloc((nnsp_addone+nnsp_size)*sizeof(PetscScalar),&work);CHKERRQ(ierr);
1421534831adSStefano Zampini     ierr = PetscMalloc((nnsp_addone+nnsp_size)*sizeof(PetscBLASInt),&ipiv);CHKERRQ(ierr);
1422534831adSStefano Zampini     for(i=0;i<pcis->n_B;i++) {
1423534831adSStefano Zampini       nnz[i]=1;
1424534831adSStefano Zampini     }
1425534831adSStefano Zampini     /* Overestimated nonzeros per row */
1426534831adSStefano Zampini     k=1;
1427534831adSStefano Zampini     for(i=pcbddc->n_vertices;i<local_primal_size;i++) {
1428534831adSStefano Zampini       if(change_basis[i]) {
1429534831adSStefano Zampini         size_of_constraint = temp_indices[i+1]-temp_indices[i];
1430534831adSStefano Zampini         if(k < size_of_constraint) {
1431534831adSStefano Zampini           k = size_of_constraint;
1432534831adSStefano Zampini         }
1433534831adSStefano Zampini         for(j=0;j<size_of_constraint;j++) {
1434534831adSStefano Zampini           nnz[temp_indices_to_constraint_B[temp_indices[i]+j]] = size_of_constraint;
1435534831adSStefano Zampini         }
1436534831adSStefano Zampini       }
1437534831adSStefano Zampini     }
1438534831adSStefano Zampini     ierr = MatSeqAIJSetPreallocation(pcbddc->ChangeOfBasisMatrix,0,nnz);CHKERRQ(ierr);
1439534831adSStefano Zampini     ierr = PetscFree(nnz);CHKERRQ(ierr);
1440534831adSStefano Zampini     /* Temporary array to store indices */
1441534831adSStefano Zampini     ierr = PetscMalloc(k*sizeof(PetscInt),&is_indices);CHKERRQ(ierr);
1442534831adSStefano Zampini     /* Set initial identity in the matrix */
1443534831adSStefano Zampini     for(i=0;i<pcis->n_B;i++) {
1444534831adSStefano Zampini       ierr = MatSetValue(pcbddc->ChangeOfBasisMatrix,i,i,1.0,INSERT_VALUES);CHKERRQ(ierr);
1445534831adSStefano Zampini     }
1446534831adSStefano Zampini     /* Now we loop on the constraints which need a change of basis */
1447534831adSStefano Zampini     /* Change of basis matrix is evaluated as the FIRST APPROACH in */
1448534831adSStefano Zampini     /* Klawonn and Widlund, Dual-primal FETI-DP methods for linear elasticity, (6.2.1) */
1449534831adSStefano Zampini     temp_constraints = 0;
1450534831adSStefano Zampini     temp_start_ptr = temp_indices_to_constraint_B[temp_indices[pcbddc->n_vertices]];
1451534831adSStefano Zampini     for(i=pcbddc->n_vertices;i<local_primal_size;i++) {
1452534831adSStefano Zampini       if(change_basis[i]) {
1453534831adSStefano Zampini         compute_submatrix = PETSC_FALSE;
1454534831adSStefano Zampini         useksp = PETSC_FALSE;
1455534831adSStefano Zampini         if(temp_start_ptr == temp_indices_to_constraint_B[temp_indices[i]]) {
1456534831adSStefano Zampini           temp_constraints++;
1457534831adSStefano Zampini           if(temp_start_ptr != temp_indices_to_constraint_B[temp_indices[i+1]]) {
1458534831adSStefano Zampini             compute_submatrix = PETSC_TRUE;
1459534831adSStefano Zampini           }
1460534831adSStefano Zampini         }
1461534831adSStefano Zampini         if(compute_submatrix) {
1462534831adSStefano Zampini           if(temp_constraints > 1 || pcbddc->use_nnsp_true) {
1463534831adSStefano Zampini             useksp = PETSC_TRUE;
1464534831adSStefano Zampini           }
1465534831adSStefano Zampini           size_of_constraint = temp_indices[i+1]-temp_indices[i];
1466534831adSStefano Zampini           if(useksp) { /* experimental */
1467534831adSStefano Zampini             ierr = MatCreate(PETSC_COMM_SELF,&temp_mat);CHKERRQ(ierr);
1468534831adSStefano Zampini             ierr = MatSetType(temp_mat,impMatType);CHKERRQ(ierr);
1469534831adSStefano Zampini             ierr = MatSetSizes(temp_mat,size_of_constraint,size_of_constraint,size_of_constraint,size_of_constraint);CHKERRQ(ierr);
1470534831adSStefano Zampini             ierr = MatSeqAIJSetPreallocation(temp_mat,size_of_constraint,PETSC_NULL);CHKERRQ(ierr);
1471534831adSStefano Zampini           }
1472534831adSStefano Zampini           /* First _size_of_constraint-temp_constraints_ columns */
1473534831adSStefano Zampini           dual_dofs = size_of_constraint-temp_constraints;
1474534831adSStefano Zampini           start_constraint = i+1-temp_constraints;
1475534831adSStefano Zampini           for(s=0;s<dual_dofs;s++) {
1476534831adSStefano Zampini             is_indices[0] = s;
1477534831adSStefano Zampini             for(j=0;j<temp_constraints;j++) {
1478534831adSStefano Zampini               for(k=0;k<temp_constraints;k++) {
1479534831adSStefano Zampini                 temp_basis[j*temp_constraints+k]=temp_quadrature_constraint[temp_indices[start_constraint+k]+s+j+1];
1480534831adSStefano Zampini               }
1481534831adSStefano Zampini               work[j]=-temp_quadrature_constraint[temp_indices[start_constraint+j]+s];
1482534831adSStefano Zampini               is_indices[j+1]=s+j+1;
1483534831adSStefano Zampini             }
1484534831adSStefano Zampini             Bt = temp_constraints;
1485534831adSStefano Zampini             ierr = PetscFPTrapPush(PETSC_FP_TRAP_OFF);CHKERRQ(ierr);
1486534831adSStefano Zampini             LAPACKgesv_(&Bt,&Bone,temp_basis,&Bt,ipiv,work,&Bt,&lierr);
1487534831adSStefano Zampini             if ( lierr ) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in GESV Lapack routine %d",(int)lierr);
1488534831adSStefano Zampini             ierr = PetscFPTrapPop();CHKERRQ(ierr);
1489534831adSStefano Zampini             j = temp_indices_to_constraint_B[temp_indices[start_constraint]+s];
1490534831adSStefano Zampini             ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,temp_constraints,&temp_indices_to_constraint_B[temp_indices[start_constraint]+s+1],1,&j,work,INSERT_VALUES);CHKERRQ(ierr);
1491534831adSStefano Zampini             if(useksp) {
1492534831adSStefano Zampini               /* temp mat with transposed rows and columns */
1493534831adSStefano Zampini               ierr = MatSetValues(temp_mat,1,&s,temp_constraints,&is_indices[1],work,INSERT_VALUES);CHKERRQ(ierr);
1494534831adSStefano Zampini               ierr = MatSetValue(temp_mat,is_indices[0],is_indices[0],1.0,INSERT_VALUES);CHKERRQ(ierr);
1495534831adSStefano Zampini             }
1496534831adSStefano Zampini           }
1497534831adSStefano Zampini           if(useksp) {
1498534831adSStefano Zampini             /* last rows of temp_mat */
1499534831adSStefano Zampini             for(j=0;j<size_of_constraint;j++) {
1500534831adSStefano Zampini               is_indices[j] = j;
1501534831adSStefano Zampini             }
1502534831adSStefano Zampini             for(s=0;s<temp_constraints;s++) {
1503534831adSStefano Zampini               k = s + dual_dofs;
1504534831adSStefano Zampini               ierr = MatSetValues(temp_mat,1,&k,size_of_constraint,is_indices,&temp_quadrature_constraint[temp_indices[start_constraint+s]],INSERT_VALUES);CHKERRQ(ierr);
1505534831adSStefano Zampini             }
1506534831adSStefano Zampini             ierr = MatAssemblyBegin(temp_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1507534831adSStefano Zampini             ierr = MatAssemblyEnd(temp_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1508534831adSStefano Zampini             ierr = MatGetVecs(temp_mat,&temp_vec,PETSC_NULL);CHKERRQ(ierr);
1509534831adSStefano Zampini             ierr = KSPCreate(PETSC_COMM_SELF,&temp_ksp);CHKERRQ(ierr);
1510534831adSStefano Zampini             ierr = KSPSetOperators(temp_ksp,temp_mat,temp_mat,SAME_PRECONDITIONER);CHKERRQ(ierr);
1511534831adSStefano Zampini             ierr = KSPSetType(temp_ksp,KSPPREONLY);CHKERRQ(ierr);
1512534831adSStefano Zampini             ierr = KSPSetUp(temp_ksp);CHKERRQ(ierr);
1513534831adSStefano Zampini             for(s=0;s<temp_constraints;s++) {
1514534831adSStefano Zampini               ierr = VecSet(temp_vec,0.0);CHKERRQ(ierr);
1515534831adSStefano Zampini               ierr = VecSetValue(temp_vec,s+dual_dofs,1.0,INSERT_VALUES);CHKERRQ(ierr);
1516534831adSStefano Zampini               ierr = VecAssemblyBegin(temp_vec);CHKERRQ(ierr);
1517534831adSStefano Zampini               ierr = VecAssemblyEnd(temp_vec);CHKERRQ(ierr);
1518534831adSStefano Zampini               ierr = KSPSolve(temp_ksp,temp_vec,temp_vec);CHKERRQ(ierr);
1519534831adSStefano Zampini               ierr = VecGetArray(temp_vec,&array_vector);CHKERRQ(ierr);
1520534831adSStefano Zampini               j = temp_indices_to_constraint_B[temp_indices[start_constraint+s]+size_of_constraint-s-1];
1521534831adSStefano Zampini               /* last columns of change of basis matrix associated to new primal dofs */
1522534831adSStefano Zampini               ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,size_of_constraint,&temp_indices_to_constraint_B[temp_indices[start_constraint+s]],1,&j,array_vector,INSERT_VALUES);CHKERRQ(ierr);
1523534831adSStefano Zampini               ierr = VecRestoreArray(temp_vec,&array_vector);CHKERRQ(ierr);
1524534831adSStefano Zampini             }
1525534831adSStefano Zampini             ierr = MatDestroy(&temp_mat);CHKERRQ(ierr);
1526534831adSStefano Zampini             ierr = KSPDestroy(&temp_ksp);CHKERRQ(ierr);
1527534831adSStefano Zampini             ierr = VecDestroy(&temp_vec);CHKERRQ(ierr);
1528534831adSStefano Zampini           } else {
1529534831adSStefano Zampini             /* last columns of change of basis matrix associated to new primal dofs */
1530534831adSStefano Zampini             for(s=0;s<temp_constraints;s++) {
1531534831adSStefano Zampini               j = temp_indices_to_constraint_B[temp_indices[start_constraint+s]+size_of_constraint-s-1];
1532534831adSStefano Zampini               ierr = MatSetValues(pcbddc->ChangeOfBasisMatrix,size_of_constraint,&temp_indices_to_constraint_B[temp_indices[start_constraint+s]],1,&j,&temp_quadrature_constraint[temp_indices[start_constraint+s]],INSERT_VALUES);CHKERRQ(ierr);
1533534831adSStefano Zampini             }
1534534831adSStefano Zampini           }
1535534831adSStefano Zampini           /* prepare for the next cycle */
1536534831adSStefano Zampini           temp_constraints = 0;
1537534831adSStefano Zampini           temp_start_ptr = temp_indices_to_constraint_B[temp_indices[i+1]];
1538534831adSStefano Zampini         }
1539534831adSStefano Zampini       }
1540534831adSStefano Zampini     }
1541534831adSStefano Zampini     /* assembling */
1542534831adSStefano Zampini     ierr = MatAssemblyBegin(pcbddc->ChangeOfBasisMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1543534831adSStefano Zampini     ierr = MatAssemblyEnd(pcbddc->ChangeOfBasisMatrix,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1544534831adSStefano Zampini     ierr = PetscFree(ipiv);CHKERRQ(ierr);
1545534831adSStefano Zampini     ierr = PetscFree(is_indices);CHKERRQ(ierr);
1546534831adSStefano Zampini   }
15473b03a366Sstefano_zampini   /* free workspace no longer needed */
15483b03a366Sstefano_zampini   ierr = PetscFree(rwork);CHKERRQ(ierr);
15493b03a366Sstefano_zampini   ierr = PetscFree(work);CHKERRQ(ierr);
15503b03a366Sstefano_zampini   ierr = PetscFree(temp_basis);CHKERRQ(ierr);
15513b03a366Sstefano_zampini   ierr = PetscFree(singular_vals);CHKERRQ(ierr);
15523b03a366Sstefano_zampini   ierr = PetscFree(correlation_mat);CHKERRQ(ierr);
15533b03a366Sstefano_zampini   ierr = PetscFree(temp_indices);CHKERRQ(ierr);
1554534831adSStefano Zampini   ierr = PetscFree(change_basis);CHKERRQ(ierr);
15553b03a366Sstefano_zampini   ierr = PetscFree(temp_indices_to_constraint);CHKERRQ(ierr);
1556534831adSStefano Zampini   ierr = PetscFree(temp_indices_to_constraint_B);CHKERRQ(ierr);
1557534831adSStefano Zampini   ierr = PetscFree(local_to_B);CHKERRQ(ierr);
15583b03a366Sstefano_zampini   ierr = PetscFree(temp_quadrature_constraint);CHKERRQ(ierr);
1559da1bb401SStefano Zampini   for(k=0;k<nnsp_size;k++) {
1560da1bb401SStefano Zampini     ierr = VecDestroy(&localnearnullsp[k]);CHKERRQ(ierr);
1561da1bb401SStefano Zampini   }
15623b03a366Sstefano_zampini   ierr = PetscFree(localnearnullsp);CHKERRQ(ierr);
15633b03a366Sstefano_zampini   PetscFunctionReturn(0);
15643b03a366Sstefano_zampini }
1565de534f79Sstefano_zampini #ifdef UNDEF_PETSC_MISSING_LAPACK_GESVD
15663b03a366Sstefano_zampini #undef PETSC_MISSING_LAPACK_GESVD
15673b03a366Sstefano_zampini #endif
15683b03a366Sstefano_zampini /* -------------------------------------------------------------------------- */
15690c7d97c5SJed Brown #undef __FUNCT__
15700c7d97c5SJed Brown #define __FUNCT__ "PCBDDCCoarseSetUp"
157153cdbc3dSStefano Zampini static PetscErrorCode PCBDDCCoarseSetUp(PC pc)
15720c7d97c5SJed Brown {
15730c7d97c5SJed Brown   PetscErrorCode  ierr;
15740c7d97c5SJed Brown 
15750c7d97c5SJed Brown   PC_IS*            pcis = (PC_IS*)(pc->data);
15760c7d97c5SJed Brown   PC_BDDC*          pcbddc = (PC_BDDC*)pc->data;
15770c7d97c5SJed Brown   Mat_IS            *matis = (Mat_IS*)pc->pmat->data;
1578534831adSStefano Zampini   Mat               change_mat_all;
15790c7d97c5SJed Brown   IS                is_R_local;
15800c7d97c5SJed Brown   IS                is_V_local;
15810c7d97c5SJed Brown   IS                is_C_local;
15820c7d97c5SJed Brown   IS                is_aux1;
15830c7d97c5SJed Brown   IS                is_aux2;
15840c7d97c5SJed Brown   const VecType     impVecType;
15850c7d97c5SJed Brown   const MatType     impMatType;
15860c7d97c5SJed Brown   PetscInt          n_R=0;
15870c7d97c5SJed Brown   PetscInt          n_D=0;
15880c7d97c5SJed Brown   PetscInt          n_B=0;
15890c7d97c5SJed Brown   PetscScalar       zero=0.0;
15900c7d97c5SJed Brown   PetscScalar       one=1.0;
15910c7d97c5SJed Brown   PetscScalar       m_one=-1.0;
15920c7d97c5SJed Brown   PetscScalar*      array;
15930c7d97c5SJed Brown   PetscScalar       *coarse_submat_vals;
15940c7d97c5SJed Brown   PetscInt          *idx_R_local;
15950c7d97c5SJed Brown   PetscInt          *idx_V_B;
15960c7d97c5SJed Brown   PetscScalar       *coarsefunctions_errors;
15970c7d97c5SJed Brown   PetscScalar       *constraints_errors;
15980c7d97c5SJed Brown   /* auxiliary indices */
1599534831adSStefano Zampini   PetscInt i,j,k;
1600e269702eSStefano Zampini   /* for verbose output of bddc */
1601e269702eSStefano Zampini   PetscViewer       viewer=pcbddc->dbg_viewer;
1602e269702eSStefano Zampini   PetscBool         dbg_flag=pcbddc->dbg_flag;
1603a0ba757dSStefano Zampini   /* for counting coarse dofs */
1604534831adSStefano Zampini   PetscInt          n_vertices,n_constraints;
16053b03a366Sstefano_zampini   PetscInt          size_of_constraint;
16063b03a366Sstefano_zampini   PetscInt          *row_cmat_indices;
16073b03a366Sstefano_zampini   PetscScalar       *row_cmat_values;
1608534831adSStefano Zampini   PetscInt          *vertices,*nnz,*is_indices,*temp_indices;
16090c7d97c5SJed Brown 
16100c7d97c5SJed Brown   PetscFunctionBegin;
16110c7d97c5SJed Brown   /* Set Non-overlapping dimensions */
16120c7d97c5SJed Brown   n_B = pcis->n_B; n_D = pcis->n - n_B;
1613534831adSStefano Zampini   /* Set types for local objects needed by BDDC precondtioner */
1614534831adSStefano Zampini   impMatType = MATSEQDENSE;
1615534831adSStefano Zampini   impVecType = VECSEQ;
1616da1bb401SStefano Zampini   /* get vertex indices from constraint matrix */
1617534831adSStefano Zampini   ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscInt),&vertices);CHKERRQ(ierr);
1618534831adSStefano Zampini   n_vertices=0;
1619da1bb401SStefano Zampini   for(i=0;i<pcbddc->local_primal_size;i++) {
1620da1bb401SStefano Zampini     ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr);
1621da1bb401SStefano Zampini     if(size_of_constraint == 1) {
1622534831adSStefano Zampini       vertices[n_vertices]=row_cmat_indices[0];
1623534831adSStefano Zampini       n_vertices++;
1624a0ba757dSStefano Zampini     }
1625da1bb401SStefano Zampini     ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr);
1626a0ba757dSStefano Zampini   }
1627534831adSStefano Zampini   /* Set number of constraints */
1628534831adSStefano Zampini   n_constraints = pcbddc->local_primal_size-n_vertices;
1629534831adSStefano Zampini 
1630534831adSStefano Zampini   /* vertices in boundary numbering */
1631534831adSStefano Zampini   if(n_vertices) {
1632534831adSStefano Zampini     ierr = VecSet(pcis->vec1_N,m_one);CHKERRQ(ierr);
1633534831adSStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
1634534831adSStefano Zampini     for (i=0; i<n_vertices; i++) { array[ vertices[i] ] = i; }
1635534831adSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
1636534831adSStefano Zampini     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1637534831adSStefano Zampini     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
1638534831adSStefano Zampini     ierr = PetscMalloc(n_vertices*sizeof(PetscInt),&idx_V_B);CHKERRQ(ierr);
1639534831adSStefano Zampini     ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr);
1640534831adSStefano Zampini     for (i=0; i<n_vertices; i++) {
1641534831adSStefano Zampini       j=0;
1642534831adSStefano Zampini       while (array[j] != i ) {j++;}
1643534831adSStefano Zampini       idx_V_B[i]=j;
1644534831adSStefano Zampini     }
1645534831adSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr);
1646534831adSStefano Zampini   }
1647534831adSStefano Zampini 
1648534831adSStefano Zampini   /* transform local matrices if needed */
1649534831adSStefano Zampini   if(pcbddc->usechangeofbasis) {
1650534831adSStefano Zampini     ierr = PetscMalloc(pcis->n*sizeof(PetscInt),&nnz);CHKERRQ(ierr);
1651534831adSStefano Zampini     ierr = ISGetIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
1652534831adSStefano Zampini     for(i=0;i<n_D;i++) {
1653534831adSStefano Zampini       nnz[is_indices[i]]=1;
1654534831adSStefano Zampini     }
1655534831adSStefano Zampini     ierr = ISRestoreIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
1656534831adSStefano Zampini     ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
1657534831adSStefano Zampini     k=1;
1658534831adSStefano Zampini     for(i=0;i<n_B;i++) {
1659534831adSStefano Zampini       ierr = MatGetRow(pcbddc->ChangeOfBasisMatrix,i,&j,PETSC_NULL,PETSC_NULL);CHKERRQ(ierr);
1660534831adSStefano Zampini       nnz[is_indices[i]]=j;
1661534831adSStefano Zampini       if( k < j) {
1662534831adSStefano Zampini         k = j;
1663534831adSStefano Zampini       }
1664534831adSStefano Zampini       ierr = MatRestoreRow(pcbddc->ChangeOfBasisMatrix,i,&j,PETSC_NULL,PETSC_NULL);CHKERRQ(ierr);
1665534831adSStefano Zampini     }
1666534831adSStefano Zampini     ierr = ISRestoreIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
1667534831adSStefano Zampini     /* assemble change of basis matrix on the whole set of local dofs */
1668534831adSStefano Zampini     ierr = PetscMalloc(k*sizeof(PetscInt),&temp_indices);CHKERRQ(ierr);
1669534831adSStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&change_mat_all);CHKERRQ(ierr);
1670534831adSStefano Zampini     ierr = MatSetSizes(change_mat_all,pcis->n,pcis->n,pcis->n,pcis->n);CHKERRQ(ierr);
1671534831adSStefano Zampini     ierr = MatSetType(change_mat_all,MATSEQAIJ);CHKERRQ(ierr);
1672534831adSStefano Zampini     ierr = MatSeqAIJSetPreallocation(change_mat_all,0,nnz);CHKERRQ(ierr);
1673534831adSStefano Zampini     ierr = ISGetIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
1674534831adSStefano Zampini     for(i=0;i<n_D;i++) {
1675534831adSStefano Zampini       ierr = MatSetValue(change_mat_all,is_indices[i],is_indices[i],1.0,INSERT_VALUES);CHKERRQ(ierr);
1676534831adSStefano Zampini     }
1677534831adSStefano Zampini     ierr = ISRestoreIndices(pcis->is_I_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
1678534831adSStefano Zampini     ierr = ISGetIndices(pcis->is_B_local,(const PetscInt**)&is_indices);CHKERRQ(ierr);
1679534831adSStefano Zampini     for(i=0;i<n_B;i++) {
1680534831adSStefano Zampini       ierr = MatGetRow(pcbddc->ChangeOfBasisMatrix,i,&j,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr);
1681534831adSStefano Zampini       for(k=0;k<j;k++) {
1682534831adSStefano Zampini         temp_indices[k]=is_indices[row_cmat_indices[k]];
1683534831adSStefano Zampini       }
1684534831adSStefano Zampini       ierr = MatSetValues(change_mat_all,1,&is_indices[i],j,temp_indices,row_cmat_values,INSERT_VALUES);CHKERRQ(ierr);
1685534831adSStefano Zampini       ierr = MatRestoreRow(pcbddc->ChangeOfBasisMatrix,i,&j,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr);
1686534831adSStefano Zampini     }
1687534831adSStefano Zampini     ierr = MatAssemblyBegin(change_mat_all,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1688534831adSStefano Zampini     ierr = MatAssemblyEnd(change_mat_all,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
1689534831adSStefano Zampini     ierr = MatPtAP(matis->A,change_mat_all,MAT_INITIAL_MATRIX,1.0,&pcbddc->local_mat);CHKERRQ(ierr);
1690534831adSStefano Zampini     ierr = MatDestroy(&pcis->A_IB);CHKERRQ(ierr);
1691534831adSStefano Zampini     ierr = MatDestroy(&pcis->A_BI);CHKERRQ(ierr);
1692534831adSStefano Zampini     ierr = MatDestroy(&pcis->A_BB);CHKERRQ(ierr);
1693534831adSStefano Zampini     ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_I_local,pcis->is_B_local,MAT_INITIAL_MATRIX,&pcis->A_IB);CHKERRQ(ierr);
1694534831adSStefano Zampini     ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_B_local,pcis->is_I_local,MAT_INITIAL_MATRIX,&pcis->A_BI);CHKERRQ(ierr);
1695534831adSStefano Zampini     ierr = MatGetSubMatrix(pcbddc->local_mat,pcis->is_B_local,pcis->is_B_local,MAT_INITIAL_MATRIX,&pcis->A_BB);CHKERRQ(ierr);
1696534831adSStefano Zampini     ierr = MatDestroy(&change_mat_all);CHKERRQ(ierr);
1697534831adSStefano Zampini     ierr = PetscFree(nnz);CHKERRQ(ierr);
1698534831adSStefano Zampini     ierr = PetscFree(temp_indices);CHKERRQ(ierr);
1699534831adSStefano Zampini   } else {
1700534831adSStefano Zampini     /* without change of basis, the local matrix is unchanged */
1701534831adSStefano Zampini     ierr = PetscObjectReference((PetscObject)matis->A);CHKERRQ(ierr);
1702534831adSStefano Zampini     pcbddc->local_mat = matis->A;
1703534831adSStefano Zampini   }
1704a0ba757dSStefano Zampini 
17050c7d97c5SJed Brown   /* Dohrmann's notation: dofs splitted in R (Remaining: all dofs but the vertices) and V (Vertices) */
17060c7d97c5SJed Brown   ierr = VecSet(pcis->vec1_N,one);CHKERRQ(ierr);
17070c7d97c5SJed Brown   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
17083b03a366Sstefano_zampini   for (i=0;i<n_vertices;i++) { array[ vertices[i] ] = zero; }
17093b03a366Sstefano_zampini   ierr = PetscMalloc(( pcis->n - n_vertices )*sizeof(PetscInt),&idx_R_local);CHKERRQ(ierr);
17100c7d97c5SJed Brown   for (i=0, n_R=0; i<pcis->n; i++) { if (array[i] == one) { idx_R_local[n_R] = i; n_R++; } }
17110c7d97c5SJed Brown   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
1712e269702eSStefano Zampini   if(dbg_flag) {
17130c7d97c5SJed Brown     ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
17140c7d97c5SJed Brown     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
17150c7d97c5SJed Brown     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d local dimensions\n",PetscGlobalRank);CHKERRQ(ierr);
17160c7d97c5SJed Brown     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local_size = %d, dirichlet_size = %d, boundary_size = %d\n",pcis->n,n_D,n_B);CHKERRQ(ierr);
17173b03a366Sstefano_zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"r_size = %d, v_size = %d, constraints = %d, local_primal_size = %d\n",n_R,n_vertices,n_constraints,pcbddc->local_primal_size);CHKERRQ(ierr);
1718534831adSStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"pcbddc->n_vertices = %d, pcbddc->n_constraints = %d\n",pcbddc->n_vertices,pcbddc->n_constraints);CHKERRQ(ierr);
17190c7d97c5SJed Brown     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
17200c7d97c5SJed Brown   }
1721534831adSStefano Zampini 
17220c7d97c5SJed Brown   /* Allocate needed vectors */
1723534831adSStefano Zampini   ierr = VecDuplicate(pcis->vec1_global,&pcbddc->original_rhs);CHKERRQ(ierr);
17243972b0daSStefano Zampini   ierr = VecDuplicate(pcis->vec1_global,&pcbddc->temp_solution);CHKERRQ(ierr);
17250c7d97c5SJed Brown   ierr = VecDuplicate(pcis->vec1_D,&pcbddc->vec4_D);CHKERRQ(ierr);
17260c7d97c5SJed Brown   ierr = VecCreate(PETSC_COMM_SELF,&pcbddc->vec1_R);CHKERRQ(ierr);
17270c7d97c5SJed Brown   ierr = VecSetSizes(pcbddc->vec1_R,n_R,n_R);CHKERRQ(ierr);
17280c7d97c5SJed Brown   ierr = VecSetType(pcbddc->vec1_R,impVecType);CHKERRQ(ierr);
1729d49ef151SStefano Zampini   ierr = VecDuplicate(pcbddc->vec1_R,&pcbddc->vec2_R);CHKERRQ(ierr);
17300c7d97c5SJed Brown   ierr = VecCreate(PETSC_COMM_SELF,&pcbddc->vec1_P);CHKERRQ(ierr);
17310c7d97c5SJed Brown   ierr = VecSetSizes(pcbddc->vec1_P,pcbddc->local_primal_size,pcbddc->local_primal_size);CHKERRQ(ierr);
17320c7d97c5SJed Brown   ierr = VecSetType(pcbddc->vec1_P,impVecType);CHKERRQ(ierr);
17330c7d97c5SJed Brown 
17340c7d97c5SJed Brown   /* Creating some index sets needed  */
17350c7d97c5SJed Brown   /* For submatrices */
1736da1bb401SStefano Zampini   ierr = ISCreateGeneral(PETSC_COMM_SELF,n_R,idx_R_local,PETSC_OWN_POINTER,&is_R_local);CHKERRQ(ierr);
17373b03a366Sstefano_zampini   if(n_vertices)    {
1738da1bb401SStefano Zampini     ierr = ISCreateGeneral(PETSC_COMM_SELF,n_vertices,vertices,PETSC_OWN_POINTER,&is_V_local);CHKERRQ(ierr);
17393b03a366Sstefano_zampini   }
1740da1bb401SStefano Zampini   if(n_constraints) {
1741da1bb401SStefano Zampini     ierr = ISCreateStride(PETSC_COMM_SELF,n_constraints,n_vertices,1,&is_C_local);CHKERRQ(ierr);
1742da1bb401SStefano Zampini   }
1743da1bb401SStefano Zampini 
17440c7d97c5SJed Brown   /* For VecScatters pcbddc->R_to_B and (optionally) pcbddc->R_to_D */
17450c7d97c5SJed Brown   {
17460c7d97c5SJed Brown     PetscInt   *aux_array1;
17470c7d97c5SJed Brown     PetscInt   *aux_array2;
17480c7d97c5SJed Brown 
17493b03a366Sstefano_zampini     ierr = PetscMalloc( (pcis->n_B-n_vertices)*sizeof(PetscInt),&aux_array1);CHKERRQ(ierr);
17503b03a366Sstefano_zampini     ierr = PetscMalloc( (pcis->n_B-n_vertices)*sizeof(PetscInt),&aux_array2);CHKERRQ(ierr);
17510c7d97c5SJed Brown 
1752d49ef151SStefano Zampini     ierr = VecSet(pcis->vec1_global,zero);CHKERRQ(ierr);
17530c7d97c5SJed Brown     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
17540c7d97c5SJed Brown     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
17550c7d97c5SJed Brown     ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
17560c7d97c5SJed Brown     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
17570c7d97c5SJed Brown     ierr = VecScatterBegin(pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
17580c7d97c5SJed Brown     ierr = VecScatterEnd  (pcis->N_to_B,pcis->vec1_N,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
17590c7d97c5SJed Brown     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
1760da1bb401SStefano Zampini     for (i=0, j=0; i<n_R; i++) { if (array[idx_R_local[i]] > one) { aux_array1[j] = i; j++; } }
17610c7d97c5SJed Brown     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
1762da1bb401SStefano Zampini     ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array1,PETSC_COPY_VALUES,&is_aux1);CHKERRQ(ierr);
17630c7d97c5SJed Brown     ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr);
1764da1bb401SStefano Zampini     for (i=0, j=0; i<n_B; i++) { if (array[i] > one) { aux_array2[j] = i; j++; } }
17653828260eSStefano Zampini     ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr);
1766da1bb401SStefano Zampini     ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array2,PETSC_COPY_VALUES,&is_aux2);CHKERRQ(ierr);
17670c7d97c5SJed Brown     ierr = VecScatterCreate(pcbddc->vec1_R,is_aux1,pcis->vec1_B,is_aux2,&pcbddc->R_to_B);CHKERRQ(ierr);
17680c7d97c5SJed Brown     ierr = PetscFree(aux_array1);CHKERRQ(ierr);
17690c7d97c5SJed Brown     ierr = PetscFree(aux_array2);CHKERRQ(ierr);
17700c7d97c5SJed Brown     ierr = ISDestroy(&is_aux1);CHKERRQ(ierr);
17710c7d97c5SJed Brown     ierr = ISDestroy(&is_aux2);CHKERRQ(ierr);
17720c7d97c5SJed Brown 
1773e269702eSStefano Zampini     if(pcbddc->prec_type || dbg_flag ) {
17740c7d97c5SJed Brown       ierr = PetscMalloc(n_D*sizeof(PetscInt),&aux_array1);CHKERRQ(ierr);
17750c7d97c5SJed Brown       ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
1776da1bb401SStefano Zampini       for (i=0, j=0; i<n_R; i++) { if (array[idx_R_local[i]] == one) { aux_array1[j] = i; j++; } }
17770c7d97c5SJed Brown       ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
1778da1bb401SStefano Zampini       ierr = ISCreateGeneral(PETSC_COMM_SELF,j,aux_array1,PETSC_COPY_VALUES,&is_aux1);CHKERRQ(ierr);
17790c7d97c5SJed Brown       ierr = VecScatterCreate(pcbddc->vec1_R,is_aux1,pcis->vec1_D,(IS)0,&pcbddc->R_to_D);CHKERRQ(ierr);
17800c7d97c5SJed Brown       ierr = PetscFree(aux_array1);CHKERRQ(ierr);
17810c7d97c5SJed Brown       ierr = ISDestroy(&is_aux1);CHKERRQ(ierr);
17820c7d97c5SJed Brown     }
17830c7d97c5SJed Brown   }
17840c7d97c5SJed Brown 
17850c7d97c5SJed Brown   /* Creating PC contexts for local Dirichlet and Neumann problems */
17860c7d97c5SJed Brown   {
17870c7d97c5SJed Brown     Mat  A_RR;
178853cdbc3dSStefano Zampini     PC   pc_temp;
17890c7d97c5SJed Brown     /* Matrix for Dirichlet problem is A_II -> we already have it from pcis.c code */
179053cdbc3dSStefano Zampini     ierr = KSPCreate(PETSC_COMM_SELF,&pcbddc->ksp_D);CHKERRQ(ierr);
179153cdbc3dSStefano Zampini     ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->ksp_D,(PetscObject)pc,1);CHKERRQ(ierr);
179253cdbc3dSStefano Zampini     ierr = KSPSetOperators(pcbddc->ksp_D,pcis->A_II,pcis->A_II,SAME_PRECONDITIONER);CHKERRQ(ierr);
179353cdbc3dSStefano Zampini     ierr = KSPSetType(pcbddc->ksp_D,KSPPREONLY);CHKERRQ(ierr);
1794da1bb401SStefano Zampini     ierr = KSPSetOptionsPrefix(pcbddc->ksp_D,"dirichlet_");CHKERRQ(ierr);
17950c7d97c5SJed Brown     /* default */
179653cdbc3dSStefano Zampini     ierr = KSPGetPC(pcbddc->ksp_D,&pc_temp);CHKERRQ(ierr);
179753cdbc3dSStefano Zampini     ierr = PCSetType(pc_temp,PCLU);CHKERRQ(ierr);
17980c7d97c5SJed Brown     /* Allow user's customization */
179953cdbc3dSStefano Zampini     ierr = KSPSetFromOptions(pcbddc->ksp_D);CHKERRQ(ierr);
180053cdbc3dSStefano Zampini     /* Set Up KSP for Dirichlet problem of BDDC */
180153cdbc3dSStefano Zampini     ierr = KSPSetUp(pcbddc->ksp_D);CHKERRQ(ierr);
18023972b0daSStefano Zampini     /* set ksp_D into pcis data */
18033972b0daSStefano Zampini     ierr = KSPDestroy(&pcis->ksp_D);CHKERRQ(ierr);
18043972b0daSStefano Zampini     ierr = PetscObjectReference((PetscObject)pcbddc->ksp_D);CHKERRQ(ierr);
18053972b0daSStefano Zampini     pcis->ksp_D = pcbddc->ksp_D;
1806da1bb401SStefano Zampini     if(pcbddc->dbg_flag) ierr = KSPView(pcbddc->ksp_D,PETSC_VIEWER_STDOUT_SELF);
18070c7d97c5SJed Brown     /* Matrix for Neumann problem is A_RR -> we need to create it */
1808534831adSStefano Zampini     ierr = MatGetSubMatrix(pcbddc->local_mat,is_R_local,is_R_local,MAT_INITIAL_MATRIX,&A_RR);CHKERRQ(ierr);
180953cdbc3dSStefano Zampini     ierr = KSPCreate(PETSC_COMM_SELF,&pcbddc->ksp_R);CHKERRQ(ierr);
181053cdbc3dSStefano Zampini     ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->ksp_R,(PetscObject)pc,1);CHKERRQ(ierr);
181153cdbc3dSStefano Zampini     ierr = KSPSetOperators(pcbddc->ksp_R,A_RR,A_RR,SAME_PRECONDITIONER);CHKERRQ(ierr);
181253cdbc3dSStefano Zampini     ierr = KSPSetType(pcbddc->ksp_R,KSPPREONLY);CHKERRQ(ierr);
1813da1bb401SStefano Zampini     ierr = KSPSetOptionsPrefix(pcbddc->ksp_R,"neumann_");CHKERRQ(ierr);
18140c7d97c5SJed Brown     /* default */
181553cdbc3dSStefano Zampini     ierr = KSPGetPC(pcbddc->ksp_R,&pc_temp);CHKERRQ(ierr);
181653cdbc3dSStefano Zampini     ierr = PCSetType(pc_temp,PCLU);CHKERRQ(ierr);
18170c7d97c5SJed Brown     /* Allow user's customization */
181853cdbc3dSStefano Zampini     ierr = KSPSetFromOptions(pcbddc->ksp_R);CHKERRQ(ierr);
181953cdbc3dSStefano Zampini     /* Set Up KSP for Neumann problem of BDDC */
182053cdbc3dSStefano Zampini     ierr = KSPSetUp(pcbddc->ksp_R);CHKERRQ(ierr);
1821da1bb401SStefano Zampini     if(pcbddc->dbg_flag) ierr = KSPView(pcbddc->ksp_R,PETSC_VIEWER_STDOUT_SELF);
1822a0ba757dSStefano Zampini     /* check Dirichlet and Neumann solvers */
1823e269702eSStefano Zampini     if(pcbddc->dbg_flag) {
18240c7d97c5SJed Brown       Vec temp_vec;
18250c7d97c5SJed Brown       PetscScalar value;
18260c7d97c5SJed Brown 
1827a0ba757dSStefano Zampini       ierr = VecDuplicate(pcis->vec1_D,&temp_vec);CHKERRQ(ierr);
1828a0ba757dSStefano Zampini       ierr = VecSetRandom(pcis->vec1_D,PETSC_NULL);CHKERRQ(ierr);
1829a0ba757dSStefano Zampini       ierr = MatMult(pcis->A_II,pcis->vec1_D,pcis->vec2_D);CHKERRQ(ierr);
1830a0ba757dSStefano Zampini       ierr = KSPSolve(pcbddc->ksp_D,pcis->vec2_D,temp_vec);CHKERRQ(ierr);
1831a0ba757dSStefano Zampini       ierr = VecAXPY(temp_vec,m_one,pcis->vec1_D);CHKERRQ(ierr);
1832a0ba757dSStefano Zampini       ierr = VecNorm(temp_vec,NORM_INFINITY,&value);CHKERRQ(ierr);
1833a0ba757dSStefano Zampini       ierr = VecDestroy(&temp_vec);CHKERRQ(ierr);
1834a0ba757dSStefano Zampini       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
1835a0ba757dSStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
1836a0ba757dSStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Checking solution of Dirichlet and Neumann problems\n");CHKERRQ(ierr);
1837a0ba757dSStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d infinity error for Dirichlet solve = % 1.14e \n",PetscGlobalRank,value);CHKERRQ(ierr);
1838d49ef151SStefano Zampini       ierr = VecDuplicate(pcbddc->vec1_R,&temp_vec);CHKERRQ(ierr);
1839d49ef151SStefano Zampini       ierr = VecSetRandom(pcbddc->vec1_R,PETSC_NULL);CHKERRQ(ierr);
1840d49ef151SStefano Zampini       ierr = MatMult(A_RR,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr);
1841d49ef151SStefano Zampini       ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec2_R,temp_vec);CHKERRQ(ierr);
1842d49ef151SStefano Zampini       ierr = VecAXPY(temp_vec,m_one,pcbddc->vec1_R);CHKERRQ(ierr);
1843d49ef151SStefano Zampini       ierr = VecNorm(temp_vec,NORM_INFINITY,&value);CHKERRQ(ierr);
1844e269702eSStefano Zampini       ierr = VecDestroy(&temp_vec);CHKERRQ(ierr);
18450c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d infinity error for  Neumann  solve = % 1.14e \n",PetscGlobalRank,value);CHKERRQ(ierr);
1846d49ef151SStefano Zampini       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
18470c7d97c5SJed Brown     }
18480c7d97c5SJed Brown     /* free Neumann problem's matrix */
18490c7d97c5SJed Brown     ierr = MatDestroy(&A_RR);CHKERRQ(ierr);
18500c7d97c5SJed Brown   }
18510c7d97c5SJed Brown 
18520c7d97c5SJed Brown   /* Assemble all remaining stuff needed to apply BDDC  */
18530c7d97c5SJed Brown   {
18540c7d97c5SJed Brown     Mat          A_RV,A_VR,A_VV;
18550c7d97c5SJed Brown     Mat          M1,M2;
18560c7d97c5SJed Brown     Mat          C_CR;
18573b03a366Sstefano_zampini     Mat          AUXMAT;
18580c7d97c5SJed Brown     Vec          vec1_C;
18590c7d97c5SJed Brown     Vec          vec2_C;
18600c7d97c5SJed Brown     Vec          vec1_V;
18610c7d97c5SJed Brown     Vec          vec2_V;
18620c7d97c5SJed Brown     PetscInt     *nnz;
18630c7d97c5SJed Brown     PetscInt     *auxindices;
186453cdbc3dSStefano Zampini     PetscInt     index;
18650c7d97c5SJed Brown     PetscScalar* array2;
18660c7d97c5SJed Brown     MatFactorInfo matinfo;
18670c7d97c5SJed Brown 
18680c7d97c5SJed Brown     /* Allocating some extra storage just to be safe */
18690c7d97c5SJed Brown     ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&nnz);CHKERRQ(ierr);
18700c7d97c5SJed Brown     ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&auxindices);CHKERRQ(ierr);
18710c7d97c5SJed Brown     for(i=0;i<pcis->n;i++) {auxindices[i]=i;}
18720c7d97c5SJed Brown 
18730c7d97c5SJed Brown     /* some work vectors on vertices and/or constraints */
18743b03a366Sstefano_zampini     if(n_vertices) {
18750c7d97c5SJed Brown       ierr = VecCreate(PETSC_COMM_SELF,&vec1_V);CHKERRQ(ierr);
18763b03a366Sstefano_zampini       ierr = VecSetSizes(vec1_V,n_vertices,n_vertices);CHKERRQ(ierr);
18770c7d97c5SJed Brown       ierr = VecSetType(vec1_V,impVecType);CHKERRQ(ierr);
18780c7d97c5SJed Brown       ierr = VecDuplicate(vec1_V,&vec2_V);CHKERRQ(ierr);
18790c7d97c5SJed Brown     }
1880534831adSStefano Zampini     if(n_constraints) {
18810c7d97c5SJed Brown       ierr = VecCreate(PETSC_COMM_SELF,&vec1_C);CHKERRQ(ierr);
1882534831adSStefano Zampini       ierr = VecSetSizes(vec1_C,n_constraints,n_constraints);CHKERRQ(ierr);
18830c7d97c5SJed Brown       ierr = VecSetType(vec1_C,impVecType);CHKERRQ(ierr);
18840c7d97c5SJed Brown       ierr = VecDuplicate(vec1_C,&vec2_C);CHKERRQ(ierr);
18850c7d97c5SJed Brown       ierr = VecDuplicate(vec1_C,&pcbddc->vec1_C);CHKERRQ(ierr);
18860c7d97c5SJed Brown     }
18870c7d97c5SJed Brown     /* Precompute stuffs needed for preprocessing and application of BDDC*/
18883b03a366Sstefano_zampini     if(n_constraints) {
18890c7d97c5SJed Brown       ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->local_auxmat2);CHKERRQ(ierr);
18903b03a366Sstefano_zampini       ierr = MatSetSizes(pcbddc->local_auxmat2,n_R,n_constraints,n_R,n_constraints);CHKERRQ(ierr);
18910c7d97c5SJed Brown       ierr = MatSetType(pcbddc->local_auxmat2,impMatType);CHKERRQ(ierr);
18923b03a366Sstefano_zampini       ierr = MatSeqDenseSetPreallocation(pcbddc->local_auxmat2,PETSC_NULL);CHKERRQ(ierr);
18930c7d97c5SJed Brown 
1894*57a90decSStefano Zampini       /* Create Constraint matrix on R nodes: C_{CR}  */
1895*57a90decSStefano Zampini       ierr = MatGetSubMatrix(pcbddc->ConstraintMatrix,is_C_local,is_R_local,MAT_INITIAL_MATRIX,&C_CR);CHKERRQ(ierr);
1896*57a90decSStefano Zampini       ierr = ISDestroy(&is_C_local);CHKERRQ(ierr);
1897*57a90decSStefano Zampini 
18980c7d97c5SJed Brown       /* Assemble local_auxmat2 = - A_{RR}^{-1} C^T_{CR} needed by BDDC application */
18993b03a366Sstefano_zampini       for(i=0;i<n_constraints;i++) {
19003b03a366Sstefano_zampini         ierr = VecSet(pcbddc->vec1_R,zero);CHKERRQ(ierr);
19013b03a366Sstefano_zampini         /* Get row of constraint matrix in R numbering */
1902*57a90decSStefano Zampini         ierr = VecGetArray(pcbddc->vec1_R,&array);CHKERRQ(ierr);
1903*57a90decSStefano Zampini         ierr = MatGetRow(C_CR,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr);
19043b03a366Sstefano_zampini         for(j=0;j<size_of_constraint;j++) { array[ row_cmat_indices[j] ] = - row_cmat_values[j]; }
1905*57a90decSStefano Zampini         ierr = MatRestoreRow(C_CR,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,(const PetscScalar**)&row_cmat_values);CHKERRQ(ierr);
1906*57a90decSStefano Zampini         ierr = VecRestoreArray(pcbddc->vec1_R,&array);CHKERRQ(ierr);
19073b03a366Sstefano_zampini         /* Solve for row of constraint matrix in R numbering */
190853cdbc3dSStefano Zampini         ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr);
19093b03a366Sstefano_zampini         /* Set values */
19100c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec2_R,&array);CHKERRQ(ierr);
19113b03a366Sstefano_zampini         ierr = MatSetValues(pcbddc->local_auxmat2,n_R,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
19120c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec2_R,&array);CHKERRQ(ierr);
19130c7d97c5SJed Brown       }
19140c7d97c5SJed Brown       ierr = MatAssemblyBegin(pcbddc->local_auxmat2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
19150c7d97c5SJed Brown       ierr = MatAssemblyEnd(pcbddc->local_auxmat2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
19160c7d97c5SJed Brown 
19170c7d97c5SJed Brown       /* Assemble AUXMAT = ( LUFactor )( -C_{CR} A_{RR}^{-1} C^T_{CR} )^{-1} */
19180c7d97c5SJed Brown       ierr = MatMatMult(C_CR,pcbddc->local_auxmat2,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&AUXMAT);CHKERRQ(ierr);
1919d49ef151SStefano Zampini       ierr = MatFactorInfoInitialize(&matinfo);CHKERRQ(ierr);
19203b03a366Sstefano_zampini       ierr = ISCreateStride(PETSC_COMM_SELF,n_constraints,0,1,&is_aux1);CHKERRQ(ierr);
19210c7d97c5SJed Brown       ierr = MatLUFactor(AUXMAT,is_aux1,is_aux1,&matinfo);CHKERRQ(ierr);
19220c7d97c5SJed Brown       ierr = ISDestroy(&is_aux1);CHKERRQ(ierr);
19230c7d97c5SJed Brown 
19243b03a366Sstefano_zampini       /* Assemble explicitly M1 = ( C_{CR} A_{RR}^{-1} C^T_{CR} )^{-1} needed in preproc  */
1925d49ef151SStefano Zampini       ierr = MatCreate(PETSC_COMM_SELF,&M1);CHKERRQ(ierr);
19263b03a366Sstefano_zampini       ierr = MatSetSizes(M1,n_constraints,n_constraints,n_constraints,n_constraints);CHKERRQ(ierr);
19270c7d97c5SJed Brown       ierr = MatSetType(M1,impMatType);CHKERRQ(ierr);
19283b03a366Sstefano_zampini       ierr = MatSeqDenseSetPreallocation(M1,PETSC_NULL);CHKERRQ(ierr);
19293b03a366Sstefano_zampini       for(i=0;i<n_constraints;i++) {
19300c7d97c5SJed Brown         ierr = VecSet(vec1_C,zero);CHKERRQ(ierr);
19310c7d97c5SJed Brown         ierr = VecSetValue(vec1_C,i,one,INSERT_VALUES);CHKERRQ(ierr);
19320c7d97c5SJed Brown         ierr = VecAssemblyBegin(vec1_C);CHKERRQ(ierr);
19330c7d97c5SJed Brown         ierr = VecAssemblyEnd(vec1_C);CHKERRQ(ierr);
19340c7d97c5SJed Brown         ierr = MatSolve(AUXMAT,vec1_C,vec2_C);CHKERRQ(ierr);
19350c7d97c5SJed Brown         ierr = VecScale(vec2_C,m_one);CHKERRQ(ierr);
19360c7d97c5SJed Brown         ierr = VecGetArray(vec2_C,&array);CHKERRQ(ierr);
19373b03a366Sstefano_zampini         ierr = MatSetValues(M1,n_constraints,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
19380c7d97c5SJed Brown         ierr = VecRestoreArray(vec2_C,&array);CHKERRQ(ierr);
19390c7d97c5SJed Brown       }
19400c7d97c5SJed Brown       ierr = MatAssemblyBegin(M1,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
19410c7d97c5SJed Brown       ierr = MatAssemblyEnd(M1,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
19420c7d97c5SJed Brown       ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr);
19430c7d97c5SJed Brown       /* Assemble local_auxmat1 = M1*C_{CR} needed by BDDC application in KSP and in preproc */
19440c7d97c5SJed Brown       ierr = MatMatMult(M1,C_CR,MAT_INITIAL_MATRIX,PETSC_DEFAULT,&pcbddc->local_auxmat1);CHKERRQ(ierr);
19450c7d97c5SJed Brown 
19460c7d97c5SJed Brown     }
19470c7d97c5SJed Brown 
19480c7d97c5SJed Brown     /* Get submatrices from subdomain matrix */
19493b03a366Sstefano_zampini     if(n_vertices){
1950534831adSStefano Zampini       ierr = MatGetSubMatrix(pcbddc->local_mat,is_R_local,is_V_local,MAT_INITIAL_MATRIX,&A_RV);CHKERRQ(ierr);
1951534831adSStefano Zampini       ierr = MatGetSubMatrix(pcbddc->local_mat,is_V_local,is_R_local,MAT_INITIAL_MATRIX,&A_VR);CHKERRQ(ierr);
1952534831adSStefano Zampini       ierr = MatGetSubMatrix(pcbddc->local_mat,is_V_local,is_V_local,MAT_INITIAL_MATRIX,&A_VV);CHKERRQ(ierr);
19530c7d97c5SJed Brown       /* Assemble M2 = A_RR^{-1}A_RV */
1954d49ef151SStefano Zampini       ierr = MatCreate(PETSC_COMM_SELF,&M2);CHKERRQ(ierr);
19553b03a366Sstefano_zampini       ierr = MatSetSizes(M2,n_R,n_vertices,n_R,n_vertices);CHKERRQ(ierr);
19560c7d97c5SJed Brown       ierr = MatSetType(M2,impMatType);CHKERRQ(ierr);
19573b03a366Sstefano_zampini       ierr = MatSeqDenseSetPreallocation(M2,PETSC_NULL);CHKERRQ(ierr);
19583b03a366Sstefano_zampini       for(i=0;i<n_vertices;i++) {
19590c7d97c5SJed Brown         ierr = VecSet(vec1_V,zero);CHKERRQ(ierr);
19600c7d97c5SJed Brown         ierr = VecSetValue(vec1_V,i,one,INSERT_VALUES);CHKERRQ(ierr);
19610c7d97c5SJed Brown         ierr = VecAssemblyBegin(vec1_V);CHKERRQ(ierr);
19620c7d97c5SJed Brown         ierr = VecAssemblyEnd(vec1_V);CHKERRQ(ierr);
19630c7d97c5SJed Brown         ierr = MatMult(A_RV,vec1_V,pcbddc->vec1_R);CHKERRQ(ierr);
196453cdbc3dSStefano Zampini         ierr = KSPSolve(pcbddc->ksp_R,pcbddc->vec1_R,pcbddc->vec2_R);CHKERRQ(ierr);
19650c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec2_R,&array);CHKERRQ(ierr);
19663b03a366Sstefano_zampini         ierr = MatSetValues(M2,n_R,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
19670c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec2_R,&array);CHKERRQ(ierr);
19680c7d97c5SJed Brown       }
19690c7d97c5SJed Brown       ierr = MatAssemblyBegin(M2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
19700c7d97c5SJed Brown       ierr = MatAssemblyEnd(M2,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
19710c7d97c5SJed Brown     }
19720c7d97c5SJed Brown 
19730c7d97c5SJed Brown     /* Matrix of coarse basis functions (local) */
1974d49ef151SStefano Zampini     ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->coarse_phi_B);CHKERRQ(ierr);
19750c7d97c5SJed Brown     ierr = MatSetSizes(pcbddc->coarse_phi_B,n_B,pcbddc->local_primal_size,n_B,pcbddc->local_primal_size);CHKERRQ(ierr);
19760c7d97c5SJed Brown     ierr = MatSetType(pcbddc->coarse_phi_B,impMatType);CHKERRQ(ierr);
19773b03a366Sstefano_zampini     ierr = MatSeqDenseSetPreallocation(pcbddc->coarse_phi_B,PETSC_NULL);CHKERRQ(ierr);
1978e269702eSStefano Zampini     if(pcbddc->prec_type || dbg_flag ) {
1979d49ef151SStefano Zampini       ierr = MatCreate(PETSC_COMM_SELF,&pcbddc->coarse_phi_D);CHKERRQ(ierr);
19800c7d97c5SJed Brown       ierr = MatSetSizes(pcbddc->coarse_phi_D,n_D,pcbddc->local_primal_size,n_D,pcbddc->local_primal_size);CHKERRQ(ierr);
19810c7d97c5SJed Brown       ierr = MatSetType(pcbddc->coarse_phi_D,impMatType);CHKERRQ(ierr);
19823b03a366Sstefano_zampini       ierr = MatSeqDenseSetPreallocation(pcbddc->coarse_phi_D,PETSC_NULL);CHKERRQ(ierr);
19830c7d97c5SJed Brown     }
19840c7d97c5SJed Brown 
1985e269702eSStefano Zampini     if(dbg_flag) {
19860c7d97c5SJed Brown       ierr = PetscMalloc( pcbddc->local_primal_size*sizeof(PetscScalar),&coarsefunctions_errors);CHKERRQ(ierr);
19870c7d97c5SJed Brown       ierr = PetscMalloc( pcbddc->local_primal_size*sizeof(PetscScalar),&constraints_errors);CHKERRQ(ierr);
19880c7d97c5SJed Brown     }
19893b03a366Sstefano_zampini     /* Subdomain contribution (Non-overlapping) to coarse matrix  */
19900c7d97c5SJed Brown     ierr = PetscMalloc ((pcbddc->local_primal_size)*(pcbddc->local_primal_size)*sizeof(PetscScalar),&coarse_submat_vals);CHKERRQ(ierr);
19910c7d97c5SJed Brown 
19920c7d97c5SJed Brown     /* We are now ready to evaluate coarse basis functions and subdomain contribution to coarse problem */
19933b03a366Sstefano_zampini     for(i=0;i<n_vertices;i++){
19940c7d97c5SJed Brown       ierr = VecSet(vec1_V,zero);CHKERRQ(ierr);
19950c7d97c5SJed Brown       ierr = VecSetValue(vec1_V,i,one,INSERT_VALUES);CHKERRQ(ierr);
19960c7d97c5SJed Brown       ierr = VecAssemblyBegin(vec1_V);CHKERRQ(ierr);
19970c7d97c5SJed Brown       ierr = VecAssemblyEnd(vec1_V);CHKERRQ(ierr);
19980c7d97c5SJed Brown       /* solution of saddle point problem */
19990c7d97c5SJed Brown       ierr = MatMult(M2,vec1_V,pcbddc->vec1_R);CHKERRQ(ierr);
20000c7d97c5SJed Brown       ierr = VecScale(pcbddc->vec1_R,m_one);CHKERRQ(ierr);
20013b03a366Sstefano_zampini       if(n_constraints) {
20020c7d97c5SJed Brown         ierr = MatMult(pcbddc->local_auxmat1,pcbddc->vec1_R,vec1_C);CHKERRQ(ierr);
20030c7d97c5SJed Brown         ierr = MatMultAdd(pcbddc->local_auxmat2,vec1_C,pcbddc->vec1_R,pcbddc->vec1_R);CHKERRQ(ierr);
20040c7d97c5SJed Brown         ierr = VecScale(vec1_C,m_one);CHKERRQ(ierr);
20050c7d97c5SJed Brown       }
20060c7d97c5SJed Brown       ierr = MatMult(A_VR,pcbddc->vec1_R,vec2_V);CHKERRQ(ierr);
20070c7d97c5SJed Brown       ierr = MatMultAdd(A_VV,vec1_V,vec2_V,vec2_V);CHKERRQ(ierr);
20080c7d97c5SJed Brown 
20090c7d97c5SJed Brown       /* Set values in coarse basis function and subdomain part of coarse_mat */
20100c7d97c5SJed Brown       /* coarse basis functions */
20110c7d97c5SJed Brown       ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr);
20120c7d97c5SJed Brown       ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20130c7d97c5SJed Brown       ierr = VecScatterEnd  (pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20140c7d97c5SJed Brown       ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr);
20153b03a366Sstefano_zampini       ierr = MatSetValues(pcbddc->coarse_phi_B,n_B,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
20160c7d97c5SJed Brown       ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr);
20170c7d97c5SJed Brown       ierr = MatSetValue(pcbddc->coarse_phi_B,idx_V_B[i],i,one,INSERT_VALUES);CHKERRQ(ierr);
2018e269702eSStefano Zampini       if( pcbddc->prec_type || dbg_flag  ) {
20190c7d97c5SJed Brown         ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20200c7d97c5SJed Brown         ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20210c7d97c5SJed Brown         ierr = VecGetArray(pcis->vec1_D,&array);CHKERRQ(ierr);
20223b03a366Sstefano_zampini         ierr = MatSetValues(pcbddc->coarse_phi_D,n_D,auxindices,1,&i,array,INSERT_VALUES);CHKERRQ(ierr);
20230c7d97c5SJed Brown         ierr = VecRestoreArray(pcis->vec1_D,&array);CHKERRQ(ierr);
20240c7d97c5SJed Brown       }
20250c7d97c5SJed Brown       /* subdomain contribution to coarse matrix */
20260c7d97c5SJed Brown       ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr);
2027da1bb401SStefano Zampini       for(j=0;j<n_vertices;j++) { coarse_submat_vals[i*pcbddc->local_primal_size+j] = array[j]; } /* WARNING -> column major ordering */
20280c7d97c5SJed Brown       ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr);
20293b03a366Sstefano_zampini       if(n_constraints) {
20300c7d97c5SJed Brown         ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr);
2031da1bb401SStefano Zampini         for(j=0;j<n_constraints;j++) { coarse_submat_vals[i*pcbddc->local_primal_size+j+n_vertices] = array[j]; } /* WARNING -> column major ordering */
20320c7d97c5SJed Brown         ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr);
20330c7d97c5SJed Brown       }
20340c7d97c5SJed Brown 
2035e269702eSStefano Zampini       if( dbg_flag ) {
20360c7d97c5SJed Brown         /* assemble subdomain vector on nodes */
2037d49ef151SStefano Zampini         ierr = VecSet(pcis->vec1_N,zero);CHKERRQ(ierr);
20380c7d97c5SJed Brown         ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
20390c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr);
20400c7d97c5SJed Brown         for(j=0;j<n_R;j++) { array[idx_R_local[j]] = array2[j]; }
20413b03a366Sstefano_zampini         array[ vertices[i] ] = one;
20420c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr);
20430c7d97c5SJed Brown         ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
20440c7d97c5SJed Brown         /* assemble subdomain vector of lagrange multipliers (i.e. primal nodes) */
2045d49ef151SStefano Zampini         ierr = VecSet(pcbddc->vec1_P,zero);CHKERRQ(ierr);
20460c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr);
20470c7d97c5SJed Brown         ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr);
20483b03a366Sstefano_zampini         for(j=0;j<n_vertices;j++) { array2[j]=array[j]; }
20490c7d97c5SJed Brown         ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr);
20503b03a366Sstefano_zampini         if(n_constraints) {
20510c7d97c5SJed Brown           ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr);
20523b03a366Sstefano_zampini           for(j=0;j<n_constraints;j++) { array2[j+n_vertices]=array[j]; }
20530c7d97c5SJed Brown           ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr);
20540c7d97c5SJed Brown         }
20550c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr);
20560c7d97c5SJed Brown         ierr = VecScale(pcbddc->vec1_P,m_one);CHKERRQ(ierr);
20570c7d97c5SJed Brown         /* check saddle point solution */
2058534831adSStefano Zampini         ierr = MatMult(pcbddc->local_mat,pcis->vec1_N,pcis->vec2_N);CHKERRQ(ierr);
20593b03a366Sstefano_zampini         ierr = MatMultTransposeAdd(pcbddc->ConstraintMatrix,pcbddc->vec1_P,pcis->vec2_N,pcis->vec2_N);CHKERRQ(ierr);
20603b03a366Sstefano_zampini         ierr = VecNorm(pcis->vec2_N,NORM_INFINITY,&coarsefunctions_errors[i]);CHKERRQ(ierr);
20613b03a366Sstefano_zampini         ierr = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr);
20620c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
20633b03a366Sstefano_zampini         array[i]=array[i]+m_one;  /* shift by the identity matrix */
20640c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
20653b03a366Sstefano_zampini         ierr = VecNorm(pcbddc->vec1_P,NORM_INFINITY,&constraints_errors[i]);CHKERRQ(ierr);
20660c7d97c5SJed Brown       }
20670c7d97c5SJed Brown     }
20680c7d97c5SJed Brown 
20693b03a366Sstefano_zampini     for(i=0;i<n_constraints;i++){
2070d49ef151SStefano Zampini       ierr = VecSet(vec2_C,zero);CHKERRQ(ierr);
20710c7d97c5SJed Brown       ierr = VecSetValue(vec2_C,i,m_one,INSERT_VALUES);CHKERRQ(ierr);
20720c7d97c5SJed Brown       ierr = VecAssemblyBegin(vec2_C);CHKERRQ(ierr);
20730c7d97c5SJed Brown       ierr = VecAssemblyEnd(vec2_C);CHKERRQ(ierr);
20740c7d97c5SJed Brown       /* solution of saddle point problem */
20750c7d97c5SJed Brown       ierr = MatMult(M1,vec2_C,vec1_C);CHKERRQ(ierr);
20760c7d97c5SJed Brown       ierr = MatMult(pcbddc->local_auxmat2,vec1_C,pcbddc->vec1_R);CHKERRQ(ierr);
20770c7d97c5SJed Brown       ierr = VecScale(vec1_C,m_one);CHKERRQ(ierr);
20783b03a366Sstefano_zampini       if(n_vertices) { ierr = MatMult(A_VR,pcbddc->vec1_R,vec2_V);CHKERRQ(ierr); }
20790c7d97c5SJed Brown       /* Set values in coarse basis function and subdomain part of coarse_mat */
20800c7d97c5SJed Brown       /* coarse basis functions */
20813b03a366Sstefano_zampini       index=i+n_vertices;
20820c7d97c5SJed Brown       ierr = VecSet(pcis->vec1_B,zero);CHKERRQ(ierr);
20830c7d97c5SJed Brown       ierr = VecScatterBegin(pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20840c7d97c5SJed Brown       ierr = VecScatterEnd  (pcbddc->R_to_B,pcbddc->vec1_R,pcis->vec1_B,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20850c7d97c5SJed Brown       ierr = VecGetArray(pcis->vec1_B,&array);CHKERRQ(ierr);
208653cdbc3dSStefano Zampini       ierr = MatSetValues(pcbddc->coarse_phi_B,n_B,auxindices,1,&index,array,INSERT_VALUES);CHKERRQ(ierr);
20870c7d97c5SJed Brown       ierr = VecRestoreArray(pcis->vec1_B,&array);CHKERRQ(ierr);
2088e269702eSStefano Zampini       if( pcbddc->prec_type || dbg_flag ) {
20890c7d97c5SJed Brown         ierr = VecScatterBegin(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20900c7d97c5SJed Brown         ierr = VecScatterEnd(pcbddc->R_to_D,pcbddc->vec1_R,pcis->vec1_D,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
20910c7d97c5SJed Brown         ierr = VecGetArray(pcis->vec1_D,&array);CHKERRQ(ierr);
209253cdbc3dSStefano Zampini         ierr = MatSetValues(pcbddc->coarse_phi_D,n_D,auxindices,1,&index,array,INSERT_VALUES);CHKERRQ(ierr);
20930c7d97c5SJed Brown         ierr = VecRestoreArray(pcis->vec1_D,&array);CHKERRQ(ierr);
20940c7d97c5SJed Brown       }
20950c7d97c5SJed Brown       /* subdomain contribution to coarse matrix */
20963b03a366Sstefano_zampini       if(n_vertices) {
20970c7d97c5SJed Brown         ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr);
2098da1bb401SStefano Zampini         for(j=0;j<n_vertices;j++) {coarse_submat_vals[index*pcbddc->local_primal_size+j]=array[j];} /* WARNING -> column major ordering */
20990c7d97c5SJed Brown         ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr);
21000c7d97c5SJed Brown       }
21010c7d97c5SJed Brown       ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr);
2102da1bb401SStefano Zampini       for(j=0;j<n_constraints;j++) {coarse_submat_vals[index*pcbddc->local_primal_size+j+n_vertices]=array[j];} /* WARNING -> column major ordering */
21030c7d97c5SJed Brown       ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr);
21040c7d97c5SJed Brown 
2105e269702eSStefano Zampini       if( dbg_flag ) {
21060c7d97c5SJed Brown         /* assemble subdomain vector on nodes */
210753cdbc3dSStefano Zampini         ierr = VecSet(pcis->vec1_N,zero);CHKERRQ(ierr);
21080c7d97c5SJed Brown         ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
21090c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr);
21100c7d97c5SJed Brown         for(j=0;j<n_R;j++){ array[ idx_R_local[j] ] = array2[j]; }
21110c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_R,&array2);CHKERRQ(ierr);
21120c7d97c5SJed Brown         ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
21130c7d97c5SJed Brown         /* assemble subdomain vector of lagrange multipliers */
211453cdbc3dSStefano Zampini         ierr = VecSet(pcbddc->vec1_P,zero);CHKERRQ(ierr);
21150c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr);
21163b03a366Sstefano_zampini         if( n_vertices) {
21170c7d97c5SJed Brown           ierr = VecGetArray(vec2_V,&array);CHKERRQ(ierr);
21183b03a366Sstefano_zampini           for(j=0;j<n_vertices;j++) {array2[j]=-array[j];}
21190c7d97c5SJed Brown           ierr = VecRestoreArray(vec2_V,&array);CHKERRQ(ierr);
21200c7d97c5SJed Brown         }
21210c7d97c5SJed Brown         ierr = VecGetArray(vec1_C,&array);CHKERRQ(ierr);
21223b03a366Sstefano_zampini         for(j=0;j<n_constraints;j++) {array2[j+n_vertices]=-array[j];}
21230c7d97c5SJed Brown         ierr = VecRestoreArray(vec1_C,&array);CHKERRQ(ierr);
21240c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_P,&array2);CHKERRQ(ierr);
21253972b0daSStefano Zampini         /* check saddle point solution */
2126534831adSStefano Zampini         ierr = MatMult(pcbddc->local_mat,pcis->vec1_N,pcis->vec2_N);CHKERRQ(ierr);
21273b03a366Sstefano_zampini         ierr = MatMultTransposeAdd(pcbddc->ConstraintMatrix,pcbddc->vec1_P,pcis->vec2_N,pcis->vec2_N);CHKERRQ(ierr);
212853cdbc3dSStefano Zampini         ierr = VecNorm(pcis->vec2_N,NORM_INFINITY,&coarsefunctions_errors[index]);CHKERRQ(ierr);
21293b03a366Sstefano_zampini         ierr = MatMult(pcbddc->ConstraintMatrix,pcis->vec1_N,pcbddc->vec1_P);CHKERRQ(ierr);
21300c7d97c5SJed Brown         ierr = VecGetArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
213153cdbc3dSStefano Zampini         array[index]=array[index]+m_one; /* shift by the identity matrix */
21320c7d97c5SJed Brown         ierr = VecRestoreArray(pcbddc->vec1_P,&array);CHKERRQ(ierr);
213353cdbc3dSStefano Zampini         ierr = VecNorm(pcbddc->vec1_P,NORM_INFINITY,&constraints_errors[index]);CHKERRQ(ierr);
21340c7d97c5SJed Brown       }
21350c7d97c5SJed Brown     }
21360c7d97c5SJed Brown     ierr = MatAssemblyBegin(pcbddc->coarse_phi_B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
21370c7d97c5SJed Brown     ierr = MatAssemblyEnd  (pcbddc->coarse_phi_B,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
2138e269702eSStefano Zampini     if( pcbddc->prec_type || dbg_flag ) {
21390c7d97c5SJed Brown       ierr = MatAssemblyBegin(pcbddc->coarse_phi_D,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
21400c7d97c5SJed Brown       ierr = MatAssemblyEnd  (pcbddc->coarse_phi_D,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
21410c7d97c5SJed Brown     }
21420c7d97c5SJed Brown     /* Checking coarse_sub_mat and coarse basis functios */
21430c7d97c5SJed Brown     /* It shuld be \Phi^{(j)^T} A^{(j)} \Phi^{(j)}=coarse_sub_mat */
21449d2fce94SStefano Zampini     if(dbg_flag) {
21450c7d97c5SJed Brown 
21460c7d97c5SJed Brown       Mat coarse_sub_mat;
21470c7d97c5SJed Brown       Mat TM1,TM2,TM3,TM4;
21480c7d97c5SJed Brown       Mat coarse_phi_D,coarse_phi_B,A_II,A_BB,A_IB,A_BI;
2149a0ba757dSStefano Zampini       const MatType checkmattype=MATSEQAIJ;
21500c7d97c5SJed Brown       PetscScalar      value;
21510c7d97c5SJed Brown 
2152c042a7c3SStefano Zampini       ierr = MatConvert(pcis->A_II,checkmattype,MAT_INITIAL_MATRIX,&A_II);CHKERRQ(ierr);
2153c042a7c3SStefano Zampini       ierr = MatConvert(pcis->A_IB,checkmattype,MAT_INITIAL_MATRIX,&A_IB);CHKERRQ(ierr);
2154c042a7c3SStefano Zampini       ierr = MatConvert(pcis->A_BI,checkmattype,MAT_INITIAL_MATRIX,&A_BI);CHKERRQ(ierr);
2155c042a7c3SStefano Zampini       ierr = MatConvert(pcis->A_BB,checkmattype,MAT_INITIAL_MATRIX,&A_BB);CHKERRQ(ierr);
2156c042a7c3SStefano Zampini       ierr = MatConvert(pcbddc->coarse_phi_D,checkmattype,MAT_INITIAL_MATRIX,&coarse_phi_D);CHKERRQ(ierr);
2157c042a7c3SStefano Zampini       ierr = MatConvert(pcbddc->coarse_phi_B,checkmattype,MAT_INITIAL_MATRIX,&coarse_phi_B);CHKERRQ(ierr);
2158c042a7c3SStefano Zampini       ierr = MatCreateSeqDense(PETSC_COMM_SELF,pcbddc->local_primal_size,pcbddc->local_primal_size,coarse_submat_vals,&coarse_sub_mat);CHKERRQ(ierr);
2159c042a7c3SStefano Zampini       ierr = MatConvert(coarse_sub_mat,checkmattype,MAT_REUSE_MATRIX,&coarse_sub_mat);CHKERRQ(ierr);
21600c7d97c5SJed Brown 
2161da1bb401SStefano Zampini       /*PetscViewer view_out;
2162da1bb401SStefano Zampini       PetscMPIInt myrank;
2163da1bb401SStefano Zampini       char filename[256];
2164da1bb401SStefano Zampini       MPI_Comm_rank(((PetscObject)pc)->comm,&myrank);
2165da1bb401SStefano Zampini       sprintf(filename,"coarsesubmat_%04d.m",myrank);
2166da1bb401SStefano Zampini       ierr = PetscViewerASCIIOpen(PETSC_COMM_SELF,filename,&view_out);CHKERRQ(ierr);
2167da1bb401SStefano Zampini       ierr = PetscViewerSetFormat(view_out,PETSC_VIEWER_ASCII_MATLAB);CHKERRQ(ierr);
2168da1bb401SStefano Zampini       ierr = MatView(coarse_sub_mat,view_out);CHKERRQ(ierr);
2169da1bb401SStefano Zampini       ierr = PetscViewerDestroy(&view_out);CHKERRQ(ierr);*/
2170da1bb401SStefano Zampini 
21710c7d97c5SJed Brown       ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
21720c7d97c5SJed Brown       ierr = PetscViewerASCIIPrintf(viewer,"Check coarse sub mat and local basis functions\n");CHKERRQ(ierr);
21730c7d97c5SJed Brown       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
217453cdbc3dSStefano Zampini       ierr = MatPtAP(A_II,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&TM1);CHKERRQ(ierr);
217553cdbc3dSStefano Zampini       ierr = MatPtAP(A_BB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&TM2);CHKERRQ(ierr);
217653cdbc3dSStefano Zampini       ierr = MatMatMult(A_IB,coarse_phi_B,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr);
2177c042a7c3SStefano Zampini       ierr = MatTransposeMatMult(coarse_phi_D,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM3);CHKERRQ(ierr);
217853cdbc3dSStefano Zampini       ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr);
217953cdbc3dSStefano Zampini       ierr = MatMatMult(A_BI,coarse_phi_D,MAT_INITIAL_MATRIX,1.0,&AUXMAT);CHKERRQ(ierr);
2180c042a7c3SStefano Zampini       ierr = MatTransposeMatMult(coarse_phi_B,AUXMAT,MAT_INITIAL_MATRIX,1.0,&TM4);CHKERRQ(ierr);
218153cdbc3dSStefano Zampini       ierr = MatDestroy(&AUXMAT);CHKERRQ(ierr);
218253cdbc3dSStefano Zampini       ierr = MatAXPY(TM1,one,TM2,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
218353cdbc3dSStefano Zampini       ierr = MatAXPY(TM1,one,TM3,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
218453cdbc3dSStefano Zampini       ierr = MatAXPY(TM1,one,TM4,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
218553cdbc3dSStefano Zampini       ierr = MatAXPY(TM1,m_one,coarse_sub_mat,DIFFERENT_NONZERO_PATTERN);CHKERRQ(ierr);
218653cdbc3dSStefano Zampini       ierr = MatNorm(TM1,NORM_INFINITY,&value);CHKERRQ(ierr);
21870c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"----------------------------------\n");CHKERRQ(ierr);
21880c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d \n",PetscGlobalRank);CHKERRQ(ierr);
21890c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"matrix error = % 1.14e\n",value);CHKERRQ(ierr);
21900c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"coarse functions errors\n");CHKERRQ(ierr);
219153cdbc3dSStefano Zampini       for(i=0;i<pcbddc->local_primal_size;i++) { ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local %02d-th function error = % 1.14e\n",i,coarsefunctions_errors[i]);CHKERRQ(ierr); }
21920c7d97c5SJed Brown       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"constraints errors\n");CHKERRQ(ierr);
219353cdbc3dSStefano Zampini       for(i=0;i<pcbddc->local_primal_size;i++) { ierr = PetscViewerASCIISynchronizedPrintf(viewer,"local %02d-th function error = % 1.14e\n",i,constraints_errors[i]);CHKERRQ(ierr); }
21940c7d97c5SJed Brown       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
219553cdbc3dSStefano Zampini       ierr = MatDestroy(&A_II);CHKERRQ(ierr);
219653cdbc3dSStefano Zampini       ierr = MatDestroy(&A_BB);CHKERRQ(ierr);
219753cdbc3dSStefano Zampini       ierr = MatDestroy(&A_IB);CHKERRQ(ierr);
219853cdbc3dSStefano Zampini       ierr = MatDestroy(&A_BI);CHKERRQ(ierr);
219953cdbc3dSStefano Zampini       ierr = MatDestroy(&TM1);CHKERRQ(ierr);
220053cdbc3dSStefano Zampini       ierr = MatDestroy(&TM2);CHKERRQ(ierr);
220153cdbc3dSStefano Zampini       ierr = MatDestroy(&TM3);CHKERRQ(ierr);
220253cdbc3dSStefano Zampini       ierr = MatDestroy(&TM4);CHKERRQ(ierr);
220353cdbc3dSStefano Zampini       ierr = MatDestroy(&coarse_phi_D);CHKERRQ(ierr);
220453cdbc3dSStefano Zampini       ierr = MatDestroy(&coarse_sub_mat);CHKERRQ(ierr);
220553cdbc3dSStefano Zampini       ierr = MatDestroy(&coarse_phi_B);CHKERRQ(ierr);
22060c7d97c5SJed Brown       ierr = PetscFree(coarsefunctions_errors);CHKERRQ(ierr);
22070c7d97c5SJed Brown       ierr = PetscFree(constraints_errors);CHKERRQ(ierr);
22080c7d97c5SJed Brown     }
22090c7d97c5SJed Brown 
22100c7d97c5SJed Brown     /* create coarse matrix and data structures for message passing associated actual choice of coarse problem type */
22110c7d97c5SJed Brown     ierr = PCBDDCSetupCoarseEnvironment(pc,coarse_submat_vals);CHKERRQ(ierr);
22120c7d97c5SJed Brown     /* free memory */
22130c7d97c5SJed Brown     ierr = PetscFree(coarse_submat_vals);CHKERRQ(ierr);
22140c7d97c5SJed Brown     ierr = PetscFree(auxindices);CHKERRQ(ierr);
22150c7d97c5SJed Brown     ierr = PetscFree(nnz);CHKERRQ(ierr);
22163b03a366Sstefano_zampini     if(n_vertices) {
22170c7d97c5SJed Brown       ierr = VecDestroy(&vec1_V);CHKERRQ(ierr);
22180c7d97c5SJed Brown       ierr = VecDestroy(&vec2_V);CHKERRQ(ierr);
22190c7d97c5SJed Brown       ierr = MatDestroy(&M2);CHKERRQ(ierr);
22200c7d97c5SJed Brown       ierr = MatDestroy(&A_RV);CHKERRQ(ierr);
22210c7d97c5SJed Brown       ierr = MatDestroy(&A_VR);CHKERRQ(ierr);
22220c7d97c5SJed Brown       ierr = MatDestroy(&A_VV);CHKERRQ(ierr);
22230c7d97c5SJed Brown     }
2224534831adSStefano Zampini     if(n_constraints) {
22250c7d97c5SJed Brown       ierr = VecDestroy(&vec1_C);CHKERRQ(ierr);
22260c7d97c5SJed Brown       ierr = VecDestroy(&vec2_C);CHKERRQ(ierr);
22270c7d97c5SJed Brown       ierr = MatDestroy(&M1);CHKERRQ(ierr);
22280c7d97c5SJed Brown       ierr = MatDestroy(&C_CR);CHKERRQ(ierr);
22290c7d97c5SJed Brown     }
22300c7d97c5SJed Brown   }
22310c7d97c5SJed Brown   /* free memory */
22323b03a366Sstefano_zampini   if(n_vertices) {
22330c7d97c5SJed Brown     ierr = PetscFree(idx_V_B);CHKERRQ(ierr);
22340c7d97c5SJed Brown     ierr = ISDestroy(&is_V_local);CHKERRQ(ierr);
22350c7d97c5SJed Brown   }
22360c7d97c5SJed Brown   ierr = ISDestroy(&is_R_local);CHKERRQ(ierr);
22370c7d97c5SJed Brown 
22380c7d97c5SJed Brown   PetscFunctionReturn(0);
22390c7d97c5SJed Brown }
22400c7d97c5SJed Brown 
22410c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
22420c7d97c5SJed Brown 
22430c7d97c5SJed Brown #undef __FUNCT__
22440c7d97c5SJed Brown #define __FUNCT__ "PCBDDCSetupCoarseEnvironment"
224553cdbc3dSStefano Zampini static PetscErrorCode PCBDDCSetupCoarseEnvironment(PC pc,PetscScalar* coarse_submat_vals)
22460c7d97c5SJed Brown {
22470c7d97c5SJed Brown 
22480c7d97c5SJed Brown 
22490c7d97c5SJed Brown   Mat_IS    *matis    = (Mat_IS*)pc->pmat->data;
22500c7d97c5SJed Brown   PC_BDDC   *pcbddc   = (PC_BDDC*)pc->data;
22510c7d97c5SJed Brown   PC_IS     *pcis     = (PC_IS*)pc->data;
22520c7d97c5SJed Brown   MPI_Comm  prec_comm = ((PetscObject)pc)->comm;
22530c7d97c5SJed Brown   MPI_Comm  coarse_comm;
22540c7d97c5SJed Brown 
22550c7d97c5SJed Brown   /* common to all choiches */
22560c7d97c5SJed Brown   PetscScalar *temp_coarse_mat_vals;
22570c7d97c5SJed Brown   PetscScalar *ins_coarse_mat_vals;
22580c7d97c5SJed Brown   PetscInt    *ins_local_primal_indices;
22590c7d97c5SJed Brown   PetscMPIInt *localsizes2,*localdispl2;
22600c7d97c5SJed Brown   PetscMPIInt size_prec_comm;
22610c7d97c5SJed Brown   PetscMPIInt rank_prec_comm;
22620c7d97c5SJed Brown   PetscMPIInt active_rank=MPI_PROC_NULL;
22630c7d97c5SJed Brown   PetscMPIInt master_proc=0;
22640c7d97c5SJed Brown   PetscInt    ins_local_primal_size;
22650c7d97c5SJed Brown   /* specific to MULTILEVEL_BDDC */
22660c7d97c5SJed Brown   PetscMPIInt *ranks_recv;
22670c7d97c5SJed Brown   PetscMPIInt count_recv=0;
22680c7d97c5SJed Brown   PetscMPIInt rank_coarse_proc_send_to;
22690c7d97c5SJed Brown   PetscMPIInt coarse_color = MPI_UNDEFINED;
22700c7d97c5SJed Brown   ISLocalToGlobalMapping coarse_ISLG;
22710c7d97c5SJed Brown   /* some other variables */
22720c7d97c5SJed Brown   PetscErrorCode ierr;
22730c7d97c5SJed Brown   const MatType coarse_mat_type;
22740c7d97c5SJed Brown   const PCType  coarse_pc_type;
227553cdbc3dSStefano Zampini   const KSPType  coarse_ksp_type;
227653cdbc3dSStefano Zampini   PC pc_temp;
22770c7d97c5SJed Brown   PetscInt i,j,k,bs;
22783b03a366Sstefano_zampini   PetscInt max_it_coarse_ksp=1;  /* don't increase this value */
2279e269702eSStefano Zampini   /* verbose output viewer */
2280e269702eSStefano Zampini   PetscViewer viewer=pcbddc->dbg_viewer;
2281e269702eSStefano Zampini   PetscBool   dbg_flag=pcbddc->dbg_flag;
22820c7d97c5SJed Brown 
22830c7d97c5SJed Brown   PetscFunctionBegin;
22840c7d97c5SJed Brown 
22850c7d97c5SJed Brown   ins_local_primal_indices = 0;
22860c7d97c5SJed Brown   ins_coarse_mat_vals      = 0;
22870c7d97c5SJed Brown   localsizes2              = 0;
22880c7d97c5SJed Brown   localdispl2              = 0;
22890c7d97c5SJed Brown   temp_coarse_mat_vals     = 0;
22900c7d97c5SJed Brown   coarse_ISLG              = 0;
22910c7d97c5SJed Brown 
229253cdbc3dSStefano Zampini   ierr = MPI_Comm_size(prec_comm,&size_prec_comm);CHKERRQ(ierr);
229353cdbc3dSStefano Zampini   ierr = MPI_Comm_rank(prec_comm,&rank_prec_comm);CHKERRQ(ierr);
22940c7d97c5SJed Brown   ierr = MatGetBlockSize(matis->A,&bs);CHKERRQ(ierr);
22950c7d97c5SJed Brown 
2296beed3852SStefano Zampini   /* Assign global numbering to coarse dofs */
2297beed3852SStefano Zampini   {
2298a0ba757dSStefano Zampini     PetscScalar    one=1.,zero=0.;
2299beed3852SStefano Zampini     PetscScalar    *array;
2300beed3852SStefano Zampini     PetscMPIInt    *auxlocal_primal;
2301beed3852SStefano Zampini     PetscMPIInt    *auxglobal_primal;
2302beed3852SStefano Zampini     PetscMPIInt    *all_auxglobal_primal;
2303beed3852SStefano Zampini     PetscMPIInt    *all_auxglobal_primal_dummy;
2304beed3852SStefano Zampini     PetscMPIInt    mpi_local_primal_size = (PetscMPIInt)pcbddc->local_primal_size;
2305da1bb401SStefano Zampini     PetscInt       *row_cmat_indices;
23063b03a366Sstefano_zampini     PetscInt       size_of_constraint;
2307da1bb401SStefano Zampini     PetscScalar    coarsesum;
2308beed3852SStefano Zampini 
2309beed3852SStefano Zampini     /* Construct needed data structures for message passing */
2310beed3852SStefano Zampini     ierr = PetscMalloc(mpi_local_primal_size*sizeof(PetscMPIInt),&pcbddc->local_primal_indices);CHKERRQ(ierr);
2311beed3852SStefano Zampini     ierr = PetscMalloc(size_prec_comm*sizeof(PetscMPIInt),&pcbddc->local_primal_sizes);CHKERRQ(ierr);
2312beed3852SStefano Zampini     ierr = PetscMalloc(size_prec_comm*sizeof(PetscMPIInt),&pcbddc->local_primal_displacements);CHKERRQ(ierr);
2313beed3852SStefano Zampini     /* Gather local_primal_size information for all processes  */
23145619798eSStefano Zampini     ierr = MPI_Allgather(&mpi_local_primal_size,1,MPIU_INT,&pcbddc->local_primal_sizes[0],1,MPIU_INT,prec_comm);CHKERRQ(ierr);
2315beed3852SStefano Zampini     pcbddc->replicated_primal_size = 0;
2316beed3852SStefano Zampini     for (i=0; i<size_prec_comm; i++) {
2317beed3852SStefano Zampini       pcbddc->local_primal_displacements[i] = pcbddc->replicated_primal_size ;
2318beed3852SStefano Zampini       pcbddc->replicated_primal_size += pcbddc->local_primal_sizes[i];
2319beed3852SStefano Zampini     }
23205619798eSStefano Zampini     if(rank_prec_comm == 0) {
2321beed3852SStefano Zampini       /* allocate some auxiliary space */
2322beed3852SStefano Zampini       ierr = PetscMalloc(pcbddc->replicated_primal_size*sizeof(*all_auxglobal_primal),&all_auxglobal_primal);CHKERRQ(ierr);
2323beed3852SStefano Zampini       ierr = PetscMalloc(pcbddc->replicated_primal_size*sizeof(*all_auxglobal_primal_dummy),&all_auxglobal_primal_dummy);CHKERRQ(ierr);
2324beed3852SStefano Zampini     }
2325beed3852SStefano Zampini     ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscMPIInt),&auxlocal_primal);CHKERRQ(ierr);
2326beed3852SStefano Zampini     ierr = PetscMalloc(pcbddc->local_primal_size*sizeof(PetscMPIInt),&auxglobal_primal);CHKERRQ(ierr);
2327beed3852SStefano Zampini 
2328da1bb401SStefano Zampini     /* First let's count coarse dofs.
2329beed3852SStefano Zampini        This code fragment assumes that the number of local constraints per connected component
2330beed3852SStefano Zampini        is not greater than the number of nodes defined for the connected component
2331beed3852SStefano Zampini        (otherwise we will surely have linear dependence between constraints and thus a singular coarse problem) */
23323b03a366Sstefano_zampini     /* auxlocal_primal      : primal indices in local nodes numbering (internal and interface) with complete queue sorted by global ordering */
2333beed3852SStefano Zampini     ierr = VecSet(pcis->vec1_N,zero);CHKERRQ(ierr);
2334beed3852SStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
2335da1bb401SStefano Zampini     for(i=0;i<pcbddc->local_primal_size;i++) {
2336da1bb401SStefano Zampini       ierr = MatGetRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr);
23373b03a366Sstefano_zampini       for (j=0; j<size_of_constraint; j++) {
23383b03a366Sstefano_zampini         k = row_cmat_indices[j];
2339beed3852SStefano Zampini         if( array[k] == zero ) {
2340beed3852SStefano Zampini           array[k] = one;
2341da1bb401SStefano Zampini           auxlocal_primal[i] = k;
2342beed3852SStefano Zampini           break;
2343beed3852SStefano Zampini         }
2344beed3852SStefano Zampini       }
2345da1bb401SStefano Zampini       ierr = MatRestoreRow(pcbddc->ConstraintMatrix,i,&size_of_constraint,(const PetscInt**)&row_cmat_indices,PETSC_NULL);CHKERRQ(ierr);
2346beed3852SStefano Zampini     }
2347beed3852SStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
2348da1bb401SStefano Zampini     ierr = VecSet(pcis->vec1_global,zero);CHKERRQ(ierr);
2349da1bb401SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
2350da1bb401SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
2351da1bb401SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
2352da1bb401SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
2353da1bb401SStefano Zampini     ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
2354da1bb401SStefano Zampini     for(i=0;i<pcis->n;i++) { if( array[i] > zero) array[i] = one/array[i]; }
2355da1bb401SStefano Zampini     ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
2356da1bb401SStefano Zampini     ierr = VecSet(pcis->vec1_global,zero);CHKERRQ(ierr);
2357da1bb401SStefano Zampini     ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
2358da1bb401SStefano Zampini     ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
2359da1bb401SStefano Zampini     ierr = VecSum(pcis->vec1_global,&coarsesum);CHKERRQ(ierr);
2360da1bb401SStefano Zampini     pcbddc->coarse_size = (PetscInt) coarsesum;
2361a0ba757dSStefano Zampini 
2362beed3852SStefano Zampini     /* Now assign them a global numbering */
2363beed3852SStefano Zampini     /* auxglobal_primal contains indices in global nodes numbering (internal and interface) */
2364beed3852SStefano Zampini     ierr = ISLocalToGlobalMappingApply(matis->mapping,pcbddc->local_primal_size,auxlocal_primal,auxglobal_primal);CHKERRQ(ierr);
2365beed3852SStefano Zampini     /* all_auxglobal_primal contains all primal nodes indices in global nodes numbering (internal and interface) */
2366beed3852SStefano Zampini     ierr = MPI_Gatherv(&auxglobal_primal[0],pcbddc->local_primal_size,MPIU_INT,&all_auxglobal_primal[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,0,prec_comm);CHKERRQ(ierr);
2367beed3852SStefano Zampini 
2368beed3852SStefano Zampini     /* After this block all_auxglobal_primal should contains one copy of each primal node's indices in global nodes numbering */
2369beed3852SStefano Zampini     /* It implements a function similar to PetscSortRemoveDupsInt */
2370beed3852SStefano Zampini     if(rank_prec_comm==0) {
2371beed3852SStefano Zampini       /* dummy argument since PetscSortMPIInt doesn't exist! */
2372beed3852SStefano Zampini       ierr = PetscSortMPIIntWithArray(pcbddc->replicated_primal_size,all_auxglobal_primal,all_auxglobal_primal_dummy);CHKERRQ(ierr);
2373beed3852SStefano Zampini       k=1;
2374beed3852SStefano Zampini       j=all_auxglobal_primal[0];  /* first dof in global numbering */
2375beed3852SStefano Zampini       for(i=1;i< pcbddc->replicated_primal_size ;i++) {
2376beed3852SStefano Zampini         if(j != all_auxglobal_primal[i] ) {
2377beed3852SStefano Zampini           all_auxglobal_primal[k]=all_auxglobal_primal[i];
2378beed3852SStefano Zampini           k++;
2379beed3852SStefano Zampini           j=all_auxglobal_primal[i];
2380beed3852SStefano Zampini         }
2381beed3852SStefano Zampini       }
2382beed3852SStefano Zampini     } else {
2383beed3852SStefano Zampini       ierr = PetscMalloc(pcbddc->coarse_size*sizeof(PetscMPIInt),&all_auxglobal_primal);CHKERRQ(ierr);
2384beed3852SStefano Zampini     }
23855619798eSStefano Zampini     /* We only need to broadcast the indices from 0 to pcbddc->coarse_size. Remaning elements of array all_aux_global_primal are garbage. */
2386beed3852SStefano Zampini     ierr = MPI_Bcast(all_auxglobal_primal,pcbddc->coarse_size,MPIU_INT,0,prec_comm);CHKERRQ(ierr);
2387beed3852SStefano Zampini 
2388beed3852SStefano Zampini     /* Now get global coarse numbering of local primal nodes */
2389beed3852SStefano Zampini     for(i=0;i<pcbddc->local_primal_size;i++) {
2390beed3852SStefano Zampini       k=0;
2391beed3852SStefano Zampini       while( all_auxglobal_primal[k] != auxglobal_primal[i] ) { k++;}
2392beed3852SStefano Zampini       pcbddc->local_primal_indices[i]=k;
2393beed3852SStefano Zampini     }
2394e269702eSStefano Zampini     if(dbg_flag) {
2395e269702eSStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"--------------------------------------------------\n");CHKERRQ(ierr);
2396da1bb401SStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Size of coarse problem %d\n",pcbddc->coarse_size);CHKERRQ(ierr);
2397e269702eSStefano Zampini       ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
2398e269702eSStefano Zampini     }
2399beed3852SStefano Zampini     /* free allocated memory */
2400beed3852SStefano Zampini     ierr = PetscFree(auxlocal_primal);CHKERRQ(ierr);
2401beed3852SStefano Zampini     ierr = PetscFree(auxglobal_primal);CHKERRQ(ierr);
2402beed3852SStefano Zampini     ierr = PetscFree(all_auxglobal_primal);CHKERRQ(ierr);
2403e269702eSStefano Zampini     if(rank_prec_comm == 0) {
2404beed3852SStefano Zampini       ierr = PetscFree(all_auxglobal_primal_dummy);CHKERRQ(ierr);
2405beed3852SStefano Zampini     }
2406e269702eSStefano Zampini   }
2407beed3852SStefano Zampini 
24080c7d97c5SJed Brown   /* adapt coarse problem type */
24090c7d97c5SJed Brown   if(pcbddc->coarse_problem_type == MULTILEVEL_BDDC && pcbddc->active_procs < MIN_PROCS_FOR_BDDC )
24100c7d97c5SJed Brown     pcbddc->coarse_problem_type = PARALLEL_BDDC;
24110c7d97c5SJed Brown 
24120c7d97c5SJed Brown   switch(pcbddc->coarse_problem_type){
24130c7d97c5SJed Brown 
2414da1bb401SStefano Zampini     case(MULTILEVEL_BDDC):   /* we define a coarse mesh where subdomains are elements */
24150c7d97c5SJed Brown     {
24160c7d97c5SJed Brown       /* we need additional variables */
24170c7d97c5SJed Brown       MetisInt   n_subdomains,n_parts,objval,ncon,faces_nvtxs;
24180c7d97c5SJed Brown       MetisInt   *metis_coarse_subdivision;
24190c7d97c5SJed Brown       MetisInt   options[METIS_NOPTIONS];
24200c7d97c5SJed Brown       PetscMPIInt size_coarse_comm,rank_coarse_comm;
24210c7d97c5SJed Brown       PetscMPIInt procs_jumps_coarse_comm;
24220c7d97c5SJed Brown       PetscMPIInt *coarse_subdivision;
24230c7d97c5SJed Brown       PetscMPIInt *total_count_recv;
24240c7d97c5SJed Brown       PetscMPIInt *total_ranks_recv;
24250c7d97c5SJed Brown       PetscMPIInt *displacements_recv;
24260c7d97c5SJed Brown       PetscMPIInt *my_faces_connectivity;
24270c7d97c5SJed Brown       PetscMPIInt *petsc_faces_adjncy;
24280c7d97c5SJed Brown       MetisInt    *faces_adjncy;
24290c7d97c5SJed Brown       MetisInt    *faces_xadj;
24300c7d97c5SJed Brown       PetscMPIInt *number_of_faces;
24310c7d97c5SJed Brown       PetscMPIInt *faces_displacements;
24320c7d97c5SJed Brown       PetscInt    *array_int;
24330c7d97c5SJed Brown       PetscMPIInt my_faces=0;
24340c7d97c5SJed Brown       PetscMPIInt total_faces=0;
24353828260eSStefano Zampini       PetscInt    ranks_stretching_ratio;
24360c7d97c5SJed Brown 
24370c7d97c5SJed Brown       /* define some quantities */
24380c7d97c5SJed Brown       pcbddc->coarse_communications_type = SCATTERS_BDDC;
24390c7d97c5SJed Brown       coarse_mat_type = MATIS;
24400c7d97c5SJed Brown       coarse_pc_type  = PCBDDC;
24416c9de887SHong Zhang       coarse_ksp_type  = KSPCHEBYSHEV;
24420c7d97c5SJed Brown 
24430c7d97c5SJed Brown       /* details of coarse decomposition */
24440c7d97c5SJed Brown       n_subdomains = pcbddc->active_procs;
24450c7d97c5SJed Brown       n_parts      = n_subdomains/pcbddc->coarsening_ratio;
24463828260eSStefano Zampini       ranks_stretching_ratio = size_prec_comm/pcbddc->active_procs;
24473828260eSStefano Zampini       procs_jumps_coarse_comm = pcbddc->coarsening_ratio*ranks_stretching_ratio;
24483828260eSStefano Zampini 
2449da1bb401SStefano Zampini       /*printf("Coarse algorithm details: \n");
2450da1bb401SStefano Zampini       printf("n_subdomains %d, n_parts %d\nstretch %d,jumps %d,coarse_ratio %d\nlevel should be log_%d(%d)\n",n_subdomains,n_parts,ranks_stretching_ratio,procs_jumps_coarse_comm,pcbddc->coarsening_ratio,pcbddc->coarsening_ratio,(ranks_stretching_ratio/pcbddc->coarsening_ratio+1));*/
24510c7d97c5SJed Brown 
24520c7d97c5SJed Brown       /* build CSR graph of subdomains' connectivity through faces */
24530c7d97c5SJed Brown       ierr = PetscMalloc (pcis->n*sizeof(PetscInt),&array_int);CHKERRQ(ierr);
24543828260eSStefano Zampini       ierr = PetscMemzero(array_int,pcis->n*sizeof(PetscInt));CHKERRQ(ierr);
24550c7d97c5SJed Brown       for(i=1;i<pcis->n_neigh;i++){/* i=1 so I don't count myself -> faces nodes counts to 1 */
24560c7d97c5SJed Brown         for(j=0;j<pcis->n_shared[i];j++){
24570c7d97c5SJed Brown           array_int[ pcis->shared[i][j] ]+=1;
24580c7d97c5SJed Brown         }
24590c7d97c5SJed Brown       }
24600c7d97c5SJed Brown       for(i=1;i<pcis->n_neigh;i++){
24610c7d97c5SJed Brown         for(j=0;j<pcis->n_shared[i];j++){
24620c7d97c5SJed Brown           if(array_int[ pcis->shared[i][j] ] == 1 ){
24630c7d97c5SJed Brown             my_faces++;
24640c7d97c5SJed Brown             break;
24650c7d97c5SJed Brown           }
24660c7d97c5SJed Brown         }
24670c7d97c5SJed Brown       }
24680c7d97c5SJed Brown 
246953cdbc3dSStefano Zampini       ierr = MPI_Reduce(&my_faces,&total_faces,1,MPIU_INT,MPI_SUM,master_proc,prec_comm);CHKERRQ(ierr);
24700c7d97c5SJed Brown       ierr = PetscMalloc (my_faces*sizeof(PetscInt),&my_faces_connectivity);CHKERRQ(ierr);
24710c7d97c5SJed Brown       my_faces=0;
24720c7d97c5SJed Brown       for(i=1;i<pcis->n_neigh;i++){
24730c7d97c5SJed Brown         for(j=0;j<pcis->n_shared[i];j++){
24740c7d97c5SJed Brown           if(array_int[ pcis->shared[i][j] ] == 1 ){
24750c7d97c5SJed Brown             my_faces_connectivity[my_faces]=pcis->neigh[i];
24760c7d97c5SJed Brown             my_faces++;
24770c7d97c5SJed Brown             break;
24780c7d97c5SJed Brown           }
24790c7d97c5SJed Brown         }
24800c7d97c5SJed Brown       }
24810c7d97c5SJed Brown       if(rank_prec_comm == master_proc) {
24820c7d97c5SJed Brown         ierr = PetscMalloc (total_faces*sizeof(PetscMPIInt),&petsc_faces_adjncy);CHKERRQ(ierr);
24830c7d97c5SJed Brown         ierr = PetscMalloc (size_prec_comm*sizeof(PetscMPIInt),&number_of_faces);CHKERRQ(ierr);
24840c7d97c5SJed Brown         ierr = PetscMalloc (total_faces*sizeof(MetisInt),&faces_adjncy);CHKERRQ(ierr);
24850c7d97c5SJed Brown         ierr = PetscMalloc ((n_subdomains+1)*sizeof(MetisInt),&faces_xadj);CHKERRQ(ierr);
24860c7d97c5SJed Brown         ierr = PetscMalloc ((size_prec_comm+1)*sizeof(PetscMPIInt),&faces_displacements);CHKERRQ(ierr);
24870c7d97c5SJed Brown       }
248853cdbc3dSStefano Zampini       ierr = MPI_Gather(&my_faces,1,MPIU_INT,&number_of_faces[0],1,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr);
24890c7d97c5SJed Brown       if(rank_prec_comm == master_proc) {
24900c7d97c5SJed Brown         faces_xadj[0]=0;
24910c7d97c5SJed Brown         faces_displacements[0]=0;
24920c7d97c5SJed Brown         j=0;
24930c7d97c5SJed Brown         for(i=1;i<size_prec_comm+1;i++) {
24940c7d97c5SJed Brown           faces_displacements[i]=faces_displacements[i-1]+number_of_faces[i-1];
24950c7d97c5SJed Brown           if(number_of_faces[i-1]) {
24960c7d97c5SJed Brown             j++;
24970c7d97c5SJed Brown             faces_xadj[j]=faces_xadj[j-1]+number_of_faces[i-1];
24980c7d97c5SJed Brown           }
24990c7d97c5SJed Brown         }
2500da1bb401SStefano Zampini         /*printf("The J I count is %d and should be %d\n",j,n_subdomains);
2501da1bb401SStefano Zampini         printf("Total faces seem %d and should be %d\n",faces_xadj[j],total_faces);*/
25020c7d97c5SJed Brown       }
250353cdbc3dSStefano Zampini       ierr = MPI_Gatherv(&my_faces_connectivity[0],my_faces,MPIU_INT,&petsc_faces_adjncy[0],number_of_faces,faces_displacements,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr);
25040c7d97c5SJed Brown       ierr = PetscFree(my_faces_connectivity);CHKERRQ(ierr);
25050c7d97c5SJed Brown       ierr = PetscFree(array_int);CHKERRQ(ierr);
25060c7d97c5SJed Brown       if(rank_prec_comm == master_proc) {
25073828260eSStefano Zampini         for(i=0;i<total_faces;i++) faces_adjncy[i]=(MetisInt)(petsc_faces_adjncy[i]/ranks_stretching_ratio); /* cast to MetisInt */
2508da1bb401SStefano Zampini         /*printf("This is the face connectivity (actual ranks)\n");
25090c7d97c5SJed Brown         for(i=0;i<n_subdomains;i++){
25100c7d97c5SJed Brown           printf("proc %d is connected with \n",i);
25110c7d97c5SJed Brown           for(j=faces_xadj[i];j<faces_xadj[i+1];j++)
25120c7d97c5SJed Brown             printf("%d ",faces_adjncy[j]);
25130c7d97c5SJed Brown           printf("\n");
2514da1bb401SStefano Zampini         }*/
25150c7d97c5SJed Brown         ierr = PetscFree(faces_displacements);CHKERRQ(ierr);
25160c7d97c5SJed Brown         ierr = PetscFree(number_of_faces);CHKERRQ(ierr);
25170c7d97c5SJed Brown         ierr = PetscFree(petsc_faces_adjncy);CHKERRQ(ierr);
25180c7d97c5SJed Brown       }
25190c7d97c5SJed Brown 
25200c7d97c5SJed Brown       if( rank_prec_comm == master_proc ) {
25210c7d97c5SJed Brown 
25223828260eSStefano Zampini         PetscInt heuristic_for_metis=3;
25233828260eSStefano Zampini 
25240c7d97c5SJed Brown         ncon=1;
25250c7d97c5SJed Brown         faces_nvtxs=n_subdomains;
25260c7d97c5SJed Brown         /* partition graoh induced by face connectivity */
25270c7d97c5SJed Brown         ierr = PetscMalloc (n_subdomains*sizeof(MetisInt),&metis_coarse_subdivision);CHKERRQ(ierr);
25280c7d97c5SJed Brown         ierr = METIS_SetDefaultOptions(options);
25290c7d97c5SJed Brown         /* we need a contiguous partition of the coarse mesh */
25300c7d97c5SJed Brown         options[METIS_OPTION_CONTIG]=1;
25310c7d97c5SJed Brown         options[METIS_OPTION_DBGLVL]=1;
25320c7d97c5SJed Brown         options[METIS_OPTION_NITER]=30;
25333828260eSStefano Zampini         if(n_subdomains>n_parts*heuristic_for_metis) {
25343828260eSStefano Zampini           options[METIS_OPTION_IPTYPE]=METIS_IPTYPE_EDGE;
25353828260eSStefano Zampini           options[METIS_OPTION_OBJTYPE]=METIS_OBJTYPE_CUT;
25360c7d97c5SJed Brown           ierr = METIS_PartGraphKway(&faces_nvtxs,&ncon,faces_xadj,faces_adjncy,NULL,NULL,NULL,&n_parts,NULL,NULL,options,&objval,metis_coarse_subdivision);
25373828260eSStefano Zampini         } else {
25383828260eSStefano Zampini           ierr = METIS_PartGraphRecursive(&faces_nvtxs,&ncon,faces_xadj,faces_adjncy,NULL,NULL,NULL,&n_parts,NULL,NULL,options,&objval,metis_coarse_subdivision);
25393828260eSStefano Zampini         }
25400c7d97c5SJed Brown         if(ierr != METIS_OK) SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_LIB,"Error in METIS_PartGraphKway (metis error code %D) called from PCBDDCSetupCoarseEnvironment\n",ierr);
25410c7d97c5SJed Brown         ierr = PetscFree(faces_xadj);CHKERRQ(ierr);
25420c7d97c5SJed Brown         ierr = PetscFree(faces_adjncy);CHKERRQ(ierr);
25430c7d97c5SJed Brown         coarse_subdivision = (PetscMPIInt*)calloc(size_prec_comm,sizeof(PetscMPIInt)); /* calloc for contiguous memory since we need to scatter these values later */
25440c7d97c5SJed Brown         /* copy/cast values avoiding possible type conflicts between PETSc, MPI and METIS */
25453828260eSStefano Zampini         for(i=0;i<size_prec_comm;i++) coarse_subdivision[i]=MPI_PROC_NULL;
25463828260eSStefano Zampini         for(i=0;i<n_subdomains;i++)   coarse_subdivision[ranks_stretching_ratio*i]=(PetscInt)(metis_coarse_subdivision[i]);
25470c7d97c5SJed Brown         ierr = PetscFree(metis_coarse_subdivision);CHKERRQ(ierr);
25480c7d97c5SJed Brown       }
25490c7d97c5SJed Brown 
25500c7d97c5SJed Brown       /* Create new communicator for coarse problem splitting the old one */
25510c7d97c5SJed Brown       if( !(rank_prec_comm%procs_jumps_coarse_comm) && rank_prec_comm < procs_jumps_coarse_comm*n_parts ){
2552da1bb401SStefano Zampini         coarse_color=0;              /* for communicator splitting */
2553da1bb401SStefano Zampini         active_rank=rank_prec_comm;  /* for insertion of matrix values */
25540c7d97c5SJed Brown       }
2555da1bb401SStefano Zampini       /* procs with coarse_color = MPI_UNDEFINED will have coarse_comm = MPI_COMM_NULL (from mpi standards)
2556da1bb401SStefano Zampini          key = rank_prec_comm -> keep same ordering of ranks from the old to the new communicator */
255753cdbc3dSStefano Zampini       ierr = MPI_Comm_split(prec_comm,coarse_color,rank_prec_comm,&coarse_comm);CHKERRQ(ierr);
25580c7d97c5SJed Brown 
25590c7d97c5SJed Brown       if( coarse_color == 0 ) {
256053cdbc3dSStefano Zampini         ierr = MPI_Comm_size(coarse_comm,&size_coarse_comm);CHKERRQ(ierr);
256153cdbc3dSStefano Zampini         ierr = MPI_Comm_rank(coarse_comm,&rank_coarse_comm);CHKERRQ(ierr);
2562da1bb401SStefano Zampini         /*printf("Details of coarse comm\n");
25633828260eSStefano Zampini         printf("size = %d, myrank = %d\n",size_coarse_comm,rank_coarse_comm);
2564da1bb401SStefano Zampini         printf("jumps = %d, coarse_color = %d, n_parts = %d\n",procs_jumps_coarse_comm,coarse_color,n_parts);*/
25650c7d97c5SJed Brown       } else {
25660c7d97c5SJed Brown         rank_coarse_comm = MPI_PROC_NULL;
25670c7d97c5SJed Brown       }
25680c7d97c5SJed Brown 
25690c7d97c5SJed Brown       /* master proc take care of arranging and distributing coarse informations */
25700c7d97c5SJed Brown       if(rank_coarse_comm == master_proc) {
25710c7d97c5SJed Brown         ierr = PetscMalloc (size_coarse_comm*sizeof(PetscMPIInt),&displacements_recv);CHKERRQ(ierr);
2572da1bb401SStefano Zampini         /*ierr = PetscMalloc (size_coarse_comm*sizeof(PetscMPIInt),&total_count_recv);CHKERRQ(ierr);
2573da1bb401SStefano Zampini           ierr = PetscMalloc (n_subdomains*sizeof(PetscMPIInt),&total_ranks_recv);CHKERRQ(ierr);*/
25740c7d97c5SJed Brown         total_count_recv = (PetscMPIInt*)calloc(size_prec_comm,sizeof(PetscMPIInt));
25750c7d97c5SJed Brown         total_ranks_recv = (PetscMPIInt*)calloc(n_subdomains,sizeof(PetscMPIInt));
25760c7d97c5SJed Brown         /* some initializations */
25770c7d97c5SJed Brown         displacements_recv[0]=0;
2578da1bb401SStefano Zampini         /* PetscMemzero(total_count_recv,size_coarse_comm*sizeof(PetscMPIInt)); not needed -> calloc initializes to zero */
25790c7d97c5SJed Brown         /* count from how many processes the j-th process of the coarse decomposition will receive data */
25800c7d97c5SJed Brown         for(j=0;j<size_coarse_comm;j++)
25813828260eSStefano Zampini           for(i=0;i<size_prec_comm;i++)
25820c7d97c5SJed Brown             if(coarse_subdivision[i]==j)
25830c7d97c5SJed Brown               total_count_recv[j]++;
25840c7d97c5SJed Brown         /* displacements needed for scatterv of total_ranks_recv */
25850c7d97c5SJed Brown         for(i=1;i<size_coarse_comm;i++) displacements_recv[i]=displacements_recv[i-1]+total_count_recv[i-1];
25860c7d97c5SJed Brown         /* Now fill properly total_ranks_recv -> each coarse process will receive the ranks (in prec_comm communicator) of its friend (sending) processes */
25870c7d97c5SJed Brown         ierr = PetscMemzero(total_count_recv,size_coarse_comm*sizeof(PetscMPIInt));CHKERRQ(ierr);
25880c7d97c5SJed Brown         for(j=0;j<size_coarse_comm;j++) {
25893828260eSStefano Zampini           for(i=0;i<size_prec_comm;i++) {
25900c7d97c5SJed Brown             if(coarse_subdivision[i]==j) {
25910c7d97c5SJed Brown               total_ranks_recv[displacements_recv[j]+total_count_recv[j]]=i;
25923828260eSStefano Zampini               total_count_recv[j]+=1;
25930c7d97c5SJed Brown             }
25940c7d97c5SJed Brown           }
25950c7d97c5SJed Brown         }
2596da1bb401SStefano Zampini         /*for(j=0;j<size_coarse_comm;j++) {
25973828260eSStefano Zampini           printf("process %d in new rank will receive from %d processes (original ranks follows)\n",j,total_count_recv[j]);
25983828260eSStefano Zampini           for(i=0;i<total_count_recv[j];i++) {
25993828260eSStefano Zampini             printf("%d ",total_ranks_recv[displacements_recv[j]+i]);
26003828260eSStefano Zampini           }
26013828260eSStefano Zampini           printf("\n");
2602da1bb401SStefano Zampini         }*/
26030c7d97c5SJed Brown 
26040c7d97c5SJed Brown         /* identify new decomposition in terms of ranks in the old communicator */
26053828260eSStefano Zampini         for(i=0;i<n_subdomains;i++) coarse_subdivision[ranks_stretching_ratio*i]=coarse_subdivision[ranks_stretching_ratio*i]*procs_jumps_coarse_comm;
2606da1bb401SStefano Zampini         /*printf("coarse_subdivision in old end new ranks\n");
26070c7d97c5SJed Brown         for(i=0;i<size_prec_comm;i++)
26083828260eSStefano Zampini           if(coarse_subdivision[i]!=MPI_PROC_NULL) {
26093828260eSStefano Zampini             printf("%d=(%d %d), ",i,coarse_subdivision[i],coarse_subdivision[i]/procs_jumps_coarse_comm);
26103828260eSStefano Zampini           } else {
26113828260eSStefano Zampini             printf("%d=(%d %d), ",i,coarse_subdivision[i],coarse_subdivision[i]);
26123828260eSStefano Zampini           }
2613da1bb401SStefano Zampini         printf("\n");*/
26140c7d97c5SJed Brown       }
26150c7d97c5SJed Brown 
26160c7d97c5SJed Brown       /* Scatter new decomposition for send details */
261753cdbc3dSStefano Zampini       ierr = MPI_Scatter(&coarse_subdivision[0],1,MPIU_INT,&rank_coarse_proc_send_to,1,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr);
26180c7d97c5SJed Brown       /* Scatter receiving details to members of coarse decomposition */
26190c7d97c5SJed Brown       if( coarse_color == 0) {
262053cdbc3dSStefano Zampini         ierr = MPI_Scatter(&total_count_recv[0],1,MPIU_INT,&count_recv,1,MPIU_INT,master_proc,coarse_comm);CHKERRQ(ierr);
26210c7d97c5SJed Brown         ierr = PetscMalloc (count_recv*sizeof(PetscMPIInt),&ranks_recv);CHKERRQ(ierr);
262253cdbc3dSStefano Zampini         ierr = MPI_Scatterv(&total_ranks_recv[0],total_count_recv,displacements_recv,MPIU_INT,&ranks_recv[0],count_recv,MPIU_INT,master_proc,coarse_comm);CHKERRQ(ierr);
26230c7d97c5SJed Brown       }
26240c7d97c5SJed Brown 
2625da1bb401SStefano Zampini       /*printf("I will send my matrix data to proc  %d\n",rank_coarse_proc_send_to);
2626da1bb401SStefano Zampini       if(coarse_color == 0) {
2627da1bb401SStefano Zampini         printf("I will receive some matrix data from %d processes (ranks follows)\n",count_recv);
2628da1bb401SStefano Zampini         for(i=0;i<count_recv;i++)
2629da1bb401SStefano Zampini           printf("%d ",ranks_recv[i]);
2630da1bb401SStefano Zampini         printf("\n");
2631da1bb401SStefano Zampini       }*/
26320c7d97c5SJed Brown 
26330c7d97c5SJed Brown       if(rank_prec_comm == master_proc) {
2634da1bb401SStefano Zampini         /*ierr = PetscFree(coarse_subdivision);CHKERRQ(ierr);
2635da1bb401SStefano Zampini         ierr = PetscFree(total_count_recv);CHKERRQ(ierr);
2636da1bb401SStefano Zampini         ierr = PetscFree(total_ranks_recv);CHKERRQ(ierr);*/
26370c7d97c5SJed Brown         free(coarse_subdivision);
26380c7d97c5SJed Brown         free(total_count_recv);
26390c7d97c5SJed Brown         free(total_ranks_recv);
26400c7d97c5SJed Brown         ierr = PetscFree(displacements_recv);CHKERRQ(ierr);
26410c7d97c5SJed Brown       }
26420c7d97c5SJed Brown       break;
26430c7d97c5SJed Brown     }
26440c7d97c5SJed Brown 
26450c7d97c5SJed Brown     case(REPLICATED_BDDC):
26460c7d97c5SJed Brown 
26470c7d97c5SJed Brown       pcbddc->coarse_communications_type = GATHERS_BDDC;
26480c7d97c5SJed Brown       coarse_mat_type = MATSEQAIJ;
26490c7d97c5SJed Brown       coarse_pc_type  = PCLU;
265053cdbc3dSStefano Zampini       coarse_ksp_type  = KSPPREONLY;
26510c7d97c5SJed Brown       coarse_comm = PETSC_COMM_SELF;
26520c7d97c5SJed Brown       active_rank = rank_prec_comm;
26530c7d97c5SJed Brown       break;
26540c7d97c5SJed Brown 
26550c7d97c5SJed Brown     case(PARALLEL_BDDC):
26560c7d97c5SJed Brown 
26570c7d97c5SJed Brown       pcbddc->coarse_communications_type = SCATTERS_BDDC;
26580c7d97c5SJed Brown       coarse_mat_type = MATMPIAIJ;
26590c7d97c5SJed Brown       coarse_pc_type  = PCREDUNDANT;
266053cdbc3dSStefano Zampini       coarse_ksp_type  = KSPPREONLY;
26610c7d97c5SJed Brown       coarse_comm = prec_comm;
26620c7d97c5SJed Brown       active_rank = rank_prec_comm;
26630c7d97c5SJed Brown       break;
26640c7d97c5SJed Brown 
26650c7d97c5SJed Brown     case(SEQUENTIAL_BDDC):
26660c7d97c5SJed Brown       pcbddc->coarse_communications_type = GATHERS_BDDC;
26670c7d97c5SJed Brown       coarse_mat_type = MATSEQAIJ;
26680c7d97c5SJed Brown       coarse_pc_type = PCLU;
266953cdbc3dSStefano Zampini       coarse_ksp_type  = KSPPREONLY;
26700c7d97c5SJed Brown       coarse_comm = PETSC_COMM_SELF;
26710c7d97c5SJed Brown       active_rank = master_proc;
26720c7d97c5SJed Brown       break;
26730c7d97c5SJed Brown   }
26740c7d97c5SJed Brown 
26750c7d97c5SJed Brown   switch(pcbddc->coarse_communications_type){
26760c7d97c5SJed Brown 
26770c7d97c5SJed Brown     case(SCATTERS_BDDC):
26780c7d97c5SJed Brown       {
26790c7d97c5SJed Brown         if(pcbddc->coarse_problem_type==MULTILEVEL_BDDC) {
26800c7d97c5SJed Brown 
26810c7d97c5SJed Brown           PetscMPIInt send_size;
26820c7d97c5SJed Brown           PetscInt    *aux_ins_indices;
26830c7d97c5SJed Brown           PetscInt    ii,jj;
26840c7d97c5SJed Brown           MPI_Request *requests;
26850c7d97c5SJed Brown 
26860c7d97c5SJed Brown           /* allocate auxiliary space */
26875619798eSStefano Zampini           ierr = PetscMalloc (pcbddc->replicated_primal_size*sizeof(PetscMPIInt),&pcbddc->replicated_local_primal_indices);CHKERRQ(ierr);
26885619798eSStefano Zampini           ierr = MPI_Allgatherv(&pcbddc->local_primal_indices[0],pcbddc->local_primal_size,MPIU_INT,&pcbddc->replicated_local_primal_indices[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,prec_comm);CHKERRQ(ierr);
26890c7d97c5SJed Brown           ierr = PetscMalloc ( pcbddc->coarse_size*sizeof(PetscInt),&aux_ins_indices);CHKERRQ(ierr);
26900c7d97c5SJed Brown           ierr = PetscMemzero(aux_ins_indices,pcbddc->coarse_size*sizeof(PetscInt));CHKERRQ(ierr);
26910c7d97c5SJed Brown           /* allocate stuffs for message massing */
26920c7d97c5SJed Brown           ierr = PetscMalloc ( (count_recv+1)*sizeof(MPI_Request),&requests);CHKERRQ(ierr);
26930c7d97c5SJed Brown           for(i=0;i<count_recv+1;i++) requests[i]=MPI_REQUEST_NULL;
26940c7d97c5SJed Brown           ierr = PetscMalloc ( count_recv*sizeof(PetscMPIInt),&localsizes2);CHKERRQ(ierr);
26950c7d97c5SJed Brown           ierr = PetscMalloc ( count_recv*sizeof(PetscMPIInt),&localdispl2);CHKERRQ(ierr);
26960c7d97c5SJed Brown           /* fill up quantities */
26970c7d97c5SJed Brown           j=0;
26980c7d97c5SJed Brown           for(i=0;i<count_recv;i++){
26990c7d97c5SJed Brown             ii = ranks_recv[i];
27000c7d97c5SJed Brown             localsizes2[i]=pcbddc->local_primal_sizes[ii]*pcbddc->local_primal_sizes[ii];
27010c7d97c5SJed Brown             localdispl2[i]=j;
27020c7d97c5SJed Brown             j+=localsizes2[i];
27030c7d97c5SJed Brown             jj = pcbddc->local_primal_displacements[ii];
2704da1bb401SStefano Zampini             for(k=0;k<pcbddc->local_primal_sizes[ii];k++) aux_ins_indices[pcbddc->replicated_local_primal_indices[jj+k]]+=1;  /* it counts the coarse subdomains sharing the coarse node */
27050c7d97c5SJed Brown           }
2706da1bb401SStefano Zampini           /*printf("aux_ins_indices 1\n");
2707da1bb401SStefano Zampini           for(i=0;i<pcbddc->coarse_size;i++)
2708da1bb401SStefano Zampini             printf("%d ",aux_ins_indices[i]);
2709da1bb401SStefano Zampini           printf("\n");*/
27100c7d97c5SJed Brown           /* temp_coarse_mat_vals used to store temporarly received matrix values */
27110c7d97c5SJed Brown           ierr = PetscMalloc ( j*sizeof(PetscScalar),&temp_coarse_mat_vals);CHKERRQ(ierr);
27120c7d97c5SJed Brown           /* evaluate how many values I will insert in coarse mat */
27130c7d97c5SJed Brown           ins_local_primal_size=0;
27140c7d97c5SJed Brown           for(i=0;i<pcbddc->coarse_size;i++)
27150c7d97c5SJed Brown             if(aux_ins_indices[i])
27160c7d97c5SJed Brown               ins_local_primal_size++;
27170c7d97c5SJed Brown           /* evaluate indices I will insert in coarse mat */
27180c7d97c5SJed Brown           ierr = PetscMalloc ( ins_local_primal_size*sizeof(PetscInt),&ins_local_primal_indices);CHKERRQ(ierr);
27190c7d97c5SJed Brown           j=0;
27200c7d97c5SJed Brown           for(i=0;i<pcbddc->coarse_size;i++)
27210c7d97c5SJed Brown             if(aux_ins_indices[i])
27220c7d97c5SJed Brown               ins_local_primal_indices[j++]=i;
27230c7d97c5SJed Brown           /* use aux_ins_indices to realize a global to local mapping */
27240c7d97c5SJed Brown           j=0;
27250c7d97c5SJed Brown           for(i=0;i<pcbddc->coarse_size;i++){
27260c7d97c5SJed Brown             if(aux_ins_indices[i]==0){
27270c7d97c5SJed Brown               aux_ins_indices[i]=-1;
27280c7d97c5SJed Brown             } else {
27290c7d97c5SJed Brown               aux_ins_indices[i]=j;
27300c7d97c5SJed Brown               j++;
27310c7d97c5SJed Brown             }
27320c7d97c5SJed Brown           }
27330c7d97c5SJed Brown 
2734da1bb401SStefano Zampini           /*printf("New details localsizes2 localdispl2\n");
2735da1bb401SStefano Zampini           for(i=0;i<count_recv;i++)
2736da1bb401SStefano Zampini             printf("(%d %d) ",localsizes2[i],localdispl2[i]);
2737da1bb401SStefano Zampini           printf("\n");
2738da1bb401SStefano Zampini           printf("aux_ins_indices 2\n");
2739da1bb401SStefano Zampini           for(i=0;i<pcbddc->coarse_size;i++)
2740da1bb401SStefano Zampini             printf("%d ",aux_ins_indices[i]);
2741da1bb401SStefano Zampini           printf("\n");
2742da1bb401SStefano Zampini           printf("ins_local_primal_indices\n");
2743da1bb401SStefano Zampini           for(i=0;i<ins_local_primal_size;i++)
2744da1bb401SStefano Zampini             printf("%d ",ins_local_primal_indices[i]);
2745da1bb401SStefano Zampini           printf("\n");
2746da1bb401SStefano Zampini           printf("coarse_submat_vals\n");
2747da1bb401SStefano Zampini           for(i=0;i<pcbddc->local_primal_size;i++)
2748da1bb401SStefano Zampini             for(j=0;j<pcbddc->local_primal_size;j++)
2749da1bb401SStefano Zampini               printf("(%lf %d %d)\n",coarse_submat_vals[j*pcbddc->local_primal_size+i],pcbddc->local_primal_indices[i],pcbddc->local_primal_indices[j]);
2750da1bb401SStefano Zampini           printf("\n");*/
27510c7d97c5SJed Brown 
27520c7d97c5SJed Brown           /* processes partecipating in coarse problem receive matrix data from their friends */
275353cdbc3dSStefano Zampini           for(i=0;i<count_recv;i++) ierr = MPI_Irecv(&temp_coarse_mat_vals[localdispl2[i]],localsizes2[i],MPIU_SCALAR,ranks_recv[i],666,prec_comm,&requests[i]);CHKERRQ(ierr);
27540c7d97c5SJed Brown           if(rank_coarse_proc_send_to != MPI_PROC_NULL ) {
27550c7d97c5SJed Brown             send_size=pcbddc->local_primal_size*pcbddc->local_primal_size;
275653cdbc3dSStefano Zampini             ierr = MPI_Isend(&coarse_submat_vals[0],send_size,MPIU_SCALAR,rank_coarse_proc_send_to,666,prec_comm,&requests[count_recv]);CHKERRQ(ierr);
27570c7d97c5SJed Brown           }
275853cdbc3dSStefano Zampini           ierr = MPI_Waitall(count_recv+1,requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
27590c7d97c5SJed Brown 
2760da1bb401SStefano Zampini           /*if(coarse_color == 0) {
2761da1bb401SStefano Zampini             printf("temp_coarse_mat_vals\n");
2762da1bb401SStefano Zampini             for(k=0;k<count_recv;k++){
2763da1bb401SStefano Zampini               printf("---- %d ----\n",ranks_recv[k]);
2764da1bb401SStefano Zampini               for(i=0;i<pcbddc->local_primal_sizes[ranks_recv[k]];i++)
2765da1bb401SStefano Zampini                 for(j=0;j<pcbddc->local_primal_sizes[ranks_recv[k]];j++)
2766da1bb401SStefano Zampini                   printf("(%lf %d %d)\n",temp_coarse_mat_vals[localdispl2[k]+j*pcbddc->local_primal_sizes[ranks_recv[k]]+i],pcbddc->replicated_local_primal_indices[pcbddc->local_primal_displacements[ranks_recv[k]]+i],pcbddc->replicated_local_primal_indices[pcbddc->local_primal_displacements[ranks_recv[k]]+j]);
2767da1bb401SStefano Zampini               printf("\n");
2768da1bb401SStefano Zampini             }
2769da1bb401SStefano Zampini           }*/
27700c7d97c5SJed Brown           /* calculate data to insert in coarse mat */
27710c7d97c5SJed Brown           ierr = PetscMalloc ( ins_local_primal_size*ins_local_primal_size*sizeof(PetscScalar),&ins_coarse_mat_vals);CHKERRQ(ierr);
27720c7d97c5SJed Brown           PetscMemzero(ins_coarse_mat_vals,ins_local_primal_size*ins_local_primal_size*sizeof(PetscScalar));
27730c7d97c5SJed Brown 
27740c7d97c5SJed Brown           PetscMPIInt rr,kk,lps,lpd;
27750c7d97c5SJed Brown           PetscInt row_ind,col_ind;
27760c7d97c5SJed Brown           for(k=0;k<count_recv;k++){
27770c7d97c5SJed Brown             rr = ranks_recv[k];
27780c7d97c5SJed Brown             kk = localdispl2[k];
27790c7d97c5SJed Brown             lps = pcbddc->local_primal_sizes[rr];
27800c7d97c5SJed Brown             lpd = pcbddc->local_primal_displacements[rr];
2781da1bb401SStefano Zampini             /*printf("Inserting the following indices (received from %d)\n",rr);*/
27820c7d97c5SJed Brown             for(j=0;j<lps;j++){
27830c7d97c5SJed Brown               col_ind=aux_ins_indices[pcbddc->replicated_local_primal_indices[lpd+j]];
27840c7d97c5SJed Brown               for(i=0;i<lps;i++){
27850c7d97c5SJed Brown                 row_ind=aux_ins_indices[pcbddc->replicated_local_primal_indices[lpd+i]];
2786da1bb401SStefano Zampini                 /*printf("%d %d\n",row_ind,col_ind);*/
27870c7d97c5SJed Brown                 ins_coarse_mat_vals[col_ind*ins_local_primal_size+row_ind]+=temp_coarse_mat_vals[kk+j*lps+i];
27880c7d97c5SJed Brown               }
27890c7d97c5SJed Brown             }
27900c7d97c5SJed Brown           }
27910c7d97c5SJed Brown           ierr = PetscFree(requests);CHKERRQ(ierr);
27920c7d97c5SJed Brown           ierr = PetscFree(aux_ins_indices);CHKERRQ(ierr);
27930c7d97c5SJed Brown           ierr = PetscFree(temp_coarse_mat_vals);CHKERRQ(ierr);
27940c7d97c5SJed Brown           if(coarse_color == 0) { ierr = PetscFree(ranks_recv);CHKERRQ(ierr); }
27950c7d97c5SJed Brown 
27960c7d97c5SJed Brown           /* create local to global mapping needed by coarse MATIS */
27970c7d97c5SJed Brown           {
27980c7d97c5SJed Brown             IS coarse_IS;
279953cdbc3dSStefano Zampini             if(coarse_comm != MPI_COMM_NULL ) ierr = MPI_Comm_free(&coarse_comm);CHKERRQ(ierr);
28000c7d97c5SJed Brown             coarse_comm = prec_comm;
28010c7d97c5SJed Brown             active_rank=rank_prec_comm;
28020c7d97c5SJed Brown             ierr = ISCreateGeneral(coarse_comm,ins_local_primal_size,ins_local_primal_indices,PETSC_COPY_VALUES,&coarse_IS);CHKERRQ(ierr);
28030c7d97c5SJed Brown             ierr = ISLocalToGlobalMappingCreateIS(coarse_IS,&coarse_ISLG);CHKERRQ(ierr);
28040c7d97c5SJed Brown             ierr = ISDestroy(&coarse_IS);CHKERRQ(ierr);
28050c7d97c5SJed Brown           }
28060c7d97c5SJed Brown         }
28070c7d97c5SJed Brown         if(pcbddc->coarse_problem_type==PARALLEL_BDDC) {
28080c7d97c5SJed Brown           /* arrays for values insertion */
28090c7d97c5SJed Brown           ins_local_primal_size = pcbddc->local_primal_size;
28100c7d97c5SJed Brown           ierr = PetscMalloc ( ins_local_primal_size*sizeof(PetscMPIInt),&ins_local_primal_indices);CHKERRQ(ierr);
28110c7d97c5SJed Brown           ierr = PetscMalloc ( ins_local_primal_size*ins_local_primal_size*sizeof(PetscScalar),&ins_coarse_mat_vals);CHKERRQ(ierr);
28120c7d97c5SJed Brown           for(j=0;j<ins_local_primal_size;j++){
28130c7d97c5SJed Brown             ins_local_primal_indices[j]=pcbddc->local_primal_indices[j];
28140c7d97c5SJed Brown             for(i=0;i<ins_local_primal_size;i++) ins_coarse_mat_vals[j*ins_local_primal_size+i]=coarse_submat_vals[j*ins_local_primal_size+i];
28150c7d97c5SJed Brown           }
28160c7d97c5SJed Brown         }
28170c7d97c5SJed Brown         break;
28180c7d97c5SJed Brown 
28190c7d97c5SJed Brown     }
28200c7d97c5SJed Brown 
28210c7d97c5SJed Brown     case(GATHERS_BDDC):
28220c7d97c5SJed Brown       {
28230c7d97c5SJed Brown 
28240c7d97c5SJed Brown         PetscMPIInt mysize,mysize2;
28250c7d97c5SJed Brown 
28260c7d97c5SJed Brown         if(rank_prec_comm==active_rank) {
28270c7d97c5SJed Brown           ierr = PetscMalloc ( pcbddc->replicated_primal_size*sizeof(PetscMPIInt),&pcbddc->replicated_local_primal_indices);CHKERRQ(ierr);
28280c7d97c5SJed Brown           pcbddc->replicated_local_primal_values = (PetscScalar*)calloc(pcbddc->replicated_primal_size,sizeof(PetscScalar));
28290c7d97c5SJed Brown           ierr = PetscMalloc ( size_prec_comm*sizeof(PetscMPIInt),&localsizes2);CHKERRQ(ierr);
28300c7d97c5SJed Brown           ierr = PetscMalloc ( size_prec_comm*sizeof(PetscMPIInt),&localdispl2);CHKERRQ(ierr);
28310c7d97c5SJed Brown           /* arrays for values insertion */
28320c7d97c5SJed Brown           ins_local_primal_size = pcbddc->coarse_size;
28330c7d97c5SJed Brown           ierr = PetscMalloc ( ins_local_primal_size*sizeof(PetscMPIInt),&ins_local_primal_indices);CHKERRQ(ierr);
28340c7d97c5SJed Brown           ierr = PetscMalloc ( ins_local_primal_size*ins_local_primal_size*sizeof(PetscScalar),&ins_coarse_mat_vals);CHKERRQ(ierr);
28350c7d97c5SJed Brown           for(i=0;i<size_prec_comm;i++) localsizes2[i]=pcbddc->local_primal_sizes[i]*pcbddc->local_primal_sizes[i];
28360c7d97c5SJed Brown           localdispl2[0]=0;
28370c7d97c5SJed Brown           for(i=1;i<size_prec_comm;i++) localdispl2[i]=localsizes2[i-1]+localdispl2[i-1];
28380c7d97c5SJed Brown           j=0;
28390c7d97c5SJed Brown           for(i=0;i<size_prec_comm;i++) j+=localsizes2[i];
28400c7d97c5SJed Brown           ierr = PetscMalloc ( j*sizeof(PetscScalar),&temp_coarse_mat_vals);CHKERRQ(ierr);
28410c7d97c5SJed Brown         }
28420c7d97c5SJed Brown 
28430c7d97c5SJed Brown         mysize=pcbddc->local_primal_size;
28440c7d97c5SJed Brown         mysize2=pcbddc->local_primal_size*pcbddc->local_primal_size;
28450c7d97c5SJed Brown         if(pcbddc->coarse_problem_type == SEQUENTIAL_BDDC){
284653cdbc3dSStefano Zampini           ierr = MPI_Gatherv(&pcbddc->local_primal_indices[0],mysize,MPIU_INT,&pcbddc->replicated_local_primal_indices[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,master_proc,prec_comm);CHKERRQ(ierr);
284753cdbc3dSStefano Zampini           ierr = MPI_Gatherv(&coarse_submat_vals[0],mysize2,MPIU_SCALAR,&temp_coarse_mat_vals[0],localsizes2,localdispl2,MPIU_SCALAR,master_proc,prec_comm);CHKERRQ(ierr);
28480c7d97c5SJed Brown         } else {
284953cdbc3dSStefano Zampini           ierr = MPI_Allgatherv(&pcbddc->local_primal_indices[0],mysize,MPIU_INT,&pcbddc->replicated_local_primal_indices[0],pcbddc->local_primal_sizes,pcbddc->local_primal_displacements,MPIU_INT,prec_comm);CHKERRQ(ierr);
285053cdbc3dSStefano Zampini           ierr = MPI_Allgatherv(&coarse_submat_vals[0],mysize2,MPIU_SCALAR,&temp_coarse_mat_vals[0],localsizes2,localdispl2,MPIU_SCALAR,prec_comm);CHKERRQ(ierr);
28510c7d97c5SJed Brown         }
28520c7d97c5SJed Brown 
28530c7d97c5SJed Brown   /* free data structures no longer needed and allocate some space which will be needed in BDDC application */
28540c7d97c5SJed Brown         if(rank_prec_comm==active_rank) {
28550c7d97c5SJed Brown           PetscInt offset,offset2,row_ind,col_ind;
28560c7d97c5SJed Brown           for(j=0;j<ins_local_primal_size;j++){
28570c7d97c5SJed Brown             ins_local_primal_indices[j]=j;
28580c7d97c5SJed Brown             for(i=0;i<ins_local_primal_size;i++) ins_coarse_mat_vals[j*ins_local_primal_size+i]=0.0;
28590c7d97c5SJed Brown           }
28600c7d97c5SJed Brown           for(k=0;k<size_prec_comm;k++){
28610c7d97c5SJed Brown             offset=pcbddc->local_primal_displacements[k];
28620c7d97c5SJed Brown             offset2=localdispl2[k];
28630c7d97c5SJed Brown             for(j=0;j<pcbddc->local_primal_sizes[k];j++){
28640c7d97c5SJed Brown               col_ind=pcbddc->replicated_local_primal_indices[offset+j];
28650c7d97c5SJed Brown               for(i=0;i<pcbddc->local_primal_sizes[k];i++){
28660c7d97c5SJed Brown                 row_ind=pcbddc->replicated_local_primal_indices[offset+i];
28670c7d97c5SJed Brown                 ins_coarse_mat_vals[col_ind*pcbddc->coarse_size+row_ind]+=temp_coarse_mat_vals[offset2+j*pcbddc->local_primal_sizes[k]+i];
28680c7d97c5SJed Brown               }
28690c7d97c5SJed Brown             }
28700c7d97c5SJed Brown           }
28710c7d97c5SJed Brown         }
28720c7d97c5SJed Brown         break;
2873da1bb401SStefano Zampini       }/* switch on coarse problem and communications associated with finished */
28740c7d97c5SJed Brown   }
28750c7d97c5SJed Brown 
28760c7d97c5SJed Brown   /* Now create and fill up coarse matrix */
28770c7d97c5SJed Brown   if( rank_prec_comm == active_rank ) {
28780c7d97c5SJed Brown     if(pcbddc->coarse_problem_type != MULTILEVEL_BDDC) {
28790c7d97c5SJed Brown       ierr = MatCreate(coarse_comm,&pcbddc->coarse_mat);CHKERRQ(ierr);
28800c7d97c5SJed Brown       ierr = MatSetSizes(pcbddc->coarse_mat,PETSC_DECIDE,PETSC_DECIDE,pcbddc->coarse_size,pcbddc->coarse_size);CHKERRQ(ierr);
28810c7d97c5SJed Brown       ierr = MatSetType(pcbddc->coarse_mat,coarse_mat_type);CHKERRQ(ierr);
28823b03a366Sstefano_zampini       ierr = MatSetUp(pcbddc->coarse_mat);CHKERRQ(ierr);
2883da1bb401SStefano Zampini       ierr = MatSetOption(pcbddc->coarse_mat,MAT_ROW_ORIENTED,PETSC_FALSE);CHKERRQ(ierr); /* local values stored in column major */
28843b03a366Sstefano_zampini       ierr = MatSetOption(pcbddc->coarse_mat,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr);
28850c7d97c5SJed Brown     } else {
28860c7d97c5SJed Brown       Mat matis_coarse_local_mat;
2887d3ee2243SStefano Zampini       /* remind bs */
2888d3ee2243SStefano Zampini       ierr = MatCreateIS(coarse_comm,bs,PETSC_DECIDE,PETSC_DECIDE,pcbddc->coarse_size,pcbddc->coarse_size,coarse_ISLG,&pcbddc->coarse_mat);CHKERRQ(ierr);
28893b03a366Sstefano_zampini       ierr = MatSetUp(pcbddc->coarse_mat);CHKERRQ(ierr);
28900c7d97c5SJed Brown       ierr = MatISGetLocalMat(pcbddc->coarse_mat,&matis_coarse_local_mat);CHKERRQ(ierr);
28913b03a366Sstefano_zampini       ierr = MatSetUp(matis_coarse_local_mat);CHKERRQ(ierr);
2892da1bb401SStefano Zampini       ierr = MatSetOption(matis_coarse_local_mat,MAT_ROW_ORIENTED,PETSC_FALSE);CHKERRQ(ierr); /* local values stored in column major */
2893a0ba757dSStefano Zampini       ierr = MatSetOption(matis_coarse_local_mat,MAT_IGNORE_ZERO_ENTRIES,PETSC_TRUE);CHKERRQ(ierr);
28940c7d97c5SJed Brown     }
2895a0ba757dSStefano Zampini     ierr = MatSetOption(pcbddc->coarse_mat,MAT_NEW_NONZERO_LOCATION_ERR,PETSC_FALSE);CHKERRQ(ierr);
28960c7d97c5SJed Brown     ierr = MatSetValues(pcbddc->coarse_mat,ins_local_primal_size,ins_local_primal_indices,ins_local_primal_size,ins_local_primal_indices,ins_coarse_mat_vals,ADD_VALUES);CHKERRQ(ierr);
28970c7d97c5SJed Brown     ierr = MatAssemblyBegin(pcbddc->coarse_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
28980c7d97c5SJed Brown     ierr = MatAssemblyEnd(pcbddc->coarse_mat,MAT_FINAL_ASSEMBLY);CHKERRQ(ierr);
28990c7d97c5SJed Brown 
2900da1bb401SStefano Zampini     /*  PetscViewer view_out;
2901da1bb401SStefano Zampini       ierr = PetscViewerASCIIOpen(PETSC_COMM_SELF,"coarsematfull.m",&view_out);CHKERRQ(ierr);
2902da1bb401SStefano Zampini       ierr = PetscViewerSetFormat(view_out,PETSC_VIEWER_ASCII_MATLAB);CHKERRQ(ierr);
2903da1bb401SStefano Zampini       ierr = MatView(pcbddc->coarse_mat,view_out);CHKERRQ(ierr);
2904da1bb401SStefano Zampini       ierr = PetscViewerDestroy(&view_out);CHKERRQ(ierr);*/
2905da1bb401SStefano Zampini 
29060c7d97c5SJed Brown     ierr = MatGetVecs(pcbddc->coarse_mat,&pcbddc->coarse_vec,&pcbddc->coarse_rhs);CHKERRQ(ierr);
29070c7d97c5SJed Brown     /* Preconditioner for coarse problem */
290853cdbc3dSStefano Zampini     ierr = KSPCreate(coarse_comm,&pcbddc->coarse_ksp);CHKERRQ(ierr);
290953cdbc3dSStefano Zampini     ierr = PetscObjectIncrementTabLevel((PetscObject)pcbddc->coarse_ksp,(PetscObject)pc,1);CHKERRQ(ierr);
291053cdbc3dSStefano Zampini     ierr = KSPSetOperators(pcbddc->coarse_ksp,pcbddc->coarse_mat,pcbddc->coarse_mat,SAME_PRECONDITIONER);CHKERRQ(ierr);
29113b03a366Sstefano_zampini     ierr = KSPSetTolerances(pcbddc->coarse_ksp,PETSC_DEFAULT,PETSC_DEFAULT,PETSC_DEFAULT,max_it_coarse_ksp);CHKERRQ(ierr);
291253cdbc3dSStefano Zampini     ierr = KSPSetType(pcbddc->coarse_ksp,coarse_ksp_type);CHKERRQ(ierr);
291353cdbc3dSStefano Zampini     ierr = KSPGetPC(pcbddc->coarse_ksp,&pc_temp);CHKERRQ(ierr);
291453cdbc3dSStefano Zampini     ierr = PCSetType(pc_temp,coarse_pc_type);CHKERRQ(ierr);
29150c7d97c5SJed Brown     /* Allow user's customization */
2916da1bb401SStefano Zampini     ierr = KSPSetOptionsPrefix(pcbddc->coarse_ksp,"coarse_");CHKERRQ(ierr);
291753cdbc3dSStefano Zampini     ierr = KSPSetFromOptions(pcbddc->coarse_ksp);CHKERRQ(ierr);
29180c7d97c5SJed Brown     /* Set Up PC for coarse problem BDDC */
291953cdbc3dSStefano Zampini     if(pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
2920e269702eSStefano Zampini       if(dbg_flag) {
2921e269702eSStefano Zampini         ierr = PetscViewerASCIIPrintf(viewer,"----------------Setting up a new level---------------\n");CHKERRQ(ierr);
2922e269702eSStefano Zampini         ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
2923e269702eSStefano Zampini       }
292453cdbc3dSStefano Zampini       ierr = PCBDDCSetCoarseProblemType(pc_temp,MULTILEVEL_BDDC);CHKERRQ(ierr);
292553cdbc3dSStefano Zampini     }
292653cdbc3dSStefano Zampini     ierr = KSPSetUp(pcbddc->coarse_ksp);CHKERRQ(ierr);
29275619798eSStefano Zampini     if(pcbddc->coarse_problem_type == MULTILEVEL_BDDC) {
29285619798eSStefano Zampini       if(dbg_flag) {
29295619798eSStefano Zampini         ierr = PetscViewerASCIIPrintf(viewer,"----------------New level set------------------------\n");CHKERRQ(ierr);
29305619798eSStefano Zampini         ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
29315619798eSStefano Zampini       }
29325619798eSStefano Zampini     }
29330c7d97c5SJed Brown   }
29340c7d97c5SJed Brown   if(pcbddc->coarse_communications_type == SCATTERS_BDDC) {
29350c7d97c5SJed Brown      IS local_IS,global_IS;
29360c7d97c5SJed Brown      ierr = ISCreateStride(PETSC_COMM_SELF,pcbddc->local_primal_size,0,1,&local_IS);CHKERRQ(ierr);
29370c7d97c5SJed Brown      ierr = ISCreateGeneral(PETSC_COMM_SELF,pcbddc->local_primal_size,pcbddc->local_primal_indices,PETSC_COPY_VALUES,&global_IS);CHKERRQ(ierr);
29380c7d97c5SJed Brown      ierr = VecScatterCreate(pcbddc->vec1_P,local_IS,pcbddc->coarse_vec,global_IS,&pcbddc->coarse_loc_to_glob);CHKERRQ(ierr);
29390c7d97c5SJed Brown      ierr = ISDestroy(&local_IS);CHKERRQ(ierr);
29400c7d97c5SJed Brown      ierr = ISDestroy(&global_IS);CHKERRQ(ierr);
29410c7d97c5SJed Brown   }
29420c7d97c5SJed Brown 
29430c7d97c5SJed Brown 
29443b03a366Sstefano_zampini   /* Evaluate condition number of coarse problem for cheby (and verbose output if requested) */
29453b03a366Sstefano_zampini   if( pcbddc->coarse_problem_type == MULTILEVEL_BDDC && rank_prec_comm == active_rank ) {
29460c7d97c5SJed Brown     PetscScalar m_one=-1.0;
29475619798eSStefano Zampini     PetscReal   infty_error,lambda_min,lambda_max,kappa_2;
29483b03a366Sstefano_zampini     const KSPType check_ksp_type=KSPGMRES;
29490c7d97c5SJed Brown 
29505619798eSStefano Zampini     /* change coarse ksp object to an iterative method suitable for extreme eigenvalues' estimation */
29513b03a366Sstefano_zampini     ierr = KSPSetType(pcbddc->coarse_ksp,check_ksp_type);CHKERRQ(ierr);
2952d49ef151SStefano Zampini     ierr = KSPSetComputeSingularValues(pcbddc->coarse_ksp,PETSC_TRUE);CHKERRQ(ierr);
29535619798eSStefano Zampini     ierr = KSPSetTolerances(pcbddc->coarse_ksp,1.e-8,1.e-8,PETSC_DEFAULT,pcbddc->coarse_size);CHKERRQ(ierr);
29545619798eSStefano Zampini     ierr = KSPSetUp(pcbddc->coarse_ksp);CHKERRQ(ierr);
2955d49ef151SStefano Zampini     ierr = VecSetRandom(pcbddc->coarse_rhs,PETSC_NULL);CHKERRQ(ierr);
2956d49ef151SStefano Zampini     ierr = MatMult(pcbddc->coarse_mat,pcbddc->coarse_rhs,pcbddc->coarse_vec);CHKERRQ(ierr);
2957d49ef151SStefano Zampini     ierr = MatMult(pcbddc->coarse_mat,pcbddc->coarse_vec,pcbddc->coarse_rhs);CHKERRQ(ierr);
2958d49ef151SStefano Zampini     ierr = KSPSolve(pcbddc->coarse_ksp,pcbddc->coarse_rhs,pcbddc->coarse_rhs);CHKERRQ(ierr);
2959d49ef151SStefano Zampini     ierr = KSPComputeExtremeSingularValues(pcbddc->coarse_ksp,&lambda_max,&lambda_min);CHKERRQ(ierr);
29603b03a366Sstefano_zampini     if(dbg_flag) {
29615619798eSStefano Zampini       kappa_2=lambda_max/lambda_min;
29625619798eSStefano Zampini       ierr = KSPGetIterationNumber(pcbddc->coarse_ksp,&k);CHKERRQ(ierr);
2963d49ef151SStefano Zampini       ierr = VecAXPY(pcbddc->coarse_rhs,m_one,pcbddc->coarse_vec);CHKERRQ(ierr);
2964d49ef151SStefano Zampini       ierr = VecNorm(pcbddc->coarse_rhs,NORM_INFINITY,&infty_error);CHKERRQ(ierr);
29653b03a366Sstefano_zampini       ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem condition number estimated with %d iterations of %s is: % 1.14e\n",k,check_ksp_type,kappa_2);CHKERRQ(ierr);
2966e269702eSStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem eigenvalues: % 1.14e %1.14e\n",lambda_min,lambda_max);CHKERRQ(ierr);
2967e269702eSStefano Zampini       ierr = PetscViewerASCIIPrintf(viewer,"Coarse problem infty_error: %1.14e\n",infty_error);CHKERRQ(ierr);
29683b03a366Sstefano_zampini     }
29695619798eSStefano Zampini     /* restore coarse ksp to default values */
2970d49ef151SStefano Zampini     ierr = KSPSetComputeSingularValues(pcbddc->coarse_ksp,PETSC_FALSE);CHKERRQ(ierr);
29715619798eSStefano Zampini     ierr = KSPSetType(pcbddc->coarse_ksp,coarse_ksp_type);CHKERRQ(ierr);
29726c9de887SHong Zhang     ierr = KSPChebyshevSetEigenvalues(pcbddc->coarse_ksp,lambda_max,lambda_min);CHKERRQ(ierr);
29733b03a366Sstefano_zampini     ierr = KSPSetTolerances(pcbddc->coarse_ksp,PETSC_DEFAULT,PETSC_DEFAULT,PETSC_DEFAULT,max_it_coarse_ksp);CHKERRQ(ierr);
29745619798eSStefano Zampini     ierr = KSPSetFromOptions(pcbddc->coarse_ksp);CHKERRQ(ierr);
29755619798eSStefano Zampini     ierr = KSPSetUp(pcbddc->coarse_ksp);CHKERRQ(ierr);
297653cdbc3dSStefano Zampini   }
29770c7d97c5SJed Brown 
29780c7d97c5SJed Brown   /* free data structures no longer needed */
29790c7d97c5SJed Brown   if(coarse_ISLG)                { ierr = ISLocalToGlobalMappingDestroy(&coarse_ISLG);CHKERRQ(ierr); }
29800c7d97c5SJed Brown   if(ins_local_primal_indices)   { ierr = PetscFree(ins_local_primal_indices);CHKERRQ(ierr);  }
29810c7d97c5SJed Brown   if(ins_coarse_mat_vals)        { ierr = PetscFree(ins_coarse_mat_vals);CHKERRQ(ierr);}
29820c7d97c5SJed Brown   if(localsizes2)                { ierr = PetscFree(localsizes2);CHKERRQ(ierr);}
29830c7d97c5SJed Brown   if(localdispl2)                { ierr = PetscFree(localdispl2);CHKERRQ(ierr);}
29840c7d97c5SJed Brown   if(temp_coarse_mat_vals)       { ierr = PetscFree(temp_coarse_mat_vals);CHKERRQ(ierr);}
29850c7d97c5SJed Brown 
29860c7d97c5SJed Brown   PetscFunctionReturn(0);
29870c7d97c5SJed Brown }
29880c7d97c5SJed Brown 
29890c7d97c5SJed Brown #undef __FUNCT__
29900c7d97c5SJed Brown #define __FUNCT__ "PCBDDCManageLocalBoundaries"
299153cdbc3dSStefano Zampini static PetscErrorCode PCBDDCManageLocalBoundaries(PC pc)
29920c7d97c5SJed Brown {
29930c7d97c5SJed Brown 
29940c7d97c5SJed Brown   PC_BDDC     *pcbddc = (PC_BDDC*)pc->data;
29950c7d97c5SJed Brown   PC_IS         *pcis = (PC_IS*)pc->data;
29960c7d97c5SJed Brown   Mat_IS      *matis  = (Mat_IS*)pc->pmat->data;
2997da1bb401SStefano Zampini   PCBDDCGraph mat_graph=pcbddc->mat_graph;
29983972b0daSStefano Zampini   PetscInt    *queue_in_global_numbering,*is_indices,*auxis;
29993b03a366Sstefano_zampini   PetscInt    bs,ierr,i,j,s,k,iindex,neumann_bsize,dirichlet_bsize;
3000da1bb401SStefano Zampini   PetscInt    total_counts,nodes_touched,where_values=1,vertex_size;
3001534831adSStefano Zampini   PetscMPIInt adapt_interface=0,adapt_interface_reduced=0,NEUMANNCNT=0;
3002da1bb401SStefano Zampini   PetscBool   same_set;
3003a0ba757dSStefano Zampini   MPI_Comm    interface_comm=((PetscObject)pc)->comm;
30043b03a366Sstefano_zampini   PetscBool   use_faces=PETSC_FALSE,use_edges=PETSC_FALSE;
30053b03a366Sstefano_zampini   const PetscInt *neumann_nodes;
30063b03a366Sstefano_zampini   const PetscInt *dirichlet_nodes;
3007a81d60d8SStefano Zampini   IS          used_IS,*custom_ISForDofs;
3008da1bb401SStefano Zampini   PetscScalar *array;
3009da1bb401SStefano Zampini   PetscScalar *array2;
3010da1bb401SStefano Zampini   PetscViewer viewer=pcbddc->dbg_viewer;
30110c7d97c5SJed Brown 
30120c7d97c5SJed Brown   PetscFunctionBegin;
3013da1bb401SStefano Zampini   /* Setup local adjacency graph */
3014da1bb401SStefano Zampini   mat_graph->nvtxs=pcis->n;
3015534831adSStefano Zampini   if(!mat_graph->xadj) { NEUMANNCNT = 1; }
3016da1bb401SStefano Zampini   ierr = PCBDDCSetupLocalAdjacencyGraph(pc);CHKERRQ(ierr);
3017a0ba757dSStefano Zampini   i = mat_graph->nvtxs;
3018a0ba757dSStefano Zampini   ierr = PetscMalloc4(i,PetscInt,&mat_graph->where,i,PetscInt,&mat_graph->count,i+1,PetscInt,&mat_graph->cptr,i,PetscInt,&mat_graph->queue);CHKERRQ(ierr);
30193972b0daSStefano Zampini   ierr = PetscMalloc2(i,PetscInt,&mat_graph->which_dof,i,PetscBool,&mat_graph->touched);CHKERRQ(ierr);
30203972b0daSStefano Zampini   ierr = PetscMalloc(i*sizeof(PetscInt),&queue_in_global_numbering);CHKERRQ(ierr);
3021a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->where,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
3022a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->count,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
3023a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->which_dof,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
3024a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->queue,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
30253828260eSStefano Zampini   ierr = PetscMemzero(mat_graph->cptr,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr);
3026a0ba757dSStefano Zampini 
3027a81d60d8SStefano Zampini   /* Setting dofs splitting in mat_graph->which_dof
3028a81d60d8SStefano Zampini      Get information about dofs' splitting if provided by the user
3029a81d60d8SStefano Zampini      Otherwise it assumes a constant block size */
3030a81d60d8SStefano Zampini   vertex_size=0;
3031a81d60d8SStefano Zampini   if(!pcbddc->n_ISForDofs) {
3032a81d60d8SStefano Zampini     ierr = MatGetBlockSize(matis->A,&bs);CHKERRQ(ierr);
3033a81d60d8SStefano Zampini     ierr = PetscMalloc(bs*sizeof(IS),&custom_ISForDofs);CHKERRQ(ierr);
3034a81d60d8SStefano Zampini     for(i=0;i<bs;i++) {
3035a81d60d8SStefano Zampini       ierr = ISCreateStride(PETSC_COMM_SELF,pcis->n/bs,i,bs,&custom_ISForDofs[i]);CHKERRQ(ierr);
3036a81d60d8SStefano Zampini     }
3037a81d60d8SStefano Zampini     ierr = PCBDDCSetDofsSplitting(pc,bs,custom_ISForDofs);CHKERRQ(ierr);
3038a81d60d8SStefano Zampini     vertex_size=1;
3039a81d60d8SStefano Zampini     /* remove my references to IS objects */
3040a81d60d8SStefano Zampini     for(i=0;i<bs;i++) {
3041a81d60d8SStefano Zampini       ierr = ISDestroy(&custom_ISForDofs[i]);CHKERRQ(ierr);
3042a81d60d8SStefano Zampini     }
3043a81d60d8SStefano Zampini     ierr = PetscFree(custom_ISForDofs);CHKERRQ(ierr);
3044a81d60d8SStefano Zampini   }
30459c0446d6SStefano Zampini   for(i=0;i<pcbddc->n_ISForDofs;i++) {
3046a81d60d8SStefano Zampini     ierr = ISGetSize(pcbddc->ISForDofs[i],&k);CHKERRQ(ierr);
30479c0446d6SStefano Zampini     ierr = ISGetIndices(pcbddc->ISForDofs[i],(const PetscInt**)&is_indices);CHKERRQ(ierr);
3048a81d60d8SStefano Zampini     for(j=0;j<k;j++) {
30499c0446d6SStefano Zampini       mat_graph->which_dof[is_indices[j]]=i;
30509c0446d6SStefano Zampini     }
30519c0446d6SStefano Zampini     ierr = ISRestoreIndices(pcbddc->ISForDofs[i],(const PetscInt**)&is_indices);CHKERRQ(ierr);
30529c0446d6SStefano Zampini   }
3053a81d60d8SStefano Zampini   /* use mat block size as vertex size if it has not yet set */
3054a81d60d8SStefano Zampini   if(!vertex_size) {
30553b03a366Sstefano_zampini     ierr = MatGetBlockSize(matis->A,&vertex_size);CHKERRQ(ierr);
30560c7d97c5SJed Brown   }
3057a81d60d8SStefano Zampini 
30583b03a366Sstefano_zampini   /* count number of neigh per node */
30590c7d97c5SJed Brown   total_counts=0;
30603b03a366Sstefano_zampini   for(i=1;i<pcis->n_neigh;i++){
30610c7d97c5SJed Brown     s=pcis->n_shared[i];
30620c7d97c5SJed Brown     total_counts+=s;
306353cdbc3dSStefano Zampini     for(j=0;j<s;j++){
30640c7d97c5SJed Brown       mat_graph->count[pcis->shared[i][j]] += 1;
30650c7d97c5SJed Brown     }
30660c7d97c5SJed Brown   }
3067534831adSStefano Zampini   /* Take into account Neumann data -> it increments number of sharing subdomains for nodes lying on the interface */
306836e030ebSStefano Zampini   ierr = PCBDDCGetNeumannBoundaries(pc,&used_IS);CHKERRQ(ierr);
3069da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_N,0.0);CHKERRQ(ierr);
3070da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
307136e030ebSStefano Zampini   if(used_IS) {
307236e030ebSStefano Zampini     ierr = ISGetSize(used_IS,&neumann_bsize);CHKERRQ(ierr);
307336e030ebSStefano Zampini     ierr = ISGetIndices(used_IS,&neumann_nodes);CHKERRQ(ierr);
307453cdbc3dSStefano Zampini     for(i=0;i<neumann_bsize;i++){
307553cdbc3dSStefano Zampini       iindex = neumann_nodes[i];
3076534831adSStefano Zampini       if(mat_graph->count[iindex] > NEUMANNCNT && array[iindex]==0.0){
307753cdbc3dSStefano Zampini         mat_graph->count[iindex]+=1;
30780c7d97c5SJed Brown         total_counts++;
3079da1bb401SStefano Zampini         array[iindex]=array[iindex]+1.0;
3080da1bb401SStefano Zampini       } else if(array[iindex]>0.0) {
3081da1bb401SStefano Zampini         SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_USER,"Error for neumann nodes provided to BDDC! They must be uniquely listed! Found duplicate node %d\n",iindex);
30820c7d97c5SJed Brown       }
30830c7d97c5SJed Brown     }
30840c7d97c5SJed Brown   }
3085da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3086da1bb401SStefano Zampini   /* allocate space for storing the set of neighbours for each node */
3087da1bb401SStefano Zampini   ierr = PetscMalloc(mat_graph->nvtxs*sizeof(PetscInt*),&mat_graph->neighbours_set);CHKERRQ(ierr);
3088da1bb401SStefano Zampini   if(mat_graph->nvtxs) { ierr = PetscMalloc(total_counts*sizeof(PetscInt),&mat_graph->neighbours_set[0]);CHKERRQ(ierr); }
3089da1bb401SStefano Zampini   for(i=1;i<mat_graph->nvtxs;i++) mat_graph->neighbours_set[i]=mat_graph->neighbours_set[i-1]+mat_graph->count[i-1];
3090a0ba757dSStefano Zampini   ierr = PetscMemzero(mat_graph->count,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
30913b03a366Sstefano_zampini   for(i=1;i<pcis->n_neigh;i++){
30920c7d97c5SJed Brown     s=pcis->n_shared[i];
30930c7d97c5SJed Brown     for(j=0;j<s;j++) {
30940c7d97c5SJed Brown       k=pcis->shared[i][j];
3095da1bb401SStefano Zampini       mat_graph->neighbours_set[k][mat_graph->count[k]] = pcis->neigh[i];
30960c7d97c5SJed Brown       mat_graph->count[k]+=1;
30970c7d97c5SJed Brown     }
30980c7d97c5SJed Brown   }
3099da1bb401SStefano Zampini   /* Check consistency of Neumann nodes */
3100da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
3101da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3102da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3103da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3104da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3105da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
31063b03a366Sstefano_zampini   /* set -1 fake neighbour to mimic Neumann boundary */
310736e030ebSStefano Zampini   if(used_IS) {
310853cdbc3dSStefano Zampini     for(i=0;i<neumann_bsize;i++){
310953cdbc3dSStefano Zampini       iindex = neumann_nodes[i];
3110534831adSStefano Zampini       if(mat_graph->count[iindex] > NEUMANNCNT){
3111da1bb401SStefano Zampini         if(mat_graph->count[iindex]+1 != (PetscInt)array[iindex]) {
3112da1bb401SStefano Zampini           SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_USER,"Neumann nodes provided to BDDC must be consistent among neighbours!\nNode %d: number of sharing subdomains %d != number of subdomains for which it is a neumann node %d\n",iindex,mat_graph->count[iindex]+1,(PetscInt)array[iindex]);
3113da1bb401SStefano Zampini         }
3114da1bb401SStefano Zampini         mat_graph->neighbours_set[iindex][mat_graph->count[iindex]] = -1;
311553cdbc3dSStefano Zampini         mat_graph->count[iindex]+=1;
31160c7d97c5SJed Brown       }
31170c7d97c5SJed Brown     }
311836e030ebSStefano Zampini     ierr = ISRestoreIndices(used_IS,&neumann_nodes);CHKERRQ(ierr);
31190c7d97c5SJed Brown   }
3120da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3121da1bb401SStefano Zampini   /* sort set of sharing subdomains */
3122da1bb401SStefano Zampini   for(i=0;i<mat_graph->nvtxs;i++) { ierr = PetscSortInt(mat_graph->count[i],mat_graph->neighbours_set[i]);CHKERRQ(ierr); }
31233b03a366Sstefano_zampini   /* remove interior nodes and dirichlet boundary nodes from the next search into the graph */
3124da1bb401SStefano Zampini   for(i=0;i<mat_graph->nvtxs;i++){mat_graph->touched[i]=PETSC_FALSE;}
3125da1bb401SStefano Zampini   nodes_touched=0;
312636e030ebSStefano Zampini   ierr = PCBDDCGetDirichletBoundaries(pc,&used_IS);CHKERRQ(ierr);
3127da1bb401SStefano Zampini   ierr = VecSet(pcis->vec2_N,0.0);CHKERRQ(ierr);
3128da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3129da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec2_N,&array2);CHKERRQ(ierr);
3130da1bb401SStefano Zampini   if(used_IS) {
3131da1bb401SStefano Zampini     ierr = ISGetSize(used_IS,&dirichlet_bsize);CHKERRQ(ierr);
3132da1bb401SStefano Zampini     if(dirichlet_bsize && matis->pure_neumann) {
3133da1bb401SStefano Zampini       SETERRQ(PETSC_COMM_SELF,PETSC_ERR_USER,"Dirichlet boundaries are intended to be used with matrices with zeroed rows!\n");
3134da1bb401SStefano Zampini     }
3135da1bb401SStefano Zampini     ierr = ISGetIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr);
3136da1bb401SStefano Zampini     for(i=0;i<dirichlet_bsize;i++){
3137da1bb401SStefano Zampini       iindex=dirichlet_nodes[i];
3138da1bb401SStefano Zampini       if(mat_graph->count[iindex] && !mat_graph->touched[iindex]) {
3139da1bb401SStefano Zampini         if(array[iindex]>0.0) {
3140da1bb401SStefano Zampini           SETERRQ1(PETSC_COMM_SELF,PETSC_ERR_USER,"BDDC cannot have nodes which are marked as Neumann and Dirichlet at the same time! Wrong node %d\n",iindex);
3141da1bb401SStefano Zampini         }
3142da1bb401SStefano Zampini         mat_graph->touched[iindex]=PETSC_TRUE;
3143da1bb401SStefano Zampini         mat_graph->where[iindex]=0;
3144da1bb401SStefano Zampini         nodes_touched++;
3145da1bb401SStefano Zampini         array2[iindex]=array2[iindex]+1.0;
3146da1bb401SStefano Zampini       }
3147da1bb401SStefano Zampini     }
3148da1bb401SStefano Zampini     ierr = ISRestoreIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr);
3149da1bb401SStefano Zampini   }
3150da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3151da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec2_N,&array2);CHKERRQ(ierr);
3152da1bb401SStefano Zampini   /* Check consistency of Dirichlet nodes */
3153da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_N,1.0);CHKERRQ(ierr);
3154da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
3155da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3156da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3157da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3158da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec1_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3159da1bb401SStefano Zampini   ierr = VecSet(pcis->vec1_global,0.0);CHKERRQ(ierr);
3160da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec2_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3161da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec2_N,pcis->vec1_global,ADD_VALUES,SCATTER_REVERSE);CHKERRQ(ierr);
3162da1bb401SStefano Zampini   ierr = VecScatterBegin(matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3163da1bb401SStefano Zampini   ierr = VecScatterEnd  (matis->ctx,pcis->vec1_global,pcis->vec2_N,INSERT_VALUES,SCATTER_FORWARD);CHKERRQ(ierr);
3164da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3165da1bb401SStefano Zampini   ierr = VecGetArray(pcis->vec2_N,&array2);CHKERRQ(ierr);
316636e030ebSStefano Zampini   if(used_IS) {
316736e030ebSStefano Zampini     ierr = ISGetSize(used_IS,&dirichlet_bsize);CHKERRQ(ierr);
316836e030ebSStefano Zampini     ierr = ISGetIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr);
31693b03a366Sstefano_zampini     for(i=0;i<dirichlet_bsize;i++){
3170da1bb401SStefano Zampini       iindex=dirichlet_nodes[i];
3171da1bb401SStefano Zampini       if(array[iindex]>1.0 && array[iindex]!=array2[iindex] ) {
3172da1bb401SStefano Zampini          SETERRQ3(PETSC_COMM_SELF,PETSC_ERR_USER,"Dirichlet nodes provided to BDDC must be consistent among neighbours!\nNode %d: number of sharing subdomains %d != number of subdomains for which it is a neumann node %d\n",iindex,(PetscInt)array[iindex],(PetscInt)array2[iindex]);
3173da1bb401SStefano Zampini       }
31743b03a366Sstefano_zampini     }
317536e030ebSStefano Zampini     ierr = ISRestoreIndices(used_IS,&dirichlet_nodes);CHKERRQ(ierr);
31763b03a366Sstefano_zampini   }
3177da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec1_N,&array);CHKERRQ(ierr);
3178da1bb401SStefano Zampini   ierr = VecRestoreArray(pcis->vec2_N,&array2);CHKERRQ(ierr);
3179da1bb401SStefano Zampini 
31800c7d97c5SJed Brown   for(i=0;i<mat_graph->nvtxs;i++){
31813b03a366Sstefano_zampini     if(!mat_graph->count[i]){  /* interior nodes */
31820c7d97c5SJed Brown       mat_graph->touched[i]=PETSC_TRUE;
31830c7d97c5SJed Brown       mat_graph->where[i]=0;
31840c7d97c5SJed Brown       nodes_touched++;
31850c7d97c5SJed Brown     }
31860c7d97c5SJed Brown   }
31870c7d97c5SJed Brown   mat_graph->ncmps = 0;
3188da1bb401SStefano Zampini   i=0;
31890c7d97c5SJed Brown   while(nodes_touched<mat_graph->nvtxs) {
3190a0ba757dSStefano Zampini     /*  find first untouched node in local ordering */
31910c7d97c5SJed Brown     while(mat_graph->touched[i]) i++;
31920c7d97c5SJed Brown     mat_graph->touched[i]=PETSC_TRUE;
3193a0ba757dSStefano Zampini     mat_graph->where[i]=where_values;
31940c7d97c5SJed Brown     nodes_touched++;
3195a0ba757dSStefano Zampini     /* now find all other nodes having the same set of sharing subdomains */
31960c7d97c5SJed Brown     for(j=i+1;j<mat_graph->nvtxs;j++){
3197a0ba757dSStefano Zampini       /* check for same number of sharing subdomains and dof number */
3198da1bb401SStefano Zampini       if(!mat_graph->touched[j] && mat_graph->count[i]==mat_graph->count[j] && mat_graph->which_dof[i] == mat_graph->which_dof[j] ){
3199a0ba757dSStefano Zampini         /* check for same set of sharing subdomains */
32000c7d97c5SJed Brown         same_set=PETSC_TRUE;
32010c7d97c5SJed Brown         for(k=0;k<mat_graph->count[j];k++){
3202da1bb401SStefano Zampini           if(mat_graph->neighbours_set[i][k]!=mat_graph->neighbours_set[j][k]) {
32030c7d97c5SJed Brown             same_set=PETSC_FALSE;
32040c7d97c5SJed Brown           }
32050c7d97c5SJed Brown         }
3206a0ba757dSStefano Zampini         /* I found a friend of mine */
32070c7d97c5SJed Brown         if(same_set) {
3208a0ba757dSStefano Zampini           mat_graph->where[j]=where_values;
32090c7d97c5SJed Brown           mat_graph->touched[j]=PETSC_TRUE;
32100c7d97c5SJed Brown           nodes_touched++;
32110c7d97c5SJed Brown         }
32120c7d97c5SJed Brown       }
32130c7d97c5SJed Brown     }
3214a0ba757dSStefano Zampini     where_values++;
32150c7d97c5SJed Brown   }
3216a0ba757dSStefano Zampini   where_values--; if(where_values<0) where_values=0;
3217a0ba757dSStefano Zampini   ierr = PetscMalloc(where_values*sizeof(PetscMPIInt),&mat_graph->where_ncmps);CHKERRQ(ierr);
3218a0ba757dSStefano Zampini   /* Find connected components defined on the shared interface */
3219a0ba757dSStefano Zampini   if(where_values) {
3220a0ba757dSStefano Zampini     ierr = PCBDDCFindConnectedComponents(mat_graph, where_values);
32213b03a366Sstefano_zampini     /* For consistency among neughbouring procs, I need to sort (by global ordering) each connected component */
3222a0ba757dSStefano Zampini     for(i=0;i<mat_graph->ncmps;i++) {
3223a0ba757dSStefano Zampini       ierr = ISLocalToGlobalMappingApply(matis->mapping,mat_graph->cptr[i+1]-mat_graph->cptr[i],&mat_graph->queue[mat_graph->cptr[i]],&queue_in_global_numbering[mat_graph->cptr[i]]);CHKERRQ(ierr);
3224a0ba757dSStefano Zampini       ierr = PetscSortIntWithArray(mat_graph->cptr[i+1]-mat_graph->cptr[i],&queue_in_global_numbering[mat_graph->cptr[i]],&mat_graph->queue[mat_graph->cptr[i]]);CHKERRQ(ierr);
3225a0ba757dSStefano Zampini     }
3226a0ba757dSStefano Zampini   }
3227a0ba757dSStefano Zampini   /* check consistency of connected components among neighbouring subdomains -> it adapt them in case it is needed */
3228a0ba757dSStefano Zampini   for(i=0;i<where_values;i++) {
32293b03a366Sstefano_zampini     /* We are not sure that two connected components will be the same among subdomains sharing a subset of local interface */
32303b03a366Sstefano_zampini     if(mat_graph->where_ncmps[i]>1) {
3231a0ba757dSStefano Zampini       adapt_interface=1;
3232a0ba757dSStefano Zampini       break;
3233a0ba757dSStefano Zampini     }
3234a0ba757dSStefano Zampini   }
3235a0ba757dSStefano Zampini   ierr = MPI_Allreduce(&adapt_interface,&adapt_interface_reduced,1,MPIU_INT,MPI_LOR,interface_comm);CHKERRQ(ierr);
3236da1bb401SStefano Zampini   if(pcbddc->dbg_flag && adapt_interface_reduced) {
3237da1bb401SStefano Zampini     ierr = PetscViewerASCIIPrintf(viewer,"Interface adapted\n");CHKERRQ(ierr);
3238da1bb401SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
3239da1bb401SStefano Zampini   }
3240a0ba757dSStefano Zampini   if(where_values && adapt_interface_reduced) {
32410c7d97c5SJed Brown 
3242a0ba757dSStefano Zampini     PetscInt sum_requests=0,my_rank;
3243a0ba757dSStefano Zampini     PetscInt buffer_size,start_of_recv,size_of_recv,start_of_send;
3244a0ba757dSStefano Zampini     PetscInt temp_buffer_size,ins_val,global_where_counter;
3245a0ba757dSStefano Zampini     PetscInt *cum_recv_counts;
3246a0ba757dSStefano Zampini     PetscInt *where_to_nodes_indices;
3247a0ba757dSStefano Zampini     PetscInt *petsc_buffer;
3248a0ba757dSStefano Zampini     PetscMPIInt *recv_buffer;
3249a0ba757dSStefano Zampini     PetscMPIInt *recv_buffer_where;
3250a0ba757dSStefano Zampini     PetscMPIInt *send_buffer;
3251a0ba757dSStefano Zampini     PetscMPIInt size_of_send;
3252a0ba757dSStefano Zampini     PetscInt *sizes_of_sends;
3253a0ba757dSStefano Zampini     MPI_Request *send_requests;
3254a0ba757dSStefano Zampini     MPI_Request *recv_requests;
3255a0ba757dSStefano Zampini     PetscInt *where_cc_adapt;
3256a0ba757dSStefano Zampini     PetscInt **temp_buffer;
3257a0ba757dSStefano Zampini     PetscInt *nodes_to_temp_buffer_indices;
3258a0ba757dSStefano Zampini     PetscInt *add_to_where;
3259a0ba757dSStefano Zampini 
3260a0ba757dSStefano Zampini     ierr = MPI_Comm_rank(interface_comm,&my_rank);CHKERRQ(ierr);
3261a0ba757dSStefano Zampini     ierr = PetscMalloc((where_values+1)*sizeof(PetscInt),&cum_recv_counts);CHKERRQ(ierr);
3262a0ba757dSStefano Zampini     ierr = PetscMemzero(cum_recv_counts,(where_values+1)*sizeof(PetscInt));CHKERRQ(ierr);
3263a0ba757dSStefano Zampini     ierr = PetscMalloc(where_values*sizeof(PetscInt),&where_to_nodes_indices);CHKERRQ(ierr);
3264a0ba757dSStefano Zampini     /* first count how many neighbours per connected component I will receive from */
3265a0ba757dSStefano Zampini     cum_recv_counts[0]=0;
3266a0ba757dSStefano Zampini     for(i=1;i<where_values+1;i++){
3267a0ba757dSStefano Zampini       j=0;
3268a0ba757dSStefano Zampini       while(mat_graph->where[j] != i) j++;
3269a0ba757dSStefano Zampini       where_to_nodes_indices[i-1]=j;
3270da1bb401SStefano Zampini       if(mat_graph->neighbours_set[j][0]!=-1) { cum_recv_counts[i]=cum_recv_counts[i-1]+mat_graph->count[j]; } /* We don't want sends/recvs_to/from_self -> here I don't count myself  */
32713b03a366Sstefano_zampini       else { cum_recv_counts[i]=cum_recv_counts[i-1]+mat_graph->count[j]-1; }
3272a0ba757dSStefano Zampini     }
3273a0ba757dSStefano Zampini     buffer_size=2*cum_recv_counts[where_values]+mat_graph->nvtxs;
3274a0ba757dSStefano Zampini     ierr = PetscMalloc(2*cum_recv_counts[where_values]*sizeof(PetscMPIInt),&recv_buffer_where);CHKERRQ(ierr);
3275a0ba757dSStefano Zampini     ierr = PetscMalloc(buffer_size*sizeof(PetscMPIInt),&send_buffer);CHKERRQ(ierr);
3276a0ba757dSStefano Zampini     ierr = PetscMalloc(cum_recv_counts[where_values]*sizeof(MPI_Request),&send_requests);CHKERRQ(ierr);
3277a0ba757dSStefano Zampini     ierr = PetscMalloc(cum_recv_counts[where_values]*sizeof(MPI_Request),&recv_requests);CHKERRQ(ierr);
3278a0ba757dSStefano Zampini     for(i=0;i<cum_recv_counts[where_values];i++) {
3279a0ba757dSStefano Zampini       send_requests[i]=MPI_REQUEST_NULL;
3280a0ba757dSStefano Zampini       recv_requests[i]=MPI_REQUEST_NULL;
3281a0ba757dSStefano Zampini     }
3282a0ba757dSStefano Zampini     /* exchange with my neighbours the number of my connected components on the shared interface */
3283a0ba757dSStefano Zampini     for(i=0;i<where_values;i++){
3284a0ba757dSStefano Zampini       j=where_to_nodes_indices[i];
3285da1bb401SStefano Zampini       k = (mat_graph->neighbours_set[j][0] == -1 ?  1 : 0);
3286a0ba757dSStefano Zampini       for(;k<mat_graph->count[j];k++){
3287da1bb401SStefano Zampini         ierr = MPI_Isend(&mat_graph->where_ncmps[i],1,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr);
3288da1bb401SStefano Zampini         ierr = MPI_Irecv(&recv_buffer_where[sum_requests],1,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr);
3289a0ba757dSStefano Zampini         sum_requests++;
3290a0ba757dSStefano Zampini       }
3291a0ba757dSStefano Zampini     }
3292a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
3293a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
3294a0ba757dSStefano Zampini     /* determine the connected component I need to adapt */
3295a0ba757dSStefano Zampini     ierr = PetscMalloc(where_values*sizeof(PetscInt),&where_cc_adapt);CHKERRQ(ierr);
3296a0ba757dSStefano Zampini     ierr = PetscMemzero(where_cc_adapt,where_values*sizeof(PetscInt));CHKERRQ(ierr);
3297a0ba757dSStefano Zampini     for(i=0;i<where_values;i++){
3298a0ba757dSStefano Zampini       for(j=cum_recv_counts[i];j<cum_recv_counts[i+1];j++){
32993b03a366Sstefano_zampini         /* The first condition is natural (i.e someone has a different number of cc than me), the second one is just to be safe */
33003b03a366Sstefano_zampini         if( mat_graph->where_ncmps[i]!=recv_buffer_where[j] || mat_graph->where_ncmps[i] > 1 ) {
3301a0ba757dSStefano Zampini           where_cc_adapt[i]=PETSC_TRUE;
3302a0ba757dSStefano Zampini           break;
3303a0ba757dSStefano Zampini         }
3304a0ba757dSStefano Zampini       }
3305a0ba757dSStefano Zampini     }
3306a0ba757dSStefano Zampini     /* now get from neighbours their ccs (in global numbering) and adapt them (in case it is needed) */
3307a0ba757dSStefano Zampini     /* first determine how much data to send (size of each queue plus the global indices) and communicate it to neighbours */
3308a0ba757dSStefano Zampini     ierr = PetscMalloc(where_values*sizeof(PetscInt),&sizes_of_sends);CHKERRQ(ierr);
3309a0ba757dSStefano Zampini     ierr = PetscMemzero(sizes_of_sends,where_values*sizeof(PetscInt));CHKERRQ(ierr);
3310a0ba757dSStefano Zampini     sum_requests=0;
3311a0ba757dSStefano Zampini     start_of_send=0;
3312a0ba757dSStefano Zampini     start_of_recv=cum_recv_counts[where_values];
3313a0ba757dSStefano Zampini     for(i=0;i<where_values;i++) {
3314a0ba757dSStefano Zampini       if(where_cc_adapt[i]) {
3315a0ba757dSStefano Zampini         size_of_send=0;
3316a0ba757dSStefano Zampini         for(j=i;j<mat_graph->ncmps;j++) {
3317a0ba757dSStefano Zampini           if(mat_graph->where[mat_graph->queue[mat_graph->cptr[j]]] == i+1) { /* WARNING -> where values goes from 1 to where_values included */
3318a0ba757dSStefano Zampini             send_buffer[start_of_send+size_of_send]=mat_graph->cptr[j+1]-mat_graph->cptr[j];
3319a0ba757dSStefano Zampini             size_of_send+=1;
3320a0ba757dSStefano Zampini             for(k=0;k<mat_graph->cptr[j+1]-mat_graph->cptr[j];k++) {
3321a0ba757dSStefano Zampini               send_buffer[start_of_send+size_of_send+k]=queue_in_global_numbering[mat_graph->cptr[j]+k];
3322a0ba757dSStefano Zampini             }
3323a0ba757dSStefano Zampini             size_of_send=size_of_send+mat_graph->cptr[j+1]-mat_graph->cptr[j];
3324a0ba757dSStefano Zampini           }
3325a0ba757dSStefano Zampini         }
3326a0ba757dSStefano Zampini         j = where_to_nodes_indices[i];
3327da1bb401SStefano Zampini         k = (mat_graph->neighbours_set[j][0] == -1 ?  1 : 0);
332811d8f4c2SStefano Zampini         sizes_of_sends[i]=size_of_send;
3329a0ba757dSStefano Zampini         for(;k<mat_graph->count[j];k++){
333011d8f4c2SStefano Zampini           ierr = MPI_Isend(&sizes_of_sends[i],1,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr);
3331da1bb401SStefano Zampini           ierr = MPI_Irecv(&recv_buffer_where[sum_requests+start_of_recv],1,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr);
3332a0ba757dSStefano Zampini           sum_requests++;
3333a0ba757dSStefano Zampini         }
3334a0ba757dSStefano Zampini         start_of_send+=size_of_send;
3335a0ba757dSStefano Zampini       }
3336a0ba757dSStefano Zampini     }
3337a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
3338a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
3339a0ba757dSStefano Zampini     buffer_size=0;
3340a0ba757dSStefano Zampini     for(k=0;k<sum_requests;k++) { buffer_size+=recv_buffer_where[start_of_recv+k]; }
3341a0ba757dSStefano Zampini     ierr = PetscMalloc(buffer_size*sizeof(PetscMPIInt),&recv_buffer);CHKERRQ(ierr);
3342a0ba757dSStefano Zampini     /* now exchange the data */
3343a0ba757dSStefano Zampini     start_of_recv=0;
3344a0ba757dSStefano Zampini     start_of_send=0;
3345a0ba757dSStefano Zampini     sum_requests=0;
3346a0ba757dSStefano Zampini     for(i=0;i<where_values;i++) {
3347a0ba757dSStefano Zampini       if(where_cc_adapt[i]) {
3348a0ba757dSStefano Zampini         size_of_send = sizes_of_sends[i];
3349a0ba757dSStefano Zampini         j = where_to_nodes_indices[i];
3350da1bb401SStefano Zampini         k = (mat_graph->neighbours_set[j][0] == -1 ?  1 : 0);
3351a0ba757dSStefano Zampini         for(;k<mat_graph->count[j];k++){
3352da1bb401SStefano Zampini           ierr = MPI_Isend(&send_buffer[start_of_send],size_of_send,MPIU_INT,mat_graph->neighbours_set[j][k],(my_rank+1)*mat_graph->count[j],interface_comm,&send_requests[sum_requests]);CHKERRQ(ierr);
3353a0ba757dSStefano Zampini           size_of_recv=recv_buffer_where[cum_recv_counts[where_values]+sum_requests];
3354da1bb401SStefano Zampini           ierr = MPI_Irecv(&recv_buffer[start_of_recv],size_of_recv,MPIU_INT,mat_graph->neighbours_set[j][k],(mat_graph->neighbours_set[j][k]+1)*mat_graph->count[j],interface_comm,&recv_requests[sum_requests]);CHKERRQ(ierr);
3355a0ba757dSStefano Zampini           start_of_recv+=size_of_recv;
3356a0ba757dSStefano Zampini           sum_requests++;
3357a0ba757dSStefano Zampini         }
3358a0ba757dSStefano Zampini         start_of_send+=size_of_send;
3359a0ba757dSStefano Zampini       }
3360a0ba757dSStefano Zampini     }
3361a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,recv_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
3362a0ba757dSStefano Zampini     ierr = MPI_Waitall(sum_requests,send_requests,MPI_STATUSES_IGNORE);CHKERRQ(ierr);
3363a0ba757dSStefano Zampini     ierr = PetscMalloc(buffer_size*sizeof(PetscInt),&petsc_buffer);CHKERRQ(ierr);
3364a0ba757dSStefano Zampini     for(k=0;k<start_of_recv;k++) { petsc_buffer[k]=(PetscInt)recv_buffer[k]; }
3365a0ba757dSStefano Zampini     for(j=0;j<buffer_size;) {
3366a0ba757dSStefano Zampini        ierr = ISGlobalToLocalMappingApply(matis->mapping,IS_GTOLM_MASK,petsc_buffer[j],&petsc_buffer[j+1],&petsc_buffer[j],&petsc_buffer[j+1]);CHKERRQ(ierr);
3367a0ba757dSStefano Zampini        k=petsc_buffer[j]+1;
3368a0ba757dSStefano Zampini        j+=k;
3369a0ba757dSStefano Zampini     }
3370a0ba757dSStefano Zampini     sum_requests=cum_recv_counts[where_values];
3371a0ba757dSStefano Zampini     start_of_recv=0;
3372a0ba757dSStefano Zampini     ierr = PetscMalloc(mat_graph->nvtxs*sizeof(PetscInt),&nodes_to_temp_buffer_indices);CHKERRQ(ierr);
3373a0ba757dSStefano Zampini     global_where_counter=0;
3374a0ba757dSStefano Zampini     for(i=0;i<where_values;i++){
3375a0ba757dSStefano Zampini       if(where_cc_adapt[i]){
3376a0ba757dSStefano Zampini         temp_buffer_size=0;
3377a0ba757dSStefano Zampini         /* find nodes on the shared interface we need to adapt */
3378a0ba757dSStefano Zampini         for(j=0;j<mat_graph->nvtxs;j++){
3379a0ba757dSStefano Zampini           if(mat_graph->where[j]==i+1) {
3380a0ba757dSStefano Zampini             nodes_to_temp_buffer_indices[j]=temp_buffer_size;
3381a0ba757dSStefano Zampini             temp_buffer_size++;
3382a0ba757dSStefano Zampini           } else {
3383a0ba757dSStefano Zampini             nodes_to_temp_buffer_indices[j]=-1;
3384a0ba757dSStefano Zampini           }
3385a0ba757dSStefano Zampini         }
3386a0ba757dSStefano Zampini         /* allocate some temporary space */
3387a0ba757dSStefano Zampini         ierr = PetscMalloc(temp_buffer_size*sizeof(PetscInt*),&temp_buffer);CHKERRQ(ierr);
3388a0ba757dSStefano Zampini         ierr = PetscMalloc(temp_buffer_size*(cum_recv_counts[i+1]-cum_recv_counts[i])*sizeof(PetscInt),&temp_buffer[0]);CHKERRQ(ierr);
3389a0ba757dSStefano Zampini         ierr = PetscMemzero(temp_buffer[0],temp_buffer_size*(cum_recv_counts[i+1]-cum_recv_counts[i])*sizeof(PetscInt));CHKERRQ(ierr);
3390a0ba757dSStefano Zampini         for(j=1;j<temp_buffer_size;j++){
3391a0ba757dSStefano Zampini           temp_buffer[j]=temp_buffer[j-1]+cum_recv_counts[i+1]-cum_recv_counts[i];
3392a0ba757dSStefano Zampini         }
3393a0ba757dSStefano Zampini         /* analyze contributions from neighbouring subdomains for i-th conn comp
3394a0ba757dSStefano Zampini            temp buffer structure:
3395a0ba757dSStefano Zampini            supposing part of the interface has dimension 5 (global nodes 0,1,2,3,4)
3396a0ba757dSStefano Zampini            3 neighs procs with structured connected components:
3397a0ba757dSStefano Zampini              neigh 0: [0 1 4], [2 3];  (2 connected components)
3398a0ba757dSStefano Zampini              neigh 1: [0 1], [2 3 4];  (2 connected components)
3399a0ba757dSStefano Zampini              neigh 2: [0 4], [1], [2 3]; (3 connected components)
3400a0ba757dSStefano Zampini            tempbuffer (row-oriented) should be filled as:
3401a0ba757dSStefano Zampini              [ 0, 0, 0;
3402a0ba757dSStefano Zampini                0, 0, 1;
3403a0ba757dSStefano Zampini                1, 1, 2;
3404a0ba757dSStefano Zampini                1, 1, 2;
3405a0ba757dSStefano Zampini                0, 1, 0; ];
3406a0ba757dSStefano Zampini            This way we can simply recover the resulting structure account for possible intersections of ccs among neighs.
3407a0ba757dSStefano Zampini            The mat_graph->where array will be modified to reproduce the following 4 connected components [0], [1], [2 3], [4];
3408a0ba757dSStefano Zampini                                                                                                                                    */
3409a0ba757dSStefano Zampini         for(j=0;j<cum_recv_counts[i+1]-cum_recv_counts[i];j++) {
3410a0ba757dSStefano Zampini           ins_val=0;
3411a0ba757dSStefano Zampini           size_of_recv=recv_buffer_where[sum_requests];  /* total size of recv from neighs */
3412a0ba757dSStefano Zampini           for(buffer_size=0;buffer_size<size_of_recv;) {  /* loop until all data from neighs has been taken into account */
3413a0ba757dSStefano Zampini             for(k=1;k<petsc_buffer[buffer_size+start_of_recv]+1;k++) { /* filling properly temp_buffer using data from a single recv */
3414a0ba757dSStefano Zampini               temp_buffer[ nodes_to_temp_buffer_indices[ petsc_buffer[ start_of_recv+buffer_size+k ] ] ][j]=ins_val;
3415a0ba757dSStefano Zampini             }
3416a0ba757dSStefano Zampini             buffer_size+=k;
3417a0ba757dSStefano Zampini             ins_val++;
3418a0ba757dSStefano Zampini           }
3419a0ba757dSStefano Zampini           start_of_recv+=size_of_recv;
3420a0ba757dSStefano Zampini           sum_requests++;
3421a0ba757dSStefano Zampini         }
3422a0ba757dSStefano Zampini         ierr = PetscMalloc(temp_buffer_size*sizeof(PetscInt),&add_to_where);CHKERRQ(ierr);
3423a0ba757dSStefano Zampini         ierr = PetscMemzero(add_to_where,temp_buffer_size*sizeof(PetscInt));CHKERRQ(ierr);
3424a0ba757dSStefano Zampini         for(j=0;j<temp_buffer_size;j++){
3425a0ba757dSStefano Zampini           if(!add_to_where[j]){ /* found a new cc  */
3426a0ba757dSStefano Zampini             global_where_counter++;
3427a0ba757dSStefano Zampini             add_to_where[j]=global_where_counter;
3428a0ba757dSStefano Zampini             for(k=j+1;k<temp_buffer_size;k++){ /* check for other nodes in new cc */
3429a0ba757dSStefano Zampini               same_set=PETSC_TRUE;
3430a0ba757dSStefano Zampini               for(s=0;s<cum_recv_counts[i+1]-cum_recv_counts[i];s++){
3431a0ba757dSStefano Zampini                 if(temp_buffer[j][s]!=temp_buffer[k][s]) {
3432a0ba757dSStefano Zampini                   same_set=PETSC_FALSE;
3433a0ba757dSStefano Zampini                   break;
3434a0ba757dSStefano Zampini                 }
3435a0ba757dSStefano Zampini               }
3436a0ba757dSStefano Zampini               if(same_set) add_to_where[k]=global_where_counter;
3437a0ba757dSStefano Zampini             }
3438a0ba757dSStefano Zampini           }
3439a0ba757dSStefano Zampini         }
3440a0ba757dSStefano Zampini         /* insert new data in where array */
3441a0ba757dSStefano Zampini         temp_buffer_size=0;
3442a0ba757dSStefano Zampini         for(j=0;j<mat_graph->nvtxs;j++){
3443a0ba757dSStefano Zampini           if(mat_graph->where[j]==i+1) {
3444a0ba757dSStefano Zampini             mat_graph->where[j]=where_values+add_to_where[temp_buffer_size];
3445a0ba757dSStefano Zampini             temp_buffer_size++;
3446a0ba757dSStefano Zampini           }
3447a0ba757dSStefano Zampini         }
3448a0ba757dSStefano Zampini         ierr = PetscFree(temp_buffer[0]);CHKERRQ(ierr);
3449a0ba757dSStefano Zampini         ierr = PetscFree(temp_buffer);CHKERRQ(ierr);
3450a0ba757dSStefano Zampini         ierr = PetscFree(add_to_where);CHKERRQ(ierr);
3451a0ba757dSStefano Zampini       }
3452a0ba757dSStefano Zampini     }
3453a0ba757dSStefano Zampini     ierr = PetscFree(nodes_to_temp_buffer_indices);CHKERRQ(ierr);
3454a0ba757dSStefano Zampini     ierr = PetscFree(sizes_of_sends);CHKERRQ(ierr);
3455a0ba757dSStefano Zampini     ierr = PetscFree(send_requests);CHKERRQ(ierr);
3456a0ba757dSStefano Zampini     ierr = PetscFree(recv_requests);CHKERRQ(ierr);
3457a0ba757dSStefano Zampini     ierr = PetscFree(petsc_buffer);CHKERRQ(ierr);
3458a0ba757dSStefano Zampini     ierr = PetscFree(recv_buffer);CHKERRQ(ierr);
3459a0ba757dSStefano Zampini     ierr = PetscFree(recv_buffer_where);CHKERRQ(ierr);
3460a0ba757dSStefano Zampini     ierr = PetscFree(send_buffer);CHKERRQ(ierr);
3461a0ba757dSStefano Zampini     ierr = PetscFree(cum_recv_counts);CHKERRQ(ierr);
3462a0ba757dSStefano Zampini     ierr = PetscFree(where_to_nodes_indices);CHKERRQ(ierr);
346323d4d1a5SStefano Zampini     ierr = PetscFree(where_cc_adapt);CHKERRQ(ierr);
3464a0ba757dSStefano Zampini     /* We are ready to evaluate consistent connected components on each part of the shared interface */
3465a0ba757dSStefano Zampini     if(global_where_counter) {
3466a0ba757dSStefano Zampini       for(i=0;i<mat_graph->nvtxs;i++){ mat_graph->touched[i]=PETSC_FALSE; }
3467a0ba757dSStefano Zampini       global_where_counter=0;
3468a0ba757dSStefano Zampini       for(i=0;i<mat_graph->nvtxs;i++){
3469a0ba757dSStefano Zampini         if(mat_graph->where[i] && !mat_graph->touched[i]) {
3470a0ba757dSStefano Zampini           global_where_counter++;
3471a0ba757dSStefano Zampini           for(j=i+1;j<mat_graph->nvtxs;j++){
3472a0ba757dSStefano Zampini             if(!mat_graph->touched[j] && mat_graph->where[j]==mat_graph->where[i]) {
3473a0ba757dSStefano Zampini               mat_graph->where[j]=global_where_counter;
3474a0ba757dSStefano Zampini               mat_graph->touched[j]=PETSC_TRUE;
3475a0ba757dSStefano Zampini             }
3476a0ba757dSStefano Zampini           }
3477a0ba757dSStefano Zampini           mat_graph->where[i]=global_where_counter;
3478a0ba757dSStefano Zampini           mat_graph->touched[i]=PETSC_TRUE;
3479a0ba757dSStefano Zampini         }
3480a0ba757dSStefano Zampini       }
3481a0ba757dSStefano Zampini       where_values=global_where_counter;
3482a0ba757dSStefano Zampini     }
3483a0ba757dSStefano Zampini     if(global_where_counter) {
3484a0ba757dSStefano Zampini       ierr = PetscMemzero(mat_graph->cptr,(mat_graph->nvtxs+1)*sizeof(PetscInt));CHKERRQ(ierr);
3485a0ba757dSStefano Zampini       ierr = PetscMemzero(mat_graph->queue,mat_graph->nvtxs*sizeof(PetscInt));CHKERRQ(ierr);
3486a0ba757dSStefano Zampini       ierr = PetscFree(mat_graph->where_ncmps);CHKERRQ(ierr);
3487a0ba757dSStefano Zampini       ierr = PetscMalloc(where_values*sizeof(PetscMPIInt),&mat_graph->where_ncmps);CHKERRQ(ierr);
3488a0ba757dSStefano Zampini       ierr = PCBDDCFindConnectedComponents(mat_graph, where_values);
3489a0ba757dSStefano Zampini       for(i=0;i<mat_graph->ncmps;i++) {
3490a0ba757dSStefano Zampini         ierr = ISLocalToGlobalMappingApply(matis->mapping,mat_graph->cptr[i+1]-mat_graph->cptr[i],&mat_graph->queue[mat_graph->cptr[i]],&queue_in_global_numbering[mat_graph->cptr[i]]);CHKERRQ(ierr);
3491a0ba757dSStefano Zampini         ierr = PetscSortIntWithArray(mat_graph->cptr[i+1]-mat_graph->cptr[i],&queue_in_global_numbering[mat_graph->cptr[i]],&mat_graph->queue[mat_graph->cptr[i]]);CHKERRQ(ierr);
3492a0ba757dSStefano Zampini       }
3493a0ba757dSStefano Zampini     }
34943b03a366Sstefano_zampini   } /* Finished adapting interface */
34950c7d97c5SJed Brown   PetscInt nfc=0;
34960c7d97c5SJed Brown   PetscInt nec=0;
34970c7d97c5SJed Brown   PetscInt nvc=0;
34983b03a366Sstefano_zampini   PetscBool twodim_flag=PETSC_FALSE;
34990c7d97c5SJed Brown   for (i=0; i<mat_graph->ncmps; i++) {
35003b03a366Sstefano_zampini     if( mat_graph->cptr[i+1]-mat_graph->cptr[i] > vertex_size ){
3501534831adSStefano Zampini       if(mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]==1){ /* 1 neigh Neumann fake included */
35020c7d97c5SJed Brown         nfc++;
35033b03a366Sstefano_zampini       } else { /* note that nec will be zero in 2d */
35043b03a366Sstefano_zampini         nec++;
35053b03a366Sstefano_zampini       }
35060c7d97c5SJed Brown     } else {
35073b03a366Sstefano_zampini       nvc+=mat_graph->cptr[i+1]-mat_graph->cptr[i];
35083b03a366Sstefano_zampini     }
35093b03a366Sstefano_zampini   }
35103b03a366Sstefano_zampini 
35113b03a366Sstefano_zampini   if(!nec) { /* we are in a 2d case -> no faces, only edges */
35123b03a366Sstefano_zampini     nec = nfc;
35133b03a366Sstefano_zampini     nfc = 0;
35143b03a366Sstefano_zampini     twodim_flag = PETSC_TRUE;
35153b03a366Sstefano_zampini   }
35163972b0daSStefano Zampini   /* allocate IS arrays for faces, edges. Vertices need a single index set. */
35173972b0daSStefano Zampini   k=0;
35183972b0daSStefano Zampini   for (i=0; i<mat_graph->ncmps; i++) {
35193972b0daSStefano Zampini     j=mat_graph->cptr[i+1]-mat_graph->cptr[i];
35203972b0daSStefano Zampini     if( j > k) {
35213972b0daSStefano Zampini       k=j;
35223972b0daSStefano Zampini     }
35233972b0daSStefano Zampini   }
35243972b0daSStefano Zampini   ierr = PetscMalloc(k*sizeof(PetscInt),&auxis);CHKERRQ(ierr);
35253972b0daSStefano Zampini 
35263b03a366Sstefano_zampini   if(!pcbddc->vertices_flag && !pcbddc->edges_flag) {
35273b03a366Sstefano_zampini     ierr = PetscMalloc(nfc*sizeof(IS),&pcbddc->ISForFaces);CHKERRQ(ierr);
35283b03a366Sstefano_zampini     use_faces=PETSC_TRUE;
35293b03a366Sstefano_zampini   }
35303b03a366Sstefano_zampini   if(!pcbddc->vertices_flag && !pcbddc->faces_flag) {
35313b03a366Sstefano_zampini     ierr = PetscMalloc(nec*sizeof(IS),&pcbddc->ISForEdges);CHKERRQ(ierr);
35323b03a366Sstefano_zampini     use_edges=PETSC_TRUE;
35333b03a366Sstefano_zampini   }
35343b03a366Sstefano_zampini   nfc=0;
35353b03a366Sstefano_zampini   nec=0;
35363b03a366Sstefano_zampini   for (i=0; i<mat_graph->ncmps; i++) {
35373b03a366Sstefano_zampini     if( mat_graph->cptr[i+1]-mat_graph->cptr[i] > vertex_size ){
35383b03a366Sstefano_zampini       for(j=0;j<mat_graph->cptr[i+1]-mat_graph->cptr[i];j++) {
35393972b0daSStefano Zampini         auxis[j]=mat_graph->queue[mat_graph->cptr[i]+j];
35403b03a366Sstefano_zampini       }
35413b03a366Sstefano_zampini       if(mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]==1){
35423b03a366Sstefano_zampini         if(twodim_flag) {
35433b03a366Sstefano_zampini           if(use_edges) {
35443972b0daSStefano Zampini             ierr = ISCreateGeneral(PETSC_COMM_SELF,j,auxis,PETSC_COPY_VALUES,&pcbddc->ISForEdges[nec]);CHKERRQ(ierr);
35453b03a366Sstefano_zampini             nec++;
35463b03a366Sstefano_zampini           }
35473b03a366Sstefano_zampini         } else {
35483b03a366Sstefano_zampini           if(use_faces) {
35493972b0daSStefano Zampini             ierr = ISCreateGeneral(PETSC_COMM_SELF,j,auxis,PETSC_COPY_VALUES,&pcbddc->ISForFaces[nfc]);CHKERRQ(ierr);
35503b03a366Sstefano_zampini             nfc++;
35513b03a366Sstefano_zampini           }
35523b03a366Sstefano_zampini         }
35533b03a366Sstefano_zampini       } else {
35543b03a366Sstefano_zampini         if(use_edges) {
35553972b0daSStefano Zampini           ierr = ISCreateGeneral(PETSC_COMM_SELF,j,auxis,PETSC_COPY_VALUES,&pcbddc->ISForEdges[nec]);CHKERRQ(ierr);
35560c7d97c5SJed Brown           nec++;
35570c7d97c5SJed Brown         }
35580c7d97c5SJed Brown       }
35590c7d97c5SJed Brown     }
35603b03a366Sstefano_zampini   }
35613b03a366Sstefano_zampini   pcbddc->n_ISForFaces=nfc;
35623b03a366Sstefano_zampini   pcbddc->n_ISForEdges=nec;
35633b03a366Sstefano_zampini   nvc=0;
35640c7d97c5SJed Brown   if( !pcbddc->constraints_flag ) {
35653b03a366Sstefano_zampini     for (i=0; i<mat_graph->ncmps; i++) {
35663b03a366Sstefano_zampini       if( mat_graph->cptr[i+1]-mat_graph->cptr[i] <= vertex_size ){
35673b03a366Sstefano_zampini         for( j=mat_graph->cptr[i];j<mat_graph->cptr[i+1];j++) {
35683972b0daSStefano Zampini           auxis[nvc]=mat_graph->queue[j];
35690c7d97c5SJed Brown           nvc++;
35700c7d97c5SJed Brown         }
35710c7d97c5SJed Brown       }
35720c7d97c5SJed Brown     }
35730c7d97c5SJed Brown   }
3574a0ba757dSStefano Zampini   /* sort vertex set (by local ordering) */
35753972b0daSStefano Zampini   ierr = PetscSortInt(nvc,auxis);CHKERRQ(ierr);
35763972b0daSStefano Zampini   ierr = ISCreateGeneral(PETSC_COMM_SELF,nvc,auxis,PETSC_COPY_VALUES,&pcbddc->ISForVertices);CHKERRQ(ierr);
35770c7d97c5SJed Brown 
3578e269702eSStefano Zampini   if(pcbddc->dbg_flag) {
3579e269702eSStefano Zampini 
3580d49ef151SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"--------------------------------------------------------------\n");CHKERRQ(ierr);
3581d49ef151SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Details from PCBDDCManageLocalBoundaries for subdomain %04d\n",PetscGlobalRank);CHKERRQ(ierr);
3582d49ef151SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"--------------------------------------------------------------\n");CHKERRQ(ierr);
3583a0ba757dSStefano Zampini /*    ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Graph (adjacency structure) of local Neumann mat\n");CHKERRQ(ierr);
3584a0ba757dSStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"--------------------------------------------------------------\n");CHKERRQ(ierr);
3585e269702eSStefano Zampini     for(i=0;i<mat_graph->nvtxs;i++) {
3586a0ba757dSStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Nodes connected to node number %d are %d\n",i,mat_graph->xadj[i+1]-mat_graph->xadj[i]);CHKERRQ(ierr);
3587e269702eSStefano Zampini       for(j=mat_graph->xadj[i];j<mat_graph->xadj[i+1];j++){
3588a0ba757dSStefano Zampini         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d ",mat_graph->adjncy[j]);CHKERRQ(ierr);
3589e269702eSStefano Zampini       }
3590a0ba757dSStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\n--------------------------------------------------------------\n");CHKERRQ(ierr);
3591da1bb401SStefano Zampini     }*/
3592d49ef151SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Matrix graph has %d connected components", mat_graph->ncmps);CHKERRQ(ierr);
35930c7d97c5SJed Brown     for(i=0;i<mat_graph->ncmps;i++) {
35943b03a366Sstefano_zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\nDetails for connected component number %02d: size %04d, count %01d. Nodes follow.\n",
35953b03a366Sstefano_zampini              i,mat_graph->cptr[i+1]-mat_graph->cptr[i],mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]);CHKERRQ(ierr);
3596da1bb401SStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"subdomains: ");
3597da1bb401SStefano Zampini       for (j=0;j<mat_graph->count[mat_graph->queue[mat_graph->cptr[i]]]; j++) {
3598da1bb401SStefano Zampini         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d ",mat_graph->neighbours_set[mat_graph->queue[mat_graph->cptr[i]]][j]);
3599da1bb401SStefano Zampini       }
3600da1bb401SStefano Zampini       ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\n");
36010c7d97c5SJed Brown       for (j=mat_graph->cptr[i]; j<mat_graph->cptr[i+1]; j++){
3602da1bb401SStefano Zampini         /* ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d (%d), ",queue_in_global_numbering[j],mat_graph->queue[j]);CHKERRQ(ierr); */
3603da1bb401SStefano Zampini         ierr = PetscViewerASCIISynchronizedPrintf(viewer,"%d, ",mat_graph->queue[j]);CHKERRQ(ierr);
36040c7d97c5SJed Brown       }
36050c7d97c5SJed Brown     }
3606da1bb401SStefano Zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"\n--------------------------------------------------------------\n");CHKERRQ(ierr);
36073b03a366Sstefano_zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local vertices\n",PetscGlobalRank,nvc);CHKERRQ(ierr);
36083b03a366Sstefano_zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local faces\n",PetscGlobalRank,nfc);CHKERRQ(ierr);
36093b03a366Sstefano_zampini     ierr = PetscViewerASCIISynchronizedPrintf(viewer,"Subdomain %04d detected %02d local edges\n",PetscGlobalRank,nec);CHKERRQ(ierr);
3610d49ef151SStefano Zampini     ierr = PetscViewerFlush(viewer);CHKERRQ(ierr);
36110c7d97c5SJed Brown   }
36120c7d97c5SJed Brown 
36133972b0daSStefano Zampini   ierr = PetscFree(queue_in_global_numbering);CHKERRQ(ierr);
36143972b0daSStefano Zampini   ierr = PetscFree(auxis);CHKERRQ(ierr);
36150c7d97c5SJed Brown   PetscFunctionReturn(0);
36160c7d97c5SJed Brown 
36170c7d97c5SJed Brown }
36180c7d97c5SJed Brown 
36190c7d97c5SJed Brown /* -------------------------------------------------------------------------- */
36200c7d97c5SJed Brown 
36210c7d97c5SJed Brown /* The following code has been adapted from function IsConnectedSubdomain contained
3622da1bb401SStefano Zampini    in source file contig.c of METIS library (version 5.0.1)
3623da1bb401SStefano Zampini    It finds connected components of each partition labeled from 1 to n_dist  */
36240c7d97c5SJed Brown 
36250c7d97c5SJed Brown #undef __FUNCT__
36260c7d97c5SJed Brown #define __FUNCT__ "PCBDDCFindConnectedComponents"
36279c0446d6SStefano Zampini static PetscErrorCode PCBDDCFindConnectedComponents(PCBDDCGraph graph, PetscInt n_dist )
36280c7d97c5SJed Brown {
36290c7d97c5SJed Brown   PetscInt i, j, k, nvtxs, first, last, nleft, ncmps,pid,cum_queue,n,ncmps_pid;
36300c7d97c5SJed Brown   PetscInt *xadj, *adjncy, *where, *queue;
36310c7d97c5SJed Brown   PetscInt *cptr;
36320c7d97c5SJed Brown   PetscBool *touched;
36330c7d97c5SJed Brown 
36340c7d97c5SJed Brown   PetscFunctionBegin;
36350c7d97c5SJed Brown 
36360c7d97c5SJed Brown   nvtxs   = graph->nvtxs;
36370c7d97c5SJed Brown   xadj    = graph->xadj;
36380c7d97c5SJed Brown   adjncy  = graph->adjncy;
36390c7d97c5SJed Brown   where   = graph->where;
36400c7d97c5SJed Brown   touched = graph->touched;
36410c7d97c5SJed Brown   queue   = graph->queue;
36420c7d97c5SJed Brown   cptr    = graph->cptr;
36430c7d97c5SJed Brown 
36440c7d97c5SJed Brown   for (i=0; i<nvtxs; i++)
36450c7d97c5SJed Brown     touched[i] = PETSC_FALSE;
36460c7d97c5SJed Brown 
36470c7d97c5SJed Brown   cum_queue=0;
36480c7d97c5SJed Brown   ncmps=0;
36490c7d97c5SJed Brown 
36500c7d97c5SJed Brown   for(n=0; n<n_dist; n++) {
3651da1bb401SStefano Zampini     pid = n+1;  /* partition labeled by 0 is discarded */
36520c7d97c5SJed Brown     nleft = 0;
36530c7d97c5SJed Brown     for (i=0; i<nvtxs; i++) {
36540c7d97c5SJed Brown       if (where[i] == pid)
36550c7d97c5SJed Brown         nleft++;
36560c7d97c5SJed Brown     }
36570c7d97c5SJed Brown     for (i=0; i<nvtxs; i++) {
36580c7d97c5SJed Brown       if (where[i] == pid)
36590c7d97c5SJed Brown         break;
36600c7d97c5SJed Brown     }
36610c7d97c5SJed Brown     touched[i] = PETSC_TRUE;
36620c7d97c5SJed Brown     queue[cum_queue] = i;
36630c7d97c5SJed Brown     first = 0; last = 1;
36640c7d97c5SJed Brown     cptr[ncmps] = cum_queue;  /* This actually points to queue */
36650c7d97c5SJed Brown     ncmps_pid = 0;
36660c7d97c5SJed Brown     while (first != nleft) {
36670c7d97c5SJed Brown       if (first == last) { /* Find another starting vertex */
36680c7d97c5SJed Brown         cptr[++ncmps] = first+cum_queue;
36690c7d97c5SJed Brown         ncmps_pid++;
36700c7d97c5SJed Brown         for (i=0; i<nvtxs; i++) {
36710c7d97c5SJed Brown           if (where[i] == pid && !touched[i])
36720c7d97c5SJed Brown             break;
36730c7d97c5SJed Brown         }
36740c7d97c5SJed Brown         queue[cum_queue+last] = i;
36750c7d97c5SJed Brown         last++;
36760c7d97c5SJed Brown         touched[i] = PETSC_TRUE;
36770c7d97c5SJed Brown       }
36780c7d97c5SJed Brown       i = queue[cum_queue+first];
36790c7d97c5SJed Brown       first++;
36800c7d97c5SJed Brown       for (j=xadj[i]; j<xadj[i+1]; j++) {
36810c7d97c5SJed Brown         k = adjncy[j];
36820c7d97c5SJed Brown         if (where[k] == pid && !touched[k]) {
36830c7d97c5SJed Brown           queue[cum_queue+last] = k;
36840c7d97c5SJed Brown           last++;
36850c7d97c5SJed Brown           touched[k] = PETSC_TRUE;
36860c7d97c5SJed Brown         }
36870c7d97c5SJed Brown       }
36880c7d97c5SJed Brown     }
36890c7d97c5SJed Brown     cptr[++ncmps] = first+cum_queue;
36900c7d97c5SJed Brown     ncmps_pid++;
36910c7d97c5SJed Brown     cum_queue=cptr[ncmps];
3692a0ba757dSStefano Zampini     graph->where_ncmps[n] = ncmps_pid;
36930c7d97c5SJed Brown   }
36940c7d97c5SJed Brown   graph->ncmps = ncmps;
36950c7d97c5SJed Brown 
36960c7d97c5SJed Brown   PetscFunctionReturn(0);
36970c7d97c5SJed Brown }
3698